| // Ceres Solver - A fast non-linear least squares minimizer |
| // Copyright 2010, 2011, 2012 Google Inc. All rights reserved. |
| // http://code.google.com/p/ceres-solver/ |
| // |
| // Redistribution and use in source and binary forms, with or without |
| // modification, are permitted provided that the following conditions are met: |
| // |
| // * Redistributions of source code must retain the above copyright notice, |
| // this list of conditions and the following disclaimer. |
| // * Redistributions in binary form must reproduce the above copyright notice, |
| // this list of conditions and the following disclaimer in the documentation |
| // and/or other materials provided with the distribution. |
| // * Neither the name of Google Inc. nor the names of its contributors may be |
| // used to endorse or promote products derived from this software without |
| // specific prior written permission. |
| // |
| // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" |
| // AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE |
| // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE |
| // ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE |
| // LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR |
| // CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF |
| // SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS |
| // INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN |
| // CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) |
| // ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE |
| // POSSIBILITY OF SUCH DAMAGE. |
| // |
| // Author: sameeragarwal@google.com (Sameer Agarwal) |
| |
| #include <algorithm> |
| #include <ctime> |
| #include <set> |
| #include <vector> |
| |
| #ifndef CERES_NO_CXSPARSE |
| #include "cs.h" |
| #endif // CERES_NO_CXSPARSE |
| |
| #include "Eigen/Dense" |
| #include "ceres/block_random_access_dense_matrix.h" |
| #include "ceres/block_random_access_matrix.h" |
| #include "ceres/block_random_access_sparse_matrix.h" |
| #include "ceres/block_sparse_matrix.h" |
| #include "ceres/block_structure.h" |
| #include "ceres/detect_structure.h" |
| #include "ceres/linear_solver.h" |
| #include "ceres/schur_complement_solver.h" |
| #include "ceres/suitesparse.h" |
| #include "ceres/triplet_sparse_matrix.h" |
| #include "ceres/internal/eigen.h" |
| #include "ceres/internal/port.h" |
| #include "ceres/internal/scoped_ptr.h" |
| #include "ceres/types.h" |
| |
| |
| namespace ceres { |
| namespace internal { |
| |
| LinearSolver::Summary SchurComplementSolver::SolveImpl( |
| BlockSparseMatrixBase* A, |
| const double* b, |
| const LinearSolver::PerSolveOptions& per_solve_options, |
| double* x) { |
| const time_t start_time = time(NULL); |
| if (eliminator_.get() == NULL) { |
| InitStorage(A->block_structure()); |
| DetectStructure(*A->block_structure(), |
| options_.num_eliminate_blocks, |
| &options_.row_block_size, |
| &options_.e_block_size, |
| &options_.f_block_size); |
| eliminator_.reset(CHECK_NOTNULL(SchurEliminatorBase::Create(options_))); |
| eliminator_->Init(options_.num_eliminate_blocks, A->block_structure()); |
| }; |
| const time_t init_time = time(NULL); |
| fill(x, x + A->num_cols(), 0.0); |
| |
| LinearSolver::Summary summary; |
| summary.num_iterations = 1; |
| summary.termination_type = FAILURE; |
| eliminator_->Eliminate(A, b, per_solve_options.D, lhs_.get(), rhs_.get()); |
| const time_t eliminate_time = time(NULL); |
| |
| double* reduced_solution = x + A->num_cols() - lhs_->num_cols(); |
| const bool status = SolveReducedLinearSystem(reduced_solution); |
| const time_t solve_time = time(NULL); |
| |
| if (!status) { |
| return summary; |
| } |
| |
| eliminator_->BackSubstitute(A, b, per_solve_options.D, reduced_solution, x); |
| const time_t backsubstitute_time = time(NULL); |
| summary.termination_type = TOLERANCE; |
| |
| VLOG(2) << "time (sec) total: " << (backsubstitute_time - start_time) |
| << " init: " << (init_time - start_time) |
| << " eliminate: " << (eliminate_time - init_time) |
| << " solve: " << (solve_time - eliminate_time) |
| << " backsubstitute: " << (backsubstitute_time - solve_time); |
| return summary; |
| } |
| |
| // Initialize a BlockRandomAccessDenseMatrix to store the Schur |
| // complement. |
| void DenseSchurComplementSolver::InitStorage( |
| const CompressedRowBlockStructure* bs) { |
| const int num_eliminate_blocks = options().num_eliminate_blocks; |
| const int num_col_blocks = bs->cols.size(); |
| |
| vector<int> blocks(num_col_blocks - num_eliminate_blocks, 0); |
| for (int i = num_eliminate_blocks, j = 0; |
| i < num_col_blocks; |
| ++i, ++j) { |
| blocks[j] = bs->cols[i].size; |
| } |
| |
| set_lhs(new BlockRandomAccessDenseMatrix(blocks)); |
| set_rhs(new double[lhs()->num_rows()]); |
| } |
| |
| // Solve the system Sx = r, assuming that the matrix S is stored in a |
| // BlockRandomAccessDenseMatrix. The linear system is solved using |
| // Eigen's Cholesky factorization. |
| bool DenseSchurComplementSolver::SolveReducedLinearSystem(double* solution) { |
| const BlockRandomAccessDenseMatrix* m = |
| down_cast<const BlockRandomAccessDenseMatrix*>(lhs()); |
| const int num_rows = m->num_rows(); |
| |
| // The case where there are no f blocks, and the system is block |
| // diagonal. |
| if (num_rows == 0) { |
| return true; |
| } |
| |
| // TODO(sameeragarwal): Add proper error handling; this completely ignores |
| // the quality of the solution to the solve. |
| VectorRef(solution, num_rows) = |
| ConstMatrixRef(m->values(), num_rows, num_rows) |
| .selfadjointView<Eigen::Upper>() |
| .ldlt() |
| .solve(ConstVectorRef(rhs(), num_rows)); |
| |
| return true; |
| } |
| |
| |
| SparseSchurComplementSolver::SparseSchurComplementSolver( |
| const LinearSolver::Options& options) |
| : SchurComplementSolver(options) { |
| #ifndef CERES_NO_SUITESPARSE |
| factor_ = NULL; |
| #endif // CERES_NO_SUITESPARSE |
| } |
| |
| SparseSchurComplementSolver::~SparseSchurComplementSolver() { |
| #ifndef CERES_NO_SUITESPARSE |
| if (factor_ != NULL) { |
| ss_.Free(factor_); |
| factor_ = NULL; |
| } |
| #endif // CERES_NO_SUITESPARSE |
| } |
| |
| // Determine the non-zero blocks in the Schur Complement matrix, and |
| // initialize a BlockRandomAccessSparseMatrix object. |
| void SparseSchurComplementSolver::InitStorage( |
| const CompressedRowBlockStructure* bs) { |
| const int num_eliminate_blocks = options().num_eliminate_blocks; |
| const int num_col_blocks = bs->cols.size(); |
| const int num_row_blocks = bs->rows.size(); |
| |
| blocks_.resize(num_col_blocks - num_eliminate_blocks, 0); |
| for (int i = num_eliminate_blocks; i < num_col_blocks; ++i) { |
| blocks_[i - num_eliminate_blocks] = bs->cols[i].size; |
| } |
| |
| set<pair<int, int> > block_pairs; |
| for (int i = 0; i < blocks_.size(); ++i) { |
| block_pairs.insert(make_pair(i, i)); |
| } |
| |
| int r = 0; |
| while (r < num_row_blocks) { |
| int e_block_id = bs->rows[r].cells.front().block_id; |
| if (e_block_id >= num_eliminate_blocks) { |
| break; |
| } |
| vector<int> f_blocks; |
| |
| // Add to the chunk until the first block in the row is |
| // different than the one in the first row for the chunk. |
| for (; r < num_row_blocks; ++r) { |
| const CompressedRow& row = bs->rows[r]; |
| if (row.cells.front().block_id != e_block_id) { |
| break; |
| } |
| |
| // Iterate over the blocks in the row, ignoring the first |
| // block since it is the one to be eliminated. |
| for (int c = 1; c < row.cells.size(); ++c) { |
| const Cell& cell = row.cells[c]; |
| f_blocks.push_back(cell.block_id - num_eliminate_blocks); |
| } |
| } |
| |
| sort(f_blocks.begin(), f_blocks.end()); |
| f_blocks.erase(unique(f_blocks.begin(), f_blocks.end()), f_blocks.end()); |
| for (int i = 0; i < f_blocks.size(); ++i) { |
| for (int j = i + 1; j < f_blocks.size(); ++j) { |
| block_pairs.insert(make_pair(f_blocks[i], f_blocks[j])); |
| } |
| } |
| } |
| |
| // Remaing rows do not contribute to the chunks and directly go |
| // into the schur complement via an outer product. |
| for (; r < num_row_blocks; ++r) { |
| const CompressedRow& row = bs->rows[r]; |
| CHECK_GE(row.cells.front().block_id, num_eliminate_blocks); |
| for (int i = 0; i < row.cells.size(); ++i) { |
| int r_block1_id = row.cells[i].block_id - num_eliminate_blocks; |
| for (int j = 0; j < row.cells.size(); ++j) { |
| int r_block2_id = row.cells[j].block_id - num_eliminate_blocks; |
| if (r_block1_id <= r_block2_id) { |
| block_pairs.insert(make_pair(r_block1_id, r_block2_id)); |
| } |
| } |
| } |
| } |
| |
| set_lhs(new BlockRandomAccessSparseMatrix(blocks_, block_pairs)); |
| set_rhs(new double[lhs()->num_rows()]); |
| } |
| |
| bool SparseSchurComplementSolver::SolveReducedLinearSystem(double* solution) { |
| switch (options().sparse_linear_algebra_library) { |
| case SUITE_SPARSE: |
| return SolveReducedLinearSystemUsingSuiteSparse(solution); |
| case CX_SPARSE: |
| return SolveReducedLinearSystemUsingCXSparse(solution); |
| default: |
| LOG(FATAL) << "Unknown sparse linear algebra library : " |
| << options().sparse_linear_algebra_library; |
| } |
| |
| LOG(FATAL) << "Unknown sparse linear algebra library : " |
| << options().sparse_linear_algebra_library; |
| return false; |
| } |
| |
| #ifndef CERES_NO_SUITESPARSE |
| // Solve the system Sx = r, assuming that the matrix S is stored in a |
| // BlockRandomAccessSparseMatrix. The linear system is solved using |
| // CHOLMOD's sparse cholesky factorization routines. |
| bool SparseSchurComplementSolver::SolveReducedLinearSystemUsingSuiteSparse( |
| double* solution) { |
| const time_t start_time = time(NULL); |
| |
| TripletSparseMatrix* tsm = |
| const_cast<TripletSparseMatrix*>( |
| down_cast<const BlockRandomAccessSparseMatrix*>(lhs())->matrix()); |
| |
| const int num_rows = tsm->num_rows(); |
| |
| // The case where there are no f blocks, and the system is block |
| // diagonal. |
| if (num_rows == 0) { |
| return true; |
| } |
| |
| cholmod_sparse* cholmod_lhs = ss_.CreateSparseMatrix(tsm); |
| // The matrix is symmetric, and the upper triangular part of the |
| // matrix contains the values. |
| cholmod_lhs->stype = 1; |
| const time_t lhs_time = time(NULL); |
| |
| cholmod_dense* cholmod_rhs = |
| ss_.CreateDenseVector(const_cast<double*>(rhs()), num_rows, num_rows); |
| const time_t rhs_time = time(NULL); |
| |
| // Symbolic factorization is computed if we don't already have one handy. |
| if (factor_ == NULL) { |
| if (options().use_block_amd) { |
| factor_ = ss_.BlockAnalyzeCholesky(cholmod_lhs, blocks_, blocks_); |
| } else { |
| factor_ = ss_.AnalyzeCholesky(cholmod_lhs); |
| } |
| } |
| |
| if (VLOG_IS_ON(2)) { |
| cholmod_print_common("Symbolic Analysis", ss_.mutable_cc()); |
| } |
| |
| CHECK_NOTNULL(factor_); |
| |
| const time_t symbolic_time = time(NULL); |
| cholmod_dense* cholmod_solution = |
| ss_.SolveCholesky(cholmod_lhs, factor_, cholmod_rhs); |
| |
| const time_t solve_time = time(NULL); |
| |
| ss_.Free(cholmod_lhs); |
| cholmod_lhs = NULL; |
| ss_.Free(cholmod_rhs); |
| cholmod_rhs = NULL; |
| |
| if (cholmod_solution == NULL) { |
| LOG(ERROR) << "CHOLMOD solve failed."; |
| return false; |
| } |
| |
| VectorRef(solution, num_rows) |
| = VectorRef(static_cast<double*>(cholmod_solution->x), num_rows); |
| ss_.Free(cholmod_solution); |
| const time_t final_time = time(NULL); |
| VLOG(2) << "time: " << (final_time - start_time) |
| << " lhs : " << (lhs_time - start_time) |
| << " rhs: " << (rhs_time - lhs_time) |
| << " analyze: " << (symbolic_time - rhs_time) |
| << " factor_and_solve: " << (solve_time - symbolic_time) |
| << " cleanup: " << (final_time - solve_time); |
| return true; |
| } |
| #else |
| bool SparseSchurComplementSolver::SolveReducedLinearSystemUsingSuiteSparse( |
| double* solution) { |
| LOG(FATAL) << "No SuiteSparse support in Ceres."; |
| return false; |
| } |
| #endif // CERES_NO_SUITESPARSE |
| |
| #ifndef CERES_NO_CXSPARSE |
| // Solve the system Sx = r, assuming that the matrix S is stored in a |
| // BlockRandomAccessSparseMatrix. The linear system is solved using |
| // CXSparse's sparse cholesky factorization routines. |
| bool SparseSchurComplementSolver::SolveReducedLinearSystemUsingCXSparse( |
| double* solution) { |
| // Extract the TripletSparseMatrix that is used for actually storing S. |
| TripletSparseMatrix* tsm = |
| const_cast<TripletSparseMatrix*>( |
| down_cast<const BlockRandomAccessSparseMatrix*>(lhs())->matrix()); |
| |
| const int num_rows = tsm->num_rows(); |
| |
| // The case where there are no f blocks, and the system is block |
| // diagonal. |
| if (num_rows == 0) { |
| return true; |
| } |
| |
| cs_di_sparse tsm_wrapper; |
| tsm_wrapper.nzmax = tsm->num_nonzeros(); |
| tsm_wrapper.m = num_rows; |
| tsm_wrapper.n = num_rows; |
| tsm_wrapper.p = tsm->mutable_cols(); |
| tsm_wrapper.i = tsm->mutable_rows(); |
| tsm_wrapper.x = tsm->mutable_values(); |
| tsm_wrapper.nz = tsm->num_nonzeros(); |
| |
| cs_di_sparse* lhs = cs_compress(&tsm_wrapper); |
| VectorRef(solution, num_rows) = ConstVectorRef(rhs(), num_rows); |
| |
| // It maybe worth caching the ordering here, but for now we are |
| // going to go with the simple cholsol based implementation. |
| int ok = cs_di_cholsol(1, lhs, solution); |
| cs_free(lhs); |
| return ok; |
| } |
| #else |
| bool SparseSchurComplementSolver::SolveReducedLinearSystemUsingCXSparse( |
| double* solution) { |
| LOG(FATAL) << "No CXSparse support in Ceres."; |
| return false; |
| } |
| #endif // CERES_NO_CXPARSE |
| |
| } // namespace internal |
| } // namespace ceres |