internal/ceres/schur_complement_solver.cc - ceres-solver - Git at Google

 // Ceres Solver - A fast non-linear least squares minimizer
 // Copyright 2022 Google Inc. All rights reserved.
 // http://ceres-solver.org/
 //
 // Redistribution and use in source and binary forms, with or without
 // modification, are permitted provided that the following conditions are met:
 //
 // * Redistributions of source code must retain the above copyright notice,
 //   this list of conditions and the following disclaimer.
 // * Redistributions in binary form must reproduce the above copyright notice,
 //   this list of conditions and the following disclaimer in the documentation
 //   and/or other materials provided with the distribution.
 // * Neither the name of Google Inc. nor the names of its contributors may be
 //   used to endorse or promote products derived from this software without
 //   specific prior written permission.
 //
 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 // AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 // ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
 // LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 // CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 // SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 // INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 // CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 // ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 // POSSIBILITY OF SUCH DAMAGE.
 //
 // Author: sameeragarwal@google.com (Sameer Agarwal)

 #include "ceres/schur_complement_solver.h"

 #include <algorithm>
 #include <ctime>
 #include <memory>
 #include <set>
 #include <utility>
 #include <vector>

 #include "Eigen/Dense"
 #include "Eigen/SparseCore"
 #include "ceres/block_random_access_dense_matrix.h"
 #include "ceres/block_random_access_matrix.h"
 #include "ceres/block_random_access_sparse_matrix.h"
 #include "ceres/block_sparse_matrix.h"
 #include "ceres/block_structure.h"
 #include "ceres/conjugate_gradients_solver.h"
 #include "ceres/detect_structure.h"
 #include "ceres/internal/eigen.h"
 #include "ceres/linear_solver.h"
 #include "ceres/sparse_cholesky.h"
 #include "ceres/triplet_sparse_matrix.h"
 #include "ceres/types.h"
 #include "ceres/wall_time.h"

 namespace ceres::internal {
 namespace {

 class BlockRandomAccessSparseMatrixAdapter final
     : public ConjugateGradientsLinearOperator<Vector> {
  public:
   explicit BlockRandomAccessSparseMatrixAdapter(
       const BlockRandomAccessSparseMatrix& m)
       : m_(m) {}

   void RightMultiplyAndAccumulate(const Vector& x, Vector& y) final {
     m_.SymmetricRightMultiplyAndAccumulate(x.data(), y.data());
   }

  private:
   const BlockRandomAccessSparseMatrix& m_;
 };

 class BlockRandomAccessDiagonalMatrixAdapter final
     : public ConjugateGradientsLinearOperator<Vector> {
  public:
   explicit BlockRandomAccessDiagonalMatrixAdapter(
       const BlockRandomAccessDiagonalMatrix& m)
       : m_(m) {}

   // y = y + Ax;
   void RightMultiplyAndAccumulate(const Vector& x, Vector& y) final {
     m_.RightMultiplyAndAccumulate(x.data(), y.data());
   }

  private:
   const BlockRandomAccessDiagonalMatrix& m_;
 };

 }  // namespace

 SchurComplementSolver::SchurComplementSolver(
     const LinearSolver::Options& options)
     : options_(options) {
   CHECK_GT(options.elimination_groups.size(), 1);
   CHECK_GT(options.elimination_groups[0], 0);
   CHECK(options.context != nullptr);
 }

 LinearSolver::Summary SchurComplementSolver::SolveImpl(
     BlockSparseMatrix* A,
     const double* b,
     const LinearSolver::PerSolveOptions& per_solve_options,
     double* x) {
   EventLogger event_logger("SchurComplementSolver::Solve");

   const CompressedRowBlockStructure* bs = A->block_structure();
   if (eliminator_ == nullptr) {
     const int num_eliminate_blocks = options_.elimination_groups[0];
     const int num_f_blocks = bs->cols.size() - num_eliminate_blocks;

     InitStorage(bs);
     DetectStructure(*bs,
                     num_eliminate_blocks,
                     &options_.row_block_size,
                     &options_.e_block_size,
                     &options_.f_block_size);

     // For the special case of the static structure <2,3,6> with
     // exactly one f block use the SchurEliminatorForOneFBlock.
     //
     // TODO(sameeragarwal): A more scalable template specialization
     // mechanism that does not cause binary bloat.
     if (options_.row_block_size == 2 && options_.e_block_size == 3 &&
         options_.f_block_size == 6 && num_f_blocks == 1) {
       eliminator_ = std::make_unique<SchurEliminatorForOneFBlock<2, 3, 6>>();
     } else {
       eliminator_ = SchurEliminatorBase::Create(options_);
     }

     CHECK(eliminator_);
     const bool kFullRankETE = true;
     eliminator_->Init(num_eliminate_blocks, kFullRankETE, bs);
   }

   std::fill(x, x + A->num_cols(), 0.0);
   event_logger.AddEvent("Setup");

   eliminator_->Eliminate(BlockSparseMatrixData(*A),
                          b,
                          per_solve_options.D,
                          lhs_.get(),
                          rhs_.data());
   event_logger.AddEvent("Eliminate");

   double* reduced_solution = x + A->num_cols() - lhs_->num_cols();
   const LinearSolver::Summary summary =
       SolveReducedLinearSystem(per_solve_options, reduced_solution);
   event_logger.AddEvent("ReducedSolve");

   if (summary.termination_type == LinearSolverTerminationType::SUCCESS) {
     eliminator_->BackSubstitute(
         BlockSparseMatrixData(*A), b, per_solve_options.D, reduced_solution, x);
     event_logger.AddEvent("BackSubstitute");
   }

   return summary;
 }
 DenseSchurComplementSolver::DenseSchurComplementSolver(
     const LinearSolver::Options& options)
     : SchurComplementSolver(options),
       cholesky_(DenseCholesky::Create(options)) {}

 DenseSchurComplementSolver::~DenseSchurComplementSolver() = default;

 // Initialize a BlockRandomAccessDenseMatrix to store the Schur
 // complement.
 void DenseSchurComplementSolver::InitStorage(
     const CompressedRowBlockStructure* bs) {
   const int num_eliminate_blocks = options().elimination_groups[0];
   const int num_col_blocks = bs->cols.size();
   auto blocks = Tail(bs->cols, num_col_blocks - num_eliminate_blocks);
   set_lhs(std::make_unique<BlockRandomAccessDenseMatrix>(blocks));
   ResizeRhs(lhs()->num_rows());
 }

 // Solve the system Sx = r, assuming that the matrix S is stored in a
 // BlockRandomAccessDenseMatrix. The linear system is solved using
 // Eigen's Cholesky factorization.
 LinearSolver::Summary DenseSchurComplementSolver::SolveReducedLinearSystem(
     const LinearSolver::PerSolveOptions& per_solve_options, double* solution) {
   LinearSolver::Summary summary;
   summary.num_iterations = 0;
   summary.termination_type = LinearSolverTerminationType::SUCCESS;
   summary.message = "Success.";

   auto* m = down_cast<BlockRandomAccessDenseMatrix*>(mutable_lhs());
   const int num_rows = m->num_rows();

   // The case where there are no f blocks, and the system is block
   // diagonal.
   if (num_rows == 0) {
     return summary;
   }

   summary.num_iterations = 1;
   summary.termination_type = cholesky_->FactorAndSolve(
       num_rows, m->mutable_values(), rhs().data(), solution, &summary.message);
   return summary;
 }

 SparseSchurComplementSolver::SparseSchurComplementSolver(
     const LinearSolver::Options& options)
     : SchurComplementSolver(options) {
   if (options.type != ITERATIVE_SCHUR) {
     sparse_cholesky_ = SparseCholesky::Create(options);
   }
 }

 SparseSchurComplementSolver::~SparseSchurComplementSolver() {
   for (int i = 0; i < 4; ++i) {
     if (scratch_[i]) {
       delete scratch_[i];
       scratch_[i] = nullptr;
     }
   }
 }

 // Determine the non-zero blocks in the Schur Complement matrix, and
 // initialize a BlockRandomAccessSparseMatrix object.
 void SparseSchurComplementSolver::InitStorage(
     const CompressedRowBlockStructure* bs) {
   const int num_eliminate_blocks = options().elimination_groups[0];
   const int num_col_blocks = bs->cols.size();
   const int num_row_blocks = bs->rows.size();

   blocks_ = Tail(bs->cols, num_col_blocks - num_eliminate_blocks);

   std::set<std::pair<int, int>> block_pairs;
   for (int i = 0; i < blocks_.size(); ++i) {
     block_pairs.emplace(i, i);
   }

   int r = 0;
   while (r < num_row_blocks) {
     int e_block_id = bs->rows[r].cells.front().block_id;
     if (e_block_id >= num_eliminate_blocks) {
       break;
     }
     std::vector<int> f_blocks;

     // Add to the chunk until the first block in the row is
     // different than the one in the first row for the chunk.
     for (; r < num_row_blocks; ++r) {
       const CompressedRow& row = bs->rows[r];
       if (row.cells.front().block_id != e_block_id) {
         break;
       }

       // Iterate over the blocks in the row, ignoring the first
       // block since it is the one to be eliminated.
       for (int c = 1; c < row.cells.size(); ++c) {
         const Cell& cell = row.cells[c];
         f_blocks.push_back(cell.block_id - num_eliminate_blocks);
       }
     }

     sort(f_blocks.begin(), f_blocks.end());
     f_blocks.erase(unique(f_blocks.begin(), f_blocks.end()), f_blocks.end());
     for (int i = 0; i < f_blocks.size(); ++i) {
       for (int j = i + 1; j < f_blocks.size(); ++j) {
         block_pairs.emplace(f_blocks[i], f_blocks[j]);
       }
     }
   }

   // Remaining rows do not contribute to the chunks and directly go
   // into the schur complement via an outer product.
   for (; r < num_row_blocks; ++r) {
     const CompressedRow& row = bs->rows[r];
     CHECK_GE(row.cells.front().block_id, num_eliminate_blocks);
     for (int i = 0; i < row.cells.size(); ++i) {
       int r_block1_id = row.cells[i].block_id - num_eliminate_blocks;
       for (const auto& cell : row.cells) {
         int r_block2_id = cell.block_id - num_eliminate_blocks;
         if (r_block1_id <= r_block2_id) {
           block_pairs.emplace(r_block1_id, r_block2_id);
         }
       }
     }
   }

   set_lhs(
       std::make_unique<BlockRandomAccessSparseMatrix>(blocks_, block_pairs));
   ResizeRhs(lhs()->num_rows());
 }

 LinearSolver::Summary SparseSchurComplementSolver::SolveReducedLinearSystem(
     const LinearSolver::PerSolveOptions& per_solve_options, double* solution) {
   if (options().type == ITERATIVE_SCHUR) {
     return SolveReducedLinearSystemUsingConjugateGradients(per_solve_options,
                                                            solution);
   }

   LinearSolver::Summary summary;
   summary.num_iterations = 0;
   summary.termination_type = LinearSolverTerminationType::SUCCESS;
   summary.message = "Success.";

   const TripletSparseMatrix* tsm =
       down_cast<const BlockRandomAccessSparseMatrix*>(lhs())->matrix();
   if (tsm->num_rows() == 0) {
     return summary;
   }

   std::unique_ptr<CompressedRowSparseMatrix> lhs;
   const CompressedRowSparseMatrix::StorageType storage_type =
       sparse_cholesky_->StorageType();
   if (storage_type ==
       CompressedRowSparseMatrix::StorageType::UPPER_TRIANGULAR) {
     lhs = CompressedRowSparseMatrix::FromTripletSparseMatrix(*tsm);
     lhs->set_storage_type(
         CompressedRowSparseMatrix::StorageType::UPPER_TRIANGULAR);
   } else {
     lhs = CompressedRowSparseMatrix::FromTripletSparseMatrixTransposed(*tsm);
     lhs->set_storage_type(
         CompressedRowSparseMatrix::StorageType::LOWER_TRIANGULAR);
   }

   *lhs->mutable_col_blocks() = blocks_;
   *lhs->mutable_row_blocks() = blocks_;

   summary.num_iterations = 1;
   summary.termination_type = sparse_cholesky_->FactorAndSolve(
       lhs.get(), rhs().data(), solution, &summary.message);
   return summary;
 }

 LinearSolver::Summary
 SparseSchurComplementSolver::SolveReducedLinearSystemUsingConjugateGradients(
     const LinearSolver::PerSolveOptions& per_solve_options, double* solution) {
   CHECK(options().use_explicit_schur_complement);
   const int num_rows = lhs()->num_rows();
   // The case where there are no f blocks, and the system is block
   // diagonal.
   if (num_rows == 0) {
     LinearSolver::Summary summary;
     summary.num_iterations = 0;
     summary.termination_type = LinearSolverTerminationType::SUCCESS;
     summary.message = "Success.";
     return summary;
   }

   // Only SCHUR_JACOBI is supported over here right now.
   CHECK_EQ(options().preconditioner_type, SCHUR_JACOBI);

   if (preconditioner_ == nullptr) {
     preconditioner_ =
         std::make_unique<BlockRandomAccessDiagonalMatrix>(blocks_);
   }

   auto* sc = down_cast<BlockRandomAccessSparseMatrix*>(mutable_lhs());

   // Extract block diagonal from the Schur complement to construct the
   // schur_jacobi preconditioner.
   for (int i = 0; i < blocks_.size(); ++i) {
     const int block_size = blocks_[i].size;

     int sc_r, sc_c, sc_row_stride, sc_col_stride;
     CellInfo* sc_cell_info =
         sc->GetCell(i, i, &sc_r, &sc_c, &sc_row_stride, &sc_col_stride);
     CHECK(sc_cell_info != nullptr);
     MatrixRef sc_m(sc_cell_info->values, sc_row_stride, sc_col_stride);

     int pre_r, pre_c, pre_row_stride, pre_col_stride;
     CellInfo* pre_cell_info = preconditioner_->GetCell(
         i, i, &pre_r, &pre_c, &pre_row_stride, &pre_col_stride);
     CHECK(pre_cell_info != nullptr);
     MatrixRef pre_m(pre_cell_info->values, pre_row_stride, pre_col_stride);

     pre_m.block(pre_r, pre_c, block_size, block_size) =
         sc_m.block(sc_r, sc_c, block_size, block_size);
   }
   preconditioner_->Invert();

   VectorRef(solution, num_rows).setZero();

   auto lhs = std::make_unique<BlockRandomAccessSparseMatrixAdapter>(*sc);
   auto preconditioner =
       std::make_unique<BlockRandomAccessDiagonalMatrixAdapter>(
           *preconditioner_);

   ConjugateGradientsSolverOptions cg_options;
   cg_options.min_num_iterations = options().min_num_iterations;
   cg_options.max_num_iterations = options().max_num_iterations;
   cg_options.residual_reset_period = options().residual_reset_period;
   cg_options.q_tolerance = per_solve_options.q_tolerance;
   cg_options.r_tolerance = per_solve_options.r_tolerance;

   cg_solution_ = Vector::Zero(sc->num_rows());
   for (int i = 0; i < 4; ++i) {
     if (scratch_[i] == nullptr) {
       scratch_[i] = new Vector(sc->num_rows());
     }
   }
   auto summary = ConjugateGradientsSolver<Vector>(
       cg_options, *lhs, rhs(), *preconditioner, scratch_, cg_solution_);
   VectorRef(solution, sc->num_rows()) = cg_solution_;
   return summary;
 }

 }  // namespace ceres::internal
	// Ceres Solver - A fast non-linear least squares minimizer
	// Copyright 2022 Google Inc. All rights reserved.
	// http://ceres-solver.org/
	//
	// Redistribution and use in source and binary forms, with or without
	// modification, are permitted provided that the following conditions are met:
	//
	// * Redistributions of source code must retain the above copyright notice,
	// this list of conditions and the following disclaimer.
	// * Redistributions in binary form must reproduce the above copyright notice,
	// this list of conditions and the following disclaimer in the documentation
	// and/or other materials provided with the distribution.
	// * Neither the name of Google Inc. nor the names of its contributors may be
	// used to endorse or promote products derived from this software without
	// specific prior written permission.
	//
	// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
	// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
	// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
	// ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
	// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
	// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
	// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
	// INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
	// CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
	// ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
	// POSSIBILITY OF SUCH DAMAGE.
	//
	// Author: sameeragarwal@google.com (Sameer Agarwal)

	#include "ceres/schur_complement_solver.h"

	#include <algorithm>
	#include <ctime>
	#include <memory>
	#include <set>
	#include <utility>
	#include <vector>

	#include "Eigen/Dense"
	#include "Eigen/SparseCore"
	#include "ceres/block_random_access_dense_matrix.h"
	#include "ceres/block_random_access_matrix.h"
	#include "ceres/block_random_access_sparse_matrix.h"
	#include "ceres/block_sparse_matrix.h"
	#include "ceres/block_structure.h"
	#include "ceres/conjugate_gradients_solver.h"
	#include "ceres/detect_structure.h"
	#include "ceres/internal/eigen.h"
	#include "ceres/linear_solver.h"
	#include "ceres/sparse_cholesky.h"
	#include "ceres/triplet_sparse_matrix.h"
	#include "ceres/types.h"
	#include "ceres/wall_time.h"

	namespace ceres::internal {
	namespace {

	class BlockRandomAccessSparseMatrixAdapter final
	: public ConjugateGradientsLinearOperator<Vector> {
	public:
	explicit BlockRandomAccessSparseMatrixAdapter(
	const BlockRandomAccessSparseMatrix& m)
	: m_(m) {}

	void RightMultiplyAndAccumulate(const Vector& x, Vector& y) final {
	m_.SymmetricRightMultiplyAndAccumulate(x.data(), y.data());
	}

	private:
	const BlockRandomAccessSparseMatrix& m_;
	};

	class BlockRandomAccessDiagonalMatrixAdapter final
	: public ConjugateGradientsLinearOperator<Vector> {
	public:
	explicit BlockRandomAccessDiagonalMatrixAdapter(
	const BlockRandomAccessDiagonalMatrix& m)
	: m_(m) {}

	// y = y + Ax;
	void RightMultiplyAndAccumulate(const Vector& x, Vector& y) final {
	m_.RightMultiplyAndAccumulate(x.data(), y.data());
	}

	private:
	const BlockRandomAccessDiagonalMatrix& m_;
	};

	} // namespace

	SchurComplementSolver::SchurComplementSolver(
	const LinearSolver::Options& options)
	: options_(options) {
	CHECK_GT(options.elimination_groups.size(), 1);
	CHECK_GT(options.elimination_groups[0], 0);
	CHECK(options.context != nullptr);
	}

	LinearSolver::Summary SchurComplementSolver::SolveImpl(
	BlockSparseMatrix* A,
	const double* b,
	const LinearSolver::PerSolveOptions& per_solve_options,
	double* x) {
	EventLogger event_logger("SchurComplementSolver::Solve");

	const CompressedRowBlockStructure* bs = A->block_structure();
	if (eliminator_ == nullptr) {
	const int num_eliminate_blocks = options_.elimination_groups[0];
	const int num_f_blocks = bs->cols.size() - num_eliminate_blocks;

	InitStorage(bs);
	DetectStructure(*bs,
	num_eliminate_blocks,
	&options_.row_block_size,
	&options_.e_block_size,
	&options_.f_block_size);

	// For the special case of the static structure <2,3,6> with
	// exactly one f block use the SchurEliminatorForOneFBlock.
	//
	// TODO(sameeragarwal): A more scalable template specialization
	// mechanism that does not cause binary bloat.
	if (options_.row_block_size == 2 && options_.e_block_size == 3 &&
	options_.f_block_size == 6 && num_f_blocks == 1) {
	eliminator_ = std::make_unique<SchurEliminatorForOneFBlock<2, 3, 6>>();
	} else {
	eliminator_ = SchurEliminatorBase::Create(options_);
	}

	CHECK(eliminator_);
	const bool kFullRankETE = true;
	eliminator_->Init(num_eliminate_blocks, kFullRankETE, bs);
	}

	std::fill(x, x + A->num_cols(), 0.0);
	event_logger.AddEvent("Setup");

	eliminator_->Eliminate(BlockSparseMatrixData(*A),
	b,
	per_solve_options.D,
	lhs_.get(),
	rhs_.data());
	event_logger.AddEvent("Eliminate");

	double* reduced_solution = x + A->num_cols() - lhs_->num_cols();
	const LinearSolver::Summary summary =
	SolveReducedLinearSystem(per_solve_options, reduced_solution);
	event_logger.AddEvent("ReducedSolve");

	if (summary.termination_type == LinearSolverTerminationType::SUCCESS) {
	eliminator_->BackSubstitute(
	BlockSparseMatrixData(*A), b, per_solve_options.D, reduced_solution, x);
	event_logger.AddEvent("BackSubstitute");
	}

	return summary;
	}
	DenseSchurComplementSolver::DenseSchurComplementSolver(
	const LinearSolver::Options& options)
	: SchurComplementSolver(options),
	cholesky_(DenseCholesky::Create(options)) {}

	DenseSchurComplementSolver::~DenseSchurComplementSolver() = default;

	// Initialize a BlockRandomAccessDenseMatrix to store the Schur
	// complement.
	void DenseSchurComplementSolver::InitStorage(
	const CompressedRowBlockStructure* bs) {
	const int num_eliminate_blocks = options().elimination_groups[0];
	const int num_col_blocks = bs->cols.size();
	auto blocks = Tail(bs->cols, num_col_blocks - num_eliminate_blocks);
	set_lhs(std::make_unique<BlockRandomAccessDenseMatrix>(blocks));
	ResizeRhs(lhs()->num_rows());
	}

	// Solve the system Sx = r, assuming that the matrix S is stored in a
	// BlockRandomAccessDenseMatrix. The linear system is solved using
	// Eigen's Cholesky factorization.
	LinearSolver::Summary DenseSchurComplementSolver::SolveReducedLinearSystem(
	const LinearSolver::PerSolveOptions& per_solve_options, double* solution) {
	LinearSolver::Summary summary;
	summary.num_iterations = 0;
	summary.termination_type = LinearSolverTerminationType::SUCCESS;
	summary.message = "Success.";

	auto* m = down_cast<BlockRandomAccessDenseMatrix*>(mutable_lhs());
	const int num_rows = m->num_rows();

	// The case where there are no f blocks, and the system is block
	// diagonal.
	if (num_rows == 0) {
	return summary;
	}

	summary.num_iterations = 1;
	summary.termination_type = cholesky_->FactorAndSolve(
	num_rows, m->mutable_values(), rhs().data(), solution, &summary.message);
	return summary;
	}

	SparseSchurComplementSolver::SparseSchurComplementSolver(
	const LinearSolver::Options& options)
	: SchurComplementSolver(options) {
	if (options.type != ITERATIVE_SCHUR) {
	sparse_cholesky_ = SparseCholesky::Create(options);
	}
	}

	SparseSchurComplementSolver::~SparseSchurComplementSolver() {
	for (int i = 0; i < 4; ++i) {
	if (scratch_[i]) {
	delete scratch_[i];
	scratch_[i] = nullptr;
	}
	}
	}

	// Determine the non-zero blocks in the Schur Complement matrix, and
	// initialize a BlockRandomAccessSparseMatrix object.
	void SparseSchurComplementSolver::InitStorage(
	const CompressedRowBlockStructure* bs) {
	const int num_eliminate_blocks = options().elimination_groups[0];
	const int num_col_blocks = bs->cols.size();
	const int num_row_blocks = bs->rows.size();

	blocks_ = Tail(bs->cols, num_col_blocks - num_eliminate_blocks);

	std::set<std::pair<int, int>> block_pairs;
	for (int i = 0; i < blocks_.size(); ++i) {
	block_pairs.emplace(i, i);
	}

	int r = 0;
	while (r < num_row_blocks) {
	int e_block_id = bs->rows[r].cells.front().block_id;
	if (e_block_id >= num_eliminate_blocks) {
	break;
	}
	std::vector<int> f_blocks;

	// Add to the chunk until the first block in the row is
	// different than the one in the first row for the chunk.
	for (; r < num_row_blocks; ++r) {
	const CompressedRow& row = bs->rows[r];
	if (row.cells.front().block_id != e_block_id) {
	break;
	}

	// Iterate over the blocks in the row, ignoring the first
	// block since it is the one to be eliminated.
	for (int c = 1; c < row.cells.size(); ++c) {
	const Cell& cell = row.cells[c];
	f_blocks.push_back(cell.block_id - num_eliminate_blocks);
	}
	}

	sort(f_blocks.begin(), f_blocks.end());
	f_blocks.erase(unique(f_blocks.begin(), f_blocks.end()), f_blocks.end());
	for (int i = 0; i < f_blocks.size(); ++i) {
	for (int j = i + 1; j < f_blocks.size(); ++j) {
	block_pairs.emplace(f_blocks[i], f_blocks[j]);
	}
	}
	}

	// Remaining rows do not contribute to the chunks and directly go
	// into the schur complement via an outer product.
	for (; r < num_row_blocks; ++r) {
	const CompressedRow& row = bs->rows[r];
	CHECK_GE(row.cells.front().block_id, num_eliminate_blocks);
	for (int i = 0; i < row.cells.size(); ++i) {
	int r_block1_id = row.cells[i].block_id - num_eliminate_blocks;
	for (const auto& cell : row.cells) {
	int r_block2_id = cell.block_id - num_eliminate_blocks;
	if (r_block1_id <= r_block2_id) {
	block_pairs.emplace(r_block1_id, r_block2_id);
	}
	}
	}
	}

	set_lhs(
	std::make_unique<BlockRandomAccessSparseMatrix>(blocks_, block_pairs));
	ResizeRhs(lhs()->num_rows());
	}

	LinearSolver::Summary SparseSchurComplementSolver::SolveReducedLinearSystem(
	const LinearSolver::PerSolveOptions& per_solve_options, double* solution) {
	if (options().type == ITERATIVE_SCHUR) {
	return SolveReducedLinearSystemUsingConjugateGradients(per_solve_options,
	solution);
	}

	LinearSolver::Summary summary;
	summary.num_iterations = 0;
	summary.termination_type = LinearSolverTerminationType::SUCCESS;
	summary.message = "Success.";

	const TripletSparseMatrix* tsm =
	down_cast<const BlockRandomAccessSparseMatrix*>(lhs())->matrix();
	if (tsm->num_rows() == 0) {
	return summary;
	}

	std::unique_ptr<CompressedRowSparseMatrix> lhs;
	const CompressedRowSparseMatrix::StorageType storage_type =
	sparse_cholesky_->StorageType();
	if (storage_type ==
	CompressedRowSparseMatrix::StorageType::UPPER_TRIANGULAR) {
	lhs = CompressedRowSparseMatrix::FromTripletSparseMatrix(*tsm);
	lhs->set_storage_type(
	CompressedRowSparseMatrix::StorageType::UPPER_TRIANGULAR);
	} else {
	lhs = CompressedRowSparseMatrix::FromTripletSparseMatrixTransposed(*tsm);
	lhs->set_storage_type(
	CompressedRowSparseMatrix::StorageType::LOWER_TRIANGULAR);
	}

	*lhs->mutable_col_blocks() = blocks_;
	*lhs->mutable_row_blocks() = blocks_;

	summary.num_iterations = 1;
	summary.termination_type = sparse_cholesky_->FactorAndSolve(
	lhs.get(), rhs().data(), solution, &summary.message);
	return summary;
	}

	LinearSolver::Summary
	SparseSchurComplementSolver::SolveReducedLinearSystemUsingConjugateGradients(
	const LinearSolver::PerSolveOptions& per_solve_options, double* solution) {
	CHECK(options().use_explicit_schur_complement);
	const int num_rows = lhs()->num_rows();
	// The case where there are no f blocks, and the system is block
	// diagonal.
	if (num_rows == 0) {
	LinearSolver::Summary summary;
	summary.num_iterations = 0;
	summary.termination_type = LinearSolverTerminationType::SUCCESS;
	summary.message = "Success.";
	return summary;
	}

	// Only SCHUR_JACOBI is supported over here right now.
	CHECK_EQ(options().preconditioner_type, SCHUR_JACOBI);

	if (preconditioner_ == nullptr) {
	preconditioner_ =
	std::make_unique<BlockRandomAccessDiagonalMatrix>(blocks_);
	}

	auto* sc = down_cast<BlockRandomAccessSparseMatrix*>(mutable_lhs());

	// Extract block diagonal from the Schur complement to construct the
	// schur_jacobi preconditioner.
	for (int i = 0; i < blocks_.size(); ++i) {
	const int block_size = blocks_[i].size;

	int sc_r, sc_c, sc_row_stride, sc_col_stride;
	CellInfo* sc_cell_info =
	sc->GetCell(i, i, &sc_r, &sc_c, &sc_row_stride, &sc_col_stride);
	CHECK(sc_cell_info != nullptr);
	MatrixRef sc_m(sc_cell_info->values, sc_row_stride, sc_col_stride);

	int pre_r, pre_c, pre_row_stride, pre_col_stride;
	CellInfo* pre_cell_info = preconditioner_->GetCell(
	i, i, &pre_r, &pre_c, &pre_row_stride, &pre_col_stride);
	CHECK(pre_cell_info != nullptr);
	MatrixRef pre_m(pre_cell_info->values, pre_row_stride, pre_col_stride);

	pre_m.block(pre_r, pre_c, block_size, block_size) =
	sc_m.block(sc_r, sc_c, block_size, block_size);
	}
	preconditioner_->Invert();

	VectorRef(solution, num_rows).setZero();

	auto lhs = std::make_unique<BlockRandomAccessSparseMatrixAdapter>(*sc);
	auto preconditioner =
	std::make_unique<BlockRandomAccessDiagonalMatrixAdapter>(
	*preconditioner_);

	ConjugateGradientsSolverOptions cg_options;
	cg_options.min_num_iterations = options().min_num_iterations;
	cg_options.max_num_iterations = options().max_num_iterations;
	cg_options.residual_reset_period = options().residual_reset_period;
	cg_options.q_tolerance = per_solve_options.q_tolerance;
	cg_options.r_tolerance = per_solve_options.r_tolerance;

	cg_solution_ = Vector::Zero(sc->num_rows());
	for (int i = 0; i < 4; ++i) {
	if (scratch_[i] == nullptr) {
	scratch_[i] = new Vector(sc->num_rows());
	}
	}
	auto summary = ConjugateGradientsSolver<Vector>(
	cg_options, lhs, rhs(), preconditioner, scratch_, cg_solution_);
	VectorRef(solution, sc->num_rows()) = cg_solution_;
	return summary;
	}

	} // namespace ceres::internal