internal/ceres/compressed_row_sparse_matrix.cc - ceres-solver - Git at Google

 // Ceres Solver - A fast non-linear least squares minimizer
 // Copyright 2010, 2011, 2012 Google Inc. All rights reserved.
 // http://code.google.com/p/ceres-solver/
 //
 // Redistribution and use in source and binary forms, with or without
 // modification, are permitted provided that the following conditions are met:
 //
 // * Redistributions of source code must retain the above copyright notice,
 //   this list of conditions and the following disclaimer.
 // * Redistributions in binary form must reproduce the above copyright notice,
 //   this list of conditions and the following disclaimer in the documentation
 //   and/or other materials provided with the distribution.
 // * Neither the name of Google Inc. nor the names of its contributors may be
 //   used to endorse or promote products derived from this software without
 //   specific prior written permission.
 //
 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 // AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 // ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
 // LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 // CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 // SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 // INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 // CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 // ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 // POSSIBILITY OF SUCH DAMAGE.
 //
 // Author: sameeragarwal@google.com (Sameer Agarwal)

 #include "ceres/compressed_row_sparse_matrix.h"

 #include <algorithm>
 #include <numeric>
 #include <vector>
 #include "ceres/crs_matrix.h"
 #include "ceres/internal/port.h"
 #include "ceres/triplet_sparse_matrix.h"
 #include "glog/logging.h"

 namespace ceres {
 namespace internal {
 namespace {

 // Helper functor used by the constructor for reordering the contents
 // of a TripletSparseMatrix. This comparator assumes thay there are no
 // duplicates in the pair of arrays rows and cols, i.e., there is no
 // indices i and j (not equal to each other) s.t.
 //
 //  rows[i] == rows[j] && cols[i] == cols[j]
 //
 // If this is the case, this functor will not be a StrictWeakOrdering.
 struct RowColLessThan {
   RowColLessThan(const int* rows, const int* cols)
       : rows(rows), cols(cols) {
   }

   bool operator()(const int x, const int y) const {
     if (rows[x] == rows[y]) {
       return (cols[x] < cols[y]);
     }
     return (rows[x] < rows[y]);
   }

   const int* rows;
   const int* cols;
 };

 }  // namespace

 // This constructor gives you a semi-initialized CompressedRowSparseMatrix.
 CompressedRowSparseMatrix::CompressedRowSparseMatrix(int num_rows,
                                                      int num_cols,
                                                      int max_num_nonzeros) {
   num_rows_ = num_rows;
   num_cols_ = num_cols;
   rows_.resize(num_rows + 1, 0);
   cols_.resize(max_num_nonzeros, 0);
   values_.resize(max_num_nonzeros, 0.0);


   VLOG(1) << "# of rows: " << num_rows_
           << " # of columns: " << num_cols_
           << " max_num_nonzeros: " << cols_.size()
           << ". Allocating " << (num_rows_ + 1) * sizeof(int) +  // NOLINT
       cols_.size() * sizeof(int) +  // NOLINT
       cols_.size() * sizeof(double);  // NOLINT
 }

 CompressedRowSparseMatrix::CompressedRowSparseMatrix(
     const TripletSparseMatrix& m) {
   num_rows_ = m.num_rows();
   num_cols_ = m.num_cols();

   rows_.resize(num_rows_ + 1, 0);
   cols_.resize(m.num_nonzeros(), 0);
   values_.resize(m.max_num_nonzeros(), 0.0);

   // index is the list of indices into the TripletSparseMatrix m.
   vector<int> index(m.num_nonzeros(), 0);
   for (int i = 0; i < m.num_nonzeros(); ++i) {
     index[i] = i;
   }

   // Sort index such that the entries of m are ordered by row and ties
   // are broken by column.
   sort(index.begin(), index.end(), RowColLessThan(m.rows(), m.cols()));

   VLOG(1) << "# of rows: " << num_rows_
           << " # of columns: " << num_cols_
           << " max_num_nonzeros: " << cols_.size()
           << ". Allocating "
           << ((num_rows_ + 1) * sizeof(int) +  // NOLINT
               cols_.size() * sizeof(int) +     // NOLINT
               cols_.size() * sizeof(double));  // NOLINT

   // Copy the contents of the cols and values array in the order given
   // by index and count the number of entries in each row.
   for (int i = 0; i < m.num_nonzeros(); ++i) {
     const int idx = index[i];
     ++rows_[m.rows()[idx] + 1];
     cols_[i] = m.cols()[idx];
     values_[i] = m.values()[idx];
   }

   // Find the cumulative sum of the row counts.
   for (int i = 1; i < num_rows_ + 1; ++i) {
     rows_[i] += rows_[i - 1];
   }

   CHECK_EQ(num_nonzeros(), m.num_nonzeros());
 }

 CompressedRowSparseMatrix::CompressedRowSparseMatrix(const double* diagonal,
                                                      int num_rows) {
   CHECK_NOTNULL(diagonal);

   num_rows_ = num_rows;
   num_cols_ = num_rows;
   rows_.resize(num_rows + 1);
   cols_.resize(num_rows);
   values_.resize(num_rows);

   rows_[0] = 0;
   for (int i = 0; i < num_rows_; ++i) {
     cols_[i] = i;
     values_[i] = diagonal[i];
     rows_[i + 1] = i + 1;
   }

   CHECK_EQ(num_nonzeros(), num_rows);
 }

 CompressedRowSparseMatrix::~CompressedRowSparseMatrix() {
 }

 void CompressedRowSparseMatrix::SetZero() {
   fill(values_.begin(), values_.end(), 0);
 }

 void CompressedRowSparseMatrix::RightMultiply(const double* x,
                                               double* y) const {
   CHECK_NOTNULL(x);
   CHECK_NOTNULL(y);

   for (int r = 0; r < num_rows_; ++r) {
     for (int idx = rows_[r]; idx < rows_[r + 1]; ++idx) {
       y[r] += values_[idx] * x[cols_[idx]];
     }
   }
 }

 void CompressedRowSparseMatrix::LeftMultiply(const double* x, double* y) const {
   CHECK_NOTNULL(x);
   CHECK_NOTNULL(y);

   for (int r = 0; r < num_rows_; ++r) {
     for (int idx = rows_[r]; idx < rows_[r + 1]; ++idx) {
       y[cols_[idx]] += values_[idx] * x[r];
     }
   }
 }

 void CompressedRowSparseMatrix::SquaredColumnNorm(double* x) const {
   CHECK_NOTNULL(x);

   fill(x, x + num_cols_, 0.0);
   for (int idx = 0; idx < rows_[num_rows_]; ++idx) {
     x[cols_[idx]] += values_[idx] * values_[idx];
   }
 }

 void CompressedRowSparseMatrix::ScaleColumns(const double* scale) {
   CHECK_NOTNULL(scale);

   for (int idx = 0; idx < rows_[num_rows_]; ++idx) {
     values_[idx] *= scale[cols_[idx]];
   }
 }

 void CompressedRowSparseMatrix::ToDenseMatrix(Matrix* dense_matrix) const {
   CHECK_NOTNULL(dense_matrix);
   dense_matrix->resize(num_rows_, num_cols_);
   dense_matrix->setZero();

   for (int r = 0; r < num_rows_; ++r) {
     for (int idx = rows_[r]; idx < rows_[r + 1]; ++idx) {
       (*dense_matrix)(r, cols_[idx]) = values_[idx];
     }
   }
 }

 void CompressedRowSparseMatrix::DeleteRows(int delta_rows) {
   CHECK_GE(delta_rows, 0);
   CHECK_LE(delta_rows, num_rows_);

   num_rows_ -= delta_rows;
   rows_.resize(num_rows_ + 1);

   // Walk the list of row blocks until we reach the new number of rows
   // and the drop the rest of the row blocks.
   int num_row_blocks = 0;
   int num_rows = 0;
   while (num_row_blocks < row_blocks_.size() && num_rows < num_rows_) {
     num_rows += row_blocks_[num_row_blocks];
     ++num_row_blocks;
   }

   row_blocks_.resize(num_row_blocks);
 }

 void CompressedRowSparseMatrix::AppendRows(const CompressedRowSparseMatrix& m) {
   CHECK_EQ(m.num_cols(), num_cols_);

   CHECK(row_blocks_.size() == 0 || m.row_blocks().size() !=0)
       << "Cannot append a matrix with row blocks to one without and vice versa."
       << "This matrix has : " << row_blocks_.size() << " row blocks."
       << "The matrix being appended has: " << m.row_blocks().size()
       << " row blocks.";

   if (cols_.size() < num_nonzeros() + m.num_nonzeros()) {
     cols_.resize(num_nonzeros() + m.num_nonzeros());
     values_.resize(num_nonzeros() + m.num_nonzeros());
   }

   // Copy the contents of m into this matrix.
   copy(m.cols(), m.cols() + m.num_nonzeros(), &cols_[num_nonzeros()]);
   copy(m.values(), m.values() + m.num_nonzeros(), &values_[num_nonzeros()]);
   rows_.resize(num_rows_ + m.num_rows() + 1);
   // new_rows = [rows_, m.row() + rows_[num_rows_]]
   fill(rows_.begin() + num_rows_,
        rows_.begin() + num_rows_ + m.num_rows() + 1,
        rows_[num_rows_]);

   for (int r = 0; r < m.num_rows() + 1; ++r) {
     rows_[num_rows_ + r] += m.rows()[r];
   }

   num_rows_ += m.num_rows();
   row_blocks_.insert(row_blocks_.end(), m.row_blocks().begin(), m.row_blocks().end());
 }

 void CompressedRowSparseMatrix::ToTextFile(FILE* file) const {
   CHECK_NOTNULL(file);
   for (int r = 0; r < num_rows_; ++r) {
     for (int idx = rows_[r]; idx < rows_[r + 1]; ++idx) {
       fprintf(file,
               "% 10d % 10d %17f\n",
               r,
               cols_[idx],
               values_[idx]);
     }
   }
 }

 void CompressedRowSparseMatrix::ToCRSMatrix(CRSMatrix* matrix) const {
   matrix->num_rows = num_rows_;
   matrix->num_cols = num_cols_;
   matrix->rows = rows_;
   matrix->cols = cols_;
   matrix->values = values_;

   // Trim.
   matrix->rows.resize(matrix->num_rows + 1);
   matrix->cols.resize(matrix->rows[matrix->num_rows]);
   matrix->values.resize(matrix->rows[matrix->num_rows]);
 }

 void CompressedRowSparseMatrix::SetMaxNumNonZeros(int num_nonzeros) {
   CHECK_GE(num_nonzeros, 0);

   cols_.resize(num_nonzeros);
   values_.resize(num_nonzeros);
 }

 void CompressedRowSparseMatrix::SolveLowerTriangularInPlace(
     double* solution) const {
   for (int r = 0; r < num_rows_; ++r) {
     for (int idx = rows_[r]; idx < rows_[r + 1] - 1; ++idx) {
       solution[r] -= values_[idx] * solution[cols_[idx]];
     }
     solution[r] /=  values_[rows_[r + 1] - 1];
   }
 }

 void CompressedRowSparseMatrix::SolveLowerTriangularTransposeInPlace(
     double* solution) const {
   for (int r = num_rows_ - 1; r >= 0; --r) {
     solution[r] /= values_[rows_[r + 1] - 1];
     for (int idx = rows_[r + 1] - 2; idx >= rows_[r]; --idx) {
       solution[cols_[idx]] -= values_[idx] * solution[r];
     }
   }
 }

 CompressedRowSparseMatrix* CompressedRowSparseMatrix::CreateBlockDiagonalMatrix(
     const double* diagonal,
     const vector<int>& blocks) {
   int num_rows = 0;
   int num_nonzeros = 0;
   for (int i = 0; i < blocks.size(); ++i) {
     num_rows += blocks[i];
     num_nonzeros += blocks[i] * blocks[i];
   }

   CompressedRowSparseMatrix* matrix =
       new CompressedRowSparseMatrix(num_rows, num_rows, num_nonzeros);

   int* rows = matrix->mutable_rows();
   int* cols = matrix->mutable_cols();
   double* values = matrix->mutable_values();
   fill(values, values + num_nonzeros, 0.0);

   int idx_cursor = 0;
   int col_cursor = 0;
   for (int i = 0; i < blocks.size(); ++i) {
     const int block_size = blocks[i];
     for (int r = 0; r < block_size; ++r) {
       *(rows++) = idx_cursor;
       values[idx_cursor + r] = diagonal[col_cursor + r];
       for (int c = 0; c < block_size; ++c, ++idx_cursor) {
         *(cols++) = col_cursor + c;
       }
     }
     col_cursor += block_size;
   }
   *rows = idx_cursor;

   *matrix->mutable_row_blocks() = blocks;
   *matrix->mutable_col_blocks() = blocks;

   CHECK_EQ(idx_cursor, num_nonzeros);
   CHECK_EQ(col_cursor, num_rows);
   return matrix;
 }

 CompressedRowSparseMatrix* CompressedRowSparseMatrix::Transpose() const {
   CompressedRowSparseMatrix* transpose =
       new CompressedRowSparseMatrix(num_cols_, num_rows_, num_nonzeros());

   int* transpose_rows = transpose->mutable_rows();
   int* transpose_cols = transpose->mutable_cols();
   double* transpose_values = transpose->mutable_values();

   for (int idx = 0; idx < num_nonzeros(); ++idx) {
     ++transpose_rows[cols_[idx] + 1];
   }

   for (int i = 1; i < transpose->num_rows() + 1; ++i) {
     transpose_rows[i] += transpose_rows[i - 1];
   }

   for (int r = 0; r < num_rows(); ++r) {
     for (int idx = rows_[r]; idx < rows_[r + 1]; ++idx) {
       const int c = cols_[idx];
       const int transpose_idx = transpose_rows[c]++;
       transpose_cols[transpose_idx] = r;
       transpose_values[transpose_idx] = values_[idx];
     }
   }

   for (int i = transpose->num_rows() - 1; i > 0 ; --i) {
     transpose_rows[i] = transpose_rows[i - 1];
   }
   transpose_rows[0] = 0;

   *(transpose->mutable_row_blocks()) = col_blocks_;
   *(transpose->mutable_col_blocks()) = row_blocks_;

   return transpose;
 }

 namespace {
 // A ProductTerm is a term in the outer product of a matrix with
 // itself.
 struct ProductTerm {
   ProductTerm(const int row, const int col, const int index)
       : row(row), col(col), index(index) {
   }

   bool operator<(const ProductTerm& right) const {
     if (row == right.row) {
       if (col == right.col) {
         return index < right.index;
       }
       return col < right.col;
     }
     return row < right.row;
   }

   int row;
   int col;
   int index;
 };

 CompressedRowSparseMatrix*
 CompressAndFillProgram(const int num_rows,
                        const int num_cols,
                        const vector<ProductTerm>& product,
                        vector<int>* program) {
   CHECK_GT(product.size(), 0);

   // Count the number of unique product term, which in turn is the
   // number of non-zeros in the outer product.
   int num_nonzeros = 1;
   for (int i = 1; i < product.size(); ++i) {
     if (product[i].row != product[i - 1].row ||
         product[i].col != product[i - 1].col) {
       ++num_nonzeros;
     }
   }

   CompressedRowSparseMatrix* matrix =
       new CompressedRowSparseMatrix(num_rows, num_cols, num_nonzeros);

   int* crsm_rows = matrix->mutable_rows();
   std::fill(crsm_rows, crsm_rows + num_rows + 1, 0);
   int* crsm_cols = matrix->mutable_cols();
   std::fill(crsm_cols, crsm_cols + num_nonzeros, 0);

   CHECK_NOTNULL(program)->clear();
   program->resize(product.size());

   // Iterate over the sorted product terms. This means each row is
   // filled one at a time, and we are able to assign a position in the
   // values array to each term.
   //
   // If terms repeat, i.e., they contribute to the same entry in the
   // result matrix), then they do not affect the sparsity structure of
   // the result matrix.
   int nnz = 0;
   crsm_cols[0] = product[0].col;
   crsm_rows[product[0].row + 1]++;
   (*program)[product[0].index] = nnz;
   for (int i = 1; i < product.size(); ++i) {
     const ProductTerm& previous = product[i - 1];
     const ProductTerm& current = product[i];

     // Sparsity structure is updated only if the term is not a repeat.
     if (previous.row != current.row || previous.col != current.col) {
       crsm_cols[++nnz] = current.col;
       crsm_rows[current.row + 1]++;
     }

     // All terms get assigned the position in the values array where
     // their value is accumulated.
     (*program)[current.index] = nnz;
   }

   for (int i = 1; i < num_rows + 1; ++i) {
     crsm_rows[i] += crsm_rows[i - 1];
   }

   return matrix;
 }

 }  // namespace

 CompressedRowSparseMatrix*
 CompressedRowSparseMatrix::CreateOuterProductMatrixAndProgram(
       const CompressedRowSparseMatrix& m,
       vector<int>* program) {
   CHECK_NOTNULL(program)->clear();
   CHECK_GT(m.num_nonzeros(), 0) << "Congratulations, "
                                 << "you found a bug in Ceres. Please report it.";

   vector<ProductTerm> product;
   const vector<int>& row_blocks = m.row_blocks();
   int row_block_begin = 0;
   // Iterate over row blocks
   for (int row_block = 0; row_block < row_blocks.size(); ++row_block) {
     const int row_block_end = row_block_begin + row_blocks[row_block];
     // Compute the outer product terms for just one row per row block.
     const int r = row_block_begin;
     // Compute the lower triangular part of the product.
     for (int idx1 = m.rows()[r]; idx1 < m.rows()[r + 1]; ++idx1) {
       for (int idx2 = m.rows()[r]; idx2 <= idx1; ++idx2) {
         product.push_back(ProductTerm(m.cols()[idx1], m.cols()[idx2], product.size()));
       }
     }
     row_block_begin = row_block_end;
   }
   CHECK_EQ(row_block_begin, m.num_rows());
   sort(product.begin(), product.end());
   return CompressAndFillProgram(m.num_cols(), m.num_cols(), product, program);
 }

 void CompressedRowSparseMatrix::ComputeOuterProduct(
     const CompressedRowSparseMatrix& m,
     const vector<int>& program,
     CompressedRowSparseMatrix* result) {
   result->SetZero();
   double* values = result->mutable_values();
   const vector<int>& row_blocks = m.row_blocks();

   int cursor = 0;
   int row_block_begin = 0;
   const double* m_values = m.values();
   const int* m_rows = m.rows();
   // Iterate over row blocks.
   for (int row_block = 0; row_block < row_blocks.size(); ++row_block) {
     const int row_block_end = row_block_begin + row_blocks[row_block];
     const int saved_cursor = cursor;
     for (int r = row_block_begin; r < row_block_end; ++r) {
       // Reuse the program segment for each row in this row block.
       cursor = saved_cursor;
       const int row_begin = m_rows[r];
       const int row_end = m_rows[r + 1];
       for (int idx1 = row_begin; idx1 < row_end; ++idx1) {
         const double v1 =  m_values[idx1];
         for (int idx2 = row_begin; idx2 <= idx1; ++idx2, ++cursor) {
           values[program[cursor]] += v1 * m_values[idx2];
         }
       }
     }
     row_block_begin = row_block_end;
   }

   CHECK_EQ(row_block_begin, m.num_rows());
   CHECK_EQ(cursor, program.size());
 }

 }  // namespace internal
 }  // namespace ceres
	// Ceres Solver - A fast non-linear least squares minimizer
	// Copyright 2010, 2011, 2012 Google Inc. All rights reserved.
	// http://code.google.com/p/ceres-solver/
	//
	// Redistribution and use in source and binary forms, with or without
	// modification, are permitted provided that the following conditions are met:
	//
	// * Redistributions of source code must retain the above copyright notice,
	// this list of conditions and the following disclaimer.
	// * Redistributions in binary form must reproduce the above copyright notice,
	// this list of conditions and the following disclaimer in the documentation
	// and/or other materials provided with the distribution.
	// * Neither the name of Google Inc. nor the names of its contributors may be
	// used to endorse or promote products derived from this software without
	// specific prior written permission.
	//
	// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
	// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
	// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
	// ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
	// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
	// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
	// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
	// INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
	// CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
	// ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
	// POSSIBILITY OF SUCH DAMAGE.
	//
	// Author: sameeragarwal@google.com (Sameer Agarwal)

	#include "ceres/compressed_row_sparse_matrix.h"

	#include <algorithm>
	#include <numeric>
	#include <vector>
	#include "ceres/crs_matrix.h"
	#include "ceres/internal/port.h"
	#include "ceres/triplet_sparse_matrix.h"
	#include "glog/logging.h"

	namespace ceres {
	namespace internal {
	namespace {

	// Helper functor used by the constructor for reordering the contents
	// of a TripletSparseMatrix. This comparator assumes thay there are no
	// duplicates in the pair of arrays rows and cols, i.e., there is no
	// indices i and j (not equal to each other) s.t.
	//
	// rows[i] == rows[j] && cols[i] == cols[j]
	//
	// If this is the case, this functor will not be a StrictWeakOrdering.
	struct RowColLessThan {
	RowColLessThan(const int* rows, const int* cols)
	: rows(rows), cols(cols) {
	}

	bool operator()(const int x, const int y) const {
	if (rows[x] == rows[y]) {
	return (cols[x] < cols[y]);
	}
	return (rows[x] < rows[y]);
	}

	const int* rows;
	const int* cols;
	};

	} // namespace

	// This constructor gives you a semi-initialized CompressedRowSparseMatrix.
	CompressedRowSparseMatrix::CompressedRowSparseMatrix(int num_rows,
	int num_cols,
	int max_num_nonzeros) {
	num_rows_ = num_rows;
	num_cols_ = num_cols;
	rows_.resize(num_rows + 1, 0);
	cols_.resize(max_num_nonzeros, 0);
	values_.resize(max_num_nonzeros, 0.0);


	VLOG(1) << "# of rows: " << num_rows_
	<< " # of columns: " << num_cols_
	<< " max_num_nonzeros: " << cols_.size()
	<< ". Allocating " << (num_rows_ + 1) * sizeof(int) + // NOLINT
	cols_.size() * sizeof(int) + // NOLINT
	cols_.size() * sizeof(double); // NOLINT
	}

	CompressedRowSparseMatrix::CompressedRowSparseMatrix(
	const TripletSparseMatrix& m) {
	num_rows_ = m.num_rows();
	num_cols_ = m.num_cols();

	rows_.resize(num_rows_ + 1, 0);
	cols_.resize(m.num_nonzeros(), 0);
	values_.resize(m.max_num_nonzeros(), 0.0);

	// index is the list of indices into the TripletSparseMatrix m.
	vector<int> index(m.num_nonzeros(), 0);
	for (int i = 0; i < m.num_nonzeros(); ++i) {
	index[i] = i;
	}

	// Sort index such that the entries of m are ordered by row and ties
	// are broken by column.
	sort(index.begin(), index.end(), RowColLessThan(m.rows(), m.cols()));

	VLOG(1) << "# of rows: " << num_rows_
	<< " # of columns: " << num_cols_
	<< " max_num_nonzeros: " << cols_.size()
	<< ". Allocating "
	<< ((num_rows_ + 1) * sizeof(int) + // NOLINT
	cols_.size() * sizeof(int) + // NOLINT
	cols_.size() * sizeof(double)); // NOLINT

	// Copy the contents of the cols and values array in the order given
	// by index and count the number of entries in each row.
	for (int i = 0; i < m.num_nonzeros(); ++i) {
	const int idx = index[i];
	++rows_[m.rows()[idx] + 1];
	cols_[i] = m.cols()[idx];
	values_[i] = m.values()[idx];
	}

	// Find the cumulative sum of the row counts.
	for (int i = 1; i < num_rows_ + 1; ++i) {
	rows_[i] += rows_[i - 1];
	}

	CHECK_EQ(num_nonzeros(), m.num_nonzeros());
	}

	CompressedRowSparseMatrix::CompressedRowSparseMatrix(const double* diagonal,
	int num_rows) {
	CHECK_NOTNULL(diagonal);

	num_rows_ = num_rows;
	num_cols_ = num_rows;
	rows_.resize(num_rows + 1);
	cols_.resize(num_rows);
	values_.resize(num_rows);

	rows_[0] = 0;
	for (int i = 0; i < num_rows_; ++i) {
	cols_[i] = i;
	values_[i] = diagonal[i];
	rows_[i + 1] = i + 1;
	}

	CHECK_EQ(num_nonzeros(), num_rows);
	}

	CompressedRowSparseMatrix::~CompressedRowSparseMatrix() {
	}

	void CompressedRowSparseMatrix::SetZero() {
	fill(values_.begin(), values_.end(), 0);
	}

	void CompressedRowSparseMatrix::RightMultiply(const double* x,
	double* y) const {
	CHECK_NOTNULL(x);
	CHECK_NOTNULL(y);

	for (int r = 0; r < num_rows_; ++r) {
	for (int idx = rows_[r]; idx < rows_[r + 1]; ++idx) {
	y[r] += values_[idx] * x[cols_[idx]];
	}
	}
	}

	void CompressedRowSparseMatrix::LeftMultiply(const double* x, double* y) const {
	CHECK_NOTNULL(x);
	CHECK_NOTNULL(y);

	for (int r = 0; r < num_rows_; ++r) {
	for (int idx = rows_[r]; idx < rows_[r + 1]; ++idx) {
	y[cols_[idx]] += values_[idx] * x[r];
	}
	}
	}

	void CompressedRowSparseMatrix::SquaredColumnNorm(double* x) const {
	CHECK_NOTNULL(x);

	fill(x, x + num_cols_, 0.0);
	for (int idx = 0; idx < rows_[num_rows_]; ++idx) {
	x[cols_[idx]] += values_[idx] * values_[idx];
	}
	}

	void CompressedRowSparseMatrix::ScaleColumns(const double* scale) {
	CHECK_NOTNULL(scale);

	for (int idx = 0; idx < rows_[num_rows_]; ++idx) {
	values_[idx] *= scale[cols_[idx]];
	}
	}

	void CompressedRowSparseMatrix::ToDenseMatrix(Matrix* dense_matrix) const {
	CHECK_NOTNULL(dense_matrix);
	dense_matrix->resize(num_rows_, num_cols_);
	dense_matrix->setZero();

	for (int r = 0; r < num_rows_; ++r) {
	for (int idx = rows_[r]; idx < rows_[r + 1]; ++idx) {
	(*dense_matrix)(r, cols_[idx]) = values_[idx];
	}
	}
	}

	void CompressedRowSparseMatrix::DeleteRows(int delta_rows) {
	CHECK_GE(delta_rows, 0);
	CHECK_LE(delta_rows, num_rows_);

	num_rows_ -= delta_rows;
	rows_.resize(num_rows_ + 1);

	// Walk the list of row blocks until we reach the new number of rows
	// and the drop the rest of the row blocks.
	int num_row_blocks = 0;
	int num_rows = 0;
	while (num_row_blocks < row_blocks_.size() && num_rows < num_rows_) {
	num_rows += row_blocks_[num_row_blocks];
	++num_row_blocks;
	}

	row_blocks_.resize(num_row_blocks);
	}

	void CompressedRowSparseMatrix::AppendRows(const CompressedRowSparseMatrix& m) {
	CHECK_EQ(m.num_cols(), num_cols_);

	CHECK(row_blocks_.size() == 0 \|\| m.row_blocks().size() !=0)
	<< "Cannot append a matrix with row blocks to one without and vice versa."
	<< "This matrix has : " << row_blocks_.size() << " row blocks."
	<< "The matrix being appended has: " << m.row_blocks().size()
	<< " row blocks.";

	if (cols_.size() < num_nonzeros() + m.num_nonzeros()) {
	cols_.resize(num_nonzeros() + m.num_nonzeros());
	values_.resize(num_nonzeros() + m.num_nonzeros());
	}

	// Copy the contents of m into this matrix.
	copy(m.cols(), m.cols() + m.num_nonzeros(), &cols_[num_nonzeros()]);
	copy(m.values(), m.values() + m.num_nonzeros(), &values_[num_nonzeros()]);
	rows_.resize(num_rows_ + m.num_rows() + 1);
	// new_rows = [rows_, m.row() + rows_[num_rows_]]
	fill(rows_.begin() + num_rows_,
	rows_.begin() + num_rows_ + m.num_rows() + 1,
	rows_[num_rows_]);

	for (int r = 0; r < m.num_rows() + 1; ++r) {
	rows_[num_rows_ + r] += m.rows()[r];
	}

	num_rows_ += m.num_rows();
	row_blocks_.insert(row_blocks_.end(), m.row_blocks().begin(), m.row_blocks().end());
	}

	void CompressedRowSparseMatrix::ToTextFile(FILE* file) const {
	CHECK_NOTNULL(file);
	for (int r = 0; r < num_rows_; ++r) {
	for (int idx = rows_[r]; idx < rows_[r + 1]; ++idx) {
	fprintf(file,
	"% 10d % 10d %17f\n",
	r,
	cols_[idx],
	values_[idx]);
	}
	}
	}

	void CompressedRowSparseMatrix::ToCRSMatrix(CRSMatrix* matrix) const {
	matrix->num_rows = num_rows_;
	matrix->num_cols = num_cols_;
	matrix->rows = rows_;
	matrix->cols = cols_;
	matrix->values = values_;

	// Trim.
	matrix->rows.resize(matrix->num_rows + 1);
	matrix->cols.resize(matrix->rows[matrix->num_rows]);
	matrix->values.resize(matrix->rows[matrix->num_rows]);
	}

	void CompressedRowSparseMatrix::SetMaxNumNonZeros(int num_nonzeros) {
	CHECK_GE(num_nonzeros, 0);

	cols_.resize(num_nonzeros);
	values_.resize(num_nonzeros);
	}

	void CompressedRowSparseMatrix::SolveLowerTriangularInPlace(
	double* solution) const {
	for (int r = 0; r < num_rows_; ++r) {
	for (int idx = rows_[r]; idx < rows_[r + 1] - 1; ++idx) {
	solution[r] -= values_[idx] * solution[cols_[idx]];
	}
	solution[r] /= values_[rows_[r + 1] - 1];
	}
	}

	void CompressedRowSparseMatrix::SolveLowerTriangularTransposeInPlace(
	double* solution) const {
	for (int r = num_rows_ - 1; r >= 0; --r) {
	solution[r] /= values_[rows_[r + 1] - 1];
	for (int idx = rows_[r + 1] - 2; idx >= rows_[r]; --idx) {
	solution[cols_[idx]] -= values_[idx] * solution[r];
	}
	}
	}

	CompressedRowSparseMatrix* CompressedRowSparseMatrix::CreateBlockDiagonalMatrix(
	const double* diagonal,
	const vector<int>& blocks) {
	int num_rows = 0;
	int num_nonzeros = 0;
	for (int i = 0; i < blocks.size(); ++i) {
	num_rows += blocks[i];
	num_nonzeros += blocks[i] * blocks[i];
	}

	CompressedRowSparseMatrix* matrix =
	new CompressedRowSparseMatrix(num_rows, num_rows, num_nonzeros);

	int* rows = matrix->mutable_rows();
	int* cols = matrix->mutable_cols();
	double* values = matrix->mutable_values();
	fill(values, values + num_nonzeros, 0.0);

	int idx_cursor = 0;
	int col_cursor = 0;
	for (int i = 0; i < blocks.size(); ++i) {
	const int block_size = blocks[i];
	for (int r = 0; r < block_size; ++r) {
	*(rows++) = idx_cursor;
	values[idx_cursor + r] = diagonal[col_cursor + r];
	for (int c = 0; c < block_size; ++c, ++idx_cursor) {
	*(cols++) = col_cursor + c;
	}
	}
	col_cursor += block_size;
	}
	*rows = idx_cursor;

	*matrix->mutable_row_blocks() = blocks;
	*matrix->mutable_col_blocks() = blocks;

	CHECK_EQ(idx_cursor, num_nonzeros);
	CHECK_EQ(col_cursor, num_rows);
	return matrix;
	}

	CompressedRowSparseMatrix* CompressedRowSparseMatrix::Transpose() const {
	CompressedRowSparseMatrix* transpose =
	new CompressedRowSparseMatrix(num_cols_, num_rows_, num_nonzeros());

	int* transpose_rows = transpose->mutable_rows();
	int* transpose_cols = transpose->mutable_cols();
	double* transpose_values = transpose->mutable_values();

	for (int idx = 0; idx < num_nonzeros(); ++idx) {
	++transpose_rows[cols_[idx] + 1];
	}

	for (int i = 1; i < transpose->num_rows() + 1; ++i) {
	transpose_rows[i] += transpose_rows[i - 1];
	}

	for (int r = 0; r < num_rows(); ++r) {
	for (int idx = rows_[r]; idx < rows_[r + 1]; ++idx) {
	const int c = cols_[idx];
	const int transpose_idx = transpose_rows[c]++;
	transpose_cols[transpose_idx] = r;
	transpose_values[transpose_idx] = values_[idx];
	}
	}

	for (int i = transpose->num_rows() - 1; i > 0 ; --i) {
	transpose_rows[i] = transpose_rows[i - 1];
	}
	transpose_rows[0] = 0;

	*(transpose->mutable_row_blocks()) = col_blocks_;
	*(transpose->mutable_col_blocks()) = row_blocks_;

	return transpose;
	}

	namespace {
	// A ProductTerm is a term in the outer product of a matrix with
	// itself.
	struct ProductTerm {
	ProductTerm(const int row, const int col, const int index)
	: row(row), col(col), index(index) {
	}

	bool operator<(const ProductTerm& right) const {
	if (row == right.row) {
	if (col == right.col) {
	return index < right.index;
	}
	return col < right.col;
	}
	return row < right.row;
	}

	int row;
	int col;
	int index;
	};

	CompressedRowSparseMatrix*
	CompressAndFillProgram(const int num_rows,
	const int num_cols,
	const vector<ProductTerm>& product,
	vector<int>* program) {
	CHECK_GT(product.size(), 0);

	// Count the number of unique product term, which in turn is the
	// number of non-zeros in the outer product.
	int num_nonzeros = 1;
	for (int i = 1; i < product.size(); ++i) {
	if (product[i].row != product[i - 1].row \|\|
	product[i].col != product[i - 1].col) {
	++num_nonzeros;
	}
	}

	CompressedRowSparseMatrix* matrix =
	new CompressedRowSparseMatrix(num_rows, num_cols, num_nonzeros);

	int* crsm_rows = matrix->mutable_rows();
	std::fill(crsm_rows, crsm_rows + num_rows + 1, 0);
	int* crsm_cols = matrix->mutable_cols();
	std::fill(crsm_cols, crsm_cols + num_nonzeros, 0);

	CHECK_NOTNULL(program)->clear();
	program->resize(product.size());

	// Iterate over the sorted product terms. This means each row is
	// filled one at a time, and we are able to assign a position in the
	// values array to each term.
	//
	// If terms repeat, i.e., they contribute to the same entry in the
	// result matrix), then they do not affect the sparsity structure of
	// the result matrix.
	int nnz = 0;
	crsm_cols[0] = product[0].col;
	crsm_rows[product[0].row + 1]++;
	(*program)[product[0].index] = nnz;
	for (int i = 1; i < product.size(); ++i) {
	const ProductTerm& previous = product[i - 1];
	const ProductTerm& current = product[i];

	// Sparsity structure is updated only if the term is not a repeat.
	if (previous.row != current.row \|\| previous.col != current.col) {
	crsm_cols[++nnz] = current.col;
	crsm_rows[current.row + 1]++;
	}

	// All terms get assigned the position in the values array where
	// their value is accumulated.
	(*program)[current.index] = nnz;
	}

	for (int i = 1; i < num_rows + 1; ++i) {
	crsm_rows[i] += crsm_rows[i - 1];
	}

	return matrix;
	}

	} // namespace

	CompressedRowSparseMatrix*
	CompressedRowSparseMatrix::CreateOuterProductMatrixAndProgram(
	const CompressedRowSparseMatrix& m,
	vector<int>* program) {
	CHECK_NOTNULL(program)->clear();
	CHECK_GT(m.num_nonzeros(), 0) << "Congratulations, "
	<< "you found a bug in Ceres. Please report it.";

	vector<ProductTerm> product;
	const vector<int>& row_blocks = m.row_blocks();
	int row_block_begin = 0;
	// Iterate over row blocks
	for (int row_block = 0; row_block < row_blocks.size(); ++row_block) {
	const int row_block_end = row_block_begin + row_blocks[row_block];
	// Compute the outer product terms for just one row per row block.
	const int r = row_block_begin;
	// Compute the lower triangular part of the product.
	for (int idx1 = m.rows()[r]; idx1 < m.rows()[r + 1]; ++idx1) {
	for (int idx2 = m.rows()[r]; idx2 <= idx1; ++idx2) {
	product.push_back(ProductTerm(m.cols()[idx1], m.cols()[idx2], product.size()));
	}
	}
	row_block_begin = row_block_end;
	}
	CHECK_EQ(row_block_begin, m.num_rows());
	sort(product.begin(), product.end());
	return CompressAndFillProgram(m.num_cols(), m.num_cols(), product, program);
	}

	void CompressedRowSparseMatrix::ComputeOuterProduct(
	const CompressedRowSparseMatrix& m,
	const vector<int>& program,
	CompressedRowSparseMatrix* result) {
	result->SetZero();
	double* values = result->mutable_values();
	const vector<int>& row_blocks = m.row_blocks();

	int cursor = 0;
	int row_block_begin = 0;
	const double* m_values = m.values();
	const int* m_rows = m.rows();
	// Iterate over row blocks.
	for (int row_block = 0; row_block < row_blocks.size(); ++row_block) {
	const int row_block_end = row_block_begin + row_blocks[row_block];
	const int saved_cursor = cursor;
	for (int r = row_block_begin; r < row_block_end; ++r) {
	// Reuse the program segment for each row in this row block.
	cursor = saved_cursor;
	const int row_begin = m_rows[r];
	const int row_end = m_rows[r + 1];
	for (int idx1 = row_begin; idx1 < row_end; ++idx1) {
	const double v1 = m_values[idx1];
	for (int idx2 = row_begin; idx2 <= idx1; ++idx2, ++cursor) {
	values[program[cursor]] += v1 * m_values[idx2];
	}
	}
	}
	row_block_begin = row_block_end;
	}

	CHECK_EQ(row_block_begin, m.num_rows());
	CHECK_EQ(cursor, program.size());
	}

	} // namespace internal
	} // namespace ceres