|  | // Ceres Solver - A fast non-linear least squares minimizer | 
|  | // Copyright 2023 Google Inc. All rights reserved. | 
|  | // http://ceres-solver.org/ | 
|  | // | 
|  | // Redistribution and use in source and binary forms, with or without | 
|  | // modification, are permitted provided that the following conditions are met: | 
|  | // | 
|  | // * Redistributions of source code must retain the above copyright notice, | 
|  | //   this list of conditions and the following disclaimer. | 
|  | // * Redistributions in binary form must reproduce the above copyright notice, | 
|  | //   this list of conditions and the following disclaimer in the documentation | 
|  | //   and/or other materials provided with the distribution. | 
|  | // * Neither the name of Google Inc. nor the names of its contributors may be | 
|  | //   used to endorse or promote products derived from this software without | 
|  | //   specific prior written permission. | 
|  | // | 
|  | // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | 
|  | // AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | 
|  | // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | 
|  | // ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE | 
|  | // LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | 
|  | // CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF | 
|  | // SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS | 
|  | // INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN | 
|  | // CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) | 
|  | // ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE | 
|  | // POSSIBILITY OF SUCH DAMAGE. | 
|  | // | 
|  | // Author: joydeepb@cs.utexas.edu (Joydeep Biswas) | 
|  |  | 
|  | #include "ceres/cuda_vector.h" | 
|  |  | 
|  | #include <string> | 
|  |  | 
|  | #include "ceres/internal/config.h" | 
|  | #include "ceres/internal/eigen.h" | 
|  | #include "glog/logging.h" | 
|  | #include "gtest/gtest.h" | 
|  |  | 
|  | namespace ceres { | 
|  | namespace internal { | 
|  |  | 
|  | #ifndef CERES_NO_CUDA | 
|  |  | 
|  | TEST(CudaVector, Creation) { | 
|  | ContextImpl context; | 
|  | std::string message; | 
|  | CHECK(context.InitCuda(&message)) << "InitCuda() failed because: " << message; | 
|  | CudaVector x(&context, 1000); | 
|  | EXPECT_EQ(x.num_rows(), 1000); | 
|  | EXPECT_NE(x.data(), nullptr); | 
|  | } | 
|  |  | 
|  | TEST(CudaVector, CopyVector) { | 
|  | Vector x(3); | 
|  | x << 1, 2, 3; | 
|  | ContextImpl context; | 
|  | std::string message; | 
|  | CHECK(context.InitCuda(&message)) << "InitCuda() failed because: " << message; | 
|  | CudaVector y(&context, 10); | 
|  | y.CopyFromCpu(x); | 
|  | EXPECT_EQ(y.num_rows(), 3); | 
|  |  | 
|  | Vector z(3); | 
|  | z << 0, 0, 0; | 
|  | y.CopyTo(&z); | 
|  | EXPECT_EQ(x, z); | 
|  | } | 
|  |  | 
|  | TEST(CudaVector, Move) { | 
|  | ContextImpl context; | 
|  | std::string message; | 
|  | CHECK(context.InitCuda(&message)) << "InitCuda() failed because: " << message; | 
|  | CudaVector y(&context, 10); | 
|  | const auto y_data = y.data(); | 
|  | const auto y_descr = y.descr(); | 
|  | EXPECT_EQ(y.num_rows(), 10); | 
|  | CudaVector z(std::move(y)); | 
|  | EXPECT_EQ(y.data(), nullptr); | 
|  | EXPECT_EQ(y.descr(), nullptr); | 
|  | EXPECT_EQ(y.num_rows(), 0); | 
|  |  | 
|  | EXPECT_EQ(z.data(), y_data); | 
|  | EXPECT_EQ(z.descr(), y_descr); | 
|  | } | 
|  |  | 
|  | TEST(CudaVector, DeepCopy) { | 
|  | Vector x(3); | 
|  | x << 1, 2, 3; | 
|  | ContextImpl context; | 
|  | std::string message; | 
|  | CHECK(context.InitCuda(&message)) << "InitCuda() failed because: " << message; | 
|  | CudaVector x_gpu(&context, 3); | 
|  | x_gpu.CopyFromCpu(x); | 
|  |  | 
|  | CudaVector y_gpu(&context, 3); | 
|  | y_gpu.SetZero(); | 
|  | EXPECT_EQ(y_gpu.Norm(), 0.0); | 
|  |  | 
|  | y_gpu = x_gpu; | 
|  | Vector y(3); | 
|  | y << 0, 0, 0; | 
|  | y_gpu.CopyTo(&y); | 
|  | EXPECT_EQ(x, y); | 
|  | } | 
|  |  | 
|  | TEST(CudaVector, Dot) { | 
|  | Vector x(3); | 
|  | Vector y(3); | 
|  | x << 1, 2, 3; | 
|  | y << 100, 10, 1; | 
|  | ContextImpl context; | 
|  | std::string message; | 
|  | CHECK(context.InitCuda(&message)) << "InitCuda() failed because: " << message; | 
|  | CudaVector x_gpu(&context, 10); | 
|  | CudaVector y_gpu(&context, 10); | 
|  | x_gpu.CopyFromCpu(x); | 
|  | y_gpu.CopyFromCpu(y); | 
|  |  | 
|  | EXPECT_EQ(x_gpu.Dot(y_gpu), 123.0); | 
|  | EXPECT_EQ(Dot(x_gpu, y_gpu), 123.0); | 
|  | } | 
|  |  | 
|  | TEST(CudaVector, Norm) { | 
|  | Vector x(3); | 
|  | x << 1, 2, 3; | 
|  | ContextImpl context; | 
|  | std::string message; | 
|  | CHECK(context.InitCuda(&message)) << "InitCuda() failed because: " << message; | 
|  | CudaVector x_gpu(&context, 10); | 
|  | x_gpu.CopyFromCpu(x); | 
|  |  | 
|  | EXPECT_NEAR(x_gpu.Norm(), | 
|  | sqrt(1.0 + 4.0 + 9.0), | 
|  | std::numeric_limits<double>::epsilon()); | 
|  |  | 
|  | EXPECT_NEAR(Norm(x_gpu), | 
|  | sqrt(1.0 + 4.0 + 9.0), | 
|  | std::numeric_limits<double>::epsilon()); | 
|  | } | 
|  |  | 
|  | TEST(CudaVector, SetZero) { | 
|  | Vector x(4); | 
|  | x << 1, 1, 1, 1; | 
|  | ContextImpl context; | 
|  | std::string message; | 
|  | CHECK(context.InitCuda(&message)) << "InitCuda() failed because: " << message; | 
|  | CudaVector x_gpu(&context, 10); | 
|  | x_gpu.CopyFromCpu(x); | 
|  |  | 
|  | EXPECT_NEAR(x_gpu.Norm(), 2.0, std::numeric_limits<double>::epsilon()); | 
|  |  | 
|  | x_gpu.SetZero(); | 
|  | EXPECT_NEAR(x_gpu.Norm(), 0.0, std::numeric_limits<double>::epsilon()); | 
|  |  | 
|  | x_gpu.CopyFromCpu(x); | 
|  | EXPECT_NEAR(x_gpu.Norm(), 2.0, std::numeric_limits<double>::epsilon()); | 
|  | SetZero(x_gpu); | 
|  | EXPECT_NEAR(x_gpu.Norm(), 0.0, std::numeric_limits<double>::epsilon()); | 
|  | } | 
|  |  | 
|  | TEST(CudaVector, Resize) { | 
|  | ContextImpl context; | 
|  | std::string message; | 
|  | CHECK(context.InitCuda(&message)) << "InitCuda() failed because: " << message; | 
|  | CudaVector x_gpu(&context, 10); | 
|  | EXPECT_EQ(x_gpu.num_rows(), 10); | 
|  | x_gpu.Resize(4); | 
|  | EXPECT_EQ(x_gpu.num_rows(), 4); | 
|  | } | 
|  |  | 
|  | TEST(CudaVector, Axpy) { | 
|  | Vector x(4); | 
|  | Vector y(4); | 
|  | x << 1, 1, 1, 1; | 
|  | y << 100, 10, 1, 0; | 
|  | ContextImpl context; | 
|  | std::string message; | 
|  | CHECK(context.InitCuda(&message)) << "InitCuda() failed because: " << message; | 
|  | CudaVector x_gpu(&context, 4); | 
|  | CudaVector y_gpu(&context, 4); | 
|  | x_gpu.CopyFromCpu(x); | 
|  | y_gpu.CopyFromCpu(y); | 
|  |  | 
|  | x_gpu.Axpby(2.0, y_gpu, 1.0); | 
|  | Vector result; | 
|  | Vector expected(4); | 
|  | expected << 201, 21, 3, 1; | 
|  | x_gpu.CopyTo(&result); | 
|  | EXPECT_EQ(result, expected); | 
|  | } | 
|  |  | 
|  | TEST(CudaVector, AxpbyBEquals1) { | 
|  | Vector x(4); | 
|  | Vector y(4); | 
|  | x << 1, 1, 1, 1; | 
|  | y << 100, 10, 1, 0; | 
|  | ContextImpl context; | 
|  | std::string message; | 
|  | CHECK(context.InitCuda(&message)) << "InitCuda() failed because: " << message; | 
|  | CudaVector x_gpu(&context, 4); | 
|  | CudaVector y_gpu(&context, 4); | 
|  | x_gpu.CopyFromCpu(x); | 
|  | y_gpu.CopyFromCpu(y); | 
|  |  | 
|  | x_gpu.Axpby(2.0, y_gpu, 1.0); | 
|  | Vector result; | 
|  | Vector expected(4); | 
|  | expected << 201, 21, 3, 1; | 
|  | x_gpu.CopyTo(&result); | 
|  | EXPECT_EQ(result, expected); | 
|  | } | 
|  |  | 
|  | TEST(CudaVector, AxpbyMemberFunctionBNotEqual1) { | 
|  | Vector x(4); | 
|  | Vector y(4); | 
|  | x << 1, 1, 1, 1; | 
|  | y << 100, 10, 1, 0; | 
|  | ContextImpl context; | 
|  | std::string message; | 
|  | CHECK(context.InitCuda(&message)) << "InitCuda() failed because: " << message; | 
|  | CudaVector x_gpu(&context, 4); | 
|  | CudaVector y_gpu(&context, 4); | 
|  | x_gpu.CopyFromCpu(x); | 
|  | y_gpu.CopyFromCpu(y); | 
|  |  | 
|  | x_gpu.Axpby(2.0, y_gpu, 3.0); | 
|  | Vector result; | 
|  | Vector expected(4); | 
|  | expected << 203, 23, 5, 3; | 
|  | x_gpu.CopyTo(&result); | 
|  | EXPECT_EQ(result, expected); | 
|  | } | 
|  |  | 
|  | TEST(CudaVector, AxpbyMemberFunctionBEqual1) { | 
|  | Vector x(4); | 
|  | Vector y(4); | 
|  | x << 1, 1, 1, 1; | 
|  | y << 100, 10, 1, 0; | 
|  | ContextImpl context; | 
|  | std::string message; | 
|  | CHECK(context.InitCuda(&message)) << "InitCuda() failed because: " << message; | 
|  | CudaVector x_gpu(&context, 4); | 
|  | CudaVector y_gpu(&context, 4); | 
|  | x_gpu.CopyFromCpu(x); | 
|  | y_gpu.CopyFromCpu(y); | 
|  |  | 
|  | x_gpu.Axpby(2.0, y_gpu, 1.0); | 
|  | Vector result; | 
|  | Vector expected(4); | 
|  | expected << 201, 21, 3, 1; | 
|  | x_gpu.CopyTo(&result); | 
|  | EXPECT_EQ(result, expected); | 
|  | } | 
|  |  | 
|  | TEST(CudaVector, AxpbyMemberXAliasesY) { | 
|  | Vector x(4); | 
|  | x << 100, 10, 1, 0; | 
|  | ContextImpl context; | 
|  | std::string message; | 
|  | CHECK(context.InitCuda(&message)) << "InitCuda() failed because: " << message; | 
|  | CudaVector x_gpu(&context, 4); | 
|  | CudaVector y_gpu(&context, 4); | 
|  | x_gpu.CopyFromCpu(x); | 
|  | y_gpu.SetZero(); | 
|  |  | 
|  | x_gpu.Axpby(2.0, x_gpu, 1.0); | 
|  | Vector result; | 
|  | Vector expected(4); | 
|  | expected << 300, 30, 3, 0; | 
|  | x_gpu.CopyTo(&result); | 
|  | EXPECT_EQ(result, expected); | 
|  | } | 
|  |  | 
|  | TEST(CudaVector, AxpbyNonMemberMethodNoAliases) { | 
|  | Vector x(4); | 
|  | Vector y(4); | 
|  | x << 1, 1, 1, 1; | 
|  | y << 100, 10, 1, 0; | 
|  | ContextImpl context; | 
|  | std::string message; | 
|  | CHECK(context.InitCuda(&message)) << "InitCuda() failed because: " << message; | 
|  | CudaVector x_gpu(&context, 4); | 
|  | CudaVector y_gpu(&context, 4); | 
|  | CudaVector z_gpu(&context, 4); | 
|  | x_gpu.CopyFromCpu(x); | 
|  | y_gpu.CopyFromCpu(y); | 
|  | z_gpu.Resize(4); | 
|  | z_gpu.SetZero(); | 
|  |  | 
|  | Axpby(2.0, x_gpu, 3.0, y_gpu, z_gpu); | 
|  | Vector result; | 
|  | Vector expected(4); | 
|  | expected << 302, 32, 5, 2; | 
|  | z_gpu.CopyTo(&result); | 
|  | EXPECT_EQ(result, expected); | 
|  | } | 
|  |  | 
|  | TEST(CudaVector, AxpbyNonMemberMethodXAliasesY) { | 
|  | Vector x(4); | 
|  | x << 100, 10, 1, 0; | 
|  | ContextImpl context; | 
|  | std::string message; | 
|  | CHECK(context.InitCuda(&message)) << "InitCuda() failed because: " << message; | 
|  | CudaVector x_gpu(&context, 4); | 
|  | CudaVector z_gpu(&context, 4); | 
|  | x_gpu.CopyFromCpu(x); | 
|  | z_gpu.SetZero(); | 
|  |  | 
|  | Axpby(2.0, x_gpu, 3.0, x_gpu, z_gpu); | 
|  | Vector result; | 
|  | Vector expected(4); | 
|  | expected << 500, 50, 5, 0; | 
|  | z_gpu.CopyTo(&result); | 
|  | EXPECT_EQ(result, expected); | 
|  | } | 
|  |  | 
|  | TEST(CudaVector, AxpbyNonMemberMethodXAliasesZ) { | 
|  | Vector x(4); | 
|  | Vector y(4); | 
|  | x << 1, 1, 1, 1; | 
|  | y << 100, 10, 1, 0; | 
|  | ContextImpl context; | 
|  | std::string message; | 
|  | CHECK(context.InitCuda(&message)) << "InitCuda() failed because: " << message; | 
|  | CudaVector x_gpu(&context, 10); | 
|  | CudaVector y_gpu(&context, 10); | 
|  | x_gpu.CopyFromCpu(x); | 
|  | y_gpu.CopyFromCpu(y); | 
|  |  | 
|  | Axpby(2.0, x_gpu, 3.0, y_gpu, x_gpu); | 
|  | Vector result; | 
|  | Vector expected(4); | 
|  | expected << 302, 32, 5, 2; | 
|  | x_gpu.CopyTo(&result); | 
|  | EXPECT_EQ(result, expected); | 
|  | } | 
|  |  | 
|  | TEST(CudaVector, AxpbyNonMemberMethodYAliasesZ) { | 
|  | Vector x(4); | 
|  | Vector y(4); | 
|  | x << 1, 1, 1, 1; | 
|  | y << 100, 10, 1, 0; | 
|  | ContextImpl context; | 
|  | std::string message; | 
|  | CHECK(context.InitCuda(&message)) << "InitCuda() failed because: " << message; | 
|  | CudaVector x_gpu(&context, 4); | 
|  | CudaVector y_gpu(&context, 4); | 
|  | x_gpu.CopyFromCpu(x); | 
|  | y_gpu.CopyFromCpu(y); | 
|  |  | 
|  | Axpby(2.0, x_gpu, 3.0, y_gpu, y_gpu); | 
|  | Vector result; | 
|  | Vector expected(4); | 
|  | expected << 302, 32, 5, 2; | 
|  | y_gpu.CopyTo(&result); | 
|  | EXPECT_EQ(result, expected); | 
|  | } | 
|  |  | 
|  | TEST(CudaVector, AxpbyNonMemberMethodXAliasesYAliasesZ) { | 
|  | Vector x(4); | 
|  | x << 100, 10, 1, 0; | 
|  | ContextImpl context; | 
|  | std::string message; | 
|  | CHECK(context.InitCuda(&message)) << "InitCuda() failed because: " << message; | 
|  | CudaVector x_gpu(&context, 10); | 
|  | x_gpu.CopyFromCpu(x); | 
|  |  | 
|  | Axpby(2.0, x_gpu, 3.0, x_gpu, x_gpu); | 
|  | Vector result; | 
|  | Vector expected(4); | 
|  | expected << 500, 50, 5, 0; | 
|  | x_gpu.CopyTo(&result); | 
|  | EXPECT_EQ(result, expected); | 
|  | } | 
|  |  | 
|  | TEST(CudaVector, DtDxpy) { | 
|  | Vector x(4); | 
|  | Vector y(4); | 
|  | Vector D(4); | 
|  | x << 1, 2, 3, 4; | 
|  | y << 100, 10, 1, 0; | 
|  | D << 4, 3, 2, 1; | 
|  | ContextImpl context; | 
|  | std::string message; | 
|  | CHECK(context.InitCuda(&message)) << "InitCuda() failed because: " << message; | 
|  | CudaVector x_gpu(&context, 4); | 
|  | CudaVector y_gpu(&context, 4); | 
|  | CudaVector D_gpu(&context, 4); | 
|  | x_gpu.CopyFromCpu(x); | 
|  | y_gpu.CopyFromCpu(y); | 
|  | D_gpu.CopyFromCpu(D); | 
|  |  | 
|  | y_gpu.DtDxpy(D_gpu, x_gpu); | 
|  | Vector result; | 
|  | Vector expected(4); | 
|  | expected << 116, 28, 13, 4; | 
|  | y_gpu.CopyTo(&result); | 
|  | EXPECT_EQ(result, expected); | 
|  | } | 
|  |  | 
|  | TEST(CudaVector, Scale) { | 
|  | Vector x(4); | 
|  | x << 1, 2, 3, 4; | 
|  | ContextImpl context; | 
|  | std::string message; | 
|  | CHECK(context.InitCuda(&message)) << "InitCuda() failed because: " << message; | 
|  | CudaVector x_gpu(&context, 4); | 
|  | x_gpu.CopyFromCpu(x); | 
|  |  | 
|  | x_gpu.Scale(-3.0); | 
|  |  | 
|  | Vector result; | 
|  | Vector expected(4); | 
|  | expected << -3.0, -6.0, -9.0, -12.0; | 
|  | x_gpu.CopyTo(&result); | 
|  | EXPECT_EQ(result, expected); | 
|  | } | 
|  |  | 
|  | #endif  // CERES_NO_CUDA | 
|  |  | 
|  | }  // namespace internal | 
|  | }  // namespace ceres |