From acdf85f87d46333e406304b721e97eff0e197396 Mon Sep 17 00:00:00 2001
From: Matt Peddie <matt.peddie@swift-nav.com>
Date: Thu, 20 Mar 2025 17:29:33 +1000
Subject: [PATCH 1/6] WIP: dense conjugate-gradient solver for dense problems

---
 BUILD.bazel                                   |   3 +
 include/albatross/CGGP                        |  19 ++
 .../src/models/conjugate_gradient_gp.hpp      | 214 ++++++++++++++++++
 tests/test_cg_gp.cc                           |  47 ++++
 4 files changed, 283 insertions(+)
 create mode 100644 include/albatross/CGGP
 create mode 100644 include/albatross/src/models/conjugate_gradient_gp.hpp
 create mode 100644 tests/test_cg_gp.cc
diff --git a/BUILD.bazel b/BUILD.bazel
index 80a2538a..ee752997 100644
--- a/BUILD.bazel
+++ b/BUILD.bazel
@@ -21,6 +21,7 @@ filegroup(
 cc_library(
     name = "albatross",
     hdrs = [
+        "include/albatross/CGGP",
         "include/albatross/Common",
         "include/albatross/Core",
         "include/albatross/CovarianceFunctions",
@@ -125,6 +126,7 @@ cc_library(
         "include/albatross/src/linalg/qr_utils.hpp",
         "include/albatross/src/linalg/spqr_utils.hpp",
         "include/albatross/src/models/conditional_gaussian.hpp",
+        "include/albatross/src/models/conjugate_gradient_gp.hpp",
         "include/albatross/src/models/gp.hpp",
         "include/albatross/src/models/least_squares.hpp",
         "include/albatross/src/models/null_model.hpp",
@@ -200,6 +202,7 @@ swift_cc_test(
         "tests/test_block_utils.cc",
         "tests/test_call_trace.cc",
         "tests/test_callers.cc",
+        "tests/test_cg_gp.cc",
         "tests/test_chi_squared_versus_gsl.cc",
         "tests/test_compression.cc",
         "tests/test_concatenate.cc",
diff --git a/include/albatross/CGGP b/include/albatross/CGGP
new file mode 100644
index 00000000..80a115e3
--- /dev/null
+++ b/include/albatross/CGGP
@@ -0,0 +1,19 @@
+/*
+ * Copyright (C) 2025 Swift Navigation Inc.
+ * Contact: Swift Navigation <dev@swiftnav.com>
+ *
+ * This source is subject to the license found in the file 'LICENSE' which must
+ * be distributed together with this source. All other rights reserved.
+ *
+ * THIS CODE AND INFORMATION IS PROVIDED "AS IS" WITHOUT WARRANTY OF ANY KIND,
+ * EITHER EXPRESSED OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE IMPLIED
+ * WARRANTIES OF MERCHANTABILITY AND/OR FITNESS FOR A PARTICULAR PURPOSE.
+ */
+
+#ifndef ALBATROSS_CG_GP_H
+#define ALBATROSS_CG_GP_H
+
+#include "GP"
+#include <albatross/src/models/conjugate_gradient_gp.hpp>
+
+#endif // ALBATROSS_CG_GP_H
diff --git a/include/albatross/src/models/conjugate_gradient_gp.hpp b/include/albatross/src/models/conjugate_gradient_gp.hpp
new file mode 100644
index 00000000..19e71e08
--- /dev/null
+++ b/include/albatross/src/models/conjugate_gradient_gp.hpp
@@ -0,0 +1,214 @@
+/*
+ * Copyright (C) 2025 Swift Navigation Inc.
+ * Contact: Swift Navigation <dev@swiftnav.com>
+ *
+ * This source is subject to the license found in the file 'LICENSE' which must
+ * be distributed together with this source. All other rights reserved.
+ *
+ * THIS CODE AND INFORMATION IS PROVIDED "AS IS" WITHOUT WARRANTY OF ANY KIND,
+ * EITHER EXPRESSED OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE IMPLIED
+ * WARRANTIES OF MERCHANTABILITY AND/OR FITNESS FOR A PARTICULAR PURPOSE.
+ */
+
+namespace albatross {
+
+template <typename FeatureType, typename Preconditioner>
+struct ConjugateGradientGPFit {};
+
+template <typename FeatureType, typename Preconditioner>
+struct Fit<ConjugateGradientGPFit<FeatureType, Preconditioner>> {
+  std::vector<FeatureType> train_features;
+  // We have to store this; the solver only takes a reference to it
+  // and doesn't own it.
+  Eigen::MatrixXd K_ff;
+  using SolverType =
+      Eigen::ConjugateGradient<Eigen::MatrixXd, Eigen::Lower, Preconditioner>;
+  // Pretty annoying that you can't copy an Eigen solver object.
+  // Maybe this is a bad idea for now, but seemingly Albatross
+  // requires you to be able to copy these.
+  std::shared_ptr<SolverType> solver;
+  Eigen::VectorXd information;
+
+  Fit(const std::vector<FeatureType> &train_features_, Eigen::MatrixXd &&K_ff_,
+      const MarginalDistribution &targets_)
+      : train_features{train_features_}, K_ff{std::move(K_ff_)},
+        // N.B. we give the CG solver a reference to our local member
+        // matrix.
+        solver{std::make_shared<SolverType>(K_ff)},
+        information{solver->solve(targets_.mean)} {}
+
+  bool operator==(const Fit &other) {
+    return std::tie(train_features, K_ff, information) ==
+           std::tie(other.train_features, other.K_ff, other.information);
+  }
+};
+
+template <typename CGSolver>
+inline JointDistribution cg_gp_joint_prediction(
+    const Eigen::MatrixXd &cross_cov, const Eigen::MatrixXd &prior_cov,
+    const Eigen::VectorXd &information, const CGSolver &solver) {
+  return JointDistribution(gp_mean_prediction(cross_cov, information),
+                           prior_cov -
+                               cross_cov.transpose() * solver.solve(cross_cov));
+}
+
+template <typename CGSolver>
+inline MarginalDistribution cg_gp_marginal_prediction(
+    const Eigen::MatrixXd &cross_cov, const Eigen::VectorXd &prior_variance,
+    const Eigen::VectorXd &information, const CGSolver &solver) {
+  return MarginalDistribution(
+      gp_mean_prediction(cross_cov, information),
+      prior_variance -
+          (cross_cov.transpose() * solver.solve(cross_cov)).diagonal());
+}
+
+template <typename CovFunc, typename MeanFunc, typename Preconditioner>
+class ConjugateGradientGaussianProcessRegression
+    : public GaussianProcessBase<CovFunc, MeanFunc,
+                                 ConjugateGradientGaussianProcessRegression<
+                                     CovFunc, MeanFunc, Preconditioner>> {
+public:
+  using Base = GaussianProcessBase<CovFunc, MeanFunc,
+                                   ConjugateGradientGaussianProcessRegression<
+                                       CovFunc, MeanFunc, Preconditioner>>;
+
+  using Base::covariance_function_;
+  using Base::mean_function_;
+
+  ConjugateGradientGaussianProcessRegression() : Base() {};
+
+  template <typename Cov>
+  ConjugateGradientGaussianProcessRegression(Cov &&covariance_function)
+      : Base(std::forward<CovFunc>(covariance_function)) {
+    static_assert(
+        std::is_same<std::decay_t<Cov>, CovFunc>::value,
+        "Please construct this with the same covariance it's declared for.");
+  }
+
+  template <typename Cov>
+  ConjugateGradientGaussianProcessRegression(Cov &&covariance_function,
+                                             const std::string &model_name)
+      : Base(std::forward<CovFunc>(covariance_function), model_name) {
+    static_assert(
+        std::is_same<std::decay_t<Cov>, CovFunc>::value,
+        "Please construct this with the same covariance it's declared for.");
+  }
+
+  template <typename Cov, typename Mean>
+  ConjugateGradientGaussianProcessRegression(Cov &&covariance_function,
+                                             Mean &&mean_function,
+                                             const std::string &model_name)
+      : Base(std::forward<CovFunc>(covariance_function),
+             std::forward<MeanFunc>(mean_function), model_name) {
+    static_assert(std::is_same<std::decay_t<Cov>, CovFunc>::value &&
+                      std::is_same<std::decay_t<Mean>, MeanFunc>::value,
+                  "Please construct this with the same covariance and mean "
+                  "it's declared for.");
+  }
+
+  template <
+      typename FeatureType,
+      std::enable_if_t<
+          has_call_operator<CovFunc, FeatureType, FeatureType>::value, int> = 0>
+  Fit<ConjugateGradientGPFit<FeatureType, Preconditioner>>
+  _fit_impl(const std::vector<FeatureType> &features,
+            const MarginalDistribution &targets) const {
+    Eigen::MatrixXd K_ff =
+        covariance_function_(features, Base::threads_.get());
+    MarginalDistribution zero_mean_targets(targets);
+    K_ff += targets.covariance;
+    mean_function_.remove_from(features, &zero_mean_targets.mean);
+    return Fit<ConjugateGradientGPFit<FeatureType, Preconditioner>>{
+        features, std::move(K_ff), std::move(zero_mean_targets)};
+  }
+
+  template <
+      typename FeatureType, typename FitFeatureType,
+      std::enable_if_t<
+          has_call_operator<CovFunc, FeatureType, FeatureType>::value &&
+              has_call_operator<CovFunc, FeatureType, FitFeatureType>::value,
+          int> = 0>
+  JointDistribution _predict_impl(
+      const std::vector<FeatureType> &features,
+      const Fit<ConjugateGradientGPFit<FitFeatureType, Preconditioner>> &cg_gp_fit,
+      PredictTypeIdentity<JointDistribution> &&) const {
+    const auto cross_cov =
+        covariance_function_(cg_gp_fit.train_features, features);
+    Eigen::MatrixXd prior_cov{covariance_function_(features)};
+    auto pred = cg_gp_joint_prediction(
+        cross_cov, prior_cov, cg_gp_fit.information, *cg_gp_fit.solver);
+    mean_function_.add_to(features, &pred.mean);
+    return pred;
+  }
+
+  template <
+      typename FeatureType, typename FitFeatureType,
+      std::enable_if_t<
+          has_call_operator<CovFunc, FeatureType, FeatureType>::value &&
+              has_call_operator<CovFunc, FeatureType, FitFeatureType>::value,
+          int> = 0>
+  MarginalDistribution _predict_impl(
+      const std::vector<FeatureType> &features,
+      const Fit<ConjugateGradientGPFit<FitFeatureType, Preconditioner>>
+          &cg_gp_fit,
+      PredictTypeIdentity<MarginalDistribution> &&) const {
+    const auto cross_cov =
+        covariance_function_(cg_gp_fit.train_features, features);
+    Eigen::VectorXd prior_variance(Eigen::VectorXd::NullaryExpr(
+        cast::to_index(features.size()), [this, &features](Eigen::Index i) {
+          const auto &f = features[cast::to_size(i)];
+          return covariance_function_(f, f);
+        }));
+    auto pred = cg_gp_marginal_prediction(
+        cross_cov, prior_variance, cg_gp_fit.information, *cg_gp_fit.solver);
+    mean_function_.add_to(features, &pred.mean);
+    return pred;
+  }
+
+  template <
+      typename FeatureType, typename FitFeatureType,
+      std::enable_if_t<
+          has_call_operator<CovFunc, FeatureType, FeatureType>::value &&
+              has_call_operator<CovFunc, FeatureType, FitFeatureType>::value,
+          int> = 0>
+  Eigen::VectorXd _predict_impl(
+      const std::vector<FeatureType> &features,
+      const Fit<ConjugateGradientGPFit<FitFeatureType, Preconditioner>>
+          &cg_gp_fit,
+      PredictTypeIdentity<Eigen::VectorXd> &&) const {
+    const auto cross_cov =
+        covariance_function_(cg_gp_fit.train_features, features);
+    auto pred = gp_mean_prediction(cross_cov, cg_gp_fit.information);
+    mean_function_.add_to(features, &pred);
+    return pred;
+  }
+};
+
+// TODO(@peddie): this is known not to have any effect for stationary
+// kernels, but IncompleteCholesky assumes a `twistedBy` (sparse
+// self-adjoint view) member, so this is all we can do for the moment.
+using AlbatrossCGDefaultPreconditioner = Eigen::DiagonalPreconditioner<double>;
+
+template <typename CovFunc,
+          typename Preconditioner = AlbatrossCGDefaultPreconditioner>
+auto cg_gp_from_covariance(CovFunc &&covariance_function,
+                           const std::string &model_name,
+                           Preconditioner && = Preconditioner{}) {
+  return ConjugateGradientGaussianProcessRegression<
+      typename std::decay<CovFunc>::type, decltype(ZeroMean()), Preconditioner>(
+      std::forward<CovFunc>(covariance_function), model_name);
+}
+
+template <typename CovFunc, typename MeanFunc,
+          typename Preconditioner = AlbatrossCGDefaultPreconditioner>
+auto cg_gp_from_mean_and_covariance(CovFunc &&covariance_function,
+                                    MeanFunc &&mean_function,
+                                    const std::string &model_name,
+                                    Preconditioner && = Preconditioner{}) {
+  return ConjugateGradientGaussianProcessRegression<
+      typename std::decay<CovFunc>::type, typename std::decay<MeanFunc>::type,
+      Preconditioner>(std::forward<CovFunc>(covariance_function),
+                      std::forward<MeanFunc>(mean_function), model_name);
+}
+
+} // namespace albatross
\ No newline at end of file
diff --git a/tests/test_cg_gp.cc b/tests/test_cg_gp.cc
new file mode 100644
index 00000000..5135088b
--- /dev/null
+++ b/tests/test_cg_gp.cc
@@ -0,0 +1,47 @@
+/*
+ * Copyright (C) 2025 Swift Navigation Inc.
+ * Contact: Swift Navigation <dev@swiftnav.com>
+ *
+ * This source is subject to the license found in the file 'LICENSE' which must
+ * be distributed together with this source. All other rights reserved.
+ *
+ * THIS CODE AND INFORMATION IS PROVIDED "AS IS" WITHOUT WARRANTY OF ANY KIND,
+ * EITHER EXPRESSED OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE IMPLIED
+ * WARRANTIES OF MERCHANTABILITY AND/OR FITNESS FOR A PARTICULAR PURPOSE.
+ */
+
+#include <gtest/gtest.h>
+
+#include "test_models.h"
+#include <chrono>
+
+#include <albatross/CGGP>
+
+namespace albatross {
+
+TEST(TestConjugateGradientGP, TestMean) {
+  using CovFunc = SquaredExponential<EuclideanDistance>;
+
+  CovFunc covariance(1, 1);
+  auto dataset = make_toy_linear_data();
+  auto direct = gp_from_covariance(covariance, "direct");
+  auto cg = cg_gp_from_covariance(covariance, "cg");
+
+  auto direct_fit = direct.fit(dataset);
+  auto cg_fit = cg.fit(dataset);
+
+  auto test_features = linspace(0.01, 9.9, 11);
+
+  auto direct_pred = direct_fit.predict_with_measurement_noise(test_features).joint();
+  auto cg_pred = cg_fit.predict_with_measurement_noise(test_features).joint();
+
+  double mean_error = (direct_pred.mean - cg_pred.mean).norm();
+  EXPECT_LT(mean_error, 1.e-9);
+
+  double cov_distance =
+      albatross::distance::wasserstein_2(direct_pred, cg_pred);
+
+  EXPECT_LT(cov_distance, 1.e-9);
+}
+
+} // namespace albatross
\ No newline at end of file

From c4b51f75fc4a198924d298fc52c9201deaa8cc93 Mon Sep 17 00:00:00 2001
From: Matt Peddie <matt.peddie@swift-nav.com>
Date: Fri, 21 Mar 2025 13:31:55 +1000
Subject: [PATCH 2/6] Options handling and performance comparisons

---
 .../src/models/conjugate_gradient_gp.hpp      | 204 ++++++++++++++----
 tests/test_cg_gp.cc                           | 125 ++++++++++-
 2 files changed, 284 insertions(+), 45 deletions(-)

diff --git a/include/albatross/src/models/conjugate_gradient_gp.hpp b/include/albatross/src/models/conjugate_gradient_gp.hpp
index 19e71e08..afc7ee76 100644
--- a/include/albatross/src/models/conjugate_gradient_gp.hpp
+++ b/include/albatross/src/models/conjugate_gradient_gp.hpp
@@ -15,6 +15,59 @@ namespace albatross {
 template <typename FeatureType, typename Preconditioner>
 struct ConjugateGradientGPFit {};
 
+struct IterativeSolverOptions {
+  // Negative values for these will be ignored.
+  static constexpr const Eigen::Index cDefaultMaxIterations{-1};
+  Eigen::Index max_iterations{cDefaultMaxIterations};
+  static constexpr const double cDefaultTolerance{-1};
+  double tolerance{cDefaultTolerance};
+
+  IterativeSolverOptions() {}
+
+  IterativeSolverOptions(Eigen::Index iterations, double tol)
+      : max_iterations{iterations}, tolerance{tol} {}
+
+  template <typename SolverType>
+  explicit IterativeSolverOptions(SolverType &&solver)
+      : max_iterations{solver.maxIterations()}, tolerance{solver.tolerance()} {}
+
+  template <typename SolverType>
+  void configure_solver(SolverType &solver) const {
+    if (tolerance > 0) {
+      solver.setTolerance(tolerance);
+    }
+
+    if (max_iterations > 0) {
+      solver.setMaxIterations(max_iterations);
+    }
+  }
+};
+
+struct IterativeSolverState {
+  Eigen::ComputationInfo info;
+  Eigen::Index iterations;
+  double error;
+
+  IterativeSolverState() = delete;
+
+  template <typename SolverType>
+  explicit IterativeSolverState(SolverType &&solver)
+      : info{solver.info()},
+        iterations{solver.iterations()}, error{solver.error()} {}
+};
+
+namespace detail {
+
+template <typename SolverType>
+std::shared_ptr<std::decay_t<SolverType>>
+make_shared_solver_with_options(const Eigen::MatrixXd &m,
+                                const IterativeSolverOptions &options) {
+  auto solver = std::make_shared<std::decay_t<SolverType>>(m);
+  options.configure_solver(*solver);
+  return solver;
+}
+} // namespace detail
+
 template <typename FeatureType, typename Preconditioner>
 struct Fit<ConjugateGradientGPFit<FeatureType, Preconditioner>> {
   std::vector<FeatureType> train_features;
@@ -29,13 +82,43 @@ struct Fit<ConjugateGradientGPFit<FeatureType, Preconditioner>> {
   std::shared_ptr<SolverType> solver;
   Eigen::VectorXd information;
 
+  IterativeSolverOptions get_options() const {
+    return IterativeSolverOptions{*solver};
+  }
+
+  IterativeSolverState get_solver_state() const {
+    return IterativeSolverState{*solver};
+  }
+
+  void set_options(const IterativeSolverOptions &options) {
+    options.configure_solver(*solver);
+  }
+
   Fit(const std::vector<FeatureType> &train_features_, Eigen::MatrixXd &&K_ff_,
       const MarginalDistribution &targets_)
       : train_features{train_features_}, K_ff{std::move(K_ff_)},
         // N.B. we give the CG solver a reference to our local member
         // matrix.
-        solver{std::make_shared<SolverType>(K_ff)},
-        information{solver->solve(targets_.mean)} {}
+        solver{std::make_shared<SolverType>(K_ff)}, information{solver->solve(
+                                                        targets_.mean)} {
+    if (solver->info() != Eigen::Success) {
+      information.setConstant(std::numeric_limits<double>::quiet_NaN());
+    }
+  }
+
+  Fit(const std::vector<FeatureType> &train_features_, Eigen::MatrixXd &&K_ff_,
+      const MarginalDistribution &targets_,
+      const IterativeSolverOptions &options)
+      : train_features{train_features_}, K_ff{std::move(K_ff_)},
+        // N.B. we give the CG solver a reference to our local member
+        // matrix.
+        solver{
+            detail::make_shared_solver_with_options<SolverType>(K_ff, options)},
+        information{solver->solve(targets_.mean)} {
+    if (solver->info() != Eigen::Success) {
+      information.setConstant(std::numeric_limits<double>::quiet_NaN());
+    }
+  }
 
   bool operator==(const Fit &other) {
     return std::tie(train_features, K_ff, information) ==
@@ -47,19 +130,30 @@ template <typename CGSolver>
 inline JointDistribution cg_gp_joint_prediction(
     const Eigen::MatrixXd &cross_cov, const Eigen::MatrixXd &prior_cov,
     const Eigen::VectorXd &information, const CGSolver &solver) {
-  return JointDistribution(gp_mean_prediction(cross_cov, information),
-                           prior_cov -
-                               cross_cov.transpose() * solver.solve(cross_cov));
+  JointDistribution ret(gp_mean_prediction(cross_cov, information),
+                        prior_cov -
+                            cross_cov.transpose() * solver.solve(cross_cov));
+  if (solver.info() != Eigen::Success) {
+    ret.covariance.setConstant(std::numeric_limits<double>::quiet_NaN());
+  }
+
+  return ret;
 }
 
 template <typename CGSolver>
 inline MarginalDistribution cg_gp_marginal_prediction(
     const Eigen::MatrixXd &cross_cov, const Eigen::VectorXd &prior_variance,
     const Eigen::VectorXd &information, const CGSolver &solver) {
-  return MarginalDistribution(
+  MarginalDistribution ret(
       gp_mean_prediction(cross_cov, information),
       prior_variance -
           (cross_cov.transpose() * solver.solve(cross_cov)).diagonal());
+  if (solver.info() != Eigen::Success) {
+    ret.covariance.diagonal().setConstant(
+        std::numeric_limits<double>::quiet_NaN());
+  }
+
+  return ret;
 }
 
 template <typename CovFunc, typename MeanFunc, typename Preconditioner>
@@ -75,36 +169,52 @@ class ConjugateGradientGaussianProcessRegression
   using Base::covariance_function_;
   using Base::mean_function_;
 
-  ConjugateGradientGaussianProcessRegression() : Base() {};
+  ConjugateGradientGaussianProcessRegression() : Base(){};
 
-  template <typename Cov>
+  template <typename Cov,
+            std::enable_if_t<std::is_same<std::decay_t<Cov>, CovFunc>::value,
+                             int> = 0>
   ConjugateGradientGaussianProcessRegression(Cov &&covariance_function)
-      : Base(std::forward<CovFunc>(covariance_function)) {
-    static_assert(
-        std::is_same<std::decay_t<Cov>, CovFunc>::value,
-        "Please construct this with the same covariance it's declared for.");
-  }
+      : Base(std::forward<CovFunc>(covariance_function)) {}
 
-  template <typename Cov>
+  template <typename Cov,
+            std::enable_if_t<std::is_same<std::decay_t<Cov>, CovFunc>::value,
+                             int> = 0>
   ConjugateGradientGaussianProcessRegression(Cov &&covariance_function,
                                              const std::string &model_name)
-      : Base(std::forward<CovFunc>(covariance_function), model_name) {
-    static_assert(
-        std::is_same<std::decay_t<Cov>, CovFunc>::value,
-        "Please construct this with the same covariance it's declared for.");
-  }
+      : Base(std::forward<CovFunc>(covariance_function), model_name) {}
+
+  template <typename Cov,
+            std::enable_if_t<std::is_same<std::decay_t<Cov>, CovFunc>::value,
+                             int> = 0>
+  ConjugateGradientGaussianProcessRegression(
+      Cov &&covariance_function, const std::string &model_name,
+      const IterativeSolverOptions &options)
+      : Base(std::forward<CovFunc>(covariance_function), model_name),
+        options_{options} {}
 
-  template <typename Cov, typename Mean>
+  template <
+      typename Cov, typename Mean,
+      std::enable_if_t<std::is_same<std::decay_t<Cov>, CovFunc>::value &&
+                           std::is_same<std::decay_t<Mean>, MeanFunc>::value,
+                       int> = 0>
   ConjugateGradientGaussianProcessRegression(Cov &&covariance_function,
                                              Mean &&mean_function,
                                              const std::string &model_name)
       : Base(std::forward<CovFunc>(covariance_function),
-             std::forward<MeanFunc>(mean_function), model_name) {
-    static_assert(std::is_same<std::decay_t<Cov>, CovFunc>::value &&
-                      std::is_same<std::decay_t<Mean>, MeanFunc>::value,
-                  "Please construct this with the same covariance and mean "
-                  "it's declared for.");
-  }
+             std::forward<MeanFunc>(mean_function), model_name) {}
+
+  template <
+      typename Cov, typename Mean,
+      std::enable_if_t<std::is_same<std::decay_t<Cov>, CovFunc>::value &&
+                           std::is_same<std::decay_t<Mean>, MeanFunc>::value,
+                       int> = 0>
+  ConjugateGradientGaussianProcessRegression(
+      Cov &&covariance_function, Mean &&mean_function,
+      const std::string &model_name, const IterativeSolverOptions &options)
+      : Base(std::forward<CovFunc>(covariance_function),
+             std::forward<MeanFunc>(mean_function), model_name),
+        options_{options} {}
 
   template <
       typename FeatureType,
@@ -113,13 +223,16 @@ class ConjugateGradientGaussianProcessRegression
   Fit<ConjugateGradientGPFit<FeatureType, Preconditioner>>
   _fit_impl(const std::vector<FeatureType> &features,
             const MarginalDistribution &targets) const {
-    Eigen::MatrixXd K_ff =
-        covariance_function_(features, Base::threads_.get());
+    Eigen::MatrixXd K_ff = covariance_function_(features, Base::threads_.get());
     MarginalDistribution zero_mean_targets(targets);
     K_ff += targets.covariance;
     mean_function_.remove_from(features, &zero_mean_targets.mean);
+    // Clamp this so that we never try to iterate more than the
+    // theoretical max of CG
+    auto options = options_;
+    options.max_iterations = std::min(options_.max_iterations, K_ff.rows());
     return Fit<ConjugateGradientGPFit<FeatureType, Preconditioner>>{
-        features, std::move(K_ff), std::move(zero_mean_targets)};
+        features, std::move(K_ff), std::move(zero_mean_targets), options};
   }
 
   template <
@@ -130,7 +243,8 @@ class ConjugateGradientGaussianProcessRegression
           int> = 0>
   JointDistribution _predict_impl(
       const std::vector<FeatureType> &features,
-      const Fit<ConjugateGradientGPFit<FitFeatureType, Preconditioner>> &cg_gp_fit,
+      const Fit<ConjugateGradientGPFit<FitFeatureType, Preconditioner>>
+          &cg_gp_fit,
       PredictTypeIdentity<JointDistribution> &&) const {
     const auto cross_cov =
         covariance_function_(cg_gp_fit.train_features, features);
@@ -182,6 +296,15 @@ class ConjugateGradientGaussianProcessRegression
     mean_function_.add_to(features, &pred);
     return pred;
   }
+
+  IterativeSolverOptions get_options() const { return options_; }
+
+  void set_options(const IterativeSolverOptions &options) {
+    options_ = options;
+  }
+
+private:
+  IterativeSolverOptions options_{};
 };
 
 // TODO(@peddie): this is known not to have any effect for stationary
@@ -191,24 +314,27 @@ using AlbatrossCGDefaultPreconditioner = Eigen::DiagonalPreconditioner<double>;
 
 template <typename CovFunc,
           typename Preconditioner = AlbatrossCGDefaultPreconditioner>
-auto cg_gp_from_covariance(CovFunc &&covariance_function,
-                           const std::string &model_name,
-                           Preconditioner && = Preconditioner{}) {
+auto cg_gp_from_covariance(
+    CovFunc &&covariance_function, const std::string &model_name,
+    const IterativeSolverOptions &options = IterativeSolverOptions{},
+    Preconditioner && = Preconditioner{}) {
   return ConjugateGradientGaussianProcessRegression<
       typename std::decay<CovFunc>::type, decltype(ZeroMean()), Preconditioner>(
-      std::forward<CovFunc>(covariance_function), model_name);
+      std::forward<CovFunc>(covariance_function), model_name, options);
 }
 
 template <typename CovFunc, typename MeanFunc,
           typename Preconditioner = AlbatrossCGDefaultPreconditioner>
-auto cg_gp_from_mean_and_covariance(CovFunc &&covariance_function,
-                                    MeanFunc &&mean_function,
-                                    const std::string &model_name,
-                                    Preconditioner && = Preconditioner{}) {
+auto cg_gp_from_mean_and_covariance(
+    CovFunc &&covariance_function, MeanFunc &&mean_function,
+    const std::string &model_name,
+    const IterativeSolverOptions &options = IterativeSolverOptions{},
+    Preconditioner && = Preconditioner{}) {
   return ConjugateGradientGaussianProcessRegression<
       typename std::decay<CovFunc>::type, typename std::decay<MeanFunc>::type,
       Preconditioner>(std::forward<CovFunc>(covariance_function),
-                      std::forward<MeanFunc>(mean_function), model_name);
+                      std::forward<MeanFunc>(mean_function), model_name,
+                      options);
 }
 
 } // namespace albatross
\ No newline at end of file
diff --git a/tests/test_cg_gp.cc b/tests/test_cg_gp.cc
index 5135088b..dea90a74 100644
--- a/tests/test_cg_gp.cc
+++ b/tests/test_cg_gp.cc
@@ -19,29 +19,142 @@
 
 namespace albatross {
 
+std::ostream &operator<<(std::ostream &os, Eigen::ComputationInfo info) {
+  switch (info) {
+  case Eigen::Success:
+    os << "Success";
+    break;
+  case Eigen::NumericalIssue:
+    os << "NumericalIssue";
+    break;
+  case Eigen::NoConvergence:
+    os << "NoConvergence";
+    break;
+  case Eigen::InvalidInput:
+    os << "InvalidInput";
+    break;
+  default:
+    os << "<invalid enum value " << info << ">";
+  };
+  return os;
+}
+
+namespace {
+template <typename FitType>
+void describe_fit(const FitType &fit, std::ostream &os = std::cout) {
+  const auto options = fit.get_options();
+  const auto state = fit.get_solver_state();
+  os << "        Status: " << state.info << std::endl;
+  os << "     Tolerance: " << options.tolerance << std::endl;
+  os << "         Error: " << state.error << std::endl;
+  os << "Max iterations: " << options.max_iterations << std::endl;
+  os << "    Iterations: " << state.iterations << std::endl;
+}
+} // namespace
+
 TEST(TestConjugateGradientGP, TestMean) {
   using CovFunc = SquaredExponential<EuclideanDistance>;
 
   CovFunc covariance(1, 1);
-  auto dataset = make_toy_linear_data();
+  auto dataset = make_toy_linear_data(5, 1, 1.e-3, 5000);
   auto direct = gp_from_covariance(covariance, "direct");
   auto cg = cg_gp_from_covariance(covariance, "cg");
 
+  auto begin = std::chrono::steady_clock::now();
   auto direct_fit = direct.fit(dataset);
+  std::cout << "direct fit: "
+            << std::chrono::duration_cast<std::chrono::nanoseconds>(
+                   std::chrono::steady_clock::now() - begin)
+                       .count() /
+                   1.e9
+            << std::endl;
+  begin = std::chrono::steady_clock::now();
   auto cg_fit = cg.fit(dataset);
+  std::cout << "cg fit: "
+            << std::chrono::duration_cast<std::chrono::nanoseconds>(
+                   std::chrono::steady_clock::now() - begin)
+                       .count() /
+                   1.e9
+            << std::endl;
+
+  describe_fit(cg_fit.get_fit());
+  auto test_features = linspace(0.01, 9.9, 100);
 
-  auto test_features = linspace(0.01, 9.9, 11);
+  begin = std::chrono::steady_clock::now();
+  auto direct_pred =
+      direct_fit.predict_with_measurement_noise(test_features).joint();
+  std::cout << "direct predict: "
+            << std::chrono::duration_cast<std::chrono::nanoseconds>(
+                   std::chrono::steady_clock::now() - begin)
+                       .count() /
+                   1.e9
+            << std::endl;
 
-  auto direct_pred = direct_fit.predict_with_measurement_noise(test_features).joint();
+  begin = std::chrono::steady_clock::now();
   auto cg_pred = cg_fit.predict_with_measurement_noise(test_features).joint();
+  std::cout << "cg predict: "
+            << std::chrono::duration_cast<std::chrono::nanoseconds>(
+                   std::chrono::steady_clock::now() - begin)
+                       .count() /
+                   1.e9
+            << std::endl;
+  describe_fit(cg_fit.get_fit());
+
+  EXPECT_TRUE(cg_pred.mean.array().isFinite().all());
+  EXPECT_TRUE(cg_pred.covariance.array().isFinite().all());
 
   double mean_error = (direct_pred.mean - cg_pred.mean).norm();
   EXPECT_LT(mean_error, 1.e-9);
 
-  double cov_distance =
-      albatross::distance::wasserstein_2(direct_pred, cg_pred);
+  double cov_error = (direct_pred.covariance - cg_pred.covariance).norm();
+  EXPECT_LT(cov_error, 1.e-9);
+
+  begin = std::chrono::steady_clock::now();
+  auto direct_marginal =
+      direct_fit.predict_with_measurement_noise(test_features).marginal();
+  std::cout << "direct marginal: "
+            << std::chrono::duration_cast<std::chrono::nanoseconds>(
+                   std::chrono::steady_clock::now() - begin)
+                       .count() /
+                   1.e9
+            << std::endl;
+
+  begin = std::chrono::steady_clock::now();
+  auto cg_marginal =
+      cg_fit.predict_with_measurement_noise(test_features).marginal();
+  std::cout << "cg marginal: "
+            << std::chrono::duration_cast<std::chrono::nanoseconds>(
+                   std::chrono::steady_clock::now() - begin)
+                       .count() /
+                   1.e9
+            << std::endl;
+  describe_fit(cg_fit.get_fit());
+  double marginal_error = (direct_marginal.covariance.diagonal() -
+                           cg_marginal.covariance.diagonal())
+                              .norm();
+  EXPECT_LT(marginal_error, 1.e-9);
+
+  begin = std::chrono::steady_clock::now();
+  auto direct_mean =
+      direct_fit.predict_with_measurement_noise(test_features).mean();
+  std::cout << "direct mean: "
+            << std::chrono::duration_cast<std::chrono::nanoseconds>(
+                   std::chrono::steady_clock::now() - begin)
+                       .count() /
+                   1.e9
+            << std::endl;
 
-  EXPECT_LT(cov_distance, 1.e-9);
+  begin = std::chrono::steady_clock::now();
+  auto cg_mean = cg_fit.predict_with_measurement_noise(test_features).mean();
+  std::cout << "cg mean: "
+            << std::chrono::duration_cast<std::chrono::nanoseconds>(
+                   std::chrono::steady_clock::now() - begin)
+                       .count() /
+                   1.e9
+            << std::endl;
+  describe_fit(cg_fit.get_fit());
+  double mean_predict_error = (direct_mean - cg_mean).norm();
+  EXPECT_LT(mean_predict_error, 1.e-9);
 }
 
 } // namespace albatross
\ No newline at end of file

From 0f2d8d03bdb41a427410fac034db41e9c9f59b66 Mon Sep 17 00:00:00 2001
From: Matt Peddie <matt.peddie@swift-nav.com>
Date: Tue, 1 Apr 2025 11:16:28 +1000
Subject: [PATCH 3/6] WIP: partial Cholesky preconditioner

---
 BUILD.bazel                                   |   4 +
 include/albatross/CGGP                        |   1 +
 .../albatross/src/eigen/partial_cholesky.hpp  | 258 ++++++++++++++++++
 tests/test_partial_cholesky.cc                |  72 +++++
 4 files changed, 335 insertions(+)
 create mode 100644 include/albatross/src/eigen/partial_cholesky.hpp
 create mode 100644 tests/test_partial_cholesky.cc

diff --git a/BUILD.bazel b/BUILD.bazel
index ee752997..51361082 100644
--- a/BUILD.bazel
+++ b/BUILD.bazel
@@ -2,6 +2,8 @@ load("@rules_swiftnav//cc:defs.bzl", "UNIT", "swift_cc_test", "swift_cc_test_lib
 load("//:copts.bzl", "COPTS")
 load("@hedron_compile_commands//:refresh_compile_commands.bzl", "refresh_compile_commands")
 
+subpackages(include = ["examples/**"])
+
 refresh_compile_commands(
     name = "gen_compile_commands",
     visibility = ["//visibility:public"],
@@ -100,6 +102,7 @@ cc_library(
         "include/albatross/src/details/traits.hpp",
         "include/albatross/src/details/typecast.hpp",
         "include/albatross/src/details/unused.hpp",
+        "include/albatross/src/eigen/partial_cholesky.hpp",
         "include/albatross/src/eigen/serializable_ldlt.hpp",
         "include/albatross/src/eigen/serializable_spqr.hpp",
         "include/albatross/src/evaluation/cross_validation.hpp",
@@ -232,6 +235,7 @@ swift_cc_test(
         "tests/test_models.cc",
         "tests/test_models.h",
         "tests/test_parameter_handling_mixin.cc",
+        "tests/test_partial_cholesky.cc",
         "tests/test_prediction.cc",
         "tests/test_radial.cc",
         "tests/test_random_utils.cc",
diff --git a/include/albatross/CGGP b/include/albatross/CGGP
index 80a115e3..f84f897a 100644
--- a/include/albatross/CGGP
+++ b/include/albatross/CGGP
@@ -14,6 +14,7 @@
 #define ALBATROSS_CG_GP_H
 
 #include "GP"
+#include <albatross/src/eigen/partial_cholesky.hpp>
 #include <albatross/src/models/conjugate_gradient_gp.hpp>
 
 #endif // ALBATROSS_CG_GP_H
diff --git a/include/albatross/src/eigen/partial_cholesky.hpp b/include/albatross/src/eigen/partial_cholesky.hpp
new file mode 100644
index 00000000..af6795fb
--- /dev/null
+++ b/include/albatross/src/eigen/partial_cholesky.hpp
@@ -0,0 +1,258 @@
+/*
+ * Copyright (C) 2025 Swift Navigation Inc.
+ * Contact: Swift Navigation <dev@swiftnav.com>
+ *
+ * This source is subject to the license found in the file 'LICENSE' which must
+ * be distributed together with this source. All other rights reserved.
+ *
+ * THIS CODE AND INFORMATION IS PROVIDED "AS IS" WITHOUT WARRANTY OF ANY KIND,
+ * EITHER EXPRESSED OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE IMPLIED
+ * WARRANTIES OF MERCHANTABILITY AND/OR FITNESS FOR A PARTICULAR PURPOSE.
+ */
+
+namespace Eigen {
+
+template <typename Scalar> class PartialCholesky {
+public:
+  using MatrixType = Matrix<Scalar, Dynamic, Dynamic>;
+  using StorageIndex = typename MatrixType::StorageIndex;
+  using RealScalar = typename NumTraits<Scalar>::Real;
+
+  using PermutationType = PermutationMatrix<Dynamic, Dynamic, StorageIndex>;
+
+  static constexpr const Index cDefaultOrder = 22;
+
+  static constexpr const double cDefaultNugget = 1.e-5;
+
+  PartialCholesky() {}
+
+  explicit PartialCholesky(const MatrixType &A)
+      : m_rows{A.rows()}, m_cols{A.cols()} {
+    compute(A);
+  }
+
+  PartialCholesky(const MatrixType &A, Index order, RealScalar nugget)
+      : m_rows{A.rows()}, m_cols{A.cols()}, m_order{order}, m_nugget{nugget} {
+    compute(A);
+  }
+
+  inline Index order() const { return m_order; }
+
+  PartialCholesky &setOrder(Index order) {
+    m_order = order;
+    return *this;
+  }
+
+  inline double nugget() const { return m_nugget; }
+
+  PartialCholesky &setNugget(double nugget) {
+    m_nugget = nugget;
+    return *this;
+  }
+
+  PartialCholesky &compute(const MatrixType &A) {
+    // This computes a low-rank pivoted Cholesky decomposition.
+    // Unlike the normal dense LDLT and friends, we do not want to
+    // copy the potentially quite large A.  Unlike the CG solver, we
+    // do not want to retain any reference to A's data once we have
+    // finished this function.
+    m_rows = A.rows();
+    m_cols = A.cols();
+    PermutationType transpositions(rows());
+    transpositions.setIdentity();
+    const Index max_rank = std::min(order(), rows());
+    MatrixType L{MatrixType::Zero(rows(), max_rank)};
+
+    // A's diagonal; needs to keep getting pivoted, shifted and
+    // searched at each step
+    VectorXd diag{A.diagonal()};
+
+    // debug
+    MatrixType Ashadow{A};
+    MatrixXd Lshadow{L};
+    PermutationType Pshadow{rows()};
+    Pshadow.setIdentity();
+
+    // Accumulated L column; also gets pivoted and shifted as we
+    // update, and contains the corrections to all columns of A below
+    // k.
+    VectorXd L_accum{VectorXd::Zero(rows())};
+
+    for (Index k = 0; k < max_rank; ++k) {
+      Index max_index;
+      diag.tail(max_rank - k).maxCoeff(&max_index);
+      max_index += k;
+
+      if (max_index != k) {
+        std::cout << "Swapping '" << max_index << "' (" << diag(max_index)
+                  << ") with '" << k << "' (" << diag(k) << ")" << std::endl;
+        transpositions.applyTranspositionOnTheRight(k, max_index);
+        std::swap(diag(k), diag(max_index));
+        L.row(k).swap(L.row(max_index));
+        std::swap(L_accum(k), L_accum(max_index));
+      }
+
+      std::cout << "P:\n" << Eigen::MatrixXi(transpositions) << std::endl;
+
+      Index max_index_shadow;
+      Ashadow.diagonal().tail(max_rank - k).maxCoeff(&max_index_shadow);
+      max_index_shadow += k;
+
+      if (max_index_shadow != k) {
+        std::cout << "Shadow: swapping '" << max_index_shadow << "' ("
+                  << Ashadow.diagonal()(max_index_shadow) << ") with '" << k
+                  << "' (" << Ashadow.diagonal()(k) << ")" << std::endl;
+        Lshadow.row(k).swap(Lshadow.row(max_index_shadow));
+        Pshadow.applyTranspositionOnTheRight(k, max_index_shadow);
+        PermutationType t{rows()};
+        t.setIdentity();
+        t.applyTranspositionOnTheRight(k, max_index_shadow);
+        Ashadow = t.transpose() * Ashadow * t;
+      }
+
+      std::cout << "Pshadow:\n" << Eigen::MatrixXi(Pshadow) << std::endl;
+
+      if (diag(k) <= 0.) {
+        m_info = InvalidInput;
+        std::cerr << "Invalid value '" << diag(k)
+                  << "' in pivoted cholesky decomp!" << std::endl;
+        return *this;
+      }
+
+      std::cout << "L:\n" << L << "\n";
+      std::cout << "L_s:\n" << Lshadow << "\n";
+      std::cout << "A_s:\n" << Ashadow << "\n";
+      // std::cout << "L_accum: " << L_accum.transpose() << "\n";
+      std::cout << "   diag: " << diag.transpose() << '\n';
+
+      const RealScalar alpha = std::sqrt(diag(k));
+
+      L(k, k) = alpha;
+      Lshadow(k, k) = std::sqrt(Ashadow.diagonal()(k));
+
+      std::cout << "alpha: " << alpha << std::endl;
+      std::cout << "shadow alpha: " << Lshadow(k, k) << std::endl;
+
+      const Index tail_size = rows() - k - 1;
+      std::cout << "tail_size: " << tail_size << std::endl;
+
+      if (tail_size < 1) {
+        break;
+      }
+      // Everything below here should be ordered appropriately -- we
+      // pivot `diag` and `L_accum` and the rows of `L` every time we do an
+      // update
+      const VectorXd Acol =
+          ((transpositions.transpose() * A.col(transpositions.indices()(k))))
+              .tail(tail_size);
+      const VectorXd Acol_shadow = Ashadow.col(k).tail(tail_size);
+      std::cout << "  Acol: " << Acol.transpose() << std::endl;
+      std::cout << "Acol_s: " << Acol_shadow.transpose() << std::endl;
+      std::cout << "  diff: " << (Acol - Acol_shadow).transpose() << std::endl;
+
+      VectorXd b = Acol;
+      // if (k > 0) {
+      //   b -= L.col(k - 1).tail(tail_size) * L(k, k - 1);
+      // }
+      for (Index i = 0; i < k; ++i) {
+        std::cout << "delta b(" << i
+                  << "): " << L.col(i).tail(tail_size).transpose() << " * "
+                  << L(k, i) << " = "
+                  << L.col(i).tail(tail_size).transpose() * L(k, i)
+                  << std::endl;
+        b -= L.col(i).tail(tail_size) * L(k, i);
+      }  // + L_accum.tail(tail_size);
+      std::cout << "     b: " << b.transpose() << std::endl;
+
+      L.col(k).tail(tail_size) = b / alpha;
+      diag.tail(tail_size) -=
+          L.col(k).tail(tail_size).array().square().matrix();
+      L_accum.tail(tail_size) -= Acol * Acol(0) / (alpha * alpha);
+
+      Lshadow.col(k).tail(tail_size) =
+        Acol_shadow / std::sqrt(Ashadow.diagonal()(k));
+      std::cout << "shadow bb^t / alpha:\n"
+                << 1 / (alpha * alpha) * Acol_shadow * Acol_shadow.transpose()
+                << std::endl;
+      Ashadow.bottomRightCorner(tail_size, tail_size) -=
+          1 / (alpha * alpha) * Acol_shadow * Acol_shadow.transpose();
+
+      std::cout << "L:\n" << L << "\n";
+      std::cout << "L_s:\n" << Lshadow << "\n";
+      std::cout << "A_s:\n" << Ashadow << "\n";
+      // std::cout << "L_accum: " << L_accum.transpose() << "\n";
+      std::cout << "   diag: " << diag.transpose() << '\n';
+      std::cout << "========" << std::endl;
+    }
+
+    m_transpositions = transpositions;
+    // std::cout << MatrixXi(m_transpositions) << std::endl;
+
+    m_L = L;
+    // std::cout << L << std::endl;
+
+    std::cout << MatrixXd(transpositions * L * L.transpose() *
+                          transpositions.transpose())
+              << std::endl;
+
+    std::cout << MatrixXd(Pshadow * Lshadow * Lshadow.transpose() *
+                          Pshadow.transpose())
+              << std::endl;
+
+    m_decomp = LDLT<MatrixXd>(MatrixXd::Identity(L.cols(), L.cols()) +
+                              1 / (m_nugget * m_nugget) * L.transpose() * L);
+
+    m_info = Success;
+    return *this;
+  }
+
+  MatrixXd matrixL() const {
+    assert(finished() &&
+           "Please don't call this on an uninitialised decomposition!");
+
+    return m_L;
+  }
+
+  PermutationType permutationsP() const {
+    assert(finished() &&
+           "Please don't call this on an uninitialised decomposition!");
+
+    return m_transpositions;
+  }
+
+  template <typename Rhs>
+  Matrix<Scalar, Dynamic, Rhs::ColsAtCompileTime> solve(const Rhs &b) const {
+    assert(finished() &&
+           "Please don't call this on an unintialised decomposition!");
+    const double n2 = m_nugget * m_nugget;
+    std::cout << 1 / n2 * b << std::endl;
+    std::cout << m_decomp.solve(m_L.transpose() * b) << std::endl;
+    Matrix<Scalar, Dynamic, Rhs::ColsAtCompileTime> ret =
+        1 / n2 * b -
+        1 / (n2 * n2) *
+            (m_transpositions * m_L *
+             m_decomp.solve(m_L.transpose() * m_transpositions.transpose() * b));
+    return ret;
+  }
+
+  inline bool finished() const {
+    return rows() > 0 && cols() > 0 & info() == Success;
+  }
+
+  inline Index rows() const { return m_rows; }
+  inline Index cols() const { return m_cols; }
+
+  ComputationInfo info() const { return m_info; }
+
+private:
+  StorageIndex m_rows{0};
+  StorageIndex m_cols{0};
+  Index m_order{cDefaultOrder};
+  RealScalar m_nugget{cDefaultNugget};
+  ComputationInfo m_info{Success};
+  MatrixType m_L{};
+  LDLT<MatrixXd> m_decomp{};
+  PermutationType m_transpositions{};
+};
+
+} // namespace Eigen
\ No newline at end of file
diff --git a/tests/test_partial_cholesky.cc b/tests/test_partial_cholesky.cc
new file mode 100644
index 00000000..0f9e3eac
--- /dev/null
+++ b/tests/test_partial_cholesky.cc
@@ -0,0 +1,72 @@
+/*
+ * Copyright (C) 2025 Swift Navigation Inc.
+ * Contact: Swift Navigation <dev@swiftnav.com>
+ *
+ * This source is subject to the license found in the file 'LICENSE' which must
+ * be distributed together with this source. All other rights reserved.
+ *
+ * THIS CODE AND INFORMATION IS PROVIDED "AS IS" WITHOUT WARRANTY OF ANY KIND,
+ * EITHER EXPRESSED OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE IMPLIED
+ * WARRANTIES OF MERCHANTABILITY AND/OR FITNESS FOR A PARTICULAR PURPOSE.
+ */
+
+#include <gtest/gtest.h>
+
+#include "test_models.h"
+#include <chrono>
+
+#include <albatross/CGGP>
+
+namespace albatross {
+
+TEST(PartialCholesky, Construct) {
+  Eigen::PartialCholesky<double> p;
+  EXPECT_EQ(Eigen::Success, p.info());
+}
+
+static constexpr Eigen::Index cExampleSize = 4;
+
+TEST(PartialCholesky, Compute) {
+  Eigen::PartialCholesky<double> p;
+  EXPECT_EQ(Eigen::Success, p.info());
+
+  std::default_random_engine gen{22};
+  const auto m = random_covariance_matrix(cExampleSize, gen);
+
+  p.compute(m);
+  std::cout << "A:\n" << m << std::endl;
+
+  ASSERT_EQ(Eigen::Success, p.info());
+
+  Eigen::MatrixXd L = p.matrixL();
+  Eigen::PartialCholesky<double>::PermutationType P = p.permutationsP();
+
+  Eigen::MatrixXd m_reconstructed{P * L * L.transpose() * P.transpose()};
+  EXPECT_LT((m_reconstructed - m).norm(), 1.e-9) << m_reconstructed - m;
+}
+
+TEST(PartialCholesky, Solve) {
+  Eigen::PartialCholesky<double> p;
+  ASSERT_EQ(Eigen::Success, p.info());
+
+  std::default_random_engine gen{22};
+  const auto m = random_covariance_matrix(cExampleSize, gen);
+  std::cout << m << std::endl;
+  const Eigen::VectorXd b{Eigen::VectorXd::NullaryExpr(cExampleSize, [&gen]() {
+    return std::normal_distribution<double>(0, 1)(gen);
+  })};
+
+  p.compute(m);
+
+  const Eigen::VectorXd x_llt = m.ldlt().solve(b);
+  std::cout << "x_llt:  " << x_llt.transpose() << std::endl;
+
+  ASSERT_EQ(Eigen::Success, p.info());
+
+  const Eigen::VectorXd x = p.solve(b);
+  EXPECT_EQ(Eigen::Success, p.info());
+  std::cout << "    x:  " << x.transpose() << std::endl;
+  EXPECT_LT((x - x_llt).norm(), p.nugget());
+}
+
+}  // namespace albatross
\ No newline at end of file

From f07c48a2e003ce48aceb6dfb5f2d2e24185f16f7 Mon Sep 17 00:00:00 2001
From: Matt Peddie <matt.peddie@swift-nav.com>
Date: Wed, 2 Apr 2025 15:20:51 +1000
Subject: [PATCH 4/6] Mad hacking

---
 .../albatross/src/eigen/partial_cholesky.hpp  | 221 ++++++-----
 tests/test_cg_gp.cc                           |   4 +-
 tests/test_partial_cholesky.cc                | 344 +++++++++++++++++-
 3 files changed, 434 insertions(+), 135 deletions(-)

diff --git a/include/albatross/src/eigen/partial_cholesky.hpp b/include/albatross/src/eigen/partial_cholesky.hpp
index af6795fb..e24b7f62 100644
--- a/include/albatross/src/eigen/partial_cholesky.hpp
+++ b/include/albatross/src/eigen/partial_cholesky.hpp
@@ -12,6 +12,20 @@
 
 namespace Eigen {
 
+// A pivoted, partial Cholesky decomposition.
+//
+// This is meant for use as a preconditioner for symmetric,
+// positive-definite problems.  The algorithm is described in:
+//
+//     On the Low-rank Approximation by the Pivoted Cholesky Decomposition
+//     H. Harbrecht, M. Peters and R. Schneider
+//     http://www.dfg-spp1324.de/download/preprints/preprint076.pdf
+//
+// In this implementation, we make the natural choice to avoid storing
+// a copy of the input matrix; we only copy its diagonal for use
+// during the decomposition.  The L matrix already stores the sequence
+// of updates to each relevant column of A, so these updates are
+// applied on demand as each pivot column is selected.
 template <typename Scalar> class PartialCholesky {
 public:
   using MatrixType = Matrix<Scalar, Dynamic, Dynamic>;
@@ -22,7 +36,7 @@ template <typename Scalar> class PartialCholesky {
 
   static constexpr const Index cDefaultOrder = 22;
 
-  static constexpr const double cDefaultNugget = 1.e-5;
+  static constexpr const double cDefaultNugget = 1.e-3;
 
   PartialCholesky() {}
 
@@ -31,6 +45,11 @@ template <typename Scalar> class PartialCholesky {
     compute(A);
   }
 
+  explicit PartialCholesky(Index order) : m_order{order} {}
+
+  PartialCholesky(Index order, RealScalar nugget)
+      : m_order{order}, m_nugget{nugget} {}
+
   PartialCholesky(const MatrixType &A, Index order, RealScalar nugget)
       : m_rows{A.rows()}, m_cols{A.cols()}, m_order{order}, m_nugget{nugget} {
     compute(A);
@@ -50,12 +69,11 @@ template <typename Scalar> class PartialCholesky {
     return *this;
   }
 
+  // Unlike the normal dense LDLT and friends, we do not want to
+  // copy the potentially quite large A.  Unlike the CG solver, we
+  // do not want to retain any reference to A's data once we have
+  // finished this function.
   PartialCholesky &compute(const MatrixType &A) {
-    // This computes a low-rank pivoted Cholesky decomposition.
-    // Unlike the normal dense LDLT and friends, we do not want to
-    // copy the potentially quite large A.  Unlike the CG solver, we
-    // do not want to retain any reference to A's data once we have
-    // finished this function.
     m_rows = A.rows();
     m_cols = A.cols();
     PermutationType transpositions(rows());
@@ -64,141 +82,98 @@ template <typename Scalar> class PartialCholesky {
     MatrixType L{MatrixType::Zero(rows(), max_rank)};
 
     // A's diagonal; needs to keep getting pivoted, shifted and
-    // searched at each step
+    // searched at each step.  We track this separately from the rest
+    // of A because we have to search each time, and for the relevant
+    // off-diagonal columns of A, we only apply the relevant updates
+    // we strictly need.
     VectorXd diag{A.diagonal()};
 
-    // debug
-    MatrixType Ashadow{A};
-    MatrixXd Lshadow{L};
-    PermutationType Pshadow{rows()};
-    Pshadow.setIdentity();
+    const auto calc_error = [&diag](Index k) {
+      return diag.tail(diag.size() - k).array().sum();
+    };
 
-    // Accumulated L column; also gets pivoted and shifted as we
-    // update, and contains the corrections to all columns of A below
-    // k.
-    VectorXd L_accum{VectorXd::Zero(rows())};
+    RealScalar error = calc_error(0);
 
     for (Index k = 0; k < max_rank; ++k) {
       Index max_index;
-      diag.tail(max_rank - k).maxCoeff(&max_index);
+      diag.tail(diag.size() - k).maxCoeff(&max_index);
       max_index += k;
+      // std::cout << "step " << k << ": found max element " << diag(max_index)
+      //           << " at position " << max_index - k << " in "
+      //           << diag.tail(diag.size() - k).transpose() << std::endl;
 
       if (max_index != k) {
-        std::cout << "Swapping '" << max_index << "' (" << diag(max_index)
-                  << ") with '" << k << "' (" << diag(k) << ")" << std::endl;
         transpositions.applyTranspositionOnTheRight(k, max_index);
         std::swap(diag(k), diag(max_index));
         L.row(k).swap(L.row(max_index));
-        std::swap(L_accum(k), L_accum(max_index));
-      }
-
-      std::cout << "P:\n" << Eigen::MatrixXi(transpositions) << std::endl;
-
-      Index max_index_shadow;
-      Ashadow.diagonal().tail(max_rank - k).maxCoeff(&max_index_shadow);
-      max_index_shadow += k;
-
-      if (max_index_shadow != k) {
-        std::cout << "Shadow: swapping '" << max_index_shadow << "' ("
-                  << Ashadow.diagonal()(max_index_shadow) << ") with '" << k
-                  << "' (" << Ashadow.diagonal()(k) << ")" << std::endl;
-        Lshadow.row(k).swap(Lshadow.row(max_index_shadow));
-        Pshadow.applyTranspositionOnTheRight(k, max_index_shadow);
-        PermutationType t{rows()};
-        t.setIdentity();
-        t.applyTranspositionOnTheRight(k, max_index_shadow);
-        Ashadow = t.transpose() * Ashadow * t;
+        // std::cout << max_index << " <-> " << k << std::endl;
       }
 
-      std::cout << "Pshadow:\n" << Eigen::MatrixXi(Pshadow) << std::endl;
-
       if (diag(k) <= 0.) {
         m_info = InvalidInput;
-        std::cerr << "Invalid value '" << diag(k)
-                  << "' in pivoted cholesky decomp!" << std::endl;
         return *this;
       }
 
-      std::cout << "L:\n" << L << "\n";
-      std::cout << "L_s:\n" << Lshadow << "\n";
-      std::cout << "A_s:\n" << Ashadow << "\n";
-      // std::cout << "L_accum: " << L_accum.transpose() << "\n";
-      std::cout << "   diag: " << diag.transpose() << '\n';
-
       const RealScalar alpha = std::sqrt(diag(k));
 
       L(k, k) = alpha;
-      Lshadow(k, k) = std::sqrt(Ashadow.diagonal()(k));
-
-      std::cout << "alpha: " << alpha << std::endl;
-      std::cout << "shadow alpha: " << Lshadow(k, k) << std::endl;
 
       const Index tail_size = rows() - k - 1;
-      std::cout << "tail_size: " << tail_size << std::endl;
-
       if (tail_size < 1) {
         break;
       }
+
       // Everything below here should be ordered appropriately -- we
-      // pivot `diag` and `L_accum` and the rows of `L` every time we do an
-      // update
-      const VectorXd Acol =
+      // pivot `diag` and the rows of `L` every time we do an update
+      VectorXd b =
           ((transpositions.transpose() * A.col(transpositions.indices()(k))))
               .tail(tail_size);
-      const VectorXd Acol_shadow = Ashadow.col(k).tail(tail_size);
-      std::cout << "  Acol: " << Acol.transpose() << std::endl;
-      std::cout << "Acol_s: " << Acol_shadow.transpose() << std::endl;
-      std::cout << "  diff: " << (Acol - Acol_shadow).transpose() << std::endl;
-
-      VectorXd b = Acol;
-      // if (k > 0) {
-      //   b -= L.col(k - 1).tail(tail_size) * L(k, k - 1);
-      // }
+
+      // I couldn't find this derived anywhere -- basically what
+      // happens here is that for the lower-right submatrix below
+      // diagonal element k of the pivoted input matrix, we have to
+      // update it with b_i b_i^t / a_i = l_i l_i^t where a_i =
+      // alpha_i^2 = diagonal element k, _for each preceding pivot
+      // column i_ below the current one.  Of course we are modifying
+      // the whole input matrix in place, and we only care about the
+      // relevant column below the pivot we just chose.  The
+      // successive updates to this column A_k,k+1:n are l_i * l_i[k]
+      // -- the columns of the bottom-left submatrix of L below k,
+      // each column scaled by the element just above it (in row k)
+      // respectively.
       for (Index i = 0; i < k; ++i) {
-        std::cout << "delta b(" << i
-                  << "): " << L.col(i).tail(tail_size).transpose() << " * "
-                  << L(k, i) << " = "
-                  << L.col(i).tail(tail_size).transpose() * L(k, i)
-                  << std::endl;
         b -= L.col(i).tail(tail_size) * L(k, i);
-      }  // + L_accum.tail(tail_size);
-      std::cout << "     b: " << b.transpose() << std::endl;
+      }
 
       L.col(k).tail(tail_size) = b / alpha;
       diag.tail(tail_size) -=
           L.col(k).tail(tail_size).array().square().matrix();
-      L_accum.tail(tail_size) -= Acol * Acol(0) / (alpha * alpha);
-
-      Lshadow.col(k).tail(tail_size) =
-        Acol_shadow / std::sqrt(Ashadow.diagonal()(k));
-      std::cout << "shadow bb^t / alpha:\n"
-                << 1 / (alpha * alpha) * Acol_shadow * Acol_shadow.transpose()
-                << std::endl;
-      Ashadow.bottomRightCorner(tail_size, tail_size) -=
-          1 / (alpha * alpha) * Acol_shadow * Acol_shadow.transpose();
-
-      std::cout << "L:\n" << L << "\n";
-      std::cout << "L_s:\n" << Lshadow << "\n";
-      std::cout << "A_s:\n" << Ashadow << "\n";
-      // std::cout << "L_accum: " << L_accum.transpose() << "\n";
-      std::cout << "   diag: " << diag.transpose() << '\n';
-      std::cout << "========" << std::endl;
+
+      for (Index i = 0; i < k; ++i) {
+        assert(L(i, i) >= L(i + 1, i + 1) && "failure in ordering invariant!");
+      }
+
+      assert(calc_error(k + 1) < error && "failure in convergence criterion!");
+      error = calc_error(k + 1);
+
+      // std::cout << "step " << k
+      //           << ": error = " << diag.tail(diag.size() - k).array().sum()
+      //           << std::endl;
     }
 
-    m_transpositions = transpositions;
-    // std::cout << MatrixXi(m_transpositions) << std::endl;
+    m_error = diag.tail(diag.size() - max_rank).array().sum();
 
-    m_L = L;
-    // std::cout << L << std::endl;
+    m_nugget = std::sqrt(A.diagonal().minCoeff());
 
-    std::cout << MatrixXd(transpositions * L * L.transpose() *
-                          transpositions.transpose())
-              << std::endl;
+    m_transpositions = transpositions;
 
-    std::cout << MatrixXd(Pshadow * Lshadow * Lshadow.transpose() *
-                          Pshadow.transpose())
-              << std::endl;
+    m_L = L;
 
+    // We decompose before returning to save time on repeated solves.
+    //
+    // Arguably we could pre-apply the outer terms of Woodbury, but
+    // computing that full matrix would significantly increase our
+    // storage requirements in the typical case where k << n.
     m_decomp = LDLT<MatrixXd>(MatrixXd::Identity(L.cols(), L.cols()) +
                               1 / (m_nugget * m_nugget) * L.transpose() * L);
 
@@ -206,49 +181,61 @@ template <typename Scalar> class PartialCholesky {
     return *this;
   }
 
+  template <typename Rhs>
+  Matrix<Scalar, Dynamic, Rhs::ColsAtCompileTime> solve(const Rhs &b) const {
+    assert(finished() &&
+           "Please don't call 'solve()' on an unintialised decomposition!");
+    const double n2 = m_nugget * m_nugget;
+    Matrix<Scalar, Dynamic, Rhs::ColsAtCompileTime> ret =
+        1 / n2 * b - 1 / (n2 * n2) *
+                         (m_transpositions * m_L *
+                          m_decomp.solve(m_L.transpose() *
+                                         m_transpositions.transpose() * b));
+    return ret;
+  }
+
   MatrixXd matrixL() const {
     assert(finished() &&
-           "Please don't call this on an uninitialised decomposition!");
+           "Please don't call 'matrixL()' on an uninitialised decomposition!");
 
     return m_L;
   }
 
   PermutationType permutationsP() const {
-    assert(finished() &&
-           "Please don't call this on an uninitialised decomposition!");
+    assert(finished() && "Please don't call 'permutationsP()' on an "
+                         "uninitialised decomposition!");
 
     return m_transpositions;
   }
 
-  template <typename Rhs>
-  Matrix<Scalar, Dynamic, Rhs::ColsAtCompileTime> solve(const Rhs &b) const {
-    assert(finished() &&
-           "Please don't call this on an unintialised decomposition!");
-    const double n2 = m_nugget * m_nugget;
-    std::cout << 1 / n2 * b << std::endl;
-    std::cout << m_decomp.solve(m_L.transpose() * b) << std::endl;
-    Matrix<Scalar, Dynamic, Rhs::ColsAtCompileTime> ret =
-        1 / n2 * b -
-        1 / (n2 * n2) *
-            (m_transpositions * m_L *
-             m_decomp.solve(m_L.transpose() * m_transpositions.transpose() * b));
-    return ret;
-  }
-
   inline bool finished() const {
     return rows() > 0 && cols() > 0 & info() == Success;
   }
 
+  inline MatrixType reconstructedMatrix() const {
+    assert(finished() && "Please don't call 'reconstructedMatrix()' on an "
+                         "unintialised decomposition!");
+    return MatrixType(permutationsP() * matrixL() * matrixL().transpose() *
+                      permutationsP().transpose());
+  }
+
   inline Index rows() const { return m_rows; }
   inline Index cols() const { return m_cols; }
 
   ComputationInfo info() const { return m_info; }
 
+  RealScalar error() const {
+    assert(finished() &&
+           "Please don't call 'error()' on an unintialised decomposition!");
+    return m_error;
+  }
+
 private:
   StorageIndex m_rows{0};
   StorageIndex m_cols{0};
   Index m_order{cDefaultOrder};
   RealScalar m_nugget{cDefaultNugget};
+  RealScalar m_error{0};
   ComputationInfo m_info{Success};
   MatrixType m_L{};
   LDLT<MatrixXd> m_decomp{};
diff --git a/tests/test_cg_gp.cc b/tests/test_cg_gp.cc
index dea90a74..9c15c45b 100644
--- a/tests/test_cg_gp.cc
+++ b/tests/test_cg_gp.cc
@@ -58,7 +58,9 @@ TEST(TestConjugateGradientGP, TestMean) {
   CovFunc covariance(1, 1);
   auto dataset = make_toy_linear_data(5, 1, 1.e-3, 5000);
   auto direct = gp_from_covariance(covariance, "direct");
-  auto cg = cg_gp_from_covariance(covariance, "cg");
+  auto cg = cg_gp_from_covariance(covariance, "cg", IterativeSolverOptions{},
+                                  Eigen::PartialCholesky<double>{20, 1.e-3});
+  // auto cg = cg_gp_from_covariance(covariance, "cg");
 
   auto begin = std::chrono::steady_clock::now();
   auto direct_fit = direct.fit(dataset);
diff --git a/tests/test_partial_cholesky.cc b/tests/test_partial_cholesky.cc
index 0f9e3eac..44b9feb7 100644
--- a/tests/test_partial_cholesky.cc
+++ b/tests/test_partial_cholesky.cc
@@ -24,49 +24,359 @@ TEST(PartialCholesky, Construct) {
   EXPECT_EQ(Eigen::Success, p.info());
 }
 
-static constexpr Eigen::Index cExampleSize = 4;
+static constexpr const std::size_t cDefaultSeed = 22;
+static constexpr const Eigen::Index cExampleSize = 10;
+
+static std::gamma_distribution<double> cEigenvalueDistribution(2, 2);
 
 TEST(PartialCholesky, Compute) {
   Eigen::PartialCholesky<double> p;
-  EXPECT_EQ(Eigen::Success, p.info());
+  ASSERT_EQ(Eigen::Success, p.info());
 
-  std::default_random_engine gen{22};
-  const auto m = random_covariance_matrix(cExampleSize, gen);
+  std::default_random_engine gen{cDefaultSeed};
+  const auto m =
+      random_covariance_matrix(cExampleSize, cEigenvalueDistribution, gen);
 
   p.compute(m);
-  std::cout << "A:\n" << m << std::endl;
 
   ASSERT_EQ(Eigen::Success, p.info());
 
-  Eigen::MatrixXd L = p.matrixL();
-  Eigen::PartialCholesky<double>::PermutationType P = p.permutationsP();
-
-  Eigen::MatrixXd m_reconstructed{P * L * L.transpose() * P.transpose()};
-  EXPECT_LT((m_reconstructed - m).norm(), 1.e-9) << m_reconstructed - m;
+  EXPECT_LT((p.reconstructedMatrix() - m).norm(), 1.e-9)
+      << p.reconstructedMatrix() - m;
 }
 
 TEST(PartialCholesky, Solve) {
   Eigen::PartialCholesky<double> p;
   ASSERT_EQ(Eigen::Success, p.info());
 
-  std::default_random_engine gen{22};
-  const auto m = random_covariance_matrix(cExampleSize, gen);
-  std::cout << m << std::endl;
+  std::default_random_engine gen{cDefaultSeed};
+  const auto m =
+      random_covariance_matrix(cExampleSize, cEigenvalueDistribution, gen);
   const Eigen::VectorXd b{Eigen::VectorXd::NullaryExpr(cExampleSize, [&gen]() {
     return std::normal_distribution<double>(0, 1)(gen);
   })};
 
   p.compute(m);
+  ASSERT_EQ(Eigen::Success, p.info());
+
+  const Eigen::VectorXd x = p.solve(b);
+  ASSERT_EQ(Eigen::Success, p.info());
 
   const Eigen::VectorXd x_llt = m.ldlt().solve(b);
-  std::cout << "x_llt:  " << x_llt.transpose() << std::endl;
+  EXPECT_LT((x - x_llt).norm(), p.nugget());
+}
 
+TEST(PartialCholesky, SolveMatrix) {
+  Eigen::PartialCholesky<double> p;
+  ASSERT_EQ(Eigen::Success, p.info());
+
+  std::default_random_engine gen{cDefaultSeed};
+  const auto m =
+      random_covariance_matrix(cExampleSize, cEigenvalueDistribution, gen);
+  const Eigen::MatrixXd b{
+      Eigen::MatrixXd::NullaryExpr(cExampleSize, cExampleSize, [&gen]() {
+        return std::normal_distribution<double>(0, 1)(gen);
+      })};
+
+  p.compute(m);
   ASSERT_EQ(Eigen::Success, p.info());
 
+  const Eigen::MatrixXd x = p.solve(b);
+  ASSERT_EQ(Eigen::Success, p.info());
+
+  const Eigen::MatrixXd x_llt = m.ldlt().solve(b);
+  EXPECT_LT((x - x_llt).norm(), 10 * p.nugget());
+}
+
+static constexpr const std::size_t cNumRandomExamples = 222;
+static constexpr const std::size_t cMaxDecompositionOrder = 30;
+
+TEST(PartialCholesky, RandomCompleteProblems) {
+  std::default_random_engine gen{cDefaultSeed};
+  std::uniform_int_distribution<Eigen::Index> decomp_order_dist(
+      1, cMaxDecompositionOrder);
+
+  for (std::size_t i = 0; i < cNumRandomExamples; ++i) {
+    const Eigen::Index decomp_order{decomp_order_dist(gen)};
+    // Generate matrices small enough that we always do a complete
+    // Cholesky factorisation.
+    std::uniform_int_distribution<Eigen::Index> problem_size_dist(1,
+                                                                  decomp_order);
+    const Eigen::Index problem_size{problem_size_dist(gen)};
+    const auto m =
+        random_covariance_matrix(problem_size, cEigenvalueDistribution, gen);
+    const Eigen::VectorXd b{
+        Eigen::VectorXd::NullaryExpr(problem_size, [&gen]() {
+          return std::normal_distribution<double>(0, 1)(gen);
+        })};
+
+    Eigen::PartialCholesky<double> p;
+    ASSERT_EQ(Eigen::Success, p.info());
+    p.setOrder(decomp_order);
+
+    p.compute(m);
+    ASSERT_EQ(Eigen::Success, p.info());
+
+    EXPECT_LT((p.reconstructedMatrix() - m).norm(), 1.e-9)
+        << p.reconstructedMatrix() - m << "\neigs:\n"
+        << Eigen::SelfAdjointEigenSolver<Eigen::MatrixXd>(m)
+               .eigenvalues()
+               .transpose();
+
+    const Eigen::VectorXd x = p.solve(b);
+    ASSERT_EQ(Eigen::Success, p.info());
+
+    const Eigen::VectorXd x_llt = m.ldlt().solve(b);
+    // A cleverer implementation would derive the nugget size from the
+    // eigenvalues of the original covariance rather than add a fudge
+    // factor.
+    EXPECT_LT((x - x_llt).norm(), p.nugget() * 10)
+        << "\neigs:\n"
+        << Eigen::SelfAdjointEigenSolver<Eigen::MatrixXd>(m)
+               .eigenvalues()
+               .transpose();
+  }
+}
+
+namespace {
+
+Eigen::VectorXd spd_eigs(const Eigen::MatrixXd &m) {
+  return Eigen::SelfAdjointEigenSolver<Eigen::MatrixXd>(m).eigenvalues();
+}
+
+double condition_number(const Eigen::MatrixXd &m) {
+  Eigen::VectorXd eigs{spd_eigs(m)};
+  return eigs.array().abs().maxCoeff() / eigs.array().abs().minCoeff();
+}
+
+} // namespace
+
+TEST(PartialCholesky, IncreasingRank) {
+  std::default_random_engine gen{cDefaultSeed};
+  const Eigen::MatrixXd m =
+      random_covariance_matrix(cExampleSize, cEigenvalueDistribution, gen);
+  const Eigen::VectorXd b{Eigen::VectorXd::NullaryExpr(cExampleSize, [&gen]() {
+    return std::normal_distribution<double>(0, 1)(gen);
+  })};
+
+  std::vector<Eigen::PartialCholesky<double>> decomps(cExampleSize);
+
+  decomps[0].setOrder(1);
+  // decomps[0].setNugget(std::sqrt(m.diagonal().minCoeff()));
+  decomps[0].compute(m);
+
+  const auto triangle = [](Eigen::Index index,
+                           const auto &a) -> Eigen::MatrixXd {
+    return a.matrixL()
+        .topLeftCorner(index, index)
+        .template triangularView<Eigen::Lower>();
+  };
+
+  const auto triangle_compare =
+      [&decomps, &triangle](Eigen::Index index) -> Eigen::MatrixXd {
+    return triangle(index, decomps[index - 1]) -
+           triangle(index, decomps[index]);
+  };
+
+  const auto bottom_left = [](Eigen::Index index,
+                              const auto &a) -> Eigen::MatrixXd {
+    return (a.permutationsP() * a.matrixL())
+        .bottomLeftCorner(a.cols() - index, index);
+  };
+
+  const auto ordered_bottom_left_compare =
+      [&decomps, &bottom_left](Eigen::Index index) -> Eigen::MatrixXd {
+    return bottom_left(index, decomps[index - 1]) -
+           bottom_left(index, decomps[index]);
+  };
+
+  const auto reconstruction_error = [&m](const auto &a) -> Eigen::MatrixXd {
+    return a.reconstructedMatrix() - m;
+  };
+
+  const auto preconditioned_condition = [&m](const auto &a) {
+    return condition_number(a.solve(m));
+  };
+
+  const auto preconditioned_eigs = [&m](const auto &a) {
+    return spd_eigs(a.solve(m));
+  };
+
+  for (Eigen::Index k = 1; k < cExampleSize; ++k) {
+    const Eigen::Index rank = k + 1;
+    decomps[k].setOrder(rank);
+    // decomps[k].setNugget(std::sqrt(m.diagonal().minCoeff()));
+    decomps[k].compute(m);
+    ASSERT_EQ(decomps[k].info(), Eigen::Success);
+    // The top left triangle should be the same between successive
+    // low-rank approximations
+    EXPECT_LT(triangle_compare(k).norm(), 1.e-9)
+        << "k = " << k << "; " << triangle(k, decomps[k - 1]) << "\n"
+        << triangle(k, decomps[k]);
+    // The bottom left block below the top triangle corresponds to the
+    // pivot / non-pivot cross-correlation block and should be the
+    // same up to a permutation.
+    EXPECT_LT(ordered_bottom_left_compare(k).norm(), 1.e-9)
+        << "k = " << k << "; " << bottom_left(k, decomps[k - 1]) << "\n"
+        << bottom_left(k, decomps[k]);
+    // The leftover Schur complement determinant should decrease with
+    // increasing approximation rank
+    EXPECT_LT(decomps[k].error(), decomps[k - 1].error()) << "k = " << k;
+    // The reconstructed matrix should get closer and closer to the
+    // true matrix as we increase the approximation rank
+    EXPECT_LT(reconstruction_error(decomps[k]).norm(),
+              reconstruction_error(decomps[k - 1]).norm())
+        << "k = " << k;
+    // The whole point of this decomposition is that preconditioning
+    // by it should improve the condition number of the original
+    // problem
+    EXPECT_LT(preconditioned_condition(decomps[k]),
+              preconditioned_condition(decomps[k - 1]))
+        << "k = " << k << "\n    m eigs: " << spd_eigs(m).transpose()
+        << "\n mhat eigs: "
+        << spd_eigs(decomps[k].reconstructedMatrix()).transpose()
+        << "\n    k eigs: " << preconditioned_eigs(decomps[k]).transpose()
+        << "\nk - 1 eigs: " << preconditioned_eigs(decomps[k - 1]).transpose();
+  }
+}
+
+TEST(PartialCholesky, Approximate) {
+  std::default_random_engine gen{cDefaultSeed};
+  const Eigen::MatrixXd m =
+      random_covariance_matrix(cExampleSize, cEigenvalueDistribution, gen);
+  const Eigen::VectorXd b{Eigen::VectorXd::NullaryExpr(cExampleSize, [&gen]() {
+    return std::normal_distribution<double>(0, 1)(gen);
+  })};
+
+  Eigen::PartialCholesky<double> p;
+  ASSERT_EQ(Eigen::Success, p.info());
+  p.setOrder(2);
+  p.compute(m);
+  ASSERT_EQ(Eigen::Success, p.info());
+  const Eigen::MatrixXd L{p.matrixL()};
+  for (Eigen::Index i = 1; i < L.cols(); ++i) {
+    EXPECT_LT(L(i, i), L(i - 1, i - 1)) << L.diagonal().transpose();
+  }
   const Eigen::VectorXd x = p.solve(b);
-  EXPECT_EQ(Eigen::Success, p.info());
-  std::cout << "    x:  " << x.transpose() << std::endl;
-  EXPECT_LT((x - x_llt).norm(), p.nugget());
+  ASSERT_EQ(Eigen::Success, p.info());
+  Eigen::MatrixXd preconditioned{p.solve(m)};
+  Eigen::SelfAdjointEigenSolver<Eigen::MatrixXd> preeigs(preconditioned);
+  std::cout << "A:\n" << m << std::endl;
+  std::cout << "reconstructed:\n" << p.reconstructedMatrix() << std::endl;
+  std::cout << "error: " << p.error() << std::endl;
+  std::cout << "diff:\n" << m - p.reconstructedMatrix() << std::endl;
+  std::cout << "L:\n" << p.matrixL() << std::endl;
+  std::cout << "P:\n" << Eigen::MatrixXi(p.permutationsP()) << std::endl;
+  std::cout << m * x - b << std::endl;
+  std::cout << m * (p.reconstructedMatrix().ldlt().solve(b)) - b << std::endl;
+  std::cout << "Aapprox^-1 A:\n" << preconditioned << std::endl;
+  Eigen::SelfAdjointEigenSolver<Eigen::MatrixXd> eigs(m);
+  std::cout << "A eigs: " << eigs.eigenvalues().transpose() << std::endl;
+  std::cout << "Aapprox^-1 A eigs: " << preeigs.eigenvalues().transpose()
+            << std::endl;
+  Eigen::PartialCholesky<double> p3;
+  p3.setOrder(3);
+  p3.compute(m);
+  std::cout << "L:\n" << p3.matrixL() << std::endl;
+  std::cout << "P:\n" << Eigen::MatrixXi(p3.permutationsP()) << std::endl;
+}
+
+TEST(PartialCholesky, Precondition) {
+  std::default_random_engine gen{cDefaultSeed};
+  const auto m =
+      random_covariance_matrix(cExampleSize, cEigenvalueDistribution, gen);
+  const Eigen::VectorXd b{Eigen::VectorXd::NullaryExpr(cExampleSize, [&gen]() {
+    return std::normal_distribution<double>(0, 1)(gen);
+  })};
+
+  Eigen::ConjugateGradient<Eigen::MatrixXd, Eigen::Lower,
+                           Eigen::PartialCholesky<double>>
+      solver(m);
+  solver.preconditioner().setOrder(cExampleSize / 4);
+
+  const Eigen::VectorXd x = solver.solve(b);
+  EXPECT_EQ(solver.info(), Eigen::Success);
+  EXPECT_LT((m * x - b).norm(), 1.e-9);
+
+  Eigen::ConjugateGradient<Eigen::MatrixXd> solver0(m);
+
+  const Eigen::VectorXd x0 = solver0.solve(b);
+  EXPECT_EQ(solver0.info(), Eigen::Success);
+  EXPECT_LT(solver.iterations(), solver0.iterations());
+}
+
+static constexpr const Eigen::Index cMaxProblemSize = 200;
+
+TEST(PartialCholesky, PreconditionRandomProblems) {
+  std::default_random_engine gen{cDefaultSeed};
+  std::uniform_int_distribution<Eigen::Index> problem_size_dist(
+      cMaxProblemSize / 10, cMaxProblemSize);
+  std::size_t fail = 0;
+  std::size_t condfail = 0;
+  double reduction = 0;
+  double dcond = 0;
+  for (std::size_t i = 0; i < cNumRandomExamples; ++i) {
+    const Eigen::Index problem_size{problem_size_dist(gen)};
+    const auto m = random_covariance_matrix(problem_size, gen);
+    const Eigen::VectorXd b{
+        Eigen::VectorXd::NullaryExpr(problem_size, [&gen]() {
+          return std::normal_distribution<double>(0, 1)(gen);
+        })};
+
+    Eigen::ConjugateGradient<Eigen::MatrixXd, Eigen::Lower,
+                             Eigen::PartialCholesky<double>>
+        solver(m);
+    EXPECT_EQ(solver.info(), Eigen::Success)
+        << "Preconditioned solver failed to decompose";
+    solver.preconditioner().setOrder(
+        std::max(problem_size / 20, Eigen::Index{10}));
+
+    const Eigen::VectorXd x = solver.solve(b);
+    EXPECT_EQ(solver.info(), Eigen::Success)
+        << "Preconditioned solver failed to solve";
+    EXPECT_LT((m * x - b).norm(), 1.e-9);
+
+    Eigen::ConjugateGradient<Eigen::MatrixXd, Eigen::Lower,
+                             Eigen::IdentityPreconditioner>
+        solver0(m);
+    EXPECT_EQ(solver0.info(), Eigen::Success)
+        << "Default solver failed to decompose";
+    const Eigen::VectorXd x0 = solver0.solve(b);
+    EXPECT_EQ(solver0.info(), Eigen::Success)
+        << "Default solver failed to solve";
+    const auto cond0 = condition_number(m);
+    EXPECT_LE(solver.iterations(), solver0.iterations())
+        << "Problem size: " << problem_size << "; cond " << cond0;
+
+    const auto condp = condition_number(solver.preconditioner().solve(m));
+
+    EXPECT_LE(condp, cond0)
+        << "Problem size: " << problem_size
+        << "; cond: " << std::setprecision(5) << cond0
+        << "; preconditioned: " << condp << "; damage: " << condp / cond0;
+
+    // std::cout << i << ": cond " << cond0 << " -> " << condp << " = "
+    //           << condp / cond0 << std::endl;
+    if (solver.iterations() > solver0.iterations()) {
+      fail++;
+    }
+    if (condp > cond0) {
+      condfail++;
+    }
+    dcond += condp / cond0;
+    reduction += static_cast<double>(solver.iterations()) /
+                 static_cast<double>(solver0.iterations());
+  }
+
+  std::cout << "More iterations on " << fail << " of " << cNumRandomExamples << " problems."
+            << std::endl;
+  std::cout << "Worse conditioning on " << condfail << " of "
+            << cNumRandomExamples << " problems." << std::endl;
+  reduction =
+      std::pow(reduction, 1 / static_cast<double>(cNumRandomExamples - fail));
+  std::cout << "Geom mean iteration reduction: " << reduction << std::endl;
+  dcond = std::pow(dcond, 1 / static_cast<double>(cNumRandomExamples));
+  std::cout << "Geom mean condition reduction: " << dcond << std::endl;
 }
 
 }  // namespace albatross
\ No newline at end of file

From 1cc1b934932e2e4a64dfcc4229f217f5323a79a0 Mon Sep 17 00:00:00 2001
From: Matt Peddie <matt.peddie@swift-nav.com>
Date: Thu, 24 Apr 2025 13:59:40 +1000
Subject: [PATCH 5/6] More work on partial cholesky

---
 .../albatross/src/eigen/partial_cholesky.hpp  |  45 ++++-
 tests/test_partial_cholesky.cc                | 189 ++++++++++++------
 2 files changed, 162 insertions(+), 72 deletions(-)

diff --git a/include/albatross/src/eigen/partial_cholesky.hpp b/include/albatross/src/eigen/partial_cholesky.hpp
index e24b7f62..8b2750ab 100644
--- a/include/albatross/src/eigen/partial_cholesky.hpp
+++ b/include/albatross/src/eigen/partial_cholesky.hpp
@@ -36,7 +36,7 @@ template <typename Scalar> class PartialCholesky {
 
   static constexpr const Index cDefaultOrder = 22;
 
-  static constexpr const double cDefaultNugget = 1.e-3;
+  static constexpr const double cDefaultNugget = 1.e-2;
 
   PartialCholesky() {}
 
@@ -163,7 +163,7 @@ template <typename Scalar> class PartialCholesky {
 
     m_error = diag.tail(diag.size() - max_rank).array().sum();
 
-    m_nugget = std::sqrt(A.diagonal().minCoeff());
+    // m_nugget = std::sqrt(A.diagonal().minCoeff());
 
     m_transpositions = transpositions;
 
@@ -177,6 +177,21 @@ template <typename Scalar> class PartialCholesky {
     m_decomp = LDLT<MatrixXd>(MatrixXd::Identity(L.cols(), L.cols()) +
                               1 / (m_nugget * m_nugget) * L.transpose() * L);
 
+    MatrixXd Ltall(L.rows() + max_rank, L.cols());
+    Ltall.topRows(L.rows()) = transpositions * L;
+    Ltall.bottomRows(max_rank) =
+        MatrixXd::Identity(max_rank, max_rank) * m_nugget;
+
+    // std::cout << "Ltall (" << Ltall.rows() << "x" << Ltall.cols() << "):\n"
+    //           << Ltall << std::endl;
+    m_qr = HouseholderQR<MatrixXd>(Ltall);
+    MatrixXd thin_Q = m_qr.householderQ() * MatrixXd::Identity(m_qr.rows(), m_L.cols());
+    // std::cout << "thin_Q (" << thin_Q.rows() << "x" << thin_Q.cols() << "):\n"
+    //           << thin_Q << std::endl;
+    m_Q = thin_Q.topRows(rows());
+    // std::cout << "m_Q (" << m_Q.rows() << "x" << m_Q.cols() << "):\n"
+    //           << m_Q << std::endl;
+
     m_info = Success;
     return *this;
   }
@@ -186,14 +201,30 @@ template <typename Scalar> class PartialCholesky {
     assert(finished() &&
            "Please don't call 'solve()' on an unintialised decomposition!");
     const double n2 = m_nugget * m_nugget;
+
+    // std::cout << "Q^T b:\n" << MatrixXd(m_Q.transpose() * b) << std::endl;
+    // std::cout << "Q Q^T b:\n" << MatrixXd(m_Q * (m_Q.transpose() * b)) << std::endl;
+    // std::cout << "b - Q Q^T b:\n" << MatrixXd(b - m_Q * (m_Q.transpose() * b)) << std::endl;
+
     Matrix<Scalar, Dynamic, Rhs::ColsAtCompileTime> ret =
-        1 / n2 * b - 1 / (n2 * n2) *
-                         (m_transpositions * m_L *
-                          m_decomp.solve(m_L.transpose() *
-                                         m_transpositions.transpose() * b));
+        1 / n2 * (b - m_Q * (m_Q.transpose() * b));
+    // Matrix<Scalar, Dynamic, Rhs::ColsAtCompileTime> ret =
+    //     1 / n2 *
+    //     (b - (m_transpositions * m_L *
+    //           m_decomp.solve(m_L.transpose() * m_transpositions.transpose() *
+    //                          b / n2)));
     return ret;
   }
 
+  LDLT<MatrixXd> direct_solve() const {
+    assert(finished() && "Please don't call 'direct_solve()' on an "
+                         "uninitialised decomposition!");
+    return LDLT<MatrixXd>(permutationsP() * matrixL() * matrixL().transpose() *
+                              permutationsP().transpose() +
+                          MatrixXd::Identity(rows(), cols()) * nugget() *
+                              nugget());
+  }
+
   MatrixXd matrixL() const {
     assert(finished() &&
            "Please don't call 'matrixL()' on an uninitialised decomposition!");
@@ -239,6 +270,8 @@ template <typename Scalar> class PartialCholesky {
   ComputationInfo m_info{Success};
   MatrixType m_L{};
   LDLT<MatrixXd> m_decomp{};
+  MatrixXd m_Q{};
+  HouseholderQR<MatrixXd> m_qr{};
   PermutationType m_transpositions{};
 };
 
diff --git a/tests/test_partial_cholesky.cc b/tests/test_partial_cholesky.cc
index 44b9feb7..91da86ea 100644
--- a/tests/test_partial_cholesky.cc
+++ b/tests/test_partial_cholesky.cc
@@ -45,6 +45,16 @@ TEST(PartialCholesky, Compute) {
       << p.reconstructedMatrix() - m;
 }
 
+namespace {
+
+Eigen::MatrixXd add_diagonal(const Eigen::MatrixXd &A, double sigma) {
+  return A +
+         Eigen::MatrixXd(
+             Eigen::VectorXd::Constant(A.rows(), sigma * sigma).asDiagonal());
+}
+
+} // namespace
+
 TEST(PartialCholesky, Solve) {
   Eigen::PartialCholesky<double> p;
   ASSERT_EQ(Eigen::Success, p.info());
@@ -62,7 +72,7 @@ TEST(PartialCholesky, Solve) {
   const Eigen::VectorXd x = p.solve(b);
   ASSERT_EQ(Eigen::Success, p.info());
 
-  const Eigen::VectorXd x_llt = m.ldlt().solve(b);
+  const Eigen::VectorXd x_llt = add_diagonal(m, p.nugget()).ldlt().solve(b);
   EXPECT_LT((x - x_llt).norm(), p.nugget());
 }
 
@@ -84,8 +94,8 @@ TEST(PartialCholesky, SolveMatrix) {
   const Eigen::MatrixXd x = p.solve(b);
   ASSERT_EQ(Eigen::Success, p.info());
 
-  const Eigen::MatrixXd x_llt = m.ldlt().solve(b);
-  EXPECT_LT((x - x_llt).norm(), 10 * p.nugget());
+  const Eigen::MatrixXd x_llt = add_diagonal(m, p.nugget()).ldlt().solve(b);
+  EXPECT_LT((x - x_llt).norm(), 1.e-9);
 }
 
 static constexpr const std::size_t cNumRandomExamples = 222;
@@ -126,11 +136,16 @@ TEST(PartialCholesky, RandomCompleteProblems) {
     const Eigen::VectorXd x = p.solve(b);
     ASSERT_EQ(Eigen::Success, p.info());
 
-    const Eigen::VectorXd x_llt = m.ldlt().solve(b);
+    const Eigen::VectorXd x_llt =
+        (m + Eigen::MatrixXd(
+                 Eigen::VectorXd::Constant(m.rows(), p.nugget() * p.nugget())
+                     .asDiagonal()))
+            .ldlt()
+            .solve(b);
     // A cleverer implementation would derive the nugget size from the
     // eigenvalues of the original covariance rather than add a fudge
     // factor.
-    EXPECT_LT((x - x_llt).norm(), p.nugget() * 10)
+    EXPECT_LT((x - x_llt).norm(), 1.e-8)
         << "\neigs:\n"
         << Eigen::SelfAdjointEigenSolver<Eigen::MatrixXd>(m)
                .eigenvalues()
@@ -154,16 +169,24 @@ double condition_number(const Eigen::MatrixXd &m) {
 TEST(PartialCholesky, IncreasingRank) {
   std::default_random_engine gen{cDefaultSeed};
   const Eigen::MatrixXd m =
-      random_covariance_matrix(cExampleSize, cEigenvalueDistribution, gen);
+      random_covariance_matrix(cExampleSize, gen);
   const Eigen::VectorXd b{Eigen::VectorXd::NullaryExpr(cExampleSize, [&gen]() {
     return std::normal_distribution<double>(0, 1)(gen);
   })};
 
   std::vector<Eigen::PartialCholesky<double>> decomps(cExampleSize);
 
+  // Eigen::IOFormat high_prec_python(16, 0, ", ", "\n", "[", "]", "[", "]");
+  // std::cout << m.format(high_prec_python) << std::endl;
+
+  const Eigen::MatrixXd m_diag{add_diagonal(m, decomps[0].nugget())};
+  // std::cout << m_diag.format(high_prec_python) << std::endl;
+  const double mcond{condition_number(m_diag)};
+
   decomps[0].setOrder(1);
   // decomps[0].setNugget(std::sqrt(m.diagonal().minCoeff()));
   decomps[0].compute(m);
+  ASSERT_EQ(decomps[0].info(), Eigen::Success);
 
   const auto triangle = [](Eigen::Index index,
                            const auto &a) -> Eigen::MatrixXd {
@@ -194,13 +217,13 @@ TEST(PartialCholesky, IncreasingRank) {
     return a.reconstructedMatrix() - m;
   };
 
-  const auto preconditioned_condition = [&m](const auto &a) {
-    return condition_number(a.solve(m));
+  const auto preconditioned_condition = [&m_diag](const auto &a) {
+    return condition_number(a.solve(m_diag));
   };
 
-  const auto preconditioned_eigs = [&m](const auto &a) {
-    return spd_eigs(a.solve(m));
-  };
+  // const auto preconditioned_eigs = [&m_diag](const auto &a) {
+  //   return spd_eigs(a.solve(m_diag));
+  // };
 
   for (Eigen::Index k = 1; k < cExampleSize; ++k) {
     const Eigen::Index rank = k + 1;
@@ -232,54 +255,86 @@ TEST(PartialCholesky, IncreasingRank) {
     // problem
     EXPECT_LT(preconditioned_condition(decomps[k]),
               preconditioned_condition(decomps[k - 1]))
-        << "k = " << k << "\n    m eigs: " << spd_eigs(m).transpose()
-        << "\n mhat eigs: "
-        << spd_eigs(decomps[k].reconstructedMatrix()).transpose()
-        << "\n    k eigs: " << preconditioned_eigs(decomps[k]).transpose()
-        << "\nk - 1 eigs: " << preconditioned_eigs(decomps[k - 1]).transpose();
+        << "k = " << k << "  mcond: " << mcond
+        << "  err: " << decomps[k].error();
+    // << "\nm_diag eigs: " << spd_eigs(m_diag).transpose()
+    // << "\nprecond eigs: "
+    // << spd_eigs(
+    //        decomps[k].solve(Eigen::MatrixXd::Identity(m.rows(), m.cols())))
+    //        .transpose()
+    // << "\nprecond eigs direct: "
+    // << spd_eigs(decomps[k].direct_solve().solve(
+    //                 Eigen::MatrixXd::Identity(m.rows(), m.cols())))
+    //        .transpose()
+    // << "\n    k eigs: " << preconditioned_eigs(decomps[k]).transpose()
+    // << "\nk - 1 eigs: " << preconditioned_eigs(decomps[k - 1]).transpose();
+    EXPECT_LT(preconditioned_condition(decomps[k]), mcond)
+        << "k = " << k << "  err: " << decomps[k].error(); //  << "\nL:\n"
+    //     << decomps[k].matrixL() << "\nP:\n"
+    //     << Eigen::MatrixXi(decomps[k].permutationsP())
+    //     << "\nm_diag eigs: " << spd_eigs(m_diag).transpose()
+    //     << "\nprecond eigs: "
+    //     << spd_eigs(
+    //            decomps[k].solve(Eigen::MatrixXd::Identity(m.rows(),
+    //            m.cols()))) .transpose()
+    //     << "\nprecond eigs direct: "
+    //     << spd_eigs(decomps[k].direct_solve().solve(
+    //                     Eigen::MatrixXd::Identity(m.rows(), m.cols())))
+    //            .transpose()
+    //     << "\ndiag eigs: "
+    //     << spd_eigs(m * m.diagonal().array().inverse().matrix().asDiagonal())
+    //            .transpose()
+    //     << "\n    k eigs: " << preconditioned_eigs(decomps[k]).transpose()
+    //     << "\nk - 1 eigs: " << preconditioned_eigs(decomps[k -
+    //     1]).transpose();
+    // if (k == 2) {
+    //   std::cout << "k = 2, rank 3.  precond(m_diag):\n"
+    //             << decomps[k].solve(m_diag) << std::endl;
+    // }
   }
 }
 
-TEST(PartialCholesky, Approximate) {
-  std::default_random_engine gen{cDefaultSeed};
-  const Eigen::MatrixXd m =
-      random_covariance_matrix(cExampleSize, cEigenvalueDistribution, gen);
-  const Eigen::VectorXd b{Eigen::VectorXd::NullaryExpr(cExampleSize, [&gen]() {
-    return std::normal_distribution<double>(0, 1)(gen);
-  })};
-
-  Eigen::PartialCholesky<double> p;
-  ASSERT_EQ(Eigen::Success, p.info());
-  p.setOrder(2);
-  p.compute(m);
-  ASSERT_EQ(Eigen::Success, p.info());
-  const Eigen::MatrixXd L{p.matrixL()};
-  for (Eigen::Index i = 1; i < L.cols(); ++i) {
-    EXPECT_LT(L(i, i), L(i - 1, i - 1)) << L.diagonal().transpose();
-  }
-  const Eigen::VectorXd x = p.solve(b);
-  ASSERT_EQ(Eigen::Success, p.info());
-  Eigen::MatrixXd preconditioned{p.solve(m)};
-  Eigen::SelfAdjointEigenSolver<Eigen::MatrixXd> preeigs(preconditioned);
-  std::cout << "A:\n" << m << std::endl;
-  std::cout << "reconstructed:\n" << p.reconstructedMatrix() << std::endl;
-  std::cout << "error: " << p.error() << std::endl;
-  std::cout << "diff:\n" << m - p.reconstructedMatrix() << std::endl;
-  std::cout << "L:\n" << p.matrixL() << std::endl;
-  std::cout << "P:\n" << Eigen::MatrixXi(p.permutationsP()) << std::endl;
-  std::cout << m * x - b << std::endl;
-  std::cout << m * (p.reconstructedMatrix().ldlt().solve(b)) - b << std::endl;
-  std::cout << "Aapprox^-1 A:\n" << preconditioned << std::endl;
-  Eigen::SelfAdjointEigenSolver<Eigen::MatrixXd> eigs(m);
-  std::cout << "A eigs: " << eigs.eigenvalues().transpose() << std::endl;
-  std::cout << "Aapprox^-1 A eigs: " << preeigs.eigenvalues().transpose()
-            << std::endl;
-  Eigen::PartialCholesky<double> p3;
-  p3.setOrder(3);
-  p3.compute(m);
-  std::cout << "L:\n" << p3.matrixL() << std::endl;
-  std::cout << "P:\n" << Eigen::MatrixXi(p3.permutationsP()) << std::endl;
-}
+// TEST(PartialCholesky, Approximate) {
+//   std::default_random_engine gen{cDefaultSeed};
+//   const Eigen::MatrixXd m =
+//       random_covariance_matrix(cExampleSize, cEigenvalueDistribution, gen);
+//   const Eigen::VectorXd b{Eigen::VectorXd::NullaryExpr(cExampleSize, [&gen]()
+//   {
+//     return std::normal_distribution<double>(0, 1)(gen);
+//   })};
+
+//   Eigen::PartialCholesky<double> p;
+//   ASSERT_EQ(Eigen::Success, p.info());
+//   p.setOrder(2);
+//   p.compute(m);
+//   ASSERT_EQ(Eigen::Success, p.info());
+//   const Eigen::MatrixXd L{p.matrixL()};
+//   for (Eigen::Index i = 1; i < L.cols(); ++i) {
+//     EXPECT_LT(L(i, i), L(i - 1, i - 1)) << L.diagonal().transpose();
+//   }
+//   const Eigen::VectorXd x = p.solve(b);
+//   ASSERT_EQ(Eigen::Success, p.info());
+//   Eigen::MatrixXd preconditioned{p.solve(m)};
+//   Eigen::SelfAdjointEigenSolver<Eigen::MatrixXd> preeigs(preconditioned);
+//   std::cout << "A:\n" << m << std::endl;
+//   std::cout << "reconstructed:\n" << p.reconstructedMatrix() << std::endl;
+//   std::cout << "error: " << p.error() << std::endl;
+//   std::cout << "diff:\n" << m - p.reconstructedMatrix() << std::endl;
+//   std::cout << "L:\n" << p.matrixL() << std::endl;
+//   std::cout << "P:\n" << Eigen::MatrixXi(p.permutationsP()) << std::endl;
+//   std::cout << m * x - b << std::endl;
+//   std::cout << m * (p.reconstructedMatrix().ldlt().solve(b)) - b <<
+//   std::endl; std::cout << "Aapprox^-1 A:\n" << preconditioned << std::endl;
+//   Eigen::SelfAdjointEigenSolver<Eigen::MatrixXd> eigs(m);
+//   std::cout << "A eigs: " << eigs.eigenvalues().transpose() << std::endl;
+//   std::cout << "Aapprox^-1 A eigs: " << preeigs.eigenvalues().transpose()
+//             << std::endl;
+//   Eigen::PartialCholesky<double> p3;
+//   p3.setOrder(3);
+//   p3.compute(m);
+//   std::cout << "L:\n" << p3.matrixL() << std::endl;
+//   std::cout << "P:\n" << Eigen::MatrixXi(p3.permutationsP()) << std::endl;
+// }
 
 TEST(PartialCholesky, Precondition) {
   std::default_random_engine gen{cDefaultSeed};
@@ -305,17 +360,19 @@ TEST(PartialCholesky, Precondition) {
   EXPECT_LT(solver.iterations(), solver0.iterations());
 }
 
-static constexpr const Eigen::Index cMaxProblemSize = 200;
+static constexpr const std::size_t cNumRandomProblems = 20;
+static constexpr const Eigen::Index cMinProblemSize = 100;
+static constexpr const Eigen::Index cMaxProblemSize = 300;
 
 TEST(PartialCholesky, PreconditionRandomProblems) {
   std::default_random_engine gen{cDefaultSeed};
   std::uniform_int_distribution<Eigen::Index> problem_size_dist(
-      cMaxProblemSize / 10, cMaxProblemSize);
+      cMinProblemSize, cMaxProblemSize);
   std::size_t fail = 0;
   std::size_t condfail = 0;
   double reduction = 0;
   double dcond = 0;
-  for (std::size_t i = 0; i < cNumRandomExamples; ++i) {
+  for (std::size_t i = 0; i < cNumRandomProblems; ++i) {
     const Eigen::Index problem_size{problem_size_dist(gen)};
     const auto m = random_covariance_matrix(problem_size, gen);
     const Eigen::VectorXd b{
@@ -329,7 +386,7 @@ TEST(PartialCholesky, PreconditionRandomProblems) {
     EXPECT_EQ(solver.info(), Eigen::Success)
         << "Preconditioned solver failed to decompose";
     solver.preconditioner().setOrder(
-        std::max(problem_size / 20, Eigen::Index{10}));
+        std::max(problem_size / 20, Eigen::Index{20}));
 
     const Eigen::VectorXd x = solver.solve(b);
     EXPECT_EQ(solver.info(), Eigen::Success)
@@ -368,14 +425,14 @@ TEST(PartialCholesky, PreconditionRandomProblems) {
                  static_cast<double>(solver0.iterations());
   }
 
-  std::cout << "More iterations on " << fail << " of " << cNumRandomExamples << " problems."
-            << std::endl;
+  std::cout << "More iterations on " << fail << " of " << cNumRandomProblems
+            << " problems." << std::endl;
   std::cout << "Worse conditioning on " << condfail << " of "
-            << cNumRandomExamples << " problems." << std::endl;
-  reduction =
-      std::pow(reduction, 1 / static_cast<double>(cNumRandomExamples - fail));
+            << cNumRandomProblems << " problems." << std::endl;
+  reduction = std::pow(reduction,
+                       2 / static_cast<double>(cNumRandomProblems - fail + 1));
   std::cout << "Geom mean iteration reduction: " << reduction << std::endl;
-  dcond = std::pow(dcond, 1 / static_cast<double>(cNumRandomExamples));
+  dcond = std::pow(dcond, 2 / static_cast<double>(cNumRandomProblems + 1));
   std::cout << "Geom mean condition reduction: " << dcond << std::endl;
 }
 

From cfa0a67226abf00b5e323b3c7c5eb072957e40df Mon Sep 17 00:00:00 2001
From: Matt Peddie <matt.peddie@swift-nav.com>
Date: Thu, 24 Apr 2025 14:02:25 +1000
Subject: [PATCH 6/6] Test changes to CG GP

---
 tests/test_cg_gp.cc | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/tests/test_cg_gp.cc b/tests/test_cg_gp.cc
index 9c15c45b..ba1cd68a 100644
--- a/tests/test_cg_gp.cc
+++ b/tests/test_cg_gp.cc
@@ -55,12 +55,12 @@ void describe_fit(const FitType &fit, std::ostream &os = std::cout) {
 TEST(TestConjugateGradientGP, TestMean) {
   using CovFunc = SquaredExponential<EuclideanDistance>;
 
-  CovFunc covariance(1, 1);
-  auto dataset = make_toy_linear_data(5, 1, 1.e-3, 5000);
+  CovFunc covariance(0.5, 1);
+  auto dataset = make_toy_linear_data(5, 0.01, 1.e-2, 4000);
   auto direct = gp_from_covariance(covariance, "direct");
-  auto cg = cg_gp_from_covariance(covariance, "cg", IterativeSolverOptions{},
-                                  Eigen::PartialCholesky<double>{20, 1.e-3});
-  // auto cg = cg_gp_from_covariance(covariance, "cg");
+  // auto cg = cg_gp_from_covariance(covariance, "cg", IterativeSolverOptions{},
+  //                                 Eigen::PartialCholesky<double>{100, 1.e-1});
+  auto cg = cg_gp_from_covariance(covariance, "cg");
 
   auto begin = std::chrono::steady_clock::now();
   auto direct_fit = direct.fit(dataset);