Compute noise_variance_ in PCA implementation

Previously `noise_vars` was an output parameter passed to the cuda PCA implementation, but it was unimplemented. This adds support for computing `noise_vars` in the cuda code, and tests that the results are valid by comparing to the scikit-learn implementation. The previous code would always have a `noise_variance_` of 0, resulting in downstream issues interpreting results after converting a cuml estimator to its sklearn equivalent (e.g. broken `score_samples`).
rapidsai · Jan 17, 2025 · c4939b6 · c4939b6
1 parent f29293f
commit c4939b6
Show file tree

Hide file tree

Showing 3 changed files with 51 additions and 9 deletions.
diff --git a/cpp/src/pca/pca.cuh b/cpp/src/pca/pca.cuh
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2018-2024, NVIDIA CORPORATION.
+ * Copyright (c) 2018-2025, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -41,6 +41,7 @@ void truncCompExpVars(const raft::handle_t& handle,
                       math_t* components,
                       math_t* explained_var,
                       math_t* explained_var_ratio,
+                      math_t* noise_vars,
                       const paramsTSVDTemplate<enum_solver>& prms,
                       cudaStream_t stream)
 {
@@ -67,6 +68,20 @@ void truncCompExpVars(const raft::handle_t& handle,
                                 prms.n_components,
                                 std::size_t(1),
                                 stream);
+
+  // Compute the scalar noise_vars defined as (pseudocode)
+  // (n_components < min(n_cols, n_rows)) ? explained_var_all[n_components:].mean() : 0
+  if (prms.n_components < prms.n_cols && prms.n_components < prms.n_rows) {
+    raft::stats::mean(noise_vars,
+                      explained_var_all.data() + prms.n_components,
+                      std::size_t{1},
+                      prms.n_cols - prms.n_components,
+                      false,
+                      true,
+                      stream);
+  } else {
+    raft::matrix::setValue(noise_vars, noise_vars, math_t{0}, 1, stream);
+  }
 }
 
 /**
@@ -116,7 +131,7 @@ void pcaFit(const raft::handle_t& handle,
   raft::stats::cov(
     handle, cov.data(), input, mu, prms.n_cols, prms.n_rows, true, false, true, stream);
   truncCompExpVars(
-    handle, cov.data(), components, explained_var, explained_var_ratio, prms, stream);
+    handle, cov.data(), components, explained_var, explained_var_ratio, noise_vars, prms, stream);
 
   math_t scalar = (prms.n_rows - 1);
   raft::matrix::seqRoot(explained_var, singular_vals, scalar, n_components, stream, true);

diff --git a/cpp/src/pca/pca_mg.cu b/cpp/src/pca/pca_mg.cu
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2024, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2025, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -69,7 +69,7 @@ void fit_impl(raft::handle_t& handle,
   Stats::opg::cov(handle, cov, input_data, input_desc, mu_data, true, streams, n_streams);
 
   ML::truncCompExpVars<T, mg_solver>(
-    handle, cov.ptr, components, explained_var, explained_var_ratio, prms, streams[0]);
+    handle, cov.ptr, components, explained_var, explained_var_ratio, noise_vars, prms, streams[0]);
 
   T scalar = (prms.n_rows - 1);
   raft::matrix::seqRoot(explained_var, singular_vals, scalar, prms.n_components, streams[0], true);
@@ -128,9 +128,6 @@ void fit_impl(raft::handle_t& handle,
              streams,
              n_streams,
              verbose);
-    for (std::uint32_t i = 0; i < n_streams; i++) {
-      handle.sync_stream(streams[i]);
-    }
   } else if (prms.algorithm == mg_solver::QR) {
     const raft::handle_t& h = handle;
     cudaStream_t stream     = h.get_stream();
@@ -194,6 +191,20 @@ void fit_impl(raft::handle_t& handle,
                                   std::size_t(1),
                                   stream);
 
+    // Compute the scalar noise_vars defined as (pseudocode)
+    // (n_components < min(n_cols, n_rows)) ? explained_var_all[n_components:].mean() : 0
+    if (prms.n_components < prms.n_cols && prms.n_components < prms.n_rows) {
+      raft::stats::mean(noise_vars,
+                        explained_var_all.data() + prms.n_components,
+                        std::size_t{1},
+                        prms.n_cols - prms.n_components,
+                        false,
+                        true,
+                        stream);
+    } else {
+      raft::matrix::setValue(noise_vars, noise_vars, T{0}, 1, stream);
+    }
+
     raft::linalg::transpose(vMatrix.data(), prms.n_cols, stream);
     raft::matrix::truncZeroOrigin(
       vMatrix.data(), prms.n_cols, components, prms.n_components, prms.n_cols, stream);

diff --git a/python/cuml/cuml/tests/test_pca.py b/python/cuml/cuml/tests/test_pca.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2019-2023, NVIDIA CORPORATION.
+# Copyright (c) 2019-2025, NVIDIA CORPORATION.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -72,13 +72,13 @@ def test_pca_fit(datatype, input_type, name, use_handle):
         "components_",
         "explained_variance_",
         "explained_variance_ratio_",
+        "noise_variance_",
     ]:
         with_sign = False if attr in ["components_"] else True
         print(attr)
         print(getattr(cupca, attr))
         print(getattr(skpca, attr))
         cuml_res = getattr(cupca, attr)
-
         skl_res = getattr(skpca, attr)
         assert array_equal(cuml_res, skl_res, 1e-3, with_sign=with_sign)
 
@@ -304,6 +304,22 @@ def test_sparse_pca_inputs(nrows, ncols, whiten, return_sparse, cupy_input):
         assert array_equal(i_sparse, X.todense(), 1e-1, with_sign=True)
 
 
+@pytest.mark.parametrize(
+    "n_samples, n_features",
+    [
+        pytest.param(9, 20, id="n_samples <= n_components"),
+        pytest.param(20, 10, id="n_features <= n_components"),
+    ],
+)
+def test_noise_variance_zero(n_samples, n_features):
+    X, _ = make_blobs(
+        n_samples=n_samples, n_features=n_features, random_state=0
+    )
+    cupca = cuPCA(n_components=10)
+    cupca.fit(X)
+    assert cupca.noise_variance_.item() == 0
+
+
 def test_exceptions():
     with pytest.raises(NotFittedError):
         X = cp.random.random((10, 10))