MDAnalysis · jberg5 · Mar 29, 2026 · Mar 29, 2026 · jberg5 · Mar 29, 2026
diff --git a/package/AUTHORS b/package/AUTHORS
@@ -277,6 +277,7 @@ Chronological list of authors
   - Ayush Agarwal
   - Parth Uppal
   - Olivier Languin--Cattoën
+  - Jonathan Berg
 
 External code
 -------------

diff --git a/package/CHANGELOG b/package/CHANGELOG
@@ -17,7 +17,7 @@ The rules for this file:
 ??/??/?? IAlibay, orbeckst, marinegor, tylerjereddy, ljwoods2, marinegor,
          spyke7, talagayev, tanii1125, BradyAJohnston, hejamu, jeremyleung521,
          harshitgajjela-droid, kunjsinha, aygarwal, jauy123, Dreamstick9,
-         ollyfutur
+         ollyfutur, jberg
 
  * 2.11.0
 
@@ -53,6 +53,9 @@ Enhancements
  * Added new function `MDAnalysis.fetch.from_PDB` to download structure files from wwPDB
    using `pooch` as optional dependency (Issue #4907, PR #4943) 
  * Added benchmarks for package.MDAnalysis.analysis.msd.EinsteinMSD (PR #5277)
+ * Improved PCA performance by computing covariance matrix via BLAS matrix
+   multiply instead of per-frame outer product accumulation, and using
+   symmetric eigendecomposition (eigh) instead of general eig (PR #5352)
  * Improved performance of `AtomGroup.wrap()` with compounds (PR #5220)
  * Adds support for parsing `.tpr` files produced by GROMACS 2026.0
  * Enables parallelization for analysis.diffusionmap.DistanceMatrix

diff --git a/package/MDAnalysis/analysis/pca.py b/package/MDAnalysis/analysis/pca.py
@@ -238,6 +238,11 @@ class PCA(AnalysisBase):
        manually iterate through ``self._trajectory``, which would
        incorrectly handle cases where the ``frame`` argument
        was passed.
+    .. versionchanged:: 2.11.0
+       Covariance matrix is now computed via BLAS matrix multiply instead of
+       per-frame outer product accumulation, and uses symmetric
+       eigendecomposition (``eigh``) instead of general ``eig``, resulting
+       in significant performance improvements for large systems.
     """
 
     _analysis_algorithm_is_parallelizable = False
@@ -290,6 +295,7 @@ def _prepare(self):
             )
         n_dim = self._n_atoms * 3
         self.cov = np.zeros((n_dim, n_dim))
+        self._frame_data = np.empty((self.n_frames, n_dim))
         self._ref_atom_positions = self._reference.positions
         self._ref_cog = self._reference.center_of_geometry()
         self._ref_atom_positions -= self._ref_cog
@@ -329,14 +335,18 @@ def _single_frame(self):
         else:
             x = self._atoms.positions.ravel()
         x -= self._xmean
-        self.cov += np.dot(x[:, np.newaxis], x[:, np.newaxis].T)
+        self._frame_data[self._frame_index] = x
 
     def _conclude(self):
+        self.cov = self._frame_data.T @ self._frame_data
         self.cov /= self.n_frames - 1
-        e_vals, e_vects = np.linalg.eig(self.cov)
-        sort_idx = np.argsort(e_vals)[::-1]
-        self._variance = e_vals[sort_idx]
-        self._p_components = e_vects[:, sort_idx]
+        del self._frame_data
+        # covariance matrix is symmetric and real-valued by
+        # construction, so we can use faster eigh
+        eigenvals, eigenvects = np.linalg.eigh(self.cov)
+        # eigh returns ascending order; reverse for descending
+        self._variance = eigenvals[::-1]
+        self._p_components = eigenvects[:, ::-1]
         self._calculated = True
         self.n_components = self._n_components