Change the default value of n_replicates_filter_ratio_thresh to 0.2.

We don't want the stability definition to depend too much on n_replicates_after_filtering/n_replicates. Before we were using 0.5. That makes sense, since 'stable' perhaps means that at least the majority (i.e., > 50%) of the solutions are equivalently good. But I observed that mvNMF solutions could be quite unstable, due to the fact that we only tune lambda_tilde for one of the mvNMF runs. That results in relatively lower ratio of n_replicates_after_filtering/n_replicates. So I'm lowering the threshold here.
parklab · Jul 19, 2021 · caf9254 · caf9254 · Hu-JIN · Jul 19, 2021
1 parent 46efc98
commit caf9254
Showing 1 changed file with 5 additions and 5 deletions.
diff --git a/musical/denovo.py b/musical/denovo.py
@@ -240,7 +240,7 @@ def _gather_results(X, Ws, Hs=None, method='cluster_by_matching', n_components=N
 def _select_n_components(n_components_all, samplewise_reconstruction_errors_all, sil_score_all,
                          n_replicates, n_replicates_after_filtering_all,
                          pthresh=0.05, sil_score_mean_thresh=0.8, sil_score_min_thresh=0.2,
-                         n_replicates_filter_ratio_thresh=0.5,
+                         n_replicates_filter_ratio_thresh=0.2,
                          method='algorithm1'):
     """Select the best n_components based on reconstruction error and stability.
 
@@ -714,7 +714,7 @@ def fit(self, eng=None):
             pthresh=self.pthresh,
             sil_score_mean_thresh=0.8,
             sil_score_min_thresh=0.2,
-            n_replicates_filter_ratio_thresh=0.5,
+            n_replicates_filter_ratio_thresh=0.2,
             method='algorithm1'
         )
         self.W = self.W_all[self.n_components]
@@ -735,7 +735,7 @@ def fit(self, eng=None):
             pthresh=self.pthresh,
             sil_score_mean_thresh=0.8,
             sil_score_min_thresh=0.2,
-            n_replicates_filter_ratio_thresh=0.5,
+            n_replicates_filter_ratio_thresh=0.2,
             method='algorithm1.1'
         )
 
@@ -748,7 +748,7 @@ def fit(self, eng=None):
             pthresh=self.pthresh,
             sil_score_mean_thresh=0.8,
             sil_score_min_thresh=0.2,
-            n_replicates_filter_ratio_thresh=0.5,
+            n_replicates_filter_ratio_thresh=0.2,
             method='algorithm2'
         )
 
@@ -761,7 +761,7 @@ def fit(self, eng=None):
             pthresh=self.pthresh,
             sil_score_mean_thresh=0.8,
             sil_score_min_thresh=0.2,
-            n_replicates_filter_ratio_thresh=0.5,
+            n_replicates_filter_ratio_thresh=0.2,
             method='algorithm2.1'
         )