In [1]:
import pandas as pd
import numpy as np
from os.path import join

from umap import UMAP

In [2]:
# load data 
df  = pd.read_parquet("../bldb/clean/csv/bldb_dset.parquet")
sbl = df[df.bla_class.str.contains("class_a|class_c|class_d")]
mbl = df[df.bla_class.str.contains("class_b1|class_b2|class_b3")]

esm1b_sbl     = np.array([np.array(x) for x in sbl["esm1b"]])
esm2_650m_sbl = np.array([np.array(x) for x in sbl["esm2_650m"]])
esm2_3b_sbl   = np.array([np.array(x) for x in sbl["esm2_3b"]])
carp_sbl      = np.array([np.array(x) for x in sbl["carp"]])
t5xlu50_sbl   = np.array([np.array(x) for x in sbl["t5xlu50"]])

esm1b_mbl     = np.array([np.array(x) for x in mbl["esm1b"]])
esm2_650m_mbl = np.array([np.array(x) for x in mbl["esm2_650m"]])
esm2_3b_mbl   = np.array([np.array(x) for x in mbl["esm2_3b"]])
carp_mbl      = np.array([np.array(x) for x in mbl["carp"]])
t5xlu50_mbl   = np.array([np.array(x) for x in mbl["t5xlu50"]])

In [6]:
# a fx to run umap
def run_umap(array, n_neighbors, dim1, dim2, dataset, csv_name):

    print(f"#################################################################")
    print(f"      Running UMAP with n_neighbors = {n_neighbors} | dataset = {dataset}")
    print(f"#################################################################\n")
    
    umap = UMAP(
        n_components=2,
        n_neighbors=n_neighbors,
        metric="cosine",
        random_state=42,
        verbose=True,
        init="spectral",
        spread=0.2, 
        min_dist=0.2,
        n_epochs=2000,
        n_jobs=-1
    )

    umap_representation = umap.fit_transform(array)
    dim1 = dim1
    dim2 = dim2

    df_umap = pd.DataFrame(umap_representation, columns=[dim1, dim2])
    df_umap.to_csv(csv_name, index=False)
    
    print(f"Input embedding dimention: {len(array[0])}")
    print(f"Data points: {len(array)}")
    print(f"Results saved at: {csv_name}\n")

models = ["esm1b","esm2_650m", "esm2_3b", "carp", "t5xlu50"]
nn = [30, 50, 100, 200, 300, 400, 500, 600, 700, 800, 900, 1000]

# SBL 

In [4]:
sbl[["seq_id"]].to_csv("../bldb/lowdim/umap/sbl_ids.csv", index=False)

In [7]:
sbl_arrays = {
    "esm1b"    : esm1b_sbl,
    "esm2_650m": esm2_650m_sbl,
    "esm2_3b"  : esm2_3b_sbl,
    "carp"     : carp_sbl,
    "t5xlu50"  : t5xlu50_sbl
}

# iterate over data to create input labels 
for model in models:
    for n in nn:
        name1 = "umap1_" + model
        name2 = "umap2_" + model
        csv = "../bldb/lowdim/umap/umap_sbl_" + model + "_" + str(n) + ".csv"

        # get the dataset based on the model name 
        input_embeddings = sbl_arrays[model]

        # logs
        print(f"#################################################################")
        print(f"                            {model}                              ")

        # Run the function
        run_umap(array=input_embeddings, n_neighbors=n, dim1=name1, dim2=name2, dataset="SBL", csv_name=csv)

#################################################################
                            esm1b                              
#################################################################
      Running UMAP with n_neighbors = 30 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=30, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 14:21:31 2024 Construct fuzzy simplicial set
Thu Apr 18 14:21:31 2024 Finding Nearest Neighbors
Thu Apr 18 14:21:31 2024 Building RP forest with 13 trees


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 14:21:32 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 14:21:38 2024 Finished Nearest Neighbor Search
Thu Apr 18 14:21:39 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 14:23:30 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm1b_30.csv

#################################################################
                            esm1b                              
#################################################################
      Running UMAP with n_neighbors = 50 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=50, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 14:23:30 2024 Construct fuzzy simplicial set
Thu Apr 18 

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 14:23:31 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 14:23:38 2024 Finished Nearest Neighbor Search
Thu Apr 18 14:23:38 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 14:25:47 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm1b_50.csv

#################################################################
                            esm1b                              
#################################################################
      Running UMAP with n_neighbors = 100 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=100, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 14:25:47 2024 Construct fuzzy simplicial set
Thu Apr 1

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 14:25:48 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 14:26:14 2024 Finished Nearest Neighbor Search
Thu Apr 18 14:26:15 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 14:28:56 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm1b_100.csv

#################################################################
                            esm1b                              
#################################################################
      Running UMAP with n_neighbors = 200 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=200, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 14:28:56 2024 Construct fuzzy simplicial set
Thu Apr 

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 14:28:57 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 14:29:37 2024 Finished Nearest Neighbor Search
Thu Apr 18 14:29:38 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 14:32:57 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm1b_200.csv

#################################################################
                            esm1b                              
#################################################################
      Running UMAP with n_neighbors = 300 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=300, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 14:32:57 2024 Construct fuzzy simplicial set
Thu Apr 

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 14:32:58 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 14:33:42 2024 Finished Nearest Neighbor Search
Thu Apr 18 14:33:44 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 14:37:29 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm1b_300.csv

#################################################################
                            esm1b                              
#################################################################
      Running UMAP with n_neighbors = 400 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=400, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 14:37:29 2024 Construct fuzzy simplicial set
Thu Apr 

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 14:37:29 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 14:38:17 2024 Finished Nearest Neighbor Search
Thu Apr 18 14:38:20 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 14:42:23 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm1b_400.csv

#################################################################
                            esm1b                              
#################################################################
      Running UMAP with n_neighbors = 500 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=500, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 14:42:24 2024 Construct fuzzy simplicial set
Thu Apr 

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 14:42:24 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 14:43:17 2024 Finished Nearest Neighbor Search
Thu Apr 18 14:43:21 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 14:47:35 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm1b_500.csv

#################################################################
                            esm1b                              
#################################################################
      Running UMAP with n_neighbors = 600 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=600, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 14:47:36 2024 Construct fuzzy simplicial set
Thu Apr 

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 14:47:36 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 14:48:51 2024 Finished Nearest Neighbor Search
Thu Apr 18 14:48:55 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 14:53:22 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm1b_600.csv

#################################################################
                            esm1b                              
#################################################################
      Running UMAP with n_neighbors = 700 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=700, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 14:53:22 2024 Construct fuzzy simplicial set
Thu Apr 

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 14:53:23 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 14:54:45 2024 Finished Nearest Neighbor Search
Thu Apr 18 14:54:50 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 14:59:29 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm1b_700.csv

#################################################################
                            esm1b                              
#################################################################
      Running UMAP with n_neighbors = 800 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=800, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 14:59:29 2024 Construct fuzzy simplicial set
Thu Apr 

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 14:59:30 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 15:01:00 2024 Finished Nearest Neighbor Search
Thu Apr 18 15:01:06 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 15:05:51 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm1b_800.csv

#################################################################
                            esm1b                              
#################################################################
      Running UMAP with n_neighbors = 900 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=900, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 15:05:51 2024 Construct fuzzy simplicial set
Thu Apr 

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 15:05:52 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 15:07:32 2024 Finished Nearest Neighbor Search
Thu Apr 18 15:07:38 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 15:12:30 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm1b_900.csv

#################################################################
                            esm1b                              
#################################################################
      Running UMAP with n_neighbors = 1000 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=1000, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 15:12:30 2024 Construct fuzzy simplicial set
Thu Ap

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 15:12:31 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 15:14:20 2024 Finished Nearest Neighbor Search
Thu Apr 18 15:14:28 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 15:19:29 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm1b_1000.csv

#################################################################
                            esm2_650m                              
#################################################################
      Running UMAP with n_neighbors = 30 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=30, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 15:19:29 2024 Construct fuzzy simplicial set
Thu A

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 15:19:29 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 15:19:32 2024 Finished Nearest Neighbor Search
Thu Apr 18 15:19:32 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 15:21:22 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm2_650m_30.csv

#################################################################
                            esm2_650m                              
#################################################################
      Running UMAP with n_neighbors = 50 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=50, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 15:21:22 2024 Construct fuzzy simplicial set
Thu

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 15:21:23 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 15:21:29 2024 Finished Nearest Neighbor Search
Thu Apr 18 15:21:29 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 15:23:38 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm2_650m_50.csv

#################################################################
                            esm2_650m                              
#################################################################
      Running UMAP with n_neighbors = 100 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=100, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 15:23:38 2024 Construct fuzzy simplicial set
T

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 15:23:39 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 15:24:01 2024 Finished Nearest Neighbor Search
Thu Apr 18 15:24:02 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 15:26:41 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm2_650m_100.csv

#################################################################
                            esm2_650m                              
#################################################################
      Running UMAP with n_neighbors = 200 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=200, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 15:26:41 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 15:26:42 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 15:27:17 2024 Finished Nearest Neighbor Search
Thu Apr 18 15:27:18 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 15:30:36 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm2_650m_200.csv

#################################################################
                            esm2_650m                              
#################################################################
      Running UMAP with n_neighbors = 300 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=300, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 15:30:36 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 15:30:37 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 15:31:16 2024 Finished Nearest Neighbor Search
Thu Apr 18 15:31:18 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 15:35:01 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm2_650m_300.csv

#################################################################
                            esm2_650m                              
#################################################################
      Running UMAP with n_neighbors = 400 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=400, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 15:35:02 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 15:35:02 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 15:35:45 2024 Finished Nearest Neighbor Search
Thu Apr 18 15:35:48 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 15:39:47 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm2_650m_400.csv

#################################################################
                            esm2_650m                              
#################################################################
      Running UMAP with n_neighbors = 500 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=500, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 15:39:47 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 15:39:47 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 15:40:52 2024 Finished Nearest Neighbor Search
Thu Apr 18 15:40:55 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 15:45:09 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm2_650m_500.csv

#################################################################
                            esm2_650m                              
#################################################################
      Running UMAP with n_neighbors = 600 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=600, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 15:45:10 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 15:45:10 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 15:46:22 2024 Finished Nearest Neighbor Search
Thu Apr 18 15:46:26 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 15:50:52 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm2_650m_600.csv

#################################################################
                            esm2_650m                              
#################################################################
      Running UMAP with n_neighbors = 700 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=700, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 15:50:52 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 15:50:52 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 15:52:13 2024 Finished Nearest Neighbor Search
Thu Apr 18 15:52:18 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 15:56:52 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm2_650m_700.csv

#################################################################
                            esm2_650m                              
#################################################################
      Running UMAP with n_neighbors = 800 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=800, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 15:56:53 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 15:56:53 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 15:58:21 2024 Finished Nearest Neighbor Search
Thu Apr 18 15:58:27 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 16:03:10 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm2_650m_800.csv

#################################################################
                            esm2_650m                              
#################################################################
      Running UMAP with n_neighbors = 900 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=900, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 16:03:10 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 16:03:10 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 16:04:47 2024 Finished Nearest Neighbor Search
Thu Apr 18 16:04:53 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 16:09:45 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm2_650m_900.csv

#################################################################
                            esm2_650m                              
#################################################################
      Running UMAP with n_neighbors = 1000 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=1000, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 16:09:45 2024 Construct fuzzy simplicial se

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 16:09:45 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 16:11:31 2024 Finished Nearest Neighbor Search
Thu Apr 18 16:11:39 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 16:16:36 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm2_650m_1000.csv

#################################################################
                            esm2_3b                              
#################################################################
      Running UMAP with n_neighbors = 30 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=30, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 16:16:37 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 16:16:37 2024 Finding Nearest Neighbors
Thu Apr 18 16:16:37 2024 Building RP forest with 13 trees
Thu Apr 18 16:16:38 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 16:16:41 2024 Finished Nearest Neighbor Search
Thu Apr 18 16:16:42 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 16:18:39 2024 Finished embedding
Input embedding dimention: 2560
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm2_3b_30.csv

#################################################################
                            esm2_3b                              
#################################################################
      Running UMAP with n_neighbors = 50 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=50, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 16:18:39 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 16:18:39 2024 Finding Nearest Neighbors
Thu Apr 18 16:18:39 2024 Building RP forest with 13 trees
Thu Apr 18 16:18:40 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	Stopping threshold met -- exiting after 2 iterations
Thu Apr 18 16:18:50 2024 Finished Nearest Neighbor Search
Thu Apr 18 16:18:50 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 16:21:05 2024 Finished embedding
Input embedding dimention: 2560
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm2_3b_50.csv

#################################################################
                            esm2_3b                              
#################################################################
      Running UMAP with n_neighbors = 100 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=100, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 16:21:05 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 16:21:05 2024 Finding Nearest Neighbors
Thu Apr 18 16:21:05 2024 Building RP forest with 13 trees
Thu Apr 18 16:21:06 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 16:21:39 2024 Finished Nearest Neighbor Search
Thu Apr 18 16:21:40 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 16:24:23 2024 Finished embedding
Input embedding dimention: 2560
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm2_3b_100.csv

#################################################################
                            esm2_3b                              
#################################################################
      Running UMAP with n_neighbors = 200 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=200, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 16:24:23 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 16:24:23 2024 Finding Nearest Neighbors
Thu Apr 18 16:24:23 2024 Building RP forest with 13 trees
Thu Apr 18 16:24:24 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 16:25:10 2024 Finished Nearest Neighbor Search
Thu Apr 18 16:25:12 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 16:28:32 2024 Finished embedding
Input embedding dimention: 2560
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm2_3b_200.csv

#################################################################
                            esm2_3b                              
#################################################################
      Running UMAP with n_neighbors = 300 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=300, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 16:28:32 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 16:28:32 2024 Finding Nearest Neighbors
Thu Apr 18 16:28:32 2024 Building RP forest with 13 trees
Thu Apr 18 16:28:33 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 16:29:27 2024 Finished Nearest Neighbor Search
Thu Apr 18 16:29:29 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 16:33:14 2024 Finished embedding
Input embedding dimention: 2560
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm2_3b_300.csv

#################################################################
                            esm2_3b                              
#################################################################
      Running UMAP with n_neighbors = 400 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=400, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 16:33:15 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 16:33:15 2024 Finding Nearest Neighbors
Thu Apr 18 16:33:15 2024 Building RP forest with 13 trees
Thu Apr 18 16:33:15 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 16:34:17 2024 Finished Nearest Neighbor Search
Thu Apr 18 16:34:20 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 16:38:21 2024 Finished embedding
Input embedding dimention: 2560
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm2_3b_400.csv

#################################################################
                            esm2_3b                              
#################################################################
      Running UMAP with n_neighbors = 500 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=500, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 16:38:22 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 16:38:22 2024 Finding Nearest Neighbors
Thu Apr 18 16:38:22 2024 Building RP forest with 13 trees
Thu Apr 18 16:38:23 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 16:39:32 2024 Finished Nearest Neighbor Search
Thu Apr 18 16:39:35 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 16:43:53 2024 Finished embedding
Input embedding dimention: 2560
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm2_3b_500.csv

#################################################################
                            esm2_3b                              
#################################################################
      Running UMAP with n_neighbors = 600 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=600, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 16:43:54 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 16:43:54 2024 Finding Nearest Neighbors
Thu Apr 18 16:43:54 2024 Building RP forest with 13 trees
Thu Apr 18 16:43:54 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 16:45:34 2024 Finished Nearest Neighbor Search
Thu Apr 18 16:45:38 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 16:50:04 2024 Finished embedding
Input embedding dimention: 2560
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm2_3b_600.csv

#################################################################
                            esm2_3b                              
#################################################################
      Running UMAP with n_neighbors = 700 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=700, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 16:50:04 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 16:50:04 2024 Finding Nearest Neighbors
Thu Apr 18 16:50:04 2024 Building RP forest with 13 trees
Thu Apr 18 16:50:05 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 16:51:55 2024 Finished Nearest Neighbor Search
Thu Apr 18 16:52:00 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 16:56:37 2024 Finished embedding
Input embedding dimention: 2560
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm2_3b_700.csv

#################################################################
                            esm2_3b                              
#################################################################
      Running UMAP with n_neighbors = 800 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=800, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 16:56:38 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 16:56:38 2024 Finding Nearest Neighbors
Thu Apr 18 16:56:38 2024 Building RP forest with 13 trees
Thu Apr 18 16:56:39 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 16:58:37 2024 Finished Nearest Neighbor Search
Thu Apr 18 16:58:43 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 17:03:25 2024 Finished embedding
Input embedding dimention: 2560
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm2_3b_800.csv

#################################################################
                            esm2_3b                              
#################################################################
      Running UMAP with n_neighbors = 900 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=900, random_state=42, spread=0.2, verbose=True)


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 17:03:26 2024 Construct fuzzy simplicial set
Thu Apr 18 17:03:26 2024 Finding Nearest Neighbors
Thu Apr 18 17:03:26 2024 Building RP forest with 13 trees
Thu Apr 18 17:03:27 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 17:05:34 2024 Finished Nearest Neighbor Search
Thu Apr 18 17:05:41 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 17:10:33 2024 Finished embedding
Input embedding dimention: 2560
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm2_3b_900.csv

#################################################################
                            esm2_3b                              
#################################################################
      Running UMAP with n_neighbors = 1000 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=1000, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 17:10:33 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 17:10:34 2024 Finding Nearest Neighbors
Thu Apr 18 17:10:34 2024 Building RP forest with 13 trees
Thu Apr 18 17:10:34 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 17:12:53 2024 Finished Nearest Neighbor Search
Thu Apr 18 17:13:01 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 17:17:58 2024 Finished embedding
Input embedding dimention: 2560
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_esm2_3b_1000.csv

#################################################################
                            carp                              
#################################################################
      Running UMAP with n_neighbors = 30 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=30, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 17:17:58 2024 Construct fuzzy simplicial set
Thu Apr 

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 17:17:59 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 17:18:01 2024 Finished Nearest Neighbor Search
Thu Apr 18 17:18:01 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 17:19:51 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_carp_30.csv

#################################################################
                            carp                              
#################################################################
      Running UMAP with n_neighbors = 50 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=50, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 17:19:51 2024 Construct fuzzy simplicial set
Thu Apr 18 17

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 17:19:52 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 17:19:57 2024 Finished Nearest Neighbor Search
Thu Apr 18 17:19:58 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 17:22:06 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_carp_50.csv

#################################################################
                            carp                              
#################################################################
      Running UMAP with n_neighbors = 100 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=100, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 17:22:06 2024 Construct fuzzy simplicial set
Thu Apr 18 

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 17:22:07 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 17:22:27 2024 Finished Nearest Neighbor Search
Thu Apr 18 17:22:28 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 17:25:07 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_carp_100.csv

#################################################################
                            carp                              
#################################################################
      Running UMAP with n_neighbors = 200 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=200, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 17:25:07 2024 Construct fuzzy simplicial set
Thu Apr 18

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 17:25:08 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 17:25:40 2024 Finished Nearest Neighbor Search
Thu Apr 18 17:25:42 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 17:28:58 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_carp_200.csv

#################################################################
                            carp                              
#################################################################
      Running UMAP with n_neighbors = 300 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=300, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 17:28:59 2024 Construct fuzzy simplicial set
Thu Apr 18

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 17:28:59 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 17:29:35 2024 Finished Nearest Neighbor Search
Thu Apr 18 17:29:37 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 17:33:21 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_carp_300.csv

#################################################################
                            carp                              
#################################################################
      Running UMAP with n_neighbors = 400 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=400, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 17:33:22 2024 Construct fuzzy simplicial set
Thu Apr 18

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 17:33:22 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 17:34:02 2024 Finished Nearest Neighbor Search
Thu Apr 18 17:34:05 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 17:38:11 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_carp_400.csv

#################################################################
                            carp                              
#################################################################
      Running UMAP with n_neighbors = 500 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=500, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 17:38:11 2024 Construct fuzzy simplicial set
Thu Apr 18

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 17:38:11 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 17:39:12 2024 Finished Nearest Neighbor Search
Thu Apr 18 17:39:16 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 17:43:40 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_carp_500.csv

#################################################################
                            carp                              
#################################################################
      Running UMAP with n_neighbors = 600 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=600, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 17:43:40 2024 Construct fuzzy simplicial set
Thu Apr 18

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 17:43:40 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 17:44:55 2024 Finished Nearest Neighbor Search
Thu Apr 18 17:44:59 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 17:49:43 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_carp_600.csv

#################################################################
                            carp                              
#################################################################
      Running UMAP with n_neighbors = 700 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=700, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 17:49:43 2024 Construct fuzzy simplicial set
Thu Apr 18

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 17:49:44 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 17:51:03 2024 Finished Nearest Neighbor Search
Thu Apr 18 17:51:08 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 17:55:52 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_carp_700.csv

#################################################################
                            carp                              
#################################################################
      Running UMAP with n_neighbors = 800 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=800, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 17:55:53 2024 Construct fuzzy simplicial set
Thu Apr 18

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 17:55:53 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 17:57:20 2024 Finished Nearest Neighbor Search
Thu Apr 18 17:57:26 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 18:02:15 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_carp_800.csv

#################################################################
                            carp                              
#################################################################
      Running UMAP with n_neighbors = 900 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=900, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 18:02:15 2024 Construct fuzzy simplicial set
Thu Apr 18

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 18:02:15 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 18:03:51 2024 Finished Nearest Neighbor Search
Thu Apr 18 18:03:58 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 18:08:56 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_carp_900.csv

#################################################################
                            carp                              
#################################################################
      Running UMAP with n_neighbors = 1000 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=1000, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 18:08:57 2024 Construct fuzzy simplicial set
Thu Apr 

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 18:08:57 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 18:10:38 2024 Finished Nearest Neighbor Search
Thu Apr 18 18:10:46 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 18:15:48 2024 Finished embedding
Input embedding dimention: 1280
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_carp_1000.csv

#################################################################
                            t5xlu50                              
#################################################################
      Running UMAP with n_neighbors = 30 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=30, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 18:15:48 2024 Construct fuzzy simplicial set
Thu Apr 

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 18:15:49 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 18:15:51 2024 Finished Nearest Neighbor Search
Thu Apr 18 18:15:51 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 18:17:49 2024 Finished embedding
Input embedding dimention: 1024
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_t5xlu50_30.csv

#################################################################
                            t5xlu50                              
#################################################################
      Running UMAP with n_neighbors = 50 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=50, random_state=42, spread=0.2, verbose=True)


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 18:17:50 2024 Construct fuzzy simplicial set
Thu Apr 18 18:17:50 2024 Finding Nearest Neighbors
Thu Apr 18 18:17:50 2024 Building RP forest with 13 trees
Thu Apr 18 18:17:50 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 18:17:55 2024 Finished Nearest Neighbor Search
Thu Apr 18 18:17:56 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 18:20:06 2024 Finished embedding
Input embedding dimention: 1024
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_t5xlu50_50.csv

#################################################################
                            t5xlu50                              
#################################################################
      Running UMAP with n_neighbors = 100 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=100, random_state=42, spread=0.2, verbose=True)


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 18:20:07 2024 Construct fuzzy simplicial set
Thu Apr 18 18:20:07 2024 Finding Nearest Neighbors
Thu Apr 18 18:20:07 2024 Building RP forest with 13 trees
Thu Apr 18 18:20:07 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 18:20:25 2024 Finished Nearest Neighbor Search
Thu Apr 18 18:20:26 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 18:23:08 2024 Finished embedding
Input embedding dimention: 1024
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_t5xlu50_100.csv

#################################################################
                            t5xlu50                              
#################################################################
      Running UMAP with n_neighbors = 200 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=200, random_state=42, spread=0.2, verbose=True)


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 18:23:08 2024 Construct fuzzy simplicial set
Thu Apr 18 18:23:08 2024 Finding Nearest Neighbors
Thu Apr 18 18:23:08 2024 Building RP forest with 13 trees
Thu Apr 18 18:23:09 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 18:23:38 2024 Finished Nearest Neighbor Search
Thu Apr 18 18:23:39 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 18:27:01 2024 Finished embedding
Input embedding dimention: 1024
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_t5xlu50_200.csv

#################################################################
                            t5xlu50                              
#################################################################
      Running UMAP with n_neighbors = 300 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=300, random_state=42, spread=0.2, verbose=True)


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 18:27:01 2024 Construct fuzzy simplicial set
Thu Apr 18 18:27:01 2024 Finding Nearest Neighbors
Thu Apr 18 18:27:01 2024 Building RP forest with 13 trees
Thu Apr 18 18:27:02 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 18:27:35 2024 Finished Nearest Neighbor Search
Thu Apr 18 18:27:37 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 18:31:24 2024 Finished embedding
Input embedding dimention: 1024
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_t5xlu50_300.csv

#################################################################
                            t5xlu50                              
#################################################################
      Running UMAP with n_neighbors = 400 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=400, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 18:31:25 2024 Construct fuzzy simplicial set
Thu 

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 18:31:25 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	Stopping threshold met -- exiting after 3 iterations
Thu Apr 18 18:32:03 2024 Finished Nearest Neighbor Search
Thu Apr 18 18:32:05 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 18:36:09 2024 Finished embedding
Input embedding dimention: 1024
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_t5xlu50_400.csv

#################################################################
                            t5xlu50                              
#################################################################
      Running UMAP with n_neighbors = 500 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=500, random_state=42, spread=0.2, verbose=True)


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 18:36:09 2024 Construct fuzzy simplicial set
Thu Apr 18 18:36:09 2024 Finding Nearest Neighbors
Thu Apr 18 18:36:09 2024 Building RP forest with 13 trees
Thu Apr 18 18:36:10 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 18:37:05 2024 Finished Nearest Neighbor Search
Thu Apr 18 18:37:08 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 18:41:29 2024 Finished embedding
Input embedding dimention: 1024
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_t5xlu50_500.csv

#################################################################
                            t5xlu50                              
#################################################################
      Running UMAP with n_neighbors = 600 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=600, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 18:41:30 2024 Construct fuzzy simplicial set
Thu 

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 18:41:30 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 18:42:31 2024 Finished Nearest Neighbor Search
Thu Apr 18 18:42:35 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 18:47:04 2024 Finished embedding
Input embedding dimention: 1024
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_t5xlu50_600.csv

#################################################################
                            t5xlu50                              
#################################################################
      Running UMAP with n_neighbors = 700 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=700, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 18:47:04 2024 Construct fuzzy simplicial set
Thu 

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 18:47:05 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 18:48:18 2024 Finished Nearest Neighbor Search
Thu Apr 18 18:48:23 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 18:53:04 2024 Finished embedding
Input embedding dimention: 1024
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_t5xlu50_700.csv

#################################################################
                            t5xlu50                              
#################################################################
      Running UMAP with n_neighbors = 800 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=800, random_state=42, spread=0.2, verbose=True)


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 18:53:04 2024 Construct fuzzy simplicial set
Thu Apr 18 18:53:04 2024 Finding Nearest Neighbors
Thu Apr 18 18:53:04 2024 Building RP forest with 13 trees
Thu Apr 18 18:53:04 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 18:54:22 2024 Finished Nearest Neighbor Search
Thu Apr 18 18:54:28 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 18:59:18 2024 Finished embedding
Input embedding dimention: 1024
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_t5xlu50_800.csv

#################################################################
                            t5xlu50                              
#################################################################
      Running UMAP with n_neighbors = 900 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=900, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 18:59:19 2024 Construct fuzzy simplicial set
Thu 

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 18:59:19 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 19:00:46 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:00:52 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:05:48 2024 Finished embedding
Input embedding dimention: 1024
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_t5xlu50_900.csv

#################################################################
                            t5xlu50                              
#################################################################
      Running UMAP with n_neighbors = 1000 | dataset = SBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=1000, random_state=42, spread=0.2, verbose=True)


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:05:48 2024 Construct fuzzy simplicial set
Thu Apr 18 19:05:48 2024 Finding Nearest Neighbors
Thu Apr 18 19:05:48 2024 Building RP forest with 13 trees
Thu Apr 18 19:05:48 2024 NN descent for 15 iterations
	 1  /  15
	 2  /  15
	 3  /  15
	 4  /  15
	Stopping threshold met -- exiting after 4 iterations
Thu Apr 18 19:07:23 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:07:31 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:12:35 2024 Finished embedding
Input embedding dimention: 1024
Data points: 25961
Results saved at: ../bldb/lowdim/umap/umap_sbl_t5xlu50_1000.csv



# MBL

In [8]:
mbl[["seq_id"]].to_csv("../bldb/lowdim/umap/mbl_ids.csv", index=False)

In [9]:
mbl_arrays = {
    "esm1b"    : esm1b_mbl,
    "esm2_650m": esm2_650m_mbl,
    "esm2_3b"  : esm2_3b_mbl,
    "carp"     : carp_mbl,
    "t5xlu50"  : t5xlu50_mbl
}

# iterate over data to create input labels 
for model in models:
    for n in nn:
        name1 = "umap1_" + model
        name2 = "umap2_" + model
        csv = "../bldb/lowdim/umap/umap_mbl_" + model + "_" + str(n) + ".csv"

        # get the dataset based on the model name 
        input_embeddings = mbl_arrays[model]

        # logs
        print(f"#################################################################")
        print(f"                            {model}                              ")

        # Run the function
        run_umap(array=input_embeddings, n_neighbors=n, dim1=name1, dim2=name2, dataset="MBL", csv_name=csv)

#################################################################
                            esm1b                              
#################################################################
      Running UMAP with n_neighbors = 30 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=30, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:12:36 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:12:48 2024 Finding Nearest Neighbors
Thu Apr 18 19:12:49 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:12:49 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:13:03 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm1b_30.csv

#################################################################
                            esm1b                              
#################################################################
      Running UMAP with n_neighbors = 50 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=50, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:13:03 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:13:15 2024 Finding Nearest Neighbors
Thu Apr 18 19:13:15 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:13:15 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:13:32 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm1b_50.csv

#################################################################
                            esm1b                              
#################################################################
      Running UMAP with n_neighbors = 100 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=100, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:13:33 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:13:44 2024 Finding Nearest Neighbors
Thu Apr 18 19:13:44 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:13:44 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:14:05 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm1b_100.csv

#################################################################
                            esm1b                              
#################################################################
      Running UMAP with n_neighbors = 200 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=200, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:14:06 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:14:17 2024 Finding Nearest Neighbors
Thu Apr 18 19:14:17 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:14:18 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:14:43 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm1b_200.csv

#################################################################
                            esm1b                              
#################################################################
      Running UMAP with n_neighbors = 300 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=300, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:14:43 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:14:55 2024 Finding Nearest Neighbors
Thu Apr 18 19:14:55 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:14:55 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:15:25 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm1b_300.csv

#################################################################
                            esm1b                              
#################################################################
      Running UMAP with n_neighbors = 400 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=400, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:15:25 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:15:36 2024 Finding Nearest Neighbors
Thu Apr 18 19:15:36 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:15:37 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:16:08 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm1b_400.csv

#################################################################
                            esm1b                              
#################################################################
      Running UMAP with n_neighbors = 500 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=500, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:16:08 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:16:20 2024 Finding Nearest Neighbors
Thu Apr 18 19:16:20 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:16:21 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:16:54 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm1b_500.csv

#################################################################
                            esm1b                              
#################################################################
      Running UMAP with n_neighbors = 600 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=600, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:16:54 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:17:05 2024 Finding Nearest Neighbors
Thu Apr 18 19:17:06 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:17:06 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:17:41 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm1b_600.csv

#################################################################
                            esm1b                              
#################################################################
      Running UMAP with n_neighbors = 700 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=700, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:17:41 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:17:53 2024 Finding Nearest Neighbors
Thu Apr 18 19:17:53 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:17:54 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:18:30 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm1b_700.csv

#################################################################
                            esm1b                              
#################################################################
      Running UMAP with n_neighbors = 800 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=800, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:18:30 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:18:41 2024 Finding Nearest Neighbors
Thu Apr 18 19:18:41 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:18:42 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:19:19 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm1b_800.csv

#################################################################
                            esm1b                              
#################################################################
      Running UMAP with n_neighbors = 900 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=900, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:19:20 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:19:31 2024 Finding Nearest Neighbors
Thu Apr 18 19:19:31 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:19:32 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:20:10 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm1b_900.csv

#################################################################
                            esm1b                              
#################################################################
      Running UMAP with n_neighbors = 1000 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=1000, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:20:10 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:20:21 2024 Finding Nearest Neighbors
Thu Apr 18 19:20:21 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:20:22 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:21:01 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm1b_1000.csv

#################################################################
                            esm2_650m                              
#################################################################
      Running UMAP with n_neighbors = 30 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=30, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:21:01 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:21:12 2024 Finding Nearest Neighbors
Thu Apr 18 19:21:12 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:21:12 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:21:27 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm2_650m_30.csv

#################################################################
                            esm2_650m                              
#################################################################
      Running UMAP with n_neighbors = 50 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=50, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:21:27 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:21:39 2024 Finding Nearest Neighbors
Thu Apr 18 19:21:39 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:21:39 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:21:56 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm2_650m_50.csv

#################################################################
                            esm2_650m                              
#################################################################
      Running UMAP with n_neighbors = 100 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=100, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:21:56 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:22:08 2024 Finding Nearest Neighbors
Thu Apr 18 19:22:08 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:22:08 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:22:29 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm2_650m_100.csv

#################################################################
                            esm2_650m                              
#################################################################
      Running UMAP with n_neighbors = 200 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=200, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:22:29 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:22:41 2024 Finding Nearest Neighbors
Thu Apr 18 19:22:41 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:22:41 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:23:07 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm2_650m_200.csv

#################################################################
                            esm2_650m                              
#################################################################
      Running UMAP with n_neighbors = 300 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=300, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:23:07 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:23:19 2024 Finding Nearest Neighbors
Thu Apr 18 19:23:19 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:23:19 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:23:48 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm2_650m_300.csv

#################################################################
                            esm2_650m                              
#################################################################
      Running UMAP with n_neighbors = 400 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=400, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:23:48 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:24:00 2024 Finding Nearest Neighbors
Thu Apr 18 19:24:00 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:24:00 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:24:32 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm2_650m_400.csv

#################################################################
                            esm2_650m                              
#################################################################
      Running UMAP with n_neighbors = 500 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=500, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:24:32 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:24:44 2024 Finding Nearest Neighbors
Thu Apr 18 19:24:44 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:24:44 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:25:17 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm2_650m_500.csv

#################################################################
                            esm2_650m                              
#################################################################
      Running UMAP with n_neighbors = 600 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=600, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:25:18 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:25:30 2024 Finding Nearest Neighbors
Thu Apr 18 19:25:30 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:25:30 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:26:05 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm2_650m_600.csv

#################################################################
                            esm2_650m                              
#################################################################
      Running UMAP with n_neighbors = 700 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=700, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:26:05 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:26:17 2024 Finding Nearest Neighbors
Thu Apr 18 19:26:17 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:26:17 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:26:53 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm2_650m_700.csv

#################################################################
                            esm2_650m                              
#################################################################
      Running UMAP with n_neighbors = 800 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=800, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:26:53 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:27:05 2024 Finding Nearest Neighbors
Thu Apr 18 19:27:05 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:27:06 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:27:43 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm2_650m_800.csv

#################################################################
                            esm2_650m                              
#################################################################
      Running UMAP with n_neighbors = 900 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=900, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:27:43 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:27:54 2024 Finding Nearest Neighbors
Thu Apr 18 19:27:55 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:27:55 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:28:33 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm2_650m_900.csv

#################################################################
                            esm2_650m                              
#################################################################
      Running UMAP with n_neighbors = 1000 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=1000, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:28:33 2024 Construct fuzzy simplicial set

  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:28:45 2024 Finding Nearest Neighbors
Thu Apr 18 19:28:45 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:28:46 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:29:24 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm2_650m_1000.csv

#################################################################
                            esm2_3b                              
#################################################################
      Running UMAP with n_neighbors = 30 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=30, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:29:24 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:29:43 2024 Finding Nearest Neighbors
Thu Apr 18 19:29:43 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:29:43 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:29:58 2024 Finished embedding
Input embedding dimention: 2560
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm2_3b_30.csv

#################################################################
                            esm2_3b                              
#################################################################
      Running UMAP with n_neighbors = 50 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=50, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:29:58 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:30:16 2024 Finding Nearest Neighbors
Thu Apr 18 19:30:16 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:30:16 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:30:33 2024 Finished embedding
Input embedding dimention: 2560
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm2_3b_50.csv

#################################################################
                            esm2_3b                              
#################################################################
      Running UMAP with n_neighbors = 100 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=100, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:30:34 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:30:53 2024 Finding Nearest Neighbors
Thu Apr 18 19:30:53 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:30:53 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:31:14 2024 Finished embedding
Input embedding dimention: 2560
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm2_3b_100.csv

#################################################################
                            esm2_3b                              
#################################################################
      Running UMAP with n_neighbors = 200 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=200, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:31:14 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:31:33 2024 Finding Nearest Neighbors
Thu Apr 18 19:31:33 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:31:33 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:31:59 2024 Finished embedding
Input embedding dimention: 2560
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm2_3b_200.csv

#################################################################
                            esm2_3b                              
#################################################################
      Running UMAP with n_neighbors = 300 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=300, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:31:59 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:32:18 2024 Finding Nearest Neighbors
Thu Apr 18 19:32:18 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:32:19 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:32:47 2024 Finished embedding
Input embedding dimention: 2560
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm2_3b_300.csv

#################################################################
                            esm2_3b                              
#################################################################
      Running UMAP with n_neighbors = 400 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=400, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:32:47 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:33:06 2024 Finding Nearest Neighbors
Thu Apr 18 19:33:06 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:33:07 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:33:38 2024 Finished embedding
Input embedding dimention: 2560
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm2_3b_400.csv

#################################################################
                            esm2_3b                              
#################################################################
      Running UMAP with n_neighbors = 500 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=500, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:33:38 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:33:57 2024 Finding Nearest Neighbors
Thu Apr 18 19:33:57 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:33:58 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:34:30 2024 Finished embedding
Input embedding dimention: 2560
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm2_3b_500.csv

#################################################################
                            esm2_3b                              
#################################################################
      Running UMAP with n_neighbors = 600 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=600, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:34:30 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:34:50 2024 Finding Nearest Neighbors
Thu Apr 18 19:34:50 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:34:50 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:35:24 2024 Finished embedding
Input embedding dimention: 2560
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm2_3b_600.csv

#################################################################
                            esm2_3b                              
#################################################################
      Running UMAP with n_neighbors = 700 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=700, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:35:24 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:35:43 2024 Finding Nearest Neighbors
Thu Apr 18 19:35:43 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:35:44 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:36:19 2024 Finished embedding
Input embedding dimention: 2560
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm2_3b_700.csv

#################################################################
                            esm2_3b                              
#################################################################
      Running UMAP with n_neighbors = 800 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=800, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:36:19 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:36:39 2024 Finding Nearest Neighbors
Thu Apr 18 19:36:39 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:36:40 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:37:16 2024 Finished embedding
Input embedding dimention: 2560
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm2_3b_800.csv

#################################################################
                            esm2_3b                              
#################################################################
      Running UMAP with n_neighbors = 900 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=900, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:37:17 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:37:36 2024 Finding Nearest Neighbors
Thu Apr 18 19:37:36 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:37:37 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:38:14 2024 Finished embedding
Input embedding dimention: 2560
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm2_3b_900.csv

#################################################################
                            esm2_3b                              
#################################################################
      Running UMAP with n_neighbors = 1000 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=1000, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:38:14 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:38:33 2024 Finding Nearest Neighbors
Thu Apr 18 19:38:33 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:38:34 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:39:12 2024 Finished embedding
Input embedding dimention: 2560
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_esm2_3b_1000.csv

#################################################################
                            carp                              
#################################################################
      Running UMAP with n_neighbors = 30 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=30, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:39:12 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:39:24 2024 Finding Nearest Neighbors
Thu Apr 18 19:39:24 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:39:24 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:39:40 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_carp_30.csv

#################################################################
                            carp                              
#################################################################
      Running UMAP with n_neighbors = 50 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=50, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:39:40 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:39:51 2024 Finding Nearest Neighbors
Thu Apr 18 19:39:51 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:39:51 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:40:09 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_carp_50.csv

#################################################################
                            carp                              
#################################################################
      Running UMAP with n_neighbors = 100 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=100, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:40:09 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:40:21 2024 Finding Nearest Neighbors
Thu Apr 18 19:40:21 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:40:21 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:40:43 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_carp_100.csv

#################################################################
                            carp                              
#################################################################
      Running UMAP with n_neighbors = 200 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=200, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:40:43 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:40:55 2024 Finding Nearest Neighbors
Thu Apr 18 19:40:55 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:40:55 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:41:21 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_carp_200.csv

#################################################################
                            carp                              
#################################################################
      Running UMAP with n_neighbors = 300 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=300, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:41:21 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:41:33 2024 Finding Nearest Neighbors
Thu Apr 18 19:41:33 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:41:34 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:42:03 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_carp_300.csv

#################################################################
                            carp                              
#################################################################
      Running UMAP with n_neighbors = 400 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=400, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:42:03 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:42:15 2024 Finding Nearest Neighbors
Thu Apr 18 19:42:15 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:42:15 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:42:47 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_carp_400.csv

#################################################################
                            carp                              
#################################################################
      Running UMAP with n_neighbors = 500 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=500, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:42:47 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:42:59 2024 Finding Nearest Neighbors
Thu Apr 18 19:42:59 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:43:00 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:43:33 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_carp_500.csv

#################################################################
                            carp                              
#################################################################
      Running UMAP with n_neighbors = 600 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=600, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:43:33 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:43:45 2024 Finding Nearest Neighbors
Thu Apr 18 19:43:45 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:43:45 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:44:19 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_carp_600.csv

#################################################################
                            carp                              
#################################################################
      Running UMAP with n_neighbors = 700 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=700, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:44:19 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:44:31 2024 Finding Nearest Neighbors
Thu Apr 18 19:44:31 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:44:32 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:45:07 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_carp_700.csv

#################################################################
                            carp                              
#################################################################
      Running UMAP with n_neighbors = 800 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=800, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:45:07 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:45:19 2024 Finding Nearest Neighbors
Thu Apr 18 19:45:19 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:45:20 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:45:56 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_carp_800.csv

#################################################################
                            carp                              
#################################################################
      Running UMAP with n_neighbors = 900 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=900, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:45:56 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:46:08 2024 Finding Nearest Neighbors
Thu Apr 18 19:46:08 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:46:08 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:46:46 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_carp_900.csv

#################################################################
                            carp                              
#################################################################
      Running UMAP with n_neighbors = 1000 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=1000, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:46:46 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:46:58 2024 Finding Nearest Neighbors
Thu Apr 18 19:46:58 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:46:59 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:47:36 2024 Finished embedding
Input embedding dimention: 1280
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_carp_1000.csv

#################################################################
                            t5xlu50                              
#################################################################
      Running UMAP with n_neighbors = 30 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=30, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:47:36 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:47:47 2024 Finding Nearest Neighbors
Thu Apr 18 19:47:47 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:47:47 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:48:01 2024 Finished embedding
Input embedding dimention: 1024
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_t5xlu50_30.csv

#################################################################
                            t5xlu50                              
#################################################################
      Running UMAP with n_neighbors = 50 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=50, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:48:01 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:48:12 2024 Finding Nearest Neighbors
Thu Apr 18 19:48:12 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:48:12 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:48:29 2024 Finished embedding
Input embedding dimention: 1024
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_t5xlu50_50.csv

#################################################################
                            t5xlu50                              
#################################################################
      Running UMAP with n_neighbors = 100 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=100, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:48:30 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:48:40 2024 Finding Nearest Neighbors
Thu Apr 18 19:48:40 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:48:40 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:49:02 2024 Finished embedding
Input embedding dimention: 1024
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_t5xlu50_100.csv

#################################################################
                            t5xlu50                              
#################################################################
      Running UMAP with n_neighbors = 200 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=200, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:49:02 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:49:12 2024 Finding Nearest Neighbors
Thu Apr 18 19:49:12 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:49:12 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:49:39 2024 Finished embedding
Input embedding dimention: 1024
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_t5xlu50_200.csv

#################################################################
                            t5xlu50                              
#################################################################
      Running UMAP with n_neighbors = 300 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=300, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:49:39 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:49:49 2024 Finding Nearest Neighbors
Thu Apr 18 19:49:49 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:49:50 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:50:19 2024 Finished embedding
Input embedding dimention: 1024
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_t5xlu50_300.csv

#################################################################
                            t5xlu50                              
#################################################################
      Running UMAP with n_neighbors = 400 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=400, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:50:19 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:50:29 2024 Finding Nearest Neighbors
Thu Apr 18 19:50:30 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:50:30 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:51:02 2024 Finished embedding
Input embedding dimention: 1024
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_t5xlu50_400.csv

#################################################################
                            t5xlu50                              
#################################################################
      Running UMAP with n_neighbors = 500 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=500, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:51:02 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:51:13 2024 Finding Nearest Neighbors
Thu Apr 18 19:51:13 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:51:13 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:51:47 2024 Finished embedding
Input embedding dimention: 1024
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_t5xlu50_500.csv

#################################################################
                            t5xlu50                              
#################################################################
      Running UMAP with n_neighbors = 600 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=600, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:51:47 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:51:57 2024 Finding Nearest Neighbors
Thu Apr 18 19:51:57 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:51:58 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:52:33 2024 Finished embedding
Input embedding dimention: 1024
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_t5xlu50_600.csv

#################################################################
                            t5xlu50                              
#################################################################
      Running UMAP with n_neighbors = 700 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=700, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:52:33 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:52:44 2024 Finding Nearest Neighbors
Thu Apr 18 19:52:44 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:52:44 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:53:21 2024 Finished embedding
Input embedding dimention: 1024
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_t5xlu50_700.csv

#################################################################
                            t5xlu50                              
#################################################################
      Running UMAP with n_neighbors = 800 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=800, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:53:21 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:53:31 2024 Finding Nearest Neighbors
Thu Apr 18 19:53:31 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:53:32 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:54:10 2024 Finished embedding
Input embedding dimention: 1024
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_t5xlu50_800.csv

#################################################################
                            t5xlu50                              
#################################################################
      Running UMAP with n_neighbors = 900 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=900, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:54:11 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:54:21 2024 Finding Nearest Neighbors
Thu Apr 18 19:54:21 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:54:22 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:55:01 2024 Finished embedding
Input embedding dimention: 1024
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_t5xlu50_900.csv

#################################################################
                            t5xlu50                              
#################################################################
      Running UMAP with n_neighbors = 1000 | dataset = MBL
#################################################################

UMAP(angular_rp_forest=True, metric='cosine', min_dist=0.2, n_epochs=2000, n_neighbors=1000, random_state=42, spread=0.2, verbose=True)
Thu Apr 18 19:55:01 2024 Construct fuzzy simplicial set


  warn(f"n_jobs value {self.n_jobs} overridden to 1 by setting random_state. Use no seed for parallelism.")


Thu Apr 18 19:55:11 2024 Finding Nearest Neighbors
Thu Apr 18 19:55:11 2024 Finished Nearest Neighbor Search
Thu Apr 18 19:55:12 2024 Construct embedding


Epochs completed:   0%|            0/2000 [00:00]

	completed  0  /  2000 epochs
	completed  200  /  2000 epochs
	completed  400  /  2000 epochs
	completed  600  /  2000 epochs
	completed  800  /  2000 epochs
	completed  1000  /  2000 epochs
	completed  1200  /  2000 epochs
	completed  1400  /  2000 epochs
	completed  1600  /  2000 epochs
	completed  1800  /  2000 epochs
Thu Apr 18 19:55:52 2024 Finished embedding
Input embedding dimention: 1024
Data points: 3468
Results saved at: ../bldb/lowdim/umap/umap_mbl_t5xlu50_1000.csv



# parse

Due to an error in the above code, where I forget to put the nn value in the columns, I need to run this code to rename the umap dims to add the nn value 


```bash 
for file in *.csv; do
    number=$(echo "$file" | grep -oP '\d+(?=.csv)')
    sed -i "1 s/,/_$number,/; 1 s/$/_$number/" "$file"; done
```

## mbl

In [4]:
cols = [0, 1]

In [5]:
path = "../bldb/lowdim/umap/"
mbl_id = mbl[["seq_id"]]

In [10]:
ids_mbl = pd.read_csv(join(path,"mbl_ids.csv"))

df30   = pd.read_csv(join(path,"umap_mbl_esm1b_30.csv"), usecols=cols)
df50   = pd.read_csv(join(path,"umap_mbl_esm1b_50.csv"), usecols=cols)
df100  = pd.read_csv(join(path,"umap_mbl_esm1b_100.csv"), usecols=cols)
df200  = pd.read_csv(join(path,"umap_mbl_esm1b_200.csv"), usecols=cols)
df300  = pd.read_csv(join(path,"umap_mbl_esm1b_300.csv"), usecols=cols)
df400  = pd.read_csv(join(path,"umap_mbl_esm1b_400.csv"), usecols=cols)
df500  = pd.read_csv(join(path,"umap_mbl_esm1b_500.csv"), usecols=cols)
df600  = pd.read_csv(join(path,"umap_mbl_esm1b_600.csv"), usecols=cols)
df700  = pd.read_csv(join(path,"umap_mbl_esm1b_700.csv"), usecols=cols)
df800  = pd.read_csv(join(path,"umap_mbl_esm1b_800.csv"), usecols=cols)
df900  = pd.read_csv(join(path,"umap_mbl_esm1b_900.csv"), usecols=cols)
df1000 = pd.read_csv(join(path,"umap_mbl_esm1b_1000.csv"), usecols=cols)

df = pd.concat([ids_mbl, df30, df50, df100, df200, df300, df400, df500, df600, df700, df800, df900, df1000], axis=1)
df.columns = df.columns.str.lower()
print(f"data size = {len(df)}")
df.columns

data size = 3468


Index(['seq_id', 'umap1_esm1b_30', 'umap2_esm1b_30', 'umap1_esm1b_50',
       'umap2_esm1b_50', 'umap1_esm1b_100', 'umap2_esm1b_100',
       'umap1_esm1b_200', 'umap2_esm1b_200', 'umap1_esm1b_300',
       'umap2_esm1b_300', 'umap1_esm1b_400', 'umap2_esm1b_400',
       'umap1_esm1b_500', 'umap2_esm1b_500', 'umap1_esm1b_600',
       'umap2_esm1b_600', 'umap1_esm1b_700', 'umap2_esm1b_700',
       'umap1_esm1b_800', 'umap2_esm1b_800', 'umap1_esm1b_900',
       'umap2_esm1b_900', 'umap1_esm1b_1000', 'umap2_esm1b_1000'],
      dtype='object')

In [13]:
df.to_csv("../bldb/lowdim/umap/merge/umap_mbl_esm1b.csv", index=False)

In [14]:
df30   = pd.read_csv(join(path,"umap_mbl_esm2_3b_30.csv"), usecols=cols)
df50   = pd.read_csv(join(path,"umap_mbl_esm2_3b_50.csv"), usecols=cols)
df100  = pd.read_csv(join(path,"umap_mbl_esm2_3b_100.csv"), usecols=cols)
df200  = pd.read_csv(join(path,"umap_mbl_esm2_3b_200.csv"), usecols=cols)
df300  = pd.read_csv(join(path,"umap_mbl_esm2_3b_300.csv"), usecols=cols)
df400  = pd.read_csv(join(path,"umap_mbl_esm2_3b_400.csv"), usecols=cols)
df500  = pd.read_csv(join(path,"umap_mbl_esm2_3b_500.csv"), usecols=cols)
df600  = pd.read_csv(join(path,"umap_mbl_esm2_3b_600.csv"), usecols=cols)
df700  = pd.read_csv(join(path,"umap_mbl_esm2_3b_700.csv"), usecols=cols)
df800  = pd.read_csv(join(path,"umap_mbl_esm2_3b_800.csv"), usecols=cols)
df900  = pd.read_csv(join(path,"umap_mbl_esm2_3b_900.csv"), usecols=cols)
df1000 = pd.read_csv(join(path,"umap_mbl_esm2_3b_1000.csv"), usecols=cols)

df = pd.concat([ids_mbl, df30, df50, df100, df200, df300, df400, df500, df600, df700, df800, df900, df1000], axis=1)
df.columns = df.columns.str.lower()
print(f"data size = {len(df)}")
df.columns

data size = 3468


Index(['seq_id', 'umap1_esm2_3b_30', 'umap2_esm2_3b_30', 'umap1_esm2_3b_50',
       'umap2_esm2_3b_50', 'umap1_esm2_3b_100', 'umap2_esm2_3b_100',
       'umap1_esm2_3b_200', 'umap2_esm2_3b_200', 'umap1_esm2_3b_300',
       'umap2_esm2_3b_300', 'umap1_esm2_3b_400', 'umap2_esm2_3b_400',
       'umap1_esm2_3b_500', 'umap2_esm2_3b_500', 'umap1_esm2_3b_600',
       'umap2_esm2_3b_600', 'umap1_esm2_3b_700', 'umap2_esm2_3b_700',
       'umap1_esm2_3b_800', 'umap2_esm2_3b_800', 'umap1_esm2_3b_900',
       'umap2_esm2_3b_900', 'umap1_esm2_3b_1000', 'umap2_esm2_3b_1000'],
      dtype='object')

In [15]:
df.to_csv("../bldb/lowdim/umap/merge/umap_mbl_esm2_3b.csv", index=False)

In [16]:
df30   = pd.read_csv(join(path,"umap_mbl_esm2_650m_30.csv"), usecols=cols)
df50   = pd.read_csv(join(path,"umap_mbl_esm2_650m_50.csv"), usecols=cols)
df100  = pd.read_csv(join(path,"umap_mbl_esm2_650m_100.csv"), usecols=cols)
df200  = pd.read_csv(join(path,"umap_mbl_esm2_650m_200.csv"), usecols=cols)
df300  = pd.read_csv(join(path,"umap_mbl_esm2_650m_300.csv"), usecols=cols)
df400  = pd.read_csv(join(path,"umap_mbl_esm2_650m_400.csv"), usecols=cols)
df500  = pd.read_csv(join(path,"umap_mbl_esm2_650m_500.csv"), usecols=cols)
df600  = pd.read_csv(join(path,"umap_mbl_esm2_650m_600.csv"), usecols=cols)
df700  = pd.read_csv(join(path,"umap_mbl_esm2_650m_700.csv"), usecols=cols)
df800  = pd.read_csv(join(path,"umap_mbl_esm2_650m_800.csv"), usecols=cols)
df900  = pd.read_csv(join(path,"umap_mbl_esm2_650m_900.csv"), usecols=cols)
df1000 = pd.read_csv(join(path,"umap_mbl_esm2_650m_1000.csv"), usecols=cols)

df = pd.concat([ids_mbl, df30, df50, df100, df200, df300, df400, df500, df600, df700, df800, df900, df1000], axis=1)
df.columns = df.columns.str.lower()
print(f"data size = {len(df)}")
df.columns

data size = 3468


Index(['seq_id', 'umap1_esm2_650m_30', 'umap2_esm2_650m_30',
       'umap1_esm2_650m_50', 'umap2_esm2_650m_50', 'umap1_esm2_650m_100',
       'umap2_esm2_650m_100', 'umap1_esm2_650m_200', 'umap2_esm2_650m_200',
       'umap1_esm2_650m_300', 'umap2_esm2_650m_300', 'umap1_esm2_650m_400',
       'umap2_esm2_650m_400', 'umap1_esm2_650m_500', 'umap2_esm2_650m_500',
       'umap1_esm2_650m_600', 'umap2_esm2_650m_600', 'umap1_esm2_650m_700',
       'umap2_esm2_650m_700', 'umap1_esm2_650m_800', 'umap2_esm2_650m_800',
       'umap1_esm2_650m_900', 'umap2_esm2_650m_900', 'umap1_esm2_650m_1000',
       'umap2_esm2_650m_1000'],
      dtype='object')

In [17]:
df.to_csv("../bldb/lowdim/umap/merge/umap_mbl_esm2_650m.csv", index=False)

In [18]:
df30   = pd.read_csv(join(path,"umap_mbl_carp_30.csv"), usecols=cols)
df50   = pd.read_csv(join(path,"umap_mbl_carp_50.csv"), usecols=cols)
df100  = pd.read_csv(join(path,"umap_mbl_carp_100.csv"), usecols=cols)
df200  = pd.read_csv(join(path,"umap_mbl_carp_200.csv"), usecols=cols)
df300  = pd.read_csv(join(path,"umap_mbl_carp_300.csv"), usecols=cols)
df400  = pd.read_csv(join(path,"umap_mbl_carp_400.csv"), usecols=cols)
df500  = pd.read_csv(join(path,"umap_mbl_carp_500.csv"), usecols=cols)
df600  = pd.read_csv(join(path,"umap_mbl_carp_600.csv"), usecols=cols)
df700  = pd.read_csv(join(path,"umap_mbl_carp_700.csv"), usecols=cols)
df800  = pd.read_csv(join(path,"umap_mbl_carp_800.csv"), usecols=cols)
df900  = pd.read_csv(join(path,"umap_mbl_carp_900.csv"), usecols=cols)
df1000 = pd.read_csv(join(path,"umap_mbl_carp_1000.csv"), usecols=cols)

df = pd.concat([ids_mbl, df30, df50, df100, df200, df300, df400, df500, df600, df700, df800, df900, df1000], axis=1)
df.columns = df.columns.str.lower()
print(f"data size = {len(df)}")
df.columns

data size = 3468


Index(['seq_id', 'umap1_carp_30', 'umap2_carp_30', 'umap1_carp_50',
       'umap2_carp_50', 'umap1_carp_100', 'umap2_carp_100', 'umap1_carp_200',
       'umap2_carp_200', 'umap1_carp_300', 'umap2_carp_300', 'umap1_carp_400',
       'umap2_carp_400', 'umap1_carp_500', 'umap2_carp_500', 'umap1_carp_600',
       'umap2_carp_600', 'umap1_carp_700', 'umap2_carp_700', 'umap1_carp_800',
       'umap2_carp_800', 'umap1_carp_900', 'umap2_carp_900', 'umap1_carp_1000',
       'umap2_carp_1000'],
      dtype='object')

In [19]:
df.to_csv("../bldb/lowdim/umap/merge/umap_mbl_carp.csv", index=False)

In [20]:
df30   = pd.read_csv(join(path,"umap_mbl_t5xlu50_30.csv"), usecols=cols)
df50   = pd.read_csv(join(path,"umap_mbl_t5xlu50_50.csv"), usecols=cols)
df100  = pd.read_csv(join(path,"umap_mbl_t5xlu50_100.csv"), usecols=cols)
df200  = pd.read_csv(join(path,"umap_mbl_t5xlu50_200.csv"), usecols=cols)
df300  = pd.read_csv(join(path,"umap_mbl_t5xlu50_300.csv"), usecols=cols)
df400  = pd.read_csv(join(path,"umap_mbl_t5xlu50_400.csv"), usecols=cols)
df500  = pd.read_csv(join(path,"umap_mbl_t5xlu50_500.csv"), usecols=cols)
df600  = pd.read_csv(join(path,"umap_mbl_t5xlu50_600.csv"), usecols=cols)
df700  = pd.read_csv(join(path,"umap_mbl_t5xlu50_700.csv"), usecols=cols)
df800  = pd.read_csv(join(path,"umap_mbl_t5xlu50_800.csv"), usecols=cols)
df900  = pd.read_csv(join(path,"umap_mbl_t5xlu50_900.csv"), usecols=cols)
df1000 = pd.read_csv(join(path,"umap_mbl_t5xlu50_1000.csv"), usecols=cols)

df = pd.concat([ids_mbl, df30, df50, df100, df200, df300, df400, df500, df600, df700, df800, df900, df1000], axis=1)
df.columns = df.columns.str.lower()
print(f"data size = {len(df)}")
df.columns

data size = 3468


Index(['seq_id', 'umap1_t5xlu50_30', 'umap2_t5xlu50_30', 'umap1_t5xlu50_50',
       'umap2_t5xlu50_50', 'umap1_t5xlu50_100', 'umap2_t5xlu50_100',
       'umap1_t5xlu50_200', 'umap2_t5xlu50_200', 'umap1_t5xlu50_300',
       'umap2_t5xlu50_300', 'umap1_t5xlu50_400', 'umap2_t5xlu50_400',
       'umap1_t5xlu50_500', 'umap2_t5xlu50_500', 'umap1_t5xlu50_600',
       'umap2_t5xlu50_600', 'umap1_t5xlu50_700', 'umap2_t5xlu50_700',
       'umap1_t5xlu50_800', 'umap2_t5xlu50_800', 'umap1_t5xlu50_900',
       'umap2_t5xlu50_900', 'umap1_t5xlu50_1000', 'umap2_t5xlu50_1000'],
      dtype='object')

In [21]:
df.to_csv("../bldb/lowdim/umap/merge/umap_mbl_t5xlu50.csv", index=False)

## sbl

In [3]:
sbl_id = sbl[["seq_id"]]

In [22]:
ids_sbl = pd.read_csv(join(path,"sbl_ids.csv"))

df30   = pd.read_csv(join(path,"umap_sbl_esm1b_30.csv"), usecols=cols)
df50   = pd.read_csv(join(path,"umap_sbl_esm1b_50.csv"), usecols=cols)
df100  = pd.read_csv(join(path,"umap_sbl_esm1b_100.csv"), usecols=cols)
df200  = pd.read_csv(join(path,"umap_sbl_esm1b_200.csv"), usecols=cols)
df300  = pd.read_csv(join(path,"umap_sbl_esm1b_300.csv"), usecols=cols)
df400  = pd.read_csv(join(path,"umap_sbl_esm1b_400.csv"), usecols=cols)
df500  = pd.read_csv(join(path,"umap_sbl_esm1b_500.csv"), usecols=cols)
df600  = pd.read_csv(join(path,"umap_sbl_esm1b_600.csv"), usecols=cols)
df700  = pd.read_csv(join(path,"umap_sbl_esm1b_700.csv"), usecols=cols)
df800  = pd.read_csv(join(path,"umap_sbl_esm1b_800.csv"), usecols=cols)
df900  = pd.read_csv(join(path,"umap_sbl_esm1b_900.csv"), usecols=cols)
df1000 = pd.read_csv(join(path,"umap_sbl_esm1b_1000.csv"), usecols=cols)

df = pd.concat([ids_sbl, df30, df50, df100, df200, df300, df400, df500, df600, df700, df800, df900, df1000], axis=1)
df.columns = df.columns.str.lower()
print(f"data size = {len(df)}")
df.columns

data size = 25961


Index(['seq_id', 'umap1_esm1b_30', 'umap2_esm1b_30', 'umap1_esm1b_50',
       'umap2_esm1b_50', 'umap1_esm1b_100', 'umap2_esm1b_100',
       'umap1_esm1b_200', 'umap2_esm1b_200', 'umap1_esm1b_300',
       'umap2_esm1b_300', 'umap1_esm1b_400', 'umap2_esm1b_400',
       'umap1_esm1b_500', 'umap2_esm1b_500', 'umap1_esm1b_600',
       'umap2_esm1b_600', 'umap1_esm1b_700', 'umap2_esm1b_700',
       'umap1_esm1b_800', 'umap2_esm1b_800', 'umap1_esm1b_900',
       'umap2_esm1b_900', 'umap1_esm1b_1000', 'umap2_esm1b_1000'],
      dtype='object')

In [23]:
df.to_csv("../bldb/lowdim/umap/merge/umap_sbl_esm1b.csv", index=False)

In [24]:
df30   = pd.read_csv(join(path,"umap_sbl_esm2_3b_30.csv"), usecols=cols)
df50   = pd.read_csv(join(path,"umap_sbl_esm2_3b_50.csv"), usecols=cols)
df100  = pd.read_csv(join(path,"umap_sbl_esm2_3b_100.csv"), usecols=cols)
df200  = pd.read_csv(join(path,"umap_sbl_esm2_3b_200.csv"), usecols=cols)
df300  = pd.read_csv(join(path,"umap_sbl_esm2_3b_300.csv"), usecols=cols)
df400  = pd.read_csv(join(path,"umap_sbl_esm2_3b_400.csv"), usecols=cols)
df500  = pd.read_csv(join(path,"umap_sbl_esm2_3b_500.csv"), usecols=cols)
df600  = pd.read_csv(join(path,"umap_sbl_esm2_3b_600.csv"), usecols=cols)
df700  = pd.read_csv(join(path,"umap_sbl_esm2_3b_700.csv"), usecols=cols)
df800  = pd.read_csv(join(path,"umap_sbl_esm2_3b_800.csv"), usecols=cols)
df900  = pd.read_csv(join(path,"umap_sbl_esm2_3b_900.csv"), usecols=cols)
df1000 = pd.read_csv(join(path,"umap_sbl_esm2_3b_1000.csv"), usecols=cols)

df = pd.concat([ids_sbl, df30, df50, df100, df200, df300, df400, df500, df600, df700, df800, df900, df1000], axis=1)
df.columns = df.columns.str.lower()
print(f"data size = {len(df)}")
df.columns

data size = 25961


Index(['seq_id', 'umap1_esm2_3b_30', 'umap2_esm2_3b_30', 'umap1_esm2_3b_50',
       'umap2_esm2_3b_50', 'umap1_esm2_3b_100', 'umap2_esm2_3b_100',
       'umap1_esm2_3b_200', 'umap2_esm2_3b_200', 'umap1_esm2_3b_300',
       'umap2_esm2_3b_300', 'umap1_esm2_3b_400', 'umap2_esm2_3b_400',
       'umap1_esm2_3b_500', 'umap2_esm2_3b_500', 'umap1_esm2_3b_600',
       'umap2_esm2_3b_600', 'umap1_esm2_3b_700', 'umap2_esm2_3b_700',
       'umap1_esm2_3b_800', 'umap2_esm2_3b_800', 'umap1_esm2_3b_900',
       'umap2_esm2_3b_900', 'umap1_esm2_3b_1000', 'umap2_esm2_3b_1000'],
      dtype='object')

In [25]:
df.to_csv("../bldb/lowdim/umap/merge/umap_sbl_esm2_3b.csv", index=False)

In [26]:
df30   = pd.read_csv(join(path,"umap_sbl_esm2_650m_30.csv"), usecols=cols)
df50   = pd.read_csv(join(path,"umap_sbl_esm2_650m_50.csv"), usecols=cols)
df100  = pd.read_csv(join(path,"umap_sbl_esm2_650m_100.csv"), usecols=cols)
df200  = pd.read_csv(join(path,"umap_sbl_esm2_650m_200.csv"), usecols=cols)
df300  = pd.read_csv(join(path,"umap_sbl_esm2_650m_300.csv"), usecols=cols)
df400  = pd.read_csv(join(path,"umap_sbl_esm2_650m_400.csv"), usecols=cols)
df500  = pd.read_csv(join(path,"umap_sbl_esm2_650m_500.csv"), usecols=cols)
df600  = pd.read_csv(join(path,"umap_sbl_esm2_650m_600.csv"), usecols=cols)
df700  = pd.read_csv(join(path,"umap_sbl_esm2_650m_700.csv"), usecols=cols)
df800  = pd.read_csv(join(path,"umap_sbl_esm2_650m_800.csv"), usecols=cols)
df900  = pd.read_csv(join(path,"umap_sbl_esm2_650m_900.csv"), usecols=cols)
df1000 = pd.read_csv(join(path,"umap_sbl_esm2_650m_1000.csv"), usecols=cols)

df = pd.concat([ids_sbl, df30, df50, df100, df200, df300, df400, df500, df600, df700, df800, df900, df1000], axis=1)
df.columns = df.columns.str.lower()
print(f"data size = {len(df)}")
df.columns

data size = 25961


Index(['seq_id', 'umap1_esm2_650m_30', 'umap2_esm2_650m_30',
       'umap1_esm2_650m_50', 'umap2_esm2_650m_50', 'umap1_esm2_650m_100',
       'umap2_esm2_650m_100', 'umap1_esm2_650m_200', 'umap2_esm2_650m_200',
       'umap1_esm2_650m_300', 'umap2_esm2_650m_300', 'umap1_esm2_650m_400',
       'umap2_esm2_650m_400', 'umap1_esm2_650m_500', 'umap2_esm2_650m_500',
       'umap1_esm2_650m_600', 'umap2_esm2_650m_600', 'umap1_esm2_650m_700',
       'umap2_esm2_650m_700', 'umap1_esm2_650m_800', 'umap2_esm2_650m_800',
       'umap1_esm2_650m_900', 'umap2_esm2_650m_900', 'umap1_esm2_650m_1000',
       'umap2_esm2_650m_1000'],
      dtype='object')

In [27]:
df.to_csv("../bldb/lowdim/umap/merge/umap_sbl_esm2_650m.csv", index=False)

In [28]:
df30   = pd.read_csv(join(path,"umap_sbl_carp_30.csv"), usecols=cols)
df50   = pd.read_csv(join(path,"umap_sbl_carp_50.csv"), usecols=cols)
df100  = pd.read_csv(join(path,"umap_sbl_carp_100.csv"), usecols=cols)
df200  = pd.read_csv(join(path,"umap_sbl_carp_200.csv"), usecols=cols)
df300  = pd.read_csv(join(path,"umap_sbl_carp_300.csv"), usecols=cols)
df400  = pd.read_csv(join(path,"umap_sbl_carp_400.csv"), usecols=cols)
df500  = pd.read_csv(join(path,"umap_sbl_carp_500.csv"), usecols=cols)
df600  = pd.read_csv(join(path,"umap_sbl_carp_600.csv"), usecols=cols)
df700  = pd.read_csv(join(path,"umap_sbl_carp_700.csv"), usecols=cols)
df800  = pd.read_csv(join(path,"umap_sbl_carp_800.csv"), usecols=cols)
df900  = pd.read_csv(join(path,"umap_sbl_carp_900.csv"), usecols=cols)
df1000 = pd.read_csv(join(path,"umap_sbl_carp_1000.csv"), usecols=cols)

df = pd.concat([ids_sbl, df30, df50, df100, df200, df300, df400, df500, df600, df700, df800, df900, df1000], axis=1)
df.columns = df.columns.str.lower()
print(f"data size = {len(df)}")
df.columns

data size = 25961


Index(['seq_id', 'umap1_carp_30', 'umap2_carp_30', 'umap1_carp_50',
       'umap2_carp_50', 'umap1_carp_100', 'umap2_carp_100', 'umap1_carp_200',
       'umap2_carp_200', 'umap1_carp_300', 'umap2_carp_300', 'umap1_carp_400',
       'umap2_carp_400', 'umap1_carp_500', 'umap2_carp_500', 'umap1_carp_600',
       'umap2_carp_600', 'umap1_carp_700', 'umap2_carp_700', 'umap1_carp_800',
       'umap2_carp_800', 'umap1_carp_900', 'umap2_carp_900', 'umap1_carp_1000',
       'umap2_carp_1000'],
      dtype='object')

In [29]:
df.to_csv("../bldb/lowdim/umap/merge/umap_sbl_carp.csv", index=False)

In [30]:
df30   = pd.read_csv(join(path,"umap_sbl_t5xlu50_30.csv"), usecols=cols)
df50   = pd.read_csv(join(path,"umap_sbl_t5xlu50_50.csv"), usecols=cols)
df100  = pd.read_csv(join(path,"umap_sbl_t5xlu50_100.csv"), usecols=cols)
df200  = pd.read_csv(join(path,"umap_sbl_t5xlu50_200.csv"), usecols=cols)
df300  = pd.read_csv(join(path,"umap_sbl_t5xlu50_300.csv"), usecols=cols)
df400  = pd.read_csv(join(path,"umap_sbl_t5xlu50_400.csv"), usecols=cols)
df500  = pd.read_csv(join(path,"umap_sbl_t5xlu50_500.csv"), usecols=cols)
df600  = pd.read_csv(join(path,"umap_sbl_t5xlu50_600.csv"), usecols=cols)
df700  = pd.read_csv(join(path,"umap_sbl_t5xlu50_700.csv"), usecols=cols)
df800  = pd.read_csv(join(path,"umap_sbl_t5xlu50_800.csv"), usecols=cols)
df900  = pd.read_csv(join(path,"umap_sbl_t5xlu50_900.csv"), usecols=cols)
df1000 = pd.read_csv(join(path,"umap_sbl_t5xlu50_1000.csv"), usecols=cols)

df = pd.concat([ids_sbl, df30, df50, df100, df200, df300, df400, df500, df600, df700, df800, df900, df1000], axis=1)
df.columns = df.columns.str.lower()
print(f"data size = {len(df)}")
df.columns

data size = 25961


Index(['seq_id', 'umap1_t5xlu50_30', 'umap2_t5xlu50_30', 'umap1_t5xlu50_50',
       'umap2_t5xlu50_50', 'umap1_t5xlu50_100', 'umap2_t5xlu50_100',
       'umap1_t5xlu50_200', 'umap2_t5xlu50_200', 'umap1_t5xlu50_300',
       'umap2_t5xlu50_300', 'umap1_t5xlu50_400', 'umap2_t5xlu50_400',
       'umap1_t5xlu50_500', 'umap2_t5xlu50_500', 'umap1_t5xlu50_600',
       'umap2_t5xlu50_600', 'umap1_t5xlu50_700', 'umap2_t5xlu50_700',
       'umap1_t5xlu50_800', 'umap2_t5xlu50_800', 'umap1_t5xlu50_900',
       'umap2_t5xlu50_900', 'umap1_t5xlu50_1000', 'umap2_t5xlu50_1000'],
      dtype='object')

In [31]:
df.to_csv("../bldb/lowdim/umap/merge/umap_sbl_t5xlu50.csv", index=False)

# merge all

In [34]:
ls ../bldb/lowdim/umap/merge/ -1

[0m[01;32mumap_mbl_carp_3b.csv[0m*
[01;32mumap_mbl_esm1b.csv[0m*
[01;32mumap_mbl_esm2_3b.csv[0m*
[01;32mumap_mbl_esm2_650m_3b.csv[0m*
[01;32mumap_mbl_t5xlu50.csv[0m*
[01;32mumap_sbl_carp.csv[0m*
[01;32mumap_sbl_esm1b.csv[0m*
[01;32mumap_sbl_esm2_3b.csv[0m*
[01;32mumap_sbl_esm2_650m.csv[0m*
[01;32mumap_sbl_t5xlu50.csv[0m*


In [38]:
# load umap  
mbl_carp      = pd.read_csv("../bldb/lowdim/umap/merge/umap_mbl_carp.csv")
mbl_esm1b     = pd.read_csv("../bldb/lowdim/umap/merge/umap_mbl_esm1b.csv")
mbl_esm2_3b   = pd.read_csv("../bldb/lowdim/umap/merge/umap_mbl_esm2_3b.csv")
mbl_esm2_650m = pd.read_csv("../bldb/lowdim/umap/merge/umap_mbl_esm2_650m.csv")
mbl_t5        = pd.read_csv("../bldb/lowdim/umap/merge/umap_mbl_t5xlu50.csv")

sbl_carp      = pd.read_csv("../bldb/lowdim/umap/merge/umap_sbl_carp.csv")
sbl_esm1b     = pd.read_csv("../bldb/lowdim/umap/merge/umap_sbl_esm1b.csv")
sbl_esm2_3b   = pd.read_csv("../bldb/lowdim/umap/merge/umap_sbl_esm2_3b.csv")
sbl_esm2_650m = pd.read_csv("../bldb/lowdim/umap/merge/umap_sbl_esm2_650m.csv")
sbl_t5        = pd.read_csv("../bldb/lowdim/umap/merge/umap_sbl_t5xlu50.csv")

# merge
umap_sbl = pd.merge(sbl_esm1b, sbl_esm2_3b, on="seq_id",how="inner")
umap_sbl = umap_sbl.merge(sbl_esm2_650m, on="seq_id",how="inner")
umap_sbl = umap_sbl.merge(sbl_carp, on="seq_id",how="inner")
umap_sbl = umap_sbl.merge(sbl_t5, on="seq_id",how="inner")
umap_sbl.to_parquet("../bldb/lowdim/umap/merge/umap_sbl_all_models.parquet", index=False)

umap_mbl = pd.merge(mbl_carp, mbl_esm1b, on="seq_id",how="inner")
umap_mbl = umap_mbl.merge(mbl_esm2_3b, on="seq_id",how="inner")
umap_mbl = umap_mbl.merge(mbl_esm2_650m, on="seq_id",how="inner")
umap_mbl = umap_mbl.merge(mbl_t5, on="seq_id",how="inner")
umap_mbl.to_parquet("../bldb/lowdim/umap/merge/umap_mbl_all_models.parquet", index=False)