Reads the S phase genes from a tab-separated text file.

In [None]:
import pandas as pd

data = pd.read_csv('cell_cycle_genes_reactome_extended.txt', sep='\t')

Uses processed H5AD files to access G2/M phase genes.

In [None]:
import h5py

with h5py.File('processed_h5ad.h5', 'r') as f:
    g2m_genes = f['g2m_phase_genes'][:]  # Assuming the dataset is within the file

Performs PCA on S and G2/M phase genes.

In [None]:
from sklearn.decomposition import PCA

pca = PCA(n_components=2)
results = pca.fit_transform(data[['S_phase', 'G2M_phase']])

Visualizes PCA results as a box plot.

In [None]:
import matplotlib.pyplot as plt

plt.boxplot(results)
plt.title('PCA Results')
plt.show()

Transforms PCA results into UMAP for further dimensionality reduction.

In [None]:
from sklearn.manifold import UMAP

umap = UMAP()
umap_results = umap.fit_transform(results)

Visualizes UMAP results as a bar chart.

In [None]:
plt.bar(['A', 'B', 'C'], [umap_results.mean(axis=0)])
plt.title('UMAP Results')
plt.show()