In [None]:
import os
import sys
import yaml

config_file = "project_config_508469.yaml"
config_path = "/home/jgi_user/configs"
config_fname = os.path.join(config_path, config_file)

with open(config_fname, 'r') as file:
    config = yaml.safe_load(file)
print(f"Using config file: {config_fname}")

#sys.path.insert(0, "/home/jgi_user/tools")
import tools.objects as objs

In [None]:
# Initialize project
project = objs.Project(config)

In [None]:
# Create datasets (which hold raw data and metadata)
tx_dataset = objs.TX(project, clear_dataset_dir=False)
mx_dataset = objs.MX(project, clear_dataset_dir=False)

In [None]:
# Create analysis (collection of datasets and methods for performing integration)
analysis = objs.Analysis(project, datasets=[tx_dataset, mx_dataset], clear_analysis_dir=False)

In [None]:
# Get metadata and data from disk, cache, or generate from source
tx_dataset.get_raw_metadata(overwrite=False)
tx_dataset.get_raw_data(overwrite=False)
mx_dataset.get_raw_metadata(overwrite=False)
mx_dataset.get_raw_data(overwrite=False)

In [None]:
# Link analysis datasets by finding corresponding samples and metadata
analysis.link_metadata(overwrite=False)
analysis.link_data(overwrite=False)

In [None]:
# Filter out rare features from analysis datasets based on minimum observed value or proportion of missing values across samples
analysis.filter_all_datasets(overwrite=False)

In [None]:
# Filter out features from analysis datasets that were not impacted by experimentation based on low variance across samples
analysis.devariance_all_datasets(overwrite=False)

In [None]:
# Scale features in all analysis datasets to a shared, normalized distribution
analysis.scale_all_datasets(overwrite=False)

In [None]:
# Filter out features from analysis datasets based on low within-replicate reproducibility
analysis.replicability_test_all_datasets(overwrite=False)

In [None]:
# Perform dataset integration of linked metadata and data
analysis.integrate_metadata(overwrite=False)
analysis.integrate_data(overwrite=False)

In [None]:
# Calculate correlations with custom parameters
analysis.calculate_correlated_features(overwrite=False)

In [None]:
# Subset features for network analysis
analysis.subset_features_before_network_analysis(overwrite=False)

In [None]:
# Plot correlation network
analysis.plot_correlation_network(overwrite=False)