# Example
## Import necessary libraries

In [3]:
import pandas as pd
from rmsd_calculation import process_all_natives
from correlations import calculate_correlations , create_correlation_matrix
from visualizations import plot_correlation_matrix, plot_metrics_vs_cgRMSD
from scores_comparisons import concat_files

## Define the atom combinations you want to analyze

In [4]:
# Your atom list
ATOM_COMBINATIONS = [
    ["P"],
    ["O1'", "O2'", "O3'"],
    ["C1'", "C2'", "C3'"],
    ["C4'", "C5'"]
]

## cgRMSD calculations

In [None]:
# Specify the directories where your data files are located 
natives_dir = "/path/to/NATIVE/"
preds_dir = "/path/to/PREDS/"
scores_dir = "/path/to/SCORES/"

# Perform cgRMSD calculations for all native structures and their predictions
# This function will compute the coarse-grained RMSD (cgRMSD) for each atom combination specified in ATOM_COMBINATIONS
process_all_natives(natives_dir, preds_dir, scores_dir, ATOM_COMBINATIONS)

## Correlations

In [None]:
# Set the paths to the files where you will store the correlation results
corr_spearman = "./corr_spearman.csv" # Spearman correlation results file
corr_pearson = "./corr_pearson.csv"  # Pearson correlation results file

# Compute the Spearman and Pearson correlations for the scores
# These correlations will measure the relationship between the cgRMSD and other metrics (e.g., RMSD, TM-score, etc.)
calculate_correlations(scores_dir, corr_spearman, method="spearman")
calculate_correlations(scores_dir, corr_pearson, method="pearson")

## Create correlation matrix

In [None]:
# Paths to the output files that will contain the correlation matrices
mtx_spearman = "./mtx_spearman.csv" # Spearman correlation matrix
mtx_pearson = "./mtx_pearson.csv" # Pearson correlation matrix

# Compute the correlation matrices for Spearman and Pearson correlations
# This will summarize the correlation coefficients between various metrics across all predictions
create_correlation_matrix(corr_spearman, mtx_spearman)
create_correlation_matrix(corr_pearson, mtx_pearson)

  

## Visualize the correlation matrix

In [None]:
# Define paths for the heatmap plots of the correlation matrices
plot_mtx_spearman = "./plot_mtx_spearman.png"
plot_mtx_pearson = "./plot_mtx_pearson.png"

# Visualize the correlation matrices using heatmaps
# The heatmaps will visually represent the relationships between different metrics (e.g., RMSD, cgRMSD, etc.)
plot_correlation_matrix(mtx_spearman, plot_mtx_spearman)
plot_correlation_matrix(mtx_pearson, plot_mtx_pearson)

## Score comparison

In [None]:
# Define the output file where all scores will be concatenated
all_scores_file = "./all_scores_file.csv"

# Concatenate the scores for all native structures and their associated predictions
# This step combines the various scores (e.g., RMSD, cgRMSD, etc.) from all predictions into a single CSV file
concat_files(scores_dir, all_scores_file)

## Visualize the score comparison plots

In [None]:
# Set the output folder where the score comparison plots will be saved
output_folder_plots = "./" 

# Visualize the comparison of scores (cgRMSD vs other metrics) across different tools
# The plots will show how the different metrics correlate and how tools compare in terms of their performance
plot_metrics_vs_cgRMSD(all_scores_file, output_folder_plots)