# R2, NRC, and IQS

In [None]:
import pandas as pd

# Load the combined CSV file into a pandas DataFrame
# Change csv e.g. R2, NRC, or IQS
df = pd.read_csv('combined_R2_results.csv')

# Show the first few rows of the dataframe to verify data
print(df.head())

In [None]:
import seaborn as sns
import matplotlib.pyplot as plt

# Set the figure size and style
plt.figure(figsize=(10, 6))
sns.set(style="whitegrid")

# Convert MAF to a categorical type to maintain order
df['MAF'] = pd.Categorical(df['MAF'], categories=[
    '0-0.05', '0.05-0.1', '0.1-0.15', '0.15-0.2',
    '0.2-0.25', '0.25-0.3', '0.3-0.35', '0.35-0.4', 
    '0.4-0.45', '0.45-0.5'], ordered=True)

# Plot R² values for different tools across MAF bins
sns.lineplot(data=df, x='MAF', y='R2', hue='Tool', style='Coverage', markers=True, dashes=False)

# Set the plot labels and title
plt.title("R² - GLIMPSE2, QUILT v1.0.5 and STITCH v1.7.2", fontsize=16)
plt.xlabel("Minor Allele Frequency (MAF)", fontsize=12)
plt.ylabel("R²", fontsize=12)

# Rotate x-axis labels for better readability
plt.xticks(rotation=45)

# Show the plot
plt.tight_layout()
plt.savefig("R2_Distribution.png", dpi=300)
plt.show()