In [2]:
import pandas as pd
import matplotlib.pyplot as plt
%matplotlib inline
import numpy as np
import seaborn as sns
from scipy import stats

In [3]:
runs =[
    "run-no-ambig", "run-with-ambig-orig", "run-general-ambig",
    "run-no-ambig-0.05-expand", "run-with-ambig-0.05-expand-orig", "run-general-ambig-0.05-expand",
    "run-no-ambig-0.2-expand", "run-with-ambig-0.2-expand", "run-general-ambig-0.2-expand","run-water-refine",
    "run-with-ambig", "run-with-ambig-0.05-expand",
    "run-cg-with-lig", "run-cg-water"
]   
succes_list = ['3J95', '3J96', '5GRS', '5HNY', '5WCB', '6ACG', '6AHF', '6IRF', '6N1Q', '6N7G', '6N8Z', '6R7I', '6UBY', '6UC0']

tick_label_dict ={
    "run-no-ambig" : "1",
    "run-with-ambig-orig" : "2",
    "run-general-ambig" : "3",
    "run-no-ambig-0.05-expand" : "4",
    "run-with-ambig-0.05-expand-orig" : "5",
    "run-general-ambig-0.05-expand" : "6",
    "run-no-ambig-0.2-expand" : "7",
    "run-with-ambig-0.2-expand" : "8",
    "run-general-ambig-0.2-expand" : "9",
    "run-cg" : "coarse grained",
    "run-cg2" : "coarse grained 2",
    "run-cg-with-lig" : "13",
    "run-water-refine" : "10",
    'run-no-ambig-0.05-expand-EM' : "it1 no restraints 0.05 expand EM",
    'run-with-ambig-0.05-expand-EM' : "it1 with restraints 0.05 expand EM",
    'run-general-ambig-0.05-expand-EM' : "it1 general restraints 0.05 expand EM",
    "run-cg-water" : "14",
    "run-general-ambig-EM" : "it1 gr + EM",
    "run-with-ambig" : "11",
    "run-with-ambig-0.05-expand" : "12"
}

def make_tick_labels(runs):
    tick_labels = []
    for run in runs:
        tick_labels.append(tick_label_dict[run])
    return tick_labels

In [11]:
def get_ref_secondary():
    """returns a DataFrame containing all the reference structure values"""
    ref_df = pd.read_csv("analysis/refrence-stride.csv", index_col = 0)
  
    return ref_df

def make_secondary_df(run):
    run = "analysis_{}".format(run)
    
    df_3J95 = pd.read_csv(("analysis/{}/3J95_stride.csv").format(run), index_col = "structure")
    df_3J96 = pd.read_csv(("analysis/{}/3J96_stride.csv").format(run), index_col = "structure")
    df_5GRS = pd.read_csv(("analysis/{}/5GRS_stride.csv").format(run), index_col = "structure")
    df_5HNY = pd.read_csv(("analysis/{}/5HNY_stride.csv").format(run), index_col = "structure")
    df_5WCB = pd.read_csv(("analysis/{}/5WCB_stride.csv").format(run), index_col = "structure")
    df_6ACG = pd.read_csv(("analysis/{}/6ACG_stride.csv").format(run), index_col = "structure")
    df_6AHF = pd.read_csv(("analysis/{}/6AHF_stride.csv").format(run), index_col = "structure")
    df_6IRF = pd.read_csv(("analysis/{}/6IRF_stride.csv").format(run), index_col = "structure")
    df_6N1Q = pd.read_csv(("analysis/{}/6N1Q_stride.csv").format(run), index_col = "structure")
    df_6N7G = pd.read_csv(("analysis/{}/6N7G_stride.csv").format(run), index_col = "structure")
    df_6N8Z = pd.read_csv(("analysis/{}/6N8Z_stride.csv").format(run), index_col = "structure")
    df_6R7I = pd.read_csv(("analysis/{}/6R7I_stride.csv").format(run), index_col = "structure")
    df_6UBY = pd.read_csv(("analysis/{}/6UBY_stride.csv").format(run), index_col = "structure")
    df_6UC0 = pd.read_csv(("analysis/{}/6UC0_stride.csv").format(run), index_col = "structure")
    
    df_list = [
        df_3J95,
        df_3J96,
        df_5GRS,
        df_5HNY,
        df_5WCB,
        df_6ACG,
        df_6AHF,
        df_6IRF,
        df_6N1Q,
        df_6N7G,
        df_6N8Z,
        df_6R7I,
        df_6UBY,
        df_6UC0,
    ]
    
    return df_list

In [88]:
ref_df = get_ref_secondary()
stride_df = make_secondary_df(runs[0])


In [94]:
ref = ref_df.div(ref_df["All"], axis = 0)
for df in stride_df:
    struct = "{}.pdb".format(df.index[1][0:4])
    df = df.iloc[:,1:6]
    df = df.div(df['All'], axis = 0)
    print(df.sub(ref.loc[struct]).mul(100))

                 Helix     Sheet      Turn      Coil  All
structure                                                
3J95_39w.pdb -0.215392 -0.949546  0.795457  0.369482  0.0
3J95_2w.pdb  -0.124853 -1.075116  0.672306  0.527663  0.0
3J95_36w.pdb -0.280659 -0.633595  0.421614  0.492641  0.0
3J95_10w.pdb -0.338843 -0.621853  0.030104  0.930592  0.0
                 Helix     Sheet      Turn      Coil  All
structure                                                
3J96_10w.pdb -0.724642 -0.853350  1.122981  0.455011  0.0
3J96_41w.pdb -0.684946 -0.432509  0.515346  0.602109  0.0
3J96_29w.pdb -0.600948 -1.261595  1.708524  0.154018  0.0
3J96_30w.pdb -0.612432 -0.374608  0.519769  0.467271  0.0
                 Helix     Sheet      Turn      Coil  All
structure                                                
5GRS_46w.pdb  4.038884 -2.069202  1.595834 -3.565515  0.0
5GRS_26w.pdb  3.541071 -1.961140  1.798046 -3.377977  0.0
5GRS_45w.pdb  3.908957 -2.736882  2.710204 -3.882279  0.0
5GRS_42w.pdb  