# Notebook for testing and playing with TrajectoryDistances 

In [1]:
import sbmlcore
import pandas as pd

In [2]:
b = {'segid': ['A', 'A', 'A', 'B', 'C', 'C'], 'mutation': ['I3D','S4K', 'Q5V', 'R6D', 'S450F', 'D435F']} #N.B. Mutation must include offset
df = pd.DataFrame.from_dict(b)
df.columns

Index(['segid', 'mutation'], dtype='object')

In [3]:
a = sbmlcore.TrajectoryDistances(
        "./tests/rpob-5uh6-3-warm.gro.gz",
        [
            "./tests/rpob-5uh6-3-md-1-50ns-dt10ns-nojump.xtc",
            "./tests/rpob-5uh6-3-md-2-50ns-dt10ns-nojump.xtc",
            "tests/rpob-5uh6-3-md-3-50ns-dt10ns-nojump.xtc",
        ],
        "./tests/5uh6.pdb",
        "resname RFP",
        "max RFP",
        distance_type="max",
        offsets = {'A': 0, 'B': 0, 'C': -6},
        percentile_exclusion=True,
    )
a.return_dist_df()

[70.78370348 69.76235741 71.14507483 72.00016103 73.06823486 69.6177079
 74.16008073]
[71.85908283 70.49513922 71.77006758 72.98890875 71.52597925 71.17361911
 74.75063523]
[75.43100858 73.68251463 74.79722268 76.22656107 74.08990704 74.45799378
 78.39320796]
[75.37050484 72.19567691 73.06146799 74.44602501 73.2602862  72.5325066
 77.73912516]
[74.03663109 70.32327815 70.95108609 71.39838507 71.53749609 70.08382141
 75.96488957]
[70.65129477 66.77504434 67.60916973 67.86798694 67.94321466 66.58620213
 72.18475193]
[70.36511564 67.12947785 67.90064186 68.26085979 66.50708925 67.36691641
 71.88348674]
[68.09878992 65.02247637 65.7201429  66.50995735 64.17697566 64.47869046
 69.8842795 ]
[67.98232331 64.89110628 65.95635853 66.93129565 64.69056117 64.74782481
 70.21200412]
[65.72602626 62.74941196 63.63726494 64.86233896 62.33027132 62.6218343
 68.30373807]
[64.64007979 62.0916357  63.77379911 64.74328075 62.0306399  61.55627607
 67.02268145]
[63.3990498  60.57161249 64.76607145 63.243076

Unnamed: 0,segid,resid,max RFP,amino_acid
0,A,3,74.160081,I
1,A,4,74.750635,S
2,A,5,78.393208,Q
3,A,6,77.739125,R
4,A,7,75.964890,P
...,...,...,...,...
3238,F,524,54.412016,R
3239,F,525,50.833875,D
3240,F,526,50.095013,Y
3241,F,527,49.678343,L


In [4]:
df = a.add_feature(df)
df

Unnamed: 0,segid,resid,mutation,max RFP
0,A,3,I3D,74.160081
1,A,4,S4K,74.750635
2,A,5,Q5V,78.393208
3,B,6,R6D,57.32006
4,C,450,S450F,13.887488
5,C,435,D435F,9.464016


In [5]:
t = sbmlcore.TrajectoryDistances(
        "./tests/rpob-5uh6-3-warm.gro.gz",
        [
            "./tests/rpob-5uh6-3-md-1-50ns-dt10ns-nojump.xtc",
            "./tests/rpob-5uh6-3-md-2-50ns-dt10ns-nojump.xtc",
            "./tests/rpob-5uh6-3-md-3-50ns-dt10ns-nojump.xtc",
        ],
        "./tests/5uh6.pdb",
        "resname RFP",
        "mean RFP",
        distance_type="mean",
        offsets = {'A': 0, 'B': 0, 'C': -6},
        percentile_exclusion=True,
    )
t.return_dist_df()

Unnamed: 0,segid,resid,mean RFP,amino_acid
0,A,3,71.505331,I
1,A,4,72.080490,S
2,A,5,75.296917,Q
3,A,6,74.086513,R
4,A,7,72.042227,P
...,...,...,...,...
3238,F,524,51.972716,R
3239,F,525,48.804352,D
3240,F,526,48.449548,Y
3241,F,527,48.072856,L


In [6]:
df = t.add_feature(df)
df

Unnamed: 0,segid,resid,mutation,max RFP,mean RFP
0,A,3,I3D,74.160081,71.505331
1,A,4,S4K,74.750635,72.08049
2,A,5,Q5V,78.393208,75.296917
3,B,6,R6D,57.32006,53.441465
4,C,450,S450F,13.887488,11.852404
5,C,435,D435F,9.464016,8.732147


In [7]:
df.to_csv('./tests/5uh6_added_traj_distances.csv')

In [9]:
p = sbmlcore.TrajectoryDistances(
        "./tests/rpob-5uh6-3-warm.gro.gz",
        [
            "./tests/rpob-5uh6-3-md-1-50ns-dt10ns-nojump.xtc",
            "./tests/rpob-5uh6-3-md-2-50ns-dt10ns-nojump.xtc",
        ],
        "./tests/5uh6.pdb",
        "resname RFP",
        "median RFP",
        distance_type="median",
        offsets = {'A': 0, 'B': 0, 'C': -6},
        percentile_exclusion=True,
    )
df = p.add_feature(df)
df

Unnamed: 0,segid,resid,mutation,max RFP,mean RFP,median RFP
0,A,3,I3D,72.000161,70.661801,70.783703
1,A,4,S4K,71.859083,71.364778,71.525979
2,A,5,Q5V,75.431009,74.491729,74.457994
3,B,6,R6D,54.469711,52.361124,51.797465
4,C,450,S450F,13.887488,12.229636,11.714328
5,C,435,D435F,9.464016,8.713272,9.211318


In [10]:
p = sbmlcore.TrajectoryDistances(
        "./tests/rpob-5uh6-3-warm.gro.gz",
        [
            "./tests/rpob-5uh6-3-md-1-50ns-dt10ns-nojump.xtc",
            "./tests/rpob-5uh6-3-md-2-50ns-dt10ns-nojump.xtc",
        ],
        "./tests/5uh6.pdb",
        "resname RFP",
        "min RFP",
        distance_type="min",
        offsets = {'A': 0, 'B': 0, 'C': -6},
        percentile_exclusion=True,
    )
df = p.add_feature(df)
df


Unnamed: 0,segid,resid,mutation,max RFP,mean RFP,median RFP,min RFP
0,A,3,I3D,72.000161,70.661801,70.783703,69.617708
1,A,4,S4K,71.859083,71.364778,71.525979,70.495139
2,A,5,Q5V,75.431009,74.491729,74.457994,73.682515
3,B,6,R6D,54.469711,52.361124,51.797465,51.712725
4,C,450,S450F,13.887488,12.229636,11.714328,11.534613
5,C,435,D435F,9.464016,8.713272,9.211318,6.590122


In [12]:
df.to_csv('./tests/5uh6_added_traj_distances.csv')

In [1]:
import sbmlcore

In [2]:
a = sbmlcore.TrajectoryDihedrals(
        "./tests/rpob-5uh6-3-warm.gro.gz",
        [
            "./tests/rpob-5uh6-3-md-1-50ns-dt10ns-nojump.xtc",
        ],
        "./tests/5uh6.pdb",
        "phi",
        "phi",
        angle_type="mean",

)
a

3243
     segid  resid         phi amino_acid
0        A      3    0.000000          I
1        A      4 -100.615114          S
2        A      5  -93.045569          Q
3        A      6 -123.129162          R
4        A      7  -74.361088          P
...    ...    ...         ...        ...
3238     F    524  -68.691273          R
3239     F    525  -69.960553          D
3240     F    526  -73.462857          Y
3241     F    527 -101.204409          L
3242     F    528 -120.899890          D

[3243 rows x 4 columns]


<sbmlcore.TrajectoryDihedrals.TrajectoryDihedrals at 0x15080eb30>

In [7]:
a = sbmlcore.TrajectoryDihedrals(
        "./tests/rpob-5uh6-3-warm.gro.gz",
        [
            "./tests/rpob-5uh6-3-md-1-50ns-dt10ns-nojump.xtc",
        ],
        "./tests/5uh6.pdb",
        "phi",
        "phi",
        angle_type="max",

)
a

3243
     segid  resid        phi amino_acid
0        A      3   0.000000          I
1        A      4 -60.717763          S
2        A      5 -64.512299          Q
3        A      6 -71.359612          R
4        A      7 -51.986569          P
...    ...    ...        ...        ...
3238     F    524 -57.800060          R
3239     F    525 -59.504043          D
3240     F    526 -57.018843          Y
3241     F    527 -88.824621          L
3242     F    528 -76.059116          D

[3243 rows x 4 columns]


<sbmlcore.TrajectoryDihedrals.TrajectoryDihedrals at 0x2803dbe80>

In [2]:
a = sbmlcore.TrajectoryDihedrals(
        "./tests/rpob-5uh6-3-warm.gro.gz",
        [
            "./tests/rpob-5uh6-3-md-1-50ns-dt10ns-nojump.xtc",
        ],
        "./tests/5uh6.pdb",
        "omega",
        "omega",
        angle_type="mean",

)
a.return_angle_df()

3243
     segid  resid       omega amino_acid
0        A      3  -56.279256          I
1        A      4  -53.908477          S
2        A      5  -56.855710          Q
3        A      6   55.698738          R
4        A      7   59.849977          P
...    ...    ...         ...        ...
3238     F    524  -60.014965          R
3239     F    525  174.896806          D
3240     F    526 -171.369486          Y
3241     F    527    3.189095          L
3242     F    528   87.519737          D

[3243 rows x 4 columns]


Unnamed: 0,segid,resid,omega,amino_acid
0,A,3,-56.279256,I
1,A,4,-53.908477,S
2,A,5,-56.855710,Q
3,A,6,55.698738,R
4,A,7,59.849977,P
...,...,...,...,...
3238,F,524,-60.014965,R
3239,F,525,174.896806,D
3240,F,526,-171.369486,Y
3241,F,527,3.189095,L


In [1]:
import sbmlcore

In [2]:
a = sbmlcore.TrajectoryDihedrals(
        "./tests/rpob-5uh6-3-warm.gro.gz",
        [
            "./tests/rpob-5uh6-3-md-1-50ns-dt10ns-nojump.xtc",
        ],
        "./tests/5uh6.pdb",
        "phi",
        "phi",
        angle_type="mean",
        add_bonds=True,
        offsets = {'A': 0, 'B': 0, 'C': -6},
        percentile_exclusion=True
)
a.return_angle_df()

(3243, 6)
(3243, 6)
4
4
[[   0.            0.            0.            0.        ]
 [-107.18091898 -101.54740077  -97.29903725  -85.70734004]
 [-102.75659101  -91.38323483  -83.37468626  -87.73925586]
 ...
 [ -81.8968086   -74.09517636  -76.95795224  -67.58047774]
 [-102.55454468 -111.1412427   -98.94747099  -94.25880243]
 [-121.76174434 -141.48849942 -122.74544862 -109.75704746]]


Unnamed: 0,segid,resid,phi,amino_acid
0,A,3,0.000000,I
1,A,4,-97.933674,S
2,A,5,-91.313442,Q
3,A,6,-128.500821,R
4,A,7,-76.573812,P
...,...,...,...,...
3238,F,524,-67.139100,R
3239,F,525,-71.194813,D
3240,F,526,-75.132604,Y
3241,F,527,-101.725515,L
