## **SETD2 with SAM, analysis**

## **Import modules**

In [1]:
import os
import sys

data_path=os.path.abspath('/media/dataHog/hca/SETD2') #Where your group data is
base_path=os.path.abspath('/media/dataHog/hca/SimFound_v2/source/') #Where your source code is (SFv2)

sys.path.append(base_path)
sys.path.append(data_path)

import importlib

import warnings
warnings.filterwarnings('ignore')
import Protocols as P

import main
import tools
import Trajectory
import MSM
import Featurize as F
import Discretize


from simtk.unit import *

## **Define Project**

In [2]:
importlib.reload(Trajectory)
importlib.reload(main)

workdir=data_path
results=workdir+'/results'
inputs=workdir+'inputs/structures/'

workdir=tools.Functions.fileHandler([workdir], _new=False)
tools.Functions.fileHandler([results, inputs])


#protein=['WT', 'R167Q', 'I602G']
protein=['setd2_open']

ligand=['SAM']
parameters=['310K']
timestep=20*picoseconds

project=main.Project(title='SETD2-SAM', 
                     hierarchy=('protein', 'ligand', 'parameter'), 
                     workdir=workdir,
                     parameter=parameters, 
                     replicas=25, 
                     protein=protein, 
                     ligand=ligand, 
                     results=results,
                     topology='SETD2.pdb',
                     timestep=timestep,
                    initial_replica=1)


project_systems=project.setSystems()

Converted parameter "temperature" (in K) into scalar: 310.0 K
System defined: ('setd2_open', 'SAM', '310K', '1'), ID: 310.0 K
System defined: ('setd2_open', 'SAM', '310K', '2'), ID: 310.0 K
System defined: ('setd2_open', 'SAM', '310K', '3'), ID: 310.0 K
System defined: ('setd2_open', 'SAM', '310K', '4'), ID: 310.0 K
System defined: ('setd2_open', 'SAM', '310K', '5'), ID: 310.0 K
System defined: ('setd2_open', 'SAM', '310K', '6'), ID: 310.0 K
System defined: ('setd2_open', 'SAM', '310K', '7'), ID: 310.0 K
System defined: ('setd2_open', 'SAM', '310K', '8'), ID: 310.0 K
System defined: ('setd2_open', 'SAM', '310K', '9'), ID: 310.0 K
System defined: ('setd2_open', 'SAM', '310K', '10'), ID: 310.0 K
System defined: ('setd2_open', 'SAM', '310K', '11'), ID: 310.0 K
System defined: ('setd2_open', 'SAM', '310K', '12'), ID: 310.0 K
System defined: ('setd2_open', 'SAM', '310K', '13'), ID: 310.0 K
System defined: ('setd2_open', 'SAM', '310K', '14'), ID: 310.0 K
System defined: ('setd2_open', 'SAM',

## **Markov State Models**


In [None]:
importlib.reload(MSM)
import numpy as np
protein_regions = {'loop_IN' : 'resid 240 to 255',
                   'post_SET_domain' : 'resid 220 to 240',
                   'combined' : 'resid 220 to 254',
                   'loopIN_SETcd' : ('resid 248 and sidechain', 'resid 136 to 147 and sidechain'),
                    'SETcd_helix' : 'resid 136 to 147'}

protein_regions = {'loopIN_SETcd' : ('resid 248 and sidechain', 'resid 136 to 147 and sidechain'),
                    'SETcd_helix' : 'resid 136 to 147'}

vamp_lags=[1, 2, 10, 50, 100, 200, 500, 1000]

features_to_extract=['torsions', 'positions', 'min_dist', 'contacts']
#input_regular='resid 241 to 253'

kinetic_models={}
kinetics=MSM.MSM(project_systems, results=results, timestep=timestep, stride=1)

for name, region in protein_regions.items():
        kinetic_models[name]=kinetics.calculate(region,
                                                     method='VAMP',
                                                     evaluate='dimensions',
                                                     features=features_to_extract, 
                                                     ft_name=name, 
                                                     lags=vamp_lags, 
                                                     dim=0.9)   


Results will be stored under:  /media/dataHog/hca/SETD2/results
Extracting feature:  torsions
Extracting feature:  positions
Extracting feature:  min_dist
