# Introduction: Landmarks

In [1]:
import deltascope as ds
import deltascope.alignment as ut

import numpy as np
import pandas as pd
import matplotlib.pyplot as plt

from sklearn.preprocessing import normalize
from scipy.optimize import minimize

import os
import tqdm
import json
import time

# Import raw data
The user needs to specify the directories containing the data of interest. Each sample type should have a key which corresponds to the directory path. Additionally, each object should have a list that includes the channels of interest.

In [2]:
# --------------------------------
# -------- User input ------------
# --------------------------------

data = {
    # Specify sample type key
    'wt': {
        # Specify path to data directory
        'path': './data/Output_wt03-09-21-29/',
        # Specify which channels are in the directory and are of interest
        'channels': ['AT','ZRF']
    },
    'you-too': {
        'path': './data/Output_yot03-09-23-21/',
        'channels': ['AT','ZRF']
    }
}

We'll generate a list of pairs of stypes and channels for ease of use.

In [3]:
data_pairs = []
for s in data.keys():
    for c in data[s]['channels']:
        data_pairs.append((s,c))

We can now read in all datafiles specified by the `data` dictionary above.

In [4]:
D = {}
for s in data.keys():
    D[s] = {}
    for c in data[s]['channels']:
        D[s][c] = ds.read_psi_to_dict(data[s]['path'],c)

100%|██████████| 64/64 [00:44<00:00,  1.42it/s]
100%|██████████| 64/64 [00:35<00:00,  1.52s/it]
100%|██████████| 69/69 [00:14<00:00,  4.77it/s]
100%|██████████| 69/69 [00:23<00:00,  1.78it/s]


# Calculate landmark bins
Based on the analysis above, we can select the optimal value of alpha bins.

In [5]:
# --------------------------------
# -------- User input ------------
# --------------------------------

# Pick an integer value for bin number based on results above
anum = 25

# Specify the percentiles which will be used to calculate landmarks
percbins = [50]

Calculate landmark bins based on user input parameters and the previously specified control sample.

In [6]:
theta_step = np.pi/4

In [7]:
lm = ds.landmarks(percbins=percbins, rnull=np.nan)
lm.calc_bins(D['wt']['AT'], anum, theta_step)

print('Alpha bins')
print(lm.acbins)
print('Theta bins')
print(lm.tbins)

Alpha bins
[-81.64435845 -74.84066191 -68.03696537 -61.23326883 -54.4295723
 -47.62587576 -40.82217922 -34.01848269 -27.21478615 -20.41108961
 -13.60739307  -6.80369654   0.           6.80369654  13.60739307
  20.41108961  27.21478615  34.01848269  40.82217922  47.62587576
  54.4295723   61.23326883  68.03696537  74.84066191  81.64435845]
Theta bins
[-3.14159265 -2.35619449 -1.57079633 -0.78539816  0.          0.78539816
  1.57079633  2.35619449  3.14159265]


# Calculate landmarks

In [8]:
lmdf = pd.DataFrame()

# Loop through each pair of stype and channels
for s,c in tqdm.tqdm(data_pairs):
    print(s,c)
    # Calculate landmarks for each sample with this data pair
    for k,df in tqdm.tqdm(D[s][c].items()):
        lmdf = lm.calc_perc(df, k, '-'.join([s,c]), lmdf)
        
# Set timestamp for saving data
tstamp = time.strftime("%m-%d-%H-%M",time.localtime())
        
# Save completed landmarks to a csv file
lmdf.to_csv(tstamp+'_landmarks.csv')
print('Landmarks saved to csv')

# Save landmark bins to json file
bins = {
    'acbins':list(lm.acbins),
    'tbins':list(lm.tbins)
}
with open(tstamp+'_landmarks_bins.json', 'w') as outfile:
    json.dump(bins, outfile)
print('Bins saved to json')

  0%|          | 0/4 [00:00<?, ?it/s]

wt AT



  0%|          | 0/31 [00:00<?, ?it/s]
  3%|▎         | 1/31 [00:00<00:18,  1.59it/s]
  6%|▋         | 2/31 [00:01<00:18,  1.54it/s]
 10%|▉         | 3/31 [00:01<00:18,  1.54it/s]
 13%|█▎        | 4/31 [00:02<00:17,  1.57it/s]
 16%|█▌        | 5/31 [00:03<00:16,  1.55it/s]
 19%|█▉        | 6/31 [00:03<00:16,  1.55it/s]
 23%|██▎       | 7/31 [00:04<00:16,  1.42it/s]
 26%|██▌       | 8/31 [00:05<00:15,  1.44it/s]
 29%|██▉       | 9/31 [00:06<00:15,  1.42it/s]
 32%|███▏      | 10/31 [00:06<00:14,  1.48it/s]
 35%|███▌      | 11/31 [00:07<00:13,  1.48it/s]
 39%|███▊      | 12/31 [00:08<00:12,  1.51it/s]
 42%|████▏     | 13/31 [00:08<00:12,  1.43it/s]
 45%|████▌     | 14/31 [00:09<00:11,  1.48it/s]
 48%|████▊     | 15/31 [00:10<00:10,  1.47it/s]
 52%|█████▏    | 16/31 [00:11<00:11,  1.35it/s]
 55%|█████▍    | 17/31 [00:11<00:10,  1.37it/s]
 58%|█████▊    | 18/31 [00:12<00:09,  1.40it/s]
 61%|██████▏   | 19/31 [00:13<00:08,  1.41it/s]
 65%|██████▍   | 20/31 [00:13<00:07,  1.43it/s]
 68%|████

wt ZRF



  0%|          | 0/31 [00:00<?, ?it/s]
  3%|▎         | 1/31 [00:00<00:23,  1.29it/s]
  6%|▋         | 2/31 [00:01<00:21,  1.33it/s]
 10%|▉         | 3/31 [00:02<00:20,  1.35it/s]
 13%|█▎        | 4/31 [00:02<00:19,  1.42it/s]
 16%|█▌        | 5/31 [00:03<00:17,  1.45it/s]
 19%|█▉        | 6/31 [00:04<00:17,  1.45it/s]
 23%|██▎       | 7/31 [00:04<00:16,  1.47it/s]
 26%|██▌       | 8/31 [00:05<00:15,  1.52it/s]
 29%|██▉       | 9/31 [00:06<00:14,  1.52it/s]
 32%|███▏      | 10/31 [00:06<00:13,  1.57it/s]
 35%|███▌      | 11/31 [00:07<00:12,  1.62it/s]
 39%|███▊      | 12/31 [00:07<00:11,  1.60it/s]
 42%|████▏     | 13/31 [00:08<00:11,  1.63it/s]
 45%|████▌     | 14/31 [00:09<00:10,  1.62it/s]
 48%|████▊     | 15/31 [00:09<00:09,  1.65it/s]
 52%|█████▏    | 16/31 [00:10<00:09,  1.61it/s]
 55%|█████▍    | 17/31 [00:10<00:08,  1.58it/s]
 58%|█████▊    | 18/31 [00:11<00:08,  1.58it/s]
 61%|██████▏   | 19/31 [00:12<00:07,  1.51it/s]
 65%|██████▍   | 20/31 [00:13<00:07,  1.52it/s]
 68%|████

you-too AT



  0%|          | 0/34 [00:00<?, ?it/s]
  3%|▎         | 1/34 [00:00<00:17,  1.91it/s]
  6%|▌         | 2/34 [00:01<00:16,  1.92it/s]
  9%|▉         | 3/34 [00:01<00:16,  1.93it/s]
 12%|█▏        | 4/34 [00:02<00:15,  1.95it/s]
 15%|█▍        | 5/34 [00:02<00:15,  1.91it/s]
 18%|█▊        | 6/34 [00:03<00:14,  1.93it/s]
 21%|██        | 7/34 [00:03<00:14,  1.84it/s]
 24%|██▎       | 8/34 [00:04<00:14,  1.77it/s]
 26%|██▋       | 9/34 [00:04<00:13,  1.84it/s]
 29%|██▉       | 10/34 [00:05<00:12,  1.87it/s]
 32%|███▏      | 11/34 [00:05<00:12,  1.89it/s]
 35%|███▌      | 12/34 [00:06<00:11,  1.88it/s]
 38%|███▊      | 13/34 [00:06<00:11,  1.85it/s]
 41%|████      | 14/34 [00:07<00:10,  1.83it/s]
 44%|████▍     | 15/34 [00:08<00:10,  1.78it/s]
 47%|████▋     | 16/34 [00:08<00:09,  1.81it/s]
 50%|█████     | 17/34 [00:09<00:09,  1.84it/s]
 53%|█████▎    | 18/34 [00:09<00:08,  1.84it/s]
 56%|█████▌    | 19/34 [00:10<00:08,  1.83it/s]
 59%|█████▉    | 20/34 [00:10<00:07,  1.82it/s]
 62%|████

you-too ZRF



  0%|          | 0/34 [00:00<?, ?it/s]
  3%|▎         | 1/34 [00:00<00:19,  1.72it/s]
  6%|▌         | 2/34 [00:01<00:18,  1.77it/s]
  9%|▉         | 3/34 [00:01<00:17,  1.76it/s]
 12%|█▏        | 4/34 [00:02<00:17,  1.75it/s]
 15%|█▍        | 5/34 [00:02<00:17,  1.68it/s]
 18%|█▊        | 6/34 [00:03<00:17,  1.64it/s]
 21%|██        | 7/34 [00:04<00:16,  1.62it/s]
 24%|██▎       | 8/34 [00:04<00:16,  1.62it/s]
 26%|██▋       | 9/34 [00:05<00:14,  1.69it/s]
 29%|██▉       | 10/34 [00:06<00:14,  1.62it/s]
 32%|███▏      | 11/34 [00:06<00:14,  1.60it/s]
 35%|███▌      | 12/34 [00:07<00:13,  1.67it/s]
 38%|███▊      | 13/34 [00:07<00:12,  1.74it/s]
 41%|████      | 14/34 [00:08<00:11,  1.76it/s]
 44%|████▍     | 15/34 [00:08<00:10,  1.73it/s]
 47%|████▋     | 16/34 [00:09<00:10,  1.75it/s]
 50%|█████     | 17/34 [00:09<00:09,  1.79it/s]
 53%|█████▎    | 18/34 [00:10<00:08,  1.85it/s]
 56%|█████▌    | 19/34 [00:10<00:08,  1.86it/s]
 59%|█████▉    | 20/34 [00:11<00:07,  1.86it/s]
 62%|████

Landmarks saved to csv
Bins saved to json
