This script loads behavioral mice data (from `biasedChoiceWorld` protocol and, separately, the last three sessions of training) only from mice that pass a given (stricter) training criterion. For the `biasedChoiceWorld` protocol, only sessions achieving the `trained_1b` and `ready4ephysrig` training status are collected.
The data are slightly reformatted and saved as `.csv` files.

In [1]:
import datajoint as dj
dj.config['database.host'] = 'datajoint.internationalbrainlab.org'

from ibl_pipeline import subject, acquisition, action, behavior, reference, data
from ibl_pipeline.analyses.behavior import PsychResults, SessionTrainingStatus
from ibl_pipeline.utils import psychofit as psy
from ibl_pipeline.analyses import behavior as behavior_analysis

import numpy as np
import matplotlib.pyplot as plt
import pandas as pd

Connecting lacerbi@datajoint.internationalbrainlab.org:3306


In [2]:
import os
myPath = r"C:\Users\Luigi\Documents\GitHub\ibl-changepoint\data" # Write here your data path
os.chdir(myPath)

In [3]:
# Get list of mice that satisfy given training criteria (stringent trained_1b)
# Check query from behavioral paper: 
# https://github.com/int-brain-lab/paper-behavior/blob/master/paper_behavior_functions.py

subj_query = (subject.Subject * subject.SubjectLab * reference.Lab * subject.SubjectProject
                  & 'subject_project = "ibl_neuropixel_brainwide_01"').aggr(
                          (acquisition.Session * behavior_analysis.SessionTrainingStatus())
#                          & 'training_status="trained_1a" OR training_status="trained_1b"',
#                          & 'training_status="trained_1b" OR training_status="ready4ephysrig"',
                          & 'training_status="trained_1b"',
                          'subject_nickname', 'sex', 'subject_birth_date', 'institution',
                          date_trained='min(date(session_start_time))')

subjects = (subj_query & 'date_trained < "2019-09-30"')

mice_names = sorted(subjects.fetch('subject_nickname'))

print(mice_names)

['CSHL_002', 'CSHL_003', 'CSHL_005', 'CSHL_008', 'CSHL_010', 'CSHL_014', 'CSHL_015', 'CSH_ZAD_001', 'CSH_ZAD_003', 'CSH_ZAD_004', 'CSH_ZAD_006', 'CSH_ZAD_007', 'CSH_ZAD_010', 'DY_001', 'DY_006', 'DY_007', 'IBL-T1', 'IBL-T2', 'IBL-T4', 'IBL_001', 'IBL_002', 'KS002', 'KS003', 'KS004', 'KS005', 'KS014', 'KS015', 'KS016', 'KS017', 'KS019', 'NYU-01', 'NYU-02', 'NYU-06', 'SWC_009', 'SWC_013', 'SWC_014', 'ZM_1084', 'ZM_1085', 'ZM_1086', 'ZM_1087', 'ZM_1091', 'ZM_1092', 'ZM_1097', 'ZM_1098', 'ZM_1367', 'ZM_1371', 'ZM_1372', 'ZM_1743', 'ZM_1745', 'ZM_1746', 'ZM_1747', 'ibl_witten_03', 'ibl_witten_04', 'ibl_witten_05', 'ibl_witten_06', 'ibl_witten_12', 'ibl_witten_14', 'ibl_witten_15', 'ibl_witten_16']


In [4]:
sess_train  = ((acquisition.Session * behavior_analysis.SessionTrainingStatus) & 
               'task_protocol LIKE "%training%"' & 'session_start_time < "2019-09-30"')
sess_stable = ((acquisition.Session * behavior_analysis.SessionTrainingStatus) & 
               'task_protocol LIKE "%biased%"' & 'session_start_time < "2019-09-30"' & 
               ('training_status="trained_1b" OR training_status="ready4ephysrig"'))
              
stable_mice_names = list()

# Perform at least this number of sessions
MinSessionNumber = 4

def get_mouse_data(df):
    position_deg = 35.    # Stimuli appear at +/- 35 degrees

    # Create new dataframe
    datamat = pd.DataFrame()
    datamat['trial_num'] = df['trial_id']
    datamat['session_num'] = np.cumsum(df['trial_id'] == 1)
    datamat['stim_probability_left'] = df['trial_stim_prob_left']
    signed_contrast = df['trial_stim_contrast_right'] - df['trial_stim_contrast_left']
    datamat['contrast'] = np.abs(signed_contrast)
    datamat['position'] = np.sign(signed_contrast)*position_deg
    datamat['response_choice'] = df['trial_response_choice']
    datamat.loc[df['trial_response_choice'] == 'CCW','response_choice'] = 1
    datamat.loc[df['trial_response_choice'] == 'CW','response_choice'] = -1
    datamat.loc[df['trial_response_choice'] == 'No Go','response_choice'] = 0
    datamat['trial_correct'] = np.double(df['trial_feedback_type']==1)
    datamat['reaction_time'] = df['trial_response_time'] - df['trial_stim_on_time'] # double-check

    # Since some trials have zero contrast, need to compute the alleged position separately
    datamat.loc[(datamat['trial_correct'] == 1) & (signed_contrast == 0),'position'] = \
        datamat.loc[(datamat['trial_correct'] == 1) & (signed_contrast == 0),'response_choice']*position_deg
    datamat.loc[(datamat['trial_correct'] == 0) & (signed_contrast == 0),'position'] = \
        datamat.loc[(datamat['trial_correct'] == 0) & (signed_contrast == 0),'response_choice']*(-position_deg)
    
    return datamat

In [6]:
# Loop over all mice
for mouse_nickname in mice_names:
    
    mouse_subject = {'subject_nickname': mouse_nickname}
    
    # Get mouse data for biased sessions
    behavior_stable = (behavior.TrialSet.Trial & (subject.Subject & mouse_subject)) \
        * sess_stable.proj('session_uuid','task_protocol','session_start_time','training_status') * subject.Subject.proj('subject_nickname') \
        * subject.SubjectLab.proj('lab_name')
    df = pd.DataFrame(behavior_stable.fetch(order_by='subject_nickname, session_start_time, trial_id', as_dict=True))

    if len(df) > 0:           # The mouse has performed in at least one stable session with biased blocks            
        datamat = get_mouse_data(df)

        # Take mice that have performed a minimum number of sessions
        if np.max(datamat['session_num']) >= MinSessionNumber:

            # Should add 'N' to mice names that start with numbers?

            # Save dataframe to CSV file
            filename = mouse_nickname + '.csv'
            datamat.to_csv(filename,index=False)
            stable_mice_names.append(mouse_nickname)
            
            # Get mouse last sessions of training data
            behavior_train = (behavior.TrialSet.Trial & (subject.Subject & mouse_subject)) \
                * sess_train.proj('session_uuid','task_protocol','session_start_time') * subject.Subject.proj('subject_nickname') \
                * subject.SubjectLab.proj('lab_name')
            df_train = pd.DataFrame(behavior_train.fetch(order_by='subject_nickname, session_start_time, trial_id', as_dict=True))

            datamat_train = get_mouse_data(df_train)
            Nlast = np.max(datamat_train['session_num']) - 3
            datamat_final = datamat_train[datamat_train['session_num'] > Nlast]

            # Save final training dataframe to CSV file
            filename = mouse_nickname + '_endtrain.csv'
            datamat_final.to_csv(filename,index=False)
            

print(stable_mice_names)

['CSHL_002', 'CSHL_003', 'CSHL_005', 'CSHL_008', 'CSHL_010', 'CSHL_014', 'CSHL_015', 'CSH_ZAD_001', 'CSH_ZAD_003', 'CSH_ZAD_004', 'CSH_ZAD_006', 'CSH_ZAD_007', 'CSH_ZAD_010', 'DY_001', 'DY_007', 'IBL-T1', 'IBL-T2', 'IBL-T4', 'IBL_001', 'IBL_002', 'KS002', 'KS003', 'KS004', 'KS005', 'KS014', 'KS015', 'KS016', 'KS017', 'NYU-01', 'NYU-02', 'NYU-06', 'SWC_013', 'ZM_1084', 'ZM_1085', 'ZM_1086', 'ZM_1087', 'ZM_1091', 'ZM_1092', 'ZM_1097', 'ZM_1098', 'ZM_1367', 'ZM_1371', 'ZM_1372', 'ZM_1743', 'ZM_1745', 'ZM_1746', 'ibl_witten_04', 'ibl_witten_05', 'ibl_witten_06', 'ibl_witten_12', 'ibl_witten_14', 'ibl_witten_15', 'ibl_witten_16']


In [7]:
len(stable_mice_names)

53