In [1]:
# Standard libraries
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
from ipywidgets import IntProgress
from IPython.display import display
from scipy.stats import mannwhitneyu, wilcoxon

# Append base directory
import os,sys,inspect
rootname = "pub-2020-exploratory-analysis"
thispath = os.path.dirname(os.path.abspath(inspect.getfile(inspect.currentframe())))
rootpath = os.path.join(thispath[:thispath.index(rootname)], rootname)
sys.path.append(rootpath)
print("Appended root directory", rootpath)

from mesostat.utils.qt_helper import gui_fnames, gui_fpath
from mesostat.metric.metric import MetricCalculator
from mesostat.utils.hdf5_io import DataStorage

from lib.sych.data_fc_db_raw import DataFCDatabase
import lib.analysis.bulk_metrics as bulk_metrics

%load_ext autoreload
%autoreload 2

Appended root directory /media/aleksejs/DataHDD/work/codes/comp-neuro/analysis-mesoscopic/pub-2020-exploratory-analysis


In [2]:
# tmp_path = root_path_data if 'root_path_data' in locals() else "./"
params = {}
params['root_path_data'] = './'
# params['root_path_data'] = '/media/alyosha/Data/TE_data/yarodata/sych_preprocessed'
#params['root_path_data'] = gui_fpath('h5path', './')

In [3]:
dataDB = DataFCDatabase(params)

Searching for data files


In [4]:
ds = DataStorage('sych_result_bulk_metrics.h5')

In [5]:
mc = MetricCalculator(serial=True, verbose=False)

# 1. Bulk Metrics vs Time

* Avg over mice
* All-region-all-types
* Expert vs Naive
* Go/NOGO/MISS/FA

# Mean

In [None]:
bulk_metrics.metric_mouse_bulk(dataDB, mc, ds, 'mean', 's', 'time', verbose=False)

In [None]:
bulk_metrics.plot_metric_bulk(dataDB, ds, 'mean', 'time', verbose=False)

# Variance

**TODO**
* Plot trial variance relative to temporal variance
* Plot mean with variance together

### Pros/Cons of Baseline Normalization
* DFF-Trial
    - Pos: Removes dynamic baseline changing on the order of trials.
    - Pos: Under assumption of signal-free pre-trial interval, baseline removal enhances relative change in significant activity during trial.
    - Neg: In presence of correlation between pre-trial interval and trial signals, this procedure destroys information during trial.

* DFF-Session vs ZScore-Session
    - Both linear transforms
    - Mean is more meaningful for DFF if pre-trial interval is at least somewhat stable
    - Va

In [None]:
bulk_metrics.metric_mouse_bulk(dataDB, mc, ds, 'varmean', 's', 'time', verbose=False)

In [None]:
bulk_metrics.plot_metric_bulk(dataDB, ds, 'varmean', 'time', ylim=[0,None], verbose=False)

### Test variance across channels for interesting interval

* Average signal over texture presentation interval
* Compute variance over trials for each channel
* Compare channels

In [None]:
bulk_metrics.metric_mouse_bulk(dataDB, mc, ds, 'varmean', 'p', 'channel', cropTime=(3, 3.5), trialTypeNames=[], perfNames=[], verbose=False)

In [None]:
bulk_metrics.plot_metric_bulk(dataDB, ds, 'varmean', 'channel', yscale='log', ylim=[0.005,2], verbose=False)

# Effective Rank

### ByTime

In [None]:
bulk_metrics.metric_mouse_bulk(dataDB, mc, ds, "rank_effective", 's', 'time', verbose=False)

In [None]:
bulk_metrics.plot_metric_bulk(dataDB, ds, 'rank_effective', 'time', ylim=[1, None], verbose=True) # ylim=[1,48]

### BySession

In [None]:
bulk_metrics.metric_mouse_bulk_vs_session(dataDB, mc, ds, "rank_effective", '', trialTypeNames=[], verbose=False)

In [None]:
bulk_metrics.plot_metric_bulk_vs_session(dataDB, ds, 'rank_effective', trialTypeNames=[], ylim=[1,None], verbose=False)

# Total Correlation

In [None]:
# bulk_metrics.metric_mouse_bulk(dataDB, mc, ds, "avg_entropy", 'sp', 'time-channel', verbose=False)
# bulk_metrics.metric_mouse_bulk(dataDB, mc, ds, "avg_entropy", 's', 'time', verbose=False)

bulk_metrics.metric_mouse_bulk(dataDB, mc, ds, "avg_TC", 's', 'time', verbose=False)

IntProgress(value=0, description='time', max=180)

In [8]:
bulk_metrics.plot_TC(dataDB, ds, ylim=None, yscale=None, verbose=True)

avg_entropy_time-channel_bn_session_All_All avg_entropy_time_bn_session_All_All
avg_entropy_time-channel_bn_session_All_iGO avg_entropy_time_bn_session_All_iGO
avg_entropy_time-channel_bn_session_All_iNOGO avg_entropy_time_bn_session_All_iNOGO
avg_entropy_time-channel_bn_session_All_iFA avg_entropy_time_bn_session_All_iFA
avg_entropy_time-channel_bn_session_All_iMISS avg_entropy_time_bn_session_All_iMISS
avg_entropy_time-channel_bn_session_naive_All avg_entropy_time_bn_session_naive_All
avg_entropy_time-channel_bn_session_naive_iGO avg_entropy_time_bn_session_naive_iGO
avg_entropy_time-channel_bn_session_naive_iNOGO avg_entropy_time_bn_session_naive_iNOGO
avg_entropy_time-channel_bn_session_naive_iFA avg_entropy_time_bn_session_naive_iFA
avg_entropy_time-channel_bn_session_naive_iMISS avg_entropy_time_bn_session_naive_iMISS
avg_entropy_time-channel_bn_session_expert_All avg_entropy_time_bn_session_expert_All
avg_entropy_time-channel_bn_session_expert_iGO avg_entropy_time_bn_session_exp

### Cleaning up

In [6]:
with pd.option_context('display.max_rows', None, 'display.max_columns', None):
    display(ds.list_dsets_pd().sort_values(by='datetime'))

Unnamed: 0,datetime,dset,metric,mousename,name,shape,target_dim
0,2020-12-02 14:18:35,dset0,mean,mvg_7,mean_time_bn_session_All_All,"(160,)","(timesteps,)"
1,2020-12-02 14:18:36,dset1,mean,mvg_7,mean_time_bn_session_All_iGO,"(160,)","(timesteps,)"
112,2020-12-02 14:18:36,dset2,mean,mvg_7,mean_time_bn_session_All_iNOGO,"(160,)","(timesteps,)"
334,2020-12-02 14:18:36,dset4,mean,mvg_7,mean_time_bn_session_All_iMISS,"(160,)","(timesteps,)"
223,2020-12-02 14:18:36,dset3,mean,mvg_7,mean_time_bn_session_All_iFA,"(160,)","(timesteps,)"
556,2020-12-02 14:18:37,dset6,mean,mvg_7,mean_time_bn_session_naive_iGO,"(160,)","(timesteps,)"
445,2020-12-02 14:18:37,dset5,mean,mvg_7,mean_time_bn_session_naive_All,"(160,)","(timesteps,)"
24,2020-12-02 14:18:38,dset12,mean,mvg_7,mean_time_bn_session_expert_iNOGO,"(160,)","(timesteps,)"
889,2020-12-02 14:18:38,dset9,mean,mvg_7,mean_time_bn_session_naive_iMISS,"(160,)","(timesteps,)"
13,2020-12-02 14:18:38,dset11,mean,mvg_7,mean_time_bn_session_expert_iGO,"(160,)","(timesteps,)"


In [None]:
ds.delete_by_query(queryDict={"metric" : "rank_effective"}, timestr="2020-11-20 18:00:00")