# statistical analysis of metrics

Leanne Friedrich 10/08/21

## initialization

In [2]:
%load_ext autoreload
%autoreload 2
LOGGERDEFINED = False

In [3]:
import os
import sys
sys.path.append("../")
from py.config import cfg
import py.logs as logs
import py.metrics as me
from printVals import *
from plainIm import plainIm
import matplotlib.pyplot as plt
import metricPlots as mp
import regression as rg
import matplotlib.cm as cm
LOGGERDEFINED = logs.openLog('vidSummaries.ipynb', LOGGERDEFINED, level='DEBUG', exportLog=False)

## analyzing data

In [9]:
ss,u = me.importStillsSummary(diag=True)
seg, useg = me.importStillsSummary(file='segmentsSummary.csv', diag=False)
ss = ss.merge(seg[['folder', 'horiz_segments']], on='folder', suffixes=['', '_manual'], how='left')

Independents: ['folder', 'bn', 'date', 'sigma', 'di', 'do', 'fluFile', 'calibFile', 'viscRatio', 'vRatio', 'ReRatio', 'rGrav', 'dEst', 'hDragP', 'vDragP', 'int_CaInv', 'int_Re', 'pressureCh0', 'ink_shortname', 'ink_days', 'ink_rheModifier', 'ink_surfactant', 'ink_dye', 'ink_var', 'ink_val', 'ink_base', 'ink_type', 'ink_tau0', 'ink_eta0', 'ink_density', 'ink_v', 'ink_rate', 'ink_visc0', 'ink_CaInv', 'ink_Re', 'ink_WeInv', 'ink_OhInv', 'ink_dPR', 'ink_dnormInv', 'ink_Bm', 'sup_shortname', 'sup_days', 'sup_rheModifier', 'sup_surfactant', 'sup_dye', 'sup_var', 'sup_val', 'sup_base', 'sup_type', 'sup_tau0', 'sup_eta0', 'sup_density', 'sup_v', 'sup_rate', 'sup_visc0', 'sup_CaInv', 'sup_Re', 'sup_WeInv', 'sup_OhInv', 'sup_dPR', 'sup_dnormInv', 'sup_Bm', 'sup_Ca', 'ink_Ca', 'sweepType', 'sup_dnorm', 'ink_dnorm', 'sup_We', 'ink_We', 'sup_Oh', 'ink_Oh', 'int_Ca']

Dependents: ['xs_aspect', 'xs_xshift', 'xs_yshift', 'xs_area', 'xs_areaN', 'xs_wN', 'xs_hN', 'xs_roughness', 'vert_wN', 'vert_hN', 'v

In [5]:
vs,uv = me.importStillsSummary(file='videoSummary.csv', diag=True)

Independents: ['folder', 'bn', 'date', 'sigma', 'di', 'do', 'fluFile', 'calibFile', 'viscRatio', 'vRatio', 'ReRatio', 'rGrav', 'dEst', 'hDragP', 'vDragP', 'int_CaInv', 'int_Re', 'pressureCh0', 'ink_shortname', 'ink_days', 'ink_rheModifier', 'ink_surfactant', 'ink_dye', 'ink_var', 'ink_val', 'ink_base', 'ink_type', 'ink_tau0', 'ink_eta0', 'ink_density', 'ink_v', 'ink_rate', 'ink_visc0', 'ink_CaInv', 'ink_Re', 'ink_WeInv', 'ink_OhInv', 'ink_dPR', 'ink_dnormInv', 'ink_Bm', 'sup_shortname', 'sup_days', 'sup_rheModifier', 'sup_surfactant', 'sup_dye', 'sup_var', 'sup_val', 'sup_base', 'sup_type', 'sup_tau0', 'sup_eta0', 'sup_density', 'sup_v', 'sup_rate', 'sup_visc0', 'sup_CaInv', 'sup_Re', 'sup_WeInv', 'sup_OhInv', 'sup_dPR', 'sup_dnormInv', 'sup_Bm', 'sup_Ca', 'ink_Ca', 'sweepType', 'sup_dnorm', 'ink_dnorm', 'sup_We', 'ink_We', 'sup_Oh', 'ink_Oh', 'int_Ca']

Dependents: ['projectionN', 'projShiftN', 'vertDispBotN', 'vertDispTopN', 'vertDispMidN']


## regression tables

In [10]:
xsregs = mp.regressionTable(ss, 'xs_aspect', nickname = 'cross-section aspect ratio', printOut=True, export=True)
varlist = [('vert_meanTN', 'normalized vertical line thickness'), 
           ('vert_hN', 'normalized vertical line length'), 
           ('vert_stdevTN', 'normalized vertical line thickness variation')]
vertregs = [mp.regressionTable(ss, i[0], nickname=i[1], logy=False, export=True, printOut=True) for i in varlist]
varlist = [('horiz_totlenN', 'normalized horizontal line total length', False),
           ('horiz_maxlenN', 'normalized horizontal line max segment length', False),
          ('horiz_segments_manual', 'number of horizontal line segments', False),
           ('horiz_roughness', 'horizontal line roughness', False)]
horizregs = [mp.regressionTable(ss, i[0], nickname=i[1], export=True, printOut=True, logy=i[2]) for i in varlist]

\begin{table}
\centering
\caption[Linear regressions for cross-section aspect ratio at nonzero surface tension]{Table of linear regressions of log-scaled variables and Spearman rank correlations for \textbf{cross-section aspect ratio} at non-zero surface tension. For example, ${Re}_{ink}$ indicates a regression fit to $h/w = 10^c*Re_{ink}^b$. A Spearman rank correlation coefficient of -1 or 1 indicates a strong correlation. Variables are defined in table \ref{tab:variableDefs}.}
\label{tab:xs_aspectRegNonZero}
\begin{tabular}{llrrll}
                                  variables &       $r^2$ &     b &     c & spearman coeff &     spearman p \\
                                  $\bm{Ca}$ & $\bm{0.33}$ &  0.10 &  0.10 &    $\bm{0.67}$ & $\bm{1.1e-27}$ \\
                                 $Ca_{ink}$ &        0.04 &  0.05 &  0.14 &           0.25 &        3.3e-04 \\
                            $\bm{Ca_{sup}}$ & $\bm{0.26}$ &  0.10 &  0.10 &    $\bm{0.61}$ & $\bm{3.9e-22}$ \\
                

In [8]:
mp.regressionTable(vs, 'vertDispBotN', nickname='bottom position', export=False, printOut=True, logy=False)

\begin{table}
\centering
\caption[Linear regressions for bottom position at nonzero surface tension]{Table of linear regressions of log-scaled variables and Spearman rank correlations for \textbf{bottom position} at non-zero surface tension. For example, ${Re}_{ink}$ indicates a regression fit to $h/w = 10^c*Re_{ink}^b$. A Spearman rank correlation coefficient of -1 or 1 indicates a strong correlation. Variables are defined in table \ref{tab:variableDefs}.}
\label{tab:vertDispBotNRegNonZero}
\begin{tabular}{llrrll}
                              variables & $r^2$ &     b &     c & spearman coeff & spearman p \\
                                   $Ca$ &  0.00 & -0.02 &  0.39 &           0.02 &    8.1e-01 \\
                             $Ca_{ink}$ &  0.09 & -0.35 &  0.24 &          -0.26 &    1.5e-04 \\
                             $Ca_{sup}$ &  0.00 &  0.06 &  0.37 &           0.13 &    7.3e-02 \\
                     $Ca_{ink}Ca_{sup}$ &  0.02 & -0.09 &  0.36 &          -0.05 &    4.7e-

[                                 variables $r^2$         b     c  \
 0                                     $Ca$  0.00 -2.02e-02  0.39   
 1                               $Ca_{ink}$  0.09 -3.50e-01  0.24   
 2                               $Ca_{sup}$  0.00  5.98e-02  0.37   
 3                       $Ca_{ink}Ca_{sup}$  0.02 -9.06e-02  0.36   
 4                      $Ca_{ink}/Ca_{sup}$  0.06 -1.66e-01  0.28   
 0                             $d_{PR,ink}$  0.07  2.47e-01  0.06   
 1                             $d_{PR,sup}$  0.02 -6.62e-02  0.46   
 2                   $d_{PR,ink}d_{PR,sup}$  0.00  1.95e-03  0.38   
 3                  $d_{PR,ink}/d_{PR,sup}$  0.05  8.45e-02  0.37   
 0                     $d_{Est}/d_{PR,ink}$  0.10 -2.88e-01 -0.06   
 1                     $d_{Est}/d_{PR,sup}$  0.01  5.27e-02  0.46   
 2   $d_{Est}/d_{PR,ink}d_{Est}/d_{PR,sup}$  0.00 -2.81e-02  0.30   
 3  $d_{Est}/d_{PR,ink}/d_{Est}/d_{PR,sup}$  0.05 -8.45e-02  0.37   
 0                               $