Download the Bar Crawl: Detecting Heavy Drinking dataset used in this notebook from: https://archive.ics.uci.edu/dataset/515/bar+crawl+detecting+heavy+drinking

In [1]:
from tigertail import TimeFrame, TimeSeries, EventSeries
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt

In [6]:
# get the TAC (transdermal alcohol content) data for subject SA0297

SA0297_TAC_path = '../data/bar-crawl-detecting-heavy-drinking/clean_tac/SA0297_clean_TAC.csv'
SA0297_TAC_df = pd.read_csv(SA0297_TAC_path).set_index('timestamp')
# SA0297_TAC_df.index.name = None
SA0297_TAC_df

Unnamed: 0_level_0,TAC_Reading
timestamp,Unnamed: 1_level_1
1493716723,-0.010229
1493718546,-0.002512
1493718863,0.003249
1493719179,0.005404
1493719495,0.003377
1493719811,-0.001451
1493720127,-0.005816
1493720443,-0.006248
1493720759,-0.001631
1493721075,0.005332


In [8]:
CC6740_TAC_path = '../data/bar-crawl-detecting-heavy-drinking/clean_tac/CC6740_clean_TAC.csv'
CC6740_TAC_df = pd.read_csv(CC6740_TAC_path).set_index('timestamp')
# SA0297_TAC_df.index.name = None
CC6740_TAC_df

Unnamed: 0_level_0,TAC_Reading
timestamp,Unnamed: 1_level_1
1493723434,0.003947
1493725257,0.000898
1493725585,-0.000894
1493725900,-0.001021
1493726214,-0.000139
1493726528,0.000598
1493726843,0.000457
1493727157,-0.000335
1493727471,-0.000855
1493727785,-0.000387


In [11]:
TAC_df = pd.concat([SA0297_TAC_df, CC6740_TAC_df], axis=1, keys=['SA0297', 'CC6740'])
TAC_df

Unnamed: 0_level_0,SA0297,CC6740
Unnamed: 0_level_1,TAC_Reading,TAC_Reading
timestamp,Unnamed: 1_level_2,Unnamed: 2_level_2
1493716723,-0.010229,
1493718546,-0.002512,
1493718863,0.003249,
1493719179,0.005404,
1493719495,0.003377,
...,...,...
1493802423,,0.028566
1493804265,,0.018062
1493806093,,0.009171
1493807921,,0.005121


In [7]:
accelerometer_path = '../data/bar-crawl-detecting-heavy-drinking/all_accelerometer_data_pids_13.csv'
accelerometer_df = pd.read_csv(accelerometer_path).set_index('time')
accelerometer_df

Unnamed: 0_level_0,pid,x,y,z
time,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
0,JB3156,0.000000,0.000000,0.000000
0,CC6740,0.000000,0.000000,0.000000
1493733882409,SA0297,0.075800,0.027300,-0.010200
1493733882455,SA0297,-0.035900,0.079400,0.003700
1493733882500,SA0297,-0.242700,-0.086100,-0.016300
...,...,...,...,...
1493829248196,CC6740,-0.133956,0.124726,-0.010736
1493829248220,CC6740,-0.100764,0.180872,0.046449
1493829248245,CC6740,-0.131853,0.195934,0.181088
1493829248270,CC6740,-0.149704,0.194482,0.202393


In [12]:
SA0297_mask = accelerometer_df['pid'] == 'SA0297'
SA0297_accelerometer_df = pd.DataFrame(accelerometer_df[SA0297_mask])
SA0297_accelerometer_df

Unnamed: 0_level_0,pid,x,y,z
time,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
1493733882409,SA0297,0.0758,0.0273,-0.0102
1493733882455,SA0297,-0.0359,0.0794,0.0037
1493733882500,SA0297,-0.2427,-0.0861,-0.0163
1493733883945,SA0297,-0.2888,0.0514,-0.0145
1493733883953,SA0297,-0.0413,-0.0184,-0.0105
...,...,...,...,...
1493824735596,SA0297,-0.0107,0.0801,0.0840
1493824735641,SA0297,0.0132,0.0835,0.0493
1493824735686,SA0297,0.0480,-0.0071,0.1374
1493824735731,SA0297,0.0597,-0.0426,-0.1090


In [16]:
SA0297_accelerometer_df = SA0297_accelerometer_df.loc[~SA0297_accelerometer_df.index.duplicated(keep='first')]
SA0297_accelerometer_df

Unnamed: 0_level_0,pid,x,y,z
time,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
1493733882409,SA0297,0.0758,0.0273,-0.0102
1493733882455,SA0297,-0.0359,0.0794,0.0037
1493733882500,SA0297,-0.2427,-0.0861,-0.0163
1493733883945,SA0297,-0.2888,0.0514,-0.0145
1493733883953,SA0297,-0.0413,-0.0184,-0.0105
...,...,...,...,...
1493824735596,SA0297,-0.0107,0.0801,0.0840
1493824735641,SA0297,0.0132,0.0835,0.0493
1493824735686,SA0297,0.0480,-0.0071,0.1374
1493824735731,SA0297,0.0597,-0.0426,-0.1090


In [18]:
SA0297_df = pd.concat([SA0297_accelerometer_df, SA0297_TAC_df], axis=1)
SA0297_df

Unnamed: 0,pid,x,y,z,TAC_Reading
1493733882409,SA0297,0.0758,0.0273,-0.0102,
1493733882455,SA0297,-0.0359,0.0794,0.0037,
1493733882500,SA0297,-0.2427,-0.0861,-0.0163,
1493733883945,SA0297,-0.2888,0.0514,-0.0145,
1493733883953,SA0297,-0.0413,-0.0184,-0.0105,
...,...,...,...,...,...
1493798799,,,,,0.008145
1493800622,,,,,0.010223
1493802445,,,,,0.006509
1493804271,,,,,-0.004768


In [9]:
SA0297_ts = TimeSeries(SA0297_TAC_df, agg_func=np.mean)
CC6740_ts = TimeSeries(CC6740_TAC_df, agg_func=np.mean)

