<a href="https://colab.research.google.com/github/eudemo-studio/eudemo-portfolio/blob/master/visible_data_wrangling.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

**Section 1:** Import required packages into Python environment & connect to Google Drive 🐍

In [None]:
# Import numpy and pandas packages
import numpy as np
import pandas as pd

# Import library for connecting Google Colab to Google Drive
from google.colab import drive

# Connect Google Colab to Google Drive (eudemo.co)
drive.mount("/content/drive")

**Section 2:** Import HR & RR .txt datasets from Google Drive into Python environment ⬇️

In [None]:
# Import Heart Rate (HR) .txt files (with semicolon separators)
# Heart Rate (HR) measured in Beats Per Minute (BPM)
HS_1204_HR_morning        = pd.read_csv("/content/drive/MyDrive/A1. Projects & Collaborations/015. Visible/workflow-python/raw_data/HS 12-04 HR morning.txt", sep=";")
HS_1204_HR_evening        = pd.read_csv("/content/drive/MyDrive/A1. Projects & Collaborations/015. Visible/workflow-python/raw_data/HS 12-04 HR evening.txt", sep=";")
HS_1304_HR_morning        = pd.read_csv("/content/drive/MyDrive/A1. Projects & Collaborations/015. Visible/workflow-python/raw_data/HS 13-04 HR Morning.txt", sep=";")
HS_1304_HR_afternoon      = pd.read_csv("/content/drive/MyDrive/A1. Projects & Collaborations/015. Visible/workflow-python/raw_data/HS 13-04 HR Afternoon.txt", sep=";")
HS_1304_HR_evening        = pd.read_csv("/content/drive/MyDrive/A1. Projects & Collaborations/015. Visible/workflow-python/raw_data/HS 13-04 HR Evening.txt", sep=";")
HS_1404_HR_early_morning  = pd.read_csv("/content/drive/MyDrive/A1. Projects & Collaborations/015. Visible/workflow-python/raw_data/HS 14-04 HR Early Morning.txt", sep=";")
HS_1404_HR_morning        = pd.read_csv("/content/drive/MyDrive/A1. Projects & Collaborations/015. Visible/workflow-python/raw_data/HS 14-04 HR Morning.txt", sep=";")

# Import RR Interval (RR) .txt files (with semicolon separators)
# RR Interval (RR) measured in Milliseconds (ms)
HS_1204_RR_morning        = pd.read_csv("/content/drive/MyDrive/A1. Projects & Collaborations/015. Visible/workflow-python/raw_data/HS 12-04 RR morning.txt", sep=";")
HS_1204_RR_evening        = pd.read_csv("/content/drive/MyDrive/A1. Projects & Collaborations/015. Visible/workflow-python/raw_data/HS 12-04 RR evening.txt", sep=";")
HS_1304_RR_morning        = pd.read_csv("/content/drive/MyDrive/A1. Projects & Collaborations/015. Visible/workflow-python/raw_data/HS 13-04 RR Morning.txt", sep=";")
HS_1304_RR_afternoon      = pd.read_csv("/content/drive/MyDrive/A1. Projects & Collaborations/015. Visible/workflow-python/raw_data/HS 13-04 RR Afternoon.txt", sep=";")
HS_1304_RR_evening        = pd.read_csv("/content/drive/MyDrive/A1. Projects & Collaborations/015. Visible/workflow-python/raw_data/HS 13-04 RR Evening.txt", sep=";")
HS_1404_RR_early_morning  = pd.read_csv("/content/drive/MyDrive/A1. Projects & Collaborations/015. Visible/workflow-python/raw_data/HS 14-04 RR Early Morning.txt", sep=";")
HS_1404_RR_morning        = pd.read_csv("/content/drive/MyDrive/A1. Projects & Collaborations/015. Visible/workflow-python/raw_data/HS 14-04 RR Morning.txt", sep=";")

**Section 3:** Binding datasets together, to form consolidated HR & RR dataframes 🤝

In [None]:
# Bind together datasets by rows, to form 'hr_df' & 'rr_df'
hr_df = pd.concat([HS_1204_HR_morning, HS_1204_HR_evening, HS_1304_HR_morning, HS_1304_HR_afternoon, HS_1304_HR_evening, HS_1404_HR_early_morning, HS_1404_HR_morning])
rr_df = pd.concat([HS_1204_RR_morning, HS_1204_RR_evening, HS_1304_RR_morning, HS_1304_RR_afternoon, HS_1304_RR_evening, HS_1404_RR_early_morning, HS_1404_RR_morning])

**Section 4:** Formatting the new dataframes - renaming column headers & changing column type 🧹

In [None]:
# Rename columns to remove capitals & spaces
hr_df.rename(columns = {'Phone timestamp':'date_time', 'HR [bpm]':'hr_bpm'}, inplace=True)
rr_df.rename(columns = {'Phone timestamp':'date_time', 'RR-interval [ms]':'rr_interval_ms'}, inplace=True)

# Convert 'date_time' column into datetime format
hr_df['date_time'] = pd.to_datetime(hr_df['date_time'])
rr_df['date_time'] = pd.to_datetime(rr_df['date_time'])

**Section 5:** Export tidied dataframes to CSV 🚢

In [None]:
# Export to CSV in 'tidy_data' folder
hr_df.to_csv("/content/drive/MyDrive/A1. Projects & Collaborations/015. Visible/workflow-python/tidy_data/hr.csv")
rr_df.to_csv("/content/drive/MyDrive/A1. Projects & Collaborations/015. Visible/workflow-python/tidy_data/rr.csv")