# Turbidity Data Merging
Merge all turbidity labeled data into a singular file

In [1]:
import pandas as pd

In [2]:
# Load data
turb_SKP_path = '../Data/labeled_data/ground_truths/turb/turb_skp/julian_time/turb_SKP_0k-300k_labeled.csv'
turb_FPT_path = '../Data/labeled_data/ground_truths/turb/turb_fpt/julian_time/turb_FPT_0k-300k_labeled.csv'
turb_PP_path = '../Data/labeled_data/ground_truths/turb/turb_pp/julian_time/turb_pp_0k-300k_labeled.csv'

skp = pd.read_csv(turb_SKP_path)
fpt = pd.read_csv(turb_FPT_path)
pp = pd.read_csv(turb_PP_path)

skp.set_index('timestamp_of_peak', inplace=True)
fpt.set_index('timestamp_of_peak', inplace=True)
pp.set_index('timestamp_of_peak', inplace=True)

In [3]:
# set peak precedence
TOP = skp
SECOND = pp
THIRD = fpt

In [5]:
# Concat frames
df = pd.concat([TOP, SECOND, THIRD])

# sort frames
df = df.sort_values(by=['timestamp_of_peak'], kind='stable')

# drop dupes
df = df[~df.index.duplicated(keep='first')]

# rename all no labels to be no
final = df.replace(to_replace='N(.*)', value="NAP", regex=True)

In [6]:
# output to csv
filename = '../Data/labeled_data/ground_truths/turb/turb_all_julian_0k-300k.csv'

final.to_csv(filename)