import numpy as np
import pandas as pd
import csv
import os
import glob
import datetime

sorted(os.listdir('../data/'))

file_list = glob.glob("../data/*.csv")

list_of_dataframes = []
for filename in file_list:
    list_of_dataframes.append(pd.read_csv(filename, encoding = 'euc-kr', skiprows = 26))
    
merged_df = pd.concat(list_of_dataframes)

merged_df

merged_df['yyyy-mm-dd hh:mm:ss'] = pd.to_datetime(merged_df['yyyy-mm-dd hh:mm:ss'], format='%Y-%m-%d %H:%M:%S', errors='raise')

merged_df['mon/day/yr'] = merged_df['yyyy-mm-dd hh:mm:ss'].dt.strftime('%m-%d-%Y')

merged_df['hh:mm'] = merged_df['yyyy-mm-dd hh:mm:ss'].dt.strftime('%H:%M')

merged_df['PCBs[μg/kg]'] = (merged_df['폴리염화바이페닐-28[μg/kg]'] + merged_df['폴리염화바이페닐-52[μg/kg]'] + 
                            merged_df['폴리염화바이페닐-101[μg/kg]'] + merged_df['폴리염화바이페닐-118[μg/kg]'] +
                            merged_df['폴리염화바이페닐-138[μg/kg]'] + merged_df['폴리염화바이페닐-153[μg/kg]'] +
                            merged_df['폴리염화바이페닐-180[μg/kg]'])

merged_df.rename(columns = {"project_name":"Cruise", "station":"Station", "bot.depth[m]":"Bot. Depth [m]", "수심(m)":"Depth [m]",
                    "수온[℃]":"Temperature [℃]", "염분[‰]":"Salinity [PSU]", "용존산소[mg/L]":"DO[ml/l]", "클로로필-a[mg/m3]":"Chl.a[mg/m3]",
                    "수소이온농도[무단위]":"pH", "총질소[wt.%]":"TN", "총인[mg/L]":"TP", "구리[μg/kg]":"Cu[μg/kg]", "납[μg/kg]":"Pb[μg/kg]",
                    "아연[μg/kg]":"Zn[μg/kg]", "카드뮴[μg/kg]":"Cd[μg/kg]", "6가크롬[μg/kg]":"Cr6+[μg/kg]", "비소[μg/kg]":"As[μg/kg]",
                    "부유물질 농도[mg/L]":"SS[mg/L]", "화학적산소요구량[mg/L]":"COD[mg/L]", "총유기탄소[mg/L]":"TOC[mg/L]",
                            "총수은[mg/L]":"Hg[mg/L]", "투명도[m]":"Transparency[m]"}, inplace = True)

df = merged_df.reindex(columns = merged_df.columns.tolist() + ['DO saturation(%)', 'NO3-[μmol/kg]', 'SiO4-[μmol/kg]', 'Type', 'NH4+[μmol/kg]', 
                                                 'DIC[μmol/kg]', 'Sigma-t [kg/m3]', 'PAR[μE/ cm2s1]', 'Potential', 'NO2-[μmol/kg]', 
                                                 'POC', 'Fluorescence[mg/m3]', 'PO4-[μmol/kg]', 'Alk[μmol/kg]', 'ISUS nitrate[μmol/kg]', 
                                                 'DO titration[μmol/kg]', 'TEP', 'PON', 'DO[μmol/kg]', 'Cond[S/m]'])

JOISS_dataset = df[['Cruise','Station','Type','mon/day/yr','hh:mm','Longitude [degrees_east]','Latitude [degrees_south]',
                          'Bot. Depth [m]','Depth [m]','Temperature [℃]','Salinity [PSU]','Potential','Sigma-t [kg/m3]',
                          'DO[μmol/kg]','DO[ml/l]','DO saturation(%)','DO titration[μmol/kg]','Fluorescence[mg/m3]','PAR[μE/ cm2s1]',
                          'Cond[S/m]','Chl.a[mg/m3]','DIC[μmol/kg]','Alk[μmol/kg]','pH','TEP','PO4-[μmol/kg]','NH4+[μmol/kg]',
                           'NO2-[μmol/kg]','NO3-[μmol/kg]','SiO4-[μmol/kg]','TN','TP','ISUS nitrate[μmol/kg]','POC',
                          'PON','PCBs[μg/kg]','Cu[μg/kg]','Pb[μg/kg]','Zn[μg/kg]','Cd[μg/kg]','Cr6+[μg/kg]','As[μg/kg]',
                          'SS[mg/L]','COD[mg/L]','TOC[mg/L]','Hg[mg/L]','Transparency[m]']]

df = pd.DataFrame(JOISS_dataset)

df = df.fillna(0)

df.to_csv("../data/JOISS_dataset.csv", encoding='euc-kr')