# Read Hydrography Master (June 2018) file

this R notebook reads (and cleans up) the Hydrography Master (June 2018) file that is provided on  
  
http://imars.marine.usf.edu/cariaco  

This .csv file is a collection monthly sampled data at CARIACO Ocean Time Series Station.

In [1]:
# read header
file <- "../../DataFiles_Raw/Master_Hydrography_June2018.csv"
header <- read.csv(file, header = F, nrows = 1, as.is=T)

# skip empty rows & read data
data <- read.csv(file, skip = 5, header = F)

# assign header to data
colnames(data) <- header

# clean up dataframe

In [2]:
# convert "-9999" values to NA
data[data == -9999] <- NA

# remove empty columns
data <- data[,c(-1,-49:-50)]

# remove rows full of NAs (i.e. where cruise number is NA)
data <- data[!is.na(data$Cruise),]

# convert date/time

In [3]:
# convert date & time into machine readable format
data$DateString <- data$Date
data$Date <- as.POSIXlt(data$Date, format="%Y/%m/%d")

# get "day of the year" as variable
data$yday <- data$Date$yday

# the cleaned file is saved as a csv in the folder "CleanedData"

In [4]:
# Write CSV in R
write.csv(data, file = "../../DataFiles_Processed/Master_Hydrography_June2018_Cleaned.csv")