# Sea Surface Temperature Time-Series Analysis

Info: Sea surface temperature measured in celcius. 2 sources - Reynolds Optimum Interpolation Sea Surface Temperature (ROISST), Hadley Centre Sea Ice and Sea Surface Temperature (HadSST).

Insight: As surface water warms, the stratification, or layering, becomes even more pronounced, suppressing mixing even further. As a result, nutrient transfer from deeper water to surface waters declines, and so does phytoplankton productivity.

In [1]:
import pandas as pd

#### Reading & Cleaning datasets

In [6]:
df = pd.read_csv('Documents/GitHub/CommunicatingDataScience/Nauplius data (raw)/point A/dataRSST_ROI2sst.csv')
df

FileNotFoundError: [Errno 2] No such file or directory: 'Documents/GitHub/CommunicatingDataScience/Nauplius data (raw)/point A/dataRSST_ROI2sst.csv'

In [5]:
# Creating a dictionary for all geo-points with their sst data by roi & had
geopoint = {'A': {'sst_roi': pd.read_csv('./Nauplius data (raw)/point A/dataRSST_ROI2sst.csv'),
                  'sst_had': pd.read_csv('./Nauplius data (raw)/point A/dataRSST_HadISST.csv')},
            'B': {'sst_roi': pd.read_csv('./Nauplius data (raw)/point B/dataRSST_ROI2sst.csv'),
                  'sst_had': pd.read_csv('.//Nauplius data (raw)/point B/dataRSST_HadISST.csv')},
            'C': {'sst_roi': pd.read_csv('./Nauplius data (raw)/point C/dataRSST_ROI2sst.csv'),
                  'sst_had': pd.read_csv('./Nauplius data (raw)/point C/dataRSST_HadISST.csv')}}
# Cleaning all datasets
for point in geopoint:
    # Accessing dataframes
    df_roi = geopoint[point]['sst_roi']
    df_had = geopoint[point]['sst_had']
    # Dropping empty unnamed NaN col
    df_roi.drop(columns=df_roi.columns[-1], inplace=True)
    df_had.drop(columns=df_had.columns[-1], inplace=True)
    # Renaming the sea surface temp
    df_roi.rename(columns={'TEMP= Reynolds OI-SST-v2 Temperature (C)': 'Reynolds Temp (C)'}, inplace=True)
    df_had.rename(columns={'HSST= HadISST Temperature (C)': 'Hadley Temp (C)'}, inplace=True)

# Display 2 random datasets
display(geopoint['B']['sst_had'], geopoint['C']['sst_roi'])

FileNotFoundError: [Errno 2] No such file or directory: './Nauplius data (raw)/point A/dataRSST_ROI2sst.csv'

#### Comparison of all datasets: 1 graph per geopoint (A,B,C) and 2 lineplots per graph (ROI, HAD)

In [None]:
import plotly.graph_objs as go

# Loop through each geopoint
for point in geopoint:
    df_roi = geopoint[point]['sst_roi']
    df_had = geopoint[point]['sst_had']
    # create traces for each dataset
    trace1 = go.Scatter(x=df_roi['DATE-YMD'], y=df_roi['Reynolds Temp (C))'], mode='lines', name='ROI')
    trace2 = go.Scatter(x=df_had['DATE-YMD'], y=df_had['Hadley Temp (C)'], mode='lines', name='HAD')
    # create layout for the plot
    layout = go.Layout(title=f'Chlorophyll-A Concentration Time Series on Point {point}',
                       xaxis=dict(title='Date', dtick='M12'),
                       yaxis=dict(title='Sea Surface Temperature (C)', dtick=2),
                       height = 800, width=1200,
                       template='plotly_dark')
    # create figure object and plot the traces
    fig = go.Figure(data=[trace1, trace2], layout=layout)
    fig.show()