In [None]:
from features import features
import numpy as np
from utils.ops import load_ml_image, load_sb_image
import matplotlib.pyplot as plt
import plotly.graph_objects as go


In [None]:
df_data = load_ml_image(features['ArDS']['path_to_file'])

In [None]:
year_0 = 2017
f, ax = plt.subplots(7, figsize = (10, 20))
for i in range(7):
    year = year_0 + i
    data = df_data[:,:, i*24:(i+1)*24]
    ax[i].hist(data.flatten(), bins = 30, log = True, rwidth=0.95, range=[0, df_data.max()])
    ax[i].set_title(f'{year}')
f.tight_layout()
f.show()
    

In [None]:
subsets = {
    'Train':[0, 72],
    'Validation': [72, 120],
    'Test': [120, 168]
}
f, ax = plt.subplots(3, figsize = (8, 8))
for i, key in enumerate(subsets):
    data = df_data[:,:, subsets[key][0]: subsets[key][1]]
    ax[i].hist(data.flatten(), bins = 30, log = True, rwidth=0.95, range=[0, df_data.max()], density = True)
    ax[i].set_ylim([0,1])
    ax[i].set_title(f'{key}')
f.tight_layout()
f.show()

In [None]:
subsets = {
    'Train':[0, 72],
    'Validation': [72, 120],
    'Test': [120, 168]
}
f= plt.figure(figsize = (8, 4))
train_data = df_data[:,:, 0: 72]
val_data = df_data[:,:, 72: 120]
test_data = df_data[:,:, 120: 168]
plt.hist(train_data.flatten(), bins = 30, log = True, rwidth=0.9, range=[0, df_data.max()], density = True,alpha = 0.6,  label = 'Train', ec = 'black', color = 'blue')
plt.hist(val_data.flatten(), bins = 30, log = True, rwidth=0.9, range=[0, df_data.max()], density = True, alpha = 0.6, label = 'Validation', ec = 'black', color = 'green')
plt.hist(test_data.flatten(), bins = 30, log = True, rwidth=0.9, range=[0, df_data.max()], density = True, alpha = 0.6, label = 'Test', ec = 'black', color = 'orange')
plt.legend(loc='upper right')
f.tight_layout()
f.show()

In [None]:
train_data = df_data[:,:, 0: 72]
val_data = df_data[:,:, 72: 120]
test_data = df_data[:,:, 120: 168]

fig = go.Figure()
fig.add_trace(go.Histogram(
    x=train_data.flatten(),
    histnorm='percent',
    name='Train', # name used in legend and hover labels
    xbins=dict( # bins used for histogram
        start=0,
        end=df_data.max(),
        size=df_data.max()/30.
        #size=1
    ),
    marker_color='blue',
    opacity=0.75
))
fig.add_trace(go.Histogram(
    x=val_data.flatten(),
    histnorm='percent',
    name='Validation',
    xbins=dict(
        start=0,
        end=df_data.max(),
        size=df_data.max()/30.
        #size=1
    ),
    marker_color='red',
    opacity=0.75
))
fig.add_trace(go.Histogram(
    x=test_data.flatten(),
    histnorm='percent',
    name='Test',
    xbins=dict(
        start=0,
        end=df_data.max(),
        size=df_data.max()/30.
        #size=1
    ),
    marker_color='green',
    opacity=0.75
))
fig.update_yaxes(type="log")
fig.update_layout(
    title="Cells Samples Histograms",
    title_x = 0.5,
    xaxis_title="Deforestation Area (Km2)",
    yaxis_title="Percent",
    legend_title="Subset"
)
fig.show()


In [None]:
train_data = df_data[:,:, 0: 72]
val_data = df_data[:,:, 72: 120]
test_data = df_data[:,:, 120: 168]

fig = go.Figure()
fig.add_trace(go.Histogram(
    x=train_data.flatten(),
    name='Train', # name used in legend and hover labels
    xbins=dict( # bins used for histogram
        start=0,
        end=df_data.max(),
        size=df_data.max()/30.
    ),
    marker_color='blue',
    opacity=0.75
))
fig.add_trace(go.Histogram(
    x=val_data.flatten(),
    name='Validation',
    xbins=dict(
        start=0,
        end=df_data.max(),
        size=df_data.max()/30.
    ),
    marker_color='red',
    opacity=0.75
))
fig.add_trace(go.Histogram(
    x=test_data.flatten(),
    name='Test',
    xbins=dict(
        start=0,
        end=df_data.max(),
        size=df_data.max()/30.
    ),
    marker_color='green',
    opacity=0.75
))
fig.update_yaxes(type="log")
fig.update_layout(
    title="Cells Samples Histograms",
    title_x = 0.5,
    xaxis_title="Deforestation Area (Km2)",
    yaxis_title="Count",
    legend_title="Subset"
)
fig.show()


In [None]:
train_data = df_data[:,:, 0: 72]
val_data = df_data[:,:, 72: 120]
test_data = df_data[:,:, 120: 168]

fig = go.Figure()
fig.add_trace(go.Histogram(
    x=train_data.flatten(),
    histnorm='percent',
    name='Train', # name used in legend and hover labels
    xbins=dict( # bins used for histogram
        start=0,
        end=1, 
        size=0.05
    ),
    marker_color='blue',
    opacity=0.75
))
fig.add_trace(go.Histogram(
    x=val_data.flatten(),
    histnorm='percent',
    name='Validation',
    xbins=dict(
        start=0,
        end=1, 
        size=0.05
    ),
    marker_color='red',
    opacity=0.75
))
fig.add_trace(go.Histogram(
    x=test_data.flatten(),
    histnorm='percent',
    name='Test',
    xbins=dict(
        start=0,
        end=1, 
        size=0.05
    ),
    marker_color='green',
    opacity=0.75
))
fig.update_yaxes(type="log")
fig.update_xaxes(range=[0, 1])
fig.update_layout(
    title="Cells Samples Histograms",
    title_x = 0.5,
    xaxis_title="Deforestation Area (Km2)",
    yaxis_title="Percent",
    legend_title="Subset"
)
fig.show()


In [None]:
fig.update_xaxes(range=[1.5, 4.5])