In [1]:
import pint
import xarray as xr
from dask.distributed import Client
from seapopym.configuration.no_transport.parameter import ForcingParameters
from seapopym.configuration.parameters.parameter_forcing import ForcingUnit
from seapopym.standard.units import StandardUnitsLabels

from seapopym_optimization import (
    FunctionalGroupOptimizeNoTransport,
    GeneticAlgorithm,
    GeneticAlgorithmParameters,
    NoTransportCostFunction,
    Observation,
    Parameter,
    constraint,
)

Load forcing.


In [2]:
time_start, time_end = "1998-01-01", "2022-01-01"

data = xr.open_dataset("../1_data_processing/1_1_Forcing/all_stations_cmems.zarr", engine="zarr")
data["T"].attrs["units"] = StandardUnitsLabels.temperature.units
data = data.sel(time=slice(time_start, time_end))
_ = data.load()

cafe_npp = xr.open_dataset("../1_data_processing/1_1_Forcing/all_stations_cafe.zarr", engine="zarr")
cafe_npp = cafe_npp.sel(time=slice(time_start, time_end))
cafe_npp = cafe_npp.dropna("time", how="all")
cafe_npp = cafe_npp.resample(time="D").interpolate("linear")
_ = cafe_npp.load()

In [3]:
data

In [4]:
cafe_npp

Load observations.

First I multiply the observations by the average epipelagic layer depth (150m) to have a biomass in m2 rather than m3.


In [5]:
def update_layer(data: xr.DataArray, epipelagic_size):
    data = data.pint.quantify() * epipelagic_size
    layer_attrs = data["layer"].attrs
    data = data.assign_coords({"layer": [1]})
    data["layer"].attrs = layer_attrs
    return data


epipelagic_size = 150 * pint.application_registry("meter")

obs_bats = xr.open_dataset("../1_data_processing/1_1_Forcing/Bats_obs.zarr", engine="zarr")
obs_bats = update_layer(obs_bats, epipelagic_size)
obs_bats = Observation(obs_bats)

obs_hot = xr.open_dataset("../1_data_processing/1_1_Forcing/Hot_obs.zarr", engine="zarr")
obs_hot = update_layer(obs_hot, epipelagic_size)
obs_hot = Observation(obs_hot)

obs_papa = xr.open_dataset("../1_data_processing/1_1_Forcing/Papa_obs.zarr", engine="zarr")
obs_papa = update_layer(obs_papa, epipelagic_size)
obs_papa = Observation(obs_papa)

observations = [obs_bats, obs_hot, obs_papa]

Create structure for SeapoPym simulation.


In [6]:
forcing_parameters = ForcingParameters(
    temperature=ForcingUnit(forcing=data["T"], resolution=1 / 12, timestep=1),
    primary_production=ForcingUnit(forcing=cafe_npp["CAFE"], resolution=1 / 12, timestep=1),
)

|	CAFE unit is milligram / day / meter ** 2, it will be converted to kilogram / day / meter ** 2.
[0m


Setup the cost function.


In [7]:
functional_groups = [
    FunctionalGroupOptimizeNoTransport(
        name="D1N1",
        day_layer=1,
        night_layer=1,
        tr_rate=Parameter("D1N1_tr_rate", -1, 0),
        tr_max=Parameter("D1N1_tr_max", 0, 50),
        inv_lambda_rate=Parameter("D1N1_inv_lambda_rate", 0, 1),
        inv_lambda_max=Parameter("D1N1_inv_lambda_max", 0, 100),
        energy_coefficient=Parameter("D1N1_energy_coefficient", 0.05, 0.8),
    ),
    FunctionalGroupOptimizeNoTransport(
        name="D2N1",
        day_layer=2,
        night_layer=1,
        tr_rate=Parameter("D2N1_tr_rate", -1, 0),
        tr_max=Parameter("D2N1_tr_max", 0, 50),
        inv_lambda_rate=Parameter("D2N1_inv_lambda_rate", 0, 1),
        inv_lambda_max=Parameter("D2N1_inv_lambda_max", 0, 100),
        energy_coefficient=Parameter("D2N1_energy_coefficient", 0.05, 0.8),
    ),
]

In [8]:
cost_function = NoTransportCostFunction(
    functional_groups=functional_groups,
    forcing_parameters=forcing_parameters,
    observations=observations,
)

Set the genetic algorithm meta parameters.


In [9]:
genetic_algo_parameters = GeneticAlgorithmParameters(
    ETA=1,
    INDPB=0.1,
    CXPB=0.5,
    MUTPB=0.2,
    NGEN=10,
    POP_SIZE=100,
    cost_function_weight=(-(1 / 3), -(1 / 3), -(1 / 3)),
    hall_of_fame_size=300,
)

Add a constraint to limit the total of energy transfert coefficient to 100%.


In [10]:
constraint_energy = constraint.ConstraintNoTransportEnergyCoefficient(
    parameters_name=["D1N1_energy_coefficient", "D2N1_energy_coefficient"],
    min_energy_coef_value=0,
    max_energy_coef_value=1,
)

Finaly, create the Genetic Algorithm.


In [11]:
client = Client()
genetic_algo = GeneticAlgorithm(
    cost_function=cost_function,
    parameter_genetic_algorithm=genetic_algo_parameters,
    constraint=[constraint_energy],
    client=client,
)

And watch the magic on the Dask dashboard :


In [12]:
genetic_algo.client

0,1
Connection method: Cluster object,Cluster type: distributed.LocalCluster
Dashboard: http://127.0.0.1:8787/status,

0,1
Dashboard: http://127.0.0.1:8787/status,Workers: 4
Total threads: 8,Total memory: 16.00 GiB
Status: running,Using processes: True

0,1
Comm: tcp://127.0.0.1:51557,Workers: 4
Dashboard: http://127.0.0.1:8787/status,Total threads: 8
Started: Just now,Total memory: 16.00 GiB

0,1
Comm: tcp://127.0.0.1:51570,Total threads: 2
Dashboard: http://127.0.0.1:51572/status,Memory: 4.00 GiB
Nanny: tcp://127.0.0.1:51560,
Local directory: /var/folders/36/grrgsqjd14j4tf6cf5ty4ykh0000gn/T/dask-scratch-space/worker-epe32n4l,Local directory: /var/folders/36/grrgsqjd14j4tf6cf5ty4ykh0000gn/T/dask-scratch-space/worker-epe32n4l

0,1
Comm: tcp://127.0.0.1:51569,Total threads: 2
Dashboard: http://127.0.0.1:51571/status,Memory: 4.00 GiB
Nanny: tcp://127.0.0.1:51562,
Local directory: /var/folders/36/grrgsqjd14j4tf6cf5ty4ykh0000gn/T/dask-scratch-space/worker-pnsbx81p,Local directory: /var/folders/36/grrgsqjd14j4tf6cf5ty4ykh0000gn/T/dask-scratch-space/worker-pnsbx81p

0,1
Comm: tcp://127.0.0.1:51568,Total threads: 2
Dashboard: http://127.0.0.1:51573/status,Memory: 4.00 GiB
Nanny: tcp://127.0.0.1:51564,
Local directory: /var/folders/36/grrgsqjd14j4tf6cf5ty4ykh0000gn/T/dask-scratch-space/worker-_qw2kptt,Local directory: /var/folders/36/grrgsqjd14j4tf6cf5ty4ykh0000gn/T/dask-scratch-space/worker-_qw2kptt

0,1
Comm: tcp://127.0.0.1:51577,Total threads: 2
Dashboard: http://127.0.0.1:51578/status,Memory: 4.00 GiB
Nanny: tcp://127.0.0.1:51566,
Local directory: /var/folders/36/grrgsqjd14j4tf6cf5ty4ykh0000gn/T/dask-scratch-space/worker-ee3rg8jf,Local directory: /var/folders/36/grrgsqjd14j4tf6cf5ty4ykh0000gn/T/dask-scratch-space/worker-ee3rg8jf


And execute the process.


In [13]:
viewer = genetic_algo.optimize()

[38;21m2024-10-16 21:48:20,059 :: Seapodym ::  DEBUG ::
|	Direct computation for global_mask_from_nan.
[0m
[38;21m2024-10-16 21:48:20,062 :: Seapodym ::  DEBUG ::
|	Direct computation for global_mask_from_nan.
[0m
[38;21m2024-10-16 21:48:20,063 :: Seapodym ::  DEBUG ::
|	Direct computation for global_mask_from_nan.
[0m
[38;21m2024-10-16 21:48:20,065 :: Seapodym ::  DEBUG ::
|	Direct computation for mask_by_fgroup.
[0m
[38;21m2024-10-16 21:48:20,065 :: Seapodym ::  DEBUG ::
|	Direct computation for mask_by_fgroup.
[0m
[38;21m2024-10-16 21:48:20,066 :: Seapodym ::  DEBUG ::
|	Direct computation for mask_by_fgroup.
[0m
[38;21m2024-10-16 21:48:20,067 :: Seapodym ::  DEBUG ::
|	Direct computation for global_mask_from_nan.
[0m
[38;21m2024-10-16 21:48:20,071 :: Seapodym ::  DEBUG ::
|	Direct computation for mask_by_fgroup.
[0m
[38;21m2024-10-16 21:48:20,075 :: Seapodym ::  DEBUG ::
|	Direct computation for _wrapper_mesh_day_lengths.
[0m
[38;21m2024-10-16 21:48:20,078 :: Sea

In [14]:
viewer.logbook

Unnamed: 0,gen,nevals,avg,std,min,max,nvalide,ninvalide
0,0,100,1.8e-05,3.1e-05,1.332802e-07,0.000323,192,108
1,1,68,1.6e-05,2.8e-05,1.252992e-07,0.000315,276,24
2,2,59,1.4e-05,1.9e-05,1.252992e-07,4.2e-05,285,15
3,3,71,1.4e-05,1.9e-05,1.252992e-07,4.2e-05,285,15
4,4,62,1.4e-05,1.9e-05,1.252992e-07,4.2e-05,294,6
5,5,82,1.4e-05,1.9e-05,1.252992e-07,4.2e-05,297,3
6,6,63,1.5e-05,1.9e-05,1.212027e-07,5e-05,300,0
7,7,64,1.4e-05,1.9e-05,1.212027e-07,4.2e-05,285,15
8,8,55,1.4e-05,1.9e-05,1.212027e-07,4.2e-05,288,12
9,9,64,1.4e-05,1.9e-05,1.208507e-07,4.2e-05,288,12


Finaly here is the result :


In [15]:
viewer.box_plot(4)

In [16]:
viewer.parallel_coordinates()