In [1]:
import yaml
import xarray as xr
import os
from src.download_copernicus_data import download_copernicus_data

# Load configs
with open('download_config.yaml', 'r') as file:
    config = yaml.safe_load(file)

  from .autonotebook import tqdm as notebook_tqdm
INFO - 2025-12-05T15:44:12Z - Checking if credentials are valid.
INFO:copernicusmarine:Checking if credentials are valid.
INFO - 2025-12-05T15:44:13Z - Valid credentials from input username and password.
INFO:copernicusmarine:Valid credentials from input username and password.


In [2]:
gebco = xr.open_dataset('rawdata/GEBCO_15_Oct_2025/gebco_2025_n68.0_s61.0_w-30.0_e-10.0.nc')  # has 'elevation' (m), positive up

# 1) Convert to positive depth (ocean depth in meters)
deptho = (-gebco['elevation']).clip(min=0)

# 2) Optional: mask very shallow or land (e.g., keep only depth > 10 m)
min_depth_m = 10
deptho = deptho.where(deptho > min_depth_m)

# 3) Rename coords to match your model dataset expectations
deptho = deptho.rename({'lat': 'latitude', 'lon': 'longitude'})

# 4) Save as the bathy file your pipeline expects
bathy_savedir = config.get('directories', {}).get('data_dir', 'rawdata/copernicus') 
if not os.path.exists(bathy_savedir):
    os.makedirs(bathy_savedir)
    
xr.Dataset({'deptho': deptho}).to_netcdf(f'{bathy_savedir}/bathy.nc')

### Physical dataset:

In [None]:
dataset_phy_my = {
    "cmems_mod_glo_phy_my_0.083deg_P1D-m": ["thetao", "uo", "vo", "so"]
}

download_copernicus_data(config, datasets=dataset_phy_my, output_file_name='phy_features_my.nc')

INFO:download_copernicus_data:Downloading data from 2010-01-01 to 2025-08-31
INFO:download_copernicus_data:Dataset cmems_mod_glo_phy_my_0.083deg_P1D-m not downloaded, downloading...


Downloading cmems_mod_glo_phy_my_0.083deg_P1D-m... with variables ['thetao', 'uo', 'vo', 'so']


INFO - 2025-10-16T16:00:49Z - Selected dataset version: "202311"
INFO:copernicusmarine:Selected dataset version: "202311"
INFO - 2025-10-16T16:00:49Z - Selected dataset part: "default"
INFO:copernicusmarine:Selected dataset part: "default"
INFO - 2025-10-16T16:00:51Z - Starting download. Please wait...
INFO:copernicusmarine:Starting download. Please wait...
100%|██████████| 7956/7956 [40:20<00:00,  3.29it/s]
INFO - 2025-10-16T16:41:13Z - Successfully downloaded to temporary_download_dir/cmems_mod_glo_phy_my_0.083deg_P1D-m_lat61_68_lon-30_-10_depths_2010-01-01_2025-08-31.nc
INFO:copernicusmarine:Successfully downloaded to temporary_download_dir/cmems_mod_glo_phy_my_0.083deg_P1D-m_lat61_68_lon-30_-10_depths_2010-01-01_2025-08-31.nc
INFO:download_copernicus_data:Merging files...


Merged dataset saved to temporary_download_dir/copernicus_data.nc
Checking first day to adjust target depths...
Adjusting 871 problematic points...
Processing variables to extract bottom layers...
Saving bottom features to datafiles/phy_features_my.nc


INFO:download_copernicus_data:Bottom features saved to datafiles/phy_features_my.nc
INFO:download_copernicus_data:Temporary directory temporary_download_dir deleted.




In [5]:
dataset_phy_myint = {
    "cmems_mod_glo_phy_myint_0.083deg_P1D-m": ["thetao", "uo", "vo", "so"]
}

download_copernicus_data(config, datasets=dataset_phy_myint, output_file_name='phy_features_myint.nc')

INFO:download_copernicus_data:Downloading data from 2010-01-01 to 2025-08-31
INFO:download_copernicus_data:Dataset cmems_mod_glo_phy_myint_0.083deg_P1D-m not downloaded, downloading...


Downloading cmems_mod_glo_phy_myint_0.083deg_P1D-m... with variables ['thetao', 'uo', 'vo', 'so']


INFO - 2025-10-16T16:54:04Z - Selected dataset version: "202311"
INFO:copernicusmarine:Selected dataset version: "202311"
INFO - 2025-10-16T16:54:04Z - Selected dataset part: "default"
INFO:copernicusmarine:Selected dataset part: "default"
INFO - 2025-10-16T16:54:07Z - Starting download. Please wait...
INFO:copernicusmarine:Starting download. Please wait...
100%|██████████| 668/668 [06:18<00:00,  1.76it/s]
INFO - 2025-10-16T17:00:25Z - Successfully downloaded to temporary_download_dir/cmems_mod_glo_phy_myint_0.083deg_P1D-m_lat61_68_lon-30_-10_depths_2010-01-01_2025-08-31.nc
INFO:copernicusmarine:Successfully downloaded to temporary_download_dir/cmems_mod_glo_phy_myint_0.083deg_P1D-m_lat61_68_lon-30_-10_depths_2010-01-01_2025-08-31.nc
INFO:download_copernicus_data:Merging files...


Merged dataset saved to temporary_download_dir/copernicus_data.nc
Checking first day to adjust target depths...
Adjusting 871 problematic points...
Processing variables to extract bottom layers...
Saving bottom features to datafiles/phy_features_myint.nc


INFO:download_copernicus_data:Bottom features saved to datafiles/phy_features_myint.nc
INFO:download_copernicus_data:Temporary directory temporary_download_dir deleted.


### Bio datasets:

In [None]:
dataset_bio_my = {
    "cmems_mod_glo_bgc_my_0.25deg_P1D-m": ["chl", "no3", "nppv", "o2", "po4", "si"]
}
download_copernicus_data(config, datasets=dataset_bio_my, output_file_name='bio_features_my.nc')

INFO:download_copernicus_data:Downloading data from 2010-01-01 to 2025-08-31
INFO:download_copernicus_data:Dataset cmems_mod_glo_bgc_my_0.25deg_P1D-m not downloaded, downloading...


Downloading cmems_mod_glo_bgc_my_0.25deg_P1D-m... with variables ['chl', 'no3', 'nppv', 'o2', 'po4', 'si']


INFO - 2025-10-16T18:01:10Z - Selected dataset version: "202406"
INFO:copernicusmarine:Selected dataset version: "202406"
INFO - 2025-10-16T18:01:10Z - Selected dataset part: "default"
INFO:copernicusmarine:Selected dataset part: "default"
INFO - 2025-10-16T18:01:12Z - Starting download. Please wait...
INFO:copernicusmarine:Starting download. Please wait...
100%|██████████| 2934/2934 [18:08<00:00,  2.69it/s]
INFO - 2025-10-16T18:19:21Z - Successfully downloaded to temporary_download_dir/cmems_mod_glo_bgc_my_0.25deg_P1D-m_lat61_68_lon-30_-10_depths_2010-01-01_2025-08-31.nc
INFO:copernicusmarine:Successfully downloaded to temporary_download_dir/cmems_mod_glo_bgc_my_0.25deg_P1D-m_lat61_68_lon-30_-10_depths_2010-01-01_2025-08-31.nc
INFO:download_copernicus_data:Merging files...


Merged dataset saved to temporary_download_dir/copernicus_data.nc
Checking first day to adjust target depths...
Adjusting 115 problematic points...
Processing variables to extract bottom layers...
Saving bottom features to datafiles/bio_features_my.nc


INFO:download_copernicus_data:Bottom features saved to datafiles/bio_features_my.nc
INFO:download_copernicus_data:Temporary directory temporary_download_dir deleted.




In [3]:
dataset_bio_myint = {
    "cmems_mod_glo_bgc_myint_0.25deg_P1D-m": ["chl", "no3", "nppv", "o2", "po4", "si"]
}
download_copernicus_data(config, datasets=dataset_bio_myint, output_file_name='bio_features_myint.nc')

INFO:download_copernicus_data:Downloading data from 2010-01-01 to 2025-08-31
INFO:download_copernicus_data:Dataset cmems_mod_glo_bgc_myint_0.25deg_P1D-m not downloaded, downloading...


Downloading cmems_mod_glo_bgc_myint_0.25deg_P1D-m... with variables ['chl', 'no3', 'nppv', 'o2', 'po4', 'si']


INFO - 2025-10-16T18:30:24Z - Selected dataset version: "202406"
INFO:copernicusmarine:Selected dataset version: "202406"
INFO - 2025-10-16T18:30:24Z - Selected dataset part: "default"
INFO:copernicusmarine:Selected dataset part: "default"
INFO - 2025-10-16T18:30:26Z - Starting download. Please wait...
INFO:copernicusmarine:Starting download. Please wait...
100%|██████████| 390/390 [02:20<00:00,  2.77it/s]
INFO - 2025-10-16T18:32:47Z - Successfully downloaded to temporary_download_dir/cmems_mod_glo_bgc_myint_0.25deg_P1D-m_lat61_68_lon-30_-10_depths_2010-01-01_2025-08-31.nc
INFO:copernicusmarine:Successfully downloaded to temporary_download_dir/cmems_mod_glo_bgc_myint_0.25deg_P1D-m_lat61_68_lon-30_-10_depths_2010-01-01_2025-08-31.nc
INFO:download_copernicus_data:Merging files...


Merged dataset saved to temporary_download_dir/copernicus_data.nc
Checking first day to adjust target depths...
Adjusting 115 problematic points...
Processing variables to extract bottom layers...
Saving bottom features to datafiles/bio_features_myint.nc


INFO:download_copernicus_data:Bottom features saved to datafiles/bio_features_myint.nc
INFO:download_copernicus_data:Temporary directory temporary_download_dir deleted.


In [7]:
# bb = xr.open_dataset('../GEBCO_15_Oct_2025/gebco_2025_n68.0_s61.0_w-30.0_e-10.0.nc')
# print(bb)