In [114]:
using Pkg
Pkg.activate("../")
using HTTP
using JSON
using JSON3
using Dates
using OrderedCollections
include("./DIVAndFairEase.jl")
token = ENV["beaconAPItoken"];

[32m[1m  Activating[22m[39m project at `~/Projects/DIVAnd-FAIR-EASE`


In [59]:
datadir = "../data/"
footprintdir = "../Footprint"
mkpath.([datadir, footprintdir])

2-element Vector{String}:
 "../data"
 "../Footprint"

In [3]:
const beacon_services = OrderedDict(
    "Euro-Argo" => "https://beacon-argo.maris.nl",
    "CORA Profile" => "https://beacon-cora-pr.maris.nl",
    "CORA Timeseries" => "https://beacon-cora-ts.maris.nl",
    "EMODnet Chemistry" => "https://beacon-emod-chem.maris.nl",
    "World Ocean Database" => "https://beacon-wod.maris.nl",
    "SeaDataNet CDI TS" => "https://beacon-cdi-ts.maris.nl",
    "CMEMS BGC" => "https://beacon-cmems.maris.nl",
);

In [69]:
datasource = "CMEMS BGC"
domain = [12., 18., 43., 46.]
parameter1 = "TEMP"
if datasource == "World Ocean Database"
    parameter1 = "Temperature"
elseif datasource == "SeaDataNet CDI TS"
    parameter1 = "ITS-90 water temperature"
end
parameter2 = "TEMP"
datestart = Dates.Date(2010, 1, 1)
dateend = Dates.Date(2020, 1, 1)
minlon = domain[1]
maxlon = domain[2]
minlat = domain[3]
maxlat = domain[4]
mindepth = 0.
maxdepth = 10.
dateref = Dates.Date(1950, 1, 1) #Days since 1950
mintemporal = (datestart - dateref).value #Days since 1950
maxtemporal = (dateend - dateref).value #Days since 1950
regionname = "BlackSea"

@info("$(datestart) → $(dateend)")

[36m[1m[ [22m[39m[36m[1mInfo: [22m[39m2010-01-01 → 2020-01-01


In [61]:
beaconURL = beacon_services[datasource]
footprintURL = joinpath(beaconURL, "api/datasets/footprint")
datasource_name = replace(datasource, " " => "_")
footprintfile = joinpath(footprintdir, "Footprint_$(datasource_name).json")
@info("Footprint endpoint: $(footprintURL)")
@info("Footprint file: $(footprintfile)")

[36m[1m[ [22m[39m[36m[1mInfo: [22m[39mFootprint endpoint: https://beacon-cmems.maris.nl/api/datasets/footprint
[36m[1m[ [22m[39m[36m[1mInfo: [22m[39mFootprint file: ../Footprint/Footprint_CMEMS_BGC.json


In [116]:
DIVAndFairEase.varbyunits(footprintfile, ["degree_Celsius", "degrees_C"])

8-element Vector{Any}:
 "PHTX"
 "TEMP_DOXY"
 "TEMP_ADJUSTED_ERROR"
 "TEMP_ADJUSTED"
 "POTENTIAL_TEMP"
 "TEMP_ERROR"
 "TEMP"
 "TEMP_CNDC"

In [62]:
if isfile(footprintfile)
    @info("Footprint file already downloaded")
else
    @info("Writing Footprint file")
    open(footprintfile, "w") do io
        r = HTTP.request("GET", footprintURL, 
            ["Authorization" => "Bearer $(token)"],
            response_stream=io)
        @info(r.status)
    end
end

[36m[1m[ [22m[39m[36m[1mInfo: [22m[39mWriting Footprint file
[36m[1m[ [22m[39m[36m[1mInfo: [22m[39m200


In [63]:
# Note 1: the JSON file is 193M, just to get the list of variables?

In [64]:
data = JSON.parsefile(footprintfile);
attributes = data["unique_column_attributes"]
params = sort(collect(keys(attributes)));
parameter1 in params

true

varbyunits (generic function with 2 methods)

In [109]:
varlist = varbyunits(data)

8-element Vector{Any}:
 "PHTX"
 "TEMP_DOXY"
 "TEMP_ADJUSTED_ERROR"
 "TEMP_ADJUSTED"
 "POTENTIAL_TEMP"
 "TEMP_ERROR"
 "TEMP"
 "TEMP_CNDC"

In [70]:
query = DIVAndFairEase.prepare_query_new(datasource, parameter1, parameter2, datestart, dateend, 
    mindepth, maxdepth, minlon, maxlon, minlat, maxlat)

[36m[1m[ [22m[39m[36m[1mInfo: [22m[39mWorking with CMEMS BGC dataset


"{\"query_parameters\":[{\"column_name\":\"TEMP\",\"alias\":\"TEMP\"},{\"column_name\":\"TEMP\",\"column_attribute\":\"scale_factor\",\"alias\":\"scale_factor\"},{\"column_name\":\"JULD\",\"alias\":\"TIME\"},{\"column_name\":\"DEPH\",\"alias\":\"DEPTH\"},{\"column_name\":\"LONGITUDE\",\"alias\":\"LONGITUDE\"},{\"colum"[93m[1m ⋯ 33 bytes ⋯ [22m[39m"UDE\"}],\"filters\":[{\"for_query_parameter\":\"TIME\",\"min\":21915,\"max\":25567},{\"for_query_parameter\":\"DEPTH\",\"min\":0.0,\"max\":10.0},{\"for_query_parameter\":\"LONGITUDE\",\"min\":12.0,\"max\":18.0},{\"for_query_parameter\":\"LATITUDE\",\"min\":43.0,\"max\":46.0}],\"output\":{\"format\":\"netcdf\"}}"

In [71]:
# Note 2: cannot work with such a long list of parameters!!

In [72]:
filename = joinpath(datadir, "$(datasource_name)_$(replace(parameter1, " "=>"_"))_$(regionname)_$(Dates.format(datestart, "yyyymmdd"))-$(Dates.format(dateend, "yyyymmdd"))_$(Int(mindepth))-$(Int(maxdepth))m.nc");
filename

"../data/CMEMS_BGC_TEMP_BlackSea_20100101-20200101_0-10m.nc"

In [73]:
@info("Data will be written in file:\n$(filename)")

if isfile(filename)
    @info("File already downloaded")
    rm(filename)
end
@time open(filename, "w") do io
    r = HTTP.request("POST", joinpath(beaconURL, "api/query"), 
        ["Content-type"=> "application/json",
         "Authorization" => "Bearer $(token)"
        ],
        query, 
        response_stream=io);
    @info(r.status)
end

@info("NetCDF file size: $(round(filesize(filename)/1000^2, digits=1))M")

[36m[1m┌ [22m[39m[36m[1mInfo: [22m[39mData will be written in file:
[36m[1m└ [22m[39m../data/CMEMS_BGC_TEMP_BlackSea_20100101-20200101_0-10m.nc


  1.514356 seconds (24.29 k allocations: 1.267 MiB, 2 lock conflicts, 1.86% compilation time)


[36m[1m[ [22m[39m[36m[1mInfo: [22m[39m204
[36m[1m[ [22m[39m[36m[1mInfo: [22m[39mNetCDF file size: 0.0M


In [44]:
query

"{\"query_parameters\":[{\"column_name\":\"TEMP\",\"alias\":\"TEMP\"},{\"column_name\":\"JULD\",\"alias\":\"TIME\"},{\"column_name\":\"DEPH\",\"alias\":\"DEPTH\"},{\"column_name\":\"LONGITUDE\",\"alias\":\"LONGITUDE\"},{\"column_name\":\"LATITUDE\",\"alias\":\"LATITUDE\"}],\"filters\":[{\"for_query_parameter\":\"TIME\",\"min\":21915,\"max\":22645},{\"for_query_parameter\":\"DEPTH\",\"min\":0.0,\"max\":10.0},{\"for_query_parameter\":\"LONGITUDE\",\"min\":12.0,\"max\":18.0},{\"for_query_parameter\":\"LATITUDE\",\"min\":43.0,\"max\":46.0},{\"for_query_parameter\":\"TEMP\",\"min\":-2.0,\"max\":30.0}],\"output\":{\"format\":\"netcdf\"}}"