In [1]:
%load_ext autoreload
%autoreload 2
import time
import multiprocessing
from pathlib import Path
import shutil
import numpy as np
import thor.data as data
import thor.data.dispatch as dispatch
import thor.grid as grid
import thor.option as option
import thor.track as track
import thor.analyze as analyze
import thor.parallel as parallel
import thor.visualize as visualize
import thor.log as log

notebook_name = "gridrad_demo.ipynb"


## You are using the Python ARM Radar Toolkit (Py-ART), an open source
## library for working with weather radar data. Py-ART is partly
## supported by the U.S. Department of Energy as part of the Atmospheric
## Radiation Measurement (ARM) Climate Research Facility, an Office of
## Science user facility.
##
## If you use this software to prepare a publication, please cite:
##
##     JJ Helmus and SM Collis, JORS 2016, doi: 10.5334/jors.119



In [2]:
# Parent directory for saving outputs
base_local = Path.home() / "THOR_output"
year=2010
event_directories = data.gridrad.get_event_directories(year, base_local=base_local)
event_directory = event_directories[0]
start, end, event_start = data.gridrad.get_event_times(event_directory)
# start = "2010-01-21T00:30:00"
# end = "2010-01-21T01:30:00"

period = parallel.get_period(start, end)
intervals = parallel.get_time_intervals(start, end, period=period)

output_parent = base_local / f"runs/gridrad_severe/gridrad_{event_start.replace('-', '')}"
event_start

'2010-01-20'

In [3]:
# if output_parent.exists():
# shutil.rmtree(output_parent)
options_directory = output_parent / "options"

# Create and save the dataset options
times_dict = {"start": start, "end": end}
gridrad_dict = {"event_start": event_start}
gridrad_options = data.option.GridRadSevereOptions(**times_dict, **gridrad_dict)
era5_dict = {"latitude_range": [27, 39], "longitude_range": [-102, -89]}
era5_pl_options = data.option.ERA5Options(**times_dict, **era5_dict)
era5_dict.update({"data_format": "single-levels"})
era5_sl_options = data.option.ERA5Options(**times_dict, **era5_dict)
data_options = data.option.DataOptions(
    datasets=[gridrad_options, era5_pl_options, era5_sl_options]
)
data_options.to_yaml(options_directory / "data.yml")
gridrad_options = data_options.dataset_by_name("gridrad")

# Create and save the grid_options dictionary 
grid_options = grid.create_options(
    name="geographic", regrid=False, altitude_spacing=None, geographic_spacing=None
)
grid.check_options(grid_options)
grid.save_grid_options(grid_options, options_directory=options_directory)

# Create the track_options dictionary
track_options = option.default_track_options(dataset="gridrad")
# Modify the default options for gridrad. Because grids so large we now use a distinct
# global flow box for each object.
track_options.levels[1].objects[0].tracking.global_flow_margin = 70
track_options.levels[1].objects[0].tracking.unique_global_flow = False
# If testing, remove the profile and tag attributes
# track_options.levels[1].objects[0].attributes["mcs"].pop("profile")
# track_options.levels[1].objects[0].attributes["mcs"].pop("tag")
track_options.to_yaml(options_directory / "track.yml")

# Create the display_options dictionary
# visualize_options = {
#     obj: visualize.option.runtime_options(obj, save=True, style="presentation")
#     for obj in ["mcs"]
# }
visualize_options = None

2024-11-05 17:56:56,649 - thor.data.option - INFO - Generating era5 filepaths.
2024-11-05 17:56:56,652 - thor.data.option - INFO - Generating era5 filepaths.
2024-11-05 17:56:56,654 - thor.data.option - INFO - Generating era5 filepaths.




In [6]:
%load_ext memory_profiler

In [9]:
760/24

31.666666666666668

In [7]:
times = data.utils.generate_times(data_options.dataset_by_name("gridrad"))
args = [times, data_options.model_copy(), grid_options.copy()]
args += [track_options.model_copy(), visualize_options]
track.simultaneous_track(*args, output_directory=output_parent)

2024-11-04 17:33:05,142 - thor.track - INFO - Beginning thor run. Saving output to /home/ewan/THOR_output/runs/gridrad_severe/gridrad_20100120.
2024-11-04 17:33:05,144 - thor.track - INFO - Beginning simultaneous tracking.
2024-11-04 17:33:12,309 - thor.track - INFO - Processing 2010-01-20T18:00:00.
2024-11-04 17:33:12,312 - thor.data.gridrad - INFO - Updating gridrad dataset for 2010-01-20T18:00:00.
2024-11-04 17:33:12,313 - thor.data.gridrad - INFO - Converting gridrad data from nexrad_3d_v4_2_20100120T180000Z.nc
2024-11-04 17:33:13,536 - thor.track - INFO - Processing hierarchy level 0.
2024-11-04 17:33:13,537 - thor.track - INFO - Tracking convective.
2024-11-04 17:33:29,496 - thor.track - INFO - Tracking middle.
2024-11-04 17:33:29,562 - thor.track - INFO - Tracking anvil.
2024-11-04 17:33:29,614 - thor.track - INFO - Processing hierarchy level 1.
2024-11-04 17:33:29,617 - thor.track - INFO - Tracking mcs.
2024-11-04 17:33:29,807 - thor.match.match - INFO - Matching mcs objects.
2

KeyboardInterrupt: 

In [4]:
# num_processes = int(0.75 * os.cpu_count())
# num_processes = os.cpu_count()
num_processes = 4
kwargs = {"initializer": parallel.initialize_process, "processes": num_processes}
with log.logging_listener(), multiprocessing.get_context("spawn").Pool(**kwargs) as pool:
    results = []
    for i, time_interval in enumerate(intervals):
        time.sleep(1)
        args = [i, time_interval, data_options.model_copy(), grid_options.copy()]
        args += [track_options.model_copy(), visualize_options]
        args += [output_parent, "gridrad"]
        args = tuple(args)
        results.append(pool.apply_async(parallel.track_interval, args))
    pool.close()
    pool.join()
    parallel.check_results(results)


## You are using the Python ARM Radar Toolkit (Py-ART), an open source
## library for working with weather radar data. Py-ART is partly
## supported by the U.S. Department of Energy as part of the Atmospheric
## Radiation Measurement (ARM) Climate Research Facility, an Office of
## Science user facility.
##
## If you use this software to prepare a publication, please cite:
##
##     JJ Helmus and SM Collis, JORS 2016, doi: 10.5334/jors.119


## You are using the Python ARM Radar Toolkit (Py-ART), an open source
## library for working with weather radar data. Py-ART is partly
## supported by the U.S. Department of Energy as part of the Atmospheric
## Radiation Measurement (ARM) Climate Research Facility, an Office of
## Science user facility.
##
## If you use this software to prepare a publication, please cite:
##
##     JJ Helmus and SM Collis, JORS 2016, doi: 10.5334/jors.119


## You are using the Python ARM Radar Toolkit (Py-ART), an open source
## library for working with weather 

2024-11-01 20:47:28,306 - thor.track - INFO - Beginning thor run. Saving output to /home/ewan/THOR_output/runs/dev/gridrad_20100120/interval_0.
2024-11-01 20:47:28,307 - thor.track - INFO - Beginning simultaneous tracking.
2024-11-01 20:47:28,357 - thor.track - INFO - Beginning thor run. Saving output to /home/ewan/THOR_output/runs/dev/gridrad_20100120/interval_1.
2024-11-01 20:47:28,358 - thor.track - INFO - Beginning simultaneous tracking.
2024-11-01 20:47:28,405 - thor.track - INFO - Beginning thor run. Saving output to /home/ewan/THOR_output/runs/dev/gridrad_20100120/interval_2.
2024-11-01 20:47:28,406 - thor.track - INFO - Beginning simultaneous tracking.
2024-11-01 20:47:28,419 - thor.track - INFO - Processing 2010-01-20T18:00:00.
2024-11-01 20:47:28,420 - thor.data.gridrad - INFO - Updating gridrad dataset for 2010-01-20T18:00:00.
2024-11-01 20:47:28,420 - thor.data.gridrad - INFO - Converting gridrad data from nexrad_3d_v4_2_20100120T180000Z.nc
2024-11-01 20:47:28,484 - thor.tr

In [5]:
parallel.stitch_run(output_parent, intervals, cleanup=False)

2024-11-01 20:51:44,913 - thor.parallel - INFO - Stitching all attribute, mask and record files.
2024-11-01 20:51:44,941 - thor.data.option - INFO - Assigning default era5 pressure levels.
2024-11-01 20:51:53,701 - thor.parallel - INFO - Stitching record files.
2024-11-01 20:51:53,787 - thor.parallel - INFO - Stitching attribute files.
2024-11-01 20:51:56,677 - thor.parallel - INFO - Stitching mask files.


In [6]:
analysis_options = analyze.mcs.analysis_options()
analyze.mcs.process_velocities(output_parent, profile_dataset=None)
analyze.mcs.quality_control(output_parent, analysis_options)
# analyze.mcs.classify_all(output_parent)

2024-11-01 20:52:04,602 - thor.data.option - INFO - Assigning default era5 pressure levels.
2024-11-01 20:52:04,771 - thor.data.option - INFO - Assigning default era5 pressure levels.


Unnamed: 0_level_0,Unnamed: 1_level_0,convective_contained,anvil_contained,velocity,area,offset,major_axis,axis_ratio,duration,parents
time,universal_id,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1
2010-01-20 18:00:00,1,True,False,True,True,True,True,True,True,False
2010-01-20 18:00:00,2,True,False,True,True,True,True,False,False,False
2010-01-20 18:10:00,1,True,False,True,True,True,True,True,True,False
2010-01-20 18:10:00,2,False,False,True,True,False,True,False,False,False
2010-01-20 18:20:00,1,True,False,True,True,True,True,False,True,False
...,...,...,...,...,...,...,...,...,...,...
2010-01-21 03:10:00,15,True,True,True,True,True,True,True,True,True
2010-01-21 03:10:00,31,True,True,True,True,True,True,False,True,False
2010-01-21 03:10:00,36,False,False,True,True,False,True,True,True,True
2010-01-21 03:20:00,15,True,True,True,True,True,True,True,True,True


In [5]:
figure_name = f"mcs_gridrad_{event_start.replace('-', '')}"
figure_options = visualize.option.horizontal_attribute_options(
    figure_name, style="presentation", attributes=["velocity", "offset"]
)
start_time = np.datetime64(start)

end_time = np.datetime64(end)
args = [output_parent, start_time, end_time, figure_options]
args_dict = {"parallel_figure": False, "dt": 7200, "by_date": False, "num_processes": 4}
visualize.attribute.mcs_series(*args, **args_dict)

2024-11-05 18:01:44,413 - thor.visualize.attribute - INFO - Visualizing MCS at time 2010-01-20T18:00:00.000000000.
2024-11-05 18:01:47,243 - thor.visualize.attribute - INFO - Saving mcs_gridrad_20100120 figure for 2010-01-20T18:00:00.000000000.
2024-11-05 18:01:49,038 - thor.visualize.attribute - INFO - Visualizing MCS at time 2010-01-20T18:10:00.000000000.
2024-11-05 18:01:51,636 - thor.visualize.attribute - INFO - Saving mcs_gridrad_20100120 figure for 2010-01-20T18:10:00.000000000.
2024-11-05 18:01:53,356 - thor.visualize.attribute - INFO - Visualizing MCS at time 2010-01-20T18:20:00.000000000.
2024-11-05 18:01:56,097 - thor.visualize.attribute - INFO - Saving mcs_gridrad_20100120 figure for 2010-01-20T18:20:00.000000000.
2024-11-05 18:01:58,031 - thor.visualize.attribute - INFO - Visualizing MCS at time 2010-01-20T18:30:00.000000000.
2024-11-05 18:02:01,137 - thor.visualize.attribute - INFO - Saving mcs_gridrad_20100120 figure for 2010-01-20T18:30:00.000000000.
2024-11-05 18:02:02,