In [3]:
import numpy as np
import matplotlib.pyplot as plt
import pandas as pd
import astropy.units as u
%matplotlib inline
%config InlineBackend.figure_format = "retina"
from matplotlib import rcParams
rcParams['savefig.dpi'] = 550
rcParams['font.size'] = 20
plt.rc('font', family='serif')
import lsdb
from tqdm import tqdm
import dask
dask.config.set({"temporary-directory" :'/epyc/ssd/users/atzanida/tmp'})
dask.config.set({"dataframe.shuffle-compression": 'Snappy'})

<dask.config.set at 0x7f75b46503a0>

In [6]:
# magic for real time editing of .py files
%load_ext autoreload
%autoreload 2

# Custom functions and tools 
import sys
sys.path.insert(1, '../../../dipper')

import tools as my_tools
import dipper as dip_pipeline
import models as dip_models
from evaluate import evaluate as evaluate
from evaluate import evaluate_updated
from gpmcmc import model_gp
from evaluate import half_eval as half_eval

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload


In [7]:
import tape as tape_v

In [8]:
tape_v.__version__

'0.3.5'

In [9]:
%%time
gaia = lsdb.read_hipscat("/data3/epyc/data3/hipscat/catalogs/gaia_dr3/gaia", 
                        columns=['ra', 'dec', 'parallax', 'parallax_over_error', 
                                'bp_rp', 'solution_id', 
                                'source_id', 
                                'pmra', 'pmra_error', 
                                'pmdec', 'pmdec_error', 
                                'parallax_error', 
                                'phot_g_mean_mag', 
                                'l', 'b', 'non_single_star', 
                                'classprob_dsc_combmod_galaxy', 
                                'classprob_dsc_combmod_star', 
                                 'in_qso_candidates'])

# load ZTF object table
ztf = lsdb.read_hipscat("/epyc/data3/hipscat/catalogs/ztf_axs/ztf_dr14")

# Load ZTF DR14 sources
ztf_sources = lsdb.read_hipscat("/epyc/data3/hipscat/catalogs/ztf_axs/ztf_source")
# change to ztf_zource

CPU times: user 42.5 s, sys: 4.88 s, total: 47.4 s
Wall time: 49.2 s


In [10]:
from distributed import Client
client = Client(n_workers=20, threads_per_worker=1, memory_limit='45GB')

In [11]:
client

0,1
Connection method: Cluster object,Cluster type: distributed.LocalCluster
Dashboard: http://127.0.0.1:8787/status,

0,1
Dashboard: http://127.0.0.1:8787/status,Workers: 20
Total threads: 20,Total memory: 838.19 GiB
Status: running,Using processes: True

0,1
Comm: tcp://127.0.0.1:35113,Workers: 20
Dashboard: http://127.0.0.1:8787/status,Total threads: 20
Started: Just now,Total memory: 838.19 GiB

0,1
Comm: tcp://127.0.0.1:45317,Total threads: 1
Dashboard: http://127.0.0.1:42390/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:44107,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-f4awuxts,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-f4awuxts

0,1
Comm: tcp://127.0.0.1:42883,Total threads: 1
Dashboard: http://127.0.0.1:44728/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:45644,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-3c0u0p_q,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-3c0u0p_q

0,1
Comm: tcp://127.0.0.1:44815,Total threads: 1
Dashboard: http://127.0.0.1:44968/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:37733,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-mub5gom0,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-mub5gom0

0,1
Comm: tcp://127.0.0.1:44664,Total threads: 1
Dashboard: http://127.0.0.1:44959/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:43541,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-1r53udrc,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-1r53udrc

0,1
Comm: tcp://127.0.0.1:41199,Total threads: 1
Dashboard: http://127.0.0.1:39957/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:39359,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-y0phvmu1,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-y0phvmu1

0,1
Comm: tcp://127.0.0.1:41282,Total threads: 1
Dashboard: http://127.0.0.1:37731/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:34467,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-xs2ya2bh,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-xs2ya2bh

0,1
Comm: tcp://127.0.0.1:39635,Total threads: 1
Dashboard: http://127.0.0.1:38335/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:33784,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-zbzfffjo,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-zbzfffjo

0,1
Comm: tcp://127.0.0.1:42289,Total threads: 1
Dashboard: http://127.0.0.1:35631/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:34111,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-vmdl54as,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-vmdl54as

0,1
Comm: tcp://127.0.0.1:43268,Total threads: 1
Dashboard: http://127.0.0.1:42416/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:43661,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-oovshad3,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-oovshad3

0,1
Comm: tcp://127.0.0.1:41110,Total threads: 1
Dashboard: http://127.0.0.1:37453/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:33357,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-62atptl0,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-62atptl0

0,1
Comm: tcp://127.0.0.1:44024,Total threads: 1
Dashboard: http://127.0.0.1:38515/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:36770,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-hw7z8wbd,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-hw7z8wbd

0,1
Comm: tcp://127.0.0.1:37151,Total threads: 1
Dashboard: http://127.0.0.1:39666/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:42084,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-_8mljlga,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-_8mljlga

0,1
Comm: tcp://127.0.0.1:33310,Total threads: 1
Dashboard: http://127.0.0.1:32892/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:36634,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-a6sp329v,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-a6sp329v

0,1
Comm: tcp://127.0.0.1:34565,Total threads: 1
Dashboard: http://127.0.0.1:41287/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:45375,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-ck2t3fz6,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-ck2t3fz6

0,1
Comm: tcp://127.0.0.1:36151,Total threads: 1
Dashboard: http://127.0.0.1:33977/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:45123,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-5_u2wsyd,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-5_u2wsyd

0,1
Comm: tcp://127.0.0.1:40779,Total threads: 1
Dashboard: http://127.0.0.1:39273/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:42994,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-aadyd0zx,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-aadyd0zx

0,1
Comm: tcp://127.0.0.1:44836,Total threads: 1
Dashboard: http://127.0.0.1:36279/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:33063,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-77of3mjj,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-77of3mjj

0,1
Comm: tcp://127.0.0.1:42858,Total threads: 1
Dashboard: http://127.0.0.1:42414/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:46397,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-pjizq9tg,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-pjizq9tg

0,1
Comm: tcp://127.0.0.1:36974,Total threads: 1
Dashboard: http://127.0.0.1:41245/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:42189,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-yr431_e1,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-yr431_e1

0,1
Comm: tcp://127.0.0.1:44259,Total threads: 1
Dashboard: http://127.0.0.1:44880/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:38663,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-xgqt7ul8,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-xgqt7ul8


In [23]:
import dask.dataframe as dd
from tape import Ensemble, ColumnMapper
pd.options.mode.chained_assignment = None

# Initialize an Ensemble
ens = Ensemble(client=client)

In [24]:
ens.client_info()

0,1
Connection method: Cluster object,Cluster type: distributed.LocalCluster
Dashboard: http://127.0.0.1:8787/status,

0,1
Dashboard: http://127.0.0.1:8787/status,Workers: 20
Total threads: 20,Total memory: 838.19 GiB
Status: running,Using processes: True

0,1
Comm: tcp://127.0.0.1:35113,Workers: 20
Dashboard: http://127.0.0.1:8787/status,Total threads: 20
Started: 4 minutes ago,Total memory: 838.19 GiB

0,1
Comm: tcp://127.0.0.1:45317,Total threads: 1
Dashboard: http://127.0.0.1:42390/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:44107,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-f4awuxts,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-f4awuxts

0,1
Comm: tcp://127.0.0.1:42883,Total threads: 1
Dashboard: http://127.0.0.1:44728/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:45644,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-3c0u0p_q,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-3c0u0p_q

0,1
Comm: tcp://127.0.0.1:44815,Total threads: 1
Dashboard: http://127.0.0.1:44968/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:37733,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-mub5gom0,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-mub5gom0

0,1
Comm: tcp://127.0.0.1:44664,Total threads: 1
Dashboard: http://127.0.0.1:44959/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:43541,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-1r53udrc,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-1r53udrc

0,1
Comm: tcp://127.0.0.1:41199,Total threads: 1
Dashboard: http://127.0.0.1:39957/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:39359,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-y0phvmu1,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-y0phvmu1

0,1
Comm: tcp://127.0.0.1:41282,Total threads: 1
Dashboard: http://127.0.0.1:37731/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:34467,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-xs2ya2bh,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-xs2ya2bh

0,1
Comm: tcp://127.0.0.1:39635,Total threads: 1
Dashboard: http://127.0.0.1:38335/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:33784,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-zbzfffjo,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-zbzfffjo

0,1
Comm: tcp://127.0.0.1:42289,Total threads: 1
Dashboard: http://127.0.0.1:35631/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:34111,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-vmdl54as,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-vmdl54as

0,1
Comm: tcp://127.0.0.1:43268,Total threads: 1
Dashboard: http://127.0.0.1:42416/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:43661,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-oovshad3,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-oovshad3

0,1
Comm: tcp://127.0.0.1:41110,Total threads: 1
Dashboard: http://127.0.0.1:37453/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:33357,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-62atptl0,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-62atptl0

0,1
Comm: tcp://127.0.0.1:44024,Total threads: 1
Dashboard: http://127.0.0.1:38515/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:36770,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-hw7z8wbd,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-hw7z8wbd

0,1
Comm: tcp://127.0.0.1:37151,Total threads: 1
Dashboard: http://127.0.0.1:39666/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:42084,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-_8mljlga,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-_8mljlga

0,1
Comm: tcp://127.0.0.1:33310,Total threads: 1
Dashboard: http://127.0.0.1:32892/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:36634,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-a6sp329v,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-a6sp329v

0,1
Comm: tcp://127.0.0.1:34565,Total threads: 1
Dashboard: http://127.0.0.1:41287/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:45375,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-ck2t3fz6,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-ck2t3fz6

0,1
Comm: tcp://127.0.0.1:36151,Total threads: 1
Dashboard: http://127.0.0.1:33977/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:45123,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-5_u2wsyd,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-5_u2wsyd

0,1
Comm: tcp://127.0.0.1:40779,Total threads: 1
Dashboard: http://127.0.0.1:39273/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:42994,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-aadyd0zx,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-aadyd0zx

0,1
Comm: tcp://127.0.0.1:44836,Total threads: 1
Dashboard: http://127.0.0.1:36279/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:33063,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-77of3mjj,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-77of3mjj

0,1
Comm: tcp://127.0.0.1:42858,Total threads: 1
Dashboard: http://127.0.0.1:42414/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:46397,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-pjizq9tg,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-pjizq9tg

0,1
Comm: tcp://127.0.0.1:36974,Total threads: 1
Dashboard: http://127.0.0.1:41245/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:42189,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-yr431_e1,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-yr431_e1

0,1
Comm: tcp://127.0.0.1:44259,Total threads: 1
Dashboard: http://127.0.0.1:44880/status,Memory: 41.91 GiB
Nanny: tcp://127.0.0.1:38663,
Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-xgqt7ul8,Local directory: /epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-xgqt7ul8


In [14]:
%%time
fgk_object = lsdb.read_hipscat("/nvme/users/atzanida/tmp/sample_final_starhorse_hips")

CPU times: user 62.1 ms, sys: 29.3 ms, total: 91.3 ms
Wall time: 75.1 ms


In [15]:
%%time
_sources = fgk_object.join(
    ztf_sources, left_on="ps1_objid_ztf_dr14", right_on="ps1_objid")

CPU times: user 1min 52s, sys: 11.6 s, total: 2min 4s
Wall time: 1min 59s


In [25]:
# ColumnMapper Establishes which table columns map to timeseries quantities
colmap = ColumnMapper(
        id_col='_hipscat_index',
        time_col='mjd',
        flux_col='mag',
        err_col='magerr',
        band_col='band',
      )

ens.from_dask_dataframe(
    source_frame=_sources._ddf,
    object_frame=fgk_object._ddf,
    column_mapper=colmap,
    sync_tables=False, # Avoid doing an initial sync
    sorted=True, # If the input data is already sorted by the chosen index
    sort=False,
)

<tape.ensemble.Ensemble at 0x7f7125029b10>

In [26]:
# feature evaluation 
column_names = ['Nphot',
    'biweight_scale',
    'frac_above_2_sigma', # in deviation
    'Ndips',
    'rate',
    'chi2dof',
    'skew', 
    'kurtosis',
    'mad',
    'stetson_i',
    'stetson_j',
    'stetson_k',
    'invNeumann',    
    'best_dip_power',
    'best_dip_time_loc',
    'best_dip_start',
    'best_dip_end',
    'best_dip_dt',
    'best_dip_ndet',
    'lc_score']

# Define DataFrame with loc and scale as meta
my_meta = pd.DataFrame(columns=column_names, dtype=float)

In [27]:
%%time
# apply calc_biweight function
calc_ = ens.batch(
    evaluate_updated,
    'mjd_ztf_source', 'mag_ztf_source', 
    'magerr_ztf_source', 'catflags_ztf_source',
    'band_ztf_source',
    meta=my_meta,
    use_map=True)

Using generated label, result_1, for a batch result.
CPU times: user 559 ms, sys: 11.9 ms, total: 571 ms
Wall time: 562 ms


In [28]:
%%time
ens.object.join(calc_).update_ensemble()

CPU times: user 19.8 s, sys: 1.11 s, total: 21 s
Wall time: 20.5 s


<tape.ensemble.Ensemble at 0x7f7125029b10>

In [None]:
%%time
full_table = ens.object.compute() # full table compute



2024-04-08 14:19:52,459 - distributed.nanny - ERROR - Worker process died unexpectedly
2024-04-08 14:25:31,624 - distributed.nanny - ERROR - Worker process died unexpectedly
2024-04-08 14:34:26,671 - distributed.worker - ERROR - Worker stream died during communication: tcp://127.0.0.1:41282
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 225, in read
    frames_nosplit_nbytes_bin = await stream.read_bytes(fmt_size)
tornado.iostream.StreamClosedError: Stream is closed

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2059, in gather_dep
    response = await get_data_from_worker(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2863, in get_data_f

2024-04-08 14:35:04,584 - distributed.worker - ERROR - failed during get data with tcp://127.0.0.1:41282 -> tcp://127.0.0.1:44836
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 225, in read
    frames_nosplit_nbytes_bin = await stream.read_bytes(fmt_size)
tornado.iostream.StreamClosedError: Stream is closed

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 1783, in get_data
    response = await comm.read(deserializers=serializers)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 236, in read
    convert_stream_closed_error(self, e)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py"

2024-04-08 14:44:08,948 - distributed.nanny - ERROR - Worker process died unexpectedly
2024-04-08 14:45:19,377 - distributed.worker - ERROR - Worker stream died during communication: tcp://127.0.0.1:44259
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 225, in read
    frames_nosplit_nbytes_bin = await stream.read_bytes(fmt_size)
tornado.iostream.StreamClosedError: Stream is closed

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2059, in gather_dep
    response = await get_data_from_worker(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2863, in get_data_from_worker
    response = await send_recv(
  File "/epyc/users/atzanida/anaconda3/envs/

2024-04-08 14:45:23,271 - distributed.worker - ERROR - Worker stream died during communication: tcp://127.0.0.1:44259
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 225, in read
    frames_nosplit_nbytes_bin = await stream.read_bytes(fmt_size)
tornado.iostream.StreamClosedError: Stream is closed

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2059, in gather_dep
    response = await get_data_from_worker(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2863, in get_data_from_worker
    response = await send_recv(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/core.py", line 1154, in send_re

2024-04-08 14:45:44,276 - distributed.worker - ERROR - failed during get data with tcp://127.0.0.1:39635 -> tcp://127.0.0.1:44664
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 225, in read
    frames_nosplit_nbytes_bin = await stream.read_bytes(fmt_size)
tornado.iostream.StreamClosedError: Stream is closed

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 1783, in get_data
    response = await comm.read(deserializers=serializers)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 236, in read
    convert_stream_closed_error(self, e)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py"

2024-04-08 14:53:47,127 - distributed.worker - ERROR - failed during get data with tcp://127.0.0.1:40779 -> tcp://127.0.0.1:44664
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 297, in write
    raise StreamClosedError()
tornado.iostream.StreamClosedError: Stream is closed

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 1782, in get_data
    compressed = await comm.write(msg, serializers=serializers)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 307, in write
    convert_stream_closed_error(self, e)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 142, in convert_strea

2024-04-08 15:08:40,103 - distributed.worker - ERROR - failed during get data with tcp://127.0.0.1:36974 -> tcp://127.0.0.1:45317
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 225, in read
    frames_nosplit_nbytes_bin = await stream.read_bytes(fmt_size)
tornado.iostream.StreamClosedError: Stream is closed

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 1783, in get_data
    response = await comm.read(deserializers=serializers)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 236, in read
    convert_stream_closed_error(self, e)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py"

2024-04-08 15:10:45,749 - distributed.nanny - ERROR - Worker process died unexpectedly
2024-04-08 15:13:45,683 - distributed.worker - ERROR - Worker stream died during communication: tcp://127.0.0.1:42858
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 225, in read
    frames_nosplit_nbytes_bin = await stream.read_bytes(fmt_size)
tornado.iostream.StreamClosedError: Stream is closed

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2059, in gather_dep
    response = await get_data_from_worker(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2863, in get_data_from_worker
    response = await send_recv(
  File "/epyc/users/atzanida/anaconda3/envs/









































































































































































































































































































































































































































































































































In [30]:
%%time
calc_.head(250, npartitions=25)

CPU times: user 2min 38s, sys: 14.3 s, total: 2min 52s
Wall time: 3min 29s


Unnamed: 0_level_0,Nphot,biweight_scale,frac_above_2_sigma,Ndips,rate,chi2dof,skew,kurtosis,mad,stetson_i,stetson_j,stetson_k,invNeumann,best_dip_power,best_dip_time_loc,best_dip_start,best_dip_end,best_dip_dt,best_dip_ndet,lc_score
_hipscat_index,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1
12482248704,266.0,0.024350,0.022556,0.0,0.0,1.004714,-0.010657,2.038177,0.015356,7.684048,19.657562,0.759092,0.460740,,,,,,,
116614234112,267.0,0.013218,0.026217,0.0,0.0,1.009678,-0.166459,0.700273,0.007980,34.753979,24.324205,0.764841,0.648049,,,,,,,
751493447680,267.0,0.029874,0.026217,0.0,0.0,1.000762,0.299815,1.643119,0.019567,-5.506576,-10.058016,0.766275,0.566931,,,,,,,
1131799379968,267.0,0.013656,0.022472,0.0,0.0,1.010237,-0.466583,0.798873,0.008295,-1.530876,3.779188,0.779306,0.553092,,,,,,,
1702816120832,267.0,0.014682,0.007491,0.0,0.0,1.012217,-0.781895,1.713557,0.009386,12.276953,14.363346,0.745565,0.498455,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
121534249172992,270.0,0.013829,0.029630,0.0,0.0,1.003574,-0.561682,3.306758,0.007973,-14.357451,-10.085254,0.706450,0.484659,,,,,,,
171481615040512,268.0,0.014494,0.022388,0.0,0.0,1.001083,-0.272640,2.635552,0.009290,18.918163,13.820829,0.738790,0.390555,,,,,,,
102827275845632,270.0,0.024209,0.018519,0.0,0.0,1.007710,-0.031022,3.598324,0.015493,31.517174,26.901697,0.737921,0.519599,,,,,,,
212441862504448,270.0,0.014518,0.033333,0.0,0.0,1.000517,0.082009,1.123886,0.008527,21.903553,24.520405,0.743447,0.532657,,,,,,,


In [50]:
# previous working example as of April 4th 
%%time
calc_.head(1_000, npartitions=10)

CPU times: user 21 s, sys: 8.35 s, total: 29.4 s
Wall time: 33.2 s


Unnamed: 0_level_0,Nphot,biweight_scale,frac_above_2_sigma,Ndips,rate,chi2dof,skew,kurtosis,mad,stetson_i,stetson_j,stetson_k,invNeumann,best_dip_power,best_dip_time_loc,best_dip_start,best_dip_end,best_dip_dt,best_dip_ndet,lc_score
_hipscat_index,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1
213961119105024,269.0,0.015609,0.018587,0.0,0.000000,1.003911,0.289721,0.743892,0.010347,95.148529,64.077812,0.794315,0.692493,,,,,,,
572198062391296,268.0,0.014040,0.018657,0.0,0.000000,1.005126,-0.240236,0.024645,0.008913,23.233597,13.197321,0.779318,0.510219,,,,,,,
471620435050496,217.0,0.013079,0.027650,0.0,0.000000,1.003753,0.198554,2.049891,0.008455,43.642849,35.884365,0.743563,0.602470,,,,,,,
497394970001408,163.0,0.013869,0.000000,0.0,0.000000,1.012015,-4.228230,34.592444,0.008417,111.317398,54.295994,0.606832,0.501397,,,,,,,
778339828629504,216.0,0.012959,0.032407,0.0,0.000000,1.000068,-0.114340,0.443450,0.008190,19.119101,20.018957,0.783205,0.582066,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
30574627545677824,247.0,0.012867,0.032389,0.0,0.000000,1.014547,0.613241,1.640722,0.007657,66.591125,40.524063,0.746860,0.775567,,,,,,,
30828687658057728,248.0,0.012120,0.016129,0.0,0.000000,1.004207,-0.329987,0.652126,0.007340,27.404694,21.355305,0.769521,0.558814,,,,,,,
31221926558957568,250.0,0.014558,0.012000,1.0,0.000662,1.000003,0.657509,4.212327,0.009738,36.517708,24.180901,0.755607,0.422658,,,,,,,
31352022284369920,247.0,0.015255,0.048583,0.0,0.000000,1.027639,0.624323,0.141673,0.009372,87.349014,46.941055,0.784883,0.568002,,,,,,,


In [None]:
%%time
ens.object.join(calc_).update_ensemble()

# previous working example as of April 4th

In [None]:
%%time
full_table = ens.object.compute() # full table compute
# previous working example as of April 4th

2024-04-05 17:17:42,886 - distributed.worker - ERROR - Failed to communicate with scheduler during heartbeat.
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 225, in read
    frames_nosplit_nbytes_bin = await stream.read_bytes(fmt_size)
tornado.iostream.StreamClosedError: Stream is closed

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 1252, in heartbeat
    response = await retry_operation(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/utils_comm.py", line 455, in retry_operation
    return await retry(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/utils_comm.py", line 434, in retry
    return await cor

2024-04-05 17:46:45,719 - distributed.worker - ERROR - Worker stream died during communication: tcp://127.0.0.1:45341
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/tornado/iostream.py", line 861, in _read_to_buffer
    bytes_read = self.read_from_fd(buf)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/tornado/iostream.py", line 1116, in read_from_fd
    return self.socket.recv_into(buf, len(buf))
ConnectionResetError: [Errno 104] Connection reset by peer

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2059, in gather_dep
    response = await get_data_from_worker(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2863, in get_data_fro

2024-04-05 17:46:46,457 - distributed.worker - ERROR - Worker stream died during communication: tcp://127.0.0.1:45341
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 230, in read
    buffer = await read_bytes_rw(stream, buffer_nbytes)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 366, in read_bytes_rw
    actual = await stream.read_into(chunk)  # type: ignore[arg-type]
tornado.iostream.StreamClosedError: Stream is closed

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2059, in gather_dep
    response = await get_data_from_worker(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py"

2024-04-05 17:48:39,548 - distributed.worker - ERROR - Worker stream died during communication: tcp://127.0.0.1:36932
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 230, in read
    buffer = await read_bytes_rw(stream, buffer_nbytes)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 366, in read_bytes_rw
    actual = await stream.read_into(chunk)  # type: ignore[arg-type]
tornado.iostream.StreamClosedError: Stream is closed

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2059, in gather_dep
    response = await get_data_from_worker(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py"

2024-04-05 17:49:47,740 - distributed.worker - ERROR - Worker stream died during communication: tcp://127.0.0.1:36932
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 546, in connect
    stream = await self.client.connect(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/tornado/tcpclient.py", line 279, in connect
    af, addr, stream = await connector.start(connect_timeout=timeout)
asyncio.exceptions.CancelledError

During handling of the above exception, another exception occurred:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/asyncio/tasks.py", line 456, in wait_for
    return fut.result()
asyncio.exceptions.CancelledError

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_dem



2024-04-05 18:02:09,872 - distributed.worker - ERROR - Worker stream died during communication: tcp://127.0.0.1:39323
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 230, in read
    buffer = await read_bytes_rw(stream, buffer_nbytes)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 366, in read_bytes_rw
    actual = await stream.read_into(chunk)  # type: ignore[arg-type]
tornado.iostream.StreamClosedError: Stream is closed

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2059, in gather_dep
    response = await get_data_from_worker(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py"

2024-04-05 18:02:10,590 - distributed.worker - ERROR - Worker stream died during communication: tcp://127.0.0.1:39323
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 230, in read
    buffer = await read_bytes_rw(stream, buffer_nbytes)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 366, in read_bytes_rw
    actual = await stream.read_into(chunk)  # type: ignore[arg-type]
tornado.iostream.StreamClosedError: Stream is closed

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2059, in gather_dep
    response = await get_data_from_worker(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py"

2024-04-05 18:02:32,526 - distributed.worker - ERROR - Worker stream died during communication: tcp://127.0.0.1:33087
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 230, in read
    buffer = await read_bytes_rw(stream, buffer_nbytes)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 366, in read_bytes_rw
    actual = await stream.read_into(chunk)  # type: ignore[arg-type]
tornado.iostream.StreamClosedError: Stream is closed

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2059, in gather_dep
    response = await get_data_from_worker(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py"

2024-04-05 18:02:34,589 - distributed.diskutils - ERROR - Failed to remove '/epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-vd0xx98p/storage' (failed in <built-in function rmdir>): [Errno 2] No such file or directory: 'storage'
2024-04-05 18:02:34,589 - distributed.diskutils - ERROR - Failed to remove '/epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-vd0xx98p' (failed in <built-in function rmdir>): [Errno 2] No such file or directory: '/epyc/ssd/users/atzanida/tmp/dask-scratch-space/worker-vd0xx98p'
  next(self.gen)
2024-04-05 18:02:38,288 - distributed.worker - ERROR - Worker stream died during communication: tcp://127.0.0.1:39323
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 227, in read
    frames_nosplit = await read_bytes_rw(stream, frames_nosplit_nbytes)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp

2024-04-05 18:02:47,260 - distributed.worker - ERROR - Worker stream died during communication: tcp://127.0.0.1:39323
ConnectionRefusedError: [Errno 111] Connection refused

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/core.py", line 342, in connect
    comm = await wait_for(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/utils.py", line 1940, in wait_for
    return await asyncio.wait_for(fut, timeout)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/asyncio/tasks.py", line 445, in wait_for
    return fut.result()
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 559, in connect
    convert_stream_closed_error(self, e)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/li

2024-04-05 18:05:56,957 - distributed.worker - ERROR - Worker stream died during communication: tcp://127.0.0.1:33083
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 230, in read
    buffer = await read_bytes_rw(stream, buffer_nbytes)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 366, in read_bytes_rw
    actual = await stream.read_into(chunk)  # type: ignore[arg-type]
tornado.iostream.StreamClosedError: Stream is closed

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2059, in gather_dep
    response = await get_data_from_worker(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py"

2024-04-05 18:06:00,794 - distributed.worker - ERROR - Worker stream died during communication: tcp://127.0.0.1:33083
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 227, in read
    frames_nosplit = await read_bytes_rw(stream, frames_nosplit_nbytes)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 366, in read_bytes_rw
    actual = await stream.read_into(chunk)  # type: ignore[arg-type]
tornado.iostream.StreamClosedError: Stream is closed

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2059, in gather_dep
    response = await get_data_from_worker(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distri

2024-04-05 18:08:42,079 - distributed.worker - ERROR - Worker stream died during communication: tcp://127.0.0.1:34567
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/tornado/iostream.py", line 861, in _read_to_buffer
    bytes_read = self.read_from_fd(buf)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/tornado/iostream.py", line 1116, in read_from_fd
    return self.socket.recv_into(buf, len(buf))
ConnectionResetError: [Errno 104] Connection reset by peer

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2059, in gather_dep
    response = await get_data_from_worker(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2863, in get_data_fro

2024-04-05 18:08:42,279 - distributed.worker - ERROR - Worker stream died during communication: tcp://127.0.0.1:34567
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 227, in read
    frames_nosplit = await read_bytes_rw(stream, frames_nosplit_nbytes)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 366, in read_bytes_rw
    actual = await stream.read_into(chunk)  # type: ignore[arg-type]
tornado.iostream.StreamClosedError: Stream is closed

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2059, in gather_dep
    response = await get_data_from_worker(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distri

2024-04-05 18:11:06,379 - distributed.worker - ERROR - Worker stream died during communication: tcp://127.0.0.1:40864
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/tornado/iostream.py", line 861, in _read_to_buffer
    bytes_read = self.read_from_fd(buf)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/tornado/iostream.py", line 1116, in read_from_fd
    return self.socket.recv_into(buf, len(buf))
ConnectionResetError: [Errno 104] Connection reset by peer

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2059, in gather_dep
    response = await get_data_from_worker(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2863, in get_data_fro

2024-04-05 18:11:06,898 - distributed.worker - ERROR - Worker stream died during communication: tcp://127.0.0.1:40864
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 230, in read
    buffer = await read_bytes_rw(stream, buffer_nbytes)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 366, in read_bytes_rw
    actual = await stream.read_into(chunk)  # type: ignore[arg-type]
tornado.iostream.StreamClosedError: Stream is closed

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2059, in gather_dep
    response = await get_data_from_worker(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py"

2024-04-05 18:11:49,107 - distributed.worker - ERROR - Worker stream died during communication: tcp://127.0.0.1:40864
ConnectionRefusedError: [Errno 111] Connection refused

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/core.py", line 342, in connect
    comm = await wait_for(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/utils.py", line 1940, in wait_for
    return await asyncio.wait_for(fut, timeout)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/asyncio/tasks.py", line 445, in wait_for
    return fut.result()
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 559, in connect
    convert_stream_closed_error(self, e)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/li

2024-04-05 18:13:20,158 - distributed.worker - ERROR - Worker stream died during communication: tcp://127.0.0.1:44539
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 230, in read
    buffer = await read_bytes_rw(stream, buffer_nbytes)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 366, in read_bytes_rw
    actual = await stream.read_into(chunk)  # type: ignore[arg-type]
tornado.iostream.StreamClosedError: Stream is closed

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2059, in gather_dep
    response = await get_data_from_worker(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py"

2024-04-05 18:13:21,084 - distributed.worker - ERROR - Worker stream died during communication: tcp://127.0.0.1:44539
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 227, in read
    frames_nosplit = await read_bytes_rw(stream, frames_nosplit_nbytes)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 366, in read_bytes_rw
    actual = await stream.read_into(chunk)  # type: ignore[arg-type]
tornado.iostream.StreamClosedError: Stream is closed

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2059, in gather_dep
    response = await get_data_from_worker(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distri

2024-04-05 18:13:34,956 - distributed.worker - ERROR - Worker stream died during communication: tcp://127.0.0.1:44539
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 297, in write
    raise StreamClosedError()
tornado.iostream.StreamClosedError: Stream is closed

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2059, in gather_dep
    response = await get_data_from_worker(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2863, in get_data_from_worker
    response = await send_recv(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/core.py", line 1152, in send_recv
    await comm.write(msg, serial



2024-04-05 18:26:04,055 - distributed.worker - ERROR - Worker stream died during communication: tcp://127.0.0.1:37917
Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 230, in read
    buffer = await read_bytes_rw(stream, buffer_nbytes)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 366, in read_bytes_rw
    actual = await stream.read_into(chunk)  # type: ignore[arg-type]
tornado.iostream.StreamClosedError: Stream is closed

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2059, in gather_dep
    response = await get_data_from_worker(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py"

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 230, in read
    buffer = await read_bytes_rw(stream, buffer_nbytes)
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/comm/tcp.py", line 366, in read_bytes_rw
    actual = await stream.read_into(chunk)  # type: ignore[arg-type]
tornado.iostream.StreamClosedError: Stream is closed

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2059, in gather_dep
    response = await get_data_from_worker(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_demo_true/lib/python3.10/site-packages/distributed/worker.py", line 2863, in get_data_from_worker
    response = await send_recv(
  File "/epyc/users/atzanida/anaconda3/envs/lsdb_

