# Imports

In [None]:
import numpy as np
import pandas as pd
import zarr
import dask
from dask import delayed
import distributed
from distributed import Client, LocalCluster, progress
from dask_jobqueue import SLURMCluster
import streamz
import holoviews as hv
from holoviews.streams import Stream, param
from holoviews.operation.datashader import regrid
from bokeh.models.tools import HoverTool
import matplotlib.pyplot as plt
import qgrid
import ipywidgets as widgets
from tqdm import tnrange, tqdm, tqdm_notebook
import warnings
from functools import partial
from cytoolz import *
from operator import getitem
import nd2reader
from importlib import reload
import traceback
import hvplot.pandas
import param
import parambokeh
from traitlets import All
import cachetools
from collections import namedtuple, defaultdict
from collections.abc import Mapping, Sequence
import skimage.morphology
import scipy
from glob import glob

IDX = pd.IndexSlice

In [None]:
%load_ext autoreload
%autoreload 2

In [None]:
# from processing import *
# from trench_detection import *
# from trench_segmentation import *
# from trench_segmentation.watershed import *
# from util import *
# from ui import *
import common, trench_detection, util
import ui, diagnostics, metadata
import workflow, image, geometry
import trench_detection.hough, trench_detection.core
import trench_segmentation.watershed

In [None]:
%load_ext line_profiler
hv.extension("bokeh")
%matplotlib inline
tqdm.monitor_interval = 0

# Restore data

In [None]:
%store -r trench_points trench_diag

# Config

In [None]:
cluster = SLURMCluster(
    queue="short",
    walltime="00:30:00",
    # job_extra=['-p transfer'],
    # job_extra=['--cores-per-socket=8'],
    # interface='ib0',
    memory="8GB",
    local_directory="/tmp",
    cores=1,
    processes=1,
    # diagnostics_port=('127.0.0.1', 8787),
    env_extra=['export PYTHONPATH="/home/jqs1/projects/matriarch"'],
)
client = Client(cluster)

In [None]:
cluster._widget().children[1].children[1].children[0].children[0].layout.width = "200px"
cluster

In [None]:
cluster.stop_jobs(cluster.running_jobs.keys())

In [None]:
# client = Client()

# Loading data

In [None]:
# nd2_filenames = ['/n/scratch2/jqs1/fidelity/all/180405_txnerr.nd2', '/n/scratch2/jqs1/fidelity/all/180405_txnerr001.nd2']
# nd2_filenames = ['/n/scratch2/jqs1/fidelity/all/180405_txnerr002.nd2']#, '/n/scratch2/jqs1/fidelity/all/TrErr002_Exp.nd2']
# nd2_filenames = ['/n/scratch2/jqs1/fidelity/all/TrErr002_Exp.nd2']
# nd2_filenames = ['/n/scratch2/jqs1/fidelity/all/180405_txnerr.nd2', '/n/scratch2/jqs1/fidelity/all/180405_txnerr001.nd2',
#                 '/n/scratch2/jqs1/fidelity/all/180405_txnerr002.nd2', '/n/scratch2/jqs1/fidelity/all/TrErr002_Exp.nd2']
# nd2_filenames = ['/home/jqs1/scratch/fidelity/180518_triplegrowthcurve/PHASE_GC001.nd2', '/home/jqs1/scratch/fidelity/180518_triplegrowthcurve/PHASE_GC002.nd2']
nd2_filenames = glob("/n/scratch2/jqs1/fidelity/all/180405_*.nd2") + glob(
    "/n/scratch2/jqs1/fidelity/all/TrErr*.nd2"
)

In [None]:
all_frames, metadata, parsed_metadata = workflow.get_nd2_frame_list(nd2_filenames)
image_limits = workflow.get_filename_image_limits(metadata)

# Reload

In [None]:
def do_reload():
    from importlib import reload
    import util, trench_detection, diagnostics, workflow, image

    # reload(util)
    reload(trench_detection.hough)
    # reload(diagnostics)
    # reload(workflow)
    # reload(image)


client.run(do_reload)
do_reload()

# Finding trenches

In [None]:
frames_to_process = all_frames.loc[IDX[:, :, ["MCHERRY"], 0], :]

In [None]:
len(frames_to_process)

## Debugging corrupted ND2

In [None]:
blah = {
    idx: client.submit(workflow.get_nd2_frame, **idx._asdict())
    for idx, row in util.iter_index(frames_to_process)
}

In [None]:
client.cancel(blah)

In [None]:
workflow.get_nd2_frame(**util.get_one(bad)._asdict())

In [None]:
bad = [k for k, v in blah.items() if v.status == "error"]

In [None]:
progress(blah)

## Run trench finding

In [None]:
%%time
find_trenches_diag = diagnostics.wrap_diagnostics(
    trench_detection.hough.find_trenches, ignore_exceptions=True, pandas=True
)
trench_info_futures = {
    idx: client.submit(
        find_trenches_diag, client.submit(workflow.get_nd2_frame, **idx._asdict())
    )
    for idx, row in util.iter_index(frames_to_process)
}

In [None]:
client.cancel(trench_info_futures)

In [None]:
def as_completed(obj, with_results=True):
    if isinstance(obj, Mapping):
        futures = obj.values()
        dask_to_keys = {future.key: k for k, future in obj.items()}
    else:
        raise NotImplementedError
    for res in distributed.as_completed(futures, with_results=with_results):
        if with_results:
            future, result = res
            yield dask_to_keys[future.key], future, result
        else:
            future = res
            yield dask_to_keys[future.key], future

In [None]:
trench_info = {}
for key, fut, res in as_completed(trench_info_futures):
    trench_info[key] = res
    client.cancel(fut)

In [None]:
progress(trench_info_futures)

In [None]:
%%time
trench_info = util.apply_map_futures(
    client.gather, trench_info_futures, predicate=lambda x: x.status == "error"
)

In [None]:
%%time
%store trench_info

In [None]:
len(trench_info)

In [None]:
len(errs)

In [None]:
errs = {k: v[2] for k, v in trench_info.items() if v[2] is not None}
errs

In [None]:
%%time
trench_points, trench_diag, trench_err = workflow.unzip_trench_info(trench_info)

In [None]:
len(trench_points)

In [None]:
%%time
%store trench_points
%store trench_diag

## Analysis

In [None]:
bad_angle = trench_diag["find_trench_lines.hough_2.angle"].abs() > 2
bad_angle.sum()

In [None]:
bad_pitch = (trench_diag["find_trench_lines.hough_2.peak_func.pitch"] - 24).abs() > 1
bad_pitch.sum()

In [None]:
selected = trench_diag[bad_pitch]  # trench_diag[bad_angle | bad_period]

In [None]:
frame_stream.event(_df=selected.index.to_frame(index=False))

In [None]:
%%time
trench_points_good = trench_points[~util.multi_join(trench_points.index, bad_pitch)]

In [None]:
(len(trench_points_good), len(trench_points_good) / len(trench_points))

In [None]:
%%time
trench_bbox_futures = []
for _, trenches in trench_points_good.groupby(["filename", "position", "t"]):
    trench_bbox_futures.append(
        client.submit(workflow.get_trench_bboxes, trenches, image_limits)
    )

In [None]:
%%time
trench_bbox_results = util.apply_map_futures(
    client.gather, trench_bbox_futures, predicate=lambda x: x.status == "finished"
)
trench_bboxes = pd.concat(
    [trench_points_good, pd.concat(trench_bbox_results, axis=0)], axis=1
)

In [None]:
%%time
%store trench_bboxes

In [None]:
%store -r trench_bboxes

In [None]:
trench_bboxes_t0 = util.get_one(trench_bboxes.groupby("t"))[1]
# trench_bboxes_t0.index = trench_points_good_t0.index.droplevel('t')

# Trench finding QA

In [None]:
selected = all_frames

In [None]:
FrameStream = ui.DataframeStream.define(
    "FrameStream", selected.index.to_frame(index=False)
)
frame_stream = FrameStream()

box = ui.dataframe_browser(frame_stream)
frame_stream.event()
box

In [None]:
ui.image_viewer(frame_stream)

In [None]:
ui.show_frame_info(trench_diag, frame_stream)

In [None]:
g = ui.show_grid(selected, stream=frame_stream)
g

In [None]:
frame = workflow.get_nd2_frame(**dict(frame_stream.get_param_values()))

In [None]:
tp, diag, _ = diagnostics.wrap_diagnostics(
    trench_detection.hough.find_trenches, ignore_exceptions=False
)(frame_rot)

In [None]:
ui.show_plot_browser(diag)

# Segmentation

In [None]:
trench_bboxes.head()

In [None]:
trench_bboxes[("info", "hough_value")].plot.hist(bins=100)

In [None]:
selected_trenches_segmarker = trench_bboxes.loc[IDX[:, :10, ["MCHERRY"], 0, :, :], :]
selected_trenches_index = next(iter(selected_trenches_segmarker.groupby("t")))[
    1
].index.droplevel("t")

In [None]:
len(trench_bboxes) / len(selected_trenches_segmarker)

In [None]:
selected_trenches_reporter = selected_trenches_segmarker.rename(
    index={"MCHERRY": "YFP"}, level="channel", copy=False
)

In [None]:
selected_trenches_all = pd.concat(
    [selected_trenches_segmarker, selected_trenches_reporter]
).sort_index()

In [None]:
[all_frames_future] = client.scatter([all_frames], broadcast=True)

In [None]:
frame_stacks_futures = {}
for frame_idx, trenches in util.iter_index(
    selected_trenches_all.groupby(["filename", "position"])
):
    frame_stacks_futures[frame_idx] = client.submit(
        workflow.get_trench_stacks, trenches, all_frames_future, image_limits
    )

In [None]:
client.cancel(frame_stacks_futures)

In [None]:
util.apply_map_futures(
    client.gather, frame_stacks_futures, predicate=lambda x: x.status == "error"
)

In [None]:
def do_segment_trench(img_stack):
    import trench_segmentation.watershed
    from numcodecs import Blosc

    seg = np.stack(
        [trench_segmentation.watershed.segment_trench(img) for img in img_stack]
    )
    return zarr.array(
        seg,
        compressor=Blosc(cname="zstd", clevel=5, shuffle=Blosc.NOSHUFFLE, blocksize=0),
    )

In [None]:
# def map_trenchwise(func, frame_stacks, trenches):
#     results = {}
#     for trench_idx, _ in util.iter_index(trenches):
#         results[trench_idx] = func(frame_stacks[trench_idx])
#     return results


def map_trenchwise(func, frame_stacks, trenches, channels=None):
    results = {}
    for trench_idx, _ in util.iter_index(trenches):
        if channels is None:
            results[trench_idx] = func(frame_stacks[trench_idx])
        else:
            results[trench_idx] = func(
                frame_stacks[trench_idx],
                *[
                    frame_stacks[trench_idx._replace(channel=channel)]
                    for channel in channels
                ],
            )
    return results

In [None]:
frame_segs_futures = {}
for frame_idx, trenches in util.iter_index(
    selected_trenches_index.to_series().groupby(["filename", "position"])
):
    frame_segs_futures[frame_idx] = client.submit(
        partial(map_trenchwise, do_segment_trench),
        frame_stacks_futures[frame_idx],
        trenches,
    )
# frame_segs_futures = valmap(partial(client.submit, partial(valmap, do_segment_trench)), frame_stacks_futures)

In [None]:
client.cancel(frame_segs_futures)

In [None]:
def compute_regionprops(seg_stack, reporter_stack):
    import skimage.measure

    results = []
    for i in range(seg_stack.shape[0]):
        results.append(skimage.measure.regionprops(seg_stack[i], reporter_stack[i]))
    return results

In [None]:
_frame_stacks = util.get_one(frame_stacks_futures).result()

In [None]:
_frame_stacks2 = workflow.get_trench_stacks(
    selected_trenches_all.xs(
        ("/n/scratch2/jqs1/fidelity/all/180405_txnerr.nd2", 0), drop_level=False
    ),
    all_frames,
    image_limits,
)

In [None]:
_key = util.get_one(_frame_stacks.keys())
_key

In [None]:
_seg_masks = util.get_one(frame_segs_futures).result()

In [None]:
util.get_one(_seg_masks.keys())

In [None]:
_rps = compute_regionprops(
    _seg_masks[_key], _frame_stacks[_key]
)  # , _frame_stacks[_key._replace(channel='YFP')])

In [None]:
_rp0 = _rps[0][0]

In [None]:
_rp0.

In [None]:
partial(map_trenchwise, compute_regionprops, channels=["YFP"])(_frame)

In [None]:
frame_regionprops_futures = {}
for frame_idx, trenches in util.iter_index(
    selected_trenches_index.to_series().groupby(["filename", "position"])
):
    frame_regionprops_futures[frame_idx] = client.submit(
        partial(map_trenchwise, compute_regionprops, channels=["YFP"]),
        frame_stacks_futures[frame_idx],
        trenches,
    )

In [None]:
client.cancel(frame_regionprops_futures)

In [None]:
frame_regionprops = util.apply_map_futures(
    client.gather, frame_regionprops_futures, predicate=lambda x: x.status == "error"
)

In [None]:
frame_segs = util.apply_map_futures(
    client.gather, frame_segs_futures, predicate=lambda x: x.status == "finished"
)

In [None]:
pysize.get_size(frame_segs)

In [None]:
len(frame_segs)

In [None]:
%%time
%store frame_segs

In [None]:
a = util.get_one(util.get_one(frame_segs))

In [None]:
plt.imshow(a[0])

In [None]:
pysize.get_size(frame_segs)

In [None]:
trenches.head()

In [None]:
# TODO: old version
# frame_segs_futures = valmap(partial(client.submit, partial(valmap, do_segment_trench)), frame_stacks_futures)

In [None]:
# UNUSED: how to add another channel to trench stacks
# selected_trenches_yfp = selected_trenches.rename(index={'MCHERRY': 'YFP'}, level='channel', copy=False)
# frame_stacks_yfp_futures = {}
# for frame_idx, trenches in util.iter_index(selected_trenches_yfp.groupby(['filename', 'position'])):
#     frame_stacks_yfp_futures[frame_idx] = client.submit(merge,
#                                                        [frame_stacks_futures[frame_idx],
#                                                         client.submit(workflow.get_trench_stacks,
#                                                                       trenches,
#                                                                       all_frames_future,
#                                                                       image_limits)])

In [None]:
# given a dataframe of segmentation frames and a dataframe of readout frames, return regionprops objects (cheaper to serialize than dataframes?)

In [None]:
client.cancel(frame_segs_futures)

In [None]:
client.gather(util.get_one(frame_segs_futures))

In [None]:
zarr.array(
    a, compressor=Blosc(cname="zstd", clevel=5, shuffle=Blosc.NOSHUFFLE, blocksize=0)
)

In [None]:
# hhh

In [None]:
frame0_stacks = client.gather(util.get_one(trench_stack_futures))

In [None]:
img_stack = util.get_one(frame0_stacks)

In [None]:
a = np.stack([trench_segmentation.watershed.segment_trench(img) for img in img_stack])

In [None]:
a.shape

In [None]:
from numcodecs import Blosc

In [None]:
# hhh

In [None]:
%%time
trench_bbox_results = util.apply_map_futures(
    client.gather, trench_bbox_futures, predicate=lambda x: x.status == "finished"
)
trench_bboxes = pd.concat(
    [trench_points_good, pd.concat(trench_bbox_results, axis=0)], axis=1
)

In [None]:
%%time
trench_stacks = workflow.get_trench_stacks(
    selected_trenches, all_frames, workflow.get_filename_image_limits(metadata)
)

In [None]:
%%time
segs, seg_diags, seg_errs = zip(
    *[
        diagnostics.wrap_diagnostics(trench_segmentation.watershed.segment_trench)(img)
        for img in img_stack
    ]
)

# Old

In [None]:
get_trenches(root_group["raw"][str(pos)][1, 30], diagnostics=diag_pos[pos])

In [None]:
diag = tree()
_ = get_trenches(root_group["raw"][str(pos)][0, 1], diagnostics=diag)

In [None]:
def f(img_stack):
    ary = np.stack(
        [
            segment_trench(img_stack[t], diagnostics=None)
            for t in range(img_stack.shape[0])
        ],
        axis=0,
    )
    ary = zarr.array(ary, compressor=DEFAULT_FRAME_COMPRESSOR)
    return ary


trench_seg_masks = positionwise_trenchwise_map(
    root_group["raw"],
    trench_points_pos,
    f,
    channel_slice=1,
    preload=True,
    time_slice=slice(None),
    positions=range(1),
)

In [None]:
def f(img_stack):
    return pd.Series(np.percentile(img_stack, 95, axis=(1, 2)))
    # return pd.Series(np.max(img_stack, axis=(1,2)))


trench_traces_all = positionwise_trenchwise_map(
    root_group["raw"],
    trench_points_pos,
    f,
    channel_slice=2,
    preload=True,
    time_slice=slice(None),
    positions=range(100),
)