# Dask imaging demonstration

This notebook explores the use of dask for parallelisation. We work through the steps of imaging, ending up with a major/minor cycle algorithm using dask.

In [None]:
%matplotlib inline

import os
import sys

from dask import delayed

sys.path.append(os.path.join('..', '..'))

results_dir = './results'
os.makedirs(results_dir, exist_ok=True)

from matplotlib import pylab

pylab.rcParams['figure.figsize'] = (12.0, 12.0)
pylab.rcParams['image.cmap'] = 'rainbow'

import numpy

from astropy.coordinates import SkyCoord
from astropy import units as u
from astropy.wcs.utils import pixel_to_skycoord

from matplotlib import pyplot as plt

from arl.data.polarisation import PolarisationFrame
from arl.data.parameters import get_parameter
from arl.visibility.operations import create_visibility, create_visibility_from_rows, copy_visibility
from arl.skycomponent.operations import create_skycomponent
from arl.image.deconvolution import deconvolve_cube
from arl.image.operations import show_image, export_image_to_fits
from arl.image.iterators import raster_iter
from arl.visibility.iterators import vis_timeslice_iter, vis_timeslice_iter
from arl.util.testing_support import create_named_configuration
from arl.fourier_transforms.ftprocessor import predict_2d, invert_2d, create_image_from_visibility, \
    predict_skycomponent_visibility, residual_image, invert_timeslice_single, invert_timeslice_single, \
    predict_timeslice_single, predict_timeslice_single,advise_wide_field

import logging

log = logging.getLogger()
log.setLevel(logging.DEBUG)
log.addHandler(logging.StreamHandler(sys.stdout))

We create the visibility. 

This just makes the uvw, time, antenna1, antenna2, weight columns in a table

In [None]:
lowcore = create_named_configuration('LOWBD2-CORE')
times = numpy.linspace(-3,+3,13) * (numpy.pi / 12.0)
frequency = numpy.array([1e8])
channel_bandwidth = numpy.array([1e7])


reffrequency = numpy.max(frequency)
phasecentre = SkyCoord(ra=+15.0 * u.deg, dec=-45.0 * u.deg, frame='icrs', equinox=2000.0)
vt = create_visibility(lowcore, times, frequency, channel_bandwidth=channel_bandwidth,
                       weight=1.0, phasecentre=phasecentre, polarisation_frame=PolarisationFrame("stokesI"))

Advise on wide field parameters. This returns a dictionary with all the input and calculated variables.

In [None]:
advice = advise_wide_field(vt)

Create a grid of components and predict each in turn, using the full phase term including w.

In [None]:
params = {'npixel': 512,
          'cellsize': 0.001,
          'spectral_mode': 'channel',
          'channel_bandwidth': 5e7,
          'reffrequency': 1e8,
          'kernel':'calculated',
          'facets':4}

npixel = 512
cellsize=0.001
facets = 4
flux = numpy.array([[100.0]])

model = create_image_from_visibility(vt, npixel=512, cellsize=0.001, npol=1)
spacing_pixels = npixel // facets
log.info('Spacing in pixels = %s' % spacing_pixels)
spacing = 180.0 * cellsize * spacing_pixels / numpy.pi
centers = -1.5, -0.5, +0.5, +1.5
comps = list()
for iy in centers:
    for ix in centers:
        pra =  int(round(npixel // 2 + ix * spacing_pixels - 1))
        pdec = int(round(npixel // 2 + iy * spacing_pixels - 1))
        sc = pixel_to_skycoord(pra, pdec, model.wcs)
        log.info("Component at (%f, %f) %s" % (pra, pdec, str(sc)))
        comps.append(create_skycomponent(flux=flux, frequency=frequency, direction=sc, 
                                         polarisation_frame=PolarisationFrame("stokesI")))
vt = predict_skycomponent_visibility(vt, comps)

Define a Dask enabled invert looking like invert_2d but with additional arguments for the invert for a single chunk, and the iterator. The iterator is used to split the visibility up into pieces before calling the
single chunk.

In [None]:
model_graph = delayed(create_image_from_visibility)(vt, npixel=512, cellsize=0.001, npol=1)

def invert_graph(vt, model_graph, dopsf=False, normalize=True, invert_single=invert_2d, iterator=vis_timeslice_iter, 
                **kwargs):

    def accumulate_results(results, normalize=normalize):
        acc = []
        sumwt = 0.0
        nresults = len(results)
        for i, result in enumerate(results):
            if i>0:
                acc.data += result[0].data
                sumwt += result[1]
            else:
                acc = result[0]
                sumwt = result[1]
        
        if normalize:
            acc.data /= float(sumwt)
            
        return acc, sumwt 

    results = list()

    for rows in iterator(vt, **kwargs):
        v = copy_visibility(create_visibility_from_rows(vt, rows))
        result = delayed(invert_single, pure=True)(v, model_graph, dopsf=dopsf, normalize=False, **kwargs)
        results.append(result)

    return delayed(accumulate_results, pure=True)(results, normalize)

In [None]:
dirty_timeslice_graph = invert_graph(vt, model, False, invert_single=invert_timeslice_single, iterator=vis_timeslice_iter,
                           normalize=False, timeslice=10.0, context='')
dirty_timeslice_graph.dask
dirty_timeslice_graph.visualize()

We will need a deconvolve graph

In [None]:
def deconvolve_graph(dirty_graph, psf_graph, model_graph, **kwargs):
    def deconvolve_model_only(dirty, psf, model, **kwargs):
        result = deconvolve_cube(dirty, psf, **kwargs)[0]
        result.data += model.data
        return result
    return delayed(deconvolve_model_only, pure=True)(dirty_graph[0], psf_graph[0], model_graph, **kwargs)

In [None]:
psf_graph = invert_graph(vt, model_graph, dopsf=True, invert_single=invert_timeslice_single, iterator=vis_timeslice_iter,
                           normalize=False, timeslice=10.0)
dirty_graph = invert_graph(vt, model_graph, False, invert_single=invert_timeslice_single, iterator=vis_timeslice_iter,
                           normalize=False, timeslice=10.0)

In [None]:
clean_model_graph = deconvolve_graph(dirty_graph, psf_graph, model_graph, niter=1000, algorithm='hogbom',
                                    gain=0.1)
clean_model_graph.visualize()

Now we can compute the deconvolution. As the graph shows, the dirty image and psf will be computed and then the deconvolution will occur.

In [None]:
clean_model = clean_model_graph.compute()

In [None]:
print(clean_model)

Next we will need a graph to calculate residuals. For this we have added a new function in ftprocessor that 
calculates residuals per visibility chunk. This works for timeslicing and wslicing but not for faceting.

In [None]:
model_graph

In [None]:
def residual_graph(vis, model_graph, iterator=vis_timeslice_iter, **kwargs):

    def accumulate_results(results, rowses):

        acc = []
        sumwt = 0.0

        for i, result in enumerate(results):
            if i>0:
                acc.data += result[1].data
                sumwt += result[2]
            else:
                acc = result[1]
                sumwt = result[2]
        
        acc.data /= float(sumwt)            
        return acc, sumwt

    results = list()
    rowses = list()

    for rows in iterator(vis, **kwargs):
        rowses.append(rows)
        visslice = copy_visibility(create_visibility_from_rows(vis, rows))
        # Each result is tuple: resid vis, resid image, sumwt
        result = delayed(residual_image, pure=True)(visslice, model_graph, normalize=False, **kwargs)
        results.append(result)

    # We return a tuple: resid vis, residual image, sumwt
    return delayed(accumulate_results, pure=True)(results, rowses)

In [None]:
residual_timeslice_graph = residual_graph(vt, model_graph, 
                                          predict_residual=predict_timeslice_single, 
                                          invert_residual=invert_timeslice_single, 
                                          iterator=vis_timeslice_iter)
residual_timeslice_graph.visualize()

In [None]:
residual, sumwt = residual_timeslice_graph.compute()

Finally we make a graph version of solve_image

In [None]:
def solve_image_graph(vis, 
                      model_graph,  
                      residual_graph=residual_graph, 
                      invert_graph=invert_graph,
                      deconvolve_graph=deconvolve_graph, **kwargs):

    psf_graph = invert_graph(vis, model_graph, dopsf=True, **kwargs)

    res_graph = residual_graph(vis, model_graph, **kwargs)    
    model_graph1 = deconvolve_graph(res_graph, psf_graph, model_graph, **kwargs)

    res_graph1 = residual_graph(vis, model_graph1, **kwargs)
    model_graph2 = deconvolve_graph(res_graph1, psf_graph, model_graph1, **kwargs)

    res_graph2 = residual_graph(vis, model_graph2, **kwargs)
    model_graph3 = deconvolve_graph(res_graph2, psf_graph, model_graph2, **kwargs)
    
    return model_graph3

Now we can create the graph that will do the deconvolution

In [None]:
model_graph = delayed(create_image_from_visibility)(vt, npixel=512, cellsize=0.001, npol=1)

solution_graph = solve_image_graph(vt, model_graph=model_graph, invert=invert_graph, 
                                           invert_residual=invert_timeslice_single, 
                                           predict_residual=predict_timeslice_single, 
                                           iterator=vis_timeslice_iter, algorithm='hogbom',
                                           niter=1000, fractional_threshold=0.1,
                                           threshold=1.0, nmajor=3, gain=0.1)
solution_graph.visualize()

In [None]:
clean_model = solution_graph.compute()