In [1]:
from sx_multi import DataSource
from sx_multi import Analysis
from sx_multi import Accumulator
from sx_multi import DaskExecutor

import matplotlib.pyplot as plt

from servicex import ServiceXDataset
from sx_multi import FuncAdlDataset
from coffea import hist, processor


In [2]:
dids = ['mc15_13TeV:mc15_13TeV.361106.PowhegPythia8EvtGen_AZNLOCTEQ6L1_Zee.merge.DAOD_STDM3.e3601_s2576_s2132_r6630_r6264_p2363_tid05630052_00']
datasets = [
    ServiceXDataset(did, backend_type='xaod')
    for did in dids
]

In [3]:
leptons_per_event_query = FuncAdlDataset() \
        .Select(lambda e: e.Electrons("Electrons")) \
        .Select(lambda eles: eles.Where(lambda e: e.pt()/1000.0 > 30.0)) \
        .Select(lambda eles: eles.Where(lambda e: abs(e.eta()) < 2.5)) \
        .Where(lambda eles: len(eles) == 2) \
        .Select(lambda ls: (ls.Select(lambda e: e.pt()/1000.0), ls.Select(lambda e: e.eta()), ls.Select(lambda e: e.phi()), ls.Select(lambda e: e.m()/1000.0))) \
        .AsROOTTTree('data.root', 'mytree', ('ElePt', 'EleEta', 'ElePhi', 'EleM'))

In [4]:
datasource = DataSource(query=leptons_per_event_query, metadata={}, datasets=datasets)

In [5]:
class Z_EEAnalysis(Analysis):
    def __init__(self):
        self.accumulator = Accumulator({
            "mass": hist.Hist(
                "Events",
                hist.Cat("dataset", "Dataset"),
                hist.Bin("mass", "$Z_{ee}$ [GeV]", 60, 60, 120),
            ),
        })

    @staticmethod
    def process(output, events):
        import awkward1 as ak
        dataset = events.metadata['dataset']
        electrons = ak.zip({
            "pt": events.ElePt,
            "eta": events.EleEta,
            "phi": events.ElePhi,
            "mass": events.EleM,
            "charge": events.EleM,
        }, with_name="PtEtaPhiMCandidate")

        # Form the invar mass, plot.
        cut = (ak.num(electrons) == 2)
        diele = electrons[cut][:, 0] + electrons[cut][:, 1]

        output["sumw"][dataset] += len(events)
        output["mass"].fill(
            dataset=dataset,
            mass=diele.mass,
        )

        return output





In [6]:
analysis = Z_EEAnalysis()
executor = DaskExecutor(client_addr="127.0.0.1:8080")


In [7]:
%matplotlib widget
async def plot_stream(accumulator_stream):
  async for coffea_info in accumulator_stream:
    # Need to ask coffea folks how to anomate this!
    hist.plot1d(coffea_info['mass'])
    plt.show()
  return coffea_info

await plot_stream(executor.execute(analysis, datasource))


+-------------+---------------+---------------+---------------+
| Package     | client        | scheduler     | workers       |
+-------------+---------------+---------------+---------------+
| blosc       | None          | 1.9.2         | 1.9.2         |
| distributed | 2.30.1        | 2.30.0        | 2.30.1        |
| lz4         | 3.1.0         | 3.1.0         | 3.1.1         |
| numpy       | 1.19.3        | 1.18.1        | 1.18.1        |
| python      | 3.7.6.final.0 | 3.8.0.final.0 | 3.7.0.final.0 |
| tornado     | 6.1           | 6.0.4         | 6.1           |
+-------------+---------------+---------------+---------------+


HBox(children=(HTML(value='mc15_13TeV:mc15_13TeV.361106.PowhegPythia8EvtGen_AZNLOCTEQ6L1_Zee.merge.DAOD_STDM3.…

HBox(children=(HTML(value='        Downloaded'), FloatProgress(value=0.0, layout=Layout(flex='2'), max=9000000…

{'mass': <Hist (dataset,mass) instance at 0x139179610>, 'sumw': defaultdict_accumulator(<class 'float'>, {'mc15x': 24000.0})}


Canvas(toolbar=Toolbar(toolitems=[('Home', 'Reset original view', 'home', 'home'), ('Back', 'Back to previous …

{'mass': <Hist (dataset,mass) instance at 0x139229f90>, 'sumw': defaultdict_accumulator(<class 'float'>, {'mc15x': 45000.0})}
{'mass': <Hist (dataset,mass) instance at 0x13926fe50>, 'sumw': defaultdict_accumulator(<class 'float'>, {'mc15x': 50000.0})}
{'mass': <Hist (dataset,mass) instance at 0x13926fe90>, 'sumw': defaultdict_accumulator(<class 'float'>, {'mc15x': 50000.0})}
{'mass': <Hist (dataset,mass) instance at 0x1392d9e10>, 'sumw': defaultdict_accumulator(<class 'float'>, {'mc15x': 50000.0})}
{'mass': <Hist (dataset,mass) instance at 0x139329750>, 'sumw': defaultdict_accumulator(<class 'float'>, {'mc15x': 125000.0})}
{'mass': <Hist (dataset,mass) instance at 0x139376b10>, 'sumw': defaultdict_accumulator(<class 'float'>, {'mc15x': 149800.0})}
{'mass': <Hist (dataset,mass) instance at 0x1393c7950>, 'sumw': defaultdict_accumulator(<class 'float'>, {'mc15x': 150000.0})}
{'mass': <Hist (dataset,mass) instance at 0x1392d3810>, 'sumw': defaultdict_accumulator(<class 'float'>, {'mc15x': 

{'mass': <Hist (dataset,mass) instance at 0x138eac550>,
 'sumw': defaultdict_accumulator(float, {'mc15x': 1993800.0})}