In [1]:
%load_ext autoreload
%autoreload 2
import numpy as np
import matplotlib.pyplot as plt
import awkward as ak
import sys
sys.path.append("../../../analysisTools/")
from analysisTools import Analyzer
from analysisTools import loadSchema
import analysisTools as tools
import analysisSubroutines as routines
import importlib
import coffea.util as util
import time
import json
import os
import glob

## Some Information

### Input files to be analyzed

**Coffea can be run on either *unskimmed ntuples* or *skimmed ntuples*.**

- ***unskimmed ntuples***: we use AOD samples for the analysis, so we run the [ntuplizer+miniAOD] from [AODSkimmer](https://github.com/kyungminparkdrums/iDMe/tree/main/AODSkimmer) in condor jobs, saving useful branches that will be used in the analysis. 

- ***skimmed ntuples***: from the *unskimmed ntuples* above, apply some basic preselections with `rdataframe` in condor jobs using the scripts in [python_analysis/condor/](https://github.com/kyungminparkdrums/iDMe/tree/main/python_analysis/condor#condor-jobs-for-skimmer-that-applies-preselections-to-the-ntuples). 

Note:
- In the FNAL LPC eos `lpcmetx/iDMe/` area, both unskimmed and skimmed ntuples are available.
- You can also produce your own, following the README in `AODSkimmer/` (for unskimmed ntuples) and `python_analysis/condor/` (for skimmed ntuples). 

### Configs
Coffea analyzer requires config files for cut, histogram, and sample information. Check out the README for each of these, you'll find information on how to add/edit cuts, histograms, etc.
- [cut config](https://github.com/kyungminparkdrums/iDMe/tree/main/python_analysis/configs#cut-configs-cut_configs)
- [histo config](https://github.com/kyungminparkdrums/iDMe/tree/main/python_analysis/configs#histo-configs-histo_configs)
- [sample config](https://github.com/kyungminparkdrums/iDMe/tree/main/python_analysis/configs#sample-configs-sample_configs)

## Run coffea on skimmed ntuples

In [2]:
cuts_config = "./cut_configs/BDTv1_ctau-1.py"
histos_config = "../../../configs/histo_configs/SR_studies.py"

In [3]:
if not os.path.isdir('coffea'):
    os.mkdir('coffea')

In [4]:
outdir = "./coffea/skimmed/"
if not os.path.isdir(outdir):
    os.mkdir(outdir)

### Signal

In [5]:
sample_config = "../skimmed_sig_v2_egamma_hadd_ntuples_2018_aEM_ctau-1.json"

In [6]:
test = Analyzer(sample_config,histos_config,cuts_config, max_samples=-1) # run over all samples in the config

t1 = time.time()
out = test.process(execr='futures')
t2 = time.time()

print("Runtime: {:.2f} minutes".format((t2-t1)/60))
util.save(out,f"{outdir}/signal_SR_BDTv1_ctau-1_5to50_skimmed.coffea")

del out, test

Output()

Output()

Pass: 71/178
Pass: 202/652
Pass: 234/700
Pass: 950/2694
Pass: 791/1863
Pass: 843/2372
Pass: 618/1879
Pass: 586/1442
Pass: 513/1530
Pass: 421/1183
Pass: 434/1373


Runtime: 0.88 minutes


### Background

In [5]:
bkg_configs = glob.glob("../../../configs/sample_configs/skimmed_bkg*.json")

print(bkg_configs)

['../../../configs/sample_configs/skimmed_bkg_2018_DY.json', '../../../configs/sample_configs/skimmed_bkg_2018_Diboson.json', '../../../configs/sample_configs/skimmed_bkg_2018_QCD_TuneCP5_PSWeights.json', '../../../configs/sample_configs/skimmed_bkg_2018_TTJetsDiLept.json', '../../../configs/sample_configs/skimmed_bkg_2018_Top.json', '../../../configs/sample_configs/skimmed_bkg_2018_Triboson.json', '../../../configs/sample_configs/skimmed_bkg_2018_WJets.json', '../../../configs/sample_configs/skimmed_bkg_2018_ZJets.json']


In [6]:
for bkg in bkg_configs:
    process = bkg.split('/')[-1].split('.json')[0].split('skimmed_')[-1]
    print(process)

    if 'TTJetsDiLept' in bkg: # currently not available ntuples
        continue
    
    test = Analyzer(bkg,histos_config,cuts_config) 
        
    t1 = time.time()
    out = test.process(execr='futures')
    t2 = time.time()
        
    print("Runtime: {:.2f} minutes".format((t2-t1)/60))
    util.save(out,f"{outdir}/{process}_SR_BDTv1_ctau-1_5to50_skimmed.coffea")
    del out, test

bkg_2018_DY


Output()

Output()

Pass: 1/3
Pass: 0/1
Pass: 0/2
Pass: 0/1
Pass: 0/2
Pass: 0/1
Pass: 0/3
Pass: 0/1
Pass: 0/3
Pass: 0/3


Runtime: 0.92 minutes
bkg_2018_Diboson


Output()

Output()

Pass: 0/325
Pass: 0/213
Pass: 0/184
Pass: 0/215
Pass: 0/238
Pass: 2/238
Pass: 0/70
Pass: 0/245


Runtime: 0.78 minutes
bkg_2018_QCD_TuneCP5_PSWeights


Output()

Output()

Pass: 0/1
Pass: 0/3
Pass: 0/3
Pass: 0/3
Pass: 0/5
Pass: 0/2
Pass: 0/3
Pass: 0/7
Pass: 0/6
Pass: 0/2
Pass: 0/4
Pass: 0/5
Pass: 0/5
Pass: 0/4
Pass: 0/5
Pass: 0/2
Pass: 0/2
Pass: 0/6
Pass: 0/1
Pass: 0/1
Pass: 0/2
Pass: 0/1
Pass: 0/5
Pass: 0/6
Pass: 0/1
Pass: 0/1
Pass: 0/1
Pass: 0/1
Pass: 0/1
Pass: 0/1
Pass: 0/1
Pass: 0/1
Pass: 0/18
Pass: 0/4
Pass: 0/19
Pass: 0/7
Pass: 0/17
Pass: 0/3
Pass: 0/10
Pass: 0/13
Pass: 0/2
Pass: 0/3
Pass: 0/2
Pass: 0/6
Pass: 0/6
Pass: 0/6Pass: 0/19
Pass: 0/1
Pass: 0/1
Pass: 0/14
Pass: 0/22
Pass: 0/29
Pass: 0/10


Runtime: 3.44 minutes
bkg_2018_TTJetsDiLept
bkg_2018_Top


Output()

Output()

Pass: 0/30
Pass: 0/63
Pass: 1/63
Pass: 0/49
Pass: 0/75
Pass: 0/18
Pass: 0/68
Pass: 0/15
Pass: 0/17
Pass: 0/12
Pass: 0/17
Pass: 0/79
Pass: 1/67
Pass: 0/94
Pass: 0/64
Pass: 0/57
Pass: 0/18
Pass: 0/17
Pass: 0/51
Pass: 0/73
Pass: 0/90
Pass: 0/73
Pass: 0/76
Pass: 0/62
Pass: 0/78
Pass: 0/37
Pass: 0/68
Pass: 0/22
Pass: 0/58
Pass: 0/30
Pass: 0/37
Pass: 0/46
Pass: 0/48
Pass: 0/151
Pass: 0/148
Pass: 0/130
Pass: 0/159
Pass: 0/17
Pass: 0/35
Pass: 0/21
Pass: 0/13
Pass: 0/80
Pass: 0/15
Pass: 0/107
Pass: 0/134
Pass: 1/143
Pass: 1/137
Pass: 0/37
Pass: 1/16
Pass: 0/10
Pass: 0/22
Pass: 0/22
Pass: 0/69
Pass: 0/119
Pass: 0/163
Pass: 0/101
Pass: 0/13
Pass: 0/53
Pass: 0/17
Pass: 1/116
Pass: 1/25
Pass: 0/23
Pass: 0/22
Pass: 0/22
Pass: 0/35
Pass: 0/107
Pass: 0/93
Pass: 0/100
Pass: 0/69
Pass: 0/20
Pass: 0/112
Pass: 0/23
Pass: 0/17
Pass: 0/21
Pass: 0/27
Pass: 1/70
Pass: 1/108
Pass: 0/86
Pass: 1/94
Pass: 0/57
Pass: 0/29
Pass: 0/29Pass: 0/16

Pass: 0/29
Pass: 0/24
Pass: 0/19
Pass: 0/21
Pass: 1/79
Pass: 0/64
Pass:

Runtime: 6.46 minutes
bkg_2018_Triboson


Output()

Output()

Pass: 0/58
Pass: 0/79
Pass: 0/30


Runtime: 0.61 minutes
bkg_2018_WJets


Output()

Output()

Pass: 0/154
Pass: 0/738
Pass: 0/1856
Pass: 1/1618
Pass: 0/537
Pass: 0/593
Pass: 0/593
Pass: 4/518
Pass: 0/552
Pass: 0/555
Pass: 4/571
Pass: 0/202
Pass: 1/321
Pass: 1/333
Pass: 5/1187
Pass: 5/2536
Pass: 8/2558
Pass: 3/824
Pass: 4/773
Pass: 4/761
Pass: 3/746
Pass: 1/813
Pass: 2/790
Pass: 8/3085
Pass: 17/5006
Pass: 24/6236
Pass: 5/1959
Pass: 1/785
Pass: 24/6174
Pass: 1/809
Pass: 1/813
Pass: 3/767
Pass: 8/3283
Pass: 1/914
Pass: 0/697
Pass: 19/6278
Pass: 19/6065
Pass: 1/805
Pass: 2/1023
Pass: 3/1958
Pass: 0/955
Pass: 1/964


Runtime: 4.54 minutes
bkg_2018_ZJets


Output()

Output()

Pass: 0/186
Pass: 6/1124
Pass: 3/1045
Pass: 2/810
Pass: 2/424
Pass: 2/795
Pass: 1/543
Pass: 0/6850
Pass: 13/6921
Pass: 23/11573
Pass: 21/11146
Pass: 0/48
Pass: 17/8968
Pass: 15/5308
Pass: 8/5466
Pass: 0/1746
Pass: 5/5360
Pass: 3/5401
Pass: 0/2500
Pass: 5/8080
Pass: 3/7189
Pass: 5/6944


Runtime: 3.36 minutes
