In [None]:
import logging
from pathlib import Path

import pandas as pd
import numpy as np

import matplotlib.pyplot as plt
import mplhep as hep
from matplotlib import colors

from boostedhh import utils, hh_vars
from bbtautau.bbtautau_vars import HLT_dict, HLT_list

logger = logging.getLogger("boostedhh.utils")
logger.setLevel(logging.DEBUG)

In [2]:
# automatically reloads imported files on edits
%load_ext autoreload
%autoreload 2

In [3]:
MAIN_DIR = Path("../../../")

plot_dir = MAIN_DIR / "plots/SensitivityStudy/24Nov20"
plot_dir.mkdir(parents=True, exist_ok=True)

year = "2022"
data_samples_tag = "24Nov18Data_v12_private_signal"
signal_samples_tag = "24Nov9UpdateTriggers_v12_private_signal"

In [14]:
base_dir = Path("/ceph/cms/store/user/rkansal/bbtautau/skimmer/")

samples = {
    "jetmet": utils.Sample(
        path=base_dir / data_samples_tag,
        selector="JetHT|JetMET",
        label="JetMET",
        isData=True,
        year=year,
    ),
    "tau": utils.Sample(
        path=base_dir / data_samples_tag,
        selector="Tau_Run",
        label="Tau",
        isData=True,
        year=year,
    ),
    "bbtt": utils.Sample(
        path=base_dir / signal_samples_tag,
        selector=hh_vars.bbtt_sigs["bbtt"],
        label=r"HHbb$\tau\tau$",
        isData=False,
        year=year,
    ),
}

In [None]:
pt_cut = 250
# msd_cut = 40

filters = [
    [
        ("('ak8FatJetPt', '0')", ">=", pt_cut),
        ("('ak8FatJetPt', '1')", ">=", pt_cut),
        # ("('ak8FatJetMsd', '0')", ">=", msd_cut),
        # ("('ak8FatJetMsd', '1')", ">=", msd_cut),
        # ("('ak8FatJetPNetXbb', '0')", ">=", 0.8),
    ],
]

# save cutflow as pandas table
cutflow = pd.DataFrame(index=list(samples.keys()))

# dictionary that will contain all information (from all samples)
events_dict = {}
for key, sample in samples.items():
    events_dict[key] = utils.load_sample(sample, filters)

utils.add_to_cutflow(events_dict, "Preselection", "finalWeight", cutflow)
print("\n", cutflow)

INFO:boostedhh.utils:Loading ['JetHT_Run2022C', 'JetMET_Run2022D', 'JetMET_Run2022C']
DEBUG:boostedhh.utils:Loading JetHT_Run2022C
INFO:boostedhh.utils:Loaded JetHT_Run2022C                                    : 3427511 entries
DEBUG:boostedhh.utils:Loading JetMET_Run2022D
INFO:boostedhh.utils:Loaded JetMET_Run2022D                                   : 17356652 entries
DEBUG:boostedhh.utils:Loading JetMET_Run2022C
INFO:boostedhh.utils:Loaded JetMET_Run2022C                                   : 29279007 entries
INFO:boostedhh.utils:Loading ['Tau_Run2022C', 'Tau_Run2022D']
DEBUG:boostedhh.utils:Loading Tau_Run2022C
INFO:boostedhh.utils:Loaded Tau_Run2022C                                      : 2148530 entries
DEBUG:boostedhh.utils:Loading Tau_Run2022D
INFO:boostedhh.utils:Loaded Tau_Run2022D                                      : 1312497 entries
INFO:boostedhh.utils:Loading ['GluGlutoHHto2B2Tau_kl-1p00_kt-1p00_c2-0p00_LHEweights_TuneCP5_13p6TeV_powheg-pythia8']
DEBUG:boostedhh.utils:Loading


         Preselection
jetmet  5.006317e+07
tau     3.461027e+06
bbtt    1.081920e+04
