# Data/MC yields

## 8 TeV

In [1]:
#imports
%cd '/home/naodell/work/CMS/amumu'
%matplotlib notebook

import os, sys
from timeit import default_timer as timer

import numpy as np
import pandas as pd
import matplotlib.pyplot as plt

import nllfitter.plot_tools as pt

from IPython.display import display

/home/naodell/work/CMS/amumu


In [2]:
#configuration and data retrieval
datasets = [
            'muon_2012A', 'muon_2012B', 'muon_2012C', 'muon_2012D', 
            'ttbar_lep', 'ttbar_semilep',
            'zjets_m-50', 'zjets_m-10to50',
            'z1jets_m-50', 'z1jets_m-10to50',
            'z2jets_m-50', 'z2jets_m-10to50',
            'z3jets_m-50', 'z3jets_m-10to50',
            'z4jets_m-50', 'z4jets_m-10to50',
            't_s', 't_t', 't_tw', 'tbar_s', 'tbar_t', 'tbar_tw',
            'ww', 'wz_2l2q', 'wz_3lnu', 'zz_2l2q', 'zz_2l2nu',
            'bprime_xb', 'bprime_xbxb_semilep', 'fcnc'
            ]
preselection = '(lepton1_pt > 25 and abs(lepton1_eta) < 2.1 \
                and lepton2_pt > 25 and abs(lepton2_eta) < 2.1 \
                and lepton1_q != lepton2_q and 12 < dilepton_mass < 70)'

data_manager = pt.DataManager(input_dir     = 'data/flatuples/mumu_2012',
                              dataset_names = datasets,
                              selection     = 'mumu',
                              period        = 2012,
                              scale         = 19.8e3,
                              cuts          = preselection
                             )

Loading dataframes: 100%|███████████████| 30.0/30.0 [00:15<00:00, 8.59it/s]


### 1b1f 

In [7]:
dataset_names = ['t', 'diboson', 'ttbar', 'zjets', 
                 'bprime_xb', 'fcnc', 'bprime_xbxb_semilep', 
                 'data']
conditions    = ['preselection', 'n_bjets == 1', 'n_fwdjets > 0', 'n_jets == 0']
table = data_manager.print_yields(dataset_names, 
                                  exclude    = ['bprime_xb', 'fcnc', 'bprime_xbxb_semilep'],
                                  conditions = conditions
                                 )
table

Unnamed: 0,preselection,n_bjets == 1,n_fwdjets > 0,n_jets == 0
t,$593.8 \pm 17.2$,$237.3 \pm 10.9$,$33.6 \pm 4.0$,$18.4 \pm 3.0$
Diboson,$1530.5 \pm 11.6$,$30.0 \pm 1.2$,$4.1 \pm 0.4$,$1.7 \pm 0.3$
$\sf t\bar{t}$,$6568.7 \pm 18.1$,$3029.6 \pm 12.2$,$575.6 \pm 5.3$,$138.9 \pm 2.6$
Z+jets,$162338.4 \pm 546.6$,$1205.5 \pm 25.4$,$123.6 \pm 8.1$,$73.7 \pm 6.4$
$\sf B’\rightarrow Xb$,$202.2 \pm 2.7$,$76.5 \pm 1.7$,$26.1 \pm 1.0$,$19.2 \pm 0.8$
$\sf t\rightarrow hc$,$185.8 \pm 2.6$,$59.6 \pm 1.5$,$7.4 \pm 0.5$,$2.8 \pm 0.3$
$\sf B’B’\rightarrow XbXb$,$240.0 \pm 2.0$,$108.1 \pm 1.4$,$28.3 \pm 0.7$,$1.1 \pm 0.1$
Data,$180310$,$4613$,$718$,$0$
background,$171031.4 \pm 547.3$,$4502.5 \pm 30.2$,$736.9 \pm 10.5$,$232.7 \pm 7.5$


### 1b1c 

In [None]:
conditions = ['preselection', 'n_bjets >= 1', 'n_jets + n_bjets == 2', 'n_fwdjets == 0', 'met_mag < 40', 'four_body_delta_phi > 2.5']
table = data_manager.print_yields(dataset_names, 
                                  exclude    = ['bprime_xb', 'fcnc', 'bprime_xbxb_semilep'],
                                  conditions = conditions
                                 )
table

### combined

In [10]:
conditions    = ['preselection', 
                 '((n_bjets == 1 and n_jets == 0 and n_fwdjets > 0) \
                  or (n_bjets >= 1 and n_jets + n_bjets == 2 \
                  and n_fwdjets == 0 and met_mag < 40 and \
                  four_body_delta_phi > 2.5))'
                ]
table = data_manager.print_yields(dataset_names, 
                                  exclude    = ['bprime_xb', 'fcnc', 'bprime_xbxb_semilep'],
                                  conditions = conditions,
                                  mc_scale   = True
                                 )
table.columns = ['preselection', '1b1f+1b1c']
table

Unnamed: 0,preselection,1b1f+1b1c
t,$593.8 \pm 17.2$,$32.9 \pm 4.0$
Diboson,$1530.5 \pm 11.6$,$8.1 \pm 0.5$
$\sf t\bar{t}$,$6568.7 \pm 18.1$,$437.4 \pm 4.6$
Z+jets,$162338.4 \pm 546.6$,$315.2 \pm 12.0$
$\sf B’\rightarrow Xb$,$202.2 \pm 2.7$,$41.5 \pm 1.2$
$\sf t\rightarrow hc$,$185.8 \pm 2.6$,$27.2 \pm 1.0$
$\sf B’B’\rightarrow XbXb$,$240.0 \pm 2.0$,$12.7 \pm 0.5$
Data,$180310$,$623$
background,$171031.4 \pm 547.3$,$793.7 \pm 13.5$


## 13 TeV

In [None]:
# 13 TeV configuration and data retrieval
datasets = [
            'muon_2016B', 'muon_2016C', 'muon_2016D',
            'ttjets',
            't_t', 't_tw', 'tbar_t', 'tbar_tw',
            'zjets_m-50', 'zjets_m-10to50',
            ]

signal_mask = '(dilepton_mass < 24 or dilepton_mass > 34)' # blind signal region
data_manager = pt.DataManager(input_dir     = 'data/flatuples/mumu_2016',
                              dataset_names = datasets,
                              selection     = 'mumu',
                              period        = 2016,
                              scale         = 12e3,
                              cuts          = preselection + ' and ' + signal_mask
                             )
dataset_names = ['t', 'ttbar', 'zjets', 'data']

### 1b1f

In [None]:
conditions    = ['preselection', 'n_bjets == 1', 'n_fwdjets > 0', 'n_jets == 0']
table_string = data_manager.print_yields(dataset_names, conditions)
#print table_string # I need to print the string and then paste into the following markdown cell; need to find a way around this...

| | t | $\sf t\bar{t}$ | Z+jets | Data | background | 
|-|-|-|-|-|-|-|
| preselection  | 1050.8 $\pm$ 20.7 | 10957.2 $\pm$ 52.6 | 145884.8 $\pm$ 739.6 | 176538  | 157892.7 $\pm$ 741.8 | 
| n_bjets == 1  | 342.8 $\pm$ 11.9 | 4605.7 $\pm$ 34.1 | 1830.6 $\pm$ 86.0 | 5985  | 6779.2 $\pm$ 93.3 | 
| n_fwdjets > 0  | 67.9 $\pm$ 5.3 | 1598.5 $\pm$ 20.1 | 339.1 $\pm$ 37.2 | 1285  | 2005.5 $\pm$ 42.6 | 
| n_jets == 0  | 28.2 $\pm$ 3.5 | 284.7 $\pm$ 8.5 | 173.3 $\pm$ 25.8 | 348  | 486.2 $\pm$ 27.4 | 

### 1b1c

In [None]:
conditions    = ['preselection', 'n_bjets == 1', 'n_jets == 1', 'n_fwdjets == 0', 'met_mag < 40', 'four_body_delta_phi > 2.5']
table_string = data_manager.print_yields(dataset_names, conditions)
#print table_string # I need to print the string and then paste into the following markdown cell; need to find a way around this...

| | t | $\sf t\bar{t}$ | Z+jets | Data | background | 
|-|-|-|-|-|-|-|
| preselection  | 1050.8 $\pm$ 20.7 | 10957.2 $\pm$ 52.6 | 145884.8 $\pm$ 739.6 | 176538  | 157892.7 $\pm$ 741.8 | 
| n_bjets == 1  | 342.8 $\pm$ 11.9 | 4605.7 $\pm$ 34.1 | 1830.6 $\pm$ 86.0 | 5985  | 6779.2 $\pm$ 93.3 | 
| n_jets == 1  | 108.4 $\pm$ 6.7 | 1700.7 $\pm$ 20.7 | 619.6 $\pm$ 50.2 | 2441  | 2428.7 $\pm$ 54.7 | 
| n_fwdjets == 0  | 85.2 $\pm$ 5.9 | 1079.9 $\pm$ 16.5 | 509.7 $\pm$ 45.2 | 1937  | 1674.7 $\pm$ 48.5 | 
| met_mag < 40  | 22.5 $\pm$ 3.0 | 268.8 $\pm$ 8.2 | 408.4 $\pm$ 40.7 | 650  | 699.7 $\pm$ 41.6 | 
| four_body_delta_phi > 2.5  | 19.9 $\pm$ 2.9 | 208.0 $\pm$ 7.2 | 359.0 $\pm$ 38.6 | 524  | 587.0 $\pm$ 39.4 | 

