In [None]:
%load_ext autoreload
%autoreload 2

import uproot
import awkward as ak

import matplotlib.pylab as plt
import numpy as np

import time

from hist import Hist

import babar_analysis_tools as bat

from analysis_variables import *

import myPIDselector

import pandas as pd
import seaborn as sns

import ROOT
import pdf_definitions as pdfs

In [None]:
h = ROOT.TH1F()

In [None]:

c1 = ROOT.TCanvas()
c1.cd()
h.Draw()

c1.Update()

#c1.Show()

# rf202

In [None]:
# Declare observable x
x = ROOT.RooRealVar("x", "x", 0, 10)

# Create two Gaussian PDFs g1(x,mean1,sigma) anf g2(x,mean2,sigma) and
# their parameters
mean = ROOT.RooRealVar("mean", "mean of gaussians", 5)
sigma1 = ROOT.RooRealVar("sigma1", "width of gaussians", 0.5)
sigma2 = ROOT.RooRealVar("sigma2", "width of gaussians", 1)

sig1 = ROOT.RooGaussian("sig1", "Signal component 1", x, mean, sigma1)
sig2 = ROOT.RooGaussian("sig2", "Signal component 2", x, mean, sigma2)

# Build Chebychev polynomial p.d.f.
a0 = ROOT.RooRealVar("a0", "a0", 0.5, 0., 1.)
a1 = ROOT.RooRealVar("a1", "a1", -0.2, 0., 1.)
bkg = ROOT.RooChebychev("bkg", "Background", x, ROOT.RooArgList(a0, a1))

# Sum the signal components into a composite signal p.d.f.
sig1frac = ROOT.RooRealVar(
    "sig1frac", "fraction of component 1 in signal", 0.8, 0., 1.)
sig = ROOT.RooAddPdf(
    "sig", "Signal", ROOT.RooArgList(sig1, sig2), ROOT.RooArgList(sig1frac))



In [None]:
# Method 1 - Construct extended composite model
# -------------------------------------------------------------------

# Sum the composite signal and background into an extended pdf
# nsig*sig+nbkg*bkg
nsig = ROOT.RooRealVar("nsig", "number of signal events", 500, 0., 10000)
nbkg = ROOT.RooRealVar(
    "nbkg", "number of background events", 500, 0, 10000)
model = ROOT.RooAddPdf(
    "model",
    "(g1+g2)+a",
    ROOT.RooArgList(
        bkg,
        sig),
    ROOT.RooArgList(
        nbkg,
        nsig))

# Sample, fit and plot extended model
# ---------------------------------------------------------------------

# Generate a data sample of expected number events in x from model
# = model.expectedEvents() = nsig+nbkg
data = model.generate(ROOT.RooArgSet(x))

# Fit model to data, ML term automatically included
model.fitTo(data)

# Plot data and PDF overlaid, expected number of events for p.d.f projection normalization
# rather than observed number of events (==data.numEntries())
xframe = x.frame(ROOT.RooFit.Title("extended ML fit example"))
data.plotOn(xframe)
model.plotOn(xframe, ROOT.RooFit.Normalization(
    1.0, ROOT.RooAbsReal.RelativeExpected))

# Overlay the background component of model with a dashed line
ras_bkg = ROOT.RooArgSet(bkg)
model.plotOn(
    xframe, ROOT.RooFit.Components(ras_bkg), ROOT.RooFit.LineStyle(
        ROOT.kDashed), ROOT.RooFit.Normalization(
            1.0, ROOT.RooAbsReal.RelativeExpected))

# Overlay the background+sig2 components of model with a dotted line
ras_bkg_sig2 = ROOT.RooArgSet(bkg, sig2)
model.plotOn(
    xframe, ROOT.RooFit.Components(ras_bkg_sig2), ROOT.RooFit.LineStyle(
        ROOT.kDotted), ROOT.RooFit.Normalization(
            1.0, ROOT.RooAbsReal.RelativeExpected))


In [None]:
# Print structure of composite p.d.f.
model.Print("t")


# Method 2 - Construct extended components first
# ---------------------------------------------------------------------

# Associated nsig/nbkg as expected number of events with sig/bkg
esig = ROOT.RooExtendPdf("esig", "extended signal p.d.f", sig, nsig)
ebkg = ROOT.RooExtendPdf("ebkg", "extended background p.d.f", bkg, nbkg)

# Sum extended components without coefs
# -------------------------------------------------------------------------

# Construct sum of two extended p.d.f. (no coefficients required)
model2 = ROOT.RooAddPdf("model2", "(g1+g2)+a", ROOT.RooArgList(ebkg, esig))

# Draw the frame on the canvas
c = ROOT.TCanvas("rf202_extendedmlfit", "rf202_extendedmlfit", 600, 600)
ROOT.gPad.SetLeftMargin(0.15)
xframe.GetYaxis().SetTitleOffset(1.4)
xframe.Draw()

c.Update()

c.SaveAs("rf202_extendedmlfit.png")


# From ChatGPT

In [None]:
c = ROOT.TCanvas("testingfits", "testingfits")#"fit", "fit", 600, 600)

In [None]:
#df = pd.read_parquet('mes_deltae_background_AFTER_FINAL_CUTS.parquet')
#df

In [None]:
mes_lo, mes_hi = 5.2,5.3
deltae_lo, deltae_hi = -0.2,0.2

x,y = pdfs.build_xy([[mes_lo, mes_hi], [deltae_lo, deltae_hi]])


x.setRange("FULL",mes_lo,mes_hi)
y.setRange("FULL",deltae_lo, deltae_hi)

x.setRange("SIGNAL",5.25, mes_hi)
y.setRange("SIGNAL",-0.10, 0.1)

# Sideband 1 region
x.setRange("SB1", mes_lo,  mes_hi)
y.setRange("SB1", 0.075, deltae_hi)

# Sideband 2 region
x.setRange("SB2",  mes_lo,  mes_hi)
y.setRange("SB2", deltae_lo, -0.075)

# Sideband 3 region
x.setRange("SB3",  mes_lo,  5.27)
y.setRange("SB3", -0.075, 0.075)



In [None]:
#dim = 2

#dum_pars, sub_funcs_list, total = pdfs.tot_PDF(x,y, data_z,
#:dim, use_double_cb, workspace)

pars_bkg, bkg_pdf = pdfs.argus_in_x(x)
pars_sig, sig_pdf = pdfs.crystal_barrel_x(x)

conv_factor_fit  = ROOT.RooRealVar("conv_factor_fit", "Conversion factor (fit)",10) # Conversion factor, fit
branching_fraction = ROOT.RooRealVar("branching_fraction","Branching fraction",1)


nbkg = ROOT.RooRealVar("nbkg","# bkg events,",10)
nsig = ROOT.RooFormulaVar("nsig","conv_factor_fit*branching_fraction",ROOT.RooArgList(conv_factor_fit,branching_fraction))


total = ROOT.RooAddPdf("total","sig_pdf + bkg_pdf", ROOT.RooArgList(sig_pdf, bkg_pdf), ROOT.RooArgList(nsig, nbkg))

pars = [nbkg, nsig]
pars += pars_sig
pars += pars_bkg


In [None]:
conv_factor_fit.setVal(4)
nbkg.setVal(9)

data = total.generate(ROOT.RooArgSet(x))
conv_factor_fit.setConstant(False)

nbkg.setConstant(False)

# Fit model to data, ML term automatically included
'''
result = total.fitTo(data, ROOT.RooFit.Extended(ROOT.kTRUE),
                                         ROOT.RooFit.Save(ROOT.kTRUE),
                                         ROOT.RooFit.Strategy(2),
                                         ROOT.RooFit.PrintLevel(-1))
'''
nll = ROOT.RooNLLVar("nll","nll",total,data,ROOT.RooFit.Extended(ROOT.kTRUE))
#fit_func = RooFormulaVar("fit_func","nll + log_gc",RooArgList(nll,pars_d["log_gc"]))
fit_func = ROOT.RooFormulaVar("fit_func","nll",ROOT.RooArgList(nll))

m = ROOT.RooMinimizer(fit_func)
m.setVerbose(ROOT.kFALSE)
m.migrad()
m.hesse()
result = m.save()



result.Print("v")



In [None]:
result.Print('v')

In [None]:
del c
c = ROOT.TCanvas("testingfits", "testingfits", 600, 300)#"fit", "fit", 600, 600)
# Plot data and PDF overlaid, expected number of events for p.d.f projection normalization
# rather than observed number of events (==data.numEntries())
xframe = x.frame(ROOT.RooFit.Title("extended ML fit example"), ROOT.RooFit.Bins(25))
data.plotOn(xframe)
total.plotOn(xframe, ROOT.RooFit.Normalization(
    1.0, ROOT.RooAbsReal.RelativeExpected))

# Overlay the background component of model with a dashed line
ras_bkg = ROOT.RooArgSet(bkg_pdf)
total.plotOn(
    xframe, ROOT.RooFit.Components(ras_bkg), ROOT.RooFit.LineStyle(
        ROOT.kDashed), ROOT.RooFit.Normalization(
            1.0, ROOT.RooAbsReal.RelativeExpected))

# Overlay the background component of model with a dashed line
ras_sig = ROOT.RooArgSet(sig_pdf)
total.plotOn(
    xframe, ROOT.RooFit.Components(ras_sig), ROOT.RooFit.LineStyle(
        ROOT.kDotted), ROOT.RooFit.Normalization(
            1.0, ROOT.RooAbsReal.RelativeExpected))

# Draw the frame on the canvas

ROOT.gPad.SetLeftMargin(0.15)
xframe.GetYaxis().SetTitleOffset(1.4)
xframe.Draw()



#c.Update()
#ROOT.gPad
c.Draw()
#ROOT.gPad.Draw()
#ROOT.gPad.Update()
#c.Draw()

#c.SaveAs("testfit.png")


In [None]:
def read_file_return_dataset(df, x, y, region_definitions=None, dim=2, max_events=1e9, index=0):
    
    nevents=0
    name = f"dataset_{index}"
    ds = ROOT.RooDataSet(name, name, ROOT.RooArgSet(x,y) )

    # mES ranges
    x_lo = region_definitions['fitting MES'][0]
    x_hi = region_definitions['fitting MES'][1]
    # DeltaE ranges
    y_lo = region_definitions['fitting DeltaE'][0]
    y_hi = region_definitions['fitting DeltaE'][1]

    print("Data ranges...")
    print(x_lo, x_hi)
    print(y_lo, y_hi)
    
    mes, deltae = df['BpostFitMes'].values, df['BpostFitDeltaE'].values

    for m,de in zip(mes, deltae):
        x.setVal(m)
        y.setVal(de)

        if nevents<max_events:
            #print "%3.3f %3.3f %3.3f" % (x.getVal(), y.getVal(), z.getVal())
            #print "\t%3.3f %3.3f" % (x_lo, x_hi)
            #print "\t%3.3f %3.3f" % (y_lo, y_hi)
            #print "\t%3.3f %3.3f" % (z_lo, z_hi)
            #print "here"

            if x.getVal()>x_lo and x.getVal()<x_hi and \
               y.getVal()>y_lo and y.getVal()<y_hi:
                #if y.getVal()>y_lo and y.getVal()<y_hi:
                # Run this check otherwise the fit won't converge.
                #print "Adding...."
                ds.add(ROOT.RooArgSet(x,y))
                nevents += 1
                #print "Added event --------------"
            '''
            else:
                print "NOT ADDING EVENT ========+++++++++===========++++++++++++"
            '''
        else:
            #print "hi"
            break

    #print "Here is hte nevents: %d %f" % (nevents, max_events)
    return ds


In [None]:
#df_sp = pd.read_parquet("DATAFRAME_SP.parquet")
#df_col = pd.read_parquet("DATAFRAME_COL.parquet")

df_sp = pd.read_parquet("DATAFRAME_SP_BNC_ALL.parquet")
df_col = pd.read_parquet("DATAFRAME_COL_BNC_ALL.parquet")

In [None]:
#mask = (df_sp['spmode']=='998')
mask = (df_sp['used_in_bkg_train'] == False)
mask &= mask & (df_sp['used_in_sig_train'] == False)
mask &= mask & (df_sp['cut_2']==True) & (df_sp['cut_3']==True)  & (df_sp['cut_4']==True)
mask = mask & (df_sp['BpostFitDeltaE']<0.05) & (df_sp['BpostFitDeltaE']>-0.05)
mask &= mask & (df_sp['proba']>0.97)

mask_sp = (df_sp['spmode']=='998')
df_tmp1 = df_sp[mask & mask_sp]

mask_sp = (df_sp['spmode']=='-999')
df_tmp2 = df_sp[mask & mask_sp].sample(n=4)

df_tmp = pd.concat([df_tmp1, df_tmp2])

#ds = read_file_return_dataset(df_sp[mask], x, y, region_definitions=region_definitions)
ds = read_file_return_dataset(df_tmp, x, y, region_definitions=region_definitions)

In [None]:
ds.Print("v")

In [None]:
ds_x = ds.reduce(x)

ds_x.Print("v")

In [None]:
ds_x.sumEntries()

In [None]:
#dim = 2

#dum_pars, sub_funcs_list, total = pdfs.tot_PDF(x,y, data_z,
#:dim, use_double_cb, workspace)

pars_bkg, bkg_pdf = pdfs.argus_in_x(x)
pars_sig, sig_pdf = pdfs.crystal_barrel_x(x)

conv_factor_fit  = ROOT.RooRealVar("conv_factor_fit", "Conversion factor (fit)",10) # Conversion factor, fit
branching_fraction = ROOT.RooRealVar("branching_fraction","Branching fraction",1)

nbkg = ROOT.RooRealVar("nbkg","# bkg events,",10)
nsig = ROOT.RooFormulaVar("nsig","conv_factor_fit*branching_fraction",ROOT.RooArgList(conv_factor_fit,branching_fraction))

total = ROOT.RooAddPdf("total","sig_pdf + bkg_pdf", ROOT.RooArgList(sig_pdf, bkg_pdf), ROOT.RooArgList(nsig, nbkg))

pars = [nbkg, nsig]
pars += pars_sig
pars += pars_bkg

conv_factor_fit.setVal(0.1)
nbkg.setVal(ds_x.sumEntries())
conv_factor_fit.setConstant(False)
nbkg.setConstant(False)

nll = ROOT.RooNLLVar("nll","nll",total, ds_x, ROOT.RooFit.Extended(ROOT.kTRUE))
#fit_func = RooFormulaVar("fit_func","nll + log_gc",RooArgList(nll,pars_d["log_gc"]))
fit_func = ROOT.RooFormulaVar("fit_func","nll",ROOT.RooArgList(nll))

m = ROOT.RooMinimizer(fit_func)
m.setVerbose(ROOT.kFALSE)
m.migrad()
m.hesse()
result = m.save()

result.Print("v")


xframe2 = x.frame(Title="Gaussian pdf with data")  # RooPlot

#del c2
c2 = ROOT.TCanvas("testingfits", "testingfits", 600, 300)#"fit", "fit", 600, 600)

ds.plotOn(xframe2)


total.plotOn(xframe2, ROOT.RooFit.Normalization(
    1.0, ROOT.RooAbsReal.RelativeExpected))

# Overlay the background component of model with a dashed line
ras_bkg = ROOT.RooArgSet(bkg_pdf)
total.plotOn(
    xframe2, ROOT.RooFit.Components(ras_bkg), ROOT.RooFit.LineStyle(
        ROOT.kDashed), ROOT.RooFit.Normalization(
            1.0, ROOT.RooAbsReal.RelativeExpected))

# Overlay the background component of model with a dashed line
ras_sig = ROOT.RooArgSet(sig_pdf)
total.plotOn(
    xframe2, ROOT.RooFit.Components(ras_sig), ROOT.RooFit.LineStyle(
        ROOT.kDotted), ROOT.RooFit.Normalization(
            1.0, ROOT.RooAbsReal.RelativeExpected))




xframe2.Draw()
#c.Update()
#ROOT.gPad
c2.Draw()

# Full fit maybe?

In [None]:
mypars = []

dum_pars, sub_funcs_list, total = pdfs.tot_PDF(x, ds_x)#, use_double_cb, workspace)

mypars += dum_pars


total.Print("v")

In [None]:
# Create a dictionary of the pars
# We'll use this later if we need to print stuff out.
#print mypars
pars_d = {}
for p in mypars:
    pars_d[p.GetName()] = p

# Create a dictionary of extra functions
# We'll use this later if we need to print stuff out.
#print sub_funcs_list
sub_funcs = {}
for f in sub_funcs_list:
    sub_funcs[f.GetName()] = f


In [None]:
for p in pars_d.keys():
    print(f"{p} ---------------------")
    #pars_d[p].Print("v")

In [None]:
df_sp = pd.read_parquet("DATAFRAME_SP_BNC_ALL.parquet")
df_col = pd.read_parquet("DATAFRAME_COL_BNC_ALL.parquet")

In [None]:
#mask = (df_sp['spmode']=='998')
mask = (df_sp['used_in_bkg_train'] == False)
mask &= mask & (df_sp['used_in_sig_train'] == False)
mask &= mask & (df_sp['cut_2']==True) & (df_sp['cut_3']==True) & (df_sp['cut_4']==True)
mask &= mask & (df_sp['BpostFitDeltaE']<0.05) & (df_sp['BpostFitDeltaE']>-0.05)
mask &= mask & (df_sp['proba']>0.90)

mask_sp = (df_sp['spmode']=='998')
df_tmp1 = df_sp[mask & mask_sp]

mask_sp = (df_sp['spmode']=='-999')
df_tmp2 = df_sp[mask & mask_sp].sample(n=5)

df_tmp = pd.concat([df_tmp1, df_tmp2])
#df_tmp = df_tmp1

#ds = read_file_return_dataset(df_sp[mask], x, y, region_definitions=region_definitions)
ds = read_file_return_dataset(df_tmp, x, y, region_definitions=region_definitions)

ds_x = ds.reduce(x)

ds_x.Print("v")

In [None]:
mypars = []
dum_pars, sub_funcs_list, total = pdfs.tot_PDF(x, ds_x)#, use_double_cb, workspace)
mypars += dum_pars
total.Print("v")

# Create a dictionary of the pars
# We'll use this later if we need to print stuff out.
#print mypars
pars_d = {}
for p in mypars:
    pars_d[p.GetName()] = p

# Create a dictionary of extra functions
# We'll use this later if we need to print stuff out.
#print sub_funcs_list
sub_funcs = {}
for f in sub_funcs_list:
    sub_funcs[f.GetName()] = f



# Background

pars_d["nbkg"].setVal(ds_x.sumEntries())
pars_d["nbkg"].setConstant(False)

pars_d["argpar"].setVal(-23.5)
pars_d["argpar"].setConstant(True)

pars_d["cutoff"].setVal(5.29)
pars_d["cutoff"].setConstant(True)

## Signal

pars_d["nCB"].setVal(1.0)
pars_d["nCB"].setConstant(True)

#pars_d["conv_factor_calc"].setVal(43.)
pars_d["conv_factor_calc"].setVal(13.)
pars_d["conv_factor_calc"].setConstant(True)

#pars_d["conv_factor_fit"].setVal(43.)
pars_d["conv_factor_fit"].setVal(13.)
pars_d["conv_factor_fit"].setConstant(False)

pars_d["conv_factor_err"].setVal(500)
pars_d["conv_factor_err"].setConstant(True)

#pars_d["branching_fraction"].setVal(0.58)
pars_d["branching_fraction"].setVal(12.2)
pars_d["branching_fraction"].setConstant(True)

pars_d["meanCB"].setVal(5.279)
pars_d["meanCB"].setConstant(True)

pars_d["sigmaCB"].setVal(0.0028)
pars_d["sigmaCB"].setConstant(True)

pars_d["alphaCB"].setVal(2.000)
pars_d["alphaCB"].setConstant(True)

# Bkg only

total.Print("v")

# Create the NLL for the fit
nll = ROOT.RooNLLVar("nll","nll", total, ds_x, ROOT.RooFit.Extended(ROOT.kTRUE))
fit_func = ROOT.RooFormulaVar("fit_func","nll + log_gc",ROOT.RooArgList(nll,pars_d["log_gc"]))

m = ROOT.RooMinimizer(fit_func)

m.setVerbose(ROOT.kFALSE)

m.migrad()
m.hesse()
fit_results = m.save()


fit_results.Print("v")
mynsig = pars_d["conv_factor_fit"].getVal() * pars_d["branching_fraction"].getVal()
print(f"mynsig: {mynsig}    nsig: {pars_d['nsig'].getVal()}")



In [None]:
fit_results.Print("v")
print()
mynsig = pars_d["conv_factor_fit"].getVal() * pars_d["branching_fraction"].getVal()
print(f"mynsig: {mynsig}    nsig: {pars_d['nsig'].getVal()}")


In [None]:
#del c
c4 = ROOT.TCanvas("testingfits4", "testingfits4", 600, 300)#"fit", "fit", 600, 600)
# Plot data and PDF overlaid, expected number of events for p.d.f projection normalization
# rather than observed number of events (==data.numEntries())
xframe4 = x.frame(ROOT.RooFit.Title("extended ML fit example"), ROOT.RooFit.Bins(25))
ds_x.plotOn(xframe4)
total.plotOn(xframe4, ROOT.RooFit.Normalization(
    1.0, ROOT.RooAbsReal.RelativeExpected))

# Overlay the background component of model with a dashed line
ras_bkg = ROOT.RooArgSet(bkg_pdf)
total.plotOn(
    xframe4, ROOT.RooFit.Components(ras_bkg), ROOT.RooFit.LineStyle(
        ROOT.kDashed), ROOT.RooFit.Normalization(
            1.0, ROOT.RooAbsReal.RelativeExpected))

# Overlay the background component of model with a dashed line
ras_sig = ROOT.RooArgSet(sig_pdf)
total.plotOn(
    xframe4, ROOT.RooFit.Components(ras_sig), ROOT.RooFit.LineStyle(
        ROOT.kDotted), ROOT.RooFit.Normalization(
            1.0, ROOT.RooAbsReal.RelativeExpected))

# Draw the frame on the canvas

ROOT.gPad.SetLeftMargin(0.15)
xframe4.GetYaxis().SetTitleOffset(1.4)
xframe4.Draw()



#c.Update()
#ROOT.gPad
c4.Draw()
#ROOT.gPad.Draw()
#ROOT.gPad.Update()
#c.Draw()

#c.SaveAs("testfit.png")


## Background

In [None]:
df_sp = pd.read_parquet("DATAFRAME_SP_BNC_ALL.parquet")
df_col = pd.read_parquet("DATAFRAME_COL_BNC_ALL.parquet")

In [None]:
#df_sp

In [None]:
#mask = (df_sp['spmode']=='998')
mask = (df_sp['used_in_bkg_train'] == False)
mask &= mask & (df_sp['used_in_sig_train'] == False)
mask &= mask & (df_sp['cut_2']==True) & (df_sp['cut_3']==True) & (df_sp['cut_4']==True)
mask &= mask & (df_sp['BpostFitDeltaE']<0.05) & (df_sp['BpostFitDeltaE']>-0.05)
mask &= mask & (df_sp['proba']>0.97)

mask_sp = (df_sp['spmode']=='998')
df_tmp1 = df_sp[mask & mask_sp]

#mask_sp = (df_sp['spmode']=='-999')
#df_tmp2 = df_sp[mask & mask_sp].sample(n=4)

#df_tmp = pd.concat([df_tmp1, df_tmp2])
df_tmp = df_tmp1

#ds = read_file_return_dataset(df_sp[mask], x, y, region_definitions=region_definitions)
ds = read_file_return_dataset(df_tmp, x, y, region_definitions=region_definitions)

ds_x = ds.reduce(x)

ds_x.Print("v")

In [None]:
#df_tmp

In [None]:

pars_d["nbkg"].setVal(ds_x.sumEntries())
pars_d["nbkg"].setConstant(False)

pars_d["argpar"].setVal(-23.5)
pars_d["argpar"].setConstant(True)

pars_d["cutoff"].setVal(5.29)
pars_d["cutoff"].setConstant(True)



# Bkg only
total = ROOT.RooExtendPdf("fit_func", "Extended function for background", sub_funcs["bkg_pdf"], pars_d["nbkg"])

total.Print("v")

# Create the NLL for the fit
nll = ROOT.RooNLLVar("nll","nll",total, ds_x, ROOT.RooFit.Extended(ROOT.kTRUE))
fit_func = ROOT.RooFormulaVar("fit_func","nll + log_gc", ROOT.RooArgList(nll,pars_d["log_gc"]))

m = ROOT.RooMinimizer(fit_func)

m.setVerbose(ROOT.kFALSE)


m.migrad()
m.hesse()
fit_results = m.save()


fit_results.Print("v")


In [None]:
xframe2 = x.frame(ROOT.RooFit.Title("Gaussian pdf with data"),   ROOT.RooFit.Bins(20))  # RooPlot
#xframe2 = x.frame(ROOT.RooFit.Title("extended ML fit example"), ROOT.RooFit.Bins(25))

#del c2
c2 = ROOT.TCanvas("testingfits", "testingfits", 600, 300)#"fit", "fit", 600, 600)

ds_x.plotOn(xframe2)

total.plotOn(xframe2, ROOT.RooFit.Normalization(1.0, ROOT.RooAbsReal.RelativeExpected))

# Overlay the background component of model with a dashed line
ras_bkg = ROOT.RooArgSet(bkg_pdf)
total.plotOn(
    xframe2, ROOT.RooFit.Components(ras_bkg), ROOT.RooFit.LineStyle(
        ROOT.kDashed), ROOT.RooFit.Normalization(
            1.0, ROOT.RooAbsReal.RelativeExpected))

## Overlay the background component of model with a dashed line
#ras_sig = ROOT.RooArgSet(sig_pdf)
#total.plotOn(
#    xframe2, ROOT.RooFit.Components(ras_sig), ROOT.RooFit.LineStyle(
#        ROOT.kDotted), ROOT.RooFit.Normalization(
#            1.0, ROOT.RooAbsReal.RelativeExpected))




xframe2.Draw()
c2.Draw()

# Signal

In [None]:
# Bkg only
total = ROOT.RooExtendPdf("fit_func", "Extended function for signal", sub_funcs["sig_pdf"], pars_d["nsig"])


total.Print("v")

In [None]:
#mask = (df_sp['spmode']=='998')
mask = (df_sp['used_in_bkg_train'] == False)
mask &= mask & (df_sp['used_in_sig_train'] == False)
mask &= mask & (df_sp['cut_2']==True) & (df_sp['cut_3']==True) & (df_sp['cut_4']==True)
mask &= mask & (df_sp['BpostFitDeltaE']<0.05) & (df_sp['BpostFitDeltaE']>-0.05)
mask &= mask & (df_sp['proba']>0.90)

mask_sp = (df_sp['spmode']=='-999')
df_tmp1 = df_sp[mask & mask_sp]

#mask_sp = (df_sp['spmode']=='-999')
#df_tmp2 = df_sp[mask & mask_sp].sample(n=4)

#df_tmp = pd.concat([df_tmp1, df_tmp2])
df_tmp = df_tmp1

#ds = read_file_return_dataset(df_sp[mask], x, y, region_definitions=region_definitions)
ds = read_file_return_dataset(df_tmp, x, y, region_definitions=region_definitions)

ds_x = ds.reduce(x)

ds_x.Print("v")

In [None]:
pars_d.keys()

In [None]:
# Create the NLL for the fit
nll = ROOT.RooNLLVar("nll","nll", total, ds_x, ROOT.RooFit.Extended(ROOT.kTRUE))

fit_func = ROOT.RooFormulaVar("fit_func","nll + log_gc", ROOT.RooArgList(nll,pars_d["log_gc"]))

m = ROOT.RooMinimizer(fit_func)

m.setVerbose(ROOT.kFALSE)
m.setMaxFunctionCalls(10000)
m.setMaxIterations(10000)

print(f"nevents: {ds_x.sumEntries()}")

pars_d["nCB"].setVal(1.0)
pars_d["nCB"].setConstant(True)

#pars_d["conv_factor_calc"].setVal(43.)
pars_d["conv_factor_calc"].setVal(13.)
pars_d["conv_factor_calc"].setConstant(True)

#pars_d["conv_factor_fit"].setVal(43.)
pars_d["conv_factor_fit"].setVal(13.)
pars_d["conv_factor_fit"].setConstant(False)

pars_d["conv_factor_err"].setVal(500)
pars_d["conv_factor_err"].setConstant(True)

#pars_d["branching_fraction"].setVal(0.58)
pars_d["branching_fraction"].setVal(12.2)
pars_d["branching_fraction"].setConstant(True)

pars_d["meanCB"].setVal(5.279)
pars_d["meanCB"].setConstant(False)

pars_d["sigmaCB"].setVal(0.0028)
pars_d["sigmaCB"].setConstant(False)

pars_d["alphaCB"].setVal(2.000)
pars_d["alphaCB"].setConstant(False)


m.migrad()

print("After migrad")
fit_results = m.save()
fit_results.Print("v")

m.hesse()
fit_results = m.save()
fit_results.Print("v")

mynsig = pars_d["conv_factor_fit"].getVal() * pars_d["branching_fraction"].getVal()
print(f"mynsig: {mynsig}    nsig: {pars_d['nsig'].getVal()}")


fit_results.Print("v")


In [None]:
nsig.Print("v")

print(pars_d["nsig"].evaluate())



In [None]:
xframe3 = x.frame(ROOT.RooFit.Title("Signal"),   ROOT.RooFit.Bins(20))  # RooPlot

#del c2
c3 = ROOT.TCanvas("testingfits", "testingfits", 600, 300)#"fit", "fit", 600, 600)

ds_x.plotOn(xframe3)

total.plotOn(xframe3, ROOT.RooFit.Normalization(1.0, ROOT.RooAbsReal.RelativeExpected))

# Overlay the background component of model with a dashed line
#ras_bkg = ROOT.RooArgSet(bkg_pdf)
#total.plotOn(
#    xframe2, ROOT.RooFit.Components(ras_bkg), ROOT.RooFit.LineStyle(
#        ROOT.kDashed), ROOT.RooFit.Normalization(
#            1.0, ROOT.RooAbsReal.RelativeExpected))

## Overlay the signal component of model with a dashed line
ras_sig = ROOT.RooArgSet(sig_pdf)
total.plotOn(
    xframe3, ROOT.RooFit.Components(ras_sig), ROOT.RooFit.LineStyle(
        ROOT.kDotted), ROOT.RooFit.Normalization(
            1.0, ROOT.RooAbsReal.RelativeExpected))




xframe3.Draw()
c3.Draw()