-
Notifications
You must be signed in to change notification settings - Fork 1.3k
/
Copy pathdf015_LazyDataSource.C
55 lines (47 loc) · 2.12 KB
/
df015_LazyDataSource.C
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
/// \file
/// \ingroup tutorial_dataframe
/// \notebook -draw
/// Use the lazy RDataFrame data source to concatenate computation graphs.
///
/// This tutorial illustrates how to take advantage of a *lazy data source*
/// creating a data frame from columns of one or multiple parent dataframe(s),
/// delaying the creation of the columns to the actual usage of the daughter
/// data frame.
/// Dataset Reference:
/// McCauley, T. (2014). Dimuon event information derived from the Run2010B
/// public Mu dataset. CERN Open Data Portal.
/// DOI: [10.7483/OPENDATA.CMS.CB8H.MFFA](http://opendata.cern.ch/record/700).
/// From the ROOT website: https://root.cern/files/tutorials/tdf014_CsvDataSource_MuRun2010B.csv
///
/// \macro_code
/// \macro_image
///
/// \date February 2018
/// \author Danilo Piparo (CERN)
int df015_LazyDataSource()
{
using namespace ROOT::RDF;
// Let's first create a RDF that will read from the CSV file.
// See the tutorial (https://root.cern/doc/master/df014__CSVDataSource_8C.html) on CSV data sources for more details!
auto fileNameUrl = "http://root.cern/files/tutorials/df014_CsvDataSource_MuRun2010B.csv";
auto fileName = "CsvDataSource_MuRun2010B.csv";
if(gSystem->AccessPathName(fileName))
TFile::Cp(fileNameUrl, fileName);
auto csv_rdf = FromCSV(fileName);
// Now we take out two columns: px and py of the first muon in the muon pair
std::string px1Name = "px1";
auto px1 = csv_rdf.Take<double>(px1Name);
std::string py1Name = "py1";
auto py1 = csv_rdf.Take<double>(py1Name);
// Now we create a new dataframe built on top of the columns above. Note that up to now, no event loop
// has been carried out!
auto df = MakeLazyDataFrame(std::make_pair(px1Name, px1), std::make_pair(py1Name, py1));
// We build a histogram of the transverse momentum of the muons.
auto ptFormula = [](double px, double py) { return sqrt(px * px + py * py); };
auto pt_h = df.Define("pt", ptFormula, {"px1", "py1"})
.Histo1D<double>({"pt", "Muon p_{T};p_{T} [GeV/c];", 128, 0, 128}, "pt");
auto can = new TCanvas();
can->SetLogy();
pt_h->DrawCopy();
return 0;
}