In [1]:
import plot

In [2]:
import numpy as np
import math
%matplotlib inline
import matplotlib.pyplot as plt
from graph_data import GraphDataset
import energyflow as ef
import torch
import torch.nn as nn
import os.path as osp
from torch_geometric.data import Data, DataLoader, DataListLoader, Batch
from torch.utils.data import random_split
from scipy.stats import iqr

In [3]:
plt.rcParams['figure.figsize'] = (4,4)
plt.rcParams['figure.dpi'] = 120
plt.rcParams['font.family'] = 'serif'

In [4]:
gdata = GraphDataset(root='/energyflowvol/datasets/', n_jets=100, n_events_merge=1, lhco=True)
_, lhco_data = random_split(gdata, [len(gdata)-100, 100])

In [5]:
gdata = GraphDataset(root='~/.energyflow/datasets', n_jets=100, n_events_merge=1)
_, qg_data = random_split(gdata, [len(gdata)-100, 100])

Processing...
Loading QG Dataset
Downloading QG_jets.npz from https://www.dropbox.com/s/fclsl7pukcpobsb/QG_jets.npz?dl=1 to /home/jovyan/.energyflow/datasets/raw/datasets
Generated: 0/10000
Generated: 500/10000
Generated: 1000/10000
Generated: 1500/10000
Generated: 2000/10000
Generated: 2500/10000
Generated: 3000/10000
Generated: 3500/10000
Generated: 4000/10000
Generated: 4500/10000
Generated: 5000/10000
Generated: 5500/10000
Generated: 6000/10000
Generated: 6500/10000
Generated: 7000/10000
Generated: 7500/10000
Generated: 8000/10000
Generated: 8500/10000
Generated: 9000/10000
Generated: 9500/10000
Done!


In [6]:
lhco_x = plot.get_x_input(lhco_data)
lhco_y = plot.get_y_output(lhco_data)

In [None]:
qg_x = plot.get_x_input(qg_data)
qg_y = plot.get_y_output(qg_data)

In [None]:
lhco_feat=lhco_x[0][0]
qg_feat=qg_x[0][0]
fig, ax = plt.subplots(figsize =(5, 5))
bins=np.linspace(0,0.2,31)
plt.hist(lhco_feat.numpy(), label='lhco', bins=bins, alpha=0.5)
plt.hist(qg_feat.numpy(), label='qg', bins=bins, alpha=0.5)
plt.legend()
ax.set_xlabel('pt')
print(f'PT\nmin: {min(lhco_feat)}\nmax: {max(lhco_feat)}\navg: {torch.mean(lhco_feat)}\nmed: {torch.median(lhco_feat)}\niqr: {iqr(lhco_feat)}')

lhco_feat=lhco_x[1][0]
qg_feat=qg_x[1][0]
fig, ax = plt.subplots(figsize =(5, 5))
bins=np.linspace(-0.4,0.4,31)
plt.hist(lhco_feat.numpy(), label='lhco', bins=bins, alpha=0.5)
plt.hist(qg_feat.numpy(), label='qg', bins=bins, alpha=0.5)
plt.legend()
ax.set_xlabel('eta')
print(f'\nETA\nmin: {min(lhco_feat)}\nmax: {max(lhco_feat)}\navg: {torch.mean(lhco_feat)}\nmed: {torch.median(lhco_feat)}\niqr: {iqr(lhco_feat)}')

lhco_feat=lhco_x[2][0]
qg_feat=qg_x[2][0]
fig, ax = plt.subplots(figsize =(5, 5))
bins=np.linspace(-0.4,0.4,31)
plt.hist(lhco_feat.numpy(), label='lhco', bins=bins, alpha=0.5)
plt.hist(qg_feat.numpy(), label='qg', bins=bins, alpha=0.5)
plt.legend()
ax.set_xlabel('phi')
print(f'\nPHI\nmin: {min(lhco_feat)}\nmax: {max(lhco_feat)}\navg: {torch.mean(lhco_feat)}\nmed: {torch.median(lhco_feat)}\niqr: {iqr(lhco_feat)}')

lhco_feat=lhco_y
qg_feat=qg_y
fig, ax = plt.subplots(figsize =(5, 5))
bins=np.linspace(0,12,100)
plt.hist(lhco_feat.numpy(), label='lhco', bins=bins, alpha=0.5)
plt.hist(qg_feat.numpy(), label='qg', bins=bins, alpha=0.5)
plt.legend()
ax.set_xlabel('emd')
print(f'\nEMD\nmin: {min(lhco_feat)}\nmax: {max(lhco_feat)}\navg: {torch.mean(lhco_feat)}\nmed: {torch.median(lhco_feat)}\niqr: {iqr(lhco_feat)}')