In [1]:
import os, re, glob, numpy as np, torch, torch.nn as nn, torch.optim as optim
from torchvision import models, transforms
from torch.utils.data import DataLoader, Dataset
from tqdm import tqdm

In [2]:
def compute_global_image_stats(chunk_paths, sample_fraction=0.1):
    sum_pixels = np.zeros(3, dtype=np.float64)
    sum_sq_pixels = np.zeros(3, dtype=np.float64)
    total_pixels = 0
    for chunk in chunk_paths:
        data = np.load(chunk)
        images = data['X_jets']  # (N, H, W, 3)
        N = images.shape[0]
        if sample_fraction < 1.0:
            sample_size = max(1, int(N * sample_fraction))
            idx = np.random.choice(N, sample_size, replace=False)
            images = images[idx]
        pixels = images.reshape(-1, 3).astype(np.float64)
        sum_pixels += pixels.sum(axis=0)
        sum_sq_pixels += (pixels**2).sum(axis=0)
        total_pixels += pixels.shape[0]
        del data, images, pixels
    mean = sum_pixels / total_pixels
    std = np.sqrt(sum_sq_pixels / total_pixels - mean**2)
    return mean.tolist(), std.tolist()


In [3]:
class JetImageDataset(Dataset):
    def __init__(self, images, labels, transform=None):
        self.images = images  # shape (N, H, W, 3)
        self.labels = labels
        self.transform = transform
    def __len__(self):
        return len(self.images)
    def __getitem__(self, idx):
        img = self.images[idx]
        label = self.labels[idx]
        if self.transform:
            img = self.transform(img)
        return img, label

In [4]:
def compute_physics_features_tensor(x, eps=1e-6):
    # x: (B, 3, H, W)
    ecal = x[:, 0:1, :, :]
    hcal = x[:, 1:2, :, :]
    tracks = x[:, 2:3, :, :]
    ratio = torch.mean(ecal / (hcal + eps), dim=[2,3])
    mean_tracks = torch.mean(tracks, dim=[2,3])
    diff = torch.mean(ecal - hcal, dim=[2,3])
    return torch.cat([ratio, mean_tracks, diff], dim=1)  # (B, 3)

In [5]:
class ChannelWiseConvBranch(nn.Module):
    def __init__(self, in_channels=1, out_channels=8):
        super().__init__()
        self.convs = nn.ModuleList([
            nn.Sequential(
                nn.Conv2d(in_channels, out_channels, kernel_size=1, padding=0),
                nn.ReLU(),
                nn.AdaptiveAvgPool2d((1,1))
            ),
            nn.Sequential(
                nn.Conv2d(in_channels, out_channels, kernel_size=3, padding=1),
                nn.ReLU(),
                nn.AdaptiveAvgPool2d((1,1))
            ),
            nn.Sequential(
                nn.Conv2d(in_channels, out_channels, kernel_size=5, padding=2),
                nn.ReLU(),
                nn.AdaptiveAvgPool2d((1,1))
            )
        ])
    def forward(self, x):
        outs = [conv(x) for conv in self.convs]
        outs = [o.view(o.size(0), -1) for o in outs]
        return torch.cat(outs, dim=1)  # (B, out_channels*3)


In [6]:
class FeaturePyramidBranch(nn.Module):
    def __init__(self, in_channels, out_channels):
        super().__init__()
        self.convs = nn.ModuleList([
            nn.Sequential(
                nn.Conv2d(in_channels, out_channels, kernel_size=1, padding=0),
                nn.ReLU(),
                nn.AdaptiveAvgPool2d((1,1))
            ),
            nn.Sequential(
                nn.Conv2d(in_channels, out_channels, kernel_size=3, padding=1),
                nn.ReLU(),
                nn.AdaptiveAvgPool2d((1,1))
            ),
            nn.Sequential(
                nn.Conv2d(in_channels, out_channels, kernel_size=5, padding=2),
                nn.ReLU(),
                nn.AdaptiveAvgPool2d((1,1))
            )
        ])
    def forward(self, x):
        outs = [conv(x) for conv in self.convs]
        outs = [o.view(o.size(0), -1) for o in outs]
        return torch.cat(outs, dim=1)  # (B, out_channels*3)

In [7]:
class ResNet18PhysicsModel(nn.Module):
    def __init__(self, num_classes=2):
        super().__init__()
        self.backbone = models.resnet18(weights=models.ResNet18_Weights.DEFAULT)
        in_features = self.backbone.fc.in_features
        self.backbone.fc = nn.Identity()  # backbone features
        
        # Physics branch
        self.physics_fc = nn.Sequential(
            nn.Linear(3, 16),
            nn.ReLU(),
            nn.Linear(16, 16),
            nn.ReLU()
        )
        
        # Channel-wise branch: applied to each channel separately
        self.channel_branch = ChannelWiseConvBranch(in_channels=1, out_channels=8)
        
        # Joint convolution branch (feature pyramid on full 3-channel input)
        self.joint_conv = FeaturePyramidBranch(in_channels=3, out_channels=8)
        
        # Additional Feature Pyramid branch on raw image
        self.fpn_branch = FeaturePyramidBranch(in_channels=3, out_channels=8)
        
        # Fusion fully connected layer: sum dimensions:
        # backbone: in_features; physics: 16; channel-wise: 3 channels * (8*3 = 24 each) = 72; joint: 8*3=24; fpn: 8*3=24.
        fusion_dim = in_features + 16 + 72 + 24 + 24
        self.fusion_fc = nn.Sequential(
            nn.Linear(fusion_dim, 512),
            nn.ReLU(),
            nn.Linear(512, num_classes)
        )
        
    def forward(self, x):
        backbone_feat = self.backbone(x)  # (B, in_features)
        phys_out = self.physics_fc(compute_physics_features_tensor(x))  # (B, 16)
        
        # Apply channel branch on each channel separately
        channel_feats = []
        for i in range(3):
            channel = x[:, i:i+1, :, :]  # (B, 1, H, W)
            feat = self.channel_branch(channel)  # (B, 24)
            channel_feats.append(feat)
        channel_feats = torch.cat(channel_feats, dim=1)  # (B, 24*3 = 72)
        
        joint_feat = self.joint_conv(x)  # (B, 24)
        fpn_feat = self.fpn_branch(x)    # (B, 24)
        
        fused = torch.cat([backbone_feat, phys_out, channel_feats, joint_feat, fpn_feat], dim=1)
        logits = self.fusion_fc(fused)
        return backbone_feat, logits

In [8]:
def save_checkpoint(model, optimizer, epoch, checkpoint_dir, model_name):
    os.makedirs(checkpoint_dir, exist_ok=True)
    ckpt_path = os.path.join(checkpoint_dir, f"{model_name}_epoch_{epoch}.pth")
    torch.save({'epoch': epoch, 'model_state': model.state_dict(),
                'optimizer_state': optimizer.state_dict()}, ckpt_path)
    print(f"Checkpoint saved: {ckpt_path}")

def load_checkpoint(model, optimizer, checkpoint_dir, model_name):
    pattern = os.path.join(checkpoint_dir, f"{model_name}_epoch_*.pth")
    files = glob.glob(pattern)
    if not files:
        print(f"No checkpoint found for {model_name}.")
        return 0
    latest = max(files, key=lambda f: int(re.search(r'epoch_(\d+)', f).group(1)))
    ckpt = torch.load(latest)
    model.load_state_dict(ckpt['model_state'])
    optimizer.load_state_dict(ckpt['optimizer_state'])
    start_epoch = ckpt['epoch']
    print(f"Loaded {model_name} from {latest} at epoch {start_epoch}")
    return start_epoch



In [9]:
def train_model(model, device, chunk_paths, epochs=5, batch_size=32, checkpoint_dir="ckpt_resnet18", resume=False):
    model = model.to(device)
    optimizer = optim.Adam(model.parameters(), lr=1e-4)
    start_epoch = 0
    if resume:
        start_epoch = load_checkpoint(model, optimizer, checkpoint_dir, model.__class__.__name__)
    
    global_mean, global_std = compute_global_image_stats(chunk_paths, sample_fraction=0.1)
    print("Global image stats (mean, std):", global_mean, global_std)
    transform = transforms.Compose([
        transforms.ToTensor(),
        transforms.Resize((224,224)),
        transforms.Normalize(mean=global_mean, std=global_std)
    ])
    criterion = nn.CrossEntropyLoss()
    
    for epoch in range(start_epoch+1, epochs+1):
        print(f"\nEpoch {epoch}/{epochs}")
        for chunk in tqdm(chunk_paths, desc="Chunks"):
            print(f"\nTraining on chunk: {chunk}")
            data = np.load(chunk)
            images = data['X_jets']
            labels = data['y']
            dataset = JetImageDataset(images, labels, transform=transform)
            dataloader = DataLoader(dataset, batch_size=batch_size, shuffle=True)
            model.train()
            epoch_loss = 0.0
            for imgs, labs in tqdm(dataloader, desc="Training Batches", leave=False):
                imgs = imgs.to(device, dtype=torch.float)
                labs = labs.to(device).long()
                optimizer.zero_grad()
                _, logits = model(imgs)
                loss = criterion(logits, labs)
                loss.backward()
                optimizer.step()
                epoch_loss += loss.item()
            print(f"Chunk loss: {epoch_loss/len(dataloader):.4f}")
            del data, images, labels, dataset, dataloader
        save_checkpoint(model, optimizer, epoch, checkpoint_dir, model.__class__.__name__)
    return model

In [10]:
if __name__ == '__main__':
    device = 'cuda' if torch.cuda.is_available() else 'cpu'
    data_dir = "/kaggle/input/genie-extracted-dataset"
    all_files = [f for f in os.listdir(data_dir) if f.endswith(".npz")]
    sorted_files = sorted(all_files, key=lambda f: int(re.search(r'chunk_(\d+)_', f).group(1)))
    chunk_paths = [os.path.join(data_dir, f) for f in sorted_files]
    
    model = ResNet18PhysicsModel(num_classes=2)
    trained_model = train_model(model, device, chunk_paths, epochs=5, batch_size=32,
                                checkpoint_dir="ckpt_resnet18", resume=True)

Downloading: "https://download.pytorch.org/models/resnet18-f37072fd.pth" to /root/.cache/torch/hub/checkpoints/resnet18-f37072fd.pth
100%|██████████| 44.7M/44.7M [00:00<00:00, 225MB/s]


No checkpoint found for ResNet18PhysicsModel.
Global image stats (mean, std): [7.939842705511931e-05, 5.1207733091916395e-05, 3.08033035513073e-05] [0.005480030499975712, 0.0021517315103955137, 0.0005202014984099218]

Epoch 1/5


Chunks:   0%|          | 0/14 [00:00<?, ?it/s]


Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_0_10000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:01<05:51,  1.13s/it][A
Training Batches:   1%|          | 2/313 [00:01<02:54,  1.79it/s][A
Training Batches:   1%|          | 3/313 [00:01<01:55,  2.68it/s][A
Training Batches:   1%|▏         | 4/313 [00:01<01:27,  3.54it/s][A
Training Batches:   2%|▏         | 5/313 [00:01<01:09,  4.40it/s][A
Training Batches:   2%|▏         | 6/313 [00:01<01:00,  5.08it/s][A
Training Batches:   2%|▏         | 7/313 [00:01<00:54,  5.66it/s][A
Training Batches:   3%|▎         | 8/313 [00:02<00:49,  6.19it/s][A
Training Batches:   3%|▎         | 9/313 [00:02<00:45,  6.62it/s][A
Training Batches:   3%|▎         | 10/313 [00:02<00:43,  6.94it/s][A
Training Batches:   4%|▎         | 11/313 [00:02<00:42,  7.19it/s][A
Training Batches:   4%|▍         | 12/313 [00:02<00:40,  7.34it/s][A
Training Batches:   4%|▍         | 13/313 [00:02<00:40,  7.48it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5845

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_10000_20000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:47,  6.50it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:46,  6.70it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:44,  6.97it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.26it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:42,  7.25it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:41,  7.42it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:40,  7.53it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:40,  7.60it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:39,  7.65it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.46it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.55it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.61it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.66it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5763

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_20000_30000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:47,  6.58it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:44,  7.02it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:42,  7.28it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:41,  7.43it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.51it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:41,  7.48it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:40,  7.58it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:40,  7.62it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:39,  7.66it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:39,  7.68it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:39,  7.63it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.57it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.64it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5754

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_30000_40000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:48,  6.42it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:45,  6.85it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:42,  7.22it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:41,  7.44it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:40,  7.55it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:40,  7.62it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:40,  7.55it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:40,  7.51it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:42,  7.17it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:41,  7.24it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.39it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:40,  7.40it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:40,  7.50it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5679

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_40000_50000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:47,  6.60it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:44,  6.97it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:43,  7.18it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.25it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.38it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:40,  7.51it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:40,  7.59it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:39,  7.65it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:39,  7.69it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:39,  7.72it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:39,  7.74it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.66it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:38,  7.70it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5632

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_50000_60000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:43,  7.10it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:43,  7.10it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:42,  7.25it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:41,  7.43it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.43it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:40,  7.52it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:41,  7.40it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:40,  7.51it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:40,  7.59it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:39,  7.64it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:39,  7.56it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.63it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.67it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5599

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_60000_70000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:51,  6.08it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:48,  6.43it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:46,  6.72it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:44,  6.89it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:42,  7.18it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:41,  7.38it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:41,  7.40it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:40,  7.51it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:41,  7.28it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.41it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.42it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:40,  7.43it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.52it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5522

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_70000_80000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:48,  6.47it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:44,  6.93it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:42,  7.23it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.22it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.38it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:41,  7.40it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:41,  7.29it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:41,  7.40it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:42,  7.09it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:42,  7.14it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:41,  7.30it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:40,  7.43it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.53it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5597

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_80000_90000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:44,  6.95it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:45,  6.85it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:42,  7.22it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:41,  7.37it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:42,  7.26it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:41,  7.41it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:40,  7.52it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:40,  7.58it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:39,  7.61it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.50it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:39,  7.55it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.60it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.53it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5601

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_90000_100000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:49,  6.35it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:46,  6.71it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:43,  7.10it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.32it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.48it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:42,  7.15it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:42,  7.21it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:41,  7.35it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:40,  7.47it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.54it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.44it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:40,  7.40it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:40,  7.37it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5561

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_100000_110000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:46,  6.69it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:45,  6.82it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:43,  7.05it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:43,  7.18it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:42,  7.26it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:41,  7.39it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:41,  7.40it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:40,  7.48it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:40,  7.55it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:39,  7.59it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:39,  7.65it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.67it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.63it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5615

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_110000_120000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:45,  6.90it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:44,  6.95it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:43,  7.10it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.33it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:42,  7.21it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:43,  7.14it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:44,  6.91it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:43,  7.03it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:43,  6.93it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:42,  7.14it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:41,  7.30it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:40,  7.42it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:40,  7.41it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5597

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_120000_130000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:48,  6.48it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:45,  6.89it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:43,  7.20it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.36it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.49it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:40,  7.55it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:40,  7.61it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:39,  7.63it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:39,  7.64it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:39,  7.66it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:39,  7.67it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.68it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.69it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5632

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_130000_139306.npz



Training Batches:   0%|          | 0/291 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/291 [00:00<00:44,  6.54it/s][A
Training Batches:   1%|          | 2/291 [00:00<00:44,  6.53it/s][A
Training Batches:   1%|          | 3/291 [00:00<00:42,  6.85it/s][A
Training Batches:   1%|▏         | 4/291 [00:00<00:41,  6.98it/s][A
Training Batches:   2%|▏         | 5/291 [00:00<00:40,  7.09it/s][A
Training Batches:   2%|▏         | 6/291 [00:00<00:39,  7.27it/s][A
Training Batches:   2%|▏         | 7/291 [00:00<00:38,  7.40it/s][A
Training Batches:   3%|▎         | 8/291 [00:01<00:37,  7.47it/s][A
Training Batches:   3%|▎         | 9/291 [00:01<00:37,  7.46it/s][A
Training Batches:   3%|▎         | 10/291 [00:01<00:37,  7.54it/s][A
Training Batches:   4%|▍         | 11/291 [00:01<00:38,  7.25it/s][A
Training Batches:   4%|▍         | 12/291 [00:01<00:37,  7.39it/s][A
Training Batches:   4%|▍         | 13/291 [00:01<00:37,  7.49it/s][A
Training Batches:   5%|▍         | 14

Chunk loss: 0.5614
Checkpoint saved: ckpt_resnet18/ResNet18PhysicsModel_epoch_1.pth

Epoch 2/5


Chunks:   0%|          | 0/14 [00:00<?, ?it/s]


Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_0_10000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:44,  7.07it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:44,  7.05it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:45,  6.89it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.19it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:43,  7.10it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:42,  7.29it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:41,  7.41it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:40,  7.50it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:40,  7.55it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.57it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.52it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.57it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:40,  7.49it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5511

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_10000_20000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:47,  6.51it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:44,  6.94it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:42,  7.28it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:41,  7.45it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:40,  7.53it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:43,  7.12it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:42,  7.27it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:41,  7.41it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:40,  7.50it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:39,  7.58it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.45it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:40,  7.51it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:40,  7.42it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5558

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_20000_30000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:44,  6.98it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:45,  6.84it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:44,  7.04it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:43,  7.17it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.37it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:41,  7.33it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:42,  7.20it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:42,  7.25it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:41,  7.40it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:41,  7.34it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:41,  7.35it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:40,  7.44it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.52it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5564

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_30000_40000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:49,  6.32it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:47,  6.53it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:45,  6.74it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:45,  6.84it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:44,  6.92it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:44,  6.94it/s][A
Training Batches:   2%|▏         | 7/313 [00:01<00:44,  6.94it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:43,  7.09it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:42,  7.12it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:41,  7.27it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:41,  7.19it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:41,  7.33it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:40,  7.42it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5529

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_40000_50000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:42,  7.36it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:44,  7.04it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:44,  7.00it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.24it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.39it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:41,  7.33it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:43,  7.10it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:42,  7.19it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:41,  7.25it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:41,  7.30it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.42it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:40,  7.50it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:41,  7.22it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5516

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_50000_60000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:48,  6.48it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:45,  6.79it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:43,  7.19it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:41,  7.36it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.49it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:43,  7.11it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:41,  7.29it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:41,  7.41it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:40,  7.49it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.43it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:41,  7.32it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:40,  7.41it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:40,  7.50it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5500

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_60000_70000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:42,  7.32it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:44,  6.97it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:44,  6.96it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:43,  7.08it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:42,  7.31it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:41,  7.41it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:41,  7.33it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:42,  7.25it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:41,  7.38it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:41,  7.31it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:41,  7.33it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:40,  7.45it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.51it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5400

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_70000_80000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:44,  6.99it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:43,  7.12it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:42,  7.25it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:41,  7.40it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.33it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:41,  7.46it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:41,  7.32it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:41,  7.32it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:40,  7.45it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.51it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.47it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:40,  7.35it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:41,  7.23it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5532

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_80000_90000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:42,  7.32it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:45,  6.79it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:43,  7.05it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.27it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.43it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:40,  7.50it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:42,  7.22it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:41,  7.27it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:41,  7.31it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.39it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.48it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.55it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:40,  7.42it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5541

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_90000_100000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:44,  7.00it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:43,  7.09it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:42,  7.30it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.34it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.38it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:44,  6.95it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:43,  7.10it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:41,  7.29it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:41,  7.41it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:42,  7.14it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:41,  7.20it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:40,  7.36it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:40,  7.45it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5460

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_100000_110000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:48,  6.48it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:47,  6.60it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:43,  7.06it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.25it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.42it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:42,  7.30it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:42,  7.21it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:41,  7.35it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:40,  7.47it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.53it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:39,  7.58it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:40,  7.51it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:40,  7.47it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5508

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_110000_120000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:44,  6.97it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:44,  7.06it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:42,  7.33it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:41,  7.46it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.47it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:40,  7.53it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:40,  7.48it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:40,  7.54it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:40,  7.43it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.52it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.52it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:40,  7.51it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.57it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5522

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_120000_130000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:42,  7.34it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:45,  6.90it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:43,  7.10it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.20it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.38it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:41,  7.36it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:42,  7.13it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:42,  7.18it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:41,  7.31it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.43it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.51it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:40,  7.47it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.55it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5535

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_130000_139306.npz



Training Batches:   0%|          | 0/291 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/291 [00:00<00:41,  7.06it/s][A
Training Batches:   1%|          | 2/291 [00:00<00:40,  7.07it/s][A
Training Batches:   1%|          | 3/291 [00:00<00:40,  7.09it/s][A
Training Batches:   1%|▏         | 4/291 [00:00<00:39,  7.32it/s][A
Training Batches:   2%|▏         | 5/291 [00:00<00:38,  7.46it/s][A
Training Batches:   2%|▏         | 6/291 [00:00<00:40,  7.07it/s][A
Training Batches:   2%|▏         | 7/291 [00:00<00:39,  7.27it/s][A
Training Batches:   3%|▎         | 8/291 [00:01<00:38,  7.38it/s][A
Training Batches:   3%|▎         | 9/291 [00:01<00:38,  7.39it/s][A
Training Batches:   3%|▎         | 10/291 [00:01<00:37,  7.49it/s][A
Training Batches:   4%|▍         | 11/291 [00:01<00:38,  7.25it/s][A
Training Batches:   4%|▍         | 12/291 [00:01<00:37,  7.37it/s][A
Training Batches:   4%|▍         | 13/291 [00:01<00:37,  7.36it/s][A
Training Batches:   5%|▍         | 14

Chunk loss: 0.5523
Checkpoint saved: ckpt_resnet18/ResNet18PhysicsModel_epoch_2.pth

Epoch 3/5


Chunks:   0%|          | 0/14 [00:00<?, ?it/s]


Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_0_10000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:39,  7.85it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:40,  7.77it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:40,  7.74it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:40,  7.62it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:40,  7.52it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:40,  7.57it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:40,  7.64it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:40,  7.57it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:40,  7.52it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.55it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.51it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.57it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.62it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5400

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_10000_20000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:47,  6.54it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:44,  6.97it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:42,  7.25it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:41,  7.42it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.41it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:41,  7.41it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:42,  7.28it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:41,  7.42it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:41,  7.31it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:41,  7.32it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.46it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:40,  7.44it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.51it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5519

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_20000_30000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:45,  6.79it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:44,  7.04it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:43,  7.13it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:43,  7.08it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:43,  7.06it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:43,  7.14it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:42,  7.18it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:42,  7.20it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:42,  7.23it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:42,  7.17it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:42,  7.11it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:41,  7.18it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:40,  7.32it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5465

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_30000_40000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:49,  6.28it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:46,  6.73it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:43,  7.15it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.35it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.47it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:40,  7.56it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:40,  7.50it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:40,  7.56it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:41,  7.33it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:41,  7.35it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.48it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.55it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.59it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5460

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_40000_50000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:42,  7.38it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:41,  7.46it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:41,  7.46it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.35it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.48it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:40,  7.54it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:40,  7.51it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:40,  7.48it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:41,  7.34it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:41,  7.35it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.46it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:40,  7.43it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:40,  7.44it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5461

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_50000_60000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:48,  6.44it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:44,  6.93it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:42,  7.27it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.32it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:42,  7.25it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:42,  7.30it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:42,  7.19it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:41,  7.35it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:40,  7.46it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.51it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:39,  7.58it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.63it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:41,  7.30it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5422

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_60000_70000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:43,  7.23it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:44,  6.94it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:43,  7.12it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.34it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.49it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:40,  7.51it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:43,  6.99it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:42,  7.19it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:41,  7.33it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.44it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.39it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:40,  7.40it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:40,  7.48it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5370

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_70000_80000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:46,  6.74it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:44,  6.94it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:43,  7.19it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.22it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:42,  7.28it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:41,  7.42it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:40,  7.50it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:42,  7.10it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:41,  7.27it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:41,  7.39it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.46it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:40,  7.52it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:40,  7.42it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5456

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_80000_90000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:44,  6.96it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:46,  6.75it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:44,  7.00it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.24it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.37it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:41,  7.49it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:42,  7.12it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:42,  7.17it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:41,  7.32it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.41it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.41it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:40,  7.36it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:40,  7.45it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5459

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_90000_100000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:47,  6.51it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:45,  6.77it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:44,  6.97it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.22it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:42,  7.28it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:41,  7.32it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:42,  7.23it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:42,  7.23it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:42,  7.21it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:41,  7.36it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.47it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.56it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:41,  7.26it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5374

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_100000_110000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:45,  6.80it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:44,  6.99it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:42,  7.33it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:41,  7.50it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:40,  7.58it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:40,  7.64it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:40,  7.49it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:40,  7.45it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:40,  7.43it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.51it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:39,  7.57it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:41,  7.26it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:40,  7.40it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5479

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_110000_120000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:49,  6.33it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:48,  6.47it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:45,  6.77it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:44,  6.94it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:43,  7.06it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:43,  7.11it/s][A
Training Batches:   2%|▏         | 7/313 [00:01<00:43,  7.08it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:42,  7.18it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:43,  7.06it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:41,  7.25it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.37it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:40,  7.48it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.57it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5430

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_120000_130000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:42,  7.34it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:44,  6.96it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:43,  7.13it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.31it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.35it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:41,  7.47it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:40,  7.55it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:40,  7.62it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:40,  7.55it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:39,  7.59it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:39,  7.62it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:41,  7.32it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:40,  7.45it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5480

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_130000_139306.npz



Training Batches:   0%|          | 0/291 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/291 [00:00<00:45,  6.34it/s][A
Training Batches:   1%|          | 2/291 [00:00<00:44,  6.49it/s][A
Training Batches:   1%|          | 3/291 [00:00<00:42,  6.70it/s][A
Training Batches:   1%|▏         | 4/291 [00:00<00:42,  6.80it/s][A
Training Batches:   2%|▏         | 5/291 [00:00<00:41,  6.81it/s][A
Training Batches:   2%|▏         | 6/291 [00:00<00:41,  6.89it/s][A
Training Batches:   2%|▏         | 7/291 [00:01<00:42,  6.75it/s][A
Training Batches:   3%|▎         | 8/291 [00:01<00:41,  6.83it/s][A
Training Batches:   3%|▎         | 9/291 [00:01<00:41,  6.76it/s][A
Training Batches:   3%|▎         | 10/291 [00:01<00:41,  6.83it/s][A
Training Batches:   4%|▍         | 11/291 [00:01<00:42,  6.52it/s][A
Training Batches:   4%|▍         | 12/291 [00:01<00:41,  6.64it/s][A
Training Batches:   4%|▍         | 13/291 [00:01<00:41,  6.63it/s][A
Training Batches:   5%|▍         | 14

Chunk loss: 0.5447
Checkpoint saved: ckpt_resnet18/ResNet18PhysicsModel_epoch_3.pth

Epoch 4/5


Chunks:   0%|          | 0/14 [00:00<?, ?it/s]


Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_0_10000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:40,  7.79it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:40,  7.61it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:40,  7.67it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:40,  7.69it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:39,  7.72it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:39,  7.72it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:39,  7.73it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:39,  7.65it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:40,  7.59it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:39,  7.61it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.51it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.57it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.63it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5368

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_10000_20000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:42,  7.27it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:44,  6.98it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:44,  6.99it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:43,  7.12it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:42,  7.33it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:41,  7.45it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:40,  7.54it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:40,  7.51it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:40,  7.47it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.44it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.53it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.60it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.62it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5433

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_20000_30000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:42,  7.32it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:46,  6.74it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:44,  7.00it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:43,  7.16it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:42,  7.22it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:41,  7.40it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:42,  7.26it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:41,  7.40it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:40,  7.50it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.54it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:39,  7.58it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.55it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.59it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5375

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_30000_40000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:44,  6.97it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:46,  6.71it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:43,  7.13it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.32it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.46it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:40,  7.54it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:40,  7.61it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:39,  7.63it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:40,  7.57it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.47it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.54it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.59it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.63it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5372

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_40000_50000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:51,  6.08it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:49,  6.31it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:47,  6.56it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:46,  6.72it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:45,  6.79it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:44,  6.86it/s][A
Training Batches:   2%|▏         | 7/313 [00:01<00:44,  6.89it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:44,  6.93it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:43,  6.94it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:43,  6.95it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:42,  7.06it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:42,  7.14it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:41,  7.18it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5336

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_50000_60000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:45,  6.81it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:45,  6.83it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:43,  7.19it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:41,  7.37it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.46it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:40,  7.52it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:40,  7.58it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:40,  7.62it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:39,  7.65it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:39,  7.65it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:39,  7.66it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.68it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.69it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5322

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_60000_70000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:51,  6.10it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:49,  6.26it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:46,  6.69it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:44,  7.02it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:42,  7.24it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:42,  7.27it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:41,  7.40it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:41,  7.40it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:40,  7.48it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.54it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:39,  7.60it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.53it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:40,  7.48it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5219

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_70000_80000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:45,  6.91it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:43,  7.12it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:42,  7.35it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:41,  7.47it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:40,  7.55it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:40,  7.60it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:40,  7.63it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:39,  7.63it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:39,  7.65it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.57it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.51it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.56it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:40,  7.46it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5369

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_80000_90000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:46,  6.72it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:45,  6.85it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:44,  7.00it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.26it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.40it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:41,  7.49it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:40,  7.55it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:40,  7.50it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:40,  7.45it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.41it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.39it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:42,  7.07it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:42,  6.99it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5373

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_90000_100000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:45,  6.86it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:43,  7.10it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:42,  7.30it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.28it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:42,  7.21it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:41,  7.38it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:40,  7.49it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:40,  7.57it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:39,  7.61it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:39,  7.66it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:39,  7.68it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.71it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:38,  7.71it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5230

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_100000_110000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:46,  6.70it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:44,  6.92it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:43,  7.10it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.29it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.43it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:40,  7.52it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:40,  7.47it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:40,  7.54it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:41,  7.41it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.40it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.47it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:40,  7.52it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:40,  7.45it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5327

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_110000_120000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:49,  6.33it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:47,  6.56it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:46,  6.72it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:44,  6.91it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:44,  6.94it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:43,  7.02it/s][A
Training Batches:   2%|▏         | 7/313 [00:01<00:43,  7.07it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:43,  7.05it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:43,  7.02it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:42,  7.09it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:42,  7.12it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:42,  7.08it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:42,  7.03it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5316

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_120000_130000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:47,  6.61it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:44,  6.96it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:43,  7.14it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.36it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.47it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:40,  7.55it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:40,  7.60it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:39,  7.64it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:39,  7.66it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:39,  7.68it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:39,  7.68it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.58it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.61it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5335

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_130000_139306.npz



Training Batches:   0%|          | 0/291 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/291 [00:00<00:42,  6.83it/s][A
Training Batches:   1%|          | 2/291 [00:00<00:41,  7.02it/s][A
Training Batches:   1%|          | 3/291 [00:00<00:39,  7.22it/s][A
Training Batches:   1%|▏         | 4/291 [00:00<00:38,  7.37it/s][A
Training Batches:   2%|▏         | 5/291 [00:00<00:38,  7.44it/s][A
Training Batches:   2%|▏         | 6/291 [00:00<00:37,  7.51it/s][A
Training Batches:   2%|▏         | 7/291 [00:00<00:37,  7.49it/s][A
Training Batches:   3%|▎         | 8/291 [00:01<00:37,  7.54it/s][A
Training Batches:   3%|▎         | 9/291 [00:01<00:37,  7.57it/s][A
Training Batches:   3%|▎         | 10/291 [00:01<00:36,  7.61it/s][A
Training Batches:   4%|▍         | 11/291 [00:01<00:37,  7.54it/s][A
Training Batches:   4%|▍         | 12/291 [00:01<00:37,  7.50it/s][A
Training Batches:   4%|▍         | 13/291 [00:01<00:37,  7.38it/s][A
Training Batches:   5%|▍         | 14

Chunk loss: 0.5343
Checkpoint saved: ckpt_resnet18/ResNet18PhysicsModel_epoch_4.pth

Epoch 5/5


Chunks:   0%|          | 0/14 [00:00<?, ?it/s]


Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_0_10000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:39,  7.84it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:40,  7.61it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:40,  7.68it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:40,  7.69it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:39,  7.73it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:39,  7.72it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:39,  7.73it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:39,  7.74it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:39,  7.74it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:39,  7.74it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:38,  7.75it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:38,  7.74it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.69it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5223

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_10000_20000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:48,  6.38it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:44,  6.93it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:42,  7.27it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:41,  7.43it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:40,  7.54it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:42,  7.22it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:42,  7.15it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:41,  7.31it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:40,  7.44it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.50it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.55it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.59it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.63it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5315

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_20000_30000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:47,  6.61it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:47,  6.55it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:46,  6.71it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:44,  6.89it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:44,  6.92it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:44,  6.94it/s][A
Training Batches:   2%|▏         | 7/313 [00:01<00:43,  6.97it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:43,  7.04it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:44,  6.90it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:43,  6.99it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:42,  7.05it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:42,  7.10it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:42,  7.04it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5256

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_30000_40000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:49,  6.26it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:46,  6.75it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:43,  7.09it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.26it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.39it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:41,  7.46it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:40,  7.51it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:40,  7.55it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:40,  7.58it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:39,  7.59it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:39,  7.60it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.60it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.60it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5218

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_40000_50000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:47,  6.55it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:45,  6.81it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:43,  7.15it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.30it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.43it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:41,  7.48it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:40,  7.55it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:40,  7.58it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:39,  7.61it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:39,  7.64it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:39,  7.66it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.67it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.68it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5180

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_50000_60000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:45,  6.81it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:44,  6.93it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:42,  7.23it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:41,  7.36it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.48it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:40,  7.56it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:40,  7.52it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:42,  7.25it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:42,  7.12it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:42,  7.08it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:42,  7.03it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:42,  7.05it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:42,  7.06it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5150

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_60000_70000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:45,  6.90it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:45,  6.87it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:43,  7.20it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.24it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.40it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:41,  7.46it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:41,  7.44it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:41,  7.41it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:40,  7.49it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.55it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:39,  7.59it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.57it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.58it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5080

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_70000_80000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:49,  6.26it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:49,  6.26it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:47,  6.51it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:45,  6.79it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:44,  6.94it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:44,  6.97it/s][A
Training Batches:   2%|▏         | 7/313 [00:01<00:43,  6.97it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:43,  7.06it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:43,  7.06it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:42,  7.12it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:42,  7.09it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:42,  7.07it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:42,  7.14it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5221

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_80000_90000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:45,  6.91it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:45,  6.85it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:43,  7.07it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:43,  7.17it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:42,  7.22it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:41,  7.38it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:40,  7.48it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:40,  7.54it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:40,  7.59it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:39,  7.61it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.53it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:40,  7.48it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.54it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5210

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_90000_100000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:47,  6.60it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:46,  6.76it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:44,  6.99it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:43,  7.11it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:42,  7.30it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:41,  7.44it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:40,  7.50it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:40,  7.55it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:40,  7.47it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.50it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.55it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:40,  7.50it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:40,  7.44it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5003

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_100000_110000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:44,  7.01it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:44,  7.00it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:42,  7.30it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:42,  7.29it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:42,  7.29it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:42,  7.30it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:41,  7.30it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:41,  7.41it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:40,  7.48it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.52it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:39,  7.57it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.58it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.61it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5135

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_110000_120000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:46,  6.78it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:45,  6.83it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:43,  7.18it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:41,  7.36it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:41,  7.49it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:41,  7.46it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:41,  7.44it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:41,  7.40it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:40,  7.48it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:40,  7.42it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:40,  7.50it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:39,  7.54it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:39,  7.58it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5152

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_120000_130000.npz



Training Batches:   0%|          | 0/313 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/313 [00:00<00:44,  6.94it/s][A
Training Batches:   1%|          | 2/313 [00:00<00:46,  6.75it/s][A
Training Batches:   1%|          | 3/313 [00:00<00:43,  7.14it/s][A
Training Batches:   1%|▏         | 4/313 [00:00<00:43,  7.17it/s][A
Training Batches:   2%|▏         | 5/313 [00:00<00:42,  7.20it/s][A
Training Batches:   2%|▏         | 6/313 [00:00<00:42,  7.23it/s][A
Training Batches:   2%|▏         | 7/313 [00:00<00:42,  7.22it/s][A
Training Batches:   3%|▎         | 8/313 [00:01<00:42,  7.25it/s][A
Training Batches:   3%|▎         | 9/313 [00:01<00:41,  7.26it/s][A
Training Batches:   3%|▎         | 10/313 [00:01<00:41,  7.26it/s][A
Training Batches:   4%|▎         | 11/313 [00:01<00:41,  7.28it/s][A
Training Batches:   4%|▍         | 12/313 [00:01<00:41,  7.29it/s][A
Training Batches:   4%|▍         | 13/313 [00:01<00:41,  7.29it/s][A
Training Batches:   4%|▍         | 14

Chunk loss: 0.5129

Training on chunk: /kaggle/input/genie-extracted-dataset/chunk_130000_139306.npz



Training Batches:   0%|          | 0/291 [00:00<?, ?it/s][A
Training Batches:   0%|          | 1/291 [00:00<00:41,  6.91it/s][A
Training Batches:   1%|          | 2/291 [00:00<00:44,  6.54it/s][A
Training Batches:   1%|          | 3/291 [00:00<00:41,  6.90it/s][A
Training Batches:   1%|▏         | 4/291 [00:00<00:39,  7.18it/s][A
Training Batches:   2%|▏         | 5/291 [00:00<00:39,  7.27it/s][A
Training Batches:   2%|▏         | 6/291 [00:00<00:38,  7.43it/s][A
Training Batches:   2%|▏         | 7/291 [00:00<00:37,  7.53it/s][A
Training Batches:   3%|▎         | 8/291 [00:01<00:37,  7.50it/s][A
Training Batches:   3%|▎         | 9/291 [00:01<00:37,  7.47it/s][A
Training Batches:   3%|▎         | 10/291 [00:01<00:37,  7.52it/s][A
Training Batches:   4%|▍         | 11/291 [00:01<00:37,  7.48it/s][A
Training Batches:   4%|▍         | 12/291 [00:01<00:37,  7.44it/s][A
Training Batches:   4%|▍         | 13/291 [00:01<00:37,  7.50it/s][A
Training Batches:   5%|▍         | 14

Chunk loss: 0.5093
Checkpoint saved: ckpt_resnet18/ResNet18PhysicsModel_epoch_5.pth
