In [2]:
import torch
import matplotlib.pyplot as plt
import sys
from neuralop.models import FNO
from neuralop.data.datasets import load_darcy_flow_small
from neuralop.utils import count_model_params
from neuralop.training import AdamW
from neuralop.training.incremental import IncrementalFNOTrainer
from neuralop.data.transforms.data_processors import IncrementalDataProcessor
from neuralop import LpLoss, H1Loss



In [3]:
train_loader, test_loaders, output_encoder = load_darcy_flow_small(
    n_train=100,
    batch_size=16,
    test_resolutions=[16, 32],
    n_tests=[100, 50],
    test_batch_sizes=[32, 32],
)

Loading test db for resolution 16 with 100 samples 
Loading test db for resolution 32 with 50 samples 


  data = torch.load(
  data = torch.load(Path(root_dir).joinpath(f"{dataset_name}_test_{res}.pt").as_posix())


In [4]:
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")


In [5]:
incremental = True
if incremental:
    starting_modes = (2, 2)
else:
    starting_modes = (16, 16)

In [6]:
model = FNO(
    max_n_modes=(16, 16),
    n_modes=starting_modes,
    hidden_channels=32,
    in_channels=1,
    out_channels=1,
)
model = model.to(device)
n_params = count_model_params(model)

In [7]:
optimizer = AdamW(model.parameters(), lr=8e-3, weight_decay=1e-4)
scheduler = torch.optim.lr_scheduler.CosineAnnealingLR(optimizer, T_max=30)


# If one wants to use Incremental Resolution, one should use the IncrementalDataProcessor - When passed to the trainer, the trainer will automatically update the resolution
# Incremental_resolution : bool, default is False
#    if True, increase the resolution of the input incrementally
#    uses the incremental_res_gap parameter
#    uses the subsampling_rates parameter - a list of resolutions to use
#    uses the dataset_indices parameter - a list of indices of the dataset to slice to regularize the input resolution
#    uses the dataset_resolution parameter - the resolution of the input
#    uses the epoch_gap parameter - the number of epochs to wait before increasing the resolution
#    uses the verbose parameter - if True, print the resolution and the number of modes
data_transform = IncrementalDataProcessor(
    in_normalizer=None,
    out_normalizer=None,
    device=device,
    subsampling_rates=[2, 1],
    dataset_resolution=16,
    dataset_indices=[2, 3],
    epoch_gap=10,
    verbose=True,
)

data_transform = data_transform.to(device)

Original Incre Res: change index to 0
Original Incre Res: change sub to 2
Original Incre Res: change res to 8


In [8]:
l2loss = LpLoss(d=2, p=2)
h1loss = H1Loss(d=2)
train_loss = h1loss
eval_losses = {"h1": h1loss, "l2": l2loss}
print("\n### N PARAMS ###\n", n_params)
print("\n### OPTIMIZER ###\n", optimizer)
print("\n### SCHEDULER ###\n", scheduler)
print("\n### LOSSES ###")
print("\n### INCREMENTAL RESOLUTION + GRADIENT EXPLAINED ###")
print(f"\n * Train: {train_loss}")
print(f"\n * Test: {eval_losses}")
sys.stdout.flush()



### N PARAMS ###
 2110305

### OPTIMIZER ###
 AdamW (
Parameter Group 0
    betas: (0.9, 0.999)
    correct_bias: True
    eps: 1e-06
    initial_lr: 0.008
    lr: 0.008
    weight_decay: 0.0001
)

### SCHEDULER ###
 <torch.optim.lr_scheduler.CosineAnnealingLR object at 0x17f3db3d0>

### LOSSES ###

### INCREMENTAL RESOLUTION + GRADIENT EXPLAINED ###

 * Train: <neuralop.losses.data_losses.H1Loss object at 0x30e756b90>

 * Test: {'h1': <neuralop.losses.data_losses.H1Loss object at 0x30e756b90>, 'l2': <neuralop.losses.data_losses.LpLoss object at 0x30e756790>}


In [9]:
# Finally pass all of these to the Trainer
trainer = IncrementalFNOTrainer(
    model=model,
    n_epochs=20,
    data_processor=data_transform,
    device=device,
    verbose=True,
    incremental_loss_gap=False,
    incremental_grad=True,
    incremental_grad_eps=0.9999,
    incremental_loss_eps = 0.001,
    incremental_buffer=5,
    incremental_max_iter=1,
    incremental_grad_max_iter=2,
)

In [10]:
trainer.train(
    train_loader,
    test_loaders,
    optimizer,
    scheduler,
    regularizer=False,
    training_loss=train_loss,
    eval_losses=eval_losses,
)

Training on 100 samples
Testing on [50, 50] samples         on resolutions [16, 32].
Raw outputs of shape torch.Size([16, 1, 8, 8])
[0] time=0.45, avg_loss=0.9192, train_err=13.1311
Eval: 16_h1=0.8140, 16_l2=0.6733, 32_h1=0.8277, 32_l2=0.6690
[1] time=0.35, avg_loss=0.7500, train_err=10.7146
Eval: 16_h1=1.0020, 16_l2=0.7634, 32_h1=1.2701, 32_l2=0.7752
[2] time=0.47, avg_loss=0.7208, train_err=10.2966
Eval: 16_h1=0.7426, 16_l2=0.6054, 32_h1=0.7700, 32_l2=0.6042
[3] time=0.32, avg_loss=0.6472, train_err=9.2463
Eval: 16_h1=0.6685, 16_l2=0.5072, 32_h1=0.8018, 32_l2=0.5303
[4] time=0.41, avg_loss=0.5322, train_err=7.6031
Eval: 16_h1=0.5952, 16_l2=0.4429, 32_h1=0.6902, 32_l2=0.4543
[5] time=0.36, avg_loss=0.4750, train_err=6.7855
Eval: 16_h1=0.5811, 16_l2=0.4052, 32_h1=0.7404, 32_l2=0.4333
[6] time=0.41, avg_loss=0.4208, train_err=6.0111
Eval: 16_h1=0.5013, 16_l2=0.3480, 32_h1=0.6514, 32_l2=0.3799
[7] time=0.30, avg_loss=0.3558, train_err=5.0835
Eval: 16_h1=0.4797, 16_l2=0.3328, 32_h1=0.6421

{'train_err': 3.6664573465074812,
 'avg_loss': 0.2566520142555237,
 'avg_lasso_loss': None,
 'epoch_train_time': 0.7043747089919634,
 '16_h1': tensor(0.2886),
 '16_l2': tensor(0.2240),
 '32_h1': tensor(0.3765),
 '32_l2': tensor(0.2401)}