In [1]:
from xno.models import XNO




In [2]:
import torch
import matplotlib.pyplot as plt
import sys
from neuralop.models import FNO
from neuralop.data.datasets import load_darcy_flow_small
from neuralop.utils import count_model_params
from neuralop.training import AdamW
# from neuralop.training.incremental import IncrementalFNOTrainer
from xno.training.incremental import IncrementalFNOTrainer
from neuralop.data.transforms.data_processors import IncrementalDataProcessor
from neuralop import LpLoss, H1Loss

In [3]:
train_loader, test_loaders, output_encoder = load_darcy_flow_small(
    n_train=100,
    batch_size=16,
    test_resolutions=[16, 32],
    n_tests=[100, 50],
    test_batch_sizes=[32, 32],
)

Loading test db for resolution 16 with 100 samples 
Loading test db for resolution 32 with 50 samples 


  data = torch.load(
  data = torch.load(Path(root_dir).joinpath(f"{dataset_name}_test_{res}.pt").as_posix())


In [4]:
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")


In [5]:
incremental = True
if incremental:
    starting_modes = (2, 2)
else:
    starting_modes = (16, 16)

In [6]:
model = XNO(
    max_n_modes=(16, 16),
    n_modes=(2, 2),
    hidden_channels=32,
    in_channels=1,
    out_channels=1,
    transformation="fno"
)
model = model.to(device)
n_params = count_model_params(model)

In [7]:
optimizer = AdamW(model.parameters(), lr=8e-3, weight_decay=1e-4)
scheduler = torch.optim.lr_scheduler.CosineAnnealingLR(optimizer, T_max=30)


In [8]:
data_transform = IncrementalDataProcessor(
    in_normalizer=None,
    out_normalizer=None,
    device=device,
    subsampling_rates=[2, 1],
    dataset_resolution=16,
    dataset_indices=[2, 3],
    epoch_gap=10,
    verbose=True,
)

data_transform = data_transform.to(device)

Original Incre Res: change index to 0
Original Incre Res: change sub to 2
Original Incre Res: change res to 8


In [9]:
l2loss = LpLoss(d=2, p=2)
h1loss = H1Loss(d=2)
train_loss = h1loss
eval_losses = {"h1": h1loss, "l2": l2loss}
print("\n### N PARAMS ###\n", n_params)
print("\n### OPTIMIZER ###\n", optimizer)
print("\n### SCHEDULER ###\n", scheduler)
print("\n### LOSSES ###")
print("\n### INCREMENTAL RESOLUTION + GRADIENT EXPLAINED ###")
print(f"\n * Train: {train_loss}")
print(f"\n * Test: {eval_losses}")
sys.stdout.flush()


### N PARAMS ###
 2110305

### OPTIMIZER ###
 AdamW (
Parameter Group 0
    betas: (0.9, 0.999)
    correct_bias: True
    eps: 1e-06
    initial_lr: 0.008
    lr: 0.008
    weight_decay: 0.0001
)

### SCHEDULER ###
 <torch.optim.lr_scheduler.CosineAnnealingLR object at 0x16778c250>

### LOSSES ###

### INCREMENTAL RESOLUTION + GRADIENT EXPLAINED ###

 * Train: <neuralop.losses.data_losses.H1Loss object at 0x16a2bfc90>

 * Test: {'h1': <neuralop.losses.data_losses.H1Loss object at 0x16a2bfc90>, 'l2': <neuralop.losses.data_losses.LpLoss object at 0x16a2bf690>}


In [10]:
# Finally pass all of these to the Trainer
trainer = IncrementalFNOTrainer(
    model=model,
    n_epochs=20,
    data_processor=data_transform,
    device=device,
    verbose=True,
    incremental_loss_gap=False,
    incremental_grad=True,
    incremental_grad_eps=0.9999,
    incremental_loss_eps = 0.001,
    incremental_buffer=5,
    incremental_max_iter=1,
    incremental_grad_max_iter=2,
)

In [11]:
trainer.train(
    train_loader,
    test_loaders,
    optimizer,
    scheduler,
    regularizer=False,
    training_loss=train_loss,
    eval_losses=eval_losses,
)

Training on 100 samples
Testing on [50, 50] samples         on resolutions [16, 32].
> [0;32m/Users/sina/Documents/GitHub_Local/XNO/xno/layers/spectral_convolution_fourier.py[0m(470)[0;36mforward[0;34m()[0m
[0;32m    468 [0;31m[0;34m[0m[0m
[0m[0;32m    469 [0;31m        [0;32mimport[0m [0mpdb[0m[0;34m;[0m [0mpdb[0m[0;34m.[0m[0mset_trace[0m[0;34m([0m[0;34m)[0m[0;34m[0m[0;34m[0m[0m
[0m[0;32m--> 470 [0;31m        [0mout_fft[0m[0;34m[[0m[0mslices_x[0m[0;34m][0m [0;34m=[0m [0mself[0m[0;34m.[0m[0m_contract[0m[0;34m([0m[0mx[0m[0;34m[[0m[0mslices_x[0m[0;34m][0m[0;34m,[0m [0mweight[0m[0;34m,[0m [0mseparable[0m[0;34m=[0m[0mself[0m[0;34m.[0m[0mseparable[0m[0;34m)[0m[0;34m[0m[0;34m[0m[0m
[0m[0;32m    471 [0;31m[0;34m[0m[0m
[0m[0;32m    472 [0;31m        [0;32mif[0m [0mself[0m[0;34m.[0m[0mresolution_scaling_factor[0m [0;32mis[0m [0;32mnot[0m [0;32mNone[0m [0;32mand[0m [0moutput_shape[0m 

In [None]:
x = "SINA"
x.lower()

In [None]:
torch.Size([1, 1, 0, 0])
torch.Size([32, 32, 16, 1])