In [None]:
import timm
import gc
import wandb
from fastai.vision.all import *
from fastai.callback.wandb import *
from utils.core import *

path = Path('/root/.fastai/data/oxford-iiit-pet')
Path.BASE_PATH = path

df = pd.read_csv('pets_sample.csv')

sweep_cfg = {
    'metric': {'name': 'error_rate', 'goal': 'minimize'},
    'method': 'bayes',
    'parameters': {
        'epochs': {
            'value': 15
        },
        'pre_size': {
            'value': 160,
        },
        'post_size': {
            'value': 112,
        },
        'pre_bs': {
            'value': 256,
        },
        'post_bs': {
            'value': 192,
        },
        'epochs': {
            'value': 15,
        },
        'pre_lr': {
            'min': 1e-3,
            'max': 1e-2
        },
        'pre_epoch': {
            'values': [1,2,3,5],
        },
        'post_lr': {
            'min': 1e-3,
            'max': 5e-3
        },
        'post_div': {
            'min': 50,
            'max': 300
        }
    }
   
}

def get_dls(item_tfms=Resize(160), 
            batch_tfms=aug_transforms(size=112), 
            valid_pct=.4,
            bs=64):
    return ImageDataLoaders.from_df(df, path/'images',
                                    splitter=RandomSplitter(seed=42), 
                                    valid_pct=valid_pct,
                                    item_tfms=item_tfms,
                                    batch_tfms=batch_tfms,
                                    seed=42,
                                    bs=bs)

def get_learn():
        return vision_learner(get_dls(), arch, 
                           metrics=error_rate)

arch = 'convnext_tiny_in22k'

def trainer():
    wandb.init(reinit=True)
    dls = get_dls(item_tfms=Resize(wandb.config.pre_size),
                  batch_tfms=aug_transforms(size=wandb.config.post_size),
                  bs=wandb.config.pre_bs)
    learn = vision_learner(get_dls(), arch, 
                           cbs=[WandbCallback()], 
                           metrics=error_rate)
    learn.fit_one_cycle(wandb.config.pre_epoch, lr_max=wandb.config.pre_lr)
    learn.unfreeze()
    learn.dls = get_dls(item_tfms=Resize(wandb.config.pre_size),
                  batch_tfms=aug_transforms(size=wandb.config.post_size),
                  bs=wandb.config.post_bs)
    learn.fit_one_cycle(wandb.config.epochs - wandb.config.pre_epoch, lr_max=(wandb.config.post_lr/wandb.config.post_div, wandb.config.post_lr))
    learn = None
    dls = None
    gc.collect()
    torch.cuda.empty_cache()
    gc.collect()

In [None]:
sweep_id = wandb.sweep(sweep_cfg)

Create sweep with ID: eqtzlnpa
Sweep URL: https://wandb.ai/mark_b2/uncategorized/sweeps/eqtzlnpa


In [None]:
count = 30

wandb.agent(sweep_id, function=trainer, count=count)

[34m[1mwandb[0m: Agent Starting Run: ue0t4e25 with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 142
[34m[1mwandb[0m: 	post_lr: 0.003599811738647518
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 2
[34m[1mwandb[0m: 	pre_lr: 0.005953066444339557
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,2.17772,1.235804,0.29684,00:21
1,1.335288,0.614822,0.181716,00:19


epoch,train_loss,valid_loss,error_rate,time
0,0.582611,0.521495,0.147855,00:32
1,0.528809,0.480726,0.139955,00:34
2,0.510912,0.450453,0.143341,00:32
3,0.46945,0.461765,0.143341,00:34
4,0.434231,0.441519,0.133183,00:32
5,0.397621,0.412497,0.124153,00:34
6,0.361418,0.454141,0.126411,00:33
7,0.325793,0.433878,0.11851,00:34
8,0.30329,0.437319,0.121896,00:33
9,0.281267,0.436678,0.130925,00:34


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▃▃▄▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▄▂▂▂▂▂▁▁▁▁▂▁▁▁
lr_0,▁▃▆███▇▆▅▄▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▃▆███▇▆▅▄▃▂▁▁▁▂▃▄▅▅▅▅▅▅▅▅▄▄▄▃▃▃▂▂▂▁▁▁▁▁
mom_0,█▇▃▁▁▁▂▃▄▅▆▇███▇▅▄▂▁▁▁▁▁▂▂▃▃▄▄▅▅▆▆▇▇████
mom_1,█▇▃▁▁▁▂▃▄▅▆▇███▇▅▄▂▁▁▁▁▁▂▂▃▃▄▄▅▅▆▆▇▇████
raw_loss,█▆▄▃▂▂▃▂▂▂▂▂▁▂▂▂▁▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.11738
lr_0,0.0
lr_1,0.0
mom_0,0.94993
mom_1,0.94993
raw_loss,0.11394
sqr_mom_0,0.99


[34m[1mwandb[0m: Agent Starting Run: 8com4bdy with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 124
[34m[1mwandb[0m: 	post_lr: 0.002003432307784184
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 5
[34m[1mwandb[0m: 	pre_lr: 0.0068666864040531385
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,2.397966,0.833584,0.22912,00:19
1,1.465582,0.746616,0.214447,00:19
2,1.111381,0.513342,0.172686,00:20
3,0.821673,0.507054,0.151242,00:19
4,0.632917,0.482132,0.145598,00:20


epoch,train_loss,valid_loss,error_rate,time
0,0.270486,0.461019,0.143341,00:32
1,0.27375,0.432991,0.142212,00:33
2,0.256579,0.437333,0.126411,00:33
3,0.246045,0.432042,0.123025,00:33
4,0.234093,0.432162,0.125282,00:33
5,0.218807,0.400259,0.126411,00:33
6,0.203766,0.402335,0.117381,00:33
7,0.191093,0.410897,0.11851,00:33
8,0.175586,0.414402,0.121896,00:34
9,0.167851,0.414887,0.120767,00:34


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▃▃▃▄▄▄▅▅▅▆▆▆▇▇▇██
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▇▄▃▃▃▃▂▁▁▂▁▁▁▁
lr_0,▁▂▃▅▆█████▇▇▆▆▅▅▄▄▃▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▂▃▅▆█████▇▇▆▆▅▅▄▄▃▃▂▂▁▁▁▁▂▂▃▃▃▃▃▂▂▂▂▁▁▁
mom_0,█▇▆▄▃▁▁▁▁▁▂▂▃▃▄▄▅▅▆▇▇▇████▆▃▁▁▁▂▃▃▄▅▆▇██
mom_1,█▇▆▄▃▁▁▁▁▁▂▂▃▃▄▄▅▅▆▇▇▇████▆▃▁▁▁▂▃▃▄▅▆▇██
raw_loss,█▆▅▃▂▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.12077
lr_0,0.0
lr_1,0.0
mom_0,0.94988
mom_1,0.94988
raw_loss,0.11108
sqr_mom_0,0.99


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: huyub6yk with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 155
[34m[1mwandb[0m: 	post_lr: 0.003400996082835743
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 2
[34m[1mwandb[0m: 	pre_lr: 0.006197069664059922
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,2.084426,0.842091,0.215576,00:19
1,1.286467,0.56224,0.168172,00:19


epoch,train_loss,valid_loss,error_rate,time
0,0.6045,0.490483,0.147856,00:32
1,0.566612,0.441342,0.138826,00:34
2,0.518596,0.438406,0.134311,00:33
3,0.475245,0.435579,0.130926,00:33
4,0.441266,0.468858,0.143341,00:32
5,0.400058,0.438878,0.136569,00:34
6,0.364602,0.409831,0.124153,00:33
7,0.333965,0.399876,0.119639,00:34
8,0.302359,0.396745,0.121896,00:33
9,0.276099,0.404945,0.125282,00:34


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▃▃▄▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▅▃▂▂▂▃▂▁▁▁▁▁▁▁
lr_0,▁▃▆███▇▆▅▄▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▃▆███▇▆▅▄▃▂▁▁▁▂▂▃▄▅▅▅▅▅▄▄▄▄▃▃▃▃▂▂▂▁▁▁▁▁
mom_0,█▇▃▁▁▁▂▃▄▅▆▇███▇▅▄▂▁▁▁▁▁▂▂▃▃▄▄▅▅▆▆▇▇████
mom_1,█▇▃▁▁▁▂▃▄▅▆▇███▇▅▄▂▁▁▁▁▁▂▂▃▃▄▄▅▅▆▆▇▇████
raw_loss,█▇▄▃▃▂▃▂▂▂▂▂▂▂▂▂▂▂▁▂▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.12415
lr_0,0.0
lr_1,0.0
mom_0,0.94993
mom_1,0.94993
raw_loss,0.11107
sqr_mom_0,0.99


[34m[1mwandb[0m: Agent Starting Run: 43tf9co8 with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 186
[34m[1mwandb[0m: 	post_lr: 0.0012084244303314855
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 1
[34m[1mwandb[0m: 	pre_lr: 0.0034467599443813684
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,2.149378,0.84742,0.269752,00:19


epoch,train_loss,valid_loss,error_rate,time
0,1.051669,0.712124,0.235892,00:32
1,0.967457,0.582604,0.196388,00:33
2,0.901173,0.547134,0.176072,00:33
3,0.831682,0.472861,0.145598,00:33
4,0.754191,0.452431,0.148984,00:33
5,0.685761,0.429108,0.143341,00:33
6,0.637912,0.416003,0.133183,00:33
7,0.589108,0.414752,0.128668,00:33
8,0.544974,0.42914,0.142212,00:34
9,0.503717,0.418864,0.138826,00:33


VBox(children=(Label(value='0.792 MB of 0.792 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▅▆▆▆▆▆▇▇▇▇▇███
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▆▄▃▂▂▂▁▁▂▂▁▁▁▁
lr_0,▁▄██▆▄▃▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▄██▆▄▃▁▁▁▂▂▂▃▃▃▃▃▃▃▃▃▃▃▃▃▂▂▂▂▂▂▂▁▁▁▁▁▁▁
mom_0,█▆▁▁▃▅▆███▇▅▄▃▂▁▁▁▁▁▂▂▂▂▃▃▄▄▅▅▆▆▆▇▇▇████
mom_1,█▆▁▁▃▅▆███▇▅▄▃▂▁▁▁▁▁▂▂▂▂▃▃▄▄▅▅▆▆▆▇▇▇████
raw_loss,█▇▄▃▃▂▂▃▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.13093
lr_0,0.0
lr_1,0.0
mom_0,0.94994
mom_1,0.94994
raw_loss,0.28283
sqr_mom_0,0.99


[34m[1mwandb[0m: Agent Starting Run: yi8nm4nv with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 258
[34m[1mwandb[0m: 	post_lr: 0.003824958738122875
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 1
[34m[1mwandb[0m: 	pre_lr: 0.00121240170606479
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,2.782294,0.984042,0.323928,00:20


epoch,train_loss,valid_loss,error_rate,time
0,1.348972,0.732977,0.23702,00:33
1,1.194288,0.575599,0.174944,00:33
2,1.029995,0.573749,0.171558,00:34
3,0.900952,0.568701,0.179458,00:33
4,0.790445,0.505459,0.156885,00:33
5,0.704066,0.493014,0.141084,00:33
6,0.630956,0.475191,0.148984,00:34
7,0.566988,0.441504,0.137697,00:33
8,0.50886,0.441628,0.143341,00:34
9,0.458423,0.41935,0.13544,00:33


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▅▆▆▆▆▆▇▇▇▇▇███
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▅▃▃▃▂▂▂▁▂▁▁▁▁▁
lr_0,▁▄██▆▄▃▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▂▃▃▃▂▂▁▁▂▃▄▅▆▇█████▇▇▇▇▆▆▅▅▄▄▃▃▃▂▂▂▁▁▁▁
mom_0,█▆▁▁▃▅▆███▇▅▄▃▂▁▁▁▁▁▂▂▂▂▃▃▄▄▅▅▆▆▆▇▇▇████
mom_1,█▆▁▁▃▅▆███▇▅▄▃▂▁▁▁▁▁▂▂▂▂▃▃▄▄▅▅▆▆▆▇▇▇████
raw_loss,▇█▆▄▃▃▃▃▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.13093
lr_0,0.0
lr_1,0.0
mom_0,0.94994
mom_1,0.94994
raw_loss,0.14933
sqr_mom_0,0.99


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 9t9b4nyu with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 130
[34m[1mwandb[0m: 	post_lr: 0.003501266480924779
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 2
[34m[1mwandb[0m: 	pre_lr: 0.003658979201231808
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,2.326228,0.815761,0.22912,00:19
1,1.419945,0.560383,0.179458,00:19


epoch,train_loss,valid_loss,error_rate,time
0,0.690405,0.470045,0.142212,00:32
1,0.618581,0.446282,0.146727,00:34
2,0.58244,0.47988,0.159142,00:33
3,0.538173,0.53751,0.168172,00:34
4,0.490013,0.456427,0.154628,00:32
5,0.448247,0.400459,0.123025,00:34
6,0.405381,0.420909,0.125282,00:33
7,0.372415,0.421325,0.132054,00:34
8,0.334816,0.383081,0.121896,00:32
9,0.304944,0.37085,0.116253,00:34


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▃▃▄▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▅▃▃▄▄▄▂▂▂▂▁▁▁▁
lr_0,▁▃▆███▇▆▅▄▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▃▆███▇▆▅▄▃▂▁▁▁▂▄▅▇████▇▇▇▆▆▅▅▄▄▃▃▂▂▁▁▁▁
mom_0,█▇▃▁▁▁▂▃▄▅▆▇███▇▅▄▂▁▁▁▁▁▂▂▃▃▄▄▅▅▆▆▇▇████
mom_1,█▇▃▁▁▁▂▃▄▅▆▇███▇▅▄▂▁▁▁▁▁▂▂▃▃▄▄▅▅▆▆▇▇████
raw_loss,██▄▃▃▃▂▂▂▂▂▂▂▁▂▂▂▂▁▂▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.11738
lr_0,0.0
lr_1,0.0
mom_0,0.94993
mom_1,0.94993
raw_loss,0.14498
sqr_mom_0,0.99


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: v3d4qlry with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 287
[34m[1mwandb[0m: 	post_lr: 0.004788432780392347
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 3
[34m[1mwandb[0m: 	pre_lr: 0.0013228319674035798
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,3.14417,0.950282,0.320542,00:20
1,1.90219,0.589652,0.199774,00:19
2,1.345357,0.52755,0.167043,00:19


epoch,train_loss,valid_loss,error_rate,time
0,0.698349,0.485296,0.147856,00:34
1,0.670701,0.547167,0.17833,00:32
2,0.637045,0.494433,0.150113,00:34
3,0.580854,0.563814,0.154628,00:33
4,0.543937,0.457302,0.136569,00:34
5,0.490216,0.487159,0.144469,00:32
6,0.444615,0.509974,0.138826,00:34
7,0.410669,0.461174,0.136569,00:32
8,0.372316,0.443881,0.141083,00:34
9,0.34042,0.427191,0.138826,00:33


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇██
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▃▂▁▃▂▂▁▁▁▁▁▁▁▁
lr_0,▁▂▄▇███▇▇▆▆▅▄▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▁▂▃▃▃▃▃▃▂▂▂▂▂▁▁▁▁▁▂▄▆▇████▇▇▆▅▅▄▃▃▂▂▁▁▁
mom_0,█▇▅▂▁▁▁▂▂▃▃▄▅▆▇▇████▆▃▂▁▁▁▁▂▂▃▄▄▅▆▆▇▇███
mom_1,█▇▅▂▁▁▁▂▂▃▃▄▅▆▇▇████▆▃▂▁▁▁▁▂▂▃▄▄▅▆▆▇▇███
raw_loss,██▇▄▃▃▃▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.13544
lr_0,0.0
lr_1,0.0
mom_0,0.94992
mom_1,0.94992
raw_loss,0.11935
sqr_mom_0,0.99


[34m[1mwandb[0m: Agent Starting Run: td272lfs with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 126
[34m[1mwandb[0m: 	post_lr: 0.003587295254683906
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 3
[34m[1mwandb[0m: 	pre_lr: 0.0033813688479561103
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,2.562408,0.837786,0.241535,00:20
1,1.547051,0.580658,0.190745,00:19
2,1.104766,0.506475,0.162528,00:20


epoch,train_loss,valid_loss,error_rate,time
0,0.448328,0.493916,0.159142,00:34
1,0.468744,0.461377,0.145598,00:33
2,0.427296,0.479468,0.144469,00:35
3,0.390661,0.506558,0.147856,00:33
4,0.354919,0.429439,0.141084,00:33
5,0.332366,0.452907,0.134312,00:32
6,0.310313,0.484796,0.151241,00:34
7,0.288443,0.452299,0.138826,00:32
8,0.269713,0.425541,0.124153,00:33
9,0.248628,0.418213,0.121896,00:32


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇██
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▅▄▃▃▃▃▂▂▃▂▁▁▁▁
lr_0,▁▂▄▇███▇▇▆▆▅▄▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▂▄▇▇█▇▇▇▆▅▄▄▃▂▂▁▁▁▂▄▆▇████▇▇▆▅▅▄▃▃▂▂▁▁▁
mom_0,█▇▅▂▁▁▁▂▂▃▃▄▅▆▇▇████▆▃▂▁▁▁▁▂▂▃▄▄▅▆▆▇▇███
mom_1,█▇▅▂▁▁▁▂▂▃▃▄▅▆▇▇████▆▃▂▁▁▁▁▂▂▃▄▄▅▆▆▇▇███
raw_loss,██▅▃▃▂▂▂▃▂▂▂▂▂▂▂▂▁▁▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.11738
lr_0,0.0
lr_1,0.0
mom_0,0.94992
mom_1,0.94992
raw_loss,0.13791
sqr_mom_0,0.99


[34m[1mwandb[0m: Agent Starting Run: p1eacgwh with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 138
[34m[1mwandb[0m: 	post_lr: 0.0034955001640792687
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 3
[34m[1mwandb[0m: 	pre_lr: 0.003001901170682759
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,2.632253,0.734553,0.214447,00:19
1,1.541019,0.535822,0.1614,00:19
2,1.106514,0.468172,0.155756,00:19


epoch,train_loss,valid_loss,error_rate,time
0,0.578427,0.453573,0.147856,00:33
1,0.522061,0.461707,0.147856,00:33
2,0.474826,0.432214,0.133183,00:33
3,0.441368,0.444765,0.137697,00:32
4,0.418523,0.454446,0.137698,00:33
5,0.392423,0.47694,0.146727,00:33
6,0.362539,0.436759,0.146727,00:33
7,0.328382,0.428695,0.141084,00:32
8,0.298259,0.443005,0.13544,00:35
9,0.272708,0.434441,0.130926,00:33


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇██
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▄▃▂▂▁▂▂▂▂▂▁▁▁▁
lr_0,▁▂▄▇███▇▇▆▆▅▄▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▂▄▆▇▇▇▇▆▅▅▄▃▃▂▂▁▁▁▂▄▆▇████▇▇▆▅▅▄▃▃▂▂▁▁▁
mom_0,█▇▅▂▁▁▁▂▂▃▃▄▅▆▇▇████▆▃▂▁▁▁▁▂▂▃▄▄▅▆▆▇▇███
mom_1,█▇▅▂▁▁▁▂▂▃▃▄▅▆▇▇████▆▃▂▁▁▁▁▂▂▃▄▄▅▆▆▇▇███
raw_loss,██▅▄▃▂▃▂▂▂▂▁▂▂▁▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.13205
lr_0,0.0
lr_1,0.0
mom_0,0.94992
mom_1,0.94992
raw_loss,0.15636
sqr_mom_0,0.99


[34m[1mwandb[0m: Agent Starting Run: 81h6oay3 with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 69
[34m[1mwandb[0m: 	post_lr: 0.0025340396295877067
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 5
[34m[1mwandb[0m: 	pre_lr: 0.007686799891943015
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,2.383051,0.854751,0.231377,00:19
1,1.514319,0.828415,0.251693,00:20
2,1.096589,0.585221,0.1614,00:20
3,0.817414,0.454033,0.137698,00:19
4,0.645934,0.44901,0.129797,00:19


epoch,train_loss,valid_loss,error_rate,time
0,0.302487,0.416906,0.121896,00:32
1,0.288271,0.407838,0.126411,00:33
2,0.265111,0.422208,0.136569,00:33
3,0.240113,0.411726,0.126411,00:33
4,0.218281,0.435338,0.13544,00:33
5,0.202749,0.446755,0.134312,00:33
6,0.192129,0.422532,0.121896,00:34
7,0.178232,0.417544,0.11851,00:33
8,0.164369,0.412968,0.117381,00:33
9,0.155178,0.411373,0.117381,00:33


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▃▃▃▄▄▄▅▅▅▆▆▆▇▇▇██
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,▇█▃▂▂▁▁▂▁▂▂▁▁▁▁
lr_0,▁▂▃▅▆█████▇▇▆▆▅▅▄▄▃▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▂▃▅▆█████▇▇▆▆▅▅▄▄▃▃▂▂▁▁▁▁▂▃▃▃▃▃▃▃▂▂▂▁▁▁
mom_0,█▇▆▄▃▁▁▁▁▁▂▂▃▃▄▄▅▅▆▇▇▇████▆▃▁▁▁▂▃▃▄▅▆▇██
mom_1,█▇▆▄▃▁▁▁▁▁▂▂▃▃▄▄▅▅▆▇▇▇████▆▃▁▁▁▂▃▃▄▅▆▇██
raw_loss,█▆▄▃▃▂▂▂▂▂▂▂▂▂▁▂▁▁▂▁▁▁▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.11738
lr_0,0.0
lr_1,0.0
mom_0,0.94988
mom_1,0.94988
raw_loss,0.06792
sqr_mom_0,0.99


[34m[1mwandb[0m: Agent Starting Run: au5ethdm with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 130
[34m[1mwandb[0m: 	post_lr: 0.0039904652371596586
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 5
[34m[1mwandb[0m: 	pre_lr: 0.008189877948369496
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,2.332395,1.17042,0.291196,00:20
1,1.481106,0.693923,0.205418,00:19
2,1.114305,0.561515,0.158014,00:19
3,0.804627,0.450331,0.142212,00:20
4,0.625933,0.435756,0.142212,00:20


epoch,train_loss,valid_loss,error_rate,time
0,0.323571,0.415457,0.129797,00:33
1,0.301156,0.431286,0.128668,00:33
2,0.2723,0.463507,0.153499,00:33
3,0.25527,0.434237,0.125282,00:33
4,0.237609,0.497321,0.143341,00:33
5,0.217559,0.435075,0.124153,00:32
6,0.203603,0.42199,0.12754,00:34
7,0.190767,0.412594,0.123025,00:33
8,0.17644,0.412727,0.116253,00:33
9,0.163157,0.410259,0.117381,00:33


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▃▃▃▄▄▄▅▅▅▆▆▆▇▇▇██
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▅▃▂▂▂▁▂▁▂▁▁▁▁▁
lr_0,▁▂▃▅▆█████▇▇▆▆▅▅▄▄▃▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▂▃▅▆█████▇▇▆▆▅▅▄▄▃▂▂▂▁▁▁▁▂▃▄▄▄▄▄▃▃▂▂▁▁▁
mom_0,█▇▆▄▃▁▁▁▁▁▂▂▃▃▄▄▅▅▆▇▇▇████▆▃▁▁▁▂▃▃▄▅▆▇██
mom_1,█▇▆▄▃▁▁▁▁▁▂▂▃▃▄▄▅▅▆▇▇▇████▆▃▁▁▁▂▃▃▄▅▆▇██
raw_loss,█▆▄▃▂▃▂▂▃▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.11738
lr_0,0.0
lr_1,0.0
mom_0,0.94988
mom_1,0.94988
raw_loss,0.11966
sqr_mom_0,0.99


[34m[1mwandb[0m: Agent Starting Run: kf0t2izu with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 132
[34m[1mwandb[0m: 	post_lr: 0.004467565792299251
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 3
[34m[1mwandb[0m: 	pre_lr: 0.007015047168113523
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,2.168519,0.787125,0.208804,00:20
1,1.338106,0.671849,0.204289,00:20
2,0.94831,0.474272,0.141084,00:20


epoch,train_loss,valid_loss,error_rate,time
0,0.464539,0.437945,0.138826,00:33
1,0.414806,0.41271,0.142212,00:33
2,0.38152,0.426968,0.138826,00:36
3,0.353234,0.506418,0.148984,00:33
4,0.338942,0.516808,0.148984,00:34
5,0.313766,0.470527,0.141084,00:35
6,0.286498,0.465518,0.13544,00:36
7,0.263331,0.467181,0.132054,00:34
8,0.243003,0.431571,0.120767,00:33
9,0.225154,0.417244,0.113995,00:33


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇██
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,██▃▃▃▃▄▄▃▃▂▁▁▁▁
lr_0,▁▂▄▇███▇▇▆▆▅▄▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▂▄▇███▇▇▆▆▅▄▃▂▂▁▁▁▁▃▄▅▅▅▅▅▅▅▄▄▃▃▂▂▂▁▁▁▁
mom_0,█▇▅▂▁▁▁▂▂▃▃▄▅▆▇▇████▆▃▂▁▁▁▁▂▂▃▄▄▅▆▆▇▇███
mom_1,█▇▅▂▁▁▁▂▂▃▃▄▅▆▇▇████▆▃▂▁▁▁▁▂▂▃▄▄▅▆▆▇▇███
raw_loss,█▇▄▃▃▂▂▂▂▂▂▂▂▂▂▂▂▂▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.11512
lr_0,0.0
lr_1,0.0
mom_0,0.94992
mom_1,0.94992
raw_loss,0.11166
sqr_mom_0,0.99


[34m[1mwandb[0m: Agent Starting Run: 3hvhp3ym with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 173
[34m[1mwandb[0m: 	post_lr: 0.0015112958851122992
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 2
[34m[1mwandb[0m: 	pre_lr: 0.008184473119240773
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,2.107058,0.970963,0.247178,00:20
1,1.368828,0.613855,0.19526,00:19


epoch,train_loss,valid_loss,error_rate,time
0,0.639103,0.574777,0.180587,00:32
1,0.610664,0.532427,0.167043,00:33
2,0.559732,0.509613,0.164786,00:33
3,0.51513,0.467468,0.155756,00:33
4,0.474509,0.456886,0.139955,00:33
5,0.44168,0.441778,0.14447,00:34
6,0.412166,0.412644,0.12754,00:33
7,0.387395,0.413294,0.129797,00:37
8,0.358232,0.408659,0.124153,00:35
9,0.337805,0.410938,0.124153,00:35


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▃▃▄▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▅▄▄▃▃▂▂▁▁▁▁▁▁▁
lr_0,▁▃▆███▇▆▅▄▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▃▆███▇▆▅▄▃▂▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁
mom_0,█▇▃▁▁▁▂▃▄▅▆▇███▇▅▄▂▁▁▁▁▁▂▂▃▃▄▄▅▅▆▆▇▇████
mom_1,█▇▃▁▁▁▂▃▄▅▆▇███▇▅▄▂▁▁▁▁▁▂▂▃▃▄▄▅▅▆▆▇▇████
raw_loss,█▆▄▃▂▃▃▂▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.1219
lr_0,0.0
lr_1,0.0
mom_0,0.94993
mom_1,0.94993
raw_loss,0.20895
sqr_mom_0,0.99


[34m[1mwandb[0m: Agent Starting Run: e66jviqd with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 81
[34m[1mwandb[0m: 	post_lr: 0.0010236798188908308
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 2
[34m[1mwandb[0m: 	pre_lr: 0.008735506879459766
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,2.083353,0.994506,0.225734,00:19
1,1.317363,0.641394,0.17833,00:19


epoch,train_loss,valid_loss,error_rate,time
0,0.689335,0.590286,0.163657,00:33
1,0.648251,0.492912,0.153499,00:35
2,0.594386,0.439799,0.142212,00:35
3,0.547851,0.422894,0.148984,00:36
4,0.507379,0.423431,0.145598,00:32
5,0.473888,0.39673,0.13544,00:34
6,0.435845,0.37951,0.134312,00:33
7,0.407873,0.371379,0.12754,00:35
8,0.384903,0.3726,0.125282,00:35
9,0.364568,0.369822,0.121896,00:36


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▃▃▄▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▅▄▃▃▃▃▂▂▂▁▁▁▁▁
lr_0,▁▃▆███▇▆▅▄▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▃▆███▇▆▅▄▃▂▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁
mom_0,█▇▃▁▁▁▂▃▄▅▆▇███▇▅▄▂▁▁▁▁▁▂▂▃▃▄▄▅▅▆▆▇▇████
mom_1,█▇▃▁▁▁▂▃▄▅▆▇███▇▅▄▂▁▁▁▁▁▂▂▃▃▄▄▅▅▆▆▇▇████
raw_loss,█▆▃▂▂▃▃▂▂▂▂▂▂▂▂▂▂▂▁▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.11851
lr_0,0.0
lr_1,0.0
mom_0,0.94993
mom_1,0.94993
raw_loss,0.20204
sqr_mom_0,0.99


[34m[1mwandb[0m: Agent Starting Run: 9cjjqbfj with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 81
[34m[1mwandb[0m: 	post_lr: 0.002523710684067091
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 1
[34m[1mwandb[0m: 	pre_lr: 0.003200195141813191
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,2.223339,0.847811,0.267494,00:20


epoch,train_loss,valid_loss,error_rate,time
0,0.974247,0.632088,0.20316,00:34
1,0.890583,0.549706,0.168172,00:34
2,0.805847,0.507929,0.160271,00:34
3,0.714285,0.469939,0.142212,00:33
4,0.633801,0.446418,0.136569,00:34
5,0.564793,0.442334,0.136569,00:33
6,0.511307,0.404928,0.128668,00:33
7,0.458429,0.389142,0.126411,00:34
8,0.417775,0.402057,0.127539,00:34
9,0.379768,0.397244,0.125282,00:33


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▅▆▆▆▆▆▇▇▇▇▇███
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▅▃▃▂▂▂▁▁▁▁▁▁▁▁
lr_0,▁▄██▆▄▃▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▄██▆▄▃▁▁▁▂▃▄▅▆▆▇▆▆▆▆▆▆▅▅▅▄▄▄▃▃▃▂▂▂▁▁▁▁▁
mom_0,█▆▁▁▃▅▆███▇▅▄▃▂▁▁▁▁▁▂▂▂▂▃▃▄▄▅▅▆▆▆▇▇▇████
mom_1,█▆▁▁▃▅▆███▇▅▄▃▂▁▁▁▁▁▂▂▂▂▃▃▄▄▅▅▆▆▆▇▇▇████
raw_loss,██▅▃▃▃▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.11964
lr_0,0.0
lr_1,0.0
mom_0,0.94994
mom_1,0.94994
raw_loss,0.17897
sqr_mom_0,0.99


[34m[1mwandb[0m: Agent Starting Run: 2ej1vpnc with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 191
[34m[1mwandb[0m: 	post_lr: 0.004455571284633971
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 3
[34m[1mwandb[0m: 	pre_lr: 0.0029666999877714616
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,2.646176,0.762773,0.208804,00:20
1,1.534201,0.528379,0.176072,00:19
2,1.081072,0.50199,0.162528,00:20


epoch,train_loss,valid_loss,error_rate,time
0,0.503312,0.440839,0.146727,00:33
1,0.483618,0.4481,0.145598,00:33
2,0.451274,0.470136,0.148984,00:33
3,0.426776,0.500527,0.146727,00:33
4,0.395996,0.488451,0.151242,00:33
5,0.361424,0.461218,0.141084,00:33
6,0.338905,0.446973,0.129797,00:33
7,0.313188,0.45042,0.127539,00:33
8,0.291364,0.465599,0.126411,00:33
9,0.271814,0.467761,0.134311,00:33


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇██
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▅▄▃▃▃▃▃▂▁▁▁▂▁▁
lr_0,▁▂▄▇███▇▇▆▆▅▄▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▂▃▅▅▆▅▅▅▄▄▃▃▂▂▁▁▁▁▂▄▆▇████▇▇▆▅▅▄▃▃▂▂▁▁▁
mom_0,█▇▅▂▁▁▁▂▂▃▃▄▅▆▇▇████▆▃▂▁▁▁▁▂▂▃▄▄▅▆▆▇▇███
mom_1,█▇▅▂▁▁▁▂▂▃▃▄▅▆▇▇████▆▃▂▁▁▁▁▂▂▃▄▄▅▆▆▇▇███
raw_loss,██▅▃▃▃▂▂▂▂▂▂▂▁▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.13093
lr_0,0.0
lr_1,0.0
mom_0,0.94992
mom_1,0.94992
raw_loss,0.09103
sqr_mom_0,0.99


[34m[1mwandb[0m: Agent Starting Run: 451qwzms with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 76
[34m[1mwandb[0m: 	post_lr: 0.0027006625386848124
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 2
[34m[1mwandb[0m: 	pre_lr: 0.003746141169832658
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,2.367069,0.746705,0.239278,00:20
1,1.439292,0.577544,0.188488,00:20


epoch,train_loss,valid_loss,error_rate,time
0,0.634081,0.507914,0.163657,00:32
1,0.600396,0.471824,0.146727,00:34
2,0.528556,0.46552,0.154628,00:33
3,0.481625,0.450475,0.144469,00:34
4,0.445858,0.442038,0.142212,00:33
5,0.406687,0.420026,0.142212,00:34
6,0.363821,0.462228,0.143341,00:33
7,0.333004,0.426473,0.126411,00:33
8,0.302575,0.390546,0.119639,00:33
9,0.277664,0.384006,0.116253,00:34


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▃▃▄▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▅▄▃▃▃▃▃▃▂▁▁▁▁▁
lr_0,▁▃▆███▇▆▅▄▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▃▆███▇▆▅▄▃▂▁▁▁▂▃▄▅▆▆▆▆▆▆▅▅▅▄▄▃▃▃▂▂▂▁▁▁▁
mom_0,█▇▃▁▁▁▂▃▄▅▆▇███▇▅▄▂▁▁▁▁▁▂▂▃▃▄▄▅▅▆▆▇▇████
mom_1,█▇▃▁▁▁▂▃▄▅▆▇███▇▅▄▂▁▁▁▁▁▂▂▃▃▄▄▅▅▆▆▇▇████
raw_loss,█▇▅▃▃▂▂▂▂▂▂▂▁▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.114
lr_0,0.0
lr_1,0.0
mom_0,0.94993
mom_1,0.94993
raw_loss,0.14247
sqr_mom_0,0.99


[34m[1mwandb[0m: Agent Starting Run: 1zrjftk0 with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 144
[34m[1mwandb[0m: 	post_lr: 0.002376118889493601
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 3
[34m[1mwandb[0m: 	pre_lr: 0.0016276775005191382
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,3.039384,0.802005,0.249436,00:20
1,1.76446,0.504079,0.1614,00:19
2,1.262444,0.489636,0.153499,00:19


epoch,train_loss,valid_loss,error_rate,time
0,0.656223,0.468509,0.145598,00:34
1,0.648477,0.483663,0.15237,00:33
2,0.592987,0.475368,0.147856,00:34
3,0.543069,0.49583,0.167043,00:33
4,0.496596,0.446144,0.134311,00:34
5,0.455387,0.455743,0.142212,00:32
6,0.418401,0.438576,0.130925,00:34
7,0.382351,0.408487,0.113995,00:33
8,0.35299,0.401242,0.120767,00:34
9,0.327598,0.398446,0.120767,00:33


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇██
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▃▃▃▃▃▄▂▂▂▁▁▁▁▁
lr_0,▁▂▄▇███▇▇▆▆▅▄▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▂▃▅▆▆▆▅▅▄▄▃▃▃▂▁▁▁▁▂▄▆▇████▇▇▆▅▅▄▃▃▂▂▁▁▁
mom_0,█▇▅▂▁▁▁▂▂▃▃▄▅▆▇▇████▆▃▂▁▁▁▁▂▂▃▄▄▅▆▆▇▇███
mom_1,█▇▅▂▁▁▁▂▂▃▃▄▅▆▇▇████▆▃▂▁▁▁▁▂▂▃▄▄▅▆▆▇▇███
raw_loss,█▇▇▄▃▃▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▁▁▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.12302
lr_0,0.0
lr_1,0.0
mom_0,0.94992
mom_1,0.94992
raw_loss,0.16313
sqr_mom_0,0.99


[34m[1mwandb[0m: Agent Starting Run: 0m5jid31 with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 216
[34m[1mwandb[0m: 	post_lr: 0.002065075879538552
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 2
[34m[1mwandb[0m: 	pre_lr: 0.003174990843821578
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,2.355474,0.796755,0.225734,00:20
1,1.437724,0.578062,0.185102,00:19


epoch,train_loss,valid_loss,error_rate,time
0,0.706041,0.504443,0.151242,00:33
1,0.647407,0.468833,0.151241,00:34
2,0.601124,0.47132,0.151242,00:33
3,0.556135,0.458107,0.14447,00:34
4,0.517073,0.432069,0.136569,00:32
5,0.482797,0.401132,0.134311,00:34
6,0.43935,0.402155,0.123025,00:33
7,0.403766,0.413007,0.125282,00:35
8,0.369893,0.414629,0.126411,00:33
9,0.341558,0.408035,0.130926,00:35


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▃▃▄▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▅▃▃▃▂▂▂▁▁▁▂▂▂▂
lr_0,▁▃▆███▇▆▅▄▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▃▆███▇▆▅▄▃▂▁▁▁▂▃▄▅▅▆▆▅▅▅▅▅▄▄▄▃▃▂▂▂▂▁▁▁▁
mom_0,█▇▃▁▁▁▂▃▄▅▆▇███▇▅▄▂▁▁▁▁▁▂▂▃▃▄▄▅▅▆▆▇▇████
mom_1,█▇▃▁▁▁▂▃▄▅▆▇███▇▅▄▂▁▁▁▁▁▂▂▃▃▄▄▅▅▆▆▇▇████
raw_loss,█▇▄▄▂▃▃▂▂▃▂▂▂▁▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.13093
lr_0,0.0
lr_1,0.0
mom_0,0.94993
mom_1,0.94993
raw_loss,0.15933
sqr_mom_0,0.99


[34m[1mwandb[0m: Agent Starting Run: ffc46vcn with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 58
[34m[1mwandb[0m: 	post_lr: 0.00286638116411079
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 1
[34m[1mwandb[0m: 	pre_lr: 0.006022541509607214
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,2.093721,0.885581,0.25395,00:20


epoch,train_loss,valid_loss,error_rate,time
0,0.966566,0.660203,0.205418,00:33
1,0.842556,0.616933,0.207675,00:34
2,0.765586,0.507888,0.150113,00:34
3,0.679582,0.466386,0.150113,00:34
4,0.592968,0.431342,0.125282,00:34
5,0.523338,0.441271,0.13544,00:33
6,0.467139,0.40874,0.123025,00:34
7,0.42014,0.435092,0.136569,00:34
8,0.378222,0.453344,0.138826,00:36
9,0.340776,0.413093,0.126411,00:33


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▅▆▆▆▆▆▇▇▇▇▇███
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▆▆▃▃▂▂▁▂▂▂▁▁▁▁
lr_0,▁▄██▆▄▃▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▄██▆▄▃▁▁▁▂▂▃▄▄▄▄▄▄▄▄▄▄▄▃▃▃▃▃▂▂▂▂▂▁▁▁▁▁▁
mom_0,█▆▁▁▃▅▆███▇▅▄▃▂▁▁▁▁▁▂▂▂▂▃▃▄▄▅▅▆▆▆▇▇▇████
mom_1,█▆▁▁▃▅▆███▇▅▄▃▂▁▁▁▁▁▂▂▂▂▃▃▄▄▅▅▆▆▆▇▇▇████
raw_loss,██▄▃▃▃▂▃▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.114
lr_0,0.0
lr_1,0.0
mom_0,0.94994
mom_1,0.94994
raw_loss,0.1335
sqr_mom_0,0.99


[34m[1mwandb[0m: Agent Starting Run: tp0b6hgc with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 114
[34m[1mwandb[0m: 	post_lr: 0.0015858161442347338
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 3
[34m[1mwandb[0m: 	pre_lr: 0.0028229823154292608
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,2.709452,0.845659,0.282167,00:19
1,1.606764,0.574973,0.179458,00:19
2,1.135308,0.496721,0.151242,00:20


epoch,train_loss,valid_loss,error_rate,time
0,0.549196,0.47468,0.147856,00:33
1,0.502948,0.453826,0.139955,00:33
2,0.479748,0.432084,0.145598,00:33
3,0.450134,0.434541,0.13544,00:33
4,0.417833,0.433617,0.13544,00:33
5,0.384932,0.427796,0.145598,00:33
6,0.358816,0.423249,0.137698,00:34
7,0.337678,0.423052,0.133183,00:33
8,0.311308,0.422253,0.13544,00:34
9,0.290924,0.410793,0.129797,00:34


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇██
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▃▂▂▂▂▁▁▂▂▁▁▁▁▁
lr_0,▁▂▄▇███▇▇▆▆▅▄▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▂▄▇███▇▇▆▆▅▄▃▂▂▁▁▁▁▂▄▄▅▅▅▅▄▄▄▃▃▃▂▂▂▁▁▁▁
mom_0,█▇▅▂▁▁▁▂▂▃▃▄▅▆▇▇████▆▃▂▁▁▁▁▂▂▃▄▄▅▆▆▇▇███
mom_1,█▇▅▂▁▁▁▂▂▃▃▄▅▆▇▇████▆▃▂▁▁▁▁▂▂▃▄▄▅▆▆▇▇███
raw_loss,██▅▃▃▂▂▂▂▂▁▂▁▁▂▂▂▂▁▂▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.12641
lr_0,0.0
lr_1,0.0
mom_0,0.94992
mom_1,0.94992
raw_loss,0.22411
sqr_mom_0,0.99


[34m[1mwandb[0m: Agent Starting Run: euak0gor with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 204
[34m[1mwandb[0m: 	post_lr: 0.00441352764663755
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 3
[34m[1mwandb[0m: 	pre_lr: 0.003788434247017028
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,2.528401,0.79699,0.234763,00:20
1,1.497056,0.547241,0.180587,00:20
2,1.079141,0.503614,0.159142,00:20


epoch,train_loss,valid_loss,error_rate,time
0,0.536978,0.465534,0.154628,00:33
1,0.488248,0.464268,0.148984,00:33
2,0.445465,0.464427,0.148984,00:33
3,0.435671,0.441287,0.139955,00:33
4,0.40988,0.482951,0.145598,00:33
5,0.37909,0.496436,0.145598,00:34
6,0.353878,0.480914,0.138826,00:34
7,0.331267,0.466356,0.137698,00:34
8,0.301833,0.451254,0.138826,00:34
9,0.277653,0.439015,0.129797,00:35


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇██
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▄▃▃▂▂▂▂▂▂▂▂▁▁▁
lr_0,▁▂▄▇███▇▇▆▆▅▄▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▂▄▆▇▇▇▇▆▅▅▄▃▃▂▂▁▁▁▂▄▆▇████▇▇▆▅▅▄▃▃▂▂▁▁▁
mom_0,█▇▅▂▁▁▁▂▂▃▃▄▅▆▇▇████▆▃▂▁▁▁▁▂▂▃▄▄▅▆▆▇▇███
mom_1,█▇▅▂▁▁▁▂▂▃▃▄▅▆▇▇████▆▃▂▁▁▁▁▂▂▃▄▄▅▆▆▇▇███
raw_loss,█▇▅▃▃▃▂▂▂▂▂▂▁▂▂▂▂▂▁▂▁▂▁▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.13093
lr_0,0.0
lr_1,0.0
mom_0,0.94992
mom_1,0.94992
raw_loss,0.15744
sqr_mom_0,0.99


[34m[1mwandb[0m: Agent Starting Run: 37p1jww9 with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 75
[34m[1mwandb[0m: 	post_lr: 0.002119172275097908
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 2
[34m[1mwandb[0m: 	pre_lr: 0.001896224995186232
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,2.711061,0.726806,0.233634,00:20
1,1.646406,0.607147,0.194131,00:19


epoch,train_loss,valid_loss,error_rate,time
0,0.77019,0.543648,0.160271,00:33
1,0.726816,0.494431,0.158014,00:34
2,0.679798,0.459306,0.153499,00:33
3,0.627472,0.505749,0.156885,00:34
4,0.57015,0.453655,0.134311,00:33
5,0.526811,0.436477,0.12754,00:34
6,0.476705,0.430584,0.125282,00:33
7,0.430411,0.455985,0.138826,00:34
8,0.394864,0.414766,0.128668,00:33
9,0.362069,0.395216,0.123025,00:34


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▃▃▄▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▆▄▃▃▃▂▂▁▂▂▁▁▁▁
lr_0,▁▃▆███▇▆▅▄▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▂▅▇▇▇▆▅▄▃▃▂▁▁▁▂▄▅▇█████▇▇▆▆▅▅▄▄▃▃▂▂▁▁▁▁
mom_0,█▇▃▁▁▁▂▃▄▅▆▇███▇▅▄▂▁▁▁▁▁▂▂▃▃▄▄▅▅▆▆▇▇████
mom_1,█▇▃▁▁▁▂▃▄▅▆▇███▇▅▄▂▁▁▁▁▁▂▂▃▃▄▄▅▅▆▆▇▇████
raw_loss,█▇▅▅▃▃▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.11851
lr_0,0.0
lr_1,0.0
mom_0,0.94993
mom_1,0.94993
raw_loss,0.14491
sqr_mom_0,0.99


[34m[1mwandb[0m: Agent Starting Run: txm7nlv3 with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 121
[34m[1mwandb[0m: 	post_lr: 0.003866361245280322
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 1
[34m[1mwandb[0m: 	pre_lr: 0.007574758941115778
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,1.907859,0.792807,0.259594,00:20


epoch,train_loss,valid_loss,error_rate,time
0,0.8105,0.575347,0.173815,00:33
1,0.785528,0.511758,0.163657,00:34
2,0.711367,0.468342,0.153499,00:33
3,0.634053,0.441719,0.129797,00:33
4,0.577077,0.433488,0.143341,00:34
5,0.521618,0.445402,0.137698,00:33
6,0.462475,0.443481,0.125282,00:33
7,0.418392,0.459982,0.132054,00:33
8,0.374688,0.425061,0.123025,00:34
9,0.343629,0.395278,0.111738,00:33


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▅▆▆▆▆▆▇▇▇▇▇███
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▄▃▃▂▂▂▂▂▂▁▁▁▁▁
lr_0,▁▄██▆▄▃▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▄██▆▄▃▁▁▁▂▂▃▄▄▄▅▅▄▄▄▄▄▄▄▃▃▃▃▂▂▂▂▂▁▁▁▁▁▁
mom_0,█▆▁▁▃▅▆███▇▅▄▃▂▁▁▁▁▁▂▂▂▂▃▃▄▄▅▅▆▆▆▇▇▇████
mom_1,█▆▁▁▃▅▆███▇▅▄▃▂▁▁▁▁▁▂▂▂▂▃▃▄▄▅▅▆▆▆▇▇▇████
raw_loss,█▇▃▂▃▃▂▂▂▂▂▂▂▂▂▁▁▁▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.114
lr_0,0.0
lr_1,0.0
mom_0,0.94994
mom_1,0.94994
raw_loss,0.16884
sqr_mom_0,0.99


[34m[1mwandb[0m: Agent Starting Run: 9kqwwiw2 with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 93
[34m[1mwandb[0m: 	post_lr: 0.004993904912057072
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 3
[34m[1mwandb[0m: 	pre_lr: 0.0012364234024738838
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,3.280355,0.829543,0.274266,00:20
1,1.942633,0.583619,0.182844,00:19
2,1.38001,0.562801,0.185102,00:20


epoch,train_loss,valid_loss,error_rate,time
0,0.784078,0.517356,0.170429,00:33
1,0.733051,0.555895,0.177201,00:34
2,0.666121,0.702821,0.193002,00:33
3,0.609626,0.51245,0.147856,00:34
4,0.557913,0.534781,0.147856,00:33
5,0.503293,0.443101,0.142212,00:34
6,0.454567,0.432827,0.124153,00:33
7,0.40131,0.448134,0.133183,00:33
8,0.357396,0.430597,0.126411,00:33
9,0.321032,0.410759,0.123025,00:33


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇██
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▄▄▃▄▄▂▂▂▁▂▁▁▁▁
lr_0,▁▂▄▇███▇▇▆▆▅▄▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▁▂▂▃▃▃▃▂▂▂▂▂▂▁▁▁▁▁▂▄▆▇████▇▇▆▅▅▄▃▃▂▂▁▁▁
mom_0,█▇▅▂▁▁▁▂▂▃▃▄▅▆▇▇████▆▃▂▁▁▁▁▂▂▃▄▄▅▆▆▇▇███
mom_1,█▇▅▂▁▁▁▂▂▃▃▄▅▆▇▇████▆▃▂▁▁▁▁▂▂▃▄▄▅▆▆▇▇███
raw_loss,██▇▅▄▃▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.12077
lr_0,0.0
lr_1,0.0
mom_0,0.94992
mom_1,0.94992
raw_loss,0.14641
sqr_mom_0,0.99


[34m[1mwandb[0m: Agent Starting Run: fzgb3teo with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 113
[34m[1mwandb[0m: 	post_lr: 0.004170825171404025
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 1
[34m[1mwandb[0m: 	pre_lr: 0.007219448340499741
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,1.863111,0.743862,0.215576,00:20


epoch,train_loss,valid_loss,error_rate,time
0,0.770526,0.593609,0.176072,00:33
1,0.727496,0.521757,0.163657,00:32
2,0.64168,0.498954,0.155756,00:34
3,0.583597,0.465466,0.147856,00:32
4,0.51777,0.496495,0.146727,00:34
5,0.461696,0.456537,0.139955,00:32
6,0.418269,0.453959,0.129797,00:34
7,0.374369,0.442918,0.128668,00:32
8,0.339197,0.416775,0.127539,00:35
9,0.307469,0.423915,0.128668,00:33


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▅▆▆▆▆▆▇▇▇▇▇███
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▅▄▃▃▃▂▂▁▁▁▁▁▁▁
lr_0,▁▄██▆▄▃▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▄██▆▄▃▁▁▁▂▃▃▄▅▅▅▅▅▅▅▅▄▄▄▄▃▃▃▃▂▂▂▂▂▁▁▁▁▁
mom_0,█▆▁▁▃▅▆███▇▅▄▃▂▁▁▁▁▁▂▂▂▂▃▃▄▄▅▅▆▆▆▇▇▇████
mom_1,█▆▁▁▃▅▆███▇▅▄▃▂▁▁▁▁▁▂▂▂▂▃▃▄▄▅▅▆▆▆▇▇▇████
raw_loss,█▆▄▃▃▃▃▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.12302
lr_0,0.0
lr_1,0.0
mom_0,0.94994
mom_1,0.94994
raw_loss,0.10262
sqr_mom_0,0.99


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: z45c23xy with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 242
[34m[1mwandb[0m: 	post_lr: 0.0015301411349877543
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 3
[34m[1mwandb[0m: 	pre_lr: 0.003810046627323762
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,2.613433,0.891885,0.227991,00:20
1,1.559145,0.511072,0.155756,00:20
2,1.097026,0.476964,0.159142,00:20


epoch,train_loss,valid_loss,error_rate,time
0,0.496173,0.45466,0.141084,00:34
1,0.488701,0.464463,0.155756,00:33
2,0.462235,0.434931,0.138826,00:34
3,0.42481,0.442002,0.141084,00:33
4,0.395487,0.445084,0.141084,00:34
5,0.376808,0.421332,0.126411,00:33
6,0.359737,0.394038,0.11851,00:34
7,0.336487,0.394586,0.126411,00:33
8,0.310111,0.386399,0.125282,00:34
9,0.292856,0.380668,0.126411,00:33


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇██
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▃▄▂▃▂▂▂▂▁▂▁▂▂▂
lr_0,▁▂▄▇███▇▇▆▆▅▄▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▂▄▇███▇▇▆▆▅▄▃▂▂▁▁▁▁▂▃▃▄▄▄▄▃▃▃▃▃▂▂▂▂▁▁▁▁
mom_0,█▇▅▂▁▁▁▂▂▃▃▄▅▆▇▇████▆▃▂▁▁▁▁▂▂▃▄▄▅▆▆▇▇███
mom_1,█▇▅▂▁▁▁▂▂▃▃▄▅▆▇▇████▆▃▂▁▁▁▁▂▂▃▄▄▅▆▆▇▇███
raw_loss,█▇▅▃▃▃▂▂▂▂▂▂▂▂▂▂▂▂▁▂▁▂▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.12754
lr_0,0.0
lr_1,0.0
mom_0,0.94992
mom_1,0.94992
raw_loss,0.15622
sqr_mom_0,0.99


[34m[1mwandb[0m: Agent Starting Run: vvr3vvfj with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 87
[34m[1mwandb[0m: 	post_lr: 0.003145195985342452
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 2
[34m[1mwandb[0m: 	pre_lr: 0.006058120473842693
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,2.166092,0.929688,0.242664,00:20
1,1.342996,0.633664,0.191874,00:20


epoch,train_loss,valid_loss,error_rate,time
0,0.597313,0.552557,0.171558,00:33
1,0.536123,0.476428,0.155756,00:33
2,0.501848,0.491234,0.167043,00:32
3,0.44709,0.445618,0.130925,00:34
4,0.403592,0.505218,0.150113,00:32
5,0.366551,0.454515,0.139955,00:34
6,0.337356,0.455639,0.133183,00:33
7,0.307309,0.474597,0.130926,00:34
8,0.286565,0.473902,0.133183,00:32
9,0.268086,0.457059,0.128668,00:34


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▃▃▄▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▅▄▃▃▁▂▂▁▁▁▁▁▁▁
lr_0,▁▃▆███▇▆▅▄▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▃▆███▇▆▅▄▃▂▁▁▁▂▂▃▄▅▅▅▅▄▄▄▄▄▃▃▃▂▂▂▂▁▁▁▁▁
mom_0,█▇▃▁▁▁▂▃▄▅▆▇███▇▅▄▂▁▁▁▁▁▂▂▃▃▄▄▅▅▆▆▇▇████
mom_1,█▇▃▁▁▁▂▃▄▅▆▇███▇▅▄▂▁▁▁▁▁▂▂▃▃▄▄▅▅▆▆▇▇████
raw_loss,█▇▄▃▃▂▂▂▂▂▂▂▂▂▂▂▁▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.12867
lr_0,0.0
lr_1,0.0
mom_0,0.94993
mom_1,0.94993
raw_loss,0.12147
sqr_mom_0,0.99


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: zg8ojbpa with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 115
[34m[1mwandb[0m: 	post_lr: 0.004265173328753435
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 1
[34m[1mwandb[0m: 	pre_lr: 0.004350440762895012
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,2.029744,0.720836,0.222348,00:20


epoch,train_loss,valid_loss,error_rate,time
0,0.877542,0.582264,0.190745,00:33
1,0.788519,0.512372,0.164786,00:33
2,0.715588,0.513954,0.1614,00:34
3,0.649857,0.516532,0.168172,00:33
4,0.588594,0.479949,0.13544,00:33
5,0.533706,0.468188,0.138826,00:34
6,0.480093,0.421401,0.126411,00:33
7,0.426805,0.409918,0.126411,00:33
8,0.379601,0.438588,0.134311,00:33
9,0.343178,0.416726,0.130925,00:33


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▅▆▆▆▆▆▇▇▇▇▇███
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▆▄▄▅▂▃▂▂▂▂▂▁▁▁
lr_0,▁▄██▆▄▃▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▄██▆▄▃▁▁▂▃▄▅▆▇█████▇▇▇▆▆▆▅▅▄▄▃▃▃▂▂▂▁▁▁▁
mom_0,█▆▁▁▃▅▆███▇▅▄▃▂▁▁▁▁▁▂▂▂▂▃▃▄▄▅▅▆▆▆▇▇▇████
mom_1,█▆▁▁▃▅▆███▇▅▄▃▂▁▁▁▁▁▂▂▂▂▃▃▄▄▅▅▆▆▆▇▇▇████
raw_loss,█▇▄▄▂▄▂▃▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.114
lr_0,0.0
lr_1,0.0
mom_0,0.94994
mom_1,0.94994
raw_loss,0.14863
sqr_mom_0,0.99


[34m[1mwandb[0m: Agent Starting Run: pqkmgjmt with config:
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	post_bs: 192
[34m[1mwandb[0m: 	post_div: 135
[34m[1mwandb[0m: 	post_lr: 0.004001199618020564
[34m[1mwandb[0m: 	post_size: 112
[34m[1mwandb[0m: 	pre_bs: 256
[34m[1mwandb[0m: 	pre_epoch: 1
[34m[1mwandb[0m: 	pre_lr: 0.007228602031791233
[34m[1mwandb[0m: 	pre_size: 160


epoch,train_loss,valid_loss,error_rate,time
0,1.959322,0.778843,0.233634,00:21


epoch,train_loss,valid_loss,error_rate,time
0,0.96902,0.600597,0.189616,00:33
1,0.846157,0.587739,0.185102,00:33
2,0.746293,0.483106,0.147856,00:34
3,0.644586,0.435058,0.130925,00:32
4,0.565848,0.455207,0.148984,00:35
5,0.513629,0.485187,0.150113,00:32
6,0.465281,0.442363,0.128668,00:35
7,0.425259,0.429632,0.136569,00:33
8,0.384475,0.440533,0.132054,00:35
9,0.349705,0.426685,0.133183,00:33


VBox(children=(Label(value='0.801 MB of 0.801 MB uploaded (0.780 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▅▆▆▆▆▆▇▇▇▇▇███
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,█▅▅▂▁▂▃▁▂▁▁▁▁▁▁
lr_0,▁▄██▆▄▃▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr_1,▁▄██▆▄▃▁▁▁▂▃▃▄▄▅▅▅▅▅▅▄▄▄▄▄▃▃▃▃▂▂▂▂▂▁▁▁▁▁
mom_0,█▆▁▁▃▅▆███▇▅▄▃▂▁▁▁▁▁▂▂▂▂▃▃▄▄▅▅▆▆▆▇▇▇████
mom_1,█▆▁▁▃▅▆███▇▅▄▃▂▁▁▁▁▁▂▂▂▂▃▃▄▄▅▅▆▆▆▇▇▇████
raw_loss,█▆▃▄▂▂▃▃▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,15.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.12754
lr_0,0.0
lr_1,0.0
mom_0,0.94994
mom_1,0.94994
raw_loss,0.11285
sqr_mom_0,0.99


In [None]:
res_df = pd.read_csv('results.csv') #.loc[df.stage==0]
by_valid = res_df.sort_values('valid', ascending=True)
by_error = res_df.sort_values('error', ascending=True)

In [None]:
# df.drop(df.loc[df['div'] > 0].index, inplace=True)
# df

In [None]:
# df.to_csv('results.csv', index=False)

In [None]:
by_error.head()

Unnamed: 0,time,arch,lr,pct_start,stage,train,valid,error,div,epochs
39,1660069611,convnext_tiny_in22k,0.004,0.25,1,0.30763,0.366548,0.113995,100.0,10.0
33,1660066989,convnext_tiny_in22k,0.003,0.25,1,0.33098,0.387178,0.115124,100.0,10.0
48,1660072787,convnext_tiny_in22k,0.005,0.25,1,0.338065,0.397917,0.116253,150.0,10.0
43,1660071105,convnext_tiny_in22k,0.004,0.25,1,0.302869,0.394233,0.11851,70.0,10.0
41,1660070416,convnext_tiny_in22k,0.002,0.25,1,0.349489,0.405622,0.11851,70.0,10.0


In [None]:
by_valid.head()

Unnamed: 0,time,arch,lr,pct_start,stage,train,valid,error,div,epochs
39,1660069611,convnext_tiny_in22k,0.004,0.25,1,0.30763,0.366548,0.113995,100.0,10.0
45,1660071771,convnext_tiny_in22k,0.002,0.25,1,0.354501,0.377165,0.121896,150.0,10.0
26,1660064069,convnext_tiny_in22k,0.002,0.25,1,0.310325,0.384408,0.126411,30.0,10.0
33,1660066989,convnext_tiny_in22k,0.003,0.25,1,0.33098,0.387178,0.115124,100.0,10.0
43,1660071105,convnext_tiny_in22k,0.004,0.25,1,0.302869,0.394233,0.11851,70.0,10.0


In [None]:
learn = vision_learner(get_dls(bs=256), arch, metrics=error_rate)
learn.fit_one_cycle(3, lr_max=4e-3)
learn.unfreeze()
learn.dls = get_dls(bs=192)
learn.fit_one_cycle(10, lr_max=(4e-5,4e-3))

epoch,train_loss,valid_loss,error_rate,time
0,3.751748,1.341895,0.358916,00:22
1,2.282366,0.82227,0.213318,00:20
2,1.714996,0.66243,0.182844,00:20


epoch,train_loss,valid_loss,error_rate,time
0,0.651146,0.534959,0.168172,00:33
1,0.617035,0.497863,0.153499,00:31
2,0.581459,0.521263,0.167043,00:33
3,0.547468,0.517798,0.151242,00:31
4,0.502452,0.529413,0.164786,00:32
5,0.454631,0.457125,0.146727,00:31
6,0.406428,0.451517,0.139955,00:32
7,0.364492,0.432912,0.132054,00:31
8,0.333013,0.423094,0.134312,00:33
9,0.301152,0.418233,0.133183,00:31


In [None]:
wandb.init(project='fastbook', config=sweep_cfg)
arch = 'convnext_tiny_in22k'
learn = load_learner(arch+'_160_112_3_003_stage0.pth')
learn.unfreeze()
learn.dls = get_dls(bs=wandb.config.post_bs)
learn.add_cb(WandbCallback())
learn.fit_one_cycle(3, lr_max=(4e-5,4e-3))

VBox(children=(Label(value='0.790 MB of 0.790 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▃▃▃▄▄▅▅▆▆▆▇▇██
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
error_rate,▄█▁
lr_0,▁▂▄▆███▇▇▆▅▅▄▃▂▂▁▁
lr_1,▁▂▄▆███▇▇▆▅▅▄▃▂▂▁▁
mom_0,█▇▅▃▁▁▁▂▂▃▃▄▅▆▇▇██
mom_1,█▇▅▃▁▁▁▂▂▃▃▄▅▆▇▇██
raw_loss,▄▆▄▅▄█▂▄▆▆▂▃▃▃▂▃▂▁
sqr_mom_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,3.0
eps_0,1e-05
eps_1,1e-05
error_rate,0.17156
lr_0,0.0
lr_1,5e-05
mom_0,0.94865
mom_1,0.94865
raw_loss,0.40105
sqr_mom_0,0.99


epoch,train_loss,valid_loss,error_rate,time
0,0.747064,0.691519,0.207675,00:33
1,0.720227,0.570864,0.163657,00:33
2,0.661863,0.49888,0.160271,00:33


In [None]:
learn = vision_learner(get_dls(bs=256), arch, metrics=error_rate)
learn.fit_one_cycle(3, lr_max=2e-3)
learn.unfreeze()
learn.dls = get_dls(bs=196)
learn.fit_one_cycle(10, lr_max=(1e-5,1e-3))

epoch,train_loss,valid_loss,error_rate,time
0,4.250829,1.531392,0.472912,00:22
1,2.739581,0.792751,0.242664,00:20
2,2.056829,0.678373,0.21219,00:20


epoch,train_loss,valid_loss,error_rate,time
0,0.849209,0.612101,0.193002,00:33
1,0.816864,0.533736,0.180587,00:31
2,0.75614,0.495051,0.147856,00:33
3,0.697693,0.457725,0.14447,00:31
4,0.647301,0.448462,0.150113,00:33
5,0.60042,0.461592,0.146727,00:31
6,0.552283,0.451783,0.14447,00:33
7,0.518473,0.429279,0.141084,00:31
8,0.490142,0.422684,0.137698,00:33
9,0.471561,0.421018,0.138826,00:31


In [None]:
for lr in np.logspace(-3,-1.5,5):
    lr = float(lr)
    learn = vision_learner(get_dls(bs=256), arch, metrics=error_rate)
    print(lr)
    learn.fit_one_cycle(6, lr_max=lr, pct_start=.99)

In [None]:
learn = vision_learner(get_dls(bs=256), arch, metrics=error_rate)
learn.fit_one_cycle(6, lr_max=.006)
learn.path = Path('.')
learn.export('convnext_nano_160_112_005_stage0.pth')

In [None]:
for dev in np.logspace(1,3,5):
    for lr in [1e-3, 2e-3]:
        dev = float(dev)
        learn = load_learner('convnext_nano_160_112_005_stage0.pth')
        learn.dls = get_dls(bs=256)
        print(lr, dev)
        learn.fit_one_cycle(16, lr_max=slice(lr/dev,lr))

In [None]:
learn = load_learner('convnext_nano_160_112_005_stage0.pth')
learn.dls = get_dls(bs=256)
learn.fit_one_cycle(16, lr_max=(1e-5,1e-3))

In [None]:
for dev in np.logspace(1,3,5):
    for lr in [1e-3, 2e-3]:
        dev = float(dev)
        learn = load_learner('convnext_nano_160_112_005_stage0.pth')
        learn.dls = get_dls(bs=256)
        print(lr, dev)
        learn.fit_one_cycle(16, lr_max=slice(lr/dev,lr))