In [2]:
%load_ext autoreload
%autoreload 2

%matplotlib inline

In [3]:
#export
from exp.nb_03 import *

# DataBunch/ Learner

In [4]:
x_train, y_train, x_valid, y_valid = get_data()
train_ds, valid_ds = Dataset(x_train, y_train), Dataset(x_valid, y_valid)
nh, bs = 50, 64
c = y_train.max().item() + 1
loss_func = F.cross_entropy

In [5]:
# loss, acc = fit(5, learn)

In [6]:
class DataBunch():
    def __init__(self, train_dl, valid_dl, c=None): self.train_dl, self.valid_dl, self.c = train_dl, valid_dl, c
        
    @property
    def train_ds(self): return self.train_dl.dataset
    @property
    def valid_ds(self): return self.valid_dl.dataset

In [7]:
train_dl = DataLoader(train_ds, bs, True)
valid_dl = DataLoader(valid_ds, bs, False)

In [8]:
len(train_dl), len(valid_dl)

(938, 157)

In [9]:
data = DataBunch(train_dl, valid_dl, c)

In [10]:
data.train_dl

<torch.utils.data.dataloader.DataLoader at 0x7f5a01da13d0>

In [11]:
data.train_ds[0][0].shape

torch.Size([784])

In [12]:
c, data.c

(10, 10)

In [13]:
def get_model(data, lr=0.1, nh=50):
    m = data.train_ds.x.shape[1]
    model = nn.Sequential(nn.Linear(m,nh), nn.ReLU(), nn.Linear(nh,c))
    return model, optim.Adam(model.parameters(), lr=lr)

In [14]:
data.train_ds.x.shape[1]

784

In [15]:
class Learner():
    def __init__(self, model, opt, loss_func, data): self.model, self.opt, self.loss_func, self.data = model, opt, loss_func, data

In [16]:
def fit(epochs, learn):
    for epoch in range(epochs):
        learn.model.train()
        for xb, yb, in learn.data.train_dl:
            loss = learn.loss_func(learn.model(xb), yb)
            loss.backward()
            learn.opt.step()
            learn.opt.zero_grad()
            
        learn.model.eval()
        with torch.no_grad():
            tot_loss, tot_acc = 0., 0.
            for xb, yb in learn.data.valid_dl:
                pred = learn.model(xb)
                tot_loss += learn.loss_func(pred, yb)
                tot_acc += accuracy(pred, yb)
                
        nv = len(learn.data.valid_dl)
        print(tot_loss / nv, tot_acc / nv)
        
    return tot_loss / nv, tot_acc / nv

In [17]:
learn = Learner(*get_model(data), loss_func, data)

In [18]:
loss, acc = fit(1, learn)

tensor(0.2899) tensor(0.9164)


# CallbackHandler

In [19]:
def fit(epochs, learn, cb):
    if not cb.begin_fit(learn): return
    for epoch in range(epochs):
        if not cb.begin_epoch(epoch): continue
        all_batches(learn.data.train_dl, cb)
        
        if cb.begin_validate():
            with torch.no_grad(): all_batches(learn.data.valid_dl, cb)
        if cb.do_stop() or not cb.after_epoch(): break
        cb.after_fit()
            
def all_batches(dl, cb):
    for xb, yb in dl:
        one_batch(xb, yb, cb)
        if cb.do_stop(): return

def one_batch(xb, yb, cb):
    if not cb.begin_batch(xb, yb): return
    loss = cb.learn.loss_func(cb.learn.model(xb), yb)
    if not cb.after_loss(loss): return
    loss.backward()
    if cb.after_backward(): cb.learn.opt.step()
    if cb.after_step(): cb.learn.opt.zero_grad()

In [20]:
class Callback():
    def begin_fit(self, learn):
        self.learn = learn
        return True
    def after_fit(self):
        return True
    def begin_epoch(self, epoch):
        self.epoch = epoch
        return True
    def after_epoch(self):
        return True
    def begin_validate(self):
        return True
    def begin_batch(self, xb, yb):
        self.xb, self.yb = xb, yb
        return True
    def after_loss(self, loss):
        self.loss = loss
        return True
    def after_backward(self): return True
    def after_step(self): return True

In [21]:
class CallbackHandler():
    def __init__(self, cbs=None):
        self.cbs = cbs if cbs else []
        
    def begin_fit(self, learn):
        self.learn, self.in_train = learn, True
        learn.stop = False
        res = True
        for cb in self.cbs: res = res and cb.begin_fit(learn)
        return res
    
    def after_fit(self):
        res = not self.in_train
        for cb in self.cbs: res = res and cb.after_fit()
        return res
    
    def begin_epoch(self, epoch):
        self.learn.model.train()
        self.in_train = True
        res = True
        for cb in self.cbs: res = res and cb.begin_epoch(epoch)
        return res
    
    def begin_validate(self):
        self.learn.model.eval()
        self.in_train = False
        res = True
        for cb in self.cbs: res = res and cb.begin_validate()
        return res
    
    def after_epoch(self):
        res = True
        for cb in self.cbs: res = res and cb.after_epoch()
        return res
    
    def begin_batch(self, xb, yb):
        res = True
        for cb in self.cbs: res = res and cb.begin_batch(xb, yb)
        return res
    
    def after_loss(self, loss):
        res = self.in_train
        for cb in self.cbs: res = res and cb.after_loss(loss)
        return res
    
    def after_backward(self):
        res = True
        for cb in self.cbs: res = res and cb.after_backward()
        return res
    
    def after_step(self):
        res = True
        for cb in self.cbs: res = res and cb.after_step()
        return res
    
    def do_stop(self):
        try: return self.learn.stop
        finally: self.learn.stop = False

In [22]:
class TestCallback(Callback):
    def begin_fit(self, learn):
        super().begin_fit(learn)
        self.n_iters = 0
        return True
    
    def after_step(self):
        self.n_iters += 1
        print(self.n_iters)
        if self.n_iters >= 10: self.learn.stop = True
        return True

In [23]:
fit(1, learn, cb=CallbackHandler([TestCallback()]))

1
2
3
4
5
6
7
8
9
10


# Runner

In [24]:
import re

_camel_re1 = re.compile('(.)([A-Z][a-z]+)')
_camel_re2 = re.compile('([a-z0-9])([A-Z])')

def camel2snake(name):
    s1 = re.sub(_camel_re1, r'\1_\2', name)
    return re.sub(_camel_re2, r'\1_\2', s1).lower()

In [49]:
def listify(o):
    if o is None: return []
    if isinstance(o, list): return o
    if isinstance(o, str): return [o]
    if isinstance(o, Iterable): return list(o)
    return [o]

In [73]:
class Callback():
    _order = 0
    def set_runner(self, run): self.run = run
    def __getattr__(self, k): return getattr(self.run, k)
    @property
    def name(self):
        name = re.sub(r'Callback$', '', self.__class__.__name__)
        return camel2snake(name or 'callback')

In [74]:
class TrainEvalCallback(Callback):
    'Main Callback'
    def begin_fit(self):
        self.run.n_epochs = 0.
        self.run.n_iter = 0
        
    def after_batch(self):
        if not self.in_train: return
        self.run.n_epochs += 1./self.iters # self.iter = len(dl), amount of batches
        self.run.n_iter += 1
        
    def begin_epoch(self):
        self.run.n_epochs = self.epoch
        self.model.train()
        self.run.in_train = True
        
    def begin_validate(self):
        self.model.eval()
        self.run.in_train = False

In [75]:
TrainEvalCallback().__class__, TrainEvalCallback().__class__.__name__

(__main__.TrainEvalCallback, 'TrainEvalCallback')

In [76]:
TrainEvalCallback().name

'train_eval'

In [89]:
class TestCallback(Callback):
    _order = 1
    def begin_batch(self):
        if self.n_iter >= 10:
            self.stop = True
            #print(self.run.n_iter)
            return True # needs the return statement, otherwise if reaches the line self.stop = False before it gets a chance to break out

In [90]:
class Runner():
    def __init__(self, cbs=None, cb_funcs=None):
        cbs = listify(cbs)
        for cbf in listify(cb_funcs):
            cb = cbf()
            setattr(self, cb.name, cb)
            cbs.append(cb)
        self.stop, self.cbs = False, [TrainEvalCallback()] + cbs
        
    @property
    def opt(self): return self.learn.opt
    @property
    def model(self): return self.learn.model
    @property
    def loss_func(self): return self.learn.loss_func
    @property
    def data(self): return self.learn.data
    
    def one_batch(self, xb, yb):
#         import pdb; pdb.set_trace()
        self.xb, self.yb = xb, yb
        if self('begin_batch'): return
        self.pred = self.model(self.xb)
        if self('after_pred'): return
        self.loss = self.loss_func(self.pred, self.yb)
        if self('after_loss') or not self.in_train: return
        self.loss.backward()
        if self('after_backward'): return
        self.opt.step()
        if self('after_step'): return
        self.opt.zero_grad()
        
    def all_batches(self, dl):
        self.iters = len(dl)
        for xb, yb in dl:
            if self.stop: break
            self.one_batch(xb, yb)
            self('after_batch')
        self.stop = False
        
        
    def fit(self, epochs, learn):
        self.epochs, self.learn = epochs, learn
        
        try:
            for cb in self.cbs: cb.set_runner(self)
            if self('begin_fit'): return
            for epoch in range(epochs):
                self.epoch = epoch
                if not self('begin_epoch'): self.all_batches(self.data.train_dl)
                
                with torch.no_grad():
                    if not self('begin_validate'): self.all_batches(self.data.valid_dl)
                if self('after_epoch'): break
                        
        finally:
            self('after_fit')
            self.learn = None
            
    def __call__(self, cb_name):
        for cb in sorted(self.cbs, key=lambda x: x._order):
            f = getattr(cb, cb_name, None)
            if f and f(): return True
        return False

In [91]:
learn = Learner(*get_model(data), loss_func, data)

In [92]:
run = Runner()

In [93]:
%time run.fit(1, learn)

CPU times: user 8.1 s, sys: 306 ms, total: 8.4 s
Wall time: 2.1 s


In [94]:
run.learn == None

True

In [95]:
accuracy(learn.model(x_valid), y_valid)

tensor(0.9221)

In [96]:
learn = Learner(*get_model(data), loss_func, data)

In [97]:
run = Runner(cbs=[TestCallback()])

In [98]:
%time run.fit(1, learn)

CPU times: user 1.35 s, sys: 40 ms, total: 1.39 s
Wall time: 689 ms


In [99]:
accuracy(learn.model(x_valid), y_valid)

tensor(0.2660)

In [43]:
class AvgStats():
    def __init__(self, metrics, in_train): self.metrics, self.in_train = listify(metrics), in_train
        
    def reset(self):
        self.tot_loss, self.count = 0., 0
        self.tot_mets = [0.] * len(self.metrics)
        
    @property
    def all_stats(self): return [self.tot_loss.item()] + self.tot_mets
    @property
    def avg_stats(self): return [o / self.count for o in self.all_stats]
    
    def __repr__(self):
        if not self.count: return ''
        return f'{"train" if self.in_train else "valid"}: {self.avg_stats}'
    
    def accumulate(self, run):
        bn = run.xb.shape[0]
        self.tot_loss += run.loss * bn
        self.count += bn
        for i, m in enumerate(self.metrics):
            self.tot_mets[i] += m(run.pred, run.yb) * bn

In [44]:
class AvgStatsCallback(Callback):
    def __init__(self, metrics):
        self.train_stats, self.valid_stats = AvgStats(metrics, True), AvgStats(metrics, False)
        
    def begin_epoch(self):
        self.train_stats.reset()
        self.valid_stats.reset()
        
    def after_loss(self):
        stats = self.train_stats if self.in_train else self.valid_stats
        with torch.no_grad(): stats.accumulate(self.run)
            
    def after_epoch(self):
        print(self.train_stats)
        print(self.valid_stats)

In [45]:
learn = Learner(*get_model(data), loss_func, data)

In [50]:
stats = AvgStatsCallback([accuracy])

In [51]:
run = Runner(cbs=stats)

In [52]:
run.fit(3, learn)

train: [0.37213893229166667, tensor(0.8868)]
valid: [0.299082373046875, tensor(0.9064)]
train: [0.25218958333333336, tensor(0.9265)]
valid: [0.224819775390625, tensor(0.9331)]
train: [0.23099016927083332, tensor(0.9322)]
valid: [0.24141611328125, tensor(0.9321)]


In [60]:
learn = Learner(*get_model(data), loss_func, data)

In [61]:
from functools import partial

In [65]:
acc_cbf = partial(AvgStatsCallback, accuracy)

In [68]:
acc_cbf()

<__main__.AvgStatsCallback at 0x7f5a027ebe20>

In [66]:
acc_cbf().name

'avg_stats'

In [56]:
run = Runner(cb_funcs=acc_cbf)

In [57]:
run.fit(3, learn)

train: [0.36030413411458334, tensor(0.8889)]
valid: [0.277065673828125, tensor(0.9191)]
train: [0.23399440104166666, tensor(0.9315)]
valid: [0.2279352783203125, tensor(0.9354)]
train: [0.21418986002604168, tensor(0.9358)]
valid: [0.2210769775390625, tensor(0.9350)]


In [71]:
run.avg_stats.valid_stats

valid: [0.2210769775390625, tensor(0.9350)]

In [72]:
run.avg_stats.valid_stats.avg_stats

[0.2210769775390625, tensor(0.9350)]