In [None]:
#default_exp TrainModels

In [None]:
#export
#hide
import os

import sys
sys.path.append("..")

from hephaestus.DatasetConstruction import *
from hephaestus.HephaestusModel import *

# TrainModels

> Scripts for training models with various parameters.

In [None]:
#export
#hide
MODEL_BASE_DIR = os.path.join("..", "models")

In [None]:
#export
#hide
DEFAULT_PARAMS_DIR = "default_params"

# models with default parameters
MODEL_DEFAULT_CONTROL = os.path.join(MODEL_BASE_DIR, DEFAULT_PARAMS_DIR, "control")
MODEL_DEFAULT_BASIC =   os.path.join(MODEL_BASE_DIR, DEFAULT_PARAMS_DIR, "basic_ops")
MODEL_DEFAULT_STRICT =  os.path.join(MODEL_BASE_DIR, DEFAULT_PARAMS_DIR, "strict_ops")
MODEL_DEFAULT_LOOSE =   os.path.join(MODEL_BASE_DIR, DEFAULT_PARAMS_DIR, "loose_ops")

## Default parameters

These models are trained with the default parameters, which are as close as possible to [Tufano et al.'s](https://arxiv.org/pdf/1812.08693.pdf) highest performing model. Refer to `HephaestusModel.train` for more information on what the default parameters are.

### Model paths

| Variable name           | Value                                   |
| :---------------------- | :-------------------------------------- |
| `MODEL_DEFAULT_CONTROL` | `"../models/default_params/control"`    |
| `MODEL_DEFAULT_BASIC`   | `"../models/default_params/basic_ops"`  |
| `MODEL_DEFAULT_STRICT`  | `"../models/default_params/strict_ops"` |
| `MODEL_DEFAULT_LOOSE`   | `"../models/default_params/loose_ops"`  |

### Models

**Control -- train only on AbstractMethods (no EditOperations):**

In [None]:
#collapse_output
modelDefaultControl = HephaestusModel(MODEL_DEFAULT_CONTROL)
modelDefaultControl.train(
    DATA_SMALL_METHODS_TRAIN_BUGGY,
    DATA_SMALL_METHODS_TRAIN_FIXED,
    DATA_SMALL_METHODS_VALID_BUGGY,
    DATA_SMALL_METHODS_VALID_FIXED
)

[2021-04-23 00:53:06,526 INFO] Counter vocab from -1 samples.
[2021-04-23 00:53:06,526 INFO] n_sample=-1: Build vocab on full datasets.
[2021-04-23 00:53:06,530 INFO] corpus_1's transforms: TransformPipe()
[2021-04-23 00:53:06,530 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/abstract_methods/train_fixed.txt, align=None)...
[2021-04-23 00:53:07,131 INFO] Counters src:429
[2021-04-23 00:53:07,131 INFO] Counters tgt:423
[2021-04-23 00:53:07,607 INFO] Parsed 2 corpora from -data.
[2021-04-23 00:53:07,607 INFO] Get special vocabs from Transforms: {'src': set(), 'tgt': set()}.
[2021-04-23 00:53:07,607 INFO] Loading vocab from text file...
[2021-04-23 00:53:07,607 INFO] Loading src vocabulary from ../models/default_params/control/save_data.vocab.src
[2021-04-23 00:53:07,608 INFO] Loaded src vocab has 429 tokens.
[2021-04-23 00:53:07,608 INFO] Loading tgt vocabulary from ../models/default_params/control/save_data.vocab.tgt
[2021-04-23 00:53:07,610 

[2021-04-23 00:59:22,383 INFO] Step 1850/50000; acc:  69.72; ppl:  3.33; xent: 1.20; lr: 0.00010; 10012/9420 tok/s;    374 sec
[2021-04-23 00:59:32,488 INFO] Step 1900/50000; acc:  70.28; ppl:  3.26; xent: 1.18; lr: 0.00010; 9877/9349 tok/s;    384 sec
[2021-04-23 00:59:42,801 INFO] Step 1950/50000; acc:  70.21; ppl:  3.26; xent: 1.18; lr: 0.00010; 10059/9415 tok/s;    394 sec
[2021-04-23 00:59:52,819 INFO] Step 2000/50000; acc:  71.12; ppl:  3.14; xent: 1.14; lr: 0.00010; 10085/9574 tok/s;    404 sec
[2021-04-23 01:00:03,041 INFO] Step 2050/50000; acc:  71.07; ppl:  3.15; xent: 1.15; lr: 0.00010; 10184/9492 tok/s;    414 sec
[2021-04-23 01:00:12,853 INFO] Step 2100/50000; acc:  72.13; ppl:  3.03; xent: 1.11; lr: 0.00010; 10058/9505 tok/s;    424 sec
[2021-04-23 01:00:22,949 INFO] Step 2150/50000; acc:  71.92; ppl:  3.01; xent: 1.10; lr: 0.00010; 10107/9544 tok/s;    434 sec
[2021-04-23 01:00:28,201 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/sm

[2021-04-23 01:09:27,726 INFO] Step 4850/50000; acc:  86.70; ppl:  1.78; xent: 0.57; lr: 0.00010; 9971/9447 tok/s;    979 sec
[2021-04-23 01:09:37,983 INFO] Step 4900/50000; acc:  86.83; ppl:  1.76; xent: 0.57; lr: 0.00010; 10151/9559 tok/s;    989 sec
[2021-04-23 01:09:47,855 INFO] Step 4950/50000; acc:  86.82; ppl:  1.75; xent: 0.56; lr: 0.00010; 10199/9634 tok/s;    999 sec
[2021-04-23 01:09:57,949 INFO] Step 5000/50000; acc:  87.12; ppl:  1.73; xent: 0.55; lr: 0.00010; 10121/9487 tok/s;   1009 sec
[2021-04-23 01:09:57,949 INFO] valid's transforms: TransformPipe()
[2021-04-23 01:09:57,952 INFO] Loading ParallelCorpus(../data/small/abstract_methods/valid_buggy.txt, ../data/small/abstract_methods/valid_fixed.txt, align=None)...
[2021-04-23 01:10:07,594 INFO] Validation perplexity: 1.65393
[2021-04-23 01:10:07,594 INFO] Validation accuracy: 88.5469
[2021-04-23 01:10:07,596 INFO] Saving checkpoint ../models/default_params/control/model_step_5000.pt
[2021-04-23 01:10:18,329 INFO] Step 50

[2021-04-23 01:19:03,014 INFO] Step 7650/50000; acc:  90.92; ppl:  1.49; xent: 0.40; lr: 0.00010; 10231/9577 tok/s;   1554 sec
[2021-04-23 01:19:12,968 INFO] Step 7700/50000; acc:  90.51; ppl:  1.51; xent: 0.41; lr: 0.00010; 9940/9449 tok/s;   1564 sec
[2021-04-23 01:19:23,125 INFO] Step 7750/50000; acc:  90.86; ppl:  1.50; xent: 0.41; lr: 0.00010; 10112/9551 tok/s;   1574 sec
[2021-04-23 01:19:33,245 INFO] Step 7800/50000; acc:  90.87; ppl:  1.50; xent: 0.40; lr: 0.00010; 10017/9427 tok/s;   1584 sec
[2021-04-23 01:19:43,185 INFO] Step 7850/50000; acc:  90.74; ppl:  1.50; xent: 0.40; lr: 0.00010; 10128/9600 tok/s;   1594 sec
[2021-04-23 01:19:53,360 INFO] Step 7900/50000; acc:  90.88; ppl:  1.49; xent: 0.40; lr: 0.00010; 10228/9543 tok/s;   1605 sec
[2021-04-23 01:20:03,310 INFO] Step 7950/50000; acc:  91.12; ppl:  1.48; xent: 0.39; lr: 0.00010; 9963/9382 tok/s;   1614 sec
[2021-04-23 01:20:13,510 INFO] Step 8000/50000; acc:  90.77; ppl:  1.50; xent: 0.41; lr: 0.00010; 10147/9537 tok/

[2021-04-23 01:28:48,110 INFO] Step 10500/50000; acc:  92.22; ppl:  1.41; xent: 0.35; lr: 0.00010; 10136/9573 tok/s;   2139 sec
[2021-04-23 01:28:58,302 INFO] Step 10550/50000; acc:  92.34; ppl:  1.40; xent: 0.34; lr: 0.00010; 10021/9429 tok/s;   2149 sec
[2021-04-23 01:29:08,372 INFO] Step 10600/50000; acc:  91.97; ppl:  1.42; xent: 0.35; lr: 0.00010; 10093/9498 tok/s;   2160 sec
[2021-04-23 01:29:18,580 INFO] Step 10650/50000; acc:  92.07; ppl:  1.42; xent: 0.35; lr: 0.00010; 10049/9471 tok/s;   2170 sec
[2021-04-23 01:29:28,796 INFO] Step 10700/50000; acc:  91.99; ppl:  1.42; xent: 0.35; lr: 0.00010; 9865/9354 tok/s;   2180 sec
[2021-04-23 01:29:38,827 INFO] Step 10750/50000; acc:  92.13; ppl:  1.41; xent: 0.35; lr: 0.00010; 10226/9673 tok/s;   2190 sec
[2021-04-23 01:29:48,833 INFO] Step 10800/50000; acc:  92.30; ppl:  1.41; xent: 0.34; lr: 0.00010; 10187/9544 tok/s;   2200 sec
[2021-04-23 01:29:59,118 INFO] Step 10850/50000; acc:  92.41; ppl:  1.40; xent: 0.34; lr: 0.00010; 10053/

[2021-04-23 01:38:43,268 INFO] Step 13450/50000; acc:  92.94; ppl:  1.36; xent: 0.31; lr: 0.00010; 10001/9464 tok/s;   2734 sec
[2021-04-23 01:38:53,468 INFO] Step 13500/50000; acc:  92.75; ppl:  1.37; xent: 0.31; lr: 0.00010; 10179/9536 tok/s;   2745 sec
[2021-04-23 01:39:03,581 INFO] Step 13550/50000; acc:  92.64; ppl:  1.37; xent: 0.32; lr: 0.00010; 9887/9386 tok/s;   2755 sec
[2021-04-23 01:39:13,833 INFO] Step 13600/50000; acc:  92.75; ppl:  1.37; xent: 0.31; lr: 0.00010; 10130/9502 tok/s;   2765 sec
[2021-04-23 01:39:23,763 INFO] Step 13650/50000; acc:  92.69; ppl:  1.38; xent: 0.32; lr: 0.00010; 9991/9497 tok/s;   2775 sec
[2021-04-23 01:39:33,926 INFO] Step 13700/50000; acc:  92.90; ppl:  1.36; xent: 0.31; lr: 0.00010; 10270/9635 tok/s;   2785 sec
[2021-04-23 01:39:43,936 INFO] Step 13750/50000; acc:  92.74; ppl:  1.36; xent: 0.31; lr: 0.00010; 10026/9434 tok/s;   2795 sec
[2021-04-23 01:39:53,903 INFO] Step 13800/50000; acc:  92.80; ppl:  1.37; xent: 0.31; lr: 0.00010; 10171/9

[2021-04-23 01:48:18,300 INFO] Step 16250/50000; acc:  93.08; ppl:  1.35; xent: 0.30; lr: 0.00010; 10085/9523 tok/s;   3309 sec
[2021-04-23 01:48:28,264 INFO] Step 16300/50000; acc:  92.99; ppl:  1.35; xent: 0.30; lr: 0.00010; 10040/9527 tok/s;   3319 sec
[2021-04-23 01:48:38,560 INFO] Step 16350/50000; acc:  93.20; ppl:  1.34; xent: 0.29; lr: 0.00010; 10079/9493 tok/s;   3330 sec
[2021-04-23 01:48:48,727 INFO] Step 16400/50000; acc:  93.27; ppl:  1.33; xent: 0.29; lr: 0.00010; 10066/9499 tok/s;   3340 sec
[2021-04-23 01:48:59,103 INFO] Step 16450/50000; acc:  93.03; ppl:  1.34; xent: 0.30; lr: 0.00010; 10011/9391 tok/s;   3350 sec
[2021-04-23 01:49:08,979 INFO] Step 16500/50000; acc:  92.99; ppl:  1.35; xent: 0.30; lr: 0.00010; 9989/9472 tok/s;   3360 sec
[2021-04-23 01:49:19,230 INFO] Step 16550/50000; acc:  93.26; ppl:  1.33; xent: 0.29; lr: 0.00010; 10031/9461 tok/s;   3370 sec
[2021-04-23 01:49:29,151 INFO] Step 16600/50000; acc:  93.20; ppl:  1.34; xent: 0.29; lr: 0.00010; 10258/

[2021-04-23 01:58:13,352 INFO] Step 19200/50000; acc:  93.38; ppl:  1.32; xent: 0.28; lr: 0.00010; 10144/9565 tok/s;   3905 sec
[2021-04-23 01:58:23,313 INFO] Step 19250/50000; acc:  93.46; ppl:  1.32; xent: 0.28; lr: 0.00010; 9971/9491 tok/s;   3914 sec
[2021-04-23 01:58:33,717 INFO] Step 19300/50000; acc:  93.59; ppl:  1.32; xent: 0.27; lr: 0.00010; 10113/9489 tok/s;   3925 sec
[2021-04-23 01:58:43,767 INFO] Step 19350/50000; acc:  93.32; ppl:  1.32; xent: 0.28; lr: 0.00010; 10056/9506 tok/s;   3935 sec
[2021-04-23 01:58:53,968 INFO] Step 19400/50000; acc:  93.32; ppl:  1.33; xent: 0.28; lr: 0.00010; 9906/9342 tok/s;   3945 sec
[2021-04-23 01:59:04,257 INFO] Step 19450/50000; acc:  93.46; ppl:  1.32; xent: 0.27; lr: 0.00010; 10010/9393 tok/s;   3955 sec
[2021-04-23 01:59:14,224 INFO] Step 19500/50000; acc:  93.39; ppl:  1.32; xent: 0.28; lr: 0.00010; 10069/9552 tok/s;   3965 sec
[2021-04-23 01:59:24,342 INFO] Step 19550/50000; acc:  93.51; ppl:  1.31; xent: 0.27; lr: 0.00010; 10218/9

[2021-04-23 02:07:48,334 INFO] Step 22000/50000; acc:  93.47; ppl:  1.31; xent: 0.27; lr: 0.00010; 10121/9632 tok/s;   4479 sec
[2021-04-23 02:07:58,585 INFO] Step 22050/50000; acc:  93.56; ppl:  1.31; xent: 0.27; lr: 0.00010; 10110/9505 tok/s;   4490 sec
[2021-04-23 02:08:08,415 INFO] Step 22100/50000; acc:  93.50; ppl:  1.31; xent: 0.27; lr: 0.00010; 10040/9561 tok/s;   4500 sec
[2021-04-23 02:08:18,625 INFO] Step 22150/50000; acc:  93.68; ppl:  1.30; xent: 0.27; lr: 0.00010; 9986/9454 tok/s;   4510 sec
[2021-04-23 02:08:28,853 INFO] Step 22200/50000; acc:  93.76; ppl:  1.30; xent: 0.26; lr: 0.00010; 10054/9483 tok/s;   4520 sec
[2021-04-23 02:08:38,888 INFO] Step 22250/50000; acc:  93.64; ppl:  1.30; xent: 0.26; lr: 0.00010; 10090/9532 tok/s;   4530 sec
[2021-04-23 02:08:49,254 INFO] Step 22300/50000; acc:  93.57; ppl:  1.30; xent: 0.27; lr: 0.00010; 9981/9353 tok/s;   4540 sec
[2021-04-23 02:08:59,276 INFO] Step 22350/50000; acc:  93.70; ppl:  1.30; xent: 0.26; lr: 0.00010; 9978/94

[2021-04-23 02:18:39,489 INFO] Step 25000/50000; acc:  93.82; ppl:  1.29; xent: 0.25; lr: 0.00010; 10144/9573 tok/s;   5131 sec
[2021-04-23 02:18:39,491 INFO] Loading ParallelCorpus(../data/small/abstract_methods/valid_buggy.txt, ../data/small/abstract_methods/valid_fixed.txt, align=None)...
[2021-04-23 02:18:49,130 INFO] Validation perplexity: 1.33406
[2021-04-23 02:18:49,130 INFO] Validation accuracy: 93.46
[2021-04-23 02:18:49,133 INFO] Saving checkpoint ../models/default_params/control/model_step_25000.pt
[2021-04-23 02:18:59,853 INFO] Step 25050/50000; acc:  93.92; ppl:  1.29; xent: 0.25; lr: 0.00010; 4991/4708 tok/s;   5151 sec
[2021-04-23 02:19:09,927 INFO] Step 25100/50000; acc:  93.82; ppl:  1.29; xent: 0.26; lr: 0.00010; 10007/9509 tok/s;   5161 sec
[2021-04-23 02:19:20,194 INFO] Step 25150/50000; acc:  94.13; ppl:  1.28; xent: 0.24; lr: 0.00010; 10209/9586 tok/s;   5171 sec
[2021-04-23 02:19:30,326 INFO] Step 25200/50000; acc:  93.61; ppl:  1.29; xent: 0.26; lr: 0.00010; 998

[2021-04-23 02:29:56,062 INFO] Step 27850/50000; acc:  93.88; ppl:  1.28; xent: 0.25; lr: 0.00010; 10117/9606 tok/s;   5807 sec
[2021-04-23 02:30:06,188 INFO] Step 27900/50000; acc:  94.00; ppl:  1.27; xent: 0.24; lr: 0.00010; 10184/9598 tok/s;   5817 sec
[2021-04-23 02:30:16,207 INFO] Step 27950/50000; acc:  93.92; ppl:  1.28; xent: 0.25; lr: 0.00010; 9935/9486 tok/s;   5827 sec
[2021-04-23 02:30:26,317 INFO] Step 28000/50000; acc:  94.14; ppl:  1.27; xent: 0.24; lr: 0.00010; 10201/9580 tok/s;   5837 sec
[2021-04-23 02:30:36,488 INFO] Step 28050/50000; acc:  94.14; ppl:  1.27; xent: 0.24; lr: 0.00010; 9958/9434 tok/s;   5848 sec
[2021-04-23 02:30:46,759 INFO] Step 28100/50000; acc:  94.05; ppl:  1.27; xent: 0.24; lr: 0.00010; 10149/9511 tok/s;   5858 sec
[2021-04-23 02:30:56,773 INFO] Step 28150/50000; acc:  93.98; ppl:  1.28; xent: 0.24; lr: 0.00010; 10015/9495 tok/s;   5868 sec
[2021-04-23 02:31:07,045 INFO] Step 28200/50000; acc:  94.09; ppl:  1.27; xent: 0.24; lr: 0.00010; 9944/93

[2021-04-23 02:39:31,093 INFO] Step 30650/50000; acc:  94.18; ppl:  1.26; xent: 0.23; lr: 0.00010; 10121/9547 tok/s;   6382 sec
[2021-04-23 02:39:41,192 INFO] Step 30700/50000; acc:  94.23; ppl:  1.27; xent: 0.24; lr: 0.00010; 10012/9388 tok/s;   6392 sec
[2021-04-23 02:39:51,151 INFO] Step 30750/50000; acc:  94.13; ppl:  1.26; xent: 0.23; lr: 0.00010; 10293/9758 tok/s;   6402 sec
[2021-04-23 02:40:01,279 INFO] Step 30800/50000; acc:  94.08; ppl:  1.27; xent: 0.24; lr: 0.00010; 9921/9420 tok/s;   6412 sec
[2021-04-23 02:40:11,548 INFO] Step 30850/50000; acc:  94.21; ppl:  1.26; xent: 0.23; lr: 0.00010; 10080/9499 tok/s;   6423 sec
[2021-04-23 02:40:21,362 INFO] Step 30900/50000; acc:  93.98; ppl:  1.27; xent: 0.24; lr: 0.00010; 10021/9520 tok/s;   6433 sec
[2021-04-23 02:40:31,705 INFO] Step 30950/50000; acc:  94.44; ppl:  1.25; xent: 0.22; lr: 0.00010; 10051/9478 tok/s;   6443 sec
[2021-04-23 02:40:41,791 INFO] Step 31000/50000; acc:  94.30; ppl:  1.26; xent: 0.23; lr: 0.00010; 10146/

[2021-04-23 02:49:25,887 INFO] Step 33600/50000; acc:  94.50; ppl:  1.25; xent: 0.22; lr: 0.00010; 10173/9568 tok/s;   6977 sec
[2021-04-23 02:49:35,747 INFO] Step 33650/50000; acc:  94.29; ppl:  1.25; xent: 0.23; lr: 0.00010; 10051/9525 tok/s;   6987 sec
[2021-04-23 02:49:45,892 INFO] Step 33700/50000; acc:  94.37; ppl:  1.25; xent: 0.22; lr: 0.00010; 10226/9702 tok/s;   6997 sec
[2021-04-23 02:49:55,893 INFO] Step 33750/50000; acc:  94.27; ppl:  1.26; xent: 0.23; lr: 0.00010; 9999/9436 tok/s;   7007 sec
[2021-04-23 02:50:05,930 INFO] Step 33800/50000; acc:  94.37; ppl:  1.25; xent: 0.22; lr: 0.00010; 10104/9605 tok/s;   7017 sec
[2021-04-23 02:50:16,165 INFO] Step 33850/50000; acc:  94.44; ppl:  1.25; xent: 0.22; lr: 0.00010; 10054/9492 tok/s;   7027 sec
[2021-04-23 02:50:26,275 INFO] Step 33900/50000; acc:  94.51; ppl:  1.24; xent: 0.22; lr: 0.00010; 10048/9491 tok/s;   7037 sec
[2021-04-23 02:50:36,567 INFO] Step 33950/50000; acc:  94.27; ppl:  1.25; xent: 0.22; lr: 0.00010; 10059/

[2021-04-23 02:59:11,104 INFO] Step 36450/50000; acc:  94.51; ppl:  1.24; xent: 0.22; lr: 0.00010; 10127/9504 tok/s;   7562 sec
[2021-04-23 02:59:20,998 INFO] Step 36500/50000; acc:  94.55; ppl:  1.24; xent: 0.21; lr: 0.00010; 10017/9455 tok/s;   7572 sec
[2021-04-23 02:59:31,240 INFO] Step 36550/50000; acc:  94.57; ppl:  1.24; xent: 0.22; lr: 0.00010; 10057/9473 tok/s;   7582 sec
[2021-04-23 02:59:41,079 INFO] Step 36600/50000; acc:  94.45; ppl:  1.24; xent: 0.22; lr: 0.00010; 10210/9761 tok/s;   7592 sec
[2021-04-23 02:59:51,186 INFO] Step 36650/50000; acc:  94.51; ppl:  1.24; xent: 0.22; lr: 0.00010; 9934/9335 tok/s;   7602 sec
[2021-04-23 03:00:01,338 INFO] Step 36700/50000; acc:  94.59; ppl:  1.24; xent: 0.21; lr: 0.00010; 10156/9614 tok/s;   7613 sec
[2021-04-23 03:00:11,338 INFO] Step 36750/50000; acc:  94.50; ppl:  1.24; xent: 0.22; lr: 0.00010; 9978/9478 tok/s;   7623 sec
[2021-04-23 03:00:21,628 INFO] Step 36800/50000; acc:  94.70; ppl:  1.23; xent: 0.21; lr: 0.00010; 10169/9

[2021-04-23 03:09:05,825 INFO] Step 39400/50000; acc:  94.69; ppl:  1.23; xent: 0.21; lr: 0.00010; 10162/9582 tok/s;   8157 sec
[2021-04-23 03:09:15,926 INFO] Step 39450/50000; acc:  94.81; ppl:  1.23; xent: 0.20; lr: 0.00010; 10151/9552 tok/s;   8167 sec
[2021-04-23 03:09:25,825 INFO] Step 39500/50000; acc:  94.60; ppl:  1.23; xent: 0.21; lr: 0.00010; 10066/9555 tok/s;   8177 sec
[2021-04-23 03:09:35,984 INFO] Step 39550/50000; acc:  94.66; ppl:  1.23; xent: 0.21; lr: 0.00010; 10135/9554 tok/s;   8187 sec
[2021-04-23 03:09:46,014 INFO] Step 39600/50000; acc:  94.63; ppl:  1.23; xent: 0.21; lr: 0.00010; 10054/9571 tok/s;   8197 sec
[2021-04-23 03:09:56,170 INFO] Step 39650/50000; acc:  94.83; ppl:  1.22; xent: 0.20; lr: 0.00010; 10129/9516 tok/s;   8207 sec
[2021-04-23 03:10:06,203 INFO] Step 39700/50000; acc:  94.72; ppl:  1.23; xent: 0.21; lr: 0.00010; 9970/9520 tok/s;   8217 sec
[2021-04-23 03:10:16,359 INFO] Step 39750/50000; acc:  94.79; ppl:  1.22; xent: 0.20; lr: 0.00010; 10217/

[2021-04-23 03:18:55,454 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/abstract_methods/train_fixed.txt, align=None)...
[2021-04-23 03:19:01,020 INFO] Step 42300/50000; acc:  94.85; ppl:  1.22; xent: 0.20; lr: 0.00010; 10189/9555 tok/s;   8752 sec
[2021-04-23 03:19:11,065 INFO] Step 42350/50000; acc:  94.86; ppl:  1.22; xent: 0.20; lr: 0.00010; 9986/9503 tok/s;   8762 sec
[2021-04-23 03:19:21,092 INFO] Step 42400/50000; acc:  94.92; ppl:  1.21; xent: 0.19; lr: 0.00010; 10269/9616 tok/s;   8772 sec
[2021-04-23 03:19:30,913 INFO] Step 42450/50000; acc:  94.63; ppl:  1.23; xent: 0.21; lr: 0.00010; 10064/9622 tok/s;   8782 sec
[2021-04-23 03:19:41,135 INFO] Step 42500/50000; acc:  94.88; ppl:  1.22; xent: 0.20; lr: 0.00010; 10184/9585 tok/s;   8792 sec
[2021-04-23 03:19:51,034 INFO] Step 42550/50000; acc:  94.82; ppl:  1.22; xent: 0.20; lr: 0.00010; 10068/9513 tok/s;   8802 sec
[2021-04-23 03:20:01,193 INFO] Step 42600/50000; acc:  94.84; ppl:  

[2021-04-23 03:28:36,612 INFO] Step 45100/50000; acc:  95.10; ppl:  1.20; xent: 0.18; lr: 0.00010; 10058/9468 tok/s;   9328 sec
[2021-04-23 03:28:46,695 INFO] Step 45150/50000; acc:  95.08; ppl:  1.21; xent: 0.19; lr: 0.00010; 10170/9474 tok/s;   9338 sec
[2021-04-23 03:28:56,711 INFO] Step 45200/50000; acc:  94.82; ppl:  1.21; xent: 0.19; lr: 0.00010; 10082/9572 tok/s;   9348 sec
[2021-04-23 03:28:59,946 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/abstract_methods/train_fixed.txt, align=None)...
[2021-04-23 03:29:06,975 INFO] Step 45250/50000; acc:  95.09; ppl:  1.21; xent: 0.19; lr: 0.00010; 10109/9481 tok/s;   9358 sec
[2021-04-23 03:29:16,806 INFO] Step 45300/50000; acc:  95.07; ppl:  1.21; xent: 0.19; lr: 0.00010; 10088/9570 tok/s;   9368 sec
[2021-04-23 03:29:26,841 INFO] Step 45350/50000; acc:  94.98; ppl:  1.21; xent: 0.19; lr: 0.00010; 10181/9636 tok/s;   9378 sec
[2021-04-23 03:29:36,850 INFO] Step 45400/50000; acc:  94.96; ppl: 

[2021-04-23 03:38:31,726 INFO] Step 48050/50000; acc:  95.07; ppl:  1.20; xent: 0.19; lr: 0.00010; 10059/9472 tok/s;   9923 sec
[2021-04-23 03:38:41,956 INFO] Step 48100/50000; acc:  95.16; ppl:  1.20; xent: 0.18; lr: 0.00010; 10130/9543 tok/s;   9933 sec
[2021-04-23 03:38:47,544 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/abstract_methods/train_fixed.txt, align=None)...
[2021-04-23 03:38:51,929 INFO] Step 48150/50000; acc:  95.17; ppl:  1.20; xent: 0.18; lr: 0.00010; 10070/9503 tok/s;   9943 sec
[2021-04-23 03:39:02,128 INFO] Step 48200/50000; acc:  95.15; ppl:  1.20; xent: 0.18; lr: 0.00010; 10061/9436 tok/s;   9953 sec
[2021-04-23 03:39:12,065 INFO] Step 48250/50000; acc:  95.12; ppl:  1.20; xent: 0.18; lr: 0.00010; 10221/9679 tok/s;   9963 sec
[2021-04-23 03:39:22,095 INFO] Step 48300/50000; acc:  95.11; ppl:  1.20; xent: 0.19; lr: 0.00010; 9957/9476 tok/s;   9973 sec
[2021-04-23 03:39:32,315 INFO] Step 48350/50000; acc:  95.16; ppl:  

**Train on basic condensed EditOperations:**

In [None]:
# collapse_output
modelBasicDefault = HephaestusModel(MODEL_DEFAULT_BASIC)
modelBasicDefault.train(
    DATA_SMALL_METHODS_TRAIN_BUGGY,
    DATA_SMALL_OPS_BASIC_TRAIN,
    DATA_SMALL_METHODS_VALID_BUGGY,
    DATA_SMALL_OPS_BASIC_VALID
)

[2021-04-24 05:10:12,077 INFO] Counter vocab from -1 samples.
[2021-04-24 05:10:12,077 INFO] n_sample=-1: Build vocab on full datasets.
[2021-04-24 05:10:12,088 INFO] corpus_1's transforms: TransformPipe()
[2021-04-24 05:10:12,089 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/edit_ops/basic/train.txt, align=None)...
[2021-04-24 05:10:13,192 INFO] Counters src:429
[2021-04-24 05:10:13,192 INFO] Counters tgt:438
[2021-04-24 05:10:13,907 INFO] Parsed 2 corpora from -data.
[2021-04-24 05:10:13,907 INFO] Get special vocabs from Transforms: {'src': set(), 'tgt': set()}.
[2021-04-24 05:10:13,907 INFO] Loading vocab from text file...
[2021-04-24 05:10:13,907 INFO] Loading src vocabulary from ../models/default_params/basic_ops/save_data.vocab.src
[2021-04-24 05:10:13,908 INFO] Loaded src vocab has 429 tokens.
[2021-04-24 05:10:13,909 INFO] Loading tgt vocabulary from ../models/default_params/basic_ops/save_data.vocab.tgt
[2021-04-24 05:10:13,910 INFO

[2021-04-24 05:22:37,414 INFO] Step 1900/50000; acc:  85.29; ppl:  1.83; xent: 0.60; lr: 0.00010; 5059/6408 tok/s;    741 sec
[2021-04-24 05:22:57,874 INFO] Step 1950/50000; acc:  84.69; ppl:  1.88; xent: 0.63; lr: 0.00010; 4959/6286 tok/s;    761 sec
[2021-04-24 05:23:17,063 INFO] Step 2000/50000; acc:  84.85; ppl:  1.86; xent: 0.62; lr: 0.00010; 5267/6449 tok/s;    781 sec
[2021-04-24 05:23:36,754 INFO] Step 2050/50000; acc:  85.41; ppl:  1.82; xent: 0.60; lr: 0.00010; 5263/6546 tok/s;    800 sec
[2021-04-24 05:23:55,492 INFO] Step 2100/50000; acc:  85.45; ppl:  1.82; xent: 0.60; lr: 0.00010; 5365/6768 tok/s;    819 sec
[2021-04-24 05:24:14,977 INFO] Step 2150/50000; acc:  85.71; ppl:  1.80; xent: 0.59; lr: 0.00010; 5160/6605 tok/s;    839 sec
[2021-04-24 05:24:25,049 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/edit_ops/basic/train.txt, align=None)...
[2021-04-24 05:24:34,273 INFO] Step 2200/50000; acc:  85.66; ppl:  1.80; xent: 0.59; lr

[2021-04-24 05:42:27,921 INFO] Step 4950/50000; acc:  87.71; ppl:  1.64; xent: 0.50; lr: 0.00010; 5289/6523 tok/s;   1931 sec
[2021-04-24 05:42:47,201 INFO] Step 5000/50000; acc:  88.29; ppl:  1.61; xent: 0.48; lr: 0.00010; 5235/6669 tok/s;   1951 sec
[2021-04-24 05:42:47,202 INFO] valid's transforms: TransformPipe()
[2021-04-24 05:42:47,203 INFO] Loading ParallelCorpus(../data/small/abstract_methods/valid_buggy.txt, ../data/small/edit_ops/basic/valid.txt, align=None)...
[2021-04-24 05:43:15,422 INFO] Validation perplexity: 1.59687
[2021-04-24 05:43:15,422 INFO] Validation accuracy: 88.4028
[2021-04-24 05:43:15,426 INFO] Saving checkpoint ../models/default_params/basic_ops/model_step_5000.pt
[2021-04-24 05:43:34,970 INFO] Step 5050/50000; acc:  88.22; ppl:  1.62; xent: 0.48; lr: 0.00010; 2129/2692 tok/s;   1999 sec
[2021-04-24 05:43:49,406 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/edit_ops/basic/train.txt, align=None)...
[2021-04-24 05:4

[2021-04-24 06:01:27,227 INFO] Step 7800/50000; acc:  88.83; ppl:  1.56; xent: 0.45; lr: 0.00010; 5081/6388 tok/s;   3071 sec
[2021-04-24 06:01:46,887 INFO] Step 7850/50000; acc:  88.77; ppl:  1.56; xent: 0.45; lr: 0.00010; 5181/6400 tok/s;   3090 sec
[2021-04-24 06:02:06,141 INFO] Step 7900/50000; acc:  89.24; ppl:  1.54; xent: 0.43; lr: 0.00010; 5339/6685 tok/s;   3110 sec
[2021-04-24 06:02:25,230 INFO] Step 7950/50000; acc:  89.15; ppl:  1.54; xent: 0.43; lr: 0.00010; 5216/6648 tok/s;   3129 sec
[2021-04-24 06:02:44,591 INFO] Step 8000/50000; acc:  89.08; ppl:  1.54; xent: 0.43; lr: 0.00010; 5262/6637 tok/s;   3148 sec
[2021-04-24 06:02:44,604 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/edit_ops/basic/train.txt, align=None)...
[2021-04-24 06:03:03,747 INFO] Step 8050/50000; acc:  89.07; ppl:  1.55; xent: 0.44; lr: 0.00010; 5259/6648 tok/s;   3167 sec
[2021-04-24 06:03:23,493 INFO] Step 8100/50000; acc:  89.08; ppl:  1.55; xent: 0.44; lr

[2021-04-24 06:20:27,299 INFO] Step 10650/50000; acc:  89.48; ppl:  1.51; xent: 0.41; lr: 0.00010; 5172/6406 tok/s;   4211 sec
[2021-04-24 06:20:47,435 INFO] Step 10700/50000; acc:  89.62; ppl:  1.50; xent: 0.41; lr: 0.00010; 5070/6561 tok/s;   4231 sec
[2021-04-24 06:21:06,774 INFO] Step 10750/50000; acc:  89.14; ppl:  1.53; xent: 0.43; lr: 0.00010; 5194/6380 tok/s;   4250 sec
[2021-04-24 06:21:25,738 INFO] Step 10800/50000; acc:  89.68; ppl:  1.50; xent: 0.40; lr: 0.00010; 5382/6672 tok/s;   4269 sec
[2021-04-24 06:21:45,367 INFO] Step 10850/50000; acc:  90.01; ppl:  1.49; xent: 0.40; lr: 0.00010; 5238/6670 tok/s;   4289 sec
[2021-04-24 06:22:04,548 INFO] Step 10900/50000; acc:  89.40; ppl:  1.51; xent: 0.42; lr: 0.00010; 5236/6560 tok/s;   4308 sec
[2021-04-24 06:22:09,328 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/edit_ops/basic/train.txt, align=None)...
[2021-04-24 06:22:24,060 INFO] Step 10950/50000; acc:  89.74; ppl:  1.50; xent: 0

[2021-04-24 06:39:58,279 INFO] Step 13650/50000; acc:  89.78; ppl:  1.49; xent: 0.40; lr: 0.00010; 5129/6504 tok/s;   5382 sec
[2021-04-24 06:40:18,090 INFO] Step 13700/50000; acc:  89.92; ppl:  1.48; xent: 0.39; lr: 0.00010; 5275/6484 tok/s;   5402 sec
[2021-04-24 06:40:36,980 INFO] Step 13750/50000; acc:  90.10; ppl:  1.47; xent: 0.38; lr: 0.00010; 5331/6680 tok/s;   5421 sec
[2021-04-24 06:40:55,973 INFO] Step 13800/50000; acc:  90.12; ppl:  1.47; xent: 0.39; lr: 0.00010; 5276/6733 tok/s;   5440 sec
[2021-04-24 06:41:15,124 INFO] Step 13850/50000; acc:  89.81; ppl:  1.48; xent: 0.39; lr: 0.00010; 5365/6682 tok/s;   5459 sec
[2021-04-24 06:41:17,503 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/edit_ops/basic/train.txt, align=None)...
[2021-04-24 06:41:34,718 INFO] Step 13900/50000; acc:  90.14; ppl:  1.47; xent: 0.39; lr: 0.00010; 5211/6618 tok/s;   5478 sec
[2021-04-24 06:41:53,964 INFO] Step 13950/50000; acc:  89.70; ppl:  1.49; xent: 0

[2021-04-24 06:58:59,059 INFO] Step 16500/50000; acc:  90.40; ppl:  1.44; xent: 0.37; lr: 0.00010; 5031/6461 tok/s;   6523 sec
[2021-04-24 06:59:18,487 INFO] Step 16550/50000; acc:  90.03; ppl:  1.47; xent: 0.38; lr: 0.00010; 5218/6463 tok/s;   6542 sec
[2021-04-24 06:59:37,662 INFO] Step 16600/50000; acc:  89.91; ppl:  1.47; xent: 0.39; lr: 0.00010; 5370/6587 tok/s;   6561 sec
[2021-04-24 06:59:57,037 INFO] Step 16650/50000; acc:  90.44; ppl:  1.44; xent: 0.37; lr: 0.00010; 5258/6515 tok/s;   6581 sec
[2021-04-24 07:00:15,759 INFO] Step 16700/50000; acc:  90.60; ppl:  1.44; xent: 0.37; lr: 0.00010; 5436/7046 tok/s;   6599 sec
[2021-04-24 07:00:35,052 INFO] Step 16750/50000; acc:  90.01; ppl:  1.46; xent: 0.38; lr: 0.00010; 5181/6536 tok/s;   6619 sec
[2021-04-24 07:00:41,945 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/edit_ops/basic/train.txt, align=None)...
[2021-04-24 07:00:54,807 INFO] Step 16800/50000; acc:  90.29; ppl:  1.45; xent: 0

[2021-04-24 07:18:29,687 INFO] Step 19500/50000; acc:  90.31; ppl:  1.44; xent: 0.37; lr: 0.00010; 5283/6520 tok/s;   7693 sec
[2021-04-24 07:18:49,367 INFO] Step 19550/50000; acc:  90.45; ppl:  1.44; xent: 0.36; lr: 0.00010; 5146/6453 tok/s;   7713 sec
[2021-04-24 07:19:07,990 INFO] Step 19600/50000; acc:  90.67; ppl:  1.43; xent: 0.36; lr: 0.00010; 5442/6885 tok/s;   7732 sec
[2021-04-24 07:19:27,479 INFO] Step 19650/50000; acc:  90.64; ppl:  1.43; xent: 0.36; lr: 0.00010; 5249/6599 tok/s;   7751 sec
[2021-04-24 07:19:38,880 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/edit_ops/basic/train.txt, align=None)...
[2021-04-24 07:19:46,648 INFO] Step 19700/50000; acc:  90.39; ppl:  1.44; xent: 0.37; lr: 0.00010; 5278/6704 tok/s;   7770 sec
[2021-04-24 07:20:06,201 INFO] Step 19750/50000; acc:  90.58; ppl:  1.44; xent: 0.36; lr: 0.00010; 5204/6522 tok/s;   7790 sec
[2021-04-24 07:20:24,745 INFO] Step 19800/50000; acc:  90.20; ppl:  1.45; xent: 0

[2021-04-24 07:37:28,198 INFO] Step 22350/50000; acc:  90.66; ppl:  1.42; xent: 0.35; lr: 0.00010; 5140/6658 tok/s;   8832 sec
[2021-04-24 07:37:47,434 INFO] Step 22400/50000; acc:  90.57; ppl:  1.43; xent: 0.36; lr: 0.00010; 5292/6470 tok/s;   8851 sec
[2021-04-24 07:38:07,115 INFO] Step 22450/50000; acc:  90.60; ppl:  1.43; xent: 0.35; lr: 0.00010; 5145/6404 tok/s;   8871 sec
[2021-04-24 07:38:26,480 INFO] Step 22500/50000; acc:  91.12; ppl:  1.41; xent: 0.34; lr: 0.00010; 5411/6814 tok/s;   8890 sec
[2021-04-24 07:38:45,941 INFO] Step 22550/50000; acc:  90.86; ppl:  1.41; xent: 0.35; lr: 0.00010; 5120/6526 tok/s;   8909 sec
[2021-04-24 07:39:01,912 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/edit_ops/basic/train.txt, align=None)...
[2021-04-24 07:39:05,194 INFO] Step 22600/50000; acc:  90.80; ppl:  1.41; xent: 0.35; lr: 0.00010; 5233/6545 tok/s;   8929 sec
[2021-04-24 07:39:24,368 INFO] Step 22650/50000; acc:  90.58; ppl:  1.43; xent: 0

[2021-04-24 07:56:28,681 INFO] Step 25200/50000; acc:  90.82; ppl:  1.41; xent: 0.35; lr: 0.00010; 5160/6563 tok/s;   9972 sec
[2021-04-24 07:56:48,362 INFO] Step 25250/50000; acc:  91.12; ppl:  1.40; xent: 0.33; lr: 0.00010; 5242/6587 tok/s;   9992 sec
[2021-04-24 07:57:08,230 INFO] Step 25300/50000; acc:  90.84; ppl:  1.41; xent: 0.34; lr: 0.00010; 5072/6478 tok/s;  10012 sec
[2021-04-24 07:57:28,095 INFO] Step 25350/50000; acc:  90.69; ppl:  1.42; xent: 0.35; lr: 0.00010; 5099/6272 tok/s;  10032 sec
[2021-04-24 07:57:47,329 INFO] Step 25400/50000; acc:  91.05; ppl:  1.40; xent: 0.34; lr: 0.00010; 5380/6584 tok/s;  10051 sec
[2021-04-24 07:58:06,655 INFO] Step 25450/50000; acc:  91.29; ppl:  1.39; xent: 0.33; lr: 0.00010; 5228/6651 tok/s;  10070 sec
[2021-04-24 07:58:25,875 INFO] Step 25500/50000; acc:  90.86; ppl:  1.41; xent: 0.34; lr: 0.00010; 5302/6659 tok/s;  10089 sec
[2021-04-24 07:58:27,437 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/s

[2021-04-24 08:16:00,312 INFO] Step 28200/50000; acc:  91.34; ppl:  1.38; xent: 0.32; lr: 0.00010; 5024/6586 tok/s;  11144 sec
[2021-04-24 08:16:19,931 INFO] Step 28250/50000; acc:  90.80; ppl:  1.41; xent: 0.34; lr: 0.00010; 5207/6341 tok/s;  11163 sec
[2021-04-24 08:16:39,020 INFO] Step 28300/50000; acc:  91.30; ppl:  1.38; xent: 0.33; lr: 0.00010; 5367/6595 tok/s;  11183 sec
[2021-04-24 08:16:58,266 INFO] Step 28350/50000; acc:  91.42; ppl:  1.38; xent: 0.32; lr: 0.00010; 5238/6653 tok/s;  11202 sec
[2021-04-24 08:17:17,627 INFO] Step 28400/50000; acc:  91.14; ppl:  1.39; xent: 0.33; lr: 0.00010; 5198/6627 tok/s;  11221 sec
[2021-04-24 08:17:23,904 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/edit_ops/basic/train.txt, align=None)...
[2021-04-24 08:17:37,103 INFO] Step 28450/50000; acc:  91.27; ppl:  1.38; xent: 0.32; lr: 0.00010; 5325/6740 tok/s;  11241 sec
[2021-04-24 08:17:56,153 INFO] Step 28500/50000; acc:  91.10; ppl:  1.40; xent: 0

[2021-04-24 08:35:01,295 INFO] Step 31050/50000; acc:  91.33; ppl:  1.38; xent: 0.32; lr: 0.00010; 5025/6334 tok/s;  12285 sec
[2021-04-24 08:35:20,772 INFO] Step 31100/50000; acc:  91.47; ppl:  1.37; xent: 0.31; lr: 0.00010; 5250/6617 tok/s;  12304 sec
[2021-04-24 08:35:40,269 INFO] Step 31150/50000; acc:  91.27; ppl:  1.38; xent: 0.32; lr: 0.00010; 5145/6594 tok/s;  12324 sec
[2021-04-24 08:35:59,448 INFO] Step 31200/50000; acc:  91.14; ppl:  1.39; xent: 0.33; lr: 0.00010; 5312/6494 tok/s;  12343 sec
[2021-04-24 08:36:18,462 INFO] Step 31250/50000; acc:  91.45; ppl:  1.37; xent: 0.32; lr: 0.00010; 5322/6622 tok/s;  12362 sec
[2021-04-24 08:36:38,305 INFO] Step 31300/50000; acc:  91.78; ppl:  1.36; xent: 0.31; lr: 0.00010; 5223/6746 tok/s;  12382 sec
[2021-04-24 08:36:56,683 INFO] Step 31350/50000; acc:  91.01; ppl:  1.39; xent: 0.33; lr: 0.00010; 5482/6741 tok/s;  12400 sec
[2021-04-24 08:37:00,674 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/s

[2021-04-24 08:54:31,905 INFO] Step 34050/50000; acc:  91.43; ppl:  1.37; xent: 0.31; lr: 0.00010; 5246/6504 tok/s;  13455 sec
[2021-04-24 08:54:51,259 INFO] Step 34100/50000; acc:  91.35; ppl:  1.37; xent: 0.32; lr: 0.00010; 5218/6464 tok/s;  13475 sec
[2021-04-24 08:55:10,410 INFO] Step 34150/50000; acc:  91.70; ppl:  1.36; xent: 0.31; lr: 0.00010; 5301/6581 tok/s;  13494 sec
[2021-04-24 08:55:29,178 INFO] Step 34200/50000; acc:  91.63; ppl:  1.36; xent: 0.31; lr: 0.00010; 5464/6975 tok/s;  13513 sec
[2021-04-24 08:55:48,591 INFO] Step 34250/50000; acc:  91.60; ppl:  1.36; xent: 0.31; lr: 0.00010; 5206/6554 tok/s;  13532 sec
[2021-04-24 08:55:56,889 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/edit_ops/basic/train.txt, align=None)...
[2021-04-24 08:56:08,157 INFO] Step 34300/50000; acc:  91.58; ppl:  1.36; xent: 0.31; lr: 0.00010; 5226/6589 tok/s;  13552 sec
[2021-04-24 08:56:27,358 INFO] Step 34350/50000; acc:  91.65; ppl:  1.36; xent: 0

[2021-04-24 09:13:31,752 INFO] Step 36900/50000; acc:  91.87; ppl:  1.35; xent: 0.30; lr: 0.00010; 5115/6438 tok/s;  14595 sec
[2021-04-24 09:13:51,859 INFO] Step 36950/50000; acc:  91.59; ppl:  1.36; xent: 0.31; lr: 0.00010; 5030/6323 tok/s;  14615 sec
[2021-04-24 09:14:11,717 INFO] Step 37000/50000; acc:  91.79; ppl:  1.35; xent: 0.30; lr: 0.00010; 5060/6322 tok/s;  14635 sec
[2021-04-24 09:14:31,501 INFO] Step 37050/50000; acc:  91.69; ppl:  1.35; xent: 0.30; lr: 0.00010; 5211/6402 tok/s;  14655 sec
[2021-04-24 09:14:50,252 INFO] Step 37100/50000; acc:  91.79; ppl:  1.35; xent: 0.30; lr: 0.00010; 5436/6840 tok/s;  14674 sec
[2021-04-24 09:15:09,634 INFO] Step 37150/50000; acc:  91.81; ppl:  1.35; xent: 0.30; lr: 0.00010; 5163/6615 tok/s;  14693 sec
[2021-04-24 09:15:22,673 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/edit_ops/basic/train.txt, align=None)...
[2021-04-24 09:15:28,963 INFO] Step 37200/50000; acc:  91.74; ppl:  1.35; xent: 0

[2021-04-24 09:33:02,224 INFO] Step 39900/50000; acc:  91.81; ppl:  1.35; xent: 0.30; lr: 0.00010; 5176/6444 tok/s;  15766 sec
[2021-04-24 09:33:21,995 INFO] Step 39950/50000; acc:  91.80; ppl:  1.34; xent: 0.30; lr: 0.00010; 5095/6378 tok/s;  15786 sec
[2021-04-24 09:33:40,987 INFO] Step 40000/50000; acc:  92.18; ppl:  1.33; xent: 0.29; lr: 0.00010; 5406/6696 tok/s;  15805 sec
[2021-04-24 09:33:40,988 INFO] Loading ParallelCorpus(../data/small/abstract_methods/valid_buggy.txt, ../data/small/edit_ops/basic/valid.txt, align=None)...
[2021-04-24 09:34:09,213 INFO] Validation perplexity: 1.45077
[2021-04-24 09:34:09,213 INFO] Validation accuracy: 90.4812
[2021-04-24 09:34:09,217 INFO] Saving checkpoint ../models/default_params/basic_ops/model_step_40000.pt
[2021-04-24 09:34:28,609 INFO] Step 40050/50000; acc:  92.05; ppl:  1.33; xent: 0.29; lr: 0.00010; 2092/2693 tok/s;  15852 sec
[2021-04-24 09:34:46,410 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data

[2021-04-24 09:52:01,424 INFO] Step 42750/50000; acc:  92.18; ppl:  1.32; xent: 0.28; lr: 0.00010; 5101/6374 tok/s;  16905 sec
[2021-04-24 09:52:21,302 INFO] Step 42800/50000; acc:  92.18; ppl:  1.33; xent: 0.29; lr: 0.00010; 5103/6590 tok/s;  16925 sec
[2021-04-24 09:52:41,090 INFO] Step 42850/50000; acc:  91.98; ppl:  1.33; xent: 0.29; lr: 0.00010; 5206/6404 tok/s;  16945 sec
[2021-04-24 09:53:00,217 INFO] Step 42900/50000; acc:  92.30; ppl:  1.32; xent: 0.28; lr: 0.00010; 5306/6473 tok/s;  16964 sec
[2021-04-24 09:53:19,519 INFO] Step 42950/50000; acc:  92.35; ppl:  1.32; xent: 0.28; lr: 0.00010; 5225/6747 tok/s;  16983 sec
[2021-04-24 09:53:38,706 INFO] Step 43000/50000; acc:  91.93; ppl:  1.34; xent: 0.29; lr: 0.00010; 5334/6596 tok/s;  17002 sec
[2021-04-24 09:53:41,843 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/edit_ops/basic/train.txt, align=None)...
[2021-04-24 09:53:57,956 INFO] Step 43050/50000; acc:  92.32; ppl:  1.32; xent: 0

[2021-04-24 10:11:02,618 INFO] Step 45600/50000; acc:  92.18; ppl:  1.32; xent: 0.28; lr: 0.00010; 5296/6534 tok/s;  18046 sec
[2021-04-24 10:11:22,211 INFO] Step 45650/50000; acc:  92.13; ppl:  1.33; xent: 0.28; lr: 0.00010; 5151/6426 tok/s;  18066 sec
[2021-04-24 10:11:42,229 INFO] Step 45700/50000; acc:  92.58; ppl:  1.31; xent: 0.27; lr: 0.00010; 5225/6674 tok/s;  18086 sec
[2021-04-24 10:12:01,843 INFO] Step 45750/50000; acc:  92.14; ppl:  1.33; xent: 0.28; lr: 0.00010; 5106/6348 tok/s;  18105 sec
[2021-04-24 10:12:21,062 INFO] Step 45800/50000; acc:  92.27; ppl:  1.32; xent: 0.28; lr: 0.00010; 5259/6497 tok/s;  18125 sec
[2021-04-24 10:12:40,310 INFO] Step 45850/50000; acc:  92.55; ppl:  1.31; xent: 0.27; lr: 0.00010; 5337/6756 tok/s;  18144 sec
[2021-04-24 10:12:59,581 INFO] Step 45900/50000; acc:  92.38; ppl:  1.32; xent: 0.28; lr: 0.00010; 5254/6647 tok/s;  18163 sec
[2021-04-24 10:13:07,326 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/s

[2021-04-24 10:30:35,675 INFO] Step 48600/50000; acc:  92.62; ppl:  1.30; xent: 0.26; lr: 0.00010; 5238/6640 tok/s;  19219 sec
[2021-04-24 10:30:55,322 INFO] Step 48650/50000; acc:  92.42; ppl:  1.31; xent: 0.27; lr: 0.00010; 5166/6535 tok/s;  19239 sec
[2021-04-24 10:31:14,539 INFO] Step 48700/50000; acc:  92.29; ppl:  1.32; xent: 0.28; lr: 0.00010; 5319/6435 tok/s;  19258 sec
[2021-04-24 10:31:33,753 INFO] Step 48750/50000; acc:  92.59; ppl:  1.30; xent: 0.26; lr: 0.00010; 5247/6582 tok/s;  19277 sec
[2021-04-24 10:31:52,920 INFO] Step 48800/50000; acc:  92.65; ppl:  1.30; xent: 0.26; lr: 0.00010; 5275/6851 tok/s;  19296 sec
[2021-04-24 10:32:11,597 INFO] Step 48850/50000; acc:  92.24; ppl:  1.32; xent: 0.27; lr: 0.00010; 5405/6736 tok/s;  19315 sec
[2021-04-24 10:32:17,055 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/edit_ops/basic/train.txt, align=None)...
[2021-04-24 10:32:31,410 INFO] Step 48900/50000; acc:  92.70; ppl:  1.30; xent: 0

**Train on strictly condensed EditOperations:**

In [None]:
#collapse_output
modelStrictDefault = HephaestusModel(MODEL_DEFAULT_STRICT)
modelStrictDefault.train(
    DATA_SMALL_METHODS_TRAIN_BUGGY,
    DATA_SMALL_OPS_STRICT_TRAIN,
    DATA_SMALL_METHODS_VALID_BUGGY,
    DATA_SMALL_OPS_STRICT_VALID
)

[2021-04-23 03:45:17,313 INFO] Counter vocab from -1 samples.
[2021-04-23 03:45:17,313 INFO] n_sample=-1: Build vocab on full datasets.
[2021-04-23 03:45:17,318 INFO] corpus_1's transforms: TransformPipe()
[2021-04-23 03:45:17,319 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/edit_ops/strict/train.txt, align=None)...
[2021-04-23 03:45:17,920 INFO] Counters src:429
[2021-04-23 03:45:17,920 INFO] Counters tgt:444
[2021-04-23 03:45:18,564 INFO] Parsed 2 corpora from -data.
[2021-04-23 03:45:18,565 INFO] Get special vocabs from Transforms: {'src': set(), 'tgt': set()}.
[2021-04-23 03:45:18,565 INFO] Loading vocab from text file...
[2021-04-23 03:45:18,565 INFO] Loading src vocabulary from ../models/default_params/strict_ops/save_data.vocab.src
[2021-04-23 03:45:18,567 INFO] Loaded src vocab has 429 tokens.
[2021-04-23 03:45:18,567 INFO] Loading tgt vocabulary from ../models/default_params/strict_ops/save_data.vocab.tgt
[2021-04-23 03:45:18,568 I

[2021-04-23 03:52:08,024 INFO] Step 1900/50000; acc:  56.11; ppl:  5.11; xent: 1.63; lr: 0.00010; 9788/4148 tok/s;    408 sec
[2021-04-23 03:52:19,121 INFO] Step 1950/50000; acc:  55.95; ppl:  5.18; xent: 1.64; lr: 0.00010; 9302/3894 tok/s;    419 sec
[2021-04-23 03:52:29,881 INFO] Step 2000/50000; acc:  56.06; ppl:  5.17; xent: 1.64; lr: 0.00010; 9250/3934 tok/s;    430 sec
[2021-04-23 03:52:41,251 INFO] Step 2050/50000; acc:  56.11; ppl:  5.06; xent: 1.62; lr: 0.00010; 9155/3756 tok/s;    442 sec
[2021-04-23 03:52:51,510 INFO] Step 2100/50000; acc:  56.82; ppl:  4.98; xent: 1.61; lr: 0.00010; 9957/4141 tok/s;    452 sec
[2021-04-23 03:53:02,186 INFO] Step 2150/50000; acc:  56.79; ppl:  4.91; xent: 1.59; lr: 0.00010; 9294/4016 tok/s;    462 sec
[2021-04-23 03:53:07,741 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/edit_ops/strict/train.txt, align=None)...
[2021-04-23 03:53:12,894 INFO] Step 2200/50000; acc:  57.12; ppl:  4.90; xent: 1.59; l

[2021-04-23 04:02:54,459 INFO] Step 4900/50000; acc:  62.25; ppl:  4.01; xent: 1.39; lr: 0.00010; 9762/4141 tok/s;   1055 sec
[2021-04-23 04:03:05,566 INFO] Step 4950/50000; acc:  62.60; ppl:  3.90; xent: 1.36; lr: 0.00010; 9305/3848 tok/s;   1066 sec
[2021-04-23 04:03:16,174 INFO] Step 5000/50000; acc:  62.59; ppl:  3.91; xent: 1.36; lr: 0.00010; 9673/4016 tok/s;   1076 sec
[2021-04-23 04:03:16,175 INFO] valid's transforms: TransformPipe()
[2021-04-23 04:03:16,184 INFO] Loading ParallelCorpus(../data/small/abstract_methods/valid_buggy.txt, ../data/small/edit_ops/strict/valid.txt, align=None)...
[2021-04-23 04:03:24,945 INFO] Validation perplexity: 3.72794
[2021-04-23 04:03:24,945 INFO] Validation accuracy: 64.0765
[2021-04-23 04:03:24,947 INFO] Saving checkpoint ../models/default_params/strict_ops/model_step_5000.pt
[2021-04-23 04:03:35,899 INFO] Step 5050/50000; acc:  62.76; ppl:  3.89; xent: 1.36; lr: 0.00010; 5136/2156 tok/s;   1096 sec
[2021-04-23 04:03:43,733 INFO] Loading Parall

[2021-04-23 04:13:17,213 INFO] Step 7750/50000; acc:  64.87; ppl:  3.51; xent: 1.26; lr: 0.00010; 9287/3980 tok/s;   1678 sec
[2021-04-23 04:13:28,015 INFO] Step 7800/50000; acc:  64.57; ppl:  3.60; xent: 1.28; lr: 0.00010; 9491/3986 tok/s;   1688 sec
[2021-04-23 04:13:38,815 INFO] Step 7850/50000; acc:  64.88; ppl:  3.55; xent: 1.27; lr: 0.00010; 9389/3935 tok/s;   1699 sec
[2021-04-23 04:13:50,201 INFO] Step 7900/50000; acc:  64.92; ppl:  3.52; xent: 1.26; lr: 0.00010; 9254/3806 tok/s;   1710 sec
[2021-04-23 04:14:00,111 INFO] Step 7950/50000; acc:  65.53; ppl:  3.42; xent: 1.23; lr: 0.00010; 9714/4170 tok/s;   1720 sec
[2021-04-23 04:14:11,010 INFO] Step 8000/50000; acc:  65.01; ppl:  3.53; xent: 1.26; lr: 0.00010; 9552/3966 tok/s;   1731 sec
[2021-04-23 04:14:11,018 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/edit_ops/strict/train.txt, align=None)...
[2021-04-23 04:14:21,925 INFO] Step 8050/50000; acc:  65.31; ppl:  3.47; xent: 1.24; l

[2021-04-23 04:23:40,757 INFO] Step 10600/50000; acc:  66.32; ppl:  3.29; xent: 1.19; lr: 0.00010; 9498/3971 tok/s;   2301 sec
[2021-04-23 04:23:51,700 INFO] Step 10650/50000; acc:  66.41; ppl:  3.31; xent: 1.20; lr: 0.00010; 9374/3900 tok/s;   2312 sec
[2021-04-23 04:24:02,137 INFO] Step 10700/50000; acc:  66.74; ppl:  3.27; xent: 1.19; lr: 0.00010; 9578/4119 tok/s;   2322 sec
[2021-04-23 04:24:12,885 INFO] Step 10750/50000; acc:  66.36; ppl:  3.37; xent: 1.21; lr: 0.00010; 9508/3985 tok/s;   2333 sec
[2021-04-23 04:24:23,770 INFO] Step 10800/50000; acc:  66.96; ppl:  3.21; xent: 1.17; lr: 0.00010; 9236/3874 tok/s;   2344 sec
[2021-04-23 04:24:34,115 INFO] Step 10850/50000; acc:  66.84; ppl:  3.28; xent: 1.19; lr: 0.00010; 9984/4075 tok/s;   2354 sec
[2021-04-23 04:24:44,900 INFO] Step 10900/50000; acc:  66.87; ppl:  3.25; xent: 1.18; lr: 0.00010; 9460/4002 tok/s;   2365 sec
[2021-04-23 04:24:47,355 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/s

[2021-04-23 04:34:27,759 INFO] Step 13600/50000; acc:  67.94; ppl:  3.11; xent: 1.13; lr: 0.00010; 10014/4061 tok/s;   2948 sec
[2021-04-23 04:34:38,224 INFO] Step 13650/50000; acc:  67.98; ppl:  3.12; xent: 1.14; lr: 0.00010; 9556/4093 tok/s;   2959 sec
[2021-04-23 04:34:49,500 INFO] Step 13700/50000; acc:  67.93; ppl:  3.11; xent: 1.13; lr: 0.00010; 9003/3780 tok/s;   2970 sec
[2021-04-23 04:34:59,991 INFO] Step 13750/50000; acc:  68.09; ppl:  3.08; xent: 1.12; lr: 0.00010; 9809/4021 tok/s;   2980 sec
[2021-04-23 04:35:10,599 INFO] Step 13800/50000; acc:  67.90; ppl:  3.11; xent: 1.13; lr: 0.00010; 9610/3995 tok/s;   2991 sec
[2021-04-23 04:35:21,227 INFO] Step 13850/50000; acc:  67.73; ppl:  3.12; xent: 1.14; lr: 0.00010; 9643/4091 tok/s;   3002 sec
[2021-04-23 04:35:22,363 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/edit_ops/strict/train.txt, align=None)...
[2021-04-23 04:35:31,654 INFO] Step 13900/50000; acc:  68.56; ppl:  3.04; xent:

[2021-04-23 04:44:51,286 INFO] Step 16450/50000; acc:  68.43; ppl:  3.02; xent: 1.11; lr: 0.00010; 8984/3762 tok/s;   3572 sec
[2021-04-23 04:45:02,080 INFO] Step 16500/50000; acc:  68.70; ppl:  2.98; xent: 1.09; lr: 0.00010; 9475/3919 tok/s;   3582 sec
[2021-04-23 04:45:12,499 INFO] Step 16550/50000; acc:  69.01; ppl:  2.97; xent: 1.09; lr: 0.00010; 9582/4110 tok/s;   3593 sec
[2021-04-23 04:45:23,845 INFO] Step 16600/50000; acc:  68.60; ppl:  3.00; xent: 1.10; lr: 0.00010; 9062/3801 tok/s;   3604 sec
[2021-04-23 04:45:34,544 INFO] Step 16650/50000; acc:  69.26; ppl:  2.95; xent: 1.08; lr: 0.00010; 9483/3912 tok/s;   3615 sec
[2021-04-23 04:45:44,982 INFO] Step 16700/50000; acc:  68.72; ppl:  2.99; xent: 1.10; lr: 0.00010; 9987/4143 tok/s;   3625 sec
[2021-04-23 04:45:55,460 INFO] Step 16750/50000; acc:  69.23; ppl:  2.93; xent: 1.08; lr: 0.00010; 9254/4068 tok/s;   3636 sec
[2021-04-23 04:45:59,323 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/s

[2021-04-23 04:55:36,947 INFO] Step 19450/50000; acc:  69.56; ppl:  2.88; xent: 1.06; lr: 0.00010; 9358/3914 tok/s;   4217 sec
[2021-04-23 04:55:47,654 INFO] Step 19500/50000; acc:  69.77; ppl:  2.88; xent: 1.06; lr: 0.00010; 9291/4016 tok/s;   4228 sec
[2021-04-23 04:55:58,565 INFO] Step 19550/50000; acc:  70.09; ppl:  2.84; xent: 1.04; lr: 0.00010; 9446/3859 tok/s;   4239 sec
[2021-04-23 04:56:08,756 INFO] Step 19600/50000; acc:  70.12; ppl:  2.84; xent: 1.04; lr: 0.00010; 9773/4158 tok/s;   4249 sec
[2021-04-23 04:56:19,660 INFO] Step 19650/50000; acc:  69.75; ppl:  2.87; xent: 1.05; lr: 0.00010; 9440/3952 tok/s;   4260 sec
[2021-04-23 04:56:26,110 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/edit_ops/strict/train.txt, align=None)...
[2021-04-23 04:56:30,590 INFO] Step 19700/50000; acc:  69.53; ppl:  2.89; xent: 1.06; lr: 0.00010; 9414/3947 tok/s;   4271 sec
[2021-04-23 04:56:41,186 INFO] Step 19750/50000; acc:  70.05; ppl:  2.85; xent: 

[2021-04-23 05:06:00,720 INFO] Step 22300/50000; acc:  70.04; ppl:  2.82; xent: 1.04; lr: 0.00010; 9645/3975 tok/s;   4841 sec
[2021-04-23 05:06:11,423 INFO] Step 22350/50000; acc:  70.65; ppl:  2.74; xent: 1.01; lr: 0.00010; 9097/3958 tok/s;   4852 sec
[2021-04-23 05:06:22,015 INFO] Step 22400/50000; acc:  70.41; ppl:  2.83; xent: 1.04; lr: 0.00010; 9806/4018 tok/s;   4862 sec
[2021-04-23 05:06:32,534 INFO] Step 22450/50000; acc:  70.73; ppl:  2.74; xent: 1.01; lr: 0.00010; 9580/4063 tok/s;   4873 sec
[2021-04-23 05:06:43,353 INFO] Step 22500/50000; acc:  70.49; ppl:  2.77; xent: 1.02; lr: 0.00010; 9412/3935 tok/s;   4884 sec
[2021-04-23 05:06:53,805 INFO] Step 22550/50000; acc:  70.58; ppl:  2.79; xent: 1.02; lr: 0.00010; 9737/4045 tok/s;   4894 sec
[2021-04-23 05:07:02,746 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/edit_ops/strict/train.txt, align=None)...
[2021-04-23 05:07:04,632 INFO] Step 22600/50000; acc:  70.50; ppl:  2.79; xent: 

[2021-04-23 05:16:24,465 INFO] Step 25150/50000; acc:  70.52; ppl:  2.75; xent: 1.01; lr: 0.00010; 9008/3706 tok/s;   5465 sec
[2021-04-23 05:16:34,969 INFO] Step 25200/50000; acc:  71.12; ppl:  2.67; xent: 0.98; lr: 0.00010; 9499/4019 tok/s;   5475 sec
[2021-04-23 05:16:46,007 INFO] Step 25250/50000; acc:  71.02; ppl:  2.72; xent: 1.00; lr: 0.00010; 9383/3907 tok/s;   5486 sec
[2021-04-23 05:16:56,772 INFO] Step 25300/50000; acc:  70.98; ppl:  2.74; xent: 1.01; lr: 0.00010; 9522/3967 tok/s;   5497 sec
[2021-04-23 05:17:07,362 INFO] Step 25350/50000; acc:  71.14; ppl:  2.70; xent: 0.99; lr: 0.00010; 9421/4029 tok/s;   5508 sec
[2021-04-23 05:17:18,776 INFO] Step 25400/50000; acc:  71.35; ppl:  2.68; xent: 0.99; lr: 0.00010; 9057/3775 tok/s;   5519 sec
[2021-04-23 05:17:29,076 INFO] Step 25450/50000; acc:  71.59; ppl:  2.67; xent: 0.98; lr: 0.00010; 9758/4010 tok/s;   5529 sec
[2021-04-23 05:17:39,909 INFO] Step 25500/50000; acc:  71.23; ppl:  2.72; xent: 1.00; lr: 0.00010; 9650/4029 to

[2021-04-23 05:27:10,657 INFO] Step 28150/50000; acc:  71.56; ppl:  2.65; xent: 0.97; lr: 0.00010; 9391/3861 tok/s;   6111 sec
[2021-04-23 05:27:21,207 INFO] Step 28200/50000; acc:  71.65; ppl:  2.65; xent: 0.97; lr: 0.00010; 9715/4118 tok/s;   6121 sec
[2021-04-23 05:27:32,056 INFO] Step 28250/50000; acc:  71.85; ppl:  2.65; xent: 0.97; lr: 0.00010; 9389/3953 tok/s;   6132 sec
[2021-04-23 05:27:42,990 INFO] Step 28300/50000; acc:  72.33; ppl:  2.57; xent: 0.94; lr: 0.00010; 9181/3866 tok/s;   6143 sec
[2021-04-23 05:27:53,267 INFO] Step 28350/50000; acc:  71.94; ppl:  2.62; xent: 0.96; lr: 0.00010; 9982/4072 tok/s;   6154 sec
[2021-04-23 05:28:03,998 INFO] Step 28400/50000; acc:  72.14; ppl:  2.60; xent: 0.96; lr: 0.00010; 9236/3991 tok/s;   6164 sec
[2021-04-23 05:28:07,520 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/edit_ops/strict/train.txt, align=None)...
[2021-04-23 05:28:14,859 INFO] Step 28450/50000; acc:  71.49; ppl:  2.65; xent: 

[2021-04-23 05:37:33,623 INFO] Step 31000/50000; acc:  72.17; ppl:  2.57; xent: 0.94; lr: 0.00010; 9123/3794 tok/s;   6734 sec
[2021-04-23 05:37:44,600 INFO] Step 31050/50000; acc:  72.39; ppl:  2.56; xent: 0.94; lr: 0.00010; 9213/3891 tok/s;   6745 sec
[2021-04-23 05:37:55,185 INFO] Step 31100/50000; acc:  72.16; ppl:  2.58; xent: 0.95; lr: 0.00010; 9904/4033 tok/s;   6755 sec
[2021-04-23 05:38:05,375 INFO] Step 31150/50000; acc:  73.14; ppl:  2.51; xent: 0.92; lr: 0.00010; 9534/4189 tok/s;   6766 sec
[2021-04-23 05:38:16,696 INFO] Step 31200/50000; acc:  72.18; ppl:  2.58; xent: 0.95; lr: 0.00010; 9186/3751 tok/s;   6777 sec
[2021-04-23 05:38:27,321 INFO] Step 31250/50000; acc:  72.84; ppl:  2.51; xent: 0.92; lr: 0.00010; 9471/4012 tok/s;   6788 sec
[2021-04-23 05:38:37,689 INFO] Step 31300/50000; acc:  72.63; ppl:  2.55; xent: 0.93; lr: 0.00010; 9715/4076 tok/s;   6798 sec
[2021-04-23 05:38:48,630 INFO] Step 31350/50000; acc:  72.36; ppl:  2.56; xent: 0.94; lr: 0.00010; 9415/3949 to

[2021-04-23 05:48:19,190 INFO] Step 34000/50000; acc:  73.47; ppl:  2.46; xent: 0.90; lr: 0.00010; 9381/3978 tok/s;   7379 sec
[2021-04-23 05:48:30,098 INFO] Step 34050/50000; acc:  72.87; ppl:  2.51; xent: 0.92; lr: 0.00010; 9505/3945 tok/s;   7390 sec
[2021-04-23 05:48:41,421 INFO] Step 34100/50000; acc:  73.22; ppl:  2.50; xent: 0.91; lr: 0.00010; 9066/3777 tok/s;   7402 sec
[2021-04-23 05:48:52,068 INFO] Step 34150/50000; acc:  73.45; ppl:  2.46; xent: 0.90; lr: 0.00010; 9402/3951 tok/s;   7412 sec
[2021-04-23 05:49:02,361 INFO] Step 34200/50000; acc:  73.28; ppl:  2.48; xent: 0.91; lr: 0.00010; 9934/4166 tok/s;   7423 sec
[2021-04-23 05:49:13,022 INFO] Step 34250/50000; acc:  72.86; ppl:  2.50; xent: 0.91; lr: 0.00010; 9455/4025 tok/s;   7433 sec
[2021-04-23 05:49:17,714 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/edit_ops/strict/train.txt, align=None)...
[2021-04-23 05:49:23,972 INFO] Step 34300/50000; acc:  72.91; ppl:  2.49; xent: 

[2021-04-23 05:58:43,044 INFO] Step 36850/50000; acc:  73.91; ppl:  2.42; xent: 0.88; lr: 0.00010; 8891/3812 tok/s;   8003 sec
[2021-04-23 05:58:53,416 INFO] Step 36900/50000; acc:  73.81; ppl:  2.42; xent: 0.88; lr: 0.00010; 9691/4061 tok/s;   8014 sec
[2021-04-23 05:59:04,391 INFO] Step 36950/50000; acc:  73.81; ppl:  2.43; xent: 0.89; lr: 0.00010; 9432/3899 tok/s;   8025 sec
[2021-04-23 05:59:15,254 INFO] Step 37000/50000; acc:  73.57; ppl:  2.46; xent: 0.90; lr: 0.00010; 9387/3975 tok/s;   8036 sec
[2021-04-23 05:59:26,443 INFO] Step 37050/50000; acc:  73.75; ppl:  2.41; xent: 0.88; lr: 0.00010; 9196/3800 tok/s;   8047 sec
[2021-04-23 05:59:36,527 INFO] Step 37100/50000; acc:  74.16; ppl:  2.40; xent: 0.88; lr: 0.00010; 9875/4206 tok/s;   8057 sec
[2021-04-23 05:59:46,943 INFO] Step 37150/50000; acc:  73.70; ppl:  2.42; xent: 0.88; lr: 0.00010; 9797/4064 tok/s;   8067 sec
[2021-04-23 05:59:54,477 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/s

[2021-04-23 06:09:28,490 INFO] Step 39850/50000; acc:  74.29; ppl:  2.36; xent: 0.86; lr: 0.00010; 9667/4029 tok/s;   8649 sec
[2021-04-23 06:09:39,418 INFO] Step 39900/50000; acc:  74.09; ppl:  2.39; xent: 0.87; lr: 0.00010; 9586/3937 tok/s;   8660 sec
[2021-04-23 06:09:50,084 INFO] Step 39950/50000; acc:  75.00; ppl:  2.31; xent: 0.84; lr: 0.00010; 9148/3980 tok/s;   8670 sec
[2021-04-23 06:10:01,210 INFO] Step 40000/50000; acc:  73.99; ppl:  2.39; xent: 0.87; lr: 0.00010; 9416/3846 tok/s;   8681 sec
[2021-04-23 06:10:01,216 INFO] Loading ParallelCorpus(../data/small/abstract_methods/valid_buggy.txt, ../data/small/edit_ops/strict/valid.txt, align=None)...
[2021-04-23 06:10:09,972 INFO] Validation perplexity: 2.95224
[2021-04-23 06:10:09,972 INFO] Validation accuracy: 70.235
[2021-04-23 06:10:09,974 INFO] Saving checkpoint ../models/default_params/strict_ops/model_step_40000.pt
[2021-04-23 06:10:20,694 INFO] Step 40050/50000; acc:  74.65; ppl:  2.35; xent: 0.85; lr: 0.00010; 5082/2165

[2021-04-23 06:19:51,326 INFO] Step 42700/50000; acc:  74.97; ppl:  2.29; xent: 0.83; lr: 0.00010; 9341/3971 tok/s;   9272 sec
[2021-04-23 06:20:02,370 INFO] Step 42750/50000; acc:  74.78; ppl:  2.32; xent: 0.84; lr: 0.00010; 9290/3880 tok/s;   9283 sec
[2021-04-23 06:20:13,013 INFO] Step 42800/50000; acc:  75.01; ppl:  2.29; xent: 0.83; lr: 0.00010; 9392/4031 tok/s;   9293 sec
[2021-04-23 06:20:23,855 INFO] Step 42850/50000; acc:  74.44; ppl:  2.34; xent: 0.85; lr: 0.00010; 9539/3951 tok/s;   9304 sec
[2021-04-23 06:20:35,176 INFO] Step 42900/50000; acc:  75.04; ppl:  2.30; xent: 0.83; lr: 0.00010; 9118/3759 tok/s;   9315 sec
[2021-04-23 06:20:45,274 INFO] Step 42950/50000; acc:  75.35; ppl:  2.28; xent: 0.83; lr: 0.00010; 9833/4127 tok/s;   9326 sec
[2021-04-23 06:20:55,946 INFO] Step 43000/50000; acc:  74.82; ppl:  2.31; xent: 0.84; lr: 0.00010; 9582/4055 tok/s;   9336 sec
[2021-04-23 06:20:57,732 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/s

[2021-04-23 06:30:14,389 INFO] Step 45550/50000; acc:  76.09; ppl:  2.20; xent: 0.79; lr: 0.00010; 9694/4038 tok/s;   9895 sec
[2021-04-23 06:30:25,965 INFO] Step 45600/50000; acc:  75.36; ppl:  2.27; xent: 0.82; lr: 0.00010; 8992/3737 tok/s;   9906 sec
[2021-04-23 06:30:36,682 INFO] Step 45650/50000; acc:  75.60; ppl:  2.25; xent: 0.81; lr: 0.00010; 9379/3948 tok/s;   9917 sec
[2021-04-23 06:30:47,115 INFO] Step 45700/50000; acc:  75.47; ppl:  2.25; xent: 0.81; lr: 0.00010; 9731/4102 tok/s;   9927 sec
[2021-04-23 06:30:57,911 INFO] Step 45750/50000; acc:  75.58; ppl:  2.26; xent: 0.81; lr: 0.00010; 9488/3965 tok/s;   9938 sec
[2021-04-23 06:31:09,278 INFO] Step 45800/50000; acc:  75.75; ppl:  2.24; xent: 0.81; lr: 0.00010; 9042/3753 tok/s;   9950 sec
[2021-04-23 06:31:19,657 INFO] Step 45850/50000; acc:  75.63; ppl:  2.25; xent: 0.81; lr: 0.00010; 9854/4078 tok/s;   9960 sec
[2021-04-23 06:31:30,249 INFO] Step 45900/50000; acc:  76.03; ppl:  2.23; xent: 0.80; lr: 0.00010; 9376/4028 to

[2021-04-23 06:41:01,690 INFO] Step 48550/50000; acc:  76.49; ppl:  2.18; xent: 0.78; lr: 0.00010; 9084/3933 tok/s;  10542 sec
[2021-04-23 06:41:12,120 INFO] Step 48600/50000; acc:  76.22; ppl:  2.19; xent: 0.79; lr: 0.00010; 9828/4054 tok/s;  10552 sec
[2021-04-23 06:41:22,883 INFO] Step 48650/50000; acc:  76.13; ppl:  2.21; xent: 0.79; lr: 0.00010; 9396/3973 tok/s;  10563 sec
[2021-04-23 06:41:34,132 INFO] Step 48700/50000; acc:  75.79; ppl:  2.23; xent: 0.80; lr: 0.00010; 9311/3838 tok/s;  10574 sec
[2021-04-23 06:41:44,491 INFO] Step 48750/50000; acc:  76.76; ppl:  2.13; xent: 0.76; lr: 0.00010; 9424/4032 tok/s;  10585 sec
[2021-04-23 06:41:54,900 INFO] Step 48800/50000; acc:  76.00; ppl:  2.22; xent: 0.80; lr: 0.00010; 9918/4114 tok/s;  10595 sec
[2021-04-23 06:42:05,786 INFO] Step 48850/50000; acc:  76.14; ppl:  2.20; xent: 0.79; lr: 0.00010; 9226/3969 tok/s;  10606 sec
[2021-04-23 06:42:08,748 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/s

**Train on loosely condensed EditOperations:**

In [None]:
# collapse_output
modelLooseDefault = HephaestusModel(MODEL_DEFAULT_LOOSE)
modelLooseDefault.train(
    DATA_SMALL_METHODS_TRAIN_BUGGY,
    DATA_SMALL_OPS_LOOSE_TRAIN,
    DATA_SMALL_METHODS_VALID_BUGGY,
    DATA_SMALL_OPS_LOOSE_VALID
)

[2021-04-23 06:46:23,510 INFO] Counter vocab from -1 samples.
[2021-04-23 06:46:23,511 INFO] n_sample=-1: Build vocab on full datasets.
[2021-04-23 06:46:23,515 INFO] corpus_1's transforms: TransformPipe()
[2021-04-23 06:46:23,516 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/edit_ops/loose/train.txt, align=None)...
[2021-04-23 06:46:24,117 INFO] Counters src:429
[2021-04-23 06:46:24,117 INFO] Counters tgt:444
[2021-04-23 06:46:24,782 INFO] Parsed 2 corpora from -data.
[2021-04-23 06:46:24,782 INFO] Get special vocabs from Transforms: {'src': set(), 'tgt': set()}.
[2021-04-23 06:46:24,782 INFO] Loading vocab from text file...
[2021-04-23 06:46:24,782 INFO] Loading src vocabulary from ../models/default_params/loose_ops/save_data.vocab.src
[2021-04-23 06:46:24,784 INFO] Loaded src vocab has 429 tokens.
[2021-04-23 06:46:24,784 INFO] Loading tgt vocabulary from ../models/default_params/loose_ops/save_data.vocab.tgt
[2021-04-23 06:46:24,786 INFO

[2021-04-23 06:52:20,648 INFO] Step 1850/50000; acc:  55.07; ppl:  5.43; xent: 1.69; lr: 0.00010; 9922/3967 tok/s;    355 sec
[2021-04-23 06:52:29,839 INFO] Step 1900/50000; acc:  55.28; ppl:  5.33; xent: 1.67; lr: 0.00010; 11123/4289 tok/s;    364 sec
[2021-04-23 06:52:39,507 INFO] Step 1950/50000; acc:  55.14; ppl:  5.39; xent: 1.68; lr: 0.00010; 10527/4248 tok/s;    374 sec
[2021-04-23 06:52:49,174 INFO] Step 2000/50000; acc:  55.41; ppl:  5.36; xent: 1.68; lr: 0.00010; 10523/4105 tok/s;    383 sec
[2021-04-23 06:52:58,847 INFO] Step 2050/50000; acc:  55.69; ppl:  5.25; xent: 1.66; lr: 0.00010; 10554/4141 tok/s;    393 sec
[2021-04-23 06:53:07,746 INFO] Step 2100/50000; acc:  55.64; ppl:  5.20; xent: 1.65; lr: 0.00010; 11287/4451 tok/s;    402 sec
[2021-04-23 06:53:17,469 INFO] Step 2150/50000; acc:  56.18; ppl:  5.13; xent: 1.63; lr: 0.00010; 10682/4213 tok/s;    412 sec
[2021-04-23 06:53:22,391 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/sm

[2021-04-23 07:01:53,980 INFO] Step 4850/50000; acc:  61.41; ppl:  4.08; xent: 1.41; lr: 0.00010; 10602/4207 tok/s;    928 sec
[2021-04-23 07:02:03,591 INFO] Step 4900/50000; acc:  61.07; ppl:  4.18; xent: 1.43; lr: 0.00010; 10753/4194 tok/s;    938 sec
[2021-04-23 07:02:13,326 INFO] Step 4950/50000; acc:  61.57; ppl:  4.10; xent: 1.41; lr: 0.00010; 10445/4092 tok/s;    947 sec
[2021-04-23 07:02:22,248 INFO] Step 5000/50000; acc:  61.97; ppl:  4.05; xent: 1.40; lr: 0.00010; 11393/4507 tok/s;    956 sec
[2021-04-23 07:02:22,248 INFO] valid's transforms: TransformPipe()
[2021-04-23 07:02:22,251 INFO] Loading ParallelCorpus(../data/small/abstract_methods/valid_buggy.txt, ../data/small/edit_ops/loose/valid.txt, align=None)...
[2021-04-23 07:02:30,167 INFO] Validation perplexity: 3.87977
[2021-04-23 07:02:30,168 INFO] Validation accuracy: 63.3767
[2021-04-23 07:02:30,170 INFO] Saving checkpoint ../models/default_params/loose_ops/model_step_5000.pt
[2021-04-23 07:02:39,852 INFO] Step 5050/50

[2021-04-23 07:11:07,172 INFO] Step 7700/50000; acc:  64.36; ppl:  3.65; xent: 1.30; lr: 0.00010; 10691/4238 tok/s;   1481 sec
[2021-04-23 07:11:17,045 INFO] Step 7750/50000; acc:  63.65; ppl:  3.69; xent: 1.31; lr: 0.00010; 10589/4092 tok/s;   1491 sec
[2021-04-23 07:11:26,356 INFO] Step 7800/50000; acc:  63.75; ppl:  3.72; xent: 1.31; lr: 0.00010; 10606/4333 tok/s;   1500 sec
[2021-04-23 07:11:36,165 INFO] Step 7850/50000; acc:  63.93; ppl:  3.71; xent: 1.31; lr: 0.00010; 10616/4073 tok/s;   1510 sec
[2021-04-23 07:11:45,529 INFO] Step 7900/50000; acc:  64.35; ppl:  3.64; xent: 1.29; lr: 0.00010; 10772/4299 tok/s;   1520 sec
[2021-04-23 07:11:54,399 INFO] Step 7950/50000; acc:  64.58; ppl:  3.57; xent: 1.27; lr: 0.00010; 11372/4449 tok/s;   1528 sec
[2021-04-23 07:12:04,079 INFO] Step 8000/50000; acc:  64.26; ppl:  3.65; xent: 1.30; lr: 0.00010; 10542/4196 tok/s;   1538 sec
[2021-04-23 07:12:04,087 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/s

[2021-04-23 07:20:20,742 INFO] Step 10550/50000; acc:  65.54; ppl:  3.44; xent: 1.24; lr: 0.00010; 10854/4114 tok/s;   2035 sec
[2021-04-23 07:20:30,456 INFO] Step 10600/50000; acc:  65.34; ppl:  3.44; xent: 1.24; lr: 0.00010; 10414/4153 tok/s;   2045 sec
[2021-04-23 07:20:40,216 INFO] Step 10650/50000; acc:  65.66; ppl:  3.41; xent: 1.23; lr: 0.00010; 10379/4147 tok/s;   2054 sec
[2021-04-23 07:20:49,670 INFO] Step 10700/50000; acc:  65.14; ppl:  3.48; xent: 1.25; lr: 0.00010; 10897/4274 tok/s;   2064 sec
[2021-04-23 07:20:59,104 INFO] Step 10750/50000; acc:  65.79; ppl:  3.46; xent: 1.24; lr: 0.00010; 10682/4240 tok/s;   2073 sec
[2021-04-23 07:21:08,768 INFO] Step 10800/50000; acc:  65.94; ppl:  3.38; xent: 1.22; lr: 0.00010; 10631/4122 tok/s;   2083 sec
[2021-04-23 07:21:17,518 INFO] Step 10850/50000; acc:  65.91; ppl:  3.39; xent: 1.22; lr: 0.00010; 11575/4522 tok/s;   2092 sec
[2021-04-23 07:21:26,842 INFO] Step 10900/50000; acc:  65.98; ppl:  3.38; xent: 1.22; lr: 0.00010; 10749

[2021-04-23 07:29:56,305 INFO] Step 13550/50000; acc:  66.67; ppl:  3.28; xent: 1.19; lr: 0.00010; 10291/4057 tok/s;   2610 sec
[2021-04-23 07:30:05,512 INFO] Step 13600/50000; acc:  67.01; ppl:  3.24; xent: 1.18; lr: 0.00010; 11112/4419 tok/s;   2620 sec
[2021-04-23 07:30:14,781 INFO] Step 13650/50000; acc:  67.02; ppl:  3.25; xent: 1.18; lr: 0.00010; 10800/4317 tok/s;   2629 sec
[2021-04-23 07:30:24,744 INFO] Step 13700/50000; acc:  66.72; ppl:  3.28; xent: 1.19; lr: 0.00010; 10410/4051 tok/s;   2639 sec
[2021-04-23 07:30:33,613 INFO] Step 13750/50000; acc:  67.02; ppl:  3.23; xent: 1.17; lr: 0.00010; 11431/4439 tok/s;   2648 sec
[2021-04-23 07:30:42,679 INFO] Step 13800/50000; acc:  67.23; ppl:  3.21; xent: 1.17; lr: 0.00010; 11118/4428 tok/s;   2657 sec
[2021-04-23 07:30:52,290 INFO] Step 13850/50000; acc:  67.42; ppl:  3.20; xent: 1.16; lr: 0.00010; 10520/4246 tok/s;   2666 sec
[2021-04-23 07:30:53,478 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ..

[2021-04-23 07:39:09,709 INFO] Step 16400/50000; acc:  67.69; ppl:  3.13; xent: 1.14; lr: 0.00010; 10248/3947 tok/s;   3164 sec
[2021-04-23 07:39:19,727 INFO] Step 16450/50000; acc:  67.86; ppl:  3.11; xent: 1.14; lr: 0.00010; 10168/4031 tok/s;   3174 sec
[2021-04-23 07:39:29,109 INFO] Step 16500/50000; acc:  68.07; ppl:  3.10; xent: 1.13; lr: 0.00010; 10699/4228 tok/s;   3183 sec
[2021-04-23 07:39:38,955 INFO] Step 16550/50000; acc:  67.39; ppl:  3.15; xent: 1.15; lr: 0.00010; 10624/4137 tok/s;   3193 sec
[2021-04-23 07:39:48,022 INFO] Step 16600/50000; acc:  68.46; ppl:  3.08; xent: 1.12; lr: 0.00010; 10912/4377 tok/s;   3202 sec
[2021-04-23 07:39:57,570 INFO] Step 16650/50000; acc:  67.32; ppl:  3.17; xent: 1.15; lr: 0.00010; 10919/4176 tok/s;   3212 sec
[2021-04-23 07:40:06,583 INFO] Step 16700/50000; acc:  68.14; ppl:  3.07; xent: 1.12; lr: 0.00010; 11078/4478 tok/s;   3221 sec
[2021-04-23 07:40:16,078 INFO] Step 16750/50000; acc:  68.35; ppl:  3.06; xent: 1.12; lr: 0.00010; 10663

[2021-04-23 07:48:43,671 INFO] Step 19400/50000; acc:  69.14; ppl:  2.97; xent: 1.09; lr: 0.00010; 10995/4288 tok/s;   3738 sec
[2021-04-23 07:48:53,136 INFO] Step 19450/50000; acc:  68.64; ppl:  3.01; xent: 1.10; lr: 0.00010; 10747/4294 tok/s;   3747 sec
[2021-04-23 07:49:02,739 INFO] Step 19500/50000; acc:  68.37; ppl:  3.03; xent: 1.11; lr: 0.00010; 10671/4138 tok/s;   3757 sec
[2021-04-23 07:49:12,473 INFO] Step 19550/50000; acc:  69.14; ppl:  2.97; xent: 1.09; lr: 0.00010; 10445/4156 tok/s;   3767 sec
[2021-04-23 07:49:21,344 INFO] Step 19600/50000; acc:  68.80; ppl:  3.01; xent: 1.10; lr: 0.00010; 11494/4478 tok/s;   3775 sec
[2021-04-23 07:49:30,883 INFO] Step 19650/50000; acc:  69.09; ppl:  2.97; xent: 1.09; lr: 0.00010; 10563/4226 tok/s;   3785 sec
[2021-04-23 07:49:36,765 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../data/small/edit_ops/loose/train.txt, align=None)...
[2021-04-23 07:49:40,533 INFO] Step 19700/50000; acc:  69.02; ppl:  2.99; x

[2021-04-23 07:57:58,068 INFO] Step 22250/50000; acc:  68.83; ppl:  2.96; xent: 1.09; lr: 0.00010; 9971/3874 tok/s;   4292 sec
[2021-04-23 07:58:07,528 INFO] Step 22300/50000; acc:  69.78; ppl:  2.86; xent: 1.05; lr: 0.00010; 10612/4217 tok/s;   4302 sec
[2021-04-23 07:58:16,970 INFO] Step 22350/50000; acc:  69.40; ppl:  2.90; xent: 1.06; lr: 0.00010; 10773/4251 tok/s;   4311 sec
[2021-04-23 07:58:26,490 INFO] Step 22400/50000; acc:  69.29; ppl:  2.94; xent: 1.08; lr: 0.00010; 10706/4227 tok/s;   4321 sec
[2021-04-23 07:58:36,067 INFO] Step 22450/50000; acc:  69.81; ppl:  2.87; xent: 1.06; lr: 0.00010; 10525/4131 tok/s;   4330 sec
[2021-04-23 07:58:45,281 INFO] Step 22500/50000; acc:  69.37; ppl:  2.91; xent: 1.07; lr: 0.00010; 11293/4398 tok/s;   4339 sec
[2021-04-23 07:58:54,368 INFO] Step 22550/50000; acc:  69.72; ppl:  2.87; xent: 1.06; lr: 0.00010; 11040/4401 tok/s;   4348 sec
[2021-04-23 07:59:02,468 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ../

[2021-04-23 08:07:11,585 INFO] Step 25100/50000; acc:  70.02; ppl:  2.84; xent: 1.04; lr: 0.00010; 10565/4156 tok/s;   4846 sec
[2021-04-23 08:07:21,313 INFO] Step 25150/50000; acc:  69.82; ppl:  2.85; xent: 1.05; lr: 0.00010; 10605/4058 tok/s;   4855 sec
[2021-04-23 08:07:30,981 INFO] Step 25200/50000; acc:  70.13; ppl:  2.81; xent: 1.03; lr: 0.00010; 10539/4194 tok/s;   4865 sec
[2021-04-23 08:07:40,643 INFO] Step 25250/50000; acc:  70.34; ppl:  2.80; xent: 1.03; lr: 0.00010; 10513/4146 tok/s;   4875 sec
[2021-04-23 08:07:49,962 INFO] Step 25300/50000; acc:  70.04; ppl:  2.85; xent: 1.05; lr: 0.00010; 10807/4293 tok/s;   4884 sec
[2021-04-23 08:07:59,717 INFO] Step 25350/50000; acc:  69.97; ppl:  2.85; xent: 1.05; lr: 0.00010; 10724/4164 tok/s;   4894 sec
[2021-04-23 08:08:09,217 INFO] Step 25400/50000; acc:  70.46; ppl:  2.77; xent: 1.02; lr: 0.00010; 10465/4217 tok/s;   4903 sec
[2021-04-23 08:08:18,179 INFO] Step 25450/50000; acc:  70.07; ppl:  2.82; xent: 1.04; lr: 0.00010; 11536

[2021-04-23 08:16:45,820 INFO] Step 28100/50000; acc:  70.50; ppl:  2.78; xent: 1.02; lr: 0.00010; 10298/4053 tok/s;   5420 sec
[2021-04-23 08:16:55,524 INFO] Step 28150/50000; acc:  70.87; ppl:  2.75; xent: 1.01; lr: 0.00010; 10452/4127 tok/s;   5430 sec
[2021-04-23 08:17:04,904 INFO] Step 28200/50000; acc:  70.70; ppl:  2.73; xent: 1.00; lr: 0.00010; 10825/4315 tok/s;   5439 sec
[2021-04-23 08:17:14,342 INFO] Step 28250/50000; acc:  70.67; ppl:  2.75; xent: 1.01; lr: 0.00010; 10665/4212 tok/s;   5448 sec
[2021-04-23 08:17:24,155 INFO] Step 28300/50000; acc:  70.93; ppl:  2.73; xent: 1.00; lr: 0.00010; 10530/4082 tok/s;   5458 sec
[2021-04-23 08:17:32,916 INFO] Step 28350/50000; acc:  71.12; ppl:  2.72; xent: 1.00; lr: 0.00010; 11548/4538 tok/s;   5467 sec
[2021-04-23 08:17:42,446 INFO] Step 28400/50000; acc:  70.94; ppl:  2.73; xent: 1.01; lr: 0.00010; 10630/4203 tok/s;   5477 sec
[2021-04-23 08:17:45,417 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ..

[2021-04-23 08:25:59,287 INFO] Step 30950/50000; acc:  71.23; ppl:  2.70; xent: 0.99; lr: 0.00010; 11185/4255 tok/s;   5973 sec
[2021-04-23 08:26:09,264 INFO] Step 31000/50000; acc:  71.69; ppl:  2.65; xent: 0.97; lr: 0.00010; 9992/4005 tok/s;   5983 sec
[2021-04-23 08:26:19,246 INFO] Step 31050/50000; acc:  71.17; ppl:  2.69; xent: 0.99; lr: 0.00010; 10402/4021 tok/s;   5993 sec
[2021-04-23 08:26:28,437 INFO] Step 31100/50000; acc:  71.77; ppl:  2.64; xent: 0.97; lr: 0.00010; 10919/4420 tok/s;   6002 sec
[2021-04-23 08:26:37,892 INFO] Step 31150/50000; acc:  71.63; ppl:  2.67; xent: 0.98; lr: 0.00010; 10751/4247 tok/s;   6012 sec
[2021-04-23 08:26:47,602 INFO] Step 31200/50000; acc:  71.49; ppl:  2.66; xent: 0.98; lr: 0.00010; 10509/4131 tok/s;   6022 sec
[2021-04-23 08:26:56,689 INFO] Step 31250/50000; acc:  71.63; ppl:  2.64; xent: 0.97; lr: 0.00010; 11094/4358 tok/s;   6031 sec
[2021-04-23 08:27:05,922 INFO] Step 31300/50000; acc:  71.50; ppl:  2.66; xent: 0.98; lr: 0.00010; 11131/

[2021-04-23 08:35:33,575 INFO] Step 33950/50000; acc:  72.07; ppl:  2.59; xent: 0.95; lr: 0.00010; 10007/4022 tok/s;   6548 sec
[2021-04-23 08:35:42,793 INFO] Step 34000/50000; acc:  72.32; ppl:  2.59; xent: 0.95; lr: 0.00010; 11012/4272 tok/s;   6557 sec
[2021-04-23 08:35:52,542 INFO] Step 34050/50000; acc:  72.09; ppl:  2.58; xent: 0.95; lr: 0.00010; 10432/4188 tok/s;   6567 sec
[2021-04-23 08:36:01,949 INFO] Step 34100/50000; acc:  72.62; ppl:  2.56; xent: 0.94; lr: 0.00010; 10712/4182 tok/s;   6576 sec
[2021-04-23 08:36:11,817 INFO] Step 34150/50000; acc:  71.60; ppl:  2.64; xent: 0.97; lr: 0.00010; 10628/4130 tok/s;   6586 sec
[2021-04-23 08:36:20,613 INFO] Step 34200/50000; acc:  72.58; ppl:  2.55; xent: 0.94; lr: 0.00010; 11208/4507 tok/s;   6595 sec
[2021-04-23 08:36:30,198 INFO] Step 34250/50000; acc:  72.43; ppl:  2.58; xent: 0.95; lr: 0.00010; 10781/4244 tok/s;   6604 sec
[2021-04-23 08:36:34,368 INFO] Loading ParallelCorpus(../data/small/abstract_methods/train_buggy.txt, ..

[2021-04-23 08:44:46,800 INFO] Step 36800/50000; acc:  72.43; ppl:  2.53; xent: 0.93; lr: 0.00010; 10694/4149 tok/s;   7101 sec
[2021-04-23 08:44:57,007 INFO] Step 36850/50000; acc:  72.63; ppl:  2.53; xent: 0.93; lr: 0.00010; 9913/3999 tok/s;   7111 sec
[2021-04-23 08:45:06,364 INFO] Step 36900/50000; acc:  72.90; ppl:  2.51; xent: 0.92; lr: 0.00010; 10972/4257 tok/s;   7120 sec
[2021-04-23 08:45:15,901 INFO] Step 36950/50000; acc:  72.84; ppl:  2.54; xent: 0.93; lr: 0.00010; 10685/4226 tok/s;   7130 sec
[2021-04-23 08:45:25,471 INFO] Step 37000/50000; acc:  73.16; ppl:  2.50; xent: 0.92; lr: 0.00010; 10552/4172 tok/s;   7140 sec
[2021-04-23 08:45:35,191 INFO] Step 37050/50000; acc:  72.93; ppl:  2.51; xent: 0.92; lr: 0.00010; 10445/4119 tok/s;   7149 sec
[2021-04-23 08:45:44,038 INFO] Step 37100/50000; acc:  72.81; ppl:  2.53; xent: 0.93; lr: 0.00010; 11634/4469 tok/s;   7158 sec
[2021-04-23 08:45:53,193 INFO] Step 37150/50000; acc:  72.91; ppl:  2.51; xent: 0.92; lr: 0.00010; 10973/

[2021-04-23 08:54:20,798 INFO] Step 39800/50000; acc:  73.86; ppl:  2.43; xent: 0.89; lr: 0.00010; 10315/4182 tok/s;   7675 sec
[2021-04-23 08:54:30,281 INFO] Step 39850/50000; acc:  73.39; ppl:  2.48; xent: 0.91; lr: 0.00010; 10941/4219 tok/s;   7684 sec
[2021-04-23 08:54:39,729 INFO] Step 39900/50000; acc:  73.38; ppl:  2.47; xent: 0.90; lr: 0.00010; 10622/4260 tok/s;   7694 sec
[2021-04-23 08:54:49,508 INFO] Step 39950/50000; acc:  73.67; ppl:  2.43; xent: 0.89; lr: 0.00010; 10432/4079 tok/s;   7704 sec
[2021-04-23 08:54:58,830 INFO] Step 40000/50000; acc:  73.45; ppl:  2.45; xent: 0.90; lr: 0.00010; 11031/4327 tok/s;   7713 sec
[2021-04-23 08:54:58,834 INFO] Loading ParallelCorpus(../data/small/abstract_methods/valid_buggy.txt, ../data/small/edit_ops/loose/valid.txt, align=None)...
[2021-04-23 08:55:06,735 INFO] Validation perplexity: 3.04471
[2021-04-23 08:55:06,735 INFO] Validation accuracy: 69.3141
[2021-04-23 08:55:06,737 INFO] Saving checkpoint ../models/default_params/loose_o

[2021-04-23 09:03:34,023 INFO] Step 42650/50000; acc:  73.74; ppl:  2.41; xent: 0.88; lr: 0.00010; 10637/4072 tok/s;   8228 sec
[2021-04-23 09:03:43,739 INFO] Step 42700/50000; acc:  73.82; ppl:  2.41; xent: 0.88; lr: 0.00010; 10563/4174 tok/s;   8238 sec
[2021-04-23 09:03:53,363 INFO] Step 42750/50000; acc:  74.03; ppl:  2.40; xent: 0.88; lr: 0.00010; 10519/4183 tok/s;   8247 sec
[2021-04-23 09:04:03,010 INFO] Step 42800/50000; acc:  73.92; ppl:  2.41; xent: 0.88; lr: 0.00010; 10591/4206 tok/s;   8257 sec
[2021-04-23 09:04:12,461 INFO] Step 42850/50000; acc:  74.02; ppl:  2.40; xent: 0.88; lr: 0.00010; 10730/4227 tok/s;   8267 sec
[2021-04-23 09:04:22,102 INFO] Step 42900/50000; acc:  74.02; ppl:  2.38; xent: 0.87; lr: 0.00010; 10512/4157 tok/s;   8276 sec
[2021-04-23 09:04:31,014 INFO] Step 42950/50000; acc:  73.99; ppl:  2.41; xent: 0.88; lr: 0.00010; 11686/4428 tok/s;   8285 sec
[2021-04-23 09:04:40,220 INFO] Step 43000/50000; acc:  74.28; ppl:  2.37; xent: 0.86; lr: 0.00010; 10683

[2021-04-23 09:12:48,039 INFO] Step 45500/50000; acc:  74.60; ppl:  2.34; xent: 0.85; lr: 0.00010; 10857/4342 tok/s;   8782 sec
[2021-04-23 09:12:57,503 INFO] Step 45550/50000; acc:  74.39; ppl:  2.35; xent: 0.85; lr: 0.00010; 10935/4212 tok/s;   8792 sec
[2021-04-23 09:13:07,419 INFO] Step 45600/50000; acc:  74.53; ppl:  2.35; xent: 0.85; lr: 0.00010; 10306/4080 tok/s;   8801 sec
[2021-04-23 09:13:17,091 INFO] Step 45650/50000; acc:  74.81; ppl:  2.34; xent: 0.85; lr: 0.00010; 10395/4125 tok/s;   8811 sec
[2021-04-23 09:13:26,541 INFO] Step 45700/50000; acc:  74.57; ppl:  2.35; xent: 0.85; lr: 0.00010; 10974/4296 tok/s;   8821 sec
[2021-04-23 09:13:36,050 INFO] Step 45750/50000; acc:  74.66; ppl:  2.34; xent: 0.85; lr: 0.00010; 10611/4225 tok/s;   8830 sec
[2021-04-23 09:13:45,700 INFO] Step 45800/50000; acc:  74.77; ppl:  2.33; xent: 0.85; lr: 0.00010; 10532/4105 tok/s;   8840 sec
[2021-04-23 09:13:54,605 INFO] Step 45850/50000; acc:  74.76; ppl:  2.34; xent: 0.85; lr: 0.00010; 11357

[2021-04-23 09:22:22,721 INFO] Step 48500/50000; acc:  75.06; ppl:  2.28; xent: 0.83; lr: 0.00010; 10360/4062 tok/s;   9357 sec
[2021-04-23 09:22:32,794 INFO] Step 48550/50000; acc:  74.82; ppl:  2.32; xent: 0.84; lr: 0.00010; 10396/4023 tok/s;   9367 sec
[2021-04-23 09:22:42,164 INFO] Step 48600/50000; acc:  75.80; ppl:  2.25; xent: 0.81; lr: 0.00010; 10535/4307 tok/s;   9376 sec
[2021-04-23 09:22:51,770 INFO] Step 48650/50000; acc:  75.09; ppl:  2.30; xent: 0.83; lr: 0.00010; 10812/4143 tok/s;   9386 sec
[2021-04-23 09:23:01,244 INFO] Step 48700/50000; acc:  75.34; ppl:  2.27; xent: 0.82; lr: 0.00010; 10579/4268 tok/s;   9395 sec
[2021-04-23 09:23:10,472 INFO] Step 48750/50000; acc:  75.08; ppl:  2.27; xent: 0.82; lr: 0.00010; 11070/4288 tok/s;   9405 sec
[2021-04-23 09:23:19,697 INFO] Step 48800/50000; acc:  75.25; ppl:  2.27; xent: 0.82; lr: 0.00010; 10979/4360 tok/s;   9414 sec
[2021-04-23 09:23:29,215 INFO] Step 48850/50000; acc:  75.25; ppl:  2.27; xent: 0.82; lr: 0.00010; 10550