In [None]:
import torch
import torch
import torch.nn as nn
import torch.nn.functional as F
from torch.utils.data import Dataset,DataLoader
import re 
import json


class trafficSet(Dataset):
    def __init__(self,path,train,g_flag=False):
        with open(path,'r') as f:
              testset = json.load(f)
        actions_set = set()
        self.actions = []
        self.rewards = []
        self.data = []
        self.target = []
        for tset in testset:
            self.actions.append(tset['actions'])
            self.rewards.append(tset['robustness'][0])
            for action in tset['actions']:
                    actions_set.add(action)
        if g_flag is False:
          if train is True:
              self.data = self.actions[:int(len(self.actions)*0.8)]
              self.target = self.rewards[:int(len(self.actions)*0.8)]
          else:
              self.data = self.actions[int(len(self.actions)*0.8):]
              self.target = self.rewards[int(len(self.actions)*0.8):]
        else:
          self.data = self.actions
          self.target = self.rewards
            
        self.max_len = len(self.actions[0]) + 1
        self.actions_list = sorted(list(actions_set))
        self.actions_to_index = {self.actions_list[i] : i  for i in range(len(self.actions_list))}
        self.actions_category = []
        self.actions_dict = {}
        self.actions_index = []
        i = 0
        action_string = re.sub(r'[0-9]+', '', self.actions_list[0])
        for action in self.actions_list:
            current_action =  action[:4] + re.sub(r'[0-9]+', '', action[4:])
            if current_action not in self.actions_category:
                self.actions_category.append(current_action)
                self.actions_index.append(i)
                self.actions_dict[current_action] = [action]
            else:
                self.actions_dict[current_action].append(action)
            i = i + 1
        self.actions_indexes= {}
        for i in range(len(self.actions_index)):
            if i != len(self.actions_index) -1 :
                self.actions_indexes[self.actions_category[i]] = [self.actions_index[i],self.actions_index[i+1]]
            else:
                self.actions_indexes[self.actions_category[i]] = [self.actions_index[i],len(self.actions_list)]
            i = i + 1
        self.actions_list = self.actions_list + [',','.'] # bos,eos(.) and pad(,) tokens
        self.actions_indexes[','] = [len(self.actions_list)-2,len(self.actions_list)-1] # pad_index(,)
        self.actions_indexes['.'] = [len(self.actions_list)-1,len(self.actions_list)] # bos_index and eos_index(.)
        self.pad_index = len(self.actions_list) - 2
        self.bos_index = len(self.actions_list) - 1
        # self.embeddings = Embedding(len(self.actions_list),emb_dim,self.actions_indexes[','][0])
    def __getitem__(self, index):
        actions = self.actions[index]
        actions_idx = []
        for action in actions:
            actions_idx.append(self.actions_to_index[action])
        # action = [self.actions_indexes['.'][0]] + action  # add <BOS> for every action
        action = torch.LongTensor(actions_idx)
        reward = self.rewards[index]
        reward = np.exp(reward)
        # print(index)
        return action,reward
    def __len__(self):
        return len(self.data)

In [None]:
model =  MLP(num_tokens=154,
                                num_outputs=1,
                                num_hid=1024,
                                num_layers=4, # TODO: add these as hyperparameters?
                                dropout=0.1,
                                max_len=38)


In [None]:
import torch
import torch.nn as nn

def Embedding(num_embeddings, embedding_dim, padding_idx=None):
    m = nn.Embedding(num_embeddings, embedding_dim, padding_idx=padding_idx)
    nn.init.normal_(m.weight, mean=0, std=embedding_dim ** -0.5)
    if padding_idx is not None:
        nn.init.constant_(m.weight[padding_idx], 0)
    return m
    
class MLP(nn.Module):
    def __init__(self, num_tokens, num_outputs, num_hid,
                 num_layers, max_len=60, dropout=0.1,
                 partition_init=150.0,):
        super(MLP,self).__init__()
        self.input = nn.Linear(num_tokens * max_len, num_hid)
        hidden_layers = []
        for _ in range(num_layers):
            hidden_layers.append(nn.Dropout(dropout))
            hidden_layers.append(nn.ReLU())
            hidden_layers.append(nn.Linear(num_hid, num_hid))
        self.hidden = nn.Sequential(*hidden_layers)
        self.output = nn.Linear(num_hid, num_outputs)
        self.max_len = max_len
        self.num_tokens = num_tokens
        self.emb = Embedding(self.num_tokens,self.num_tokens)

   

    def forward(self, x,  return_all=False, lens=None):
        x = self.emb(x)
        # print(x.shape)
        x = x.reshape(x.size(0),-1)
        # print(x.shape)
        out = self.input(x)
        # out = x.reshape(-1)
        out = self.hidden(out)
        out = self.output(out)
        # print(out.shape)
        out = out.reshape(-1)
        return out



In [None]:
from sklearn.metrics import mean_absolute_error
import torch
import os
import shutil
import time
import numpy as np
def save_ckpt(state, is_best, model_save_dir):
    current_w = os.path.join(model_save_dir, args.current_w)
    best_w = os.path.join(model_save_dir, args.best_w)
    torch.save(state, current_w)
    if is_best: shutil.copyfile(current_w, best_w)

def cal_mean_error(y_true,y_pred):
    y_true = y_true.view(-1).cpu().detach().numpy().astype(float)
    y_pred = y_pred.view(-1).cpu().detach().numpy().astype(float)
    return mean_absolute_error(y_true, y_pred)

def mkdirs(path):
    if not os.path.exists(path):
        os.makedirs(path)

# adjust learning rate 
def adjust_learning_rate(optimizer, lr):
    for param_group in optimizer.param_groups:
        param_group['lr'] = lr
    return lr

class AttrDict(dict):
    def __init__(self, *args, **kwargs):
        super(AttrDict, self).__init__(*args, **kwargs)
        self.__dict__ = self
  # vocab = ["0", "1", "2", "3", "4", "5", "6", "7", "8", '9', '.', ',']    
args = AttrDict({
    "resume": False, 
    "ckpt" : 'model/', 
    "batch_size": 128,
    "model_name": "proxy",
     "stage_epoch":[32,64,128,256],
    "lr":0.01,
    "max_epoch" : 256,
    # saved current weight path
    "current_w" :'current_w.pth',
    # saved best weight path
    "best_w" : 'best_w.pth',
    "lr_decay" : 10
    
})
def print_time_cost(since):
    time_elapsed = time.time() - since
    return '{:.0f}m{:.0f}s\n'.format(time_elapsed // 60, time_elapsed % 60)

In [None]:
import torch, time, os, shutil
import numpy as np
import pandas as pd
#from tensorboard_logger import Logger
from torch import nn, optim
from torch.utils.data import DataLoader
import os

os.environ["CUDA_VISIBLE_DEVICES"] = "0"

device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

torch.manual_seed(41)
torch.cuda.manual_seed(41)

def train_epoch(model, optimizer, criterion, train_dataloader, show_interval=10):
    model.train()
    print("start_training")
    mse_meter, loss_meter, it_count = 0, 0, 0
    for inputs, target in train_dataloader:
        inputs = inputs.to(device)
        target = target.to(device)
        # zero the parameter gradients
        optimizer.zero_grad()
        # forward
        output = model(inputs)
        output = output.to(torch.float32)
        target = target.to(torch.float32)
        # print(target.shape)
        loss = criterion(output, target)
        loss.backward()
        optimizer.step()
        loss_meter += loss.item()
        it_count += 1
        mse = cal_mean_error(target, output)
        mse_meter += mse
        if it_count != 0 and it_count % show_interval == 0:
            print("%d,loss:%.3e mse:%.3f" % (it_count, loss.item(), mse))
    return loss_meter / it_count, mse_meter / it_count


def val_epoch(model, criterion, val_dataloader, threshold=0.5):
    model.eval()
    mse_meter,loss_meter, it_count = 0, 0, 0
    with torch.no_grad():
        for inputs, target in val_dataloader:
            inputs = inputs.to(device)
            target = target.to(device)
            output = model(inputs)
            loss = criterion(output, target)
            loss_meter += loss.item()
            it_count += 1
            mse = cal_mean_error(target, output)
            mse_meter += mse
    return loss_meter / it_count, mse_meter / it_count


def train(args):
    # get model 
    model =  MLP(num_tokens=154,
                                num_outputs=1,
                                num_hid=1024,
                                num_layers=4, # TODO: add these as hyperparameters?
                                dropout=0.1,
                                max_len=38)
#     if args.ckpt and not args.resume:
#         state = torch.load(args.ckpt, map_location='cpu')
#         model.load_state_dict(state['state_dict'])
#         print('train with pretrained weight val_f1', state['f1'])
    model = model.to(device)
    print(model)
    # data
    train_dataset = trafficSet(path = "a_testset_for_double_direction.json",train=True)
    train_dataloader = DataLoader(train_dataset, batch_size=args.batch_size, shuffle=True, num_workers=6)
    val_dataset = trafficSet(path = "a_testset_for_double_direction.json",train=False)
    val_dataloader = DataLoader(val_dataset, batch_size=args.batch_size, num_workers=4)
    print("train_datasize", len(train_dataset), "val_datasize", len(val_dataset))
    # optimizer and loss
    optimizer = optim.Adam(model.parameters(), lr=args.lr)
    criterion = nn.MSELoss()
    # model save dir
    model_save_dir = '%s/%s_%s' % (args.ckpt, args.model_name, time.strftime("%Y%m%d%H%M"))
    mkdirs(model_save_dir)
    best_mse = -1
    lr = args.lr
    start_epoch = 1
    stage = 1
    # train from last save point
#     if args.resume:
#         if os.path.exists(args.ckpt):  # weight path
#             model_save_dir = args.ckpt
#             current_w = torch.load(os.path.join(args.ckpt, config.current_w))
#             best_w = torch.load(os.path.join(model_save_dir, config.best_w))
#             best_f1 = best_w['loss']
#             start_epoch = current_w['epoch'] + 1
#             lr = current_w['lr']
#             stage = current_w['stage']
#             model.load_state_dict(current_w['state_dict'])
#             if start_epoch - 1 in config.stage_epoch:
#                 stage += 1
#                 lr /= config.lr_decay
#                 utils.adjust_learning_rate(optimizer, lr)
#                 model.load_state_dict(best_w['state_dict'])
#             print("=> loaded checkpoint (epoch {})".format(start_epoch - 1))
#     logger = Logger(logdir=model_save_dir, flush_secs=2)
    # =========>start training<=========
    for epoch in range(start_epoch, args.max_epoch + 1):
        since = time.time()
        train_loss, train_mse = train_epoch(model, optimizer, criterion, train_dataloader, show_interval=100)
        val_loss, val_mse = val_epoch(model, criterion, val_dataloader)
        print('#epoch:%02d stage:%d train_loss:%.3e train_mse:%.3f  val_loss:%0.3e val_mse:%.3f time:%s\n'
              % (epoch, stage, train_loss, train_mse, val_loss, val_mse, print_time_cost(since)))
        # logger.log_value('train_loss', train_loss, step=epoch)
        # logger.log_value('train_f1', train_f1, step=epoch)
        # logger.log_value('val_loss', val_loss, step=epoch)
        # logger.log_value('val_f1', val_f1, step=epoch)
        state = {"state_dict": model.state_dict(), "epoch": epoch, "loss": val_loss, 'mse': val_mse, 'lr': lr,
                 'stage': stage}
        save_ckpt(state, best_mse > val_mse, model_save_dir)
        best_mse = max(best_mse, val_mse)
        print(best_mse)
        if epoch in args.stage_epoch:
            stage += 1
            lr /= args.lr_decay
            best_w = os.path.join(model_save_dir, args.best_w)
            model.load_state_dict(torch.load(best_w)['state_dict'])
            print("*" * 10, "step into stage%02d lr %.3ef" % (stage, lr))
            adjust_learning_rate(optimizer, lr)

train(args)

MLP(
  (input): Linear(in_features=5852, out_features=1024, bias=True)
  (hidden): Sequential(
    (0): Dropout(p=0.1, inplace=False)
    (1): ReLU()
    (2): Linear(in_features=1024, out_features=1024, bias=True)
    (3): Dropout(p=0.1, inplace=False)
    (4): ReLU()
    (5): Linear(in_features=1024, out_features=1024, bias=True)
    (6): Dropout(p=0.1, inplace=False)
    (7): ReLU()
    (8): Linear(in_features=1024, out_features=1024, bias=True)
    (9): Dropout(p=0.1, inplace=False)
    (10): ReLU()
    (11): Linear(in_features=1024, out_features=1024, bias=True)
  )
  (output): Linear(in_features=1024, out_features=1, bias=True)
  (emb): Embedding(154, 154)
)


  cpuset_checked))


train_datasize 3900 val_datasize 975
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:01 stage:1 train_loss:3.042e+06 train_mse:322.124  val_loss:5.327e+01 val_mse:0.458 time:0m9s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:02 stage:1 train_loss:3.364e+03 train_mse:1.900  val_loss:1.547e-01 val_mse:0.332 time:0m9s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:03 stage:1 train_loss:1.844e-01 train_mse:0.303  val_loss:7.865e-02 val_mse:0.238 time:0m10s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:04 stage:1 train_loss:1.685e-01 train_mse:0.290  val_loss:7.560e-02 val_mse:0.233 time:0m9s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:05 stage:1 train_loss:1.271e-01 train_mse:0.273  val_loss:7.119e-02 val_mse:0.226 time:0m9s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:06 stage:1 train_loss:1.268e-01 train_mse:0.277  val_loss:7.414e-02 val_mse:0.231 time:0m9s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:07 stage:1 train_loss:1.311e-01 train_mse:0.264  val_loss:8.062e-02 val_mse:0.241 time:0m9s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:08 stage:1 train_loss:3.756e-01 train_mse:0.269  val_loss:9.158e-02 val_mse:0.257 time:0m9s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:09 stage:1 train_loss:1.307e-01 train_mse:0.255  val_loss:7.147e-02 val_mse:0.227 time:0m9s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:10 stage:1 train_loss:1.471e-01 train_mse:0.259  val_loss:7.956e-02 val_mse:0.240 time:0m9s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:11 stage:1 train_loss:1.065e-01 train_mse:0.255  val_loss:7.638e-02 val_mse:0.235 time:0m9s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:12 stage:1 train_loss:9.078e-02 train_mse:0.245  val_loss:7.160e-02 val_mse:0.227 time:0m9s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:13 stage:1 train_loss:1.179e-01 train_mse:0.251  val_loss:7.188e-02 val_mse:0.227 time:0m9s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:14 stage:1 train_loss:1.023e-01 train_mse:0.249  val_loss:7.366e-02 val_mse:0.230 time:0m9s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:15 stage:1 train_loss:8.556e-02 train_mse:0.244  val_loss:7.524e-02 val_mse:0.233 time:0m9s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:16 stage:1 train_loss:8.337e-02 train_mse:0.240  val_loss:7.750e-02 val_mse:0.236 time:0m9s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:17 stage:1 train_loss:8.440e-02 train_mse:0.239  val_loss:7.158e-02 val_mse:0.227 time:0m10s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:18 stage:1 train_loss:8.900e-02 train_mse:0.244  val_loss:7.244e-02 val_mse:0.229 time:0m9s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:19 stage:1 train_loss:8.107e-02 train_mse:0.241  val_loss:7.549e-02 val_mse:0.233 time:0m9s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:20 stage:1 train_loss:7.813e-02 train_mse:0.237  val_loss:7.376e-02 val_mse:0.231 time:0m9s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:21 stage:1 train_loss:8.009e-02 train_mse:0.236  val_loss:7.926e-02 val_mse:0.239 time:0m10s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:22 stage:1 train_loss:1.381e-01 train_mse:0.245  val_loss:7.219e-02 val_mse:0.229 time:0m11s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:23 stage:1 train_loss:8.159e-02 train_mse:0.241  val_loss:7.487e-02 val_mse:0.232 time:0m12s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:24 stage:1 train_loss:7.750e-02 train_mse:0.235  val_loss:7.331e-02 val_mse:0.230 time:0m13s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:25 stage:1 train_loss:7.617e-02 train_mse:0.234  val_loss:7.068e-02 val_mse:0.226 time:0m13s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:26 stage:1 train_loss:7.606e-02 train_mse:0.234  val_loss:7.224e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:27 stage:1 train_loss:7.442e-02 train_mse:0.233  val_loss:7.195e-02 val_mse:0.228 time:0m15s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:28 stage:1 train_loss:7.540e-02 train_mse:0.233  val_loss:7.083e-02 val_mse:0.226 time:0m15s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:29 stage:1 train_loss:7.476e-02 train_mse:0.233  val_loss:7.084e-02 val_mse:0.226 time:0m16s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:30 stage:1 train_loss:7.384e-02 train_mse:0.232  val_loss:7.077e-02 val_mse:0.226 time:0m16s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:31 stage:1 train_loss:7.500e-02 train_mse:0.233  val_loss:7.148e-02 val_mse:0.227 time:0m16s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:32 stage:1 train_loss:7.296e-02 train_mse:0.230  val_loss:7.146e-02 val_mse:0.227 time:0m16s


0.4575966253904035
********** step into stage02 lr 1.000e-03f
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:33 stage:2 train_loss:6.561e+01 train_mse:0.483  val_loss:4.238e-01 val_mse:0.294 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:34 stage:2 train_loss:1.630e+01 train_mse:0.467  val_loss:7.281e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:35 stage:2 train_loss:1.591e-01 train_mse:0.313  val_loss:7.205e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:36 stage:2 train_loss:1.121e-01 train_mse:0.273  val_loss:7.278e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:37 stage:2 train_loss:9.427e-02 train_mse:0.254  val_loss:7.520e-02 val_mse:0.233 time:0m13s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:38 stage:2 train_loss:8.562e-02 train_mse:0.245  val_loss:7.338e-02 val_mse:0.230 time:0m13s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:39 stage:2 train_loss:8.102e-02 train_mse:0.239  val_loss:7.546e-02 val_mse:0.233 time:0m13s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:40 stage:2 train_loss:8.065e-02 train_mse:0.239  val_loss:7.303e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:41 stage:2 train_loss:7.825e-02 train_mse:0.236  val_loss:7.161e-02 val_mse:0.227 time:0m13s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:42 stage:2 train_loss:7.756e-02 train_mse:0.236  val_loss:7.090e-02 val_mse:0.226 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:43 stage:2 train_loss:7.929e-02 train_mse:0.238  val_loss:7.157e-02 val_mse:0.227 time:0m13s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:44 stage:2 train_loss:7.613e-02 train_mse:0.234  val_loss:7.347e-02 val_mse:0.230 time:0m13s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:45 stage:2 train_loss:7.542e-02 train_mse:0.234  val_loss:7.106e-02 val_mse:0.226 time:0m13s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:46 stage:2 train_loss:7.646e-02 train_mse:0.235  val_loss:7.845e-02 val_mse:0.238 time:0m13s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:47 stage:2 train_loss:7.794e-02 train_mse:0.237  val_loss:7.404e-02 val_mse:0.231 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:48 stage:2 train_loss:7.558e-02 train_mse:0.236  val_loss:7.297e-02 val_mse:0.230 time:0m13s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:49 stage:2 train_loss:7.504e-02 train_mse:0.233  val_loss:7.362e-02 val_mse:0.230 time:0m13s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:50 stage:2 train_loss:7.613e-02 train_mse:0.235  val_loss:7.471e-02 val_mse:0.232 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:51 stage:2 train_loss:7.455e-02 train_mse:0.233  val_loss:7.180e-02 val_mse:0.228 time:0m13s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:52 stage:2 train_loss:7.538e-02 train_mse:0.234  val_loss:7.514e-02 val_mse:0.233 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:53 stage:2 train_loss:7.431e-02 train_mse:0.232  val_loss:7.639e-02 val_mse:0.235 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:54 stage:2 train_loss:7.594e-02 train_mse:0.232  val_loss:7.166e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:55 stage:2 train_loss:7.332e-02 train_mse:0.231  val_loss:7.298e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:56 stage:2 train_loss:7.514e-02 train_mse:0.234  val_loss:7.637e-02 val_mse:0.235 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:57 stage:2 train_loss:7.386e-02 train_mse:0.232  val_loss:7.485e-02 val_mse:0.233 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:58 stage:2 train_loss:7.481e-02 train_mse:0.233  val_loss:7.378e-02 val_mse:0.231 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:59 stage:2 train_loss:7.436e-02 train_mse:0.233  val_loss:7.017e-02 val_mse:0.225 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:60 stage:2 train_loss:7.373e-02 train_mse:0.232  val_loss:7.450e-02 val_mse:0.232 time:0m15s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:61 stage:2 train_loss:7.461e-02 train_mse:0.233  val_loss:7.068e-02 val_mse:0.226 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:62 stage:2 train_loss:7.377e-02 train_mse:0.232  val_loss:7.232e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:63 stage:2 train_loss:7.456e-02 train_mse:0.233  val_loss:6.961e-02 val_mse:0.225 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:64 stage:2 train_loss:7.559e-02 train_mse:0.236  val_loss:7.214e-02 val_mse:0.228 time:0m14s


0.4575966253904035
********** step into stage03 lr 1.000e-04f
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:65 stage:3 train_loss:2.887e+02 train_mse:0.548  val_loss:7.172e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:66 stage:3 train_loss:1.213e-01 train_mse:0.265  val_loss:7.197e-02 val_mse:0.229 time:0m13s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:67 stage:3 train_loss:1.066e-01 train_mse:0.261  val_loss:7.245e-02 val_mse:0.229 time:0m13s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:68 stage:3 train_loss:1.314e-01 train_mse:0.265  val_loss:7.253e-02 val_mse:0.229 time:0m13s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:69 stage:3 train_loss:3.536e-01 train_mse:0.268  val_loss:7.284e-02 val_mse:0.230 time:0m13s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:70 stage:3 train_loss:1.596e-01 train_mse:0.267  val_loss:7.310e-02 val_mse:0.230 time:0m13s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:71 stage:3 train_loss:1.083e-01 train_mse:0.265  val_loss:7.342e-02 val_mse:0.231 time:0m13s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:72 stage:3 train_loss:1.009e-01 train_mse:0.259  val_loss:7.294e-02 val_mse:0.230 time:0m13s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:73 stage:3 train_loss:9.824e-02 train_mse:0.258  val_loss:7.313e-02 val_mse:0.230 time:0m13s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:74 stage:3 train_loss:1.232e-01 train_mse:0.254  val_loss:7.295e-02 val_mse:0.230 time:0m13s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:75 stage:3 train_loss:9.967e-02 train_mse:0.261  val_loss:7.295e-02 val_mse:0.230 time:0m13s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:76 stage:3 train_loss:1.155e-01 train_mse:0.253  val_loss:7.293e-02 val_mse:0.230 time:0m13s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:77 stage:3 train_loss:9.601e-02 train_mse:0.256  val_loss:7.293e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:78 stage:3 train_loss:1.009e-01 train_mse:0.256  val_loss:7.284e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:79 stage:3 train_loss:9.541e-02 train_mse:0.255  val_loss:7.310e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:80 stage:3 train_loss:1.415e-01 train_mse:0.254  val_loss:7.292e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:81 stage:3 train_loss:9.731e-02 train_mse:0.255  val_loss:7.298e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:82 stage:3 train_loss:9.219e-02 train_mse:0.253  val_loss:7.310e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:83 stage:3 train_loss:9.087e-02 train_mse:0.250  val_loss:7.287e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:84 stage:3 train_loss:9.133e-02 train_mse:0.251  val_loss:7.319e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:85 stage:3 train_loss:9.129e-02 train_mse:0.251  val_loss:7.290e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:86 stage:3 train_loss:8.773e-02 train_mse:0.247  val_loss:7.256e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:87 stage:3 train_loss:9.316e-02 train_mse:0.251  val_loss:7.254e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:88 stage:3 train_loss:9.315e-02 train_mse:0.248  val_loss:7.280e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:89 stage:3 train_loss:8.652e-02 train_mse:0.246  val_loss:7.274e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:90 stage:3 train_loss:8.777e-02 train_mse:0.247  val_loss:7.250e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:91 stage:3 train_loss:8.732e-02 train_mse:0.247  val_loss:7.246e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:92 stage:3 train_loss:8.764e-02 train_mse:0.247  val_loss:7.222e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:93 stage:3 train_loss:8.700e-02 train_mse:0.247  val_loss:7.193e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:94 stage:3 train_loss:8.600e-02 train_mse:0.246  val_loss:7.199e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:95 stage:3 train_loss:1.137e-01 train_mse:0.248  val_loss:7.170e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:96 stage:3 train_loss:8.365e-02 train_mse:0.242  val_loss:7.157e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:97 stage:3 train_loss:8.532e-02 train_mse:0.245  val_loss:7.184e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:98 stage:3 train_loss:8.357e-02 train_mse:0.242  val_loss:7.196e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:99 stage:3 train_loss:8.364e-02 train_mse:0.243  val_loss:7.188e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:100 stage:3 train_loss:8.329e-02 train_mse:0.242  val_loss:7.184e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:101 stage:3 train_loss:8.221e-02 train_mse:0.242  val_loss:7.162e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:102 stage:3 train_loss:8.293e-02 train_mse:0.243  val_loss:7.177e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:103 stage:3 train_loss:8.232e-02 train_mse:0.242  val_loss:7.163e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:104 stage:3 train_loss:8.365e-02 train_mse:0.242  val_loss:7.160e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:105 stage:3 train_loss:8.068e-02 train_mse:0.240  val_loss:7.119e-02 val_mse:0.227 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:106 stage:3 train_loss:8.186e-02 train_mse:0.242  val_loss:7.026e-02 val_mse:0.225 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:107 stage:3 train_loss:8.042e-02 train_mse:0.239  val_loss:6.980e-02 val_mse:0.225 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:108 stage:3 train_loss:7.944e-02 train_mse:0.237  val_loss:6.800e-02 val_mse:0.222 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:109 stage:3 train_loss:7.937e-02 train_mse:0.237  val_loss:6.623e-02 val_mse:0.219 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:110 stage:3 train_loss:7.919e-02 train_mse:0.235  val_loss:6.537e-02 val_mse:0.218 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:111 stage:3 train_loss:7.698e-02 train_mse:0.234  val_loss:6.304e-02 val_mse:0.214 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:112 stage:3 train_loss:7.693e-02 train_mse:0.234  val_loss:6.263e-02 val_mse:0.213 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:113 stage:3 train_loss:4.940e+00 train_mse:0.268  val_loss:6.050e-02 val_mse:0.212 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:114 stage:3 train_loss:7.814e-02 train_mse:0.234  val_loss:6.179e-02 val_mse:0.211 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:115 stage:3 train_loss:7.622e-02 train_mse:0.233  val_loss:6.157e-02 val_mse:0.211 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:116 stage:3 train_loss:7.572e-02 train_mse:0.231  val_loss:6.159e-02 val_mse:0.211 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:117 stage:3 train_loss:7.295e-02 train_mse:0.228  val_loss:6.085e-02 val_mse:0.210 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:118 stage:3 train_loss:7.438e-02 train_mse:0.229  val_loss:6.151e-02 val_mse:0.211 time:0m15s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:119 stage:3 train_loss:7.384e-02 train_mse:0.230  val_loss:6.135e-02 val_mse:0.211 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:120 stage:3 train_loss:7.377e-02 train_mse:0.230  val_loss:6.148e-02 val_mse:0.211 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:121 stage:3 train_loss:7.348e-02 train_mse:0.229  val_loss:6.033e-02 val_mse:0.210 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:122 stage:3 train_loss:7.532e-02 train_mse:0.231  val_loss:6.012e-02 val_mse:0.209 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:123 stage:3 train_loss:7.487e-02 train_mse:0.231  val_loss:6.036e-02 val_mse:0.209 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:124 stage:3 train_loss:7.478e-02 train_mse:0.232  val_loss:5.930e-02 val_mse:0.208 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:125 stage:3 train_loss:7.135e-02 train_mse:0.225  val_loss:5.926e-02 val_mse:0.208 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:126 stage:3 train_loss:7.273e-02 train_mse:0.226  val_loss:5.841e-02 val_mse:0.206 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:127 stage:3 train_loss:7.280e-02 train_mse:0.228  val_loss:5.842e-02 val_mse:0.206 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:128 stage:3 train_loss:7.200e-02 train_mse:0.226  val_loss:5.789e-02 val_mse:0.205 time:0m14s


0.4575966253904035
********** step into stage04 lr 1.000e-05f
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:129 stage:4 train_loss:4.398e+02 train_mse:0.824  val_loss:7.186e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:130 stage:4 train_loss:2.015e-01 train_mse:0.274  val_loss:7.181e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:131 stage:4 train_loss:6.875e-01 train_mse:0.293  val_loss:7.196e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:132 stage:4 train_loss:3.433e-01 train_mse:0.277  val_loss:7.215e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:133 stage:4 train_loss:1.774e-01 train_mse:0.275  val_loss:7.233e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:134 stage:4 train_loss:5.097e-01 train_mse:0.282  val_loss:7.242e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:135 stage:4 train_loss:1.923e-01 train_mse:0.277  val_loss:7.246e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:136 stage:4 train_loss:1.986e-01 train_mse:0.277  val_loss:7.250e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:137 stage:4 train_loss:1.241e-01 train_mse:0.268  val_loss:7.266e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:138 stage:4 train_loss:6.528e+01 train_mse:0.390  val_loss:7.248e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:139 stage:4 train_loss:1.385e-01 train_mse:0.269  val_loss:7.252e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:140 stage:4 train_loss:1.189e+00 train_mse:0.283  val_loss:7.259e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:141 stage:4 train_loss:7.707e+00 train_mse:0.341  val_loss:7.264e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:142 stage:4 train_loss:1.107e-01 train_mse:0.262  val_loss:7.253e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:143 stage:4 train_loss:1.061e-01 train_mse:0.264  val_loss:7.264e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:144 stage:4 train_loss:1.484e-01 train_mse:0.264  val_loss:7.268e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:145 stage:4 train_loss:1.427e-01 train_mse:0.269  val_loss:7.272e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:146 stage:4 train_loss:1.062e-01 train_mse:0.261  val_loss:7.278e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:147 stage:4 train_loss:1.291e-01 train_mse:0.263  val_loss:7.287e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:148 stage:4 train_loss:1.203e-01 train_mse:0.263  val_loss:7.304e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:149 stage:4 train_loss:1.468e-01 train_mse:0.263  val_loss:7.310e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:150 stage:4 train_loss:1.091e-01 train_mse:0.264  val_loss:7.305e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:151 stage:4 train_loss:1.569e-01 train_mse:0.273  val_loss:7.307e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:152 stage:4 train_loss:2.032e-01 train_mse:0.272  val_loss:7.308e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:153 stage:4 train_loss:1.375e-01 train_mse:0.263  val_loss:7.327e-02 val_mse:0.231 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:154 stage:4 train_loss:5.813e-01 train_mse:0.279  val_loss:7.328e-02 val_mse:0.231 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:155 stage:4 train_loss:2.853e-01 train_mse:0.273  val_loss:7.318e-02 val_mse:0.231 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:156 stage:4 train_loss:5.039e-01 train_mse:0.269  val_loss:7.320e-02 val_mse:0.231 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:157 stage:4 train_loss:1.524e-01 train_mse:0.266  val_loss:7.311e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:158 stage:4 train_loss:1.038e-01 train_mse:0.259  val_loss:7.324e-02 val_mse:0.231 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:159 stage:4 train_loss:1.397e-01 train_mse:0.269  val_loss:7.324e-02 val_mse:0.231 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:160 stage:4 train_loss:1.186e-01 train_mse:0.262  val_loss:7.313e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:161 stage:4 train_loss:1.655e-01 train_mse:0.267  val_loss:7.320e-02 val_mse:0.231 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:162 stage:4 train_loss:1.309e-01 train_mse:0.265  val_loss:7.317e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:163 stage:4 train_loss:9.942e-02 train_mse:0.259  val_loss:7.321e-02 val_mse:0.231 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:164 stage:4 train_loss:1.172e-01 train_mse:0.260  val_loss:7.323e-02 val_mse:0.231 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:165 stage:4 train_loss:1.233e-01 train_mse:0.258  val_loss:7.330e-02 val_mse:0.231 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:166 stage:4 train_loss:1.214e-01 train_mse:0.264  val_loss:7.344e-02 val_mse:0.231 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:167 stage:4 train_loss:1.926e-01 train_mse:0.268  val_loss:7.330e-02 val_mse:0.231 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:168 stage:4 train_loss:1.935e-01 train_mse:0.268  val_loss:7.337e-02 val_mse:0.231 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:169 stage:4 train_loss:1.170e-01 train_mse:0.260  val_loss:7.341e-02 val_mse:0.231 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:170 stage:4 train_loss:1.014e-01 train_mse:0.258  val_loss:7.339e-02 val_mse:0.231 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:171 stage:4 train_loss:5.061e-01 train_mse:0.274  val_loss:7.318e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:172 stage:4 train_loss:1.390e-01 train_mse:0.265  val_loss:7.307e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:173 stage:4 train_loss:1.070e-01 train_mse:0.258  val_loss:7.302e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:174 stage:4 train_loss:4.548e+00 train_mse:0.295  val_loss:7.299e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:175 stage:4 train_loss:6.689e+01 train_mse:0.391  val_loss:7.275e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:176 stage:4 train_loss:1.108e-01 train_mse:0.254  val_loss:7.278e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:177 stage:4 train_loss:3.209e-01 train_mse:0.265  val_loss:7.287e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:178 stage:4 train_loss:9.842e-02 train_mse:0.258  val_loss:7.306e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:179 stage:4 train_loss:1.081e-01 train_mse:0.256  val_loss:7.315e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:180 stage:4 train_loss:1.001e-01 train_mse:0.255  val_loss:7.324e-02 val_mse:0.231 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:181 stage:4 train_loss:1.042e-01 train_mse:0.259  val_loss:7.329e-02 val_mse:0.231 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:182 stage:4 train_loss:1.181e-01 train_mse:0.259  val_loss:7.311e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:183 stage:4 train_loss:1.206e-01 train_mse:0.257  val_loss:7.305e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:184 stage:4 train_loss:1.386e-01 train_mse:0.257  val_loss:7.304e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:185 stage:4 train_loss:1.086e-01 train_mse:0.258  val_loss:7.334e-02 val_mse:0.231 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:186 stage:4 train_loss:1.696e-01 train_mse:0.268  val_loss:7.329e-02 val_mse:0.231 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:187 stage:4 train_loss:1.200e-01 train_mse:0.258  val_loss:7.312e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:188 stage:4 train_loss:1.164e-01 train_mse:0.258  val_loss:7.314e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:189 stage:4 train_loss:1.035e-01 train_mse:0.254  val_loss:7.304e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:190 stage:4 train_loss:1.072e-01 train_mse:0.258  val_loss:7.316e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:191 stage:4 train_loss:1.013e-01 train_mse:0.258  val_loss:7.316e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:192 stage:4 train_loss:9.243e-02 train_mse:0.250  val_loss:7.315e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:193 stage:4 train_loss:1.138e-01 train_mse:0.257  val_loss:7.314e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:194 stage:4 train_loss:1.162e-01 train_mse:0.257  val_loss:7.307e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:195 stage:4 train_loss:1.210e-01 train_mse:0.259  val_loss:7.307e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:196 stage:4 train_loss:1.055e-01 train_mse:0.252  val_loss:7.315e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:197 stage:4 train_loss:1.917e-01 train_mse:0.258  val_loss:7.318e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:198 stage:4 train_loss:1.037e-01 train_mse:0.256  val_loss:7.323e-02 val_mse:0.231 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:199 stage:4 train_loss:1.140e-01 train_mse:0.255  val_loss:7.318e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:200 stage:4 train_loss:1.135e-01 train_mse:0.255  val_loss:7.303e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:201 stage:4 train_loss:4.566e-01 train_mse:0.262  val_loss:7.295e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:202 stage:4 train_loss:6.042e-01 train_mse:0.269  val_loss:7.294e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:203 stage:4 train_loss:9.426e-02 train_mse:0.253  val_loss:7.300e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:204 stage:4 train_loss:1.460e-01 train_mse:0.254  val_loss:7.309e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:205 stage:4 train_loss:9.456e-02 train_mse:0.252  val_loss:7.307e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:206 stage:4 train_loss:9.053e-02 train_mse:0.251  val_loss:7.315e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:207 stage:4 train_loss:1.073e-01 train_mse:0.253  val_loss:7.311e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:208 stage:4 train_loss:9.728e-02 train_mse:0.253  val_loss:7.316e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:209 stage:4 train_loss:1.203e-01 train_mse:0.257  val_loss:7.302e-02 val_mse:0.230 time:0m15s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:210 stage:4 train_loss:1.014e-01 train_mse:0.253  val_loss:7.277e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:211 stage:4 train_loss:9.368e-02 train_mse:0.252  val_loss:7.291e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:212 stage:4 train_loss:9.910e-02 train_mse:0.253  val_loss:7.291e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:213 stage:4 train_loss:4.523e-01 train_mse:0.267  val_loss:7.291e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:214 stage:4 train_loss:1.167e-01 train_mse:0.254  val_loss:7.293e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:215 stage:4 train_loss:1.151e-01 train_mse:0.253  val_loss:7.306e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:216 stage:4 train_loss:2.644e-01 train_mse:0.257  val_loss:7.294e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:217 stage:4 train_loss:9.673e-02 train_mse:0.254  val_loss:7.283e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:218 stage:4 train_loss:1.090e-01 train_mse:0.256  val_loss:7.268e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:219 stage:4 train_loss:9.435e-02 train_mse:0.252  val_loss:7.254e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:220 stage:4 train_loss:1.039e-01 train_mse:0.254  val_loss:7.258e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:221 stage:4 train_loss:9.998e-02 train_mse:0.253  val_loss:7.264e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:222 stage:4 train_loss:9.815e-02 train_mse:0.252  val_loss:7.278e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:223 stage:4 train_loss:2.041e-01 train_mse:0.258  val_loss:7.271e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:224 stage:4 train_loss:9.174e-02 train_mse:0.250  val_loss:7.262e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:225 stage:4 train_loss:1.837e-01 train_mse:0.258  val_loss:7.272e-02 val_mse:0.230 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:226 stage:4 train_loss:9.439e-02 train_mse:0.253  val_loss:7.258e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:227 stage:4 train_loss:9.539e-02 train_mse:0.251  val_loss:7.245e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:228 stage:4 train_loss:6.372e-01 train_mse:0.263  val_loss:7.238e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:229 stage:4 train_loss:1.056e-01 train_mse:0.250  val_loss:7.253e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:230 stage:4 train_loss:1.063e-01 train_mse:0.253  val_loss:7.248e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:231 stage:4 train_loss:9.486e-02 train_mse:0.250  val_loss:7.233e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:232 stage:4 train_loss:1.038e-01 train_mse:0.251  val_loss:7.228e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:233 stage:4 train_loss:9.115e-02 train_mse:0.252  val_loss:7.228e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:234 stage:4 train_loss:1.448e-01 train_mse:0.251  val_loss:7.236e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:235 stage:4 train_loss:9.766e-02 train_mse:0.248  val_loss:7.216e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:236 stage:4 train_loss:1.013e-01 train_mse:0.248  val_loss:7.217e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:237 stage:4 train_loss:9.063e-02 train_mse:0.249  val_loss:7.217e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:238 stage:4 train_loss:2.408e-01 train_mse:0.257  val_loss:7.214e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:239 stage:4 train_loss:9.353e-02 train_mse:0.248  val_loss:7.219e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:240 stage:4 train_loss:9.048e-02 train_mse:0.247  val_loss:7.232e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:241 stage:4 train_loss:8.906e-02 train_mse:0.245  val_loss:7.226e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:242 stage:4 train_loss:9.959e-02 train_mse:0.250  val_loss:7.224e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:243 stage:4 train_loss:9.233e-02 train_mse:0.248  val_loss:7.220e-02 val_mse:0.229 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:244 stage:4 train_loss:9.470e-02 train_mse:0.247  val_loss:7.210e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:245 stage:4 train_loss:8.640e-02 train_mse:0.247  val_loss:7.193e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:246 stage:4 train_loss:8.904e-02 train_mse:0.248  val_loss:7.188e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:247 stage:4 train_loss:9.070e-02 train_mse:0.245  val_loss:7.192e-02 val_mse:0.228 time:0m15s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:248 stage:4 train_loss:9.678e-02 train_mse:0.249  val_loss:7.190e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:249 stage:4 train_loss:9.205e-02 train_mse:0.247  val_loss:7.199e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:250 stage:4 train_loss:8.898e-02 train_mse:0.248  val_loss:7.183e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:251 stage:4 train_loss:2.504e+00 train_mse:0.271  val_loss:7.177e-02 val_mse:0.228 time:0m15s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:252 stage:4 train_loss:9.110e-02 train_mse:0.245  val_loss:7.176e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:253 stage:4 train_loss:8.697e-02 train_mse:0.244  val_loss:7.176e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:254 stage:4 train_loss:8.558e-02 train_mse:0.246  val_loss:7.174e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:255 stage:4 train_loss:2.108e-01 train_mse:0.259  val_loss:7.184e-02 val_mse:0.228 time:0m14s


0.4575966253904035
start_training


  cpuset_checked))
  cpuset_checked))


#epoch:256 stage:4 train_loss:4.532e-01 train_mse:0.259  val_loss:7.177e-02 val_mse:0.228 time:0m14s


0.4575966253904035
********** step into stage05 lr 1.000e-06f


In [None]:
train_dataset = trafficSet(path = "a_testset_for_double_direction.json",train=True)
train_dataloader = DataLoader(train_dataset, batch_size=args.batch_size, shuffle=True, num_workers=6)
for x,y in train_dataloader:
  print(x.shape)

  cpuset_checked))


torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([128, 38])
torch.Size([60, 38])


In [None]:
model1 =  MLP(num_tokens=154,
                                num_outputs=1,
                                num_hid=1024,
                                num_layers=4, # TODO: add these as hyperparameters?
                                dropout=0.1,
                                max_len=38)
model1.load_state_dict(torch.load("/content/model/proxy_202206280904/current_w.pth",map_location='cpu')['state_dict'])
val_dataset = trafficSet(path = "a_testset_for_double_direction.json",train=False)
criterion = nn.MSELoss()

val_dataloader = DataLoader(val_dataset, batch_size=args.batch_size, num_workers=4)

val_loss, val_mse = val_epoch(model1, criterion, val_dataloader)

  cpuset_checked))


In [None]:
val_loss

0.07176542143914345

In [None]:
val_mse

0.22795962596799946