In [1]:
import numpy as np
import pandas as pd

import torch
import torch.nn as nn
import torch.optim as optim
import torch.nn.functional as F
import torch.utils.data as data

import utility.Data_loader as D
from utility.Model import Mcslt
from utility.Custom import CustomDataset

from tqdm import tqdm
from collections import Counter

In [2]:
%%time
if __name__ == '__main__':
    read_path = 'D:virus/image/4gram_768/'
    
    temp = [[],[]]
    
    Loader = D.File_loader()
    data_a, label_a = Loader.read_files(read_path, interp = False)
    
    idx = np.argsort(label_a)
    
    sorted_data = data_a[idx].reshape(10736, -1)
    sorted_label = sorted(label_a)
        
    BATCH_SIZE = 64
    TOTAL = 30
    EPOCH =500
    NUM_CLASS = 9
    LR = 0.0001
    SEED = [s for s in range(TOTAL)]
    Num_Nodes = 768
    
    CUDA_N = 'cuda:1'
    
    # creating data indices for spliting
    full_dataset = CustomDataset(sorted_data, sorted_label)
    train_size = int(0.8 * len(full_dataset))
    test_size = len(full_dataset) - train_size
    
    # spliting
    torch.manual_seed(10)
    train_dataset, test_dataset = data.random_split(full_dataset, [train_size, test_size])
    train_loader = data.DataLoader(train_dataset, batch_size=BATCH_SIZE, shuffle = False)
    test_loader = data.DataLoader(test_dataset, batch_size=BATCH_SIZE, shuffle=False)
    
    loss_total = []
    acc_total = []
    pred_total = []
    true_total = []
    
    
    for i in tqdm(range(TOTAL)):
        
        
        device = torch.device(CUDA_N if torch.cuda.is_available() else 'cpu')
        torch.manual_seed(SEED[i])
        net = Mcslt(Num_Nodes, NUM_CLASS)
        net.to(device)
        print(net)
        
        softmax = nn.Softmax()
        criterion = nn.CrossEntropyLoss()
        optimizer = optim.SGD(net.parameters(), lr=LR, momentum = 0.1)
        
        loss_list = []
        train_acc_list = []
        test_acc_list = []
        
        pred_temp = []
        true_temp = []
        
        for epoch in range(EPOCH):
            net.train()
            running_loss = 0
            total = train_size
            correct = 0 
            
            for step, images_labels in enumerate(train_loader):
                inputs, labels = images_labels
                inputs, labels = inputs.type(torch.FloatTensor).to(device), labels.type(torch.LongTensor).to(device)
                
                outputs = net(inputs)
                
                loss = criterion(outputs, labels)
                
                optimizer.zero_grad()
                loss.backward()
                optimizer.step()
                running_loss += loss.item()
                
                _, pred = torch.max(outputs, dim=1)
                correct += (pred == labels).sum().item()
                
            train_acc = correct/total
            loss_list.append(running_loss)
            train_acc_list.append(train_acc)
            print('{}th- epoch: {}, train_loss = {}, train_acc = {}'.format(i+1, epoch, running_loss, train_acc))
            
            with torch.no_grad():
                net.eval()
                correct = 0
                total = test_size
                pt, tt = [], []
                
                for step_t, images_labels_t in enumerate(test_loader):
                    inputs_t, labels_t = images_labels_t
                    inputs_t, labels_t = inputs_t.type(torch.FloatTensor).to(device), labels_t.type(torch.LongTensor).to(device)
                    
                    outputs_t = net(inputs_t)
                    outputs_t = softmax(outputs_t)
                    
                    # test accuracy
                    _, pred_t = torch.max(outputs_t, dim = 1)
                    
                    pt.append(pred_t)
                    tt.append(labels_t)
                    
                    correct += (pred_t == labels_t).sum().item()
                    
                pred_temp.append(torch.cat(pt))
                true_temp.append(torch.cat(tt))
                
                test_acc = correct/total
                test_acc_list.append(test_acc)
                
                print('test Acc {}:'.format(test_acc))
                
        best_result_index = np.argmax(np.array(test_acc_list))
        loss_total.append(loss_list[best_result_index])
        acc_total.append(test_acc_list[best_result_index])
        pred_total.append(pred_temp[best_result_index].tolist())
        true_total.append(true_temp[best_result_index].tolist())
        
    file_name = 'res/Mcslt_4gram'
    torch.save(net.state_dict(), file_name +'.pth')
    
    loss_DF = pd.DataFrame(loss_total)
    loss_DF.to_csv(file_name+" loss.csv")
    
    acc_DF = pd.DataFrame(acc_total)
    acc_DF.to_csv(file_name +" acc.csv")
    
    pred_DF = pd.DataFrame(pred_total)
    pred_DF.to_csv(file_name +" pred.csv")
    
    true_DF = pd.DataFrame(true_total)
    true_DF.to_csv(file_name +" true.csv")

100%|███████████████████████████████████████████████████████████████████| 10736/10736 [00:02<00:00, 4835.43it/s]
  0%|                                                                                    | 0/30 [00:00<?, ?it/s]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
1th- epoch: 0, train_loss = 152.95249550044537, train_acc = 0.7392873777363763




test Acc 0.8310055865921788:
1th- epoch: 1, train_loss = 53.89130235463381, train_acc = 0.8913600372612949
test Acc 0.8966480446927374:
1th- epoch: 2, train_loss = 37.86744794994593, train_acc = 0.9233814625058221
test Acc 0.9199255121042831:
1th- epoch: 3, train_loss = 29.80711743235588, train_acc = 0.9371215649743828
test Acc 0.9278398510242085:
1th- epoch: 4, train_loss = 24.71362467110157, train_acc = 0.9493479273404751
test Acc 0.9334264432029795:
1th- epoch: 5, train_loss = 21.14100305363536, train_acc = 0.9569166278528178
test Acc 0.9394785847299814:
1th- epoch: 6, train_loss = 18.458827279508114, train_acc = 0.9630880298090359
test Acc 0.9436685288640596:
1th- epoch: 7, train_loss = 16.37180996313691, train_acc = 0.9689101071262226
test Acc 0.9450651769087524:
1th- epoch: 8, train_loss = 14.702631890773773, train_acc = 0.971821145784816
test Acc 0.9492551210428305:
1th- epoch: 9, train_loss = 13.332399712875485, train_acc = 0.9741499767116907
test Acc 0.9539106145251397:
1th- e

test Acc 0.9748603351955307:
1th- epoch: 151, train_loss = 1.368846389115788, train_acc = 0.9974382859804378
test Acc 0.9748603351955307:
1th- epoch: 152, train_loss = 1.365379884839058, train_acc = 0.9974382859804378
test Acc 0.9748603351955307:
1th- epoch: 153, train_loss = 1.3611929366597906, train_acc = 0.9974382859804378
test Acc 0.9748603351955307:
1th- epoch: 154, train_loss = 1.3573722405126318, train_acc = 0.9974382859804378
test Acc 0.9748603351955307:
1th- epoch: 155, train_loss = 1.35332613310311, train_acc = 0.9974382859804378
test Acc 0.9748603351955307:
1th- epoch: 156, train_loss = 1.349892637343146, train_acc = 0.9974382859804378
test Acc 0.9748603351955307:
1th- epoch: 157, train_loss = 1.346063214004971, train_acc = 0.9974382859804378
test Acc 0.9748603351955307:
1th- epoch: 158, train_loss = 1.3424196913838387, train_acc = 0.9974382859804378
test Acc 0.9748603351955307:
1th- epoch: 159, train_loss = 1.3385665664682165, train_acc = 0.9974382859804378
test Acc 0.97486

1th- epoch: 299, train_loss = 1.064030094712507, train_acc = 0.9976711690731253
test Acc 0.9762569832402235:
1th- epoch: 300, train_loss = 1.062970593571663, train_acc = 0.9976711690731253
test Acc 0.9762569832402235:
1th- epoch: 301, train_loss = 1.0616804647142999, train_acc = 0.9976711690731253
test Acc 0.9762569832402235:
1th- epoch: 302, train_loss = 1.0608106379513629, train_acc = 0.9976711690731253
test Acc 0.9762569832402235:
1th- epoch: 303, train_loss = 1.0597335982020013, train_acc = 0.9976711690731253
test Acc 0.9762569832402235:
1th- epoch: 304, train_loss = 1.0586116425693035, train_acc = 0.9976711690731253
test Acc 0.9762569832402235:
1th- epoch: 305, train_loss = 1.0580903043155558, train_acc = 0.9976711690731253
test Acc 0.9762569832402235:
1th- epoch: 306, train_loss = 1.0569809141452424, train_acc = 0.9976711690731253
test Acc 0.9762569832402235:
1th- epoch: 307, train_loss = 1.0556661213631742, train_acc = 0.9976711690731253
test Acc 0.9762569832402235:
1th- epoch: 

1th- epoch: 447, train_loss = 0.9537316113710403, train_acc = 0.9977876106194691
test Acc 0.9776536312849162:
1th- epoch: 448, train_loss = 0.9532016081211623, train_acc = 0.9977876106194691
test Acc 0.9776536312849162:
1th- epoch: 449, train_loss = 0.95269675552845, train_acc = 0.9977876106194691
test Acc 0.9776536312849162:
1th- epoch: 450, train_loss = 0.9522973621787969, train_acc = 0.9977876106194691
test Acc 0.9776536312849162:
1th- epoch: 451, train_loss = 0.9515115581452847, train_acc = 0.9977876106194691
test Acc 0.9776536312849162:
1th- epoch: 452, train_loss = 0.9511744988558348, train_acc = 0.9977876106194691
test Acc 0.9776536312849162:
1th- epoch: 453, train_loss = 0.9504037822189275, train_acc = 0.9977876106194691
test Acc 0.9776536312849162:
1th- epoch: 454, train_loss = 0.9501762303116266, train_acc = 0.9977876106194691
test Acc 0.9776536312849162:
1th- epoch: 455, train_loss = 0.9495669106545392, train_acc = 0.9977876106194691
test Acc 0.9776536312849162:
1th- epoch: 

  3%|██▍                                                                      | 1/30 [09:25<4:33:28, 565.81s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
2th- epoch: 0, train_loss = 154.08877535909414, train_acc = 0.7343968327899395
test Acc 0.8389199255121043:
2th- epoch: 1, train_loss = 54.000666469335556, train_acc = 0.884257102934327
test Acc 0.8919925512104283:
2th- epoch: 2, train_loss = 38.284685630351305, train_acc = 0.9189566837447601
test Acc 0.9157355679702048:
2th- epoch: 3, train_loss = 30.541963724419475, train_acc = 0.9354913833255706
test Acc 0.9287709497206704:
2th- epoch: 4, train_loss = 25.61072311922908, train_acc = 0.9437587331159758
test Acc 0.9371508379888268:
2th- epoch: 5, train_loss = 22.09210024960339, train_acc = 0.9523754075454122
te

2th- epoch: 147, train_loss = 1.4901005912106484, train_acc = 0.9973218444340941
test Acc 0.9748603351955307:
2th- epoch: 148, train_loss = 1.4859596739988774, train_acc = 0.9973218444340941
test Acc 0.9748603351955307:
2th- epoch: 149, train_loss = 1.4809331789147109, train_acc = 0.9973218444340941
test Acc 0.9748603351955307:
2th- epoch: 150, train_loss = 1.4764103456400335, train_acc = 0.9973218444340941
test Acc 0.9748603351955307:
2th- epoch: 151, train_loss = 1.4718612676952034, train_acc = 0.9973218444340941
test Acc 0.9748603351955307:
2th- epoch: 152, train_loss = 1.4670769344083965, train_acc = 0.9973218444340941
test Acc 0.9748603351955307:
2th- epoch: 153, train_loss = 1.4622629745863378, train_acc = 0.9973218444340941
test Acc 0.9748603351955307:
2th- epoch: 154, train_loss = 1.458091346314177, train_acc = 0.9973218444340941
test Acc 0.9748603351955307:
2th- epoch: 155, train_loss = 1.452907921280712, train_acc = 0.9973218444340941
test Acc 0.9748603351955307:
2th- epoch: 

2th- epoch: 295, train_loss = 1.1332801307435147, train_acc = 0.9976711690731253
test Acc 0.9781191806331471:
2th- epoch: 296, train_loss = 1.1323615008150227, train_acc = 0.9976711690731253
test Acc 0.9781191806331471:
2th- epoch: 297, train_loss = 1.1308012561057694, train_acc = 0.9976711690731253
test Acc 0.9781191806331471:
2th- epoch: 298, train_loss = 1.1298066930030473, train_acc = 0.9976711690731253
test Acc 0.9781191806331471:
2th- epoch: 299, train_loss = 1.1283519423450343, train_acc = 0.9976711690731253
test Acc 0.9781191806331471:
2th- epoch: 300, train_loss = 1.127551740675699, train_acc = 0.9976711690731253
test Acc 0.9781191806331471:
2th- epoch: 301, train_loss = 1.1262489004875533, train_acc = 0.9976711690731253
test Acc 0.9781191806331471:
2th- epoch: 302, train_loss = 1.1249637734144926, train_acc = 0.9976711690731253
test Acc 0.9781191806331471:
2th- epoch: 303, train_loss = 1.1234685089439154, train_acc = 0.9976711690731253
test Acc 0.9781191806331471:
2th- epoch:

2th- epoch: 445, train_loss = 1.002491298422683, train_acc = 0.9977876106194691
test Acc 0.979050279329609:
2th- epoch: 446, train_loss = 1.00245468999492, train_acc = 0.9977876106194691
test Acc 0.9795158286778398:
2th- epoch: 447, train_loss = 1.0018565698410384, train_acc = 0.9977876106194691
test Acc 0.9795158286778398:
2th- epoch: 448, train_loss = 1.0010332849924453, train_acc = 0.9977876106194691
test Acc 0.9795158286778398:
2th- epoch: 449, train_loss = 1.0008353597368114, train_acc = 0.9977876106194691
test Acc 0.9795158286778398:
2th- epoch: 450, train_loss = 1.0000697312061675, train_acc = 0.9977876106194691
test Acc 0.9795158286778398:
2th- epoch: 451, train_loss = 0.9994704549317248, train_acc = 0.9977876106194691
test Acc 0.9795158286778398:
2th- epoch: 452, train_loss = 0.9993129707872868, train_acc = 0.9977876106194691
test Acc 0.9795158286778398:
2th- epoch: 453, train_loss = 0.9983291539247148, train_acc = 0.9977876106194691
test Acc 0.9795158286778398:
2th- epoch: 45

  7%|████▊                                                                    | 2/30 [19:26<4:28:56, 576.31s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
3th- epoch: 0, train_loss = 123.17900551855564, train_acc = 0.765836050302748
test Acc 0.8654562383612663:
3th- epoch: 1, train_loss = 48.73801824450493, train_acc = 0.895668374476013
test Acc 0.9143389199255121:
3th- epoch: 2, train_loss = 35.17724047601223, train_acc = 0.9253609687936656
test Acc 0.9245810055865922:
3th- epoch: 3, train_loss = 28.33591763302684, train_acc = 0.9415463437354448
test Acc 0.9334264432029795:
3th- epoch: 4, train_loss = 23.950195588171482, train_acc = 0.9507452258965999
test Acc 0.9413407821229051:
3th- epoch: 5, train_loss = 20.844478575512767, train_acc = 0.9587796925943176
test

3th- epoch: 147, train_loss = 1.4876832652371377, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
3th- epoch: 148, train_loss = 1.4830412678420544, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
3th- epoch: 149, train_loss = 1.4778119511902332, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
3th- epoch: 150, train_loss = 1.4728173215407878, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
3th- epoch: 151, train_loss = 1.4692124377470464, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
3th- epoch: 152, train_loss = 1.463656086474657, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
3th- epoch: 153, train_loss = 1.4598353567998856, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
3th- epoch: 154, train_loss = 1.45487134414725, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
3th- epoch: 155, train_loss = 1.4507416635751724, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
3th- epoch: 156, train

3th- epoch: 297, train_loss = 1.1212139179115184, train_acc = 0.9976711690731253
test Acc 0.979050279329609:
3th- epoch: 298, train_loss = 1.1198465749621391, train_acc = 0.9976711690731253
test Acc 0.979050279329609:
3th- epoch: 299, train_loss = 1.1182581645553, train_acc = 0.9976711690731253
test Acc 0.979050279329609:
3th- epoch: 300, train_loss = 1.117754717648495, train_acc = 0.9976711690731253
test Acc 0.979050279329609:
3th- epoch: 301, train_loss = 1.116240366070997, train_acc = 0.9976711690731253
test Acc 0.979050279329609:
3th- epoch: 302, train_loss = 1.115282962739002, train_acc = 0.9976711690731253
test Acc 0.979050279329609:
3th- epoch: 303, train_loss = 1.1135982908308506, train_acc = 0.9976711690731253
test Acc 0.979050279329609:
3th- epoch: 304, train_loss = 1.1124266274273396, train_acc = 0.9976711690731253
test Acc 0.979050279329609:
3th- epoch: 305, train_loss = 1.11134484159993, train_acc = 0.9976711690731253
test Acc 0.979050279329609:
3th- epoch: 306, train_loss

3th- epoch: 446, train_loss = 0.995318283647066, train_acc = 0.9976711690731253
test Acc 0.9795158286778398:
3th- epoch: 447, train_loss = 0.9947852355835494, train_acc = 0.9976711690731253
test Acc 0.9795158286778398:
3th- epoch: 448, train_loss = 0.994014206022257, train_acc = 0.9976711690731253
test Acc 0.9795158286778398:
3th- epoch: 449, train_loss = 0.9937700206937734, train_acc = 0.9976711690731253
test Acc 0.9795158286778398:
3th- epoch: 450, train_loss = 0.9927196465432644, train_acc = 0.9976711690731253
test Acc 0.9795158286778398:
3th- epoch: 451, train_loss = 0.9925276873109397, train_acc = 0.9976711690731253
test Acc 0.9795158286778398:
3th- epoch: 452, train_loss = 0.9918291407229844, train_acc = 0.9976711690731253
test Acc 0.9795158286778398:
3th- epoch: 453, train_loss = 0.9913220877351705, train_acc = 0.9976711690731253
test Acc 0.9795158286778398:
3th- epoch: 454, train_loss = 0.9904582922754344, train_acc = 0.9976711690731253
test Acc 0.9795158286778398:
3th- epoch: 

 10%|███████▎                                                                 | 3/30 [29:24<4:22:18, 582.91s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
4th- epoch: 0, train_loss = 147.49719558656216, train_acc = 0.7502328830926874
test Acc 0.8547486033519553:
4th- epoch: 1, train_loss = 55.71110089123249, train_acc = 0.8878667908709827
test Acc 0.8947858472998138:
4th- epoch: 2, train_loss = 40.02158988267183, train_acc = 0.9175593851886353
test Acc 0.9129422718808193:
4th- epoch: 3, train_loss = 31.796170972287655, train_acc = 0.9337447601304145
test Acc 0.9213221601489758:
4th- epoch: 4, train_loss = 26.57037415355444, train_acc = 0.945388914764788
test Acc 0.9278398510242085:
4th- epoch: 5, train_loss = 22.898487240076065, train_acc = 0.9526082906380997
tes

test Acc 0.9771880819366853:
4th- epoch: 147, train_loss = 1.5069506367435679, train_acc = 0.9976711690731253
test Acc 0.9771880819366853:
4th- epoch: 148, train_loss = 1.5021513676038012, train_acc = 0.9976711690731253
test Acc 0.9771880819366853:
4th- epoch: 149, train_loss = 1.4972094086697325, train_acc = 0.9976711690731253
test Acc 0.9771880819366853:
4th- epoch: 150, train_loss = 1.4921583185205236, train_acc = 0.9976711690731253
test Acc 0.9771880819366853:
4th- epoch: 151, train_loss = 1.487641990184784, train_acc = 0.9976711690731253
test Acc 0.9776536312849162:
4th- epoch: 152, train_loss = 1.4830655058613047, train_acc = 0.9976711690731253
test Acc 0.9771880819366853:
4th- epoch: 153, train_loss = 1.4782175148138776, train_acc = 0.9976711690731253
test Acc 0.9771880819366853:
4th- epoch: 154, train_loss = 1.4739153943955898, train_acc = 0.9976711690731253
test Acc 0.9771880819366853:
4th- epoch: 155, train_loss = 1.4699126580962911, train_acc = 0.9976711690731253
test Acc 0.

4th- epoch: 296, train_loss = 1.1369840527477209, train_acc = 0.9980204937121565
test Acc 0.979050279329609:
4th- epoch: 297, train_loss = 1.1359189748764038, train_acc = 0.9980204937121565
test Acc 0.979050279329609:
4th- epoch: 298, train_loss = 1.134335229784483, train_acc = 0.9980204937121565
test Acc 0.979050279329609:
4th- epoch: 299, train_loss = 1.1334302152099553, train_acc = 0.9980204937121565
test Acc 0.979050279329609:
4th- epoch: 300, train_loss = 1.1321919833717402, train_acc = 0.9980204937121565
test Acc 0.979050279329609:
4th- epoch: 301, train_loss = 1.130595007300144, train_acc = 0.9980204937121565
test Acc 0.979050279329609:
4th- epoch: 302, train_loss = 1.1299029129149858, train_acc = 0.9980204937121565
test Acc 0.979050279329609:
4th- epoch: 303, train_loss = 1.128212379902834, train_acc = 0.9980204937121565
test Acc 0.979050279329609:
4th- epoch: 304, train_loss = 1.1273093186318874, train_acc = 0.9980204937121565
test Acc 0.979050279329609:
4th- epoch: 305, train

4th- epoch: 445, train_loss = 1.007431839898345, train_acc = 0.9981369352585002
test Acc 0.9799813780260708:
4th- epoch: 446, train_loss = 1.0061978946177987, train_acc = 0.9981369352585002
test Acc 0.9799813780260708:
4th- epoch: 447, train_loss = 1.0064678614289733, train_acc = 0.9981369352585002
test Acc 0.9799813780260708:
4th- epoch: 448, train_loss = 1.005401940390584, train_acc = 0.9981369352585002
test Acc 0.9799813780260708:
4th- epoch: 449, train_loss = 1.0052430381329032, train_acc = 0.9981369352585002
test Acc 0.9799813780260708:
4th- epoch: 450, train_loss = 1.0044450287969084, train_acc = 0.9981369352585002
test Acc 0.9799813780260708:
4th- epoch: 451, train_loss = 1.003870299711707, train_acc = 0.9981369352585002
test Acc 0.9799813780260708:
4th- epoch: 452, train_loss = 1.0038677801640006, train_acc = 0.9981369352585002
test Acc 0.9799813780260708:
4th- epoch: 453, train_loss = 1.0027519750146894, train_acc = 0.9981369352585002
test Acc 0.9799813780260708:
4th- epoch: 4

 13%|█████████▋                                                               | 4/30 [39:24<4:14:44, 587.87s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
5th- epoch: 0, train_loss = 138.70187711715698, train_acc = 0.7395202608290639
test Acc 0.8505586592178771:
5th- epoch: 1, train_loss = 51.63381112366915, train_acc = 0.8914764788076386
test Acc 0.9031657355679702:
5th- epoch: 2, train_loss = 36.8081136867404, train_acc = 0.9232650209594784
test Acc 0.9245810055865922:
5th- epoch: 3, train_loss = 29.473633747547865, train_acc = 0.9386353050768514
test Acc 0.9338919925512105:
5th- epoch: 4, train_loss = 24.857946317642927, train_acc = 0.9479506287843502
test Acc 0.9385474860335196:
5th- epoch: 5, train_loss = 21.57964688912034, train_acc = 0.9563344201210993
tes

5th- epoch: 147, train_loss = 1.4506375116761774, train_acc = 0.9972054028877504
test Acc 0.9776536312849162:
5th- epoch: 148, train_loss = 1.445879136910662, train_acc = 0.9972054028877504
test Acc 0.9776536312849162:
5th- epoch: 149, train_loss = 1.4413319460581988, train_acc = 0.9970889613414066
test Acc 0.9776536312849162:
5th- epoch: 150, train_loss = 1.4368453368078917, train_acc = 0.9972054028877504
test Acc 0.9776536312849162:
5th- epoch: 151, train_loss = 1.4321783112827688, train_acc = 0.9972054028877504
test Acc 0.9776536312849162:
5th- epoch: 152, train_loss = 1.4276916680391878, train_acc = 0.9972054028877504
test Acc 0.9776536312849162:
5th- epoch: 153, train_loss = 1.4233582869637758, train_acc = 0.9972054028877504
test Acc 0.9776536312849162:
5th- epoch: 154, train_loss = 1.4189039536286145, train_acc = 0.9972054028877504
test Acc 0.9776536312849162:
5th- epoch: 155, train_loss = 1.4144825593102723, train_acc = 0.9972054028877504
test Acc 0.9776536312849162:
5th- epoch:

5th- epoch: 295, train_loss = 1.096132454171311, train_acc = 0.9975547275267815
test Acc 0.9795158286778398:
5th- epoch: 296, train_loss = 1.0949525758624077, train_acc = 0.9975547275267815
test Acc 0.9795158286778398:
5th- epoch: 297, train_loss = 1.0939288244699128, train_acc = 0.9975547275267815
test Acc 0.9795158286778398:
5th- epoch: 298, train_loss = 1.0926783972536214, train_acc = 0.9975547275267815
test Acc 0.9795158286778398:
5th- epoch: 299, train_loss = 1.0915734029258601, train_acc = 0.9975547275267815
test Acc 0.9795158286778398:
5th- epoch: 300, train_loss = 1.0904840373550542, train_acc = 0.9975547275267815
test Acc 0.9795158286778398:
5th- epoch: 301, train_loss = 1.0897144197369926, train_acc = 0.9975547275267815
test Acc 0.9795158286778398:
5th- epoch: 302, train_loss = 1.0881486025755294, train_acc = 0.9975547275267815
test Acc 0.9795158286778398:
5th- epoch: 303, train_loss = 1.0866456596995704, train_acc = 0.9975547275267815
test Acc 0.9795158286778398:
5th- epoch:

5th- epoch: 443, train_loss = 0.9735722430050373, train_acc = 0.9977876106194691
test Acc 0.9799813780260708:
5th- epoch: 444, train_loss = 0.9728127159178257, train_acc = 0.9977876106194691
test Acc 0.9799813780260708:
5th- epoch: 445, train_loss = 0.9723043330013752, train_acc = 0.9977876106194691
test Acc 0.9799813780260708:
5th- epoch: 446, train_loss = 0.9713116809725761, train_acc = 0.9977876106194691
test Acc 0.9799813780260708:
5th- epoch: 447, train_loss = 0.9715440105646849, train_acc = 0.9977876106194691
test Acc 0.9799813780260708:
5th- epoch: 448, train_loss = 0.9704683988238685, train_acc = 0.9977876106194691
test Acc 0.9799813780260708:
5th- epoch: 449, train_loss = 0.9698152666096576, train_acc = 0.9979040521658128
test Acc 0.9799813780260708:
5th- epoch: 450, train_loss = 0.9689186910691205, train_acc = 0.9979040521658128
test Acc 0.9799813780260708:
5th- epoch: 451, train_loss = 0.9685013654234353, train_acc = 0.9979040521658128
test Acc 0.9799813780260708:
5th- epoch

 17%|████████████▏                                                            | 5/30 [49:26<4:06:42, 592.08s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
6th- epoch: 0, train_loss = 145.12541434168816, train_acc = 0.7401024685607824
test Acc 0.8445065176908753:
6th- epoch: 1, train_loss = 53.523081820458174, train_acc = 0.8876339077782953
test Acc 0.8929236499068901:
6th- epoch: 2, train_loss = 37.701557744294405, train_acc = 0.9193060083837913
test Acc 0.9110800744878957:
6th- epoch: 3, train_loss = 29.71613502688706, train_acc = 0.9350256171401956
test Acc 0.9236499068901304:
6th- epoch: 4, train_loss = 24.695085471495986, train_acc = 0.9487657196087564
test Acc 0.9324953445065177:
6th- epoch: 5, train_loss = 21.212551033124328, train_acc = 0.956450861667443
t

6th- epoch: 147, train_loss = 1.4017912931740284, train_acc = 0.9981369352585002
test Acc 0.9739292364990689:
6th- epoch: 148, train_loss = 1.3975938471267, train_acc = 0.9981369352585002
test Acc 0.9739292364990689:
6th- epoch: 149, train_loss = 1.3931218571960926, train_acc = 0.9981369352585002
test Acc 0.9739292364990689:
6th- epoch: 150, train_loss = 1.389257891685702, train_acc = 0.9981369352585002
test Acc 0.9739292364990689:
6th- epoch: 151, train_loss = 1.3851356406812556, train_acc = 0.9981369352585002
test Acc 0.9739292364990689:
6th- epoch: 152, train_loss = 1.3813892069156282, train_acc = 0.9981369352585002
test Acc 0.9739292364990689:
6th- epoch: 153, train_loss = 1.3773728187079541, train_acc = 0.9981369352585002
test Acc 0.9743947858472998:
6th- epoch: 154, train_loss = 1.3734300844371319, train_acc = 0.9981369352585002
test Acc 0.9743947858472998:
6th- epoch: 155, train_loss = 1.3697755237226374, train_acc = 0.9981369352585002
test Acc 0.9743947858472998:
6th- epoch: 15

6th- epoch: 295, train_loss = 1.0953670268354472, train_acc = 0.9981369352585002
test Acc 0.9757914338919925:
6th- epoch: 296, train_loss = 1.0943967774510384, train_acc = 0.9981369352585002
test Acc 0.9757914338919925:
6th- epoch: 297, train_loss = 1.0933005089464132, train_acc = 0.9981369352585002
test Acc 0.9762569832402235:
6th- epoch: 298, train_loss = 1.0922819500265177, train_acc = 0.9981369352585002
test Acc 0.9757914338919925:
6th- epoch: 299, train_loss = 1.0911235846579075, train_acc = 0.9981369352585002
test Acc 0.9757914338919925:
6th- epoch: 300, train_loss = 1.0903192485275213, train_acc = 0.9981369352585002
test Acc 0.9757914338919925:
6th- epoch: 301, train_loss = 1.0891324716212694, train_acc = 0.9981369352585002
test Acc 0.9767225325884544:
6th- epoch: 302, train_loss = 1.088162654399639, train_acc = 0.9981369352585002
test Acc 0.9762569832402235:
6th- epoch: 303, train_loss = 1.087102960795164, train_acc = 0.9981369352585002
test Acc 0.9762569832402235:
6th- epoch: 

6th- epoch: 443, train_loss = 0.9835333861410618, train_acc = 0.9981369352585002
test Acc 0.9771880819366853:
6th- epoch: 444, train_loss = 0.983184405908105, train_acc = 0.9981369352585002
test Acc 0.9776536312849162:
6th- epoch: 445, train_loss = 0.9826679254620103, train_acc = 0.9981369352585002
test Acc 0.9771880819366853:
6th- epoch: 446, train_loss = 0.981956506773713, train_acc = 0.9981369352585002
test Acc 0.9776536312849162:
6th- epoch: 447, train_loss = 0.9815739206969738, train_acc = 0.9981369352585002
test Acc 0.9776536312849162:
6th- epoch: 448, train_loss = 0.9806800559163094, train_acc = 0.9981369352585002
test Acc 0.9776536312849162:
6th- epoch: 449, train_loss = 0.9803753085434437, train_acc = 0.9981369352585002
test Acc 0.9776536312849162:
6th- epoch: 450, train_loss = 0.9795751633791951, train_acc = 0.9981369352585002
test Acc 0.9776536312849162:
6th- epoch: 451, train_loss = 0.9794602480978938, train_acc = 0.9981369352585002
test Acc 0.9776536312849162:
6th- epoch: 

 20%|██████████████▌                                                          | 6/30 [59:28<3:58:05, 595.22s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
7th- epoch: 0, train_loss = 130.6896826326847, train_acc = 0.7472054028877504
test Acc 0.8691806331471136:
7th- epoch: 1, train_loss = 53.300356052815914, train_acc = 0.8874010246856078
test Acc 0.909217877094972:
7th- epoch: 2, train_loss = 37.77710651233792, train_acc = 0.9208197484862599
test Acc 0.930633147113594:
7th- epoch: 3, train_loss = 29.93952849879861, train_acc = 0.9385188635305077
test Acc 0.9376163873370578:
7th- epoch: 4, train_loss = 25.08260739967227, train_acc = 0.9492314857941313
test Acc 0.9464618249534451:
7th- epoch: 5, train_loss = 21.709920037537813, train_acc = 0.9581974848625989
test 

7th- epoch: 147, train_loss = 1.510573111474514, train_acc = 0.9972054028877504
test Acc 0.9799813780260708:
7th- epoch: 148, train_loss = 1.5055828405311331, train_acc = 0.9972054028877504
test Acc 0.9799813780260708:
7th- epoch: 149, train_loss = 1.5008986989269033, train_acc = 0.9972054028877504
test Acc 0.9799813780260708:
7th- epoch: 150, train_loss = 1.4962416788330302, train_acc = 0.9972054028877504
test Acc 0.9799813780260708:
7th- epoch: 151, train_loss = 1.4912759339204058, train_acc = 0.9972054028877504
test Acc 0.9799813780260708:
7th- epoch: 152, train_loss = 1.4869877422461286, train_acc = 0.9972054028877504
test Acc 0.9799813780260708:
7th- epoch: 153, train_loss = 1.482096552848816, train_acc = 0.9972054028877504
test Acc 0.9804469273743017:
7th- epoch: 154, train_loss = 1.477939359843731, train_acc = 0.9972054028877504
test Acc 0.9804469273743017:
7th- epoch: 155, train_loss = 1.4732552418718114, train_acc = 0.9972054028877504
test Acc 0.9804469273743017:
7th- epoch: 1

test Acc 0.9809124767225326:
7th- epoch: 296, train_loss = 1.1454719143803231, train_acc = 0.9979040521658128
test Acc 0.9809124767225326:
7th- epoch: 297, train_loss = 1.1442581477458589, train_acc = 0.9979040521658128
test Acc 0.9809124767225326:
7th- epoch: 298, train_loss = 1.1428947212989442, train_acc = 0.9979040521658128
test Acc 0.9809124767225326:
7th- epoch: 299, train_loss = 1.141693014651537, train_acc = 0.9979040521658128
test Acc 0.9809124767225326:
7th- epoch: 300, train_loss = 1.1395873266155832, train_acc = 0.9979040521658128
test Acc 0.9809124767225326:
7th- epoch: 301, train_loss = 1.1386179749970324, train_acc = 0.9979040521658128
test Acc 0.9809124767225326:
7th- epoch: 302, train_loss = 1.137072067707777, train_acc = 0.9979040521658128
test Acc 0.9809124767225326:
7th- epoch: 303, train_loss = 1.1361490090494044, train_acc = 0.9979040521658128
test Acc 0.9809124767225326:
7th- epoch: 304, train_loss = 1.1344769683782943, train_acc = 0.9979040521658128
test Acc 0.9

7th- epoch: 444, train_loss = 1.013663181423908, train_acc = 0.9979040521658128
test Acc 0.9818435754189944:
7th- epoch: 445, train_loss = 1.01259826371097, train_acc = 0.9979040521658128
test Acc 0.9818435754189944:
7th- epoch: 446, train_loss = 1.0122396163642406, train_acc = 0.9977876106194691
test Acc 0.9818435754189944:
7th- epoch: 447, train_loss = 1.011437720299, train_acc = 0.9977876106194691
test Acc 0.9818435754189944:
7th- epoch: 448, train_loss = 1.0107593213615473, train_acc = 0.9979040521658128
test Acc 0.9818435754189944:
7th- epoch: 449, train_loss = 1.0104109980165958, train_acc = 0.9977876106194691
test Acc 0.9818435754189944:
7th- epoch: 450, train_loss = 1.0095544196665287, train_acc = 0.9977876106194691
test Acc 0.9818435754189944:
7th- epoch: 451, train_loss = 1.0090011445281561, train_acc = 0.9979040521658128
test Acc 0.9818435754189944:
7th- epoch: 452, train_loss = 1.0082944383320864, train_acc = 0.9977876106194691
test Acc 0.9818435754189944:
7th- epoch: 453, 

 23%|████████████████▌                                                      | 7/30 [1:09:31<3:49:00, 597.42s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
8th- epoch: 0, train_loss = 139.13524037599564, train_acc = 0.7424312994876572
test Acc 0.8645251396648045:
8th- epoch: 1, train_loss = 53.41073361411691, train_acc = 0.8872845831392641
test Acc 0.9068901303538175:
8th- epoch: 2, train_loss = 38.439810164272785, train_acc = 0.9184909175593852
test Acc 0.9283054003724395:
8th- epoch: 3, train_loss = 30.718181427568197, train_acc = 0.9373544480670704
test Acc 0.9380819366852886:
8th- epoch: 4, train_loss = 25.766608955338597, train_acc = 0.9471355379599441
test Acc 0.9422718808193669:
8th- epoch: 5, train_loss = 22.255240177735686, train_acc = 0.9547042384722869


test Acc 0.9776536312849162:
8th- epoch: 147, train_loss = 1.457721425802447, train_acc = 0.9977876106194691
test Acc 0.9781191806331471:
8th- epoch: 148, train_loss = 1.4525516275316477, train_acc = 0.9977876106194691
test Acc 0.9781191806331471:
8th- epoch: 149, train_loss = 1.447779467329383, train_acc = 0.9977876106194691
test Acc 0.9781191806331471:
8th- epoch: 150, train_loss = 1.4433828108012676, train_acc = 0.9977876106194691
test Acc 0.9781191806331471:
8th- epoch: 151, train_loss = 1.438342514098622, train_acc = 0.9977876106194691
test Acc 0.9781191806331471:
8th- epoch: 152, train_loss = 1.4338463047752157, train_acc = 0.9977876106194691
test Acc 0.9781191806331471:
8th- epoch: 153, train_loss = 1.4294695189455524, train_acc = 0.9977876106194691
test Acc 0.9781191806331471:
8th- epoch: 154, train_loss = 1.4254361341008916, train_acc = 0.9977876106194691
test Acc 0.9781191806331471:
8th- epoch: 155, train_loss = 1.420253217802383, train_acc = 0.9979040521658128
test Acc 0.978

8th- epoch: 296, train_loss = 1.1012403449858539, train_acc = 0.9979040521658128
test Acc 0.978584729981378:
8th- epoch: 297, train_loss = 1.1001245751976967, train_acc = 0.9979040521658128
test Acc 0.979050279329609:
8th- epoch: 298, train_loss = 1.0991483951802365, train_acc = 0.9979040521658128
test Acc 0.978584729981378:
8th- epoch: 299, train_loss = 1.097308750555385, train_acc = 0.9979040521658128
test Acc 0.979050279329609:
8th- epoch: 300, train_loss = 1.0967159159481525, train_acc = 0.9979040521658128
test Acc 0.979050279329609:
8th- epoch: 301, train_loss = 1.0955212122644298, train_acc = 0.9979040521658128
test Acc 0.979050279329609:
8th- epoch: 302, train_loss = 1.0947031316463836, train_acc = 0.9979040521658128
test Acc 0.979050279329609:
8th- epoch: 303, train_loss = 1.0934013270889409, train_acc = 0.9979040521658128
test Acc 0.979050279329609:
8th- epoch: 304, train_loss = 1.0921919091488235, train_acc = 0.9979040521658128
test Acc 0.979050279329609:
8th- epoch: 305, tra

8th- epoch: 446, train_loss = 0.97237273430801, train_acc = 0.9980204937121565
test Acc 0.979050279329609:
8th- epoch: 447, train_loss = 0.9723350082931574, train_acc = 0.9980204937121565
test Acc 0.979050279329609:
8th- epoch: 448, train_loss = 0.9714453481137753, train_acc = 0.9980204937121565
test Acc 0.979050279329609:
8th- epoch: 449, train_loss = 0.9708541346190032, train_acc = 0.9980204937121565
test Acc 0.979050279329609:
8th- epoch: 450, train_loss = 0.9705657052400056, train_acc = 0.9980204937121565
test Acc 0.979050279329609:
8th- epoch: 451, train_loss = 0.9696929256024305, train_acc = 0.9980204937121565
test Acc 0.979050279329609:
8th- epoch: 452, train_loss = 0.9693793927726801, train_acc = 0.9980204937121565
test Acc 0.979050279329609:
8th- epoch: 453, train_loss = 0.9683564715087414, train_acc = 0.9980204937121565
test Acc 0.979050279329609:
8th- epoch: 454, train_loss = 0.9681377162632998, train_acc = 0.9980204937121565
test Acc 0.979050279329609:
8th- epoch: 455, trai

 27%|██████████████████▉                                                    | 8/30 [1:19:33<3:39:36, 598.91s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
9th- epoch: 0, train_loss = 132.65721866488457, train_acc = 0.7550069864927806
test Acc 0.8417132216014898:
9th- epoch: 1, train_loss = 52.31398078799248, train_acc = 0.8953190498369819
test Acc 0.9031657355679702:
9th- epoch: 2, train_loss = 37.59956260770559, train_acc = 0.926059618071728
test Acc 0.9259776536312849:
9th- epoch: 3, train_loss = 29.97028935328126, train_acc = 0.9411970190964136
test Acc 0.9357541899441341:
9th- epoch: 4, train_loss = 25.07636795192957, train_acc = 0.9509781089892874
test Acc 0.9422718808193669:
9th- epoch: 5, train_loss = 21.62777128443122, train_acc = 0.9568001863064741
test 

9th- epoch: 147, train_loss = 1.424071278423071, train_acc = 0.9972054028877504
test Acc 0.973463687150838:
9th- epoch: 148, train_loss = 1.4196828504791483, train_acc = 0.9973218444340941
test Acc 0.973463687150838:
9th- epoch: 149, train_loss = 1.4149613231420517, train_acc = 0.9973218444340941
test Acc 0.973463687150838:
9th- epoch: 150, train_loss = 1.4107260294258595, train_acc = 0.9973218444340941
test Acc 0.973463687150838:
9th- epoch: 151, train_loss = 1.4064013982424513, train_acc = 0.9973218444340941
test Acc 0.973463687150838:
9th- epoch: 152, train_loss = 1.4019899740815163, train_acc = 0.9973218444340941
test Acc 0.973463687150838:
9th- epoch: 153, train_loss = 1.3981061415979639, train_acc = 0.9973218444340941
test Acc 0.973463687150838:
9th- epoch: 154, train_loss = 1.3934234715998173, train_acc = 0.9973218444340941
test Acc 0.973463687150838:
9th- epoch: 155, train_loss = 1.389848466962576, train_acc = 0.9973218444340941
test Acc 0.973463687150838:
9th- epoch: 156, trai

9th- epoch: 296, train_loss = 1.082230652391445, train_acc = 0.9976711690731253
test Acc 0.9757914338919925:
9th- epoch: 297, train_loss = 1.081392265856266, train_acc = 0.9976711690731253
test Acc 0.9757914338919925:
9th- epoch: 298, train_loss = 1.0799535363912582, train_acc = 0.9976711690731253
test Acc 0.9757914338919925:
9th- epoch: 299, train_loss = 1.0790334616904147, train_acc = 0.9976711690731253
test Acc 0.9757914338919925:
9th- epoch: 300, train_loss = 1.0778583970968612, train_acc = 0.9976711690731253
test Acc 0.9757914338919925:
9th- epoch: 301, train_loss = 1.0765917114913464, train_acc = 0.9976711690731253
test Acc 0.9757914338919925:
9th- epoch: 302, train_loss = 1.0756999514997005, train_acc = 0.9976711690731253
test Acc 0.9757914338919925:
9th- epoch: 303, train_loss = 1.074462780088652, train_acc = 0.9976711690731253
test Acc 0.9762569832402235:
9th- epoch: 304, train_loss = 1.0734060530667193, train_acc = 0.9976711690731253
test Acc 0.9762569832402235:
9th- epoch: 3

9th- epoch: 444, train_loss = 0.962063405662775, train_acc = 0.9977876106194691
test Acc 0.9776536312849162:
9th- epoch: 445, train_loss = 0.9617877168057021, train_acc = 0.9977876106194691
test Acc 0.9776536312849162:
9th- epoch: 446, train_loss = 0.9616364079120103, train_acc = 0.9977876106194691
test Acc 0.9776536312849162:
9th- epoch: 447, train_loss = 0.9606853561999742, train_acc = 0.9977876106194691
test Acc 0.9776536312849162:
9th- epoch: 448, train_loss = 0.9602133147418499, train_acc = 0.9977876106194691
test Acc 0.9776536312849162:
9th- epoch: 449, train_loss = 0.959479139506584, train_acc = 0.9977876106194691
test Acc 0.9776536312849162:
9th- epoch: 450, train_loss = 0.9597858985362109, train_acc = 0.9977876106194691
test Acc 0.9776536312849162:
9th- epoch: 451, train_loss = 0.9588262513279915, train_acc = 0.9977876106194691
test Acc 0.9776536312849162:
9th- epoch: 452, train_loss = 0.9584518087503966, train_acc = 0.9977876106194691
test Acc 0.9776536312849162:
9th- epoch: 

 30%|█████████████████████▎                                                 | 9/30 [1:29:35<3:29:54, 599.75s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
10th- epoch: 0, train_loss = 144.76702085137367, train_acc = 0.7488355845365626
test Acc 0.8472998137802608:
10th- epoch: 1, train_loss = 55.605603531003, train_acc = 0.8887983232417327
test Acc 0.8878026070763501:
10th- epoch: 2, train_loss = 39.45965737849474, train_acc = 0.9207033069399162
test Acc 0.909683426443203:
10th- epoch: 3, train_loss = 31.150475934147835, train_acc = 0.9367722403353517
test Acc 0.9250465549348231:
10th- epoch: 4, train_loss = 25.972970850765705, train_acc = 0.9460875640428504
test Acc 0.9343575418994413:
10th- epoch: 5, train_loss = 22.383294969797134, train_acc = 0.955752212389380

10th- epoch: 145, train_loss = 1.443713710992597, train_acc = 0.9973218444340941
test Acc 0.9725325884543762:
10th- epoch: 146, train_loss = 1.4390854351222515, train_acc = 0.9973218444340941
test Acc 0.9725325884543762:
10th- epoch: 147, train_loss = 1.4348467104136944, train_acc = 0.9973218444340941
test Acc 0.972998137802607:
10th- epoch: 148, train_loss = 1.4303906025597826, train_acc = 0.9973218444340941
test Acc 0.972998137802607:
10th- epoch: 149, train_loss = 1.426138355047442, train_acc = 0.9973218444340941
test Acc 0.972998137802607:
10th- epoch: 150, train_loss = 1.4222035048296675, train_acc = 0.9973218444340941
test Acc 0.972998137802607:
10th- epoch: 151, train_loss = 1.4179262655088678, train_acc = 0.9973218444340941
test Acc 0.972998137802607:
10th- epoch: 152, train_loss = 1.4137486839899793, train_acc = 0.9973218444340941
test Acc 0.972998137802607:
10th- epoch: 153, train_loss = 1.4100199131062254, train_acc = 0.9973218444340941
test Acc 0.972998137802607:
10th- epoc

10th- epoch: 293, train_loss = 1.1091866567730904, train_acc = 0.9976711690731253
test Acc 0.9725325884543762:
10th- epoch: 294, train_loss = 1.10754680755781, train_acc = 0.9976711690731253
test Acc 0.9725325884543762:
10th- epoch: 295, train_loss = 1.1065675057470798, train_acc = 0.9976711690731253
test Acc 0.9725325884543762:
10th- epoch: 296, train_loss = 1.1048610706930049, train_acc = 0.9976711690731253
test Acc 0.9725325884543762:
10th- epoch: 297, train_loss = 1.1041828629677184, train_acc = 0.9976711690731253
test Acc 0.9725325884543762:
10th- epoch: 298, train_loss = 1.102978394657839, train_acc = 0.9976711690731253
test Acc 0.9725325884543762:
10th- epoch: 299, train_loss = 1.1017867836053483, train_acc = 0.9976711690731253
test Acc 0.9725325884543762:
10th- epoch: 300, train_loss = 1.1008804142475128, train_acc = 0.9976711690731253
test Acc 0.9725325884543762:
10th- epoch: 301, train_loss = 1.0995674940641038, train_acc = 0.9976711690731253
test Acc 0.9725325884543762:
10th

10th- epoch: 441, train_loss = 0.9920995458960533, train_acc = 0.9976711690731253
test Acc 0.9739292364990689:
10th- epoch: 442, train_loss = 0.9914227873086929, train_acc = 0.9977876106194691
test Acc 0.9739292364990689:
10th- epoch: 443, train_loss = 0.9906331822276115, train_acc = 0.9976711690731253
test Acc 0.9739292364990689:
10th- epoch: 444, train_loss = 0.9902342719433364, train_acc = 0.9977876106194691
test Acc 0.9739292364990689:
10th- epoch: 445, train_loss = 0.9895072045328561, train_acc = 0.9977876106194691
test Acc 0.9739292364990689:
10th- epoch: 446, train_loss = 0.9892958005366381, train_acc = 0.9977876106194691
test Acc 0.9739292364990689:
10th- epoch: 447, train_loss = 0.9886054011585657, train_acc = 0.9977876106194691
test Acc 0.973463687150838:
10th- epoch: 448, train_loss = 0.9880277551710606, train_acc = 0.9977876106194691
test Acc 0.9739292364990689:
10th- epoch: 449, train_loss = 0.9877637326717377, train_acc = 0.9977876106194691
test Acc 0.973463687150838:
10t

 33%|███████████████████████▎                                              | 10/30 [1:39:37<3:20:10, 600.53s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
11th- epoch: 0, train_loss = 126.04840872436762, train_acc = 0.7611783884489987
test Acc 0.8621973929236499:
11th- epoch: 1, train_loss = 52.50549767538905, train_acc = 0.891243595714951
test Acc 0.9050279329608939:
11th- epoch: 2, train_loss = 37.70993671193719, train_acc = 0.9241965533302282
test Acc 0.9217877094972067:
11th- epoch: 3, train_loss = 30.092312321066856, train_acc = 0.9373544480670704
test Acc 0.9273743016759777:
11th- epoch: 4, train_loss = 25.137697216123343, train_acc = 0.9477177456916628
test Acc 0.9343575418994413:
11th- epoch: 5, train_loss = 21.60839789547026, train_acc = 0.95493712156497

11th- epoch: 145, train_loss = 1.45642449951265, train_acc = 0.9975547275267815
test Acc 0.9767225325884544:
11th- epoch: 146, train_loss = 1.4516100771725178, train_acc = 0.9975547275267815
test Acc 0.9767225325884544:
11th- epoch: 147, train_loss = 1.446702758432366, train_acc = 0.9975547275267815
test Acc 0.9767225325884544:
11th- epoch: 148, train_loss = 1.4418469741940498, train_acc = 0.9975547275267815
test Acc 0.9771880819366853:
11th- epoch: 149, train_loss = 1.4383937617531046, train_acc = 0.9975547275267815
test Acc 0.9771880819366853:
11th- epoch: 150, train_loss = 1.4325105609605089, train_acc = 0.9975547275267815
test Acc 0.9771880819366853:
11th- epoch: 151, train_loss = 1.4291678642621264, train_acc = 0.9975547275267815
test Acc 0.9771880819366853:
11th- epoch: 152, train_loss = 1.4243440827121958, train_acc = 0.9975547275267815
test Acc 0.9771880819366853:
11th- epoch: 153, train_loss = 1.4202794581651688, train_acc = 0.9975547275267815
test Acc 0.9771880819366853:
11th

11th- epoch: 293, train_loss = 1.0968148683314212, train_acc = 0.9977876106194691
test Acc 0.9795158286778398:
11th- epoch: 294, train_loss = 1.0946879659895785, train_acc = 0.9977876106194691
test Acc 0.9795158286778398:
11th- epoch: 295, train_loss = 1.0937812837655656, train_acc = 0.9977876106194691
test Acc 0.9795158286778398:
11th- epoch: 296, train_loss = 1.0922860304708593, train_acc = 0.9977876106194691
test Acc 0.9795158286778398:
11th- epoch: 297, train_loss = 1.0914266954059713, train_acc = 0.9977876106194691
test Acc 0.9795158286778398:
11th- epoch: 298, train_loss = 1.089524497569073, train_acc = 0.9977876106194691
test Acc 0.9795158286778398:
11th- epoch: 299, train_loss = 1.088732064992655, train_acc = 0.9977876106194691
test Acc 0.9795158286778398:
11th- epoch: 300, train_loss = 1.08755162358284, train_acc = 0.9977876106194691
test Acc 0.9795158286778398:
11th- epoch: 301, train_loss = 1.0861142563517205, train_acc = 0.9977876106194691
test Acc 0.9795158286778398:
11th-

11th- epoch: 441, train_loss = 0.9743265906872693, train_acc = 0.9979040521658128
test Acc 0.9795158286778398:
11th- epoch: 442, train_loss = 0.9742079699935857, train_acc = 0.9979040521658128
test Acc 0.9795158286778398:
11th- epoch: 443, train_loss = 0.9732802497746889, train_acc = 0.9979040521658128
test Acc 0.9795158286778398:
11th- epoch: 444, train_loss = 0.9728618413209915, train_acc = 0.9979040521658128
test Acc 0.9795158286778398:
11th- epoch: 445, train_loss = 0.9725408045051154, train_acc = 0.9979040521658128
test Acc 0.9795158286778398:
11th- epoch: 446, train_loss = 0.9714135726389941, train_acc = 0.9979040521658128
test Acc 0.9795158286778398:
11th- epoch: 447, train_loss = 0.9713083915412426, train_acc = 0.9979040521658128
test Acc 0.9795158286778398:
11th- epoch: 448, train_loss = 0.9705820977687836, train_acc = 0.9979040521658128
test Acc 0.9795158286778398:
11th- epoch: 449, train_loss = 0.9702125912008341, train_acc = 0.9979040521658128
test Acc 0.9795158286778398:
1

 37%|█████████████████████████▋                                            | 11/30 [1:49:38<3:10:09, 600.48s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
12th- epoch: 0, train_loss = 142.62350638210773, train_acc = 0.7424312994876572
test Acc 0.866852886405959:
12th- epoch: 1, train_loss = 54.574624706059694, train_acc = 0.8875174662319516
test Acc 0.9124767225325885:
12th- epoch: 2, train_loss = 39.04006975889206, train_acc = 0.9210526315789473
test Acc 0.9278398510242085:
12th- epoch: 3, train_loss = 30.96744266524911, train_acc = 0.9374708896134141
test Acc 0.9343575418994413:
12th- epoch: 4, train_loss = 25.77957373484969, train_acc = 0.9476013041453191
test Acc 0.9432029795158287:
12th- epoch: 5, train_loss = 22.120889184996486, train_acc = 0.95505356311131

12th- epoch: 145, train_loss = 1.4298054116079584, train_acc = 0.9974382859804378
test Acc 0.9743947858472998:
12th- epoch: 146, train_loss = 1.4250788515200838, train_acc = 0.9974382859804378
test Acc 0.9739292364990689:
12th- epoch: 147, train_loss = 1.4208575723459944, train_acc = 0.9974382859804378
test Acc 0.9739292364990689:
12th- epoch: 148, train_loss = 1.4161471935221925, train_acc = 0.9974382859804378
test Acc 0.9743947858472998:
12th- epoch: 149, train_loss = 1.4121306216111407, train_acc = 0.9974382859804378
test Acc 0.9748603351955307:
12th- epoch: 150, train_loss = 1.4079345539212227, train_acc = 0.9974382859804378
test Acc 0.9743947858472998:
12th- epoch: 151, train_loss = 1.40396998077631, train_acc = 0.9974382859804378
test Acc 0.9748603351955307:
12th- epoch: 152, train_loss = 1.3996988447615877, train_acc = 0.9974382859804378
test Acc 0.9748603351955307:
12th- epoch: 153, train_loss = 1.395395594299771, train_acc = 0.9974382859804378
test Acc 0.9743947858472998:
12th

12th- epoch: 292, train_loss = 1.0995155908167362, train_acc = 0.9976711690731253
test Acc 0.9767225325884544:
12th- epoch: 293, train_loss = 1.0985834772291128, train_acc = 0.9976711690731253
test Acc 0.9767225325884544:
12th- epoch: 294, train_loss = 1.0967870814201888, train_acc = 0.9976711690731253
test Acc 0.9767225325884544:
12th- epoch: 295, train_loss = 1.0962023536267225, train_acc = 0.9976711690731253
test Acc 0.9767225325884544:
12th- epoch: 296, train_loss = 1.0954775214195251, train_acc = 0.9976711690731253
test Acc 0.9767225325884544:
12th- epoch: 297, train_loss = 1.093880428612465, train_acc = 0.9976711690731253
test Acc 0.9767225325884544:
12th- epoch: 298, train_loss = 1.0925065515039023, train_acc = 0.9976711690731253
test Acc 0.9767225325884544:
12th- epoch: 299, train_loss = 1.0918510742485523, train_acc = 0.9976711690731253
test Acc 0.9767225325884544:
12th- epoch: 300, train_loss = 1.0906362272799015, train_acc = 0.9976711690731253
test Acc 0.9767225325884544:
12

12th- epoch: 439, train_loss = 0.9806532984075602, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
12th- epoch: 440, train_loss = 0.9800699812622042, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
12th- epoch: 441, train_loss = 0.9793836871831445, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
12th- epoch: 442, train_loss = 0.9790785287768813, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
12th- epoch: 443, train_loss = 0.978467100605485, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
12th- epoch: 444, train_loss = 0.9779487860650988, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
12th- epoch: 445, train_loss = 0.9770718378276797, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
12th- epoch: 446, train_loss = 0.9766528519539861, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
12th- epoch: 447, train_loss = 0.9759190914483042, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
12

 40%|████████████████████████████                                          | 12/30 [1:59:37<3:00:02, 600.16s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
13th- epoch: 0, train_loss = 130.44992643594742, train_acc = 0.7555891942244993
test Acc 0.8561452513966481:
13th- epoch: 1, train_loss = 49.66384865343571, train_acc = 0.8986958546809501
test Acc 0.9082867783985102:
13th- epoch: 2, train_loss = 35.365323424339294, train_acc = 0.9273404750815091
test Acc 0.9269087523277467:
13th- epoch: 3, train_loss = 28.274416513741016, train_acc = 0.9425943176525384
test Acc 0.9343575418994413:
13th- epoch: 4, train_loss = 23.80209792405367, train_acc = 0.9533069399161621
test Acc 0.9399441340782123:
13th- epoch: 5, train_loss = 20.643781404942274, train_acc = 0.957498835584

13th- epoch: 145, train_loss = 1.4895572116365656, train_acc = 0.9973218444340941
test Acc 0.9776536312849162:
13th- epoch: 146, train_loss = 1.4847296638181433, train_acc = 0.9973218444340941
test Acc 0.9776536312849162:
13th- epoch: 147, train_loss = 1.479332355200313, train_acc = 0.9973218444340941
test Acc 0.9776536312849162:
13th- epoch: 148, train_loss = 1.47494590037968, train_acc = 0.9973218444340941
test Acc 0.9776536312849162:
13th- epoch: 149, train_loss = 1.4701636160025373, train_acc = 0.9973218444340941
test Acc 0.9776536312849162:
13th- epoch: 150, train_loss = 1.4653213880956173, train_acc = 0.9974382859804378
test Acc 0.9776536312849162:
13th- epoch: 151, train_loss = 1.4615546464920044, train_acc = 0.9974382859804378
test Acc 0.9776536312849162:
13th- epoch: 152, train_loss = 1.4563944712281227, train_acc = 0.9974382859804378
test Acc 0.9776536312849162:
13th- epoch: 153, train_loss = 1.4521812945604324, train_acc = 0.9974382859804378
test Acc 0.9776536312849162:
13th

test Acc 0.978584729981378:
13th- epoch: 293, train_loss = 1.1291997954249382, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
13th- epoch: 294, train_loss = 1.1277924900059588, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
13th- epoch: 295, train_loss = 1.1262277203495614, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
13th- epoch: 296, train_loss = 1.1253553107380867, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
13th- epoch: 297, train_loss = 1.1238552468712442, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
13th- epoch: 298, train_loss = 1.1230694763362408, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
13th- epoch: 299, train_loss = 1.1218513486091979, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
13th- epoch: 300, train_loss = 1.120525514066685, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
13th- epoch: 301, train_loss = 1.119424528151285, train_acc = 0.9974382859804378
test Acc 0.9

test Acc 0.9795158286778398:
13th- epoch: 441, train_loss = 1.001886816084152, train_acc = 0.9976711690731253
test Acc 0.9795158286778398:
13th- epoch: 442, train_loss = 1.001552085072035, train_acc = 0.9976711690731253
test Acc 0.9795158286778398:
13th- epoch: 443, train_loss = 1.000484367221361, train_acc = 0.9976711690731253
test Acc 0.9795158286778398:
13th- epoch: 444, train_loss = 1.0003945814969484, train_acc = 0.9976711690731253
test Acc 0.9795158286778398:
13th- epoch: 445, train_loss = 0.9997962974011898, train_acc = 0.9976711690731253
test Acc 0.9795158286778398:
13th- epoch: 446, train_loss = 0.9994441643357277, train_acc = 0.9976711690731253
test Acc 0.9795158286778398:
13th- epoch: 447, train_loss = 0.9984567066130694, train_acc = 0.9976711690731253
test Acc 0.9795158286778398:
13th- epoch: 448, train_loss = 0.9979333107767161, train_acc = 0.9976711690731253
test Acc 0.9795158286778398:
13th- epoch: 449, train_loss = 0.9973688920435961, train_acc = 0.9976711690731253
test

 43%|██████████████████████████████▎                                       | 13/30 [2:09:37<2:50:01, 600.11s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
14th- epoch: 0, train_loss = 135.53779469430447, train_acc = 0.7558220773171868
test Acc 0.8608007448789572:
14th- epoch: 1, train_loss = 53.070725195109844, train_acc = 0.8846064275733582
test Acc 0.8980446927374302:
14th- epoch: 2, train_loss = 38.02295248955488, train_acc = 0.9193060083837913
test Acc 0.9162011173184358:
14th- epoch: 3, train_loss = 30.308994226157665, train_acc = 0.9363064741499767
test Acc 0.9273743016759777:
14th- epoch: 4, train_loss = 25.425975371152163, train_acc = 0.9485328365160689
test Acc 0.9348230912476723:
14th- epoch: 5, train_loss = 21.98725873604417, train_acc = 0.955519329296

14th- epoch: 145, train_loss = 1.4710750604281202, train_acc = 0.9972054028877504
test Acc 0.9743947858472998:
14th- epoch: 146, train_loss = 1.4662146344780922, train_acc = 0.9972054028877504
test Acc 0.9743947858472998:
14th- epoch: 147, train_loss = 1.4614148611435667, train_acc = 0.9972054028877504
test Acc 0.9743947858472998:
14th- epoch: 148, train_loss = 1.4566672568907961, train_acc = 0.9972054028877504
test Acc 0.9743947858472998:
14th- epoch: 149, train_loss = 1.451966897933744, train_acc = 0.9972054028877504
test Acc 0.9743947858472998:
14th- epoch: 150, train_loss = 1.4475983729353175, train_acc = 0.9972054028877504
test Acc 0.9743947858472998:
14th- epoch: 151, train_loss = 1.442785949795507, train_acc = 0.9973218444340941
test Acc 0.9743947858472998:
14th- epoch: 152, train_loss = 1.4382406758377329, train_acc = 0.9972054028877504
test Acc 0.9743947858472998:
14th- epoch: 153, train_loss = 1.4339882420608774, train_acc = 0.9972054028877504
test Acc 0.9743947858472998:
14t

14th- epoch: 292, train_loss = 1.1092473777825944, train_acc = 0.9981369352585002
test Acc 0.9757914338919925:
14th- epoch: 293, train_loss = 1.1085247099399567, train_acc = 0.9981369352585002
test Acc 0.9757914338919925:
14th- epoch: 294, train_loss = 1.1071146242320538, train_acc = 0.9981369352585002
test Acc 0.9757914338919925:
14th- epoch: 295, train_loss = 1.1056007432634942, train_acc = 0.9981369352585002
test Acc 0.9757914338919925:
14th- epoch: 296, train_loss = 1.1048896896536462, train_acc = 0.9981369352585002
test Acc 0.9757914338919925:
14th- epoch: 297, train_loss = 1.1035382499103434, train_acc = 0.9981369352585002
test Acc 0.9757914338919925:
14th- epoch: 298, train_loss = 1.1022262945771217, train_acc = 0.9981369352585002
test Acc 0.9757914338919925:
14th- epoch: 299, train_loss = 1.1014073652331717, train_acc = 0.9981369352585002
test Acc 0.9757914338919925:
14th- epoch: 300, train_loss = 1.0998823928530328, train_acc = 0.9981369352585002
test Acc 0.9757914338919925:
1

14th- epoch: 439, train_loss = 0.9873271211981773, train_acc = 0.9982533768048439
test Acc 0.9762569832402235:
14th- epoch: 440, train_loss = 0.9863648911414202, train_acc = 0.9982533768048439
test Acc 0.9762569832402235:
14th- epoch: 441, train_loss = 0.9861909002065659, train_acc = 0.9982533768048439
test Acc 0.9762569832402235:
14th- epoch: 442, train_loss = 0.9852617345750332, train_acc = 0.9982533768048439
test Acc 0.9762569832402235:
14th- epoch: 443, train_loss = 0.985284898430109, train_acc = 0.9982533768048439
test Acc 0.9762569832402235:
14th- epoch: 444, train_loss = 0.9845427088439465, train_acc = 0.9982533768048439
test Acc 0.9762569832402235:
14th- epoch: 445, train_loss = 0.9839812939462718, train_acc = 0.9982533768048439
test Acc 0.9762569832402235:
14th- epoch: 446, train_loss = 0.983008303999668, train_acc = 0.9982533768048439
test Acc 0.9762569832402235:
14th- epoch: 447, train_loss = 0.9827634779212531, train_acc = 0.9982533768048439
test Acc 0.9762569832402235:
14t

 47%|████████████████████████████████▋                                     | 14/30 [2:19:37<2:40:01, 600.09s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
15th- epoch: 0, train_loss = 141.84736455976963, train_acc = 0.7536096879366558
test Acc 0.8556797020484171:
15th- epoch: 1, train_loss = 49.80940514802933, train_acc = 0.8971821145784816
test Acc 0.9115456238361266:
15th- epoch: 2, train_loss = 35.64134393632412, train_acc = 0.9283884489986027
test Acc 0.9236499068901304:
15th- epoch: 3, train_loss = 28.37890825420618, train_acc = 0.9437587331159758
test Acc 0.9329608938547486:
15th- epoch: 4, train_loss = 23.78404115140438, train_acc = 0.9541220307405682
test Acc 0.9385474860335196:
15th- epoch: 5, train_loss = 20.597284607589245, train_acc = 0.96204005589194

15th- epoch: 146, train_loss = 1.4012237936258316, train_acc = 0.9975547275267815
test Acc 0.979050279329609:
15th- epoch: 147, train_loss = 1.3969546022126451, train_acc = 0.9975547275267815
test Acc 0.979050279329609:
15th- epoch: 148, train_loss = 1.3934669172158465, train_acc = 0.9975547275267815
test Acc 0.979050279329609:
15th- epoch: 149, train_loss = 1.3886352615663782, train_acc = 0.9975547275267815
test Acc 0.979050279329609:
15th- epoch: 150, train_loss = 1.384520192979835, train_acc = 0.9975547275267815
test Acc 0.979050279329609:
15th- epoch: 151, train_loss = 1.3804009357700124, train_acc = 0.9975547275267815
test Acc 0.979050279329609:
15th- epoch: 152, train_loss = 1.3765324540436268, train_acc = 0.9975547275267815
test Acc 0.979050279329609:
15th- epoch: 153, train_loss = 1.3726445647189394, train_acc = 0.9975547275267815
test Acc 0.979050279329609:
15th- epoch: 154, train_loss = 1.3686390966176987, train_acc = 0.9975547275267815
test Acc 0.979050279329609:
15th- epoch

15th- epoch: 294, train_loss = 1.0918039915559348, train_acc = 0.9977876106194691
test Acc 0.978584729981378:
15th- epoch: 295, train_loss = 1.0908868374826852, train_acc = 0.9977876106194691
test Acc 0.979050279329609:
15th- epoch: 296, train_loss = 1.090025182813406, train_acc = 0.9977876106194691
test Acc 0.979050279329609:
15th- epoch: 297, train_loss = 1.0888788228330668, train_acc = 0.9977876106194691
test Acc 0.978584729981378:
15th- epoch: 298, train_loss = 1.087767827004427, train_acc = 0.9977876106194691
test Acc 0.979050279329609:
15th- epoch: 299, train_loss = 1.0864663856627885, train_acc = 0.9977876106194691
test Acc 0.979050279329609:
15th- epoch: 300, train_loss = 1.0857542070152704, train_acc = 0.9977876106194691
test Acc 0.979050279329609:
15th- epoch: 301, train_loss = 1.0848266743123531, train_acc = 0.9977876106194691
test Acc 0.979050279329609:
15th- epoch: 302, train_loss = 1.0834789760410786, train_acc = 0.9977876106194691
test Acc 0.979050279329609:
15th- epoch:

test Acc 0.9795158286778398:
15th- epoch: 442, train_loss = 0.9820314297976438, train_acc = 0.9980204937121565
test Acc 0.9795158286778398:
15th- epoch: 443, train_loss = 0.9818070145847742, train_acc = 0.9980204937121565
test Acc 0.9795158286778398:
15th- epoch: 444, train_loss = 0.9808936193585396, train_acc = 0.9980204937121565
test Acc 0.9795158286778398:
15th- epoch: 445, train_loss = 0.9804880196752492, train_acc = 0.9980204937121565
test Acc 0.9795158286778398:
15th- epoch: 446, train_loss = 0.9802265303733293, train_acc = 0.9980204937121565
test Acc 0.9795158286778398:
15th- epoch: 447, train_loss = 0.9799481282534543, train_acc = 0.9980204937121565
test Acc 0.9795158286778398:
15th- epoch: 448, train_loss = 0.9790754889545497, train_acc = 0.9980204937121565
test Acc 0.9795158286778398:
15th- epoch: 449, train_loss = 0.9783231044712011, train_acc = 0.9980204937121565
test Acc 0.9795158286778398:
15th- epoch: 450, train_loss = 0.9780043164792005, train_acc = 0.9980204937121565
t

 50%|███████████████████████████████████                                   | 15/30 [2:29:37<2:30:01, 600.08s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
16th- epoch: 0, train_loss = 142.13731163740158, train_acc = 0.7412668840242198
test Acc 0.8296089385474861:
16th- epoch: 1, train_loss = 52.15036651492119, train_acc = 0.88996273870517
test Acc 0.8985102420856611:
16th- epoch: 2, train_loss = 36.70214994251728, train_acc = 0.9247787610619469
test Acc 0.9180633147113594:
16th- epoch: 3, train_loss = 29.112062893807888, train_acc = 0.941895668374476
test Acc 0.9287709497206704:
16th- epoch: 4, train_loss = 24.302316550165415, train_acc = 0.952491849091756
test Acc 0.9371508379888268:
16th- epoch: 5, train_loss = 20.88670487329364, train_acc = 0.9598276665114113


16th- epoch: 146, train_loss = 1.4566572034964338, train_acc = 0.9974382859804378
test Acc 0.9799813780260708:
16th- epoch: 147, train_loss = 1.451566199422814, train_acc = 0.9974382859804378
test Acc 0.9804469273743017:
16th- epoch: 148, train_loss = 1.447786202072166, train_acc = 0.9974382859804378
test Acc 0.9799813780260708:
16th- epoch: 149, train_loss = 1.44279269000981, train_acc = 0.9974382859804378
test Acc 0.9799813780260708:
16th- epoch: 150, train_loss = 1.4386416139313951, train_acc = 0.9974382859804378
test Acc 0.9799813780260708:
16th- epoch: 151, train_loss = 1.4347680347273126, train_acc = 0.9974382859804378
test Acc 0.9799813780260708:
16th- epoch: 152, train_loss = 1.430306389927864, train_acc = 0.9974382859804378
test Acc 0.9799813780260708:
16th- epoch: 153, train_loss = 1.4264239309122786, train_acc = 0.9974382859804378
test Acc 0.9799813780260708:
16th- epoch: 154, train_loss = 1.4220508424332365, train_acc = 0.9974382859804378
test Acc 0.9799813780260708:
16th- 

16th- epoch: 293, train_loss = 1.1155948738451116, train_acc = 0.9976711690731253
test Acc 0.9809124767225326:
16th- epoch: 294, train_loss = 1.1141384827787988, train_acc = 0.9976711690731253
test Acc 0.9809124767225326:
16th- epoch: 295, train_loss = 1.1133116260170937, train_acc = 0.9976711690731253
test Acc 0.9809124767225326:
16th- epoch: 296, train_loss = 1.1120346250827424, train_acc = 0.9976711690731253
test Acc 0.9809124767225326:
16th- epoch: 297, train_loss = 1.110697594762314, train_acc = 0.9976711690731253
test Acc 0.9809124767225326:
16th- epoch: 298, train_loss = 1.1095225301687606, train_acc = 0.9976711690731253
test Acc 0.9809124767225326:
16th- epoch: 299, train_loss = 1.1083785382215865, train_acc = 0.9976711690731253
test Acc 0.9809124767225326:
16th- epoch: 300, train_loss = 1.1070594415068626, train_acc = 0.9976711690731253
test Acc 0.9809124767225326:
16th- epoch: 301, train_loss = 1.1059383861720562, train_acc = 0.9976711690731253
test Acc 0.9809124767225326:
16

16th- epoch: 440, train_loss = 0.9916626438498497, train_acc = 0.9979040521658128
test Acc 0.9809124767225326:
16th- epoch: 441, train_loss = 0.9910759242775384, train_acc = 0.9979040521658128
test Acc 0.9809124767225326:
16th- epoch: 442, train_loss = 0.9907238172891084, train_acc = 0.9979040521658128
test Acc 0.9809124767225326:
16th- epoch: 443, train_loss = 0.9895817326905672, train_acc = 0.9979040521658128
test Acc 0.9809124767225326:
16th- epoch: 444, train_loss = 0.9897616840898991, train_acc = 0.9979040521658128
test Acc 0.9809124767225326:
16th- epoch: 445, train_loss = 0.9884455725550652, train_acc = 0.9979040521658128
test Acc 0.9813780260707635:
16th- epoch: 446, train_loss = 0.9886908444168512, train_acc = 0.9979040521658128
test Acc 0.9809124767225326:
16th- epoch: 447, train_loss = 0.9874693925085012, train_acc = 0.9979040521658128
test Acc 0.9813780260707635:
16th- epoch: 448, train_loss = 0.9871984322962817, train_acc = 0.9979040521658128
test Acc 0.9809124767225326:
1

 53%|█████████████████████████████████████▎                                | 16/30 [2:39:38<2:20:03, 600.25s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
17th- epoch: 0, train_loss = 147.36077573895454, train_acc = 0.7384722869119702
test Acc 0.8663873370577281:
17th- epoch: 1, train_loss = 51.17999942600727, train_acc = 0.8997438285980438
test Acc 0.909217877094972:
17th- epoch: 2, train_loss = 37.34969172626734, train_acc = 0.9295528644620401
test Acc 0.9287709497206704:
17th- epoch: 3, train_loss = 30.291147138923407, train_acc = 0.9425943176525384
test Acc 0.9329608938547486:
17th- epoch: 4, train_loss = 25.684368815273046, train_acc = 0.9496972519795063
test Acc 0.9385474860335196:
17th- epoch: 5, train_loss = 22.33663908019662, train_acc = 0.95668374476013

17th- epoch: 145, train_loss = 1.4539598425617442, train_acc = 0.9974382859804378
test Acc 0.9720670391061452:
17th- epoch: 146, train_loss = 1.449788780300878, train_acc = 0.9974382859804378
test Acc 0.9725325884543762:
17th- epoch: 147, train_loss = 1.444997377693653, train_acc = 0.9974382859804378
test Acc 0.9725325884543762:
17th- epoch: 148, train_loss = 1.4408920196583495, train_acc = 0.9974382859804378
test Acc 0.9725325884543762:
17th- epoch: 149, train_loss = 1.4364155879011378, train_acc = 0.9974382859804378
test Acc 0.9725325884543762:
17th- epoch: 150, train_loss = 1.4318275587866083, train_acc = 0.9974382859804378
test Acc 0.9725325884543762:
17th- epoch: 151, train_loss = 1.4278025664389133, train_acc = 0.9974382859804378
test Acc 0.9725325884543762:
17th- epoch: 152, train_loss = 1.4229197651147842, train_acc = 0.9974382859804378
test Acc 0.9725325884543762:
17th- epoch: 153, train_loss = 1.4192449748516083, train_acc = 0.9974382859804378
test Acc 0.9725325884543762:
17t

17th- epoch: 293, train_loss = 1.1119885903899558, train_acc = 0.9977876106194691
test Acc 0.9739292364990689:
17th- epoch: 294, train_loss = 1.1101815489237197, train_acc = 0.9977876106194691
test Acc 0.9739292364990689:
17th- epoch: 295, train_loss = 1.1094365653698333, train_acc = 0.9977876106194691
test Acc 0.9739292364990689:
17th- epoch: 296, train_loss = 1.1078423038125038, train_acc = 0.9977876106194691
test Acc 0.9739292364990689:
17th- epoch: 297, train_loss = 1.1073267459869385, train_acc = 0.9977876106194691
test Acc 0.9739292364990689:
17th- epoch: 298, train_loss = 1.1057713094050996, train_acc = 0.9977876106194691
test Acc 0.9739292364990689:
17th- epoch: 299, train_loss = 1.1044079710845836, train_acc = 0.9977876106194691
test Acc 0.9739292364990689:
17th- epoch: 300, train_loss = 1.103281207382679, train_acc = 0.9977876106194691
test Acc 0.9739292364990689:
17th- epoch: 301, train_loss = 1.1022359803318977, train_acc = 0.9977876106194691
test Acc 0.9739292364990689:
17

test Acc 0.9743947858472998:
17th- epoch: 441, train_loss = 0.9864240114984568, train_acc = 0.9980204937121565
test Acc 0.9743947858472998:
17th- epoch: 442, train_loss = 0.9859202528896276, train_acc = 0.9980204937121565
test Acc 0.9743947858472998:
17th- epoch: 443, train_loss = 0.9856771677732468, train_acc = 0.9980204937121565
test Acc 0.9743947858472998:
17th- epoch: 444, train_loss = 0.9848437743785325, train_acc = 0.9980204937121565
test Acc 0.9743947858472998:
17th- epoch: 445, train_loss = 0.9842038340866566, train_acc = 0.9980204937121565
test Acc 0.9743947858472998:
17th- epoch: 446, train_loss = 0.9839763529598713, train_acc = 0.9980204937121565
test Acc 0.9743947858472998:
17th- epoch: 447, train_loss = 0.9834485277533531, train_acc = 0.9980204937121565
test Acc 0.9743947858472998:
17th- epoch: 448, train_loss = 0.98246274763369, train_acc = 0.9980204937121565
test Acc 0.9743947858472998:
17th- epoch: 449, train_loss = 0.9821715404686984, train_acc = 0.9980204937121565
tes

 57%|███████████████████████████████████████▋                              | 17/30 [2:49:38<2:10:01, 600.09s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
18th- epoch: 0, train_loss = 138.0338877737522, train_acc = 0.7496506753609687
test Acc 0.8733705772811918:
18th- epoch: 1, train_loss = 50.93073916435242, train_acc = 0.898346530041919
test Acc 0.9138733705772812:
18th- epoch: 2, train_loss = 36.79111433029175, train_acc = 0.9275733581741965
test Acc 0.9320297951582868:
18th- epoch: 3, train_loss = 29.70471628382802, train_acc = 0.9432929669306008
test Acc 0.9399441340782123:
18th- epoch: 4, train_loss = 25.20223729684949, train_acc = 0.952026082906381
test Acc 0.9422718808193669:
18th- epoch: 5, train_loss = 21.963475976139307, train_acc = 0.9583139264089428


18th- epoch: 145, train_loss = 1.4479262202512473, train_acc = 0.9973218444340941
test Acc 0.9748603351955307:
18th- epoch: 146, train_loss = 1.4439545541536063, train_acc = 0.9973218444340941
test Acc 0.9753258845437617:
18th- epoch: 147, train_loss = 1.438608781201765, train_acc = 0.9973218444340941
test Acc 0.9753258845437617:
18th- epoch: 148, train_loss = 1.43427356146276, train_acc = 0.9973218444340941
test Acc 0.9753258845437617:
18th- epoch: 149, train_loss = 1.429594113258645, train_acc = 0.9973218444340941
test Acc 0.9753258845437617:
18th- epoch: 150, train_loss = 1.4250810083467513, train_acc = 0.9973218444340941
test Acc 0.9753258845437617:
18th- epoch: 151, train_loss = 1.4211916320491582, train_acc = 0.9973218444340941
test Acc 0.9753258845437617:
18th- epoch: 152, train_loss = 1.4159652888774872, train_acc = 0.9973218444340941
test Acc 0.9753258845437617:
18th- epoch: 153, train_loss = 1.412040740950033, train_acc = 0.9973218444340941
test Acc 0.9753258845437617:
18th- 

test Acc 0.9781191806331471:
18th- epoch: 293, train_loss = 1.0954696666449308, train_acc = 0.9976711690731253
test Acc 0.9781191806331471:
18th- epoch: 294, train_loss = 1.0944824293255806, train_acc = 0.9976711690731253
test Acc 0.9781191806331471:
18th- epoch: 295, train_loss = 1.0930639834841713, train_acc = 0.9976711690731253
test Acc 0.9781191806331471:
18th- epoch: 296, train_loss = 1.0919290067395195, train_acc = 0.9976711690731253
test Acc 0.9781191806331471:
18th- epoch: 297, train_loss = 1.0910976914456114, train_acc = 0.9976711690731253
test Acc 0.9781191806331471:
18th- epoch: 298, train_loss = 1.0896669210633263, train_acc = 0.9976711690731253
test Acc 0.9781191806331471:
18th- epoch: 299, train_loss = 1.0887082094559446, train_acc = 0.9976711690731253
test Acc 0.9781191806331471:
18th- epoch: 300, train_loss = 1.0871905690291896, train_acc = 0.9976711690731253
test Acc 0.9781191806331471:
18th- epoch: 301, train_loss = 1.0863637682050467, train_acc = 0.9976711690731253
t

18th- epoch: 441, train_loss = 0.9748515256796964, train_acc = 0.9977876106194691
test Acc 0.979050279329609:
18th- epoch: 442, train_loss = 0.9748686458915472, train_acc = 0.9977876106194691
test Acc 0.979050279329609:
18th- epoch: 443, train_loss = 0.9741341726039536, train_acc = 0.9977876106194691
test Acc 0.979050279329609:
18th- epoch: 444, train_loss = 0.9734705084119923, train_acc = 0.9977876106194691
test Acc 0.979050279329609:
18th- epoch: 445, train_loss = 0.9728185199201107, train_acc = 0.9977876106194691
test Acc 0.979050279329609:
18th- epoch: 446, train_loss = 0.9724850964848883, train_acc = 0.9977876106194691
test Acc 0.979050279329609:
18th- epoch: 447, train_loss = 0.9720311351120472, train_acc = 0.9977876106194691
test Acc 0.979050279329609:
18th- epoch: 448, train_loss = 0.9717135752434842, train_acc = 0.9977876106194691
test Acc 0.979050279329609:
18th- epoch: 449, train_loss = 0.9706979356706142, train_acc = 0.9977876106194691
test Acc 0.979050279329609:
18th- epoc

 60%|██████████████████████████████████████████                            | 18/30 [2:59:37<1:59:59, 599.96s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
19th- epoch: 0, train_loss = 154.41929411888123, train_acc = 0.7421984163949698
test Acc 0.8594040968342644:
19th- epoch: 1, train_loss = 54.103476859629154, train_acc = 0.887750349324639
test Acc 0.9064245810055865:
19th- epoch: 2, train_loss = 38.298537861555815, train_acc = 0.9217512808570097
test Acc 0.9194599627560521:
19th- epoch: 3, train_loss = 30.390397552400827, train_acc = 0.9388681881695389
test Acc 0.9245810055865922:
19th- epoch: 4, train_loss = 25.392121233046055, train_acc = 0.9487657196087564
test Acc 0.9320297951582868:
19th- epoch: 5, train_loss = 21.855698246508837, train_acc = 0.95505356311

19th- epoch: 145, train_loss = 1.4249654370360076, train_acc = 0.9977876106194691
test Acc 0.9757914338919925:
19th- epoch: 146, train_loss = 1.41999226633925, train_acc = 0.9977876106194691
test Acc 0.9757914338919925:
19th- epoch: 147, train_loss = 1.4150900482200086, train_acc = 0.9977876106194691
test Acc 0.9753258845437617:
19th- epoch: 148, train_loss = 1.4105034969979897, train_acc = 0.9977876106194691
test Acc 0.9757914338919925:
19th- epoch: 149, train_loss = 1.4057483794167638, train_acc = 0.9977876106194691
test Acc 0.9753258845437617:
19th- epoch: 150, train_loss = 1.401657447568141, train_acc = 0.9977876106194691
test Acc 0.9753258845437617:
19th- epoch: 151, train_loss = 1.39759448741097, train_acc = 0.9977876106194691
test Acc 0.9753258845437617:
19th- epoch: 152, train_loss = 1.3930360312806442, train_acc = 0.9977876106194691
test Acc 0.9753258845437617:
19th- epoch: 153, train_loss = 1.3886806648224592, train_acc = 0.9977876106194691
test Acc 0.9753258845437617:
19th- 

test Acc 0.9762569832402235:
19th- epoch: 293, train_loss = 1.0820538314874284, train_acc = 0.9980204937121565
test Acc 0.9762569832402235:
19th- epoch: 294, train_loss = 1.0808279781485908, train_acc = 0.9980204937121565
test Acc 0.9762569832402235:
19th- epoch: 295, train_loss = 1.0800423715263605, train_acc = 0.9980204937121565
test Acc 0.9762569832402235:
19th- epoch: 296, train_loss = 1.078603449568618, train_acc = 0.9980204937121565
test Acc 0.9762569832402235:
19th- epoch: 297, train_loss = 1.0774760681088082, train_acc = 0.9980204937121565
test Acc 0.9762569832402235:
19th- epoch: 298, train_loss = 1.0770071651786566, train_acc = 0.9980204937121565
test Acc 0.9762569832402235:
19th- epoch: 299, train_loss = 1.0753041474963538, train_acc = 0.9980204937121565
test Acc 0.9762569832402235:
19th- epoch: 300, train_loss = 1.0742385045741685, train_acc = 0.9980204937121565
test Acc 0.9762569832402235:
19th- epoch: 301, train_loss = 1.0730606454308145, train_acc = 0.9980204937121565
te

test Acc 0.9776536312849162:
19th- epoch: 440, train_loss = 0.9629550824465696, train_acc = 0.9982533768048439
test Acc 0.9776536312849162:
19th- epoch: 441, train_loss = 0.9621215499937534, train_acc = 0.9982533768048439
test Acc 0.9776536312849162:
19th- epoch: 442, train_loss = 0.9620629772543907, train_acc = 0.9982533768048439
test Acc 0.9776536312849162:
19th- epoch: 443, train_loss = 0.9613397419452667, train_acc = 0.9982533768048439
test Acc 0.9776536312849162:
19th- epoch: 444, train_loss = 0.9603311158716679, train_acc = 0.9982533768048439
test Acc 0.9776536312849162:
19th- epoch: 445, train_loss = 0.9601052142679691, train_acc = 0.9982533768048439
test Acc 0.9776536312849162:
19th- epoch: 446, train_loss = 0.9596799705177546, train_acc = 0.9982533768048439
test Acc 0.9776536312849162:
19th- epoch: 447, train_loss = 0.9591852370649576, train_acc = 0.9982533768048439
test Acc 0.9776536312849162:
19th- epoch: 448, train_loss = 0.9584433330746833, train_acc = 0.9982533768048439
t

 63%|████████████████████████████████████████████▎                         | 19/30 [3:09:37<1:49:59, 599.92s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
20th- epoch: 0, train_loss = 139.0960905700922, train_acc = 0.7444108057755007
test Acc 0.8594040968342644:
20th- epoch: 1, train_loss = 50.42718705534935, train_acc = 0.8940381928272008
test Acc 0.9068901303538175:
20th- epoch: 2, train_loss = 36.04918462783098, train_acc = 0.9251280857009782
test Acc 0.9245810055865922:
20th- epoch: 3, train_loss = 28.755334101617336, train_acc = 0.9411970190964136
test Acc 0.9343575418994413:
20th- epoch: 4, train_loss = 24.141942873597145, train_acc = 0.9513274336283186
test Acc 0.9390130353817505:
20th- epoch: 5, train_loss = 20.82873029075563, train_acc = 0.95691662785281

20th- epoch: 145, train_loss = 1.3690402073552832, train_acc = 0.9974382859804378
test Acc 0.9720670391061452:
20th- epoch: 146, train_loss = 1.364698844612576, train_acc = 0.9974382859804378
test Acc 0.9720670391061452:
20th- epoch: 147, train_loss = 1.3607186103472486, train_acc = 0.9975547275267815
test Acc 0.9720670391061452:
20th- epoch: 148, train_loss = 1.357049866230227, train_acc = 0.9975547275267815
test Acc 0.9720670391061452:
20th- epoch: 149, train_loss = 1.3531254641711712, train_acc = 0.9976711690731253
test Acc 0.9720670391061452:
20th- epoch: 150, train_loss = 1.3495085363974795, train_acc = 0.9976711690731253
test Acc 0.9720670391061452:
20th- epoch: 151, train_loss = 1.345418356359005, train_acc = 0.9976711690731253
test Acc 0.9720670391061452:
20th- epoch: 152, train_loss = 1.3418825169210322, train_acc = 0.9976711690731253
test Acc 0.9720670391061452:
20th- epoch: 153, train_loss = 1.3380998484790325, train_acc = 0.9976711690731253
test Acc 0.9720670391061452:
20th

test Acc 0.9739292364990689:
20th- epoch: 293, train_loss = 1.0680933395924512, train_acc = 0.9976711690731253
test Acc 0.9739292364990689:
20th- epoch: 294, train_loss = 1.0672130485472735, train_acc = 0.9976711690731253
test Acc 0.9739292364990689:
20th- epoch: 295, train_loss = 1.0662863080797251, train_acc = 0.9976711690731253
test Acc 0.9739292364990689:
20th- epoch: 296, train_loss = 1.064713679254055, train_acc = 0.9976711690731253
test Acc 0.9739292364990689:
20th- epoch: 297, train_loss = 1.0643441130814608, train_acc = 0.9976711690731253
test Acc 0.9739292364990689:
20th- epoch: 298, train_loss = 1.062871627509594, train_acc = 0.9977876106194691
test Acc 0.9739292364990689:
20th- epoch: 299, train_loss = 1.0620792657136917, train_acc = 0.9976711690731253
test Acc 0.9739292364990689:
20th- epoch: 300, train_loss = 1.0610614717006683, train_acc = 0.9977876106194691
test Acc 0.9739292364990689:
20th- epoch: 301, train_loss = 1.0601429268717766, train_acc = 0.9976711690731253
tes

20th- epoch: 440, train_loss = 0.9621901834907476, train_acc = 0.9977876106194691
test Acc 0.9757914338919925:
20th- epoch: 441, train_loss = 0.9617266965506133, train_acc = 0.9977876106194691
test Acc 0.9757914338919925:
20th- epoch: 442, train_loss = 0.9612552151083946, train_acc = 0.9977876106194691
test Acc 0.9757914338919925:
20th- epoch: 443, train_loss = 0.960816470294958, train_acc = 0.9977876106194691
test Acc 0.9757914338919925:
20th- epoch: 444, train_loss = 0.9602003221807536, train_acc = 0.9977876106194691
test Acc 0.9757914338919925:
20th- epoch: 445, train_loss = 0.9597580010595266, train_acc = 0.9977876106194691
test Acc 0.9757914338919925:
20th- epoch: 446, train_loss = 0.9594306821527425, train_acc = 0.9977876106194691
test Acc 0.9757914338919925:
20th- epoch: 447, train_loss = 0.9586804360151291, train_acc = 0.9977876106194691
test Acc 0.9757914338919925:
20th- epoch: 448, train_loss = 0.9580078708531801, train_acc = 0.9977876106194691
test Acc 0.9757914338919925:
20

 67%|██████████████████████████████████████████████▋                       | 20/30 [3:19:39<1:40:06, 600.66s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
21th- epoch: 0, train_loss = 151.2073800712824, train_acc = 0.746040987424313
test Acc 0.8491620111731844:
21th- epoch: 1, train_loss = 52.821558855473995, train_acc = 0.8922915696320447
test Acc 0.8915270018621974:
21th- epoch: 2, train_loss = 37.00347354263067, train_acc = 0.9219841639496973
test Acc 0.9143389199255121:
21th- epoch: 3, train_loss = 28.931000776588917, train_acc = 0.9397997205402888
test Acc 0.9269087523277467:
21th- epoch: 4, train_loss = 23.892789099365473, train_acc = 0.9508616674429436
test Acc 0.9376163873370578:
21th- epoch: 5, train_loss = 20.404083512723446, train_acc = 0.9599441080577

21th- epoch: 145, train_loss = 1.414896097034216, train_acc = 0.9974382859804378
test Acc 0.9739292364990689:
21th- epoch: 146, train_loss = 1.4106894793221727, train_acc = 0.9974382859804378
test Acc 0.9743947858472998:
21th- epoch: 147, train_loss = 1.4066680260002613, train_acc = 0.9974382859804378
test Acc 0.9743947858472998:
21th- epoch: 148, train_loss = 1.4025000283727422, train_acc = 0.9974382859804378
test Acc 0.9743947858472998:
21th- epoch: 149, train_loss = 1.398763862787746, train_acc = 0.9974382859804378
test Acc 0.9743947858472998:
21th- epoch: 150, train_loss = 1.394769104779698, train_acc = 0.9974382859804378
test Acc 0.9743947858472998:
21th- epoch: 151, train_loss = 1.390905705629848, train_acc = 0.9974382859804378
test Acc 0.9743947858472998:
21th- epoch: 152, train_loss = 1.3872278617927805, train_acc = 0.9974382859804378
test Acc 0.9743947858472998:
21th- epoch: 153, train_loss = 1.3834039295325056, train_acc = 0.9974382859804378
test Acc 0.9743947858472998:
21th-

21th- epoch: 292, train_loss = 1.101468951732386, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
21th- epoch: 293, train_loss = 1.1001742866938002, train_acc = 0.9977876106194691
test Acc 0.9776536312849162:
21th- epoch: 294, train_loss = 1.0994886097614653, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
21th- epoch: 295, train_loss = 1.0980615317821503, train_acc = 0.9977876106194691
test Acc 0.9776536312849162:
21th- epoch: 296, train_loss = 1.0970965710585006, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
21th- epoch: 297, train_loss = 1.0961088587646373, train_acc = 0.9977876106194691
test Acc 0.9776536312849162:
21th- epoch: 298, train_loss = 1.0951191646163352, train_acc = 0.9977876106194691
test Acc 0.9776536312849162:
21th- epoch: 299, train_loss = 1.0936464977567084, train_acc = 0.9977876106194691
test Acc 0.9776536312849162:
21th- epoch: 300, train_loss = 1.0929687495226972, train_acc = 0.9977876106194691
test Acc 0.9776536312849162:
21

test Acc 0.978584729981378:
21th- epoch: 440, train_loss = 0.9878347578051034, train_acc = 0.9977876106194691
test Acc 0.978584729981378:
21th- epoch: 441, train_loss = 0.9875482705829199, train_acc = 0.9977876106194691
test Acc 0.978584729981378:
21th- epoch: 442, train_loss = 0.9867951845226344, train_acc = 0.9977876106194691
test Acc 0.978584729981378:
21th- epoch: 443, train_loss = 0.9862753910419997, train_acc = 0.9977876106194691
test Acc 0.978584729981378:
21th- epoch: 444, train_loss = 0.9856714618799742, train_acc = 0.9977876106194691
test Acc 0.978584729981378:
21th- epoch: 445, train_loss = 0.9852723181247711, train_acc = 0.9977876106194691
test Acc 0.978584729981378:
21th- epoch: 446, train_loss = 0.9848325637576636, train_acc = 0.9977876106194691
test Acc 0.978584729981378:
21th- epoch: 447, train_loss = 0.9841130264103413, train_acc = 0.9977876106194691
test Acc 0.978584729981378:
21th- epoch: 448, train_loss = 0.9834767232241575, train_acc = 0.9977876106194691
test Acc 0

 70%|█████████████████████████████████████████████████                     | 21/30 [3:29:41<1:30:07, 600.82s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
22th- epoch: 0, train_loss = 150.62694111466408, train_acc = 0.7406846762925011
test Acc 0.8524208566108007:
22th- epoch: 1, train_loss = 52.46190697699785, train_acc = 0.8891476478807638
test Acc 0.9008379888268156:
22th- epoch: 2, train_loss = 37.91224742680788, train_acc = 0.9211690731252911
test Acc 0.9185288640595903:
22th- epoch: 3, train_loss = 30.38081346079707, train_acc = 0.9382859804378202
test Acc 0.930633147113594:
22th- epoch: 4, train_loss = 25.520402040332556, train_acc = 0.9474848625989754
test Acc 0.9338919925512105:
22th- epoch: 5, train_loss = 22.053122183308005, train_acc = 0.95423847228691

22th- epoch: 145, train_loss = 1.5245683888206258, train_acc = 0.9972054028877504
test Acc 0.972998137802607:
22th- epoch: 146, train_loss = 1.5194985704729334, train_acc = 0.9972054028877504
test Acc 0.972998137802607:
22th- epoch: 147, train_loss = 1.513648796826601, train_acc = 0.9972054028877504
test Acc 0.972998137802607:
22th- epoch: 148, train_loss = 1.5088731398573145, train_acc = 0.9972054028877504
test Acc 0.972998137802607:
22th- epoch: 149, train_loss = 1.5036072445800528, train_acc = 0.9972054028877504
test Acc 0.972998137802607:
22th- epoch: 150, train_loss = 1.4990628212690353, train_acc = 0.9972054028877504
test Acc 0.972998137802607:
22th- epoch: 151, train_loss = 1.493479692726396, train_acc = 0.9972054028877504
test Acc 0.972998137802607:
22th- epoch: 152, train_loss = 1.4886840233812109, train_acc = 0.9972054028877504
test Acc 0.972998137802607:
22th- epoch: 153, train_loss = 1.4842254346003756, train_acc = 0.9972054028877504
test Acc 0.972998137802607:
22th- epoch:

test Acc 0.9767225325884544:
22th- epoch: 293, train_loss = 1.1322847467963584, train_acc = 0.9975547275267815
test Acc 0.9767225325884544:
22th- epoch: 294, train_loss = 1.1309599938686006, train_acc = 0.9975547275267815
test Acc 0.9767225325884544:
22th- epoch: 295, train_loss = 1.1296901665627956, train_acc = 0.9975547275267815
test Acc 0.9767225325884544:
22th- epoch: 296, train_loss = 1.1285665680770762, train_acc = 0.9975547275267815
test Acc 0.9767225325884544:
22th- epoch: 297, train_loss = 1.1273659753496759, train_acc = 0.9975547275267815
test Acc 0.9767225325884544:
22th- epoch: 298, train_loss = 1.1258088573813438, train_acc = 0.9975547275267815
test Acc 0.9767225325884544:
22th- epoch: 299, train_loss = 1.12455677613616, train_acc = 0.9975547275267815
test Acc 0.9767225325884544:
22th- epoch: 300, train_loss = 1.1236757089500315, train_acc = 0.9975547275267815
test Acc 0.9767225325884544:
22th- epoch: 301, train_loss = 1.1222174664144404, train_acc = 0.9975547275267815
tes

test Acc 0.9776536312849162:
22th- epoch: 440, train_loss = 0.9965743906795979, train_acc = 0.9979040521658128
test Acc 0.9776536312849162:
22th- epoch: 441, train_loss = 0.9971306547522545, train_acc = 0.9979040521658128
test Acc 0.9776536312849162:
22th- epoch: 442, train_loss = 0.9962879208324011, train_acc = 0.9979040521658128
test Acc 0.9776536312849162:
22th- epoch: 443, train_loss = 0.9959526844322681, train_acc = 0.9979040521658128
test Acc 0.9776536312849162:
22th- epoch: 444, train_loss = 0.9949744492769241, train_acc = 0.9979040521658128
test Acc 0.9776536312849162:
22th- epoch: 445, train_loss = 0.9947947511973325, train_acc = 0.9979040521658128
test Acc 0.9776536312849162:
22th- epoch: 446, train_loss = 0.9942580051720142, train_acc = 0.9979040521658128
test Acc 0.9776536312849162:
22th- epoch: 447, train_loss = 0.9931066557765007, train_acc = 0.9979040521658128
test Acc 0.9776536312849162:
22th- epoch: 448, train_loss = 0.9925658864376601, train_acc = 0.9979040521658128
t

 73%|███████████████████████████████████████████████████▎                  | 22/30 [3:39:41<1:20:06, 600.77s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
23th- epoch: 0, train_loss = 130.92466051876545, train_acc = 0.7559385188635305
test Acc 0.8594040968342644:
23th- epoch: 1, train_loss = 52.00387782603502, train_acc = 0.8885654401490451
test Acc 0.9120111731843575:
23th- epoch: 2, train_loss = 36.46412738785148, train_acc = 0.922100605496041
test Acc 0.9301675977653632:
23th- epoch: 3, train_loss = 28.844684537500143, train_acc = 0.9406148113646949
test Acc 0.9385474860335196:
23th- epoch: 4, train_loss = 24.081856675446033, train_acc = 0.9517931998136935
test Acc 0.9455307262569832:
23th- epoch: 5, train_loss = 20.70738466270268, train_acc = 0.95831392640894

23th- epoch: 145, train_loss = 1.4107412049779668, train_acc = 0.9974382859804378
test Acc 0.9757914338919925:
23th- epoch: 146, train_loss = 1.4067776141455397, train_acc = 0.9974382859804378
test Acc 0.9757914338919925:
23th- epoch: 147, train_loss = 1.4022476188838482, train_acc = 0.9974382859804378
test Acc 0.9757914338919925:
23th- epoch: 148, train_loss = 1.3986002864548936, train_acc = 0.9974382859804378
test Acc 0.9757914338919925:
23th- epoch: 149, train_loss = 1.3942041397094727, train_acc = 0.9974382859804378
test Acc 0.9757914338919925:
23th- epoch: 150, train_loss = 1.3900413376977667, train_acc = 0.9974382859804378
test Acc 0.9757914338919925:
23th- epoch: 151, train_loss = 1.3864316990366206, train_acc = 0.9974382859804378
test Acc 0.9757914338919925:
23th- epoch: 152, train_loss = 1.3827213397016749, train_acc = 0.9974382859804378
test Acc 0.9757914338919925:
23th- epoch: 153, train_loss = 1.3787891753017902, train_acc = 0.9974382859804378
test Acc 0.9757914338919925:
2

test Acc 0.9767225325884544:
23th- epoch: 293, train_loss = 1.0933547367458232, train_acc = 0.9975547275267815
test Acc 0.9767225325884544:
23th- epoch: 294, train_loss = 1.0919759621028788, train_acc = 0.9975547275267815
test Acc 0.9767225325884544:
23th- epoch: 295, train_loss = 1.090857621282339, train_acc = 0.9975547275267815
test Acc 0.9767225325884544:
23th- epoch: 296, train_loss = 1.089747837453615, train_acc = 0.9975547275267815
test Acc 0.9767225325884544:
23th- epoch: 297, train_loss = 1.0888849559123628, train_acc = 0.9975547275267815
test Acc 0.9767225325884544:
23th- epoch: 298, train_loss = 1.0877879385952838, train_acc = 0.9975547275267815
test Acc 0.9767225325884544:
23th- epoch: 299, train_loss = 1.0867054015398026, train_acc = 0.9975547275267815
test Acc 0.9767225325884544:
23th- epoch: 300, train_loss = 1.0855670757591724, train_acc = 0.9975547275267815
test Acc 0.9767225325884544:
23th- epoch: 301, train_loss = 1.0844190890784375, train_acc = 0.9975547275267815
tes

23th- epoch: 440, train_loss = 0.9804797222313937, train_acc = 0.9976711690731253
test Acc 0.9776536312849162:
23th- epoch: 441, train_loss = 0.9799542290566023, train_acc = 0.9976711690731253
test Acc 0.9776536312849162:
23th- epoch: 442, train_loss = 0.9793183716537897, train_acc = 0.9976711690731253
test Acc 0.9776536312849162:
23th- epoch: 443, train_loss = 0.9786872963013593, train_acc = 0.9976711690731253
test Acc 0.9776536312849162:
23th- epoch: 444, train_loss = 0.9781234090623911, train_acc = 0.9976711690731253
test Acc 0.9776536312849162:
23th- epoch: 445, train_loss = 0.9777428793313447, train_acc = 0.9976711690731253
test Acc 0.9776536312849162:
23th- epoch: 446, train_loss = 0.9770359123649541, train_acc = 0.9976711690731253
test Acc 0.9776536312849162:
23th- epoch: 447, train_loss = 0.9766338008048479, train_acc = 0.9976711690731253
test Acc 0.9776536312849162:
23th- epoch: 448, train_loss = 0.9761228039860725, train_acc = 0.9976711690731253
test Acc 0.9776536312849162:
2

 77%|█████████████████████████████████████████████████████▋                | 23/30 [3:49:43<1:10:07, 601.07s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
24th- epoch: 0, train_loss = 160.1572159677744, train_acc = 0.7409175593851887
test Acc 0.8482309124767226:
24th- epoch: 1, train_loss = 52.09315092116594, train_acc = 0.8950861667442943
test Acc 0.8999068901303539:
24th- epoch: 2, train_loss = 37.083602357655764, train_acc = 0.9227992547741034
test Acc 0.9166666666666666:
24th- epoch: 3, train_loss = 29.413713928312063, train_acc = 0.9372380065207266
test Acc 0.9273743016759777:
24th- epoch: 4, train_loss = 24.54266452603042, train_acc = 0.9473684210526315
test Acc 0.9329608938547486:
24th- epoch: 5, train_loss = 21.10725255124271, train_acc = 0.95447135537959

24th- epoch: 145, train_loss = 1.4188661413500085, train_acc = 0.9973218444340941
test Acc 0.972998137802607:
24th- epoch: 146, train_loss = 1.4138009498128667, train_acc = 0.9972054028877504
test Acc 0.972998137802607:
24th- epoch: 147, train_loss = 1.4096063300967216, train_acc = 0.9973218444340941
test Acc 0.972998137802607:
24th- epoch: 148, train_loss = 1.4063040912151337, train_acc = 0.9973218444340941
test Acc 0.972998137802607:
24th- epoch: 149, train_loss = 1.4021635738899931, train_acc = 0.9973218444340941
test Acc 0.972998137802607:
24th- epoch: 150, train_loss = 1.3980302748968825, train_acc = 0.9973218444340941
test Acc 0.972998137802607:
24th- epoch: 151, train_loss = 1.3943688794970512, train_acc = 0.9973218444340941
test Acc 0.972998137802607:
24th- epoch: 152, train_loss = 1.3903510893578641, train_acc = 0.9973218444340941
test Acc 0.972998137802607:
24th- epoch: 153, train_loss = 1.3862728203530423, train_acc = 0.9973218444340941
test Acc 0.972998137802607:
24th- epoc

test Acc 0.9739292364990689:
24th- epoch: 293, train_loss = 1.1000720846059266, train_acc = 0.9975547275267815
test Acc 0.9739292364990689:
24th- epoch: 294, train_loss = 1.0980119183659554, train_acc = 0.9975547275267815
test Acc 0.9739292364990689:
24th- epoch: 295, train_loss = 1.097194084286457, train_acc = 0.9975547275267815
test Acc 0.9739292364990689:
24th- epoch: 296, train_loss = 1.0960659248230513, train_acc = 0.9975547275267815
test Acc 0.9739292364990689:
24th- epoch: 297, train_loss = 1.0951832669379655, train_acc = 0.9975547275267815
test Acc 0.9739292364990689:
24th- epoch: 298, train_loss = 1.094283423066372, train_acc = 0.9975547275267815
test Acc 0.9739292364990689:
24th- epoch: 299, train_loss = 1.0929009777901229, train_acc = 0.9975547275267815
test Acc 0.9739292364990689:
24th- epoch: 300, train_loss = 1.0916980504989624, train_acc = 0.9975547275267815
test Acc 0.9739292364990689:
24th- epoch: 301, train_loss = 1.0908000568451826, train_acc = 0.9975547275267815
tes

test Acc 0.9743947858472998:
24th- epoch: 440, train_loss = 0.9845476684422465, train_acc = 0.9976711690731253
test Acc 0.9748603351955307:
24th- epoch: 441, train_loss = 0.9847762510180473, train_acc = 0.9976711690731253
test Acc 0.9748603351955307:
24th- epoch: 442, train_loss = 0.9839429967105389, train_acc = 0.9976711690731253
test Acc 0.9748603351955307:
24th- epoch: 443, train_loss = 0.9837293488235446, train_acc = 0.9976711690731253
test Acc 0.9748603351955307:
24th- epoch: 444, train_loss = 0.9831015008239774, train_acc = 0.9976711690731253
test Acc 0.9748603351955307:
24th- epoch: 445, train_loss = 0.982260562479496, train_acc = 0.9976711690731253
test Acc 0.9748603351955307:
24th- epoch: 446, train_loss = 0.9821548871695995, train_acc = 0.9976711690731253
test Acc 0.9748603351955307:
24th- epoch: 447, train_loss = 0.9814676567912102, train_acc = 0.9976711690731253
test Acc 0.9748603351955307:
24th- epoch: 448, train_loss = 0.9809590006916551, train_acc = 0.9976711690731253
te

 80%|████████████████████████████████████████████████████████              | 24/30 [3:59:43<1:00:04, 600.68s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
25th- epoch: 0, train_loss = 141.9878898859024, train_acc = 0.7441779226828132
test Acc 0.8547486033519553:
25th- epoch: 1, train_loss = 49.54516392946243, train_acc = 0.8991616208663251
test Acc 0.9073556797020484:
25th- epoch: 2, train_loss = 34.69954644329846, train_acc = 0.9276897997205403
test Acc 0.925512104283054:
25th- epoch: 3, train_loss = 27.48380015604198, train_acc = 0.9443409408476945
test Acc 0.9329608938547486:
25th- epoch: 4, train_loss = 22.972137494012713, train_acc = 0.9544713553795995
test Acc 0.9371508379888268:
25th- epoch: 5, train_loss = 19.86863180808723, train_acc = 0.9613414066138798

25th- epoch: 145, train_loss = 1.4551874758908525, train_acc = 0.9970889613414066
test Acc 0.9781191806331471:
25th- epoch: 146, train_loss = 1.4505336011061445, train_acc = 0.9970889613414066
test Acc 0.9781191806331471:
25th- epoch: 147, train_loss = 1.4462691707303748, train_acc = 0.9969725197950629
test Acc 0.9781191806331471:
25th- epoch: 148, train_loss = 1.4419331885874271, train_acc = 0.9970889613414066
test Acc 0.9781191806331471:
25th- epoch: 149, train_loss = 1.4372128831455484, train_acc = 0.9970889613414066
test Acc 0.9781191806331471:
25th- epoch: 150, train_loss = 1.4333633681526408, train_acc = 0.9970889613414066
test Acc 0.9781191806331471:
25th- epoch: 151, train_loss = 1.4292178563773632, train_acc = 0.9970889613414066
test Acc 0.9781191806331471:
25th- epoch: 152, train_loss = 1.4252022728323936, train_acc = 0.9970889613414066
test Acc 0.9781191806331471:
25th- epoch: 153, train_loss = 1.4211666671326384, train_acc = 0.9970889613414066
test Acc 0.9781191806331471:
2

25th- epoch: 293, train_loss = 1.1225304491817951, train_acc = 0.9974382859804378
test Acc 0.9795158286778398:
25th- epoch: 294, train_loss = 1.120969581126701, train_acc = 0.9974382859804378
test Acc 0.9795158286778398:
25th- epoch: 295, train_loss = 1.1202059797942638, train_acc = 0.9974382859804378
test Acc 0.9795158286778398:
25th- epoch: 296, train_loss = 1.1191479675471783, train_acc = 0.9974382859804378
test Acc 0.9795158286778398:
25th- epoch: 297, train_loss = 1.1178525015711784, train_acc = 0.9974382859804378
test Acc 0.9795158286778398:
25th- epoch: 298, train_loss = 1.1165724036400206, train_acc = 0.9974382859804378
test Acc 0.9795158286778398:
25th- epoch: 299, train_loss = 1.1153358754818328, train_acc = 0.9974382859804378
test Acc 0.9799813780260708:
25th- epoch: 300, train_loss = 1.1141334722633474, train_acc = 0.9974382859804378
test Acc 0.9795158286778398:
25th- epoch: 301, train_loss = 1.1133006140589714, train_acc = 0.9974382859804378
test Acc 0.9799813780260708:
25

25th- epoch: 440, train_loss = 0.9991913537087385, train_acc = 0.9977876106194691
test Acc 0.9809124767225326:
25th- epoch: 441, train_loss = 0.9984465017914772, train_acc = 0.9977876106194691
test Acc 0.9809124767225326:
25th- epoch: 442, train_loss = 0.9975329289736692, train_acc = 0.9977876106194691
test Acc 0.9809124767225326:
25th- epoch: 443, train_loss = 0.9973500383493956, train_acc = 0.9977876106194691
test Acc 0.9809124767225326:
25th- epoch: 444, train_loss = 0.9972385428845882, train_acc = 0.9977876106194691
test Acc 0.9809124767225326:
25th- epoch: 445, train_loss = 0.9960107555089053, train_acc = 0.9977876106194691
test Acc 0.9809124767225326:
25th- epoch: 446, train_loss = 0.9954282070102636, train_acc = 0.9977876106194691
test Acc 0.9809124767225326:
25th- epoch: 447, train_loss = 0.9951831301150378, train_acc = 0.9977876106194691
test Acc 0.9809124767225326:
25th- epoch: 448, train_loss = 0.9942487055959646, train_acc = 0.9977876106194691
test Acc 0.9809124767225326:
2

 83%|████████████████████████████████████████████████████████████            | 25/30 [4:09:43<50:01, 600.40s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
26th- epoch: 0, train_loss = 138.4163089543581, train_acc = 0.7509315323707498
test Acc 0.8421787709497207:
26th- epoch: 1, train_loss = 51.692580722272396, train_acc = 0.8910107126222636
test Acc 0.9013035381750466:
26th- epoch: 2, train_loss = 36.779625091701746, train_acc = 0.922100605496041
test Acc 0.9222532588454376:
26th- epoch: 3, train_loss = 29.004756432026625, train_acc = 0.9386353050768514
test Acc 0.9301675977653632:
26th- epoch: 4, train_loss = 24.08485385030508, train_acc = 0.9494643688868188
test Acc 0.936219739292365:
26th- epoch: 5, train_loss = 20.68077564239502, train_acc = 0.958313926408942

26th- epoch: 145, train_loss = 1.4441966377198696, train_acc = 0.9973218444340941
test Acc 0.9757914338919925:
26th- epoch: 146, train_loss = 1.44079662731383, train_acc = 0.9973218444340941
test Acc 0.9757914338919925:
26th- epoch: 147, train_loss = 1.4358698800206184, train_acc = 0.9973218444340941
test Acc 0.9757914338919925:
26th- epoch: 148, train_loss = 1.4314529933035374, train_acc = 0.9973218444340941
test Acc 0.9757914338919925:
26th- epoch: 149, train_loss = 1.4275353215634823, train_acc = 0.9973218444340941
test Acc 0.9757914338919925:
26th- epoch: 150, train_loss = 1.42246188595891, train_acc = 0.9973218444340941
test Acc 0.9757914338919925:
26th- epoch: 151, train_loss = 1.418952283798717, train_acc = 0.9973218444340941
test Acc 0.9757914338919925:
26th- epoch: 152, train_loss = 1.4135207161307335, train_acc = 0.9973218444340941
test Acc 0.9757914338919925:
26th- epoch: 153, train_loss = 1.410341185866855, train_acc = 0.9973218444340941
test Acc 0.9757914338919925:
26th- e

26th- epoch: 293, train_loss = 1.0998593631084077, train_acc = 0.9976711690731253
test Acc 0.979050279329609:
26th- epoch: 294, train_loss = 1.099124291271437, train_acc = 0.9976711690731253
test Acc 0.979050279329609:
26th- epoch: 295, train_loss = 1.0973355050082318, train_acc = 0.9976711690731253
test Acc 0.979050279329609:
26th- epoch: 296, train_loss = 1.0964521678979509, train_acc = 0.9976711690731253
test Acc 0.979050279329609:
26th- epoch: 297, train_loss = 1.0955682669882663, train_acc = 0.9976711690731253
test Acc 0.979050279329609:
26th- epoch: 298, train_loss = 1.0944557711482048, train_acc = 0.9976711690731253
test Acc 0.979050279329609:
26th- epoch: 299, train_loss = 1.0931497253477573, train_acc = 0.9976711690731253
test Acc 0.979050279329609:
26th- epoch: 300, train_loss = 1.0916846108739264, train_acc = 0.9976711690731253
test Acc 0.979050279329609:
26th- epoch: 301, train_loss = 1.0905886441469193, train_acc = 0.9976711690731253
test Acc 0.979050279329609:
26th- epoch

26th- epoch: 441, train_loss = 0.9776960512099322, train_acc = 0.9977876106194691
test Acc 0.979050279329609:
26th- epoch: 442, train_loss = 0.9768615017237607, train_acc = 0.9977876106194691
test Acc 0.979050279329609:
26th- epoch: 443, train_loss = 0.9763317021133844, train_acc = 0.9977876106194691
test Acc 0.979050279329609:
26th- epoch: 444, train_loss = 0.9761243276298046, train_acc = 0.9977876106194691
test Acc 0.979050279329609:
26th- epoch: 445, train_loss = 0.9754908519389573, train_acc = 0.9977876106194691
test Acc 0.979050279329609:
26th- epoch: 446, train_loss = 0.9749528206884861, train_acc = 0.9977876106194691
test Acc 0.9795158286778398:
26th- epoch: 447, train_loss = 0.9741504217090551, train_acc = 0.9977876106194691
test Acc 0.979050279329609:
26th- epoch: 448, train_loss = 0.9733954133989755, train_acc = 0.9977876106194691
test Acc 0.979050279329609:
26th- epoch: 449, train_loss = 0.973843472689623, train_acc = 0.9977876106194691
test Acc 0.9795158286778398:
26th- epo

 87%|██████████████████████████████████████████████████████████████▍         | 26/30 [4:19:44<40:03, 600.79s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
27th- epoch: 0, train_loss = 127.63400320708752, train_acc = 0.7519795062878435
test Acc 0.8431098696461825:
27th- epoch: 1, train_loss = 49.06055061519146, train_acc = 0.8945039590125757
test Acc 0.9008379888268156:
27th- epoch: 2, train_loss = 34.75550312548876, train_acc = 0.9271075919888216
test Acc 0.9194599627560521:
27th- epoch: 3, train_loss = 27.78252149000764, train_acc = 0.9448067070330693
test Acc 0.9301675977653632:
27th- epoch: 4, train_loss = 23.45552946999669, train_acc = 0.9531904983698184
test Acc 0.9366852886405959:
27th- epoch: 5, train_loss = 20.412003841251135, train_acc = 0.96064275733581

27th- epoch: 146, train_loss = 1.4499823835212737, train_acc = 0.9976711690731253
test Acc 0.9757914338919925:
27th- epoch: 147, train_loss = 1.444950881646946, train_acc = 0.9976711690731253
test Acc 0.9757914338919925:
27th- epoch: 148, train_loss = 1.440449558198452, train_acc = 0.9976711690731253
test Acc 0.9757914338919925:
27th- epoch: 149, train_loss = 1.4355911177117378, train_acc = 0.9976711690731253
test Acc 0.9757914338919925:
27th- epoch: 150, train_loss = 1.4309095956850797, train_acc = 0.9976711690731253
test Acc 0.9762569832402235:
27th- epoch: 151, train_loss = 1.4263096663635224, train_acc = 0.9976711690731253
test Acc 0.9767225325884544:
27th- epoch: 152, train_loss = 1.4221625856589526, train_acc = 0.9976711690731253
test Acc 0.9767225325884544:
27th- epoch: 153, train_loss = 1.4179247438441962, train_acc = 0.9976711690731253
test Acc 0.9767225325884544:
27th- epoch: 154, train_loss = 1.4132576771080494, train_acc = 0.9976711690731253
test Acc 0.9767225325884544:
27t

test Acc 0.9771880819366853:
27th- epoch: 294, train_loss = 1.1019575546379201, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
27th- epoch: 295, train_loss = 1.1008231590385549, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
27th- epoch: 296, train_loss = 1.0992581670288928, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
27th- epoch: 297, train_loss = 1.0984510891139507, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
27th- epoch: 298, train_loss = 1.097268931567669, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
27th- epoch: 299, train_loss = 1.095982450991869, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
27th- epoch: 300, train_loss = 1.09526402130723, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
27th- epoch: 301, train_loss = 1.093748273968231, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
27th- epoch: 302, train_loss = 1.092998078733217, train_acc = 0.9977876106194691
test Ac

test Acc 0.9781191806331471:
27th- epoch: 368, train_loss = 1.0329158802633174, train_acc = 0.9979040521658128
test Acc 0.9781191806331471:
27th- epoch: 369, train_loss = 1.0316967529361136, train_acc = 0.9979040521658128
test Acc 0.9781191806331471:
27th- epoch: 370, train_loss = 1.031333768100012, train_acc = 0.9979040521658128
test Acc 0.9781191806331471:
27th- epoch: 371, train_loss = 1.0302147567272186, train_acc = 0.9979040521658128
test Acc 0.9781191806331471:
27th- epoch: 372, train_loss = 1.0296954587101936, train_acc = 0.9979040521658128
test Acc 0.9781191806331471:
27th- epoch: 373, train_loss = 1.0291566401720047, train_acc = 0.9979040521658128
test Acc 0.9781191806331471:
27th- epoch: 374, train_loss = 1.0277661966974847, train_acc = 0.9979040521658128
test Acc 0.9781191806331471:
27th- epoch: 375, train_loss = 1.027509284496773, train_acc = 0.9979040521658128
test Acc 0.9781191806331471:
27th- epoch: 376, train_loss = 1.0267633497714996, train_acc = 0.9979040521658128
tes

 90%|████████████████████████████████████████████████████████████████▊       | 27/30 [4:29:46<30:03, 601.00s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
28th- epoch: 0, train_loss = 139.79587899148464, train_acc = 0.7501164415463437
test Acc 0.851024208566108:
28th- epoch: 1, train_loss = 49.30814127624035, train_acc = 0.8985794131346064
test Acc 0.904096834264432:
28th- epoch: 2, train_loss = 35.19730290398002, train_acc = 0.9262925011644154
test Acc 0.9245810055865922:
28th- epoch: 3, train_loss = 28.117874965071678, train_acc = 0.9403819282720075
test Acc 0.9380819366852886:
28th- epoch: 4, train_loss = 23.63491563498974, train_acc = 0.9491150442477876
test Acc 0.9459962756052142:
28th- epoch: 5, train_loss = 20.447700323536992, train_acc = 0.957033069399161

test Acc 0.9776536312849162:
28th- epoch: 146, train_loss = 1.397525998414494, train_acc = 0.9974382859804378
test Acc 0.9776536312849162:
28th- epoch: 147, train_loss = 1.3928875109413639, train_acc = 0.9974382859804378
test Acc 0.9776536312849162:
28th- epoch: 148, train_loss = 1.388578256010078, train_acc = 0.9974382859804378
test Acc 0.9776536312849162:
28th- epoch: 149, train_loss = 1.3847234236309305, train_acc = 0.9974382859804378
test Acc 0.9776536312849162:
28th- epoch: 150, train_loss = 1.380238275974989, train_acc = 0.9974382859804378
test Acc 0.9776536312849162:
28th- epoch: 151, train_loss = 1.3766513312002644, train_acc = 0.9974382859804378
test Acc 0.9776536312849162:
28th- epoch: 152, train_loss = 1.372276110574603, train_acc = 0.9975547275267815
test Acc 0.9776536312849162:
28th- epoch: 153, train_loss = 1.3679332683095708, train_acc = 0.9975547275267815
test Acc 0.9776536312849162:
28th- epoch: 154, train_loss = 1.3640666293213144, train_acc = 0.9975547275267815
test 

28th- epoch: 293, train_loss = 1.0777189638465643, train_acc = 0.9976711690731253
test Acc 0.978584729981378:
28th- epoch: 294, train_loss = 1.0768040257389657, train_acc = 0.9976711690731253
test Acc 0.978584729981378:
28th- epoch: 295, train_loss = 1.0753281693905592, train_acc = 0.9976711690731253
test Acc 0.978584729981378:
28th- epoch: 296, train_loss = 1.0742623656988144, train_acc = 0.9976711690731253
test Acc 0.978584729981378:
28th- epoch: 297, train_loss = 1.0734476900543086, train_acc = 0.9976711690731253
test Acc 0.978584729981378:
28th- epoch: 298, train_loss = 1.072229536890518, train_acc = 0.9976711690731253
test Acc 0.978584729981378:
28th- epoch: 299, train_loss = 1.0715106036514044, train_acc = 0.9976711690731253
test Acc 0.978584729981378:
28th- epoch: 300, train_loss = 1.0704056930844672, train_acc = 0.9976711690731253
test Acc 0.978584729981378:
28th- epoch: 301, train_loss = 1.0693802281166427, train_acc = 0.9976711690731253
test Acc 0.978584729981378:
28th- epoch

28th- epoch: 441, train_loss = 0.9657401225122157, train_acc = 0.9979040521658128
test Acc 0.979050279329609:
28th- epoch: 442, train_loss = 0.9646005742251873, train_acc = 0.9979040521658128
test Acc 0.979050279329609:
28th- epoch: 443, train_loss = 0.9641133540717419, train_acc = 0.9979040521658128
test Acc 0.979050279329609:
28th- epoch: 444, train_loss = 0.9634688409569208, train_acc = 0.9979040521658128
test Acc 0.979050279329609:
28th- epoch: 445, train_loss = 0.9633409834059421, train_acc = 0.9979040521658128
test Acc 0.979050279329609:
28th- epoch: 446, train_loss = 0.9625078725221101, train_acc = 0.9979040521658128
test Acc 0.979050279329609:
28th- epoch: 447, train_loss = 0.9622702716442291, train_acc = 0.9979040521658128
test Acc 0.979050279329609:
28th- epoch: 448, train_loss = 0.9615666183235589, train_acc = 0.9979040521658128
test Acc 0.979050279329609:
28th- epoch: 449, train_loss = 0.9614044930785894, train_acc = 0.9979040521658128
test Acc 0.979050279329609:
28th- epoc

 93%|███████████████████████████████████████████████████████████████████▏    | 28/30 [4:38:36<19:19, 579.78s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
29th- epoch: 0, train_loss = 149.6169278025627, train_acc = 0.7310200279459711
test Acc 0.8659217877094972:
29th- epoch: 1, train_loss = 53.62474758177996, train_acc = 0.8886818816953889
test Acc 0.9115456238361266:
29th- epoch: 2, train_loss = 37.865694642066956, train_acc = 0.9243129948765719
test Acc 0.9269087523277467:
29th- epoch: 3, train_loss = 29.903529573231936, train_acc = 0.9392175128085701
test Acc 0.9320297951582868:
29th- epoch: 4, train_loss = 24.807492550462484, train_acc = 0.9492314857941313
test Acc 0.9366852886405959:
29th- epoch: 5, train_loss = 21.231363020837307, train_acc = 0.955985095482

29th- epoch: 145, train_loss = 1.4309655638644472, train_acc = 0.9975547275267815
test Acc 0.9739292364990689:
29th- epoch: 146, train_loss = 1.4260651431977749, train_acc = 0.9975547275267815
test Acc 0.9739292364990689:
29th- epoch: 147, train_loss = 1.4217095276108012, train_acc = 0.9975547275267815
test Acc 0.9739292364990689:
29th- epoch: 148, train_loss = 1.4176114773144946, train_acc = 0.9975547275267815
test Acc 0.9739292364990689:
29th- epoch: 149, train_loss = 1.4127171263098717, train_acc = 0.9975547275267815
test Acc 0.9739292364990689:
29th- epoch: 150, train_loss = 1.4089895226061344, train_acc = 0.9975547275267815
test Acc 0.9739292364990689:
29th- epoch: 151, train_loss = 1.4042449332773685, train_acc = 0.9975547275267815
test Acc 0.9739292364990689:
29th- epoch: 152, train_loss = 1.4010741909733042, train_acc = 0.9975547275267815
test Acc 0.9739292364990689:
29th- epoch: 153, train_loss = 1.3961929505458102, train_acc = 0.9975547275267815
test Acc 0.9739292364990689:
2

test Acc 0.9757914338919925:
29th- epoch: 293, train_loss = 1.0964647941291332, train_acc = 0.9976711690731253
test Acc 0.9757914338919925:
29th- epoch: 294, train_loss = 1.0949915833771229, train_acc = 0.9976711690731253
test Acc 0.9757914338919925:
29th- epoch: 295, train_loss = 1.0940611970727332, train_acc = 0.9976711690731253
test Acc 0.9757914338919925:
29th- epoch: 296, train_loss = 1.0927251254324801, train_acc = 0.9976711690731253
test Acc 0.9757914338919925:
29th- epoch: 297, train_loss = 1.0918204064364545, train_acc = 0.9976711690731253
test Acc 0.9757914338919925:
29th- epoch: 298, train_loss = 1.0904386204783805, train_acc = 0.9976711690731253
test Acc 0.9757914338919925:
29th- epoch: 299, train_loss = 1.0891955618862994, train_acc = 0.9976711690731253
test Acc 0.9757914338919925:
29th- epoch: 300, train_loss = 1.0887512427871116, train_acc = 0.9976711690731253
test Acc 0.9762569832402235:
29th- epoch: 301, train_loss = 1.0871735562686808, train_acc = 0.9976711690731253
t

test Acc 0.9776536312849162:
29th- epoch: 440, train_loss = 0.980447302252287, train_acc = 0.9979040521658128
test Acc 0.9776536312849162:
29th- epoch: 441, train_loss = 0.9796858665940817, train_acc = 0.9979040521658128
test Acc 0.9776536312849162:
29th- epoch: 442, train_loss = 0.9796094285848085, train_acc = 0.9979040521658128
test Acc 0.9776536312849162:
29th- epoch: 443, train_loss = 0.978645416587824, train_acc = 0.9979040521658128
test Acc 0.9776536312849162:
29th- epoch: 444, train_loss = 0.9781287871301174, train_acc = 0.9979040521658128
test Acc 0.9776536312849162:
29th- epoch: 445, train_loss = 0.9776122123003006, train_acc = 0.9979040521658128
test Acc 0.9776536312849162:
29th- epoch: 446, train_loss = 0.9769382079539355, train_acc = 0.9979040521658128
test Acc 0.9776536312849162:
29th- epoch: 447, train_loss = 0.9765566711721476, train_acc = 0.9979040521658128
test Acc 0.9776536312849162:
29th- epoch: 448, train_loss = 0.976061542838579, train_acc = 0.9979040521658128
test

 97%|█████████████████████████████████████████████████████████████████████▌  | 29/30 [4:47:11<09:20, 560.39s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
30th- epoch: 0, train_loss = 147.08830343186855, train_acc = 0.7186772240335352
test Acc 0.8314711359404097:
30th- epoch: 1, train_loss = 53.687663190066814, train_acc = 0.8821611551001397
test Acc 0.8910614525139665:
30th- epoch: 2, train_loss = 37.45364032685757, train_acc = 0.9175593851886353
test Acc 0.9078212290502793:
30th- epoch: 3, train_loss = 29.51941943541169, train_acc = 0.935724266418258
test Acc 0.9180633147113594:
30th- epoch: 4, train_loss = 24.622521802783012, train_acc = 0.9495808104331626
test Acc 0.9236499068901304:
30th- epoch: 5, train_loss = 21.18886574730277, train_acc = 0.95726595249184

30th- epoch: 145, train_loss = 1.4488460744032636, train_acc = 0.9975547275267815
test Acc 0.9688081936685289:
30th- epoch: 146, train_loss = 1.4433293665060773, train_acc = 0.9975547275267815
test Acc 0.9688081936685289:
30th- epoch: 147, train_loss = 1.43972811603453, train_acc = 0.9975547275267815
test Acc 0.9688081936685289:
30th- epoch: 148, train_loss = 1.4341695780167356, train_acc = 0.9975547275267815
test Acc 0.9688081936685289:
30th- epoch: 149, train_loss = 1.4306511817267165, train_acc = 0.9975547275267815
test Acc 0.9688081936685289:
30th- epoch: 150, train_loss = 1.4249473871896043, train_acc = 0.9975547275267815
test Acc 0.9688081936685289:
30th- epoch: 151, train_loss = 1.4215142155298963, train_acc = 0.9975547275267815
test Acc 0.9692737430167597:
30th- epoch: 152, train_loss = 1.4169955365359783, train_acc = 0.9975547275267815
test Acc 0.9692737430167597:
30th- epoch: 153, train_loss = 1.413151760934852, train_acc = 0.9975547275267815
test Acc 0.9692737430167597:
30th

test Acc 0.9739292364990689:
30th- epoch: 293, train_loss = 1.0954562040860765, train_acc = 0.9976711690731253
test Acc 0.973463687150838:
30th- epoch: 294, train_loss = 1.0941663831472397, train_acc = 0.9976711690731253
test Acc 0.9739292364990689:
30th- epoch: 295, train_loss = 1.0932078796322457, train_acc = 0.9976711690731253
test Acc 0.973463687150838:
30th- epoch: 296, train_loss = 1.0917700144345872, train_acc = 0.9976711690731253
test Acc 0.9739292364990689:
30th- epoch: 297, train_loss = 1.0906028126482852, train_acc = 0.9976711690731253
test Acc 0.973463687150838:
30th- epoch: 298, train_loss = 1.0898746575112455, train_acc = 0.9976711690731253
test Acc 0.9739292364990689:
30th- epoch: 299, train_loss = 1.0883434377610683, train_acc = 0.9976711690731253
test Acc 0.973463687150838:
30th- epoch: 300, train_loss = 1.087391899258364, train_acc = 0.9976711690731253
test Acc 0.9739292364990689:
30th- epoch: 301, train_loss = 1.0860384342377074, train_acc = 0.9976711690731253
test A

30th- epoch: 440, train_loss = 0.9746304353175219, train_acc = 0.9980204937121565
test Acc 0.9743947858472998:
30th- epoch: 441, train_loss = 0.9742308109998703, train_acc = 0.9980204937121565
test Acc 0.9743947858472998:
30th- epoch: 442, train_loss = 0.9734907945094164, train_acc = 0.9980204937121565
test Acc 0.9743947858472998:
30th- epoch: 443, train_loss = 0.9730826119484846, train_acc = 0.9980204937121565
test Acc 0.9743947858472998:
30th- epoch: 444, train_loss = 0.9725885403749999, train_acc = 0.9980204937121565
test Acc 0.9743947858472998:
30th- epoch: 445, train_loss = 0.9718371480703354, train_acc = 0.9980204937121565
test Acc 0.9743947858472998:
30th- epoch: 446, train_loss = 0.9716024920344353, train_acc = 0.9980204937121565
test Acc 0.9743947858472998:
30th- epoch: 447, train_loss = 0.9706860283913556, train_acc = 0.9980204937121565
test Acc 0.9743947858472998:
30th- epoch: 448, train_loss = 0.97054217880941, train_acc = 0.9980204937121565
test Acc 0.9743947858472998:
30t

100%|████████████████████████████████████████████████████████████████████████| 30/30 [4:55:46<00:00, 546.65s/it]


Wall time: 4h 55min 48s
