In [1]:
import numpy as np
import pandas as pd

import torch
import torch.nn as nn
import torch.optim as optim
import torch.nn.functional as F
import torch.utils.data as data

import utility.Data_loader as D
from utility.Model import Mcslt
from utility.Custom import CustomDataset

from tqdm import tqdm
from collections import Counter

In [2]:
%%time
if __name__ == '__main__':
    read_path = 'D:virus/image/3gram_768/'
    
    temp = [[],[]]
    
    Loader = D.File_loader()
    data_a, label_a = Loader.read_files(read_path, interp = False)
    
    idx = np.argsort(label_a)
    
    sorted_data = data_a[idx].reshape(10736, -1)
    sorted_label = sorted(label_a)
        
    BATCH_SIZE = 64
    TOTAL = 30
    EPOCH =500
    NUM_CLASS = 9
    LR = 0.0001
    SEED = [s for s in range(TOTAL)]
    Num_Nodes = 768
    
    CUDA_N = 'cuda:1'
    
    # creating data indices for spliting
    full_dataset = CustomDataset(sorted_data, sorted_label)
    train_size = int(0.8 * len(full_dataset))
    test_size = len(full_dataset) - train_size
    
    # spliting
    torch.manual_seed(10)
    train_dataset, test_dataset = data.random_split(full_dataset, [train_size, test_size])
    train_loader = data.DataLoader(train_dataset, batch_size=BATCH_SIZE, shuffle = False)
    test_loader = data.DataLoader(test_dataset, batch_size=BATCH_SIZE, shuffle=False)
    
    loss_total = []
    acc_total = []
    pred_total = []
    true_total = []
    
    
    for i in tqdm(range(TOTAL)):
        
        
        device = torch.device(CUDA_N if torch.cuda.is_available() else 'cpu')
        torch.manual_seed(SEED[i])
        net = Mcslt(Num_Nodes, NUM_CLASS)
        net.to(device)
        print(net)
        
        softmax = nn.Softmax()
        criterion = nn.CrossEntropyLoss()
        optimizer = optim.SGD(net.parameters(), lr=LR, momentum = 0.1)
        
        loss_list = []
        train_acc_list = []
        test_acc_list = []
        
        pred_temp = []
        true_temp = []
        
        for epoch in range(EPOCH):
            net.train()
            running_loss = 0
            total = train_size
            correct = 0 
            
            for step, images_labels in enumerate(train_loader):
                inputs, labels = images_labels
                inputs, labels = inputs.type(torch.FloatTensor).to(device), labels.type(torch.LongTensor).to(device)
                
                outputs = net(inputs)
                
                loss = criterion(outputs, labels)
                
                optimizer.zero_grad()
                loss.backward()
                optimizer.step()
                running_loss += loss.item()
                
                _, pred = torch.max(outputs, dim=1)
                correct += (pred == labels).sum().item()
                
            train_acc = correct/total
            loss_list.append(running_loss)
            train_acc_list.append(train_acc)
            print('{}th- epoch: {}, train_loss = {}, train_acc = {}'.format(i+1, epoch, running_loss, train_acc))
            
            with torch.no_grad():
                net.eval()
                correct = 0
                total = test_size
                pt, tt = [], []
                
                for step_t, images_labels_t in enumerate(test_loader):
                    inputs_t, labels_t = images_labels_t
                    inputs_t, labels_t = inputs_t.type(torch.FloatTensor).to(device), labels_t.type(torch.LongTensor).to(device)
                    
                    outputs_t = net(inputs_t)
                    outputs_t = softmax(outputs_t)
                    
                    # test accuracy
                    _, pred_t = torch.max(outputs_t, dim = 1)
                    
                    pt.append(pred_t)
                    tt.append(labels_t)
                    
                    correct += (pred_t == labels_t).sum().item()
                    
                pred_temp.append(torch.cat(pt))
                true_temp.append(torch.cat(tt))
                
                test_acc = correct/total
                test_acc_list.append(test_acc)
                
                print('test Acc {}:'.format(test_acc))
                
        best_result_index = np.argmax(np.array(test_acc_list))
        loss_total.append(loss_list[best_result_index])
        acc_total.append(test_acc_list[best_result_index])
        pred_total.append(pred_temp[best_result_index].tolist())
        true_total.append(true_temp[best_result_index].tolist())
        
    file_name = 'res/Mcslt_4gram'
    torch.save(net.state_dict(), file_name +'.pth')
    
    loss_DF = pd.DataFrame(loss_total)
    loss_DF.to_csv(file_name+" loss.csv")
    
    acc_DF = pd.DataFrame(acc_total)
    acc_DF.to_csv(file_name +" acc.csv")
    
    pred_DF = pd.DataFrame(pred_total)
    pred_DF.to_csv(file_name +" pred.csv")
    
    true_DF = pd.DataFrame(true_total)
    true_DF.to_csv(file_name +" true.csv")

100%|███████████████████████████████████████████████████████████████████| 10736/10736 [00:02<00:00, 4763.59it/s]
  0%|                                                                                    | 0/30 [00:00<?, ?it/s]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
1th- epoch: 0, train_loss = 131.19023767113686, train_acc = 0.760130414531905




test Acc 0.8608007448789572:
1th- epoch: 1, train_loss = 43.96203000098467, train_acc = 0.9084769445738239
test Acc 0.9073556797020484:
1th- epoch: 2, train_loss = 30.780783776193857, train_acc = 0.9363064741499767
test Acc 0.9278398510242085:
1th- epoch: 3, train_loss = 24.49717727303505, train_acc = 0.9496972519795063
test Acc 0.9390130353817505:
1th- epoch: 4, train_loss = 20.67032276839018, train_acc = 0.9579646017699115
test Acc 0.9455307262569832:
1th- epoch: 5, train_loss = 18.01358439028263, train_acc = 0.9640195621797858
test Acc 0.9492551210428305:
1th- epoch: 6, train_loss = 16.034080408513546, train_acc = 0.9684443409408477
test Acc 0.9557728119180633:
1th- epoch: 7, train_loss = 14.477960899472237, train_acc = 0.9725197950628784
test Acc 0.9599627560521415:
1th- epoch: 8, train_loss = 13.21421879157424, train_acc = 0.9755472752678156
test Acc 0.962756052141527:
1th- epoch: 9, train_loss = 12.1604408249259, train_acc = 0.9777596646483465
test Acc 0.9632216014897579:
1th- ep

test Acc 0.9771880819366853:
1th- epoch: 151, train_loss = 1.461849891813472, train_acc = 0.9973218444340941
test Acc 0.9771880819366853:
1th- epoch: 152, train_loss = 1.4573826019186527, train_acc = 0.9973218444340941
test Acc 0.9771880819366853:
1th- epoch: 153, train_loss = 1.452127878786996, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
1th- epoch: 154, train_loss = 1.4486100052017719, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
1th- epoch: 155, train_loss = 1.4433887489140034, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
1th- epoch: 156, train_loss = 1.4386854618787766, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
1th- epoch: 157, train_loss = 1.4344406698364764, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
1th- epoch: 158, train_loss = 1.429922852665186, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
1th- epoch: 159, train_loss = 1.425363017944619, train_acc = 0.9974382859804378
test Acc 0.977

1th- epoch: 299, train_loss = 1.0993738385732286, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
1th- epoch: 300, train_loss = 1.0976678009028547, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
1th- epoch: 301, train_loss = 1.0970545944874175, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
1th- epoch: 302, train_loss = 1.09541504830122, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
1th- epoch: 303, train_loss = 1.0940415325458162, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
1th- epoch: 304, train_loss = 1.093199696391821, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
1th- epoch: 305, train_loss = 1.0922170976991765, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
1th- epoch: 306, train_loss = 1.0907739351387136, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
1th- epoch: 307, train_loss = 1.0885031993384473, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
1th- epoch: 3

1th- epoch: 448, train_loss = 0.9587208988668863, train_acc = 0.9976711690731253
test Acc 0.978584729981378:
1th- epoch: 449, train_loss = 0.9581796328129712, train_acc = 0.9976711690731253
test Acc 0.978584729981378:
1th- epoch: 450, train_loss = 0.9575887694954872, train_acc = 0.9976711690731253
test Acc 0.978584729981378:
1th- epoch: 451, train_loss = 0.9568447470664978, train_acc = 0.9976711690731253
test Acc 0.978584729981378:
1th- epoch: 452, train_loss = 0.9565671434102114, train_acc = 0.9976711690731253
test Acc 0.978584729981378:
1th- epoch: 453, train_loss = 0.9557495042681694, train_acc = 0.9976711690731253
test Acc 0.978584729981378:
1th- epoch: 454, train_loss = 0.9550516419112682, train_acc = 0.9976711690731253
test Acc 0.978584729981378:
1th- epoch: 455, train_loss = 0.9542646917107049, train_acc = 0.9976711690731253
test Acc 0.978584729981378:
1th- epoch: 456, train_loss = 0.9537219479680061, train_acc = 0.9976711690731253
test Acc 0.978584729981378:
1th- epoch: 457, tr

  3%|██▍                                                                      | 1/30 [09:26<4:34:01, 566.95s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
2th- epoch: 0, train_loss = 125.51846661418676, train_acc = 0.7744527247321844
test Acc 0.8761638733705773:
2th- epoch: 1, train_loss = 44.91896792128682, train_acc = 0.9137168141592921
test Acc 0.9287709497206704:
2th- epoch: 2, train_loss = 32.517977014184, train_acc = 0.9370051234280391
test Acc 0.946927374301676:
2th- epoch: 3, train_loss = 26.131156489253044, train_acc = 0.94981369352585
test Acc 0.9515828677839852:
2th- epoch: 4, train_loss = 22.00563778169453, train_acc = 0.9572659524918491
test Acc 0.9534450651769087:
2th- epoch: 5, train_loss = 19.030975544825196, train_acc = 0.9637866790870983
test Ac

test Acc 0.9809124767225326:
2th- epoch: 147, train_loss = 1.487912799580954, train_acc = 0.9973218444340941
test Acc 0.9809124767225326:
2th- epoch: 148, train_loss = 1.483100907295011, train_acc = 0.9973218444340941
test Acc 0.9809124767225326:
2th- epoch: 149, train_loss = 1.4786177979549393, train_acc = 0.9973218444340941
test Acc 0.9809124767225326:
2th- epoch: 150, train_loss = 1.472826718701981, train_acc = 0.9973218444340941
test Acc 0.9809124767225326:
2th- epoch: 151, train_loss = 1.4681722335517406, train_acc = 0.9973218444340941
test Acc 0.9809124767225326:
2th- epoch: 152, train_loss = 1.4633274240186438, train_acc = 0.9973218444340941
test Acc 0.9809124767225326:
2th- epoch: 153, train_loss = 1.4585439339280128, train_acc = 0.9973218444340941
test Acc 0.9809124767225326:
2th- epoch: 154, train_loss = 1.4537580019095913, train_acc = 0.9973218444340941
test Acc 0.9809124767225326:
2th- epoch: 155, train_loss = 1.4494574269047007, train_acc = 0.9973218444340941
test Acc 0.98

2th- epoch: 295, train_loss = 1.10111254703952, train_acc = 0.9975547275267815
test Acc 0.9809124767225326:
2th- epoch: 296, train_loss = 1.100040068209637, train_acc = 0.9975547275267815
test Acc 0.9809124767225326:
2th- epoch: 297, train_loss = 1.099079616367817, train_acc = 0.9975547275267815
test Acc 0.9809124767225326:
2th- epoch: 298, train_loss = 1.0971110655809753, train_acc = 0.9975547275267815
test Acc 0.9809124767225326:
2th- epoch: 299, train_loss = 1.0965108759701252, train_acc = 0.9975547275267815
test Acc 0.9809124767225326:
2th- epoch: 300, train_loss = 1.094932743057143, train_acc = 0.9975547275267815
test Acc 0.9809124767225326:
2th- epoch: 301, train_loss = 1.093194657296408, train_acc = 0.9975547275267815
test Acc 0.9809124767225326:
2th- epoch: 302, train_loss = 1.0922771717305295, train_acc = 0.9975547275267815
test Acc 0.9809124767225326:
2th- epoch: 303, train_loss = 1.090904688462615, train_acc = 0.9975547275267815
test Acc 0.9809124767225326:
2th- epoch: 304, 

test Acc 0.9809124767225326:
2th- epoch: 370, train_loss = 1.0175798498094082, train_acc = 0.9976711690731253
test Acc 0.9809124767225326:
2th- epoch: 371, train_loss = 1.0160741402360145, train_acc = 0.9976711690731253
test Acc 0.9809124767225326:
2th- epoch: 372, train_loss = 1.0156870329228695, train_acc = 0.9976711690731253
test Acc 0.9809124767225326:
2th- epoch: 373, train_loss = 1.0143951301870402, train_acc = 0.9976711690731253
test Acc 0.9809124767225326:
2th- epoch: 374, train_loss = 1.0132105884549674, train_acc = 0.9976711690731253
test Acc 0.9809124767225326:
2th- epoch: 375, train_loss = 1.0130238812416792, train_acc = 0.9976711690731253
test Acc 0.9809124767225326:
2th- epoch: 376, train_loss = 1.0117312303336803, train_acc = 0.9976711690731253
test Acc 0.9809124767225326:
2th- epoch: 377, train_loss = 1.0109714083373547, train_acc = 0.9976711690731253
test Acc 0.9809124767225326:
2th- epoch: 378, train_loss = 1.0101498340663966, train_acc = 0.9976711690731253
test Acc 0

  7%|████▊                                                                    | 2/30 [19:25<4:28:59, 576.40s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
3th- epoch: 0, train_loss = 119.46971649676561, train_acc = 0.7706101537028411
test Acc 0.8747672253258846:
3th- epoch: 1, train_loss = 43.75456079095602, train_acc = 0.9110386585933862
test Acc 0.9106145251396648:
3th- epoch: 2, train_loss = 31.91010744869709, train_acc = 0.9349091755938519
test Acc 0.9259776536312849:
3th- epoch: 3, train_loss = 25.69590152800083, train_acc = 0.9457382394038193
test Acc 0.9394785847299814:
3th- epoch: 4, train_loss = 21.596347901970148, train_acc = 0.9543549138332557
test Acc 0.9436685288640596:
3th- epoch: 5, train_loss = 18.67721415311098, train_acc = 0.9618071727992548
tes

3th- epoch: 147, train_loss = 1.5180489482590929, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
3th- epoch: 148, train_loss = 1.5127525416901335, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
3th- epoch: 149, train_loss = 1.5074668899178505, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
3th- epoch: 150, train_loss = 1.5022411743411794, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
3th- epoch: 151, train_loss = 1.4978771470487118, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
3th- epoch: 152, train_loss = 1.4924706431338564, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
3th- epoch: 153, train_loss = 1.4886355685302988, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
3th- epoch: 154, train_loss = 1.4825722947716713, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
3th- epoch: 155, train_loss = 1.4789129184791818, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
3th- epoch

3th- epoch: 295, train_loss = 1.1231861089763697, train_acc = 0.9974382859804378
test Acc 0.9823091247672253:
3th- epoch: 296, train_loss = 1.1222776249051094, train_acc = 0.9974382859804378
test Acc 0.9823091247672253:
3th- epoch: 297, train_loss = 1.120208709180588, train_acc = 0.9973218444340941
test Acc 0.9823091247672253:
3th- epoch: 298, train_loss = 1.120110278337961, train_acc = 0.9974382859804378
test Acc 0.9823091247672253:
3th- epoch: 299, train_loss = 1.1178648968634661, train_acc = 0.9974382859804378
test Acc 0.9823091247672253:
3th- epoch: 300, train_loss = 1.1162026934325695, train_acc = 0.9974382859804378
test Acc 0.9823091247672253:
3th- epoch: 301, train_loss = 1.115136024862295, train_acc = 0.9974382859804378
test Acc 0.9827746741154563:
3th- epoch: 302, train_loss = 1.1138508146104869, train_acc = 0.9974382859804378
test Acc 0.9827746741154563:
3th- epoch: 303, train_loss = 1.112479748815531, train_acc = 0.9974382859804378
test Acc 0.9827746741154563:
3th- epoch: 30

3th- epoch: 443, train_loss = 0.9718640881328611, train_acc = 0.9975547275267815
test Acc 0.9823091247672253:
3th- epoch: 444, train_loss = 0.9709956087172031, train_acc = 0.9975547275267815
test Acc 0.9823091247672253:
3th- epoch: 445, train_loss = 0.9713909377605887, train_acc = 0.9975547275267815
test Acc 0.9823091247672253:
3th- epoch: 446, train_loss = 0.970090489834547, train_acc = 0.9975547275267815
test Acc 0.9823091247672253:
3th- epoch: 447, train_loss = 0.9695296324789524, train_acc = 0.9975547275267815
test Acc 0.9823091247672253:
3th- epoch: 448, train_loss = 0.9686901730747195, train_acc = 0.9975547275267815
test Acc 0.9823091247672253:
3th- epoch: 449, train_loss = 0.9674152284860611, train_acc = 0.9975547275267815
test Acc 0.9823091247672253:
3th- epoch: 450, train_loss = 0.9664823263883591, train_acc = 0.9975547275267815
test Acc 0.9823091247672253:
3th- epoch: 451, train_loss = 0.9662686809897423, train_acc = 0.9975547275267815
test Acc 0.9823091247672253:
3th- epoch:

 10%|███████▎                                                                 | 3/30 [29:24<4:22:30, 583.35s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
4th- epoch: 0, train_loss = 132.0282479673624, train_acc = 0.766301816488123
test Acc 0.8649906890130353:
4th- epoch: 1, train_loss = 45.407737493515015, train_acc = 0.9063809967396367
test Acc 0.9115456238361266:
4th- epoch: 2, train_loss = 32.735219053924084, train_acc = 0.9318816953889147
test Acc 0.9283054003724395:
4th- epoch: 3, train_loss = 26.47483091056347, train_acc = 0.9459711224965067
test Acc 0.9338919925512105:
4th- epoch: 4, train_loss = 22.551902689039707, train_acc = 0.9550535631113182
test Acc 0.9371508379888268:
4th- epoch: 5, train_loss = 19.818847365677357, train_acc = 0.9600605496040987
te

4th- epoch: 147, train_loss = 1.6425629269797355, train_acc = 0.9975547275267815
test Acc 0.9748603351955307:
4th- epoch: 148, train_loss = 1.6362687747459859, train_acc = 0.9975547275267815
test Acc 0.9748603351955307:
4th- epoch: 149, train_loss = 1.6300528210122138, train_acc = 0.9975547275267815
test Acc 0.9753258845437617:
4th- epoch: 150, train_loss = 1.6241581018548459, train_acc = 0.9975547275267815
test Acc 0.9753258845437617:
4th- epoch: 151, train_loss = 1.6180002067703754, train_acc = 0.9975547275267815
test Acc 0.9753258845437617:
4th- epoch: 152, train_loss = 1.611750055104494, train_acc = 0.9975547275267815
test Acc 0.9753258845437617:
4th- epoch: 153, train_loss = 1.6059732895810157, train_acc = 0.9975547275267815
test Acc 0.9753258845437617:
4th- epoch: 154, train_loss = 1.600037505151704, train_acc = 0.9975547275267815
test Acc 0.9753258845437617:
4th- epoch: 155, train_loss = 1.5939322251360863, train_acc = 0.9975547275267815
test Acc 0.9753258845437617:
4th- epoch: 

4th- epoch: 295, train_loss = 1.1689189647440799, train_acc = 0.9977876106194691
test Acc 0.9781191806331471:
4th- epoch: 296, train_loss = 1.1664185698027723, train_acc = 0.9977876106194691
test Acc 0.9781191806331471:
4th- epoch: 297, train_loss = 1.1653962594573386, train_acc = 0.9977876106194691
test Acc 0.9781191806331471:
4th- epoch: 298, train_loss = 1.1638178589637391, train_acc = 0.9977876106194691
test Acc 0.9781191806331471:
4th- epoch: 299, train_loss = 1.1619459477369674, train_acc = 0.9977876106194691
test Acc 0.9781191806331471:
4th- epoch: 300, train_loss = 1.160173210024368, train_acc = 0.9977876106194691
test Acc 0.9781191806331471:
4th- epoch: 301, train_loss = 1.158909862220753, train_acc = 0.9977876106194691
test Acc 0.9781191806331471:
4th- epoch: 302, train_loss = 1.1568304039537907, train_acc = 0.9977876106194691
test Acc 0.9781191806331471:
4th- epoch: 303, train_loss = 1.155631959438324, train_acc = 0.9977876106194691
test Acc 0.9781191806331471:
4th- epoch: 3

test Acc 0.9795158286778398:
4th- epoch: 445, train_loss = 1.0005488879978657, train_acc = 0.9979040521658128
test Acc 0.9795158286778398:
4th- epoch: 446, train_loss = 0.9996634560229722, train_acc = 0.9979040521658128
test Acc 0.9795158286778398:
4th- epoch: 447, train_loss = 0.9989920891821384, train_acc = 0.9979040521658128
test Acc 0.9795158286778398:
4th- epoch: 448, train_loss = 0.9987231107952539, train_acc = 0.9979040521658128
test Acc 0.9795158286778398:
4th- epoch: 449, train_loss = 0.9972934847173747, train_acc = 0.9979040521658128
test Acc 0.9795158286778398:
4th- epoch: 450, train_loss = 0.9970836937427521, train_acc = 0.9979040521658128
test Acc 0.9795158286778398:
4th- epoch: 451, train_loss = 0.995519890129799, train_acc = 0.9980204937121565
test Acc 0.9795158286778398:
4th- epoch: 452, train_loss = 0.9954028291103896, train_acc = 0.9979040521658128
test Acc 0.9799813780260708:
4th- epoch: 453, train_loss = 0.9947239682078362, train_acc = 0.9979040521658128
test Acc 0.

 13%|█████████▋                                                               | 4/30 [39:25<4:14:57, 588.38s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
5th- epoch: 0, train_loss = 120.55677610635757, train_acc = 0.7828365160689333
test Acc 0.8901303538175046:
5th- epoch: 1, train_loss = 45.66316147148609, train_acc = 0.9098742431299488
test Acc 0.930633147113594:
5th- epoch: 2, train_loss = 33.25825983658433, train_acc = 0.9364229156963204
test Acc 0.9432029795158287:
5th- epoch: 3, train_loss = 26.978147331625223, train_acc = 0.946786213320913
test Acc 0.9478584729981379:
5th- epoch: 4, train_loss = 22.876254690811038, train_acc = 0.9540055891942245
test Acc 0.9548417132216015:
5th- epoch: 5, train_loss = 19.890782237052917, train_acc = 0.9597112249650676
tes

5th- epoch: 147, train_loss = 1.5116535763954744, train_acc = 0.9972054028877504
test Acc 0.9804469273743017:
5th- epoch: 148, train_loss = 1.5071857917355374, train_acc = 0.9972054028877504
test Acc 0.9804469273743017:
5th- epoch: 149, train_loss = 1.502219513640739, train_acc = 0.9972054028877504
test Acc 0.9804469273743017:
5th- epoch: 150, train_loss = 1.496840976178646, train_acc = 0.9972054028877504
test Acc 0.9804469273743017:
5th- epoch: 151, train_loss = 1.4922748301178217, train_acc = 0.9972054028877504
test Acc 0.9804469273743017:
5th- epoch: 152, train_loss = 1.4876926908036694, train_acc = 0.9972054028877504
test Acc 0.9804469273743017:
5th- epoch: 153, train_loss = 1.4832032913109288, train_acc = 0.9972054028877504
test Acc 0.9804469273743017:
5th- epoch: 154, train_loss = 1.478418285609223, train_acc = 0.9972054028877504
test Acc 0.9804469273743017:
5th- epoch: 155, train_loss = 1.4737028687959537, train_acc = 0.9972054028877504
test Acc 0.9804469273743017:
5th- epoch: 1

test Acc 0.9813780260707635:
5th- epoch: 222, train_loss = 1.2572603880544193, train_acc = 0.9970889613414066
test Acc 0.9813780260707635:
5th- epoch: 223, train_loss = 1.2551434173365124, train_acc = 0.9970889613414066
test Acc 0.9813780260707635:
5th- epoch: 224, train_loss = 1.2539149979129434, train_acc = 0.9970889613414066
test Acc 0.9813780260707635:
5th- epoch: 225, train_loss = 1.2507347312639467, train_acc = 0.9970889613414066
test Acc 0.9813780260707635:
5th- epoch: 226, train_loss = 1.2484599354793318, train_acc = 0.9970889613414066
test Acc 0.9813780260707635:
5th- epoch: 227, train_loss = 1.2460043877363205, train_acc = 0.9970889613414066
test Acc 0.9813780260707635:
5th- epoch: 228, train_loss = 1.24354271433549, train_acc = 0.9970889613414066
test Acc 0.9813780260707635:
5th- epoch: 229, train_loss = 1.2416538776014931, train_acc = 0.9970889613414066
test Acc 0.9813780260707635:
5th- epoch: 230, train_loss = 1.239103616506327, train_acc = 0.9970889613414066
test Acc 0.98

5th- epoch: 370, train_loss = 1.0412256438285112, train_acc = 0.9973218444340941
test Acc 0.9809124767225326:
5th- epoch: 371, train_loss = 1.039876138791442, train_acc = 0.9973218444340941
test Acc 0.9809124767225326:
5th- epoch: 372, train_loss = 1.039012599736452, train_acc = 0.9973218444340941
test Acc 0.9809124767225326:
5th- epoch: 373, train_loss = 1.0381059050559998, train_acc = 0.9973218444340941
test Acc 0.9809124767225326:
5th- epoch: 374, train_loss = 1.0375091824680567, train_acc = 0.9973218444340941
test Acc 0.9809124767225326:
5th- epoch: 375, train_loss = 1.036661963298684, train_acc = 0.9973218444340941
test Acc 0.9809124767225326:
5th- epoch: 376, train_loss = 1.0355917209235486, train_acc = 0.9973218444340941
test Acc 0.9809124767225326:
5th- epoch: 377, train_loss = 1.0343724756094161, train_acc = 0.9973218444340941
test Acc 0.9809124767225326:
5th- epoch: 378, train_loss = 1.0337021270242985, train_acc = 0.9973218444340941
test Acc 0.9809124767225326:
5th- epoch: 3

 17%|████████████▏                                                            | 5/30 [49:26<4:06:44, 592.16s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
6th- epoch: 0, train_loss = 137.3917533159256, train_acc = 0.7617605961807172
test Acc 0.8677839851024208:
6th- epoch: 1, train_loss = 44.395061656832695, train_acc = 0.9110386585933862
test Acc 0.9068901303538175:
6th- epoch: 2, train_loss = 31.72097035497427, train_acc = 0.9381695388914765
test Acc 0.9287709497206704:
6th- epoch: 3, train_loss = 25.49173191189766, train_acc = 0.9486492780624126
test Acc 0.9399441340782123:
6th- epoch: 4, train_loss = 21.56215450912714, train_acc = 0.955519329296693
test Acc 0.9473929236499069:
6th- epoch: 5, train_loss = 18.77768489345908, train_acc = 0.9613414066138798
test 

test Acc 0.9837057728119181:
6th- epoch: 147, train_loss = 1.540387307642959, train_acc = 0.9973218444340941
test Acc 0.9837057728119181:
6th- epoch: 148, train_loss = 1.535784162580967, train_acc = 0.9973218444340941
test Acc 0.9837057728119181:
6th- epoch: 149, train_loss = 1.530431634397246, train_acc = 0.9973218444340941
test Acc 0.9837057728119181:
6th- epoch: 150, train_loss = 1.5259656546404585, train_acc = 0.9973218444340941
test Acc 0.9837057728119181:
6th- epoch: 151, train_loss = 1.520800276310183, train_acc = 0.9973218444340941
test Acc 0.9837057728119181:
6th- epoch: 152, train_loss = 1.51568803191185, train_acc = 0.9973218444340941
test Acc 0.9837057728119181:
6th- epoch: 153, train_loss = 1.511133585125208, train_acc = 0.9973218444340941
test Acc 0.9837057728119181:
6th- epoch: 154, train_loss = 1.5063350523123518, train_acc = 0.9973218444340941
test Acc 0.9837057728119181:
6th- epoch: 155, train_loss = 1.5018850540509447, train_acc = 0.9973218444340941
test Acc 0.983705

test Acc 0.9846368715083799:
6th- epoch: 296, train_loss = 1.1404526121914387, train_acc = 0.9976711690731253
test Acc 0.9846368715083799:
6th- epoch: 297, train_loss = 1.138512123376131, train_acc = 0.9976711690731253
test Acc 0.9846368715083799:
6th- epoch: 298, train_loss = 1.1377410925924778, train_acc = 0.9976711690731253
test Acc 0.9846368715083799:
6th- epoch: 299, train_loss = 1.1358772056992166, train_acc = 0.9976711690731253
test Acc 0.9846368715083799:
6th- epoch: 300, train_loss = 1.1340477739577182, train_acc = 0.9976711690731253
test Acc 0.9846368715083799:
6th- epoch: 301, train_loss = 1.1334104153211229, train_acc = 0.9976711690731253
test Acc 0.9846368715083799:
6th- epoch: 302, train_loss = 1.1316519665415399, train_acc = 0.9976711690731253
test Acc 0.9846368715083799:
6th- epoch: 303, train_loss = 1.1304403890972026, train_acc = 0.9976711690731253
test Acc 0.9846368715083799:
6th- epoch: 304, train_loss = 1.1291432802681811, train_acc = 0.9976711690731253
test Acc 0.

6th- epoch: 445, train_loss = 0.9845953447220381, train_acc = 0.9980204937121565
test Acc 0.9837057728119181:
6th- epoch: 446, train_loss = 0.9845053789613303, train_acc = 0.9980204937121565
test Acc 0.9837057728119181:
6th- epoch: 447, train_loss = 0.9834746060369071, train_acc = 0.9980204937121565
test Acc 0.9837057728119181:
6th- epoch: 448, train_loss = 0.9829739468696062, train_acc = 0.9980204937121565
test Acc 0.9837057728119181:
6th- epoch: 449, train_loss = 0.9815093713405076, train_acc = 0.9980204937121565
test Acc 0.9837057728119181:
6th- epoch: 450, train_loss = 0.9816835038363934, train_acc = 0.9980204937121565
test Acc 0.9837057728119181:
6th- epoch: 451, train_loss = 0.9809615686535835, train_acc = 0.9980204937121565
test Acc 0.9837057728119181:
6th- epoch: 452, train_loss = 0.9796949736773968, train_acc = 0.9980204937121565
test Acc 0.9837057728119181:
6th- epoch: 453, train_loss = 0.9792502112686634, train_acc = 0.9980204937121565
test Acc 0.9837057728119181:
6th- epoch

 20%|██████████████▌                                                          | 6/30 [59:28<3:58:06, 595.26s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
7th- epoch: 0, train_loss = 116.58521346747875, train_acc = 0.7792268281322776
test Acc 0.8640595903165735:
7th- epoch: 1, train_loss = 43.69835852086544, train_acc = 0.9153469958081043
test Acc 0.9031657355679702:
7th- epoch: 2, train_loss = 31.73815283179283, train_acc = 0.9373544480670704
test Acc 0.925512104283054:
7th- epoch: 3, train_loss = 25.724874954670668, train_acc = 0.948067070330694
test Acc 0.9338919925512105:
7th- epoch: 4, train_loss = 21.860715355724096, train_acc = 0.9568001863064741
test Acc 0.9418063314711359:
7th- epoch: 5, train_loss = 19.114923752844334, train_acc = 0.9614578481602236
tes

7th- epoch: 147, train_loss = 1.5550116946687922, train_acc = 0.9970889613414066
test Acc 0.9799813780260708:
7th- epoch: 148, train_loss = 1.5497002148767933, train_acc = 0.9970889613414066
test Acc 0.9799813780260708:
7th- epoch: 149, train_loss = 1.544545085518621, train_acc = 0.9970889613414066
test Acc 0.9799813780260708:
7th- epoch: 150, train_loss = 1.5387955643236637, train_acc = 0.9970889613414066
test Acc 0.9799813780260708:
7th- epoch: 151, train_loss = 1.5337493028491735, train_acc = 0.9970889613414066
test Acc 0.9799813780260708:
7th- epoch: 152, train_loss = 1.52871833241079, train_acc = 0.9970889613414066
test Acc 0.9799813780260708:
7th- epoch: 153, train_loss = 1.5235524444142357, train_acc = 0.9972054028877504
test Acc 0.9799813780260708:
7th- epoch: 154, train_loss = 1.5186912877252325, train_acc = 0.9972054028877504
test Acc 0.9799813780260708:
7th- epoch: 155, train_loss = 1.5137978723505512, train_acc = 0.9970889613414066
test Acc 0.9799813780260708:
7th- epoch: 1

7th- epoch: 295, train_loss = 1.1469134303624742, train_acc = 0.9975547275267815
test Acc 0.9804469273743017:
7th- epoch: 296, train_loss = 1.144993242516648, train_acc = 0.9975547275267815
test Acc 0.9804469273743017:
7th- epoch: 297, train_loss = 1.1436302736401558, train_acc = 0.9975547275267815
test Acc 0.9804469273743017:
7th- epoch: 298, train_loss = 1.1421953700482845, train_acc = 0.9975547275267815
test Acc 0.9804469273743017:
7th- epoch: 299, train_loss = 1.1412982549518347, train_acc = 0.9975547275267815
test Acc 0.9799813780260708:
7th- epoch: 300, train_loss = 1.139384986832738, train_acc = 0.9975547275267815
test Acc 0.9804469273743017:
7th- epoch: 301, train_loss = 1.1377281099557877, train_acc = 0.9975547275267815
test Acc 0.9799813780260708:
7th- epoch: 302, train_loss = 1.1364050302654505, train_acc = 0.9975547275267815
test Acc 0.9804469273743017:
7th- epoch: 303, train_loss = 1.1357719544321299, train_acc = 0.9975547275267815
test Acc 0.9799813780260708:
7th- epoch: 

7th- epoch: 443, train_loss = 0.995130897819763, train_acc = 0.9976711690731253
test Acc 0.9804469273743017:
7th- epoch: 444, train_loss = 0.9945893312396947, train_acc = 0.9976711690731253
test Acc 0.9804469273743017:
7th- epoch: 445, train_loss = 0.9937426410615444, train_acc = 0.9976711690731253
test Acc 0.9804469273743017:
7th- epoch: 446, train_loss = 0.9926066882908344, train_acc = 0.9976711690731253
test Acc 0.9804469273743017:
7th- epoch: 447, train_loss = 0.9921171540918294, train_acc = 0.9976711690731253
test Acc 0.9799813780260708:
7th- epoch: 448, train_loss = 0.9916330873966217, train_acc = 0.9976711690731253
test Acc 0.9799813780260708:
7th- epoch: 449, train_loss = 0.990760109067196, train_acc = 0.9976711690731253
test Acc 0.9804469273743017:
7th- epoch: 450, train_loss = 0.990170419216156, train_acc = 0.9976711690731253
test Acc 0.9804469273743017:
7th- epoch: 451, train_loss = 0.9892978419957217, train_acc = 0.9976711690731253
test Acc 0.9799813780260708:
7th- epoch: 4

 23%|████████████████▌                                                      | 7/30 [1:09:30<3:49:00, 597.40s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
8th- epoch: 0, train_loss = 124.84038951992989, train_acc = 0.7748020493712157
test Acc 0.8719739292364991:
8th- epoch: 1, train_loss = 45.046216666698456, train_acc = 0.9094084769445738
test Acc 0.9152700186219739:
8th- epoch: 2, train_loss = 32.58322702720761, train_acc = 0.9350256171401956
test Acc 0.9283054003724395:
8th- epoch: 3, train_loss = 26.379041235893965, train_acc = 0.9487657196087564
test Acc 0.936219739292365:
8th- epoch: 4, train_loss = 22.445093885064125, train_acc = 0.955985095482068
test Acc 0.9394785847299814:
8th- epoch: 5, train_loss = 19.68724923208356, train_acc = 0.9632044713553796
tes

test Acc 0.9767225325884544:
8th- epoch: 147, train_loss = 1.5332045510876924, train_acc = 0.9970889613414066
test Acc 0.9767225325884544:
8th- epoch: 148, train_loss = 1.5276825150940567, train_acc = 0.9970889613414066
test Acc 0.9767225325884544:
8th- epoch: 149, train_loss = 1.5222638335544616, train_acc = 0.9970889613414066
test Acc 0.9767225325884544:
8th- epoch: 150, train_loss = 1.5177340728696436, train_acc = 0.9970889613414066
test Acc 0.9767225325884544:
8th- epoch: 151, train_loss = 1.512447243789211, train_acc = 0.9970889613414066
test Acc 0.9767225325884544:
8th- epoch: 152, train_loss = 1.507624718011357, train_acc = 0.9970889613414066
test Acc 0.9767225325884544:
8th- epoch: 153, train_loss = 1.502605739980936, train_acc = 0.9970889613414066
test Acc 0.9767225325884544:
8th- epoch: 154, train_loss = 1.4977565376320854, train_acc = 0.9970889613414066
test Acc 0.9767225325884544:
8th- epoch: 155, train_loss = 1.4936082946369424, train_acc = 0.9970889613414066
test Acc 0.97

8th- epoch: 295, train_loss = 1.1447055502794683, train_acc = 0.9976711690731253
test Acc 0.9771880819366853:
8th- epoch: 296, train_loss = 1.142617895558942, train_acc = 0.9976711690731253
test Acc 0.9771880819366853:
8th- epoch: 297, train_loss = 1.1410697055980563, train_acc = 0.9976711690731253
test Acc 0.9771880819366853:
8th- epoch: 298, train_loss = 1.1395544344559312, train_acc = 0.9976711690731253
test Acc 0.9771880819366853:
8th- epoch: 299, train_loss = 1.1382589644636028, train_acc = 0.9976711690731253
test Acc 0.9771880819366853:
8th- epoch: 300, train_loss = 1.1377139004762284, train_acc = 0.9976711690731253
test Acc 0.9771880819366853:
8th- epoch: 301, train_loss = 1.1355569924344309, train_acc = 0.9976711690731253
test Acc 0.9771880819366853:
8th- epoch: 302, train_loss = 1.1339731633779593, train_acc = 0.9976711690731253
test Acc 0.9771880819366853:
8th- epoch: 303, train_loss = 1.1330771284992807, train_acc = 0.9976711690731253
test Acc 0.9771880819366853:
8th- epoch:

8th- epoch: 443, train_loss = 0.9981163768097758, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
8th- epoch: 444, train_loss = 0.9963118002342526, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
8th- epoch: 445, train_loss = 0.9962806062249001, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
8th- epoch: 446, train_loss = 0.9951154372247402, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
8th- epoch: 447, train_loss = 0.9946034019812942, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
8th- epoch: 448, train_loss = 0.9939277718367521, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
8th- epoch: 449, train_loss = 0.9935151130484883, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
8th- epoch: 450, train_loss = 0.99194104471826, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
8th- epoch: 451, train_loss = 0.9922349012049381, train_acc = 0.9977876106194691
test Acc 0.9771880819366853:
8th- epoch: 

 27%|██████████████████▉                                                    | 8/30 [1:19:32<3:39:27, 598.54s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
9th- epoch: 0, train_loss = 124.46605522930622, train_acc = 0.7624592454587797
test Acc 0.8733705772811918:
9th- epoch: 1, train_loss = 44.577378414571285, train_acc = 0.9118537494177923
test Acc 0.9162011173184358:
9th- epoch: 2, train_loss = 32.38711951673031, train_acc = 0.9386353050768514
test Acc 0.9348230912476723:
9th- epoch: 3, train_loss = 26.2661728002131, train_acc = 0.9501630181648812
test Acc 0.9455307262569832:
9th- epoch: 4, train_loss = 22.34255894087255, train_acc = 0.9558686539357243
test Acc 0.9492551210428305:
9th- epoch: 5, train_loss = 19.528276009485126, train_acc = 0.9614578481602236
tes

9th- epoch: 147, train_loss = 1.5053991489112377, train_acc = 0.9972054028877504
test Acc 0.9804469273743017:
9th- epoch: 148, train_loss = 1.5011304741492495, train_acc = 0.9972054028877504
test Acc 0.9804469273743017:
9th- epoch: 149, train_loss = 1.4964932227740064, train_acc = 0.9972054028877504
test Acc 0.9804469273743017:
9th- epoch: 150, train_loss = 1.4924353323876858, train_acc = 0.9972054028877504
test Acc 0.9804469273743017:
9th- epoch: 151, train_loss = 1.487904561101459, train_acc = 0.9972054028877504
test Acc 0.9804469273743017:
9th- epoch: 152, train_loss = 1.4833816947648302, train_acc = 0.9972054028877504
test Acc 0.9809124767225326:
9th- epoch: 153, train_loss = 1.4791512874653563, train_acc = 0.9972054028877504
test Acc 0.9809124767225326:
9th- epoch: 154, train_loss = 1.4750253682723269, train_acc = 0.9972054028877504
test Acc 0.9809124767225326:
9th- epoch: 155, train_loss = 1.4704010114073753, train_acc = 0.9972054028877504
test Acc 0.9809124767225326:
9th- epoch:

test Acc 0.9813780260707635:
9th- epoch: 296, train_loss = 1.1423275185225066, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
9th- epoch: 297, train_loss = 1.1404941578803118, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
9th- epoch: 298, train_loss = 1.1395179728569929, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
9th- epoch: 299, train_loss = 1.137210233748192, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
9th- epoch: 300, train_loss = 1.1365772845747415, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
9th- epoch: 301, train_loss = 1.135952460259432, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
9th- epoch: 302, train_loss = 1.1336418154241983, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
9th- epoch: 303, train_loss = 1.1327551504073199, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
9th- epoch: 304, train_loss = 1.1310968498291913, train_acc = 0.9973218444340941
test Acc 0.9

9th- epoch: 444, train_loss = 0.9956749330012826, train_acc = 0.9974382859804378
test Acc 0.9827746741154563:
9th- epoch: 445, train_loss = 0.9953843553812476, train_acc = 0.9974382859804378
test Acc 0.9827746741154563:
9th- epoch: 446, train_loss = 0.9942541569471359, train_acc = 0.9974382859804378
test Acc 0.9827746741154563:
9th- epoch: 447, train_loss = 0.9937723974435357, train_acc = 0.9974382859804378
test Acc 0.9827746741154563:
9th- epoch: 448, train_loss = 0.992881428450346, train_acc = 0.9974382859804378
test Acc 0.9827746741154563:
9th- epoch: 449, train_loss = 0.9919777723698644, train_acc = 0.9974382859804378
test Acc 0.9827746741154563:
9th- epoch: 450, train_loss = 0.9923651901335688, train_acc = 0.9974382859804378
test Acc 0.9827746741154563:
9th- epoch: 451, train_loss = 0.9912487541587325, train_acc = 0.9974382859804378
test Acc 0.9827746741154563:
9th- epoch: 452, train_loss = 0.9903742944152327, train_acc = 0.9974382859804378
test Acc 0.9827746741154563:
9th- epoch:

 30%|█████████████████████▎                                                 | 9/30 [1:29:32<3:29:43, 599.21s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
10th- epoch: 0, train_loss = 129.98318174481392, train_acc = 0.7706101537028411
test Acc 0.88268156424581:
10th- epoch: 1, train_loss = 42.20667303353548, train_acc = 0.9153469958081043
test Acc 0.9241154562383612:
10th- epoch: 2, train_loss = 30.88708208873868, train_acc = 0.9420121099208197
test Acc 0.9357541899441341:
10th- epoch: 3, train_loss = 25.17395945265889, train_acc = 0.9512109920819748
test Acc 0.9432029795158287:
10th- epoch: 4, train_loss = 21.47044638544321, train_acc = 0.9572659524918491
test Acc 0.9515828677839852:
10th- epoch: 5, train_loss = 18.809588346630335, train_acc = 0.9630880298090359

10th- epoch: 146, train_loss = 1.5217109012883157, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
10th- epoch: 147, train_loss = 1.5161171555519104, train_acc = 0.9974382859804378
test Acc 0.9804469273743017:
10th- epoch: 148, train_loss = 1.5106922325212508, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
10th- epoch: 149, train_loss = 1.5048814564943314, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
10th- epoch: 150, train_loss = 1.4997709307353944, train_acc = 0.9974382859804378
test Acc 0.9804469273743017:
10th- epoch: 151, train_loss = 1.4945253592450172, train_acc = 0.9974382859804378
test Acc 0.9804469273743017:
10th- epoch: 152, train_loss = 1.4896274183411151, train_acc = 0.9974382859804378
test Acc 0.9804469273743017:
10th- epoch: 153, train_loss = 1.4843153145629913, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
10th- epoch: 154, train_loss = 1.4796044763643295, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
1

10th- epoch: 293, train_loss = 1.1191360999946482, train_acc = 0.9974382859804378
test Acc 0.9823091247672253:
10th- epoch: 294, train_loss = 1.117806640744675, train_acc = 0.9974382859804378
test Acc 0.9823091247672253:
10th- epoch: 295, train_loss = 1.1159077249467373, train_acc = 0.9974382859804378
test Acc 0.9823091247672253:
10th- epoch: 296, train_loss = 1.1137818644638173, train_acc = 0.9974382859804378
test Acc 0.9823091247672253:
10th- epoch: 297, train_loss = 1.113015465438366, train_acc = 0.9974382859804378
test Acc 0.9823091247672253:
10th- epoch: 298, train_loss = 1.1120287254452705, train_acc = 0.9974382859804378
test Acc 0.9823091247672253:
10th- epoch: 299, train_loss = 1.1105277240276337, train_acc = 0.9974382859804378
test Acc 0.9823091247672253:
10th- epoch: 300, train_loss = 1.1090664826333523, train_acc = 0.9974382859804378
test Acc 0.9823091247672253:
10th- epoch: 301, train_loss = 1.1077298745512962, train_acc = 0.9974382859804378
test Acc 0.9823091247672253:
10t

10th- epoch: 440, train_loss = 0.9742522425949574, train_acc = 0.9975547275267815
test Acc 0.9813780260707635:
10th- epoch: 441, train_loss = 0.9727211606805213, train_acc = 0.9975547275267815
test Acc 0.9813780260707635:
10th- epoch: 442, train_loss = 0.9727393413777463, train_acc = 0.9975547275267815
test Acc 0.9813780260707635:
10th- epoch: 443, train_loss = 0.9715255250339396, train_acc = 0.9975547275267815
test Acc 0.9813780260707635:
10th- epoch: 444, train_loss = 0.9710085627739318, train_acc = 0.9975547275267815
test Acc 0.9813780260707635:
10th- epoch: 445, train_loss = 0.9706318626995198, train_acc = 0.9975547275267815
test Acc 0.9813780260707635:
10th- epoch: 446, train_loss = 0.9700878386502154, train_acc = 0.9975547275267815
test Acc 0.9813780260707635:
10th- epoch: 447, train_loss = 0.9686894938349724, train_acc = 0.9975547275267815
test Acc 0.9813780260707635:
10th- epoch: 448, train_loss = 0.9686368592083454, train_acc = 0.9975547275267815
test Acc 0.9813780260707635:
1

 33%|███████████████████████▎                                              | 10/30 [1:39:30<3:19:34, 598.74s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
11th- epoch: 0, train_loss = 116.08354974538088, train_acc = 0.7735211923614346
test Acc 0.87243947858473:
11th- epoch: 1, train_loss = 45.43683683872223, train_acc = 0.905798789007918
test Acc 0.909683426443203:
11th- epoch: 2, train_loss = 32.18170055747032, train_acc = 0.9314159292035398
test Acc 0.9241154562383612:
11th- epoch: 3, train_loss = 25.45407424867153, train_acc = 0.9432929669306008
test Acc 0.9348230912476723:
11th- epoch: 4, train_loss = 21.190470848232508, train_acc = 0.9542384722869119
test Acc 0.9418063314711359:
11th- epoch: 5, train_loss = 18.288129083812237, train_acc = 0.9598276665114113


11th- epoch: 146, train_loss = 1.5313376064877957, train_acc = 0.9970889613414066
test Acc 0.9771880819366853:
11th- epoch: 147, train_loss = 1.5268585681915283, train_acc = 0.9970889613414066
test Acc 0.9776536312849162:
11th- epoch: 148, train_loss = 1.521308058174327, train_acc = 0.9970889613414066
test Acc 0.9776536312849162:
11th- epoch: 149, train_loss = 1.5167378846090287, train_acc = 0.9970889613414066
test Acc 0.9776536312849162:
11th- epoch: 150, train_loss = 1.5115491386968642, train_acc = 0.9970889613414066
test Acc 0.9776536312849162:
11th- epoch: 151, train_loss = 1.5070372931659222, train_acc = 0.9970889613414066
test Acc 0.9776536312849162:
11th- epoch: 152, train_loss = 1.502131012501195, train_acc = 0.9970889613414066
test Acc 0.9776536312849162:
11th- epoch: 153, train_loss = 1.4974979311227798, train_acc = 0.9970889613414066
test Acc 0.9776536312849162:
11th- epoch: 154, train_loss = 1.4927655197679996, train_acc = 0.9970889613414066
test Acc 0.9776536312849162:
11t

test Acc 0.9776536312849162:
11th- epoch: 294, train_loss = 1.1376741913263686, train_acc = 0.9970889613414066
test Acc 0.9776536312849162:
11th- epoch: 295, train_loss = 1.1361291433568113, train_acc = 0.9970889613414066
test Acc 0.9776536312849162:
11th- epoch: 296, train_loss = 1.1345575277809985, train_acc = 0.9970889613414066
test Acc 0.9776536312849162:
11th- epoch: 297, train_loss = 1.1341680635814555, train_acc = 0.9970889613414066
test Acc 0.9776536312849162:
11th- epoch: 298, train_loss = 1.132237157493364, train_acc = 0.9970889613414066
test Acc 0.9776536312849162:
11th- epoch: 299, train_loss = 1.130894597619772, train_acc = 0.9970889613414066
test Acc 0.9776536312849162:
11th- epoch: 300, train_loss = 1.128915208100807, train_acc = 0.9970889613414066
test Acc 0.9776536312849162:
11th- epoch: 301, train_loss = 1.128024107485544, train_acc = 0.9970889613414066
test Acc 0.9776536312849162:
11th- epoch: 302, train_loss = 1.1267249013180844, train_acc = 0.9970889613414066
test 

test Acc 0.9776536312849162:
11th- epoch: 368, train_loss = 1.0490705805714242, train_acc = 0.9972054028877504
test Acc 0.9776536312849162:
11th- epoch: 369, train_loss = 1.047900925099384, train_acc = 0.9972054028877504
test Acc 0.9776536312849162:
11th- epoch: 370, train_loss = 1.0471853365306742, train_acc = 0.9972054028877504
test Acc 0.9776536312849162:
11th- epoch: 371, train_loss = 1.045552792667877, train_acc = 0.9972054028877504
test Acc 0.9776536312849162:
11th- epoch: 372, train_loss = 1.0452379721100442, train_acc = 0.9972054028877504
test Acc 0.9776536312849162:
11th- epoch: 373, train_loss = 1.0436295072431676, train_acc = 0.9972054028877504
test Acc 0.9776536312849162:
11th- epoch: 374, train_loss = 1.0429055604035966, train_acc = 0.9972054028877504
test Acc 0.9776536312849162:
11th- epoch: 375, train_loss = 1.0421574314241298, train_acc = 0.9972054028877504
test Acc 0.9776536312849162:
11th- epoch: 376, train_loss = 1.0407302342355251, train_acc = 0.9972054028877504
tes

 37%|█████████████████████████▋                                            | 11/30 [1:49:29<3:09:35, 598.70s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
12th- epoch: 0, train_loss = 128.7874104976654, train_acc = 0.7685142058686539
test Acc 0.8691806331471136:
12th- epoch: 1, train_loss = 43.30498591810465, train_acc = 0.9061481136469492
test Acc 0.9073556797020484:
12th- epoch: 2, train_loss = 31.07407159730792, train_acc = 0.9323474615742897
test Acc 0.9292364990689013:
12th- epoch: 3, train_loss = 25.206489384174347, train_acc = 0.945854680950163
test Acc 0.9357541899441341:
12th- epoch: 4, train_loss = 21.505670428276062, train_acc = 0.955985095482068
test Acc 0.9413407821229051:
12th- epoch: 5, train_loss = 18.85269165970385, train_acc = 0.9608756404285049

12th- epoch: 145, train_loss = 1.5959025224437937, train_acc = 0.9969725197950629
test Acc 0.9748603351955307:
12th- epoch: 146, train_loss = 1.5896528909215704, train_acc = 0.9969725197950629
test Acc 0.9748603351955307:
12th- epoch: 147, train_loss = 1.5845670414855704, train_acc = 0.9969725197950629
test Acc 0.9748603351955307:
12th- epoch: 148, train_loss = 1.5784171981504187, train_acc = 0.9969725197950629
test Acc 0.9748603351955307:
12th- epoch: 149, train_loss = 1.572647655964829, train_acc = 0.9968560782487191
test Acc 0.9748603351955307:
12th- epoch: 150, train_loss = 1.5671529608080164, train_acc = 0.9968560782487191
test Acc 0.9748603351955307:
12th- epoch: 151, train_loss = 1.5612160650780424, train_acc = 0.9969725197950629
test Acc 0.9748603351955307:
12th- epoch: 152, train_loss = 1.5559454299509525, train_acc = 0.9969725197950629
test Acc 0.9748603351955307:
12th- epoch: 153, train_loss = 1.5509436912834644, train_acc = 0.9969725197950629
test Acc 0.9748603351955307:
12

12th- epoch: 292, train_loss = 1.155977226793766, train_acc = 0.9974382859804378
test Acc 0.9762569832402235:
12th- epoch: 293, train_loss = 1.1539480748178903, train_acc = 0.9974382859804378
test Acc 0.9762569832402235:
12th- epoch: 294, train_loss = 1.1525027553143445, train_acc = 0.9974382859804378
test Acc 0.9762569832402235:
12th- epoch: 295, train_loss = 1.1505305307509843, train_acc = 0.9974382859804378
test Acc 0.9762569832402235:
12th- epoch: 296, train_loss = 1.1493821491894778, train_acc = 0.9974382859804378
test Acc 0.9762569832402235:
12th- epoch: 297, train_loss = 1.1478216188552324, train_acc = 0.9974382859804378
test Acc 0.9762569832402235:
12th- epoch: 298, train_loss = 1.1464150746760424, train_acc = 0.9974382859804378
test Acc 0.9762569832402235:
12th- epoch: 299, train_loss = 1.1446694744226988, train_acc = 0.9974382859804378
test Acc 0.9762569832402235:
12th- epoch: 300, train_loss = 1.1432122377154883, train_acc = 0.9974382859804378
test Acc 0.9762569832402235:
12

test Acc 0.9781191806331471:
12th- epoch: 440, train_loss = 0.993607897311449, train_acc = 0.9974382859804378
test Acc 0.9781191806331471:
12th- epoch: 441, train_loss = 0.9923699274659157, train_acc = 0.9974382859804378
test Acc 0.9781191806331471:
12th- epoch: 442, train_loss = 0.9920802600681782, train_acc = 0.9974382859804378
test Acc 0.9781191806331471:
12th- epoch: 443, train_loss = 0.9915941345243482, train_acc = 0.9974382859804378
test Acc 0.9781191806331471:
12th- epoch: 444, train_loss = 0.9904482550919056, train_acc = 0.9974382859804378
test Acc 0.9781191806331471:
12th- epoch: 445, train_loss = 0.9897538187651662, train_acc = 0.9974382859804378
test Acc 0.9781191806331471:
12th- epoch: 446, train_loss = 0.9891448567359475, train_acc = 0.9974382859804378
test Acc 0.9781191806331471:
12th- epoch: 447, train_loss = 0.9885800816118717, train_acc = 0.9974382859804378
test Acc 0.9781191806331471:
12th- epoch: 448, train_loss = 0.987176138907671, train_acc = 0.9974382859804378
tes

 40%|████████████████████████████                                          | 12/30 [1:59:28<2:59:37, 598.75s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
13th- epoch: 0, train_loss = 108.92297939956188, train_acc = 0.7805076851420587
test Acc 0.8691806331471136:
13th- epoch: 1, train_loss = 40.389610439538956, train_acc = 0.9158127619934793
test Acc 0.9068901303538175:
13th- epoch: 2, train_loss = 29.37217888981104, train_acc = 0.94014904517932
test Acc 0.9278398510242085:
13th- epoch: 3, train_loss = 23.99834307655692, train_acc = 0.952491849091756
test Acc 0.9380819366852886:
13th- epoch: 4, train_loss = 20.61295384913683, train_acc = 0.9613414066138798
test Acc 0.9441340782122905:
13th- epoch: 5, train_loss = 18.212854601442814, train_acc = 0.966115510013973


13th- epoch: 145, train_loss = 1.5844788948306814, train_acc = 0.9969725197950629
test Acc 0.9771880819366853:
13th- epoch: 146, train_loss = 1.5789760574698448, train_acc = 0.9969725197950629
test Acc 0.9771880819366853:
13th- epoch: 147, train_loss = 1.5731544382870197, train_acc = 0.9969725197950629
test Acc 0.9771880819366853:
13th- epoch: 148, train_loss = 1.5676388057181612, train_acc = 0.9969725197950629
test Acc 0.9771880819366853:
13th- epoch: 149, train_loss = 1.5617284575710073, train_acc = 0.9969725197950629
test Acc 0.9771880819366853:
13th- epoch: 150, train_loss = 1.5565433166921139, train_acc = 0.9969725197950629
test Acc 0.9771880819366853:
13th- epoch: 151, train_loss = 1.5507009712746367, train_acc = 0.9969725197950629
test Acc 0.9771880819366853:
13th- epoch: 152, train_loss = 1.545859932899475, train_acc = 0.9969725197950629
test Acc 0.9771880819366853:
13th- epoch: 153, train_loss = 1.5403962507843971, train_acc = 0.9969725197950629
test Acc 0.9771880819366853:
13

13th- epoch: 292, train_loss = 1.1553907406632788, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
13th- epoch: 293, train_loss = 1.1536223205621354, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
13th- epoch: 294, train_loss = 1.1521571427583694, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
13th- epoch: 295, train_loss = 1.1506712337140925, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
13th- epoch: 296, train_loss = 1.1487716932897456, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
13th- epoch: 297, train_loss = 1.1474685830180533, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
13th- epoch: 298, train_loss = 1.146177978545893, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
13th- epoch: 299, train_loss = 1.1443348589236848, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
13th- epoch: 300, train_loss = 1.1428366489708424, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
13

test Acc 0.9776536312849162:
13th- epoch: 440, train_loss = 0.9952123438415583, train_acc = 0.9974382859804378
test Acc 0.9776536312849162:
13th- epoch: 441, train_loss = 0.9948104421200696, train_acc = 0.9974382859804378
test Acc 0.9776536312849162:
13th- epoch: 442, train_loss = 0.9936769815685693, train_acc = 0.9974382859804378
test Acc 0.9776536312849162:
13th- epoch: 443, train_loss = 0.9928094359638635, train_acc = 0.9974382859804378
test Acc 0.9776536312849162:
13th- epoch: 444, train_loss = 0.9926367253065109, train_acc = 0.9974382859804378
test Acc 0.9776536312849162:
13th- epoch: 445, train_loss = 0.9917144812643528, train_acc = 0.9974382859804378
test Acc 0.9776536312849162:
13th- epoch: 446, train_loss = 0.9908435357210692, train_acc = 0.9974382859804378
test Acc 0.9776536312849162:
13th- epoch: 447, train_loss = 0.9897334910929203, train_acc = 0.9974382859804378
test Acc 0.9776536312849162:
13th- epoch: 448, train_loss = 0.9895234940049704, train_acc = 0.9974382859804378
t

 43%|██████████████████████████████▎                                       | 13/30 [2:09:27<2:49:42, 598.99s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
14th- epoch: 0, train_loss = 131.23634496331215, train_acc = 0.7652538425710294
test Acc 0.8594040968342644:
14th- epoch: 1, train_loss = 42.364793978631496, train_acc = 0.9092920353982301
test Acc 0.9157355679702048:
14th- epoch: 2, train_loss = 30.22188837081194, train_acc = 0.9371215649743828
test Acc 0.9315642458100558:
14th- epoch: 3, train_loss = 24.338241264224052, train_acc = 0.9507452258965999
test Acc 0.9441340782122905:
14th- epoch: 4, train_loss = 20.639132395386696, train_acc = 0.9579646017699115
test Acc 0.9478584729981379:
14th- epoch: 5, train_loss = 17.95643488690257, train_acc = 0.962505822077

14th- epoch: 145, train_loss = 1.6415602192282677, train_acc = 0.9975547275267815
test Acc 0.9771880819366853:
14th- epoch: 146, train_loss = 1.6359527023741975, train_acc = 0.9975547275267815
test Acc 0.9771880819366853:
14th- epoch: 147, train_loss = 1.6294344825437292, train_acc = 0.9976711690731253
test Acc 0.9771880819366853:
14th- epoch: 148, train_loss = 1.6241572486469522, train_acc = 0.9976711690731253
test Acc 0.9771880819366853:
14th- epoch: 149, train_loss = 1.6177516641328111, train_acc = 0.9976711690731253
test Acc 0.9771880819366853:
14th- epoch: 150, train_loss = 1.6121016269316897, train_acc = 0.9976711690731253
test Acc 0.9771880819366853:
14th- epoch: 151, train_loss = 1.6065725249936804, train_acc = 0.9976711690731253
test Acc 0.9771880819366853:
14th- epoch: 152, train_loss = 1.6011579036712646, train_acc = 0.9976711690731253
test Acc 0.9771880819366853:
14th- epoch: 153, train_loss = 1.5954249961068854, train_acc = 0.9976711690731253
test Acc 0.9771880819366853:
1

14th- epoch: 292, train_loss = 1.1829645931720734, train_acc = 0.9977876106194691
test Acc 0.9781191806331471:
14th- epoch: 293, train_loss = 1.181592758744955, train_acc = 0.9977876106194691
test Acc 0.9781191806331471:
14th- epoch: 294, train_loss = 1.179673397273291, train_acc = 0.9977876106194691
test Acc 0.9781191806331471:
14th- epoch: 295, train_loss = 1.1783541962504387, train_acc = 0.9977876106194691
test Acc 0.9781191806331471:
14th- epoch: 296, train_loss = 1.1769226889009587, train_acc = 0.9977876106194691
test Acc 0.9781191806331471:
14th- epoch: 297, train_loss = 1.1749358561937697, train_acc = 0.9977876106194691
test Acc 0.9781191806331471:
14th- epoch: 298, train_loss = 1.1735576465725899, train_acc = 0.9977876106194691
test Acc 0.9781191806331471:
14th- epoch: 299, train_loss = 1.172037957876455, train_acc = 0.9977876106194691
test Acc 0.9781191806331471:
14th- epoch: 300, train_loss = 1.170341829478275, train_acc = 0.9977876106194691
test Acc 0.9781191806331471:
14th-

14th- epoch: 440, train_loss = 1.0164442608656827, train_acc = 0.9979040521658128
test Acc 0.9795158286778398:
14th- epoch: 441, train_loss = 1.0149309436383191, train_acc = 0.9979040521658128
test Acc 0.9795158286778398:
14th- epoch: 442, train_loss = 1.0144816065730993, train_acc = 0.9979040521658128
test Acc 0.9795158286778398:
14th- epoch: 443, train_loss = 1.0138240829110146, train_acc = 0.9979040521658128
test Acc 0.9795158286778398:
14th- epoch: 444, train_loss = 1.0126566824910697, train_acc = 0.9979040521658128
test Acc 0.9795158286778398:
14th- epoch: 445, train_loss = 1.0120658961532172, train_acc = 0.9979040521658128
test Acc 0.9795158286778398:
14th- epoch: 446, train_loss = 1.0109598698618356, train_acc = 0.9979040521658128
test Acc 0.9795158286778398:
14th- epoch: 447, train_loss = 1.0108211636543274, train_acc = 0.9979040521658128
test Acc 0.9795158286778398:
14th- epoch: 448, train_loss = 1.0096729596552905, train_acc = 0.9979040521658128
test Acc 0.9795158286778398:
1

 47%|████████████████████████████████▋                                     | 14/30 [2:19:26<2:39:44, 599.03s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
15th- epoch: 0, train_loss = 127.47455484420061, train_acc = 0.778178854215184
test Acc 0.8794227188081937:
15th- epoch: 1, train_loss = 44.195656921714544, train_acc = 0.9101071262226362
test Acc 0.9213221601489758:
15th- epoch: 2, train_loss = 31.501319527626038, train_acc = 0.9358407079646017
test Acc 0.9338919925512105:
15th- epoch: 3, train_loss = 25.172774486243725, train_acc = 0.9496972519795063
test Acc 0.9408752327746741:
15th- epoch: 4, train_loss = 21.25533981062472, train_acc = 0.9577317186772241
test Acc 0.9459962756052142:
15th- epoch: 5, train_loss = 18.544415282085538, train_acc = 0.962971588262

15th- epoch: 146, train_loss = 1.5704411529004574, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
15th- epoch: 147, train_loss = 1.564682848751545, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
15th- epoch: 148, train_loss = 1.5602754863793962, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
15th- epoch: 149, train_loss = 1.5554269713466056, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
15th- epoch: 150, train_loss = 1.549962607503403, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
15th- epoch: 151, train_loss = 1.5453662537038326, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
15th- epoch: 152, train_loss = 1.54094797372818, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
15th- epoch: 153, train_loss = 1.535481158643961, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
15th- epoch: 154, train_loss = 1.531936610757839, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
15th- e

15th- epoch: 294, train_loss = 1.1706697406771127, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
15th- epoch: 295, train_loss = 1.1688834950327873, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
15th- epoch: 296, train_loss = 1.1681394862680463, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
15th- epoch: 297, train_loss = 1.166274480521679, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
15th- epoch: 298, train_loss = 1.1650251398532419, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
15th- epoch: 299, train_loss = 1.1631912887096405, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
15th- epoch: 300, train_loss = 1.1625528571457835, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
15th- epoch: 301, train_loss = 1.1605699732899666, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
15th- epoch: 302, train_loss = 1.1590584379882785, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
15

15th- epoch: 441, train_loss = 1.015742248542665, train_acc = 0.9976711690731253
test Acc 0.9813780260707635:
15th- epoch: 442, train_loss = 1.0154926764444099, train_acc = 0.9976711690731253
test Acc 0.9813780260707635:
15th- epoch: 443, train_loss = 1.0149461564942612, train_acc = 0.9976711690731253
test Acc 0.9813780260707635:
15th- epoch: 444, train_loss = 1.013702737785934, train_acc = 0.9976711690731253
test Acc 0.9813780260707635:
15th- epoch: 445, train_loss = 1.0134281391874538, train_acc = 0.9976711690731253
test Acc 0.9813780260707635:
15th- epoch: 446, train_loss = 1.0125953083261265, train_acc = 0.9976711690731253
test Acc 0.9813780260707635:
15th- epoch: 447, train_loss = 1.0115924651399837, train_acc = 0.9976711690731253
test Acc 0.9813780260707635:
15th- epoch: 448, train_loss = 1.010551551975368, train_acc = 0.9976711690731253
test Acc 0.9813780260707635:
15th- epoch: 449, train_loss = 1.0110094683841453, train_acc = 0.9976711690731253
test Acc 0.9813780260707635:
15th

 50%|███████████████████████████████████                                   | 15/30 [2:29:26<2:29:47, 599.18s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
16th- epoch: 0, train_loss = 126.53203892707825, train_acc = 0.7633907778295296
test Acc 0.8770949720670391:
16th- epoch: 1, train_loss = 43.34786815196276, train_acc = 0.9113879832324173
test Acc 0.9129422718808193:
16th- epoch: 2, train_loss = 31.128815229982138, train_acc = 0.9386353050768514
test Acc 0.9297020484171322:
16th- epoch: 3, train_loss = 25.101302661001682, train_acc = 0.9509781089892874
test Acc 0.9436685288640596:
16th- epoch: 4, train_loss = 21.303765315562487, train_acc = 0.9587796925943176
test Acc 0.9506517690875232:
16th- epoch: 5, train_loss = 18.627039212733507, train_acc = 0.96343735444

16th- epoch: 145, train_loss = 1.5369437547633424, train_acc = 0.9972054028877504
test Acc 0.9776536312849162:
16th- epoch: 146, train_loss = 1.5315838605165482, train_acc = 0.9972054028877504
test Acc 0.9776536312849162:
16th- epoch: 147, train_loss = 1.52669398766011, train_acc = 0.9972054028877504
test Acc 0.9776536312849162:
16th- epoch: 148, train_loss = 1.5209107244154438, train_acc = 0.9972054028877504
test Acc 0.9776536312849162:
16th- epoch: 149, train_loss = 1.5160065429518, train_acc = 0.9972054028877504
test Acc 0.9776536312849162:
16th- epoch: 150, train_loss = 1.5105823893100023, train_acc = 0.9972054028877504
test Acc 0.9776536312849162:
16th- epoch: 151, train_loss = 1.505395925254561, train_acc = 0.9972054028877504
test Acc 0.9776536312849162:
16th- epoch: 152, train_loss = 1.5003123419592157, train_acc = 0.9972054028877504
test Acc 0.9776536312849162:
16th- epoch: 153, train_loss = 1.4945966834202409, train_acc = 0.9972054028877504
test Acc 0.9776536312849162:
16th- e

16th- epoch: 293, train_loss = 1.1241378380800597, train_acc = 0.9974382859804378
test Acc 0.9781191806331471:
16th- epoch: 294, train_loss = 1.1228476439719088, train_acc = 0.9974382859804378
test Acc 0.9776536312849162:
16th- epoch: 295, train_loss = 1.1217579450458288, train_acc = 0.9974382859804378
test Acc 0.9781191806331471:
16th- epoch: 296, train_loss = 1.1203181675518863, train_acc = 0.9974382859804378
test Acc 0.9781191806331471:
16th- epoch: 297, train_loss = 1.1182552054524422, train_acc = 0.9974382859804378
test Acc 0.9776536312849162:
16th- epoch: 298, train_loss = 1.1168269726331346, train_acc = 0.9974382859804378
test Acc 0.9781191806331471:
16th- epoch: 299, train_loss = 1.1154573056846857, train_acc = 0.9974382859804378
test Acc 0.9781191806331471:
16th- epoch: 300, train_loss = 1.1141225583851337, train_acc = 0.9974382859804378
test Acc 0.9781191806331471:
16th- epoch: 301, train_loss = 1.1138184436713345, train_acc = 0.9974382859804378
test Acc 0.9781191806331471:
1

16th- epoch: 440, train_loss = 0.9751678550092038, train_acc = 0.9975547275267815
test Acc 0.9776536312849162:
16th- epoch: 441, train_loss = 0.9751182440668344, train_acc = 0.9975547275267815
test Acc 0.9776536312849162:
16th- epoch: 442, train_loss = 0.9738943794218358, train_acc = 0.9975547275267815
test Acc 0.9776536312849162:
16th- epoch: 443, train_loss = 0.9731061744096223, train_acc = 0.9975547275267815
test Acc 0.9776536312849162:
16th- epoch: 444, train_loss = 0.9725883460196201, train_acc = 0.9975547275267815
test Acc 0.9776536312849162:
16th- epoch: 445, train_loss = 0.9717762277869042, train_acc = 0.9975547275267815
test Acc 0.9776536312849162:
16th- epoch: 446, train_loss = 0.9701319870946463, train_acc = 0.9975547275267815
test Acc 0.9776536312849162:
16th- epoch: 447, train_loss = 0.9700790401548147, train_acc = 0.9975547275267815
test Acc 0.9771880819366853:
16th- epoch: 448, train_loss = 0.9692693749966566, train_acc = 0.9975547275267815
test Acc 0.9771880819366853:
1

 53%|█████████████████████████████████████▎                                | 16/30 [2:39:23<2:19:41, 598.69s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
17th- epoch: 0, train_loss = 114.40539652109146, train_acc = 0.7887750349324639
test Acc 0.8696461824953445:
17th- epoch: 1, train_loss = 43.87324829399586, train_acc = 0.9089427107591989
test Acc 0.9194599627560521:
17th- epoch: 2, train_loss = 31.612607523798943, train_acc = 0.9365393572426641
test Acc 0.931098696461825:
17th- epoch: 3, train_loss = 25.25949202850461, train_acc = 0.9470190964136004
test Acc 0.9390130353817505:
17th- epoch: 4, train_loss = 21.158839901909232, train_acc = 0.9554028877503493
test Acc 0.9422718808193669:
17th- epoch: 5, train_loss = 18.32203887589276, train_acc = 0.96145784816022

17th- epoch: 146, train_loss = 1.5387059536296874, train_acc = 0.9969725197950629
test Acc 0.9771880819366853:
17th- epoch: 147, train_loss = 1.5338269744534045, train_acc = 0.9969725197950629
test Acc 0.9776536312849162:
17th- epoch: 148, train_loss = 1.5282730776816607, train_acc = 0.9969725197950629
test Acc 0.9776536312849162:
17th- epoch: 149, train_loss = 1.5231091224122792, train_acc = 0.9969725197950629
test Acc 0.9776536312849162:
17th- epoch: 150, train_loss = 1.5178906694054604, train_acc = 0.9969725197950629
test Acc 0.9776536312849162:
17th- epoch: 151, train_loss = 1.5129271186888218, train_acc = 0.9969725197950629
test Acc 0.9776536312849162:
17th- epoch: 152, train_loss = 1.5074541978538036, train_acc = 0.9969725197950629
test Acc 0.9776536312849162:
17th- epoch: 153, train_loss = 1.503076716675423, train_acc = 0.9969725197950629
test Acc 0.9776536312849162:
17th- epoch: 154, train_loss = 1.4974065590649843, train_acc = 0.9969725197950629
test Acc 0.9776536312849162:
17

17th- epoch: 294, train_loss = 1.1280643318896182, train_acc = 0.9972054028877504
test Acc 0.9781191806331471:
17th- epoch: 295, train_loss = 1.127035714685917, train_acc = 0.9972054028877504
test Acc 0.9781191806331471:
17th- epoch: 296, train_loss = 1.1253476304118522, train_acc = 0.9972054028877504
test Acc 0.9781191806331471:
17th- epoch: 297, train_loss = 1.1240893540089019, train_acc = 0.9972054028877504
test Acc 0.9781191806331471:
17th- epoch: 298, train_loss = 1.1221339876647107, train_acc = 0.9972054028877504
test Acc 0.9781191806331471:
17th- epoch: 299, train_loss = 1.120490641624201, train_acc = 0.9972054028877504
test Acc 0.9781191806331471:
17th- epoch: 300, train_loss = 1.1194450557231903, train_acc = 0.9972054028877504
test Acc 0.9781191806331471:
17th- epoch: 301, train_loss = 1.1177475092117675, train_acc = 0.9972054028877504
test Acc 0.9781191806331471:
17th- epoch: 302, train_loss = 1.1167524109478109, train_acc = 0.9972054028877504
test Acc 0.9781191806331471:
17t

17th- epoch: 442, train_loss = 0.9771646695735399, train_acc = 0.9973218444340941
test Acc 0.9781191806331471:
17th- epoch: 443, train_loss = 0.9766312974097673, train_acc = 0.9973218444340941
test Acc 0.9781191806331471:
17th- epoch: 444, train_loss = 0.9763335722091142, train_acc = 0.9973218444340941
test Acc 0.978584729981378:
17th- epoch: 445, train_loss = 0.9753889391722623, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
17th- epoch: 446, train_loss = 0.9745545561017934, train_acc = 0.9973218444340941
test Acc 0.9781191806331471:
17th- epoch: 447, train_loss = 0.9736353854241315, train_acc = 0.9973218444340941
test Acc 0.9781191806331471:
17th- epoch: 448, train_loss = 0.9732190234062728, train_acc = 0.9974382859804378
test Acc 0.9781191806331471:
17th- epoch: 449, train_loss = 0.9722178354859352, train_acc = 0.9974382859804378
test Acc 0.9781191806331471:
17th- epoch: 450, train_loss = 0.9720549868943635, train_acc = 0.9974382859804378
test Acc 0.9781191806331471:
17t

 57%|███████████████████████████████████████▋                              | 17/30 [2:49:23<2:09:45, 598.88s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
18th- epoch: 0, train_loss = 114.45541493594646, train_acc = 0.7782952957615277
test Acc 0.8919925512104283:
18th- epoch: 1, train_loss = 44.26167467236519, train_acc = 0.9094084769445738
test Acc 0.9236499068901304:
18th- epoch: 2, train_loss = 32.07041832059622, train_acc = 0.9335118770377271
test Acc 0.9320297951582868:
18th- epoch: 3, train_loss = 26.002422146499157, train_acc = 0.9459711224965067
test Acc 0.9376163873370578:
18th- epoch: 4, train_loss = 22.08591390401125, train_acc = 0.9554028877503493
test Acc 0.9427374301675978:
18th- epoch: 5, train_loss = 19.235760431736708, train_acc = 0.9616907312529

18th- epoch: 145, train_loss = 1.5695761168608442, train_acc = 0.9970889613414066
test Acc 0.9781191806331471:
18th- epoch: 146, train_loss = 1.5636711729457602, train_acc = 0.9970889613414066
test Acc 0.9781191806331471:
18th- epoch: 147, train_loss = 1.5581247558584437, train_acc = 0.9970889613414066
test Acc 0.9781191806331471:
18th- epoch: 148, train_loss = 1.5527813894441351, train_acc = 0.9970889613414066
test Acc 0.9781191806331471:
18th- epoch: 149, train_loss = 1.547506413073279, train_acc = 0.9970889613414066
test Acc 0.9781191806331471:
18th- epoch: 150, train_loss = 1.542655477882363, train_acc = 0.9969725197950629
test Acc 0.9781191806331471:
18th- epoch: 151, train_loss = 1.5368550767889246, train_acc = 0.9969725197950629
test Acc 0.9781191806331471:
18th- epoch: 152, train_loss = 1.5312280046055093, train_acc = 0.9970889613414066
test Acc 0.9781191806331471:
18th- epoch: 153, train_loss = 1.5266831616172567, train_acc = 0.9970889613414066
test Acc 0.9781191806331471:
18t

test Acc 0.9813780260707635:
18th- epoch: 293, train_loss = 1.141101115674246, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
18th- epoch: 294, train_loss = 1.1393364680116065, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
18th- epoch: 295, train_loss = 1.1378508235211484, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
18th- epoch: 296, train_loss = 1.1363596506416798, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
18th- epoch: 297, train_loss = 1.1346702724695206, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
18th- epoch: 298, train_loss = 1.1326524739270099, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
18th- epoch: 299, train_loss = 1.132029237865936, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
18th- epoch: 300, train_loss = 1.129818458110094, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
18th- epoch: 301, train_loss = 1.128423682122957, train_acc = 0.9973218444340941
test 

18th- epoch: 440, train_loss = 0.9841280865075532, train_acc = 0.9974382859804378
test Acc 0.9818435754189944:
18th- epoch: 441, train_loss = 0.983550414443016, train_acc = 0.9974382859804378
test Acc 0.9818435754189944:
18th- epoch: 442, train_loss = 0.9829999369976576, train_acc = 0.9974382859804378
test Acc 0.9818435754189944:
18th- epoch: 443, train_loss = 0.9828201197087765, train_acc = 0.9974382859804378
test Acc 0.9818435754189944:
18th- epoch: 444, train_loss = 0.9809852453472558, train_acc = 0.9974382859804378
test Acc 0.9818435754189944:
18th- epoch: 445, train_loss = 0.9808145612478256, train_acc = 0.9974382859804378
test Acc 0.9818435754189944:
18th- epoch: 446, train_loss = 0.9798801305296365, train_acc = 0.9974382859804378
test Acc 0.9818435754189944:
18th- epoch: 447, train_loss = 0.9792983370425645, train_acc = 0.9974382859804378
test Acc 0.9818435754189944:
18th- epoch: 448, train_loss = 0.97850633165217, train_acc = 0.9974382859804378
test Acc 0.9818435754189944:
18th

 60%|██████████████████████████████████████████                            | 18/30 [2:59:22<1:59:47, 598.95s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
19th- epoch: 0, train_loss = 137.81563758850098, train_acc = 0.7649045179319981
test Acc 0.8435754189944135:
19th- epoch: 1, train_loss = 45.36756218969822, train_acc = 0.9077782952957615
test Acc 0.8868715083798883:
19th- epoch: 2, train_loss = 33.248519118875265, train_acc = 0.9346762925011645
test Acc 0.914804469273743:
19th- epoch: 3, train_loss = 27.022679667919874, train_acc = 0.9485328365160689
test Acc 0.9315642458100558:
19th- epoch: 4, train_loss = 23.01511850208044, train_acc = 0.9561015370284117
test Acc 0.9422718808193669:
19th- epoch: 5, train_loss = 20.135420406237245, train_acc = 0.9604098742431

test Acc 0.9823091247672253:
19th- epoch: 146, train_loss = 1.5414646279532462, train_acc = 0.9974382859804378
test Acc 0.9823091247672253:
19th- epoch: 147, train_loss = 1.536464219680056, train_acc = 0.9974382859804378
test Acc 0.9823091247672253:
19th- epoch: 148, train_loss = 1.5319612396415323, train_acc = 0.9974382859804378
test Acc 0.9823091247672253:
19th- epoch: 149, train_loss = 1.5262379811611027, train_acc = 0.9974382859804378
test Acc 0.9823091247672253:
19th- epoch: 150, train_loss = 1.5215948021505028, train_acc = 0.9974382859804378
test Acc 0.9823091247672253:
19th- epoch: 151, train_loss = 1.5163898898754269, train_acc = 0.9974382859804378
test Acc 0.9823091247672253:
19th- epoch: 152, train_loss = 1.5119648359250277, train_acc = 0.9974382859804378
test Acc 0.9823091247672253:
19th- epoch: 153, train_loss = 1.5067537734284997, train_acc = 0.9974382859804378
test Acc 0.9823091247672253:
19th- epoch: 154, train_loss = 1.5024538745637983, train_acc = 0.9974382859804378
te

test Acc 0.9832402234636871:
19th- epoch: 220, train_loss = 1.2844461239874363, train_acc = 0.9974382859804378
test Acc 0.9832402234636871:
19th- epoch: 221, train_loss = 1.2815198065945879, train_acc = 0.9974382859804378
test Acc 0.9832402234636871:
19th- epoch: 222, train_loss = 1.2796669671079144, train_acc = 0.9974382859804378
test Acc 0.9832402234636871:
19th- epoch: 223, train_loss = 1.2770974524319172, train_acc = 0.9974382859804378
test Acc 0.9832402234636871:
19th- epoch: 224, train_loss = 1.2744972854852676, train_acc = 0.9974382859804378
test Acc 0.9832402234636871:
19th- epoch: 225, train_loss = 1.2719718907028437, train_acc = 0.9974382859804378
test Acc 0.9832402234636871:
19th- epoch: 226, train_loss = 1.2701398668577895, train_acc = 0.9974382859804378
test Acc 0.9832402234636871:
19th- epoch: 227, train_loss = 1.2672723165014759, train_acc = 0.9974382859804378
test Acc 0.9832402234636871:
19th- epoch: 228, train_loss = 1.2657101905206218, train_acc = 0.9974382859804378
t

test Acc 0.9832402234636871:
19th- epoch: 367, train_loss = 1.0550396361504681, train_acc = 0.9977876106194691
test Acc 0.9832402234636871:
19th- epoch: 368, train_loss = 1.0533997646416537, train_acc = 0.9977876106194691
test Acc 0.9832402234636871:
19th- epoch: 369, train_loss = 1.0522582003031857, train_acc = 0.9977876106194691
test Acc 0.9832402234636871:
19th- epoch: 370, train_loss = 1.0511880572885275, train_acc = 0.9977876106194691
test Acc 0.9832402234636871:
19th- epoch: 371, train_loss = 1.050571583211422, train_acc = 0.9977876106194691
test Acc 0.9832402234636871:
19th- epoch: 372, train_loss = 1.0488683612202294, train_acc = 0.9977876106194691
test Acc 0.9832402234636871:
19th- epoch: 373, train_loss = 1.0481557585299015, train_acc = 0.9977876106194691
test Acc 0.9832402234636871:
19th- epoch: 374, train_loss = 1.046973502903711, train_acc = 0.9977876106194691
test Acc 0.9832402234636871:
19th- epoch: 375, train_loss = 1.046483501791954, train_acc = 0.9977876106194691
test

 63%|████████████████████████████████████████████▎                         | 19/30 [3:09:20<1:49:47, 598.86s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
20th- epoch: 0, train_loss = 115.24945767223835, train_acc = 0.7869119701909641
test Acc 0.8873370577281192:
20th- epoch: 1, train_loss = 40.71963457763195, train_acc = 0.9224499301350721
test Acc 0.9297020484171322:
20th- epoch: 2, train_loss = 29.916068241000175, train_acc = 0.9435258500232883
test Acc 0.9408752327746741:
20th- epoch: 3, train_loss = 24.512979693710804, train_acc = 0.9535398230088495
test Acc 0.9487895716945997:
20th- epoch: 4, train_loss = 20.972793359309435, train_acc = 0.9592454587796926
test Acc 0.957169459962756:
20th- epoch: 5, train_loss = 18.40068293735385, train_acc = 0.9634373544480

20th- epoch: 146, train_loss = 1.4721976656001061, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
20th- epoch: 147, train_loss = 1.4673811569809914, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
20th- epoch: 148, train_loss = 1.4625722442287952, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
20th- epoch: 149, train_loss = 1.4577567242085934, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
20th- epoch: 150, train_loss = 1.4533293310087174, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
20th- epoch: 151, train_loss = 1.4481996446847916, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
20th- epoch: 152, train_loss = 1.4438216488342732, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
20th- epoch: 153, train_loss = 1.438998925150372, train_acc = 0.9973218444340941
test Acc 0.9809124767225326:
20th- epoch: 154, train_loss = 1.4351504556834698, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
20

20th- epoch: 293, train_loss = 1.1030412974650972, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
20th- epoch: 294, train_loss = 1.1015741862356663, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
20th- epoch: 295, train_loss = 1.100625158578623, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
20th- epoch: 296, train_loss = 1.0990572609007359, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
20th- epoch: 297, train_loss = 1.0981341153383255, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
20th- epoch: 298, train_loss = 1.0961745877866633, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
20th- epoch: 299, train_loss = 1.095047913491726, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
20th- epoch: 300, train_loss = 1.093832179903984, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
20th- epoch: 301, train_loss = 1.0926806690986268, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
20th

20th- epoch: 367, train_loss = 1.021250817924738, train_acc = 0.9974382859804378
test Acc 0.9804469273743017:
20th- epoch: 368, train_loss = 1.0204770900309086, train_acc = 0.9974382859804378
test Acc 0.9804469273743017:
20th- epoch: 369, train_loss = 1.0198153667151928, train_acc = 0.9974382859804378
test Acc 0.9804469273743017:
20th- epoch: 370, train_loss = 1.0189218285377137, train_acc = 0.9974382859804378
test Acc 0.9804469273743017:
20th- epoch: 371, train_loss = 1.017832839221228, train_acc = 0.9974382859804378
test Acc 0.9804469273743017:
20th- epoch: 372, train_loss = 1.0166849456727505, train_acc = 0.9974382859804378
test Acc 0.9804469273743017:
20th- epoch: 373, train_loss = 1.0163638927042484, train_acc = 0.9974382859804378
test Acc 0.9804469273743017:
20th- epoch: 374, train_loss = 1.015044103085529, train_acc = 0.9974382859804378
test Acc 0.9804469273743017:
20th- epoch: 375, train_loss = 1.0147899563307874, train_acc = 0.9974382859804378
test Acc 0.9804469273743017:
20th

 67%|██████████████████████████████████████████████▋                       | 20/30 [3:19:20<1:39:50, 599.06s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
21th- epoch: 0, train_loss = 139.0367359444499, train_acc = 0.7524452724732185
test Acc 0.8794227188081937:
21th- epoch: 1, train_loss = 44.29526772350073, train_acc = 0.9105728924080112
test Acc 0.9180633147113594:
21th- epoch: 2, train_loss = 31.85752570256591, train_acc = 0.9381695388914765
test Acc 0.9269087523277467:
21th- epoch: 3, train_loss = 25.609631817787886, train_acc = 0.9493479273404751
test Acc 0.9366852886405959:
21th- epoch: 4, train_loss = 21.668907333165407, train_acc = 0.9577317186772241
test Acc 0.9432029795158287:
21th- epoch: 5, train_loss = 18.82619269937277, train_acc = 0.96320447135537

21th- epoch: 145, train_loss = 1.5437512969365343, train_acc = 0.9970889613414066
test Acc 0.9818435754189944:
21th- epoch: 146, train_loss = 1.5383742563426495, train_acc = 0.9970889613414066
test Acc 0.9818435754189944:
21th- epoch: 147, train_loss = 1.5335645253071561, train_acc = 0.9970889613414066
test Acc 0.9818435754189944:
21th- epoch: 148, train_loss = 1.5272890975465998, train_acc = 0.9970889613414066
test Acc 0.9818435754189944:
21th- epoch: 149, train_loss = 1.5228893905878067, train_acc = 0.9970889613414066
test Acc 0.9818435754189944:
21th- epoch: 150, train_loss = 1.517749579041265, train_acc = 0.9970889613414066
test Acc 0.9818435754189944:
21th- epoch: 151, train_loss = 1.5128928931662813, train_acc = 0.9970889613414066
test Acc 0.9818435754189944:
21th- epoch: 152, train_loss = 1.5082593919942155, train_acc = 0.9970889613414066
test Acc 0.9818435754189944:
21th- epoch: 153, train_loss = 1.5030267536640167, train_acc = 0.9970889613414066
test Acc 0.9818435754189944:
21

21th- epoch: 219, train_loss = 1.2777752950787544, train_acc = 0.9973218444340941
test Acc 0.9818435754189944:
21th- epoch: 220, train_loss = 1.275747346400749, train_acc = 0.9973218444340941
test Acc 0.9818435754189944:
21th- epoch: 221, train_loss = 1.273087517649401, train_acc = 0.9973218444340941
test Acc 0.9818435754189944:
21th- epoch: 222, train_loss = 1.2709169052541256, train_acc = 0.9973218444340941
test Acc 0.9818435754189944:
21th- epoch: 223, train_loss = 1.2688736828858964, train_acc = 0.9973218444340941
test Acc 0.9818435754189944:
21th- epoch: 224, train_loss = 1.2660465960507281, train_acc = 0.9973218444340941
test Acc 0.9818435754189944:
21th- epoch: 225, train_loss = 1.2639687334303744, train_acc = 0.9973218444340941
test Acc 0.9818435754189944:
21th- epoch: 226, train_loss = 1.2614648279850371, train_acc = 0.9973218444340941
test Acc 0.9818435754189944:
21th- epoch: 227, train_loss = 1.2598201123182662, train_acc = 0.9973218444340941
test Acc 0.9818435754189944:
21t

test Acc 0.9818435754189944:
21th- epoch: 367, train_loss = 1.04861076301313, train_acc = 0.9973218444340941
test Acc 0.9818435754189944:
21th- epoch: 368, train_loss = 1.048180670797592, train_acc = 0.9973218444340941
test Acc 0.9818435754189944:
21th- epoch: 369, train_loss = 1.0470978766679764, train_acc = 0.9973218444340941
test Acc 0.9818435754189944:
21th- epoch: 370, train_loss = 1.0457127963600215, train_acc = 0.9973218444340941
test Acc 0.9818435754189944:
21th- epoch: 371, train_loss = 1.0446343955991324, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
21th- epoch: 372, train_loss = 1.0444553308188915, train_acc = 0.9973218444340941
test Acc 0.9818435754189944:
21th- epoch: 373, train_loss = 1.0429761645791586, train_acc = 0.9973218444340941
test Acc 0.9818435754189944:
21th- epoch: 374, train_loss = 1.0422206012008246, train_acc = 0.9973218444340941
test Acc 0.9818435754189944:
21th- epoch: 375, train_loss = 1.040926376968855, train_acc = 0.9973218444340941
test 

 70%|█████████████████████████████████████████████████                     | 21/30 [3:29:20<1:29:55, 599.45s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
22th- epoch: 0, train_loss = 139.52416820824146, train_acc = 0.7582673497904052
test Acc 0.8710428305400373:
22th- epoch: 1, train_loss = 46.42191171646118, train_acc = 0.904052165812762
test Acc 0.9129422718808193:
22th- epoch: 2, train_loss = 33.00591354072094, train_acc = 0.9329296693060084
test Acc 0.9259776536312849:
22th- epoch: 3, train_loss = 26.503715604543686, train_acc = 0.9451560316721006
test Acc 0.9366852886405959:
22th- epoch: 4, train_loss = 22.432009052485228, train_acc = 0.9536562645551933
test Acc 0.9450651769087524:
22th- epoch: 5, train_loss = 19.57628185302019, train_acc = 0.96122496506753

22th- epoch: 146, train_loss = 1.6234012295026332, train_acc = 0.9972054028877504
test Acc 0.9757914338919925:
22th- epoch: 147, train_loss = 1.6171724896412343, train_acc = 0.9972054028877504
test Acc 0.9762569832402235:
22th- epoch: 148, train_loss = 1.6110930442810059, train_acc = 0.9972054028877504
test Acc 0.9757914338919925:
22th- epoch: 149, train_loss = 1.6053552452940494, train_acc = 0.9972054028877504
test Acc 0.9762569832402235:
22th- epoch: 150, train_loss = 1.5995257075410336, train_acc = 0.9972054028877504
test Acc 0.9762569832402235:
22th- epoch: 151, train_loss = 1.5941373507957906, train_acc = 0.9972054028877504
test Acc 0.9762569832402235:
22th- epoch: 152, train_loss = 1.5881411533337086, train_acc = 0.9972054028877504
test Acc 0.9757914338919925:
22th- epoch: 153, train_loss = 1.5820312935393304, train_acc = 0.9972054028877504
test Acc 0.9757914338919925:
22th- epoch: 154, train_loss = 1.577406057389453, train_acc = 0.9972054028877504
test Acc 0.9757914338919925:
22

test Acc 0.9776536312849162:
22th- epoch: 294, train_loss = 1.1688553392887115, train_acc = 0.9973218444340941
test Acc 0.9776536312849162:
22th- epoch: 295, train_loss = 1.1672530720825307, train_acc = 0.9973218444340941
test Acc 0.9776536312849162:
22th- epoch: 296, train_loss = 1.1653773399884813, train_acc = 0.9973218444340941
test Acc 0.9776536312849162:
22th- epoch: 297, train_loss = 1.1638780261273496, train_acc = 0.9973218444340941
test Acc 0.9776536312849162:
22th- epoch: 298, train_loss = 1.1624545330996625, train_acc = 0.9973218444340941
test Acc 0.9776536312849162:
22th- epoch: 299, train_loss = 1.1609785370528698, train_acc = 0.9973218444340941
test Acc 0.9776536312849162:
22th- epoch: 300, train_loss = 1.1593738198280334, train_acc = 0.9973218444340941
test Acc 0.9776536312849162:
22th- epoch: 301, train_loss = 1.159057229757309, train_acc = 0.9973218444340941
test Acc 0.9776536312849162:
22th- epoch: 302, train_loss = 1.1564142939751036, train_acc = 0.9973218444340941
te

22th- epoch: 442, train_loss = 1.0063363760709763, train_acc = 0.9973218444340941
test Acc 0.978584729981378:
22th- epoch: 443, train_loss = 1.0048061596753541, train_acc = 0.9973218444340941
test Acc 0.978584729981378:
22th- epoch: 444, train_loss = 1.0047062461671885, train_acc = 0.9973218444340941
test Acc 0.978584729981378:
22th- epoch: 445, train_loss = 1.0028232298791409, train_acc = 0.9973218444340941
test Acc 0.978584729981378:
22th- epoch: 446, train_loss = 1.0031251510081347, train_acc = 0.9973218444340941
test Acc 0.978584729981378:
22th- epoch: 447, train_loss = 1.0018576507864054, train_acc = 0.9973218444340941
test Acc 0.978584729981378:
22th- epoch: 448, train_loss = 1.0016488606634084, train_acc = 0.9973218444340941
test Acc 0.978584729981378:
22th- epoch: 449, train_loss = 0.9999815411865711, train_acc = 0.9973218444340941
test Acc 0.978584729981378:
22th- epoch: 450, train_loss = 1.0002166479825974, train_acc = 0.9973218444340941
test Acc 0.978584729981378:
22th- epoc

 73%|███████████████████████████████████████████████████▎                  | 22/30 [3:39:20<1:19:57, 599.63s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
23th- epoch: 0, train_loss = 126.42875200510025, train_acc = 0.7682813227759665
test Acc 0.8822160148975792:
23th- epoch: 1, train_loss = 45.097257524728775, train_acc = 0.9095249184909175
test Acc 0.9241154562383612:
23th- epoch: 2, train_loss = 32.96508913487196, train_acc = 0.9344434094084769
test Acc 0.9385474860335196:
23th- epoch: 3, train_loss = 26.755202628672123, train_acc = 0.9474848625989754
test Acc 0.9450651769087524:
23th- epoch: 4, train_loss = 22.81513339281082, train_acc = 0.9556357708430367
test Acc 0.9483240223463687:
23th- epoch: 5, train_loss = 19.990813095122576, train_acc = 0.961224965067

23th- epoch: 145, train_loss = 1.540206165285781, train_acc = 0.9972054028877504
test Acc 0.9809124767225326:
23th- epoch: 146, train_loss = 1.5350743632297963, train_acc = 0.9972054028877504
test Acc 0.9809124767225326:
23th- epoch: 147, train_loss = 1.529136101482436, train_acc = 0.9972054028877504
test Acc 0.9809124767225326:
23th- epoch: 148, train_loss = 1.5238012063782662, train_acc = 0.9972054028877504
test Acc 0.9809124767225326:
23th- epoch: 149, train_loss = 1.5191912837326527, train_acc = 0.9972054028877504
test Acc 0.9809124767225326:
23th- epoch: 150, train_loss = 1.5135752235073596, train_acc = 0.9972054028877504
test Acc 0.9809124767225326:
23th- epoch: 151, train_loss = 1.5088286934187636, train_acc = 0.9972054028877504
test Acc 0.9809124767225326:
23th- epoch: 152, train_loss = 1.5040850093355402, train_acc = 0.9972054028877504
test Acc 0.9809124767225326:
23th- epoch: 153, train_loss = 1.498827355564572, train_acc = 0.9972054028877504
test Acc 0.9809124767225326:
23th

test Acc 0.9813780260707635:
23th- epoch: 293, train_loss = 1.149513565003872, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
23th- epoch: 294, train_loss = 1.14854009822011, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
23th- epoch: 295, train_loss = 1.1466181625728495, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
23th- epoch: 296, train_loss = 1.145414188504219, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
23th- epoch: 297, train_loss = 1.1433092790539376, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
23th- epoch: 298, train_loss = 1.1422566597466357, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
23th- epoch: 299, train_loss = 1.1406195312738419, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
23th- epoch: 300, train_loss = 1.1396560805733316, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
23th- epoch: 301, train_loss = 1.1375092305243015, train_acc = 0.9973218444340941
test 

test Acc 0.9813780260707635:
23th- epoch: 367, train_loss = 1.0618472062051296, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
23th- epoch: 368, train_loss = 1.0621744468808174, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
23th- epoch: 369, train_loss = 1.0609476591343991, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
23th- epoch: 370, train_loss = 1.0596975634689443, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
23th- epoch: 371, train_loss = 1.0589581218664534, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
23th- epoch: 372, train_loss = 1.0575446474249475, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
23th- epoch: 373, train_loss = 1.0572012973134406, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
23th- epoch: 374, train_loss = 1.0557775770430453, train_acc = 0.9973218444340941
test Acc 0.9813780260707635:
23th- epoch: 375, train_loss = 1.0552113850717433, train_acc = 0.9973218444340941
t

 77%|█████████████████████████████████████████████████████▋                | 23/30 [3:49:21<1:09:59, 599.96s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
24th- epoch: 0, train_loss = 137.42208197712898, train_acc = 0.7686306474149976
test Acc 0.8850093109869647:
24th- epoch: 1, train_loss = 45.073923259973526, train_acc = 0.9106893339543549
test Acc 0.9152700186219739:
24th- epoch: 2, train_loss = 32.72907539829612, train_acc = 0.9345598509548206
test Acc 0.9287709497206704:
24th- epoch: 3, train_loss = 26.363103833049536, train_acc = 0.9452724732184443
test Acc 0.9418063314711359:
24th- epoch: 4, train_loss = 22.300114516168833, train_acc = 0.9540055891942245
test Acc 0.9473929236499069:
24th- epoch: 5, train_loss = 19.41576362401247, train_acc = 0.960526315789

24th- epoch: 146, train_loss = 1.5492344623198733, train_acc = 0.9973218444340941
test Acc 0.9757914338919925:
24th- epoch: 147, train_loss = 1.54324008023832, train_acc = 0.9973218444340941
test Acc 0.9757914338919925:
24th- epoch: 148, train_loss = 1.5378291172673926, train_acc = 0.9973218444340941
test Acc 0.9757914338919925:
24th- epoch: 149, train_loss = 1.5316209271550179, train_acc = 0.9973218444340941
test Acc 0.9757914338919925:
24th- epoch: 150, train_loss = 1.526660112082027, train_acc = 0.9973218444340941
test Acc 0.9757914338919925:
24th- epoch: 151, train_loss = 1.5204169489443302, train_acc = 0.9973218444340941
test Acc 0.9762569832402235:
24th- epoch: 152, train_loss = 1.5152099380502477, train_acc = 0.9973218444340941
test Acc 0.9762569832402235:
24th- epoch: 153, train_loss = 1.5094624845078215, train_acc = 0.9973218444340941
test Acc 0.9762569832402235:
24th- epoch: 154, train_loss = 1.5044082142412663, train_acc = 0.9973218444340941
test Acc 0.9762569832402235:
24th

24th- epoch: 293, train_loss = 1.123718739807373, train_acc = 0.9973218444340941
test Acc 0.9762569832402235:
24th- epoch: 294, train_loss = 1.122300195187563, train_acc = 0.9973218444340941
test Acc 0.9762569832402235:
24th- epoch: 295, train_loss = 1.1207364474830683, train_acc = 0.9973218444340941
test Acc 0.9762569832402235:
24th- epoch: 296, train_loss = 1.1193802542984486, train_acc = 0.9973218444340941
test Acc 0.9762569832402235:
24th- epoch: 297, train_loss = 1.11789140602923, train_acc = 0.9973218444340941
test Acc 0.9762569832402235:
24th- epoch: 298, train_loss = 1.1164186944661196, train_acc = 0.9973218444340941
test Acc 0.9762569832402235:
24th- epoch: 299, train_loss = 1.1150457163748797, train_acc = 0.9973218444340941
test Acc 0.9762569832402235:
24th- epoch: 300, train_loss = 1.1130405118165072, train_acc = 0.9974382859804378
test Acc 0.9762569832402235:
24th- epoch: 301, train_loss = 1.1112248239514884, train_acc = 0.9974382859804378
test Acc 0.9762569832402235:
24th-

24th- epoch: 367, train_loss = 1.0324612843396608, train_acc = 0.9976711690731253
test Acc 0.9757914338919925:
24th- epoch: 368, train_loss = 1.0315739065408707, train_acc = 0.9976711690731253
test Acc 0.9762569832402235:
24th- epoch: 369, train_loss = 1.0300854345259722, train_acc = 0.9976711690731253
test Acc 0.9757914338919925:
24th- epoch: 370, train_loss = 1.029012775659794, train_acc = 0.9976711690731253
test Acc 0.9762569832402235:
24th- epoch: 371, train_loss = 1.0286954802868422, train_acc = 0.9976711690731253
test Acc 0.9762569832402235:
24th- epoch: 372, train_loss = 1.0270163491368294, train_acc = 0.9976711690731253
test Acc 0.9762569832402235:
24th- epoch: 373, train_loss = 1.0261609330773354, train_acc = 0.9976711690731253
test Acc 0.9757914338919925:
24th- epoch: 374, train_loss = 1.0258701319398824, train_acc = 0.9976711690731253
test Acc 0.9762569832402235:
24th- epoch: 375, train_loss = 1.0244514929654542, train_acc = 0.9976711690731253
test Acc 0.9762569832402235:
24

 80%|████████████████████████████████████████████████████████              | 24/30 [3:59:21<1:00:00, 600.04s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
25th- epoch: 0, train_loss = 138.33161522448063, train_acc = 0.7538425710293433
test Acc 0.8701117318435754:
25th- epoch: 1, train_loss = 42.922269247472286, train_acc = 0.907545412203074
test Acc 0.9227188081936686:
25th- epoch: 2, train_loss = 30.127762608230114, train_acc = 0.935724266418258
test Acc 0.9418063314711359:
25th- epoch: 3, train_loss = 24.030582323670387, train_acc = 0.9491150442477876
test Acc 0.9483240223463687:
25th- epoch: 4, train_loss = 20.26810473576188, train_acc = 0.9572659524918491
test Acc 0.9534450651769087:
25th- epoch: 5, train_loss = 17.64822068065405, train_acc = 0.96413600372612

25th- epoch: 146, train_loss = 1.5098048573127016, train_acc = 0.9974382859804378
test Acc 0.9795158286778398:
25th- epoch: 147, train_loss = 1.5052157193422318, train_acc = 0.9974382859804378
test Acc 0.9795158286778398:
25th- epoch: 148, train_loss = 1.5002997206756845, train_acc = 0.9974382859804378
test Acc 0.9804469273743017:
25th- epoch: 149, train_loss = 1.4952170526375994, train_acc = 0.9974382859804378
test Acc 0.9799813780260708:
25th- epoch: 150, train_loss = 1.4907836044440046, train_acc = 0.9974382859804378
test Acc 0.9804469273743017:
25th- epoch: 151, train_loss = 1.4859527312219143, train_acc = 0.9974382859804378
test Acc 0.9804469273743017:
25th- epoch: 152, train_loss = 1.4813822557916865, train_acc = 0.9974382859804378
test Acc 0.9804469273743017:
25th- epoch: 153, train_loss = 1.4763168841600418, train_acc = 0.9974382859804378
test Acc 0.9799813780260708:
25th- epoch: 154, train_loss = 1.4716570638120174, train_acc = 0.9974382859804378
test Acc 0.9799813780260708:
2

25th- epoch: 220, train_loss = 1.2570204213261604, train_acc = 0.9973218444340941
test Acc 0.9804469273743017:
25th- epoch: 221, train_loss = 1.2545391581952572, train_acc = 0.9973218444340941
test Acc 0.9804469273743017:
25th- epoch: 222, train_loss = 1.2533486361498944, train_acc = 0.9973218444340941
test Acc 0.9804469273743017:
25th- epoch: 223, train_loss = 1.25100614503026, train_acc = 0.9972054028877504
test Acc 0.9804469273743017:
25th- epoch: 224, train_loss = 1.2486477333004586, train_acc = 0.9973218444340941
test Acc 0.9804469273743017:
25th- epoch: 225, train_loss = 1.2464118587668054, train_acc = 0.9973218444340941
test Acc 0.9804469273743017:
25th- epoch: 226, train_loss = 1.2435251213610172, train_acc = 0.9973218444340941
test Acc 0.9804469273743017:
25th- epoch: 227, train_loss = 1.241251161962282, train_acc = 0.9973218444340941
test Acc 0.9804469273743017:
25th- epoch: 228, train_loss = 1.239927377551794, train_acc = 0.9973218444340941
test Acc 0.9809124767225326:
25th-

test Acc 0.9809124767225326:
25th- epoch: 368, train_loss = 1.0401655261812266, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
25th- epoch: 369, train_loss = 1.0401201459171716, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
25th- epoch: 370, train_loss = 1.0387915236351546, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
25th- epoch: 371, train_loss = 1.0377385740575846, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
25th- epoch: 372, train_loss = 1.0371138701739255, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
25th- epoch: 373, train_loss = 1.036096140742302, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
25th- epoch: 374, train_loss = 1.034454744309187, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
25th- epoch: 375, train_loss = 1.0348518043756485, train_acc = 0.9974382859804378
test Acc 0.9809124767225326:
25th- epoch: 376, train_loss = 1.0326810727419797, train_acc = 0.9974382859804378
tes

 83%|████████████████████████████████████████████████████████████            | 25/30 [4:09:21<49:59, 599.99s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
26th- epoch: 0, train_loss = 117.53440274298191, train_acc = 0.7986725663716814
test Acc 0.8822160148975792:
26th- epoch: 1, train_loss = 41.28352787345648, train_acc = 0.9214019562179786
test Acc 0.9194599627560521:
26th- epoch: 2, train_loss = 30.401863306760788, train_acc = 0.9402654867256637
test Acc 0.9338919925512105:
26th- epoch: 3, train_loss = 24.629316225647926, train_acc = 0.9507452258965999
test Acc 0.9427374301675978:
26th- epoch: 4, train_loss = 20.80338730290532, train_acc = 0.9588961341406614
test Acc 0.9483240223463687:
26th- epoch: 5, train_loss = 18.049234628677368, train_acc = 0.964601769911

26th- epoch: 146, train_loss = 1.474029072909616, train_acc = 0.9970889613414066
test Acc 0.978584729981378:
26th- epoch: 147, train_loss = 1.4696301569929346, train_acc = 0.9970889613414066
test Acc 0.978584729981378:
26th- epoch: 148, train_loss = 1.465147795737721, train_acc = 0.9970889613414066
test Acc 0.978584729981378:
26th- epoch: 149, train_loss = 1.460497229010798, train_acc = 0.9970889613414066
test Acc 0.978584729981378:
26th- epoch: 150, train_loss = 1.4563804218778387, train_acc = 0.9970889613414066
test Acc 0.9781191806331471:
26th- epoch: 151, train_loss = 1.4520923495292664, train_acc = 0.9970889613414066
test Acc 0.978584729981378:
26th- epoch: 152, train_loss = 1.4475133419036865, train_acc = 0.9970889613414066
test Acc 0.9781191806331471:
26th- epoch: 153, train_loss = 1.4432771106949076, train_acc = 0.9970889613414066
test Acc 0.978584729981378:
26th- epoch: 154, train_loss = 1.439251055358909, train_acc = 0.9970889613414066
test Acc 0.978584729981378:
26th- epoch:

26th- epoch: 294, train_loss = 1.1150908296112902, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
26th- epoch: 295, train_loss = 1.1134378065471537, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
26th- epoch: 296, train_loss = 1.112073142081499, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
26th- epoch: 297, train_loss = 1.1109363946015947, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
26th- epoch: 298, train_loss = 1.1095160891418345, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
26th- epoch: 299, train_loss = 1.1081283055245876, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
26th- epoch: 300, train_loss = 1.106923212588299, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
26th- epoch: 301, train_loss = 1.1057651415467262, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
26th- epoch: 302, train_loss = 1.1045555832679383, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
26t

26th- epoch: 441, train_loss = 0.9769663065671921, train_acc = 0.9974382859804378
test Acc 0.9795158286778398:
26th- epoch: 442, train_loss = 0.9767102648911532, train_acc = 0.9974382859804378
test Acc 0.9795158286778398:
26th- epoch: 443, train_loss = 0.9759055425820407, train_acc = 0.9974382859804378
test Acc 0.9795158286778398:
26th- epoch: 444, train_loss = 0.974983461201191, train_acc = 0.9974382859804378
test Acc 0.9795158286778398:
26th- epoch: 445, train_loss = 0.9747690769436304, train_acc = 0.9974382859804378
test Acc 0.9795158286778398:
26th- epoch: 446, train_loss = 0.9738850519061089, train_acc = 0.9974382859804378
test Acc 0.9795158286778398:
26th- epoch: 447, train_loss = 0.9730054500105325, train_acc = 0.9974382859804378
test Acc 0.9795158286778398:
26th- epoch: 448, train_loss = 0.972576587140793, train_acc = 0.9974382859804378
test Acc 0.9795158286778398:
26th- epoch: 449, train_loss = 0.9718788651225623, train_acc = 0.9974382859804378
test Acc 0.9795158286778398:
26t

 87%|██████████████████████████████████████████████████████████████▍         | 26/30 [4:19:21<40:00, 600.04s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
27th- epoch: 0, train_loss = 120.01467788219452, train_acc = 0.7812063344201211
test Acc 0.86731843575419:
27th- epoch: 1, train_loss = 43.486647963523865, train_acc = 0.9126688402421984
test Acc 0.909683426443203:
27th- epoch: 2, train_loss = 31.42276230081916, train_acc = 0.9382859804378202
test Acc 0.9283054003724395:
27th- epoch: 3, train_loss = 25.287669137120247, train_acc = 0.9491150442477876
test Acc 0.9390130353817505:
27th- epoch: 4, train_loss = 21.402035631239414, train_acc = 0.9570330693991617
test Acc 0.9450651769087524:
27th- epoch: 5, train_loss = 18.646835807710886, train_acc = 0.96238938053097

27th- epoch: 145, train_loss = 1.4979132569860667, train_acc = 0.9972054028877504
test Acc 0.9795158286778398:
27th- epoch: 146, train_loss = 1.4923815820366144, train_acc = 0.9972054028877504
test Acc 0.9795158286778398:
27th- epoch: 147, train_loss = 1.487522494746372, train_acc = 0.9972054028877504
test Acc 0.9795158286778398:
27th- epoch: 148, train_loss = 1.4829026882071048, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
27th- epoch: 149, train_loss = 1.477587535395287, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
27th- epoch: 150, train_loss = 1.4732680296292529, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
27th- epoch: 151, train_loss = 1.468651640578173, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
27th- epoch: 152, train_loss = 1.4635423409054056, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
27th- epoch: 153, train_loss = 1.459710213006474, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
27th-

test Acc 0.9795158286778398:
27th- epoch: 293, train_loss = 1.1157637722790241, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
27th- epoch: 294, train_loss = 1.1142721797223203, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
27th- epoch: 295, train_loss = 1.1123787226970308, train_acc = 0.9973218444340941
test Acc 0.9795158286778398:
27th- epoch: 296, train_loss = 1.1116937473416328, train_acc = 0.9973218444340941
test Acc 0.9799813780260708:
27th- epoch: 297, train_loss = 1.110567172348965, train_acc = 0.9973218444340941
test Acc 0.9799813780260708:
27th- epoch: 298, train_loss = 1.108452149957884, train_acc = 0.9973218444340941
test Acc 0.9799813780260708:
27th- epoch: 299, train_loss = 1.107162928848993, train_acc = 0.9973218444340941
test Acc 0.9799813780260708:
27th- epoch: 300, train_loss = 1.1062324084341526, train_acc = 0.9973218444340941
test Acc 0.9799813780260708:
27th- epoch: 301, train_loss = 1.1046915091574192, train_acc = 0.9973218444340941
test

test Acc 0.9809124767225326:
27th- epoch: 440, train_loss = 0.9747134471836034, train_acc = 0.9973218444340941
test Acc 0.9804469273743017:
27th- epoch: 441, train_loss = 0.9733957412245218, train_acc = 0.9973218444340941
test Acc 0.9809124767225326:
27th- epoch: 442, train_loss = 0.973397991299862, train_acc = 0.9973218444340941
test Acc 0.9809124767225326:
27th- epoch: 443, train_loss = 0.9727197749016341, train_acc = 0.9973218444340941
test Acc 0.9804469273743017:
27th- epoch: 444, train_loss = 0.9718932794930879, train_acc = 0.9973218444340941
test Acc 0.9804469273743017:
27th- epoch: 445, train_loss = 0.9713353179395199, train_acc = 0.9973218444340941
test Acc 0.9809124767225326:
27th- epoch: 446, train_loss = 0.9701818401517812, train_acc = 0.9973218444340941
test Acc 0.9804469273743017:
27th- epoch: 447, train_loss = 0.9703519642353058, train_acc = 0.9973218444340941
test Acc 0.9809124767225326:
27th- epoch: 448, train_loss = 0.9689968029560987, train_acc = 0.9973218444340941
te

 90%|████████████████████████████████████████████████████████████████▊       | 27/30 [4:29:20<29:58, 599.49s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
28th- epoch: 0, train_loss = 123.47101902961731, train_acc = 0.7782952957615277
test Acc 0.8631284916201117:
28th- epoch: 1, train_loss = 43.898209907114506, train_acc = 0.9108057755006986
test Acc 0.9110800744878957:
28th- epoch: 2, train_loss = 32.08491016179323, train_acc = 0.9351420586865393
test Acc 0.9292364990689013:
28th- epoch: 3, train_loss = 26.10694331675768, train_acc = 0.9479506287843502
test Acc 0.9352886405959032:
28th- epoch: 4, train_loss = 22.23122033290565, train_acc = 0.955985095482068
test Acc 0.9394785847299814:
28th- epoch: 5, train_loss = 19.455635583028197, train_acc = 0.96075919888216

28th- epoch: 145, train_loss = 1.5419040335109457, train_acc = 0.9969725197950629
test Acc 0.9776536312849162:
28th- epoch: 146, train_loss = 1.5371391406515613, train_acc = 0.9969725197950629
test Acc 0.9776536312849162:
28th- epoch: 147, train_loss = 1.5315421937266365, train_acc = 0.9969725197950629
test Acc 0.9776536312849162:
28th- epoch: 148, train_loss = 1.5265132244676352, train_acc = 0.9969725197950629
test Acc 0.9776536312849162:
28th- epoch: 149, train_loss = 1.5219339666655287, train_acc = 0.9969725197950629
test Acc 0.9776536312849162:
28th- epoch: 150, train_loss = 1.5178879337618127, train_acc = 0.9969725197950629
test Acc 0.9776536312849162:
28th- epoch: 151, train_loss = 1.5121434709290043, train_acc = 0.9969725197950629
test Acc 0.9776536312849162:
28th- epoch: 152, train_loss = 1.5086986651876941, train_acc = 0.9970889613414066
test Acc 0.9776536312849162:
28th- epoch: 153, train_loss = 1.5035695662954822, train_acc = 0.9969725197950629
test Acc 0.9776536312849162:
2

28th- epoch: 293, train_loss = 1.1462262024288066, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
28th- epoch: 294, train_loss = 1.1445267188246362, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
28th- epoch: 295, train_loss = 1.1430235877633095, train_acc = 0.9973218444340941
test Acc 0.978584729981378:
28th- epoch: 296, train_loss = 1.141221794008743, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
28th- epoch: 297, train_loss = 1.1401268243789673, train_acc = 0.9973218444340941
test Acc 0.978584729981378:
28th- epoch: 298, train_loss = 1.1393849961459637, train_acc = 0.9973218444340941
test Acc 0.978584729981378:
28th- epoch: 299, train_loss = 1.1378368201549165, train_acc = 0.9973218444340941
test Acc 0.978584729981378:
28th- epoch: 300, train_loss = 1.1355124625260942, train_acc = 0.9973218444340941
test Acc 0.978584729981378:
28th- epoch: 301, train_loss = 1.134385820478201, train_acc = 0.9973218444340941
test Acc 0.978584729981378:
28th- epoch:

28th- epoch: 441, train_loss = 0.9894275541009847, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
28th- epoch: 442, train_loss = 0.988519156962866, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
28th- epoch: 443, train_loss = 0.9879535399377346, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
28th- epoch: 444, train_loss = 0.9871546886861324, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
28th- epoch: 445, train_loss = 0.9866179650125559, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
28th- epoch: 446, train_loss = 0.9856634587049484, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
28th- epoch: 447, train_loss = 0.9852564409375191, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
28th- epoch: 448, train_loss = 0.9842071744205896, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
28th- epoch: 449, train_loss = 0.9839968457818031, train_acc = 0.9974382859804378
test Acc 0.978584729981378:
28th- epoch

 93%|███████████████████████████████████████████████████████████████████▏    | 28/30 [4:38:13<19:19, 579.54s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
29th- epoch: 0, train_loss = 124.39278297126293, train_acc = 0.7633907778295296
test Acc 0.8649906890130353:
29th- epoch: 1, train_loss = 41.68598657846451, train_acc = 0.9151141127154169
test Acc 0.9129422718808193:
29th- epoch: 2, train_loss = 30.06034354865551, train_acc = 0.9380530973451328
test Acc 0.9352886405959032:
29th- epoch: 3, train_loss = 24.272865671664476, train_acc = 0.9485328365160689
test Acc 0.9464618249534451:
29th- epoch: 4, train_loss = 20.51719507202506, train_acc = 0.9563344201210993
test Acc 0.9501862197392924:
29th- epoch: 5, train_loss = 17.85262414626777, train_acc = 0.96087564042850

29th- epoch: 145, train_loss = 1.5105675620725378, train_acc = 0.9974382859804378
test Acc 0.9781191806331471:
29th- epoch: 146, train_loss = 1.5058959648013115, train_acc = 0.9974382859804378
test Acc 0.9781191806331471:
29th- epoch: 147, train_loss = 1.5009861724684015, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
29th- epoch: 148, train_loss = 1.4959180740406737, train_acc = 0.9974382859804378
test Acc 0.9781191806331471:
29th- epoch: 149, train_loss = 1.4911636946490034, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
29th- epoch: 150, train_loss = 1.4866319857537746, train_acc = 0.9974382859804378
test Acc 0.9781191806331471:
29th- epoch: 151, train_loss = 1.4814726511249319, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
29th- epoch: 152, train_loss = 1.4775034511694685, train_acc = 0.9974382859804378
test Acc 0.9781191806331471:
29th- epoch: 153, train_loss = 1.4724133176496252, train_acc = 0.9974382859804378
test Acc 0.9771880819366853:
2

29th- epoch: 293, train_loss = 1.1303534917533398, train_acc = 0.9975547275267815
test Acc 0.979050279329609:
29th- epoch: 294, train_loss = 1.1290164031088352, train_acc = 0.9975547275267815
test Acc 0.979050279329609:
29th- epoch: 295, train_loss = 1.1279140946571715, train_acc = 0.9975547275267815
test Acc 0.979050279329609:
29th- epoch: 296, train_loss = 1.126618891954422, train_acc = 0.9975547275267815
test Acc 0.979050279329609:
29th- epoch: 297, train_loss = 1.1252710695262067, train_acc = 0.9975547275267815
test Acc 0.979050279329609:
29th- epoch: 298, train_loss = 1.123453814536333, train_acc = 0.9975547275267815
test Acc 0.979050279329609:
29th- epoch: 299, train_loss = 1.1219585959916003, train_acc = 0.9975547275267815
test Acc 0.979050279329609:
29th- epoch: 300, train_loss = 1.1201411460642703, train_acc = 0.9975547275267815
test Acc 0.979050279329609:
29th- epoch: 301, train_loss = 1.1186983709339984, train_acc = 0.9975547275267815
test Acc 0.979050279329609:
29th- epoch:

29th- epoch: 441, train_loss = 0.9826067102549132, train_acc = 0.9976711690731253
test Acc 0.9795158286778398:
29th- epoch: 442, train_loss = 0.9817592588660773, train_acc = 0.9976711690731253
test Acc 0.9795158286778398:
29th- epoch: 443, train_loss = 0.9812135882675648, train_acc = 0.9976711690731253
test Acc 0.9795158286778398:
29th- epoch: 444, train_loss = 0.9807729820313398, train_acc = 0.9977876106194691
test Acc 0.9795158286778398:
29th- epoch: 445, train_loss = 0.9800400212407112, train_acc = 0.9977876106194691
test Acc 0.9795158286778398:
29th- epoch: 446, train_loss = 0.9792225124838296, train_acc = 0.9977876106194691
test Acc 0.9795158286778398:
29th- epoch: 447, train_loss = 0.9783533426525537, train_acc = 0.9976711690731253
test Acc 0.9795158286778398:
29th- epoch: 448, train_loss = 0.9778978700342122, train_acc = 0.9977876106194691
test Acc 0.9795158286778398:
29th- epoch: 449, train_loss = 0.9772547992470209, train_acc = 0.9977876106194691
test Acc 0.9795158286778398:
2

 97%|█████████████████████████████████████████████████████████████████████▌  | 29/30 [4:46:48<09:20, 560.18s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
30th- epoch: 0, train_loss = 113.69584788382053, train_acc = 0.7729389846297159
test Acc 0.8631284916201117:
30th- epoch: 1, train_loss = 44.04290430247784, train_acc = 0.9076618537494178
test Acc 0.9115456238361266:
30th- epoch: 2, train_loss = 32.305283308029175, train_acc = 0.9331625523986958
test Acc 0.9273743016759777:
30th- epoch: 3, train_loss = 26.40425281971693, train_acc = 0.9442244993013508
test Acc 0.9376163873370578:
30th- epoch: 4, train_loss = 22.59037795290351, train_acc = 0.9531904983698184
test Acc 0.9455307262569832:
30th- epoch: 5, train_loss = 19.901660047471523, train_acc = 0.9601769911504

30th- epoch: 145, train_loss = 1.6859120812732726, train_acc = 0.9972054028877504
test Acc 0.979050279329609:
30th- epoch: 146, train_loss = 1.6795437771361321, train_acc = 0.9972054028877504
test Acc 0.979050279329609:
30th- epoch: 147, train_loss = 1.672990445047617, train_acc = 0.9972054028877504
test Acc 0.979050279329609:
30th- epoch: 148, train_loss = 1.667089828522876, train_acc = 0.9972054028877504
test Acc 0.979050279329609:
30th- epoch: 149, train_loss = 1.660900266142562, train_acc = 0.9972054028877504
test Acc 0.979050279329609:
30th- epoch: 150, train_loss = 1.6553485665936023, train_acc = 0.9973218444340941
test Acc 0.979050279329609:
30th- epoch: 151, train_loss = 1.6500129513442516, train_acc = 0.9973218444340941
test Acc 0.979050279329609:
30th- epoch: 152, train_loss = 1.6446180827915668, train_acc = 0.9973218444340941
test Acc 0.979050279329609:
30th- epoch: 153, train_loss = 1.6386900593061, train_acc = 0.9973218444340941
test Acc 0.979050279329609:
30th- epoch: 154

test Acc 0.9799813780260708:
30th- epoch: 293, train_loss = 1.229230533062946, train_acc = 0.9974382859804378
test Acc 0.9799813780260708:
30th- epoch: 294, train_loss = 1.2278116096858867, train_acc = 0.9974382859804378
test Acc 0.9799813780260708:
30th- epoch: 295, train_loss = 1.226123172789812, train_acc = 0.9974382859804378
test Acc 0.9799813780260708:
30th- epoch: 296, train_loss = 1.2244715367560275, train_acc = 0.9974382859804378
test Acc 0.9804469273743017:
30th- epoch: 297, train_loss = 1.222823987423908, train_acc = 0.9974382859804378
test Acc 0.9804469273743017:
30th- epoch: 298, train_loss = 1.2210462081129663, train_acc = 0.9974382859804378
test Acc 0.9804469273743017:
30th- epoch: 299, train_loss = 1.2199715388123877, train_acc = 0.9974382859804378
test Acc 0.9804469273743017:
30th- epoch: 300, train_loss = 1.218146726489067, train_acc = 0.9974382859804378
test Acc 0.9804469273743017:
30th- epoch: 301, train_loss = 1.2165484887664206, train_acc = 0.9974382859804378
test 

30th- epoch: 440, train_loss = 1.0538547411561012, train_acc = 0.9976711690731253
test Acc 0.9799813780260708:
30th- epoch: 441, train_loss = 1.0531300939619541, train_acc = 0.9976711690731253
test Acc 0.9799813780260708:
30th- epoch: 442, train_loss = 1.0526515779201873, train_acc = 0.9976711690731253
test Acc 0.9799813780260708:
30th- epoch: 443, train_loss = 1.0512943863868713, train_acc = 0.9976711690731253
test Acc 0.9799813780260708:
30th- epoch: 444, train_loss = 1.050635240972042, train_acc = 0.9976711690731253
test Acc 0.9799813780260708:
30th- epoch: 445, train_loss = 1.0494477525353432, train_acc = 0.9976711690731253
test Acc 0.9799813780260708:
30th- epoch: 446, train_loss = 1.0491261171700899, train_acc = 0.9976711690731253
test Acc 0.9799813780260708:
30th- epoch: 447, train_loss = 1.0479557067155838, train_acc = 0.9976711690731253
test Acc 0.9799813780260708:
30th- epoch: 448, train_loss = 1.0474299217166845, train_acc = 0.9976711690731253
test Acc 0.9799813780260708:
30

100%|████████████████████████████████████████████████████████████████████████| 30/30 [4:55:22<00:00, 546.44s/it]


Wall time: 4h 55min 25s
