In [1]:
import numpy as np
import pandas as pd

import torch
import torch.nn as nn
import torch.optim as optim
import torch.nn.functional as F
import torch.utils.data as data

import utility.Data_loader as D
from utility.Model import Mcslt
from utility.Custom import CustomDataset

from tqdm import tqdm
from collections import Counter

In [2]:
%%time
if __name__ == '__main__':
    read_path = 'D:virus/image/2gram_768/'
    
    temp = [[],[]]
    
    Loader = D.File_loader()
    data_a, label_a = Loader.read_files(read_path, interp = False)
    
    idx = np.argsort(label_a)
    
    sorted_data = data_a[idx].reshape(10736, -1)
    sorted_label = sorted(label_a)
        
    BATCH_SIZE = 64
    TOTAL = 30
    EPOCH =500
    NUM_CLASS = 9
    LR = 0.0001
    SEED = [s for s in range(TOTAL)]
    Num_Nodes = 768
    
    CUDA_N = 'cuda:0'
    
    # creating data indices for spliting
    full_dataset = CustomDataset(sorted_data, sorted_label)
    train_size = int(0.8 * len(full_dataset))
    test_size = len(full_dataset) - train_size
    
    # spliting
    torch.manual_seed(10)
    train_dataset, test_dataset = data.random_split(full_dataset, [train_size, test_size])
    train_loader = data.DataLoader(train_dataset, batch_size=BATCH_SIZE, shuffle = False)
    test_loader = data.DataLoader(test_dataset, batch_size=BATCH_SIZE, shuffle=False)
    
    loss_total = []
    acc_total = []
    pred_total = []
    true_total = []
    
    
    for i in tqdm(range(TOTAL)):
        
        
        device = torch.device(CUDA_N if torch.cuda.is_available() else 'cpu')
        torch.manual_seed(SEED[i])
        net = Mcslt(Num_Nodes, NUM_CLASS)
        net.to(device)
        print(net)
        
        softmax = nn.Softmax()
        criterion = nn.CrossEntropyLoss()
        optimizer = optim.SGD(net.parameters(), lr=LR, momentum = 0.1)
        
        loss_list = []
        train_acc_list = []
        test_acc_list = []
        
        pred_temp = []
        true_temp = []
        
        for epoch in range(EPOCH):
            net.train()
            running_loss = 0
            total = train_size
            correct = 0 
            
            for step, images_labels in enumerate(train_loader):
                inputs, labels = images_labels
                inputs, labels = inputs.type(torch.FloatTensor).to(device), labels.type(torch.LongTensor).to(device)
                
                outputs = net(inputs)
                
                loss = criterion(outputs, labels)
                
                optimizer.zero_grad()
                loss.backward()
                optimizer.step()
                running_loss += loss.item()
                
                _, pred = torch.max(outputs, dim=1)
                correct += (pred == labels).sum().item()
                
            train_acc = correct/total
            loss_list.append(running_loss)
            train_acc_list.append(train_acc)
            print('{}th- epoch: {}, train_loss = {}, train_acc = {}'.format(i+1, epoch, running_loss, train_acc))
            
            with torch.no_grad():
                net.eval()
                correct = 0
                total = test_size
                pt, tt = [], []
                
                for step_t, images_labels_t in enumerate(test_loader):
                    inputs_t, labels_t = images_labels_t
                    inputs_t, labels_t = inputs_t.type(torch.FloatTensor).to(device), labels_t.type(torch.LongTensor).to(device)
                    
                    outputs_t = net(inputs_t)
                    outputs_t = softmax(outputs_t)
                    
                    # test accuracy
                    _, pred_t = torch.max(outputs_t, dim = 1)
                    
                    pt.append(pred_t)
                    tt.append(labels_t)
                    
                    correct += (pred_t == labels_t).sum().item()
                    
                pred_temp.append(torch.cat(pt))
                true_temp.append(torch.cat(tt))
                
                test_acc = correct/total
                test_acc_list.append(test_acc)
                
                print('test Acc {}:'.format(test_acc))
                
        best_result_index = np.argmax(np.array(test_acc_list))
        loss_total.append(loss_list[best_result_index])
        acc_total.append(test_acc_list[best_result_index])
        pred_total.append(pred_temp[best_result_index].tolist())
        true_total.append(true_temp[best_result_index].tolist())
        
    file_name = 'res/Mcslt_2gram'
    torch.save(net.state_dict(), file_name +'.pth')
    
    loss_DF = pd.DataFrame(loss_total)
    loss_DF.to_csv(file_name+" loss.csv")
    
    acc_DF = pd.DataFrame(acc_total)
    acc_DF.to_csv(file_name +" acc.csv")
    
    pred_DF = pd.DataFrame(pred_total)
    pred_DF.to_csv(file_name +" pred.csv")
    
    true_DF = pd.DataFrame(true_total)
    true_DF.to_csv(file_name +" true.csv")

100%|███████████████████████████████████████████████████████████████████| 10736/10736 [00:02<00:00, 5099.10it/s]
  0%|                                                                                    | 0/30 [00:00<?, ?it/s]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
1th- epoch: 0, train_loss = 100.64926259219646, train_acc = 0.8105496040987424




test Acc 0.8999068901303539:
1th- epoch: 1, train_loss = 40.10758416354656, train_acc = 0.9222170470423847
test Acc 0.9231843575418994:
1th- epoch: 2, train_loss = 31.26131097227335, train_acc = 0.9377037727061015
test Acc 0.9329608938547486:
1th- epoch: 3, train_loss = 26.368512220680714, train_acc = 0.9451560316721006
test Acc 0.936219739292365:
1th- epoch: 4, train_loss = 23.120950762182474, train_acc = 0.950279459711225
test Acc 0.9404096834264432:
1th- epoch: 5, train_loss = 20.70344428345561, train_acc = 0.9552864462040056
test Acc 0.9441340782122905:
1th- epoch: 6, train_loss = 18.813547898083925, train_acc = 0.959944108057755
test Acc 0.9497206703910615:
1th- epoch: 7, train_loss = 17.302119944244623, train_acc = 0.9619236143455985
test Acc 0.9511173184357542:
1th- epoch: 8, train_loss = 16.06968630477786, train_acc = 0.9646017699115044
test Acc 0.952048417132216:
1th- epoch: 9, train_loss = 15.03093471005559, train_acc = 0.9673963670237541
test Acc 0.952513966480447:
1th- epoc

1th- epoch: 151, train_loss = 2.579667004523799, train_acc = 0.9941779226828132
test Acc 0.9716014897579144:
1th- epoch: 152, train_loss = 2.570378166856244, train_acc = 0.994294364229157
test Acc 0.9716014897579144:
1th- epoch: 153, train_loss = 2.5630102567374706, train_acc = 0.994294364229157
test Acc 0.9716014897579144:
1th- epoch: 154, train_loss = 2.5530360031407326, train_acc = 0.994294364229157
test Acc 0.9716014897579144:
1th- epoch: 155, train_loss = 2.5430710203945637, train_acc = 0.994294364229157
test Acc 0.9716014897579144:
1th- epoch: 156, train_loss = 2.536312371492386, train_acc = 0.994294364229157
test Acc 0.9716014897579144:
1th- epoch: 157, train_loss = 2.525679439306259, train_acc = 0.9944108057755007
test Acc 0.9716014897579144:
1th- epoch: 158, train_loss = 2.51732137799263, train_acc = 0.9944108057755007
test Acc 0.9716014897579144:
1th- epoch: 159, train_loss = 2.509898503543809, train_acc = 0.9944108057755007
test Acc 0.9716014897579144:
1th- epoch: 160, train

test Acc 0.9739292364990689:
1th- epoch: 301, train_loss = 1.8908066438743845, train_acc = 0.9956916627852818
test Acc 0.9739292364990689:
1th- epoch: 302, train_loss = 1.8886181712150574, train_acc = 0.9956916627852818
test Acc 0.9739292364990689:
1th- epoch: 303, train_loss = 1.886801078915596, train_acc = 0.9956916627852818
test Acc 0.9739292364990689:
1th- epoch: 304, train_loss = 1.88388194644358, train_acc = 0.9956916627852818
test Acc 0.9739292364990689:
1th- epoch: 305, train_loss = 1.8816215271363035, train_acc = 0.995575221238938
test Acc 0.9739292364990689:
1th- epoch: 306, train_loss = 1.8791263438761234, train_acc = 0.9956916627852818
test Acc 0.9739292364990689:
1th- epoch: 307, train_loss = 1.8772499164333567, train_acc = 0.9953423381462506
test Acc 0.973463687150838:
1th- epoch: 308, train_loss = 1.8753956457367167, train_acc = 0.9954587796925943
test Acc 0.9739292364990689:
1th- epoch: 309, train_loss = 1.8739522099494934, train_acc = 0.9956916627852818
test Acc 0.9734

1th- epoch: 450, train_loss = 1.678173144639004, train_acc = 0.995575221238938
test Acc 0.9739292364990689:
1th- epoch: 451, train_loss = 1.6770221181213856, train_acc = 0.995575221238938
test Acc 0.9739292364990689:
1th- epoch: 452, train_loss = 1.6769587409798987, train_acc = 0.995575221238938
test Acc 0.9739292364990689:
1th- epoch: 453, train_loss = 1.675762988626957, train_acc = 0.995575221238938
test Acc 0.9739292364990689:
1th- epoch: 454, train_loss = 1.6746910462970845, train_acc = 0.995575221238938
test Acc 0.9743947858472998:
1th- epoch: 455, train_loss = 1.6738162748515606, train_acc = 0.995575221238938
test Acc 0.9743947858472998:
1th- epoch: 456, train_loss = 1.6722636384074576, train_acc = 0.995575221238938
test Acc 0.9743947858472998:
1th- epoch: 457, train_loss = 1.6719343637232669, train_acc = 0.995575221238938
test Acc 0.9739292364990689:
1th- epoch: 458, train_loss = 1.6720405059750192, train_acc = 0.995575221238938
test Acc 0.9743947858472998:
1th- epoch: 459, trai

  3%|██▍                                                                      | 1/30 [09:02<4:22:25, 542.95s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
2th- epoch: 0, train_loss = 126.18775202333927, train_acc = 0.7848160223567769
test Acc 0.8868715083798883:
2th- epoch: 1, train_loss = 42.39623365551233, train_acc = 0.911504424778761
test Acc 0.9208566108007449:
2th- epoch: 2, train_loss = 31.537923127412796, train_acc = 0.9372380065207266
test Acc 0.9404096834264432:
2th- epoch: 3, train_loss = 26.486054215580225, train_acc = 0.9479506287843502
test Acc 0.9445996275605214:
2th- epoch: 4, train_loss = 23.343022897839546, train_acc = 0.9537727061015371
test Acc 0.946927374301676:
2th- epoch: 5, train_loss = 21.062164559960365, train_acc = 0.9572659524918491
te

2th- epoch: 147, train_loss = 2.739899759646505, train_acc = 0.993828598043782
test Acc 0.9776536312849162:
2th- epoch: 148, train_loss = 2.729697351809591, train_acc = 0.993828598043782
test Acc 0.9776536312849162:
2th- epoch: 149, train_loss = 2.720919918268919, train_acc = 0.993828598043782
test Acc 0.9776536312849162:
2th- epoch: 150, train_loss = 2.7107685045339167, train_acc = 0.993828598043782
test Acc 0.9776536312849162:
2th- epoch: 151, train_loss = 2.6994971721433103, train_acc = 0.9939450395901258
test Acc 0.9776536312849162:
2th- epoch: 152, train_loss = 2.6886944212019444, train_acc = 0.9939450395901258
test Acc 0.9776536312849162:
2th- epoch: 153, train_loss = 2.680717434734106, train_acc = 0.9939450395901258
test Acc 0.9776536312849162:
2th- epoch: 154, train_loss = 2.6687365076504648, train_acc = 0.9939450395901258
test Acc 0.9776536312849162:
2th- epoch: 155, train_loss = 2.6588625186122954, train_acc = 0.9939450395901258
test Acc 0.9776536312849162:
2th- epoch: 156, t

2th- epoch: 296, train_loss = 1.964274536818266, train_acc = 0.9956916627852818
test Acc 0.9799813780260708:
2th- epoch: 297, train_loss = 1.9618368732044473, train_acc = 0.9956916627852818
test Acc 0.9795158286778398:
2th- epoch: 298, train_loss = 1.9592991782119498, train_acc = 0.9956916627852818
test Acc 0.9799813780260708:
2th- epoch: 299, train_loss = 1.9585992991924286, train_acc = 0.9956916627852818
test Acc 0.9795158286778398:
2th- epoch: 300, train_loss = 1.955085443914868, train_acc = 0.9956916627852818
test Acc 0.9795158286778398:
2th- epoch: 301, train_loss = 1.951599775464274, train_acc = 0.9956916627852818
test Acc 0.9799813780260708:
2th- epoch: 302, train_loss = 1.9496955896029249, train_acc = 0.9956916627852818
test Acc 0.9799813780260708:
2th- epoch: 303, train_loss = 1.9494723515817896, train_acc = 0.9956916627852818
test Acc 0.9795158286778398:
2th- epoch: 304, train_loss = 1.9460352584719658, train_acc = 0.9956916627852818
test Acc 0.9799813780260708:
2th- epoch: 3

2th- epoch: 446, train_loss = 1.725196170329582, train_acc = 0.995575221238938
test Acc 0.9795158286778398:
2th- epoch: 447, train_loss = 1.7246351018548012, train_acc = 0.995575221238938
test Acc 0.9795158286778398:
2th- epoch: 448, train_loss = 1.7236758954823017, train_acc = 0.995575221238938
test Acc 0.9795158286778398:
2th- epoch: 449, train_loss = 1.7226150880451314, train_acc = 0.995575221238938
test Acc 0.9795158286778398:
2th- epoch: 450, train_loss = 1.723723292350769, train_acc = 0.995575221238938
test Acc 0.9795158286778398:
2th- epoch: 451, train_loss = 1.720322284847498, train_acc = 0.995575221238938
test Acc 0.9795158286778398:
2th- epoch: 452, train_loss = 1.718739962845575, train_acc = 0.995575221238938
test Acc 0.9795158286778398:
2th- epoch: 453, train_loss = 1.7187363554839976, train_acc = 0.995575221238938
test Acc 0.9795158286778398:
2th- epoch: 454, train_loss = 1.7177907638251781, train_acc = 0.995575221238938
test Acc 0.9795158286778398:
2th- epoch: 455, train_

  7%|████▊                                                                    | 2/30 [18:05<4:13:18, 542.80s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
3th- epoch: 0, train_loss = 103.90057855844498, train_acc = 0.7863297624592455
test Acc 0.8556797020484171:
3th- epoch: 1, train_loss = 40.09911388158798, train_acc = 0.9112715416860736
test Acc 0.9134078212290503:
3th- epoch: 2, train_loss = 30.716049134731293, train_acc = 0.9358407079646017
test Acc 0.9264432029795159:
3th- epoch: 3, train_loss = 26.072980005294085, train_acc = 0.9448067070330693
test Acc 0.9338919925512105:
3th- epoch: 4, train_loss = 23.093431018292904, train_acc = 0.9508616674429436
test Acc 0.9385474860335196:
3th- epoch: 5, train_loss = 20.90156902000308, train_acc = 0.9551700046576619
t

3th- epoch: 147, train_loss = 2.744730909820646, train_acc = 0.9934792734047508
test Acc 0.973463687150838:
3th- epoch: 148, train_loss = 2.7343355431221426, train_acc = 0.9935957149510946
test Acc 0.9739292364990689:
3th- epoch: 149, train_loss = 2.723738618195057, train_acc = 0.9935957149510946
test Acc 0.9739292364990689:
3th- epoch: 150, train_loss = 2.712595332413912, train_acc = 0.9935957149510946
test Acc 0.9739292364990689:
3th- epoch: 151, train_loss = 2.702894315123558, train_acc = 0.9935957149510946
test Acc 0.9739292364990689:
3th- epoch: 152, train_loss = 2.6926326144021004, train_acc = 0.9937121564974383
test Acc 0.9748603351955307:
3th- epoch: 153, train_loss = 2.682493343949318, train_acc = 0.9937121564974383
test Acc 0.9743947858472998:
3th- epoch: 154, train_loss = 2.671792224049568, train_acc = 0.993828598043782
test Acc 0.9743947858472998:
3th- epoch: 155, train_loss = 2.6621475976426154, train_acc = 0.993828598043782
test Acc 0.9748603351955307:
3th- epoch: 156, tr

3th- epoch: 296, train_loss = 1.9483303390443325, train_acc = 0.9952258965999069
test Acc 0.978584729981378:
3th- epoch: 297, train_loss = 1.9455139277270064, train_acc = 0.9952258965999069
test Acc 0.978584729981378:
3th- epoch: 298, train_loss = 1.9426177702844143, train_acc = 0.9952258965999069
test Acc 0.978584729981378:
3th- epoch: 299, train_loss = 1.9400896144798025, train_acc = 0.9952258965999069
test Acc 0.978584729981378:
3th- epoch: 300, train_loss = 1.9378649294376373, train_acc = 0.9952258965999069
test Acc 0.978584729981378:
3th- epoch: 301, train_loss = 1.9361879924545065, train_acc = 0.9952258965999069
test Acc 0.978584729981378:
3th- epoch: 302, train_loss = 1.9333227388560772, train_acc = 0.9952258965999069
test Acc 0.978584729981378:
3th- epoch: 303, train_loss = 1.931398638873361, train_acc = 0.9952258965999069
test Acc 0.978584729981378:
3th- epoch: 304, train_loss = 1.9284613778581843, train_acc = 0.9952258965999069
test Acc 0.978584729981378:
3th- epoch: 305, tra

3th- epoch: 446, train_loss = 1.7022982984781265, train_acc = 0.995575221238938
test Acc 0.9795158286778398:
3th- epoch: 447, train_loss = 1.701097181707155, train_acc = 0.995575221238938
test Acc 0.9795158286778398:
3th- epoch: 448, train_loss = 1.700685425370466, train_acc = 0.995575221238938
test Acc 0.9795158286778398:
3th- epoch: 449, train_loss = 1.6997139267623425, train_acc = 0.995575221238938
test Acc 0.979050279329609:
3th- epoch: 450, train_loss = 1.6984996696119197, train_acc = 0.995575221238938
test Acc 0.9795158286778398:
3th- epoch: 451, train_loss = 1.6974153990740888, train_acc = 0.995575221238938
test Acc 0.9795158286778398:
3th- epoch: 452, train_loss = 1.69664017111063, train_acc = 0.995575221238938
test Acc 0.9795158286778398:
3th- epoch: 453, train_loss = 1.6962973127956502, train_acc = 0.995575221238938
test Acc 0.9795158286778398:
3th- epoch: 454, train_loss = 1.6939474108512513, train_acc = 0.995575221238938
test Acc 0.9795158286778398:
3th- epoch: 455, train_l

 10%|███████▎                                                                 | 3/30 [27:07<4:04:06, 542.45s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
4th- epoch: 0, train_loss = 108.69461387395859, train_acc = 0.8022822543083372
test Acc 0.8915270018621974:
4th- epoch: 1, train_loss = 37.936294339597225, train_acc = 0.9190731252911039
test Acc 0.9278398510242085:
4th- epoch: 2, train_loss = 28.93476329743862, train_acc = 0.9377037727061015
test Acc 0.9380819366852886:
4th- epoch: 3, train_loss = 24.6188601590693, train_acc = 0.9474848625989754
test Acc 0.9464618249534451:
4th- epoch: 4, train_loss = 21.867646768689156, train_acc = 0.9529576152771309
test Acc 0.9497206703910615:
4th- epoch: 5, train_loss = 19.90212193503976, train_acc = 0.9588961341406614
tes

4th- epoch: 147, train_loss = 2.7803934342227876, train_acc = 0.993828598043782
test Acc 0.973463687150838:
4th- epoch: 148, train_loss = 2.7691004150547087, train_acc = 0.993828598043782
test Acc 0.973463687150838:
4th- epoch: 149, train_loss = 2.759299848228693, train_acc = 0.993828598043782
test Acc 0.973463687150838:
4th- epoch: 150, train_loss = 2.7476092143915594, train_acc = 0.993828598043782
test Acc 0.973463687150838:
4th- epoch: 151, train_loss = 2.7379025034606457, train_acc = 0.993828598043782
test Acc 0.973463687150838:
4th- epoch: 152, train_loss = 2.7257131836377084, train_acc = 0.993828598043782
test Acc 0.973463687150838:
4th- epoch: 153, train_loss = 2.716121416538954, train_acc = 0.993828598043782
test Acc 0.973463687150838:
4th- epoch: 154, train_loss = 2.704548928886652, train_acc = 0.993828598043782
test Acc 0.9725325884543762:
4th- epoch: 155, train_loss = 2.6943310759961605, train_acc = 0.9939450395901258
test Acc 0.9725325884543762:
4th- epoch: 156, train_loss 

test Acc 0.9781191806331471:
4th- epoch: 297, train_loss = 1.9287972748279572, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
4th- epoch: 298, train_loss = 1.9250955544412136, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
4th- epoch: 299, train_loss = 1.9242188967764378, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
4th- epoch: 300, train_loss = 1.9214249290525913, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
4th- epoch: 301, train_loss = 1.9182080775499344, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
4th- epoch: 302, train_loss = 1.917110102949664, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
4th- epoch: 303, train_loss = 1.9131154380738735, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
4th- epoch: 304, train_loss = 1.9113187391776592, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
4th- epoch: 305, train_loss = 1.9079881173092872, train_acc = 0.995575221238938
test Acc 0.978119180

4th- epoch: 447, train_loss = 1.686644925386645, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
4th- epoch: 448, train_loss = 1.6872798912227154, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
4th- epoch: 449, train_loss = 1.685946960002184, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
4th- epoch: 450, train_loss = 1.6856360906967893, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
4th- epoch: 451, train_loss = 1.6825755214085802, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
4th- epoch: 452, train_loss = 1.6829926209757105, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
4th- epoch: 453, train_loss = 1.681390006095171, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
4th- epoch: 454, train_loss = 1.6814259676029906, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
4th- epoch: 455, train_loss = 1.6802539465716109, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
4th- epoch: 456, train

 13%|█████████▋                                                               | 4/30 [36:10<3:55:13, 542.82s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
5th- epoch: 0, train_loss = 111.08853866159916, train_acc = 0.7887750349324639
test Acc 0.8864059590316573:
5th- epoch: 1, train_loss = 43.164893604815006, train_acc = 0.9153469958081043
test Acc 0.9120111731843575:
5th- epoch: 2, train_loss = 33.53804633021355, train_acc = 0.9337447601304145
test Acc 0.9287709497206704:
5th- epoch: 3, train_loss = 28.47831581532955, train_acc = 0.9446902654867256
test Acc 0.9352886405959032:
5th- epoch: 4, train_loss = 25.15022163465619, train_acc = 0.9503959012575687
test Acc 0.9441340782122905:
5th- epoch: 5, train_loss = 22.705197729170322, train_acc = 0.9538891476478808
te

5th- epoch: 147, train_loss = 2.733631164766848, train_acc = 0.9937121564974383
test Acc 0.9781191806331471:
5th- epoch: 148, train_loss = 2.723349410109222, train_acc = 0.9937121564974383
test Acc 0.9781191806331471:
5th- epoch: 149, train_loss = 2.71131921838969, train_acc = 0.993828598043782
test Acc 0.9781191806331471:
5th- epoch: 150, train_loss = 2.6999787618406117, train_acc = 0.993828598043782
test Acc 0.9781191806331471:
5th- epoch: 151, train_loss = 2.6888323253951967, train_acc = 0.993828598043782
test Acc 0.9776536312849162:
5th- epoch: 152, train_loss = 2.678727388381958, train_acc = 0.993828598043782
test Acc 0.9781191806331471:
5th- epoch: 153, train_loss = 2.6675725704990327, train_acc = 0.993828598043782
test Acc 0.9781191806331471:
5th- epoch: 154, train_loss = 2.6570355109870434, train_acc = 0.993828598043782
test Acc 0.9776536312849162:
5th- epoch: 155, train_loss = 2.646723189856857, train_acc = 0.993828598043782
test Acc 0.9776536312849162:
5th- epoch: 156, train_

5th- epoch: 296, train_loss = 1.9186757799470797, train_acc = 0.9951094550535631
test Acc 0.9823091247672253:
5th- epoch: 297, train_loss = 1.9154581278562546, train_acc = 0.9951094550535631
test Acc 0.9823091247672253:
5th- epoch: 298, train_loss = 1.9144289181567729, train_acc = 0.9951094550535631
test Acc 0.9823091247672253:
5th- epoch: 299, train_loss = 1.9107960660476238, train_acc = 0.9951094550535631
test Acc 0.9823091247672253:
5th- epoch: 300, train_loss = 1.9086367993149906, train_acc = 0.9951094550535631
test Acc 0.9823091247672253:
5th- epoch: 301, train_loss = 1.9064212157391012, train_acc = 0.9951094550535631
test Acc 0.9823091247672253:
5th- epoch: 302, train_loss = 1.9042659573024139, train_acc = 0.9951094550535631
test Acc 0.9823091247672253:
5th- epoch: 303, train_loss = 1.9011948665138334, train_acc = 0.9951094550535631
test Acc 0.9823091247672253:
5th- epoch: 304, train_loss = 1.8995119790779427, train_acc = 0.9951094550535631
test Acc 0.9823091247672253:
5th- epoch

5th- epoch: 444, train_loss = 1.6905880580306984, train_acc = 0.9952258965999069
test Acc 0.9823091247672253:
5th- epoch: 445, train_loss = 1.6896765607525595, train_acc = 0.9952258965999069
test Acc 0.9823091247672253:
5th- epoch: 446, train_loss = 1.6886983723961748, train_acc = 0.9952258965999069
test Acc 0.9823091247672253:
5th- epoch: 447, train_loss = 1.6873051653965376, train_acc = 0.9952258965999069
test Acc 0.9823091247672253:
5th- epoch: 448, train_loss = 1.6866076323203743, train_acc = 0.9952258965999069
test Acc 0.9823091247672253:
5th- epoch: 449, train_loss = 1.6854580896906555, train_acc = 0.9952258965999069
test Acc 0.9823091247672253:
5th- epoch: 450, train_loss = 1.684595960949082, train_acc = 0.9952258965999069
test Acc 0.9823091247672253:
5th- epoch: 451, train_loss = 1.6844033773522824, train_acc = 0.9952258965999069
test Acc 0.9823091247672253:
5th- epoch: 452, train_loss = 1.6831779765780084, train_acc = 0.9952258965999069
test Acc 0.9823091247672253:
5th- epoch:

 17%|████████████▏                                                            | 5/30 [45:13<3:46:11, 542.86s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
6th- epoch: 0, train_loss = 110.49510361254215, train_acc = 0.793549138332557
test Acc 0.8854748603351955:
6th- epoch: 1, train_loss = 41.37627271562815, train_acc = 0.9160456450861667
test Acc 0.9194599627560521:
6th- epoch: 2, train_loss = 31.609285980463028, train_acc = 0.9387517466231952
test Acc 0.9329608938547486:
6th- epoch: 3, train_loss = 26.680094815790653, train_acc = 0.9473684210526315
test Acc 0.9348230912476723:
6th- epoch: 4, train_loss = 23.41655270010233, train_acc = 0.9537727061015371
test Acc 0.9404096834264432:
6th- epoch: 5, train_loss = 21.0295033082366, train_acc = 0.9574988355845365
test

6th- epoch: 147, train_loss = 2.5726446558255702, train_acc = 0.9946436888681882
test Acc 0.9748603351955307:
6th- epoch: 148, train_loss = 2.561396097065881, train_acc = 0.9946436888681882
test Acc 0.9748603351955307:
6th- epoch: 149, train_loss = 2.552033982006833, train_acc = 0.9946436888681882
test Acc 0.9767225325884544:
6th- epoch: 150, train_loss = 2.5427662928123027, train_acc = 0.9946436888681882
test Acc 0.9767225325884544:
6th- epoch: 151, train_loss = 2.5341797929722816, train_acc = 0.9946436888681882
test Acc 0.9767225325884544:
6th- epoch: 152, train_loss = 2.524400881258771, train_acc = 0.9946436888681882
test Acc 0.9767225325884544:
6th- epoch: 153, train_loss = 2.515693099470809, train_acc = 0.9946436888681882
test Acc 0.9767225325884544:
6th- epoch: 154, train_loss = 2.5068524528760463, train_acc = 0.9946436888681882
test Acc 0.9771880819366853:
6th- epoch: 155, train_loss = 2.4996917832177132, train_acc = 0.9946436888681882
test Acc 0.9767225325884544:
6th- epoch: 15

test Acc 0.9776536312849162:
6th- epoch: 297, train_loss = 1.860914833843708, train_acc = 0.996040987424313
test Acc 0.9776536312849162:
6th- epoch: 298, train_loss = 1.8611738085746765, train_acc = 0.9961574289706567
test Acc 0.9776536312849162:
6th- epoch: 299, train_loss = 1.8578851483762264, train_acc = 0.996040987424313
test Acc 0.9776536312849162:
6th- epoch: 300, train_loss = 1.8555068919667974, train_acc = 0.996040987424313
test Acc 0.9776536312849162:
6th- epoch: 301, train_loss = 1.8538959237048402, train_acc = 0.996040987424313
test Acc 0.9776536312849162:
6th- epoch: 302, train_loss = 1.8515888713300228, train_acc = 0.996040987424313
test Acc 0.9776536312849162:
6th- epoch: 303, train_loss = 1.848785058944486, train_acc = 0.9961574289706567
test Acc 0.9776536312849162:
6th- epoch: 304, train_loss = 1.8484608245780692, train_acc = 0.996040987424313
test Acc 0.9776536312849162:
6th- epoch: 305, train_loss = 1.8448515856871381, train_acc = 0.996040987424313
test Acc 0.97765363

6th- epoch: 447, train_loss = 1.6538528501987457, train_acc = 0.996040987424313
test Acc 0.9776536312849162:
6th- epoch: 448, train_loss = 1.6534072533249855, train_acc = 0.996040987424313
test Acc 0.9776536312849162:
6th- epoch: 449, train_loss = 1.6536318150465377, train_acc = 0.996040987424313
test Acc 0.9776536312849162:
6th- epoch: 450, train_loss = 1.651420985639561, train_acc = 0.996040987424313
test Acc 0.9776536312849162:
6th- epoch: 451, train_loss = 1.6509560297126882, train_acc = 0.996040987424313
test Acc 0.9776536312849162:
6th- epoch: 452, train_loss = 1.6501392896170728, train_acc = 0.996040987424313
test Acc 0.9776536312849162:
6th- epoch: 453, train_loss = 1.6488796534831636, train_acc = 0.996040987424313
test Acc 0.9776536312849162:
6th- epoch: 454, train_loss = 1.6464172179694287, train_acc = 0.996040987424313
test Acc 0.9776536312849162:
6th- epoch: 455, train_loss = 1.6467168641393073, train_acc = 0.996040987424313
test Acc 0.9776536312849162:
6th- epoch: 456, tra

 20%|██████████████▌                                                          | 6/30 [54:20<3:37:34, 543.93s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
7th- epoch: 0, train_loss = 93.45585179328918, train_acc = 0.8068234746157429
test Acc 0.8924581005586593:
7th- epoch: 1, train_loss = 42.215537786483765, train_acc = 0.916394969725198
test Acc 0.9203910614525139:
7th- epoch: 2, train_loss = 32.90927780047059, train_acc = 0.9353749417792269
test Acc 0.9334264432029795:
7th- epoch: 3, train_loss = 27.691766619682312, train_acc = 0.9431765253842571
test Acc 0.9366852886405959:
7th- epoch: 4, train_loss = 24.16898050904274, train_acc = 0.9485328365160689
test Acc 0.9408752327746741:
7th- epoch: 5, train_loss = 21.545543808490038, train_acc = 0.9537727061015371
tes

7th- epoch: 147, train_loss = 2.6706477417610586, train_acc = 0.9941779226828132
test Acc 0.9757914338919925:
7th- epoch: 148, train_loss = 2.6605110689997673, train_acc = 0.994294364229157
test Acc 0.9757914338919925:
7th- epoch: 149, train_loss = 2.6493682130239904, train_acc = 0.994294364229157
test Acc 0.9757914338919925:
7th- epoch: 150, train_loss = 2.6403405778110027, train_acc = 0.994294364229157
test Acc 0.9757914338919925:
7th- epoch: 151, train_loss = 2.6283983602188528, train_acc = 0.994294364229157
test Acc 0.9757914338919925:
7th- epoch: 152, train_loss = 2.6189227998256683, train_acc = 0.994294364229157
test Acc 0.9757914338919925:
7th- epoch: 153, train_loss = 2.6097083589993417, train_acc = 0.994294364229157
test Acc 0.9757914338919925:
7th- epoch: 154, train_loss = 2.5997114828787744, train_acc = 0.994294364229157
test Acc 0.9762569832402235:
7th- epoch: 155, train_loss = 2.591264678630978, train_acc = 0.994294364229157
test Acc 0.9762569832402235:
7th- epoch: 156, tr

7th- epoch: 297, train_loss = 1.8986890513915569, train_acc = 0.9954587796925943
test Acc 0.979050279329609:
7th- epoch: 298, train_loss = 1.8957477423828095, train_acc = 0.995575221238938
test Acc 0.979050279329609:
7th- epoch: 299, train_loss = 1.8939904372673482, train_acc = 0.995575221238938
test Acc 0.979050279329609:
7th- epoch: 300, train_loss = 1.8903544929344207, train_acc = 0.995575221238938
test Acc 0.979050279329609:
7th- epoch: 301, train_loss = 1.8892978292424232, train_acc = 0.995575221238938
test Acc 0.979050279329609:
7th- epoch: 302, train_loss = 1.8867381513118744, train_acc = 0.995575221238938
test Acc 0.979050279329609:
7th- epoch: 303, train_loss = 1.8839505303185433, train_acc = 0.995575221238938
test Acc 0.979050279329609:
7th- epoch: 304, train_loss = 1.881395872682333, train_acc = 0.995575221238938
test Acc 0.979050279329609:
7th- epoch: 305, train_loss = 1.879461983917281, train_acc = 0.995575221238938
test Acc 0.979050279329609:
7th- epoch: 306, train_loss =

7th- epoch: 447, train_loss = 1.6710171848535538, train_acc = 0.995575221238938
test Acc 0.9799813780260708:
7th- epoch: 448, train_loss = 1.669607549905777, train_acc = 0.995575221238938
test Acc 0.9799813780260708:
7th- epoch: 449, train_loss = 1.6693653637776151, train_acc = 0.995575221238938
test Acc 0.9799813780260708:
7th- epoch: 450, train_loss = 1.668058500974439, train_acc = 0.995575221238938
test Acc 0.9799813780260708:
7th- epoch: 451, train_loss = 1.6655446328222752, train_acc = 0.995575221238938
test Acc 0.9799813780260708:
7th- epoch: 452, train_loss = 1.6662688391515985, train_acc = 0.995575221238938
test Acc 0.9799813780260708:
7th- epoch: 453, train_loss = 1.6653286591172218, train_acc = 0.995575221238938
test Acc 0.9799813780260708:
7th- epoch: 454, train_loss = 1.6644697015872225, train_acc = 0.995575221238938
test Acc 0.9799813780260708:
7th- epoch: 455, train_loss = 1.66446727886796, train_acc = 0.995575221238938
test Acc 0.9799813780260708:
7th- epoch: 456, train_

 23%|████████████████▌                                                      | 7/30 [1:03:23<3:28:26, 543.75s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
8th- epoch: 0, train_loss = 104.73707439005375, train_acc = 0.794014904517932
test Acc 0.9031657355679702:
8th- epoch: 1, train_loss = 40.19258721917868, train_acc = 0.9161620866325105
test Acc 0.9250465549348231:
8th- epoch: 2, train_loss = 31.28423283994198, train_acc = 0.9368886818816954
test Acc 0.9357541899441341:
8th- epoch: 3, train_loss = 26.535315711051226, train_acc = 0.9450395901257569
test Acc 0.9404096834264432:
8th- epoch: 4, train_loss = 23.392054785043, train_acc = 0.9500465766185375
test Acc 0.9418063314711359:
8th- epoch: 5, train_loss = 21.106871098279953, train_acc = 0.9551700046576619
test 

8th- epoch: 147, train_loss = 2.7426969911903143, train_acc = 0.993828598043782
test Acc 0.9753258845437617:
8th- epoch: 148, train_loss = 2.73202733322978, train_acc = 0.993828598043782
test Acc 0.9753258845437617:
8th- epoch: 149, train_loss = 2.721505695488304, train_acc = 0.993828598043782
test Acc 0.9753258845437617:
8th- epoch: 150, train_loss = 2.711455923039466, train_acc = 0.993828598043782
test Acc 0.9753258845437617:
8th- epoch: 151, train_loss = 2.7009590030647814, train_acc = 0.993828598043782
test Acc 0.9753258845437617:
8th- epoch: 152, train_loss = 2.6910122907720506, train_acc = 0.993828598043782
test Acc 0.9753258845437617:
8th- epoch: 153, train_loss = 2.679971367586404, train_acc = 0.993828598043782
test Acc 0.9753258845437617:
8th- epoch: 154, train_loss = 2.6706713177263737, train_acc = 0.993828598043782
test Acc 0.9757914338919925:
8th- epoch: 155, train_loss = 2.660890720319003, train_acc = 0.993828598043782
test Acc 0.9757914338919925:
8th- epoch: 156, train_lo

test Acc 0.9799813780260708:
8th- epoch: 297, train_loss = 1.9582838658243418, train_acc = 0.9952258965999069
test Acc 0.9799813780260708:
8th- epoch: 298, train_loss = 1.9573856722563505, train_acc = 0.9952258965999069
test Acc 0.9799813780260708:
8th- epoch: 299, train_loss = 1.954295014962554, train_acc = 0.9952258965999069
test Acc 0.9799813780260708:
8th- epoch: 300, train_loss = 1.9525586999952793, train_acc = 0.9952258965999069
test Acc 0.9799813780260708:
8th- epoch: 301, train_loss = 1.949568297015503, train_acc = 0.9952258965999069
test Acc 0.9799813780260708:
8th- epoch: 302, train_loss = 1.9474519200157374, train_acc = 0.9952258965999069
test Acc 0.9799813780260708:
8th- epoch: 303, train_loss = 1.9437498759943992, train_acc = 0.9952258965999069
test Acc 0.9799813780260708:
8th- epoch: 304, train_loss = 1.942150078713894, train_acc = 0.9952258965999069
test Acc 0.9799813780260708:
8th- epoch: 305, train_loss = 1.9401319392491132, train_acc = 0.9952258965999069
test Acc 0.97

8th- epoch: 445, train_loss = 1.7197730224579573, train_acc = 0.9949930135072194
test Acc 0.9809124767225326:
8th- epoch: 446, train_loss = 1.7178339045494795, train_acc = 0.9949930135072194
test Acc 0.9809124767225326:
8th- epoch: 447, train_loss = 1.7174648009240627, train_acc = 0.9949930135072194
test Acc 0.9809124767225326:
8th- epoch: 448, train_loss = 1.7153512127697468, train_acc = 0.9949930135072194
test Acc 0.9809124767225326:
8th- epoch: 449, train_loss = 1.7155224749585614, train_acc = 0.9949930135072194
test Acc 0.9809124767225326:
8th- epoch: 450, train_loss = 1.7142446072539315, train_acc = 0.9949930135072194
test Acc 0.9809124767225326:
8th- epoch: 451, train_loss = 1.7126459274441004, train_acc = 0.9949930135072194
test Acc 0.9809124767225326:
8th- epoch: 452, train_loss = 1.7121675051748753, train_acc = 0.9949930135072194
test Acc 0.9809124767225326:
8th- epoch: 453, train_loss = 1.7104446204612032, train_acc = 0.9949930135072194
test Acc 0.9809124767225326:
8th- epoch

 27%|██████████████████▉                                                    | 8/30 [1:12:27<3:19:22, 543.76s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
9th- epoch: 0, train_loss = 119.15285448729992, train_acc = 0.7678155565905915
test Acc 0.8649906890130353:
9th- epoch: 1, train_loss = 42.46607218682766, train_acc = 0.9104564508616675
test Acc 0.9152700186219739:
9th- epoch: 2, train_loss = 32.192509576678276, train_acc = 0.9326967862133209
test Acc 0.9283054003724395:
9th- epoch: 3, train_loss = 27.226513400673866, train_acc = 0.9430600838379134
test Acc 0.9357541899441341:
9th- epoch: 4, train_loss = 24.028793692588806, train_acc = 0.9494643688868188
test Acc 0.9408752327746741:
9th- epoch: 5, train_loss = 21.741251714527607, train_acc = 0.9551700046576619


9th- epoch: 147, train_loss = 2.810593380127102, train_acc = 0.9940614811364695
test Acc 0.9776536312849162:
9th- epoch: 148, train_loss = 2.79950083559379, train_acc = 0.9940614811364695
test Acc 0.9776536312849162:
9th- epoch: 149, train_loss = 2.787711217533797, train_acc = 0.9940614811364695
test Acc 0.9776536312849162:
9th- epoch: 150, train_loss = 2.7764270063489676, train_acc = 0.9940614811364695
test Acc 0.9776536312849162:
9th- epoch: 151, train_loss = 2.7634201725013554, train_acc = 0.9940614811364695
test Acc 0.9776536312849162:
9th- epoch: 152, train_loss = 2.752212563995272, train_acc = 0.9940614811364695
test Acc 0.9776536312849162:
9th- epoch: 153, train_loss = 2.7435455680824816, train_acc = 0.9941779226828132
test Acc 0.9776536312849162:
9th- epoch: 154, train_loss = 2.7314841193147004, train_acc = 0.9941779226828132
test Acc 0.9776536312849162:
9th- epoch: 155, train_loss = 2.7223116834647954, train_acc = 0.994294364229157
test Acc 0.9776536312849162:
9th- epoch: 156,

test Acc 0.9804469273743017:
9th- epoch: 297, train_loss = 1.9467100538313389, train_acc = 0.9954587796925943
test Acc 0.9804469273743017:
9th- epoch: 298, train_loss = 1.9442940999288112, train_acc = 0.9954587796925943
test Acc 0.9804469273743017:
9th- epoch: 299, train_loss = 1.9417319509666413, train_acc = 0.9954587796925943
test Acc 0.9804469273743017:
9th- epoch: 300, train_loss = 1.9385693781077862, train_acc = 0.9954587796925943
test Acc 0.9804469273743017:
9th- epoch: 301, train_loss = 1.9365805871784687, train_acc = 0.9954587796925943
test Acc 0.9804469273743017:
9th- epoch: 302, train_loss = 1.9334032621700317, train_acc = 0.9954587796925943
test Acc 0.9804469273743017:
9th- epoch: 303, train_loss = 1.9313926063477993, train_acc = 0.9954587796925943
test Acc 0.9804469273743017:
9th- epoch: 304, train_loss = 1.9285337675828487, train_acc = 0.9954587796925943
test Acc 0.9804469273743017:
9th- epoch: 305, train_loss = 1.9265826232731342, train_acc = 0.9954587796925943
test Acc 0

9th- epoch: 446, train_loss = 1.6992808716604486, train_acc = 0.995575221238938
test Acc 0.9799813780260708:
9th- epoch: 447, train_loss = 1.6982489041984081, train_acc = 0.995575221238938
test Acc 0.9799813780260708:
9th- epoch: 448, train_loss = 1.695382572710514, train_acc = 0.995575221238938
test Acc 0.9799813780260708:
9th- epoch: 449, train_loss = 1.6950025794794783, train_acc = 0.995575221238938
test Acc 0.9799813780260708:
9th- epoch: 450, train_loss = 1.6940661879489198, train_acc = 0.995575221238938
test Acc 0.9799813780260708:
9th- epoch: 451, train_loss = 1.6934296352555975, train_acc = 0.995575221238938
test Acc 0.9799813780260708:
9th- epoch: 452, train_loss = 1.6921587524702772, train_acc = 0.995575221238938
test Acc 0.9799813780260708:
9th- epoch: 453, train_loss = 1.6905798179795966, train_acc = 0.995575221238938
test Acc 0.9799813780260708:
9th- epoch: 454, train_loss = 1.6885807266226038, train_acc = 0.995575221238938
test Acc 0.9799813780260708:
9th- epoch: 455, tra

 30%|█████████████████████▎                                                 | 9/30 [1:21:32<3:10:27, 544.17s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
10th- epoch: 0, train_loss = 115.89155440032482, train_acc = 0.7826036329762459
test Acc 0.888268156424581:
10th- epoch: 1, train_loss = 42.09839668869972, train_acc = 0.9156963204471356
test Acc 0.9269087523277467:
10th- epoch: 2, train_loss = 31.975367955863476, train_acc = 0.933977643223102
test Acc 0.9371508379888268:
10th- epoch: 3, train_loss = 26.802278637886047, train_acc = 0.9442244993013508
test Acc 0.9432029795158287:
10th- epoch: 4, train_loss = 23.47108968347311, train_acc = 0.9517931998136935
test Acc 0.9464618249534451:
10th- epoch: 5, train_loss = 21.116410303860903, train_acc = 0.95586865393572

10th- epoch: 146, train_loss = 2.7304573878645897, train_acc = 0.9937121564974383
test Acc 0.9757914338919925:
10th- epoch: 147, train_loss = 2.7177151441574097, train_acc = 0.993828598043782
test Acc 0.9762569832402235:
10th- epoch: 148, train_loss = 2.7071384005248547, train_acc = 0.9937121564974383
test Acc 0.9753258845437617:
10th- epoch: 149, train_loss = 2.6974664381705225, train_acc = 0.9937121564974383
test Acc 0.9762569832402235:
10th- epoch: 150, train_loss = 2.686088731046766, train_acc = 0.9937121564974383
test Acc 0.9762569832402235:
10th- epoch: 151, train_loss = 2.676719143986702, train_acc = 0.9937121564974383
test Acc 0.9762569832402235:
10th- epoch: 152, train_loss = 2.665029080118984, train_acc = 0.9937121564974383
test Acc 0.9762569832402235:
10th- epoch: 153, train_loss = 2.654880865011364, train_acc = 0.9937121564974383
test Acc 0.9757914338919925:
10th- epoch: 154, train_loss = 2.643146345857531, train_acc = 0.993828598043782
test Acc 0.9762569832402235:
10th- ep

test Acc 0.9795158286778398:
10th- epoch: 295, train_loss = 1.9321190405171365, train_acc = 0.9956916627852818
test Acc 0.9795158286778398:
10th- epoch: 296, train_loss = 1.9291876864153892, train_acc = 0.995575221238938
test Acc 0.9795158286778398:
10th- epoch: 297, train_loss = 1.9272029536077753, train_acc = 0.9956916627852818
test Acc 0.9795158286778398:
10th- epoch: 298, train_loss = 1.9254018465289846, train_acc = 0.995575221238938
test Acc 0.9795158286778398:
10th- epoch: 299, train_loss = 1.9227713234722614, train_acc = 0.9956916627852818
test Acc 0.9795158286778398:
10th- epoch: 300, train_loss = 1.9207878274610266, train_acc = 0.9956916627852818
test Acc 0.9795158286778398:
10th- epoch: 301, train_loss = 1.918706238269806, train_acc = 0.995575221238938
test Acc 0.9795158286778398:
10th- epoch: 302, train_loss = 1.9154334949562326, train_acc = 0.9956916627852818
test Acc 0.9795158286778398:
10th- epoch: 303, train_loss = 1.9136666767299175, train_acc = 0.9956916627852818
test 

test Acc 0.9804469273743017:
10th- epoch: 443, train_loss = 1.7084277620306239, train_acc = 0.9954587796925943
test Acc 0.9804469273743017:
10th- epoch: 444, train_loss = 1.7073801085352898, train_acc = 0.9954587796925943
test Acc 0.9804469273743017:
10th- epoch: 445, train_loss = 1.7063858335604891, train_acc = 0.9954587796925943
test Acc 0.9804469273743017:
10th- epoch: 446, train_loss = 1.7060586934676394, train_acc = 0.9954587796925943
test Acc 0.9804469273743017:
10th- epoch: 447, train_loss = 1.7038697078824043, train_acc = 0.9954587796925943
test Acc 0.9804469273743017:
10th- epoch: 448, train_loss = 1.7034988068044186, train_acc = 0.9954587796925943
test Acc 0.9804469273743017:
10th- epoch: 449, train_loss = 1.703413862735033, train_acc = 0.9954587796925943
test Acc 0.9804469273743017:
10th- epoch: 450, train_loss = 1.7024077387759462, train_acc = 0.9954587796925943
test Acc 0.9804469273743017:
10th- epoch: 451, train_loss = 1.7000627579400316, train_acc = 0.9954587796925943
te

 33%|███████████████████████▎                                              | 10/30 [1:30:37<3:01:26, 544.32s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
11th- epoch: 0, train_loss = 105.91318941116333, train_acc = 0.7821378667908709
test Acc 0.8868715083798883:
11th- epoch: 1, train_loss = 43.831471629440784, train_acc = 0.912435957149511
test Acc 0.9180633147113594:
11th- epoch: 2, train_loss = 34.084251061081886, train_acc = 0.9303679552864462
test Acc 0.9334264432029795:
11th- epoch: 3, train_loss = 28.805090375244617, train_acc = 0.939683278993945
test Acc 0.9408752327746741:
11th- epoch: 4, train_loss = 25.24021750688553, train_acc = 0.9473684210526315
test Acc 0.9464618249534451:
11th- epoch: 5, train_loss = 22.66324845701456, train_acc = 0.95272473218444

test Acc 0.973463687150838:
11th- epoch: 146, train_loss = 2.7192429900169373, train_acc = 0.9949930135072194
test Acc 0.973463687150838:
11th- epoch: 147, train_loss = 2.707244584802538, train_acc = 0.9947601304145319
test Acc 0.973463687150838:
11th- epoch: 148, train_loss = 2.6956415832974017, train_acc = 0.9949930135072194
test Acc 0.973463687150838:
11th- epoch: 149, train_loss = 2.6878400780260563, train_acc = 0.9951094550535631
test Acc 0.973463687150838:
11th- epoch: 150, train_loss = 2.6771997462492436, train_acc = 0.9951094550535631
test Acc 0.973463687150838:
11th- epoch: 151, train_loss = 2.6664946030359715, train_acc = 0.9951094550535631
test Acc 0.973463687150838:
11th- epoch: 152, train_loss = 2.657055673422292, train_acc = 0.9951094550535631
test Acc 0.973463687150838:
11th- epoch: 153, train_loss = 2.6467496615368873, train_acc = 0.9949930135072194
test Acc 0.973463687150838:
11th- epoch: 154, train_loss = 2.63748657819815, train_acc = 0.9951094550535631
test Acc 0.973

11th- epoch: 294, train_loss = 1.9364739209413528, train_acc = 0.9956916627852818
test Acc 0.979050279329609:
11th- epoch: 295, train_loss = 1.9333088161656633, train_acc = 0.9956916627852818
test Acc 0.979050279329609:
11th- epoch: 296, train_loss = 1.932306615053676, train_acc = 0.9956916627852818
test Acc 0.979050279329609:
11th- epoch: 297, train_loss = 1.9292755151400343, train_acc = 0.9956916627852818
test Acc 0.979050279329609:
11th- epoch: 298, train_loss = 1.9261201148619875, train_acc = 0.9956916627852818
test Acc 0.979050279329609:
11th- epoch: 299, train_loss = 1.9225894175469875, train_acc = 0.9956916627852818
test Acc 0.979050279329609:
11th- epoch: 300, train_loss = 1.9218319592764601, train_acc = 0.9956916627852818
test Acc 0.9795158286778398:
11th- epoch: 301, train_loss = 1.918243887485005, train_acc = 0.9956916627852818
test Acc 0.9795158286778398:
11th- epoch: 302, train_loss = 1.9160424806177616, train_acc = 0.9956916627852818
test Acc 0.9795158286778398:
11th- epo

11th- epoch: 442, train_loss = 1.6963358409702778, train_acc = 0.9954587796925943
test Acc 0.978584729981378:
11th- epoch: 443, train_loss = 1.696091226011049, train_acc = 0.9954587796925943
test Acc 0.978584729981378:
11th- epoch: 444, train_loss = 1.6958427391946316, train_acc = 0.9954587796925943
test Acc 0.978584729981378:
11th- epoch: 445, train_loss = 1.6929027922451496, train_acc = 0.9954587796925943
test Acc 0.978584729981378:
11th- epoch: 446, train_loss = 1.6932292605633847, train_acc = 0.9954587796925943
test Acc 0.978584729981378:
11th- epoch: 447, train_loss = 1.692308199882973, train_acc = 0.9954587796925943
test Acc 0.978584729981378:
11th- epoch: 448, train_loss = 1.6926896857912652, train_acc = 0.9954587796925943
test Acc 0.978584729981378:
11th- epoch: 449, train_loss = 1.6917175737326033, train_acc = 0.9954587796925943
test Acc 0.978584729981378:
11th- epoch: 450, train_loss = 1.6912401740555651, train_acc = 0.9954587796925943
test Acc 0.978584729981378:
11th- epoch:

 37%|█████████████████████████▋                                            | 11/30 [1:39:40<2:52:19, 544.17s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
12th- epoch: 0, train_loss = 107.21029570698738, train_acc = 0.7962272938984629
test Acc 0.8868715083798883:
12th- epoch: 1, train_loss = 41.80223961919546, train_acc = 0.915929203539823
test Acc 0.9329608938547486:
12th- epoch: 2, train_loss = 32.58128770068288, train_acc = 0.935258500232883
test Acc 0.9432029795158287:
12th- epoch: 3, train_loss = 27.713868524879217, train_acc = 0.945388914764788
test Acc 0.946927374301676:
12th- epoch: 4, train_loss = 24.44312271475792, train_acc = 0.9514438751746623
test Acc 0.9487895716945997:
12th- epoch: 5, train_loss = 22.028920505195856, train_acc = 0.9563344201210993


12th- epoch: 146, train_loss = 2.707168899476528, train_acc = 0.993828598043782
test Acc 0.9757914338919925:
12th- epoch: 147, train_loss = 2.697041163686663, train_acc = 0.9939450395901258
test Acc 0.9757914338919925:
12th- epoch: 148, train_loss = 2.6875074305571616, train_acc = 0.993828598043782
test Acc 0.9757914338919925:
12th- epoch: 149, train_loss = 2.676521184388548, train_acc = 0.9939450395901258
test Acc 0.9757914338919925:
12th- epoch: 150, train_loss = 2.6656862013041973, train_acc = 0.9939450395901258
test Acc 0.9757914338919925:
12th- epoch: 151, train_loss = 2.655226308386773, train_acc = 0.9939450395901258
test Acc 0.9757914338919925:
12th- epoch: 152, train_loss = 2.645245846360922, train_acc = 0.9939450395901258
test Acc 0.9757914338919925:
12th- epoch: 153, train_loss = 2.635562409181148, train_acc = 0.9939450395901258
test Acc 0.9757914338919925:
12th- epoch: 154, train_loss = 2.625993942376226, train_acc = 0.9939450395901258
test Acc 0.9757914338919925:
12th- epoc

12th- epoch: 294, train_loss = 1.9484646631171927, train_acc = 0.9951094550535631
test Acc 0.9776536312849162:
12th- epoch: 295, train_loss = 1.9455721912672743, train_acc = 0.9952258965999069
test Acc 0.9776536312849162:
12th- epoch: 296, train_loss = 1.9425650052726269, train_acc = 0.9952258965999069
test Acc 0.9776536312849162:
12th- epoch: 297, train_loss = 1.9407431818544865, train_acc = 0.9952258965999069
test Acc 0.9776536312849162:
12th- epoch: 298, train_loss = 1.9382325522601604, train_acc = 0.9951094550535631
test Acc 0.9776536312849162:
12th- epoch: 299, train_loss = 1.9350974075496197, train_acc = 0.9951094550535631
test Acc 0.9781191806331471:
12th- epoch: 300, train_loss = 1.9326025123009458, train_acc = 0.9951094550535631
test Acc 0.9776536312849162:
12th- epoch: 301, train_loss = 1.9295726729324088, train_acc = 0.9951094550535631
test Acc 0.9776536312849162:
12th- epoch: 302, train_loss = 1.9272363409399986, train_acc = 0.9951094550535631
test Acc 0.9776536312849162:
1

test Acc 0.9776536312849162:
12th- epoch: 442, train_loss = 1.7128496058285236, train_acc = 0.995575221238938
test Acc 0.9776536312849162:
12th- epoch: 443, train_loss = 1.7106639854609966, train_acc = 0.995575221238938
test Acc 0.9776536312849162:
12th- epoch: 444, train_loss = 1.7114318497478962, train_acc = 0.995575221238938
test Acc 0.9776536312849162:
12th- epoch: 445, train_loss = 1.7096626262064092, train_acc = 0.995575221238938
test Acc 0.9776536312849162:
12th- epoch: 446, train_loss = 1.7086374126374722, train_acc = 0.995575221238938
test Acc 0.9776536312849162:
12th- epoch: 447, train_loss = 1.7078332875971682, train_acc = 0.995575221238938
test Acc 0.9776536312849162:
12th- epoch: 448, train_loss = 1.7062047098879702, train_acc = 0.995575221238938
test Acc 0.9776536312849162:
12th- epoch: 449, train_loss = 1.7051380798220634, train_acc = 0.995575221238938
test Acc 0.9776536312849162:
12th- epoch: 450, train_loss = 1.7044368485803716, train_acc = 0.995575221238938
test Acc 0

 40%|████████████████████████████                                          | 12/30 [1:48:42<2:43:03, 543.54s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
13th- epoch: 0, train_loss = 110.09092658758163, train_acc = 0.7831858407079646
test Acc 0.8729050279329609:
13th- epoch: 1, train_loss = 43.50572842359543, train_acc = 0.911504424778761
test Acc 0.9273743016759777:
13th- epoch: 2, train_loss = 32.57695250585675, train_acc = 0.9338612016767582
test Acc 0.9371508379888268:
13th- epoch: 3, train_loss = 27.43114423006773, train_acc = 0.9466697717745691
test Acc 0.9432029795158287:
13th- epoch: 4, train_loss = 24.160670079290867, train_acc = 0.952491849091756
test Acc 0.9459962756052142:
13th- epoch: 5, train_loss = 21.76900590956211, train_acc = 0.9563344201210993

13th- epoch: 146, train_loss = 2.7759797810576856, train_acc = 0.9940614811364695
test Acc 0.9776536312849162:
13th- epoch: 147, train_loss = 2.7647250718437135, train_acc = 0.9940614811364695
test Acc 0.9776536312849162:
13th- epoch: 148, train_loss = 2.7536980025470257, train_acc = 0.9940614811364695
test Acc 0.9776536312849162:
13th- epoch: 149, train_loss = 2.742251785006374, train_acc = 0.9940614811364695
test Acc 0.9776536312849162:
13th- epoch: 150, train_loss = 2.73132586106658, train_acc = 0.9940614811364695
test Acc 0.9776536312849162:
13th- epoch: 151, train_loss = 2.7219973169267178, train_acc = 0.9940614811364695
test Acc 0.9776536312849162:
13th- epoch: 152, train_loss = 2.7104423134587705, train_acc = 0.9940614811364695
test Acc 0.9776536312849162:
13th- epoch: 153, train_loss = 2.7006699331104755, train_acc = 0.9940614811364695
test Acc 0.9776536312849162:
13th- epoch: 154, train_loss = 2.6899529048241675, train_acc = 0.9941779226828132
test Acc 0.9776536312849162:
13th

test Acc 0.979050279329609:
13th- epoch: 295, train_loss = 1.9423936840612441, train_acc = 0.9949930135072194
test Acc 0.979050279329609:
13th- epoch: 296, train_loss = 1.9406474865972996, train_acc = 0.9953423381462506
test Acc 0.979050279329609:
13th- epoch: 297, train_loss = 1.9384002399165183, train_acc = 0.9954587796925943
test Acc 0.979050279329609:
13th- epoch: 298, train_loss = 1.936124611645937, train_acc = 0.9954587796925943
test Acc 0.979050279329609:
13th- epoch: 299, train_loss = 1.9330733206588775, train_acc = 0.9954587796925943
test Acc 0.979050279329609:
13th- epoch: 300, train_loss = 1.931103588314727, train_acc = 0.9954587796925943
test Acc 0.979050279329609:
13th- epoch: 301, train_loss = 1.9284034930169582, train_acc = 0.9954587796925943
test Acc 0.979050279329609:
13th- epoch: 302, train_loss = 1.9251621912699193, train_acc = 0.9954587796925943
test Acc 0.979050279329609:
13th- epoch: 303, train_loss = 1.9243655018508434, train_acc = 0.9954587796925943
test Acc 0.9

13th- epoch: 443, train_loss = 1.6989962483057752, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
13th- epoch: 444, train_loss = 1.6935277344891801, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
13th- epoch: 445, train_loss = 1.6960911663481966, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
13th- epoch: 446, train_loss = 1.692994687706232, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
13th- epoch: 447, train_loss = 1.694527999847196, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
13th- epoch: 448, train_loss = 1.6899212213465944, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
13th- epoch: 449, train_loss = 1.6930359365651384, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
13th- epoch: 450, train_loss = 1.6887801116099581, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
13th- epoch: 451, train_loss = 1.6896248484263197, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
13t

 43%|██████████████████████████████▎                                       | 13/30 [1:57:45<2:33:54, 543.19s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
14th- epoch: 0, train_loss = 113.30852463841438, train_acc = 0.8013507219375874
test Acc 0.9017690875232774:
14th- epoch: 1, train_loss = 42.9876928254962, train_acc = 0.9168607359105729
test Acc 0.931098696461825:
14th- epoch: 2, train_loss = 33.2076660245657, train_acc = 0.9375873311597578
test Acc 0.9380819366852886:
14th- epoch: 3, train_loss = 28.21143900230527, train_acc = 0.9466697717745691
test Acc 0.9478584729981379:
14th- epoch: 4, train_loss = 24.910916160792112, train_acc = 0.9529576152771309
test Acc 0.9492551210428305:
14th- epoch: 5, train_loss = 22.459322184324265, train_acc = 0.9573823940381928

14th- epoch: 146, train_loss = 2.7938651801086962, train_acc = 0.9946436888681882
test Acc 0.9748603351955307:
14th- epoch: 147, train_loss = 2.7817059233784676, train_acc = 0.9946436888681882
test Acc 0.9748603351955307:
14th- epoch: 148, train_loss = 2.7709019244648516, train_acc = 0.9946436888681882
test Acc 0.9748603351955307:
14th- epoch: 149, train_loss = 2.7597484812140465, train_acc = 0.9946436888681882
test Acc 0.9748603351955307:
14th- epoch: 150, train_loss = 2.746914379298687, train_acc = 0.9946436888681882
test Acc 0.9748603351955307:
14th- epoch: 151, train_loss = 2.736286237835884, train_acc = 0.9946436888681882
test Acc 0.9748603351955307:
14th- epoch: 152, train_loss = 2.7263669706881046, train_acc = 0.9946436888681882
test Acc 0.9748603351955307:
14th- epoch: 153, train_loss = 2.7135296030901372, train_acc = 0.9948765719608756
test Acc 0.9748603351955307:
14th- epoch: 154, train_loss = 2.7044337638653815, train_acc = 0.9948765719608756
test Acc 0.9748603351955307:
14t

14th- epoch: 294, train_loss = 1.9583264142274857, train_acc = 0.9954587796925943
test Acc 0.979050279329609:
14th- epoch: 295, train_loss = 1.9544083636719733, train_acc = 0.9954587796925943
test Acc 0.979050279329609:
14th- epoch: 296, train_loss = 1.9531192146241665, train_acc = 0.9954587796925943
test Acc 0.979050279329609:
14th- epoch: 297, train_loss = 1.948346097022295, train_acc = 0.9954587796925943
test Acc 0.979050279329609:
14th- epoch: 298, train_loss = 1.9471166208386421, train_acc = 0.9954587796925943
test Acc 0.979050279329609:
14th- epoch: 299, train_loss = 1.9432523536961526, train_acc = 0.9954587796925943
test Acc 0.979050279329609:
14th- epoch: 300, train_loss = 1.9427524332422763, train_acc = 0.9954587796925943
test Acc 0.979050279329609:
14th- epoch: 301, train_loss = 1.9396912194788456, train_acc = 0.9954587796925943
test Acc 0.979050279329609:
14th- epoch: 302, train_loss = 1.935838658362627, train_acc = 0.9954587796925943
test Acc 0.979050279329609:
14th- epoch:

14th- epoch: 443, train_loss = 1.7041202721884474, train_acc = 0.996040987424313
test Acc 0.979050279329609:
14th- epoch: 444, train_loss = 1.7020158605882898, train_acc = 0.996040987424313
test Acc 0.979050279329609:
14th- epoch: 445, train_loss = 1.7010691264877096, train_acc = 0.996040987424313
test Acc 0.979050279329609:
14th- epoch: 446, train_loss = 1.700185506255366, train_acc = 0.996040987424313
test Acc 0.979050279329609:
14th- epoch: 447, train_loss = 1.6993333660066128, train_acc = 0.996040987424313
test Acc 0.979050279329609:
14th- epoch: 448, train_loss = 1.698043517768383, train_acc = 0.996040987424313
test Acc 0.979050279329609:
14th- epoch: 449, train_loss = 1.6969594297697768, train_acc = 0.996040987424313
test Acc 0.979050279329609:
14th- epoch: 450, train_loss = 1.6960982432356104, train_acc = 0.996040987424313
test Acc 0.979050279329609:
14th- epoch: 451, train_loss = 1.694388127536513, train_acc = 0.996040987424313
test Acc 0.979050279329609:
14th- epoch: 452, trai

 47%|████████████████████████████████▋                                     | 14/30 [2:06:47<2:24:47, 542.94s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
15th- epoch: 0, train_loss = 120.19700223207474, train_acc = 0.78959012575687
test Acc 0.883147113594041:
15th- epoch: 1, train_loss = 42.51785994321108, train_acc = 0.9147647880763856
test Acc 0.925512104283054:
15th- epoch: 2, train_loss = 31.886488676071167, train_acc = 0.9329296693060084
test Acc 0.9376163873370578:
15th- epoch: 3, train_loss = 26.47762479633093, train_acc = 0.9421285514671635
test Acc 0.9441340782122905:
15th- epoch: 4, train_loss = 22.96200193092227, train_acc = 0.9503959012575687
test Acc 0.9478584729981379:
15th- epoch: 5, train_loss = 20.405875209718943, train_acc = 0.9568001863064741


15th- epoch: 146, train_loss = 2.539174938108772, train_acc = 0.9952258965999069
test Acc 0.9799813780260708:
15th- epoch: 147, train_loss = 2.5302457720972598, train_acc = 0.9952258965999069
test Acc 0.9799813780260708:
15th- epoch: 148, train_loss = 2.5205173254944384, train_acc = 0.9952258965999069
test Acc 0.9804469273743017:
15th- epoch: 149, train_loss = 2.5130036659538746, train_acc = 0.9953423381462506
test Acc 0.9804469273743017:
15th- epoch: 150, train_loss = 2.502740120049566, train_acc = 0.9953423381462506
test Acc 0.9804469273743017:
15th- epoch: 151, train_loss = 2.495870105922222, train_acc = 0.9953423381462506
test Acc 0.9804469273743017:
15th- epoch: 152, train_loss = 2.486542528960854, train_acc = 0.9952258965999069
test Acc 0.9804469273743017:
15th- epoch: 153, train_loss = 2.47770152753219, train_acc = 0.9952258965999069
test Acc 0.9804469273743017:
15th- epoch: 154, train_loss = 2.4701258279383183, train_acc = 0.9953423381462506
test Acc 0.9804469273743017:
15th- e

15th- epoch: 294, train_loss = 1.8834787321975455, train_acc = 0.995575221238938
test Acc 0.9818435754189944:
15th- epoch: 295, train_loss = 1.8807030072202906, train_acc = 0.995575221238938
test Acc 0.9818435754189944:
15th- epoch: 296, train_loss = 1.8795435341307893, train_acc = 0.995575221238938
test Acc 0.9818435754189944:
15th- epoch: 297, train_loss = 1.8765311116585508, train_acc = 0.995575221238938
test Acc 0.9818435754189944:
15th- epoch: 298, train_loss = 1.8744758516550064, train_acc = 0.995575221238938
test Acc 0.9818435754189944:
15th- epoch: 299, train_loss = 1.871026168228127, train_acc = 0.995575221238938
test Acc 0.9818435754189944:
15th- epoch: 300, train_loss = 1.8709773421287537, train_acc = 0.995575221238938
test Acc 0.9818435754189944:
15th- epoch: 301, train_loss = 1.8682353608310223, train_acc = 0.995575221238938
test Acc 0.9818435754189944:
15th- epoch: 302, train_loss = 1.8666547375032678, train_acc = 0.995575221238938
test Acc 0.9818435754189944:
15th- epoch

15th- epoch: 442, train_loss = 1.6762950706179254, train_acc = 0.9956916627852818
test Acc 0.9818435754189944:
15th- epoch: 443, train_loss = 1.6741253050859086, train_acc = 0.9956916627852818
test Acc 0.9818435754189944:
15th- epoch: 444, train_loss = 1.6737144167418592, train_acc = 0.9956916627852818
test Acc 0.9818435754189944:
15th- epoch: 445, train_loss = 1.6730139590799809, train_acc = 0.9956916627852818
test Acc 0.9818435754189944:
15th- epoch: 446, train_loss = 1.6742852007155307, train_acc = 0.9956916627852818
test Acc 0.9818435754189944:
15th- epoch: 447, train_loss = 1.6712586631183513, train_acc = 0.9956916627852818
test Acc 0.9818435754189944:
15th- epoch: 448, train_loss = 1.671618773310911, train_acc = 0.9956916627852818
test Acc 0.9818435754189944:
15th- epoch: 449, train_loss = 1.6691798183019273, train_acc = 0.9956916627852818
test Acc 0.9818435754189944:
15th- epoch: 450, train_loss = 1.6685086426441558, train_acc = 0.9956916627852818
test Acc 0.9818435754189944:
15

 50%|███████████████████████████████████                                   | 15/30 [2:15:49<2:15:39, 542.66s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
16th- epoch: 0, train_loss = 103.93933291733265, train_acc = 0.8021658127619935
test Acc 0.8300744878957169:
16th- epoch: 1, train_loss = 42.68801660090685, train_acc = 0.9153469958081043
test Acc 0.8896648044692738:
16th- epoch: 2, train_loss = 33.15369077771902, train_acc = 0.9343269678621332
test Acc 0.9199255121042831:
16th- epoch: 3, train_loss = 28.010819256305695, train_acc = 0.9431765253842571
test Acc 0.9320297951582868:
16th- epoch: 4, train_loss = 24.54947232082486, train_acc = 0.94981369352585
test Acc 0.9343575418994413:
16th- epoch: 5, train_loss = 21.994068637490273, train_acc = 0.956334420121099

16th- epoch: 146, train_loss = 2.6180659788660705, train_acc = 0.9945272473218444
test Acc 0.9711359404096834:
16th- epoch: 147, train_loss = 2.6085220109671354, train_acc = 0.9944108057755007
test Acc 0.9711359404096834:
16th- epoch: 148, train_loss = 2.599269190337509, train_acc = 0.9945272473218444
test Acc 0.9711359404096834:
16th- epoch: 149, train_loss = 2.5893732365220785, train_acc = 0.9945272473218444
test Acc 0.9711359404096834:
16th- epoch: 150, train_loss = 2.5802063471637666, train_acc = 0.9944108057755007
test Acc 0.9711359404096834:
16th- epoch: 151, train_loss = 2.571541449520737, train_acc = 0.9945272473218444
test Acc 0.9711359404096834:
16th- epoch: 152, train_loss = 2.562425192911178, train_acc = 0.9945272473218444
test Acc 0.9711359404096834:
16th- epoch: 153, train_loss = 2.5527996718883514, train_acc = 0.9944108057755007
test Acc 0.9711359404096834:
16th- epoch: 154, train_loss = 2.545249793212861, train_acc = 0.9945272473218444
test Acc 0.9711359404096834:
16th-

16th- epoch: 294, train_loss = 1.9125900684157386, train_acc = 0.9952258965999069
test Acc 0.9757914338919925:
16th- epoch: 295, train_loss = 1.909851118340157, train_acc = 0.9952258965999069
test Acc 0.9757914338919925:
16th- epoch: 296, train_loss = 1.908817840158008, train_acc = 0.9952258965999069
test Acc 0.9757914338919925:
16th- epoch: 297, train_loss = 1.9064653050154448, train_acc = 0.9952258965999069
test Acc 0.9757914338919925:
16th- epoch: 298, train_loss = 1.9042104365071282, train_acc = 0.9952258965999069
test Acc 0.9757914338919925:
16th- epoch: 299, train_loss = 1.9011088827392086, train_acc = 0.9952258965999069
test Acc 0.9757914338919925:
16th- epoch: 300, train_loss = 1.8991284550866112, train_acc = 0.9952258965999069
test Acc 0.9757914338919925:
16th- epoch: 301, train_loss = 1.8970970883965492, train_acc = 0.9952258965999069
test Acc 0.9757914338919925:
16th- epoch: 302, train_loss = 1.8951311396667734, train_acc = 0.9951094550535631
test Acc 0.9753258845437617:
16t

test Acc 0.9767225325884544:
16th- epoch: 442, train_loss = 1.6958835422992706, train_acc = 0.9953423381462506
test Acc 0.9767225325884544:
16th- epoch: 443, train_loss = 1.6954349192674272, train_acc = 0.9953423381462506
test Acc 0.9767225325884544:
16th- epoch: 444, train_loss = 1.694241909950506, train_acc = 0.9953423381462506
test Acc 0.9767225325884544:
16th- epoch: 445, train_loss = 1.6942059167777188, train_acc = 0.9953423381462506
test Acc 0.9767225325884544:
16th- epoch: 446, train_loss = 1.6936086937785149, train_acc = 0.9953423381462506
test Acc 0.9767225325884544:
16th- epoch: 447, train_loss = 1.6925830717082135, train_acc = 0.9953423381462506
test Acc 0.9767225325884544:
16th- epoch: 448, train_loss = 1.6909173894673586, train_acc = 0.9953423381462506
test Acc 0.9767225325884544:
16th- epoch: 449, train_loss = 1.6908176448196173, train_acc = 0.9953423381462506
test Acc 0.9767225325884544:
16th- epoch: 450, train_loss = 1.6884945177589543, train_acc = 0.9953423381462506
te

 53%|█████████████████████████████████████▎                                | 16/30 [2:24:52<2:06:37, 542.66s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
17th- epoch: 0, train_loss = 107.87365773320198, train_acc = 0.8026315789473685
test Acc 0.8654562383612663:
17th- epoch: 1, train_loss = 41.79552835971117, train_acc = 0.9177922682813228
test Acc 0.898975791433892:
17th- epoch: 2, train_loss = 31.800120443105698, train_acc = 0.9377037727061015
test Acc 0.9110800744878957:
17th- epoch: 3, train_loss = 26.607997179031372, train_acc = 0.9456217978574756
test Acc 0.925512104283054:
17th- epoch: 4, train_loss = 23.19555378332734, train_acc = 0.9508616674429436
test Acc 0.9352886405959032:
17th- epoch: 5, train_loss = 20.683591309934855, train_acc = 0.95598509548206

17th- epoch: 146, train_loss = 2.7394340720493346, train_acc = 0.994294364229157
test Acc 0.9776536312849162:
17th- epoch: 147, train_loss = 2.727941842051223, train_acc = 0.994294364229157
test Acc 0.9776536312849162:
17th- epoch: 148, train_loss = 2.7164813752751797, train_acc = 0.994294364229157
test Acc 0.9776536312849162:
17th- epoch: 149, train_loss = 2.7052566695492715, train_acc = 0.994294364229157
test Acc 0.9776536312849162:
17th- epoch: 150, train_loss = 2.695041333558038, train_acc = 0.994294364229157
test Acc 0.9776536312849162:
17th- epoch: 151, train_loss = 2.685997150838375, train_acc = 0.994294364229157
test Acc 0.9776536312849162:
17th- epoch: 152, train_loss = 2.674946417333558, train_acc = 0.994294364229157
test Acc 0.9776536312849162:
17th- epoch: 153, train_loss = 2.6631306011695415, train_acc = 0.9944108057755007
test Acc 0.9776536312849162:
17th- epoch: 154, train_loss = 2.654260865179822, train_acc = 0.994294364229157
test Acc 0.9776536312849162:
17th- epoch: 1

17th- epoch: 294, train_loss = 1.9337955067167059, train_acc = 0.9956916627852818
test Acc 0.979050279329609:
17th- epoch: 295, train_loss = 1.9309313707053661, train_acc = 0.9956916627852818
test Acc 0.979050279329609:
17th- epoch: 296, train_loss = 1.92938581854105, train_acc = 0.9956916627852818
test Acc 0.979050279329609:
17th- epoch: 297, train_loss = 1.9264258792391047, train_acc = 0.9956916627852818
test Acc 0.979050279329609:
17th- epoch: 298, train_loss = 1.9241057323524728, train_acc = 0.9956916627852818
test Acc 0.979050279329609:
17th- epoch: 299, train_loss = 1.9215584844350815, train_acc = 0.9956916627852818
test Acc 0.979050279329609:
17th- epoch: 300, train_loss = 1.9181746704271063, train_acc = 0.9956916627852818
test Acc 0.979050279329609:
17th- epoch: 301, train_loss = 1.9163521267473698, train_acc = 0.9956916627852818
test Acc 0.979050279329609:
17th- epoch: 302, train_loss = 1.9142038399586454, train_acc = 0.9956916627852818
test Acc 0.979050279329609:
17th- epoch:

17th- epoch: 442, train_loss = 1.6928775496780872, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
17th- epoch: 443, train_loss = 1.691407072066795, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
17th- epoch: 444, train_loss = 1.6905198867316358, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
17th- epoch: 445, train_loss = 1.6897721613640897, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
17th- epoch: 446, train_loss = 1.6883662070031278, train_acc = 0.9956916627852818
test Acc 0.9781191806331471:
17th- epoch: 447, train_loss = 1.6873165468568914, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
17th- epoch: 448, train_loss = 1.6868657183949836, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
17th- epoch: 449, train_loss = 1.6857951444690116, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
17th- epoch: 450, train_loss = 1.6847756157512777, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
17th- epoc

 57%|███████████████████████████████████████▋                              | 17/30 [2:33:54<1:57:33, 542.54s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
18th- epoch: 0, train_loss = 101.42842911183834, train_acc = 0.7922682813227759
test Acc 0.8854748603351955:
18th- epoch: 1, train_loss = 41.419960260391235, train_acc = 0.9145319049836982
test Acc 0.9222532588454376:
18th- epoch: 2, train_loss = 32.25364777445793, train_acc = 0.9325803446669771
test Acc 0.9390130353817505:
18th- epoch: 3, train_loss = 27.3325407654047, train_acc = 0.9428272007452259
test Acc 0.9450651769087524:
18th- epoch: 4, train_loss = 24.01680977270007, train_acc = 0.9501630181648812
test Acc 0.9492551210428305:
18th- epoch: 5, train_loss = 21.591693732887506, train_acc = 0.95365626455519

test Acc 0.973463687150838:
18th- epoch: 72, train_loss = 4.295250819995999, train_acc = 0.9914997671169073
test Acc 0.973463687150838:
18th- epoch: 73, train_loss = 4.253808477893472, train_acc = 0.9914997671169073
test Acc 0.973463687150838:
18th- epoch: 74, train_loss = 4.212777498178184, train_acc = 0.9917326502095948
test Acc 0.973463687150838:
18th- epoch: 75, train_loss = 4.175179521553218, train_acc = 0.9917326502095948
test Acc 0.973463687150838:
18th- epoch: 76, train_loss = 4.1365630105137825, train_acc = 0.9917326502095948
test Acc 0.973463687150838:
18th- epoch: 77, train_loss = 4.096885221544653, train_acc = 0.9917326502095948
test Acc 0.9739292364990689:
18th- epoch: 78, train_loss = 4.061061445157975, train_acc = 0.9919655333022822
test Acc 0.9739292364990689:
18th- epoch: 79, train_loss = 4.025885900482535, train_acc = 0.9919655333022822
test Acc 0.9739292364990689:
18th- epoch: 80, train_loss = 3.99035463668406, train_acc = 0.9919655333022822
test Acc 0.97392923649906

18th- epoch: 220, train_loss = 2.1823559310287237, train_acc = 0.9948765719608756
test Acc 0.979050279329609:
18th- epoch: 221, train_loss = 2.177961279405281, train_acc = 0.9948765719608756
test Acc 0.9795158286778398:
18th- epoch: 222, train_loss = 2.1730136293917894, train_acc = 0.9948765719608756
test Acc 0.979050279329609:
18th- epoch: 223, train_loss = 2.16832279227674, train_acc = 0.9948765719608756
test Acc 0.979050279329609:
18th- epoch: 224, train_loss = 2.1645342633128166, train_acc = 0.9948765719608756
test Acc 0.979050279329609:
18th- epoch: 225, train_loss = 2.1599502004683018, train_acc = 0.9948765719608756
test Acc 0.979050279329609:
18th- epoch: 226, train_loss = 2.1553257156629115, train_acc = 0.9948765719608756
test Acc 0.979050279329609:
18th- epoch: 227, train_loss = 2.1511114209424704, train_acc = 0.9948765719608756
test Acc 0.979050279329609:
18th- epoch: 228, train_loss = 2.146159475669265, train_acc = 0.9948765719608756
test Acc 0.979050279329609:
18th- epoch: 

18th- epoch: 368, train_loss = 1.7876598400762305, train_acc = 0.995575221238938
test Acc 0.9804469273743017:
18th- epoch: 369, train_loss = 1.7871498676249757, train_acc = 0.9956916627852818
test Acc 0.9804469273743017:
18th- epoch: 370, train_loss = 1.784590574563481, train_acc = 0.9956916627852818
test Acc 0.9799813780260708:
18th- epoch: 371, train_loss = 1.783654714585282, train_acc = 0.9956916627852818
test Acc 0.9804469273743017:
18th- epoch: 372, train_loss = 1.782126173377037, train_acc = 0.9956916627852818
test Acc 0.9799813780260708:
18th- epoch: 373, train_loss = 1.7805589586496353, train_acc = 0.9956916627852818
test Acc 0.9804469273743017:
18th- epoch: 374, train_loss = 1.7793149253120646, train_acc = 0.995575221238938
test Acc 0.9799813780260708:
18th- epoch: 375, train_loss = 1.7769508747151121, train_acc = 0.995575221238938
test Acc 0.9804469273743017:
18th- epoch: 376, train_loss = 1.776249684393406, train_acc = 0.995575221238938
test Acc 0.9799813780260708:
18th- epo

 60%|██████████████████████████████████████████                            | 18/30 [2:42:56<1:48:28, 542.36s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
19th- epoch: 0, train_loss = 117.58458161354065, train_acc = 0.7876106194690266
test Acc 0.8780260707635009:
19th- epoch: 1, train_loss = 40.73934967070818, train_acc = 0.916394969725198
test Acc 0.914804469273743:
19th- epoch: 2, train_loss = 30.69610169157386, train_acc = 0.9368886818816954
test Acc 0.9366852886405959:
19th- epoch: 3, train_loss = 25.680314112454653, train_acc = 0.9455053563111319
test Acc 0.9487895716945997:
19th- epoch: 4, train_loss = 22.459307048469782, train_acc = 0.9535398230088495
test Acc 0.952513966480447:
19th- epoch: 5, train_loss = 20.139185670763254, train_acc = 0.959245458779692

19th- epoch: 146, train_loss = 2.6319450507871807, train_acc = 0.994294364229157
test Acc 0.9739292364990689:
19th- epoch: 147, train_loss = 2.621859449893236, train_acc = 0.994294364229157
test Acc 0.9739292364990689:
19th- epoch: 148, train_loss = 2.61210198700428, train_acc = 0.994294364229157
test Acc 0.9739292364990689:
19th- epoch: 149, train_loss = 2.6016353801824152, train_acc = 0.994294364229157
test Acc 0.9739292364990689:
19th- epoch: 150, train_loss = 2.5916046504862607, train_acc = 0.994294364229157
test Acc 0.9739292364990689:
19th- epoch: 151, train_loss = 2.5814730445854366, train_acc = 0.994294364229157
test Acc 0.9739292364990689:
19th- epoch: 152, train_loss = 2.5733328387141228, train_acc = 0.994294364229157
test Acc 0.9739292364990689:
19th- epoch: 153, train_loss = 2.5628902222961187, train_acc = 0.994294364229157
test Acc 0.973463687150838:
19th- epoch: 154, train_loss = 2.5545567921362817, train_acc = 0.994294364229157
test Acc 0.9739292364990689:
19th- epoch: 1

19th- epoch: 294, train_loss = 1.8937126602977514, train_acc = 0.9956916627852818
test Acc 0.9771880819366853:
19th- epoch: 295, train_loss = 1.8913306307513267, train_acc = 0.9956916627852818
test Acc 0.9767225325884544:
19th- epoch: 296, train_loss = 1.8887189235538244, train_acc = 0.9958081043316255
test Acc 0.9771880819366853:
19th- epoch: 297, train_loss = 1.8864609103184193, train_acc = 0.9956916627852818
test Acc 0.9771880819366853:
19th- epoch: 298, train_loss = 1.8841404486447573, train_acc = 0.9956916627852818
test Acc 0.9771880819366853:
19th- epoch: 299, train_loss = 1.883016686886549, train_acc = 0.996040987424313
test Acc 0.9767225325884544:
19th- epoch: 300, train_loss = 1.8805820010602474, train_acc = 0.9956916627852818
test Acc 0.9767225325884544:
19th- epoch: 301, train_loss = 1.8788464639801532, train_acc = 0.9956916627852818
test Acc 0.9767225325884544:
19th- epoch: 302, train_loss = 1.8759446367621422, train_acc = 0.9958081043316255
test Acc 0.9767225325884544:
19t

19th- epoch: 442, train_loss = 1.6868023164570332, train_acc = 0.996040987424313
test Acc 0.9776536312849162:
19th- epoch: 443, train_loss = 1.684693654999137, train_acc = 0.996040987424313
test Acc 0.9776536312849162:
19th- epoch: 444, train_loss = 1.6862246226519346, train_acc = 0.996040987424313
test Acc 0.9776536312849162:
19th- epoch: 445, train_loss = 1.6812780313193798, train_acc = 0.996040987424313
test Acc 0.9776536312849162:
19th- epoch: 446, train_loss = 1.6842350885272026, train_acc = 0.996040987424313
test Acc 0.9776536312849162:
19th- epoch: 447, train_loss = 1.6817276161164045, train_acc = 0.996040987424313
test Acc 0.9776536312849162:
19th- epoch: 448, train_loss = 1.6806141367414966, train_acc = 0.996040987424313
test Acc 0.9776536312849162:
19th- epoch: 449, train_loss = 1.6810394786298275, train_acc = 0.996040987424313
test Acc 0.9776536312849162:
19th- epoch: 450, train_loss = 1.679436138481833, train_acc = 0.996040987424313
test Acc 0.9776536312849162:
19th- epoch:

 63%|████████████████████████████████████████████▎                         | 19/30 [2:51:59<1:39:27, 542.49s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
20th- epoch: 0, train_loss = 107.36397568881512, train_acc = 0.8013507219375874
test Acc 0.888268156424581:
20th- epoch: 1, train_loss = 42.203599989414215, train_acc = 0.917675826734979
test Acc 0.9250465549348231:
20th- epoch: 2, train_loss = 32.109659399837255, train_acc = 0.9382859804378202
test Acc 0.9366852886405959:
20th- epoch: 3, train_loss = 27.141545340418816, train_acc = 0.9466697717745691
test Acc 0.9441340782122905:
20th- epoch: 4, train_loss = 23.94090372696519, train_acc = 0.9523754075454122
test Acc 0.946927374301676:
20th- epoch: 5, train_loss = 21.569679617881775, train_acc = 0.95598509548206

20th- epoch: 145, train_loss = 2.4818897782824934, train_acc = 0.994294364229157
test Acc 0.9716014897579144:
20th- epoch: 146, train_loss = 2.471565742045641, train_acc = 0.994294364229157
test Acc 0.9716014897579144:
20th- epoch: 147, train_loss = 2.4620795238297433, train_acc = 0.994294364229157
test Acc 0.9716014897579144:
20th- epoch: 148, train_loss = 2.4544788636267185, train_acc = 0.994294364229157
test Acc 0.9716014897579144:
20th- epoch: 149, train_loss = 2.4465412236750126, train_acc = 0.994294364229157
test Acc 0.9716014897579144:
20th- epoch: 150, train_loss = 2.4376231159549206, train_acc = 0.994294364229157
test Acc 0.9720670391061452:
20th- epoch: 151, train_loss = 2.4314804561436176, train_acc = 0.994294364229157
test Acc 0.9716014897579144:
20th- epoch: 152, train_loss = 2.4215122424066067, train_acc = 0.994294364229157
test Acc 0.9716014897579144:
20th- epoch: 153, train_loss = 2.4139825317543, train_acc = 0.994294364229157
test Acc 0.9720670391061452:
20th- epoch: 1

test Acc 0.9753258845437617:
20th- epoch: 293, train_loss = 1.848820373415947, train_acc = 0.9953423381462506
test Acc 0.9753258845437617:
20th- epoch: 294, train_loss = 1.8468580655753613, train_acc = 0.9952258965999069
test Acc 0.9753258845437617:
20th- epoch: 295, train_loss = 1.8449668859830126, train_acc = 0.9952258965999069
test Acc 0.9753258845437617:
20th- epoch: 296, train_loss = 1.8434042694279924, train_acc = 0.9952258965999069
test Acc 0.9753258845437617:
20th- epoch: 297, train_loss = 1.8419874062528834, train_acc = 0.9952258965999069
test Acc 0.9753258845437617:
20th- epoch: 298, train_loss = 1.839060957194306, train_acc = 0.9952258965999069
test Acc 0.9753258845437617:
20th- epoch: 299, train_loss = 1.8374100787332281, train_acc = 0.9952258965999069
test Acc 0.9753258845437617:
20th- epoch: 300, train_loss = 1.8362320624291897, train_acc = 0.9952258965999069
test Acc 0.9753258845437617:
20th- epoch: 301, train_loss = 1.833734324784018, train_acc = 0.9952258965999069
test

test Acc 0.9767225325884544:
20th- epoch: 440, train_loss = 1.6598260464379564, train_acc = 0.9952258965999069
test Acc 0.9767225325884544:
20th- epoch: 441, train_loss = 1.6568011516937986, train_acc = 0.9952258965999069
test Acc 0.9767225325884544:
20th- epoch: 442, train_loss = 1.6583757748594508, train_acc = 0.9952258965999069
test Acc 0.9767225325884544:
20th- epoch: 443, train_loss = 1.6559127556975, train_acc = 0.9952258965999069
test Acc 0.9767225325884544:
20th- epoch: 444, train_loss = 1.6567450339207426, train_acc = 0.9952258965999069
test Acc 0.9767225325884544:
20th- epoch: 445, train_loss = 1.654987913905643, train_acc = 0.9952258965999069
test Acc 0.9767225325884544:
20th- epoch: 446, train_loss = 1.6534630171954632, train_acc = 0.9952258965999069
test Acc 0.9767225325884544:
20th- epoch: 447, train_loss = 1.6542503970558755, train_acc = 0.9952258965999069
test Acc 0.9767225325884544:
20th- epoch: 448, train_loss = 1.6529349039192311, train_acc = 0.9952258965999069
test 

 67%|██████████████████████████████████████████████▋                       | 20/30 [3:01:02<1:30:28, 542.83s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
21th- epoch: 0, train_loss = 110.43031527101994, train_acc = 0.7945971122496507
test Acc 0.8873370577281192:
21th- epoch: 1, train_loss = 41.552692510187626, train_acc = 0.9127852817885421
test Acc 0.9185288640595903:
21th- epoch: 2, train_loss = 31.026623107492924, train_acc = 0.9344434094084769
test Acc 0.9338919925512105:
21th- epoch: 3, train_loss = 25.79345501586795, train_acc = 0.9445738239403819
test Acc 0.9385474860335196:
21th- epoch: 4, train_loss = 22.493091087788343, train_acc = 0.9519096413600373
test Acc 0.9455307262569832:
21th- epoch: 5, train_loss = 20.160108730196953, train_acc = 0.95714951094

test Acc 0.9716014897579144:
21th- epoch: 72, train_loss = 4.253647996578366, train_acc = 0.9919655333022822
test Acc 0.9716014897579144:
21th- epoch: 73, train_loss = 4.214005928486586, train_acc = 0.9919655333022822
test Acc 0.9716014897579144:
21th- epoch: 74, train_loss = 4.1793333776295185, train_acc = 0.9918490917559385
test Acc 0.9716014897579144:
21th- epoch: 75, train_loss = 4.145205980632454, train_acc = 0.992081974848626
test Acc 0.9716014897579144:
21th- epoch: 76, train_loss = 4.109111322555691, train_acc = 0.9921984163949698
test Acc 0.9720670391061452:
21th- epoch: 77, train_loss = 4.077350323554128, train_acc = 0.9923148579413135
test Acc 0.9716014897579144:
21th- epoch: 78, train_loss = 4.045316537376493, train_acc = 0.9921984163949698
test Acc 0.9716014897579144:
21th- epoch: 79, train_loss = 4.012383708264679, train_acc = 0.9921984163949698
test Acc 0.9720670391061452:
21th- epoch: 80, train_loss = 3.978924347553402, train_acc = 0.9921984163949698
test Acc 0.97206703

21th- epoch: 220, train_loss = 2.1946053069550544, train_acc = 0.9946436888681882
test Acc 0.9776536312849162:
21th- epoch: 221, train_loss = 2.1892102647107095, train_acc = 0.9947601304145319
test Acc 0.9776536312849162:
21th- epoch: 222, train_loss = 2.1847094867844135, train_acc = 0.9947601304145319
test Acc 0.9776536312849162:
21th- epoch: 223, train_loss = 2.182368958950974, train_acc = 0.9947601304145319
test Acc 0.9776536312849162:
21th- epoch: 224, train_loss = 2.1751686421921477, train_acc = 0.9947601304145319
test Acc 0.9776536312849162:
21th- epoch: 225, train_loss = 2.171414560289122, train_acc = 0.9947601304145319
test Acc 0.9776536312849162:
21th- epoch: 226, train_loss = 2.167781097232364, train_acc = 0.9947601304145319
test Acc 0.9776536312849162:
21th- epoch: 227, train_loss = 2.163439535885118, train_acc = 0.9947601304145319
test Acc 0.9776536312849162:
21th- epoch: 228, train_loss = 2.159347388893366, train_acc = 0.9947601304145319
test Acc 0.9776536312849162:
21th- 

21th- epoch: 368, train_loss = 1.8036297857761383, train_acc = 0.9951094550535631
test Acc 0.979050279329609:
21th- epoch: 369, train_loss = 1.8011256257886998, train_acc = 0.9951094550535631
test Acc 0.979050279329609:
21th- epoch: 370, train_loss = 1.8003078338806517, train_acc = 0.9951094550535631
test Acc 0.979050279329609:
21th- epoch: 371, train_loss = 1.7969872181420214, train_acc = 0.9951094550535631
test Acc 0.979050279329609:
21th- epoch: 372, train_loss = 1.7965428816969506, train_acc = 0.9951094550535631
test Acc 0.979050279329609:
21th- epoch: 373, train_loss = 1.7946903457050212, train_acc = 0.9951094550535631
test Acc 0.979050279329609:
21th- epoch: 374, train_loss = 1.7934427348081954, train_acc = 0.9951094550535631
test Acc 0.979050279329609:
21th- epoch: 375, train_loss = 1.7920304710860364, train_acc = 0.9951094550535631
test Acc 0.979050279329609:
21th- epoch: 376, train_loss = 1.7910394345526583, train_acc = 0.9951094550535631
test Acc 0.979050279329609:
21th- epoc

 70%|█████████████████████████████████████████████████                     | 21/30 [3:10:06<1:21:26, 542.99s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
22th- epoch: 0, train_loss = 127.25541940331459, train_acc = 0.7833022822543083
test Acc 0.8896648044692738:
22th- epoch: 1, train_loss = 41.436591789126396, train_acc = 0.9125523986958547
test Acc 0.9264432029795159:
22th- epoch: 2, train_loss = 31.89788932353258, train_acc = 0.9330461108523521
test Acc 0.9380819366852886:
22th- epoch: 3, train_loss = 26.990378618240356, train_acc = 0.9450395901257569
test Acc 0.9450651769087524:
22th- epoch: 4, train_loss = 23.791397362947464, train_acc = 0.9527247321844434
test Acc 0.946927374301676:
22th- epoch: 5, train_loss = 21.443966504186392, train_acc = 0.956217978574

22th- epoch: 146, train_loss = 2.7528040683828294, train_acc = 0.994294364229157
test Acc 0.9739292364990689:
22th- epoch: 147, train_loss = 2.7407927089370787, train_acc = 0.994294364229157
test Acc 0.9743947858472998:
22th- epoch: 148, train_loss = 2.730351862963289, train_acc = 0.9945272473218444
test Acc 0.9743947858472998:
22th- epoch: 149, train_loss = 2.7199945971369743, train_acc = 0.9945272473218444
test Acc 0.9739292364990689:
22th- epoch: 150, train_loss = 2.709352082107216, train_acc = 0.9945272473218444
test Acc 0.9743947858472998:
22th- epoch: 151, train_loss = 2.6985366553999484, train_acc = 0.9945272473218444
test Acc 0.9743947858472998:
22th- epoch: 152, train_loss = 2.6880122958682477, train_acc = 0.9945272473218444
test Acc 0.9743947858472998:
22th- epoch: 153, train_loss = 2.6783095449209213, train_acc = 0.9945272473218444
test Acc 0.9739292364990689:
22th- epoch: 154, train_loss = 2.6679785600863397, train_acc = 0.9945272473218444
test Acc 0.9739292364990689:
22th-

22th- epoch: 294, train_loss = 1.9405000668484718, train_acc = 0.9954587796925943
test Acc 0.9767225325884544:
22th- epoch: 295, train_loss = 1.9373343139886856, train_acc = 0.9954587796925943
test Acc 0.9767225325884544:
22th- epoch: 296, train_loss = 1.9348243947606534, train_acc = 0.9954587796925943
test Acc 0.9767225325884544:
22th- epoch: 297, train_loss = 1.9320394929964095, train_acc = 0.9954587796925943
test Acc 0.9767225325884544:
22th- epoch: 298, train_loss = 1.9296163630206138, train_acc = 0.9954587796925943
test Acc 0.9767225325884544:
22th- epoch: 299, train_loss = 1.9278019380290061, train_acc = 0.9954587796925943
test Acc 0.9767225325884544:
22th- epoch: 300, train_loss = 1.9247318606358021, train_acc = 0.9954587796925943
test Acc 0.9767225325884544:
22th- epoch: 301, train_loss = 1.9219792920630425, train_acc = 0.9954587796925943
test Acc 0.9767225325884544:
22th- epoch: 302, train_loss = 1.9198753561358899, train_acc = 0.9954587796925943
test Acc 0.9767225325884544:
2

22th- epoch: 442, train_loss = 1.6946210836758837, train_acc = 0.9956916627852818
test Acc 0.9771880819366853:
22th- epoch: 443, train_loss = 1.6939850188791752, train_acc = 0.995575221238938
test Acc 0.9771880819366853:
22th- epoch: 444, train_loss = 1.693190272897482, train_acc = 0.995575221238938
test Acc 0.9771880819366853:
22th- epoch: 445, train_loss = 1.6922290349612013, train_acc = 0.9956916627852818
test Acc 0.9771880819366853:
22th- epoch: 446, train_loss = 1.6909566335380077, train_acc = 0.9956916627852818
test Acc 0.9771880819366853:
22th- epoch: 447, train_loss = 1.6896607974776998, train_acc = 0.9956916627852818
test Acc 0.9771880819366853:
22th- epoch: 448, train_loss = 1.6891521997749805, train_acc = 0.995575221238938
test Acc 0.9771880819366853:
22th- epoch: 449, train_loss = 1.6876268349587917, train_acc = 0.9956916627852818
test Acc 0.9771880819366853:
22th- epoch: 450, train_loss = 1.6870528906583786, train_acc = 0.9956916627852818
test Acc 0.9771880819366853:
22th-

 73%|███████████████████████████████████████████████████▎                  | 22/30 [3:19:08<1:12:21, 542.75s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
23th- epoch: 0, train_loss = 109.25575223565102, train_acc = 0.7898230088495575
test Acc 0.8943202979515829:
23th- epoch: 1, train_loss = 38.82944169640541, train_acc = 0.9201210992081975
test Acc 0.9324953445065177:
23th- epoch: 2, train_loss = 29.855571269989014, train_acc = 0.9384024219841639
test Acc 0.9450651769087524:
23th- epoch: 3, train_loss = 25.114335767924786, train_acc = 0.9487657196087564
test Acc 0.9487895716945997:
23th- epoch: 4, train_loss = 22.092435907572508, train_acc = 0.9537727061015371
test Acc 0.9534450651769087:
23th- epoch: 5, train_loss = 19.964155431836843, train_acc = 0.95889613414

23th- epoch: 146, train_loss = 2.5856284820474684, train_acc = 0.9946436888681882
test Acc 0.9771880819366853:
23th- epoch: 147, train_loss = 2.5763452700339258, train_acc = 0.9946436888681882
test Acc 0.9771880819366853:
23th- epoch: 148, train_loss = 2.5660915463231504, train_acc = 0.9946436888681882
test Acc 0.9771880819366853:
23th- epoch: 149, train_loss = 2.5560822202824056, train_acc = 0.9946436888681882
test Acc 0.9771880819366853:
23th- epoch: 150, train_loss = 2.5462430850602686, train_acc = 0.9946436888681882
test Acc 0.9771880819366853:
23th- epoch: 151, train_loss = 2.5365845165215433, train_acc = 0.9946436888681882
test Acc 0.9771880819366853:
23th- epoch: 152, train_loss = 2.5267711258493364, train_acc = 0.9946436888681882
test Acc 0.9771880819366853:
23th- epoch: 153, train_loss = 2.5183169059455395, train_acc = 0.9946436888681882
test Acc 0.9771880819366853:
23th- epoch: 154, train_loss = 2.5084218927659094, train_acc = 0.9946436888681882
test Acc 0.9771880819366853:
2

23th- epoch: 294, train_loss = 1.87179436290171, train_acc = 0.9956916627852818
test Acc 0.9795158286778398:
23th- epoch: 295, train_loss = 1.8696949208388105, train_acc = 0.9956916627852818
test Acc 0.9795158286778398:
23th- epoch: 296, train_loss = 1.8675157862016931, train_acc = 0.9956916627852818
test Acc 0.9795158286778398:
23th- epoch: 297, train_loss = 1.8657194724073634, train_acc = 0.9956916627852818
test Acc 0.9795158286778398:
23th- epoch: 298, train_loss = 1.8633802197873592, train_acc = 0.9956916627852818
test Acc 0.9795158286778398:
23th- epoch: 299, train_loss = 1.8613786734640598, train_acc = 0.9956916627852818
test Acc 0.9795158286778398:
23th- epoch: 300, train_loss = 1.8590337919304147, train_acc = 0.9956916627852818
test Acc 0.9795158286778398:
23th- epoch: 301, train_loss = 1.8568451404571533, train_acc = 0.9956916627852818
test Acc 0.9795158286778398:
23th- epoch: 302, train_loss = 1.854660471319221, train_acc = 0.9956916627852818
test Acc 0.9795158286778398:
23th

23th- epoch: 442, train_loss = 1.6636148926918395, train_acc = 0.995575221238938
test Acc 0.9809124767225326:
23th- epoch: 443, train_loss = 1.66292404133128, train_acc = 0.995575221238938
test Acc 0.9809124767225326:
23th- epoch: 444, train_loss = 1.6618044252390973, train_acc = 0.995575221238938
test Acc 0.9809124767225326:
23th- epoch: 445, train_loss = 1.6616344600915909, train_acc = 0.995575221238938
test Acc 0.9809124767225326:
23th- epoch: 446, train_loss = 1.6605744386906736, train_acc = 0.995575221238938
test Acc 0.9809124767225326:
23th- epoch: 447, train_loss = 1.6591839988832362, train_acc = 0.995575221238938
test Acc 0.9809124767225326:
23th- epoch: 448, train_loss = 1.6591676485841163, train_acc = 0.995575221238938
test Acc 0.9809124767225326:
23th- epoch: 449, train_loss = 1.657645344734192, train_acc = 0.995575221238938
test Acc 0.9809124767225326:
23th- epoch: 450, train_loss = 1.6569979998166673, train_acc = 0.995575221238938
test Acc 0.9809124767225326:
23th- epoch: 

 77%|█████████████████████████████████████████████████████▋                | 23/30 [3:28:12<1:03:22, 543.21s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
24th- epoch: 0, train_loss = 115.67594040930271, train_acc = 0.7980903586399627
test Acc 0.8803538175046555:
24th- epoch: 1, train_loss = 41.58495197445154, train_acc = 0.9155798789007918
test Acc 0.9264432029795159:
24th- epoch: 2, train_loss = 32.41995342820883, train_acc = 0.9351420586865393
test Acc 0.9385474860335196:
24th- epoch: 3, train_loss = 27.419733971357346, train_acc = 0.9450395901257569
test Acc 0.9422718808193669:
24th- epoch: 4, train_loss = 24.178152836859226, train_acc = 0.9513274336283186
test Acc 0.9445996275605214:
24th- epoch: 5, train_loss = 21.803983449935913, train_acc = 0.956334420121

24th- epoch: 146, train_loss = 2.6793954796157777, train_acc = 0.9944108057755007
test Acc 0.9767225325884544:
24th- epoch: 147, train_loss = 2.670158388558775, train_acc = 0.9944108057755007
test Acc 0.9767225325884544:
24th- epoch: 148, train_loss = 2.6599581777118146, train_acc = 0.9944108057755007
test Acc 0.9767225325884544:
24th- epoch: 149, train_loss = 2.6499984660185874, train_acc = 0.9944108057755007
test Acc 0.9767225325884544:
24th- epoch: 150, train_loss = 2.6400739825330675, train_acc = 0.9944108057755007
test Acc 0.9767225325884544:
24th- epoch: 151, train_loss = 2.628752063959837, train_acc = 0.994294364229157
test Acc 0.9767225325884544:
24th- epoch: 152, train_loss = 2.6208623819984496, train_acc = 0.9945272473218444
test Acc 0.9767225325884544:
24th- epoch: 153, train_loss = 2.6118332147598267, train_acc = 0.9944108057755007
test Acc 0.9767225325884544:
24th- epoch: 154, train_loss = 2.6018829247914255, train_acc = 0.9945272473218444
test Acc 0.9767225325884544:
24th

24th- epoch: 294, train_loss = 1.9393752452451736, train_acc = 0.9953423381462506
test Acc 0.9776536312849162:
24th- epoch: 295, train_loss = 1.9375120352488011, train_acc = 0.9953423381462506
test Acc 0.9776536312849162:
24th- epoch: 296, train_loss = 1.934870906174183, train_acc = 0.9954587796925943
test Acc 0.9776536312849162:
24th- epoch: 297, train_loss = 1.932315896032378, train_acc = 0.9954587796925943
test Acc 0.9776536312849162:
24th- epoch: 298, train_loss = 1.9308877040166408, train_acc = 0.9953423381462506
test Acc 0.9776536312849162:
24th- epoch: 299, train_loss = 1.9269985891878605, train_acc = 0.9953423381462506
test Acc 0.9776536312849162:
24th- epoch: 300, train_loss = 1.9261521324515343, train_acc = 0.9953423381462506
test Acc 0.9776536312849162:
24th- epoch: 301, train_loss = 1.9239712941925973, train_acc = 0.9953423381462506
test Acc 0.9776536312849162:
24th- epoch: 302, train_loss = 1.9199030336458236, train_acc = 0.9953423381462506
test Acc 0.9776536312849162:
24t

24th- epoch: 442, train_loss = 1.7199011308839545, train_acc = 0.9954587796925943
test Acc 0.9776536312849162:
24th- epoch: 443, train_loss = 1.7217865189304575, train_acc = 0.9954587796925943
test Acc 0.9776536312849162:
24th- epoch: 444, train_loss = 1.7197018414735794, train_acc = 0.9954587796925943
test Acc 0.9776536312849162:
24th- epoch: 445, train_loss = 1.7207170004257932, train_acc = 0.9954587796925943
test Acc 0.9776536312849162:
24th- epoch: 446, train_loss = 1.7175665870308876, train_acc = 0.995575221238938
test Acc 0.9776536312849162:
24th- epoch: 447, train_loss = 1.7179810479283333, train_acc = 0.9954587796925943
test Acc 0.9776536312849162:
24th- epoch: 448, train_loss = 1.7182172226021066, train_acc = 0.9954587796925943
test Acc 0.9776536312849162:
24th- epoch: 449, train_loss = 1.7145177138736472, train_acc = 0.9954587796925943
test Acc 0.9776536312849162:
24th- epoch: 450, train_loss = 1.7161248413613066, train_acc = 0.9954587796925943
test Acc 0.9776536312849162:
24

 80%|█████████████████████████████████████████████████████████▌              | 24/30 [3:37:15<54:18, 543.05s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
25th- epoch: 0, train_loss = 118.49549621343613, train_acc = 0.7829529576152772
test Acc 0.8868715083798883:
25th- epoch: 1, train_loss = 41.95682406425476, train_acc = 0.912435957149511
test Acc 0.9213221601489758:
25th- epoch: 2, train_loss = 31.697894111275673, train_acc = 0.9356078248719143
test Acc 0.9334264432029795:
25th- epoch: 3, train_loss = 26.726380087435246, train_acc = 0.944108057755007
test Acc 0.9445996275605214:
25th- epoch: 4, train_loss = 23.548087805509567, train_acc = 0.9505123428039124
test Acc 0.9455307262569832:
25th- epoch: 5, train_loss = 21.275924049317837, train_acc = 0.9562179785747

25th- epoch: 146, train_loss = 2.680503983050585, train_acc = 0.9947601304145319
test Acc 0.9799813780260708:
25th- epoch: 147, train_loss = 2.6698115677572787, train_acc = 0.9948765719608756
test Acc 0.9799813780260708:
25th- epoch: 148, train_loss = 2.6598206856288016, train_acc = 0.9948765719608756
test Acc 0.9799813780260708:
25th- epoch: 149, train_loss = 2.649536664132029, train_acc = 0.9948765719608756
test Acc 0.9799813780260708:
25th- epoch: 150, train_loss = 2.6396986418403685, train_acc = 0.9948765719608756
test Acc 0.9799813780260708:
25th- epoch: 151, train_loss = 2.6287575736641884, train_acc = 0.9949930135072194
test Acc 0.9799813780260708:
25th- epoch: 152, train_loss = 2.6176086864434183, train_acc = 0.9949930135072194
test Acc 0.9799813780260708:
25th- epoch: 153, train_loss = 2.6089953198097646, train_acc = 0.9949930135072194
test Acc 0.9799813780260708:
25th- epoch: 154, train_loss = 2.6003975444473326, train_acc = 0.9949930135072194
test Acc 0.9799813780260708:
25t

25th- epoch: 294, train_loss = 1.923717355937697, train_acc = 0.995575221238938
test Acc 0.9809124767225326:
25th- epoch: 295, train_loss = 1.9221345596015453, train_acc = 0.995575221238938
test Acc 0.9809124767225326:
25th- epoch: 296, train_loss = 1.9201545976102352, train_acc = 0.995575221238938
test Acc 0.9809124767225326:
25th- epoch: 297, train_loss = 1.916237000375986, train_acc = 0.995575221238938
test Acc 0.9809124767225326:
25th- epoch: 298, train_loss = 1.9144454872002825, train_acc = 0.995575221238938
test Acc 0.9809124767225326:
25th- epoch: 299, train_loss = 1.9135789138963446, train_acc = 0.995575221238938
test Acc 0.9809124767225326:
25th- epoch: 300, train_loss = 1.9110078947851434, train_acc = 0.995575221238938
test Acc 0.9804469273743017:
25th- epoch: 301, train_loss = 1.9099828811595216, train_acc = 0.995575221238938
test Acc 0.9809124767225326:
25th- epoch: 302, train_loss = 1.90576631820295, train_acc = 0.995575221238938
test Acc 0.9804469273743017:
25th- epoch: 3

25th- epoch: 442, train_loss = 1.69966197386384, train_acc = 0.995575221238938
test Acc 0.9813780260707635:
25th- epoch: 443, train_loss = 1.6991896380786784, train_acc = 0.995575221238938
test Acc 0.9813780260707635:
25th- epoch: 444, train_loss = 1.6972633649711497, train_acc = 0.995575221238938
test Acc 0.9813780260707635:
25th- epoch: 445, train_loss = 1.695201129943598, train_acc = 0.995575221238938
test Acc 0.9813780260707635:
25th- epoch: 446, train_loss = 1.6966169203515165, train_acc = 0.995575221238938
test Acc 0.9813780260707635:
25th- epoch: 447, train_loss = 1.6950163133442402, train_acc = 0.995575221238938
test Acc 0.9813780260707635:
25th- epoch: 448, train_loss = 1.6945678529446013, train_acc = 0.995575221238938
test Acc 0.9813780260707635:
25th- epoch: 449, train_loss = 1.6937149427831173, train_acc = 0.995575221238938
test Acc 0.9813780260707635:
25th- epoch: 450, train_loss = 1.6919883911614306, train_acc = 0.995575221238938
test Acc 0.9813780260707635:
25th- epoch: 

 83%|████████████████████████████████████████████████████████████            | 25/30 [3:46:18<45:15, 543.14s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
26th- epoch: 0, train_loss = 119.70763616263866, train_acc = 0.7822543083372148
test Acc 0.8943202979515829:
26th- epoch: 1, train_loss = 41.11606873571873, train_acc = 0.9130181648812297
test Acc 0.9269087523277467:
26th- epoch: 2, train_loss = 31.312080889940262, train_acc = 0.9350256171401956
test Acc 0.9390130353817505:
26th- epoch: 3, train_loss = 26.31152194365859, train_acc = 0.9459711224965067
test Acc 0.9441340782122905:
26th- epoch: 4, train_loss = 23.13976438343525, train_acc = 0.9544713553795995
test Acc 0.9473929236499069:
26th- epoch: 5, train_loss = 20.88550717383623, train_acc = 0.95912901723334

26th- epoch: 146, train_loss = 2.708770605735481, train_acc = 0.9948765719608756
test Acc 0.9757914338919925:
26th- epoch: 147, train_loss = 2.6975754532031715, train_acc = 0.9948765719608756
test Acc 0.9757914338919925:
26th- epoch: 148, train_loss = 2.686595858540386, train_acc = 0.9948765719608756
test Acc 0.9757914338919925:
26th- epoch: 149, train_loss = 2.6781536391936243, train_acc = 0.9948765719608756
test Acc 0.9757914338919925:
26th- epoch: 150, train_loss = 2.667184815276414, train_acc = 0.9949930135072194
test Acc 0.9757914338919925:
26th- epoch: 151, train_loss = 2.6581034823320806, train_acc = 0.9949930135072194
test Acc 0.9757914338919925:
26th- epoch: 152, train_loss = 2.647219069302082, train_acc = 0.9949930135072194
test Acc 0.9757914338919925:
26th- epoch: 153, train_loss = 2.6374504901468754, train_acc = 0.9949930135072194
test Acc 0.9757914338919925:
26th- epoch: 154, train_loss = 2.6279850411228836, train_acc = 0.9949930135072194
test Acc 0.9757914338919925:
26th-

26th- epoch: 294, train_loss = 1.9327155041974038, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
26th- epoch: 295, train_loss = 1.9299868121743202, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
26th- epoch: 296, train_loss = 1.9257904954720289, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
26th- epoch: 297, train_loss = 1.9220994014758617, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
26th- epoch: 298, train_loss = 1.9219695150386542, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
26th- epoch: 299, train_loss = 1.9180691551882774, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
26th- epoch: 300, train_loss = 1.9171248581260443, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
26th- epoch: 301, train_loss = 1.914406333817169, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
26th- epoch: 302, train_loss = 1.912570035085082, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
26t

test Acc 0.9804469273743017:
26th- epoch: 442, train_loss = 1.6993495660135522, train_acc = 0.9956916627852818
test Acc 0.9804469273743017:
26th- epoch: 443, train_loss = 1.6976574026048183, train_acc = 0.9956916627852818
test Acc 0.9804469273743017:
26th- epoch: 444, train_loss = 1.6972728198161349, train_acc = 0.9956916627852818
test Acc 0.9804469273743017:
26th- epoch: 445, train_loss = 1.696209855377674, train_acc = 0.9956916627852818
test Acc 0.9804469273743017:
26th- epoch: 446, train_loss = 1.6953512094914913, train_acc = 0.9956916627852818
test Acc 0.9804469273743017:
26th- epoch: 447, train_loss = 1.6942934915423393, train_acc = 0.9956916627852818
test Acc 0.9804469273743017:
26th- epoch: 448, train_loss = 1.6928709720959887, train_acc = 0.9956916627852818
test Acc 0.9804469273743017:
26th- epoch: 449, train_loss = 1.691748229204677, train_acc = 0.9956916627852818
test Acc 0.9804469273743017:
26th- epoch: 450, train_loss = 1.691184226423502, train_acc = 0.9956916627852818
test

 87%|██████████████████████████████████████████████████████████████▍         | 26/30 [3:55:21<36:12, 543.13s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
27th- epoch: 0, train_loss = 107.20833261311054, train_acc = 0.7902887750349324
test Acc 0.8603351955307262:
27th- epoch: 1, train_loss = 40.97393673658371, train_acc = 0.9146483465300419
test Acc 0.8952513966480447:
27th- epoch: 2, train_loss = 31.856340371072292, train_acc = 0.9338612016767582
test Acc 0.9236499068901304:
27th- epoch: 3, train_loss = 26.915815882384777, train_acc = 0.944108057755007
test Acc 0.9376163873370578:
27th- epoch: 4, train_loss = 23.58322962373495, train_acc = 0.9519096413600373
test Acc 0.9432029795158287:
27th- epoch: 5, train_loss = 21.180729515850544, train_acc = 0.9568001863064

27th- epoch: 145, train_loss = 2.7355077392421663, train_acc = 0.9941779226828132
test Acc 0.9776536312849162:
27th- epoch: 146, train_loss = 2.7238217652775347, train_acc = 0.9941779226828132
test Acc 0.9776536312849162:
27th- epoch: 147, train_loss = 2.712434289511293, train_acc = 0.9941779226828132
test Acc 0.9781191806331471:
27th- epoch: 148, train_loss = 2.7020048201084137, train_acc = 0.9941779226828132
test Acc 0.9776536312849162:
27th- epoch: 149, train_loss = 2.6904376335442066, train_acc = 0.9941779226828132
test Acc 0.9781191806331471:
27th- epoch: 150, train_loss = 2.680219101253897, train_acc = 0.9941779226828132
test Acc 0.9781191806331471:
27th- epoch: 151, train_loss = 2.669344112277031, train_acc = 0.9941779226828132
test Acc 0.9781191806331471:
27th- epoch: 152, train_loss = 2.6589065841399133, train_acc = 0.9941779226828132
test Acc 0.9781191806331471:
27th- epoch: 153, train_loss = 2.6485886748414487, train_acc = 0.9941779226828132
test Acc 0.9781191806331471:
27th

27th- epoch: 293, train_loss = 1.927121177315712, train_acc = 0.9952258965999069
test Acc 0.9809124767225326:
27th- epoch: 294, train_loss = 1.9263576393714175, train_acc = 0.9952258965999069
test Acc 0.9809124767225326:
27th- epoch: 295, train_loss = 1.9222658202052116, train_acc = 0.9952258965999069
test Acc 0.9813780260707635:
27th- epoch: 296, train_loss = 1.9206569083034992, train_acc = 0.9952258965999069
test Acc 0.9813780260707635:
27th- epoch: 297, train_loss = 1.9179661398520693, train_acc = 0.9952258965999069
test Acc 0.9813780260707635:
27th- epoch: 298, train_loss = 1.9162435246398672, train_acc = 0.9952258965999069
test Acc 0.9813780260707635:
27th- epoch: 299, train_loss = 1.9133015660336241, train_acc = 0.9952258965999069
test Acc 0.9813780260707635:
27th- epoch: 300, train_loss = 1.910936220199801, train_acc = 0.9952258965999069
test Acc 0.9813780260707635:
27th- epoch: 301, train_loss = 1.9092831885209307, train_acc = 0.9952258965999069
test Acc 0.9813780260707635:
27t

27th- epoch: 440, train_loss = 1.692229013890028, train_acc = 0.9954587796925943
test Acc 0.9809124767225326:
27th- epoch: 441, train_loss = 1.6915498289163224, train_acc = 0.9954587796925943
test Acc 0.9809124767225326:
27th- epoch: 442, train_loss = 1.6906888373196125, train_acc = 0.9954587796925943
test Acc 0.9809124767225326:
27th- epoch: 443, train_loss = 1.6895108471508138, train_acc = 0.9954587796925943
test Acc 0.9809124767225326:
27th- epoch: 444, train_loss = 1.6884255793993361, train_acc = 0.9954587796925943
test Acc 0.9809124767225326:
27th- epoch: 445, train_loss = 1.6883440564270131, train_acc = 0.9954587796925943
test Acc 0.9809124767225326:
27th- epoch: 446, train_loss = 1.6865346257691272, train_acc = 0.9954587796925943
test Acc 0.9809124767225326:
27th- epoch: 447, train_loss = 1.6853536342387088, train_acc = 0.9954587796925943
test Acc 0.9809124767225326:
27th- epoch: 448, train_loss = 1.685012357949745, train_acc = 0.9954587796925943
test Acc 0.9809124767225326:
27t

 90%|████████████████████████████████████████████████████████████████▊       | 27/30 [4:04:25<27:09, 543.28s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
28th- epoch: 0, train_loss = 106.18086077272892, train_acc = 0.7968095016301816
test Acc 0.888733705772812:
28th- epoch: 1, train_loss = 41.29218380898237, train_acc = 0.9161620866325105
test Acc 0.9269087523277467:
28th- epoch: 2, train_loss = 31.784854017198086, train_acc = 0.936655798789008
test Acc 0.9413407821229051:
28th- epoch: 3, train_loss = 26.97260106354952, train_acc = 0.945854680950163
test Acc 0.9441340782122905:
28th- epoch: 4, train_loss = 23.717313654720783, train_acc = 0.9534233814625058
test Acc 0.9497206703910615:
28th- epoch: 5, train_loss = 21.29383822903037, train_acc = 0.9572659524918491

28th- epoch: 146, train_loss = 2.51853974792175, train_acc = 0.9948765719608756
test Acc 0.9767225325884544:
28th- epoch: 147, train_loss = 2.5089298498351127, train_acc = 0.9948765719608756
test Acc 0.9762569832402235:
28th- epoch: 148, train_loss = 2.5013766835909337, train_acc = 0.9949930135072194
test Acc 0.9767225325884544:
28th- epoch: 149, train_loss = 2.4907740615308285, train_acc = 0.9949930135072194
test Acc 0.9762569832402235:
28th- epoch: 150, train_loss = 2.4835911605041474, train_acc = 0.9949930135072194
test Acc 0.9767225325884544:
28th- epoch: 151, train_loss = 2.47420393046923, train_acc = 0.9949930135072194
test Acc 0.9762569832402235:
28th- epoch: 152, train_loss = 2.4661111894529313, train_acc = 0.9949930135072194
test Acc 0.9762569832402235:
28th- epoch: 153, train_loss = 2.4570846781134605, train_acc = 0.9949930135072194
test Acc 0.9762569832402235:
28th- epoch: 154, train_loss = 2.4480806414503604, train_acc = 0.9949930135072194
test Acc 0.9762569832402235:
28th-

28th- epoch: 294, train_loss = 1.8612580312183127, train_acc = 0.9953423381462506
test Acc 0.9781191806331471:
28th- epoch: 295, train_loss = 1.8594742255518213, train_acc = 0.9953423381462506
test Acc 0.9781191806331471:
28th- epoch: 296, train_loss = 1.8577966938028112, train_acc = 0.9953423381462506
test Acc 0.9781191806331471:
28th- epoch: 297, train_loss = 1.8555823663482442, train_acc = 0.9953423381462506
test Acc 0.9781191806331471:
28th- epoch: 298, train_loss = 1.8528243725886568, train_acc = 0.9953423381462506
test Acc 0.9781191806331471:
28th- epoch: 299, train_loss = 1.8519376242766157, train_acc = 0.9953423381462506
test Acc 0.9781191806331471:
28th- epoch: 300, train_loss = 1.8491554781794548, train_acc = 0.9953423381462506
test Acc 0.9781191806331471:
28th- epoch: 301, train_loss = 1.8477118586888537, train_acc = 0.9953423381462506
test Acc 0.9781191806331471:
28th- epoch: 302, train_loss = 1.845226133824326, train_acc = 0.9953423381462506
test Acc 0.9781191806331471:
28

28th- epoch: 442, train_loss = 1.6653900097007863, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
28th- epoch: 443, train_loss = 1.663850113749504, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
28th- epoch: 444, train_loss = 1.66463241976453, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
28th- epoch: 445, train_loss = 1.6629958960111253, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
28th- epoch: 446, train_loss = 1.6617522339220159, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
28th- epoch: 447, train_loss = 1.6623459818656556, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
28th- epoch: 448, train_loss = 1.6605131861870177, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
28th- epoch: 449, train_loss = 1.6596393560175784, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
28th- epoch: 450, train_loss = 1.6587027522618882, train_acc = 0.9954587796925943
test Acc 0.9795158286778398:
28th

 93%|███████████████████████████████████████████████████████████████████▏    | 28/30 [4:13:28<18:06, 543.25s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
29th- epoch: 0, train_loss = 96.53166696429253, train_acc = 0.8082207731718677
test Acc 0.8687150837988827:
29th- epoch: 1, train_loss = 41.03782796859741, train_acc = 0.9136003726129484
test Acc 0.9199255121042831:
29th- epoch: 2, train_loss = 31.385571397840977, train_acc = 0.9330461108523521
test Acc 0.9329608938547486:
29th- epoch: 3, train_loss = 26.17290173470974, train_acc = 0.944108057755007
test Acc 0.9441340782122905:
29th- epoch: 4, train_loss = 22.803202502429485, train_acc = 0.9505123428039124
test Acc 0.9506517690875232:
29th- epoch: 5, train_loss = 20.47078873217106, train_acc = 0.955286446204005

29th- epoch: 146, train_loss = 2.658899346832186, train_acc = 0.9940614811364695
test Acc 0.9795158286778398:
29th- epoch: 147, train_loss = 2.64705423777923, train_acc = 0.9940614811364695
test Acc 0.9795158286778398:
29th- epoch: 148, train_loss = 2.6375191435217857, train_acc = 0.9940614811364695
test Acc 0.9795158286778398:
29th- epoch: 149, train_loss = 2.6275884001515806, train_acc = 0.9940614811364695
test Acc 0.9795158286778398:
29th- epoch: 150, train_loss = 2.6177622848190367, train_acc = 0.9940614811364695
test Acc 0.9795158286778398:
29th- epoch: 151, train_loss = 2.6063288375735283, train_acc = 0.9941779226828132
test Acc 0.9795158286778398:
29th- epoch: 152, train_loss = 2.597336603794247, train_acc = 0.9940614811364695
test Acc 0.9795158286778398:
29th- epoch: 153, train_loss = 2.5878924690186977, train_acc = 0.9940614811364695
test Acc 0.9795158286778398:
29th- epoch: 154, train_loss = 2.5787370554171503, train_acc = 0.9941779226828132
test Acc 0.9795158286778398:
29th-

29th- epoch: 294, train_loss = 1.9012917603831738, train_acc = 0.995575221238938
test Acc 0.9804469273743017:
29th- epoch: 295, train_loss = 1.8992707047145814, train_acc = 0.995575221238938
test Acc 0.9804469273743017:
29th- epoch: 296, train_loss = 1.8968013997655362, train_acc = 0.995575221238938
test Acc 0.9804469273743017:
29th- epoch: 297, train_loss = 1.8950994934421033, train_acc = 0.9956916627852818
test Acc 0.9804469273743017:
29th- epoch: 298, train_loss = 1.892082504928112, train_acc = 0.995575221238938
test Acc 0.9804469273743017:
29th- epoch: 299, train_loss = 1.8901670041959733, train_acc = 0.9956916627852818
test Acc 0.9804469273743017:
29th- epoch: 300, train_loss = 1.8869699637871236, train_acc = 0.995575221238938
test Acc 0.9804469273743017:
29th- epoch: 301, train_loss = 1.8852044518571347, train_acc = 0.995575221238938
test Acc 0.9804469273743017:
29th- epoch: 302, train_loss = 1.8836664259433746, train_acc = 0.995575221238938
test Acc 0.9804469273743017:
29th- epo

test Acc 0.9804469273743017:
29th- epoch: 442, train_loss = 1.6786278076469898, train_acc = 0.9958081043316255
test Acc 0.9804469273743017:
29th- epoch: 443, train_loss = 1.6775043284287676, train_acc = 0.9958081043316255
test Acc 0.9804469273743017:
29th- epoch: 444, train_loss = 1.6774528907844797, train_acc = 0.9958081043316255
test Acc 0.9804469273743017:
29th- epoch: 445, train_loss = 1.675861074239947, train_acc = 0.9958081043316255
test Acc 0.9804469273743017:
29th- epoch: 446, train_loss = 1.6757360001793131, train_acc = 0.9958081043316255
test Acc 0.9804469273743017:
29th- epoch: 447, train_loss = 1.6739940667757764, train_acc = 0.9958081043316255
test Acc 0.9804469273743017:
29th- epoch: 448, train_loss = 1.6727443374693394, train_acc = 0.9958081043316255
test Acc 0.9804469273743017:
29th- epoch: 449, train_loss = 1.67263299098704, train_acc = 0.9958081043316255
test Acc 0.9804469273743017:
29th- epoch: 450, train_loss = 1.6714618764817715, train_acc = 0.9958081043316255
test

 97%|█████████████████████████████████████████████████████████████████████▌  | 29/30 [4:22:31<09:03, 543.09s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
30th- epoch: 0, train_loss = 106.08653329312801, train_acc = 0.7812063344201211
test Acc 0.8626629422718808:
30th- epoch: 1, train_loss = 42.843772023916245, train_acc = 0.9137168141592921
test Acc 0.914804469273743:
30th- epoch: 2, train_loss = 32.90244650095701, train_acc = 0.9356078248719143
test Acc 0.9324953445065177:
30th- epoch: 3, train_loss = 27.909543372690678, train_acc = 0.9462040055891943
test Acc 0.9427374301675978:
30th- epoch: 4, train_loss = 24.643171593546867, train_acc = 0.9510945505356311
test Acc 0.946927374301676:
30th- epoch: 5, train_loss = 22.226665269583464, train_acc = 0.9550535631113

30th- epoch: 146, train_loss = 2.71965586906299, train_acc = 0.9946436888681882
test Acc 0.9748603351955307:
30th- epoch: 147, train_loss = 2.7077079652808607, train_acc = 0.9946436888681882
test Acc 0.9748603351955307:
30th- epoch: 148, train_loss = 2.697655662894249, train_acc = 0.9946436888681882
test Acc 0.9748603351955307:
30th- epoch: 149, train_loss = 2.686784863471985, train_acc = 0.9946436888681882
test Acc 0.9748603351955307:
30th- epoch: 150, train_loss = 2.6760612479411066, train_acc = 0.9946436888681882
test Acc 0.9748603351955307:
30th- epoch: 151, train_loss = 2.6664390019141138, train_acc = 0.9946436888681882
test Acc 0.9748603351955307:
30th- epoch: 152, train_loss = 2.654739574994892, train_acc = 0.9946436888681882
test Acc 0.9748603351955307:
30th- epoch: 153, train_loss = 2.6449082284234464, train_acc = 0.9946436888681882
test Acc 0.9748603351955307:
30th- epoch: 154, train_loss = 2.634452771395445, train_acc = 0.9946436888681882
test Acc 0.9748603351955307:
30th- e

30th- epoch: 294, train_loss = 1.9257286179345101, train_acc = 0.995575221238938
test Acc 0.9776536312849162:
30th- epoch: 295, train_loss = 1.9232720732688904, train_acc = 0.995575221238938
test Acc 0.9776536312849162:
30th- epoch: 296, train_loss = 1.9211627766489983, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
30th- epoch: 297, train_loss = 1.91900834441185, train_acc = 0.995575221238938
test Acc 0.9776536312849162:
30th- epoch: 298, train_loss = 1.9143013209104538, train_acc = 0.995575221238938
test Acc 0.9776536312849162:
30th- epoch: 299, train_loss = 1.911855700192973, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
30th- epoch: 300, train_loss = 1.9100323889870197, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
30th- epoch: 301, train_loss = 1.9066225301939994, train_acc = 0.995575221238938
test Acc 0.9776536312849162:
30th- epoch: 302, train_loss = 1.9053964987397194, train_acc = 0.995575221238938
test Acc 0.9781191806331471:
30th- epoch: 

30th- epoch: 443, train_loss = 1.6927770165493712, train_acc = 0.995575221238938
test Acc 0.978584729981378:
30th- epoch: 444, train_loss = 1.6926163248717785, train_acc = 0.995575221238938
test Acc 0.978584729981378:
30th- epoch: 445, train_loss = 1.6908323926618323, train_acc = 0.995575221238938
test Acc 0.978584729981378:
30th- epoch: 446, train_loss = 1.69041231891606, train_acc = 0.995575221238938
test Acc 0.978584729981378:
30th- epoch: 447, train_loss = 1.6891694279620424, train_acc = 0.995575221238938
test Acc 0.978584729981378:
30th- epoch: 448, train_loss = 1.6876070561120287, train_acc = 0.995575221238938
test Acc 0.978584729981378:
30th- epoch: 449, train_loss = 1.6874075817177072, train_acc = 0.995575221238938
test Acc 0.978584729981378:
30th- epoch: 450, train_loss = 1.6880283914506435, train_acc = 0.995575221238938
test Acc 0.978584729981378:
30th- epoch: 451, train_loss = 1.6856044493615627, train_acc = 0.995575221238938
test Acc 0.979050279329609:
30th- epoch: 452, tra

100%|████████████████████████████████████████████████████████████████████████| 30/30 [4:31:34<00:00, 543.03s/it]


Wall time: 4h 31min 36s
