In [None]:
import numpy as np
import pandas as pd

import torch
import torch.nn as nn
import torch.optim as optim
import torch.nn.functional as F
import torch.utils.data as data

import utility.Data_loader as D
from utility.Model import Mcslt
from utility.Custom import CustomDataset

from tqdm import tqdm
from collections import Counter

In [2]:
%%time
if __name__ == '__main__':
    read_path = 'D:virus/image/1gram_768/'
    
    temp = [[],[]]
    
    Loader = D.File_loader()
    data_a, label_a = Loader.read_files(read_path, interp = False)
    
    idx = np.argsort(label_a)
    
    sorted_data = data_a[idx].reshape(10736, -1)
    sorted_label = sorted(label_a)
        
    BATCH_SIZE = 64
    TOTAL = 30
    EPOCH =500
    NUM_CLASS = 9
    LR = 0.0001
    SEED = [s for s in range(TOTAL)]
    Num_Nodes = 768
    
    CUDA_N = 'cuda:0'
    
    # creating data indices for spliting
    full_dataset = CustomDataset(sorted_data, sorted_label)
    train_size = int(0.8 * len(full_dataset))
    test_size = len(full_dataset) - train_size
    
    # spliting
    torch.manual_seed(10)
    train_dataset, test_dataset = data.random_split(full_dataset, [train_size, test_size])
    train_loader = data.DataLoader(train_dataset, batch_size=BATCH_SIZE, shuffle = False)
    test_loader = data.DataLoader(test_dataset, batch_size=BATCH_SIZE, shuffle=False)
    
    loss_total = []
    acc_total = []
    pred_total = []
    true_total = []
    
    
    for i in tqdm(range(TOTAL)):
        
        
        device = torch.device(CUDA_N if torch.cuda.is_available() else 'cpu')
        torch.manual_seed(SEED[i])
        net = Mcslt(Num_Nodes, NUM_CLASS)
        net.to(device)
        print(net)
        
        softmax = nn.Softmax()
        criterion = nn.CrossEntropyLoss()
        optimizer = optim.SGD(net.parameters(), lr=LR, momentum = 0.1)
        
        loss_list = []
        train_acc_list = []
        test_acc_list = []
        
        pred_temp = []
        true_temp = []
        
        for epoch in range(EPOCH):
            net.train()
            running_loss = 0
            total = train_size
            correct = 0 
            
            for step, images_labels in enumerate(train_loader):
                inputs, labels = images_labels
                inputs, labels = inputs.type(torch.FloatTensor).to(device), labels.type(torch.LongTensor).to(device)
                
                outputs = net(inputs)
                
                loss = criterion(outputs, labels)
                
                optimizer.zero_grad()
                loss.backward()
                optimizer.step()
                running_loss += loss.item()
                
                _, pred = torch.max(outputs, dim=1)
                correct += (pred == labels).sum().item()
                
            train_acc = correct/total
            loss_list.append(running_loss)
            train_acc_list.append(train_acc)
            print('{}th- epoch: {}, train_loss = {}, train_acc = {}'.format(i+1, epoch, running_loss, train_acc))
            
            with torch.no_grad():
                net.eval()
                correct = 0
                total = test_size
                pt, tt = [], []
                
                for step_t, images_labels_t in enumerate(test_loader):
                    inputs_t, labels_t = images_labels_t
                    inputs_t, labels_t = inputs_t.type(torch.FloatTensor).to(device), labels_t.type(torch.LongTensor).to(device)
                    
                    outputs_t = net(inputs_t)
                    outputs_t = softmax(outputs_t)
                    
                    # test accuracy
                    _, pred_t = torch.max(outputs_t, dim = 1)
                    
                    pt.append(pred_t)
                    tt.append(labels_t)
                    
                    correct += (pred_t == labels_t).sum().item()
                    
                pred_temp.append(torch.cat(pt))
                true_temp.append(torch.cat(tt))
                
                test_acc = correct/total
                test_acc_list.append(test_acc)
                
                print('test Acc {}:'.format(test_acc))
                
        best_result_index = np.argmax(np.array(test_acc_list))
        loss_total.append(loss_list[best_result_index])
        acc_total.append(test_acc_list[best_result_index])
        pred_total.append(pred_temp[best_result_index].tolist())
        true_total.append(true_temp[best_result_index].tolist())
        
    file_name = 'res/Mcslt_1gram'
    torch.save(net.state_dict(), file_name +'.pth')
    
    loss_DF = pd.DataFrame(loss_total)
    loss_DF.to_csv(file_name+" loss.csv")
    
    acc_DF = pd.DataFrame(acc_total)
    acc_DF.to_csv(file_name +" acc.csv")
    
    pred_DF = pd.DataFrame(pred_total)
    pred_DF.to_csv(file_name +" pred.csv")
    
    true_DF = pd.DataFrame(true_total)
    true_DF.to_csv(file_name +" true.csv")

100%|███████████████████████████████████████████████████████████████████| 10736/10736 [00:01<00:00, 5742.01it/s]
  0%|                                                                                    | 0/30 [00:00<?, ?it/s]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
1th- epoch: 0, train_loss = 141.51218968629837, train_acc = 0.75




test Acc 0.8635940409683427:
1th- epoch: 1, train_loss = 58.23592698574066, train_acc = 0.8813460642757336
test Acc 0.8947858472998138:
1th- epoch: 2, train_loss = 48.3622922450304, train_acc = 0.902771308802981
test Acc 0.9022346368715084:
1th- epoch: 3, train_loss = 43.494202613830566, train_acc = 0.9103400093153237
test Acc 0.9120111731843575:
1th- epoch: 4, train_loss = 40.261719420552254, train_acc = 0.9156963204471356
test Acc 0.9162011173184358:
1th- epoch: 5, train_loss = 37.85023643821478, train_acc = 0.9203539823008849
test Acc 0.9213221601489758:
1th- epoch: 6, train_loss = 35.90387463569641, train_acc = 0.9231485794131346
test Acc 0.9245810055865922:
1th- epoch: 7, train_loss = 34.435725674033165, train_acc = 0.9252445272473219
test Acc 0.9292364990689013:
1th- epoch: 8, train_loss = 33.12388176470995, train_acc = 0.9272240335351654
test Acc 0.930633147113594:
1th- epoch: 9, train_loss = 32.027555629611015, train_acc = 0.9293199813693526
test Acc 0.9315642458100558:
1th- ep

1th- epoch: 151, train_loss = 16.437374438159168, train_acc = 0.9633209129017233
test Acc 0.9464618249534451:
1th- epoch: 152, train_loss = 16.437853108160198, train_acc = 0.9635537959944108
test Acc 0.946927374301676:
1th- epoch: 153, train_loss = 16.404670022428036, train_acc = 0.9632044713553796
test Acc 0.946927374301676:
1th- epoch: 154, train_loss = 16.38467296678573, train_acc = 0.9633209129017233
test Acc 0.946927374301676:
1th- epoch: 155, train_loss = 16.361124138347805, train_acc = 0.9633209129017233
test Acc 0.946927374301676:
1th- epoch: 156, train_loss = 16.35290731769055, train_acc = 0.9633209129017233
test Acc 0.946927374301676:
1th- epoch: 157, train_loss = 16.325540277175605, train_acc = 0.9634373544480671
test Acc 0.946927374301676:
1th- epoch: 158, train_loss = 16.304023225791752, train_acc = 0.9633209129017233
test Acc 0.9473929236499069:
1th- epoch: 159, train_loss = 16.291634187102318, train_acc = 0.9633209129017233
test Acc 0.946927374301676:
1th- epoch: 160, tr

1th- epoch: 300, train_loss = 14.603662960231304, train_acc = 0.9672799254774104
test Acc 0.9483240223463687:
1th- epoch: 301, train_loss = 14.592954797204584, train_acc = 0.9672799254774104
test Acc 0.9483240223463687:
1th- epoch: 302, train_loss = 14.585573054850101, train_acc = 0.9673963670237541
test Acc 0.9483240223463687:
1th- epoch: 303, train_loss = 14.57369014620781, train_acc = 0.9673963670237541
test Acc 0.9483240223463687:
1th- epoch: 304, train_loss = 14.571775391697884, train_acc = 0.9673963670237541
test Acc 0.9483240223463687:
1th- epoch: 305, train_loss = 14.556932926177979, train_acc = 0.9672799254774104
test Acc 0.9483240223463687:
1th- epoch: 306, train_loss = 14.55694122845307, train_acc = 0.9673963670237541
test Acc 0.9483240223463687:
1th- epoch: 307, train_loss = 14.549049896653742, train_acc = 0.9675128085700978
test Acc 0.9483240223463687:
1th- epoch: 308, train_loss = 14.538993862923235, train_acc = 0.9678621332091291
test Acc 0.9483240223463687:
1th- epoch: 

test Acc 0.9487895716945997:
1th- epoch: 449, train_loss = 13.748240113258362, train_acc = 0.9699580810433163
test Acc 0.9492551210428305:
1th- epoch: 450, train_loss = 13.752988318447024, train_acc = 0.97007452258966
test Acc 0.9492551210428305:
1th- epoch: 451, train_loss = 13.743619874119759, train_acc = 0.97007452258966
test Acc 0.9492551210428305:
1th- epoch: 452, train_loss = 13.741098883096129, train_acc = 0.9699580810433163
test Acc 0.9492551210428305:
1th- epoch: 453, train_loss = 13.73489161580801, train_acc = 0.9699580810433163
test Acc 0.9492551210428305:
1th- epoch: 454, train_loss = 13.729323364794254, train_acc = 0.9699580810433163
test Acc 0.9492551210428305:
1th- epoch: 455, train_loss = 13.730227373540401, train_acc = 0.9699580810433163
test Acc 0.9492551210428305:
1th- epoch: 456, train_loss = 13.725483221467584, train_acc = 0.97007452258966
test Acc 0.9492551210428305:
1th- epoch: 457, train_loss = 13.717251867055893, train_acc = 0.97007452258966
test Acc 0.94925512

  3%|██▍                                                                      | 1/30 [09:02<4:22:03, 542.20s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
2th- epoch: 0, train_loss = 127.45502880215645, train_acc = 0.749534233814625
test Acc 0.8119180633147114:
2th- epoch: 1, train_loss = 59.21118600666523, train_acc = 0.8734280391243596
test Acc 0.8566108007448789:
2th- epoch: 2, train_loss = 49.65851204097271, train_acc = 0.8954354913833256
test Acc 0.88268156424581:
2th- epoch: 3, train_loss = 44.52341739833355, train_acc = 0.905798789007918
test Acc 0.8943202979515829:
2th- epoch: 4, train_loss = 41.05014143139124, train_acc = 0.912435957149511
test Acc 0.9082867783985102:
2th- epoch: 5, train_loss = 38.648760728538036, train_acc = 0.9174429436422916
test Acc

2th- epoch: 147, train_loss = 16.878104964271188, train_acc = 0.9634373544480671
test Acc 0.9450651769087524:
2th- epoch: 148, train_loss = 16.861504951491952, train_acc = 0.9632044713553796
test Acc 0.9450651769087524:
2th- epoch: 149, train_loss = 16.83960670232773, train_acc = 0.9634373544480671
test Acc 0.9455307262569832:
2th- epoch: 150, train_loss = 16.815933572128415, train_acc = 0.9632044713553796
test Acc 0.9455307262569832:
2th- epoch: 151, train_loss = 16.79067882709205, train_acc = 0.9633209129017233
test Acc 0.9455307262569832:
2th- epoch: 152, train_loss = 16.776182325556874, train_acc = 0.9633209129017233
test Acc 0.9455307262569832:
2th- epoch: 153, train_loss = 16.75211418233812, train_acc = 0.9634373544480671
test Acc 0.9455307262569832:
2th- epoch: 154, train_loss = 16.73311212658882, train_acc = 0.9636702375407545
test Acc 0.9459962756052142:
2th- epoch: 155, train_loss = 16.71538239903748, train_acc = 0.9634373544480671
test Acc 0.9450651769087524:
2th- epoch: 156

test Acc 0.946927374301676:
2th- epoch: 297, train_loss = 14.92519545275718, train_acc = 0.9677456916627852
test Acc 0.946927374301676:
2th- epoch: 298, train_loss = 14.917648809961975, train_acc = 0.9677456916627852
test Acc 0.946927374301676:
2th- epoch: 299, train_loss = 14.908299446105957, train_acc = 0.9677456916627852
test Acc 0.946927374301676:
2th- epoch: 300, train_loss = 14.91156666353345, train_acc = 0.9678621332091291
test Acc 0.946927374301676:
2th- epoch: 301, train_loss = 14.897472796030343, train_acc = 0.9676292501164415
test Acc 0.946927374301676:
2th- epoch: 302, train_loss = 14.887117858044803, train_acc = 0.9678621332091291
test Acc 0.946927374301676:
2th- epoch: 303, train_loss = 14.885658998973668, train_acc = 0.9678621332091291
test Acc 0.946927374301676:
2th- epoch: 304, train_loss = 14.873137908987701, train_acc = 0.9677456916627852
test Acc 0.946927374301676:
2th- epoch: 305, train_loss = 14.868231409229338, train_acc = 0.9677456916627852
test Acc 0.9469273743

2th- epoch: 445, train_loss = 14.034782508853823, train_acc = 0.969608756404285
test Acc 0.9487895716945997:
2th- epoch: 446, train_loss = 14.032862678170204, train_acc = 0.969608756404285
test Acc 0.9487895716945997:
2th- epoch: 447, train_loss = 14.032205797731876, train_acc = 0.9694923148579413
test Acc 0.9487895716945997:
2th- epoch: 448, train_loss = 14.024740878492594, train_acc = 0.969608756404285
test Acc 0.9487895716945997:
2th- epoch: 449, train_loss = 14.01280348887667, train_acc = 0.969608756404285
test Acc 0.9487895716945997:
2th- epoch: 450, train_loss = 14.01234399387613, train_acc = 0.969608756404285
test Acc 0.9487895716945997:
2th- epoch: 451, train_loss = 14.017632111907005, train_acc = 0.969608756404285
test Acc 0.9487895716945997:
2th- epoch: 452, train_loss = 14.007768007460982, train_acc = 0.969608756404285
test Acc 0.9487895716945997:
2th- epoch: 453, train_loss = 14.002687819302082, train_acc = 0.969608756404285
test Acc 0.9487895716945997:
2th- epoch: 454, tra

  7%|████▊                                                                    | 2/30 [18:04<4:13:03, 542.28s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
3th- epoch: 0, train_loss = 116.76749747991562, train_acc = 0.7554727526781556
test Acc 0.8519553072625698:
3th- epoch: 1, train_loss = 59.1044575124979, train_acc = 0.8762226362366092
test Acc 0.8854748603351955:
3th- epoch: 2, train_loss = 49.34728763997555, train_acc = 0.8952026082906381
test Acc 0.8994413407821229:
3th- epoch: 3, train_loss = 44.30472859740257, train_acc = 0.9055659059152306
test Acc 0.9064245810055865:
3th- epoch: 4, train_loss = 40.95401853322983, train_acc = 0.9113879832324173
test Acc 0.9106145251396648:
3th- epoch: 5, train_loss = 38.5804136171937, train_acc = 0.9161620866325105
test A

3th- epoch: 147, train_loss = 17.207624100148678, train_acc = 0.9615742897065673
test Acc 0.9455307262569832:
3th- epoch: 148, train_loss = 17.193420777097344, train_acc = 0.9615742897065673
test Acc 0.9455307262569832:
3th- epoch: 149, train_loss = 17.16484414227307, train_acc = 0.961690731252911
test Acc 0.9455307262569832:
3th- epoch: 150, train_loss = 17.146300675347447, train_acc = 0.9618071727992548
test Acc 0.9459962756052142:
3th- epoch: 151, train_loss = 17.11153689585626, train_acc = 0.9618071727992548
test Acc 0.9455307262569832:
3th- epoch: 152, train_loss = 17.100823648273945, train_acc = 0.9619236143455985
test Acc 0.9459962756052142:
3th- epoch: 153, train_loss = 17.074683183804154, train_acc = 0.9619236143455985
test Acc 0.9459962756052142:
3th- epoch: 154, train_loss = 17.05058477073908, train_acc = 0.9622729389846297
test Acc 0.9459962756052142:
3th- epoch: 155, train_loss = 17.039342744275928, train_acc = 0.9620400558919422
test Acc 0.9455307262569832:
3th- epoch: 15

3th- epoch: 296, train_loss = 15.153619240038097, train_acc = 0.9657661853749417
test Acc 0.9483240223463687:
3th- epoch: 297, train_loss = 15.146068987436593, train_acc = 0.9657661853749417
test Acc 0.9487895716945997:
3th- epoch: 298, train_loss = 15.135366514325142, train_acc = 0.9657661853749417
test Acc 0.9483240223463687:
3th- epoch: 299, train_loss = 15.124909073114395, train_acc = 0.9657661853749417
test Acc 0.9487895716945997:
3th- epoch: 300, train_loss = 15.116426748223603, train_acc = 0.9657661853749417
test Acc 0.9487895716945997:
3th- epoch: 301, train_loss = 15.109538336284459, train_acc = 0.9657661853749417
test Acc 0.9487895716945997:
3th- epoch: 302, train_loss = 15.103071088902652, train_acc = 0.9657661853749417
test Acc 0.9483240223463687:
3th- epoch: 303, train_loss = 15.098965686745942, train_acc = 0.9657661853749417
test Acc 0.9487895716945997:
3th- epoch: 304, train_loss = 15.086336421780288, train_acc = 0.9658826269212856
test Acc 0.9487895716945997:
3th- epoch

3th- epoch: 444, train_loss = 14.150016814470291, train_acc = 0.9692594317652539
test Acc 0.9497206703910615:
3th- epoch: 445, train_loss = 14.14616251224652, train_acc = 0.9690265486725663
test Acc 0.9497206703910615:
3th- epoch: 446, train_loss = 14.139765759464353, train_acc = 0.9691429902189101
test Acc 0.9497206703910615:
3th- epoch: 447, train_loss = 14.134732271078974, train_acc = 0.9692594317652539
test Acc 0.9497206703910615:
3th- epoch: 448, train_loss = 14.129677583929151, train_acc = 0.9692594317652539
test Acc 0.9497206703910615:
3th- epoch: 449, train_loss = 14.126035551074892, train_acc = 0.9692594317652539
test Acc 0.9497206703910615:
3th- epoch: 450, train_loss = 14.125455806497484, train_acc = 0.9693758733115976
test Acc 0.9497206703910615:
3th- epoch: 451, train_loss = 14.114192301873118, train_acc = 0.9692594317652539
test Acc 0.9497206703910615:
3th- epoch: 452, train_loss = 14.11435999488458, train_acc = 0.9692594317652539
test Acc 0.9497206703910615:
3th- epoch: 

 10%|███████▎                                                                 | 3/30 [27:07<4:04:10, 542.59s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
4th- epoch: 0, train_loss = 133.66366842389107, train_acc = 0.7392873777363763
test Acc 0.835195530726257:
4th- epoch: 1, train_loss = 61.14858815073967, train_acc = 0.8745924545877969
test Acc 0.8891992551210428:
4th- epoch: 2, train_loss = 51.14849931001663, train_acc = 0.8970656730321379
test Acc 0.9008379888268156:
4th- epoch: 3, train_loss = 45.9944751560688, train_acc = 0.9049836981835119
test Acc 0.9078212290502793:
4th- epoch: 4, train_loss = 42.66969057917595, train_acc = 0.911504424778761
test Acc 0.9124767225325885:
4th- epoch: 5, train_loss = 40.21695948392153, train_acc = 0.916394969725198
test Acc

4th- epoch: 147, train_loss = 17.199761105701327, train_acc = 0.961690731252911
test Acc 0.9459962756052142:
4th- epoch: 148, train_loss = 17.182656725868583, train_acc = 0.9619236143455985
test Acc 0.9459962756052142:
4th- epoch: 149, train_loss = 17.16750002466142, train_acc = 0.961690731252911
test Acc 0.9459962756052142:
4th- epoch: 150, train_loss = 17.13502380810678, train_acc = 0.961690731252911
test Acc 0.9459962756052142:
4th- epoch: 151, train_loss = 17.117489647120237, train_acc = 0.9618071727992548
test Acc 0.9459962756052142:
4th- epoch: 152, train_loss = 17.097417825832963, train_acc = 0.9618071727992548
test Acc 0.9459962756052142:
4th- epoch: 153, train_loss = 17.065124599263072, train_acc = 0.9618071727992548
test Acc 0.9459962756052142:
4th- epoch: 154, train_loss = 17.052919385954738, train_acc = 0.9619236143455985
test Acc 0.9459962756052142:
4th- epoch: 155, train_loss = 17.030444918200374, train_acc = 0.9620400558919422
test Acc 0.9459962756052142:
4th- epoch: 156

4th- epoch: 296, train_loss = 15.17069724202156, train_acc = 0.9666977177456917
test Acc 0.9497206703910615:
4th- epoch: 297, train_loss = 15.159249517135322, train_acc = 0.9669306008383791
test Acc 0.9497206703910615:
4th- epoch: 298, train_loss = 15.158097644336522, train_acc = 0.9666977177456917
test Acc 0.9497206703910615:
4th- epoch: 299, train_loss = 15.14405029732734, train_acc = 0.9669306008383791
test Acc 0.9497206703910615:
4th- epoch: 300, train_loss = 15.141666191630065, train_acc = 0.9669306008383791
test Acc 0.9497206703910615:
4th- epoch: 301, train_loss = 15.1302245631814, train_acc = 0.9666977177456917
test Acc 0.9497206703910615:
4th- epoch: 302, train_loss = 15.12825268227607, train_acc = 0.9668141592920354
test Acc 0.9497206703910615:
4th- epoch: 303, train_loss = 15.114187642931938, train_acc = 0.9669306008383791
test Acc 0.9497206703910615:
4th- epoch: 304, train_loss = 15.098023449070752, train_acc = 0.9669306008383791
test Acc 0.9497206703910615:
4th- epoch: 305

4th- epoch: 444, train_loss = 14.207080368883908, train_acc = 0.9691429902189101
test Acc 0.9506517690875232:
4th- epoch: 445, train_loss = 14.197924030013382, train_acc = 0.9691429902189101
test Acc 0.9506517690875232:
4th- epoch: 446, train_loss = 14.193804780952632, train_acc = 0.9691429902189101
test Acc 0.9506517690875232:
4th- epoch: 447, train_loss = 14.186047594062984, train_acc = 0.9691429902189101
test Acc 0.9506517690875232:
4th- epoch: 448, train_loss = 14.177645231131464, train_acc = 0.9690265486725663
test Acc 0.9506517690875232:
4th- epoch: 449, train_loss = 14.174020655453205, train_acc = 0.9690265486725663
test Acc 0.9506517690875232:
4th- epoch: 450, train_loss = 14.167880117893219, train_acc = 0.9691429902189101
test Acc 0.9506517690875232:
4th- epoch: 451, train_loss = 14.166562899947166, train_acc = 0.9691429902189101
test Acc 0.9506517690875232:
4th- epoch: 452, train_loss = 14.16089078783989, train_acc = 0.9691429902189101
test Acc 0.9506517690875232:
4th- epoch:

 13%|█████████▋                                                               | 4/30 [36:09<3:54:59, 542.30s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
5th- epoch: 0, train_loss = 137.19349732995033, train_acc = 0.7261294829995343
test Acc 0.8086592178770949:
5th- epoch: 1, train_loss = 60.105453476309776, train_acc = 0.8678388448998603
test Acc 0.8589385474860335:
5th- epoch: 2, train_loss = 49.83126164972782, train_acc = 0.893921751280857
test Acc 0.883147113594041:
5th- epoch: 3, train_loss = 44.522868663072586, train_acc = 0.9066138798323242
test Acc 0.9022346368715084:
5th- epoch: 4, train_loss = 41.15682389587164, train_acc = 0.9138332557056358
test Acc 0.9120111731843575:
5th- epoch: 5, train_loss = 38.684550531208515, train_acc = 0.9183744760130415
tes

5th- epoch: 147, train_loss = 16.974545545876026, train_acc = 0.9627387051700047
test Acc 0.9464618249534451:
5th- epoch: 148, train_loss = 16.943931927904487, train_acc = 0.9630880298090359
test Acc 0.9464618249534451:
5th- epoch: 149, train_loss = 16.926802469417453, train_acc = 0.9632044713553796
test Acc 0.946927374301676:
5th- epoch: 150, train_loss = 16.902023872360587, train_acc = 0.9630880298090359
test Acc 0.9464618249534451:
5th- epoch: 151, train_loss = 16.880329970270395, train_acc = 0.9633209129017233
test Acc 0.9464618249534451:
5th- epoch: 152, train_loss = 16.87053775601089, train_acc = 0.9633209129017233
test Acc 0.9464618249534451:
5th- epoch: 153, train_loss = 16.849531641229987, train_acc = 0.9634373544480671
test Acc 0.9464618249534451:
5th- epoch: 154, train_loss = 16.832564247772098, train_acc = 0.9634373544480671
test Acc 0.946927374301676:
5th- epoch: 155, train_loss = 16.797119177877903, train_acc = 0.9634373544480671
test Acc 0.946927374301676:
5th- epoch: 15

5th- epoch: 296, train_loss = 15.047016746364534, train_acc = 0.9671634839310667
test Acc 0.9483240223463687:
5th- epoch: 297, train_loss = 15.038898926228285, train_acc = 0.9672799254774104
test Acc 0.9483240223463687:
5th- epoch: 298, train_loss = 15.03156923968345, train_acc = 0.9672799254774104
test Acc 0.9483240223463687:
5th- epoch: 299, train_loss = 15.026088569313288, train_acc = 0.9672799254774104
test Acc 0.9483240223463687:
5th- epoch: 300, train_loss = 15.009218376129866, train_acc = 0.9673963670237541
test Acc 0.9483240223463687:
5th- epoch: 301, train_loss = 15.005808825604618, train_acc = 0.9672799254774104
test Acc 0.9483240223463687:
5th- epoch: 302, train_loss = 14.996310472488403, train_acc = 0.9673963670237541
test Acc 0.9483240223463687:
5th- epoch: 303, train_loss = 14.985980346798897, train_acc = 0.9672799254774104
test Acc 0.9487895716945997:
5th- epoch: 304, train_loss = 14.975183228962123, train_acc = 0.9673963670237541
test Acc 0.9483240223463687:
5th- epoch:

5th- epoch: 444, train_loss = 14.140299419406801, train_acc = 0.9691429902189101
test Acc 0.9492551210428305:
5th- epoch: 445, train_loss = 14.127679458353668, train_acc = 0.9691429902189101
test Acc 0.9492551210428305:
5th- epoch: 446, train_loss = 14.12582814693451, train_acc = 0.9691429902189101
test Acc 0.9492551210428305:
5th- epoch: 447, train_loss = 14.12855883454904, train_acc = 0.9691429902189101
test Acc 0.9492551210428305:
5th- epoch: 448, train_loss = 14.115735122468323, train_acc = 0.9691429902189101
test Acc 0.9492551210428305:
5th- epoch: 449, train_loss = 14.109738774597645, train_acc = 0.9691429902189101
test Acc 0.9492551210428305:
5th- epoch: 450, train_loss = 14.106512846890837, train_acc = 0.9691429902189101
test Acc 0.9492551210428305:
5th- epoch: 451, train_loss = 14.106723272707313, train_acc = 0.9692594317652539
test Acc 0.9492551210428305:
5th- epoch: 452, train_loss = 14.100948348641396, train_acc = 0.9693758733115976
test Acc 0.9497206703910615:
5th- epoch: 

 17%|████████████▏                                                            | 5/30 [45:14<3:46:17, 543.09s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
6th- epoch: 0, train_loss = 128.24296414852142, train_acc = 0.7494177922682813
test Acc 0.8212290502793296:
6th- epoch: 1, train_loss = 58.3861091658473, train_acc = 0.8777363763390778
test Acc 0.8682495344506518:
6th- epoch: 2, train_loss = 48.60183996707201, train_acc = 0.8948532836516069
test Acc 0.8845437616387337:
6th- epoch: 3, train_loss = 43.74584659188986, train_acc = 0.9051001397298556
test Acc 0.898975791433892:
6th- epoch: 4, train_loss = 40.56760708242655, train_acc = 0.9112715416860736
test Acc 0.9031657355679702:
6th- epoch: 5, train_loss = 38.22667954862118, train_acc = 0.915929203539823
test Ac

6th- epoch: 147, train_loss = 17.095595851540565, train_acc = 0.9623893805309734
test Acc 0.9450651769087524:
6th- epoch: 148, train_loss = 17.07233594916761, train_acc = 0.9623893805309734
test Acc 0.9450651769087524:
6th- epoch: 149, train_loss = 17.052076369524002, train_acc = 0.9626222636236609
test Acc 0.9450651769087524:
6th- epoch: 150, train_loss = 17.024069694802165, train_acc = 0.9628551467163484
test Acc 0.9450651769087524:
6th- epoch: 151, train_loss = 17.00953121483326, train_acc = 0.9628551467163484
test Acc 0.9445996275605214:
6th- epoch: 152, train_loss = 16.991106376051903, train_acc = 0.9628551467163484
test Acc 0.9450651769087524:
6th- epoch: 153, train_loss = 16.97119746170938, train_acc = 0.9628551467163484
test Acc 0.9445996275605214:
6th- epoch: 154, train_loss = 16.949003040790558, train_acc = 0.9628551467163484
test Acc 0.9445996275605214:
6th- epoch: 155, train_loss = 16.924191497266293, train_acc = 0.9629715882626921
test Acc 0.9445996275605214:
6th- epoch: 1

6th- epoch: 296, train_loss = 15.086441147141159, train_acc = 0.9662319515603167
test Acc 0.946927374301676:
6th- epoch: 297, train_loss = 15.075694997794926, train_acc = 0.9663483931066604
test Acc 0.946927374301676:
6th- epoch: 298, train_loss = 15.069817282259464, train_acc = 0.9664648346530041
test Acc 0.946927374301676:
6th- epoch: 299, train_loss = 15.049476030282676, train_acc = 0.966581276199348
test Acc 0.9464618249534451:
6th- epoch: 300, train_loss = 15.044383309781551, train_acc = 0.966581276199348
test Acc 0.946927374301676:
6th- epoch: 301, train_loss = 15.044191884808242, train_acc = 0.9663483931066604
test Acc 0.946927374301676:
6th- epoch: 302, train_loss = 15.033243256621063, train_acc = 0.9664648346530041
test Acc 0.946927374301676:
6th- epoch: 303, train_loss = 15.018927979283035, train_acc = 0.9664648346530041
test Acc 0.946927374301676:
6th- epoch: 304, train_loss = 15.017941854894161, train_acc = 0.9664648346530041
test Acc 0.946927374301676:
6th- epoch: 305, tra

test Acc 0.9478584729981379:
6th- epoch: 446, train_loss = 14.129596252925694, train_acc = 0.9693758733115976
test Acc 0.9478584729981379:
6th- epoch: 447, train_loss = 14.127021198160946, train_acc = 0.9692594317652539
test Acc 0.9478584729981379:
6th- epoch: 448, train_loss = 14.118821400217712, train_acc = 0.9693758733115976
test Acc 0.9478584729981379:
6th- epoch: 449, train_loss = 14.114262078888714, train_acc = 0.9693758733115976
test Acc 0.9483240223463687:
6th- epoch: 450, train_loss = 14.111345673911273, train_acc = 0.9693758733115976
test Acc 0.9478584729981379:
6th- epoch: 451, train_loss = 14.106897269375622, train_acc = 0.9693758733115976
test Acc 0.9478584729981379:
6th- epoch: 452, train_loss = 14.101289975456893, train_acc = 0.9693758733115976
test Acc 0.9478584729981379:
6th- epoch: 453, train_loss = 14.089052446186543, train_acc = 0.9692594317652539
test Acc 0.9478584729981379:
6th- epoch: 454, train_loss = 14.09150257986039, train_acc = 0.9693758733115976
test Acc 0.

 20%|██████████████▌                                                          | 6/30 [54:18<3:37:19, 543.31s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
7th- epoch: 0, train_loss = 124.80583634972572, train_acc = 0.7402189101071263
test Acc 0.8333333333333334:
7th- epoch: 1, train_loss = 60.4703631401062, train_acc = 0.8720307405682347
test Acc 0.8808193668528864:
7th- epoch: 2, train_loss = 50.570172891020775, train_acc = 0.8919422449930136
test Acc 0.8919925512104283:
7th- epoch: 3, train_loss = 45.45087657868862, train_acc = 0.9030041918956684
test Acc 0.9003724394785847:
7th- epoch: 4, train_loss = 41.96814885735512, train_acc = 0.9108057755006986
test Acc 0.909217877094972:
7th- epoch: 5, train_loss = 39.38542552292347, train_acc = 0.9151141127154169
test 

7th- epoch: 147, train_loss = 16.977304125204682, train_acc = 0.9620400558919422
test Acc 0.9464618249534451:
7th- epoch: 148, train_loss = 16.954186329618096, train_acc = 0.9620400558919422
test Acc 0.9459962756052142:
7th- epoch: 149, train_loss = 16.946069149300456, train_acc = 0.962156497438286
test Acc 0.9464618249534451:
7th- epoch: 150, train_loss = 16.9093430172652, train_acc = 0.9625058220773172
test Acc 0.9464618249534451:
7th- epoch: 151, train_loss = 16.89572488889098, train_acc = 0.9625058220773172
test Acc 0.946927374301676:
7th- epoch: 152, train_loss = 16.86653565056622, train_acc = 0.9623893805309734
test Acc 0.946927374301676:
7th- epoch: 153, train_loss = 16.84625561349094, train_acc = 0.9626222636236609
test Acc 0.946927374301676:
7th- epoch: 154, train_loss = 16.821884498000145, train_acc = 0.9627387051700047
test Acc 0.946927374301676:
7th- epoch: 155, train_loss = 16.80133350007236, train_acc = 0.9625058220773172
test Acc 0.946927374301676:
7th- epoch: 156, train

7th- epoch: 296, train_loss = 14.962637127377093, train_acc = 0.966115510013973
test Acc 0.9501862197392924:
7th- epoch: 297, train_loss = 14.95742618944496, train_acc = 0.9664648346530041
test Acc 0.9506517690875232:
7th- epoch: 298, train_loss = 14.938251125626266, train_acc = 0.9666977177456917
test Acc 0.9506517690875232:
7th- epoch: 299, train_loss = 14.946868129074574, train_acc = 0.9662319515603167
test Acc 0.9506517690875232:
7th- epoch: 300, train_loss = 14.924102692864835, train_acc = 0.9664648346530041
test Acc 0.9506517690875232:
7th- epoch: 301, train_loss = 14.914614199660718, train_acc = 0.966581276199348
test Acc 0.9506517690875232:
7th- epoch: 302, train_loss = 14.916640476323664, train_acc = 0.9662319515603167
test Acc 0.9506517690875232:
7th- epoch: 303, train_loss = 14.909124174155295, train_acc = 0.9666977177456917
test Acc 0.9506517690875232:
7th- epoch: 304, train_loss = 14.895127188414335, train_acc = 0.966581276199348
test Acc 0.9506517690875232:
7th- epoch: 30

7th- epoch: 444, train_loss = 14.047163107432425, train_acc = 0.9698416394969726
test Acc 0.9501862197392924:
7th- epoch: 445, train_loss = 14.04675793275237, train_acc = 0.9699580810433163
test Acc 0.9501862197392924:
7th- epoch: 446, train_loss = 14.039849866181612, train_acc = 0.9698416394969726
test Acc 0.9501862197392924:
7th- epoch: 447, train_loss = 14.030056610703468, train_acc = 0.9698416394969726
test Acc 0.9501862197392924:
7th- epoch: 448, train_loss = 14.033127567730844, train_acc = 0.9703074056823474
test Acc 0.9501862197392924:
7th- epoch: 449, train_loss = 14.022106226533651, train_acc = 0.9699580810433163
test Acc 0.9501862197392924:
7th- epoch: 450, train_loss = 14.023976225405931, train_acc = 0.9698416394969726
test Acc 0.9501862197392924:
7th- epoch: 451, train_loss = 14.01887692231685, train_acc = 0.97007452258966
test Acc 0.9501862197392924:
7th- epoch: 452, train_loss = 14.005274173803627, train_acc = 0.9699580810433163
test Acc 0.9501862197392924:
7th- epoch: 45

 23%|████████████████▌                                                      | 7/30 [1:03:24<3:28:34, 544.10s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
8th- epoch: 0, train_loss = 129.7454314827919, train_acc = 0.7437121564974383
test Acc 0.8654562383612663:
8th- epoch: 1, train_loss = 61.05909751355648, train_acc = 0.8727293898462971
test Acc 0.8961824953445066:
8th- epoch: 2, train_loss = 50.69575181603432, train_acc = 0.8948532836516069
test Acc 0.9078212290502793:
8th- epoch: 3, train_loss = 45.432965695858, train_acc = 0.9044014904517932
test Acc 0.9129422718808193:
8th- epoch: 4, train_loss = 41.936932146549225, train_acc = 0.9109222170470423
test Acc 0.9157355679702048:
8th- epoch: 5, train_loss = 39.3415162563324, train_acc = 0.9149976711690732
test Ac

8th- epoch: 147, train_loss = 17.108743665739894, train_acc = 0.9625058220773172
test Acc 0.9459962756052142:
8th- epoch: 148, train_loss = 17.07840894162655, train_acc = 0.9625058220773172
test Acc 0.9459962756052142:
8th- epoch: 149, train_loss = 17.062770884484053, train_acc = 0.9625058220773172
test Acc 0.9455307262569832:
8th- epoch: 150, train_loss = 17.04253764823079, train_acc = 0.9626222636236609
test Acc 0.9459962756052142:
8th- epoch: 151, train_loss = 17.014757746830583, train_acc = 0.9625058220773172
test Acc 0.9455307262569832:
8th- epoch: 152, train_loss = 17.00496249087155, train_acc = 0.9625058220773172
test Acc 0.9464618249534451:
8th- epoch: 153, train_loss = 16.972746713086963, train_acc = 0.9626222636236609
test Acc 0.9459962756052142:
8th- epoch: 154, train_loss = 16.953646548092365, train_acc = 0.9626222636236609
test Acc 0.946927374301676:
8th- epoch: 155, train_loss = 16.945859730243683, train_acc = 0.9626222636236609
test Acc 0.9464618249534451:
8th- epoch: 15

8th- epoch: 296, train_loss = 15.10597616713494, train_acc = 0.966115510013973
test Acc 0.9478584729981379:
8th- epoch: 297, train_loss = 15.09981144964695, train_acc = 0.966115510013973
test Acc 0.9478584729981379:
8th- epoch: 298, train_loss = 15.095208407379687, train_acc = 0.966115510013973
test Acc 0.9478584729981379:
8th- epoch: 299, train_loss = 15.086981347762048, train_acc = 0.9662319515603167
test Acc 0.9478584729981379:
8th- epoch: 300, train_loss = 15.079387459903955, train_acc = 0.966115510013973
test Acc 0.9478584729981379:
8th- epoch: 301, train_loss = 15.069807427935302, train_acc = 0.966115510013973
test Acc 0.9483240223463687:
8th- epoch: 302, train_loss = 15.05872220825404, train_acc = 0.9663483931066604
test Acc 0.9478584729981379:
8th- epoch: 303, train_loss = 15.051551279611886, train_acc = 0.9662319515603167
test Acc 0.9483240223463687:
8th- epoch: 304, train_loss = 15.039174241013825, train_acc = 0.9663483931066604
test Acc 0.9483240223463687:
8th- epoch: 305, t

8th- epoch: 445, train_loss = 14.187785630114377, train_acc = 0.9694923148579413
test Acc 0.9487895716945997:
8th- epoch: 446, train_loss = 14.180721056647599, train_acc = 0.9694923148579413
test Acc 0.9487895716945997:
8th- epoch: 447, train_loss = 14.176138932816684, train_acc = 0.9694923148579413
test Acc 0.9487895716945997:
8th- epoch: 448, train_loss = 14.173438449390233, train_acc = 0.9694923148579413
test Acc 0.9487895716945997:
8th- epoch: 449, train_loss = 14.164945280645043, train_acc = 0.969608756404285
test Acc 0.9487895716945997:
8th- epoch: 450, train_loss = 14.16275917366147, train_acc = 0.969608756404285
test Acc 0.9487895716945997:
8th- epoch: 451, train_loss = 14.158391274511814, train_acc = 0.969608756404285
test Acc 0.9487895716945997:
8th- epoch: 452, train_loss = 14.15331554505974, train_acc = 0.9693758733115976
test Acc 0.9487895716945997:
8th- epoch: 453, train_loss = 14.148718459997326, train_acc = 0.969608756404285
test Acc 0.9487895716945997:
8th- epoch: 454,

 27%|██████████████████▉                                                    | 8/30 [1:12:30<3:19:45, 544.81s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
9th- epoch: 0, train_loss = 121.51958999037743, train_acc = 0.7550069864927806
test Acc 0.8533519553072626:
9th- epoch: 1, train_loss = 59.24321077764034, train_acc = 0.8773870517000466
test Acc 0.8929236499068901:
9th- epoch: 2, train_loss = 49.301661409437656, train_acc = 0.8996273870517001
test Acc 0.9054934823091247:
9th- epoch: 3, train_loss = 44.248012624680996, train_acc = 0.91022356776898
test Acc 0.9138733705772812:
9th- epoch: 4, train_loss = 40.889715261757374, train_acc = 0.9137168141592921
test Acc 0.9171322160148976:
9th- epoch: 5, train_loss = 38.38197169452906, train_acc = 0.9190731252911039
tes

9th- epoch: 147, train_loss = 16.779008416458964, train_acc = 0.9633209129017233
test Acc 0.9455307262569832:
9th- epoch: 148, train_loss = 16.757209548726678, train_acc = 0.9633209129017233
test Acc 0.9455307262569832:
9th- epoch: 149, train_loss = 16.73463685438037, train_acc = 0.9630880298090359
test Acc 0.9455307262569832:
9th- epoch: 150, train_loss = 16.716545658186078, train_acc = 0.9633209129017233
test Acc 0.9455307262569832:
9th- epoch: 151, train_loss = 16.692022928968072, train_acc = 0.9632044713553796
test Acc 0.9455307262569832:
9th- epoch: 152, train_loss = 16.672588234767318, train_acc = 0.9634373544480671
test Acc 0.9455307262569832:
9th- epoch: 153, train_loss = 16.650452725589275, train_acc = 0.9633209129017233
test Acc 0.9455307262569832:
9th- epoch: 154, train_loss = 16.626568725332618, train_acc = 0.9634373544480671
test Acc 0.9455307262569832:
9th- epoch: 155, train_loss = 16.60512788966298, train_acc = 0.9634373544480671
test Acc 0.9455307262569832:
9th- epoch: 

test Acc 0.9473929236499069:
9th- epoch: 222, train_loss = 15.55776690505445, train_acc = 0.9659990684676293
test Acc 0.9473929236499069:
9th- epoch: 223, train_loss = 15.542839469388127, train_acc = 0.9659990684676293
test Acc 0.9473929236499069:
9th- epoch: 224, train_loss = 15.53874565474689, train_acc = 0.9657661853749417
test Acc 0.9473929236499069:
9th- epoch: 225, train_loss = 15.519497774541378, train_acc = 0.9659990684676293
test Acc 0.9473929236499069:
9th- epoch: 226, train_loss = 15.512384420260787, train_acc = 0.9659990684676293
test Acc 0.9478584729981379:
9th- epoch: 227, train_loss = 15.494974618777633, train_acc = 0.9659990684676293
test Acc 0.9473929236499069:
9th- epoch: 228, train_loss = 15.489962752908468, train_acc = 0.9659990684676293
test Acc 0.9478584729981379:
9th- epoch: 229, train_loss = 15.47536158747971, train_acc = 0.9659990684676293
test Acc 0.9478584729981379:
9th- epoch: 230, train_loss = 15.457307187840343, train_acc = 0.9659990684676293
test Acc 0.94

9th- epoch: 370, train_loss = 14.288607989437878, train_acc = 0.9687936655798789
test Acc 0.9497206703910615:
9th- epoch: 371, train_loss = 14.279566586948931, train_acc = 0.9687936655798789
test Acc 0.9497206703910615:
9th- epoch: 372, train_loss = 14.275353639386594, train_acc = 0.9686772240335352
test Acc 0.9497206703910615:
9th- epoch: 373, train_loss = 14.267533439211547, train_acc = 0.9686772240335352
test Acc 0.9497206703910615:
9th- epoch: 374, train_loss = 14.26465363893658, train_acc = 0.9689101071262226
test Acc 0.9497206703910615:
9th- epoch: 375, train_loss = 14.260802686214447, train_acc = 0.9687936655798789
test Acc 0.9497206703910615:
9th- epoch: 376, train_loss = 14.250892505981028, train_acc = 0.9687936655798789
test Acc 0.9497206703910615:
9th- epoch: 377, train_loss = 14.24510280508548, train_acc = 0.9687936655798789
test Acc 0.9497206703910615:
9th- epoch: 378, train_loss = 14.239412783645093, train_acc = 0.9686772240335352
test Acc 0.9497206703910615:
9th- epoch: 

 30%|█████████████████████▎                                                 | 9/30 [1:21:36<3:10:44, 544.97s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
10th- epoch: 0, train_loss = 128.92108803987503, train_acc = 0.746506753609688
test Acc 0.8631284916201117:
10th- epoch: 1, train_loss = 57.772426307201385, train_acc = 0.8762226362366092
test Acc 0.8947858472998138:
10th- epoch: 2, train_loss = 47.93527953326702, train_acc = 0.8992780624126688
test Acc 0.9031657355679702:
10th- epoch: 3, train_loss = 43.049539029598236, train_acc = 0.9096413600372613
test Acc 0.9078212290502793:
10th- epoch: 4, train_loss = 39.96564503014088, train_acc = 0.9149976711690732
test Acc 0.9110800744878957:
10th- epoch: 5, train_loss = 37.7461698576808, train_acc = 0.919073125291103

10th- epoch: 145, train_loss = 17.06492362357676, train_acc = 0.9630880298090359
test Acc 0.9436685288640596:
10th- epoch: 146, train_loss = 17.052377127110958, train_acc = 0.9632044713553796
test Acc 0.9432029795158287:
10th- epoch: 147, train_loss = 17.04756487905979, train_acc = 0.9633209129017233
test Acc 0.9436685288640596:
10th- epoch: 148, train_loss = 17.00769300200045, train_acc = 0.9633209129017233
test Acc 0.9432029795158287:
10th- epoch: 149, train_loss = 16.999882148578763, train_acc = 0.9633209129017233
test Acc 0.9432029795158287:
10th- epoch: 150, train_loss = 16.998640425503254, train_acc = 0.9632044713553796
test Acc 0.9436685288640596:
10th- epoch: 151, train_loss = 16.941845044493675, train_acc = 0.9634373544480671
test Acc 0.9436685288640596:
10th- epoch: 152, train_loss = 16.945328811183572, train_acc = 0.9632044713553796
test Acc 0.9441340782122905:
10th- epoch: 153, train_loss = 16.917053900659084, train_acc = 0.9636702375407545
test Acc 0.9436685288640596:
10th

10th- epoch: 293, train_loss = 15.06946720648557, train_acc = 0.966581276199348
test Acc 0.9473929236499069:
10th- epoch: 294, train_loss = 15.075576434843242, train_acc = 0.966581276199348
test Acc 0.9473929236499069:
10th- epoch: 295, train_loss = 15.063597400672734, train_acc = 0.9666977177456917
test Acc 0.9473929236499069:
10th- epoch: 296, train_loss = 15.04783172160387, train_acc = 0.966581276199348
test Acc 0.9473929236499069:
10th- epoch: 297, train_loss = 15.049453966319561, train_acc = 0.9666977177456917
test Acc 0.9473929236499069:
10th- epoch: 298, train_loss = 15.028761136345565, train_acc = 0.9666977177456917
test Acc 0.9473929236499069:
10th- epoch: 299, train_loss = 15.038362371735275, train_acc = 0.9668141592920354
test Acc 0.9473929236499069:
10th- epoch: 300, train_loss = 15.019077439792454, train_acc = 0.9666977177456917
test Acc 0.9473929236499069:
10th- epoch: 301, train_loss = 15.00457404088229, train_acc = 0.9666977177456917
test Acc 0.9473929236499069:
10th- e

test Acc 0.9473929236499069:
10th- epoch: 441, train_loss = 14.169858418405056, train_acc = 0.9690265486725663
test Acc 0.9473929236499069:
10th- epoch: 442, train_loss = 14.149388253688812, train_acc = 0.9690265486725663
test Acc 0.9473929236499069:
10th- epoch: 443, train_loss = 14.158207724802196, train_acc = 0.9690265486725663
test Acc 0.9473929236499069:
10th- epoch: 444, train_loss = 14.157701942138374, train_acc = 0.9689101071262226
test Acc 0.9473929236499069:
10th- epoch: 445, train_loss = 14.153141558170319, train_acc = 0.9689101071262226
test Acc 0.9473929236499069:
10th- epoch: 446, train_loss = 14.14605101197958, train_acc = 0.9691429902189101
test Acc 0.9473929236499069:
10th- epoch: 447, train_loss = 14.131854007951915, train_acc = 0.9691429902189101
test Acc 0.9473929236499069:
10th- epoch: 448, train_loss = 14.136824865825474, train_acc = 0.9690265486725663
test Acc 0.9473929236499069:
10th- epoch: 449, train_loss = 14.13415156584233, train_acc = 0.9691429902189101
tes

 33%|███████████████████████▎                                              | 10/30 [1:30:40<3:01:36, 544.84s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
11th- epoch: 0, train_loss = 115.28072586655617, train_acc = 0.7488355845365626
test Acc 0.8375232774674115:
11th- epoch: 1, train_loss = 61.595390886068344, train_acc = 0.8653935724266418
test Acc 0.8803538175046555:
11th- epoch: 2, train_loss = 51.308166459202766, train_acc = 0.8885654401490451
test Acc 0.8961824953445066:
11th- epoch: 3, train_loss = 45.96796381473541, train_acc = 0.900093153237075
test Acc 0.9082867783985102:
11th- epoch: 4, train_loss = 42.421362459659576, train_acc = 0.908011178388449
test Acc 0.9106145251396648:
11th- epoch: 5, train_loss = 39.89963909238577, train_acc = 0.91429902189101

11th- epoch: 145, train_loss = 17.14594973810017, train_acc = 0.9619236143455985
test Acc 0.9459962756052142:
11th- epoch: 146, train_loss = 17.125558553263545, train_acc = 0.9620400558919422
test Acc 0.9459962756052142:
11th- epoch: 147, train_loss = 17.10388650931418, train_acc = 0.962156497438286
test Acc 0.9459962756052142:
11th- epoch: 148, train_loss = 17.08491138368845, train_acc = 0.9620400558919422
test Acc 0.9459962756052142:
11th- epoch: 149, train_loss = 17.04940682835877, train_acc = 0.962156497438286
test Acc 0.9455307262569832:
11th- epoch: 150, train_loss = 17.024634942412376, train_acc = 0.9622729389846297
test Acc 0.9455307262569832:
11th- epoch: 151, train_loss = 17.00360683351755, train_acc = 0.9622729389846297
test Acc 0.9455307262569832:
11th- epoch: 152, train_loss = 16.988729417324066, train_acc = 0.9625058220773172
test Acc 0.9455307262569832:
11th- epoch: 153, train_loss = 16.970137821510434, train_acc = 0.9626222636236609
test Acc 0.9455307262569832:
11th- ep

11th- epoch: 293, train_loss = 15.090650756843388, train_acc = 0.9664648346530041
test Acc 0.9464618249534451:
11th- epoch: 294, train_loss = 15.08202548790723, train_acc = 0.9664648346530041
test Acc 0.9464618249534451:
11th- epoch: 295, train_loss = 15.06872583180666, train_acc = 0.9666977177456917
test Acc 0.9464618249534451:
11th- epoch: 296, train_loss = 15.058213852345943, train_acc = 0.966581276199348
test Acc 0.9464618249534451:
11th- epoch: 297, train_loss = 15.051987846381962, train_acc = 0.966581276199348
test Acc 0.946927374301676:
11th- epoch: 298, train_loss = 15.05711746495217, train_acc = 0.9666977177456917
test Acc 0.946927374301676:
11th- epoch: 299, train_loss = 15.042523130774498, train_acc = 0.9668141592920354
test Acc 0.9464618249534451:
11th- epoch: 300, train_loss = 15.03767551947385, train_acc = 0.966581276199348
test Acc 0.946927374301676:
11th- epoch: 301, train_loss = 15.01834350079298, train_acc = 0.9668141592920354
test Acc 0.946927374301676:
11th- epoch: 

test Acc 0.9483240223463687:
11th- epoch: 441, train_loss = 14.137011255137622, train_acc = 0.9690265486725663
test Acc 0.9483240223463687:
11th- epoch: 442, train_loss = 14.130592110566795, train_acc = 0.9691429902189101
test Acc 0.9483240223463687:
11th- epoch: 443, train_loss = 14.132968145422637, train_acc = 0.9690265486725663
test Acc 0.9483240223463687:
11th- epoch: 444, train_loss = 14.133935186080635, train_acc = 0.9690265486725663
test Acc 0.9483240223463687:
11th- epoch: 445, train_loss = 14.130808453075588, train_acc = 0.9690265486725663
test Acc 0.9483240223463687:
11th- epoch: 446, train_loss = 14.127703885547817, train_acc = 0.9691429902189101
test Acc 0.9483240223463687:
11th- epoch: 447, train_loss = 14.113116391003132, train_acc = 0.9692594317652539
test Acc 0.9483240223463687:
11th- epoch: 448, train_loss = 14.10908321570605, train_acc = 0.9690265486725663
test Acc 0.9483240223463687:
11th- epoch: 449, train_loss = 14.10837783664465, train_acc = 0.9691429902189101
tes

 37%|█████████████████████████▋                                            | 11/30 [1:39:42<2:52:16, 544.01s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
12th- epoch: 0, train_loss = 135.24134570360184, train_acc = 0.720540288775035
test Acc 0.8272811918063314:
12th- epoch: 1, train_loss = 62.9997153878212, train_acc = 0.8663251047973917
test Acc 0.8770949720670391:
12th- epoch: 2, train_loss = 51.31371168792248, train_acc = 0.8913600372612949
test Acc 0.9003724394785847:
12th- epoch: 3, train_loss = 45.642023265361786, train_acc = 0.9034699580810434
test Acc 0.9078212290502793:
12th- epoch: 4, train_loss = 42.066577434539795, train_acc = 0.9106893339543549
test Acc 0.9180633147113594:
12th- epoch: 5, train_loss = 39.395015604794025, train_acc = 0.91511411271541

12th- epoch: 145, train_loss = 17.229709416627884, train_acc = 0.9628551467163484
test Acc 0.9464618249534451:
12th- epoch: 146, train_loss = 17.217738704755902, train_acc = 0.9628551467163484
test Acc 0.9459962756052142:
12th- epoch: 147, train_loss = 17.202303010970354, train_acc = 0.9627387051700047
test Acc 0.9464618249534451:
12th- epoch: 148, train_loss = 17.169874308630824, train_acc = 0.9629715882626921
test Acc 0.9464618249534451:
12th- epoch: 149, train_loss = 17.146025344729424, train_acc = 0.9628551467163484
test Acc 0.9459962756052142:
12th- epoch: 150, train_loss = 17.120003938674927, train_acc = 0.9628551467163484
test Acc 0.9464618249534451:
12th- epoch: 151, train_loss = 17.103226287290454, train_acc = 0.9630880298090359
test Acc 0.9464618249534451:
12th- epoch: 152, train_loss = 17.08506701886654, train_acc = 0.9628551467163484
test Acc 0.9459962756052142:
12th- epoch: 153, train_loss = 17.050918390974402, train_acc = 0.9628551467163484
test Acc 0.9459962756052142:
12

12th- epoch: 293, train_loss = 15.175265991128981, train_acc = 0.9663483931066604
test Acc 0.9478584729981379:
12th- epoch: 294, train_loss = 15.179737276397645, train_acc = 0.9663483931066604
test Acc 0.9478584729981379:
12th- epoch: 295, train_loss = 15.159586392343044, train_acc = 0.9663483931066604
test Acc 0.9478584729981379:
12th- epoch: 296, train_loss = 15.158377938903868, train_acc = 0.9663483931066604
test Acc 0.9478584729981379:
12th- epoch: 297, train_loss = 15.143397034145892, train_acc = 0.9664648346530041
test Acc 0.9478584729981379:
12th- epoch: 298, train_loss = 15.141530535183847, train_acc = 0.9663483931066604
test Acc 0.9478584729981379:
12th- epoch: 299, train_loss = 15.12413448188454, train_acc = 0.9663483931066604
test Acc 0.9478584729981379:
12th- epoch: 300, train_loss = 15.131431422196329, train_acc = 0.9664648346530041
test Acc 0.9478584729981379:
12th- epoch: 301, train_loss = 15.102364521473646, train_acc = 0.9663483931066604
test Acc 0.9478584729981379:
12

12th- epoch: 440, train_loss = 14.198719386011362, train_acc = 0.9687936655798789
test Acc 0.9497206703910615:
12th- epoch: 441, train_loss = 14.196031064726412, train_acc = 0.9686772240335352
test Acc 0.9497206703910615:
12th- epoch: 442, train_loss = 14.192805618979037, train_acc = 0.9686772240335352
test Acc 0.9497206703910615:
12th- epoch: 443, train_loss = 14.185138790868223, train_acc = 0.9686772240335352
test Acc 0.9497206703910615:
12th- epoch: 444, train_loss = 14.181323205120862, train_acc = 0.9686772240335352
test Acc 0.9497206703910615:
12th- epoch: 445, train_loss = 14.178882011212409, train_acc = 0.9687936655798789
test Acc 0.9497206703910615:
12th- epoch: 446, train_loss = 14.183547589927912, train_acc = 0.9687936655798789
test Acc 0.9497206703910615:
12th- epoch: 447, train_loss = 14.178386949002743, train_acc = 0.9689101071262226
test Acc 0.9497206703910615:
12th- epoch: 448, train_loss = 14.17171041527763, train_acc = 0.9690265486725663
test Acc 0.9497206703910615:
12

 40%|████████████████████████████                                          | 12/30 [1:48:46<2:43:08, 543.83s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
13th- epoch: 0, train_loss = 117.53854861855507, train_acc = 0.7552398695854681
test Acc 0.851024208566108:
13th- epoch: 1, train_loss = 59.90960466861725, train_acc = 0.8754075454122031
test Acc 0.8687150837988827:
13th- epoch: 2, train_loss = 50.66846892237663, train_acc = 0.8952026082906381
test Acc 0.8761638733705773:
13th- epoch: 3, train_loss = 45.750662475824356, train_acc = 0.904052165812762
test Acc 0.8854748603351955:
13th- epoch: 4, train_loss = 42.34278203547001, train_acc = 0.9096413600372613
test Acc 0.8980446927374302:
13th- epoch: 5, train_loss = 39.739959962666035, train_acc = 0.914066138798323

13th- epoch: 145, train_loss = 17.176623629406095, train_acc = 0.9627387051700047
test Acc 0.9427374301675978:
13th- epoch: 146, train_loss = 17.16008897870779, train_acc = 0.9627387051700047
test Acc 0.9427374301675978:
13th- epoch: 147, train_loss = 17.134454296901822, train_acc = 0.9627387051700047
test Acc 0.9432029795158287:
13th- epoch: 148, train_loss = 17.10775432176888, train_acc = 0.9627387051700047
test Acc 0.9427374301675978:
13th- epoch: 149, train_loss = 17.088879680261016, train_acc = 0.9627387051700047
test Acc 0.9432029795158287:
13th- epoch: 150, train_loss = 17.072477035224438, train_acc = 0.9628551467163484
test Acc 0.9432029795158287:
13th- epoch: 151, train_loss = 17.038788491860032, train_acc = 0.9627387051700047
test Acc 0.9432029795158287:
13th- epoch: 152, train_loss = 17.02271924726665, train_acc = 0.9629715882626921
test Acc 0.9436685288640596:
13th- epoch: 153, train_loss = 17.008288526907563, train_acc = 0.9632044713553796
test Acc 0.9436685288640596:
13th

13th- epoch: 293, train_loss = 15.167005479335785, train_acc = 0.9663483931066604
test Acc 0.9464618249534451:
13th- epoch: 294, train_loss = 15.163597330451012, train_acc = 0.9663483931066604
test Acc 0.9464618249534451:
13th- epoch: 295, train_loss = 15.150734876282513, train_acc = 0.9664648346530041
test Acc 0.9464618249534451:
13th- epoch: 296, train_loss = 15.141268935985863, train_acc = 0.966581276199348
test Acc 0.9464618249534451:
13th- epoch: 297, train_loss = 15.131502960808575, train_acc = 0.9664648346530041
test Acc 0.9464618249534451:
13th- epoch: 298, train_loss = 15.122319434769452, train_acc = 0.9664648346530041
test Acc 0.9464618249534451:
13th- epoch: 299, train_loss = 15.115279726684093, train_acc = 0.9666977177456917
test Acc 0.9464618249534451:
13th- epoch: 300, train_loss = 15.100906322710216, train_acc = 0.9666977177456917
test Acc 0.9464618249534451:
13th- epoch: 301, train_loss = 15.097637005150318, train_acc = 0.9666977177456917
test Acc 0.9464618249534451:
13

13th- epoch: 441, train_loss = 14.211578843649477, train_acc = 0.9686772240335352
test Acc 0.9478584729981379:
13th- epoch: 442, train_loss = 14.19936173921451, train_acc = 0.9685607824871915
test Acc 0.9473929236499069:
13th- epoch: 443, train_loss = 14.200440478976816, train_acc = 0.9686772240335352
test Acc 0.9473929236499069:
13th- epoch: 444, train_loss = 14.197762513998896, train_acc = 0.9685607824871915
test Acc 0.9464618249534451:
13th- epoch: 445, train_loss = 14.19097383087501, train_acc = 0.9686772240335352
test Acc 0.9478584729981379:
13th- epoch: 446, train_loss = 14.187913993839175, train_acc = 0.9687936655798789
test Acc 0.9478584729981379:
13th- epoch: 447, train_loss = 14.182847355958074, train_acc = 0.9685607824871915
test Acc 0.9478584729981379:
13th- epoch: 448, train_loss = 14.175051229540259, train_acc = 0.9686772240335352
test Acc 0.946927374301676:
13th- epoch: 449, train_loss = 14.171367754694074, train_acc = 0.9685607824871915
test Acc 0.9473929236499069:
13th

 43%|██████████████████████████████▎                                       | 13/30 [1:57:48<2:33:58, 543.42s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
14th- epoch: 0, train_loss = 122.24854975938797, train_acc = 0.7432463903120633
test Acc 0.8258845437616388:
14th- epoch: 1, train_loss = 58.653245240449905, train_acc = 0.8752911038658593
test Acc 0.8687150837988827:
14th- epoch: 2, train_loss = 49.66527110338211, train_acc = 0.895668374476013
test Acc 0.8915270018621974:
14th- epoch: 3, train_loss = 44.666166961193085, train_acc = 0.9055659059152306
test Acc 0.8994413407821229:
14th- epoch: 4, train_loss = 41.3081961274147, train_acc = 0.911970190964136
test Acc 0.9087523277467412:
14th- epoch: 5, train_loss = 38.89223250746727, train_acc = 0.9156963204471356

14th- epoch: 145, train_loss = 17.026321286335588, train_acc = 0.9615742897065673
test Acc 0.9450651769087524:
14th- epoch: 146, train_loss = 17.007378231734037, train_acc = 0.9618071727992548
test Acc 0.9450651769087524:
14th- epoch: 147, train_loss = 16.9813129324466, train_acc = 0.961690731252911
test Acc 0.9450651769087524:
14th- epoch: 148, train_loss = 16.96913835592568, train_acc = 0.9619236143455985
test Acc 0.9450651769087524:
14th- epoch: 149, train_loss = 16.942189510911703, train_acc = 0.9619236143455985
test Acc 0.9450651769087524:
14th- epoch: 150, train_loss = 16.926392150111496, train_acc = 0.9620400558919422
test Acc 0.9450651769087524:
14th- epoch: 151, train_loss = 16.91119034588337, train_acc = 0.9619236143455985
test Acc 0.9450651769087524:
14th- epoch: 152, train_loss = 16.884683216921985, train_acc = 0.9620400558919422
test Acc 0.9450651769087524:
14th- epoch: 153, train_loss = 16.874256224371493, train_acc = 0.9620400558919422
test Acc 0.9450651769087524:
14th- 

14th- epoch: 293, train_loss = 15.143184803426266, train_acc = 0.966115510013973
test Acc 0.9478584729981379:
14th- epoch: 294, train_loss = 15.131994985044003, train_acc = 0.966581276199348
test Acc 0.9478584729981379:
14th- epoch: 295, train_loss = 15.126794303767383, train_acc = 0.966115510013973
test Acc 0.9478584729981379:
14th- epoch: 296, train_loss = 15.116991381160915, train_acc = 0.9664648346530041
test Acc 0.9478584729981379:
14th- epoch: 297, train_loss = 15.112143454141915, train_acc = 0.966115510013973
test Acc 0.9478584729981379:
14th- epoch: 298, train_loss = 15.098033818416297, train_acc = 0.966581276199348
test Acc 0.9478584729981379:
14th- epoch: 299, train_loss = 15.087751577608287, train_acc = 0.9664648346530041
test Acc 0.9478584729981379:
14th- epoch: 300, train_loss = 15.085744678974152, train_acc = 0.9666977177456917
test Acc 0.9478584729981379:
14th- epoch: 301, train_loss = 15.078492730855942, train_acc = 0.9666977177456917
test Acc 0.9478584729981379:
14th- 

14th- epoch: 441, train_loss = 14.22471001977101, train_acc = 0.9697251979506288
test Acc 0.9478584729981379:
14th- epoch: 442, train_loss = 14.218261793255806, train_acc = 0.9697251979506288
test Acc 0.9478584729981379:
14th- epoch: 443, train_loss = 14.212029899004847, train_acc = 0.9697251979506288
test Acc 0.9478584729981379:
14th- epoch: 444, train_loss = 14.208678901195526, train_acc = 0.9697251979506288
test Acc 0.9478584729981379:
14th- epoch: 445, train_loss = 14.200793117284775, train_acc = 0.9697251979506288
test Acc 0.9478584729981379:
14th- epoch: 446, train_loss = 14.200006254017353, train_acc = 0.9697251979506288
test Acc 0.9478584729981379:
14th- epoch: 447, train_loss = 14.194653084035963, train_acc = 0.9697251979506288
test Acc 0.9478584729981379:
14th- epoch: 448, train_loss = 14.19086846197024, train_acc = 0.9697251979506288
test Acc 0.9478584729981379:
14th- epoch: 449, train_loss = 14.189475653227419, train_acc = 0.9697251979506288
test Acc 0.9478584729981379:
14t

 47%|████████████████████████████████▋                                     | 14/30 [2:06:50<2:24:45, 542.87s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
15th- epoch: 0, train_loss = 117.56422618031502, train_acc = 0.7738705170004657
test Acc 0.8165735567970205:
15th- epoch: 1, train_loss = 53.4420832246542, train_acc = 0.8851886353050769
test Acc 0.8766294227188082:
15th- epoch: 2, train_loss = 44.753689125180244, train_acc = 0.904052165812762
test Acc 0.9022346368715084:
15th- epoch: 3, train_loss = 40.27193704992533, train_acc = 0.9138332557056358
test Acc 0.9138733705772812:
15th- epoch: 4, train_loss = 37.34017127752304, train_acc = 0.9204704238472287
test Acc 0.9241154562383612:
15th- epoch: 5, train_loss = 35.20771073549986, train_acc = 0.925593851886353


15th- epoch: 145, train_loss = 16.480969278141856, train_acc = 0.9635537959944108
test Acc 0.9432029795158287:
15th- epoch: 146, train_loss = 16.461873142048717, train_acc = 0.9637866790870983
test Acc 0.9432029795158287:
15th- epoch: 147, train_loss = 16.43736564554274, train_acc = 0.963903120633442
test Acc 0.9432029795158287:
15th- epoch: 148, train_loss = 16.411487573757768, train_acc = 0.9640195621797858
test Acc 0.9432029795158287:
15th- epoch: 149, train_loss = 16.398932492360473, train_acc = 0.9642524452724732
test Acc 0.9432029795158287:
15th- epoch: 150, train_loss = 16.380388075485826, train_acc = 0.9641360037261295
test Acc 0.9432029795158287:
15th- epoch: 151, train_loss = 16.363679798319936, train_acc = 0.9641360037261295
test Acc 0.9432029795158287:
15th- epoch: 152, train_loss = 16.344989638775587, train_acc = 0.9641360037261295
test Acc 0.9436685288640596:
15th- epoch: 153, train_loss = 16.332819186151028, train_acc = 0.963903120633442
test Acc 0.9432029795158287:
15th

15th- epoch: 293, train_loss = 14.686766958795488, train_acc = 0.9677456916627852
test Acc 0.946927374301676:
15th- epoch: 294, train_loss = 14.683611743152142, train_acc = 0.9677456916627852
test Acc 0.946927374301676:
15th- epoch: 295, train_loss = 14.672070864588022, train_acc = 0.9677456916627852
test Acc 0.946927374301676:
15th- epoch: 296, train_loss = 14.664515551179647, train_acc = 0.9678621332091291
test Acc 0.946927374301676:
15th- epoch: 297, train_loss = 14.659246698953211, train_acc = 0.9678621332091291
test Acc 0.946927374301676:
15th- epoch: 298, train_loss = 14.65441772621125, train_acc = 0.9678621332091291
test Acc 0.946927374301676:
15th- epoch: 299, train_loss = 14.64360545296222, train_acc = 0.9678621332091291
test Acc 0.946927374301676:
15th- epoch: 300, train_loss = 14.63565902877599, train_acc = 0.9678621332091291
test Acc 0.946927374301676:
15th- epoch: 301, train_loss = 14.626225966960192, train_acc = 0.9679785747554728
test Acc 0.946927374301676:
15th- epoch: 

15th- epoch: 441, train_loss = 13.854382428340614, train_acc = 0.9699580810433163
test Acc 0.9473929236499069:
15th- epoch: 442, train_loss = 13.862274901010096, train_acc = 0.9699580810433163
test Acc 0.9473929236499069:
15th- epoch: 443, train_loss = 13.841005627065897, train_acc = 0.9699580810433163
test Acc 0.9473929236499069:
15th- epoch: 444, train_loss = 13.837905335240066, train_acc = 0.9698416394969726
test Acc 0.9473929236499069:
15th- epoch: 445, train_loss = 13.83099774364382, train_acc = 0.97007452258966
test Acc 0.9473929236499069:
15th- epoch: 446, train_loss = 13.829939741641283, train_acc = 0.97007452258966
test Acc 0.9473929236499069:
15th- epoch: 447, train_loss = 13.82444631960243, train_acc = 0.9698416394969726
test Acc 0.9473929236499069:
15th- epoch: 448, train_loss = 13.820664721541107, train_acc = 0.97007452258966
test Acc 0.9473929236499069:
15th- epoch: 449, train_loss = 13.813918924890459, train_acc = 0.97007452258966
test Acc 0.9473929236499069:
15th- epoch

 50%|███████████████████████████████████                                   | 15/30 [2:15:52<2:15:38, 542.59s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
16th- epoch: 0, train_loss = 119.80422616004944, train_acc = 0.757918025151374
test Acc 0.8594040968342644:
16th- epoch: 1, train_loss = 57.76751586794853, train_acc = 0.8813460642757336
test Acc 0.8845437616387337:
16th- epoch: 2, train_loss = 49.15712831914425, train_acc = 0.8960176991150443
test Acc 0.8999068901303539:
16th- epoch: 3, train_loss = 44.31117305904627, train_acc = 0.9055659059152306
test Acc 0.904562383612663:
16th- epoch: 4, train_loss = 41.03763162344694, train_acc = 0.9120866325104797
test Acc 0.9124767225325885:
16th- epoch: 5, train_loss = 38.5909256413579, train_acc = 0.915929203539823
te

16th- epoch: 145, train_loss = 16.885147040709853, train_acc = 0.9615742897065673
test Acc 0.9450651769087524:
16th- epoch: 146, train_loss = 16.86186933517456, train_acc = 0.961690731252911
test Acc 0.9450651769087524:
16th- epoch: 147, train_loss = 16.843024348840117, train_acc = 0.9614578481602236
test Acc 0.9455307262569832:
16th- epoch: 148, train_loss = 16.826095620170236, train_acc = 0.961690731252911
test Acc 0.9455307262569832:
16th- epoch: 149, train_loss = 16.794677570462227, train_acc = 0.961690731252911
test Acc 0.9455307262569832:
16th- epoch: 150, train_loss = 16.778973903506994, train_acc = 0.9614578481602236
test Acc 0.9455307262569832:
16th- epoch: 151, train_loss = 16.761325618252158, train_acc = 0.961690731252911
test Acc 0.9455307262569832:
16th- epoch: 152, train_loss = 16.750682352110744, train_acc = 0.9615742897065673
test Acc 0.9455307262569832:
16th- epoch: 153, train_loss = 16.723219415172935, train_acc = 0.9615742897065673
test Acc 0.9455307262569832:
16th- 

test Acc 0.9478584729981379:
16th- epoch: 293, train_loss = 14.97449332755059, train_acc = 0.9671634839310667
test Acc 0.9478584729981379:
16th- epoch: 294, train_loss = 14.970880164764822, train_acc = 0.9672799254774104
test Acc 0.9478584729981379:
16th- epoch: 295, train_loss = 14.960427685640752, train_acc = 0.9672799254774104
test Acc 0.9478584729981379:
16th- epoch: 296, train_loss = 14.959224049933255, train_acc = 0.9671634839310667
test Acc 0.9478584729981379:
16th- epoch: 297, train_loss = 14.948863244615495, train_acc = 0.9672799254774104
test Acc 0.9483240223463687:
16th- epoch: 298, train_loss = 14.932836689986289, train_acc = 0.9673963670237541
test Acc 0.9478584729981379:
16th- epoch: 299, train_loss = 14.92943203728646, train_acc = 0.9673963670237541
test Acc 0.9478584729981379:
16th- epoch: 300, train_loss = 14.929755259305239, train_acc = 0.9675128085700978
test Acc 0.9483240223463687:
16th- epoch: 301, train_loss = 14.913889371789992, train_acc = 0.9675128085700978
tes

test Acc 0.9497206703910615:
16th- epoch: 367, train_loss = 14.462470307946205, train_acc = 0.9683278993945039
test Acc 0.9492551210428305:
16th- epoch: 368, train_loss = 14.46241291705519, train_acc = 0.9683278993945039
test Acc 0.9497206703910615:
16th- epoch: 369, train_loss = 14.452631399035454, train_acc = 0.9682114578481602
test Acc 0.9501862197392924:
16th- epoch: 370, train_loss = 14.449682153761387, train_acc = 0.9684443409408477
test Acc 0.9497206703910615:
16th- epoch: 371, train_loss = 14.444843423552811, train_acc = 0.9684443409408477
test Acc 0.9492551210428305:
16th- epoch: 372, train_loss = 14.431025079451501, train_acc = 0.9685607824871915
test Acc 0.9497206703910615:
16th- epoch: 373, train_loss = 14.433106943033636, train_acc = 0.9684443409408477
test Acc 0.9497206703910615:
16th- epoch: 374, train_loss = 14.420217965729535, train_acc = 0.9684443409408477
test Acc 0.9497206703910615:
16th- epoch: 375, train_loss = 14.417228642851114, train_acc = 0.9684443409408477
te

 53%|█████████████████████████████████████▎                                | 16/30 [2:24:53<2:06:31, 542.26s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
17th- epoch: 0, train_loss = 123.35105806589127, train_acc = 0.7469725197950629
test Acc 0.8337988826815642:
17th- epoch: 1, train_loss = 59.712867587804794, train_acc = 0.8706334420121099
test Acc 0.8943202979515829:
17th- epoch: 2, train_loss = 49.4197196662426, train_acc = 0.8959012575687005
test Acc 0.9050279329608939:
17th- epoch: 3, train_loss = 44.33423639088869, train_acc = 0.9052165812761993
test Acc 0.9110800744878957:
17th- epoch: 4, train_loss = 40.93861739337444, train_acc = 0.9111551001397299
test Acc 0.9162011173184358:
17th- epoch: 5, train_loss = 38.529023826122284, train_acc = 0.91604564508616

17th- epoch: 145, train_loss = 17.222914503887296, train_acc = 0.9619236143455985
test Acc 0.9450651769087524:
17th- epoch: 146, train_loss = 17.197084380313754, train_acc = 0.9619236143455985
test Acc 0.9450651769087524:
17th- epoch: 147, train_loss = 17.181572748348117, train_acc = 0.9619236143455985
test Acc 0.9455307262569832:
17th- epoch: 148, train_loss = 17.15967532247305, train_acc = 0.962156497438286
test Acc 0.9455307262569832:
17th- epoch: 149, train_loss = 17.140128729864955, train_acc = 0.9622729389846297
test Acc 0.9455307262569832:
17th- epoch: 150, train_loss = 17.118523193523288, train_acc = 0.9622729389846297
test Acc 0.9455307262569832:
17th- epoch: 151, train_loss = 17.098150359466672, train_acc = 0.9622729389846297
test Acc 0.9455307262569832:
17th- epoch: 152, train_loss = 17.07721335068345, train_acc = 0.9622729389846297
test Acc 0.9455307262569832:
17th- epoch: 153, train_loss = 17.05819496884942, train_acc = 0.9623893805309734
test Acc 0.9455307262569832:
17th-

17th- epoch: 293, train_loss = 15.212992310523987, train_acc = 0.9664648346530041
test Acc 0.9487895716945997:
17th- epoch: 294, train_loss = 15.203111201524734, train_acc = 0.9664648346530041
test Acc 0.9487895716945997:
17th- epoch: 295, train_loss = 15.19955523032695, train_acc = 0.9663483931066604
test Acc 0.9487895716945997:
17th- epoch: 296, train_loss = 15.187715099193156, train_acc = 0.9664648346530041
test Acc 0.9487895716945997:
17th- epoch: 297, train_loss = 15.181237093172967, train_acc = 0.9664648346530041
test Acc 0.9487895716945997:
17th- epoch: 298, train_loss = 15.17287628352642, train_acc = 0.966581276199348
test Acc 0.9487895716945997:
17th- epoch: 299, train_loss = 15.169114299118519, train_acc = 0.9664648346530041
test Acc 0.9487895716945997:
17th- epoch: 300, train_loss = 15.161694183014333, train_acc = 0.966581276199348
test Acc 0.9487895716945997:
17th- epoch: 301, train_loss = 15.154742929153144, train_acc = 0.966581276199348
test Acc 0.9487895716945997:
17th- 

test Acc 0.9492551210428305:
17th- epoch: 441, train_loss = 14.29953183233738, train_acc = 0.9691429902189101
test Acc 0.9492551210428305:
17th- epoch: 442, train_loss = 14.300118598155677, train_acc = 0.9691429902189101
test Acc 0.9492551210428305:
17th- epoch: 443, train_loss = 14.29622308164835, train_acc = 0.9691429902189101
test Acc 0.9492551210428305:
17th- epoch: 444, train_loss = 14.291083787567914, train_acc = 0.9691429902189101
test Acc 0.9492551210428305:
17th- epoch: 445, train_loss = 14.285791437141597, train_acc = 0.9691429902189101
test Acc 0.9492551210428305:
17th- epoch: 446, train_loss = 14.282711084000766, train_acc = 0.9692594317652539
test Acc 0.9497206703910615:
17th- epoch: 447, train_loss = 14.272465710528195, train_acc = 0.9691429902189101
test Acc 0.9492551210428305:
17th- epoch: 448, train_loss = 14.273824592120945, train_acc = 0.9692594317652539
test Acc 0.9492551210428305:
17th- epoch: 449, train_loss = 14.2671126909554, train_acc = 0.9692594317652539
test 

 57%|███████████████████████████████████████▋                              | 17/30 [2:33:56<1:57:32, 542.50s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
18th- epoch: 0, train_loss = 126.22205558419228, train_acc = 0.746506753609688
test Acc 0.8580074487895717:
18th- epoch: 1, train_loss = 57.62270247936249, train_acc = 0.875873311597578
test Acc 0.8957169459962756:
18th- epoch: 2, train_loss = 48.54898066818714, train_acc = 0.8949697251979506
test Acc 0.9059590316573557:
18th- epoch: 3, train_loss = 43.68787541985512, train_acc = 0.9038192827200745
test Acc 0.9115456238361266:
18th- epoch: 4, train_loss = 40.45688892155886, train_acc = 0.9116208663251048
test Acc 0.914804469273743:
18th- epoch: 5, train_loss = 38.06871249526739, train_acc = 0.9174429436422916
t

18th- epoch: 145, train_loss = 17.015915313735604, train_acc = 0.9626222636236609
test Acc 0.946927374301676:
18th- epoch: 146, train_loss = 17.005121832713485, train_acc = 0.9626222636236609
test Acc 0.9464618249534451:
18th- epoch: 147, train_loss = 16.98474551178515, train_acc = 0.9628551467163484
test Acc 0.9464618249534451:
18th- epoch: 148, train_loss = 16.95886513032019, train_acc = 0.9628551467163484
test Acc 0.9464618249534451:
18th- epoch: 149, train_loss = 16.930529575794935, train_acc = 0.9628551467163484
test Acc 0.9464618249534451:
18th- epoch: 150, train_loss = 16.90895688906312, train_acc = 0.9629715882626921
test Acc 0.946927374301676:
18th- epoch: 151, train_loss = 16.88355179876089, train_acc = 0.9629715882626921
test Acc 0.9464618249534451:
18th- epoch: 152, train_loss = 16.859851328656077, train_acc = 0.9629715882626921
test Acc 0.9464618249534451:
18th- epoch: 153, train_loss = 16.84830735437572, train_acc = 0.9629715882626921
test Acc 0.946927374301676:
18th- epo

18th- epoch: 293, train_loss = 15.044670478440821, train_acc = 0.9668141592920354
test Acc 0.9473929236499069:
18th- epoch: 294, train_loss = 15.03825334366411, train_acc = 0.9659990684676293
test Acc 0.9478584729981379:
18th- epoch: 295, train_loss = 15.023275207728148, train_acc = 0.9668141592920354
test Acc 0.9478584729981379:
18th- epoch: 296, train_loss = 15.0091054700315, train_acc = 0.9668141592920354
test Acc 0.9478584729981379:
18th- epoch: 297, train_loss = 15.019738052040339, train_acc = 0.9662319515603167
test Acc 0.9478584729981379:
18th- epoch: 298, train_loss = 15.000595617108047, train_acc = 0.9668141592920354
test Acc 0.9483240223463687:
18th- epoch: 299, train_loss = 14.989837699569762, train_acc = 0.9668141592920354
test Acc 0.9478584729981379:
18th- epoch: 300, train_loss = 14.98551105428487, train_acc = 0.9668141592920354
test Acc 0.9478584729981379:
18th- epoch: 301, train_loss = 14.974606181494892, train_acc = 0.9669306008383791
test Acc 0.9483240223463687:
18th-

18th- epoch: 440, train_loss = 14.148127841763198, train_acc = 0.9690265486725663
test Acc 0.9487895716945997:
18th- epoch: 441, train_loss = 14.13454352831468, train_acc = 0.9690265486725663
test Acc 0.9487895716945997:
18th- epoch: 442, train_loss = 14.136705715209246, train_acc = 0.9691429902189101
test Acc 0.9487895716945997:
18th- epoch: 443, train_loss = 14.126457667443901, train_acc = 0.9691429902189101
test Acc 0.9487895716945997:
18th- epoch: 444, train_loss = 14.130977562163025, train_acc = 0.9692594317652539
test Acc 0.9487895716945997:
18th- epoch: 445, train_loss = 14.12238742550835, train_acc = 0.9691429902189101
test Acc 0.9487895716945997:
18th- epoch: 446, train_loss = 14.115852528717369, train_acc = 0.9691429902189101
test Acc 0.9487895716945997:
18th- epoch: 447, train_loss = 14.101799266878515, train_acc = 0.9692594317652539
test Acc 0.9487895716945997:
18th- epoch: 448, train_loss = 14.101594539824873, train_acc = 0.9693758733115976
test Acc 0.9487895716945997:
18t

 60%|██████████████████████████████████████████                            | 18/30 [2:43:00<1:48:33, 542.81s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
19th- epoch: 0, train_loss = 130.95724514126778, train_acc = 0.7654867256637168
test Acc 0.8417132216014898:
19th- epoch: 1, train_loss = 54.34340439736843, train_acc = 0.8870517000465766
test Acc 0.8929236499068901:
19th- epoch: 2, train_loss = 46.20507165789604, train_acc = 0.901839776432231
test Acc 0.904562383612663:
19th- epoch: 3, train_loss = 41.70541572570801, train_acc = 0.9090591523055426
test Acc 0.9124767225325885:
19th- epoch: 4, train_loss = 38.74282340705395, train_acc = 0.9131346064275734
test Acc 0.9175977653631285:
19th- epoch: 5, train_loss = 36.502392411231995, train_acc = 0.918141592920354


19th- epoch: 145, train_loss = 17.006689386442304, train_acc = 0.9629715882626921
test Acc 0.9455307262569832:
19th- epoch: 146, train_loss = 16.98910623975098, train_acc = 0.9630880298090359
test Acc 0.9455307262569832:
19th- epoch: 147, train_loss = 16.968417463824153, train_acc = 0.9632044713553796
test Acc 0.9455307262569832:
19th- epoch: 148, train_loss = 16.957724129781127, train_acc = 0.9629715882626921
test Acc 0.9455307262569832:
19th- epoch: 149, train_loss = 16.935577923431993, train_acc = 0.9630880298090359
test Acc 0.9455307262569832:
19th- epoch: 150, train_loss = 16.911019971594214, train_acc = 0.9630880298090359
test Acc 0.9459962756052142:
19th- epoch: 151, train_loss = 16.896105429157615, train_acc = 0.9632044713553796
test Acc 0.9459962756052142:
19th- epoch: 152, train_loss = 16.880163004621863, train_acc = 0.9630880298090359
test Acc 0.9459962756052142:
19th- epoch: 153, train_loss = 16.859674675390124, train_acc = 0.9630880298090359
test Acc 0.9459962756052142:
19

test Acc 0.9492551210428305:
19th- epoch: 293, train_loss = 15.191284307278693, train_acc = 0.966115510013973
test Acc 0.9492551210428305:
19th- epoch: 294, train_loss = 15.18153625819832, train_acc = 0.9662319515603167
test Acc 0.9492551210428305:
19th- epoch: 295, train_loss = 15.172568685375154, train_acc = 0.9662319515603167
test Acc 0.9492551210428305:
19th- epoch: 296, train_loss = 15.168129096738994, train_acc = 0.9662319515603167
test Acc 0.9492551210428305:
19th- epoch: 297, train_loss = 15.15981720853597, train_acc = 0.9663483931066604
test Acc 0.9492551210428305:
19th- epoch: 298, train_loss = 15.154210954904556, train_acc = 0.9663483931066604
test Acc 0.9492551210428305:
19th- epoch: 299, train_loss = 15.139248449355364, train_acc = 0.9662319515603167
test Acc 0.9492551210428305:
19th- epoch: 300, train_loss = 15.130185960792005, train_acc = 0.9663483931066604
test Acc 0.9492551210428305:
19th- epoch: 301, train_loss = 15.1230677543208, train_acc = 0.9663483931066604
test A

test Acc 0.9492551210428305:
19th- epoch: 367, train_loss = 14.667027451097965, train_acc = 0.9680950163018165
test Acc 0.9492551210428305:
19th- epoch: 368, train_loss = 14.656824707053602, train_acc = 0.9680950163018165
test Acc 0.9492551210428305:
19th- epoch: 369, train_loss = 14.650346866808832, train_acc = 0.9682114578481602
test Acc 0.9492551210428305:
19th- epoch: 370, train_loss = 14.645844105631113, train_acc = 0.9682114578481602
test Acc 0.9492551210428305:
19th- epoch: 371, train_loss = 14.643723651766777, train_acc = 0.9682114578481602
test Acc 0.9492551210428305:
19th- epoch: 372, train_loss = 14.634391237981617, train_acc = 0.9682114578481602
test Acc 0.9492551210428305:
19th- epoch: 373, train_loss = 14.627238523215055, train_acc = 0.9682114578481602
test Acc 0.9492551210428305:
19th- epoch: 374, train_loss = 14.61788350623101, train_acc = 0.9682114578481602
test Acc 0.9492551210428305:
19th- epoch: 375, train_loss = 14.614925571717322, train_acc = 0.9682114578481602
te

 63%|████████████████████████████████████████████▎                         | 19/30 [2:52:02<1:39:29, 542.71s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
20th- epoch: 0, train_loss = 132.30161106586456, train_acc = 0.7481369352585002
test Acc 0.8435754189944135:
20th- epoch: 1, train_loss = 64.00464470684528, train_acc = 0.8665579878900792
test Acc 0.8817504655493482:
20th- epoch: 2, train_loss = 53.64158695936203, train_acc = 0.8856544014904518
test Acc 0.8966480446927374:
20th- epoch: 3, train_loss = 47.89222050458193, train_acc = 0.8950861667442943
test Acc 0.904562383612663:
20th- epoch: 4, train_loss = 44.07895132154226, train_acc = 0.9037028411737308
test Acc 0.9115456238361266:
20th- epoch: 5, train_loss = 41.14436190575361, train_acc = 0.9097578015836051

20th- epoch: 145, train_loss = 16.996531972661614, train_acc = 0.9632044713553796
test Acc 0.9455307262569832:
20th- epoch: 146, train_loss = 16.978619685396552, train_acc = 0.9632044713553796
test Acc 0.9455307262569832:
20th- epoch: 147, train_loss = 16.95713079907, train_acc = 0.9632044713553796
test Acc 0.9455307262569832:
20th- epoch: 148, train_loss = 16.938389813527465, train_acc = 0.9632044713553796
test Acc 0.9459962756052142:
20th- epoch: 149, train_loss = 16.918447632342577, train_acc = 0.9632044713553796
test Acc 0.9459962756052142:
20th- epoch: 150, train_loss = 16.892038950696588, train_acc = 0.9632044713553796
test Acc 0.9455307262569832:
20th- epoch: 151, train_loss = 16.873648412525654, train_acc = 0.9633209129017233
test Acc 0.9459962756052142:
20th- epoch: 152, train_loss = 16.85057575441897, train_acc = 0.9632044713553796
test Acc 0.9459962756052142:
20th- epoch: 153, train_loss = 16.838076170533895, train_acc = 0.9632044713553796
test Acc 0.9459962756052142:
20th- 

20th- epoch: 293, train_loss = 15.018155883997679, train_acc = 0.9669306008383791
test Acc 0.9487895716945997:
20th- epoch: 294, train_loss = 15.013691536150873, train_acc = 0.9669306008383791
test Acc 0.9487895716945997:
20th- epoch: 295, train_loss = 15.002440846525133, train_acc = 0.9669306008383791
test Acc 0.9492551210428305:
20th- epoch: 296, train_loss = 14.987071649171412, train_acc = 0.9669306008383791
test Acc 0.9492551210428305:
20th- epoch: 297, train_loss = 14.974180082790554, train_acc = 0.9670470423847228
test Acc 0.9492551210428305:
20th- epoch: 298, train_loss = 14.961968407034874, train_acc = 0.9670470423847228
test Acc 0.9492551210428305:
20th- epoch: 299, train_loss = 14.951524985022843, train_acc = 0.9671634839310667
test Acc 0.9497206703910615:
20th- epoch: 300, train_loss = 14.947222427465022, train_acc = 0.9670470423847228
test Acc 0.9492551210428305:
20th- epoch: 301, train_loss = 14.938237153925002, train_acc = 0.9670470423847228
test Acc 0.9487895716945997:
2

test Acc 0.9497206703910615:
20th- epoch: 441, train_loss = 14.054735090583563, train_acc = 0.969608756404285
test Acc 0.9506517690875232:
20th- epoch: 442, train_loss = 14.044214977882802, train_acc = 0.969608756404285
test Acc 0.9506517690875232:
20th- epoch: 443, train_loss = 14.04055008199066, train_acc = 0.969608756404285
test Acc 0.9501862197392924:
20th- epoch: 444, train_loss = 14.037055951543152, train_acc = 0.969608756404285
test Acc 0.9501862197392924:
20th- epoch: 445, train_loss = 14.03016175236553, train_acc = 0.969608756404285
test Acc 0.9501862197392924:
20th- epoch: 446, train_loss = 14.025108396075666, train_acc = 0.969608756404285
test Acc 0.9506517690875232:
20th- epoch: 447, train_loss = 14.022069830447435, train_acc = 0.969608756404285
test Acc 0.9501862197392924:
20th- epoch: 448, train_loss = 14.019978768192232, train_acc = 0.969608756404285
test Acc 0.9501862197392924:
20th- epoch: 449, train_loss = 14.013579304330051, train_acc = 0.969608756404285
test Acc 0.9

 67%|██████████████████████████████████████████████▋                       | 20/30 [3:01:04<1:30:23, 542.40s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
21th- epoch: 0, train_loss = 127.7598928809166, train_acc = 0.7382394038192828
test Acc 0.8594040968342644:
21th- epoch: 1, train_loss = 58.70052136480808, train_acc = 0.873660922217047
test Acc 0.8924581005586593:
21th- epoch: 2, train_loss = 49.3637013733387, train_acc = 0.8942710759198882
test Acc 0.9050279329608939:
21th- epoch: 3, train_loss = 44.39538785815239, train_acc = 0.9046343735444806
test Acc 0.9078212290502793:
21th- epoch: 4, train_loss = 41.21347515285015, train_acc = 0.9109222170470423
test Acc 0.909683426443203:
21th- epoch: 5, train_loss = 38.78637910634279, train_acc = 0.9170936190032604
te

21th- epoch: 145, train_loss = 16.82685431279242, train_acc = 0.9622729389846297
test Acc 0.9464618249534451:
21th- epoch: 146, train_loss = 16.831890942528844, train_acc = 0.9622729389846297
test Acc 0.9464618249534451:
21th- epoch: 147, train_loss = 16.787476690486073, train_acc = 0.9622729389846297
test Acc 0.946927374301676:
21th- epoch: 148, train_loss = 16.78196564130485, train_acc = 0.9622729389846297
test Acc 0.9464618249534451:
21th- epoch: 149, train_loss = 16.760724959895015, train_acc = 0.9622729389846297
test Acc 0.9464618249534451:
21th- epoch: 150, train_loss = 16.71957208402455, train_acc = 0.9625058220773172
test Acc 0.9464618249534451:
21th- epoch: 151, train_loss = 16.709359753876925, train_acc = 0.9623893805309734
test Acc 0.946927374301676:
21th- epoch: 152, train_loss = 16.687459932640195, train_acc = 0.9625058220773172
test Acc 0.9464618249534451:
21th- epoch: 153, train_loss = 16.66246755234897, train_acc = 0.9625058220773172
test Acc 0.946927374301676:
21th- ep

21th- epoch: 293, train_loss = 14.889920013956726, train_acc = 0.9670470423847228
test Acc 0.9492551210428305:
21th- epoch: 294, train_loss = 14.877917694859207, train_acc = 0.9670470423847228
test Acc 0.9492551210428305:
21th- epoch: 295, train_loss = 14.865217008627951, train_acc = 0.9670470423847228
test Acc 0.9492551210428305:
21th- epoch: 296, train_loss = 14.863484416157007, train_acc = 0.9670470423847228
test Acc 0.9492551210428305:
21th- epoch: 297, train_loss = 14.849959989078343, train_acc = 0.9670470423847228
test Acc 0.9492551210428305:
21th- epoch: 298, train_loss = 14.8423404796049, train_acc = 0.9671634839310667
test Acc 0.9487895716945997:
21th- epoch: 299, train_loss = 14.83514104411006, train_acc = 0.9671634839310667
test Acc 0.9483240223463687:
21th- epoch: 300, train_loss = 14.817682161927223, train_acc = 0.9670470423847228
test Acc 0.9492551210428305:
21th- epoch: 301, train_loss = 14.817533045075834, train_acc = 0.9671634839310667
test Acc 0.9492551210428305:
21th

test Acc 0.9487895716945997:
21th- epoch: 441, train_loss = 13.935277646873146, train_acc = 0.9698416394969726
test Acc 0.9487895716945997:
21th- epoch: 442, train_loss = 13.92812030762434, train_acc = 0.9698416394969726
test Acc 0.9487895716945997:
21th- epoch: 443, train_loss = 13.925829868763685, train_acc = 0.9697251979506288
test Acc 0.9487895716945997:
21th- epoch: 444, train_loss = 13.924685148987919, train_acc = 0.9698416394969726
test Acc 0.9487895716945997:
21th- epoch: 445, train_loss = 13.92018742626533, train_acc = 0.9698416394969726
test Acc 0.9487895716945997:
21th- epoch: 446, train_loss = 13.909833960235119, train_acc = 0.9698416394969726
test Acc 0.9487895716945997:
21th- epoch: 447, train_loss = 13.921625728253275, train_acc = 0.9698416394969726
test Acc 0.9487895716945997:
21th- epoch: 448, train_loss = 13.903665613383055, train_acc = 0.9698416394969726
test Acc 0.9487895716945997:
21th- epoch: 449, train_loss = 13.902461498975754, train_acc = 0.9698416394969726
tes

 70%|█████████████████████████████████████████████████                     | 21/30 [3:10:05<1:21:19, 542.13s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
22th- epoch: 0, train_loss = 133.22568610310555, train_acc = 0.7430135072193759
test Acc 0.8663873370577281:
22th- epoch: 1, train_loss = 56.289796844124794, train_acc = 0.881578947368421
test Acc 0.8947858472998138:
22th- epoch: 2, train_loss = 47.66492983698845, train_acc = 0.8981136469492315
test Acc 0.9054934823091247:
22th- epoch: 3, train_loss = 43.12902471423149, train_acc = 0.9076618537494178
test Acc 0.9115456238361266:
22th- epoch: 4, train_loss = 40.080603182315826, train_acc = 0.9141825803446669
test Acc 0.914804469273743:
22th- epoch: 5, train_loss = 37.85172309726477, train_acc = 0.918374476013041

22th- epoch: 145, train_loss = 16.883248263970017, train_acc = 0.961690731252911
test Acc 0.9450651769087524:
22th- epoch: 146, train_loss = 16.85499901883304, train_acc = 0.9618071727992548
test Acc 0.9445996275605214:
22th- epoch: 147, train_loss = 16.850221613422036, train_acc = 0.9619236143455985
test Acc 0.9450651769087524:
22th- epoch: 148, train_loss = 16.804639441892505, train_acc = 0.962156497438286
test Acc 0.9445996275605214:
22th- epoch: 149, train_loss = 16.769400734454393, train_acc = 0.9620400558919422
test Acc 0.9450651769087524:
22th- epoch: 150, train_loss = 16.77832391113043, train_acc = 0.9623893805309734
test Acc 0.9450651769087524:
22th- epoch: 151, train_loss = 16.75160658918321, train_acc = 0.9622729389846297
test Acc 0.9450651769087524:
22th- epoch: 152, train_loss = 16.727989392355084, train_acc = 0.962156497438286
test Acc 0.9441340782122905:
22th- epoch: 153, train_loss = 16.71132661961019, train_acc = 0.9622729389846297
test Acc 0.9445996275605214:
22th- ep

22th- epoch: 293, train_loss = 14.957335873506963, train_acc = 0.9668141592920354
test Acc 0.9478584729981379:
22th- epoch: 294, train_loss = 14.94596682395786, train_acc = 0.9668141592920354
test Acc 0.9473929236499069:
22th- epoch: 295, train_loss = 14.93087499216199, train_acc = 0.9669306008383791
test Acc 0.9478584729981379:
22th- epoch: 296, train_loss = 14.932758208364248, train_acc = 0.9670470423847228
test Acc 0.9478584729981379:
22th- epoch: 297, train_loss = 14.923568564467132, train_acc = 0.9669306008383791
test Acc 0.9478584729981379:
22th- epoch: 298, train_loss = 14.913986663334072, train_acc = 0.9670470423847228
test Acc 0.9473929236499069:
22th- epoch: 299, train_loss = 14.917296814732254, train_acc = 0.9669306008383791
test Acc 0.9473929236499069:
22th- epoch: 300, train_loss = 14.90176048874855, train_acc = 0.9671634839310667
test Acc 0.9473929236499069:
22th- epoch: 301, train_loss = 14.904123671352863, train_acc = 0.9670470423847228
test Acc 0.9478584729981379:
22th

test Acc 0.9483240223463687:
22th- epoch: 441, train_loss = 14.038272007368505, train_acc = 0.9690265486725663
test Acc 0.9478584729981379:
22th- epoch: 442, train_loss = 14.039077155292034, train_acc = 0.9692594317652539
test Acc 0.9473929236499069:
22th- epoch: 443, train_loss = 14.038365174084902, train_acc = 0.9692594317652539
test Acc 0.9483240223463687:
22th- epoch: 444, train_loss = 14.031206118874252, train_acc = 0.9692594317652539
test Acc 0.9483240223463687:
22th- epoch: 445, train_loss = 14.018884946592152, train_acc = 0.9692594317652539
test Acc 0.9473929236499069:
22th- epoch: 446, train_loss = 14.019570473581553, train_acc = 0.9691429902189101
test Acc 0.9483240223463687:
22th- epoch: 447, train_loss = 14.018724702298641, train_acc = 0.9692594317652539
test Acc 0.9478584729981379:
22th- epoch: 448, train_loss = 14.007078927010298, train_acc = 0.9692594317652539
test Acc 0.9483240223463687:
22th- epoch: 449, train_loss = 14.017195398919284, train_acc = 0.9692594317652539
t

 73%|███████████████████████████████████████████████████▎                  | 22/30 [3:19:08<1:12:17, 542.24s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
23th- epoch: 0, train_loss = 129.01631951332092, train_acc = 0.7564042850489054
test Acc 0.8342644320297952:
23th- epoch: 1, train_loss = 62.09029261767864, train_acc = 0.8699347927340475
test Acc 0.861731843575419:
23th- epoch: 2, train_loss = 52.252997785806656, train_acc = 0.8872845831392641
test Acc 0.8803538175046555:
23th- epoch: 3, train_loss = 46.992271453142166, train_acc = 0.8989287377736377
test Acc 0.8878026070763501:
23th- epoch: 4, train_loss = 43.51921145617962, train_acc = 0.9068467629250117
test Acc 0.904562383612663:
23th- epoch: 5, train_loss = 40.98732936382294, train_acc = 0.911504424778761

23th- epoch: 145, train_loss = 17.23046671040356, train_acc = 0.9614578481602236
test Acc 0.9459962756052142:
23th- epoch: 146, train_loss = 17.21131880581379, train_acc = 0.9615742897065673
test Acc 0.9464618249534451:
23th- epoch: 147, train_loss = 17.18770349957049, train_acc = 0.9615742897065673
test Acc 0.9464618249534451:
23th- epoch: 148, train_loss = 17.160665983334184, train_acc = 0.961690731252911
test Acc 0.9459962756052142:
23th- epoch: 149, train_loss = 17.135444397106767, train_acc = 0.9619236143455985
test Acc 0.9464618249534451:
23th- epoch: 150, train_loss = 17.120236299932003, train_acc = 0.9618071727992548
test Acc 0.9455307262569832:
23th- epoch: 151, train_loss = 17.09171306155622, train_acc = 0.9618071727992548
test Acc 0.9459962756052142:
23th- epoch: 152, train_loss = 17.068922959268093, train_acc = 0.9618071727992548
test Acc 0.9464618249534451:
23th- epoch: 153, train_loss = 17.056475771591067, train_acc = 0.9619236143455985
test Acc 0.9464618249534451:
23th- 

23th- epoch: 293, train_loss = 15.169652502052486, train_acc = 0.9657661853749417
test Acc 0.9487895716945997:
23th- epoch: 294, train_loss = 15.157115451991558, train_acc = 0.9657661853749417
test Acc 0.9487895716945997:
23th- epoch: 295, train_loss = 15.149116180837154, train_acc = 0.965649743828598
test Acc 0.9487895716945997:
23th- epoch: 296, train_loss = 15.138272449374199, train_acc = 0.9657661853749417
test Acc 0.9487895716945997:
23th- epoch: 297, train_loss = 15.129759755916893, train_acc = 0.9657661853749417
test Acc 0.9487895716945997:
23th- epoch: 298, train_loss = 15.122808150947094, train_acc = 0.965649743828598
test Acc 0.9487895716945997:
23th- epoch: 299, train_loss = 15.115309529006481, train_acc = 0.9657661853749417
test Acc 0.9487895716945997:
23th- epoch: 300, train_loss = 15.104643069207668, train_acc = 0.9663483931066604
test Acc 0.9487895716945997:
23th- epoch: 301, train_loss = 15.102997948415577, train_acc = 0.9658826269212856
test Acc 0.9487895716945997:
23t

test Acc 0.9492551210428305:
23th- epoch: 441, train_loss = 14.197105864994228, train_acc = 0.9690265486725663
test Acc 0.9492551210428305:
23th- epoch: 442, train_loss = 14.191013765521348, train_acc = 0.9689101071262226
test Acc 0.9492551210428305:
23th- epoch: 443, train_loss = 14.184821779839694, train_acc = 0.9690265486725663
test Acc 0.9492551210428305:
23th- epoch: 444, train_loss = 14.18379523884505, train_acc = 0.9690265486725663
test Acc 0.9492551210428305:
23th- epoch: 445, train_loss = 14.17985922563821, train_acc = 0.9689101071262226
test Acc 0.9492551210428305:
23th- epoch: 446, train_loss = 14.175763060338795, train_acc = 0.9689101071262226
test Acc 0.9492551210428305:
23th- epoch: 447, train_loss = 14.171798340976238, train_acc = 0.9690265486725663
test Acc 0.9492551210428305:
23th- epoch: 448, train_loss = 14.16432508546859, train_acc = 0.9690265486725663
test Acc 0.9492551210428305:
23th- epoch: 449, train_loss = 14.161488249897957, train_acc = 0.9689101071262226
test

 77%|█████████████████████████████████████████████████████▋                | 23/30 [3:28:10<1:03:15, 542.18s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
24th- epoch: 0, train_loss = 128.02437835931778, train_acc = 0.7661853749417792
test Acc 0.8254189944134078:
24th- epoch: 1, train_loss = 59.408789709210396, train_acc = 0.8792501164415464
test Acc 0.8729050279329609:
24th- epoch: 2, train_loss = 49.35571776330471, train_acc = 0.8970656730321379
test Acc 0.8943202979515829:
24th- epoch: 3, train_loss = 43.92164558172226, train_acc = 0.9089427107591989
test Acc 0.9022346368715084:
24th- epoch: 4, train_loss = 40.42357395589352, train_acc = 0.9136003726129484
test Acc 0.9064245810055865:
24th- epoch: 5, train_loss = 37.88589700311422, train_acc = 0.91942244993013

24th- epoch: 145, train_loss = 16.840185947716236, train_acc = 0.9629715882626921
test Acc 0.9455307262569832:
24th- epoch: 146, train_loss = 16.827311657369137, train_acc = 0.9629715882626921
test Acc 0.9455307262569832:
24th- epoch: 147, train_loss = 16.801592020317912, train_acc = 0.9630880298090359
test Acc 0.9455307262569832:
24th- epoch: 148, train_loss = 16.783351158723235, train_acc = 0.9630880298090359
test Acc 0.9455307262569832:
24th- epoch: 149, train_loss = 16.767168261110783, train_acc = 0.9633209129017233
test Acc 0.9455307262569832:
24th- epoch: 150, train_loss = 16.736208545044065, train_acc = 0.9632044713553796
test Acc 0.9455307262569832:
24th- epoch: 151, train_loss = 16.71853848360479, train_acc = 0.9632044713553796
test Acc 0.9455307262569832:
24th- epoch: 152, train_loss = 16.699306443333626, train_acc = 0.9630880298090359
test Acc 0.9455307262569832:
24th- epoch: 153, train_loss = 16.6802512165159, train_acc = 0.9634373544480671
test Acc 0.9455307262569832:
24th

24th- epoch: 293, train_loss = 14.907324461266398, train_acc = 0.9675128085700978
test Acc 0.9473929236499069:
24th- epoch: 294, train_loss = 14.887744152918458, train_acc = 0.9677456916627852
test Acc 0.9473929236499069:
24th- epoch: 295, train_loss = 14.87933961302042, train_acc = 0.9677456916627852
test Acc 0.9473929236499069:
24th- epoch: 296, train_loss = 14.869434684515, train_acc = 0.9677456916627852
test Acc 0.9473929236499069:
24th- epoch: 297, train_loss = 14.863198338076472, train_acc = 0.9679785747554728
test Acc 0.9473929236499069:
24th- epoch: 298, train_loss = 14.85276923328638, train_acc = 0.9677456916627852
test Acc 0.9473929236499069:
24th- epoch: 299, train_loss = 14.844770120456815, train_acc = 0.9679785747554728
test Acc 0.9473929236499069:
24th- epoch: 300, train_loss = 14.836976021528244, train_acc = 0.9678621332091291
test Acc 0.9473929236499069:
24th- epoch: 301, train_loss = 14.828709969297051, train_acc = 0.9679785747554728
test Acc 0.9473929236499069:
24th- 

24th- epoch: 441, train_loss = 13.97901064902544, train_acc = 0.9694923148579413
test Acc 0.9492551210428305:
24th- epoch: 442, train_loss = 13.97669215966016, train_acc = 0.969608756404285
test Acc 0.9487895716945997:
24th- epoch: 443, train_loss = 13.972521317191422, train_acc = 0.9697251979506288
test Acc 0.9492551210428305:
24th- epoch: 444, train_loss = 13.965396839194, train_acc = 0.969608756404285
test Acc 0.9487895716945997:
24th- epoch: 445, train_loss = 13.967703525908291, train_acc = 0.9697251979506288
test Acc 0.9483240223463687:
24th- epoch: 446, train_loss = 13.956009536981583, train_acc = 0.9698416394969726
test Acc 0.9492551210428305:
24th- epoch: 447, train_loss = 13.951969929039478, train_acc = 0.9698416394969726
test Acc 0.9487895716945997:
24th- epoch: 448, train_loss = 13.95081910211593, train_acc = 0.9697251979506288
test Acc 0.9487895716945997:
24th- epoch: 449, train_loss = 13.949322931468487, train_acc = 0.9698416394969726
test Acc 0.9487895716945997:
24th- epo

 80%|█████████████████████████████████████████████████████████▌              | 24/30 [3:37:14<54:16, 542.83s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
25th- epoch: 0, train_loss = 133.0015206038952, train_acc = 0.7414997671169073
test Acc 0.7625698324022346:
25th- epoch: 1, train_loss = 64.33412411808968, train_acc = 0.8678388448998603
test Acc 0.8249534450651769:
25th- epoch: 2, train_loss = 52.60006159543991, train_acc = 0.8883325570563577
test Acc 0.8542830540037244:
25th- epoch: 3, train_loss = 46.6560178399086, train_acc = 0.9041686073591058
test Acc 0.8710428305400373:
25th- epoch: 4, train_loss = 42.75709669291973, train_acc = 0.9104564508616675
test Acc 0.883147113594041:
25th- epoch: 5, train_loss = 39.96528621017933, train_acc = 0.9127852817885421
t

25th- epoch: 145, train_loss = 17.18105278722942, train_acc = 0.9623893805309734
test Acc 0.9459962756052142:
25th- epoch: 146, train_loss = 17.158523611724377, train_acc = 0.9623893805309734
test Acc 0.9459962756052142:
25th- epoch: 147, train_loss = 17.13792504183948, train_acc = 0.9625058220773172
test Acc 0.9464618249534451:
25th- epoch: 148, train_loss = 17.1194132193923, train_acc = 0.9625058220773172
test Acc 0.9464618249534451:
25th- epoch: 149, train_loss = 17.094799457117915, train_acc = 0.9626222636236609
test Acc 0.9459962756052142:
25th- epoch: 150, train_loss = 17.073767095804214, train_acc = 0.9628551467163484
test Acc 0.9459962756052142:
25th- epoch: 151, train_loss = 17.051052272319794, train_acc = 0.9627387051700047
test Acc 0.9464618249534451:
25th- epoch: 152, train_loss = 17.030630519613624, train_acc = 0.9628551467163484
test Acc 0.9459962756052142:
25th- epoch: 153, train_loss = 17.007687471807003, train_acc = 0.9626222636236609
test Acc 0.9464618249534451:
25th-

25th- epoch: 293, train_loss = 15.163169905543327, train_acc = 0.9666977177456917
test Acc 0.9487895716945997:
25th- epoch: 294, train_loss = 15.15460395347327, train_acc = 0.9666977177456917
test Acc 0.9487895716945997:
25th- epoch: 295, train_loss = 15.153939967043698, train_acc = 0.9666977177456917
test Acc 0.9487895716945997:
25th- epoch: 296, train_loss = 15.147471457719803, train_acc = 0.9666977177456917
test Acc 0.9487895716945997:
25th- epoch: 297, train_loss = 15.132303687743843, train_acc = 0.9666977177456917
test Acc 0.9487895716945997:
25th- epoch: 298, train_loss = 15.121716792695224, train_acc = 0.9666977177456917
test Acc 0.9487895716945997:
25th- epoch: 299, train_loss = 15.116993722505867, train_acc = 0.9666977177456917
test Acc 0.9487895716945997:
25th- epoch: 300, train_loss = 15.112135755829513, train_acc = 0.9666977177456917
test Acc 0.9487895716945997:
25th- epoch: 301, train_loss = 15.094787794165313, train_acc = 0.9666977177456917
test Acc 0.9492551210428305:
25

25th- epoch: 440, train_loss = 14.202606238424778, train_acc = 0.9693758733115976
test Acc 0.9487895716945997:
25th- epoch: 441, train_loss = 14.203573738690466, train_acc = 0.9693758733115976
test Acc 0.9492551210428305:
25th- epoch: 442, train_loss = 14.19686105614528, train_acc = 0.9692594317652539
test Acc 0.9492551210428305:
25th- epoch: 443, train_loss = 14.191033825278282, train_acc = 0.9693758733115976
test Acc 0.9492551210428305:
25th- epoch: 444, train_loss = 14.186140152160078, train_acc = 0.969608756404285
test Acc 0.9492551210428305:
25th- epoch: 445, train_loss = 14.184786958154291, train_acc = 0.9694923148579413
test Acc 0.9492551210428305:
25th- epoch: 446, train_loss = 14.180968304630369, train_acc = 0.9693758733115976
test Acc 0.9492551210428305:
25th- epoch: 447, train_loss = 14.172769352793694, train_acc = 0.969608756404285
test Acc 0.9492551210428305:
25th- epoch: 448, train_loss = 14.170453004539013, train_acc = 0.9694923148579413
test Acc 0.9492551210428305:
25th

 83%|████████████████████████████████████████████████████████████            | 25/30 [3:46:18<45:15, 543.10s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
26th- epoch: 0, train_loss = 115.4410684555769, train_acc = 0.7814392175128085
test Acc 0.8789571694599627:
26th- epoch: 1, train_loss = 54.94027541577816, train_acc = 0.8835584536562645
test Acc 0.9022346368715084:
26th- epoch: 2, train_loss = 47.171870470047, train_acc = 0.8990451793199814
test Acc 0.910148975791434:
26th- epoch: 3, train_loss = 42.9403131082654, train_acc = 0.9078947368421053
test Acc 0.914804469273743:
26th- epoch: 4, train_loss = 39.9950849711895, train_acc = 0.9127852817885421
test Acc 0.9189944134078212:
26th- epoch: 5, train_loss = 37.688808768987656, train_acc = 0.9175593851886353
test

26th- epoch: 145, train_loss = 16.822729004547, train_acc = 0.9628551467163484
test Acc 0.9492551210428305:
26th- epoch: 146, train_loss = 16.80719523690641, train_acc = 0.9628551467163484
test Acc 0.9497206703910615:
26th- epoch: 147, train_loss = 16.779670594260097, train_acc = 0.9629715882626921
test Acc 0.9497206703910615:
26th- epoch: 148, train_loss = 16.763100972399116, train_acc = 0.9629715882626921
test Acc 0.9492551210428305:
26th- epoch: 149, train_loss = 16.73466813750565, train_acc = 0.9629715882626921
test Acc 0.9497206703910615:
26th- epoch: 150, train_loss = 16.73246575333178, train_acc = 0.9629715882626921
test Acc 0.9497206703910615:
26th- epoch: 151, train_loss = 16.690492833033204, train_acc = 0.9633209129017233
test Acc 0.9492551210428305:
26th- epoch: 152, train_loss = 16.671286139637232, train_acc = 0.9632044713553796
test Acc 0.9497206703910615:
26th- epoch: 153, train_loss = 16.646076422184706, train_acc = 0.9632044713553796
test Acc 0.9501862197392924:
26th- e

26th- epoch: 293, train_loss = 14.896527670323849, train_acc = 0.9673963670237541
test Acc 0.9506517690875232:
26th- epoch: 294, train_loss = 14.895020487718284, train_acc = 0.9673963670237541
test Acc 0.9506517690875232:
26th- epoch: 295, train_loss = 14.88216032832861, train_acc = 0.9673963670237541
test Acc 0.9501862197392924:
26th- epoch: 296, train_loss = 14.871417619287968, train_acc = 0.9673963670237541
test Acc 0.9506517690875232:
26th- epoch: 297, train_loss = 14.86082647740841, train_acc = 0.9672799254774104
test Acc 0.9501862197392924:
26th- epoch: 298, train_loss = 14.852716187946498, train_acc = 0.9673963670237541
test Acc 0.9506517690875232:
26th- epoch: 299, train_loss = 14.84841891657561, train_acc = 0.9673963670237541
test Acc 0.9506517690875232:
26th- epoch: 300, train_loss = 14.83248911332339, train_acc = 0.9677456916627852
test Acc 0.9501862197392924:
26th- epoch: 301, train_loss = 14.843819350004196, train_acc = 0.9673963670237541
test Acc 0.9506517690875232:
26th-

26th- epoch: 440, train_loss = 14.017943538725376, train_acc = 0.9694923148579413
test Acc 0.9511173184357542:
26th- epoch: 441, train_loss = 14.01161241531372, train_acc = 0.9694923148579413
test Acc 0.9506517690875232:
26th- epoch: 442, train_loss = 14.012006225530058, train_acc = 0.9693758733115976
test Acc 0.9506517690875232:
26th- epoch: 443, train_loss = 14.005559647921473, train_acc = 0.9694923148579413
test Acc 0.9506517690875232:
26th- epoch: 444, train_loss = 13.997819758951664, train_acc = 0.9694923148579413
test Acc 0.9506517690875232:
26th- epoch: 445, train_loss = 13.99246971309185, train_acc = 0.9694923148579413
test Acc 0.9506517690875232:
26th- epoch: 446, train_loss = 13.99465499818325, train_acc = 0.9694923148579413
test Acc 0.9506517690875232:
26th- epoch: 447, train_loss = 13.985188437160105, train_acc = 0.9693758733115976
test Acc 0.9506517690875232:
26th- epoch: 448, train_loss = 13.98418084019795, train_acc = 0.9694923148579413
test Acc 0.9506517690875232:
26th-

 87%|██████████████████████████████████████████████████████████████▍         | 26/30 [3:55:22<36:13, 543.29s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
27th- epoch: 0, train_loss = 123.56497845053673, train_acc = 0.7475547275267815
test Acc 0.8305400372439479:
27th- epoch: 1, train_loss = 58.693184807896614, train_acc = 0.8735444806707033
test Acc 0.8743016759776536:
27th- epoch: 2, train_loss = 49.101226672530174, train_acc = 0.897880763856544
test Acc 0.888268156424581:
27th- epoch: 3, train_loss = 44.08827379345894, train_acc = 0.9048672566371682
test Acc 0.9008379888268156:
27th- epoch: 4, train_loss = 40.821395710110664, train_acc = 0.9104564508616675
test Acc 0.9078212290502793:
27th- epoch: 5, train_loss = 38.2874239385128, train_acc = 0.917093619003260

27th- epoch: 145, train_loss = 17.03664749674499, train_acc = 0.9632044713553796
test Acc 0.9441340782122905:
27th- epoch: 146, train_loss = 17.008239900693297, train_acc = 0.9633209129017233
test Acc 0.9441340782122905:
27th- epoch: 147, train_loss = 16.989847287535667, train_acc = 0.9632044713553796
test Acc 0.9441340782122905:
27th- epoch: 148, train_loss = 16.967597771435976, train_acc = 0.9632044713553796
test Acc 0.9441340782122905:
27th- epoch: 149, train_loss = 16.950621152296662, train_acc = 0.9632044713553796
test Acc 0.9441340782122905:
27th- epoch: 150, train_loss = 16.92517763748765, train_acc = 0.9633209129017233
test Acc 0.9441340782122905:
27th- epoch: 151, train_loss = 16.907730270177126, train_acc = 0.9635537959944108
test Acc 0.9441340782122905:
27th- epoch: 152, train_loss = 16.885187827050686, train_acc = 0.9634373544480671
test Acc 0.9436685288640596:
27th- epoch: 153, train_loss = 16.86699436791241, train_acc = 0.9636702375407545
test Acc 0.9436685288640596:
27th

test Acc 0.9445996275605214:
27th- epoch: 293, train_loss = 15.0870312852785, train_acc = 0.9662319515603167
test Acc 0.9445996275605214:
27th- epoch: 294, train_loss = 15.074506032280624, train_acc = 0.9662319515603167
test Acc 0.9445996275605214:
27th- epoch: 295, train_loss = 15.067554224282503, train_acc = 0.9662319515603167
test Acc 0.9445996275605214:
27th- epoch: 296, train_loss = 15.05779939237982, train_acc = 0.9663483931066604
test Acc 0.9445996275605214:
27th- epoch: 297, train_loss = 15.0545722739771, train_acc = 0.9663483931066604
test Acc 0.9445996275605214:
27th- epoch: 298, train_loss = 15.043615826405585, train_acc = 0.9663483931066604
test Acc 0.9445996275605214:
27th- epoch: 299, train_loss = 15.038124143145978, train_acc = 0.9662319515603167
test Acc 0.9445996275605214:
27th- epoch: 300, train_loss = 15.030191303230822, train_acc = 0.9662319515603167
test Acc 0.9445996275605214:
27th- epoch: 301, train_loss = 15.025732238776982, train_acc = 0.9663483931066604
test A

27th- epoch: 440, train_loss = 14.176395886577666, train_acc = 0.9686772240335352
test Acc 0.9464618249534451:
27th- epoch: 441, train_loss = 14.172168161720037, train_acc = 0.9686772240335352
test Acc 0.9464618249534451:
27th- epoch: 442, train_loss = 14.167292202822864, train_acc = 0.9689101071262226
test Acc 0.9464618249534451:
27th- epoch: 443, train_loss = 14.168141234666109, train_acc = 0.9686772240335352
test Acc 0.9464618249534451:
27th- epoch: 444, train_loss = 14.15663702134043, train_acc = 0.9689101071262226
test Acc 0.946927374301676:
27th- epoch: 445, train_loss = 14.150806464254856, train_acc = 0.9687936655798789
test Acc 0.946927374301676:
27th- epoch: 446, train_loss = 14.15534661244601, train_acc = 0.9686772240335352
test Acc 0.9464618249534451:
27th- epoch: 447, train_loss = 14.147148515097797, train_acc = 0.9689101071262226
test Acc 0.9464618249534451:
27th- epoch: 448, train_loss = 14.138056814670563, train_acc = 0.9687936655798789
test Acc 0.9464618249534451:
27th-

 90%|████████████████████████████████████████████████████████████████▊       | 27/30 [4:04:26<27:10, 543.54s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
28th- epoch: 0, train_loss = 124.78025555610657, train_acc = 0.7459245458779693
test Acc 0.7579143389199255:
28th- epoch: 1, train_loss = 60.91704769432545, train_acc = 0.8687703772706101
test Acc 0.8226256983240223:
28th- epoch: 2, train_loss = 50.662580251693726, train_acc = 0.8914764788076386
test Acc 0.8524208566108007:
28th- epoch: 3, train_loss = 45.74715481698513, train_acc = 0.9025384257102934
test Acc 0.86731843575419:
28th- epoch: 4, train_loss = 42.39347532391548, train_acc = 0.9085933861201677
test Acc 0.8766294227188082:
28th- epoch: 5, train_loss = 39.87271158397198, train_acc = 0.9151141127154169

28th- epoch: 145, train_loss = 16.838190527632833, train_acc = 0.9633209129017233
test Acc 0.9445996275605214:
28th- epoch: 146, train_loss = 16.808526983484626, train_acc = 0.9633209129017233
test Acc 0.9441340782122905:
28th- epoch: 147, train_loss = 16.78184320218861, train_acc = 0.9629715882626921
test Acc 0.9441340782122905:
28th- epoch: 148, train_loss = 16.763340020552278, train_acc = 0.9634373544480671
test Acc 0.9436685288640596:
28th- epoch: 149, train_loss = 16.751368021592498, train_acc = 0.9633209129017233
test Acc 0.9445996275605214:
28th- epoch: 150, train_loss = 16.7221265938133, train_acc = 0.9633209129017233
test Acc 0.9445996275605214:
28th- epoch: 151, train_loss = 16.695878328755498, train_acc = 0.9633209129017233
test Acc 0.9441340782122905:
28th- epoch: 152, train_loss = 16.663654200732708, train_acc = 0.9633209129017233
test Acc 0.9441340782122905:
28th- epoch: 153, train_loss = 16.672554487362504, train_acc = 0.9635537959944108
test Acc 0.9450651769087524:
28th

28th- epoch: 293, train_loss = 14.883060042746365, train_acc = 0.9676292501164415
test Acc 0.9473929236499069:
28th- epoch: 294, train_loss = 14.86683342140168, train_acc = 0.9677456916627852
test Acc 0.9473929236499069:
28th- epoch: 295, train_loss = 14.859060823917389, train_acc = 0.9678621332091291
test Acc 0.9473929236499069:
28th- epoch: 296, train_loss = 14.85334490146488, train_acc = 0.9678621332091291
test Acc 0.946927374301676:
28th- epoch: 297, train_loss = 14.846858111210167, train_acc = 0.9677456916627852
test Acc 0.9473929236499069:
28th- epoch: 298, train_loss = 14.833897016942501, train_acc = 0.9678621332091291
test Acc 0.9478584729981379:
28th- epoch: 299, train_loss = 14.827268860302866, train_acc = 0.9677456916627852
test Acc 0.9473929236499069:
28th- epoch: 300, train_loss = 14.828383141197264, train_acc = 0.9679785747554728
test Acc 0.9473929236499069:
28th- epoch: 301, train_loss = 14.820336206816137, train_acc = 0.9678621332091291
test Acc 0.9478584729981379:
28th

28th- epoch: 440, train_loss = 13.94974554469809, train_acc = 0.9689101071262226
test Acc 0.9483240223463687:
28th- epoch: 441, train_loss = 13.938643074594438, train_acc = 0.9689101071262226
test Acc 0.9483240223463687:
28th- epoch: 442, train_loss = 13.943784843198955, train_acc = 0.9690265486725663
test Acc 0.9483240223463687:
28th- epoch: 443, train_loss = 13.930114102549851, train_acc = 0.9689101071262226
test Acc 0.9483240223463687:
28th- epoch: 444, train_loss = 13.930719714611769, train_acc = 0.9689101071262226
test Acc 0.9483240223463687:
28th- epoch: 445, train_loss = 13.920766055583954, train_acc = 0.9689101071262226
test Acc 0.9483240223463687:
28th- epoch: 446, train_loss = 13.918188954237849, train_acc = 0.9689101071262226
test Acc 0.9483240223463687:
28th- epoch: 447, train_loss = 13.91109936311841, train_acc = 0.9689101071262226
test Acc 0.9483240223463687:
28th- epoch: 448, train_loss = 13.9107211320661, train_acc = 0.9689101071262226
test Acc 0.9483240223463687:
28th-

 93%|███████████████████████████████████████████████████████████████████▏    | 28/30 [4:13:30<18:07, 543.63s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
29th- epoch: 0, train_loss = 123.51335108280182, train_acc = 0.7425477410340009
test Acc 0.8566108007448789:
29th- epoch: 1, train_loss = 56.2576664686203, train_acc = 0.872380065207266
test Acc 0.8817504655493482:
29th- epoch: 2, train_loss = 46.97509351372719, train_acc = 0.8910107126222636
test Acc 0.904562383612663:
29th- epoch: 3, train_loss = 42.246245220303535, train_acc = 0.9030041918956684
test Acc 0.9124767225325885:
29th- epoch: 4, train_loss = 39.162872210145, train_acc = 0.9105728924080112
test Acc 0.9171322160148976:
29th- epoch: 5, train_loss = 36.93672014027834, train_acc = 0.9151141127154169
te

29th- epoch: 145, train_loss = 16.824213311076164, train_acc = 0.9627387051700047
test Acc 0.9445996275605214:
29th- epoch: 146, train_loss = 16.814102517440915, train_acc = 0.9630880298090359
test Acc 0.9445996275605214:
29th- epoch: 147, train_loss = 16.791318660601974, train_acc = 0.9628551467163484
test Acc 0.9450651769087524:
29th- epoch: 148, train_loss = 16.77997314929962, train_acc = 0.9628551467163484
test Acc 0.9450651769087524:
29th- epoch: 149, train_loss = 16.74793365597725, train_acc = 0.9632044713553796
test Acc 0.9450651769087524:
29th- epoch: 150, train_loss = 16.724954694509506, train_acc = 0.9629715882626921
test Acc 0.9445996275605214:
29th- epoch: 151, train_loss = 16.711886072531343, train_acc = 0.9632044713553796
test Acc 0.9450651769087524:
29th- epoch: 152, train_loss = 16.69285367242992, train_acc = 0.9630880298090359
test Acc 0.9450651769087524:
29th- epoch: 153, train_loss = 16.679615773260593, train_acc = 0.9632044713553796
test Acc 0.9450651769087524:
29th

29th- epoch: 293, train_loss = 14.887014160864055, train_acc = 0.9677456916627852
test Acc 0.9478584729981379:
29th- epoch: 294, train_loss = 14.877749130129814, train_acc = 0.9676292501164415
test Acc 0.9478584729981379:
29th- epoch: 295, train_loss = 14.862331330776215, train_acc = 0.9676292501164415
test Acc 0.9483240223463687:
29th- epoch: 296, train_loss = 14.872662097215652, train_acc = 0.9675128085700978
test Acc 0.9483240223463687:
29th- epoch: 297, train_loss = 14.869758442044258, train_acc = 0.9676292501164415
test Acc 0.9483240223463687:
29th- epoch: 298, train_loss = 14.85456594824791, train_acc = 0.9677456916627852
test Acc 0.9483240223463687:
29th- epoch: 299, train_loss = 14.846158869564533, train_acc = 0.9676292501164415
test Acc 0.9483240223463687:
29th- epoch: 300, train_loss = 14.842322933487594, train_acc = 0.9677456916627852
test Acc 0.9478584729981379:
29th- epoch: 301, train_loss = 14.831947204656899, train_acc = 0.9678621332091291
test Acc 0.9483240223463687:
29

29th- epoch: 441, train_loss = 13.990956015884876, train_acc = 0.969608756404285
test Acc 0.9487895716945997:
29th- epoch: 442, train_loss = 13.986311699263752, train_acc = 0.9699580810433163
test Acc 0.9487895716945997:
29th- epoch: 443, train_loss = 13.974659025669098, train_acc = 0.9699580810433163
test Acc 0.9487895716945997:
29th- epoch: 444, train_loss = 13.969361998140812, train_acc = 0.969608756404285
test Acc 0.9487895716945997:
29th- epoch: 445, train_loss = 13.96854053158313, train_acc = 0.9698416394969726
test Acc 0.9492551210428305:
29th- epoch: 446, train_loss = 13.960292977280915, train_acc = 0.969608756404285
test Acc 0.9487895716945997:
29th- epoch: 447, train_loss = 13.958616730757058, train_acc = 0.9699580810433163
test Acc 0.9492551210428305:
29th- epoch: 448, train_loss = 13.958302569575608, train_acc = 0.969608756404285
test Acc 0.9492551210428305:
29th- epoch: 449, train_loss = 13.949731692671776, train_acc = 0.9698416394969726
test Acc 0.9487895716945997:
29th- 

 97%|█████████████████████████████████████████████████████████████████████▌  | 29/30 [4:22:32<09:03, 543.32s/it]

Method7_second(
  (fc): Sequential(
    (0): Linear(in_features=768, out_features=768, bias=True)
    (1): Linear(in_features=768, out_features=512, bias=True)
    (2): Linear(in_features=512, out_features=512, bias=True)
    (3): ReLU()
    (4): Linear(in_features=512, out_features=256, bias=True)
    (5): ReLU()
    (6): Linear(in_features=256, out_features=9, bias=True)
  )
)
30th- epoch: 0, train_loss = 115.23131236433983, train_acc = 0.7553563111318118
test Acc 0.8221601489757915:
30th- epoch: 1, train_loss = 59.639636024832726, train_acc = 0.8734280391243596
test Acc 0.8649906890130353:
30th- epoch: 2, train_loss = 49.37126184999943, train_acc = 0.8969492314857941
test Acc 0.8878026070763501:
30th- epoch: 3, train_loss = 44.10238888859749, train_acc = 0.9084769445738239
test Acc 0.904562383612663:
30th- epoch: 4, train_loss = 40.790367498993874, train_acc = 0.9137168141592921
test Acc 0.9078212290502793:
30th- epoch: 5, train_loss = 38.368752144277096, train_acc = 0.9189566837447

30th- epoch: 145, train_loss = 16.83628506027162, train_acc = 0.9640195621797858
test Acc 0.9455307262569832:
30th- epoch: 146, train_loss = 16.820240246132016, train_acc = 0.9641360037261295
test Acc 0.9455307262569832:
30th- epoch: 147, train_loss = 16.79452502168715, train_acc = 0.9644853283651607
test Acc 0.9455307262569832:
30th- epoch: 148, train_loss = 16.776116451248527, train_acc = 0.9643688868188169
test Acc 0.9455307262569832:
30th- epoch: 149, train_loss = 16.76062543131411, train_acc = 0.9646017699115044
test Acc 0.9455307262569832:
30th- epoch: 150, train_loss = 16.744512287899852, train_acc = 0.9646017699115044
test Acc 0.9455307262569832:
30th- epoch: 151, train_loss = 16.726976001635194, train_acc = 0.9647182114578482
test Acc 0.9459962756052142:
30th- epoch: 152, train_loss = 16.70060585439205, train_acc = 0.9647182114578482
test Acc 0.9455307262569832:
30th- epoch: 153, train_loss = 16.676826238632202, train_acc = 0.9648346530041919
test Acc 0.9455307262569832:
30th-

30th- epoch: 293, train_loss = 14.89049682021141, train_acc = 0.9666977177456917
test Acc 0.9464618249534451:
30th- epoch: 294, train_loss = 14.885660770349205, train_acc = 0.9668141592920354
test Acc 0.9464618249534451:
30th- epoch: 295, train_loss = 14.87382484972477, train_acc = 0.9666977177456917
test Acc 0.9464618249534451:
30th- epoch: 296, train_loss = 14.86893568187952, train_acc = 0.9668141592920354
test Acc 0.9464618249534451:
30th- epoch: 297, train_loss = 14.85727196931839, train_acc = 0.9668141592920354
test Acc 0.9464618249534451:
30th- epoch: 298, train_loss = 14.850390654988587, train_acc = 0.9669306008383791
test Acc 0.9464618249534451:
30th- epoch: 299, train_loss = 14.842486071400344, train_acc = 0.9669306008383791
test Acc 0.9464618249534451:
30th- epoch: 300, train_loss = 14.835646852850914, train_acc = 0.9669306008383791
test Acc 0.9464618249534451:
30th- epoch: 301, train_loss = 14.826421312987804, train_acc = 0.9671634839310667
test Acc 0.9464618249534451:
30th-

test Acc 0.9473929236499069:
30th- epoch: 441, train_loss = 13.999066174030304, train_acc = 0.9692594317652539
test Acc 0.9473929236499069:
30th- epoch: 442, train_loss = 13.993437108583748, train_acc = 0.9692594317652539
test Acc 0.9473929236499069:
30th- epoch: 443, train_loss = 13.983579084277153, train_acc = 0.9692594317652539
test Acc 0.9473929236499069:
30th- epoch: 444, train_loss = 13.978036649525166, train_acc = 0.9694923148579413
test Acc 0.9473929236499069:
30th- epoch: 445, train_loss = 13.968836682848632, train_acc = 0.9692594317652539
test Acc 0.9473929236499069:
30th- epoch: 446, train_loss = 13.971171016804874, train_acc = 0.9692594317652539
test Acc 0.9473929236499069:
30th- epoch: 447, train_loss = 13.965251259505749, train_acc = 0.9693758733115976
test Acc 0.9473929236499069:
30th- epoch: 448, train_loss = 13.96749276900664, train_acc = 0.9693758733115976
test Acc 0.9473929236499069:
30th- epoch: 449, train_loss = 13.956205812748522, train_acc = 0.9694923148579413
te

100%|████████████████████████████████████████████████████████████████████████| 30/30 [4:31:35<00:00, 543.20s/it]


Wall time: 4h 31min 38s
