In [1]:
import torch 
import json,pickle,math
import pandas as pd
import numpy as np
import torch.nn as nn
import torchvision
import torchvision.transforms as transforms


In [2]:
full_df = pd.read_csv(open('../davis_all_pairs.csv','r'))

In [3]:
all_9_folds={}
for i in [0,1,2]:
    for j in [0,1,2]:
        file_name = 'fold' +str(i) +str(j) 
        
        temp = open('../data/davis/DAVIS_9_FOLDS/' + file_name +'.pkl', 'rb')
        new_df = pd.read_pickle(temp)
        all_9_folds.update({file_name:new_df})
        temp.close()
        

In [4]:
def create_davis_test_train(test_fold_number,all_9_folds):
    test_protein_fold_id = test_fold_number[0]
    test_ligand_fold_id = test_fold_number[1]
    test_set = pd.DataFrame(columns = full_df.columns)
    train_set = pd.DataFrame(columns= full_df.columns)
    for i in [0,1,2]:
        for j in [0,1,2]:
            fold_name = 'fold' + str(i) + str(j)
            df = all_9_folds[fold_name]
            
            if str(i) == test_protein_fold_id:
                test_set = pd.concat([test_set, df.copy()], ignore_index=True)
                
            if str(i) != test_protein_fold_id:
                print("train ->",i, j)
                train_set = pd.concat([train_set, df.copy()], ignore_index=True)
                
                
    return train_set, test_set


# Create train test split on these 9 folds
## fold_number is the id of fold. For example, test = fold00, train = fold 11,22,12,21

In [5]:
fold_number = '2x'

In [6]:
train, test = create_davis_test_train(test_fold_number=fold_number, all_9_folds=all_9_folds)

train -> 0 0
train -> 0 1
train -> 0 2
train -> 1 0
train -> 1 1
train -> 1 2


In [7]:
train

Unnamed: 0,SMILES,Target Sequence,Label,drug_encoding,target_encoding
0,CCC1C(=O)N(C2=CN=C(N=C2N1C3CCCC3)NC4=C(C=C(C=C...,MSDVAIVKEGWLHKRGEYIKTWRPRYFLLKNDGTFIGYKERPQDVD...,5.000000,"[C, C, C, 1, C, (, =, O, ), N, (, C, 2, =, C, ...","[M, S, D, V, A, I, V, K, E, G, W, L, H, K, R, ..."
1,CN1C2=C(C=C(C=C2)OC3=CC(=NC=C3)C4=NC=C(N4)C(F)...,MSDVAIVKEGWLHKRGEYIKTWRPRYFLLKNDGTFIGYKERPQDVD...,5.000000,"[C, N, 1, C, 2, =, C, (, C, =, C, (, C, =, C, ...","[M, S, D, V, A, I, V, K, E, G, W, L, H, K, R, ..."
2,C1CC1CONC(=O)C2=C(C(=C(C=C2)F)F)NC3=C(C=C(C=C3...,MSDVAIVKEGWLHKRGEYIKTWRPRYFLLKNDGTFIGYKERPQDVD...,5.000000,"[C, 1, C, C, 1, C, O, N, C, (, =, O, ), C, 2, ...","[M, S, D, V, A, I, V, K, E, G, W, L, H, K, R, ..."
3,CC1=CC2=C(N1)C=CC(=C2F)OC3=NC=NC4=CC(=C(C=C43)...,MSDVAIVKEGWLHKRGEYIKTWRPRYFLLKNDGTFIGYKERPQDVD...,5.000000,"[C, C, 1, =, C, C, 2, =, C, (, N, 1, ), C, =, ...","[M, S, D, V, A, I, V, K, E, G, W, L, H, K, R, ..."
4,CC1=C(C(=CC=C1)Cl)NC(=O)C2=CN=C(S2)NC3=NC(=NC(...,MSDVAIVKEGWLHKRGEYIKTWRPRYFLLKNDGTFIGYKERPQDVD...,5.000000,"[C, C, 1, =, C, (, C, (, =, C, C, =, C, 1, ), ...","[M, S, D, V, A, I, V, K, E, G, W, L, H, K, R, ..."
...,...,...,...,...,...
20055,CN1C=NC2=C1C=C(C(=C2F)NC3=C(C=C(C=C3)Br)Cl)C(=...,MPDPAAHLPFFYGSISRAEAEEHLKLAGMADGLFLLRQCLRSLGGY...,5.000000,"[C, N, 1, C, =, N, C, 2, =, C, 1, C, =, C, (, ...","[M, P, D, P, A, A, H, L, P, F, F, Y, G, S, I, ..."
20056,CC(C)S(=O)(=O)C1=CC=CC=C1NC2=NC(=NC=C2Cl)NC3=C...,MPDPAAHLPFFYGSISRAEAEEHLKLAGMADGLFLLRQCLRSLGGY...,5.795880,"[C, C, (, C, ), S, (, =, O, ), (, =, O, ), C, ...","[M, P, D, P, A, A, H, L, P, F, F, Y, G, S, I, ..."
20057,C1=CC(=CC(=C1)O)C2=NC3=C(N=C2C4=CC(=CC=C4)O)N=...,MPDPAAHLPFFYGSISRAEAEEHLKLAGMADGLFLLRQCLRSLGGY...,5.000000,"[C, 1, =, C, C, (, =, C, C, (, =, C, 1, ), O, ...","[M, P, D, P, A, A, H, L, P, F, F, Y, G, S, I, ..."
20058,CC1=CN=C(N=C1NC2=CC(=CC=C2)S(=O)(=O)NC(C)(C)C)...,MPDPAAHLPFFYGSISRAEAEEHLKLAGMADGLFLLRQCLRSLGGY...,5.420216,"[C, C, 1, =, C, N, =, C, (, N, =, C, 1, N, C, ...","[M, P, D, P, A, A, H, L, P, F, F, Y, G, S, I, ..."


In [9]:
# test

# To ensure that there are no common targets or drugs in train and test


In [10]:
test_smiles = list(test['SMILES'])
test_targets = list(test['Target Sequence'])
train_smiles = list(train['SMILES'])
train_targets = list(train['Target Sequence'])

# for i in test_smiles:
#     if i in train_smiles:
#         print("common entity present")
for i in test_targets:
    if i in train_targets:
        print("common entity present")


# Creating similarity matrices for this fold

In [11]:
import rdkit
from rdkit.Chem import AllChem as Chem
from rdkit.Chem import AllChem
from rdkit.DataStructs import FingerprintSimilarity as fs
from rdkit.Chem.Fingerprints import FingerprintMols
from Bio import pairwise2

In [12]:
train_targets = list(set(list(train['Target Sequence'])))
train_smiles = list(set(list(train['SMILES'])))

def computeLigandSimilarity(smiles):
    fingerprints = {}
    for smile in smiles:
        mol = AllChem.MolFromSmiles(smile)
        if mol == None:
            mol = AllChem.MolFromSmiles(smile, sanitize=False)
        fp = FingerprintMols.FingerprintMol(mol)
        fingerprints[smile] = fp
    
    n = len(smiles)
    sims = np.zeros((n, n))
    for i in range(n):
        for j in range(i+1):
            fpi = fingerprints[smiles[i]]
            fpj = fingerprints[smiles[j]]
            sim = fs(fpi, fpj)
            sims[i, j] = sims[j, i] = sim
    return sims

def computeProteinSimilarity(targets):
    n = len(targets)
    mat = np.zeros((n,n))
    mat_i = np.zeros(n)
    for i in range(n):
        seq = targets[i]
        s = pairwise2.align.localxx(seq,seq, score_only=True)
        mat_i[i] = s
        
    for i in range(n):
        print(i)
        for j in range(n):
            if mat[i][j] == 0 :
                s1 = targets[i]
                s2 = targets[j]
                sw_ij = pairwise2.align.localxx(s1,s2,score_only=True)
                normalized_score = sw_ij /math.sqrt(mat_i[i]*mat_i[j])
                mat[i][j] = mat[j][i] = normalized_score
    
    return mat

In [13]:
ligand_similarity_matrix = computeLigandSimilarity(train_smiles)

In [14]:
np.shape(ligand_similarity_matrix)

(68, 68)

In [15]:
print(len(train_targets))
protein_similarity_matrix = computeProteinSimilarity(train_targets)

273
0
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272


In [16]:
np.shape(protein_similarity_matrix)

(273, 273)

In [17]:
LSM = ligand_similarity_matrix
PSM = protein_similarity_matrix

# creating outer products for train set

In [18]:
outer_train_prods = []
for i,row in train.iterrows():
#     print(i)
    smi = row['SMILES']
    seq = row['Target Sequence']
    target_id = train_targets.index(seq)
    smi_id = train_smiles.index(smi)
    ki=LSM[smi_id]
    kj=PSM[target_id]
    ki_x_kj = np.outer(ki,kj)
    outer_train_prods.append([ki_x_kj])
outer_train_prods = np.array(outer_train_prods)
print(np.shape(outer_train_prods))

(20060, 1, 68, 273)


# Creating similarity matrcies for test set

In [19]:
test_targets = list(set(list(test['Target Sequence'])))
test_smiles = list(set(list(test['SMILES'])))

In [20]:
test_PSM = np.zeros((len(test_targets), len(train_targets)))
np.shape(test_PSM)

(106, 273)

In [21]:
s_train_PSM = np.zeros(len(train_targets))
s_test_PSM = np.zeros(len(test_targets))

for i in range(len(train_targets)):
    seq = train_targets[i]
    s_train_PSM[i] = pairwise2.align.localxx(seq,seq, score_only=True)
    
for i in range(len(test_targets)):
    seq = test_targets[i]
    s_test_PSM[i] = pairwise2.align.localxx(seq,seq, score_only=True)
    
for i in range(len(test_targets)):
    print(i)
    for j in range(len(train_targets)):
        seq1 = test_targets[i]
        seq2 = train_targets[j]
        s_ij=pairwise2.align.localxx(seq1, seq2, score_only=True)
        N_S = s_ij / math.sqrt(s_train_PSM[j] * s_test_PSM[i])
        test_PSM[i][j] = N_S

0
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105


In [22]:
test_LSM = np.zeros((len(test_smiles), len(train_smiles)))
np.shape(test_LSM)

(68, 68)

In [23]:
for i in range(len(test_smiles)):
    print(i)
    for j in range(len(train_smiles)):
        smi1 = test_smiles[i]
        smi2 = train_smiles[j]
        
        mol1 = AllChem.MolFromSmiles(smi1)
        if mol1 == None:
            mol1= AllChem.MolFromSmiles(smi1, sanitize=False)
        fp1 = FingerprintMols.FingerprintMol(mol1)
        
        mol2 = AllChem.MolFromSmiles(smi2)
        if mol2 == None:
            mol2= AllChem.MolFromSmiles(smi2, sanitize=False)
        fp2 = FingerprintMols.FingerprintMol(mol2)
        
        test_LSM[i][j] = fs(fp1,fp2)

0
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67


# Creating outer products for test set

In [24]:
outer_test_prods = []
for i,row in test.iterrows():
#     print(i)
    smi = row['SMILES']
    seq = row['Target Sequence']
    target_id = test_targets.index(seq)
    smi_id = test_smiles.index(smi)
    ki=test_LSM[smi_id]
    kj=test_PSM[target_id]
    ki_x_kj = np.outer(ki,kj)
    outer_test_prods.append([ki_x_kj])
outer_test_prods = np.array(outer_test_prods)
print(np.shape(outer_test_prods))

(9996, 1, 68, 273)


In [25]:
# Device configuration
device = torch.device('cuda:0' if torch.cuda.is_available() else 'cpu')

# Hyper parameters
num_epochs = 20
# num_classes = 10
batch_size = 32
learning_rate = 0.001

In [26]:
device

device(type='cuda', index=0)

In [27]:
class custom_dataset(torch.utils.data.Dataset):
    def __init__(self, dataframe, outer_prods, transform=None):
#         self.df = pd.read_csv(open(csv_file))
        self.df = dataframe
#         self.root_dir = root_dir
        self.transform = transform
        self.outer_prods = outer_prods
        
    def __len__(self):
        return len(self.df)
    
    def __getitem__(self, idx):
        output = {'outer_product': self.outer_prods[idx] , 'Label':self.df.iloc[idx]['Label']}
        return output

In [28]:
train_dataset = custom_dataset(dataframe = train, outer_prods = outer_train_prods)
test_dataset = custom_dataset(dataframe = test, outer_prods = outer_test_prods)


In [29]:
train_loader= torch.utils.data.DataLoader(train_dataset, batch_size=batch_size, shuffle=True)
test_loader= torch.utils.data.DataLoader(test_dataset, batch_size=batch_size, shuffle=True)

In [30]:
print(len(train_loader)*32, len(test_loader)*32)

20064 10016


In [33]:
# for i in test_loader:
#     a = i['outer_product']
#     b= i['Label']
#     break
# conv1 = nn.Conv2d(1,32,5).double()
# pool = nn.MaxPool2d(2,2).double()
# conv2 = nn.Conv2d(32,18,3).double()
# fc1 = nn.Linear(18*15*66, 128).double()
# fc2 = nn.Linear(128,1).double()
# dropout = nn.Dropout(0.1).double()
# x= conv1(a)
# print(x.shape)
# x = pool(x)
# print(x.shape)
# x= conv2(x)
# print(x.shape)
# x = pool(x)
# print(x.shape)
# x = x.view(-1,18*15*66)
# print(x.shape)
# x = dropout(x)
# print(x.shape)
# x = fc1(x)
# print(x.shape)
# x = fc2(x)
# print(x.shape)

torch.Size([32, 32, 64, 269])
torch.Size([32, 32, 32, 134])
torch.Size([32, 18, 30, 132])
torch.Size([32, 18, 15, 66])
torch.Size([32, 17820])
torch.Size([32, 17820])
torch.Size([32, 128])
torch.Size([32, 1])


In [34]:
import torch.nn.functional as F

class ConvNet(nn.Module):
    def __init__(self):
        super(ConvNet, self).__init__()
        self.conv1 = nn.Conv2d(1,32, 5).double()
        self.pool1 = nn.MaxPool2d(2,2).double()
        self.conv2 = nn.Conv2d(32,18,3).double()
        self.pool2 = nn.MaxPool2d(2,2).double()
        self.fc1 = nn.Linear(18*15*66, 128).double()
        self.fc2 = nn.Linear(128,1).double()
        self.dropout = nn.Dropout(0.1).double()
    def forward(self, x):
        x = F.relu(self.conv1(x))
        x = self.pool1(x)
        x = F.relu(self.conv2(x))
        x = self.pool2(x)
        x = x.view(-1,18*15*66)
        x = self.dropout(x)
        x = F.relu(self.fc1(x))
        x = self.fc2(x)
        
        
        return x
    

In [35]:
model = ConvNet().to(device)

In [36]:
# Loss and optimizer
criterion = nn.MSELoss()
optimizer = torch.optim.Adam(model.parameters(), lr=learning_rate)


# Evaluation metrics

In [37]:
def rmse(y,f):
    rmse = math.sqrt(((y - f)**2).mean(axis=0))
    return rmse
def mse(y,f):
    mse = ((y - f)**2).mean(axis=0)
    return mse
def pearson(y,f):
    rp = np.corrcoef(y, f)[0,1]
    return rp
from lifelines.utils import concordance_index
def ci(y,f):
    return concordance_index(y,f)

In [38]:
def predicting(model, device, test_loader):
    model.eval()
    total_preds = np.array([])
    total_labels = np.array([])
    with torch.no_grad():
        for i in test_loader:
            images = i['outer_product']
            labels = i['Label']
            images = images.to(device)
            labels = labels.to(device)

            # Forward pass
            outputs = model(images) 
            outputs = outputs.cpu().detach().numpy().flatten()
            labels =labels.cpu().detach().numpy().flatten()
            total_preds = np.concatenate([total_preds, outputs])
            total_labels = np.concatenate([total_labels, labels])
    
    model.train()
    return total_labels, total_preds

# Train the model


In [39]:
model_file_name = 'best_sim-CNN-DTA_davis_fold' + fold_number +  '.model'
result_file_name = 'best_result_sim-CNNDTA_davis_fold'+fold_number + '.csv'

In [40]:
# Train the model
best_mse = 1000
best_ci = 0

total_step = len(train_loader)
for epoch in range(num_epochs):
    c=0
    for i in train_loader:
        c=c+1
        images = i['outer_product']
        labels = i['Label']
        images = images.to(device)
        labels = labels.to(device)
        
        # Forward pass
        outputs = model(images)
        loss = criterion(outputs.flatten(), labels)
        
        # Backward and optimize
        optimizer.zero_grad()
        loss.backward()
        optimizer.step()
           
        print ('Epoch [{}/{}], Step [{}/{}], Loss: {:.4f}' 
               .format(epoch+1, num_epochs, c, total_step, loss.item()))
    
    # taking best model so far
    G,P = predicting(model, device, test_loader)
    ret = [rmse(G, P), mse(G, P), pearson(G, P), ci(G, P)]
    if ret[1] < best_mse:
        torch.save(model.state_dict(), model_file_name)
        with open(result_file_name, 'w') as f:
            f.write(','.join(map(str, ret)))
        best_epoch = epoch+1
        best_mse = ret[1]
        best_ci = ret[-1]
        best_r = ret[2]
        
        print('rmse improved at epoch ', best_epoch,
                      '; best_mse,best_ci,best_r:', best_mse, best_ci,best_r)
        
        

Epoch [1/20], Step [1/627], Loss: 30.0014
Epoch [1/20], Step [2/627], Loss: 16.1782
Epoch [1/20], Step [3/627], Loss: 2.7980
Epoch [1/20], Step [4/627], Loss: 9.9136
Epoch [1/20], Step [5/627], Loss: 6.9843
Epoch [1/20], Step [6/627], Loss: 1.5928
Epoch [1/20], Step [7/627], Loss: 1.2610
Epoch [1/20], Step [8/627], Loss: 2.5849
Epoch [1/20], Step [9/627], Loss: 3.2998
Epoch [1/20], Step [10/627], Loss: 3.5986
Epoch [1/20], Step [11/627], Loss: 2.5553
Epoch [1/20], Step [12/627], Loss: 2.5153
Epoch [1/20], Step [13/627], Loss: 0.3023
Epoch [1/20], Step [14/627], Loss: 0.9530
Epoch [1/20], Step [15/627], Loss: 1.2719
Epoch [1/20], Step [16/627], Loss: 1.8864
Epoch [1/20], Step [17/627], Loss: 1.9128
Epoch [1/20], Step [18/627], Loss: 0.9533
Epoch [1/20], Step [19/627], Loss: 0.7578
Epoch [1/20], Step [20/627], Loss: 0.5378
Epoch [1/20], Step [21/627], Loss: 2.3224
Epoch [1/20], Step [22/627], Loss: 0.7947
Epoch [1/20], Step [23/627], Loss: 0.8847
Epoch [1/20], Step [24/627], Loss: 0.5715

Epoch [1/20], Step [194/627], Loss: 0.5164
Epoch [1/20], Step [195/627], Loss: 1.4232
Epoch [1/20], Step [196/627], Loss: 1.6416
Epoch [1/20], Step [197/627], Loss: 0.8444
Epoch [1/20], Step [198/627], Loss: 0.7393
Epoch [1/20], Step [199/627], Loss: 1.1704
Epoch [1/20], Step [200/627], Loss: 0.8302
Epoch [1/20], Step [201/627], Loss: 0.4939
Epoch [1/20], Step [202/627], Loss: 1.2392
Epoch [1/20], Step [203/627], Loss: 0.6399
Epoch [1/20], Step [204/627], Loss: 1.1487
Epoch [1/20], Step [205/627], Loss: 0.4338
Epoch [1/20], Step [206/627], Loss: 1.0681
Epoch [1/20], Step [207/627], Loss: 0.8815
Epoch [1/20], Step [208/627], Loss: 1.3698
Epoch [1/20], Step [209/627], Loss: 1.0289
Epoch [1/20], Step [210/627], Loss: 0.2775
Epoch [1/20], Step [211/627], Loss: 0.7088
Epoch [1/20], Step [212/627], Loss: 1.3011
Epoch [1/20], Step [213/627], Loss: 1.3497
Epoch [1/20], Step [214/627], Loss: 0.5508
Epoch [1/20], Step [215/627], Loss: 0.3815
Epoch [1/20], Step [216/627], Loss: 0.7901
Epoch [1/20

Epoch [1/20], Step [389/627], Loss: 0.8031
Epoch [1/20], Step [390/627], Loss: 0.5064
Epoch [1/20], Step [391/627], Loss: 0.5955
Epoch [1/20], Step [392/627], Loss: 0.4107
Epoch [1/20], Step [393/627], Loss: 0.6968
Epoch [1/20], Step [394/627], Loss: 0.3888
Epoch [1/20], Step [395/627], Loss: 0.5025
Epoch [1/20], Step [396/627], Loss: 0.8515
Epoch [1/20], Step [397/627], Loss: 0.4768
Epoch [1/20], Step [398/627], Loss: 0.6356
Epoch [1/20], Step [399/627], Loss: 0.3696
Epoch [1/20], Step [400/627], Loss: 1.0992
Epoch [1/20], Step [401/627], Loss: 0.6948
Epoch [1/20], Step [402/627], Loss: 0.3229
Epoch [1/20], Step [403/627], Loss: 0.6128
Epoch [1/20], Step [404/627], Loss: 0.6784
Epoch [1/20], Step [405/627], Loss: 0.2711
Epoch [1/20], Step [406/627], Loss: 1.7379
Epoch [1/20], Step [407/627], Loss: 0.3487
Epoch [1/20], Step [408/627], Loss: 0.8574
Epoch [1/20], Step [409/627], Loss: 0.3506
Epoch [1/20], Step [410/627], Loss: 1.2906
Epoch [1/20], Step [411/627], Loss: 0.4220
Epoch [1/20

Epoch [1/20], Step [584/627], Loss: 0.4404
Epoch [1/20], Step [585/627], Loss: 0.5426
Epoch [1/20], Step [586/627], Loss: 0.7887
Epoch [1/20], Step [587/627], Loss: 0.4075
Epoch [1/20], Step [588/627], Loss: 0.6452
Epoch [1/20], Step [589/627], Loss: 0.8843
Epoch [1/20], Step [590/627], Loss: 1.2980
Epoch [1/20], Step [591/627], Loss: 0.5007
Epoch [1/20], Step [592/627], Loss: 0.3206
Epoch [1/20], Step [593/627], Loss: 0.4733
Epoch [1/20], Step [594/627], Loss: 0.6259
Epoch [1/20], Step [595/627], Loss: 0.1586
Epoch [1/20], Step [596/627], Loss: 0.4006
Epoch [1/20], Step [597/627], Loss: 0.5003
Epoch [1/20], Step [598/627], Loss: 0.7186
Epoch [1/20], Step [599/627], Loss: 0.3383
Epoch [1/20], Step [600/627], Loss: 0.6910
Epoch [1/20], Step [601/627], Loss: 0.8383
Epoch [1/20], Step [602/627], Loss: 1.1843
Epoch [1/20], Step [603/627], Loss: 0.5538
Epoch [1/20], Step [604/627], Loss: 0.6320
Epoch [1/20], Step [605/627], Loss: 0.6666
Epoch [1/20], Step [606/627], Loss: 0.3603
Epoch [1/20

Epoch [2/20], Step [150/627], Loss: 0.8469
Epoch [2/20], Step [151/627], Loss: 0.9062
Epoch [2/20], Step [152/627], Loss: 0.6838
Epoch [2/20], Step [153/627], Loss: 1.0729
Epoch [2/20], Step [154/627], Loss: 0.7749
Epoch [2/20], Step [155/627], Loss: 0.4849
Epoch [2/20], Step [156/627], Loss: 0.7034
Epoch [2/20], Step [157/627], Loss: 0.4648
Epoch [2/20], Step [158/627], Loss: 0.9522
Epoch [2/20], Step [159/627], Loss: 0.6473
Epoch [2/20], Step [160/627], Loss: 0.6090
Epoch [2/20], Step [161/627], Loss: 0.6269
Epoch [2/20], Step [162/627], Loss: 0.4552
Epoch [2/20], Step [163/627], Loss: 0.5436
Epoch [2/20], Step [164/627], Loss: 0.3717
Epoch [2/20], Step [165/627], Loss: 0.5912
Epoch [2/20], Step [166/627], Loss: 0.4000
Epoch [2/20], Step [167/627], Loss: 0.4999
Epoch [2/20], Step [168/627], Loss: 0.5706
Epoch [2/20], Step [169/627], Loss: 0.5887
Epoch [2/20], Step [170/627], Loss: 0.5142
Epoch [2/20], Step [171/627], Loss: 0.4392
Epoch [2/20], Step [172/627], Loss: 0.3884
Epoch [2/20

Epoch [2/20], Step [345/627], Loss: 0.8611
Epoch [2/20], Step [346/627], Loss: 0.3999
Epoch [2/20], Step [347/627], Loss: 0.8799
Epoch [2/20], Step [348/627], Loss: 0.3053
Epoch [2/20], Step [349/627], Loss: 1.1880
Epoch [2/20], Step [350/627], Loss: 0.7937
Epoch [2/20], Step [351/627], Loss: 0.9510
Epoch [2/20], Step [352/627], Loss: 0.2276
Epoch [2/20], Step [353/627], Loss: 1.3778
Epoch [2/20], Step [354/627], Loss: 0.7006
Epoch [2/20], Step [355/627], Loss: 1.3171
Epoch [2/20], Step [356/627], Loss: 0.4164
Epoch [2/20], Step [357/627], Loss: 0.3999
Epoch [2/20], Step [358/627], Loss: 0.6093
Epoch [2/20], Step [359/627], Loss: 1.2321
Epoch [2/20], Step [360/627], Loss: 0.4847
Epoch [2/20], Step [361/627], Loss: 0.2763
Epoch [2/20], Step [362/627], Loss: 0.2750
Epoch [2/20], Step [363/627], Loss: 0.7978
Epoch [2/20], Step [364/627], Loss: 0.5100
Epoch [2/20], Step [365/627], Loss: 0.3436
Epoch [2/20], Step [366/627], Loss: 0.2736
Epoch [2/20], Step [367/627], Loss: 0.7167
Epoch [2/20

Epoch [2/20], Step [539/627], Loss: 1.0868
Epoch [2/20], Step [540/627], Loss: 0.4035
Epoch [2/20], Step [541/627], Loss: 0.3954
Epoch [2/20], Step [542/627], Loss: 0.4419
Epoch [2/20], Step [543/627], Loss: 0.6903
Epoch [2/20], Step [544/627], Loss: 0.5848
Epoch [2/20], Step [545/627], Loss: 0.6204
Epoch [2/20], Step [546/627], Loss: 0.5992
Epoch [2/20], Step [547/627], Loss: 0.2356
Epoch [2/20], Step [548/627], Loss: 0.8683
Epoch [2/20], Step [549/627], Loss: 0.4512
Epoch [2/20], Step [550/627], Loss: 0.2433
Epoch [2/20], Step [551/627], Loss: 0.1607
Epoch [2/20], Step [552/627], Loss: 0.5406
Epoch [2/20], Step [553/627], Loss: 1.3573
Epoch [2/20], Step [554/627], Loss: 0.7162
Epoch [2/20], Step [555/627], Loss: 0.6136
Epoch [2/20], Step [556/627], Loss: 0.4427
Epoch [2/20], Step [557/627], Loss: 0.5577
Epoch [2/20], Step [558/627], Loss: 0.4770
Epoch [2/20], Step [559/627], Loss: 0.6017
Epoch [2/20], Step [560/627], Loss: 0.5490
Epoch [2/20], Step [561/627], Loss: 0.2278
Epoch [2/20

Epoch [3/20], Step [104/627], Loss: 0.2437
Epoch [3/20], Step [105/627], Loss: 0.3917
Epoch [3/20], Step [106/627], Loss: 0.4205
Epoch [3/20], Step [107/627], Loss: 0.4890
Epoch [3/20], Step [108/627], Loss: 0.2786
Epoch [3/20], Step [109/627], Loss: 1.4340
Epoch [3/20], Step [110/627], Loss: 0.7692
Epoch [3/20], Step [111/627], Loss: 0.2301
Epoch [3/20], Step [112/627], Loss: 0.6624
Epoch [3/20], Step [113/627], Loss: 0.6683
Epoch [3/20], Step [114/627], Loss: 0.5392
Epoch [3/20], Step [115/627], Loss: 0.4285
Epoch [3/20], Step [116/627], Loss: 0.7814
Epoch [3/20], Step [117/627], Loss: 1.3712
Epoch [3/20], Step [118/627], Loss: 0.2986
Epoch [3/20], Step [119/627], Loss: 0.5481
Epoch [3/20], Step [120/627], Loss: 0.8990
Epoch [3/20], Step [121/627], Loss: 0.4648
Epoch [3/20], Step [122/627], Loss: 0.5637
Epoch [3/20], Step [123/627], Loss: 0.3093
Epoch [3/20], Step [124/627], Loss: 0.3374
Epoch [3/20], Step [125/627], Loss: 2.0384
Epoch [3/20], Step [126/627], Loss: 1.1574
Epoch [3/20

Epoch [3/20], Step [299/627], Loss: 0.7449
Epoch [3/20], Step [300/627], Loss: 0.5037
Epoch [3/20], Step [301/627], Loss: 0.3018
Epoch [3/20], Step [302/627], Loss: 0.3280
Epoch [3/20], Step [303/627], Loss: 0.5604
Epoch [3/20], Step [304/627], Loss: 0.6896
Epoch [3/20], Step [305/627], Loss: 0.2902
Epoch [3/20], Step [306/627], Loss: 0.5486
Epoch [3/20], Step [307/627], Loss: 0.5618
Epoch [3/20], Step [308/627], Loss: 0.3828
Epoch [3/20], Step [309/627], Loss: 0.2516
Epoch [3/20], Step [310/627], Loss: 1.2830
Epoch [3/20], Step [311/627], Loss: 0.7900
Epoch [3/20], Step [312/627], Loss: 0.4376
Epoch [3/20], Step [313/627], Loss: 0.2989
Epoch [3/20], Step [314/627], Loss: 0.8473
Epoch [3/20], Step [315/627], Loss: 0.6899
Epoch [3/20], Step [316/627], Loss: 0.5441
Epoch [3/20], Step [317/627], Loss: 0.6382
Epoch [3/20], Step [318/627], Loss: 0.9712
Epoch [3/20], Step [319/627], Loss: 0.6712
Epoch [3/20], Step [320/627], Loss: 0.6386
Epoch [3/20], Step [321/627], Loss: 0.2939
Epoch [3/20

Epoch [3/20], Step [492/627], Loss: 0.8873
Epoch [3/20], Step [493/627], Loss: 0.7380
Epoch [3/20], Step [494/627], Loss: 0.6161
Epoch [3/20], Step [495/627], Loss: 0.4356
Epoch [3/20], Step [496/627], Loss: 0.3878
Epoch [3/20], Step [497/627], Loss: 0.2481
Epoch [3/20], Step [498/627], Loss: 1.0260
Epoch [3/20], Step [499/627], Loss: 0.3294
Epoch [3/20], Step [500/627], Loss: 0.3463
Epoch [3/20], Step [501/627], Loss: 0.3394
Epoch [3/20], Step [502/627], Loss: 0.6335
Epoch [3/20], Step [503/627], Loss: 0.2804
Epoch [3/20], Step [504/627], Loss: 0.5320
Epoch [3/20], Step [505/627], Loss: 0.2746
Epoch [3/20], Step [506/627], Loss: 0.5881
Epoch [3/20], Step [507/627], Loss: 0.6152
Epoch [3/20], Step [508/627], Loss: 0.3466
Epoch [3/20], Step [509/627], Loss: 0.7508
Epoch [3/20], Step [510/627], Loss: 0.2337
Epoch [3/20], Step [511/627], Loss: 0.6000
Epoch [3/20], Step [512/627], Loss: 0.1955
Epoch [3/20], Step [513/627], Loss: 0.2885
Epoch [3/20], Step [514/627], Loss: 0.6514
Epoch [3/20

Epoch [4/20], Step [59/627], Loss: 0.2658
Epoch [4/20], Step [60/627], Loss: 0.5525
Epoch [4/20], Step [61/627], Loss: 0.3110
Epoch [4/20], Step [62/627], Loss: 0.6341
Epoch [4/20], Step [63/627], Loss: 0.3210
Epoch [4/20], Step [64/627], Loss: 0.5411
Epoch [4/20], Step [65/627], Loss: 0.6283
Epoch [4/20], Step [66/627], Loss: 0.5637
Epoch [4/20], Step [67/627], Loss: 0.6269
Epoch [4/20], Step [68/627], Loss: 0.5810
Epoch [4/20], Step [69/627], Loss: 0.5267
Epoch [4/20], Step [70/627], Loss: 0.3497
Epoch [4/20], Step [71/627], Loss: 0.6344
Epoch [4/20], Step [72/627], Loss: 0.6504
Epoch [4/20], Step [73/627], Loss: 0.5947
Epoch [4/20], Step [74/627], Loss: 0.4288
Epoch [4/20], Step [75/627], Loss: 0.7438
Epoch [4/20], Step [76/627], Loss: 0.2963
Epoch [4/20], Step [77/627], Loss: 0.7160
Epoch [4/20], Step [78/627], Loss: 0.7581
Epoch [4/20], Step [79/627], Loss: 0.2066
Epoch [4/20], Step [80/627], Loss: 0.3452
Epoch [4/20], Step [81/627], Loss: 0.3963
Epoch [4/20], Step [82/627], Loss:

Epoch [4/20], Step [253/627], Loss: 0.6278
Epoch [4/20], Step [254/627], Loss: 0.4247
Epoch [4/20], Step [255/627], Loss: 0.5478
Epoch [4/20], Step [256/627], Loss: 0.4855
Epoch [4/20], Step [257/627], Loss: 0.3455
Epoch [4/20], Step [258/627], Loss: 0.5522
Epoch [4/20], Step [259/627], Loss: 0.5637
Epoch [4/20], Step [260/627], Loss: 1.8951
Epoch [4/20], Step [261/627], Loss: 0.2601
Epoch [4/20], Step [262/627], Loss: 0.5199
Epoch [4/20], Step [263/627], Loss: 0.4963
Epoch [4/20], Step [264/627], Loss: 0.5249
Epoch [4/20], Step [265/627], Loss: 0.4126
Epoch [4/20], Step [266/627], Loss: 0.2456
Epoch [4/20], Step [267/627], Loss: 0.3131
Epoch [4/20], Step [268/627], Loss: 0.7298
Epoch [4/20], Step [269/627], Loss: 0.8291
Epoch [4/20], Step [270/627], Loss: 0.5474
Epoch [4/20], Step [271/627], Loss: 0.4186
Epoch [4/20], Step [272/627], Loss: 0.4567
Epoch [4/20], Step [273/627], Loss: 0.5229
Epoch [4/20], Step [274/627], Loss: 0.6074
Epoch [4/20], Step [275/627], Loss: 0.5178
Epoch [4/20

Epoch [4/20], Step [444/627], Loss: 0.5704
Epoch [4/20], Step [445/627], Loss: 1.0917
Epoch [4/20], Step [446/627], Loss: 0.4541
Epoch [4/20], Step [447/627], Loss: 0.4433
Epoch [4/20], Step [448/627], Loss: 0.5653
Epoch [4/20], Step [449/627], Loss: 0.4900
Epoch [4/20], Step [450/627], Loss: 0.4626
Epoch [4/20], Step [451/627], Loss: 0.5443
Epoch [4/20], Step [452/627], Loss: 0.5241
Epoch [4/20], Step [453/627], Loss: 0.4765
Epoch [4/20], Step [454/627], Loss: 0.3731
Epoch [4/20], Step [455/627], Loss: 0.5528
Epoch [4/20], Step [456/627], Loss: 0.5906
Epoch [4/20], Step [457/627], Loss: 0.6200
Epoch [4/20], Step [458/627], Loss: 0.4659
Epoch [4/20], Step [459/627], Loss: 0.9114
Epoch [4/20], Step [460/627], Loss: 0.6809
Epoch [4/20], Step [461/627], Loss: 0.2659
Epoch [4/20], Step [462/627], Loss: 0.3659
Epoch [4/20], Step [463/627], Loss: 0.5226
Epoch [4/20], Step [464/627], Loss: 0.3471
Epoch [4/20], Step [465/627], Loss: 0.4623
Epoch [4/20], Step [466/627], Loss: 0.5831
Epoch [4/20

Epoch [5/20], Step [11/627], Loss: 0.6298
Epoch [5/20], Step [12/627], Loss: 0.1748
Epoch [5/20], Step [13/627], Loss: 1.1313
Epoch [5/20], Step [14/627], Loss: 0.6639
Epoch [5/20], Step [15/627], Loss: 0.4433
Epoch [5/20], Step [16/627], Loss: 0.3057
Epoch [5/20], Step [17/627], Loss: 0.5527
Epoch [5/20], Step [18/627], Loss: 0.9889
Epoch [5/20], Step [19/627], Loss: 0.3591
Epoch [5/20], Step [20/627], Loss: 0.4431
Epoch [5/20], Step [21/627], Loss: 0.4429
Epoch [5/20], Step [22/627], Loss: 0.1745
Epoch [5/20], Step [23/627], Loss: 0.5074
Epoch [5/20], Step [24/627], Loss: 0.8690
Epoch [5/20], Step [25/627], Loss: 0.3237
Epoch [5/20], Step [26/627], Loss: 0.4521
Epoch [5/20], Step [27/627], Loss: 0.5869
Epoch [5/20], Step [28/627], Loss: 0.7481
Epoch [5/20], Step [29/627], Loss: 0.7307
Epoch [5/20], Step [30/627], Loss: 0.7063
Epoch [5/20], Step [31/627], Loss: 0.8115
Epoch [5/20], Step [32/627], Loss: 0.2875
Epoch [5/20], Step [33/627], Loss: 0.2294
Epoch [5/20], Step [34/627], Loss:

Epoch [5/20], Step [208/627], Loss: 0.4155
Epoch [5/20], Step [209/627], Loss: 0.6641
Epoch [5/20], Step [210/627], Loss: 0.4384
Epoch [5/20], Step [211/627], Loss: 0.4604
Epoch [5/20], Step [212/627], Loss: 0.4457
Epoch [5/20], Step [213/627], Loss: 0.4792
Epoch [5/20], Step [214/627], Loss: 0.4850
Epoch [5/20], Step [215/627], Loss: 0.5370
Epoch [5/20], Step [216/627], Loss: 0.1842
Epoch [5/20], Step [217/627], Loss: 0.1698
Epoch [5/20], Step [218/627], Loss: 0.3986
Epoch [5/20], Step [219/627], Loss: 0.7036
Epoch [5/20], Step [220/627], Loss: 0.5030
Epoch [5/20], Step [221/627], Loss: 0.8277
Epoch [5/20], Step [222/627], Loss: 0.3174
Epoch [5/20], Step [223/627], Loss: 0.4461
Epoch [5/20], Step [224/627], Loss: 0.2980
Epoch [5/20], Step [225/627], Loss: 1.1775
Epoch [5/20], Step [226/627], Loss: 0.7205
Epoch [5/20], Step [227/627], Loss: 0.3766
Epoch [5/20], Step [228/627], Loss: 0.6225
Epoch [5/20], Step [229/627], Loss: 0.3400
Epoch [5/20], Step [230/627], Loss: 0.5630
Epoch [5/20

Epoch [5/20], Step [399/627], Loss: 0.4575
Epoch [5/20], Step [400/627], Loss: 0.4010
Epoch [5/20], Step [401/627], Loss: 0.4248
Epoch [5/20], Step [402/627], Loss: 0.2267
Epoch [5/20], Step [403/627], Loss: 0.5703
Epoch [5/20], Step [404/627], Loss: 0.5782
Epoch [5/20], Step [405/627], Loss: 0.2335
Epoch [5/20], Step [406/627], Loss: 0.3269
Epoch [5/20], Step [407/627], Loss: 0.7836
Epoch [5/20], Step [408/627], Loss: 0.2500
Epoch [5/20], Step [409/627], Loss: 0.5329
Epoch [5/20], Step [410/627], Loss: 0.2616
Epoch [5/20], Step [411/627], Loss: 0.7039
Epoch [5/20], Step [412/627], Loss: 0.3810
Epoch [5/20], Step [413/627], Loss: 0.2923
Epoch [5/20], Step [414/627], Loss: 0.2844
Epoch [5/20], Step [415/627], Loss: 0.6202
Epoch [5/20], Step [416/627], Loss: 0.3491
Epoch [5/20], Step [417/627], Loss: 0.4955
Epoch [5/20], Step [418/627], Loss: 0.1742
Epoch [5/20], Step [419/627], Loss: 0.3832
Epoch [5/20], Step [420/627], Loss: 0.6511
Epoch [5/20], Step [421/627], Loss: 0.2112
Epoch [5/20

Epoch [5/20], Step [591/627], Loss: 0.5183
Epoch [5/20], Step [592/627], Loss: 0.3260
Epoch [5/20], Step [593/627], Loss: 0.4908
Epoch [5/20], Step [594/627], Loss: 1.1820
Epoch [5/20], Step [595/627], Loss: 0.6712
Epoch [5/20], Step [596/627], Loss: 0.5124
Epoch [5/20], Step [597/627], Loss: 0.4351
Epoch [5/20], Step [598/627], Loss: 0.4885
Epoch [5/20], Step [599/627], Loss: 0.2679
Epoch [5/20], Step [600/627], Loss: 0.1744
Epoch [5/20], Step [601/627], Loss: 0.2745
Epoch [5/20], Step [602/627], Loss: 0.3512
Epoch [5/20], Step [603/627], Loss: 0.2008
Epoch [5/20], Step [604/627], Loss: 0.5718
Epoch [5/20], Step [605/627], Loss: 0.3323
Epoch [5/20], Step [606/627], Loss: 0.3555
Epoch [5/20], Step [607/627], Loss: 0.4375
Epoch [5/20], Step [608/627], Loss: 0.3686
Epoch [5/20], Step [609/627], Loss: 0.5431
Epoch [5/20], Step [610/627], Loss: 0.3794
Epoch [5/20], Step [611/627], Loss: 0.2973
Epoch [5/20], Step [612/627], Loss: 0.4498
Epoch [5/20], Step [613/627], Loss: 0.3469
Epoch [5/20

Epoch [6/20], Step [161/627], Loss: 0.2456
Epoch [6/20], Step [162/627], Loss: 0.2170
Epoch [6/20], Step [163/627], Loss: 0.2423
Epoch [6/20], Step [164/627], Loss: 0.4463
Epoch [6/20], Step [165/627], Loss: 0.3974
Epoch [6/20], Step [166/627], Loss: 0.1901
Epoch [6/20], Step [167/627], Loss: 0.5168
Epoch [6/20], Step [168/627], Loss: 0.3891
Epoch [6/20], Step [169/627], Loss: 0.1917
Epoch [6/20], Step [170/627], Loss: 0.6144
Epoch [6/20], Step [171/627], Loss: 0.3615
Epoch [6/20], Step [172/627], Loss: 0.3093
Epoch [6/20], Step [173/627], Loss: 0.2362
Epoch [6/20], Step [174/627], Loss: 0.3499
Epoch [6/20], Step [175/627], Loss: 0.2005
Epoch [6/20], Step [176/627], Loss: 0.2598
Epoch [6/20], Step [177/627], Loss: 0.3682
Epoch [6/20], Step [178/627], Loss: 0.2033
Epoch [6/20], Step [179/627], Loss: 0.4478
Epoch [6/20], Step [180/627], Loss: 0.1870
Epoch [6/20], Step [181/627], Loss: 0.1466
Epoch [6/20], Step [182/627], Loss: 0.3660
Epoch [6/20], Step [183/627], Loss: 0.8573
Epoch [6/20

Epoch [6/20], Step [354/627], Loss: 0.2188
Epoch [6/20], Step [355/627], Loss: 0.1635
Epoch [6/20], Step [356/627], Loss: 0.2997
Epoch [6/20], Step [357/627], Loss: 0.4629
Epoch [6/20], Step [358/627], Loss: 0.3016
Epoch [6/20], Step [359/627], Loss: 0.2977
Epoch [6/20], Step [360/627], Loss: 0.5116
Epoch [6/20], Step [361/627], Loss: 0.3895
Epoch [6/20], Step [362/627], Loss: 0.4480
Epoch [6/20], Step [363/627], Loss: 1.0248
Epoch [6/20], Step [364/627], Loss: 0.2310
Epoch [6/20], Step [365/627], Loss: 0.2509
Epoch [6/20], Step [366/627], Loss: 0.3626
Epoch [6/20], Step [367/627], Loss: 0.3808
Epoch [6/20], Step [368/627], Loss: 0.5787
Epoch [6/20], Step [369/627], Loss: 0.3950
Epoch [6/20], Step [370/627], Loss: 0.3509
Epoch [6/20], Step [371/627], Loss: 0.4477
Epoch [6/20], Step [372/627], Loss: 0.3444
Epoch [6/20], Step [373/627], Loss: 0.7319
Epoch [6/20], Step [374/627], Loss: 0.2973
Epoch [6/20], Step [375/627], Loss: 0.2917
Epoch [6/20], Step [376/627], Loss: 0.2435
Epoch [6/20

Epoch [6/20], Step [548/627], Loss: 0.7473
Epoch [6/20], Step [549/627], Loss: 0.5093
Epoch [6/20], Step [550/627], Loss: 0.9893
Epoch [6/20], Step [551/627], Loss: 0.3003
Epoch [6/20], Step [552/627], Loss: 0.2177
Epoch [6/20], Step [553/627], Loss: 0.7711
Epoch [6/20], Step [554/627], Loss: 0.4251
Epoch [6/20], Step [555/627], Loss: 0.6659
Epoch [6/20], Step [556/627], Loss: 1.1703
Epoch [6/20], Step [557/627], Loss: 0.1712
Epoch [6/20], Step [558/627], Loss: 0.6490
Epoch [6/20], Step [559/627], Loss: 0.5637
Epoch [6/20], Step [560/627], Loss: 0.4996
Epoch [6/20], Step [561/627], Loss: 0.2776
Epoch [6/20], Step [562/627], Loss: 0.6359
Epoch [6/20], Step [563/627], Loss: 0.6958
Epoch [6/20], Step [564/627], Loss: 0.3981
Epoch [6/20], Step [565/627], Loss: 0.4816
Epoch [6/20], Step [566/627], Loss: 0.1335
Epoch [6/20], Step [567/627], Loss: 0.2348
Epoch [6/20], Step [568/627], Loss: 1.0011
Epoch [6/20], Step [569/627], Loss: 0.2654
Epoch [6/20], Step [570/627], Loss: 0.3105
Epoch [6/20

Epoch [7/20], Step [118/627], Loss: 0.5570
Epoch [7/20], Step [119/627], Loss: 0.6346
Epoch [7/20], Step [120/627], Loss: 0.4557
Epoch [7/20], Step [121/627], Loss: 0.1901
Epoch [7/20], Step [122/627], Loss: 0.3621
Epoch [7/20], Step [123/627], Loss: 0.5181
Epoch [7/20], Step [124/627], Loss: 0.5804
Epoch [7/20], Step [125/627], Loss: 0.3924
Epoch [7/20], Step [126/627], Loss: 0.3258
Epoch [7/20], Step [127/627], Loss: 0.3088
Epoch [7/20], Step [128/627], Loss: 0.4725
Epoch [7/20], Step [129/627], Loss: 0.3578
Epoch [7/20], Step [130/627], Loss: 0.2447
Epoch [7/20], Step [131/627], Loss: 0.5582
Epoch [7/20], Step [132/627], Loss: 0.3184
Epoch [7/20], Step [133/627], Loss: 0.4502
Epoch [7/20], Step [134/627], Loss: 0.7174
Epoch [7/20], Step [135/627], Loss: 0.3855
Epoch [7/20], Step [136/627], Loss: 0.5818
Epoch [7/20], Step [137/627], Loss: 0.3510
Epoch [7/20], Step [138/627], Loss: 0.3838
Epoch [7/20], Step [139/627], Loss: 0.2827
Epoch [7/20], Step [140/627], Loss: 0.2648
Epoch [7/20

Epoch [7/20], Step [310/627], Loss: 0.4596
Epoch [7/20], Step [311/627], Loss: 0.3230
Epoch [7/20], Step [312/627], Loss: 0.2573
Epoch [7/20], Step [313/627], Loss: 0.5084
Epoch [7/20], Step [314/627], Loss: 0.7148
Epoch [7/20], Step [315/627], Loss: 0.2114
Epoch [7/20], Step [316/627], Loss: 0.4329
Epoch [7/20], Step [317/627], Loss: 0.0775
Epoch [7/20], Step [318/627], Loss: 0.3402
Epoch [7/20], Step [319/627], Loss: 0.2211
Epoch [7/20], Step [320/627], Loss: 0.2020
Epoch [7/20], Step [321/627], Loss: 0.4081
Epoch [7/20], Step [322/627], Loss: 0.5347
Epoch [7/20], Step [323/627], Loss: 0.2402
Epoch [7/20], Step [324/627], Loss: 0.6602
Epoch [7/20], Step [325/627], Loss: 0.1722
Epoch [7/20], Step [326/627], Loss: 0.5316
Epoch [7/20], Step [327/627], Loss: 0.3526
Epoch [7/20], Step [328/627], Loss: 0.3491
Epoch [7/20], Step [329/627], Loss: 0.5826
Epoch [7/20], Step [330/627], Loss: 0.4001
Epoch [7/20], Step [331/627], Loss: 0.1554
Epoch [7/20], Step [332/627], Loss: 0.3015
Epoch [7/20

Epoch [7/20], Step [501/627], Loss: 0.2147
Epoch [7/20], Step [502/627], Loss: 0.3145
Epoch [7/20], Step [503/627], Loss: 0.3548
Epoch [7/20], Step [504/627], Loss: 0.3688
Epoch [7/20], Step [505/627], Loss: 0.2297
Epoch [7/20], Step [506/627], Loss: 0.1613
Epoch [7/20], Step [507/627], Loss: 0.0828
Epoch [7/20], Step [508/627], Loss: 0.2763
Epoch [7/20], Step [509/627], Loss: 0.6114
Epoch [7/20], Step [510/627], Loss: 0.2164
Epoch [7/20], Step [511/627], Loss: 0.6099
Epoch [7/20], Step [512/627], Loss: 0.4431
Epoch [7/20], Step [513/627], Loss: 0.1768
Epoch [7/20], Step [514/627], Loss: 0.7380
Epoch [7/20], Step [515/627], Loss: 0.3154
Epoch [7/20], Step [516/627], Loss: 0.2706
Epoch [7/20], Step [517/627], Loss: 0.2385
Epoch [7/20], Step [518/627], Loss: 0.4223
Epoch [7/20], Step [519/627], Loss: 0.3528
Epoch [7/20], Step [520/627], Loss: 0.4121
Epoch [7/20], Step [521/627], Loss: 0.3168
Epoch [7/20], Step [522/627], Loss: 0.4405
Epoch [7/20], Step [523/627], Loss: 0.3669
Epoch [7/20

Epoch [8/20], Step [71/627], Loss: 1.0069
Epoch [8/20], Step [72/627], Loss: 0.3752
Epoch [8/20], Step [73/627], Loss: 0.2561
Epoch [8/20], Step [74/627], Loss: 0.2943
Epoch [8/20], Step [75/627], Loss: 0.3184
Epoch [8/20], Step [76/627], Loss: 0.2993
Epoch [8/20], Step [77/627], Loss: 0.5779
Epoch [8/20], Step [78/627], Loss: 0.4635
Epoch [8/20], Step [79/627], Loss: 0.2086
Epoch [8/20], Step [80/627], Loss: 0.2686
Epoch [8/20], Step [81/627], Loss: 0.3914
Epoch [8/20], Step [82/627], Loss: 0.2771
Epoch [8/20], Step [83/627], Loss: 0.3217
Epoch [8/20], Step [84/627], Loss: 0.6913
Epoch [8/20], Step [85/627], Loss: 0.3668
Epoch [8/20], Step [86/627], Loss: 0.3059
Epoch [8/20], Step [87/627], Loss: 0.7298
Epoch [8/20], Step [88/627], Loss: 0.2810
Epoch [8/20], Step [89/627], Loss: 0.2831
Epoch [8/20], Step [90/627], Loss: 0.3708
Epoch [8/20], Step [91/627], Loss: 0.1582
Epoch [8/20], Step [92/627], Loss: 0.5314
Epoch [8/20], Step [93/627], Loss: 0.4655
Epoch [8/20], Step [94/627], Loss:

Epoch [8/20], Step [266/627], Loss: 0.5895
Epoch [8/20], Step [267/627], Loss: 0.1871
Epoch [8/20], Step [268/627], Loss: 0.6760
Epoch [8/20], Step [269/627], Loss: 0.2499
Epoch [8/20], Step [270/627], Loss: 0.3974
Epoch [8/20], Step [271/627], Loss: 0.5448
Epoch [8/20], Step [272/627], Loss: 0.5701
Epoch [8/20], Step [273/627], Loss: 0.2614
Epoch [8/20], Step [274/627], Loss: 0.2439
Epoch [8/20], Step [275/627], Loss: 0.2744
Epoch [8/20], Step [276/627], Loss: 0.2362
Epoch [8/20], Step [277/627], Loss: 0.4469
Epoch [8/20], Step [278/627], Loss: 0.1177
Epoch [8/20], Step [279/627], Loss: 0.1402
Epoch [8/20], Step [280/627], Loss: 0.2556
Epoch [8/20], Step [281/627], Loss: 0.6253
Epoch [8/20], Step [282/627], Loss: 0.3454
Epoch [8/20], Step [283/627], Loss: 0.4331
Epoch [8/20], Step [284/627], Loss: 0.4598
Epoch [8/20], Step [285/627], Loss: 0.2738
Epoch [8/20], Step [286/627], Loss: 0.3425
Epoch [8/20], Step [287/627], Loss: 0.3955
Epoch [8/20], Step [288/627], Loss: 0.1699
Epoch [8/20

Epoch [8/20], Step [460/627], Loss: 0.0931
Epoch [8/20], Step [461/627], Loss: 0.2555
Epoch [8/20], Step [462/627], Loss: 0.4336
Epoch [8/20], Step [463/627], Loss: 0.3364
Epoch [8/20], Step [464/627], Loss: 0.2187
Epoch [8/20], Step [465/627], Loss: 0.2052
Epoch [8/20], Step [466/627], Loss: 0.1699
Epoch [8/20], Step [467/627], Loss: 0.5583
Epoch [8/20], Step [468/627], Loss: 0.4838
Epoch [8/20], Step [469/627], Loss: 0.1214
Epoch [8/20], Step [470/627], Loss: 0.2311
Epoch [8/20], Step [471/627], Loss: 0.3904
Epoch [8/20], Step [472/627], Loss: 0.4848
Epoch [8/20], Step [473/627], Loss: 0.4220
Epoch [8/20], Step [474/627], Loss: 0.3700
Epoch [8/20], Step [475/627], Loss: 0.2936
Epoch [8/20], Step [476/627], Loss: 0.4721
Epoch [8/20], Step [477/627], Loss: 0.6474
Epoch [8/20], Step [478/627], Loss: 0.2360
Epoch [8/20], Step [479/627], Loss: 0.2426
Epoch [8/20], Step [480/627], Loss: 0.8190
Epoch [8/20], Step [481/627], Loss: 0.4165
Epoch [8/20], Step [482/627], Loss: 0.7010
Epoch [8/20

Epoch [9/20], Step [26/627], Loss: 0.2374
Epoch [9/20], Step [27/627], Loss: 0.1531
Epoch [9/20], Step [28/627], Loss: 0.5401
Epoch [9/20], Step [29/627], Loss: 0.3271
Epoch [9/20], Step [30/627], Loss: 0.3718
Epoch [9/20], Step [31/627], Loss: 0.2798
Epoch [9/20], Step [32/627], Loss: 0.5872
Epoch [9/20], Step [33/627], Loss: 0.2332
Epoch [9/20], Step [34/627], Loss: 0.3003
Epoch [9/20], Step [35/627], Loss: 0.4456
Epoch [9/20], Step [36/627], Loss: 0.4663
Epoch [9/20], Step [37/627], Loss: 0.3052
Epoch [9/20], Step [38/627], Loss: 0.1279
Epoch [9/20], Step [39/627], Loss: 0.5879
Epoch [9/20], Step [40/627], Loss: 0.1714
Epoch [9/20], Step [41/627], Loss: 0.3262
Epoch [9/20], Step [42/627], Loss: 0.3995
Epoch [9/20], Step [43/627], Loss: 0.2448
Epoch [9/20], Step [44/627], Loss: 0.3414
Epoch [9/20], Step [45/627], Loss: 0.6931
Epoch [9/20], Step [46/627], Loss: 0.2284
Epoch [9/20], Step [47/627], Loss: 0.2363
Epoch [9/20], Step [48/627], Loss: 0.4656
Epoch [9/20], Step [49/627], Loss:

Epoch [9/20], Step [221/627], Loss: 0.1427
Epoch [9/20], Step [222/627], Loss: 0.2960
Epoch [9/20], Step [223/627], Loss: 0.1030
Epoch [9/20], Step [224/627], Loss: 0.2407
Epoch [9/20], Step [225/627], Loss: 0.4007
Epoch [9/20], Step [226/627], Loss: 0.3045
Epoch [9/20], Step [227/627], Loss: 0.2429
Epoch [9/20], Step [228/627], Loss: 0.2325
Epoch [9/20], Step [229/627], Loss: 0.2552
Epoch [9/20], Step [230/627], Loss: 0.2633
Epoch [9/20], Step [231/627], Loss: 0.6985
Epoch [9/20], Step [232/627], Loss: 0.3228
Epoch [9/20], Step [233/627], Loss: 0.2327
Epoch [9/20], Step [234/627], Loss: 0.2735
Epoch [9/20], Step [235/627], Loss: 0.3814
Epoch [9/20], Step [236/627], Loss: 0.1747
Epoch [9/20], Step [237/627], Loss: 0.1290
Epoch [9/20], Step [238/627], Loss: 0.2140
Epoch [9/20], Step [239/627], Loss: 0.2565
Epoch [9/20], Step [240/627], Loss: 0.5465
Epoch [9/20], Step [241/627], Loss: 0.2253
Epoch [9/20], Step [242/627], Loss: 0.5804
Epoch [9/20], Step [243/627], Loss: 0.1820
Epoch [9/20

Epoch [9/20], Step [416/627], Loss: 0.3742
Epoch [9/20], Step [417/627], Loss: 0.2648
Epoch [9/20], Step [418/627], Loss: 0.3385
Epoch [9/20], Step [419/627], Loss: 0.3913
Epoch [9/20], Step [420/627], Loss: 0.1470
Epoch [9/20], Step [421/627], Loss: 0.3300
Epoch [9/20], Step [422/627], Loss: 0.5047
Epoch [9/20], Step [423/627], Loss: 0.2586
Epoch [9/20], Step [424/627], Loss: 0.1581
Epoch [9/20], Step [425/627], Loss: 0.2959
Epoch [9/20], Step [426/627], Loss: 0.1992
Epoch [9/20], Step [427/627], Loss: 0.2574
Epoch [9/20], Step [428/627], Loss: 0.2170
Epoch [9/20], Step [429/627], Loss: 0.1675
Epoch [9/20], Step [430/627], Loss: 0.1922
Epoch [9/20], Step [431/627], Loss: 0.4412
Epoch [9/20], Step [432/627], Loss: 0.1488
Epoch [9/20], Step [433/627], Loss: 0.1499
Epoch [9/20], Step [434/627], Loss: 0.4144
Epoch [9/20], Step [435/627], Loss: 0.0585
Epoch [9/20], Step [436/627], Loss: 0.4167
Epoch [9/20], Step [437/627], Loss: 0.4469
Epoch [9/20], Step [438/627], Loss: 0.5916
Epoch [9/20

Epoch [9/20], Step [609/627], Loss: 0.4957
Epoch [9/20], Step [610/627], Loss: 0.5726
Epoch [9/20], Step [611/627], Loss: 0.1117
Epoch [9/20], Step [612/627], Loss: 0.3517
Epoch [9/20], Step [613/627], Loss: 0.6813
Epoch [9/20], Step [614/627], Loss: 0.3143
Epoch [9/20], Step [615/627], Loss: 0.5424
Epoch [9/20], Step [616/627], Loss: 0.2933
Epoch [9/20], Step [617/627], Loss: 0.2071
Epoch [9/20], Step [618/627], Loss: 0.4487
Epoch [9/20], Step [619/627], Loss: 0.6347
Epoch [9/20], Step [620/627], Loss: 0.3132
Epoch [9/20], Step [621/627], Loss: 0.2757
Epoch [9/20], Step [622/627], Loss: 0.1453
Epoch [9/20], Step [623/627], Loss: 0.5431
Epoch [9/20], Step [624/627], Loss: 0.3414
Epoch [9/20], Step [625/627], Loss: 0.0953
Epoch [9/20], Step [626/627], Loss: 0.2314
Epoch [9/20], Step [627/627], Loss: 0.1291
Epoch [10/20], Step [1/627], Loss: 0.1579
Epoch [10/20], Step [2/627], Loss: 0.1692
Epoch [10/20], Step [3/627], Loss: 0.3562
Epoch [10/20], Step [4/627], Loss: 0.1632
Epoch [10/20], 

Epoch [10/20], Step [176/627], Loss: 0.1869
Epoch [10/20], Step [177/627], Loss: 0.1680
Epoch [10/20], Step [178/627], Loss: 0.5333
Epoch [10/20], Step [179/627], Loss: 0.1778
Epoch [10/20], Step [180/627], Loss: 0.3209
Epoch [10/20], Step [181/627], Loss: 0.3379
Epoch [10/20], Step [182/627], Loss: 0.2098
Epoch [10/20], Step [183/627], Loss: 0.4689
Epoch [10/20], Step [184/627], Loss: 0.2320
Epoch [10/20], Step [185/627], Loss: 0.3177
Epoch [10/20], Step [186/627], Loss: 0.5139
Epoch [10/20], Step [187/627], Loss: 0.3979
Epoch [10/20], Step [188/627], Loss: 0.0929
Epoch [10/20], Step [189/627], Loss: 0.1724
Epoch [10/20], Step [190/627], Loss: 0.3499
Epoch [10/20], Step [191/627], Loss: 0.1554
Epoch [10/20], Step [192/627], Loss: 0.2614
Epoch [10/20], Step [193/627], Loss: 0.4745
Epoch [10/20], Step [194/627], Loss: 0.4297
Epoch [10/20], Step [195/627], Loss: 0.1964
Epoch [10/20], Step [196/627], Loss: 0.1078
Epoch [10/20], Step [197/627], Loss: 0.2038
Epoch [10/20], Step [198/627], L

Epoch [10/20], Step [363/627], Loss: 0.5888
Epoch [10/20], Step [364/627], Loss: 0.4023
Epoch [10/20], Step [365/627], Loss: 0.1721
Epoch [10/20], Step [366/627], Loss: 0.3996
Epoch [10/20], Step [367/627], Loss: 0.2067
Epoch [10/20], Step [368/627], Loss: 0.3394
Epoch [10/20], Step [369/627], Loss: 0.1837
Epoch [10/20], Step [370/627], Loss: 0.3704
Epoch [10/20], Step [371/627], Loss: 0.2445
Epoch [10/20], Step [372/627], Loss: 0.3307
Epoch [10/20], Step [373/627], Loss: 0.7555
Epoch [10/20], Step [374/627], Loss: 0.5009
Epoch [10/20], Step [375/627], Loss: 0.2065
Epoch [10/20], Step [376/627], Loss: 0.2346
Epoch [10/20], Step [377/627], Loss: 0.1350
Epoch [10/20], Step [378/627], Loss: 0.5032
Epoch [10/20], Step [379/627], Loss: 0.6063
Epoch [10/20], Step [380/627], Loss: 0.3060
Epoch [10/20], Step [381/627], Loss: 0.1724
Epoch [10/20], Step [382/627], Loss: 0.1548
Epoch [10/20], Step [383/627], Loss: 0.5774
Epoch [10/20], Step [384/627], Loss: 0.5772
Epoch [10/20], Step [385/627], L

Epoch [10/20], Step [554/627], Loss: 0.2834
Epoch [10/20], Step [555/627], Loss: 0.1637
Epoch [10/20], Step [556/627], Loss: 0.4046
Epoch [10/20], Step [557/627], Loss: 0.3567
Epoch [10/20], Step [558/627], Loss: 0.5463
Epoch [10/20], Step [559/627], Loss: 0.2461
Epoch [10/20], Step [560/627], Loss: 0.7203
Epoch [10/20], Step [561/627], Loss: 0.3419
Epoch [10/20], Step [562/627], Loss: 0.1810
Epoch [10/20], Step [563/627], Loss: 0.1745
Epoch [10/20], Step [564/627], Loss: 0.1883
Epoch [10/20], Step [565/627], Loss: 0.3159
Epoch [10/20], Step [566/627], Loss: 0.3533
Epoch [10/20], Step [567/627], Loss: 0.1919
Epoch [10/20], Step [568/627], Loss: 0.5138
Epoch [10/20], Step [569/627], Loss: 0.1621
Epoch [10/20], Step [570/627], Loss: 0.3112
Epoch [10/20], Step [571/627], Loss: 0.3516
Epoch [10/20], Step [572/627], Loss: 0.3625
Epoch [10/20], Step [573/627], Loss: 0.3060
Epoch [10/20], Step [574/627], Loss: 0.2854
Epoch [10/20], Step [575/627], Loss: 0.5781
Epoch [10/20], Step [576/627], L

Epoch [11/20], Step [116/627], Loss: 0.3083
Epoch [11/20], Step [117/627], Loss: 0.2485
Epoch [11/20], Step [118/627], Loss: 0.3613
Epoch [11/20], Step [119/627], Loss: 0.8630
Epoch [11/20], Step [120/627], Loss: 0.3709
Epoch [11/20], Step [121/627], Loss: 0.1675
Epoch [11/20], Step [122/627], Loss: 0.5597
Epoch [11/20], Step [123/627], Loss: 0.3473
Epoch [11/20], Step [124/627], Loss: 0.3610
Epoch [11/20], Step [125/627], Loss: 0.4707
Epoch [11/20], Step [126/627], Loss: 0.5535
Epoch [11/20], Step [127/627], Loss: 0.3669
Epoch [11/20], Step [128/627], Loss: 0.6910
Epoch [11/20], Step [129/627], Loss: 0.2598
Epoch [11/20], Step [130/627], Loss: 0.1418
Epoch [11/20], Step [131/627], Loss: 0.1384
Epoch [11/20], Step [132/627], Loss: 0.1287
Epoch [11/20], Step [133/627], Loss: 0.2829
Epoch [11/20], Step [134/627], Loss: 0.6208
Epoch [11/20], Step [135/627], Loss: 0.2229
Epoch [11/20], Step [136/627], Loss: 0.2161
Epoch [11/20], Step [137/627], Loss: 0.2267
Epoch [11/20], Step [138/627], L

Epoch [11/20], Step [307/627], Loss: 0.1589
Epoch [11/20], Step [308/627], Loss: 0.2316
Epoch [11/20], Step [309/627], Loss: 0.2267
Epoch [11/20], Step [310/627], Loss: 0.6297
Epoch [11/20], Step [311/627], Loss: 0.1541
Epoch [11/20], Step [312/627], Loss: 0.2236
Epoch [11/20], Step [313/627], Loss: 0.2660
Epoch [11/20], Step [314/627], Loss: 0.1566
Epoch [11/20], Step [315/627], Loss: 0.3442
Epoch [11/20], Step [316/627], Loss: 0.1253
Epoch [11/20], Step [317/627], Loss: 0.2086
Epoch [11/20], Step [318/627], Loss: 0.7101
Epoch [11/20], Step [319/627], Loss: 0.0905
Epoch [11/20], Step [320/627], Loss: 0.1148
Epoch [11/20], Step [321/627], Loss: 0.3105
Epoch [11/20], Step [322/627], Loss: 0.4553
Epoch [11/20], Step [323/627], Loss: 0.4743
Epoch [11/20], Step [324/627], Loss: 0.3226
Epoch [11/20], Step [325/627], Loss: 0.1830
Epoch [11/20], Step [326/627], Loss: 0.1920
Epoch [11/20], Step [327/627], Loss: 0.4481
Epoch [11/20], Step [328/627], Loss: 0.2379
Epoch [11/20], Step [329/627], L

Epoch [11/20], Step [496/627], Loss: 0.7377
Epoch [11/20], Step [497/627], Loss: 0.3583
Epoch [11/20], Step [498/627], Loss: 0.4581
Epoch [11/20], Step [499/627], Loss: 0.3443
Epoch [11/20], Step [500/627], Loss: 0.3341
Epoch [11/20], Step [501/627], Loss: 0.1781
Epoch [11/20], Step [502/627], Loss: 0.2284
Epoch [11/20], Step [503/627], Loss: 0.6267
Epoch [11/20], Step [504/627], Loss: 0.3490
Epoch [11/20], Step [505/627], Loss: 0.6177
Epoch [11/20], Step [506/627], Loss: 0.2413
Epoch [11/20], Step [507/627], Loss: 0.2817
Epoch [11/20], Step [508/627], Loss: 0.3147
Epoch [11/20], Step [509/627], Loss: 0.2832
Epoch [11/20], Step [510/627], Loss: 0.1582
Epoch [11/20], Step [511/627], Loss: 0.4084
Epoch [11/20], Step [512/627], Loss: 0.1498
Epoch [11/20], Step [513/627], Loss: 0.3423
Epoch [11/20], Step [514/627], Loss: 0.1970
Epoch [11/20], Step [515/627], Loss: 0.1167
Epoch [11/20], Step [516/627], Loss: 0.2311
Epoch [11/20], Step [517/627], Loss: 0.2249
Epoch [11/20], Step [518/627], L

Epoch [12/20], Step [59/627], Loss: 0.0728
Epoch [12/20], Step [60/627], Loss: 0.1575
Epoch [12/20], Step [61/627], Loss: 0.3754
Epoch [12/20], Step [62/627], Loss: 0.1970
Epoch [12/20], Step [63/627], Loss: 0.0942
Epoch [12/20], Step [64/627], Loss: 0.4069
Epoch [12/20], Step [65/627], Loss: 0.2323
Epoch [12/20], Step [66/627], Loss: 0.3673
Epoch [12/20], Step [67/627], Loss: 0.1846
Epoch [12/20], Step [68/627], Loss: 0.2410
Epoch [12/20], Step [69/627], Loss: 0.3031
Epoch [12/20], Step [70/627], Loss: 0.4029
Epoch [12/20], Step [71/627], Loss: 0.1665
Epoch [12/20], Step [72/627], Loss: 0.5587
Epoch [12/20], Step [73/627], Loss: 0.3823
Epoch [12/20], Step [74/627], Loss: 0.4533
Epoch [12/20], Step [75/627], Loss: 0.2785
Epoch [12/20], Step [76/627], Loss: 0.3023
Epoch [12/20], Step [77/627], Loss: 0.1760
Epoch [12/20], Step [78/627], Loss: 0.1255
Epoch [12/20], Step [79/627], Loss: 0.2181
Epoch [12/20], Step [80/627], Loss: 0.1985
Epoch [12/20], Step [81/627], Loss: 0.1640
Epoch [12/2

Epoch [12/20], Step [247/627], Loss: 0.1532
Epoch [12/20], Step [248/627], Loss: 0.5244
Epoch [12/20], Step [249/627], Loss: 0.1256
Epoch [12/20], Step [250/627], Loss: 0.5837
Epoch [12/20], Step [251/627], Loss: 0.3438
Epoch [12/20], Step [252/627], Loss: 0.2569
Epoch [12/20], Step [253/627], Loss: 0.2458
Epoch [12/20], Step [254/627], Loss: 0.3065
Epoch [12/20], Step [255/627], Loss: 0.2421
Epoch [12/20], Step [256/627], Loss: 0.2532
Epoch [12/20], Step [257/627], Loss: 0.4930
Epoch [12/20], Step [258/627], Loss: 0.2273
Epoch [12/20], Step [259/627], Loss: 0.0819
Epoch [12/20], Step [260/627], Loss: 0.1988
Epoch [12/20], Step [261/627], Loss: 0.2434
Epoch [12/20], Step [262/627], Loss: 0.3714
Epoch [12/20], Step [263/627], Loss: 0.3066
Epoch [12/20], Step [264/627], Loss: 0.1432
Epoch [12/20], Step [265/627], Loss: 0.0904
Epoch [12/20], Step [266/627], Loss: 0.1677
Epoch [12/20], Step [267/627], Loss: 0.3037
Epoch [12/20], Step [268/627], Loss: 0.1646
Epoch [12/20], Step [269/627], L

Epoch [12/20], Step [437/627], Loss: 0.4354
Epoch [12/20], Step [438/627], Loss: 0.3337
Epoch [12/20], Step [439/627], Loss: 0.1512
Epoch [12/20], Step [440/627], Loss: 0.1669
Epoch [12/20], Step [441/627], Loss: 0.4379
Epoch [12/20], Step [442/627], Loss: 0.1509
Epoch [12/20], Step [443/627], Loss: 0.2192
Epoch [12/20], Step [444/627], Loss: 0.3827
Epoch [12/20], Step [445/627], Loss: 0.2513
Epoch [12/20], Step [446/627], Loss: 0.2148
Epoch [12/20], Step [447/627], Loss: 0.4103
Epoch [12/20], Step [448/627], Loss: 0.1704
Epoch [12/20], Step [449/627], Loss: 0.3157
Epoch [12/20], Step [450/627], Loss: 0.5252
Epoch [12/20], Step [451/627], Loss: 0.0762
Epoch [12/20], Step [452/627], Loss: 0.1032
Epoch [12/20], Step [453/627], Loss: 0.1622
Epoch [12/20], Step [454/627], Loss: 0.3134
Epoch [12/20], Step [455/627], Loss: 0.2856
Epoch [12/20], Step [456/627], Loss: 0.3924
Epoch [12/20], Step [457/627], Loss: 0.3443
Epoch [12/20], Step [458/627], Loss: 0.3884
Epoch [12/20], Step [459/627], L

Epoch [12/20], Step [625/627], Loss: 0.2140
Epoch [12/20], Step [626/627], Loss: 0.2008
Epoch [12/20], Step [627/627], Loss: 0.2089
rmse improved at epoch  12 ; best_mse,best_ci,best_r: 0.7925021010928085 0.7303496184919442 0.4043708688001691
Epoch [13/20], Step [1/627], Loss: 0.1375
Epoch [13/20], Step [2/627], Loss: 0.0828
Epoch [13/20], Step [3/627], Loss: 0.2624
Epoch [13/20], Step [4/627], Loss: 0.1746
Epoch [13/20], Step [5/627], Loss: 0.1952
Epoch [13/20], Step [6/627], Loss: 0.3449
Epoch [13/20], Step [7/627], Loss: 0.0981
Epoch [13/20], Step [8/627], Loss: 0.0321
Epoch [13/20], Step [9/627], Loss: 0.2075
Epoch [13/20], Step [10/627], Loss: 0.3492
Epoch [13/20], Step [11/627], Loss: 0.1241
Epoch [13/20], Step [12/627], Loss: 0.1217
Epoch [13/20], Step [13/627], Loss: 0.1326
Epoch [13/20], Step [14/627], Loss: 0.2153
Epoch [13/20], Step [15/627], Loss: 0.2189
Epoch [13/20], Step [16/627], Loss: 0.2884
Epoch [13/20], Step [17/627], Loss: 0.2066
Epoch [13/20], Step [18/627], Loss:

Epoch [13/20], Step [185/627], Loss: 0.3347
Epoch [13/20], Step [186/627], Loss: 0.2896
Epoch [13/20], Step [187/627], Loss: 0.1092
Epoch [13/20], Step [188/627], Loss: 0.4272
Epoch [13/20], Step [189/627], Loss: 0.1753
Epoch [13/20], Step [190/627], Loss: 0.2865
Epoch [13/20], Step [191/627], Loss: 0.3152
Epoch [13/20], Step [192/627], Loss: 0.2448
Epoch [13/20], Step [193/627], Loss: 0.2715
Epoch [13/20], Step [194/627], Loss: 0.1969
Epoch [13/20], Step [195/627], Loss: 0.2957
Epoch [13/20], Step [196/627], Loss: 0.1206
Epoch [13/20], Step [197/627], Loss: 0.2428
Epoch [13/20], Step [198/627], Loss: 0.1456
Epoch [13/20], Step [199/627], Loss: 0.1483
Epoch [13/20], Step [200/627], Loss: 0.1224
Epoch [13/20], Step [201/627], Loss: 0.1658
Epoch [13/20], Step [202/627], Loss: 0.1815
Epoch [13/20], Step [203/627], Loss: 0.2789
Epoch [13/20], Step [204/627], Loss: 0.1995
Epoch [13/20], Step [205/627], Loss: 0.0839
Epoch [13/20], Step [206/627], Loss: 0.3787
Epoch [13/20], Step [207/627], L

Epoch [13/20], Step [374/627], Loss: 0.3759
Epoch [13/20], Step [375/627], Loss: 0.2484
Epoch [13/20], Step [376/627], Loss: 0.3062
Epoch [13/20], Step [377/627], Loss: 0.3161
Epoch [13/20], Step [378/627], Loss: 0.2085
Epoch [13/20], Step [379/627], Loss: 0.1749
Epoch [13/20], Step [380/627], Loss: 0.3899
Epoch [13/20], Step [381/627], Loss: 0.9147
Epoch [13/20], Step [382/627], Loss: 0.4038
Epoch [13/20], Step [383/627], Loss: 0.1814
Epoch [13/20], Step [384/627], Loss: 0.3103
Epoch [13/20], Step [385/627], Loss: 0.2507
Epoch [13/20], Step [386/627], Loss: 0.1328
Epoch [13/20], Step [387/627], Loss: 0.2160
Epoch [13/20], Step [388/627], Loss: 0.3693
Epoch [13/20], Step [389/627], Loss: 0.2197
Epoch [13/20], Step [390/627], Loss: 0.1822
Epoch [13/20], Step [391/627], Loss: 0.1471
Epoch [13/20], Step [392/627], Loss: 0.1451
Epoch [13/20], Step [393/627], Loss: 0.6232
Epoch [13/20], Step [394/627], Loss: 0.2927
Epoch [13/20], Step [395/627], Loss: 0.1744
Epoch [13/20], Step [396/627], L

Epoch [13/20], Step [565/627], Loss: 0.0955
Epoch [13/20], Step [566/627], Loss: 0.2190
Epoch [13/20], Step [567/627], Loss: 0.2921
Epoch [13/20], Step [568/627], Loss: 0.2685
Epoch [13/20], Step [569/627], Loss: 0.0985
Epoch [13/20], Step [570/627], Loss: 0.2077
Epoch [13/20], Step [571/627], Loss: 0.1647
Epoch [13/20], Step [572/627], Loss: 0.1032
Epoch [13/20], Step [573/627], Loss: 0.1660
Epoch [13/20], Step [574/627], Loss: 0.2299
Epoch [13/20], Step [575/627], Loss: 0.1485
Epoch [13/20], Step [576/627], Loss: 0.2366
Epoch [13/20], Step [577/627], Loss: 0.2439
Epoch [13/20], Step [578/627], Loss: 0.1948
Epoch [13/20], Step [579/627], Loss: 0.1173
Epoch [13/20], Step [580/627], Loss: 0.2551
Epoch [13/20], Step [581/627], Loss: 0.2510
Epoch [13/20], Step [582/627], Loss: 0.1556
Epoch [13/20], Step [583/627], Loss: 0.3335
Epoch [13/20], Step [584/627], Loss: 0.1774
Epoch [13/20], Step [585/627], Loss: 0.1702
Epoch [13/20], Step [586/627], Loss: 0.2636
Epoch [13/20], Step [587/627], L

Epoch [14/20], Step [127/627], Loss: 0.1699
Epoch [14/20], Step [128/627], Loss: 0.5139
Epoch [14/20], Step [129/627], Loss: 0.2348
Epoch [14/20], Step [130/627], Loss: 0.1576
Epoch [14/20], Step [131/627], Loss: 0.1905
Epoch [14/20], Step [132/627], Loss: 0.1013
Epoch [14/20], Step [133/627], Loss: 0.1130
Epoch [14/20], Step [134/627], Loss: 0.2510
Epoch [14/20], Step [135/627], Loss: 0.2591
Epoch [14/20], Step [136/627], Loss: 0.2986
Epoch [14/20], Step [137/627], Loss: 0.1987
Epoch [14/20], Step [138/627], Loss: 0.1785
Epoch [14/20], Step [139/627], Loss: 0.1291
Epoch [14/20], Step [140/627], Loss: 0.2108
Epoch [14/20], Step [141/627], Loss: 0.1698
Epoch [14/20], Step [142/627], Loss: 0.2357
Epoch [14/20], Step [143/627], Loss: 0.1719
Epoch [14/20], Step [144/627], Loss: 0.1561
Epoch [14/20], Step [145/627], Loss: 0.1936
Epoch [14/20], Step [146/627], Loss: 0.2454
Epoch [14/20], Step [147/627], Loss: 0.2160
Epoch [14/20], Step [148/627], Loss: 0.1279
Epoch [14/20], Step [149/627], L

Epoch [14/20], Step [317/627], Loss: 0.3456
Epoch [14/20], Step [318/627], Loss: 0.2520
Epoch [14/20], Step [319/627], Loss: 0.1066
Epoch [14/20], Step [320/627], Loss: 0.1650
Epoch [14/20], Step [321/627], Loss: 0.2076
Epoch [14/20], Step [322/627], Loss: 0.1197
Epoch [14/20], Step [323/627], Loss: 0.1100
Epoch [14/20], Step [324/627], Loss: 0.1159
Epoch [14/20], Step [325/627], Loss: 0.2242
Epoch [14/20], Step [326/627], Loss: 0.3053
Epoch [14/20], Step [327/627], Loss: 0.1022
Epoch [14/20], Step [328/627], Loss: 0.0731
Epoch [14/20], Step [329/627], Loss: 0.4606
Epoch [14/20], Step [330/627], Loss: 0.2375
Epoch [14/20], Step [331/627], Loss: 0.1025
Epoch [14/20], Step [332/627], Loss: 0.2812
Epoch [14/20], Step [333/627], Loss: 0.2713
Epoch [14/20], Step [334/627], Loss: 0.1746
Epoch [14/20], Step [335/627], Loss: 0.1362
Epoch [14/20], Step [336/627], Loss: 0.2642
Epoch [14/20], Step [337/627], Loss: 0.1974
Epoch [14/20], Step [338/627], Loss: 0.2807
Epoch [14/20], Step [339/627], L

Epoch [14/20], Step [504/627], Loss: 0.1190
Epoch [14/20], Step [505/627], Loss: 0.3715
Epoch [14/20], Step [506/627], Loss: 0.1899
Epoch [14/20], Step [507/627], Loss: 0.1142
Epoch [14/20], Step [508/627], Loss: 0.2877
Epoch [14/20], Step [509/627], Loss: 0.3483
Epoch [14/20], Step [510/627], Loss: 0.3532
Epoch [14/20], Step [511/627], Loss: 0.2995
Epoch [14/20], Step [512/627], Loss: 0.1438
Epoch [14/20], Step [513/627], Loss: 0.2070
Epoch [14/20], Step [514/627], Loss: 0.3039
Epoch [14/20], Step [515/627], Loss: 0.3873
Epoch [14/20], Step [516/627], Loss: 0.2720
Epoch [14/20], Step [517/627], Loss: 0.1493
Epoch [14/20], Step [518/627], Loss: 0.1263
Epoch [14/20], Step [519/627], Loss: 0.0991
Epoch [14/20], Step [520/627], Loss: 0.2092
Epoch [14/20], Step [521/627], Loss: 0.5953
Epoch [14/20], Step [522/627], Loss: 0.3101
Epoch [14/20], Step [523/627], Loss: 0.0583
Epoch [14/20], Step [524/627], Loss: 0.2135
Epoch [14/20], Step [525/627], Loss: 0.2403
Epoch [14/20], Step [526/627], L

Epoch [15/20], Step [66/627], Loss: 0.1322
Epoch [15/20], Step [67/627], Loss: 0.1400
Epoch [15/20], Step [68/627], Loss: 0.2257
Epoch [15/20], Step [69/627], Loss: 0.1193
Epoch [15/20], Step [70/627], Loss: 0.2344
Epoch [15/20], Step [71/627], Loss: 0.0819
Epoch [15/20], Step [72/627], Loss: 0.1235
Epoch [15/20], Step [73/627], Loss: 0.3065
Epoch [15/20], Step [74/627], Loss: 0.1346
Epoch [15/20], Step [75/627], Loss: 0.2530
Epoch [15/20], Step [76/627], Loss: 0.2291
Epoch [15/20], Step [77/627], Loss: 0.1091
Epoch [15/20], Step [78/627], Loss: 0.1970
Epoch [15/20], Step [79/627], Loss: 0.1809
Epoch [15/20], Step [80/627], Loss: 0.2974
Epoch [15/20], Step [81/627], Loss: 0.1479
Epoch [15/20], Step [82/627], Loss: 0.1433
Epoch [15/20], Step [83/627], Loss: 0.0872
Epoch [15/20], Step [84/627], Loss: 0.1372
Epoch [15/20], Step [85/627], Loss: 0.3488
Epoch [15/20], Step [86/627], Loss: 0.2383
Epoch [15/20], Step [87/627], Loss: 0.1164
Epoch [15/20], Step [88/627], Loss: 0.2519
Epoch [15/2

Epoch [15/20], Step [256/627], Loss: 0.0774
Epoch [15/20], Step [257/627], Loss: 0.2229
Epoch [15/20], Step [258/627], Loss: 0.1403
Epoch [15/20], Step [259/627], Loss: 0.1401
Epoch [15/20], Step [260/627], Loss: 0.1502
Epoch [15/20], Step [261/627], Loss: 0.0738
Epoch [15/20], Step [262/627], Loss: 0.1350
Epoch [15/20], Step [263/627], Loss: 0.3131
Epoch [15/20], Step [264/627], Loss: 0.1572
Epoch [15/20], Step [265/627], Loss: 0.1735
Epoch [15/20], Step [266/627], Loss: 0.6700
Epoch [15/20], Step [267/627], Loss: 0.2364
Epoch [15/20], Step [268/627], Loss: 0.1629
Epoch [15/20], Step [269/627], Loss: 0.1099
Epoch [15/20], Step [270/627], Loss: 0.3154
Epoch [15/20], Step [271/627], Loss: 0.2260
Epoch [15/20], Step [272/627], Loss: 0.1498
Epoch [15/20], Step [273/627], Loss: 0.2653
Epoch [15/20], Step [274/627], Loss: 0.3550
Epoch [15/20], Step [275/627], Loss: 0.1412
Epoch [15/20], Step [276/627], Loss: 0.0887
Epoch [15/20], Step [277/627], Loss: 0.1347
Epoch [15/20], Step [278/627], L

Epoch [15/20], Step [445/627], Loss: 0.2190
Epoch [15/20], Step [446/627], Loss: 0.2215
Epoch [15/20], Step [447/627], Loss: 0.3353
Epoch [15/20], Step [448/627], Loss: 0.1199
Epoch [15/20], Step [449/627], Loss: 0.1133
Epoch [15/20], Step [450/627], Loss: 0.3527
Epoch [15/20], Step [451/627], Loss: 0.3047
Epoch [15/20], Step [452/627], Loss: 0.1067
Epoch [15/20], Step [453/627], Loss: 0.1614
Epoch [15/20], Step [454/627], Loss: 0.1238
Epoch [15/20], Step [455/627], Loss: 0.3360
Epoch [15/20], Step [456/627], Loss: 0.1925
Epoch [15/20], Step [457/627], Loss: 0.2351
Epoch [15/20], Step [458/627], Loss: 0.2502
Epoch [15/20], Step [459/627], Loss: 0.3492
Epoch [15/20], Step [460/627], Loss: 0.1939
Epoch [15/20], Step [461/627], Loss: 0.3257
Epoch [15/20], Step [462/627], Loss: 0.1146
Epoch [15/20], Step [463/627], Loss: 0.1102
Epoch [15/20], Step [464/627], Loss: 0.1173
Epoch [15/20], Step [465/627], Loss: 0.1942
Epoch [15/20], Step [466/627], Loss: 0.2730
Epoch [15/20], Step [467/627], L

Epoch [16/20], Step [5/627], Loss: 0.0679
Epoch [16/20], Step [6/627], Loss: 0.1549
Epoch [16/20], Step [7/627], Loss: 0.1478
Epoch [16/20], Step [8/627], Loss: 0.1578
Epoch [16/20], Step [9/627], Loss: 0.4777
Epoch [16/20], Step [10/627], Loss: 0.1390
Epoch [16/20], Step [11/627], Loss: 0.2887
Epoch [16/20], Step [12/627], Loss: 0.1711
Epoch [16/20], Step [13/627], Loss: 0.2569
Epoch [16/20], Step [14/627], Loss: 0.2766
Epoch [16/20], Step [15/627], Loss: 0.1701
Epoch [16/20], Step [16/627], Loss: 0.0925
Epoch [16/20], Step [17/627], Loss: 0.0654
Epoch [16/20], Step [18/627], Loss: 0.2990
Epoch [16/20], Step [19/627], Loss: 0.2419
Epoch [16/20], Step [20/627], Loss: 0.3798
Epoch [16/20], Step [21/627], Loss: 0.1087
Epoch [16/20], Step [22/627], Loss: 0.1806
Epoch [16/20], Step [23/627], Loss: 0.1459
Epoch [16/20], Step [24/627], Loss: 0.2154
Epoch [16/20], Step [25/627], Loss: 0.1699
Epoch [16/20], Step [26/627], Loss: 0.1768
Epoch [16/20], Step [27/627], Loss: 0.1627
Epoch [16/20], S

Epoch [16/20], Step [194/627], Loss: 0.1408
Epoch [16/20], Step [195/627], Loss: 0.1641
Epoch [16/20], Step [196/627], Loss: 0.1397
Epoch [16/20], Step [197/627], Loss: 0.2179
Epoch [16/20], Step [198/627], Loss: 0.1904
Epoch [16/20], Step [199/627], Loss: 0.2539
Epoch [16/20], Step [200/627], Loss: 0.0813
Epoch [16/20], Step [201/627], Loss: 0.1056
Epoch [16/20], Step [202/627], Loss: 0.1550
Epoch [16/20], Step [203/627], Loss: 0.2783
Epoch [16/20], Step [204/627], Loss: 0.0740
Epoch [16/20], Step [205/627], Loss: 0.1585
Epoch [16/20], Step [206/627], Loss: 0.1750
Epoch [16/20], Step [207/627], Loss: 0.1486
Epoch [16/20], Step [208/627], Loss: 0.1695
Epoch [16/20], Step [209/627], Loss: 0.1385
Epoch [16/20], Step [210/627], Loss: 0.2623
Epoch [16/20], Step [211/627], Loss: 0.1849
Epoch [16/20], Step [212/627], Loss: 0.0998
Epoch [16/20], Step [213/627], Loss: 0.1534
Epoch [16/20], Step [214/627], Loss: 0.2181
Epoch [16/20], Step [215/627], Loss: 0.1760
Epoch [16/20], Step [216/627], L

Epoch [16/20], Step [381/627], Loss: 0.0864
Epoch [16/20], Step [382/627], Loss: 0.2229
Epoch [16/20], Step [383/627], Loss: 0.0728
Epoch [16/20], Step [384/627], Loss: 0.1853
Epoch [16/20], Step [385/627], Loss: 0.3101
Epoch [16/20], Step [386/627], Loss: 0.1104
Epoch [16/20], Step [387/627], Loss: 0.1110
Epoch [16/20], Step [388/627], Loss: 0.1128
Epoch [16/20], Step [389/627], Loss: 0.2001
Epoch [16/20], Step [390/627], Loss: 0.2703
Epoch [16/20], Step [391/627], Loss: 0.4472
Epoch [16/20], Step [392/627], Loss: 0.1617
Epoch [16/20], Step [393/627], Loss: 0.1452
Epoch [16/20], Step [394/627], Loss: 0.2043
Epoch [16/20], Step [395/627], Loss: 0.1701
Epoch [16/20], Step [396/627], Loss: 0.1113
Epoch [16/20], Step [397/627], Loss: 0.1366
Epoch [16/20], Step [398/627], Loss: 0.3379
Epoch [16/20], Step [399/627], Loss: 0.1569
Epoch [16/20], Step [400/627], Loss: 0.1668
Epoch [16/20], Step [401/627], Loss: 0.1416
Epoch [16/20], Step [402/627], Loss: 0.0885
Epoch [16/20], Step [403/627], L

Epoch [16/20], Step [571/627], Loss: 0.2495
Epoch [16/20], Step [572/627], Loss: 0.2556
Epoch [16/20], Step [573/627], Loss: 0.2587
Epoch [16/20], Step [574/627], Loss: 0.2888
Epoch [16/20], Step [575/627], Loss: 0.2520
Epoch [16/20], Step [576/627], Loss: 0.2489
Epoch [16/20], Step [577/627], Loss: 0.2102
Epoch [16/20], Step [578/627], Loss: 0.0917
Epoch [16/20], Step [579/627], Loss: 0.2036
Epoch [16/20], Step [580/627], Loss: 0.1484
Epoch [16/20], Step [581/627], Loss: 0.1095
Epoch [16/20], Step [582/627], Loss: 0.1693
Epoch [16/20], Step [583/627], Loss: 0.2652
Epoch [16/20], Step [584/627], Loss: 0.1448
Epoch [16/20], Step [585/627], Loss: 0.1376
Epoch [16/20], Step [586/627], Loss: 0.3871
Epoch [16/20], Step [587/627], Loss: 0.1355
Epoch [16/20], Step [588/627], Loss: 0.2750
Epoch [16/20], Step [589/627], Loss: 0.0748
Epoch [16/20], Step [590/627], Loss: 0.2386
Epoch [16/20], Step [591/627], Loss: 0.3103
Epoch [16/20], Step [592/627], Loss: 0.1795
Epoch [16/20], Step [593/627], L

Epoch [17/20], Step [133/627], Loss: 0.1103
Epoch [17/20], Step [134/627], Loss: 0.2398
Epoch [17/20], Step [135/627], Loss: 0.1376
Epoch [17/20], Step [136/627], Loss: 0.0978
Epoch [17/20], Step [137/627], Loss: 0.1274
Epoch [17/20], Step [138/627], Loss: 0.1082
Epoch [17/20], Step [139/627], Loss: 0.2848
Epoch [17/20], Step [140/627], Loss: 0.2674
Epoch [17/20], Step [141/627], Loss: 0.1926
Epoch [17/20], Step [142/627], Loss: 0.1702
Epoch [17/20], Step [143/627], Loss: 0.1251
Epoch [17/20], Step [144/627], Loss: 0.2010
Epoch [17/20], Step [145/627], Loss: 0.1602
Epoch [17/20], Step [146/627], Loss: 0.1763
Epoch [17/20], Step [147/627], Loss: 0.1726
Epoch [17/20], Step [148/627], Loss: 0.1437
Epoch [17/20], Step [149/627], Loss: 0.0849
Epoch [17/20], Step [150/627], Loss: 0.3046
Epoch [17/20], Step [151/627], Loss: 0.0598
Epoch [17/20], Step [152/627], Loss: 0.4551
Epoch [17/20], Step [153/627], Loss: 0.2609
Epoch [17/20], Step [154/627], Loss: 0.2511
Epoch [17/20], Step [155/627], L

Epoch [17/20], Step [323/627], Loss: 0.1306
Epoch [17/20], Step [324/627], Loss: 0.0952
Epoch [17/20], Step [325/627], Loss: 0.4759
Epoch [17/20], Step [326/627], Loss: 0.2458
Epoch [17/20], Step [327/627], Loss: 0.1365
Epoch [17/20], Step [328/627], Loss: 0.1285
Epoch [17/20], Step [329/627], Loss: 0.2675
Epoch [17/20], Step [330/627], Loss: 0.1823
Epoch [17/20], Step [331/627], Loss: 0.3534
Epoch [17/20], Step [332/627], Loss: 0.1047
Epoch [17/20], Step [333/627], Loss: 0.1641
Epoch [17/20], Step [334/627], Loss: 0.2373
Epoch [17/20], Step [335/627], Loss: 0.0674
Epoch [17/20], Step [336/627], Loss: 0.0889
Epoch [17/20], Step [337/627], Loss: 0.1717
Epoch [17/20], Step [338/627], Loss: 0.0560
Epoch [17/20], Step [339/627], Loss: 0.2101
Epoch [17/20], Step [340/627], Loss: 0.2760
Epoch [17/20], Step [341/627], Loss: 0.2271
Epoch [17/20], Step [342/627], Loss: 0.1854
Epoch [17/20], Step [343/627], Loss: 0.2032
Epoch [17/20], Step [344/627], Loss: 0.2944
Epoch [17/20], Step [345/627], L

Epoch [17/20], Step [512/627], Loss: 0.1896
Epoch [17/20], Step [513/627], Loss: 0.1497
Epoch [17/20], Step [514/627], Loss: 0.0745
Epoch [17/20], Step [515/627], Loss: 0.1269
Epoch [17/20], Step [516/627], Loss: 0.0767
Epoch [17/20], Step [517/627], Loss: 0.1165
Epoch [17/20], Step [518/627], Loss: 0.0834
Epoch [17/20], Step [519/627], Loss: 0.1148
Epoch [17/20], Step [520/627], Loss: 0.0989
Epoch [17/20], Step [521/627], Loss: 0.1382
Epoch [17/20], Step [522/627], Loss: 0.2577
Epoch [17/20], Step [523/627], Loss: 0.2032
Epoch [17/20], Step [524/627], Loss: 0.2659
Epoch [17/20], Step [525/627], Loss: 0.2005
Epoch [17/20], Step [526/627], Loss: 0.1712
Epoch [17/20], Step [527/627], Loss: 0.3829
Epoch [17/20], Step [528/627], Loss: 0.1775
Epoch [17/20], Step [529/627], Loss: 0.2151
Epoch [17/20], Step [530/627], Loss: 0.1885
Epoch [17/20], Step [531/627], Loss: 0.1141
Epoch [17/20], Step [532/627], Loss: 0.1006
Epoch [17/20], Step [533/627], Loss: 0.1594
Epoch [17/20], Step [534/627], L

Epoch [18/20], Step [71/627], Loss: 0.1850
Epoch [18/20], Step [72/627], Loss: 0.0481
Epoch [18/20], Step [73/627], Loss: 0.2030
Epoch [18/20], Step [74/627], Loss: 0.1155
Epoch [18/20], Step [75/627], Loss: 0.2155
Epoch [18/20], Step [76/627], Loss: 0.1207
Epoch [18/20], Step [77/627], Loss: 0.2024
Epoch [18/20], Step [78/627], Loss: 0.1223
Epoch [18/20], Step [79/627], Loss: 0.0513
Epoch [18/20], Step [80/627], Loss: 0.2134
Epoch [18/20], Step [81/627], Loss: 0.2338
Epoch [18/20], Step [82/627], Loss: 0.0592
Epoch [18/20], Step [83/627], Loss: 0.2560
Epoch [18/20], Step [84/627], Loss: 0.1029
Epoch [18/20], Step [85/627], Loss: 0.0994
Epoch [18/20], Step [86/627], Loss: 0.1071
Epoch [18/20], Step [87/627], Loss: 0.0980
Epoch [18/20], Step [88/627], Loss: 0.1550
Epoch [18/20], Step [89/627], Loss: 0.0898
Epoch [18/20], Step [90/627], Loss: 0.0786
Epoch [18/20], Step [91/627], Loss: 0.1072
Epoch [18/20], Step [92/627], Loss: 0.0493
Epoch [18/20], Step [93/627], Loss: 0.0585
Epoch [18/2

Epoch [18/20], Step [260/627], Loss: 0.3462
Epoch [18/20], Step [261/627], Loss: 0.1079
Epoch [18/20], Step [262/627], Loss: 0.1144
Epoch [18/20], Step [263/627], Loss: 0.1772
Epoch [18/20], Step [264/627], Loss: 0.1400
Epoch [18/20], Step [265/627], Loss: 0.2884
Epoch [18/20], Step [266/627], Loss: 0.1238
Epoch [18/20], Step [267/627], Loss: 0.2039
Epoch [18/20], Step [268/627], Loss: 0.0872
Epoch [18/20], Step [269/627], Loss: 0.1685
Epoch [18/20], Step [270/627], Loss: 0.1512
Epoch [18/20], Step [271/627], Loss: 0.0990
Epoch [18/20], Step [272/627], Loss: 0.1865
Epoch [18/20], Step [273/627], Loss: 0.4092
Epoch [18/20], Step [274/627], Loss: 0.2394
Epoch [18/20], Step [275/627], Loss: 0.2296
Epoch [18/20], Step [276/627], Loss: 0.1165
Epoch [18/20], Step [277/627], Loss: 0.2403
Epoch [18/20], Step [278/627], Loss: 0.2586
Epoch [18/20], Step [279/627], Loss: 0.4097
Epoch [18/20], Step [280/627], Loss: 0.1465
Epoch [18/20], Step [281/627], Loss: 0.0834
Epoch [18/20], Step [282/627], L

Epoch [18/20], Step [450/627], Loss: 0.1978
Epoch [18/20], Step [451/627], Loss: 0.1525
Epoch [18/20], Step [452/627], Loss: 0.1008
Epoch [18/20], Step [453/627], Loss: 0.0729
Epoch [18/20], Step [454/627], Loss: 0.1184
Epoch [18/20], Step [455/627], Loss: 0.1103
Epoch [18/20], Step [456/627], Loss: 0.3012
Epoch [18/20], Step [457/627], Loss: 0.1124
Epoch [18/20], Step [458/627], Loss: 0.1305
Epoch [18/20], Step [459/627], Loss: 0.1075
Epoch [18/20], Step [460/627], Loss: 0.0709
Epoch [18/20], Step [461/627], Loss: 0.3735
Epoch [18/20], Step [462/627], Loss: 0.1110
Epoch [18/20], Step [463/627], Loss: 0.1376
Epoch [18/20], Step [464/627], Loss: 0.1768
Epoch [18/20], Step [465/627], Loss: 0.1473
Epoch [18/20], Step [466/627], Loss: 0.1083
Epoch [18/20], Step [467/627], Loss: 0.1150
Epoch [18/20], Step [468/627], Loss: 0.1122
Epoch [18/20], Step [469/627], Loss: 0.1497
Epoch [18/20], Step [470/627], Loss: 0.1878
Epoch [18/20], Step [471/627], Loss: 0.1384
Epoch [18/20], Step [472/627], L

Epoch [19/20], Step [10/627], Loss: 0.2560
Epoch [19/20], Step [11/627], Loss: 0.1277
Epoch [19/20], Step [12/627], Loss: 0.1621
Epoch [19/20], Step [13/627], Loss: 0.1952
Epoch [19/20], Step [14/627], Loss: 0.1408
Epoch [19/20], Step [15/627], Loss: 0.1110
Epoch [19/20], Step [16/627], Loss: 0.1140
Epoch [19/20], Step [17/627], Loss: 0.0864
Epoch [19/20], Step [18/627], Loss: 0.1591
Epoch [19/20], Step [19/627], Loss: 0.2817
Epoch [19/20], Step [20/627], Loss: 0.1292
Epoch [19/20], Step [21/627], Loss: 0.1646
Epoch [19/20], Step [22/627], Loss: 0.1238
Epoch [19/20], Step [23/627], Loss: 0.1078
Epoch [19/20], Step [24/627], Loss: 0.1190
Epoch [19/20], Step [25/627], Loss: 0.1266
Epoch [19/20], Step [26/627], Loss: 0.1364
Epoch [19/20], Step [27/627], Loss: 0.1250
Epoch [19/20], Step [28/627], Loss: 0.2189
Epoch [19/20], Step [29/627], Loss: 0.0897
Epoch [19/20], Step [30/627], Loss: 0.1842
Epoch [19/20], Step [31/627], Loss: 0.0995
Epoch [19/20], Step [32/627], Loss: 0.1215
Epoch [19/2

Epoch [19/20], Step [201/627], Loss: 0.2487
Epoch [19/20], Step [202/627], Loss: 0.0319
Epoch [19/20], Step [203/627], Loss: 0.2028
Epoch [19/20], Step [204/627], Loss: 0.1096
Epoch [19/20], Step [205/627], Loss: 0.0558
Epoch [19/20], Step [206/627], Loss: 0.0936
Epoch [19/20], Step [207/627], Loss: 0.1472
Epoch [19/20], Step [208/627], Loss: 0.1405
Epoch [19/20], Step [209/627], Loss: 0.0579
Epoch [19/20], Step [210/627], Loss: 0.3410
Epoch [19/20], Step [211/627], Loss: 0.1123
Epoch [19/20], Step [212/627], Loss: 0.1723
Epoch [19/20], Step [213/627], Loss: 0.0671
Epoch [19/20], Step [214/627], Loss: 0.1441
Epoch [19/20], Step [215/627], Loss: 0.1321
Epoch [19/20], Step [216/627], Loss: 0.2011
Epoch [19/20], Step [217/627], Loss: 0.0559
Epoch [19/20], Step [218/627], Loss: 0.1001
Epoch [19/20], Step [219/627], Loss: 0.1007
Epoch [19/20], Step [220/627], Loss: 0.0649
Epoch [19/20], Step [221/627], Loss: 0.0451
Epoch [19/20], Step [222/627], Loss: 0.4417
Epoch [19/20], Step [223/627], L

Epoch [19/20], Step [389/627], Loss: 0.0537
Epoch [19/20], Step [390/627], Loss: 0.1909
Epoch [19/20], Step [391/627], Loss: 0.2339
Epoch [19/20], Step [392/627], Loss: 0.1008
Epoch [19/20], Step [393/627], Loss: 0.0595
Epoch [19/20], Step [394/627], Loss: 0.0923
Epoch [19/20], Step [395/627], Loss: 0.1753
Epoch [19/20], Step [396/627], Loss: 0.1225
Epoch [19/20], Step [397/627], Loss: 0.1166
Epoch [19/20], Step [398/627], Loss: 0.1511
Epoch [19/20], Step [399/627], Loss: 0.1105
Epoch [19/20], Step [400/627], Loss: 0.0541
Epoch [19/20], Step [401/627], Loss: 0.0906
Epoch [19/20], Step [402/627], Loss: 0.3249
Epoch [19/20], Step [403/627], Loss: 0.1970
Epoch [19/20], Step [404/627], Loss: 0.0452
Epoch [19/20], Step [405/627], Loss: 0.1239
Epoch [19/20], Step [406/627], Loss: 0.0575
Epoch [19/20], Step [407/627], Loss: 0.0593
Epoch [19/20], Step [408/627], Loss: 0.0894
Epoch [19/20], Step [409/627], Loss: 0.2424
Epoch [19/20], Step [410/627], Loss: 0.2118
Epoch [19/20], Step [411/627], L

Epoch [19/20], Step [578/627], Loss: 0.2069
Epoch [19/20], Step [579/627], Loss: 0.0980
Epoch [19/20], Step [580/627], Loss: 0.1908
Epoch [19/20], Step [581/627], Loss: 0.1251
Epoch [19/20], Step [582/627], Loss: 0.1368
Epoch [19/20], Step [583/627], Loss: 0.1076
Epoch [19/20], Step [584/627], Loss: 0.1572
Epoch [19/20], Step [585/627], Loss: 0.0976
Epoch [19/20], Step [586/627], Loss: 0.1032
Epoch [19/20], Step [587/627], Loss: 0.2341
Epoch [19/20], Step [588/627], Loss: 0.0526
Epoch [19/20], Step [589/627], Loss: 0.1072
Epoch [19/20], Step [590/627], Loss: 0.0743
Epoch [19/20], Step [591/627], Loss: 0.1707
Epoch [19/20], Step [592/627], Loss: 0.1411
Epoch [19/20], Step [593/627], Loss: 0.2955
Epoch [19/20], Step [594/627], Loss: 0.1114
Epoch [19/20], Step [595/627], Loss: 0.1049
Epoch [19/20], Step [596/627], Loss: 0.1077
Epoch [19/20], Step [597/627], Loss: 0.1568
Epoch [19/20], Step [598/627], Loss: 0.0413
Epoch [19/20], Step [599/627], Loss: 0.1896
Epoch [19/20], Step [600/627], L

Epoch [20/20], Step [142/627], Loss: 0.0706
Epoch [20/20], Step [143/627], Loss: 0.3258
Epoch [20/20], Step [144/627], Loss: 0.0841
Epoch [20/20], Step [145/627], Loss: 0.0696
Epoch [20/20], Step [146/627], Loss: 0.0918
Epoch [20/20], Step [147/627], Loss: 0.0902
Epoch [20/20], Step [148/627], Loss: 0.0426
Epoch [20/20], Step [149/627], Loss: 0.0830
Epoch [20/20], Step [150/627], Loss: 0.0818
Epoch [20/20], Step [151/627], Loss: 0.0372
Epoch [20/20], Step [152/627], Loss: 0.0588
Epoch [20/20], Step [153/627], Loss: 0.1126
Epoch [20/20], Step [154/627], Loss: 0.3691
Epoch [20/20], Step [155/627], Loss: 0.1007
Epoch [20/20], Step [156/627], Loss: 0.3815
Epoch [20/20], Step [157/627], Loss: 0.1526
Epoch [20/20], Step [158/627], Loss: 0.1116
Epoch [20/20], Step [159/627], Loss: 0.1574
Epoch [20/20], Step [160/627], Loss: 0.1052
Epoch [20/20], Step [161/627], Loss: 0.1394
Epoch [20/20], Step [162/627], Loss: 0.0711
Epoch [20/20], Step [163/627], Loss: 0.0594
Epoch [20/20], Step [164/627], L

Epoch [20/20], Step [329/627], Loss: 0.1712
Epoch [20/20], Step [330/627], Loss: 0.1102
Epoch [20/20], Step [331/627], Loss: 0.1558
Epoch [20/20], Step [332/627], Loss: 0.2400
Epoch [20/20], Step [333/627], Loss: 0.2213
Epoch [20/20], Step [334/627], Loss: 0.2656
Epoch [20/20], Step [335/627], Loss: 0.0644
Epoch [20/20], Step [336/627], Loss: 0.2133
Epoch [20/20], Step [337/627], Loss: 0.2185
Epoch [20/20], Step [338/627], Loss: 0.3851
Epoch [20/20], Step [339/627], Loss: 0.1042
Epoch [20/20], Step [340/627], Loss: 0.1179
Epoch [20/20], Step [341/627], Loss: 0.2352
Epoch [20/20], Step [342/627], Loss: 0.1773
Epoch [20/20], Step [343/627], Loss: 0.1335
Epoch [20/20], Step [344/627], Loss: 0.0539
Epoch [20/20], Step [345/627], Loss: 0.0870
Epoch [20/20], Step [346/627], Loss: 0.0714
Epoch [20/20], Step [347/627], Loss: 0.0414
Epoch [20/20], Step [348/627], Loss: 0.0557
Epoch [20/20], Step [349/627], Loss: 0.1333
Epoch [20/20], Step [350/627], Loss: 0.1003
Epoch [20/20], Step [351/627], L

Epoch [20/20], Step [518/627], Loss: 0.1368
Epoch [20/20], Step [519/627], Loss: 0.0748
Epoch [20/20], Step [520/627], Loss: 0.1280
Epoch [20/20], Step [521/627], Loss: 0.1304
Epoch [20/20], Step [522/627], Loss: 0.2236
Epoch [20/20], Step [523/627], Loss: 0.0716
Epoch [20/20], Step [524/627], Loss: 0.1908
Epoch [20/20], Step [525/627], Loss: 0.1767
Epoch [20/20], Step [526/627], Loss: 0.0986
Epoch [20/20], Step [527/627], Loss: 0.2276
Epoch [20/20], Step [528/627], Loss: 0.1134
Epoch [20/20], Step [529/627], Loss: 0.1102
Epoch [20/20], Step [530/627], Loss: 0.0863
Epoch [20/20], Step [531/627], Loss: 0.1026
Epoch [20/20], Step [532/627], Loss: 0.1043
Epoch [20/20], Step [533/627], Loss: 0.2019
Epoch [20/20], Step [534/627], Loss: 0.0780
Epoch [20/20], Step [535/627], Loss: 0.1427
Epoch [20/20], Step [536/627], Loss: 0.0553
Epoch [20/20], Step [537/627], Loss: 0.0733
Epoch [20/20], Step [538/627], Loss: 0.0884
Epoch [20/20], Step [539/627], Loss: 0.0606
Epoch [20/20], Step [540/627], L

In [41]:
best_epoch

17

In [42]:
model.eval()
# eval mode (batchnorm uses moving mean/variance instead of mini-batch mean/variance)
total_preds = np.array([])
total_labels = np.array([])
with torch.no_grad():
    correct = 0
    total = 0
    for i in test_loader:
        images = i['outer_product']
        labels = i['Label']
        images = images.to(device)
        labels = labels.to(device)
        
        # Forward pass
        outputs = model(images) 
        outputs = outputs.cpu().detach().numpy().flatten()
        labels =labels.cpu().detach().numpy().flatten()
        total_preds = np.concatenate([total_preds, outputs])
        total_labels = np.concatenate([total_labels, labels])
#         total_preds = torch.cat(total_preds, outputs.cpu(), 0 )
#         total_labels = torch.cat(total_labels, labels.cpu(), 0)
#         break

In [43]:
G,P = total_labels, total_preds

In [44]:
rmse(G,P)

0.9435996056646103

In [45]:
mse(G,P)

0.8903802158104082

In [46]:
pearson(G,P)

0.35047573919117125

In [47]:
ci(G,P)

0.68872536919979

In [48]:
model = ConvNet().to(device)

In [50]:
model.load_state_dict(torch.load('./best_sim-CNN-DTA_davis_fold2x.model'))

<All keys matched successfully>

In [51]:
model.eval()


ConvNet(
  (conv1): Conv2d(1, 32, kernel_size=(5, 5), stride=(1, 1))
  (pool1): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False)
  (conv2): Conv2d(32, 18, kernel_size=(3, 3), stride=(1, 1))
  (pool2): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False)
  (fc1): Linear(in_features=17820, out_features=128, bias=True)
  (fc2): Linear(in_features=128, out_features=1, bias=True)
  (dropout): Dropout(p=0.1, inplace=False)
)

In [52]:
total_preds = np.array([])
total_labels = np.array([])
with torch.no_grad():
    correct = 0
    total = 0
    for i in test_loader:
        images = i['outer_product']
        labels = i['Label']
        images = images.to(device)
        labels = labels.to(device)
        
        # Forward pass
        outputs = model(images) 
        outputs = outputs.cpu().detach().numpy().flatten()
        labels =labels.cpu().detach().numpy().flatten()
        total_preds = np.concatenate([total_preds, outputs])
        total_labels = np.concatenate([total_labels, labels])
#         total_preds = torch.cat(total_preds, outputs.cpu(), 0 )
#         total_labels = torch.cat(total_labels, labels.cpu(), 0)
#         break

In [53]:
G,P = total_labels, total_preds

In [54]:
rmse(G,P)

0.8857288421190969

In [55]:
print("MSE = ",mse(G,P))
print("R = ",pearson(G,P))
print("CI = ",ci(G,P))
print("RMSE = ",rmse(G,P))


MSE =  0.7845155817616359
R =  0.4063060107522774
CI =  0.720438629378811
RMSE =  0.8857288421190969
