In [1]:
import torch 
import json,pickle,math
import pandas as pd
import numpy as np
import torch.nn as nn
import torchvision
import torchvision.transforms as transforms


In [2]:
full_df = pd.read_csv(open('../davis_all_pairs.csv','r'))

In [3]:
all_9_folds={}
for i in [0,1,2]:
    for j in [0,1,2]:
        file_name = 'fold' +str(i) +str(j) 
        
        temp = open('../data/davis/DAVIS_9_FOLDS/' + file_name +'.pkl', 'rb')
        new_df = pd.read_pickle(temp)
        all_9_folds.update({file_name:new_df})
        temp.close()
        

In [5]:
def create_davis_test_train(test_fold_number,all_9_folds):
    test_protein_fold_id = test_fold_number[0]
    test_ligand_fold_id = test_fold_number[1]
    test_set = pd.DataFrame(columns = full_df.columns)
    train_set = pd.DataFrame(columns= full_df.columns)
    for i in [0,1,2]:
        for j in [0,1,2]:
            fold_name = 'fold' + str(i) + str(j)
            df = all_9_folds[fold_name]
            
            if str(i) == test_protein_fold_id:
                test_set = pd.concat([test_set, df.copy()], ignore_index=True)
                
            if str(i) != test_protein_fold_id:
                print("train ->",i, j)
                train_set = pd.concat([train_set, df.copy()], ignore_index=True)
                
                
    return train_set, test_set


# Create train test split on these 9 folds
## fold_number is the id of fold. For example, test = fold00, train = fold 11,22,12,21

In [6]:
fold_number = '1x'

In [7]:
train, test = create_davis_test_train(test_fold_number=fold_number, all_9_folds=all_9_folds)

train -> 0 0
train -> 0 1
train -> 0 2
train -> 2 0
train -> 2 1
train -> 2 2


In [9]:
# train

In [11]:
# test

# To ensure that there are no common targets or drugs in train and test


In [12]:
test_smiles = list(test['SMILES'])
test_targets = list(test['Target Sequence'])
train_smiles = list(train['SMILES'])
train_targets = list(train['Target Sequence'])

# for i in test_smiles:
#     if i in train_smiles:
#         print("common entity present")
for i in test_targets:
    if i in train_targets:
        print("common entity present")


# Creating similarity matrices for this fold

In [13]:
import rdkit
from rdkit.Chem import AllChem as Chem
from rdkit.Chem import AllChem
from rdkit.DataStructs import FingerprintSimilarity as fs
from rdkit.Chem.Fingerprints import FingerprintMols
from Bio import pairwise2

In [14]:
train_targets = list(set(list(train['Target Sequence'])))
train_smiles = list(set(list(train['SMILES'])))

def computeLigandSimilarity(smiles):
    fingerprints = {}
    for smile in smiles:
        mol = AllChem.MolFromSmiles(smile)
        if mol == None:
            mol = AllChem.MolFromSmiles(smile, sanitize=False)
        fp = FingerprintMols.FingerprintMol(mol)
        fingerprints[smile] = fp
    
    n = len(smiles)
    sims = np.zeros((n, n))
    for i in range(n):
        for j in range(i+1):
            fpi = fingerprints[smiles[i]]
            fpj = fingerprints[smiles[j]]
            sim = fs(fpi, fpj)
            sims[i, j] = sims[j, i] = sim
    return sims

def computeProteinSimilarity(targets):
    n = len(targets)
    mat = np.zeros((n,n))
    mat_i = np.zeros(n)
    for i in range(n):
        seq = targets[i]
        s = pairwise2.align.localxx(seq,seq, score_only=True)
        mat_i[i] = s
        
    for i in range(n):
        print(i)
        for j in range(n):
            if mat[i][j] == 0 :
                s1 = targets[i]
                s2 = targets[j]
                sw_ij = pairwise2.align.localxx(s1,s2,score_only=True)
                normalized_score = sw_ij /math.sqrt(mat_i[i]*mat_i[j])
                mat[i][j] = mat[j][i] = normalized_score
    
    return mat

In [15]:
ligand_similarity_matrix = computeLigandSimilarity(train_smiles)

In [16]:
np.shape(ligand_similarity_matrix)

(68, 68)

In [17]:
print(len(train_targets))
protein_similarity_matrix = computeProteinSimilarity(train_targets)

248
0
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247


In [18]:
np.shape(protein_similarity_matrix)

(248, 248)

In [19]:
LSM = ligand_similarity_matrix
PSM = protein_similarity_matrix

# creating outer products for train set

In [20]:
outer_train_prods = []
for i,row in train.iterrows():
#     print(i)
    smi = row['SMILES']
    seq = row['Target Sequence']
    target_id = train_targets.index(seq)
    smi_id = train_smiles.index(smi)
    ki=LSM[smi_id]
    kj=PSM[target_id]
    ki_x_kj = np.outer(ki,kj)
    outer_train_prods.append([ki_x_kj])
outer_train_prods = np.array(outer_train_prods)
print(np.shape(outer_train_prods))

(20060, 1, 68, 248)


# Creating similarity matrcies for test set

In [21]:
test_targets = list(set(list(test['Target Sequence'])))
test_smiles = list(set(list(test['SMILES'])))

In [22]:
test_PSM = np.zeros((len(test_targets), len(train_targets)))
np.shape(test_PSM)

(131, 248)

In [23]:
s_train_PSM = np.zeros(len(train_targets))
s_test_PSM = np.zeros(len(test_targets))

for i in range(len(train_targets)):
    seq = train_targets[i]
    s_train_PSM[i] = pairwise2.align.localxx(seq,seq, score_only=True)
    
for i in range(len(test_targets)):
    seq = test_targets[i]
    s_test_PSM[i] = pairwise2.align.localxx(seq,seq, score_only=True)
    
for i in range(len(test_targets)):
    print(i)
    for j in range(len(train_targets)):
        seq1 = test_targets[i]
        seq2 = train_targets[j]
        s_ij=pairwise2.align.localxx(seq1, seq2, score_only=True)
        N_S = s_ij / math.sqrt(s_train_PSM[j] * s_test_PSM[i])
        test_PSM[i][j] = N_S

0
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130


In [24]:
test_LSM = np.zeros((len(test_smiles), len(train_smiles)))
np.shape(test_LSM)

(68, 68)

In [25]:
for i in range(len(test_smiles)):
    print(i)
    for j in range(len(train_smiles)):
        smi1 = test_smiles[i]
        smi2 = train_smiles[j]
        
        mol1 = AllChem.MolFromSmiles(smi1)
        if mol1 == None:
            mol1= AllChem.MolFromSmiles(smi1, sanitize=False)
        fp1 = FingerprintMols.FingerprintMol(mol1)
        
        mol2 = AllChem.MolFromSmiles(smi2)
        if mol2 == None:
            mol2= AllChem.MolFromSmiles(smi2, sanitize=False)
        fp2 = FingerprintMols.FingerprintMol(mol2)
        
        test_LSM[i][j] = fs(fp1,fp2)

0
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67


# Creating outer products for test set

In [26]:
outer_test_prods = []
for i,row in test.iterrows():
#     print(i)
    smi = row['SMILES']
    seq = row['Target Sequence']
    target_id = test_targets.index(seq)
    smi_id = test_smiles.index(smi)
    ki=test_LSM[smi_id]
    kj=test_PSM[target_id]
    ki_x_kj = np.outer(ki,kj)
    outer_test_prods.append([ki_x_kj])
outer_test_prods = np.array(outer_test_prods)
print(np.shape(outer_test_prods))

(9996, 1, 68, 248)


In [27]:
# Device configuration
device = torch.device('cuda:0' if torch.cuda.is_available() else 'cpu')

# Hyper parameters
num_epochs = 20
# num_classes = 10
batch_size = 32
learning_rate = 0.001

In [28]:
device

device(type='cuda', index=0)

In [29]:
class custom_dataset(torch.utils.data.Dataset):
    def __init__(self, dataframe, outer_prods, transform=None):
#         self.df = pd.read_csv(open(csv_file))
        self.df = dataframe
#         self.root_dir = root_dir
        self.transform = transform
        self.outer_prods = outer_prods
        
    def __len__(self):
        return len(self.df)
    
    def __getitem__(self, idx):
        output = {'outer_product': self.outer_prods[idx] , 'Label':self.df.iloc[idx]['Label']}
        return output

In [30]:
train_dataset = custom_dataset(dataframe = train, outer_prods = outer_train_prods)
test_dataset = custom_dataset(dataframe = test, outer_prods = outer_test_prods)


In [31]:
train_loader= torch.utils.data.DataLoader(train_dataset, batch_size=batch_size, shuffle=True)
test_loader= torch.utils.data.DataLoader(test_dataset, batch_size=batch_size, shuffle=True)

In [32]:
print(len(train_loader)*32, len(test_loader)*32)

20064 10016


In [35]:
# for i in test_loader:
#     a = i['outer_product']
#     b= i['Label']
#     break
# conv1 = nn.Conv2d(1,32,5).double()
# pool = nn.MaxPool2d(2,2).double()
# conv2 = nn.Conv2d(32,18,3).double()
# fc1 = nn.Linear(18*15*60, 128).double()
# fc2 = nn.Linear(128,1).double()
# dropout = nn.Dropout(0.1).double()
# x= conv1(a)
# print(x.shape)
# x = pool(x)
# print(x.shape)
# x= conv2(x)
# print(x.shape)
# x = pool(x)
# print(x.shape)
# x = x.view(-1,18*15*60)
# print(x.shape)
# x = dropout(x)
# print(x.shape)
# x = fc1(x)
# print(x.shape)
# x = fc2(x)
# print(x.shape)

In [37]:
import torch.nn.functional as F

class ConvNet(nn.Module):
    def __init__(self):
        super(ConvNet, self).__init__()
        self.conv1 = nn.Conv2d(1,32, 5).double()
        self.pool1 = nn.MaxPool2d(2,2).double()
        self.conv2 = nn.Conv2d(32,18,3).double()
        self.pool2 = nn.MaxPool2d(2,2).double()
        self.fc1 = nn.Linear(18*15*60, 128).double()
        self.fc2 = nn.Linear(128,1).double()
        self.dropout = nn.Dropout(0.1).double()
    def forward(self, x):
        x = F.relu(self.conv1(x))
        x = self.pool1(x)
        x = F.relu(self.conv2(x))
        x = self.pool2(x)
        x = x.view(-1,18*15*60)
        x = self.dropout(x)
        x = F.relu(self.fc1(x))
        x = self.fc2(x)
        
        
        return x
    

In [38]:
model = ConvNet().to(device)

In [39]:
# Loss and optimizer
criterion = nn.MSELoss()
optimizer = torch.optim.Adam(model.parameters(), lr=learning_rate)


# Evaluation metrics

In [40]:
def rmse(y,f):
    rmse = math.sqrt(((y - f)**2).mean(axis=0))
    return rmse
def mse(y,f):
    mse = ((y - f)**2).mean(axis=0)
    return mse
def pearson(y,f):
    rp = np.corrcoef(y, f)[0,1]
    return rp
from lifelines.utils import concordance_index
def ci(y,f):
    return concordance_index(y,f)

In [41]:
def predicting(model, device, test_loader):
    model.eval()
    total_preds = np.array([])
    total_labels = np.array([])
    with torch.no_grad():
        for i in test_loader:
            images = i['outer_product']
            labels = i['Label']
            images = images.to(device)
            labels = labels.to(device)

            # Forward pass
            outputs = model(images) 
            outputs = outputs.cpu().detach().numpy().flatten()
            labels =labels.cpu().detach().numpy().flatten()
            total_preds = np.concatenate([total_preds, outputs])
            total_labels = np.concatenate([total_labels, labels])
    
    model.train()
    return total_labels, total_preds

# Train the model


In [42]:
model_file_name = 'best_sim-CNN-DTA_davis_fold' + fold_number +  '.model'
result_file_name = 'best_result_sim-CNNDTA_davis_fold'+fold_number + '.csv'

In [43]:
# Train the model
best_mse = 1000
best_ci = 0

total_step = len(train_loader)
for epoch in range(num_epochs):
    c=0
    for i in train_loader:
        c=c+1
        images = i['outer_product']
        labels = i['Label']
        images = images.to(device)
        labels = labels.to(device)
        
        # Forward pass
        outputs = model(images)
        loss = criterion(outputs.flatten(), labels)
        
        # Backward and optimize
        optimizer.zero_grad()
        loss.backward()
        optimizer.step()
           
        print ('Epoch [{}/{}], Step [{}/{}], Loss: {:.4f}' 
               .format(epoch+1, num_epochs, c, total_step, loss.item()))
    
    # taking best model so far
    G,P = predicting(model, device, test_loader)
    ret = [rmse(G, P), mse(G, P), pearson(G, P), ci(G, P)]
    if ret[1] < best_mse:
        torch.save(model.state_dict(), model_file_name)
        with open(result_file_name, 'w') as f:
            f.write(','.join(map(str, ret)))
        best_epoch = epoch+1
        best_mse = ret[1]
        best_ci = ret[-1]
        best_r = ret[2]
        
        print('rmse improved at epoch ', best_epoch,
                      '; best_mse,best_ci,best_r:', best_mse, best_ci,best_r)
        
        

Epoch [1/20], Step [1/627], Loss: 32.7357
Epoch [1/20], Step [2/627], Loss: 13.1218
Epoch [1/20], Step [3/627], Loss: 1.7689
Epoch [1/20], Step [4/627], Loss: 13.6573
Epoch [1/20], Step [5/627], Loss: 7.4127
Epoch [1/20], Step [6/627], Loss: 1.2893
Epoch [1/20], Step [7/627], Loss: 0.9056
Epoch [1/20], Step [8/627], Loss: 2.9469
Epoch [1/20], Step [9/627], Loss: 5.7408
Epoch [1/20], Step [10/627], Loss: 3.8345
Epoch [1/20], Step [11/627], Loss: 4.6607
Epoch [1/20], Step [12/627], Loss: 2.2109
Epoch [1/20], Step [13/627], Loss: 0.3441
Epoch [1/20], Step [14/627], Loss: 1.3227
Epoch [1/20], Step [15/627], Loss: 1.5263
Epoch [1/20], Step [16/627], Loss: 2.8759
Epoch [1/20], Step [17/627], Loss: 2.0767
Epoch [1/20], Step [18/627], Loss: 1.6039
Epoch [1/20], Step [19/627], Loss: 0.5003
Epoch [1/20], Step [20/627], Loss: 0.3320
Epoch [1/20], Step [21/627], Loss: 0.9651
Epoch [1/20], Step [22/627], Loss: 1.4105
Epoch [1/20], Step [23/627], Loss: 2.9576
Epoch [1/20], Step [24/627], Loss: 1.127

Epoch [1/20], Step [195/627], Loss: 0.4198
Epoch [1/20], Step [196/627], Loss: 0.8411
Epoch [1/20], Step [197/627], Loss: 1.5083
Epoch [1/20], Step [198/627], Loss: 0.8217
Epoch [1/20], Step [199/627], Loss: 0.3428
Epoch [1/20], Step [200/627], Loss: 1.2091
Epoch [1/20], Step [201/627], Loss: 0.8951
Epoch [1/20], Step [202/627], Loss: 0.4687
Epoch [1/20], Step [203/627], Loss: 1.2850
Epoch [1/20], Step [204/627], Loss: 0.3859
Epoch [1/20], Step [205/627], Loss: 0.2431
Epoch [1/20], Step [206/627], Loss: 0.7551
Epoch [1/20], Step [207/627], Loss: 0.6036
Epoch [1/20], Step [208/627], Loss: 1.0901
Epoch [1/20], Step [209/627], Loss: 0.4512
Epoch [1/20], Step [210/627], Loss: 0.6756
Epoch [1/20], Step [211/627], Loss: 0.6241
Epoch [1/20], Step [212/627], Loss: 0.1999
Epoch [1/20], Step [213/627], Loss: 1.2124
Epoch [1/20], Step [214/627], Loss: 1.0988
Epoch [1/20], Step [215/627], Loss: 0.8403
Epoch [1/20], Step [216/627], Loss: 0.3440
Epoch [1/20], Step [217/627], Loss: 0.4665
Epoch [1/20

Epoch [1/20], Step [390/627], Loss: 1.0355
Epoch [1/20], Step [391/627], Loss: 0.3865
Epoch [1/20], Step [392/627], Loss: 0.1918
Epoch [1/20], Step [393/627], Loss: 0.6508
Epoch [1/20], Step [394/627], Loss: 0.5955
Epoch [1/20], Step [395/627], Loss: 0.7984
Epoch [1/20], Step [396/627], Loss: 0.7968
Epoch [1/20], Step [397/627], Loss: 0.9288
Epoch [1/20], Step [398/627], Loss: 1.1351
Epoch [1/20], Step [399/627], Loss: 1.0189
Epoch [1/20], Step [400/627], Loss: 0.7427
Epoch [1/20], Step [401/627], Loss: 0.5901
Epoch [1/20], Step [402/627], Loss: 0.3341
Epoch [1/20], Step [403/627], Loss: 0.5085
Epoch [1/20], Step [404/627], Loss: 0.9117
Epoch [1/20], Step [405/627], Loss: 0.5158
Epoch [1/20], Step [406/627], Loss: 1.0352
Epoch [1/20], Step [407/627], Loss: 1.1088
Epoch [1/20], Step [408/627], Loss: 0.7156
Epoch [1/20], Step [409/627], Loss: 1.0124
Epoch [1/20], Step [410/627], Loss: 0.3907
Epoch [1/20], Step [411/627], Loss: 0.7887
Epoch [1/20], Step [412/627], Loss: 0.9136
Epoch [1/20

Epoch [1/20], Step [585/627], Loss: 0.9651
Epoch [1/20], Step [586/627], Loss: 0.3563
Epoch [1/20], Step [587/627], Loss: 0.4585
Epoch [1/20], Step [588/627], Loss: 0.4912
Epoch [1/20], Step [589/627], Loss: 0.2974
Epoch [1/20], Step [590/627], Loss: 0.3622
Epoch [1/20], Step [591/627], Loss: 0.2161
Epoch [1/20], Step [592/627], Loss: 0.6654
Epoch [1/20], Step [593/627], Loss: 0.5663
Epoch [1/20], Step [594/627], Loss: 0.3167
Epoch [1/20], Step [595/627], Loss: 0.4088
Epoch [1/20], Step [596/627], Loss: 0.4825
Epoch [1/20], Step [597/627], Loss: 0.4366
Epoch [1/20], Step [598/627], Loss: 0.3414
Epoch [1/20], Step [599/627], Loss: 0.3909
Epoch [1/20], Step [600/627], Loss: 0.2245
Epoch [1/20], Step [601/627], Loss: 0.7655
Epoch [1/20], Step [602/627], Loss: 1.6613
Epoch [1/20], Step [603/627], Loss: 0.2568
Epoch [1/20], Step [604/627], Loss: 0.4675
Epoch [1/20], Step [605/627], Loss: 0.6812
Epoch [1/20], Step [606/627], Loss: 0.3536
Epoch [1/20], Step [607/627], Loss: 0.3507
Epoch [1/20

Epoch [2/20], Step [150/627], Loss: 0.5188
Epoch [2/20], Step [151/627], Loss: 0.2279
Epoch [2/20], Step [152/627], Loss: 0.7949
Epoch [2/20], Step [153/627], Loss: 0.5608
Epoch [2/20], Step [154/627], Loss: 0.3271
Epoch [2/20], Step [155/627], Loss: 0.7572
Epoch [2/20], Step [156/627], Loss: 0.6748
Epoch [2/20], Step [157/627], Loss: 0.5816
Epoch [2/20], Step [158/627], Loss: 0.2190
Epoch [2/20], Step [159/627], Loss: 0.6624
Epoch [2/20], Step [160/627], Loss: 0.6138
Epoch [2/20], Step [161/627], Loss: 0.8242
Epoch [2/20], Step [162/627], Loss: 0.3301
Epoch [2/20], Step [163/627], Loss: 0.2854
Epoch [2/20], Step [164/627], Loss: 0.5950
Epoch [2/20], Step [165/627], Loss: 1.2367
Epoch [2/20], Step [166/627], Loss: 0.4674
Epoch [2/20], Step [167/627], Loss: 0.4415
Epoch [2/20], Step [168/627], Loss: 0.5765
Epoch [2/20], Step [169/627], Loss: 0.6912
Epoch [2/20], Step [170/627], Loss: 0.3529
Epoch [2/20], Step [171/627], Loss: 0.3115
Epoch [2/20], Step [172/627], Loss: 1.1553
Epoch [2/20

Epoch [2/20], Step [345/627], Loss: 0.3980
Epoch [2/20], Step [346/627], Loss: 0.5261
Epoch [2/20], Step [347/627], Loss: 0.2630
Epoch [2/20], Step [348/627], Loss: 0.5232
Epoch [2/20], Step [349/627], Loss: 0.7561
Epoch [2/20], Step [350/627], Loss: 0.5067
Epoch [2/20], Step [351/627], Loss: 0.9999
Epoch [2/20], Step [352/627], Loss: 0.3808
Epoch [2/20], Step [353/627], Loss: 0.8227
Epoch [2/20], Step [354/627], Loss: 0.4197
Epoch [2/20], Step [355/627], Loss: 0.7055
Epoch [2/20], Step [356/627], Loss: 0.3647
Epoch [2/20], Step [357/627], Loss: 0.4493
Epoch [2/20], Step [358/627], Loss: 0.6495
Epoch [2/20], Step [359/627], Loss: 0.3596
Epoch [2/20], Step [360/627], Loss: 0.8021
Epoch [2/20], Step [361/627], Loss: 0.4741
Epoch [2/20], Step [362/627], Loss: 0.5823
Epoch [2/20], Step [363/627], Loss: 0.8156
Epoch [2/20], Step [364/627], Loss: 0.4922
Epoch [2/20], Step [365/627], Loss: 0.9637
Epoch [2/20], Step [366/627], Loss: 1.0748
Epoch [2/20], Step [367/627], Loss: 0.4331
Epoch [2/20

Epoch [2/20], Step [540/627], Loss: 0.4131
Epoch [2/20], Step [541/627], Loss: 0.3385
Epoch [2/20], Step [542/627], Loss: 0.1556
Epoch [2/20], Step [543/627], Loss: 0.6628
Epoch [2/20], Step [544/627], Loss: 0.6267
Epoch [2/20], Step [545/627], Loss: 0.6234
Epoch [2/20], Step [546/627], Loss: 0.5203
Epoch [2/20], Step [547/627], Loss: 0.4736
Epoch [2/20], Step [548/627], Loss: 0.9809
Epoch [2/20], Step [549/627], Loss: 0.7071
Epoch [2/20], Step [550/627], Loss: 0.3379
Epoch [2/20], Step [551/627], Loss: 0.3445
Epoch [2/20], Step [552/627], Loss: 0.7577
Epoch [2/20], Step [553/627], Loss: 0.3677
Epoch [2/20], Step [554/627], Loss: 0.3366
Epoch [2/20], Step [555/627], Loss: 0.9879
Epoch [2/20], Step [556/627], Loss: 0.4350
Epoch [2/20], Step [557/627], Loss: 0.8844
Epoch [2/20], Step [558/627], Loss: 0.2053
Epoch [2/20], Step [559/627], Loss: 0.4493
Epoch [2/20], Step [560/627], Loss: 0.5241
Epoch [2/20], Step [561/627], Loss: 0.9664
Epoch [2/20], Step [562/627], Loss: 0.5783
Epoch [2/20

Epoch [3/20], Step [111/627], Loss: 0.5618
Epoch [3/20], Step [112/627], Loss: 0.5032
Epoch [3/20], Step [113/627], Loss: 0.5929
Epoch [3/20], Step [114/627], Loss: 0.6333
Epoch [3/20], Step [115/627], Loss: 0.9562
Epoch [3/20], Step [116/627], Loss: 0.7600
Epoch [3/20], Step [117/627], Loss: 0.6919
Epoch [3/20], Step [118/627], Loss: 0.5753
Epoch [3/20], Step [119/627], Loss: 0.3907
Epoch [3/20], Step [120/627], Loss: 0.5913
Epoch [3/20], Step [121/627], Loss: 0.4108
Epoch [3/20], Step [122/627], Loss: 0.5137
Epoch [3/20], Step [123/627], Loss: 0.5379
Epoch [3/20], Step [124/627], Loss: 0.3693
Epoch [3/20], Step [125/627], Loss: 0.2334
Epoch [3/20], Step [126/627], Loss: 0.2434
Epoch [3/20], Step [127/627], Loss: 0.3291
Epoch [3/20], Step [128/627], Loss: 0.5878
Epoch [3/20], Step [129/627], Loss: 0.8672
Epoch [3/20], Step [130/627], Loss: 0.5850
Epoch [3/20], Step [131/627], Loss: 0.6562
Epoch [3/20], Step [132/627], Loss: 0.6517
Epoch [3/20], Step [133/627], Loss: 0.9397
Epoch [3/20

Epoch [3/20], Step [306/627], Loss: 0.5488
Epoch [3/20], Step [307/627], Loss: 0.3955
Epoch [3/20], Step [308/627], Loss: 0.7494
Epoch [3/20], Step [309/627], Loss: 0.3452
Epoch [3/20], Step [310/627], Loss: 0.8352
Epoch [3/20], Step [311/627], Loss: 0.2353
Epoch [3/20], Step [312/627], Loss: 0.3482
Epoch [3/20], Step [313/627], Loss: 0.7363
Epoch [3/20], Step [314/627], Loss: 0.4444
Epoch [3/20], Step [315/627], Loss: 0.2762
Epoch [3/20], Step [316/627], Loss: 0.4066
Epoch [3/20], Step [317/627], Loss: 0.3322
Epoch [3/20], Step [318/627], Loss: 0.3446
Epoch [3/20], Step [319/627], Loss: 0.8125
Epoch [3/20], Step [320/627], Loss: 0.4564
Epoch [3/20], Step [321/627], Loss: 0.2569
Epoch [3/20], Step [322/627], Loss: 0.4093
Epoch [3/20], Step [323/627], Loss: 0.6853
Epoch [3/20], Step [324/627], Loss: 0.3588
Epoch [3/20], Step [325/627], Loss: 0.3194
Epoch [3/20], Step [326/627], Loss: 0.6385
Epoch [3/20], Step [327/627], Loss: 0.3636
Epoch [3/20], Step [328/627], Loss: 1.3490
Epoch [3/20

Epoch [3/20], Step [501/627], Loss: 0.7040
Epoch [3/20], Step [502/627], Loss: 0.3867
Epoch [3/20], Step [503/627], Loss: 0.3413
Epoch [3/20], Step [504/627], Loss: 0.3729
Epoch [3/20], Step [505/627], Loss: 0.5646
Epoch [3/20], Step [506/627], Loss: 0.2231
Epoch [3/20], Step [507/627], Loss: 1.0353
Epoch [3/20], Step [508/627], Loss: 1.0001
Epoch [3/20], Step [509/627], Loss: 0.1414
Epoch [3/20], Step [510/627], Loss: 0.5096
Epoch [3/20], Step [511/627], Loss: 0.7331
Epoch [3/20], Step [512/627], Loss: 0.3499
Epoch [3/20], Step [513/627], Loss: 0.8506
Epoch [3/20], Step [514/627], Loss: 0.3040
Epoch [3/20], Step [515/627], Loss: 0.3483
Epoch [3/20], Step [516/627], Loss: 1.0198
Epoch [3/20], Step [517/627], Loss: 0.7053
Epoch [3/20], Step [518/627], Loss: 0.6882
Epoch [3/20], Step [519/627], Loss: 0.2509
Epoch [3/20], Step [520/627], Loss: 0.6764
Epoch [3/20], Step [521/627], Loss: 0.3289
Epoch [3/20], Step [522/627], Loss: 0.7293
Epoch [3/20], Step [523/627], Loss: 0.6359
Epoch [3/20

Epoch [4/20], Step [71/627], Loss: 0.1149
Epoch [4/20], Step [72/627], Loss: 0.8059
Epoch [4/20], Step [73/627], Loss: 0.3440
Epoch [4/20], Step [74/627], Loss: 0.2970
Epoch [4/20], Step [75/627], Loss: 0.4110
Epoch [4/20], Step [76/627], Loss: 0.8999
Epoch [4/20], Step [77/627], Loss: 0.4017
Epoch [4/20], Step [78/627], Loss: 0.6372
Epoch [4/20], Step [79/627], Loss: 0.6637
Epoch [4/20], Step [80/627], Loss: 0.5995
Epoch [4/20], Step [81/627], Loss: 0.5990
Epoch [4/20], Step [82/627], Loss: 0.3578
Epoch [4/20], Step [83/627], Loss: 0.2933
Epoch [4/20], Step [84/627], Loss: 0.4550
Epoch [4/20], Step [85/627], Loss: 0.2791
Epoch [4/20], Step [86/627], Loss: 0.2869
Epoch [4/20], Step [87/627], Loss: 0.6978
Epoch [4/20], Step [88/627], Loss: 0.6277
Epoch [4/20], Step [89/627], Loss: 0.2211
Epoch [4/20], Step [90/627], Loss: 0.3115
Epoch [4/20], Step [91/627], Loss: 0.6109
Epoch [4/20], Step [92/627], Loss: 0.7408
Epoch [4/20], Step [93/627], Loss: 0.9659
Epoch [4/20], Step [94/627], Loss:

Epoch [4/20], Step [266/627], Loss: 0.7592
Epoch [4/20], Step [267/627], Loss: 0.3916
Epoch [4/20], Step [268/627], Loss: 1.0166
Epoch [4/20], Step [269/627], Loss: 0.3917
Epoch [4/20], Step [270/627], Loss: 0.4627
Epoch [4/20], Step [271/627], Loss: 0.6702
Epoch [4/20], Step [272/627], Loss: 0.5160
Epoch [4/20], Step [273/627], Loss: 0.2786
Epoch [4/20], Step [274/627], Loss: 0.3475
Epoch [4/20], Step [275/627], Loss: 0.4048
Epoch [4/20], Step [276/627], Loss: 0.8322
Epoch [4/20], Step [277/627], Loss: 0.3223
Epoch [4/20], Step [278/627], Loss: 0.2560
Epoch [4/20], Step [279/627], Loss: 0.3237
Epoch [4/20], Step [280/627], Loss: 0.6341
Epoch [4/20], Step [281/627], Loss: 0.5879
Epoch [4/20], Step [282/627], Loss: 0.2357
Epoch [4/20], Step [283/627], Loss: 0.7985
Epoch [4/20], Step [284/627], Loss: 0.3443
Epoch [4/20], Step [285/627], Loss: 0.5032
Epoch [4/20], Step [286/627], Loss: 0.3413
Epoch [4/20], Step [287/627], Loss: 0.4459
Epoch [4/20], Step [288/627], Loss: 0.4116
Epoch [4/20

Epoch [4/20], Step [461/627], Loss: 0.2090
Epoch [4/20], Step [462/627], Loss: 0.1108
Epoch [4/20], Step [463/627], Loss: 0.2738
Epoch [4/20], Step [464/627], Loss: 0.3053
Epoch [4/20], Step [465/627], Loss: 0.6423
Epoch [4/20], Step [466/627], Loss: 0.2091
Epoch [4/20], Step [467/627], Loss: 0.2839
Epoch [4/20], Step [468/627], Loss: 0.6534
Epoch [4/20], Step [469/627], Loss: 0.5115
Epoch [4/20], Step [470/627], Loss: 0.5090
Epoch [4/20], Step [471/627], Loss: 0.3308
Epoch [4/20], Step [472/627], Loss: 0.1823
Epoch [4/20], Step [473/627], Loss: 0.3286
Epoch [4/20], Step [474/627], Loss: 0.2465
Epoch [4/20], Step [475/627], Loss: 0.3128
Epoch [4/20], Step [476/627], Loss: 0.1618
Epoch [4/20], Step [477/627], Loss: 0.8483
Epoch [4/20], Step [478/627], Loss: 0.2366
Epoch [4/20], Step [479/627], Loss: 0.6529
Epoch [4/20], Step [480/627], Loss: 0.4774
Epoch [4/20], Step [481/627], Loss: 0.5284
Epoch [4/20], Step [482/627], Loss: 0.4514
Epoch [4/20], Step [483/627], Loss: 0.2597
Epoch [4/20

Epoch [5/20], Step [26/627], Loss: 0.3965
Epoch [5/20], Step [27/627], Loss: 0.5719
Epoch [5/20], Step [28/627], Loss: 0.5304
Epoch [5/20], Step [29/627], Loss: 0.1883
Epoch [5/20], Step [30/627], Loss: 0.3381
Epoch [5/20], Step [31/627], Loss: 0.4265
Epoch [5/20], Step [32/627], Loss: 0.2711
Epoch [5/20], Step [33/627], Loss: 0.2625
Epoch [5/20], Step [34/627], Loss: 0.1111
Epoch [5/20], Step [35/627], Loss: 0.3823
Epoch [5/20], Step [36/627], Loss: 0.6196
Epoch [5/20], Step [37/627], Loss: 0.3872
Epoch [5/20], Step [38/627], Loss: 0.3755
Epoch [5/20], Step [39/627], Loss: 0.2138
Epoch [5/20], Step [40/627], Loss: 0.6944
Epoch [5/20], Step [41/627], Loss: 0.7416
Epoch [5/20], Step [42/627], Loss: 0.6635
Epoch [5/20], Step [43/627], Loss: 0.2608
Epoch [5/20], Step [44/627], Loss: 0.9483
Epoch [5/20], Step [45/627], Loss: 0.5351
Epoch [5/20], Step [46/627], Loss: 0.6190
Epoch [5/20], Step [47/627], Loss: 0.3174
Epoch [5/20], Step [48/627], Loss: 0.2964
Epoch [5/20], Step [49/627], Loss:

Epoch [5/20], Step [221/627], Loss: 0.3809
Epoch [5/20], Step [222/627], Loss: 0.2444
Epoch [5/20], Step [223/627], Loss: 0.2507
Epoch [5/20], Step [224/627], Loss: 0.4734
Epoch [5/20], Step [225/627], Loss: 0.2122
Epoch [5/20], Step [226/627], Loss: 0.1040
Epoch [5/20], Step [227/627], Loss: 0.3669
Epoch [5/20], Step [228/627], Loss: 0.1510
Epoch [5/20], Step [229/627], Loss: 0.4135
Epoch [5/20], Step [230/627], Loss: 0.4370
Epoch [5/20], Step [231/627], Loss: 0.4757
Epoch [5/20], Step [232/627], Loss: 0.8129
Epoch [5/20], Step [233/627], Loss: 0.3279
Epoch [5/20], Step [234/627], Loss: 0.2604
Epoch [5/20], Step [235/627], Loss: 0.6432
Epoch [5/20], Step [236/627], Loss: 0.1753
Epoch [5/20], Step [237/627], Loss: 0.6606
Epoch [5/20], Step [238/627], Loss: 0.2022
Epoch [5/20], Step [239/627], Loss: 0.6184
Epoch [5/20], Step [240/627], Loss: 0.1755
Epoch [5/20], Step [241/627], Loss: 0.1661
Epoch [5/20], Step [242/627], Loss: 0.4327
Epoch [5/20], Step [243/627], Loss: 0.7076
Epoch [5/20

Epoch [5/20], Step [416/627], Loss: 0.3833
Epoch [5/20], Step [417/627], Loss: 0.6777
Epoch [5/20], Step [418/627], Loss: 0.3595
Epoch [5/20], Step [419/627], Loss: 0.2162
Epoch [5/20], Step [420/627], Loss: 0.2987
Epoch [5/20], Step [421/627], Loss: 0.5061
Epoch [5/20], Step [422/627], Loss: 0.3747
Epoch [5/20], Step [423/627], Loss: 0.3612
Epoch [5/20], Step [424/627], Loss: 0.4489
Epoch [5/20], Step [425/627], Loss: 0.5798
Epoch [5/20], Step [426/627], Loss: 0.2955
Epoch [5/20], Step [427/627], Loss: 0.2834
Epoch [5/20], Step [428/627], Loss: 0.2266
Epoch [5/20], Step [429/627], Loss: 0.4575
Epoch [5/20], Step [430/627], Loss: 0.4105
Epoch [5/20], Step [431/627], Loss: 0.3208
Epoch [5/20], Step [432/627], Loss: 0.4653
Epoch [5/20], Step [433/627], Loss: 0.4243
Epoch [5/20], Step [434/627], Loss: 0.7523
Epoch [5/20], Step [435/627], Loss: 0.5690
Epoch [5/20], Step [436/627], Loss: 0.8291
Epoch [5/20], Step [437/627], Loss: 0.3685
Epoch [5/20], Step [438/627], Loss: 0.6755
Epoch [5/20

Epoch [5/20], Step [611/627], Loss: 0.6038
Epoch [5/20], Step [612/627], Loss: 0.5293
Epoch [5/20], Step [613/627], Loss: 0.2016
Epoch [5/20], Step [614/627], Loss: 0.3773
Epoch [5/20], Step [615/627], Loss: 0.2807
Epoch [5/20], Step [616/627], Loss: 0.3400
Epoch [5/20], Step [617/627], Loss: 0.1995
Epoch [5/20], Step [618/627], Loss: 0.1751
Epoch [5/20], Step [619/627], Loss: 0.1978
Epoch [5/20], Step [620/627], Loss: 0.3440
Epoch [5/20], Step [621/627], Loss: 0.4502
Epoch [5/20], Step [622/627], Loss: 0.2231
Epoch [5/20], Step [623/627], Loss: 0.5023
Epoch [5/20], Step [624/627], Loss: 0.1957
Epoch [5/20], Step [625/627], Loss: 0.5639
Epoch [5/20], Step [626/627], Loss: 0.8419
Epoch [5/20], Step [627/627], Loss: 0.2373
rmse improved at epoch  5 ; best_mse,best_ci,best_r: 0.9052509167615512 0.7213496019957586 0.42482394936808665
Epoch [6/20], Step [1/627], Loss: 0.2939
Epoch [6/20], Step [2/627], Loss: 0.2061
Epoch [6/20], Step [3/627], Loss: 0.4002
Epoch [6/20], Step [4/627], Loss: 0

Epoch [6/20], Step [175/627], Loss: 0.4101
Epoch [6/20], Step [176/627], Loss: 0.6421
Epoch [6/20], Step [177/627], Loss: 0.3586
Epoch [6/20], Step [178/627], Loss: 0.3961
Epoch [6/20], Step [179/627], Loss: 0.3011
Epoch [6/20], Step [180/627], Loss: 0.4540
Epoch [6/20], Step [181/627], Loss: 1.0333
Epoch [6/20], Step [182/627], Loss: 0.3076
Epoch [6/20], Step [183/627], Loss: 0.6520
Epoch [6/20], Step [184/627], Loss: 0.3247
Epoch [6/20], Step [185/627], Loss: 0.5061
Epoch [6/20], Step [186/627], Loss: 0.1884
Epoch [6/20], Step [187/627], Loss: 0.3855
Epoch [6/20], Step [188/627], Loss: 0.2906
Epoch [6/20], Step [189/627], Loss: 0.2921
Epoch [6/20], Step [190/627], Loss: 0.5567
Epoch [6/20], Step [191/627], Loss: 0.2343
Epoch [6/20], Step [192/627], Loss: 0.2738
Epoch [6/20], Step [193/627], Loss: 0.2606
Epoch [6/20], Step [194/627], Loss: 0.2398
Epoch [6/20], Step [195/627], Loss: 0.3356
Epoch [6/20], Step [196/627], Loss: 0.6721
Epoch [6/20], Step [197/627], Loss: 0.5427
Epoch [6/20

Epoch [6/20], Step [370/627], Loss: 0.2939
Epoch [6/20], Step [371/627], Loss: 0.4961
Epoch [6/20], Step [372/627], Loss: 0.7053
Epoch [6/20], Step [373/627], Loss: 0.2940
Epoch [6/20], Step [374/627], Loss: 0.1214
Epoch [6/20], Step [375/627], Loss: 0.2642
Epoch [6/20], Step [376/627], Loss: 0.6693
Epoch [6/20], Step [377/627], Loss: 0.1566
Epoch [6/20], Step [378/627], Loss: 0.2284
Epoch [6/20], Step [379/627], Loss: 0.1407
Epoch [6/20], Step [380/627], Loss: 0.2854
Epoch [6/20], Step [381/627], Loss: 0.3346
Epoch [6/20], Step [382/627], Loss: 0.9449
Epoch [6/20], Step [383/627], Loss: 0.2726
Epoch [6/20], Step [384/627], Loss: 0.1866
Epoch [6/20], Step [385/627], Loss: 0.8904
Epoch [6/20], Step [386/627], Loss: 0.5389
Epoch [6/20], Step [387/627], Loss: 0.5015
Epoch [6/20], Step [388/627], Loss: 0.3590
Epoch [6/20], Step [389/627], Loss: 0.5242
Epoch [6/20], Step [390/627], Loss: 0.5160
Epoch [6/20], Step [391/627], Loss: 0.3087
Epoch [6/20], Step [392/627], Loss: 0.1553
Epoch [6/20

Epoch [6/20], Step [565/627], Loss: 0.3810
Epoch [6/20], Step [566/627], Loss: 0.9800
Epoch [6/20], Step [567/627], Loss: 0.5328
Epoch [6/20], Step [568/627], Loss: 0.8534
Epoch [6/20], Step [569/627], Loss: 0.4814
Epoch [6/20], Step [570/627], Loss: 0.7126
Epoch [6/20], Step [571/627], Loss: 0.3994
Epoch [6/20], Step [572/627], Loss: 0.7577
Epoch [6/20], Step [573/627], Loss: 0.4356
Epoch [6/20], Step [574/627], Loss: 0.6460
Epoch [6/20], Step [575/627], Loss: 0.3231
Epoch [6/20], Step [576/627], Loss: 0.4151
Epoch [6/20], Step [577/627], Loss: 0.2964
Epoch [6/20], Step [578/627], Loss: 0.1742
Epoch [6/20], Step [579/627], Loss: 0.4269
Epoch [6/20], Step [580/627], Loss: 0.2715
Epoch [6/20], Step [581/627], Loss: 0.1375
Epoch [6/20], Step [582/627], Loss: 0.5587
Epoch [6/20], Step [583/627], Loss: 0.2982
Epoch [6/20], Step [584/627], Loss: 0.2727
Epoch [6/20], Step [585/627], Loss: 0.1748
Epoch [6/20], Step [586/627], Loss: 0.2548
Epoch [6/20], Step [587/627], Loss: 0.3597
Epoch [6/20

Epoch [7/20], Step [136/627], Loss: 0.9333
Epoch [7/20], Step [137/627], Loss: 0.4584
Epoch [7/20], Step [138/627], Loss: 0.2304
Epoch [7/20], Step [139/627], Loss: 0.3473
Epoch [7/20], Step [140/627], Loss: 0.1484
Epoch [7/20], Step [141/627], Loss: 0.2034
Epoch [7/20], Step [142/627], Loss: 0.1433
Epoch [7/20], Step [143/627], Loss: 0.0956
Epoch [7/20], Step [144/627], Loss: 0.3161
Epoch [7/20], Step [145/627], Loss: 0.2997
Epoch [7/20], Step [146/627], Loss: 0.1479
Epoch [7/20], Step [147/627], Loss: 0.1996
Epoch [7/20], Step [148/627], Loss: 0.5298
Epoch [7/20], Step [149/627], Loss: 0.7220
Epoch [7/20], Step [150/627], Loss: 0.4440
Epoch [7/20], Step [151/627], Loss: 0.5456
Epoch [7/20], Step [152/627], Loss: 0.4192
Epoch [7/20], Step [153/627], Loss: 0.2815
Epoch [7/20], Step [154/627], Loss: 0.5386
Epoch [7/20], Step [155/627], Loss: 0.4136
Epoch [7/20], Step [156/627], Loss: 0.4373
Epoch [7/20], Step [157/627], Loss: 0.4729
Epoch [7/20], Step [158/627], Loss: 0.2274
Epoch [7/20

Epoch [7/20], Step [331/627], Loss: 0.2734
Epoch [7/20], Step [332/627], Loss: 0.1627
Epoch [7/20], Step [333/627], Loss: 0.5500
Epoch [7/20], Step [334/627], Loss: 0.7394
Epoch [7/20], Step [335/627], Loss: 0.1800
Epoch [7/20], Step [336/627], Loss: 0.3064
Epoch [7/20], Step [337/627], Loss: 0.2017
Epoch [7/20], Step [338/627], Loss: 0.2142
Epoch [7/20], Step [339/627], Loss: 0.2392
Epoch [7/20], Step [340/627], Loss: 0.2194
Epoch [7/20], Step [341/627], Loss: 0.2463
Epoch [7/20], Step [342/627], Loss: 0.6198
Epoch [7/20], Step [343/627], Loss: 0.2466
Epoch [7/20], Step [344/627], Loss: 0.3738
Epoch [7/20], Step [345/627], Loss: 0.2893
Epoch [7/20], Step [346/627], Loss: 0.6127
Epoch [7/20], Step [347/627], Loss: 0.4370
Epoch [7/20], Step [348/627], Loss: 0.4242
Epoch [7/20], Step [349/627], Loss: 0.3590
Epoch [7/20], Step [350/627], Loss: 0.5265
Epoch [7/20], Step [351/627], Loss: 0.5032
Epoch [7/20], Step [352/627], Loss: 0.2245
Epoch [7/20], Step [353/627], Loss: 0.8102
Epoch [7/20

Epoch [7/20], Step [526/627], Loss: 0.2979
Epoch [7/20], Step [527/627], Loss: 0.3412
Epoch [7/20], Step [528/627], Loss: 0.3910
Epoch [7/20], Step [529/627], Loss: 0.2656
Epoch [7/20], Step [530/627], Loss: 0.2284
Epoch [7/20], Step [531/627], Loss: 0.2099
Epoch [7/20], Step [532/627], Loss: 0.5434
Epoch [7/20], Step [533/627], Loss: 0.6413
Epoch [7/20], Step [534/627], Loss: 0.2596
Epoch [7/20], Step [535/627], Loss: 0.5113
Epoch [7/20], Step [536/627], Loss: 0.1875
Epoch [7/20], Step [537/627], Loss: 0.4869
Epoch [7/20], Step [538/627], Loss: 0.3762
Epoch [7/20], Step [539/627], Loss: 0.2831
Epoch [7/20], Step [540/627], Loss: 0.3833
Epoch [7/20], Step [541/627], Loss: 0.3656
Epoch [7/20], Step [542/627], Loss: 0.6727
Epoch [7/20], Step [543/627], Loss: 0.6818
Epoch [7/20], Step [544/627], Loss: 0.3125
Epoch [7/20], Step [545/627], Loss: 0.2677
Epoch [7/20], Step [546/627], Loss: 0.2563
Epoch [7/20], Step [547/627], Loss: 0.4878
Epoch [7/20], Step [548/627], Loss: 0.6898
Epoch [7/20

Epoch [8/20], Step [96/627], Loss: 0.1804
Epoch [8/20], Step [97/627], Loss: 0.3962
Epoch [8/20], Step [98/627], Loss: 0.3702
Epoch [8/20], Step [99/627], Loss: 0.3238
Epoch [8/20], Step [100/627], Loss: 0.6579
Epoch [8/20], Step [101/627], Loss: 0.3439
Epoch [8/20], Step [102/627], Loss: 0.5551
Epoch [8/20], Step [103/627], Loss: 0.4327
Epoch [8/20], Step [104/627], Loss: 0.3343
Epoch [8/20], Step [105/627], Loss: 0.7643
Epoch [8/20], Step [106/627], Loss: 0.2834
Epoch [8/20], Step [107/627], Loss: 0.1708
Epoch [8/20], Step [108/627], Loss: 0.4478
Epoch [8/20], Step [109/627], Loss: 0.3541
Epoch [8/20], Step [110/627], Loss: 0.1165
Epoch [8/20], Step [111/627], Loss: 0.2916
Epoch [8/20], Step [112/627], Loss: 0.2558
Epoch [8/20], Step [113/627], Loss: 0.1837
Epoch [8/20], Step [114/627], Loss: 0.2294
Epoch [8/20], Step [115/627], Loss: 0.6193
Epoch [8/20], Step [116/627], Loss: 0.4309
Epoch [8/20], Step [117/627], Loss: 0.3773
Epoch [8/20], Step [118/627], Loss: 0.3133
Epoch [8/20], S

Epoch [8/20], Step [291/627], Loss: 0.1842
Epoch [8/20], Step [292/627], Loss: 0.6890
Epoch [8/20], Step [293/627], Loss: 0.6621
Epoch [8/20], Step [294/627], Loss: 0.4616
Epoch [8/20], Step [295/627], Loss: 0.4022
Epoch [8/20], Step [296/627], Loss: 0.4136
Epoch [8/20], Step [297/627], Loss: 0.3095
Epoch [8/20], Step [298/627], Loss: 0.5194
Epoch [8/20], Step [299/627], Loss: 0.1138
Epoch [8/20], Step [300/627], Loss: 0.2452
Epoch [8/20], Step [301/627], Loss: 0.4602
Epoch [8/20], Step [302/627], Loss: 0.0984
Epoch [8/20], Step [303/627], Loss: 0.1912
Epoch [8/20], Step [304/627], Loss: 0.1308
Epoch [8/20], Step [305/627], Loss: 0.2206
Epoch [8/20], Step [306/627], Loss: 0.2545
Epoch [8/20], Step [307/627], Loss: 0.2889
Epoch [8/20], Step [308/627], Loss: 0.1963
Epoch [8/20], Step [309/627], Loss: 0.2107
Epoch [8/20], Step [310/627], Loss: 0.2247
Epoch [8/20], Step [311/627], Loss: 0.4964
Epoch [8/20], Step [312/627], Loss: 0.2268
Epoch [8/20], Step [313/627], Loss: 0.2168
Epoch [8/20

Epoch [8/20], Step [486/627], Loss: 0.7387
Epoch [8/20], Step [487/627], Loss: 0.2521
Epoch [8/20], Step [488/627], Loss: 0.2967
Epoch [8/20], Step [489/627], Loss: 0.2857
Epoch [8/20], Step [490/627], Loss: 0.4595
Epoch [8/20], Step [491/627], Loss: 0.5418
Epoch [8/20], Step [492/627], Loss: 0.3212
Epoch [8/20], Step [493/627], Loss: 0.1866
Epoch [8/20], Step [494/627], Loss: 0.1645
Epoch [8/20], Step [495/627], Loss: 0.3065
Epoch [8/20], Step [496/627], Loss: 0.2469
Epoch [8/20], Step [497/627], Loss: 0.7230
Epoch [8/20], Step [498/627], Loss: 0.2164
Epoch [8/20], Step [499/627], Loss: 0.3209
Epoch [8/20], Step [500/627], Loss: 0.1594
Epoch [8/20], Step [501/627], Loss: 0.3540
Epoch [8/20], Step [502/627], Loss: 0.2151
Epoch [8/20], Step [503/627], Loss: 0.2883
Epoch [8/20], Step [504/627], Loss: 0.4263
Epoch [8/20], Step [505/627], Loss: 0.1539
Epoch [8/20], Step [506/627], Loss: 0.2404
Epoch [8/20], Step [507/627], Loss: 0.2070
Epoch [8/20], Step [508/627], Loss: 0.2892
Epoch [8/20

Epoch [9/20], Step [51/627], Loss: 0.4786
Epoch [9/20], Step [52/627], Loss: 0.7540
Epoch [9/20], Step [53/627], Loss: 0.3866
Epoch [9/20], Step [54/627], Loss: 0.2512
Epoch [9/20], Step [55/627], Loss: 0.2492
Epoch [9/20], Step [56/627], Loss: 0.3797
Epoch [9/20], Step [57/627], Loss: 0.4793
Epoch [9/20], Step [58/627], Loss: 0.2438
Epoch [9/20], Step [59/627], Loss: 0.3071
Epoch [9/20], Step [60/627], Loss: 0.2422
Epoch [9/20], Step [61/627], Loss: 0.1835
Epoch [9/20], Step [62/627], Loss: 0.2235
Epoch [9/20], Step [63/627], Loss: 0.2347
Epoch [9/20], Step [64/627], Loss: 0.2249
Epoch [9/20], Step [65/627], Loss: 0.5284
Epoch [9/20], Step [66/627], Loss: 0.2081
Epoch [9/20], Step [67/627], Loss: 0.3131
Epoch [9/20], Step [68/627], Loss: 0.2882
Epoch [9/20], Step [69/627], Loss: 0.1775
Epoch [9/20], Step [70/627], Loss: 0.2824
Epoch [9/20], Step [71/627], Loss: 0.3014
Epoch [9/20], Step [72/627], Loss: 0.2994
Epoch [9/20], Step [73/627], Loss: 0.3261
Epoch [9/20], Step [74/627], Loss:

Epoch [9/20], Step [246/627], Loss: 0.6425
Epoch [9/20], Step [247/627], Loss: 0.3998
Epoch [9/20], Step [248/627], Loss: 0.2868
Epoch [9/20], Step [249/627], Loss: 0.7012
Epoch [9/20], Step [250/627], Loss: 0.2608
Epoch [9/20], Step [251/627], Loss: 0.1474
Epoch [9/20], Step [252/627], Loss: 0.5186
Epoch [9/20], Step [253/627], Loss: 0.6659
Epoch [9/20], Step [254/627], Loss: 0.1818
Epoch [9/20], Step [255/627], Loss: 0.1071
Epoch [9/20], Step [256/627], Loss: 0.1373
Epoch [9/20], Step [257/627], Loss: 0.1792
Epoch [9/20], Step [258/627], Loss: 0.1340
Epoch [9/20], Step [259/627], Loss: 0.2316
Epoch [9/20], Step [260/627], Loss: 0.0811
Epoch [9/20], Step [261/627], Loss: 0.2939
Epoch [9/20], Step [262/627], Loss: 0.1000
Epoch [9/20], Step [263/627], Loss: 0.4349
Epoch [9/20], Step [264/627], Loss: 0.2934
Epoch [9/20], Step [265/627], Loss: 0.1802
Epoch [9/20], Step [266/627], Loss: 0.5722
Epoch [9/20], Step [267/627], Loss: 0.2879
Epoch [9/20], Step [268/627], Loss: 0.5672
Epoch [9/20

Epoch [9/20], Step [441/627], Loss: 0.1655
Epoch [9/20], Step [442/627], Loss: 0.4313
Epoch [9/20], Step [443/627], Loss: 0.2330
Epoch [9/20], Step [444/627], Loss: 0.3840
Epoch [9/20], Step [445/627], Loss: 0.1467
Epoch [9/20], Step [446/627], Loss: 0.3174
Epoch [9/20], Step [447/627], Loss: 0.7705
Epoch [9/20], Step [448/627], Loss: 0.4140
Epoch [9/20], Step [449/627], Loss: 0.1216
Epoch [9/20], Step [450/627], Loss: 0.4402
Epoch [9/20], Step [451/627], Loss: 0.4224
Epoch [9/20], Step [452/627], Loss: 0.2378
Epoch [9/20], Step [453/627], Loss: 0.2423
Epoch [9/20], Step [454/627], Loss: 0.9525
Epoch [9/20], Step [455/627], Loss: 0.2122
Epoch [9/20], Step [456/627], Loss: 0.2334
Epoch [9/20], Step [457/627], Loss: 0.1086
Epoch [9/20], Step [458/627], Loss: 0.5551
Epoch [9/20], Step [459/627], Loss: 0.1481
Epoch [9/20], Step [460/627], Loss: 0.4971
Epoch [9/20], Step [461/627], Loss: 0.2200
Epoch [9/20], Step [462/627], Loss: 0.2248
Epoch [9/20], Step [463/627], Loss: 0.1039
Epoch [9/20

Epoch [10/20], Step [5/627], Loss: 0.2342
Epoch [10/20], Step [6/627], Loss: 0.1791
Epoch [10/20], Step [7/627], Loss: 0.3813
Epoch [10/20], Step [8/627], Loss: 0.4318
Epoch [10/20], Step [9/627], Loss: 0.3212
Epoch [10/20], Step [10/627], Loss: 0.3060
Epoch [10/20], Step [11/627], Loss: 0.1855
Epoch [10/20], Step [12/627], Loss: 0.1574
Epoch [10/20], Step [13/627], Loss: 0.2476
Epoch [10/20], Step [14/627], Loss: 0.0819
Epoch [10/20], Step [15/627], Loss: 0.2732
Epoch [10/20], Step [16/627], Loss: 0.1872
Epoch [10/20], Step [17/627], Loss: 0.1856
Epoch [10/20], Step [18/627], Loss: 0.2181
Epoch [10/20], Step [19/627], Loss: 0.1170
Epoch [10/20], Step [20/627], Loss: 0.2182
Epoch [10/20], Step [21/627], Loss: 0.0874
Epoch [10/20], Step [22/627], Loss: 0.3385
Epoch [10/20], Step [23/627], Loss: 0.2015
Epoch [10/20], Step [24/627], Loss: 0.1109
Epoch [10/20], Step [25/627], Loss: 0.1133
Epoch [10/20], Step [26/627], Loss: 0.1913
Epoch [10/20], Step [27/627], Loss: 0.1517
Epoch [10/20], S

Epoch [10/20], Step [195/627], Loss: 1.7117
Epoch [10/20], Step [196/627], Loss: 0.2035
Epoch [10/20], Step [197/627], Loss: 0.0747
Epoch [10/20], Step [198/627], Loss: 0.1694
Epoch [10/20], Step [199/627], Loss: 0.1679
Epoch [10/20], Step [200/627], Loss: 0.7212
Epoch [10/20], Step [201/627], Loss: 0.2231
Epoch [10/20], Step [202/627], Loss: 0.1276
Epoch [10/20], Step [203/627], Loss: 0.2679
Epoch [10/20], Step [204/627], Loss: 0.1908
Epoch [10/20], Step [205/627], Loss: 0.2499
Epoch [10/20], Step [206/627], Loss: 0.1379
Epoch [10/20], Step [207/627], Loss: 0.3692
Epoch [10/20], Step [208/627], Loss: 0.4028
Epoch [10/20], Step [209/627], Loss: 0.2366
Epoch [10/20], Step [210/627], Loss: 0.3564
Epoch [10/20], Step [211/627], Loss: 0.1660
Epoch [10/20], Step [212/627], Loss: 0.3787
Epoch [10/20], Step [213/627], Loss: 0.4357
Epoch [10/20], Step [214/627], Loss: 0.3006
Epoch [10/20], Step [215/627], Loss: 0.4458
Epoch [10/20], Step [216/627], Loss: 0.1409
Epoch [10/20], Step [217/627], L

Epoch [10/20], Step [385/627], Loss: 0.2508
Epoch [10/20], Step [386/627], Loss: 0.4626
Epoch [10/20], Step [387/627], Loss: 0.1823
Epoch [10/20], Step [388/627], Loss: 0.1288
Epoch [10/20], Step [389/627], Loss: 0.1931
Epoch [10/20], Step [390/627], Loss: 0.3451
Epoch [10/20], Step [391/627], Loss: 0.1222
Epoch [10/20], Step [392/627], Loss: 0.2186
Epoch [10/20], Step [393/627], Loss: 0.3072
Epoch [10/20], Step [394/627], Loss: 0.2860
Epoch [10/20], Step [395/627], Loss: 0.2191
Epoch [10/20], Step [396/627], Loss: 0.2915
Epoch [10/20], Step [397/627], Loss: 0.0363
Epoch [10/20], Step [398/627], Loss: 0.3504
Epoch [10/20], Step [399/627], Loss: 0.1289
Epoch [10/20], Step [400/627], Loss: 0.4559
Epoch [10/20], Step [401/627], Loss: 0.2596
Epoch [10/20], Step [402/627], Loss: 0.3033
Epoch [10/20], Step [403/627], Loss: 0.3527
Epoch [10/20], Step [404/627], Loss: 0.3034
Epoch [10/20], Step [405/627], Loss: 0.3323
Epoch [10/20], Step [406/627], Loss: 0.5121
Epoch [10/20], Step [407/627], L

Epoch [10/20], Step [575/627], Loss: 0.4049
Epoch [10/20], Step [576/627], Loss: 0.2599
Epoch [10/20], Step [577/627], Loss: 0.2424
Epoch [10/20], Step [578/627], Loss: 0.7455
Epoch [10/20], Step [579/627], Loss: 0.3816
Epoch [10/20], Step [580/627], Loss: 0.2898
Epoch [10/20], Step [581/627], Loss: 0.2153
Epoch [10/20], Step [582/627], Loss: 0.3937
Epoch [10/20], Step [583/627], Loss: 0.1141
Epoch [10/20], Step [584/627], Loss: 0.4303
Epoch [10/20], Step [585/627], Loss: 0.1460
Epoch [10/20], Step [586/627], Loss: 0.1337
Epoch [10/20], Step [587/627], Loss: 0.3149
Epoch [10/20], Step [588/627], Loss: 0.6797
Epoch [10/20], Step [589/627], Loss: 0.2526
Epoch [10/20], Step [590/627], Loss: 0.0924
Epoch [10/20], Step [591/627], Loss: 0.3165
Epoch [10/20], Step [592/627], Loss: 0.2318
Epoch [10/20], Step [593/627], Loss: 0.2923
Epoch [10/20], Step [594/627], Loss: 0.1831
Epoch [10/20], Step [595/627], Loss: 0.1778
Epoch [10/20], Step [596/627], Loss: 0.7318
Epoch [10/20], Step [597/627], L

Epoch [11/20], Step [141/627], Loss: 0.2432
Epoch [11/20], Step [142/627], Loss: 0.1835
Epoch [11/20], Step [143/627], Loss: 0.1664
Epoch [11/20], Step [144/627], Loss: 0.3665
Epoch [11/20], Step [145/627], Loss: 0.1912
Epoch [11/20], Step [146/627], Loss: 0.1988
Epoch [11/20], Step [147/627], Loss: 0.0890
Epoch [11/20], Step [148/627], Loss: 0.3813
Epoch [11/20], Step [149/627], Loss: 0.3219
Epoch [11/20], Step [150/627], Loss: 0.1609
Epoch [11/20], Step [151/627], Loss: 0.3224
Epoch [11/20], Step [152/627], Loss: 0.3063
Epoch [11/20], Step [153/627], Loss: 0.2790
Epoch [11/20], Step [154/627], Loss: 0.1617
Epoch [11/20], Step [155/627], Loss: 0.1481
Epoch [11/20], Step [156/627], Loss: 0.3950
Epoch [11/20], Step [157/627], Loss: 0.1356
Epoch [11/20], Step [158/627], Loss: 0.3565
Epoch [11/20], Step [159/627], Loss: 0.2043
Epoch [11/20], Step [160/627], Loss: 0.3769
Epoch [11/20], Step [161/627], Loss: 0.5560
Epoch [11/20], Step [162/627], Loss: 0.2873
Epoch [11/20], Step [163/627], L

Epoch [11/20], Step [331/627], Loss: 0.1480
Epoch [11/20], Step [332/627], Loss: 0.2395
Epoch [11/20], Step [333/627], Loss: 0.1862
Epoch [11/20], Step [334/627], Loss: 0.3037
Epoch [11/20], Step [335/627], Loss: 0.3557
Epoch [11/20], Step [336/627], Loss: 0.6081
Epoch [11/20], Step [337/627], Loss: 0.3701
Epoch [11/20], Step [338/627], Loss: 0.3235
Epoch [11/20], Step [339/627], Loss: 0.3080
Epoch [11/20], Step [340/627], Loss: 0.5003
Epoch [11/20], Step [341/627], Loss: 0.3587
Epoch [11/20], Step [342/627], Loss: 0.1741
Epoch [11/20], Step [343/627], Loss: 0.7705
Epoch [11/20], Step [344/627], Loss: 0.3514
Epoch [11/20], Step [345/627], Loss: 0.1484
Epoch [11/20], Step [346/627], Loss: 0.3677
Epoch [11/20], Step [347/627], Loss: 0.0775
Epoch [11/20], Step [348/627], Loss: 0.1958
Epoch [11/20], Step [349/627], Loss: 0.1279
Epoch [11/20], Step [350/627], Loss: 0.1123
Epoch [11/20], Step [351/627], Loss: 0.2573
Epoch [11/20], Step [352/627], Loss: 0.1754
Epoch [11/20], Step [353/627], L

Epoch [11/20], Step [521/627], Loss: 0.0849
Epoch [11/20], Step [522/627], Loss: 0.3699
Epoch [11/20], Step [523/627], Loss: 0.3884
Epoch [11/20], Step [524/627], Loss: 0.3824
Epoch [11/20], Step [525/627], Loss: 0.1304
Epoch [11/20], Step [526/627], Loss: 0.2528
Epoch [11/20], Step [527/627], Loss: 0.1080
Epoch [11/20], Step [528/627], Loss: 0.1907
Epoch [11/20], Step [529/627], Loss: 0.3368
Epoch [11/20], Step [530/627], Loss: 0.4214
Epoch [11/20], Step [531/627], Loss: 0.2825
Epoch [11/20], Step [532/627], Loss: 0.2586
Epoch [11/20], Step [533/627], Loss: 0.1811
Epoch [11/20], Step [534/627], Loss: 0.3065
Epoch [11/20], Step [535/627], Loss: 0.1827
Epoch [11/20], Step [536/627], Loss: 0.2745
Epoch [11/20], Step [537/627], Loss: 0.2842
Epoch [11/20], Step [538/627], Loss: 0.0912
Epoch [11/20], Step [539/627], Loss: 0.1204
Epoch [11/20], Step [540/627], Loss: 0.1818
Epoch [11/20], Step [541/627], Loss: 0.2527
Epoch [11/20], Step [542/627], Loss: 0.4737
Epoch [11/20], Step [543/627], L

Epoch [12/20], Step [86/627], Loss: 0.2348
Epoch [12/20], Step [87/627], Loss: 0.4624
Epoch [12/20], Step [88/627], Loss: 0.3615
Epoch [12/20], Step [89/627], Loss: 0.1842
Epoch [12/20], Step [90/627], Loss: 0.1816
Epoch [12/20], Step [91/627], Loss: 0.0955
Epoch [12/20], Step [92/627], Loss: 0.1385
Epoch [12/20], Step [93/627], Loss: 0.1830
Epoch [12/20], Step [94/627], Loss: 0.2317
Epoch [12/20], Step [95/627], Loss: 0.1003
Epoch [12/20], Step [96/627], Loss: 0.1222
Epoch [12/20], Step [97/627], Loss: 0.1289
Epoch [12/20], Step [98/627], Loss: 0.3608
Epoch [12/20], Step [99/627], Loss: 0.1868
Epoch [12/20], Step [100/627], Loss: 0.1755
Epoch [12/20], Step [101/627], Loss: 0.1552
Epoch [12/20], Step [102/627], Loss: 0.1537
Epoch [12/20], Step [103/627], Loss: 0.4373
Epoch [12/20], Step [104/627], Loss: 0.7223
Epoch [12/20], Step [105/627], Loss: 0.1156
Epoch [12/20], Step [106/627], Loss: 0.2892
Epoch [12/20], Step [107/627], Loss: 0.7183
Epoch [12/20], Step [108/627], Loss: 0.4467
Ep

Epoch [12/20], Step [276/627], Loss: 0.0809
Epoch [12/20], Step [277/627], Loss: 0.2506
Epoch [12/20], Step [278/627], Loss: 0.3773
Epoch [12/20], Step [279/627], Loss: 0.5210
Epoch [12/20], Step [280/627], Loss: 0.1649
Epoch [12/20], Step [281/627], Loss: 0.0894
Epoch [12/20], Step [282/627], Loss: 0.2062
Epoch [12/20], Step [283/627], Loss: 0.3241
Epoch [12/20], Step [284/627], Loss: 0.3024
Epoch [12/20], Step [285/627], Loss: 0.4461
Epoch [12/20], Step [286/627], Loss: 0.1387
Epoch [12/20], Step [287/627], Loss: 0.2505
Epoch [12/20], Step [288/627], Loss: 0.2074
Epoch [12/20], Step [289/627], Loss: 0.1409
Epoch [12/20], Step [290/627], Loss: 0.2096
Epoch [12/20], Step [291/627], Loss: 0.2489
Epoch [12/20], Step [292/627], Loss: 0.1087
Epoch [12/20], Step [293/627], Loss: 0.1466
Epoch [12/20], Step [294/627], Loss: 0.4486
Epoch [12/20], Step [295/627], Loss: 0.5845
Epoch [12/20], Step [296/627], Loss: 0.0778
Epoch [12/20], Step [297/627], Loss: 0.2042
Epoch [12/20], Step [298/627], L

Epoch [12/20], Step [466/627], Loss: 0.1855
Epoch [12/20], Step [467/627], Loss: 0.2003
Epoch [12/20], Step [468/627], Loss: 0.8079
Epoch [12/20], Step [469/627], Loss: 0.1932
Epoch [12/20], Step [470/627], Loss: 0.2121
Epoch [12/20], Step [471/627], Loss: 0.2338
Epoch [12/20], Step [472/627], Loss: 0.1955
Epoch [12/20], Step [473/627], Loss: 0.1655
Epoch [12/20], Step [474/627], Loss: 0.1535
Epoch [12/20], Step [475/627], Loss: 0.3687
Epoch [12/20], Step [476/627], Loss: 0.2525
Epoch [12/20], Step [477/627], Loss: 0.3215
Epoch [12/20], Step [478/627], Loss: 0.2402
Epoch [12/20], Step [479/627], Loss: 0.1250
Epoch [12/20], Step [480/627], Loss: 0.3227
Epoch [12/20], Step [481/627], Loss: 0.2534
Epoch [12/20], Step [482/627], Loss: 0.1922
Epoch [12/20], Step [483/627], Loss: 0.4163
Epoch [12/20], Step [484/627], Loss: 0.1681
Epoch [12/20], Step [485/627], Loss: 0.1249
Epoch [12/20], Step [486/627], Loss: 0.1214
Epoch [12/20], Step [487/627], Loss: 0.1414
Epoch [12/20], Step [488/627], L

Epoch [13/20], Step [26/627], Loss: 0.3987
Epoch [13/20], Step [27/627], Loss: 0.2615
Epoch [13/20], Step [28/627], Loss: 0.1131
Epoch [13/20], Step [29/627], Loss: 0.2799
Epoch [13/20], Step [30/627], Loss: 0.2044
Epoch [13/20], Step [31/627], Loss: 0.2250
Epoch [13/20], Step [32/627], Loss: 0.4235
Epoch [13/20], Step [33/627], Loss: 0.2476
Epoch [13/20], Step [34/627], Loss: 0.0854
Epoch [13/20], Step [35/627], Loss: 0.1936
Epoch [13/20], Step [36/627], Loss: 0.1310
Epoch [13/20], Step [37/627], Loss: 0.1739
Epoch [13/20], Step [38/627], Loss: 0.1550
Epoch [13/20], Step [39/627], Loss: 0.4810
Epoch [13/20], Step [40/627], Loss: 0.3470
Epoch [13/20], Step [41/627], Loss: 0.2733
Epoch [13/20], Step [42/627], Loss: 0.5209
Epoch [13/20], Step [43/627], Loss: 0.3011
Epoch [13/20], Step [44/627], Loss: 0.3807
Epoch [13/20], Step [45/627], Loss: 0.3864
Epoch [13/20], Step [46/627], Loss: 0.3034
Epoch [13/20], Step [47/627], Loss: 0.1781
Epoch [13/20], Step [48/627], Loss: 0.4954
Epoch [13/2

Epoch [13/20], Step [216/627], Loss: 0.2138
Epoch [13/20], Step [217/627], Loss: 0.2313
Epoch [13/20], Step [218/627], Loss: 0.3759
Epoch [13/20], Step [219/627], Loss: 0.3629
Epoch [13/20], Step [220/627], Loss: 0.1022
Epoch [13/20], Step [221/627], Loss: 0.4883
Epoch [13/20], Step [222/627], Loss: 0.2809
Epoch [13/20], Step [223/627], Loss: 0.1849
Epoch [13/20], Step [224/627], Loss: 0.2387
Epoch [13/20], Step [225/627], Loss: 0.3963
Epoch [13/20], Step [226/627], Loss: 0.2862
Epoch [13/20], Step [227/627], Loss: 0.3512
Epoch [13/20], Step [228/627], Loss: 0.5177
Epoch [13/20], Step [229/627], Loss: 0.1187
Epoch [13/20], Step [230/627], Loss: 0.1126
Epoch [13/20], Step [231/627], Loss: 0.1834
Epoch [13/20], Step [232/627], Loss: 0.2091
Epoch [13/20], Step [233/627], Loss: 0.5831
Epoch [13/20], Step [234/627], Loss: 0.1848
Epoch [13/20], Step [235/627], Loss: 0.4253
Epoch [13/20], Step [236/627], Loss: 0.1627
Epoch [13/20], Step [237/627], Loss: 0.3581
Epoch [13/20], Step [238/627], L

Epoch [13/20], Step [406/627], Loss: 0.2612
Epoch [13/20], Step [407/627], Loss: 0.2113
Epoch [13/20], Step [408/627], Loss: 0.0405
Epoch [13/20], Step [409/627], Loss: 0.2829
Epoch [13/20], Step [410/627], Loss: 0.1482
Epoch [13/20], Step [411/627], Loss: 0.2215
Epoch [13/20], Step [412/627], Loss: 0.1759
Epoch [13/20], Step [413/627], Loss: 0.1700
Epoch [13/20], Step [414/627], Loss: 0.1551
Epoch [13/20], Step [415/627], Loss: 0.1440
Epoch [13/20], Step [416/627], Loss: 0.3819
Epoch [13/20], Step [417/627], Loss: 0.4816
Epoch [13/20], Step [418/627], Loss: 0.3101
Epoch [13/20], Step [419/627], Loss: 0.2297
Epoch [13/20], Step [420/627], Loss: 0.1222
Epoch [13/20], Step [421/627], Loss: 0.1882
Epoch [13/20], Step [422/627], Loss: 0.3073
Epoch [13/20], Step [423/627], Loss: 0.0949
Epoch [13/20], Step [424/627], Loss: 0.0869
Epoch [13/20], Step [425/627], Loss: 0.1582
Epoch [13/20], Step [426/627], Loss: 0.1957
Epoch [13/20], Step [427/627], Loss: 0.1362
Epoch [13/20], Step [428/627], L

Epoch [13/20], Step [596/627], Loss: 0.1897
Epoch [13/20], Step [597/627], Loss: 0.0885
Epoch [13/20], Step [598/627], Loss: 0.3006
Epoch [13/20], Step [599/627], Loss: 0.2437
Epoch [13/20], Step [600/627], Loss: 0.2637
Epoch [13/20], Step [601/627], Loss: 0.6186
Epoch [13/20], Step [602/627], Loss: 0.2485
Epoch [13/20], Step [603/627], Loss: 0.1483
Epoch [13/20], Step [604/627], Loss: 0.0931
Epoch [13/20], Step [605/627], Loss: 0.2396
Epoch [13/20], Step [606/627], Loss: 0.1225
Epoch [13/20], Step [607/627], Loss: 0.4837
Epoch [13/20], Step [608/627], Loss: 0.4076
Epoch [13/20], Step [609/627], Loss: 0.1500
Epoch [13/20], Step [610/627], Loss: 0.0981
Epoch [13/20], Step [611/627], Loss: 0.3859
Epoch [13/20], Step [612/627], Loss: 0.2730
Epoch [13/20], Step [613/627], Loss: 0.1177
Epoch [13/20], Step [614/627], Loss: 0.2329
Epoch [13/20], Step [615/627], Loss: 0.1765
Epoch [13/20], Step [616/627], Loss: 0.2666
Epoch [13/20], Step [617/627], Loss: 0.3057
Epoch [13/20], Step [618/627], L

Epoch [14/20], Step [161/627], Loss: 0.1308
Epoch [14/20], Step [162/627], Loss: 0.1557
Epoch [14/20], Step [163/627], Loss: 0.1056
Epoch [14/20], Step [164/627], Loss: 0.2988
Epoch [14/20], Step [165/627], Loss: 0.3924
Epoch [14/20], Step [166/627], Loss: 0.4329
Epoch [14/20], Step [167/627], Loss: 0.1360
Epoch [14/20], Step [168/627], Loss: 0.1872
Epoch [14/20], Step [169/627], Loss: 0.2969
Epoch [14/20], Step [170/627], Loss: 0.1672
Epoch [14/20], Step [171/627], Loss: 0.2094
Epoch [14/20], Step [172/627], Loss: 0.0922
Epoch [14/20], Step [173/627], Loss: 0.1366
Epoch [14/20], Step [174/627], Loss: 0.0979
Epoch [14/20], Step [175/627], Loss: 0.0610
Epoch [14/20], Step [176/627], Loss: 0.2229
Epoch [14/20], Step [177/627], Loss: 0.1866
Epoch [14/20], Step [178/627], Loss: 0.2370
Epoch [14/20], Step [179/627], Loss: 0.0746
Epoch [14/20], Step [180/627], Loss: 0.1398
Epoch [14/20], Step [181/627], Loss: 0.1386
Epoch [14/20], Step [182/627], Loss: 0.1516
Epoch [14/20], Step [183/627], L

Epoch [14/20], Step [351/627], Loss: 0.3923
Epoch [14/20], Step [352/627], Loss: 0.2058
Epoch [14/20], Step [353/627], Loss: 0.2471
Epoch [14/20], Step [354/627], Loss: 0.1653
Epoch [14/20], Step [355/627], Loss: 0.1573
Epoch [14/20], Step [356/627], Loss: 0.1908
Epoch [14/20], Step [357/627], Loss: 0.1892
Epoch [14/20], Step [358/627], Loss: 0.2902
Epoch [14/20], Step [359/627], Loss: 0.1134
Epoch [14/20], Step [360/627], Loss: 0.2563
Epoch [14/20], Step [361/627], Loss: 0.1327
Epoch [14/20], Step [362/627], Loss: 0.1048
Epoch [14/20], Step [363/627], Loss: 0.2378
Epoch [14/20], Step [364/627], Loss: 0.1468
Epoch [14/20], Step [365/627], Loss: 0.0831
Epoch [14/20], Step [366/627], Loss: 0.2079
Epoch [14/20], Step [367/627], Loss: 0.1985
Epoch [14/20], Step [368/627], Loss: 0.2882
Epoch [14/20], Step [369/627], Loss: 0.1781
Epoch [14/20], Step [370/627], Loss: 0.1972
Epoch [14/20], Step [371/627], Loss: 0.1364
Epoch [14/20], Step [372/627], Loss: 0.1629
Epoch [14/20], Step [373/627], L

Epoch [14/20], Step [541/627], Loss: 0.1583
Epoch [14/20], Step [542/627], Loss: 0.0780
Epoch [14/20], Step [543/627], Loss: 0.3446
Epoch [14/20], Step [544/627], Loss: 0.1676
Epoch [14/20], Step [545/627], Loss: 0.3512
Epoch [14/20], Step [546/627], Loss: 0.2839
Epoch [14/20], Step [547/627], Loss: 0.1647
Epoch [14/20], Step [548/627], Loss: 0.2293
Epoch [14/20], Step [549/627], Loss: 0.2558
Epoch [14/20], Step [550/627], Loss: 0.1182
Epoch [14/20], Step [551/627], Loss: 0.3689
Epoch [14/20], Step [552/627], Loss: 0.3307
Epoch [14/20], Step [553/627], Loss: 0.1707
Epoch [14/20], Step [554/627], Loss: 0.1838
Epoch [14/20], Step [555/627], Loss: 0.3913
Epoch [14/20], Step [556/627], Loss: 0.3026
Epoch [14/20], Step [557/627], Loss: 0.1989
Epoch [14/20], Step [558/627], Loss: 0.1803
Epoch [14/20], Step [559/627], Loss: 0.1473
Epoch [14/20], Step [560/627], Loss: 0.2430
Epoch [14/20], Step [561/627], Loss: 0.4878
Epoch [14/20], Step [562/627], Loss: 0.3577
Epoch [14/20], Step [563/627], L

Epoch [15/20], Step [106/627], Loss: 0.1946
Epoch [15/20], Step [107/627], Loss: 0.1663
Epoch [15/20], Step [108/627], Loss: 0.2338
Epoch [15/20], Step [109/627], Loss: 0.0854
Epoch [15/20], Step [110/627], Loss: 0.2104
Epoch [15/20], Step [111/627], Loss: 0.1581
Epoch [15/20], Step [112/627], Loss: 0.2349
Epoch [15/20], Step [113/627], Loss: 0.1024
Epoch [15/20], Step [114/627], Loss: 0.1479
Epoch [15/20], Step [115/627], Loss: 0.1421
Epoch [15/20], Step [116/627], Loss: 0.1512
Epoch [15/20], Step [117/627], Loss: 0.2120
Epoch [15/20], Step [118/627], Loss: 0.3374
Epoch [15/20], Step [119/627], Loss: 0.1233
Epoch [15/20], Step [120/627], Loss: 0.3014
Epoch [15/20], Step [121/627], Loss: 0.2246
Epoch [15/20], Step [122/627], Loss: 0.1629
Epoch [15/20], Step [123/627], Loss: 0.2282
Epoch [15/20], Step [124/627], Loss: 0.2109
Epoch [15/20], Step [125/627], Loss: 0.1270
Epoch [15/20], Step [126/627], Loss: 0.1776
Epoch [15/20], Step [127/627], Loss: 0.1335
Epoch [15/20], Step [128/627], L

Epoch [15/20], Step [296/627], Loss: 0.1189
Epoch [15/20], Step [297/627], Loss: 0.1983
Epoch [15/20], Step [298/627], Loss: 0.2289
Epoch [15/20], Step [299/627], Loss: 0.1497
Epoch [15/20], Step [300/627], Loss: 0.2728
Epoch [15/20], Step [301/627], Loss: 0.1168
Epoch [15/20], Step [302/627], Loss: 0.0696
Epoch [15/20], Step [303/627], Loss: 0.5040
Epoch [15/20], Step [304/627], Loss: 0.1263
Epoch [15/20], Step [305/627], Loss: 0.1454
Epoch [15/20], Step [306/627], Loss: 0.1140
Epoch [15/20], Step [307/627], Loss: 0.1238
Epoch [15/20], Step [308/627], Loss: 0.1700
Epoch [15/20], Step [309/627], Loss: 0.2313
Epoch [15/20], Step [310/627], Loss: 0.1516
Epoch [15/20], Step [311/627], Loss: 0.1514
Epoch [15/20], Step [312/627], Loss: 0.0920
Epoch [15/20], Step [313/627], Loss: 0.1980
Epoch [15/20], Step [314/627], Loss: 0.1692
Epoch [15/20], Step [315/627], Loss: 0.3537
Epoch [15/20], Step [316/627], Loss: 0.1629
Epoch [15/20], Step [317/627], Loss: 0.1269
Epoch [15/20], Step [318/627], L

Epoch [15/20], Step [486/627], Loss: 0.1102
Epoch [15/20], Step [487/627], Loss: 0.2889
Epoch [15/20], Step [488/627], Loss: 0.1395
Epoch [15/20], Step [489/627], Loss: 0.1030
Epoch [15/20], Step [490/627], Loss: 0.1106
Epoch [15/20], Step [491/627], Loss: 0.2146
Epoch [15/20], Step [492/627], Loss: 0.0752
Epoch [15/20], Step [493/627], Loss: 0.1023
Epoch [15/20], Step [494/627], Loss: 0.1743
Epoch [15/20], Step [495/627], Loss: 0.1280
Epoch [15/20], Step [496/627], Loss: 0.2720
Epoch [15/20], Step [497/627], Loss: 0.4001
Epoch [15/20], Step [498/627], Loss: 0.3013
Epoch [15/20], Step [499/627], Loss: 0.0766
Epoch [15/20], Step [500/627], Loss: 0.3204
Epoch [15/20], Step [501/627], Loss: 0.1273
Epoch [15/20], Step [502/627], Loss: 0.2615
Epoch [15/20], Step [503/627], Loss: 0.1226
Epoch [15/20], Step [504/627], Loss: 0.1628
Epoch [15/20], Step [505/627], Loss: 0.1479
Epoch [15/20], Step [506/627], Loss: 0.1378
Epoch [15/20], Step [507/627], Loss: 0.1774
Epoch [15/20], Step [508/627], L

Epoch [16/20], Step [51/627], Loss: 0.0656
Epoch [16/20], Step [52/627], Loss: 0.1991
Epoch [16/20], Step [53/627], Loss: 0.0810
Epoch [16/20], Step [54/627], Loss: 0.1246
Epoch [16/20], Step [55/627], Loss: 0.1636
Epoch [16/20], Step [56/627], Loss: 0.0768
Epoch [16/20], Step [57/627], Loss: 0.1161
Epoch [16/20], Step [58/627], Loss: 0.2655
Epoch [16/20], Step [59/627], Loss: 0.1685
Epoch [16/20], Step [60/627], Loss: 0.1159
Epoch [16/20], Step [61/627], Loss: 0.1239
Epoch [16/20], Step [62/627], Loss: 0.2566
Epoch [16/20], Step [63/627], Loss: 0.0505
Epoch [16/20], Step [64/627], Loss: 0.0951
Epoch [16/20], Step [65/627], Loss: 0.0895
Epoch [16/20], Step [66/627], Loss: 0.2052
Epoch [16/20], Step [67/627], Loss: 0.1418
Epoch [16/20], Step [68/627], Loss: 0.1717
Epoch [16/20], Step [69/627], Loss: 0.0731
Epoch [16/20], Step [70/627], Loss: 0.1465
Epoch [16/20], Step [71/627], Loss: 0.1775
Epoch [16/20], Step [72/627], Loss: 0.0521
Epoch [16/20], Step [73/627], Loss: 0.3054
Epoch [16/2

Epoch [16/20], Step [241/627], Loss: 0.2157
Epoch [16/20], Step [242/627], Loss: 0.1540
Epoch [16/20], Step [243/627], Loss: 0.1013
Epoch [16/20], Step [244/627], Loss: 0.1068
Epoch [16/20], Step [245/627], Loss: 0.2550
Epoch [16/20], Step [246/627], Loss: 0.3126
Epoch [16/20], Step [247/627], Loss: 0.1515
Epoch [16/20], Step [248/627], Loss: 0.0914
Epoch [16/20], Step [249/627], Loss: 0.2204
Epoch [16/20], Step [250/627], Loss: 0.2250
Epoch [16/20], Step [251/627], Loss: 0.1991
Epoch [16/20], Step [252/627], Loss: 0.2393
Epoch [16/20], Step [253/627], Loss: 0.2660
Epoch [16/20], Step [254/627], Loss: 0.2768
Epoch [16/20], Step [255/627], Loss: 0.1517
Epoch [16/20], Step [256/627], Loss: 0.1881
Epoch [16/20], Step [257/627], Loss: 0.0757
Epoch [16/20], Step [258/627], Loss: 0.1575
Epoch [16/20], Step [259/627], Loss: 0.1328
Epoch [16/20], Step [260/627], Loss: 0.2872
Epoch [16/20], Step [261/627], Loss: 0.1140
Epoch [16/20], Step [262/627], Loss: 0.0908
Epoch [16/20], Step [263/627], L

Epoch [16/20], Step [431/627], Loss: 0.3045
Epoch [16/20], Step [432/627], Loss: 0.1186
Epoch [16/20], Step [433/627], Loss: 0.2453
Epoch [16/20], Step [434/627], Loss: 0.1123
Epoch [16/20], Step [435/627], Loss: 0.3230
Epoch [16/20], Step [436/627], Loss: 0.2586
Epoch [16/20], Step [437/627], Loss: 0.1729
Epoch [16/20], Step [438/627], Loss: 0.1766
Epoch [16/20], Step [439/627], Loss: 0.2354
Epoch [16/20], Step [440/627], Loss: 0.2740
Epoch [16/20], Step [441/627], Loss: 0.1277
Epoch [16/20], Step [442/627], Loss: 0.0358
Epoch [16/20], Step [443/627], Loss: 0.1936
Epoch [16/20], Step [444/627], Loss: 0.0857
Epoch [16/20], Step [445/627], Loss: 0.1511
Epoch [16/20], Step [446/627], Loss: 0.1639
Epoch [16/20], Step [447/627], Loss: 0.1198
Epoch [16/20], Step [448/627], Loss: 0.0613
Epoch [16/20], Step [449/627], Loss: 0.2562
Epoch [16/20], Step [450/627], Loss: 0.0738
Epoch [16/20], Step [451/627], Loss: 0.2525
Epoch [16/20], Step [452/627], Loss: 0.2078
Epoch [16/20], Step [453/627], L

Epoch [16/20], Step [621/627], Loss: 0.0975
Epoch [16/20], Step [622/627], Loss: 0.1567
Epoch [16/20], Step [623/627], Loss: 0.0862
Epoch [16/20], Step [624/627], Loss: 0.2082
Epoch [16/20], Step [625/627], Loss: 0.1421
Epoch [16/20], Step [626/627], Loss: 0.0579
Epoch [16/20], Step [627/627], Loss: 0.0815
Epoch [17/20], Step [1/627], Loss: 0.5071
Epoch [17/20], Step [2/627], Loss: 0.1076
Epoch [17/20], Step [3/627], Loss: 0.0846
Epoch [17/20], Step [4/627], Loss: 0.1559
Epoch [17/20], Step [5/627], Loss: 0.1569
Epoch [17/20], Step [6/627], Loss: 0.1718
Epoch [17/20], Step [7/627], Loss: 0.2438
Epoch [17/20], Step [8/627], Loss: 0.1107
Epoch [17/20], Step [9/627], Loss: 0.1836
Epoch [17/20], Step [10/627], Loss: 0.0670
Epoch [17/20], Step [11/627], Loss: 0.0308
Epoch [17/20], Step [12/627], Loss: 0.0599
Epoch [17/20], Step [13/627], Loss: 0.3676
Epoch [17/20], Step [14/627], Loss: 0.0927
Epoch [17/20], Step [15/627], Loss: 0.0965
Epoch [17/20], Step [16/627], Loss: 0.2287
Epoch [17/20]

Epoch [17/20], Step [186/627], Loss: 0.1535
Epoch [17/20], Step [187/627], Loss: 0.1213
Epoch [17/20], Step [188/627], Loss: 0.1844
Epoch [17/20], Step [189/627], Loss: 0.0873
Epoch [17/20], Step [190/627], Loss: 0.1113
Epoch [17/20], Step [191/627], Loss: 0.1674
Epoch [17/20], Step [192/627], Loss: 0.1124
Epoch [17/20], Step [193/627], Loss: 0.1828
Epoch [17/20], Step [194/627], Loss: 0.0685
Epoch [17/20], Step [195/627], Loss: 0.1112
Epoch [17/20], Step [196/627], Loss: 0.1050
Epoch [17/20], Step [197/627], Loss: 0.0620
Epoch [17/20], Step [198/627], Loss: 0.0657
Epoch [17/20], Step [199/627], Loss: 0.1905
Epoch [17/20], Step [200/627], Loss: 0.1810
Epoch [17/20], Step [201/627], Loss: 0.1819
Epoch [17/20], Step [202/627], Loss: 0.3219
Epoch [17/20], Step [203/627], Loss: 0.0964
Epoch [17/20], Step [204/627], Loss: 0.1725
Epoch [17/20], Step [205/627], Loss: 0.1569
Epoch [17/20], Step [206/627], Loss: 0.1059
Epoch [17/20], Step [207/627], Loss: 0.1806
Epoch [17/20], Step [208/627], L

Epoch [17/20], Step [376/627], Loss: 0.2222
Epoch [17/20], Step [377/627], Loss: 0.1990
Epoch [17/20], Step [378/627], Loss: 0.1050
Epoch [17/20], Step [379/627], Loss: 0.0989
Epoch [17/20], Step [380/627], Loss: 0.1332
Epoch [17/20], Step [381/627], Loss: 0.2795
Epoch [17/20], Step [382/627], Loss: 0.1005
Epoch [17/20], Step [383/627], Loss: 0.1701
Epoch [17/20], Step [384/627], Loss: 0.0429
Epoch [17/20], Step [385/627], Loss: 0.1732
Epoch [17/20], Step [386/627], Loss: 0.0838
Epoch [17/20], Step [387/627], Loss: 0.2145
Epoch [17/20], Step [388/627], Loss: 0.1008
Epoch [17/20], Step [389/627], Loss: 0.1710
Epoch [17/20], Step [390/627], Loss: 0.0769
Epoch [17/20], Step [391/627], Loss: 0.0587
Epoch [17/20], Step [392/627], Loss: 0.0521
Epoch [17/20], Step [393/627], Loss: 0.1798
Epoch [17/20], Step [394/627], Loss: 0.2392
Epoch [17/20], Step [395/627], Loss: 0.1212
Epoch [17/20], Step [396/627], Loss: 0.0948
Epoch [17/20], Step [397/627], Loss: 0.1087
Epoch [17/20], Step [398/627], L

Epoch [17/20], Step [566/627], Loss: 0.1348
Epoch [17/20], Step [567/627], Loss: 0.1255
Epoch [17/20], Step [568/627], Loss: 0.1031
Epoch [17/20], Step [569/627], Loss: 0.1084
Epoch [17/20], Step [570/627], Loss: 0.1494
Epoch [17/20], Step [571/627], Loss: 0.1320
Epoch [17/20], Step [572/627], Loss: 0.2308
Epoch [17/20], Step [573/627], Loss: 0.2357
Epoch [17/20], Step [574/627], Loss: 0.0370
Epoch [17/20], Step [575/627], Loss: 0.2357
Epoch [17/20], Step [576/627], Loss: 0.3204
Epoch [17/20], Step [577/627], Loss: 0.1217
Epoch [17/20], Step [578/627], Loss: 0.1558
Epoch [17/20], Step [579/627], Loss: 0.2594
Epoch [17/20], Step [580/627], Loss: 0.0748
Epoch [17/20], Step [581/627], Loss: 0.0804
Epoch [17/20], Step [582/627], Loss: 0.1908
Epoch [17/20], Step [583/627], Loss: 0.2831
Epoch [17/20], Step [584/627], Loss: 0.0628
Epoch [17/20], Step [585/627], Loss: 0.1035
Epoch [17/20], Step [586/627], Loss: 0.1217
Epoch [17/20], Step [587/627], Loss: 0.1314
Epoch [17/20], Step [588/627], L

Epoch [18/20], Step [131/627], Loss: 0.2439
Epoch [18/20], Step [132/627], Loss: 0.0356
Epoch [18/20], Step [133/627], Loss: 0.1459
Epoch [18/20], Step [134/627], Loss: 0.0866
Epoch [18/20], Step [135/627], Loss: 0.0875
Epoch [18/20], Step [136/627], Loss: 0.0749
Epoch [18/20], Step [137/627], Loss: 0.1082
Epoch [18/20], Step [138/627], Loss: 0.0990
Epoch [18/20], Step [139/627], Loss: 0.1165
Epoch [18/20], Step [140/627], Loss: 0.0503
Epoch [18/20], Step [141/627], Loss: 0.1908
Epoch [18/20], Step [142/627], Loss: 0.2489
Epoch [18/20], Step [143/627], Loss: 0.1415
Epoch [18/20], Step [144/627], Loss: 0.0780
Epoch [18/20], Step [145/627], Loss: 0.1241
Epoch [18/20], Step [146/627], Loss: 0.1239
Epoch [18/20], Step [147/627], Loss: 0.1480
Epoch [18/20], Step [148/627], Loss: 0.2107
Epoch [18/20], Step [149/627], Loss: 0.1631
Epoch [18/20], Step [150/627], Loss: 0.1200
Epoch [18/20], Step [151/627], Loss: 0.0723
Epoch [18/20], Step [152/627], Loss: 0.0501
Epoch [18/20], Step [153/627], L

Epoch [18/20], Step [321/627], Loss: 0.2094
Epoch [18/20], Step [322/627], Loss: 0.1102
Epoch [18/20], Step [323/627], Loss: 0.1513
Epoch [18/20], Step [324/627], Loss: 0.0788
Epoch [18/20], Step [325/627], Loss: 0.1072
Epoch [18/20], Step [326/627], Loss: 0.1123
Epoch [18/20], Step [327/627], Loss: 0.1807
Epoch [18/20], Step [328/627], Loss: 0.1578
Epoch [18/20], Step [329/627], Loss: 0.1261
Epoch [18/20], Step [330/627], Loss: 0.3238
Epoch [18/20], Step [331/627], Loss: 0.0998
Epoch [18/20], Step [332/627], Loss: 0.2361
Epoch [18/20], Step [333/627], Loss: 0.1023
Epoch [18/20], Step [334/627], Loss: 0.1863
Epoch [18/20], Step [335/627], Loss: 0.2785
Epoch [18/20], Step [336/627], Loss: 0.2491
Epoch [18/20], Step [337/627], Loss: 0.1012
Epoch [18/20], Step [338/627], Loss: 0.0921
Epoch [18/20], Step [339/627], Loss: 0.2214
Epoch [18/20], Step [340/627], Loss: 0.0466
Epoch [18/20], Step [341/627], Loss: 0.0958
Epoch [18/20], Step [342/627], Loss: 0.0717
Epoch [18/20], Step [343/627], L

Epoch [18/20], Step [511/627], Loss: 0.0562
Epoch [18/20], Step [512/627], Loss: 0.2437
Epoch [18/20], Step [513/627], Loss: 0.1981
Epoch [18/20], Step [514/627], Loss: 0.1134
Epoch [18/20], Step [515/627], Loss: 0.1566
Epoch [18/20], Step [516/627], Loss: 0.1112
Epoch [18/20], Step [517/627], Loss: 0.1268
Epoch [18/20], Step [518/627], Loss: 0.2155
Epoch [18/20], Step [519/627], Loss: 0.1927
Epoch [18/20], Step [520/627], Loss: 0.0721
Epoch [18/20], Step [521/627], Loss: 0.0776
Epoch [18/20], Step [522/627], Loss: 0.1732
Epoch [18/20], Step [523/627], Loss: 0.1347
Epoch [18/20], Step [524/627], Loss: 0.1476
Epoch [18/20], Step [525/627], Loss: 0.1390
Epoch [18/20], Step [526/627], Loss: 0.1699
Epoch [18/20], Step [527/627], Loss: 0.1425
Epoch [18/20], Step [528/627], Loss: 0.2300
Epoch [18/20], Step [529/627], Loss: 0.0420
Epoch [18/20], Step [530/627], Loss: 0.0478
Epoch [18/20], Step [531/627], Loss: 0.0908
Epoch [18/20], Step [532/627], Loss: 0.0793
Epoch [18/20], Step [533/627], L

Epoch [19/20], Step [76/627], Loss: 0.1224
Epoch [19/20], Step [77/627], Loss: 0.1855
Epoch [19/20], Step [78/627], Loss: 0.1622
Epoch [19/20], Step [79/627], Loss: 0.1552
Epoch [19/20], Step [80/627], Loss: 0.0692
Epoch [19/20], Step [81/627], Loss: 0.0416
Epoch [19/20], Step [82/627], Loss: 0.2218
Epoch [19/20], Step [83/627], Loss: 0.0835
Epoch [19/20], Step [84/627], Loss: 0.3203
Epoch [19/20], Step [85/627], Loss: 0.0978
Epoch [19/20], Step [86/627], Loss: 0.1305
Epoch [19/20], Step [87/627], Loss: 0.2749
Epoch [19/20], Step [88/627], Loss: 0.1645
Epoch [19/20], Step [89/627], Loss: 0.0799
Epoch [19/20], Step [90/627], Loss: 0.1273
Epoch [19/20], Step [91/627], Loss: 0.1752
Epoch [19/20], Step [92/627], Loss: 0.1101
Epoch [19/20], Step [93/627], Loss: 0.1156
Epoch [19/20], Step [94/627], Loss: 0.1553
Epoch [19/20], Step [95/627], Loss: 0.0652
Epoch [19/20], Step [96/627], Loss: 0.1562
Epoch [19/20], Step [97/627], Loss: 0.1355
Epoch [19/20], Step [98/627], Loss: 0.1291
Epoch [19/2

Epoch [19/20], Step [266/627], Loss: 0.0809
Epoch [19/20], Step [267/627], Loss: 0.1164
Epoch [19/20], Step [268/627], Loss: 0.0985
Epoch [19/20], Step [269/627], Loss: 0.1373
Epoch [19/20], Step [270/627], Loss: 0.2022
Epoch [19/20], Step [271/627], Loss: 0.1070
Epoch [19/20], Step [272/627], Loss: 0.0604
Epoch [19/20], Step [273/627], Loss: 0.0849
Epoch [19/20], Step [274/627], Loss: 0.1098
Epoch [19/20], Step [275/627], Loss: 0.1446
Epoch [19/20], Step [276/627], Loss: 0.0559
Epoch [19/20], Step [277/627], Loss: 0.0433
Epoch [19/20], Step [278/627], Loss: 0.0519
Epoch [19/20], Step [279/627], Loss: 0.1647
Epoch [19/20], Step [280/627], Loss: 0.0728
Epoch [19/20], Step [281/627], Loss: 0.1035
Epoch [19/20], Step [282/627], Loss: 0.0561
Epoch [19/20], Step [283/627], Loss: 0.1389
Epoch [19/20], Step [284/627], Loss: 0.1599
Epoch [19/20], Step [285/627], Loss: 0.1720
Epoch [19/20], Step [286/627], Loss: 0.0761
Epoch [19/20], Step [287/627], Loss: 0.0629
Epoch [19/20], Step [288/627], L

Epoch [19/20], Step [456/627], Loss: 0.0640
Epoch [19/20], Step [457/627], Loss: 0.2300
Epoch [19/20], Step [458/627], Loss: 0.1647
Epoch [19/20], Step [459/627], Loss: 0.1297
Epoch [19/20], Step [460/627], Loss: 0.1306
Epoch [19/20], Step [461/627], Loss: 0.0724
Epoch [19/20], Step [462/627], Loss: 0.1141
Epoch [19/20], Step [463/627], Loss: 0.0530
Epoch [19/20], Step [464/627], Loss: 0.1410
Epoch [19/20], Step [465/627], Loss: 0.1705
Epoch [19/20], Step [466/627], Loss: 0.1320
Epoch [19/20], Step [467/627], Loss: 0.0997
Epoch [19/20], Step [468/627], Loss: 0.2023
Epoch [19/20], Step [469/627], Loss: 0.1987
Epoch [19/20], Step [470/627], Loss: 0.0631
Epoch [19/20], Step [471/627], Loss: 0.1249
Epoch [19/20], Step [472/627], Loss: 0.0780
Epoch [19/20], Step [473/627], Loss: 0.0955
Epoch [19/20], Step [474/627], Loss: 0.1036
Epoch [19/20], Step [475/627], Loss: 0.1174
Epoch [19/20], Step [476/627], Loss: 0.2194
Epoch [19/20], Step [477/627], Loss: 0.1080
Epoch [19/20], Step [478/627], L

Epoch [20/20], Step [15/627], Loss: 0.0782
Epoch [20/20], Step [16/627], Loss: 0.0826
Epoch [20/20], Step [17/627], Loss: 0.0601
Epoch [20/20], Step [18/627], Loss: 0.1198
Epoch [20/20], Step [19/627], Loss: 0.0210
Epoch [20/20], Step [20/627], Loss: 0.0714
Epoch [20/20], Step [21/627], Loss: 0.0541
Epoch [20/20], Step [22/627], Loss: 0.1102
Epoch [20/20], Step [23/627], Loss: 0.1873
Epoch [20/20], Step [24/627], Loss: 0.1069
Epoch [20/20], Step [25/627], Loss: 0.1179
Epoch [20/20], Step [26/627], Loss: 0.0827
Epoch [20/20], Step [27/627], Loss: 0.2937
Epoch [20/20], Step [28/627], Loss: 0.0457
Epoch [20/20], Step [29/627], Loss: 0.0567
Epoch [20/20], Step [30/627], Loss: 0.0882
Epoch [20/20], Step [31/627], Loss: 0.1038
Epoch [20/20], Step [32/627], Loss: 0.0964
Epoch [20/20], Step [33/627], Loss: 0.0743
Epoch [20/20], Step [34/627], Loss: 0.0794
Epoch [20/20], Step [35/627], Loss: 0.1527
Epoch [20/20], Step [36/627], Loss: 0.3640
Epoch [20/20], Step [37/627], Loss: 0.0910
Epoch [20/2

Epoch [20/20], Step [205/627], Loss: 0.0698
Epoch [20/20], Step [206/627], Loss: 0.0626
Epoch [20/20], Step [207/627], Loss: 0.0420
Epoch [20/20], Step [208/627], Loss: 0.0808
Epoch [20/20], Step [209/627], Loss: 0.1656
Epoch [20/20], Step [210/627], Loss: 0.0585
Epoch [20/20], Step [211/627], Loss: 0.0703
Epoch [20/20], Step [212/627], Loss: 0.0928
Epoch [20/20], Step [213/627], Loss: 0.0921
Epoch [20/20], Step [214/627], Loss: 0.0471
Epoch [20/20], Step [215/627], Loss: 0.0356
Epoch [20/20], Step [216/627], Loss: 0.1333
Epoch [20/20], Step [217/627], Loss: 0.1234
Epoch [20/20], Step [218/627], Loss: 0.1121
Epoch [20/20], Step [219/627], Loss: 0.0244
Epoch [20/20], Step [220/627], Loss: 0.1266
Epoch [20/20], Step [221/627], Loss: 0.0888
Epoch [20/20], Step [222/627], Loss: 0.0800
Epoch [20/20], Step [223/627], Loss: 0.2588
Epoch [20/20], Step [224/627], Loss: 0.1945
Epoch [20/20], Step [225/627], Loss: 0.0519
Epoch [20/20], Step [226/627], Loss: 0.1620
Epoch [20/20], Step [227/627], L

Epoch [20/20], Step [395/627], Loss: 0.3924
Epoch [20/20], Step [396/627], Loss: 0.0632
Epoch [20/20], Step [397/627], Loss: 0.1718
Epoch [20/20], Step [398/627], Loss: 0.1156
Epoch [20/20], Step [399/627], Loss: 0.0836
Epoch [20/20], Step [400/627], Loss: 0.0687
Epoch [20/20], Step [401/627], Loss: 0.0811
Epoch [20/20], Step [402/627], Loss: 0.0670
Epoch [20/20], Step [403/627], Loss: 0.1464
Epoch [20/20], Step [404/627], Loss: 0.1249
Epoch [20/20], Step [405/627], Loss: 0.0724
Epoch [20/20], Step [406/627], Loss: 0.0464
Epoch [20/20], Step [407/627], Loss: 0.3452
Epoch [20/20], Step [408/627], Loss: 0.1928
Epoch [20/20], Step [409/627], Loss: 0.0481
Epoch [20/20], Step [410/627], Loss: 0.1747
Epoch [20/20], Step [411/627], Loss: 0.1552
Epoch [20/20], Step [412/627], Loss: 0.3042
Epoch [20/20], Step [413/627], Loss: 0.1494
Epoch [20/20], Step [414/627], Loss: 0.1333
Epoch [20/20], Step [415/627], Loss: 0.1283
Epoch [20/20], Step [416/627], Loss: 0.0618
Epoch [20/20], Step [417/627], L

Epoch [20/20], Step [585/627], Loss: 0.1926
Epoch [20/20], Step [586/627], Loss: 0.1826
Epoch [20/20], Step [587/627], Loss: 0.1069
Epoch [20/20], Step [588/627], Loss: 0.1825
Epoch [20/20], Step [589/627], Loss: 0.0686
Epoch [20/20], Step [590/627], Loss: 0.2291
Epoch [20/20], Step [591/627], Loss: 0.1572
Epoch [20/20], Step [592/627], Loss: 0.0587
Epoch [20/20], Step [593/627], Loss: 0.1003
Epoch [20/20], Step [594/627], Loss: 0.1543
Epoch [20/20], Step [595/627], Loss: 0.2220
Epoch [20/20], Step [596/627], Loss: 0.1835
Epoch [20/20], Step [597/627], Loss: 0.0879
Epoch [20/20], Step [598/627], Loss: 0.1396
Epoch [20/20], Step [599/627], Loss: 0.1100
Epoch [20/20], Step [600/627], Loss: 0.1072
Epoch [20/20], Step [601/627], Loss: 0.1371
Epoch [20/20], Step [602/627], Loss: 0.0968
Epoch [20/20], Step [603/627], Loss: 0.0523
Epoch [20/20], Step [604/627], Loss: 0.0658
Epoch [20/20], Step [605/627], Loss: 0.0949
Epoch [20/20], Step [606/627], Loss: 0.1898
Epoch [20/20], Step [607/627], L

In [44]:
best_epoch

19

In [45]:
model.eval()
# eval mode (batchnorm uses moving mean/variance instead of mini-batch mean/variance)
total_preds = np.array([])
total_labels = np.array([])
with torch.no_grad():
    correct = 0
    total = 0
    for i in test_loader:
        images = i['outer_product']
        labels = i['Label']
        images = images.to(device)
        labels = labels.to(device)
        
        # Forward pass
        outputs = model(images) 
        outputs = outputs.cpu().detach().numpy().flatten()
        labels =labels.cpu().detach().numpy().flatten()
        total_preds = np.concatenate([total_preds, outputs])
        total_labels = np.concatenate([total_labels, labels])
#         total_preds = torch.cat(total_preds, outputs.cpu(), 0 )
#         total_labels = torch.cat(total_labels, labels.cpu(), 0)
#         break

In [46]:
G,P = total_labels, total_preds

In [47]:
rmse(G,P)

1.0090536904610754

In [48]:
mse(G,P)

1.0181893502331156

In [49]:
pearson(G,P)

0.43066980360698215

In [50]:
ci(G,P)

0.6985993820628222

In [51]:
model = ConvNet().to(device)

In [52]:
model.load_state_dict(torch.load('./best_sim-CNN-DTA_davis_fold1x.model'))

<All keys matched successfully>

In [53]:
model.eval()


ConvNet(
  (conv1): Conv2d(1, 32, kernel_size=(5, 5), stride=(1, 1))
  (pool1): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False)
  (conv2): Conv2d(32, 18, kernel_size=(3, 3), stride=(1, 1))
  (pool2): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False)
  (fc1): Linear(in_features=16200, out_features=128, bias=True)
  (fc2): Linear(in_features=128, out_features=1, bias=True)
  (dropout): Dropout(p=0.1, inplace=False)
)

In [54]:
total_preds = np.array([])
total_labels = np.array([])
with torch.no_grad():
    correct = 0
    total = 0
    for i in test_loader:
        images = i['outer_product']
        labels = i['Label']
        images = images.to(device)
        labels = labels.to(device)
        
        # Forward pass
        outputs = model(images) 
        outputs = outputs.cpu().detach().numpy().flatten()
        labels =labels.cpu().detach().numpy().flatten()
        total_preds = np.concatenate([total_preds, outputs])
        total_labels = np.concatenate([total_labels, labels])
#         total_preds = torch.cat(total_preds, outputs.cpu(), 0 )
#         total_labels = torch.cat(total_labels, labels.cpu(), 0)
#         break

In [55]:
G,P = total_labels, total_preds

In [56]:
rmse(G,P)

0.9417070648264768

In [60]:
print("MSE = ",mse(G,P))
print("R = ",pearson(G,P))
print("CI = ",ci(G,P))
print("RMSE = ",rmse(G,P))


MSE =  0.8868121959440982
R =  0.4284664823235108
CI =  0.7183587860551893
RMSE =  0.9417070648264768
