In [1]:
import tensorflow as tf
import numpy as np
tf.__version__

'2.0.0'

In [2]:
class MNISTLoader():
    def __init__(self):
        mnist = tf.keras.datasets.mnist
        (self.train_data, self.train_label), (self.test_data, self.test_label) = mnist.load_data()
        # MNIST中的图像默认为uint8（0-255的数字）。以下代码将其归一化到0-1之间的浮点数，并在最后增加一维作为颜色通道
        self.train_data = np.expand_dims(self.train_data.astype(np.float32) / 255.0, axis=-1)      # [60000, 28, 28, 1]
        self.test_data = np.expand_dims(self.test_data.astype(np.float32) / 255.0, axis=-1)        # [10000, 28, 28, 1]
        self.train_label = self.train_label.astype(np.int32)    # [60000]
        self.test_label = self.test_label.astype(np.int32)      # [10000]
        self.num_train_data, self.num_test_data = self.train_data.shape[0], self.test_data.shape[0]

    def get_batch(self, batch_size):
        # 从数据集中随机取出batch_size个元素并返回
        index = np.random.randint(0, np.shape(self.train_data)[0], batch_size)
        return self.train_data[index, :], self.train_label[index]

In [3]:
class MLP(tf.keras.Model):
    def __init__(self):
        super().__init__()
        self.flatten = tf.keras.layers.Flatten()
        self.dense1 = tf.keras.layers.Dense(units=100, activation=tf.nn.relu)
        self.dense2 = tf.keras.layers.Dense(units=10)
        
    def call(self, inputs):
        x = self.flatten(inputs)
        x = self.dense1(x)
        x = self.dense2(x)
        outputs = tf.nn.softmax(x)
        return outputs

In [4]:
num_batches = 10000
batch_size = 50
learning_rate = 0.001
model = MLP()
data_loader = MNISTLoader()

In [5]:
optimizer = tf.keras.optimizers.Adam(learning_rate=learning_rate)

实例化记录器

In [6]:
summary_writer = tf.summary.create_file_writer('./tensorboard')     # 实例化记录器
for batch_index in range(num_batches):
    X, y = data_loader.get_batch(batch_size)
    with tf.GradientTape() as tape:
        y_pred = model(X)
        loss = tf.keras.losses.sparse_categorical_crossentropy(y_true=y, y_pred=y_pred)
        loss = tf.reduce_mean(loss)
        print("batch %d: loss %f" % (batch_index, loss.numpy()))
        with summary_writer.as_default():                           # 指定记录器
            tf.summary.scalar("loss", loss, step=batch_index)       # 将当前损失函数的值写入记录器
    grads = tape.gradient(loss, model.variables)
    optimizer.apply_gradients(grads_and_vars=zip(grads, model.variables))

batch 0: loss 2.341841
batch 1: loss 2.229311
batch 2: loss 2.253901
batch 3: loss 2.103704
batch 4: loss 1.988687
batch 5: loss 2.001765
batch 6: loss 1.917500
batch 7: loss 1.874986
batch 8: loss 1.823159
batch 9: loss 1.672640
batch 10: loss 1.638416
batch 11: loss 1.617443
batch 12: loss 1.502446
batch 13: loss 1.573944
batch 14: loss 1.426760
batch 15: loss 1.357222
batch 16: loss 1.382384
batch 17: loss 1.195881
batch 18: loss 1.336071
batch 19: loss 1.182269
batch 20: loss 1.175822
batch 21: loss 1.273833
batch 22: loss 1.118905
batch 23: loss 0.922557
batch 24: loss 0.894505
batch 25: loss 1.036744
batch 26: loss 0.998775
batch 27: loss 1.207561
batch 28: loss 1.088631
batch 29: loss 0.935906
batch 30: loss 0.833973
batch 31: loss 0.911847
batch 32: loss 0.884330
batch 33: loss 0.927670
batch 34: loss 0.802239
batch 35: loss 0.788868
batch 36: loss 0.796847
batch 37: loss 0.771140
batch 38: loss 0.592976
batch 39: loss 0.817199
batch 40: loss 0.651403
batch 41: loss 0.641124
ba

batch 341: loss 0.207769
batch 342: loss 0.360769
batch 343: loss 0.624532
batch 344: loss 0.136707
batch 345: loss 0.326883
batch 346: loss 0.210817
batch 347: loss 0.380202
batch 348: loss 0.213622
batch 349: loss 0.254146
batch 350: loss 0.256316
batch 351: loss 0.274970
batch 352: loss 0.335548
batch 353: loss 0.474327
batch 354: loss 0.281958
batch 355: loss 0.169646
batch 356: loss 0.264483
batch 357: loss 0.119932
batch 358: loss 0.295862
batch 359: loss 0.715190
batch 360: loss 0.519560
batch 361: loss 0.354562
batch 362: loss 0.320491
batch 363: loss 0.206907
batch 364: loss 0.197776
batch 365: loss 0.146945
batch 366: loss 0.462555
batch 367: loss 0.352268
batch 368: loss 0.324025
batch 369: loss 0.161426
batch 370: loss 0.249026
batch 371: loss 0.376522
batch 372: loss 0.257896
batch 373: loss 0.584276
batch 374: loss 0.474710
batch 375: loss 0.181638
batch 376: loss 0.142422
batch 377: loss 0.448354
batch 378: loss 0.138191
batch 379: loss 0.116747
batch 380: loss 0.148273


batch 688: loss 0.191543
batch 689: loss 0.105134
batch 690: loss 0.204547
batch 691: loss 0.232714
batch 692: loss 0.096405
batch 693: loss 0.230100
batch 694: loss 0.222839
batch 695: loss 0.175036
batch 696: loss 0.235688
batch 697: loss 0.064055
batch 698: loss 0.197620
batch 699: loss 0.393011
batch 700: loss 0.349919
batch 701: loss 0.327615
batch 702: loss 0.079568
batch 703: loss 0.220764
batch 704: loss 0.225040
batch 705: loss 0.222821
batch 706: loss 0.183251
batch 707: loss 0.205227
batch 708: loss 0.148898
batch 709: loss 0.180713
batch 710: loss 0.227692
batch 711: loss 0.315524
batch 712: loss 0.180612
batch 713: loss 0.185178
batch 714: loss 0.393899
batch 715: loss 0.105562
batch 716: loss 0.258666
batch 717: loss 0.485322
batch 718: loss 0.285872
batch 719: loss 0.046478
batch 720: loss 0.486898
batch 721: loss 0.402708
batch 722: loss 0.073246
batch 723: loss 0.233368
batch 724: loss 0.238674
batch 725: loss 0.217219
batch 726: loss 0.196126
batch 727: loss 0.363675


batch 1034: loss 0.178744
batch 1035: loss 0.089267
batch 1036: loss 0.242335
batch 1037: loss 0.092178
batch 1038: loss 0.168661
batch 1039: loss 0.467352
batch 1040: loss 0.204233
batch 1041: loss 0.174045
batch 1042: loss 0.182518
batch 1043: loss 0.197729
batch 1044: loss 0.113805
batch 1045: loss 0.108399
batch 1046: loss 0.207288
batch 1047: loss 0.157888
batch 1048: loss 0.302930
batch 1049: loss 0.458521
batch 1050: loss 0.087831
batch 1051: loss 0.075939
batch 1052: loss 0.197717
batch 1053: loss 0.093672
batch 1054: loss 0.208499
batch 1055: loss 0.127700
batch 1056: loss 0.100815
batch 1057: loss 0.303627
batch 1058: loss 0.067883
batch 1059: loss 0.092563
batch 1060: loss 0.077659
batch 1061: loss 0.220269
batch 1062: loss 0.231388
batch 1063: loss 0.113248
batch 1064: loss 0.195973
batch 1065: loss 0.088825
batch 1066: loss 0.123109
batch 1067: loss 0.099912
batch 1068: loss 0.182325
batch 1069: loss 0.177144
batch 1070: loss 0.309261
batch 1071: loss 0.170927
batch 1072: 

batch 1380: loss 0.037030
batch 1381: loss 0.152531
batch 1382: loss 0.097677
batch 1383: loss 0.236242
batch 1384: loss 0.146873
batch 1385: loss 0.136957
batch 1386: loss 0.158714
batch 1387: loss 0.053015
batch 1388: loss 0.218857
batch 1389: loss 0.274785
batch 1390: loss 0.076857
batch 1391: loss 0.086710
batch 1392: loss 0.081679
batch 1393: loss 0.045379
batch 1394: loss 0.163303
batch 1395: loss 0.058162
batch 1396: loss 0.109033
batch 1397: loss 0.138378
batch 1398: loss 0.131426
batch 1399: loss 0.151675
batch 1400: loss 0.151530
batch 1401: loss 0.219366
batch 1402: loss 0.193573
batch 1403: loss 0.242846
batch 1404: loss 0.081721
batch 1405: loss 0.200461
batch 1406: loss 0.049240
batch 1407: loss 0.131572
batch 1408: loss 0.160617
batch 1409: loss 0.193592
batch 1410: loss 0.088336
batch 1411: loss 0.152382
batch 1412: loss 0.063758
batch 1413: loss 0.143838
batch 1414: loss 0.168342
batch 1415: loss 0.090870
batch 1416: loss 0.187520
batch 1417: loss 0.107062
batch 1418: 

batch 1731: loss 0.141741
batch 1732: loss 0.127804
batch 1733: loss 0.141942
batch 1734: loss 0.140920
batch 1735: loss 0.044613
batch 1736: loss 0.112961
batch 1737: loss 0.137069
batch 1738: loss 0.335977
batch 1739: loss 0.287816
batch 1740: loss 0.225024
batch 1741: loss 0.129135
batch 1742: loss 0.207349
batch 1743: loss 0.083102
batch 1744: loss 0.254630
batch 1745: loss 0.261602
batch 1746: loss 0.062531
batch 1747: loss 0.262123
batch 1748: loss 0.141555
batch 1749: loss 0.163447
batch 1750: loss 0.085080
batch 1751: loss 0.200324
batch 1752: loss 0.083811
batch 1753: loss 0.065836
batch 1754: loss 0.171661
batch 1755: loss 0.125887
batch 1756: loss 0.040978
batch 1757: loss 0.103389
batch 1758: loss 0.224384
batch 1759: loss 0.093452
batch 1760: loss 0.121311
batch 1761: loss 0.157619
batch 1762: loss 0.024669
batch 1763: loss 0.355400
batch 1764: loss 0.094199
batch 1765: loss 0.152386
batch 1766: loss 0.064062
batch 1767: loss 0.123314
batch 1768: loss 0.097899
batch 1769: 

batch 2078: loss 0.072999
batch 2079: loss 0.143378
batch 2080: loss 0.023814
batch 2081: loss 0.060470
batch 2082: loss 0.075717
batch 2083: loss 0.068420
batch 2084: loss 0.127440
batch 2085: loss 0.080401
batch 2086: loss 0.150586
batch 2087: loss 0.058326
batch 2088: loss 0.269115
batch 2089: loss 0.147297
batch 2090: loss 0.075662
batch 2091: loss 0.085604
batch 2092: loss 0.053452
batch 2093: loss 0.107915
batch 2094: loss 0.186235
batch 2095: loss 0.048786
batch 2096: loss 0.037859
batch 2097: loss 0.209843
batch 2098: loss 0.020360
batch 2099: loss 0.036925
batch 2100: loss 0.049780
batch 2101: loss 0.161319
batch 2102: loss 0.222721
batch 2103: loss 0.336393
batch 2104: loss 0.307254
batch 2105: loss 0.079505
batch 2106: loss 0.134670
batch 2107: loss 0.060791
batch 2108: loss 0.098293
batch 2109: loss 0.148545
batch 2110: loss 0.170276
batch 2111: loss 0.157902
batch 2112: loss 0.291207
batch 2113: loss 0.159874
batch 2114: loss 0.193551
batch 2115: loss 0.158860
batch 2116: 

batch 2428: loss 0.051337
batch 2429: loss 0.055098
batch 2430: loss 0.038637
batch 2431: loss 0.092462
batch 2432: loss 0.100115
batch 2433: loss 0.074432
batch 2434: loss 0.130499
batch 2435: loss 0.125214
batch 2436: loss 0.323290
batch 2437: loss 0.027688
batch 2438: loss 0.043856
batch 2439: loss 0.068315
batch 2440: loss 0.160572
batch 2441: loss 0.082843
batch 2442: loss 0.107363
batch 2443: loss 0.160329
batch 2444: loss 0.030336
batch 2445: loss 0.139864
batch 2446: loss 0.059811
batch 2447: loss 0.137981
batch 2448: loss 0.076300
batch 2449: loss 0.232970
batch 2450: loss 0.084967
batch 2451: loss 0.099431
batch 2452: loss 0.042289
batch 2453: loss 0.109709
batch 2454: loss 0.032666
batch 2455: loss 0.080559
batch 2456: loss 0.297844
batch 2457: loss 0.092654
batch 2458: loss 0.044569
batch 2459: loss 0.217496
batch 2460: loss 0.114590
batch 2461: loss 0.117576
batch 2462: loss 0.290047
batch 2463: loss 0.175579
batch 2464: loss 0.076042
batch 2465: loss 0.055235
batch 2466: 

batch 2780: loss 0.107896
batch 2781: loss 0.029767
batch 2782: loss 0.034108
batch 2783: loss 0.091396
batch 2784: loss 0.150534
batch 2785: loss 0.126600
batch 2786: loss 0.073975
batch 2787: loss 0.066559
batch 2788: loss 0.101545
batch 2789: loss 0.123030
batch 2790: loss 0.143097
batch 2791: loss 0.199666
batch 2792: loss 0.052956
batch 2793: loss 0.051120
batch 2794: loss 0.079227
batch 2795: loss 0.051373
batch 2796: loss 0.062995
batch 2797: loss 0.033280
batch 2798: loss 0.082320
batch 2799: loss 0.147251
batch 2800: loss 0.027537
batch 2801: loss 0.094580
batch 2802: loss 0.332917
batch 2803: loss 0.015369
batch 2804: loss 0.064742
batch 2805: loss 0.068023
batch 2806: loss 0.120563
batch 2807: loss 0.084520
batch 2808: loss 0.036918
batch 2809: loss 0.049283
batch 2810: loss 0.038877
batch 2811: loss 0.026573
batch 2812: loss 0.037452
batch 2813: loss 0.114789
batch 2814: loss 0.082535
batch 2815: loss 0.048664
batch 2816: loss 0.033974
batch 2817: loss 0.042019
batch 2818: 

batch 3135: loss 0.020396
batch 3136: loss 0.102010
batch 3137: loss 0.062816
batch 3138: loss 0.062541
batch 3139: loss 0.217855
batch 3140: loss 0.120841
batch 3141: loss 0.125222
batch 3142: loss 0.162283
batch 3143: loss 0.021822
batch 3144: loss 0.182005
batch 3145: loss 0.083694
batch 3146: loss 0.034802
batch 3147: loss 0.040494
batch 3148: loss 0.147968
batch 3149: loss 0.162919
batch 3150: loss 0.029666
batch 3151: loss 0.048760
batch 3152: loss 0.106652
batch 3153: loss 0.014905
batch 3154: loss 0.108241
batch 3155: loss 0.184403
batch 3156: loss 0.068053
batch 3157: loss 0.046013
batch 3158: loss 0.023122
batch 3159: loss 0.025479
batch 3160: loss 0.044269
batch 3161: loss 0.093285
batch 3162: loss 0.071312
batch 3163: loss 0.072396
batch 3164: loss 0.141514
batch 3165: loss 0.012247
batch 3166: loss 0.035742
batch 3167: loss 0.057176
batch 3168: loss 0.129363
batch 3169: loss 0.041788
batch 3170: loss 0.148460
batch 3171: loss 0.240944
batch 3172: loss 0.102158
batch 3173: 

batch 3451: loss 0.033004
batch 3452: loss 0.092276
batch 3453: loss 0.157029
batch 3454: loss 0.078561
batch 3455: loss 0.044846
batch 3456: loss 0.127300
batch 3457: loss 0.018092
batch 3458: loss 0.079608
batch 3459: loss 0.048459
batch 3460: loss 0.080585
batch 3461: loss 0.059219
batch 3462: loss 0.043174
batch 3463: loss 0.032074
batch 3464: loss 0.134535
batch 3465: loss 0.059884
batch 3466: loss 0.168122
batch 3467: loss 0.117150
batch 3468: loss 0.180753
batch 3469: loss 0.036124
batch 3470: loss 0.070294
batch 3471: loss 0.059724
batch 3472: loss 0.157173
batch 3473: loss 0.048780
batch 3474: loss 0.026278
batch 3475: loss 0.137694
batch 3476: loss 0.107056
batch 3477: loss 0.071328
batch 3478: loss 0.033303
batch 3479: loss 0.215349
batch 3480: loss 0.075251
batch 3481: loss 0.026237
batch 3482: loss 0.133558
batch 3483: loss 0.040125
batch 3484: loss 0.122849
batch 3485: loss 0.120536
batch 3486: loss 0.075076
batch 3487: loss 0.021951
batch 3488: loss 0.084332
batch 3489: 

batch 3804: loss 0.149810
batch 3805: loss 0.074238
batch 3806: loss 0.161097
batch 3807: loss 0.045559
batch 3808: loss 0.101627
batch 3809: loss 0.050140
batch 3810: loss 0.018567
batch 3811: loss 0.149170
batch 3812: loss 0.028904
batch 3813: loss 0.032472
batch 3814: loss 0.078550
batch 3815: loss 0.102614
batch 3816: loss 0.057427
batch 3817: loss 0.029670
batch 3818: loss 0.094832
batch 3819: loss 0.040400
batch 3820: loss 0.082056
batch 3821: loss 0.160933
batch 3822: loss 0.051890
batch 3823: loss 0.029136
batch 3824: loss 0.006456
batch 3825: loss 0.047867
batch 3826: loss 0.026073
batch 3827: loss 0.017974
batch 3828: loss 0.037551
batch 3829: loss 0.059597
batch 3830: loss 0.093175
batch 3831: loss 0.041765
batch 3832: loss 0.180943
batch 3833: loss 0.031805
batch 3834: loss 0.022999
batch 3835: loss 0.056085
batch 3836: loss 0.031358
batch 3837: loss 0.018550
batch 3838: loss 0.055721
batch 3839: loss 0.042080
batch 3840: loss 0.080708
batch 3841: loss 0.061684
batch 3842: 

batch 4155: loss 0.062599
batch 4156: loss 0.085880
batch 4157: loss 0.102617
batch 4158: loss 0.062598
batch 4159: loss 0.118287
batch 4160: loss 0.117684
batch 4161: loss 0.078616
batch 4162: loss 0.129325
batch 4163: loss 0.056176
batch 4164: loss 0.031902
batch 4165: loss 0.006697
batch 4166: loss 0.064497
batch 4167: loss 0.072829
batch 4168: loss 0.082151
batch 4169: loss 0.138571
batch 4170: loss 0.041704
batch 4171: loss 0.020547
batch 4172: loss 0.133772
batch 4173: loss 0.083424
batch 4174: loss 0.012578
batch 4175: loss 0.182278
batch 4176: loss 0.028525
batch 4177: loss 0.127529
batch 4178: loss 0.251097
batch 4179: loss 0.026816
batch 4180: loss 0.037697
batch 4181: loss 0.167429
batch 4182: loss 0.034807
batch 4183: loss 0.065205
batch 4184: loss 0.076600
batch 4185: loss 0.047198
batch 4186: loss 0.027960
batch 4187: loss 0.034775
batch 4188: loss 0.025013
batch 4189: loss 0.117284
batch 4190: loss 0.058016
batch 4191: loss 0.036090
batch 4192: loss 0.032060
batch 4193: 

batch 4502: loss 0.090254
batch 4503: loss 0.019102
batch 4504: loss 0.169211
batch 4505: loss 0.058249
batch 4506: loss 0.035633
batch 4507: loss 0.144909
batch 4508: loss 0.042768
batch 4509: loss 0.055035
batch 4510: loss 0.076349
batch 4511: loss 0.077877
batch 4512: loss 0.053178
batch 4513: loss 0.015255
batch 4514: loss 0.020347
batch 4515: loss 0.015366
batch 4516: loss 0.028888
batch 4517: loss 0.044413
batch 4518: loss 0.037659
batch 4519: loss 0.174422
batch 4520: loss 0.017114
batch 4521: loss 0.060446
batch 4522: loss 0.033101
batch 4523: loss 0.011896
batch 4524: loss 0.077011
batch 4525: loss 0.109664
batch 4526: loss 0.102244
batch 4527: loss 0.193097
batch 4528: loss 0.181899
batch 4529: loss 0.057968
batch 4530: loss 0.081514
batch 4531: loss 0.059173
batch 4532: loss 0.098701
batch 4533: loss 0.051781
batch 4534: loss 0.015011
batch 4535: loss 0.098714
batch 4536: loss 0.020390
batch 4537: loss 0.170356
batch 4538: loss 0.027680
batch 4539: loss 0.011035
batch 4540: 

batch 4818: loss 0.062909
batch 4819: loss 0.016393
batch 4820: loss 0.047271
batch 4821: loss 0.075633
batch 4822: loss 0.003447
batch 4823: loss 0.016678
batch 4824: loss 0.016595
batch 4825: loss 0.015282
batch 4826: loss 0.029771
batch 4827: loss 0.057154
batch 4828: loss 0.024713
batch 4829: loss 0.015799
batch 4830: loss 0.087323
batch 4831: loss 0.070648
batch 4832: loss 0.018904
batch 4833: loss 0.007667
batch 4834: loss 0.027475
batch 4835: loss 0.006447
batch 4836: loss 0.037732
batch 4837: loss 0.028122
batch 4838: loss 0.012982
batch 4839: loss 0.020124
batch 4840: loss 0.117992
batch 4841: loss 0.034714
batch 4842: loss 0.017718
batch 4843: loss 0.025144
batch 4844: loss 0.060212
batch 4845: loss 0.014784
batch 4846: loss 0.084174
batch 4847: loss 0.027810
batch 4848: loss 0.020395
batch 4849: loss 0.034980
batch 4850: loss 0.090504
batch 4851: loss 0.108852
batch 4852: loss 0.009541
batch 4853: loss 0.014698
batch 4854: loss 0.041172
batch 4855: loss 0.031799
batch 4856: 

batch 5138: loss 0.134024
batch 5139: loss 0.081058
batch 5140: loss 0.052740
batch 5141: loss 0.031912
batch 5142: loss 0.030367
batch 5143: loss 0.027484
batch 5144: loss 0.030731
batch 5145: loss 0.032110
batch 5146: loss 0.058888
batch 5147: loss 0.020827
batch 5148: loss 0.021852
batch 5149: loss 0.085394
batch 5150: loss 0.065532
batch 5151: loss 0.067027
batch 5152: loss 0.010151
batch 5153: loss 0.026201
batch 5154: loss 0.025422
batch 5155: loss 0.071446
batch 5156: loss 0.026136
batch 5157: loss 0.039496
batch 5158: loss 0.018145
batch 5159: loss 0.063201
batch 5160: loss 0.042642
batch 5161: loss 0.082564
batch 5162: loss 0.050110
batch 5163: loss 0.007328
batch 5164: loss 0.020301
batch 5165: loss 0.042303
batch 5166: loss 0.074729
batch 5167: loss 0.050232
batch 5168: loss 0.008743
batch 5169: loss 0.010627
batch 5170: loss 0.169464
batch 5171: loss 0.013610
batch 5172: loss 0.068785
batch 5173: loss 0.005424
batch 5174: loss 0.022451
batch 5175: loss 0.050686
batch 5176: 

batch 5489: loss 0.082862
batch 5490: loss 0.024344
batch 5491: loss 0.089417
batch 5492: loss 0.031527
batch 5493: loss 0.042002
batch 5494: loss 0.010697
batch 5495: loss 0.067573
batch 5496: loss 0.054818
batch 5497: loss 0.017637
batch 5498: loss 0.061812
batch 5499: loss 0.116164
batch 5500: loss 0.047219
batch 5501: loss 0.015263
batch 5502: loss 0.090442
batch 5503: loss 0.009078
batch 5504: loss 0.011144
batch 5505: loss 0.020106
batch 5506: loss 0.064788
batch 5507: loss 0.047312
batch 5508: loss 0.068474
batch 5509: loss 0.018971
batch 5510: loss 0.048704
batch 5511: loss 0.008539
batch 5512: loss 0.050976
batch 5513: loss 0.017585
batch 5514: loss 0.088828
batch 5515: loss 0.092592
batch 5516: loss 0.122892
batch 5517: loss 0.007865
batch 5518: loss 0.128015
batch 5519: loss 0.039608
batch 5520: loss 0.008941
batch 5521: loss 0.019713
batch 5522: loss 0.019731
batch 5523: loss 0.054825
batch 5524: loss 0.030871
batch 5525: loss 0.138515
batch 5526: loss 0.140827
batch 5527: 

batch 5806: loss 0.042631
batch 5807: loss 0.144079
batch 5808: loss 0.185123
batch 5809: loss 0.016079
batch 5810: loss 0.050959
batch 5811: loss 0.024144
batch 5812: loss 0.027387
batch 5813: loss 0.065350
batch 5814: loss 0.032741
batch 5815: loss 0.013262
batch 5816: loss 0.174418
batch 5817: loss 0.034539
batch 5818: loss 0.016849
batch 5819: loss 0.012801
batch 5820: loss 0.038296
batch 5821: loss 0.006621
batch 5822: loss 0.032498
batch 5823: loss 0.095389
batch 5824: loss 0.022960
batch 5825: loss 0.029482
batch 5826: loss 0.027813
batch 5827: loss 0.060201
batch 5828: loss 0.069425
batch 5829: loss 0.019023
batch 5830: loss 0.011763
batch 5831: loss 0.012107
batch 5832: loss 0.063475
batch 5833: loss 0.014242
batch 5834: loss 0.027408
batch 5835: loss 0.081527
batch 5836: loss 0.042824
batch 5837: loss 0.009274
batch 5838: loss 0.057442
batch 5839: loss 0.036107
batch 5840: loss 0.015206
batch 5841: loss 0.066504
batch 5842: loss 0.006907
batch 5843: loss 0.029818
batch 5844: 

batch 6161: loss 0.007043
batch 6162: loss 0.004236
batch 6163: loss 0.130959
batch 6164: loss 0.045677
batch 6165: loss 0.008519
batch 6166: loss 0.134176
batch 6167: loss 0.053995
batch 6168: loss 0.078967
batch 6169: loss 0.027180
batch 6170: loss 0.064778
batch 6171: loss 0.087330
batch 6172: loss 0.073931
batch 6173: loss 0.082476
batch 6174: loss 0.024074
batch 6175: loss 0.008576
batch 6176: loss 0.074504
batch 6177: loss 0.048466
batch 6178: loss 0.122816
batch 6179: loss 0.011010
batch 6180: loss 0.009820
batch 6181: loss 0.027545
batch 6182: loss 0.037189
batch 6183: loss 0.005326
batch 6184: loss 0.018062
batch 6185: loss 0.067187
batch 6186: loss 0.009861
batch 6187: loss 0.007670
batch 6188: loss 0.013452
batch 6189: loss 0.093661
batch 6190: loss 0.008550
batch 6191: loss 0.116281
batch 6192: loss 0.025487
batch 6193: loss 0.059222
batch 6194: loss 0.007145
batch 6195: loss 0.024013
batch 6196: loss 0.041730
batch 6197: loss 0.007816
batch 6198: loss 0.062233
batch 6199: 

batch 6511: loss 0.008405
batch 6512: loss 0.007842
batch 6513: loss 0.008271
batch 6514: loss 0.095721
batch 6515: loss 0.002852
batch 6516: loss 0.067460
batch 6517: loss 0.048053
batch 6518: loss 0.035925
batch 6519: loss 0.079319
batch 6520: loss 0.039076
batch 6521: loss 0.087361
batch 6522: loss 0.013024
batch 6523: loss 0.057058
batch 6524: loss 0.023079
batch 6525: loss 0.009913
batch 6526: loss 0.021560
batch 6527: loss 0.083124
batch 6528: loss 0.041653
batch 6529: loss 0.081319
batch 6530: loss 0.056274
batch 6531: loss 0.026144
batch 6532: loss 0.085401
batch 6533: loss 0.025484
batch 6534: loss 0.027425
batch 6535: loss 0.059929
batch 6536: loss 0.011121
batch 6537: loss 0.153088
batch 6538: loss 0.053143
batch 6539: loss 0.020833
batch 6540: loss 0.054181
batch 6541: loss 0.070127
batch 6542: loss 0.096211
batch 6543: loss 0.010114
batch 6544: loss 0.003554
batch 6545: loss 0.024250
batch 6546: loss 0.132853
batch 6547: loss 0.047557
batch 6548: loss 0.011001
batch 6549: 

batch 6857: loss 0.032111
batch 6858: loss 0.116740
batch 6859: loss 0.004825
batch 6860: loss 0.014404
batch 6861: loss 0.087985
batch 6862: loss 0.013669
batch 6863: loss 0.101880
batch 6864: loss 0.026841
batch 6865: loss 0.009705
batch 6866: loss 0.006257
batch 6867: loss 0.009877
batch 6868: loss 0.004488
batch 6869: loss 0.048370
batch 6870: loss 0.008151
batch 6871: loss 0.203324
batch 6872: loss 0.013114
batch 6873: loss 0.020232
batch 6874: loss 0.054734
batch 6875: loss 0.041718
batch 6876: loss 0.040621
batch 6877: loss 0.085145
batch 6878: loss 0.017309
batch 6879: loss 0.021231
batch 6880: loss 0.007926
batch 6881: loss 0.017378
batch 6882: loss 0.019491
batch 6883: loss 0.028366
batch 6884: loss 0.018232
batch 6885: loss 0.040294
batch 6886: loss 0.013709
batch 6887: loss 0.014167
batch 6888: loss 0.070656
batch 6889: loss 0.034630
batch 6890: loss 0.025507
batch 6891: loss 0.028024
batch 6892: loss 0.027523
batch 6893: loss 0.100632
batch 6894: loss 0.043688
batch 6895: 

batch 7204: loss 0.200477
batch 7205: loss 0.019908
batch 7206: loss 0.003822
batch 7207: loss 0.004193
batch 7208: loss 0.117421
batch 7209: loss 0.017676
batch 7210: loss 0.012604
batch 7211: loss 0.066966
batch 7212: loss 0.048229
batch 7213: loss 0.016499
batch 7214: loss 0.053153
batch 7215: loss 0.011726
batch 7216: loss 0.032439
batch 7217: loss 0.052273
batch 7218: loss 0.034019
batch 7219: loss 0.033327
batch 7220: loss 0.053906
batch 7221: loss 0.012921
batch 7222: loss 0.014231
batch 7223: loss 0.071572
batch 7224: loss 0.023689
batch 7225: loss 0.022486
batch 7226: loss 0.013582
batch 7227: loss 0.019259
batch 7228: loss 0.023390
batch 7229: loss 0.070503
batch 7230: loss 0.081226
batch 7231: loss 0.009238
batch 7232: loss 0.068681
batch 7233: loss 0.039679
batch 7234: loss 0.003844
batch 7235: loss 0.056883
batch 7236: loss 0.059008
batch 7237: loss 0.073387
batch 7238: loss 0.039297
batch 7239: loss 0.025374
batch 7240: loss 0.043782
batch 7241: loss 0.033511
batch 7242: 

batch 7555: loss 0.212738
batch 7556: loss 0.025244
batch 7557: loss 0.017591
batch 7558: loss 0.048964
batch 7559: loss 0.018544
batch 7560: loss 0.082902
batch 7561: loss 0.051808
batch 7562: loss 0.105462
batch 7563: loss 0.004775
batch 7564: loss 0.011313
batch 7565: loss 0.007820
batch 7566: loss 0.023090
batch 7567: loss 0.120019
batch 7568: loss 0.010860
batch 7569: loss 0.060822
batch 7570: loss 0.008310
batch 7571: loss 0.033510
batch 7572: loss 0.035271
batch 7573: loss 0.016401
batch 7574: loss 0.006350
batch 7575: loss 0.026283
batch 7576: loss 0.039104
batch 7577: loss 0.035285
batch 7578: loss 0.004889
batch 7579: loss 0.025668
batch 7580: loss 0.097194
batch 7581: loss 0.229462
batch 7582: loss 0.009343
batch 7583: loss 0.011109
batch 7584: loss 0.069459
batch 7585: loss 0.008486
batch 7586: loss 0.038942
batch 7587: loss 0.066611
batch 7588: loss 0.013788
batch 7589: loss 0.012301
batch 7590: loss 0.034269
batch 7591: loss 0.047629
batch 7592: loss 0.046389
batch 7593: 

batch 7875: loss 0.023134
batch 7876: loss 0.015313
batch 7877: loss 0.019000
batch 7878: loss 0.050971
batch 7879: loss 0.168333
batch 7880: loss 0.017901
batch 7881: loss 0.062342
batch 7882: loss 0.006407
batch 7883: loss 0.004927
batch 7884: loss 0.053947
batch 7885: loss 0.018733
batch 7886: loss 0.040363
batch 7887: loss 0.022091
batch 7888: loss 0.027892
batch 7889: loss 0.016128
batch 7890: loss 0.017502
batch 7891: loss 0.008629
batch 7892: loss 0.113453
batch 7893: loss 0.106214
batch 7894: loss 0.012800
batch 7895: loss 0.006046
batch 7896: loss 0.009788
batch 7897: loss 0.004499
batch 7898: loss 0.055111
batch 7899: loss 0.007790
batch 7900: loss 0.030874
batch 7901: loss 0.018689
batch 7902: loss 0.105383
batch 7903: loss 0.006533
batch 7904: loss 0.013541
batch 7905: loss 0.023177
batch 7906: loss 0.049250
batch 7907: loss 0.006279
batch 7908: loss 0.019850
batch 7909: loss 0.077154
batch 7910: loss 0.082263
batch 7911: loss 0.022405
batch 7912: loss 0.044649
batch 7913: 

batch 8221: loss 0.014813
batch 8222: loss 0.014198
batch 8223: loss 0.026760
batch 8224: loss 0.043147
batch 8225: loss 0.078632
batch 8226: loss 0.046486
batch 8227: loss 0.078196
batch 8228: loss 0.035458
batch 8229: loss 0.081567
batch 8230: loss 0.034955
batch 8231: loss 0.021134
batch 8232: loss 0.012061
batch 8233: loss 0.009154
batch 8234: loss 0.041827
batch 8235: loss 0.087332
batch 8236: loss 0.004573
batch 8237: loss 0.010764
batch 8238: loss 0.045806
batch 8239: loss 0.181718
batch 8240: loss 0.071720
batch 8241: loss 0.093611
batch 8242: loss 0.006177
batch 8243: loss 0.003297
batch 8244: loss 0.005679
batch 8245: loss 0.025508
batch 8246: loss 0.002079
batch 8247: loss 0.056695
batch 8248: loss 0.074513
batch 8249: loss 0.057836
batch 8250: loss 0.027722
batch 8251: loss 0.127679
batch 8252: loss 0.014250
batch 8253: loss 0.081537
batch 8254: loss 0.016556
batch 8255: loss 0.032591
batch 8256: loss 0.035392
batch 8257: loss 0.037965
batch 8258: loss 0.009158
batch 8259: 

batch 8576: loss 0.046807
batch 8577: loss 0.072869
batch 8578: loss 0.063603
batch 8579: loss 0.079728
batch 8580: loss 0.018124
batch 8581: loss 0.031507
batch 8582: loss 0.114374
batch 8583: loss 0.005396
batch 8584: loss 0.063198
batch 8585: loss 0.035441
batch 8586: loss 0.009003
batch 8587: loss 0.007683
batch 8588: loss 0.355235
batch 8589: loss 0.010546
batch 8590: loss 0.049214
batch 8591: loss 0.007479
batch 8592: loss 0.041901
batch 8593: loss 0.009522
batch 8594: loss 0.094277
batch 8595: loss 0.074390
batch 8596: loss 0.084151
batch 8597: loss 0.107078
batch 8598: loss 0.105134
batch 8599: loss 0.012731
batch 8600: loss 0.020741
batch 8601: loss 0.048017
batch 8602: loss 0.017025
batch 8603: loss 0.043195
batch 8604: loss 0.012815
batch 8605: loss 0.056716
batch 8606: loss 0.007317
batch 8607: loss 0.055752
batch 8608: loss 0.011687
batch 8609: loss 0.003082
batch 8610: loss 0.044397
batch 8611: loss 0.008879
batch 8612: loss 0.137966
batch 8613: loss 0.008566
batch 8614: 

batch 8925: loss 0.005969
batch 8926: loss 0.031355
batch 8927: loss 0.102423
batch 8928: loss 0.014443
batch 8929: loss 0.003451
batch 8930: loss 0.022257
batch 8931: loss 0.174368
batch 8932: loss 0.011774
batch 8933: loss 0.007533
batch 8934: loss 0.022859
batch 8935: loss 0.141565
batch 8936: loss 0.021431
batch 8937: loss 0.037694
batch 8938: loss 0.148548
batch 8939: loss 0.044511
batch 8940: loss 0.006303
batch 8941: loss 0.088946
batch 8942: loss 0.005742
batch 8943: loss 0.063063
batch 8944: loss 0.108472
batch 8945: loss 0.077071
batch 8946: loss 0.031255
batch 8947: loss 0.024251
batch 8948: loss 0.009898
batch 8949: loss 0.046350
batch 8950: loss 0.018017
batch 8951: loss 0.126179
batch 8952: loss 0.019463
batch 8953: loss 0.031130
batch 8954: loss 0.009382
batch 8955: loss 0.028710
batch 8956: loss 0.126737
batch 8957: loss 0.090228
batch 8958: loss 0.011267
batch 8959: loss 0.032135
batch 8960: loss 0.024747
batch 8961: loss 0.058595
batch 8962: loss 0.020769
batch 8963: 

batch 9276: loss 0.116181
batch 9277: loss 0.016987
batch 9278: loss 0.044181
batch 9279: loss 0.034406
batch 9280: loss 0.013389
batch 9281: loss 0.008821
batch 9282: loss 0.029188
batch 9283: loss 0.023880
batch 9284: loss 0.004540
batch 9285: loss 0.014670
batch 9286: loss 0.059701
batch 9287: loss 0.007854
batch 9288: loss 0.017587
batch 9289: loss 0.004706
batch 9290: loss 0.024479
batch 9291: loss 0.005344
batch 9292: loss 0.002928
batch 9293: loss 0.007503
batch 9294: loss 0.064050
batch 9295: loss 0.015541
batch 9296: loss 0.008756
batch 9297: loss 0.005156
batch 9298: loss 0.030585
batch 9299: loss 0.058266
batch 9300: loss 0.038226
batch 9301: loss 0.038622
batch 9302: loss 0.012481
batch 9303: loss 0.008127
batch 9304: loss 0.007492
batch 9305: loss 0.021550
batch 9306: loss 0.021945
batch 9307: loss 0.023315
batch 9308: loss 0.054920
batch 9309: loss 0.015428
batch 9310: loss 0.087382
batch 9311: loss 0.029526
batch 9312: loss 0.000858
batch 9313: loss 0.011087
batch 9314: 

batch 9626: loss 0.013456
batch 9627: loss 0.042646
batch 9628: loss 0.012434
batch 9629: loss 0.061825
batch 9630: loss 0.003532
batch 9631: loss 0.084013
batch 9632: loss 0.010417
batch 9633: loss 0.025028
batch 9634: loss 0.036971
batch 9635: loss 0.014411
batch 9636: loss 0.006046
batch 9637: loss 0.008316
batch 9638: loss 0.059270
batch 9639: loss 0.050468
batch 9640: loss 0.020817
batch 9641: loss 0.007244
batch 9642: loss 0.111028
batch 9643: loss 0.004653
batch 9644: loss 0.068449
batch 9645: loss 0.017948
batch 9646: loss 0.009906
batch 9647: loss 0.023678
batch 9648: loss 0.059574
batch 9649: loss 0.029078
batch 9650: loss 0.004772
batch 9651: loss 0.041860
batch 9652: loss 0.006386
batch 9653: loss 0.036375
batch 9654: loss 0.023628
batch 9655: loss 0.005489
batch 9656: loss 0.003635
batch 9657: loss 0.003827
batch 9658: loss 0.026556
batch 9659: loss 0.037185
batch 9660: loss 0.011163
batch 9661: loss 0.009404
batch 9662: loss 0.038456
batch 9663: loss 0.030161
batch 9664: 

batch 9975: loss 0.065486
batch 9976: loss 0.075565
batch 9977: loss 0.009092
batch 9978: loss 0.022786
batch 9979: loss 0.003516
batch 9980: loss 0.010673
batch 9981: loss 0.021867
batch 9982: loss 0.039896
batch 9983: loss 0.021303
batch 9984: loss 0.012209
batch 9985: loss 0.015465
batch 9986: loss 0.059400
batch 9987: loss 0.114808
batch 9988: loss 0.002620
batch 9989: loss 0.033956
batch 9990: loss 0.063090
batch 9991: loss 0.001569
batch 9992: loss 0.014490
batch 9993: loss 0.008548
batch 9994: loss 0.004492
batch 9995: loss 0.017643
batch 9996: loss 0.029310
batch 9997: loss 0.002204
batch 9998: loss 0.004479
batch 9999: loss 0.008705


SyntaxError: invalid syntax (<ipython-input-8-c7df4e95a9d9>, line 1)