In [31]:
from gensim.models import KeyedVectors
from sklearn.model_selection import train_test_split
import pandas as pd
import numpy as np

# load the word embeddings into the model from file
filename = 'word2vecSmall.bin.gz'
model = KeyedVectors.load_word2vec_format(filename, binary=True)


In [32]:
# load csv
df = pd.read_csv('../yelp_demo/yelp_reviews.csv')


In [33]:
df['tokenized'] = df['text'].apply(lambda x: x.split())

In [34]:
df['tokenized'] = df['tokenized'].apply(lambda x: [word for word in x if word in model])

In [35]:
df['word_count'] = df['tokenized'].apply(lambda x: len(x))

In [36]:
avg_review_length = int(df['word_count'].mean() - 1)

In [37]:
avg_review_length

73

In [38]:
# split up our dataset into train and test sets using a handy sklearn function
X_train, X_test, y_train, y_test = train_test_split(df['tokenized'].values, df['pos_neg'].values, test_size=0.2)


In [39]:
y_train = np.array([np.array([1.0 if x > 0 else 0.0, 1.0 if x <= 0 else 0.0]) for x in y_train])


In [40]:
y_test = np.array([np.array([1.0 if x > 0 else 0.0, 1.0 if x <= 0 else 0.0]) for x in y_test])


In [41]:
X_train_embeddings = []

for review in X_train:
    if len(review) == 0:
        X_train_embeddings.append(np.zeros((avg_review_length, 300)))
        continue
    embeddings = model[review]
    if len(embeddings) > avg_review_length:
        embeddings = embeddings[:avg_review_length]
    elif len(embeddings) < avg_review_length:
        padding = avg_review_length - len(embeddings)
        padding = np.zeros((padding, 300))
        embeddings = np.concatenate((embeddings, padding))
        X_train_embeddings.append(embeddings)

In [42]:
X_test_embeddings = []

for review in X_test:
    if len(review) == 0:
        X_test_embeddings.append(np.zeros((avg_review_length, 300)))
        continue
    embeddings = model[review]
    if len(embeddings) > avg_review_length:
        embeddings = embeddings[:avg_review_length]
    elif len(embeddings) < avg_review_length:
        padding = avg_review_length - len(embeddings)
        padding = np.zeros((padding, 300))
        embeddings = np.concatenate((embeddings, padding))
        X_test_embeddings.append(embeddings)

In [44]:
import torch
import torch.nn as nn
import torch.nn.functional as F

from model import YelpNet

In [45]:
net = YelpNet(300, avg_review_length)

In [46]:
from torch.autograd import Variable

review = Variable(torch.Tensor(X_test_embeddings[0]))
print(review.shape)
prediction = net.forward(review)

torch.Size([73, 300])
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.1699, -0.2676,  0.1475,  ..., -0.0781, -0.0645,  0.0728],
        [ 0.1094,  0.1406, -0.0317,  ...,  0.0077,  0.1201, -0.1797],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.0053, 0.0084], grad_fn=<ReluBackward0>)


In [47]:
print(prediction)

tensor([0.4992, 0.5008], grad_fn=<DivBackward0>)


In [48]:
optimizer = torch.optim.SGD(net.parameters(), lr=0.005)

for i in range(len(X_train_embeddings)):
    try:
        review = Variable(torch.Tensor(X_train_embeddings[i]))
        correct_label = 0 if y_train[i][0] == 1 else 1

        prediction = net.forward(review)

        loss = torch.log(1 + torch.exp(-prediction[correct_label]))

        loss.backward()
        optimizer.step()
        optimizer.zero_grad()
    except:
        print('ouch')
            
torch.save(net, "trained_net.pb")

tensor([[ 0.0747, -0.0903, -0.0559,  ..., -0.2617, -0.2061, -0.1748],
        [ 0.0679, -0.0413,  0.1001,  ...,  0.1045, -0.0854, -0.1543],
        [-0.0062, -0.0243,  0.0156,  ...,  0.0991,  0.0062,  0.0820],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0., 0.], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.0192, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.2773,  0.1445, -0.0557,  ...

tensor([[-0.0535,  0.1309,  0.2656,  ..., -0.0042,  0.2197, -0.1777],
        [ 0.0400, -0.1167, -0.0364,  ..., -0.2500,  0.0540, -0.0435],
        [-0.0581,  0.0581,  0.0133,  ..., -0.1748, -0.0231, -0.0435],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.0735, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.3145, -0.0026, -0.1670,  ..., -0.2324,  0.1069, -0.0284],
        [-0.1455, -0.0059, -0.1230,  ..., -0.1699,  0.1387, -0.2012],
        [-0.0557,  0.0089, -0.0923,  ...,  0.0032,  0.2871, -0.1416],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.0394, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0311, -0.1904,  0.03

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.0864,  0.2578,  0.0281,  ..., -0.2715,  0.1729,  0.0422],
        [-0.0249,  0.0220, -0.0354,  ...,  0.0108, -0.0188, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.0273, 0.0181], grad_fn=<ReluBackward0>)
tensor([[ 0.1504, -0.0566,  0.2012,  ..., -0.1035,  0.1001, -0.0283],
        [-0.5195, -0.0337, -0.0208,  ..., -0.2373, -0.1982, -0.1069],
        [ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.0285, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.3262,  0.18

tensor([0.0470, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        [-0.0449, -0.0304,  0.0023,  ...,  0.0123, -0.0884, -0.0156],
        [-0.2285, -0.0884,  0.1279,  ..., -0.2129,  0.1885, -0.1455],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.0511, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2432, -0.0085,  0.2051,  ...,  0.0337,  0.1289,  0.0708],
        [ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        [ 0.1582,  0.1060, -0.1895,  ..., -0.2676,  0.0084, -0.2139],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.0108, 0.0000], grad_fn

tensor([[ 0.0334,  0.0020,  0.0613,  ..., -0.0148,  0.0216, -0.0330],
        [ 0.1699,  0.0143, -0.0454,  ...,  0.0415, -0.1001, -0.1885],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.0721, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0437,  0.0928,  0.0564,  ..., -0.1641, -0.0483, -0.0549],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        [-0.0078, -0.0280,  0.0405,  ...,  0.0396, -0.0605,  0.0081],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.0602, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[ 0.1104, -0.1235,  0.1406,  ..., -0.3770,  0.0300, -0.0840],
        [ 0.1895,  0.1367, -0.0947,  ...,  0.0762,  0.0154, -0.0503],
        [-0.1953, -0.1328,  0.2695,  ...,  0.1738,  0.1748,  0.1396],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.0349, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0664, -0.0240,  0.0544,  ..., -0.1396,  0.0610, -0.2969],
        [ 0.1030, -0.1523,  0.0259,  ..., -0.1982, -0.1230,  0.0649],
        [ 0.1094,  0.1406, -0.0317,  ...,  0.0077,  0.1201, -0.1797],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.0464, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([0.0891, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1104, -0.1235,  0.1406,  ..., -0.3770,  0.0300, -0.0840],
        [-0.1494,  0.1670,  0.0723,  ...,  0.0728,  0.1533, -0.1436],
        [-0.0581,  0.0581,  0.0133,  ..., -0.1748, -0.0231, -0.0435],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.0600, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1011, -0.0515,  0.1504,  ...,  0.1807, -0.2422,  0.1348],
        [ 0.1055, -0.1206,  0.0991,  ...,  0.1235,  0.1299, -0.2539],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.0725, 0.0000], grad_fn

tensor([[-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        [-0.2070,  0.2031,  0.0420,  ...,  0.1387,  0.0369, -0.0287],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.1130, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1621,  0.0869,  0.2012,  ..., -0.0840,  0.0449, -0.1797],
        [ 0.0942, -0.0228,  0.0522,  ..., -0.0469,  0.1611, -0.1992],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.1129, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1953,  0.0042, -0.12

tensor([[-0.1729,  0.2793,  0.1069,  ...,  0.1230,  0.1299, -0.1826],
        [-0.1816,  0.1650, -0.1660,  ...,  0.1592,  0.1279,  0.0022],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.0481, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0195,  0.0613,  0.0023,  ...,  0.1206,  0.0291, -0.0825],
        [-0.0613,  0.1436, -0.2109,  ...,  0.1182,  0.0356, -0.0281],
        [ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.1708, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.2891, -0.0703, -0.09

tensor([0.0898, 0.0019], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.1069,  ...,  0.1230,  0.1299, -0.1826],
        [ 0.2715, -0.1621,  0.1611,  ..., -0.0491,  0.1270,  0.1787],
        [-0.1484,  0.1289, -0.0737,  ...,  0.2930,  0.2090, -0.2031],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.1119, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0820,  0.0645,  0.1226,  ..., -0.0598, -0.1631, -0.0991],
        [-0.0579,  0.0132,  0.1152,  ...,  0.0864,  0.0299,  0.0078],
        [ 0.0265,  0.0192,  0.0220,  ...,  0.0601,  0.0713, -0.0583],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.0724, 0.0000], grad_fn

tensor([[ 0.0215, -0.2119, -0.1172,  ..., -0.0903, -0.0544,  0.1797],
        [ 0.1094,  0.1406, -0.0317,  ...,  0.0077,  0.1201, -0.1797],
        [ 0.0605,  0.1406,  0.0845,  ..., -0.2441, -0.0081, -0.1885],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.1633, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0359, -0.0160, -0.2949,  ..., -0.2559,  0.0177, -0.0688],
        [-0.0586, -0.0376,  0.0728,  ..., -0.1079, -0.0864, -0.0320],
        [ 0.3301,  0.1216, -0.0210,  ..., -0.1230,  0.0669, -0.0952],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.1373, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1260,  0.1904,  0.06

tensor([0.1805, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.3262,  0.1895,  ...,  0.1377,  0.0938, -0.1592],
        [ 0.1030, -0.1523,  0.0259,  ..., -0.1982, -0.1230,  0.0649],
        [ 0.0381,  0.2969,  0.1748,  ..., -0.3086, -0.0107,  0.3359],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.1198, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0006, -0.2090,  0.1914,  ..., -0.1836, -0.0898,  0.2490],
        [ 0.1094,  0.1406, -0.0317,  ...,  0.0077,  0.1201, -0.1797],
        [-0.2070,  0.2031,  0.0420,  ...,  0.1387,  0.0369, -0.0287],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.1570, 0.0000], grad_fn

tensor([[ 0.1738, -0.2539, -0.1846,  ..., -0.0474, -0.0052,  0.0244],
        [-0.0408,  0.2520, -0.2158,  ..., -0.2021,  0.1021,  0.0337],
        [-0.0249,  0.0220, -0.0354,  ...,  0.0108, -0.0188, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.1276, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1943,  0.0510,  0.0967,  ..., -0.1348,  0.1309,  0.0762],
        [ 0.1133,  0.2441,  0.0286,  ..., -0.0074,  0.0236,  0.1914],
        [ 0.2148,  0.2637, -0.0408,  ..., -0.0332,  0.0815,  0.0217],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.1883, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0070, -0.0732,  0.17

tensor([[ 0.1104, -0.1235,  0.1406,  ..., -0.3770,  0.0300, -0.0840],
        [ 0.0327, -0.0962,  0.0442,  ..., -0.1768,  0.0159, -0.0854],
        [ 0.1172, -0.0349, -0.1089,  ..., -0.0040,  0.0815,  0.0459],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.1814, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0820,  0.0645,  0.1226,  ..., -0.0598, -0.1631, -0.0991],
        [ 0.0620,  0.1084, -0.0967,  ..., -0.2598,  0.0123, -0.0442],
        [-0.3672, -0.0344,  0.0498,  ...,  0.1279,  0.1504, -0.3203],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.2412, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[-5.4443e-02,  1.8848e-01, -1.3770e-01,  ..., -2.3145e-01,
          4.1016e-01, -1.6992e-01],
        [ 5.8105e-02, -1.7452e-04,  7.6172e-02,  ...,  1.0132e-02,
          6.4453e-02, -2.9663e-02],
        [ 6.8848e-02,  5.7373e-02, -1.1914e-01,  ..., -8.7891e-02,
          6.4453e-02,  1.7285e-01],
        ...,
        [ 0.0000e+00,  0.0000e+00,  0.0000e+00,  ...,  0.0000e+00,
          0.0000e+00,  0.0000e+00],
        [ 0.0000e+00,  0.0000e+00,  0.0000e+00,  ...,  0.0000e+00,
          0.0000e+00,  0.0000e+00],
        [ 0.0000e+00,  0.0000e+00,  0.0000e+00,  ...,  0.0000e+00,
          0.0000e+00,  0.0000e+00]])
tensor([0.1894, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.1069,  ...,  0.1230,  0.1299, -0.1826],
        [-0.1270,  0.0220,  0.2871,  ..., -0.1016, -0.0903,  0.0884],
        [-0.2451, -0.1562,  0.1001,  ..., -0.0879, -0.0081,  0.0496],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000

tensor([[-0.0275,  0.0459,  0.3438,  ...,  0.1177,  0.1865,  0.0393],
        [ 0.1445,  0.0471,  0.1006,  ...,  0.0023,  0.0981, -0.0669],
        [-0.0630, -0.0297,  0.1973,  ..., -0.2871, -0.0525,  0.0233],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.1295, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.1030, -0.1523,  0.0259,  ..., -0.1982, -0.1230,  0.0649],
        [ 0.1094,  0.1406, -0.0317,  ...,  0.0077,  0.1201, -0.1797],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.2159, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1011,  0.0177,  0.01

tensor([[ 0.0304, -0.2227, -0.2275,  ..., -0.0718,  0.0757,  0.0422],
        [ 0.0166,  0.0457, -0.1191,  ...,  0.0165,  0.2637,  0.0845],
        [ 0.0303, -0.0227, -0.0364,  ...,  0.0471,  0.1562, -0.0234],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.1252, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        [-0.2676,  0.0522,  0.0092,  ...,  0.0396, -0.1494,  0.0913],
        [ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.1754, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1309, -0.0280, -0.23

tensor([[-0.2891,  0.3262,  0.1895,  ...,  0.1377,  0.0938, -0.1592],
        [-0.0967, -0.0264,  0.0903,  ..., -0.0197,  0.2139,  0.1367],
        [-0.3164,  0.0593, -0.1094,  ...,  0.0454, -0.0244, -0.3594],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.2449, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1025, -0.0125, -0.1787,  ..., -0.2041,  0.1553,  0.1855],
        [-0.1816,  0.1650, -0.1660,  ...,  0.1592,  0.1279,  0.0022],
        [ 0.1230, -0.0461, -0.2021,  ..., -0.0913,  0.2891, -0.0292],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.2541, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[-0.2891,  0.3262,  0.1895,  ...,  0.1377,  0.0938, -0.1592],
        [ 0.0864,  0.2578,  0.0281,  ..., -0.2715,  0.1729,  0.0422],
        [-0.0118, -0.0474,  0.0447,  ...,  0.0713, -0.0349,  0.0242],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.2560, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.2715, -0.1621,  0.1611,  ..., -0.0491,  0.1270,  0.1787],
        [ 0.0378, -0.0601, -0.0581,  ..., -0.1396, -0.0053,  0.0085],
        [ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.3360, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1104, -0.1235,  0.14

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.0269,  0.3242, -0.0510,  ..., -0.1006,  0.3984, -0.3789],
        [ 0.1201, -0.0201,  0.2070,  ...,  0.2295, -0.2949,  0.0119],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.3084, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.0581,  0.0581,  0.0133,  ..., -0.1748, -0.0231, -0.0435],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.1637, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1895,  0.1104,  0.00

tensor([0.2832, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.1069,  ...,  0.1230,  0.1299, -0.1826],
        [-0.3535, -0.2471,  0.2041,  ...,  0.1206, -0.2246, -0.1660],
        [-0.0571, -0.2578, -0.1147,  ..., -0.1807,  0.2119,  0.1670],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.3700, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.1069,  ...,  0.1230,  0.1299, -0.1826],
        [-0.0249,  0.0220, -0.0354,  ...,  0.0108, -0.0188, -0.0688],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.3541, 0.0000], grad_fn

tensor([[ 0.1396,  0.1514, -0.2158,  ..., -0.1719, -0.1235,  0.2197],
        [ 0.1279,  0.1191, -0.0869,  ..., -0.1670,  0.1807, -0.0073],
        [-0.0249,  0.0220, -0.0354,  ...,  0.0108, -0.0188, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.2150, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0304, -0.2227, -0.2275,  ..., -0.0718,  0.0757,  0.0422],
        [-0.1816,  0.1650, -0.1660,  ...,  0.1592,  0.1279,  0.0022],
        [-0.0586, -0.0376,  0.0728,  ..., -0.1079, -0.0864, -0.0320],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.3613, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.3262,  0.18

tensor([[-0.1729,  0.2793,  0.1069,  ...,  0.1230,  0.1299, -0.1826],
        [-0.1582, -0.0708, -0.2461,  ...,  0.0864,  0.0850,  0.2793],
        [-0.1318,  0.0874, -0.1816,  ..., -0.0664,  0.1396, -0.1475],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.3432, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0118, -0.1943,  0.2637,  ..., -0.1533, -0.1030, -0.2949],
        [-0.1777, -0.2334, -0.1572,  ...,  0.0064, -0.1602, -0.0549],
        [-0.0378, -0.0757,  0.1309,  ..., -0.0894, -0.2969, -0.1582],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.2118, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1855,  0.3223,  0.25

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.1235,  0.0320,  0.1504,  ..., -0.2129, -0.0064, -0.0801],
        [ 0.0850, -0.0952,  0.1191,  ..., -0.1089,  0.0488, -0.1309],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.4862, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1021, -0.2676, -0.2373,  ...,  0.0525,  0.1973, -0.0796],
        [ 0.2285,  0.0452,  0.0952,  ..., -0.0806, -0.0840,  0.0161],
        [ 0.0718,  0.2080, -0.0284,  ..., -0.1680, -0.0209, -0.1426],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.3418, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0645, -0.0796, -0.17

tensor([[-0.1162, -0.1177,  0.0815,  ...,  0.1943,  0.0302,  0.4434],
        [-0.1396,  0.2314, -0.1309,  ...,  0.0732,  0.2949,  0.3008],
        [-0.0903,  0.0579, -0.0811,  ..., -0.0239, -0.2236, -0.1133],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.2294, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1104, -0.1235,  0.1406,  ..., -0.3770,  0.0300, -0.0840],
        [-0.0129, -0.0850,  0.0796,  ..., -0.0033,  0.0879,  0.2578],
        [ 0.0708, -0.0264,  0.1953,  ..., -0.0820, -0.1108, -0.1768],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.3048, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0654,  0.1270,  0.09

tensor([[ 0.1533,  0.1230,  0.1650,  ..., -0.2871, -0.3125,  0.1318],
        [ 0.0850, -0.0952,  0.1191,  ..., -0.1089,  0.0488, -0.1309],
        [-0.0096, -0.0845, -0.1089,  ...,  0.0184,  0.2422, -0.0193],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.5026, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0535,  0.1309,  0.2656,  ..., -0.0042,  0.2197, -0.1777],
        [ 0.0393, -0.1963, -0.1064,  ..., -0.0757,  0.0466, -0.0840],
        [ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.5584, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.0830,  0.1001,  0.2158,  ..., -0.0068, -0.0129,  0.0898],
        [-0.0118, -0.0474,  0.0447,  ...,  0.0713, -0.0349,  0.0242],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.3686, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0654,  0.1270,  0.0923,  ...,  0.1475,  0.2490,  0.1113],
        [-0.1816, -0.1328,  0.0391,  ..., -0.2227,  0.1445,  0.1270],
        [-0.2480, -0.2080, -0.1328,  ...,  0.0410,  0.0525,  0.0952],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.1943, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0659, -0.0796,  0.10

tensor([[ 0.1367,  0.0166, -0.3223,  ...,  0.1387,  0.0933, -0.1147],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        [-0.2539,  0.0286,  0.1045,  ..., -0.0815, -0.0928, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.2483, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.3125,  0.0879, -0.0510,  ..., -0.1670,  0.1206, -0.0461],
        [-0.0273,  0.0449,  0.0767,  ..., -0.1250,  0.1089, -0.1436],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.4318, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1621,  0.0869,  0.20

tensor([[ 0.1089, -0.1436, -0.1069,  ..., -0.6211, -0.2793, -0.0067],
        [-0.2451,  0.1245, -0.1299,  ...,  0.1445, -0.0713,  0.0117],
        [ 0.0476,  0.1973, -0.0608,  ..., -0.0035,  0.1011,  0.1226],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.3714, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.1069,  ...,  0.1230,  0.1299, -0.1826],
        [-0.1816,  0.1650, -0.1660,  ...,  0.1592,  0.1279,  0.0022],
        [ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.6211, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.3945,  0.0461, -0.42

tensor([[-0.1729,  0.2793,  0.1069,  ...,  0.1230,  0.1299, -0.1826],
        [-0.1816,  0.1650, -0.1660,  ...,  0.1592,  0.1279,  0.0022],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.4919, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1582,  0.1963, -0.1836,  ..., -0.5078,  0.0179,  0.1865],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        [-0.1787,  0.1128, -0.1719,  ...,  0.0183, -0.2598, -0.0972],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.6518, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.2285,  0.0820,  0.03

tensor([[-0.1855,  0.3223,  0.2520,  ..., -0.1367,  0.1621, -0.0771],
        [-0.1006, -0.0247,  0.0923,  ..., -0.1455,  0.2598,  0.0041],
        [ 0.1108, -0.1582,  0.0208,  ...,  0.1514, -0.1650,  0.0198],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.5425, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0535,  0.1309,  0.2656,  ..., -0.0042,  0.2197, -0.1777],
        [ 0.1426,  0.0723,  0.0303,  ..., -0.1416,  0.0344, -0.1523],
        [ 0.1387,  0.0294, -0.1865,  ...,  0.1006, -0.0991, -0.0317],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.5324, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0535,  0.1309,  0.26

tensor([[ 0.0679,  0.1953,  0.1206,  ..., -0.2080, -0.0452, -0.1328],
        [ 0.1396, -0.0062,  0.2148,  ...,  0.0571,  0.0996, -0.2344],
        [-0.1514,  0.2285,  0.2119,  ...,  0.0087, -0.0037,  0.1260],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.6421, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.1157,  0.0315,  0.4160,  ...,  0.1338,  0.0266,  0.0178],
        [-0.2949, -0.2412,  0.0923,  ...,  0.1680,  0.0923,  0.0364],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.3722, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0361,  0.0481, -0.16

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.1396, -0.0347, -0.0537,  ..., -0.1182, -0.0025, -0.0723],
        [ 0.0845, -0.0004,  0.0532,  ...,  0.0171,  0.0608, -0.1089],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.6961, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0215, -0.2119, -0.1172,  ..., -0.0903, -0.0544,  0.1797],
        [ 0.1104,  0.2480, -0.0077,  ..., -0.0762,  0.1309, -0.2217],
        [-0.0273,  0.0449,  0.0767,  ..., -0.1250,  0.1089, -0.1436],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.6043, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0605,  0.1406,  0.08

tensor([0.6532, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1299, -0.1729, -0.2217,  ..., -0.3867, -0.0698,  0.1797],
        [ 0.1094,  0.1406, -0.0317,  ...,  0.0077,  0.1201, -0.1797],
        [-0.2070,  0.2031,  0.0420,  ...,  0.1387,  0.0369, -0.0287],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.7827, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0148, -0.1123, -0.1602,  ...,  0.0437, -0.1924, -0.0752],
        [-0.2070,  0.2031,  0.0420,  ...,  0.1387,  0.0369, -0.0287],
        [ 0.1328, -0.1099, -0.1973,  ...,  0.0151, -0.0874, -0.2412],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.4287, 0.0000], grad_fn

tensor([[ 0.1582,  0.1963, -0.1836,  ..., -0.5078,  0.0179,  0.1865],
        [ 0.0942, -0.0228,  0.0522,  ..., -0.0469,  0.1611, -0.1992],
        [-0.0170,  0.0432,  0.0503,  ...,  0.0625,  0.2402, -0.1025],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.8463, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1089, -0.1436, -0.1069,  ..., -0.6211, -0.2793, -0.0067],
        [-0.0510,  0.0042,  0.0249,  ..., -0.0981,  0.0515,  0.0123],
        [ 0.1108, -0.1582,  0.0208,  ...,  0.1514, -0.1650,  0.0198],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.5866, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1699,  0.2012,  0.20

tensor([0.7060, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        [-0.2070,  0.2031,  0.0420,  ...,  0.1387,  0.0369, -0.0287],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.9175, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.1758,  0.2129, -0.0713,  ...,  0.1147,  0.3301, -0.1680],
        [ 0.1729,  0.1357, -0.1611,  ..., -0.1904, -0.1650, -0.0244],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.5958, 0.0000], grad_fn

tensor([0.6002, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 2.5586e-01,  1.9336e-01,  1.3184e-01,  ...,  4.6875e-02,
         -7.6172e-02,  3.1738e-02],
        [ 5.8105e-02, -1.7452e-04,  7.6172e-02,  ...,  1.0132e-02,
          6.4453e-02, -2.9663e-02],
        [ 3.4912e-02,  8.4961e-02,  6.2500e-02,  ..., -1.9043e-02,
         -8.9111e-03,  2.2095e-02],
        ...,
        [ 0.0000e+00,  0.0000e+00,  0.0000e+00,  ...,  0.0000e+00,
          0.0000e+00,  0.0000e+00],
        [ 0.0000e+00,  0.0000e+00,  0.0000e+00,  ...,  0.0000e+00,
          0.0000e+00,  0.0000e+00],
        [ 0.0000e+00,  0.0000e+00,  0.0000e+00,  ...,  0.0000e+00,
          0.0000e+00,  0.0000e+00]])
tensor([0.5154, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1172, -0.0618,  0.1357,  ..., -0.2432,  0.2539, -0.0396],
        [-0.0312,  0.3125,  0.0903,  ...,  0.0030,  0.1138, -0.0874],
        [ 0.0703,  0.0869,  0.0879,  ..., -0.0476,  0.0145, -0.0625],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.

tensor([[ 0.0525, -0.0596, -0.0053,  ..., -0.0306, -0.2637,  0.0205],
        [ 0.0038,  0.0247,  0.0120,  ...,  0.1143, -0.1943,  0.2129],
        [ 0.1445,  0.0471,  0.1006,  ...,  0.0023,  0.0981, -0.0669],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.7181, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1167, -0.0801, -0.1924,  ..., -0.1035, -0.0090,  0.0796],
        [-0.1816,  0.1650, -0.1660,  ...,  0.1592,  0.1279,  0.0022],
        [-0.2129, -0.0043, -0.1807,  ..., -0.1299, -0.2158,  0.0123],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.4134, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.2285,  0.0820,  0.03

tensor([[-0.2734,  0.1250,  0.0889,  ..., -0.0684,  0.0991, -0.2559],
        [ 0.0869,  0.1514, -0.0232,  ..., -0.2041,  0.0447, -0.1807],
        [ 0.0737,  0.0041, -0.1357,  ..., -0.1416, -0.1504, -0.1377],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.5111, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        [ 0.0457, -0.1455,  0.1562,  ..., -0.0159,  0.0067, -0.0019],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.8100, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1060,  0.2139,  0.11

tensor([0.5692, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0605,  0.1406,  0.0845,  ..., -0.2441, -0.0081, -0.1885],
        [-0.1050,  0.1270,  0.2236,  ...,  0.1387, -0.1582,  0.0134],
        [-0.1729,  0.2793,  0.1069,  ...,  0.1230,  0.1299, -0.1826],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.8595, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0605,  0.1406,  0.0845,  ..., -0.2441, -0.0081, -0.1885],
        [ 0.0679, -0.0413,  0.1001,  ...,  0.1045, -0.0854, -0.1543],
        [-0.0476,  0.0815,  0.0457,  ..., -0.0557,  0.1050, -0.1084],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.5134, 0.0000], grad_fn

tensor([[ 0.2393,  0.0698,  0.0068,  ..., -0.0156,  0.0417,  0.0620],
        [ 0.0645, -0.1611, -0.1187,  ..., -0.0287,  0.2285, -0.0410],
        [ 0.2061,  0.1157, -0.1699,  ..., -0.0879,  0.1123,  0.0227],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.8411, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1328,  0.0718,  0.1904,  ..., -0.2129,  0.1074,  0.1816],
        [-0.0747, -0.0588,  0.0457,  ...,  0.0938,  0.0280, -0.1152],
        [-0.0249,  0.0220, -0.0354,  ...,  0.0108, -0.0188, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.7833, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0420, -0.1235,  0.15

tensor([[-0.2100, -0.0354, -0.1582,  ..., -0.2148,  0.1289,  0.1133],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        [-0.0118, -0.0474,  0.0447,  ...,  0.0713, -0.0349,  0.0242],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.7492, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0559,  0.1177,  0.2109,  ..., -0.0427,  0.1475, -0.1826],
        [ 0.0845, -0.0004,  0.0532,  ...,  0.0171,  0.0608, -0.1089],
        [-0.0571, -0.0305, -0.0055,  ..., -0.0199,  0.1426, -0.0005],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.4972, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.1396, -0.0347, -0.0537,  ..., -0.1182, -0.0025, -0.0723],
        [ 0.2021,  0.1138,  0.2412,  ..., -0.0752, -0.1631,  0.0291],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.8500, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1445,  0.0471,  0.1006,  ...,  0.0023,  0.0981, -0.0669],
        [ 0.1079, -0.0300,  0.0332,  ..., -0.2197, -0.0488,  0.1758],
        [ 0.0510,  0.2773, -0.0283,  ..., -0.0527,  0.3770,  0.0427],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.6375, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[-0.0168, -0.0669,  0.1465,  ...,  0.0253, -0.0315,  0.0806],
        [ 0.0299,  0.0564,  0.0037,  ..., -0.0242,  0.0109, -0.1475],
        [ 0.1157,  0.0315,  0.4160,  ...,  0.1338,  0.0266,  0.0178],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.8717, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1006,  0.2793,  0.3184,  ...,  0.1602,  0.2148,  0.0237],
        [-0.2354,  0.1187,  0.1445,  ...,  0.1914, -0.1406,  0.2178],
        [-0.0273,  0.1055, -0.0266,  ..., -0.3457,  0.4004,  0.0242],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.5238, 0.0089], grad_fn=<ReluBackward0>)
tensor([[ 0.3945,  0.0461, -0.42

tensor([[ 0.0605,  0.1406,  0.0845,  ..., -0.2441, -0.0081, -0.1885],
        [-0.2070,  0.2031,  0.0420,  ...,  0.1387,  0.0369, -0.0287],
        [-0.0118, -0.0474,  0.0447,  ...,  0.0713, -0.0349,  0.0242],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.5570, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.2285, -0.0601,  0.1396,  ...,  0.0483, -0.1436,  0.3262],
        [ 0.0166,  0.0457, -0.1191,  ...,  0.0165,  0.2637,  0.0845],
        [-0.0742,  0.1128,  0.0947,  ...,  0.0266,  0.1943,  0.0698],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.0270, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1060,  0.2139,  0.11

tensor([[-0.0986,  0.0547,  0.1836,  ..., -0.0344, -0.0537, -0.1016],
        [ 0.1396, -0.0062,  0.2148,  ...,  0.0571,  0.0996, -0.2344],
        [ 0.0977, -0.0356,  0.0918,  ..., -0.1934, -0.1177,  0.0508],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.9002, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0757,  0.2969, -0.0215,  ...,  0.0186, -0.1021,  0.2129],
        [-0.1816,  0.1650, -0.1660,  ...,  0.1592,  0.1279,  0.0022],
        [-0.1367, -0.2773,  0.0474,  ..., -0.0223,  0.1177, -0.0669],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.5840, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0275,  0.0459,  0.34

tensor([[ 0.3945,  0.0461, -0.4258,  ..., -0.5664,  0.0640, -0.0114],
        [-0.0273,  0.0449,  0.0767,  ..., -0.1250,  0.1089, -0.1436],
        [-0.0118, -0.0474,  0.0447,  ...,  0.0713, -0.0349,  0.0242],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.9125, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2480, -0.2080, -0.1328,  ...,  0.0410,  0.0525,  0.0952],
        [-0.3496,  0.0762,  0.0952,  ...,  0.0894, -0.2129,  0.1182],
        [ 0.3027,  0.3672, -0.0498,  ..., -0.0403,  0.0425, -0.1250],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.7346, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.16

tensor([0.3125, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0581,  0.0581,  0.0133,  ..., -0.1748, -0.0231, -0.0435],
        [ 0.0732,  0.1963,  0.0005,  ...,  0.0152,  0.0679,  0.0579],
        [ 0.1147, -0.0835,  0.0337,  ..., -0.1123, -0.0728,  0.0752],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.5626, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.1030, -0.1523,  0.0259,  ..., -0.1982, -0.1230,  0.0649],
        [ 0.1504,  0.0447, -0.0825,  ...,  0.0381,  0.2266,  0.0923],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.8445, 0.0000], grad_fn

tensor([[-0.1396,  0.2314, -0.1309,  ...,  0.0732,  0.2949,  0.3008],
        [-0.0615,  0.4941,  0.0080,  ..., -0.1992, -0.1289, -0.1631],
        [-0.0249,  0.0220, -0.0354,  ...,  0.0108, -0.0188, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.4552, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.1396, -0.0347, -0.0537,  ..., -0.1182, -0.0025, -0.0723],
        [-0.1011,  0.0177,  0.0147,  ..., -0.0835,  0.0056, -0.0178],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.1079, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[ 0.0938,  0.3086, -0.1221,  ..., -0.0649,  0.0339,  0.3125],
        [ 0.1689,  0.0640, -0.0845,  ..., -0.1719, -0.0293, -0.2061],
        [ 0.1777, -0.0371,  0.0056,  ..., -0.0435,  0.0986,  0.2559],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.8458, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1299, -0.0684, -0.0520,  ..., -0.2432, -0.0991,  0.0957],
        [-0.0249,  0.0220, -0.0354,  ...,  0.0108, -0.0188, -0.0688],
        [ 0.0063,  0.0193, -0.0898,  ..., -0.1611,  0.0012, -0.1064],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.6739, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.16

tensor([0.5870, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0403,  0.0928,  0.1553,  ...,  0.1250,  0.0449,  0.0344],
        [ 0.1504,  0.0447, -0.0825,  ...,  0.0381,  0.2266,  0.0923],
        [ 0.0703,  0.0869,  0.0879,  ..., -0.0476,  0.0145, -0.0625],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.5515, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1504,  0.1025, -0.0064,  ..., -0.0172, -0.2930, -0.0981],
        [ 0.0249,  0.2383,  0.1416,  ...,  0.1602, -0.0311,  0.0081],
        [-0.1157, -0.0315,  0.1592,  ...,  0.0262, -0.0625, -0.0415],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.9193, 0.0000], grad_fn

tensor([[-0.1621,  0.0869,  0.2012,  ..., -0.0840,  0.0449, -0.1797],
        [ 0.2041,  0.0132,  0.0757,  ..., -0.2119, -0.1328,  0.1084],
        [-0.0967, -0.0264,  0.0903,  ..., -0.0197,  0.2139,  0.1367],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.1218, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1089, -0.1436, -0.1069,  ..., -0.6211, -0.2793, -0.0067],
        [ 0.1445,  0.0471,  0.1006,  ...,  0.0023,  0.0981, -0.0669],
        [-0.1748, -0.1328, -0.2930,  ..., -0.0723, -0.2676,  0.0150],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.8079, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.3262,  0.18

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.4102,  0.0371,  0.1934,  ..., -0.1328, -0.1138,  0.0244],
        [ 0.0649, -0.0518, -0.1396,  ..., -0.1221, -0.0179,  0.2031],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.0359, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1396,  0.2314, -0.1309,  ...,  0.0732,  0.2949,  0.3008],
        [-0.1689,  0.3438,  0.2715,  ..., -0.0076,  0.0461,  0.0332],
        [ 0.1562, -0.2119, -0.0684,  ...,  0.0181,  0.0835,  0.1172],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.9184, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.16

tensor([[ 0.1504, -0.0566,  0.2012,  ..., -0.1035,  0.1001, -0.0283],
        [ 0.2402,  0.2012,  0.1621,  ...,  0.0349,  0.0315,  0.0145],
        [-0.0118, -0.0474,  0.0447,  ...,  0.0713, -0.0349,  0.0242],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.2188, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0437,  0.0928,  0.0564,  ..., -0.1641, -0.0483, -0.0549],
        [-0.0157, -0.0283,  0.0835,  ...,  0.0069,  0.0610, -0.1484],
        [ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.2944, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[-0.0488, -0.0757, -0.0354,  ..., -0.0557,  0.2266, -0.2295],
        [ 0.0703,  0.0869,  0.0879,  ..., -0.0476,  0.0145, -0.0625],
        [ 0.1094,  0.1406, -0.0317,  ...,  0.0077,  0.1201, -0.1797],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.0238, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0845, -0.0004,  0.0532,  ...,  0.0171,  0.0608, -0.1089],
        [ 0.0894,  0.1299,  0.2129,  ..., -0.1523,  0.0055, -0.1006],
        [-0.1396, -0.0347, -0.0537,  ..., -0.1182, -0.0025, -0.0723],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.6642, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0118, -0.0474,  0.04

tensor([0.8342, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0645, -0.0796, -0.1768,  ..., -0.0078,  0.1836, -0.2402],
        [-0.1572, -0.3379, -0.0718,  ...,  0.0771,  0.0437, -0.1299],
        [-0.2676,  0.0928, -0.2383,  ...,  0.0583,  0.0226, -0.1011],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.5253, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.1396, -0.0347, -0.0537,  ..., -0.1182, -0.0025, -0.0723],
        [ 0.0239, -0.0461,  0.0039,  ..., -0.2695, -0.0688, -0.2754],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.1245, 0.0000], grad_fn

tensor([[-0.0535,  0.1309,  0.2656,  ..., -0.0042,  0.2197, -0.1777],
        [ 0.1226, -0.0894,  0.0270,  ..., -0.0640, -0.0718, -0.1387],
        [-0.1260,  0.1245,  0.0036,  ...,  0.0364,  0.1377, -0.2383],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.1819, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.1030, -0.1523,  0.0259,  ..., -0.1982, -0.1230,  0.0649],
        [ 0.1094,  0.1406, -0.0317,  ...,  0.0077,  0.1201, -0.1797],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.4489, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[-0.0291,  0.0762,  0.2676,  ...,  0.0601,  0.3301,  0.0703],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        [-0.2676, -0.0781,  0.3086,  ..., -0.4258, -0.0840,  0.0603],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.9608, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1196,  0.1079, -0.2002,  ..., -0.0444, -0.0369, -0.1523],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        [ 0.1260,  0.1904,  0.0698,  ...,  0.0613,  0.1729, -0.0786],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.5760, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0781, -0.1128,  0.01

tensor([[-0.1729,  0.2793,  0.1069,  ...,  0.1230,  0.1299, -0.1826],
        [-0.2188,  0.0498, -0.1201,  ..., -0.3418, -0.1226,  0.1533],
        [-0.0449, -0.0304,  0.0023,  ...,  0.0123, -0.0884, -0.0156],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.9323, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0786, -0.0233, -0.1699,  ..., -0.0383,  0.1572,  0.0713],
        [-0.0586, -0.0376,  0.0728,  ..., -0.1079, -0.0864, -0.0320],
        [-0.0811,  0.1699, -0.1836,  ...,  0.0752,  0.1445, -0.1367],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.7636, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1699, -0.2676,  0.14

tensor([[ 5.7129e-02,  9.1553e-03,  6.3965e-02,  ..., -1.7090e-01,
          2.2339e-02,  1.0840e-01],
        [ 7.1777e-02,  2.0801e-01, -2.8442e-02,  ..., -1.6797e-01,
         -2.0874e-02, -1.4258e-01],
        [-3.5352e-01, -6.1768e-02,  1.2012e-01,  ...,  8.1055e-02,
         -2.4567e-03, -8.4877e-05],
        ...,
        [ 0.0000e+00,  0.0000e+00,  0.0000e+00,  ...,  0.0000e+00,
          0.0000e+00,  0.0000e+00],
        [ 0.0000e+00,  0.0000e+00,  0.0000e+00,  ...,  0.0000e+00,
          0.0000e+00,  0.0000e+00],
        [ 0.0000e+00,  0.0000e+00,  0.0000e+00,  ...,  0.0000e+00,
          0.0000e+00,  0.0000e+00]])
tensor([0.4846, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1182,  0.1318, -0.0559,  ...,  0.0608,  0.1226, -0.2988],
        [ 0.0306, -0.0192,  0.0388,  ..., -0.0062, -0.0248,  0.1001],
        [-0.1729,  0.2793,  0.1069,  ...,  0.1230,  0.1299, -0.1826],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000

tensor([[ 0.1582,  0.1060, -0.1895,  ..., -0.2676,  0.0084, -0.2139],
        [ 0.0166,  0.0457, -0.1191,  ...,  0.0165,  0.2637,  0.0845],
        [ 0.0240,  0.3145, -0.0262,  ...,  0.0153,  0.0649,  0.1426],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.4171, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.3574, -0.0366,  0.1562,  ..., -0.2773, -0.2031,  0.0603],
        [-0.1157, -0.0315,  0.1592,  ...,  0.0262, -0.0625, -0.0415],
        [ 0.1094,  0.1406, -0.0317,  ...,  0.0077,  0.1201, -0.1797],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.1927, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.1030, -0.1523,  0.0259,  ..., -0.1982, -0.1230,  0.0649],
        [ 0.1094,  0.1406, -0.0317,  ...,  0.0077,  0.1201, -0.1797],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.1542, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.2285, -0.0601,  0.1396,  ...,  0.0483, -0.1436,  0.3262],
        [ 0.0825, -0.1514,  0.0659,  ..., -0.1016, -0.1084, -0.2051],
        [-0.0762, -0.0210, -0.0029,  ...,  0.0254, -0.0791, -0.2275],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.9546, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1533,  0.1230,  0.16

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        [ 0.0166,  0.0457, -0.1191,  ...,  0.0165,  0.2637,  0.0845],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.3762, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.1035,  0.1377, -0.0030,  ...,  0.0439, -0.1455,  0.0713],
        [-0.0264,  0.0684, -0.0311,  ..., -0.1709,  0.1963, -0.0996],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.2911, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[-1.5723e-01,  1.0645e-01,  3.1445e-01,  ...,  2.5195e-01,
         -1.8262e-01,  3.3398e-01],
        [ 1.1133e-01, -1.5723e-01,  4.4189e-02,  ..., -3.9453e-01,
         -1.6992e-01,  3.1006e-02],
        [ 8.4473e-02, -3.5286e-04,  5.3223e-02,  ...,  1.7090e-02,
          6.0791e-02, -1.0889e-01],
        ...,
        [-1.1780e-02, -4.7363e-02,  4.4678e-02,  ...,  7.1289e-02,
         -3.4912e-02,  2.4170e-02],
        [-1.0449e-01,  2.9755e-03, -1.0107e-01,  ..., -6.2500e-02,
          5.9326e-02, -2.1094e-01],
        [ 0.0000e+00,  0.0000e+00,  0.0000e+00,  ...,  0.0000e+00,
          0.0000e+00,  0.0000e+00]])
tensor([1.4635, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1089, -0.0747, -0.0454,  ..., -0.3594,  0.0486,  0.1611],
        [ 0.0078,  0.1641,  0.1855,  ...,  0.2178,  0.2061, -0.0596],
        [-0.1934, -0.1836,  0.3066,  ...,  0.0291,  0.1279, -0.0894],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000

tensor([[-0.0275,  0.0459,  0.3438,  ...,  0.1177,  0.1865,  0.0393],
        [-0.1270,  0.0220,  0.2871,  ..., -0.1016, -0.0903,  0.0884],
        [-0.1465, -0.0542, -0.0850,  ...,  0.0320, -0.0005, -0.1050],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.6114, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0654,  0.1270,  0.0923,  ...,  0.1475,  0.2490,  0.1113],
        [ 0.1147,  0.0669, -0.1523,  ..., -0.0557, -0.2305, -0.1611],
        [-0.1465,  0.1865,  0.2197,  ...,  0.2891, -0.1060,  0.1660],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.1783, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1104, -0.1235,  0.14

tensor([[-0.1133, -0.1172,  0.0850,  ...,  0.0038, -0.1934,  0.0219],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        [ 0.0718,  0.2080, -0.0284,  ..., -0.1680, -0.0209, -0.1426],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.0394, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0747,  0.1943, -0.1475,  ..., -0.2637, -0.0942,  0.0510],
        [-0.3418, -0.4102,  0.4512,  ..., -0.0432,  0.1445,  0.2471],
        [ 0.0505, -0.2363,  0.0177,  ..., -0.0510,  0.3066,  0.0850],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.6466, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.10

tensor([[ 0.0786,  0.1318,  0.1895,  ..., -0.2236, -0.1011,  0.0339],
        [-0.0469,  0.0669,  0.0093,  ..., -0.0120,  0.1650, -0.0317],
        [ 0.0845, -0.0004,  0.0532,  ...,  0.0171,  0.0608, -0.1089],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.3113, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        [-0.1514,  0.0236,  0.1328,  ...,  0.1211,  0.2656, -0.0061],
        [-0.0237,  0.0493,  0.1816,  ...,  0.0220, -0.1504,  0.0123],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.3389, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0056, -0.0938,  0.04

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.4102, -0.0640, -0.1387,  ..., -0.2793,  0.0601, -0.1475],
        [ 0.1108, -0.1582,  0.0208,  ...,  0.1514, -0.1650,  0.0198],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.4623, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0275,  0.0459,  0.3438,  ...,  0.1177,  0.1865,  0.0393],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        [-0.1270,  0.0220,  0.2871,  ..., -0.1016, -0.0903,  0.0884],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.2535, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0605,  0.1406,  0.08

tensor([1.3787, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1094,  0.1406, -0.0317,  ...,  0.0077,  0.1201, -0.1797],
        [ 0.1895,  0.1367, -0.0947,  ...,  0.0762,  0.0154, -0.0503],
        [ 0.0752, -0.0189, -0.0054,  ..., -0.0403,  0.1128, -0.2012],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.4684, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1396,  0.2314, -0.1309,  ...,  0.0732,  0.2949,  0.3008],
        [-0.0298,  0.0718, -0.0212,  ..., -0.1167, -0.1250,  0.2871],
        [ 0.0146,  0.3477,  0.0430,  ..., -0.1992,  0.0728,  0.0237],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.1390, 0.0000], grad_fn

tensor([[-0.1953, -0.0776,  0.0874,  ..., -0.1777,  0.0933, -0.0106],
        [ 0.1445,  0.0471,  0.1006,  ...,  0.0023,  0.0981, -0.0669],
        [ 0.1533,  0.0718, -0.0242,  ...,  0.0284, -0.0996,  0.0325],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.2833, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2061, -0.1270,  0.1289,  ..., -0.2031, -0.2617,  0.0718],
        [ 0.2041,  0.0132,  0.0757,  ..., -0.2119, -0.1328,  0.1084],
        [ 0.0378,  0.1328, -0.0165,  ..., -0.3887, -0.0554, -0.1602],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.5576, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0479, -0.2949,  0.37

tensor([0.8380, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1167, -0.0801, -0.1924,  ..., -0.1035, -0.0090,  0.0796],
        [ 0.0146,  0.3477,  0.0430,  ..., -0.1992,  0.0728,  0.0237],
        [-0.0530,  0.2832,  0.2207,  ..., -0.1260,  0.0488, -0.0820],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.7696, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1060,  0.2139,  0.1187,  ...,  0.1069,  0.0237, -0.0354],
        [ 0.0791, -0.1201, -0.0942,  ..., -0.1357, -0.0322, -0.0728],
        [-0.2070,  0.2031,  0.0420,  ...,  0.1387,  0.0369, -0.0287],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.1849, 0.0000], grad_fn

tensor([[-0.1904, -0.0376, -0.1177,  ...,  0.2080,  0.1387,  0.1631],
        [ 0.0703,  0.0869,  0.0879,  ..., -0.0476,  0.0145, -0.0625],
        [-0.1240,  0.0786, -0.0100,  ...,  0.0767, -0.1172, -0.0452],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.2983, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0403,  0.0928,  0.1553,  ...,  0.1250,  0.0449,  0.0344],
        [ 0.0718,  0.0161, -0.1191,  ...,  0.1377, -0.1240,  0.0142],
        [ 0.0444, -0.1875, -0.3691,  ...,  0.1133, -0.0859,  0.3828],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.4217, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1504, -0.0566,  0.20

tensor([[-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        [-0.2070,  0.2031,  0.0420,  ...,  0.1387,  0.0369, -0.0287],
        [ 0.0830, -0.0125,  0.0413,  ..., -0.1553,  0.2441,  0.1396],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.0693, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.0962, -0.0287, -0.1084,  ...,  0.0693,  0.1045, -0.1641],
        [-0.0811,  0.1040, -0.2695,  ..., -0.2002,  0.2256, -0.1465],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.6875, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.10

tensor([[ 0.1943,  0.0510,  0.0967,  ..., -0.1348,  0.1309,  0.0762],
        [-0.1816,  0.1650, -0.1660,  ...,  0.1592,  0.1279,  0.0022],
        [-0.2246,  0.0522, -0.1953,  ...,  0.0864, -0.0771,  0.1729],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.1609, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        [-0.2070,  0.2031,  0.0420,  ...,  0.1387,  0.0369, -0.0287],
        [ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.2647, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1089, -0.1436, -0.10

tensor([[-0.0403,  0.0928,  0.1553,  ...,  0.1250,  0.0449,  0.0344],
        [ 0.0630,  0.1245,  0.1133,  ..., -0.0635,  0.1147,  0.0310],
        [ 0.0378, -0.0601, -0.0581,  ..., -0.1396, -0.0053,  0.0085],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.0320, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.2080, -0.1543, -0.0070,  ...,  0.0059,  0.2988,  0.2158],
        [-0.2041,  0.0894, -0.1318,  ..., -0.0840,  0.6797,  0.1719],
        [-0.1904,  0.1475,  0.0339,  ..., -0.0400,  0.0776,  0.0679],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.7509, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0820,  0.0645,  0.12

tensor([[-0.2266,  0.1533,  0.0889,  ..., -0.0182, -0.0522, -0.1089],
        [ 0.0703,  0.0869,  0.0879,  ..., -0.0476,  0.0145, -0.0625],
        [-0.0078, -0.0280,  0.0405,  ...,  0.0396, -0.0605,  0.0081],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.6926, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0535,  0.1309,  0.2656,  ..., -0.0042,  0.2197, -0.1777],
        [-0.0884, -0.1270, -0.0147,  ..., -0.0820, -0.0791, -0.1177],
        [ 0.1138,  0.1108,  0.0432,  ..., -0.1611,  0.0376,  0.1729],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.3065, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0130,  0.1484, -0.04

tensor([1.1109, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0273,  0.0449,  0.0767,  ..., -0.1250,  0.1089, -0.1436],
        [ 0.0317, -0.1064,  0.0024,  ..., -0.0625, -0.1030,  0.0293],
        [-0.0579,  0.2617, -0.0302,  ...,  0.0168,  0.0072, -0.0493],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.5843, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0996,  0.1338,  0.1050,  ..., -0.1504,  0.0918,  0.0825],
        [-0.1758,  0.0010, -0.0034,  ..., -0.1147, -0.1338, -0.0583],
        [ 0.1245,  0.0908, -0.0049,  ..., -0.1494, -0.0732,  0.3340],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.2128, 0.0000], grad_fn

tensor([[ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        [ 0.0786,  0.1318,  0.1895,  ..., -0.2236, -0.1011,  0.0339],
        [ 0.0332, -0.0898, -0.2949,  ..., -0.1270,  0.1611, -0.1602],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.7411, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        [-0.2070,  0.2031,  0.0420,  ...,  0.1387,  0.0369, -0.0287],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.3005, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0679,  0.1953,  0.12

tensor([[-1.0889e-01, -7.4707e-02, -4.5410e-02,  ..., -3.5938e-01,
          4.8584e-02,  1.6113e-01],
        [-2.3071e-02,  1.5332e-01,  1.5234e-01,  ...,  1.4453e-01,
          1.3281e-01, -8.5938e-02],
        [ 8.4473e-02, -3.5286e-04,  5.3223e-02,  ...,  1.7090e-02,
          6.0791e-02, -1.0889e-01],
        ...,
        [ 0.0000e+00,  0.0000e+00,  0.0000e+00,  ...,  0.0000e+00,
          0.0000e+00,  0.0000e+00],
        [ 0.0000e+00,  0.0000e+00,  0.0000e+00,  ...,  0.0000e+00,
          0.0000e+00,  0.0000e+00],
        [ 0.0000e+00,  0.0000e+00,  0.0000e+00,  ...,  0.0000e+00,
          0.0000e+00,  0.0000e+00]])
tensor([1.2897, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0581,  0.0581,  0.0133,  ..., -0.1748, -0.0231, -0.0435],
        [-0.3242, -0.0835, -0.0168,  ..., -0.1602, -0.2285,  0.0015],
        [-0.0078, -0.0280,  0.0405,  ...,  0.0396, -0.0605,  0.0081],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000

tensor([[-0.1709,  0.2383, -0.0237,  ...,  0.0337,  0.2197, -0.0564],
        [-0.1816,  0.1650, -0.1660,  ...,  0.1592,  0.1279,  0.0022],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.2415, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.1035,  0.1377, -0.0030,  ...,  0.0439, -0.1455,  0.0713],
        [ 0.0732,  0.1963,  0.0005,  ...,  0.0152,  0.0679,  0.0579],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.7776, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1768,  0.1670,  0.00

tensor([[-0.1011,  0.0177,  0.0147,  ..., -0.0835,  0.0056, -0.0178],
        [ 0.1348, -0.0014,  0.0854,  ..., -0.0566, -0.2676,  0.1084],
        [ 0.0349,  0.0850,  0.0625,  ..., -0.0190, -0.0089,  0.0221],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.3963, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0215, -0.2119, -0.1172,  ..., -0.0903, -0.0544,  0.1797],
        [ 0.1094,  0.1406, -0.0317,  ...,  0.0077,  0.1201, -0.1797],
        [-0.2891,  0.3262,  0.1895,  ...,  0.1377,  0.0938, -0.1592],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.4707, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1504, -0.0566,  0.20

tensor([1.6402, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1094,  0.1123,  0.1914,  ...,  0.0703,  0.0830,  0.0530],
        [ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.1396, -0.0347, -0.0537,  ..., -0.1182, -0.0025, -0.0723],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.9158, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        [-0.2070,  0.2031,  0.0420,  ...,  0.1387,  0.0369, -0.0287],
        [-0.0449, -0.0304,  0.0023,  ...,  0.0123, -0.0884, -0.0156],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.6926, 0.0000], grad_fn

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.0698, -0.0127, -0.1040,  ..., -0.1475,  0.0295,  0.2080],
        [ 0.0547, -0.0096,  0.2617,  ...,  0.0791, -0.2451, -0.0613],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.7247, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0605,  0.1406,  0.0845,  ..., -0.2441, -0.0081, -0.1885],
        [-0.1973,  0.2500,  0.0522,  ...,  0.1680,  0.0488, -0.0889],
        [-0.0118, -0.1943,  0.2637,  ..., -0.1533, -0.1030, -0.2949],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.1807, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1001,  0.1758,  0.04

tensor([0.5629, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-4.7363e-02, -1.4160e-01,  4.9072e-02,  ..., -3.4961e-01,
         -1.4062e-01,  1.0449e-01],
        [ 4.1748e-02,  3.1836e-01, -2.6978e-02,  ..., -1.1536e-02,
          1.3965e-01,  1.8954e-05],
        [-1.3184e-01,  1.7456e-02,  5.0391e-01,  ..., -1.0742e-01,
         -3.2031e-01,  3.3203e-01],
        ...,
        [ 0.0000e+00,  0.0000e+00,  0.0000e+00,  ...,  0.0000e+00,
          0.0000e+00,  0.0000e+00],
        [ 0.0000e+00,  0.0000e+00,  0.0000e+00,  ...,  0.0000e+00,
          0.0000e+00,  0.0000e+00],
        [ 0.0000e+00,  0.0000e+00,  0.0000e+00,  ...,  0.0000e+00,
          0.0000e+00,  0.0000e+00]])
tensor([0.8850, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1011,  0.0177,  0.0147,  ..., -0.0835,  0.0056, -0.0178],
        [-0.0273,  0.0449,  0.0767,  ..., -0.1250,  0.1089, -0.1436],
        [ 0.1934, -0.0043, -0.0322,  ...,  0.0520,  0.0276, -0.0066],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.

tensor([[-0.1011,  0.0177,  0.0147,  ..., -0.0835,  0.0056, -0.0178],
        [ 0.1934,  0.1543,  0.0413,  ...,  0.3594,  0.0664,  0.0498],
        [ 0.2812,  0.2539,  0.1128,  ...,  0.2412, -0.2539, -0.2598],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.6267, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0231,  0.1533,  0.1523,  ...,  0.1445,  0.1328, -0.0859],
        [ 0.1260,  0.1904,  0.0698,  ...,  0.0613,  0.1729, -0.0786],
        [ 0.0737,  0.0041, -0.1357,  ..., -0.1416, -0.1504, -0.1377],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.4664, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2256, -0.0195,  0.09

tensor([[-0.1260,  0.0547,  0.0781,  ..., -0.1309,  0.3379,  0.1445],
        [ 0.2002,  0.1543,  0.1030,  ..., -0.2432,  0.0078, -0.1445],
        [ 0.0718,  0.2080, -0.0284,  ..., -0.1680, -0.0209, -0.1426],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.4843, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1118,  0.1807,  0.2051,  ...,  0.2266,  0.1289,  0.0405],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        [-0.1270,  0.0220,  0.2871,  ..., -0.1016, -0.0903,  0.0884],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.4438, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0957,  0.0036,  0.13

tensor([1.0126, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1504, -0.0566,  0.2012,  ..., -0.1035,  0.1001, -0.0283],
        [ 0.0732, -0.0059,  0.1338,  ..., -0.3379, -0.2119,  0.0801],
        [-0.0344,  0.1035,  0.0216,  ...,  0.0732,  0.0332,  0.0383],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.4472, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.3223,  0.1768,  0.1533,  ...,  0.2490,  0.0918,  0.1299],
        [ 0.1094,  0.2285, -0.2715,  ...,  0.0133, -0.1299, -0.1592],
        [ 0.0574,  0.1230, -0.0864,  ..., -0.0339,  0.0781,  0.0547],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.3837, 0.0000], grad_fn

tensor([1.7326, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0055, -0.0112,  0.1270,  ..., -0.0189,  0.1836, -0.1289],
        [ 0.0317, -0.1064,  0.0024,  ..., -0.0625, -0.1030,  0.0293],
        [-0.0579,  0.2617, -0.0302,  ...,  0.0168,  0.0072, -0.0493],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.4857, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.1157,  0.0315,  0.4160,  ...,  0.1338,  0.0266,  0.0178],
        [-0.1348, -0.0240,  0.0442,  ...,  0.1016,  0.0669,  0.1011],
        ...,
        [ 0.1094,  0.1406, -0.0317,  ...,  0.0077,  0.1201, -0.1797],
        [-0.2070,  0.2031,  0.0420,  ...,  0.1387,  0.0369, -0.0287],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.6541, 0.0000], grad_fn

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.0342,  0.3887,  0.1602,  ..., -0.1729,  0.0991, -0.1191],
        [ 0.1943,  0.0996,  0.0825,  ..., -0.1738, -0.1592,  0.1797],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.8338, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0427, -0.3398,  0.0913,  ...,  0.0991, -0.0430, -0.0649],
        [ 0.2373,  0.2773, -0.0811,  ..., -0.0308,  0.0376, -0.1650],
        [-0.0449, -0.0304,  0.0023,  ...,  0.0123, -0.0884, -0.0156],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.3622, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0466,  0.0713, -0.18

tensor([[-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        [-0.2070,  0.2031,  0.0420,  ...,  0.1387,  0.0369, -0.0287],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.6952, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0659,  0.1562,  0.1025,  ...,  0.0332,  0.1670,  0.0698],
        [ 0.0894,  0.0195, -0.0352,  ..., -0.0515,  0.1826, -0.0302],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.0391, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0361, -0.1211,  0.13

tensor([[-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        [ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.7182, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1133, -0.1172,  0.0850,  ...,  0.0038, -0.1934,  0.0219],
        [ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        [-0.4297,  0.1436,  0.0918,  ...,  0.2373, -0.0128, -0.0654],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.6934, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.10

tensor([1.8552, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.4121,  0.3184,  0.1260,  ...,  0.0654,  0.2002, -0.2256],
        [-0.2070,  0.2031,  0.0420,  ...,  0.1387,  0.0369, -0.0287],
        [ 0.0703,  0.0869,  0.0879,  ..., -0.0476,  0.0145, -0.0625],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.8733, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1895,  0.1816,  0.3359,  ...,  0.1167,  0.0569,  0.1055],
        [ 0.0444,  0.1875, -0.0549,  ..., -0.0508, -0.2578,  0.1465],
        [ 0.1631,  0.0271,  0.1445,  ...,  0.3145,  0.0786, -0.0356],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.0115, 0.0000], grad_fn

tensor([[-0.2500,  0.1934, -0.0469,  ...,  0.1475,  0.2910, -0.2754],
        [-0.1396,  0.2314, -0.1309,  ...,  0.0732,  0.2949,  0.3008],
        [-0.2383,  0.0092, -0.0435,  ...,  0.0245, -0.2148, -0.0167],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.9880, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0605,  0.1406,  0.0845,  ..., -0.2441, -0.0081, -0.1885],
        [ 0.1299, -0.1206,  0.0025,  ...,  0.4062, -0.0552,  0.0330],
        [ 0.0146,  0.3477,  0.0430,  ..., -0.1992,  0.0728,  0.0237],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.6202, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1621,  0.0527, -0.06

tensor([[ 0.1582,  0.1963, -0.1836,  ..., -0.5078,  0.0179,  0.1865],
        [ 0.0703,  0.0869,  0.0879,  ..., -0.0476,  0.0145, -0.0625],
        [ 0.0332, -0.0898, -0.2949,  ..., -0.1270,  0.1611, -0.1602],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.8852, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0820,  0.0645,  0.1226,  ..., -0.0598, -0.1631, -0.0991],
        [ 0.1094,  0.1406, -0.0317,  ...,  0.0077,  0.1201, -0.1797],
        [-0.1729,  0.2793,  0.1069,  ...,  0.1230,  0.1299, -0.1826],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.6857, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.16

tensor([[ 0.0605,  0.1406,  0.0845,  ..., -0.2441, -0.0081, -0.1885],
        [ 0.0674, -0.0811, -0.1030,  ..., -0.1660, -0.0796,  0.0723],
        [-0.1729,  0.2793,  0.1069,  ...,  0.1230,  0.1299, -0.1826],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.7501, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1011,  0.0177,  0.0147,  ..., -0.0835,  0.0056, -0.0178],
        [ 0.2129,  0.1494,  0.0139,  ...,  0.0574, -0.0811, -0.0294],
        [ 0.2402,  0.2012,  0.1621,  ...,  0.0349,  0.0315,  0.0145],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.9138, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0781, -0.1128,  0.01

tensor([2.0768, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        [-0.1953, -0.1147, -0.2148,  ...,  0.0249,  0.0151,  0.0806],
        [-0.1699,  0.2012,  0.2051,  ...,  0.1797,  0.2119, -0.1865],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.6234, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2520, -0.0771, -0.0184,  ..., -0.3945, -0.0942,  0.0005],
        [ 0.0006,  0.0618, -0.1250,  ..., -0.2852,  0.0449,  0.0393],
        [-0.0615, -0.0850, -0.1504,  ..., -0.0669, -0.0220,  0.0515],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.6873, 0.0000], grad_fn

tensor([1.7635, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2373,  0.0771, -0.0476,  ..., -0.2598,  0.0194, -0.1445],
        [ 0.0518,  0.0679, -0.0864,  ..., -0.0767,  0.4258, -0.1592],
        [-0.0811,  0.1040, -0.2695,  ..., -0.2002,  0.2256, -0.1465],
        ...,
        [ 0.1133, -0.1367,  0.1069,  ...,  0.1572, -0.0294,  0.1157],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.2380, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.2891, -0.0703, -0.0972,  ..., -0.2324,  0.2158,  0.2539],
        [-0.1367,  0.1260,  0.2178,  ...,  0.1836,  0.1494, -0.0898],
        [-0.1816,  0.1650, -0.1660,  ...,  0.1592,  0.1279,  0.0022],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.6855, 0.0000], grad_fn

tensor([1.9416, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.0013, -0.0483, -0.2832,  ..., -0.1836,  0.3027, -0.1484],
        [-0.0510,  0.1416, -0.0732,  ...,  0.0148, -0.0084,  0.1582],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.0573, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0718,  0.2080, -0.0284,  ..., -0.1680, -0.0209, -0.1426],
        [ 0.0718,  0.2080, -0.0284,  ..., -0.1680, -0.0209, -0.1426],
        [-0.2695,  0.2451,  0.5156,  ..., -0.0562, -0.1543, -0.1143],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.6264, 0.0000], grad_fn

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.0209,  0.0219, -0.0835,  ...,  0.0801,  0.1221, -0.1914],
        [ 0.0110,  0.0508,  0.2227,  ...,  0.0061, -0.2080,  0.0311],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.9636, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.3574, -0.0366,  0.1562,  ..., -0.2773, -0.2031,  0.0603],
        [ 0.0703,  0.0869,  0.0879,  ..., -0.0476,  0.0145, -0.0625],
        [ 0.2373, -0.1011, -0.0728,  ..., -0.1011, -0.1016,  0.0150],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.4537, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0605,  0.1406,  0.08

tensor([1.6958, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        [ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        [ 0.0608, -0.0138,  0.0217,  ...,  0.1089,  0.0388,  0.1445],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.9952, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2500,  0.1934, -0.0469,  ...,  0.1475,  0.2910, -0.2754],
        [ 0.0605,  0.1406,  0.0845,  ..., -0.2441, -0.0081, -0.1885],
        [-0.0703, -0.0244, -0.1885,  ..., -0.1582,  0.0747, -0.2441],
        ...,
        [ 0.0625, -0.1992, -0.0383,  ...,  0.0036, -0.2148,  0.2236],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.1655, 0.0000], grad_fn

tensor([[-0.2676, -0.1357, -0.0996,  ...,  0.0033,  0.1187, -0.0737],
        [-0.1797,  0.1758,  0.0221,  ...,  0.1934,  0.2139,  0.0045],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.0504, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1201,  0.0957,  0.1689,  ..., -0.0278,  0.0879,  0.2891],
        [-0.0928,  0.1689,  0.1963,  ..., -0.0286, -0.1748,  0.2207],
        [ 0.2021,  0.2324,  0.0255,  ..., -0.3379,  0.1973,  0.0908],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.6168, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.10

tensor([2.0587, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1094,  0.1123,  0.1914,  ...,  0.0703,  0.0830,  0.0530],
        [-0.1816, -0.1328,  0.0391,  ..., -0.2227,  0.1445,  0.1270],
        [ 0.1445,  0.0471,  0.1006,  ...,  0.0023,  0.0981, -0.0669],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.0565, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.1069,  ...,  0.1230,  0.1299, -0.1826],
        [-0.1270,  0.0220,  0.2871,  ..., -0.1016, -0.0903,  0.0884],
        [ 0.0306,  0.0708,  0.0723,  ..., -0.0099, -0.0245,  0.0140],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.9542, 0.0000], grad_fn

tensor([[-0.2891,  0.3262,  0.1895,  ...,  0.1377,  0.0938, -0.1592],
        [ 0.0583, -0.0679,  0.2021,  ..., -0.2500,  0.1738,  0.0767],
        [-0.1982,  0.1729,  0.0854,  ...,  0.1021,  0.1709, -0.1230],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.9652, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        [-0.2070,  0.2031,  0.0420,  ...,  0.1387,  0.0369, -0.0287],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.9866, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[ 0.1768,  0.1670,  0.0045,  ..., -0.3848, -0.2734,  0.1484],
        [ 0.1445,  0.0471,  0.1006,  ...,  0.0023,  0.0981, -0.0669],
        [ 0.1309,  0.0084,  0.0334,  ...,  0.2285, -0.1494, -0.1504],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.2035, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1396,  0.2314, -0.1309,  ...,  0.0732,  0.2949,  0.3008],
        [ 0.0525,  0.0109,  0.0289,  ..., -0.0781,  0.0474, -0.1016],
        [-0.1396,  0.2314, -0.1309,  ...,  0.0732,  0.2949,  0.3008],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.5262, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0562, -0.0277, -0.02

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.1030, -0.1523,  0.0259,  ..., -0.1982, -0.1230,  0.0649],
        [-0.0175, -0.0359,  0.0305,  ..., -0.0181, -0.1455, -0.0170],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.3645, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1113,  0.2061,  0.2266,  ..., -0.0830,  0.0095, -0.0400],
        [-0.0118, -0.0474,  0.0447,  ...,  0.0713, -0.0349,  0.0242],
        [ 0.1719,  0.1035,  0.0237,  ...,  0.0004, -0.2295,  0.0425],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.8621, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.3770, -0.2812, -0.08

tensor([[-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        [ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        [ 0.1445,  0.0471,  0.1006,  ...,  0.0023,  0.0981, -0.0669],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.6797, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1582,  0.1963, -0.1836,  ..., -0.5078,  0.0179,  0.1865],
        [-0.0273,  0.0449,  0.0767,  ..., -0.1250,  0.1089, -0.1436],
        [-0.0118, -0.0474,  0.0447,  ...,  0.0713, -0.0349,  0.0242],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.0051, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0605,  0.1406,  0.08

tensor([[-0.1787,  0.1387, -0.2363,  ..., -0.3496,  0.1211,  0.1211],
        [ 0.1572, -0.0708,  0.0540,  ...,  0.0098, -0.0049, -0.0330],
        [ 0.1011,  0.0496, -0.1172,  ..., -0.2471, -0.0938,  0.1787],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.8642, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0535,  0.1309,  0.2656,  ..., -0.0042,  0.2197, -0.1777],
        [ 0.0708, -0.2139,  0.1533,  ..., -0.2168, -0.0198,  0.1064],
        [ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.9016, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.2236,  0.4629,  0.09

tensor([[ 0.2969, -0.0664,  0.1846,  ..., -0.2217,  0.1235,  0.1104],
        [ 0.0679, -0.0413,  0.1001,  ...,  0.1045, -0.0854, -0.1543],
        [ 0.0248,  0.0640, -0.0508,  ..., -0.0186, -0.0237, -0.1768],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.8025, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1582,  0.1963, -0.1836,  ..., -0.5078,  0.0179,  0.1865],
        [ 0.0942, -0.0228,  0.0522,  ..., -0.0469,  0.1611, -0.1992],
        [-0.0281,  0.0586,  0.1895,  ..., -0.0913, -0.0332,  0.0229],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.3021, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1621,  0.0869,  0.20

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.0688, -0.1377, -0.1367,  ..., -0.2695,  0.1475, -0.2148],
        [ 0.1260,  0.1904,  0.0698,  ...,  0.0613,  0.1729, -0.0786],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.9731, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0579, -0.0510, -0.2070,  ..., -0.0442, -0.0513, -0.2178],
        [ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        [-0.2383,  0.0092, -0.0435,  ...,  0.0245, -0.2148, -0.0167],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.9995, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.1030, -0.1523,  0.0259,  ..., -0.1982, -0.1230,  0.0649],
        [ 0.0405,  0.0625, -0.0175,  ..., -0.1562,  0.0019, -0.0698],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.5485, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.1396, -0.0347, -0.0537,  ..., -0.1182, -0.0025, -0.0723],
        [-0.0361, -0.1211,  0.1338,  ..., -0.0864,  0.1436,  0.0273],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.9948, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[-0.3887,  0.2432, -0.0869,  ..., -0.3047, -0.1777,  0.1680],
        [ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        [ 0.0146,  0.3477,  0.0430,  ..., -0.1992,  0.0728,  0.0237],
        ...,
        [ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        [ 0.0850, -0.0952,  0.1191,  ..., -0.1089,  0.0488, -0.1309],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.2103, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.1396, -0.0347, -0.0537,  ..., -0.1182, -0.0025, -0.0723],
        [-0.1011,  0.0177,  0.0147,  ..., -0.0835,  0.0056, -0.0178],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.2815, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[-0.0591, -0.0311,  0.1602,  ...,  0.1177,  0.2754,  0.0267],
        [-0.3906, -0.0693,  0.2344,  ...,  0.0033,  0.0771,  0.1924],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.8618, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0508,  0.0928, -0.3984,  ..., -0.3125,  0.0588, -0.0576],
        [-0.0078, -0.0280,  0.0405,  ...,  0.0396, -0.0605,  0.0081],
        [ 0.1445,  0.0471,  0.1006,  ...,  0.0023,  0.0981, -0.0669],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.1783, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0796, -0.0767, -0.16

tensor([[ 0.0405,  0.0625, -0.0175,  ..., -0.1562,  0.0019, -0.0698],
        [-0.0005,  0.1602,  0.0016,  ..., -0.0354,  0.0889, -0.3027],
        [-0.2158,  0.0143, -0.0791,  ...,  0.0991, -0.1523, -0.0845],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.1730, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1113,  0.0610, -0.2402,  ...,  0.1211,  0.0374, -0.2617],
        [ 0.3184,  0.1768,  0.0586,  ..., -0.0981,  0.0525, -0.0023],
        [-0.1816,  0.0017, -0.3047,  ..., -0.0408,  0.0996, -0.1875],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.3660, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0605,  0.1406,  0.08

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.1396, -0.0347, -0.0537,  ..., -0.1182, -0.0025, -0.0723],
        [-0.1011,  0.0177,  0.0147,  ..., -0.0835,  0.0056, -0.0178],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.3420, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1299, -0.1729, -0.2217,  ..., -0.3867, -0.0698,  0.1797],
        [ 0.0942, -0.0228,  0.0522,  ..., -0.0469,  0.1611, -0.1992],
        [ 0.1069, -0.1055,  0.0532,  ..., -0.1475, -0.0625,  0.0767],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.5228, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0708, -0.0349,  0.06

tensor([[-0.1621,  0.2256,  0.0151,  ...,  0.0143, -0.0674, -0.0461],
        [ 0.2559,  0.0356,  0.0420,  ..., -0.1777, -0.0942, -0.1377],
        [-0.0476,  0.0815,  0.0457,  ..., -0.0557,  0.1050, -0.1084],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.1826, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.2100,  0.1079,  0.1299,  ..., -0.3223,  0.0718,  0.2598],
        [ 0.1885,  0.0072, -0.0518,  ...,  0.0471, -0.0090, -0.2734],
        [-0.0315,  0.0645, -0.0605,  ...,  0.0388,  0.1523, -0.0269],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.2193, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        [ 0.0703,  0.0869,  0.0879,  ..., -0.0476,  0.0145, -0.0625],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.4281, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.1069,  ...,  0.1230,  0.1299, -0.1826],
        [-0.2070,  0.2031,  0.0420,  ...,  0.1387,  0.0369, -0.0287],
        [ 0.0240,  0.3145, -0.0262,  ...,  0.0153,  0.0649,  0.1426],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.8332, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1035,  0.0131, -0.08

tensor([[ 0.0796, -0.0767, -0.1631,  ..., -0.1787, -0.0047, -0.0459],
        [-0.1133, -0.1172,  0.0850,  ...,  0.0038, -0.1934,  0.0219],
        [-0.1816,  0.1650, -0.1660,  ...,  0.1592,  0.1279,  0.0022],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.9626, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.1670, -0.0664,  0.0574,  ..., -0.0542,  0.1172,  0.0840],
        [ 0.0554, -0.0004, -0.0148,  ...,  0.1289, -0.1299, -0.1069],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.3486, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0820,  0.0645,  0.12

tensor([2.5344, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        [ 0.0718,  0.2080, -0.0284,  ..., -0.1680, -0.0209, -0.1426],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.3981, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.3496,  0.0138, -0.2012,  ..., -0.0566,  0.1855,  0.0747],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        [-0.0732,  0.0603,  0.4590,  ...,  0.0344,  0.0312,  0.3613],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.6575, 0.0000], grad_fn

tensor([[ 0.1289,  0.1982,  0.1357,  ...,  0.0718,  0.3066, -0.0349],
        [-0.1289, -0.1484,  0.2480,  ..., -0.3574, -0.1738,  0.1167],
        [-0.1484, -0.1240,  0.0413,  ..., -0.0947,  0.1377,  0.1143],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.3940, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2734,  0.1250,  0.0889,  ..., -0.0684,  0.0991, -0.2559],
        [ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.0581,  0.0581,  0.0133,  ..., -0.1748, -0.0231, -0.0435],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.9891, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1582,  0.1963, -0.18

tensor([[-0.4121,  0.3184,  0.1260,  ...,  0.0654,  0.2002, -0.2256],
        [ 0.0378, -0.0601, -0.0581,  ..., -0.1396, -0.0053,  0.0085],
        [-0.0249,  0.0220, -0.0354,  ...,  0.0108, -0.0188, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.3304, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1167, -0.0801, -0.1924,  ..., -0.1035, -0.0090,  0.0796],
        [ 0.0718,  0.2080, -0.0284,  ..., -0.1680, -0.0209, -0.1426],
        [-0.0183,  0.0557, -0.0115,  ..., -0.3457,  0.1108,  0.0334],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.0095, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.16

tensor([[-0.2461,  0.0481,  0.2031,  ...,  0.2441, -0.1719,  0.2520],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        [ 0.1582,  0.1060, -0.1895,  ..., -0.2676,  0.0084, -0.2139],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.6181, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0605,  0.1406,  0.0845,  ..., -0.2441, -0.0081, -0.1885],
        [-0.1816,  0.1650, -0.1660,  ...,  0.1592,  0.1279,  0.0022],
        [ 0.0146,  0.3477,  0.0430,  ..., -0.1992,  0.0728,  0.0237],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.7555, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0767,  0.0967,  0.01

tensor([1.7762, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1191,  0.1011, -0.1299,  ..., -0.0737, -0.0464,  0.2344],
        [ 0.0260, -0.1016, -0.3047,  ...,  0.1465,  0.2158,  0.0278],
        [ 0.0488,  0.1670,  0.1689,  ..., -0.2295, -0.0097, -0.0957],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.3041, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.1670, -0.0664,  0.0574,  ..., -0.0542,  0.1172,  0.0840],
        [-0.0571, -0.0305, -0.0055,  ..., -0.0199,  0.1426, -0.0005],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.6076, 0.0000], grad_fn

tensor([1.2077, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0713, -0.0903,  0.1270,  ...,  0.0278,  0.1206, -0.1777],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        [ 0.1416, -0.0271, -0.1846,  ...,  0.0143,  0.1484, -0.0383],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.6685, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.2715, -0.1621,  0.1611,  ..., -0.0491,  0.1270,  0.1787],
        [-0.2070,  0.2031,  0.0420,  ...,  0.1387,  0.0369, -0.0287],
        [ 0.0332, -0.0898, -0.2949,  ..., -0.1270,  0.1611, -0.1602],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.0203, 0.0000], grad_fn

tensor([[ 0.0635, -0.0297, -0.1934,  ...,  0.0199,  0.0059, -0.0879],
        [ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        [-0.0381,  0.3457,  0.1030,  ..., -0.0884,  0.2090, -0.2080],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.3898, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 2.8906e-01,  6.9336e-02, -6.8848e-02,  ..., -9.4238e-02,
          1.6797e-01, -2.4121e-01],
        [-1.2988e-01, -1.3184e-01,  4.0039e-01,  ..., -1.2305e-01,
          1.1719e-01, -2.2949e-02],
        [ 5.8105e-02, -1.7452e-04,  7.6172e-02,  ...,  1.0132e-02,
          6.4453e-02, -2.9663e-02],
        ...,
        [ 0.0000e+00,  0.0000e+00,  0.0000e+00,  ...,  0.0000e+00,
          0.0000e+00,  0.0000e+00],
        [ 0.0000e+00,  0.0000e+00,  0.0000e+00,  ...,  0.0000e+00,
          0.0000e+00,  0

tensor([[-0.2520, -0.0771, -0.0184,  ..., -0.3945, -0.0942,  0.0005],
        [-0.1709,  0.1797,  0.0229,  ...,  0.0388, -0.0099, -0.0315],
        [-0.0118, -0.0474,  0.0447,  ...,  0.0713, -0.0349,  0.0242],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.5670, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0879, -0.1895,  0.1553,  ..., -0.0199, -0.0515,  0.2676],
        [ 0.2002,  0.1543,  0.1030,  ..., -0.2432,  0.0078, -0.1445],
        [-0.0183,  0.0557, -0.0115,  ..., -0.3457,  0.1108,  0.0334],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.3484, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.16

tensor([[-0.1699,  0.2012,  0.2051,  ...,  0.1797,  0.2119, -0.1865],
        [ 0.0962, -0.0287, -0.1084,  ...,  0.0693,  0.1045, -0.1641],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.9638, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0957,  0.2432,  0.2305,  ..., -0.0991,  0.0461,  0.0640],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        [ 0.0718,  0.2080, -0.0284,  ..., -0.1680, -0.0209, -0.1426],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.1736, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.10

tensor([[ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        [ 0.0942, -0.0228,  0.0522,  ..., -0.0469,  0.1611, -0.1992],
        [ 0.0388,  0.1592, -0.0889,  ...,  0.1523, -0.0100, -0.1494],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.9211, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.3262,  0.1895,  ...,  0.1377,  0.0938, -0.1592],
        [ 0.1011, -0.0038,  0.0182,  ..., -0.0447, -0.0266, -0.1050],
        [-0.0581,  0.0581,  0.0133,  ..., -0.1748, -0.0231, -0.0435],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.4828, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.10

tensor([[-0.0659, -0.0635, -0.1226,  ..., -0.5000, -0.3379, -0.0043],
        [-0.1396, -0.0347, -0.0537,  ..., -0.1182, -0.0025, -0.0723],
        [ 0.0767,  0.0097, -0.0801,  ...,  0.0337, -0.0894, -0.0223],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.7555, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.4160,  0.0898,  0.1660,  ...,  0.1660, -0.1016, -0.0374],
        [ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        [ 0.1641, -0.1699, -0.2715,  ...,  0.0635,  0.1631,  0.1602],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.3304, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.3262,  0.18

tensor([[-0.4121,  0.3184,  0.1260,  ...,  0.0654,  0.2002, -0.2256],
        [ 0.0869,  0.0300, -0.0459,  ..., -0.0200,  0.0559,  0.1099],
        [ 0.1895,  0.1367, -0.0947,  ...,  0.0762,  0.0154, -0.0503],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.3536, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0092, -0.1621, -0.1514,  ..., -0.1445,  0.2119,  0.2871],
        [-0.0129, -0.0850,  0.0796,  ..., -0.0033,  0.0879,  0.2578],
        [-0.2070,  0.2031,  0.0420,  ...,  0.1387,  0.0369, -0.0287],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.3580, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1709, -0.2139, -0.16

tensor([[-0.0664,  0.1309,  0.0471,  ..., -0.2109,  0.0493,  0.0077],
        [-0.0786,  0.3125, -0.0055,  ..., -0.2441,  0.1064, -0.0796],
        [ 0.3027,  0.0430, -0.0339,  ..., -0.2617, -0.1025, -0.0265],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.5184, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0913,  0.1318,  0.0197,  ..., -0.3613,  0.0442,  0.0728],
        [-0.0273,  0.0449,  0.0767,  ..., -0.1250,  0.1089, -0.1436],
        [-0.0118, -0.0474,  0.0447,  ...,  0.0713, -0.0349,  0.0242],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.2786, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2520, -0.0771, -0.01

tensor([[ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        [ 0.0166,  0.0457, -0.1191,  ...,  0.0165,  0.2637,  0.0845],
        [-0.3613,  0.0544, -0.0076,  ...,  0.2207, -0.1514, -0.0947],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.7523, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0605,  0.1406,  0.0845,  ..., -0.2441, -0.0081, -0.1885],
        [-0.1904,  0.1475,  0.0339,  ..., -0.0400,  0.0776,  0.0679],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.0022, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[-0.2891,  0.3262,  0.1895,  ...,  0.1377,  0.0938, -0.1592],
        [-0.0209,  0.0219, -0.0835,  ...,  0.0801,  0.1221, -0.1914],
        [-0.0791,  0.1592, -0.0146,  ..., -0.0669,  0.1318,  0.0205],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.6212, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1816, -0.1328,  0.0391,  ..., -0.2227,  0.1445,  0.1270],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        [-0.1836, -0.3027, -0.0259,  ...,  0.0928,  0.3984,  0.2109],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.0918, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1011,  0.0177,  0.01

tensor([[-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        [ 0.0718,  0.2080, -0.0284,  ..., -0.1680, -0.0209, -0.1426],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.3345, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1953, -0.0776,  0.0874,  ..., -0.1777,  0.0933, -0.0106],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        [ 0.1533,  0.0718, -0.0242,  ...,  0.0284, -0.0996,  0.0325],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.5962, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0444,  0.2285,  0.04

tensor([[ 0.0322,  0.1221,  0.2256,  ...,  0.0493, -0.0518, -0.1245],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        [ 0.2334,  0.1709,  0.0562,  ..., -0.1099,  0.2021,  0.0884],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.0121, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        [ 0.0327, -0.0962,  0.0442,  ..., -0.1768,  0.0159, -0.0854],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.4814, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0466,  0.0713, -0.18

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.0703,  0.0918,  0.1445,  ..., -0.2402, -0.0767,  0.0170],
        [-0.0361, -0.1211,  0.1338,  ..., -0.0864,  0.1436,  0.0273],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.8123, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0879, -0.1182,  0.0879,  ..., -0.0366,  0.1260,  0.0522],
        [-0.0535,  0.1309,  0.2656,  ..., -0.0042,  0.2197, -0.1777],
        [ 0.1680,  0.1631, -0.0913,  ...,  0.0811,  0.0292,  0.2090],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.5706, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.1396, -0.0347, -0.0537,  ..., -0.1182, -0.0025, -0.0723],
        [ 0.0938, -0.0933,  0.0544,  ..., -0.0928, -0.0245, -0.0850],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.1761, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1582,  0.1963, -0.1836,  ..., -0.5078,  0.0179,  0.1865],
        [-0.0273,  0.0449,  0.0767,  ..., -0.1250,  0.1089, -0.1436],
        [-0.0118, -0.0474,  0.0447,  ...,  0.0713, -0.0349,  0.0242],
        ...,
        [ 0.1299,  0.1318, -0.0330,  ..., -0.0659,  0.0330,  0.2090],
        [ 0.0659,  0.0349, -0.1152,  ...,  0.0618,  0.0081, -0.1348],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.9798, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0781, -0.1128,  0.01

tensor([[ 0.0820,  0.0645,  0.1226,  ..., -0.0598, -0.1631, -0.0991],
        [ 0.0864,  0.2578,  0.0281,  ..., -0.2715,  0.1729,  0.0422],
        [-0.0273,  0.0449,  0.0767,  ..., -0.1250,  0.1089, -0.1436],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.7275, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1030,  0.2432,  0.2637,  ..., -0.2578, -0.0021,  0.1172],
        [-0.1123, -0.1230, -0.0845,  ..., -0.0081,  0.2109,  0.3398],
        [-0.0449, -0.0304,  0.0023,  ...,  0.0123, -0.0884, -0.0156],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.5641, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0275,  0.0459,  0.34

tensor([[ 0.0820,  0.0645,  0.1226,  ..., -0.0598, -0.1631, -0.0991],
        [ 0.0620,  0.1084, -0.0967,  ..., -0.2598,  0.0123, -0.0442],
        [ 0.1445,  0.0471,  0.1006,  ...,  0.0023,  0.0981, -0.0669],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.7826, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.0977, -0.0356,  0.0918,  ..., -0.1934, -0.1177,  0.0508],
        [ 0.0850, -0.0952,  0.1191,  ..., -0.1089,  0.0488, -0.1309],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.6909, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0713, -0.0903,  0.12

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.2793, -0.0148,  0.0679,  ...,  0.0649, -0.1240,  0.2061],
        [-0.1641,  0.0108,  0.0332,  ...,  0.0005,  0.2295, -0.0315],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.6520, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.1030, -0.1523,  0.0259,  ..., -0.1982, -0.1230,  0.0649],
        [ 0.0938,  0.0918, -0.0050,  ...,  0.0359, -0.1348,  0.0459],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.0274, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.2285, -0.0601,  0.13

tensor([[-0.1196,  0.2041, -0.2275,  ...,  0.2178,  0.1807, -0.0588],
        [ 0.1885, -0.1738,  0.1533,  ..., -0.2061,  0.0172, -0.0986],
        [ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.0752, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1167, -0.0801, -0.1924,  ..., -0.1035, -0.0090,  0.0796],
        [-0.1904,  0.1475,  0.0339,  ..., -0.0400,  0.0776,  0.0679],
        [-0.0967, -0.0264,  0.0903,  ..., -0.0197,  0.2139,  0.1367],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.3550, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1128, -0.0118,  0.11

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.1030, -0.1523,  0.0259,  ..., -0.1982, -0.1230,  0.0649],
        [ 0.1094,  0.1406, -0.0317,  ...,  0.0077,  0.1201, -0.1797],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.2721, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0251, -0.2363, -0.0403,  ..., -0.0491,  0.1221,  0.1895],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        [-0.0737,  0.2578, -0.1826,  ...,  0.1050,  0.1123,  0.0127],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.1794, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1582,  0.1963, -0.18

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.1030, -0.1523,  0.0259,  ..., -0.1982, -0.1230,  0.0649],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.4394, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.1069,  ...,  0.1230,  0.1299, -0.1826],
        [-0.1260,  0.0254,  0.1670,  ...,  0.0698, -0.0850, -0.1553],
        [ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.4171, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1094,  0.1123,  0.19

tensor([[-0.1309, -0.0845, -0.0967,  ..., -0.1670, -0.0923,  0.3516],
        [ 0.1099, -0.0850,  0.1167,  ..., -0.0859,  0.0972, -0.1318],
        [-0.0903,  0.2520,  0.0552,  ..., -0.1328,  0.1118, -0.0613],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.0101, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0129, -0.0850,  0.0796,  ..., -0.0033,  0.0879,  0.2578],
        [ 0.1270,  0.2637, -0.0698,  ..., -0.1855, -0.0366, -0.2256],
        [-0.0118, -0.0474,  0.0447,  ...,  0.0713, -0.0349,  0.0242],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.9425, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1768,  0.1670,  0.00

tensor([[ 6.0547e-02,  1.4062e-01,  8.4473e-02,  ..., -2.4414e-01,
         -8.0566e-03, -1.8848e-01],
        [ 1.1182e-01,  2.3560e-02, -1.5039e-01,  ...,  9.4727e-02,
         -7.7148e-02,  8.0566e-03],
        [-6.8848e-02, -7.7148e-02,  8.8501e-03,  ...,  8.8379e-02,
          2.2411e-04, -5.5176e-02],
        ...,
        [ 0.0000e+00,  0.0000e+00,  0.0000e+00,  ...,  0.0000e+00,
          0.0000e+00,  0.0000e+00],
        [ 0.0000e+00,  0.0000e+00,  0.0000e+00,  ...,  0.0000e+00,
          0.0000e+00,  0.0000e+00],
        [ 0.0000e+00,  0.0000e+00,  0.0000e+00,  ...,  0.0000e+00,
          0.0000e+00,  0.0000e+00]])
tensor([2.3583, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0688,  0.3848, -0.1123,  ..., -0.0096,  0.1133,  0.3750],
        [-0.2891,  0.0957,  0.1826,  ..., -0.0101, -0.1973, -0.0031],
        [-0.1006, -0.0247,  0.0923,  ..., -0.1455,  0.2598,  0.0041],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000

tensor([[-0.0664,  0.1309,  0.0471,  ..., -0.2109,  0.0493,  0.0077],
        [ 0.1895,  0.1367, -0.0947,  ...,  0.0762,  0.0154, -0.0503],
        [-0.1260,  0.0254,  0.1670,  ...,  0.0698, -0.0850, -0.1553],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.8941, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1816,  0.1650, -0.1660,  ...,  0.1592,  0.1279,  0.0022],
        [ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        [-0.0476,  0.0815,  0.0457,  ..., -0.0557,  0.1050, -0.1084],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.4422, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[ 0.0679,  0.1953,  0.1206,  ..., -0.2080, -0.0452, -0.1328],
        [ 0.1445,  0.0471,  0.1006,  ...,  0.0023,  0.0981, -0.0669],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.0865, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.1069,  ...,  0.1230,  0.1299, -0.1826],
        [ 0.1660, -0.0820,  0.4512,  ..., -0.1504,  0.0913,  0.1631],
        [ 0.0261,  0.0144, -0.0344,  ...,  0.1562,  0.0996,  0.1270],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.1466, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.2119,  0.0248, -0.07

tensor([[ 0.2695,  0.0698,  0.1216,  ..., -0.0742,  0.0479,  0.1445],
        [ 0.1553,  0.1060,  0.0122,  ..., -0.1006, -0.0217,  0.0216],
        [ 0.2188, -0.0090, -0.1182,  ...,  0.0854, -0.0537, -0.0928],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.4354, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.7173, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[ 0.0747,  0.1221,  0.0144,  ...,  0.0884, -0.0564,  0.1201],
        [ 0.0742, -0.1650, -0.1079,  ..., -0.0986,  0.1182, -0.1885],
        [-0.0449, -0.0304,  0.0023,  ...,  0.0123, -0.0884, -0.0156],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.1269, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0605,  0.1406,  0.0845,  ..., -0.2441, -0.0081, -0.1885],
        [ 0.0170,  0.0173, -0.0417,  ..., -0.1924,  0.1777, -0.3047],
        [ 0.0388, -0.2168, -0.0535,  ..., -0.0908,  0.1611,  0.1279],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.7369, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0425,  0.2197, -0.13

tensor([[-0.1113,  0.1436,  0.1895,  ...,  0.0342,  0.1602, -0.2500],
        [-0.1006, -0.0247,  0.0923,  ..., -0.1455,  0.2598,  0.0041],
        [-0.0588, -0.1367, -0.1348,  ..., -0.0737, -0.0547, -0.2871],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.7627, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.3906,  0.0038, -0.1680,  ..., -0.0542, -0.0981, -0.0378],
        [-0.0850,  0.2363, -0.2715,  ...,  0.1572, -0.0574, -0.1494],
        [-0.0070, -0.0437, -0.1680,  ...,  0.1387,  0.2334,  0.0576],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.5818, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.0630, -0.1050, -0.0046,  ..., -0.1011, -0.0231, -0.1973],
        [-0.1396, -0.0347, -0.0537,  ..., -0.1182, -0.0025, -0.0723],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.7675, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2715,  0.2178, -0.2373,  ..., -0.2422,  0.0476, -0.0361],
        [ 0.2021, -0.0811,  0.1836,  ...,  0.0664,  0.0537, -0.1719],
        [ 0.1514,  0.2422,  0.0933,  ..., -0.0620,  0.0552, -0.1699],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.9801, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[-0.0275,  0.0459,  0.3438,  ...,  0.1177,  0.1865,  0.0393],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        [-0.1270,  0.0220,  0.2871,  ..., -0.1016, -0.0903,  0.0884],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.1069, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.2930, -0.1660, -0.1108,  ..., -0.0107,  0.0243, -0.1206],
        [-0.0845, -0.0869, -0.0261,  ...,  0.1816,  0.1465, -0.1543],
        [ 0.1650,  0.0703,  0.0388,  ..., -0.0033,  0.1641, -0.1089],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.2728, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0080, -0.0262,  0.09

tensor([1.9506, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0654,  0.1270,  0.0923,  ...,  0.1475,  0.2490,  0.1113],
        [ 0.1094,  0.1406, -0.0317,  ...,  0.0077,  0.1201, -0.1797],
        [-0.0527,  0.0854,  0.0469,  ..., -0.1064,  0.2168, -0.2178],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.6757, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0605,  0.1406,  0.0845,  ..., -0.2441, -0.0081, -0.1885],
        [ 0.0605,  0.1406,  0.0845,  ..., -0.2441, -0.0081, -0.1885],
        [ 0.1104, -0.1235,  0.1406,  ..., -0.3770,  0.0300, -0.0840],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.0661, 0.0000], grad_fn

tensor([[-0.1011,  0.0177,  0.0147,  ..., -0.0835,  0.0056, -0.0178],
        [ 0.1230, -0.0461, -0.2021,  ..., -0.0913,  0.2891, -0.0292],
        [-0.0005,  0.1602,  0.0016,  ..., -0.0354,  0.0889, -0.3027],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.1637, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1797,  0.1865,  0.0009,  ...,  0.2695,  0.0576, -0.0996],
        [ 0.1875,  0.0157, -0.0586,  ..., -0.0815, -0.1709, -0.1543],
        [-0.0630, -0.0297,  0.1973,  ..., -0.2871, -0.0525,  0.0233],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.7365, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0381,  0.3457,  0.10

tensor([2.4574, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.2197,  0.0118, -0.0515,  ..., -0.2334, -0.0214, -0.0947],
        [ 0.1201, -0.0201,  0.2070,  ...,  0.2295, -0.2949,  0.0119],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.5088, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.3926,  0.1992, -0.0505,  ..., -0.2441, -0.1602,  0.4648],
        [ 0.1035,  0.1377, -0.0030,  ...,  0.0439, -0.1455,  0.0713],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.7219, 0.0000], grad_fn

tensor([[-0.1816, -0.0408, -0.0825,  ..., -0.0542,  0.0908, -0.0776],
        [ 0.0854, -0.1064, -0.1719,  ..., -0.1157, -0.0898,  0.1064],
        [-0.3652,  0.0413, -0.0625,  ..., -0.0344,  0.0613,  0.1719],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.9710, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.4315, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0820,  0.0645,  0.12

tensor([[-0.0737, -0.1582, -0.1846,  ..., -0.0947, -0.1235, -0.0923],
        [-0.1816,  0.1650, -0.1660,  ...,  0.1592,  0.1279,  0.0022],
        [ 0.0679, -0.0413,  0.1001,  ...,  0.1045, -0.0854, -0.1543],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.5117, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1348,  0.1846,  0.1230,  ..., -0.1201,  0.3105,  0.2227],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([0.5020, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.3047,  0.1240, -0.26

tensor([[ 0.2158,  0.1216, -0.0249,  ...,  0.1167,  0.0405,  0.1182],
        [ 0.3184,  0.1768,  0.0586,  ..., -0.0981,  0.0525, -0.0023],
        [ 0.0393, -0.1963, -0.1064,  ..., -0.0757,  0.0466, -0.0840],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.9152, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1201, -0.0201,  0.2070,  ...,  0.2295, -0.2949,  0.0119],
        [-0.0586, -0.0376,  0.0728,  ..., -0.1079, -0.0864, -0.0320],
        [-0.0070, -0.0437, -0.1680,  ...,  0.1387,  0.2334,  0.0576],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.6177, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.16

tensor([3.1078, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.1069,  ...,  0.1230,  0.1299, -0.1826],
        [-0.1816,  0.1650, -0.1660,  ...,  0.1592,  0.1279,  0.0022],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.2242, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2256, -0.0195,  0.0908,  ...,  0.0282, -0.1777, -0.0060],
        [-0.0259,  0.0977,  0.0090,  ..., -0.0256, -0.0762, -0.1279],
        [-0.0078, -0.0280,  0.0405,  ...,  0.0396, -0.0605,  0.0081],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.9057, 0.0000], grad_fn

tensor([[ 0.2285, -0.0601,  0.1396,  ...,  0.0483, -0.1436,  0.3262],
        [ 0.2812,  0.2539,  0.1128,  ...,  0.2412, -0.2539, -0.2598],
        [ 0.0938, -0.0933,  0.0544,  ..., -0.0928, -0.0245, -0.0850],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.6978, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2520, -0.0771, -0.0184,  ..., -0.3945, -0.0942,  0.0005],
        [ 0.0718,  0.2080, -0.0284,  ..., -0.1680, -0.0209, -0.1426],
        [ 0.0962,  0.1475,  0.0913,  ..., -0.0352,  0.0126, -0.0762],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.0672, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.10

tensor([[-0.0535,  0.1309,  0.2656,  ..., -0.0042,  0.2197, -0.1777],
        [-0.0188, -0.1182, -0.1436,  ..., -0.0557,  0.1226, -0.1025],
        [ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.1010, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        [-0.1816,  0.1650, -0.1660,  ...,  0.1592,  0.1279,  0.0022],
        [ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.1834, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1768,  0.1670,  0.00

tensor([[ 0.0698, -0.0378, -0.0400,  ...,  0.0041,  0.0009, -0.1196],
        [ 0.1094,  0.1406, -0.0317,  ...,  0.0077,  0.1201, -0.1797],
        [-0.2070,  0.2031,  0.0420,  ...,  0.1387,  0.0369, -0.0287],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.0438, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.1030, -0.1523,  0.0259,  ..., -0.1982, -0.1230,  0.0649],
        [ 0.0884, -0.0317, -0.1226,  ...,  0.0234,  0.2480, -0.1177],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.3589, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1104, -0.1235,  0.14

tensor([[ 0.0215, -0.2119, -0.1172,  ..., -0.0903, -0.0544,  0.1797],
        [ 0.1094,  0.1406, -0.0317,  ...,  0.0077,  0.1201, -0.1797],
        [ 0.0605,  0.1406,  0.0845,  ..., -0.2441, -0.0081, -0.1885],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.6239, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2520, -0.0771, -0.0184,  ..., -0.3945, -0.0942,  0.0005],
        [-0.1934,  0.0226, -0.2266,  ...,  0.0972, -0.1069,  0.0194],
        [ 0.1387,  0.0294, -0.1865,  ...,  0.1006, -0.0991, -0.0317],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.6833, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1445, -0.0124,  0.11

tensor([[ 0.3652,  0.1455,  0.0344,  ..., -0.0417,  0.0835,  0.0459],
        [ 0.3145,  0.3672,  0.1514,  ...,  0.1040,  0.1226,  0.0688],
        [ 0.0166,  0.0457, -0.1191,  ...,  0.0165,  0.2637,  0.0845],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.5992, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.0581,  0.0581,  0.0133,  ..., -0.1748, -0.0231, -0.0435],
        [ 0.0996,  0.1338,  0.1050,  ..., -0.1504,  0.0918,  0.0825],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.3074, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0535,  0.1309,  0.26

tensor([3.1859, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0146,  0.3477,  0.0430,  ..., -0.1992,  0.0728,  0.0237],
        [-0.2266,  0.1533,  0.0889,  ..., -0.0182, -0.0522, -0.1089],
        [ 0.0493, -0.1001,  0.0067,  ..., -0.0248, -0.1592, -0.0228],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.5079, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.3711,  0.3789, -0.0957,  ..., -0.4199, -0.2002,  0.1562],
        [-0.2891,  0.3262,  0.1895,  ...,  0.1377,  0.0938, -0.1592],
        [ 0.0688, -0.1377, -0.1367,  ..., -0.2695,  0.1475, -0.2148],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.9074, 0.0000], grad_fn

tensor([[ 0.0605,  0.1406,  0.0845,  ..., -0.2441, -0.0081, -0.1885],
        [-0.1904,  0.1475,  0.0339,  ..., -0.0400,  0.0776,  0.0679],
        [-0.0640, -0.2207, -0.2021,  ..., -0.2295,  0.0186, -0.1514],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.0403, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2520, -0.0771, -0.0184,  ..., -0.3945, -0.0942,  0.0005],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        [-0.0112,  0.2051, -0.1289,  ...,  0.2314, -0.0820,  0.1108],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.0438, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0535,  0.1309,  0.26

tensor([[ 0.0605,  0.1406,  0.0845,  ..., -0.2441, -0.0081, -0.1885],
        [ 0.1895,  0.1367, -0.0947,  ...,  0.0762,  0.0154, -0.0503],
        [-0.2695,  0.1050,  0.1040,  ..., -0.0349,  0.0918,  0.1089],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.8601, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1855,  0.3223,  0.2520,  ..., -0.1367,  0.1621, -0.0771],
        [-0.1396, -0.0347, -0.0537,  ..., -0.1182, -0.0025, -0.0723],
        [ 0.1260,  0.1904,  0.0698,  ...,  0.0613,  0.1729, -0.0786],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.8499, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0605,  0.1406,  0.08

tensor([[-0.0986,  0.0547,  0.1836,  ..., -0.0344, -0.0537, -0.1016],
        [ 0.1904,  0.0972, -0.2676,  ...,  0.1494,  0.1128, -0.2832],
        [-0.0027, -0.0317, -0.1455,  ..., -0.1924,  0.2217,  0.2500],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.1827, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1396,  0.2314, -0.1309,  ...,  0.0732,  0.2949,  0.3008],
        [ 0.0405,  0.0625, -0.0175,  ..., -0.1562,  0.0019, -0.0698],
        [ 0.2773, -0.1069, -0.0747,  ...,  0.2109,  0.3457,  0.1631],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.2725, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.10

tensor([[ 0.0605,  0.1406,  0.0845,  ..., -0.2441, -0.0081, -0.1885],
        [ 0.0117, -0.0967,  0.1689,  ..., -0.0630, -0.0737,  0.2812],
        [-0.1816,  0.1650, -0.1660,  ...,  0.1592,  0.1279,  0.0022],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.9101, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.0620,  0.1084, -0.0967,  ..., -0.2598,  0.0123, -0.0442],
        [-0.3145, -0.0879,  0.1816,  ...,  0.1846, -0.2471,  0.2354],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.4290, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.16

tensor([[-0.0129, -0.0850,  0.0796,  ..., -0.0033,  0.0879,  0.2578],
        [-0.1270,  0.0220,  0.2871,  ..., -0.1016, -0.0903,  0.0884],
        [-0.3672, -0.0344,  0.0498,  ...,  0.1279,  0.1504, -0.3203],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.7970, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.1069,  ...,  0.1230,  0.1299, -0.1826],
        [-0.1270,  0.0220,  0.2871,  ..., -0.1016, -0.0903,  0.0884],
        [ 0.1118,  0.0236, -0.1504,  ...,  0.0947, -0.0771,  0.0081],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.1673, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0231,  0.1533,  0.15

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.0364, -0.0215, -0.0354,  ..., -0.0874,  0.0515,  0.0175],
        [ 0.0571, -0.0527, -0.1172,  ..., -0.0444,  0.0138, -0.0381],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.4759, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0129, -0.0850,  0.0796,  ..., -0.0033,  0.0879,  0.2578],
        [-0.2930,  0.2949,  0.0771,  ...,  0.1543,  0.2949,  0.2520],
        [ 0.1055,  0.0420, -0.0099,  ..., -0.3223,  0.2754, -0.2070],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.3156, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1030, -0.0087,  0.23

tensor([2.3393, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.1016,  0.1260,  0.0889,  ...,  0.0518,  0.0356, -0.0645],
        [ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.1372, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1011,  0.0177,  0.0147,  ..., -0.0835,  0.0056, -0.0178],
        [ 0.0654,  0.1035,  0.2314,  ...,  0.2178, -0.0479, -0.0096],
        [-0.0118, -0.0474,  0.0447,  ...,  0.0713, -0.0349,  0.0242],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.8796, 0.0000], grad_fn

tensor([[ 0.0850,  0.0962, -0.0272,  ...,  0.0693,  0.0194,  0.0742],
        [ 0.2637,  0.1914, -0.2637,  ..., -0.3066,  0.3184,  0.0581],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.0282, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.3496,  0.0138, -0.2012,  ..., -0.0566,  0.1855,  0.0747],
        [ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        [-0.0581,  0.0581,  0.0133,  ..., -0.1748, -0.0231, -0.0435],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.8124, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0055,  0.1030, -0.17

tensor([[-0.2266, -0.0156, -0.0593,  ..., -0.0957, -0.1621,  0.1758],
        [-0.0530,  0.2832,  0.2207,  ..., -0.1260,  0.0488, -0.0820],
        [-0.0825,  0.0225, -0.1494,  ..., -0.0312,  0.0444, -0.1475],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.1436, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.3945,  0.0461, -0.4258,  ..., -0.5664,  0.0640, -0.0114],
        [ 0.0703,  0.0869,  0.0879,  ..., -0.0476,  0.0145, -0.0625],
        [-0.0118, -0.0474,  0.0447,  ...,  0.0713, -0.0349,  0.0242],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.3300, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[-0.0275,  0.0459,  0.3438,  ...,  0.1177,  0.1865,  0.0393],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        [-0.1445,  0.0128, -0.0303,  ..., -0.0613, -0.1309, -0.0166],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.9755, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0684,  0.0369, -0.1128,  ...,  0.0493,  0.0889,  0.0684],
        [ 0.0718,  0.2080, -0.0284,  ..., -0.1680, -0.0209, -0.1426],
        [-0.0581,  0.0581,  0.0133,  ..., -0.1748, -0.0231, -0.0435],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.3512, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0664,  0.1309,  0.04

tensor([[-0.1729,  0.2793,  0.1069,  ...,  0.1230,  0.1299, -0.1826],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        [ 0.0962, -0.0287, -0.1084,  ...,  0.0693,  0.1045, -0.1641],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.4696, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1699,  0.2012,  0.2051,  ...,  0.1797,  0.2119, -0.1865],
        [-0.0449, -0.0304,  0.0023,  ...,  0.0123, -0.0884, -0.0156],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.7864, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[-0.0129, -0.0850,  0.0796,  ..., -0.0033,  0.0879,  0.2578],
        [-0.1963, -0.3848, -0.1582,  ...,  0.0913,  0.1436,  0.3965],
        [ 0.0703,  0.0869,  0.0879,  ..., -0.0476,  0.0145, -0.0625],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.4515, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        [-0.0075,  0.0082,  0.0737,  ...,  0.0325, -0.1182,  0.0776],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.5254, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.3828,  0.1426, -0.12

tensor([[-0.3496,  0.0138, -0.2012,  ..., -0.0566,  0.1855,  0.0747],
        [ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        [-0.1816, -0.1328,  0.0391,  ..., -0.2227,  0.1445,  0.1270],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.7831, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.1069,  ...,  0.1230,  0.1299, -0.1826],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        [-0.1299, -0.0684, -0.0520,  ..., -0.2432, -0.0991,  0.0957],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.1339, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.3262,  0.18

tensor([[-0.0129, -0.0850,  0.0796,  ..., -0.0033,  0.0879,  0.2578],
        [-0.1328, -0.1943,  0.0718,  ...,  0.1973, -0.0903, -0.0698],
        [ 0.0703,  0.0869,  0.0879,  ..., -0.0476,  0.0145, -0.0625],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.7425, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1011,  0.0177,  0.0147,  ..., -0.0835,  0.0056, -0.0178],
        [ 0.0493, -0.1001,  0.0067,  ..., -0.0248, -0.1592, -0.0228],
        [-0.0474,  0.1875,  0.0023,  ..., -0.0036, -0.0625, -0.0557],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.2273, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1992,  0.2363,  0.08

tensor([[ 0.1504, -0.0566,  0.2012,  ..., -0.1035,  0.1001, -0.0283],
        [-0.0474,  0.1875,  0.0023,  ..., -0.0036, -0.0625, -0.0557],
        [ 0.1982,  0.1069, -0.0913,  ...,  0.0176, -0.1953, -0.0190],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.4813, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.3535, -0.2471,  0.2041,  ...,  0.1206, -0.2246, -0.1660],
        [-0.1338, -0.3301, -0.1221,  ..., -0.0291, -0.0618, -0.0771],
        [ 0.0513, -0.0369, -0.0034,  ..., -0.0693,  0.1777,  0.0544],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.1849, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[ 0.0977, -0.0356,  0.0918,  ..., -0.1934, -0.1177,  0.0508],
        [-0.0557,  0.0089, -0.0923,  ...,  0.0032,  0.2871, -0.1416],
        [ 0.1445,  0.0471,  0.1006,  ...,  0.0023,  0.0981, -0.0669],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.6281, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.0581,  0.0581,  0.0133,  ..., -0.1748, -0.0231, -0.0435],
        [ 0.1641,  0.1924,  0.0923,  ..., -0.1582,  0.1377,  0.1138],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.5221, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0664,  0.1309,  0.04

tensor([2.9908, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2393, -0.1250, -0.2070,  ..., -0.0957,  0.0630, -0.1553],
        [-0.0535,  0.1309,  0.2656,  ..., -0.0042,  0.2197, -0.1777],
        [-0.0630, -0.0297,  0.1973,  ..., -0.2871, -0.0525,  0.0233],
        ...,
        [ 0.2002, -0.1543,  0.1455,  ..., -0.0786,  0.2598, -0.2217],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.5982, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0264,  0.0684, -0.0311,  ..., -0.1709,  0.1963, -0.0996],
        [ 0.0942, -0.0228,  0.0522,  ..., -0.0469,  0.1611, -0.1992],
        [ 0.0679, -0.0413,  0.1001,  ...,  0.1045, -0.0854, -0.1543],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.9643, 0.0000], grad_fn

tensor([[-0.1089, -0.0747, -0.0454,  ..., -0.3594,  0.0486,  0.1611],
        [-0.0359,  0.0996,  0.3516,  ..., -0.1699, -0.2559, -0.0581],
        [-0.0903,  0.1738,  0.1523,  ..., -0.3008,  0.0957, -0.2344],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.3393, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2061, -0.1270,  0.1289,  ..., -0.2031, -0.2617,  0.0718],
        [ 0.2041,  0.0132,  0.0757,  ..., -0.2119, -0.1328,  0.1084],
        [ 0.1533, -0.1118, -0.2334,  ..., -0.0104,  0.1099, -0.0043],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.7223, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.3086, -0.0669, -0.19

tensor([[ 0.0796, -0.0767, -0.1631,  ..., -0.1787, -0.0047, -0.0459],
        [-0.1729,  0.2793,  0.1069,  ...,  0.1230,  0.1299, -0.1826],
        [ 0.1885,  0.0072, -0.0518,  ...,  0.0471, -0.0090, -0.2734],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.8583, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0605,  0.1406,  0.0845,  ..., -0.2441, -0.0081, -0.1885],
        [-0.1738,  0.0240, -0.0302,  ..., -0.2520,  0.1533,  0.0879],
        [ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.0313, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0737, -0.1582, -0.18

tensor([[ 0.0605,  0.1406,  0.0845,  ..., -0.2441, -0.0081, -0.1885],
        [-0.0075,  0.0082,  0.0737,  ...,  0.0325, -0.1182,  0.0776],
        [ 0.0146,  0.3477,  0.0430,  ..., -0.1992,  0.0728,  0.0237],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.2953, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0364, -0.0215, -0.0354,  ..., -0.0874,  0.0515,  0.0175],
        [ 0.0332, -0.0898, -0.2949,  ..., -0.1270,  0.1611, -0.1602],
        [ 0.0693, -0.0525,  0.1631,  ...,  0.0481,  0.0383, -0.0830],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.4372, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0801,  0.1050,  0.04

tensor([[ 0.0562, -0.0277, -0.0204,  ...,  0.1113,  0.0332, -0.1406],
        [ 0.0405,  0.0625, -0.0175,  ..., -0.1562,  0.0019, -0.0698],
        [ 0.0405,  0.0625, -0.0175,  ..., -0.1562,  0.0019, -0.0698],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.7571, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1309, -0.0280, -0.2334,  ...,  0.0500,  0.1035, -0.1846],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        [-0.2383,  0.0092, -0.0435,  ...,  0.0245, -0.2148, -0.0167],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.3795, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0889,  0.1465,  0.11

tensor([[-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        [-0.2070,  0.2031,  0.0420,  ...,  0.1387,  0.0369, -0.0287],
        [-0.0449, -0.0304,  0.0023,  ...,  0.0123, -0.0884, -0.0156],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.6464, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1396,  0.2314, -0.1309,  ...,  0.0732,  0.2949,  0.3008],
        [-0.1396,  0.2314, -0.1309,  ...,  0.0732,  0.2949,  0.3008],
        [-0.0566, -0.2969, -0.4648,  ..., -0.0215,  0.0400,  0.3164],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.3414, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1582,  0.1963, -0.18

tensor([[ 7.9102e-02, -5.0354e-03,  1.1182e-01,  ..., -6.7749e-03,
          4.2725e-02, -1.0352e-01],
        [-4.1748e-02, -4.3945e-02,  2.2656e-01,  ..., -1.6016e-01,
          2.6703e-04, -9.8633e-02],
        [ 3.3936e-02,  8.3496e-02, -1.2402e-01,  ...,  4.8828e-02,
         -2.8320e-01,  9.8145e-02],
        ...,
        [ 0.0000e+00,  0.0000e+00,  0.0000e+00,  ...,  0.0000e+00,
          0.0000e+00,  0.0000e+00],
        [ 0.0000e+00,  0.0000e+00,  0.0000e+00,  ...,  0.0000e+00,
          0.0000e+00,  0.0000e+00],
        [ 0.0000e+00,  0.0000e+00,  0.0000e+00,  ...,  0.0000e+00,
          0.0000e+00,  0.0000e+00]])
tensor([3.1120, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.1030, -0.1523,  0.0259,  ..., -0.1982, -0.1230,  0.0649],
        [ 0.1445,  0.0471,  0.1006,  ...,  0.0023,  0.0981, -0.0669],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000

tensor([[ 0.0786,  0.1318,  0.1895,  ..., -0.2236, -0.1011,  0.0339],
        [-0.0703,  0.0918,  0.1445,  ..., -0.2402, -0.0767,  0.0170],
        [-0.2285, -0.0884,  0.1279,  ..., -0.2129,  0.1885, -0.1455],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.5576, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.0962, -0.0287, -0.1084,  ...,  0.0693,  0.1045, -0.1641],
        [-0.0811,  0.1040, -0.2695,  ..., -0.2002,  0.2256, -0.1465],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.4224, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0129, -0.0850,  0.07

tensor([2.8578, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        [-0.2070,  0.2031,  0.0420,  ...,  0.1387,  0.0369, -0.0287],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.0416, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.3262,  0.1895,  ...,  0.1377,  0.0938, -0.1592],
        [-0.0143,  0.2871, -0.1182,  ..., -0.1216,  0.1367, -0.0540],
        [ 0.0111, -0.1357,  0.1064,  ..., -0.0045, -0.1138,  0.0325],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.4446, 0.0000], grad_fn

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.0679,  0.0996,  0.1016,  ..., -0.1040,  0.2422, -0.0942],
        [ 0.0845, -0.0004,  0.0532,  ...,  0.0171,  0.0608, -0.1089],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.8883, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0535,  0.1309,  0.2656,  ..., -0.0042,  0.2197, -0.1777],
        [-0.0374, -0.2637, -0.1377,  ..., -0.0977,  0.0356,  0.0796],
        [ 0.0903,  0.1484, -0.0618,  ..., -0.2188,  0.1660,  0.1514],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.2260, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[ 0.0015, -0.1445,  0.2461,  ..., -0.2148,  0.1050,  0.1235],
        [-0.1025, -0.0474,  0.2461,  ..., -0.0791,  0.1211,  0.0737],
        [ 0.0342, -0.3203,  0.1807,  ..., -0.1846, -0.0732, -0.0603],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.3589, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1465, -0.0620,  0.1138,  ..., -0.1973,  0.0535, -0.0320],
        [ 0.0864,  0.2578,  0.0281,  ..., -0.2715,  0.1729,  0.0422],
        [ 0.0942, -0.0228,  0.0522,  ..., -0.0469,  0.1611, -0.1992],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.9046, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.10

tensor([[ 0.0605,  0.1406,  0.0845,  ..., -0.2441, -0.0081, -0.1885],
        [-0.1816,  0.1650, -0.1660,  ...,  0.1592,  0.1279,  0.0022],
        [-0.0586, -0.0376,  0.0728,  ..., -0.1079, -0.0864, -0.0320],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.1205, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0129, -0.0850,  0.0796,  ..., -0.0033,  0.0879,  0.2578],
        [-0.1455,  0.2480, -0.1514,  ..., -0.0029,  0.1436, -0.1279],
        [-0.2178, -0.0337,  0.0228,  ...,  0.0884,  0.0126,  0.1050],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.1157, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0275,  0.0459,  0.34

tensor([[-0.1289,  0.1191,  0.0267,  ...,  0.0066,  0.1543,  0.0605],
        [-0.1699,  0.2012,  0.2051,  ...,  0.1797,  0.2119, -0.1865],
        [ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.8075, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        [-0.0356, -0.1338, -0.0732,  ...,  0.0295, -0.0850, -0.2236],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.0035, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0129, -0.0850,  0.07

tensor([[-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        [ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        [ 0.1113,  0.1060, -0.0737,  ..., -0.0723,  0.0374, -0.1562],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.2247, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        [ 0.0239, -0.0461,  0.0039,  ..., -0.2695, -0.0688, -0.2754],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.5712, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0275,  0.0459,  0.34

tensor([[ 0.0938,  0.3086, -0.1221,  ..., -0.0649,  0.0339,  0.3125],
        [ 0.0630,  0.1245,  0.1133,  ..., -0.0635,  0.1147,  0.0310],
        [ 0.1094,  0.1406, -0.0317,  ...,  0.0077,  0.1201, -0.1797],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.5849, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0508, -0.0933,  0.0649,  ..., -0.1689, -0.0415,  0.0082],
        [ 0.1641,  0.1885,  0.1416,  ..., -0.0713, -0.1021,  0.0145],
        [-0.0118, -0.0474,  0.0447,  ...,  0.0713, -0.0349,  0.0242],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.1163, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.3496,  0.0330,  0.00

tensor([[-0.0664, -0.0240,  0.0544,  ..., -0.1396,  0.0610, -0.2969],
        [ 0.0996,  0.1338,  0.1050,  ..., -0.1504,  0.0918,  0.0825],
        [-0.2100, -0.0084,  0.1729,  ...,  0.0576,  0.0728, -0.0605],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.6813, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0535,  0.1309,  0.2656,  ..., -0.0042,  0.2197, -0.1777],
        [-0.1011,  0.2041,  0.0150,  ..., -0.1123,  0.1240,  0.1592],
        [ 0.1030, -0.1523,  0.0259,  ..., -0.1982, -0.1230,  0.0649],
        ...,
        [ 0.0718,  0.2080, -0.0284,  ..., -0.1680, -0.0209, -0.1426],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([4.0300, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.3262,  0.18

tensor([[-0.1006, -0.0247,  0.0923,  ..., -0.1455,  0.2598,  0.0041],
        [-0.1709,  0.2100,  0.0216,  ..., -0.0249,  0.3066,  0.2715],
        [-0.1006, -0.0247,  0.0923,  ..., -0.1455,  0.2598,  0.0041],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.0321, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0664,  0.1309,  0.0471,  ..., -0.2109,  0.0493,  0.0077],
        [-0.1729,  0.2793,  0.1069,  ...,  0.1230,  0.1299, -0.1826],
        [-0.1289, -0.0530, -0.2988,  ..., -0.0486,  0.1816,  0.0815],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.1622, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1396,  0.2314, -0.13

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.1396, -0.0347, -0.0537,  ..., -0.1182, -0.0025, -0.0723],
        [-0.1011,  0.0177,  0.0147,  ..., -0.0835,  0.0056, -0.0178],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.9566, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1582,  0.1963, -0.1836,  ..., -0.5078,  0.0179,  0.1865],
        [ 0.1709,  0.0493,  0.0840,  ...,  0.1807,  0.2402,  0.4434],
        [ 0.1030, -0.0087,  0.2393,  ...,  0.0464,  0.1104, -0.1689],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.8305, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.2949,  0.4961, -0.00

tensor([[-0.1167, -0.0801, -0.1924,  ..., -0.1035, -0.0090,  0.0796],
        [-0.2451, -0.1562,  0.1001,  ..., -0.0879, -0.0081,  0.0496],
        [-0.2246,  0.0522, -0.1953,  ...,  0.0864, -0.0771,  0.1729],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.0799, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.0977, -0.0356,  0.0918,  ..., -0.1934, -0.1177,  0.0508],
        [-0.1572, -0.1074, -0.0315,  ..., -0.0483,  0.2100, -0.0518],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.7244, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.16

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.0239, -0.0461,  0.0039,  ..., -0.2695, -0.0688, -0.2754],
        [-0.0581,  0.0581,  0.0133,  ..., -0.1748, -0.0231, -0.0435],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.3263, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1167, -0.0801, -0.1924,  ..., -0.1035, -0.0090,  0.0796],
        [-0.0962, -0.1025,  0.0767,  ..., -0.0322,  0.3125, -0.2080],
        [-0.0549, -0.1172,  0.0278,  ..., -0.1865,  0.1562, -0.0649],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.8916, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.10

tensor([[-0.4121,  0.3184,  0.1260,  ...,  0.0654,  0.2002, -0.2256],
        [-0.1504,  0.2305,  0.4004,  ..., -0.1807, -0.1816,  0.0099],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.9200, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0491, -0.2295,  0.1357,  ...,  0.0139,  0.0265, -0.0186],
        [-0.1309,  0.1562, -0.1885,  ...,  0.0121, -0.0366,  0.0089],
        [ 0.0260, -0.0019,  0.1855,  ..., -0.1216,  0.2217, -0.0220],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.3258, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1089, -0.0747, -0.04

tensor([[-0.0118, -0.1943,  0.2637,  ..., -0.1533, -0.1030, -0.2949],
        [-0.1157,  0.0613,  0.1514,  ..., -0.0776, -0.0608,  0.1953],
        [-0.1895,  0.1816,  0.3359,  ...,  0.1167,  0.0569,  0.1055],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.1038, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0188, -0.1182, -0.1436,  ..., -0.0557,  0.1226, -0.1025],
        [-0.0615, -0.0850, -0.1504,  ..., -0.0669, -0.0220,  0.0515],
        [ 0.1377, -0.1543,  0.1553,  ..., -0.2236,  0.0996, -0.0625],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.5316, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1699,  0.2012,  0.20

tensor([[-0.0425,  0.0092,  0.1631,  ..., -0.1309, -0.2227,  0.0253],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        [-0.1270,  0.0220,  0.2871,  ..., -0.1016, -0.0903,  0.0884],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.4333, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0557,  0.0089, -0.0923,  ...,  0.0032,  0.2871, -0.1416],
        [ 0.0183, -0.2100, -0.1426,  ...,  0.0593,  0.2324, -0.0864],
        [-0.0118, -0.0474,  0.0447,  ...,  0.0713, -0.0349,  0.0242],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.2120, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0605,  0.1406,  0.08

tensor([[ 0.3926,  0.1099, -0.1436,  ..., -0.0212, -0.1514,  0.2715],
        [ 0.1094,  0.1406, -0.0317,  ...,  0.0077,  0.1201, -0.1797],
        [-0.2070,  0.2031,  0.0420,  ...,  0.1387,  0.0369, -0.0287],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.2594, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0304, -0.2227, -0.2275,  ..., -0.0718,  0.0757,  0.0422],
        [-0.0583,  0.0679, -0.0540,  ...,  0.0845,  0.0231,  0.2432],
        [-0.1533, -0.1709, -0.0310,  ...,  0.0240, -0.3555, -0.2051],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.7873, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0535,  0.1309,  0.26

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.1260,  0.1279,  0.1963,  ..., -0.1484,  0.1904, -0.0391],
        [-0.0273,  0.0449,  0.0767,  ..., -0.1250,  0.1089, -0.1436],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.3581, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0231,  0.1533,  0.1523,  ...,  0.1445,  0.1328, -0.0859],
        [ 0.1641,  0.1875, -0.0410,  ...,  0.1089, -0.0102,  0.0208],
        [ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.3796, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0820,  0.2168, -0.12

tensor([[-0.1089, -0.0747, -0.0454,  ..., -0.3594,  0.0486,  0.1611],
        [-0.1855,  0.3223,  0.2520,  ..., -0.1367,  0.1621, -0.0771],
        [ 0.0977, -0.0356,  0.0918,  ..., -0.1934, -0.1177,  0.0508],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.9837, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0713, -0.0903,  0.1270,  ...,  0.0278,  0.1206, -0.1777],
        [ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.0581,  0.0581,  0.0133,  ..., -0.1748, -0.0231, -0.0435],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.2974, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1201,  0.2256,  0.15

tensor([[-0.0231,  0.1533,  0.1523,  ...,  0.1445,  0.1328, -0.0859],
        [ 0.1167, -0.0864,  0.0874,  ...,  0.1553, -0.0986, -0.1079],
        [ 0.0845, -0.0004,  0.0532,  ...,  0.0171,  0.0608, -0.1089],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.4137, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.1699, -0.2676,  0.1475,  ..., -0.0781, -0.0645,  0.0728],
        [ 0.1094,  0.1406, -0.0317,  ...,  0.0077,  0.1201, -0.1797],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.8389, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0022, -0.0178,  0.26

tensor([[-0.1621,  0.0869,  0.2012,  ..., -0.0840,  0.0449, -0.1797],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        [ 0.2891,  0.0698,  0.1621,  ..., -0.1245,  0.0215, -0.0437],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.4250, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.0679,  0.0996,  0.1016,  ..., -0.1040,  0.2422, -0.0942],
        [-0.2070,  0.2031,  0.0420,  ...,  0.1387,  0.0369, -0.0287],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.2163, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0129, -0.0850,  0.07

tensor([[ 0.2451, -0.0210, -0.0554,  ..., -0.0138,  0.0898, -0.1318],
        [ 0.1069, -0.1055,  0.0532,  ..., -0.1475, -0.0625,  0.0767],
        [-0.0184,  0.1709,  0.1108,  ..., -0.1348, -0.0162,  0.0167],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.5145, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        [ 0.1260,  0.1904,  0.0698,  ...,  0.0613,  0.1729, -0.0786],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.1818, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0013, -0.0483, -0.28

tensor([[-0.2891,  0.3262,  0.1895,  ...,  0.1377,  0.0938, -0.1592],
        [-0.0581,  0.0581,  0.0133,  ..., -0.1748, -0.0231, -0.0435],
        [ 0.0850,  0.0962, -0.0272,  ...,  0.0693,  0.0194,  0.0742],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.4237, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.4121,  0.3184,  0.1260,  ...,  0.0654,  0.2002, -0.2256],
        [-0.0188, -0.1182, -0.1436,  ..., -0.0557,  0.1226, -0.1025],
        [-0.0449, -0.0304,  0.0023,  ...,  0.0123, -0.0884, -0.0156],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.1196, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.11

tensor([[ 0.0605,  0.1406,  0.0845,  ..., -0.2441, -0.0081, -0.1885],
        [-0.4121,  0.3184,  0.1260,  ...,  0.0654,  0.2002, -0.2256],
        [-0.1484, -0.2070, -0.2139,  ..., -0.0225,  0.2305, -0.0830],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.3195, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0562,  0.1230, -0.3496,  ...,  0.0294, -0.0260, -0.0415],
        [-0.1699,  0.2012,  0.2051,  ...,  0.1797,  0.2119, -0.1865],
        [ 0.1455,  0.0168,  0.0236,  ...,  0.0659,  0.0067,  0.0156],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.3649, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.16

tensor([[-0.2891,  0.3262,  0.1895,  ...,  0.1377,  0.0938, -0.1592],
        [ 0.1030, -0.1523,  0.0259,  ..., -0.1982, -0.1230,  0.0649],
        [ 0.1094,  0.1406, -0.0317,  ...,  0.0077,  0.1201, -0.1797],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.8199, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.3262,  0.1895,  ...,  0.1377,  0.0938, -0.1592],
        [-0.0581,  0.0581,  0.0133,  ..., -0.1748, -0.0231, -0.0435],
        [-0.2061, -0.1069, -0.2158,  ...,  0.2168,  0.0674,  0.1504],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.8825, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.10

In [49]:
correct_count = 0
wrong_count = 0

for i in range(len(X_test_embeddings)):
    review = Variable(torch.Tensor(X_test_embeddings[i]))
    correct_label = 0 if y_test[i][0] == 1 else 1
    predictions = net.forward(review)

    # the model's prediction is the digit with the max probability ... how do we find that?
    value, prediction = predictions.max(0)

    if prediction == correct_label:
        correct_count += 1
    else:
        wrong_count += 1

print(correct_count, wrong_count)
print(correct_count / (correct_count + wrong_count))

tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [-0.1699, -0.2676,  0.1475,  ..., -0.0781, -0.0645,  0.0728],
        [ 0.1094,  0.1406, -0.0317,  ...,  0.0077,  0.1201, -0.1797],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.3376, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0376,  0.2031,  0.0226,  ...,  0.1396,  0.3047, -0.0674],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        [-0.1836,  0.2891,  0.2656,  ..., -0.1367, -0.3008,  0.1973],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.2158, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.10

tensor([[-0.1631, -0.0242, -0.0962,  ...,  0.0796, -0.1494,  0.0618],
        [-0.2070,  0.2031,  0.0420,  ...,  0.1387,  0.0369, -0.0287],
        [ 0.1069, -0.0630, -0.4141,  ..., -0.3770,  0.0071, -0.1143],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.5277, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        [ 0.1445,  0.0471,  0.1006,  ...,  0.0023,  0.0981, -0.0669],
        [ 0.0747,  0.0164,  0.0879,  ..., -0.0457,  0.0139, -0.0840],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.2049, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.1992,  0.16

tensor([3.3732, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1953, -0.0776,  0.0874,  ..., -0.1777,  0.0933, -0.0106],
        [ 0.1445,  0.0471,  0.1006,  ...,  0.0023,  0.0981, -0.0669],
        [ 0.1226, -0.0894,  0.0270,  ..., -0.0640, -0.0718, -0.1387],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.5940, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0781, -0.1128,  0.0187,  ..., -0.2090,  0.1631,  0.0172],
        [-0.0045, -0.1245,  0.0004,  ...,  0.0488,  0.0674,  0.1924],
        [ 0.1494,  0.0403, -0.0776,  ...,  0.0079,  0.0654, -0.2578],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.5872, 0.0000], grad_fn

tensor([[ 0.1367, -0.0046, -0.3184,  ...,  0.1143,  0.1582, -0.2383],
        [ 0.1455,  0.0168,  0.0236,  ...,  0.0659,  0.0067,  0.0156],
        [ 0.0703,  0.0869,  0.0879,  ..., -0.0476,  0.0145, -0.0625],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.2551, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0742,  0.0669,  0.0583,  ..., -0.0564, -0.0574, -0.3340],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.2734, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1689,  0.0259,  0.09

tensor([3.5540, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.3086, -0.1147,  0.2090,  ..., -0.1182,  0.0210, -0.2061],
        [ 0.1797, -0.0913, -0.1553,  ..., -0.1143, -0.0378, -0.1514],
        [ 0.1729, -0.1426,  0.0659,  ...,  0.3262, -0.1504, -0.1445],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.0449, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.2676,  0.0659, -0.2637,  ..., -0.3887,  0.1768, -0.0613],
        [ 0.1260,  0.1348, -0.0625,  ..., -0.1387,  0.2227, -0.2793],
        [ 0.0160,  0.0684, -0.1699,  ...,  0.0825, -0.0491,  0.0211],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.5511, 0.0000], grad_fn

tensor([2.3195, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.3906,  0.0038, -0.1680,  ..., -0.0542, -0.0981, -0.0378],
        [-0.2285, -0.0884,  0.1279,  ..., -0.2129,  0.1885, -0.1455],
        [-0.2207,  0.1113,  0.0337,  ...,  0.0967,  0.1084, -0.0566],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.0030, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.2041,  0.0132,  0.0757,  ..., -0.2119, -0.1328,  0.1084],
        [-0.1006, -0.0247,  0.0923,  ..., -0.1455,  0.2598,  0.0041],
        [-0.2891,  0.1992,  0.1602,  ...,  0.1279,  0.1211, -0.2295],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.2382, 0.0000], grad_fn

tensor([[ 0.1279, -0.0559,  0.0112,  ..., -0.1475,  0.0623,  0.1855],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        [-0.1270,  0.0220,  0.2871,  ..., -0.1016, -0.0903,  0.0884],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.2342, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1167, -0.0801, -0.1924,  ..., -0.1035, -0.0090,  0.0796],
        [-0.1699,  0.0596, -0.0845,  ..., -0.0879,  0.2656,  0.1641],
        [ 0.2021, -0.0811,  0.1836,  ...,  0.0664,  0.0537, -0.1719],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.0924, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1367,  0.1787,  0.09

tensor([[-0.1201,  0.2256,  0.1543,  ...,  0.1914,  0.0757,  0.0140],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        [ 0.0737,  0.0041, -0.1357,  ..., -0.1416, -0.1504, -0.1377],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.8743, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2520, -0.0771, -0.0184,  ..., -0.3945, -0.0942,  0.0005],
        [ 0.0239, -0.0461,  0.0039,  ..., -0.2695, -0.0688, -0.2754],
        [ 0.2021,  0.1138,  0.2412,  ..., -0.0752, -0.1631,  0.0291],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.2965, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.3262,  0.18

tensor([[-0.2891,  0.3262,  0.1895,  ...,  0.1377,  0.0938, -0.1592],
        [-0.1006, -0.0247,  0.0923,  ..., -0.1455,  0.2598,  0.0041],
        [ 0.1504,  0.0447, -0.0825,  ...,  0.0381,  0.2266,  0.0923],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.2608, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1079,  0.0120, -0.2061,  ..., -0.0525, -0.1475,  0.1846],
        [ 0.1445,  0.0471,  0.1006,  ...,  0.0023,  0.0981, -0.0669],
        [ 0.0393, -0.1963, -0.1064,  ..., -0.0757,  0.0466, -0.0840],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.9219, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1396,  0.1514, -0.21

tensor([3.7023, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0664,  0.1309,  0.0471,  ..., -0.2109,  0.0493,  0.0077],
        [ 0.0166,  0.0457, -0.1191,  ...,  0.0165,  0.2637,  0.0845],
        [-0.3496,  0.0138, -0.2012,  ..., -0.0566,  0.1855,  0.0747],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.9464, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0118, -0.1943,  0.2637,  ..., -0.1533, -0.1030, -0.2949],
        [ 0.1079,  0.0166,  0.0762,  ..., -0.3047, -0.1035,  0.0225],
        [ 0.2695,  0.0859,  0.0942,  ...,  0.1230, -0.0184, -0.1670],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.5200, 0.0000], grad_fn

tensor([[-0.1167, -0.0801, -0.1924,  ..., -0.1035, -0.0090,  0.0796],
        [-0.3047, -0.1230, -0.1836,  ..., -0.1055,  0.1406,  0.1475],
        [ 0.0166,  0.0457, -0.1191,  ...,  0.0165,  0.2637,  0.0845],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.8952, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1196,  0.0879,  0.0182,  ..., -0.2236,  0.0300,  0.1387],
        [ 0.1201, -0.0201,  0.2070,  ...,  0.2295, -0.2949,  0.0119],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.6698, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0055, -0.0112,  0.12

tensor([[-0.0449, -0.0304,  0.0023,  ...,  0.0123, -0.0884, -0.0156],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        [-0.1270,  0.0220,  0.2871,  ..., -0.1016, -0.0903,  0.0884],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.9079, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.2480,  0.2314,  0.0415,  ...,  0.0221,  0.1621,  0.1396],
        [-0.0908,  0.1113,  0.3340,  ...,  0.1177,  0.0693, -0.1348],
        [ 0.0942, -0.0228,  0.0522,  ..., -0.0469,  0.1611, -0.1992],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.1853, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.2559,  0.1934,  0.13

tensor([1.7033, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0605,  0.1406,  0.0845,  ..., -0.2441, -0.0081, -0.1885],
        [ 0.0679, -0.0413,  0.1001,  ...,  0.1045, -0.0854, -0.1543],
        [ 0.0063,  0.0193, -0.0898,  ..., -0.1611,  0.0012, -0.1064],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.8359, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0605,  0.1406,  0.0845,  ..., -0.2441, -0.0081, -0.1885],
        [-0.1738,  0.0240, -0.0302,  ..., -0.2520,  0.1533,  0.0879],
        [-0.2930, -0.0557, -0.0500,  ..., -0.1445,  0.1699,  0.0140],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.2071, 0.0000], grad_fn

tensor([3.4118, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.4570,  0.2598,  0.2793,  ...,  0.2412,  0.2129, -0.0649],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        [ 0.0669, -0.1797,  0.0187,  ...,  0.0325,  0.2793,  0.2451],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.5135, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0703,  0.0869,  0.0879,  ..., -0.0476,  0.0145, -0.0625],
        [-0.0977,  0.0571, -0.0092,  ..., -0.0271, -0.0114, -0.1914],
        [-0.0118, -0.0474,  0.0447,  ...,  0.0713, -0.0349,  0.0242],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.5924, 0.0000], grad_fn

tensor([3.4269, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.0378,  0.0381,  0.0298,  ..., -0.3379, -0.2734,  0.2773],
        [ 0.1030, -0.1523,  0.0259,  ..., -0.1982, -0.1230,  0.0649],
        [ 0.1094,  0.1406, -0.0317,  ...,  0.0077,  0.1201, -0.1797],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.2796, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2520, -0.0771, -0.0184,  ..., -0.3945, -0.0942,  0.0005],
        [ 0.1260,  0.1904,  0.0698,  ...,  0.0613,  0.1729, -0.0786],
        [ 0.1641, -0.1699, -0.2715,  ...,  0.0635,  0.1631,  0.1602],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.7706, 0.0000], grad_fn

tensor([[ 0.0605,  0.1406,  0.0845,  ..., -0.2441, -0.0081, -0.1885],
        [ 0.1348,  0.3711, -0.0240,  ..., -0.0243,  0.0442, -0.2051],
        [-0.0249,  0.0220, -0.0354,  ...,  0.0108, -0.0188, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.2880, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.1074, -0.2285,  0.0204,  ...,  0.0160,  0.0942, -0.0066],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.9627, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 3.6523e-01,  1.4551e-0

tensor([3.8058, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.1069,  ...,  0.1230,  0.1299, -0.1826],
        [ 0.1045,  0.1035,  0.1387,  ...,  0.0913,  0.1992,  0.1504],
        [-0.1006, -0.0247,  0.0923,  ..., -0.1455,  0.2598,  0.0041],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.7547, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.3262,  0.1895,  ...,  0.1377,  0.0938, -0.1592],
        [-0.2227,  0.0588, -0.1748,  ..., -0.4746,  0.3535,  0.1079],
        [-0.0273,  0.0449,  0.0767,  ..., -0.1250,  0.1089, -0.1436],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.6993, 0.0000], grad_fn

tensor([3.4407, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0688,  0.1865,  0.0227,  ..., -0.0649, -0.0422,  0.1533],
        [ 0.0332, -0.0898, -0.2949,  ..., -0.1270,  0.1611, -0.1602],
        [ 0.1445,  0.0471,  0.1006,  ...,  0.0023,  0.0981, -0.0669],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.8538, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0605,  0.1406,  0.0845,  ..., -0.2441, -0.0081, -0.1885],
        [ 0.2285, -0.0601,  0.1396,  ...,  0.0483, -0.1436,  0.3262],
        [ 0.0850, -0.0952,  0.1191,  ..., -0.1089,  0.0488, -0.1309],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.7371, 0.0000], grad_fn

tensor([[ 0.0466,  0.0713, -0.1846,  ..., -0.0544, -0.0065, -0.3418],
        [-0.0121,  0.2949, -0.0801,  ..., -0.0032, -0.1445, -0.0554],
        [ 0.2285,  0.0452,  0.0952,  ..., -0.0806, -0.0840,  0.0161],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.1394, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.1069,  ...,  0.1230,  0.1299, -0.1826],
        [-0.1641, -0.0618, -0.0542,  ..., -0.0330,  0.1934, -0.0593],
        [-0.0586, -0.0376,  0.0728,  ..., -0.1079, -0.0864, -0.0320],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.2243, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0215, -0.2119, -0.11

tensor([3.2978, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0605,  0.1406,  0.0845,  ..., -0.2441, -0.0081, -0.1885],
        [-0.0884,  0.3613, -0.0442,  ...,  0.1318,  0.2910, -0.3125],
        [ 0.0410,  0.0344,  0.2461,  ...,  0.3047, -0.1953, -0.2021],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.5918, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1699,  0.2012,  0.2051,  ...,  0.1797,  0.2119, -0.1865],
        [ 0.0962, -0.0287, -0.1084,  ...,  0.0693,  0.1045, -0.1641],
        [ 0.0070, -0.0732,  0.1719,  ...,  0.0112,  0.1641,  0.1069],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([4.0978, 0.0000], grad_fn

tensor([3.2094, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1729,  0.2793,  0.1069,  ...,  0.1230,  0.1299, -0.1826],
        [ 0.1641,  0.1924,  0.0923,  ..., -0.1582,  0.1377,  0.1138],
        [ 0.0679, -0.0413,  0.1001,  ...,  0.1045, -0.0854, -0.1543],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.6627, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0791, -0.0050,  0.1118,  ..., -0.0068,  0.0427, -0.1035],
        [ 0.0894,  0.1299,  0.2129,  ..., -0.1523,  0.0055, -0.1006],
        [ 0.1035,  0.1377, -0.0030,  ...,  0.0439, -0.1455,  0.0713],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([1.7228, 0.0000], grad_fn

tensor([[ 0.1147, -0.0508,  0.0674,  ..., -0.0864, -0.0566,  0.0815],
        [-0.1279,  0.2461, -0.0679,  ...,  0.2617,  0.0928, -0.1260],
        [-0.0078, -0.0280,  0.0405,  ...,  0.0396, -0.0605,  0.0081],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.0142, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.1060,  0.2139,  0.1187,  ...,  0.1069,  0.0237, -0.0354],
        [ 0.0962, -0.0287, -0.1084,  ...,  0.0693,  0.1045, -0.1641],
        [ 0.0718,  0.2080, -0.0284,  ..., -0.1680, -0.0209, -0.1426],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.6674, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.3398, -0.1797, -0.07

tensor([3.5218, 0.0000], grad_fn=<ReluBackward0>)
tensor([[ 0.0669, -0.1797,  0.0187,  ...,  0.0325,  0.2793,  0.2451],
        [ 0.0801,  0.1050,  0.0498,  ...,  0.0037,  0.0476, -0.0688],
        [-0.1011,  0.2041,  0.0150,  ..., -0.1123,  0.1240,  0.1592],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([2.8350, 0.0000], grad_fn=<ReluBackward0>)
tensor([[-0.2891,  0.3262,  0.1895,  ...,  0.1377,  0.0938, -0.1592],
        [-0.0581,  0.0581,  0.0133,  ..., -0.1748, -0.0231, -0.0435],
        [-0.2061, -0.1069, -0.2158,  ...,  0.2168,  0.0674,  0.1504],
        ...,
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000],
        [ 0.0000,  0.0000,  0.0000,  ...,  0.0000,  0.0000,  0.0000]])
tensor([3.3164, 0.0000], grad_fn