attn_weights tensor([[[[ 1.5886e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.1406e-01, -3.7227e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.2901e-01, -1.4754e+00, -1.3682e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-3.3851e-01, -1.9934e+00, -1.8157e+00, ..., -2.4630e+00, -3.4028e+38, -3.4028e+38], [-8.5572e-01, -1.6032e+00, -1.6190e+00, ..., -1.1067e+00, -5.2037e-01, -3.4028e+38], [-1.0739e+00, -4.1311e+00, -1.8456e+00, ..., -3.0839e+00, -2.9772e+00, -4.3772e+00]], [[ 4.9801e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.1083e+00, 3.8895e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.2395e+00, 3.3452e+00, 8.1080e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.3570e+00, 2.1203e+00, 4.3021e+00, ..., 8.6404e+00, -3.4028e+38, -3.4028e+38], [ 1.6422e+00, 1.6619e+00, 2.4619e+00, ..., 1.4925e+00, 9.3353e+00, -3.4028e+38], [-2.2587e+00, 3.7379e+00, -1.7587e+00, ..., -6.7492e+00, -5.7719e+00, 3.7754e+00]], [[-8.1685e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.4874e-01, -7.4014e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-4.5773e-01, -1.1369e+00, -1.5733e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-7.6691e-01, -1.5972e+00, -1.4952e+00, ..., -2.1660e+00, -3.4028e+38, -3.4028e+38], [-9.3493e-01, -1.7857e+00, -1.7580e+00, ..., -1.2111e+00, -2.3295e+00, -3.4028e+38], [-1.8281e+00, -5.9342e-01, -2.4992e+00, ..., -3.6709e+00, -4.1456e+00, -7.0534e-01]], ..., [[-4.5338e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-6.8989e-01, -1.3212e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-8.0877e-01, -1.2086e+00, -1.6255e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.4420e+00, -1.7200e+00, -1.9151e+00, ..., -3.6196e+00, -3.4028e+38, -3.4028e+38], [-1.5779e+00, -1.7665e+00, -1.9595e+00, ..., -1.7388e+00, -3.4492e+00, -3.4028e+38], [-1.2321e+00, -1.4967e+00, -1.5727e+00, ..., -2.4541e+00, -2.5550e+00, -1.7038e+00]], [[ 2.3908e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.0778e+00, 2.3298e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.9623e+00, 3.1252e+00, 3.9533e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.3894e+00, 1.9812e+00, 1.8545e+00, ..., 2.4025e+00, -3.4028e+38, -3.4028e+38], [ 1.2180e+00, 1.2443e+00, 7.9313e-01, ..., 2.0279e-01, 2.0380e+00, -3.4028e+38], [ 1.1238e+00, 1.1937e+00, 9.2528e-01, ..., -1.9060e-01, -2.1234e-01, 7.0923e-01]], [[-1.0287e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-8.5334e-01, -1.1953e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.3778e+00, -1.8176e+00, -3.0492e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.3321e+00, -1.9475e+00, -3.3753e+00, ..., -2.4721e+00, -3.4028e+38, -3.4028e+38], [-1.4442e+00, -2.4030e+00, -2.8946e+00, ..., -2.8746e+00, -1.9727e+00, -3.4028e+38], [-1.6640e+00, -2.2097e+00, -3.6145e+00, ..., -2.4098e+00, -2.0495e+00, -2.0280e+00]]], [[[ 1.5886e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.1406e-01, -3.7227e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.2901e-01, -1.4754e+00, -1.3682e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-3.3851e-01, -1.9934e+00, -1.8157e+00, ..., -2.4630e+00, -3.4028e+38, -3.4028e+38], [-8.5572e-01, -1.6032e+00, -1.6190e+00, ..., -1.1067e+00, -5.2037e-01, -3.4028e+38], [-1.0739e+00, -4.1311e+00, -1.8456e+00, ..., -3.0839e+00, -2.9772e+00, -4.3772e+00]], [[ 4.9801e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.1083e+00, 3.8895e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.2395e+00, 3.3452e+00, 8.1080e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.3570e+00, 2.1203e+00, 4.3021e+00, ..., 8.6404e+00, -3.4028e+38, -3.4028e+38], [ 1.6422e+00, 1.6619e+00, 2.4619e+00, ..., 1.4925e+00, 9.3353e+00, -3.4028e+38], [-2.2587e+00, 3.7379e+00, -1.7587e+00, ..., -6.7492e+00, -5.7719e+00, 3.7754e+00]], [[-8.1685e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.4874e-01, -7.4014e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-4.5773e-01, -1.1369e+00, -1.5733e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-7.6691e-01, -1.5972e+00, -1.4952e+00, ..., -2.1660e+00, -3.4028e+38, -3.4028e+38], [-9.3493e-01, -1.7857e+00, -1.7580e+00, ..., -1.2111e+00, -2.3295e+00, -3.4028e+38], [-1.8281e+00, -5.9342e-01, -2.4992e+00, ..., -3.6709e+00, -4.1456e+00, -7.0534e-01]], ..., [[-4.5338e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-6.8989e-01, -1.3212e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-8.0877e-01, -1.2086e+00, -1.6255e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.4420e+00, -1.7200e+00, -1.9151e+00, ..., -3.6196e+00, -3.4028e+38, -3.4028e+38], [-1.5779e+00, -1.7665e+00, -1.9595e+00, ..., -1.7388e+00, -3.4492e+00, -3.4028e+38], [-1.2321e+00, -1.4967e+00, -1.5727e+00, ..., -2.4541e+00, -2.5550e+00, -1.7038e+00]], [[ 2.3908e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.0778e+00, 2.3298e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.9623e+00, 3.1252e+00, 3.9533e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.3894e+00, 1.9812e+00, 1.8545e+00, ..., 2.4025e+00, -3.4028e+38, -3.4028e+38], [ 1.2180e+00, 1.2443e+00, 7.9313e-01, ..., 2.0279e-01, 2.0380e+00, -3.4028e+38], [ 1.1238e+00, 1.1937e+00, 9.2528e-01, ..., -1.9060e-01, -2.1234e-01, 7.0923e-01]], [[-1.0287e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-8.5334e-01, -1.1953e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.3778e+00, -1.8176e+00, -3.0492e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.3321e+00, -1.9475e+00, -3.3753e+00, ..., -2.4721e+00, -3.4028e+38, -3.4028e+38], [-1.4442e+00, -2.4030e+00, -2.8946e+00, ..., -2.8746e+00, -1.9727e+00, -3.4028e+38], [-1.6640e+00, -2.2097e+00, -3.6145e+00, ..., -2.4098e+00, -2.0495e+00, -2.0280e+00]]], [[[ 1.5886e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.1406e-01, -3.7227e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.2901e-01, -1.4754e+00, -1.3682e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-3.3851e-01, -1.9934e+00, -1.8157e+00, ..., -2.4630e+00, -3.4028e+38, -3.4028e+38], [-8.5572e-01, -1.6032e+00, -1.6190e+00, ..., -1.1067e+00, -5.2037e-01, -3.4028e+38], [-1.0739e+00, -4.1311e+00, -1.8456e+00, ..., -3.0839e+00, -2.9772e+00, -4.3772e+00]], [[ 4.9801e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.1083e+00, 3.8895e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.2395e+00, 3.3452e+00, 8.1080e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.3570e+00, 2.1203e+00, 4.3021e+00, ..., 8.6404e+00, -3.4028e+38, -3.4028e+38], [ 1.6422e+00, 1.6619e+00, 2.4619e+00, ..., 1.4925e+00, 9.3353e+00, -3.4028e+38], [-2.2587e+00, 3.7379e+00, -1.7587e+00, ..., -6.7492e+00, -5.7719e+00, 3.7754e+00]], [[-8.1685e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.4874e-01, -7.4014e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-4.5773e-01, -1.1369e+00, -1.5733e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-7.6691e-01, -1.5972e+00, -1.4952e+00, ..., -2.1660e+00, -3.4028e+38, -3.4028e+38], [-9.3493e-01, -1.7857e+00, -1.7580e+00, ..., -1.2111e+00, -2.3295e+00, -3.4028e+38], [-1.8281e+00, -5.9342e-01, -2.4992e+00, ..., -3.6709e+00, -4.1456e+00, -7.0534e-01]], ..., [[-4.5338e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-6.8989e-01, -1.3212e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-8.0877e-01, -1.2086e+00, -1.6255e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.4420e+00, -1.7200e+00, -1.9151e+00, ..., -3.6196e+00, -3.4028e+38, -3.4028e+38], [-1.5779e+00, -1.7665e+00, -1.9595e+00, ..., -1.7388e+00, -3.4492e+00, -3.4028e+38], [-1.2321e+00, -1.4967e+00, -1.5727e+00, ..., -2.4541e+00, -2.5550e+00, -1.7038e+00]], [[ 2.3908e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.0778e+00, 2.3298e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.9623e+00, 3.1252e+00, 3.9533e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.3894e+00, 1.9812e+00, 1.8545e+00, ..., 2.4025e+00, -3.4028e+38, -3.4028e+38], [ 1.2180e+00, 1.2443e+00, 7.9313e-01, ..., 2.0279e-01, 2.0380e+00, -3.4028e+38], [ 1.1238e+00, 1.1937e+00, 9.2528e-01, ..., -1.9060e-01, -2.1234e-01, 7.0923e-01]], [[-1.0287e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-8.5334e-01, -1.1953e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.3778e+00, -1.8176e+00, -3.0492e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.3321e+00, -1.9475e+00, -3.3753e+00, ..., -2.4721e+00, -3.4028e+38, -3.4028e+38], [-1.4442e+00, -2.4030e+00, -2.8946e+00, ..., -2.8746e+00, -1.9727e+00, -3.4028e+38], [-1.6640e+00, -2.2097e+00, -3.6145e+00, ..., -2.4098e+00, -2.0495e+00, -2.0280e+00]]], [[[ 1.5886e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.1406e-01, -3.7227e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.2901e-01, -1.4754e+00, -1.3682e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-3.3851e-01, -1.9934e+00, -1.8157e+00, ..., -2.4630e+00, -3.4028e+38, -3.4028e+38], [-8.5572e-01, -1.6032e+00, -1.6190e+00, ..., -1.1067e+00, -5.2037e-01, -3.4028e+38], [-1.0739e+00, -4.1311e+00, -1.8456e+00, ..., -3.0839e+00, -2.9772e+00, -4.3772e+00]], [[ 4.9801e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.1083e+00, 3.8895e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.2395e+00, 3.3452e+00, 8.1080e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.3570e+00, 2.1203e+00, 4.3021e+00, ..., 8.6404e+00, -3.4028e+38, -3.4028e+38], [ 1.6422e+00, 1.6619e+00, 2.4619e+00, ..., 1.4925e+00, 9.3353e+00, -3.4028e+38], [-2.2587e+00, 3.7379e+00, -1.7587e+00, ..., -6.7492e+00, -5.7719e+00, 3.7754e+00]], [[-8.1685e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.4874e-01, -7.4014e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-4.5773e-01, -1.1369e+00, -1.5733e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-7.6691e-01, -1.5972e+00, -1.4952e+00, ..., -2.1660e+00, -3.4028e+38, -3.4028e+38], [-9.3493e-01, -1.7857e+00, -1.7580e+00, ..., -1.2111e+00, -2.3295e+00, -3.4028e+38], [-1.8281e+00, -5.9342e-01, -2.4992e+00, ..., -3.6709e+00, -4.1456e+00, -7.0534e-01]], ..., [[-4.5338e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-6.8989e-01, -1.3212e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-8.0877e-01, -1.2086e+00, -1.6255e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.4420e+00, -1.7200e+00, -1.9151e+00, ..., -3.6196e+00, -3.4028e+38, -3.4028e+38], [-1.5779e+00, -1.7665e+00, -1.9595e+00, ..., -1.7388e+00, -3.4492e+00, -3.4028e+38], [-1.2321e+00, -1.4967e+00, -1.5727e+00, ..., -2.4541e+00, -2.5550e+00, -1.7038e+00]], [[ 2.3908e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.0778e+00, 2.3298e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.9623e+00, 3.1252e+00, 3.9533e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.3894e+00, 1.9812e+00, 1.8545e+00, ..., 2.4025e+00, -3.4028e+38, -3.4028e+38], [ 1.2180e+00, 1.2443e+00, 7.9313e-01, ..., 2.0279e-01, 2.0380e+00, -3.4028e+38], [ 1.1238e+00, 1.1937e+00, 9.2528e-01, ..., -1.9060e-01, -2.1234e-01, 7.0923e-01]], [[-1.0287e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-8.5334e-01, -1.1953e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.3778e+00, -1.8176e+00, -3.0492e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.3321e+00, -1.9475e+00, -3.3753e+00, ..., -2.4721e+00, -3.4028e+38, -3.4028e+38], [-1.4442e+00, -2.4030e+00, -2.8946e+00, ..., -2.8746e+00, -1.9727e+00, -3.4028e+38], [-1.6640e+00, -2.2097e+00, -3.6145e+00, ..., -2.4098e+00, -2.0495e+00, -2.0280e+00]]], [[[ 1.5886e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.1406e-01, -3.7227e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.2901e-01, -1.4754e+00, -1.3682e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-3.3851e-01, -1.9934e+00, -1.8157e+00, ..., -2.4630e+00, -3.4028e+38, -3.4028e+38], [-8.5572e-01, -1.6032e+00, -1.6190e+00, ..., -1.1067e+00, -5.2037e-01, -3.4028e+38], [-1.0739e+00, -4.1311e+00, -1.8456e+00, ..., -3.0839e+00, -2.9772e+00, -4.3772e+00]], [[ 4.9801e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.1083e+00, 3.8895e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.2395e+00, 3.3452e+00, 8.1080e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.3570e+00, 2.1203e+00, 4.3021e+00, ..., 8.6404e+00, -3.4028e+38, -3.4028e+38], [ 1.6422e+00, 1.6619e+00, 2.4619e+00, ..., 1.4925e+00, 9.3353e+00, -3.4028e+38], [-2.2587e+00, 3.7379e+00, -1.7587e+00, ..., -6.7492e+00, -5.7719e+00, 3.7754e+00]], [[-8.1685e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.4874e-01, -7.4014e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-4.5773e-01, -1.1369e+00, -1.5733e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-7.6691e-01, -1.5972e+00, -1.4952e+00, ..., -2.1660e+00, -3.4028e+38, -3.4028e+38], [-9.3493e-01, -1.7857e+00, -1.7580e+00, ..., -1.2111e+00, -2.3295e+00, -3.4028e+38], [-1.8281e+00, -5.9342e-01, -2.4992e+00, ..., -3.6709e+00, -4.1456e+00, -7.0534e-01]], ..., [[-4.5338e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-6.8989e-01, -1.3212e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-8.0877e-01, -1.2086e+00, -1.6255e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.4420e+00, -1.7200e+00, -1.9151e+00, ..., -3.6196e+00, -3.4028e+38, -3.4028e+38], [-1.5779e+00, -1.7665e+00, -1.9595e+00, ..., -1.7388e+00, -3.4492e+00, -3.4028e+38], [-1.2321e+00, -1.4967e+00, -1.5727e+00, ..., -2.4541e+00, -2.5550e+00, -1.7038e+00]], [[ 2.3908e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.0778e+00, 2.3298e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.9623e+00, 3.1252e+00, 3.9533e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.3894e+00, 1.9812e+00, 1.8545e+00, ..., 2.4025e+00, -3.4028e+38, -3.4028e+38], [ 1.2180e+00, 1.2443e+00, 7.9313e-01, ..., 2.0279e-01, 2.0380e+00, -3.4028e+38], [ 1.1238e+00, 1.1937e+00, 9.2528e-01, ..., -1.9060e-01, -2.1234e-01, 7.0923e-01]], [[-1.0287e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-8.5334e-01, -1.1953e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.3778e+00, -1.8176e+00, -3.0492e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.3321e+00, -1.9475e+00, -3.3753e+00, ..., -2.4721e+00, -3.4028e+38, -3.4028e+38], [-1.4442e+00, -2.4030e+00, -2.8946e+00, ..., -2.8746e+00, -1.9727e+00, -3.4028e+38], [-1.6640e+00, -2.2097e+00, -3.6145e+00, ..., -2.4098e+00, -2.0495e+00, -2.0280e+00]]]]) attn_weights tensor([[[[ 1.2823e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1981e+00, -1.2028e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.6485e+00, -4.8753e-01, -5.8615e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-6.7973e-01, -1.8233e+00, -1.7457e+00, ..., -9.1193e-01, -3.4028e+38, -3.4028e+38], [-2.1149e+00, -2.7591e+00, -2.0481e+00, ..., -1.2349e+00, -1.3748e+00, -3.4028e+38], [-1.4793e-01, -2.3528e+00, -5.1867e-01, ..., -5.7342e-01, 1.4240e-01, -7.4004e-01]], [[ 5.2174e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.3098e+00, -5.5193e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4165e-01, -3.6863e-01, -1.6412e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-2.3674e-01, -1.1929e+00, -1.5160e+00, ..., -1.6464e+00, -3.4028e+38, -3.4028e+38], [-9.3387e-01, -1.7905e+00, -1.9955e+00, ..., -2.0768e+00, -2.0107e+00, -3.4028e+38], [-8.0515e-03, -1.7177e+00, -1.5425e+00, ..., -1.6193e+00, -7.5606e-01, -2.6929e-01]], [[-9.5129e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-5.1648e-01, -3.9159e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.3196e+00, -3.3901e+00, -2.3023e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.8268e+00, -3.3415e+00, -2.5802e+00, ..., -2.8411e+00, -3.4028e+38, -3.4028e+38], [-2.1672e+00, -3.3389e+00, -2.7820e+00, ..., -2.9644e+00, -2.5428e+00, -3.4028e+38], [-2.2269e+00, -3.5804e+00, -2.9344e+00, ..., -3.0596e+00, -2.6335e+00, -1.7759e+00]], ..., [[-1.4098e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.9724e+00, -4.8375e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.5309e+00, -6.5884e-01, -7.6767e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.6823e+00, -3.5325e-01, -1.6668e-01, ..., -1.1548e+00, -3.4028e+38, -3.4028e+38], [ 1.3219e+00, -3.0234e-01, 7.9925e-02, ..., -8.3700e-01, -1.4604e+00, -3.4028e+38], [ 1.3191e+00, -5.0901e-01, -3.6811e-01, ..., -1.2528e+00, -1.2815e+00, -9.4165e-01]], [[-8.5641e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.9938e+00, -6.1290e-02, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.1440e+00, -9.2050e-01, -9.7892e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-6.4869e+00, -1.2307e+00, -1.2148e+00, ..., -9.2694e-01, -3.4028e+38, -3.4028e+38], [-6.1790e+00, -1.4306e+00, -1.4742e+00, ..., -1.1063e+00, -9.8613e-01, -3.4028e+38], [-5.8402e+00, -1.8115e+00, -1.7621e+00, ..., -1.3260e+00, -1.1715e+00, -1.2679e+00]], [[ 1.8292e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 9.5365e-01, -4.6707e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 8.0555e-01, 6.5082e-02, 2.3727e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 9.7184e-01, -8.8981e-03, -3.2301e+00, ..., 2.9439e+00, -3.4028e+38, -3.4028e+38], [ 1.6527e+00, 6.4238e-01, -1.3935e+00, ..., -9.6682e-01, 4.1661e+00, -3.4028e+38], [-6.2612e-01, -1.0668e+00, -1.7231e+00, ..., -2.6845e+00, -2.5670e+00, -1.1238e+00]]], [[[ 1.2823e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1981e+00, -1.2028e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.6485e+00, -4.8753e-01, -5.8615e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-6.7973e-01, -1.8233e+00, -1.7457e+00, ..., -9.1193e-01, -3.4028e+38, -3.4028e+38], [-2.1149e+00, -2.7591e+00, -2.0481e+00, ..., -1.2349e+00, -1.3748e+00, -3.4028e+38], [-1.4793e-01, -2.3528e+00, -5.1867e-01, ..., -5.7342e-01, 1.4240e-01, -7.4004e-01]], [[ 5.2174e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.3098e+00, -5.5193e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4165e-01, -3.6863e-01, -1.6412e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-2.3674e-01, -1.1929e+00, -1.5160e+00, ..., -1.6464e+00, -3.4028e+38, -3.4028e+38], [-9.3387e-01, -1.7905e+00, -1.9955e+00, ..., -2.0768e+00, -2.0107e+00, -3.4028e+38], [-8.0515e-03, -1.7177e+00, -1.5425e+00, ..., -1.6193e+00, -7.5606e-01, -2.6929e-01]], [[-9.5129e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-5.1648e-01, -3.9159e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.3196e+00, -3.3901e+00, -2.3023e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.8268e+00, -3.3415e+00, -2.5802e+00, ..., -2.8411e+00, -3.4028e+38, -3.4028e+38], [-2.1672e+00, -3.3389e+00, -2.7820e+00, ..., -2.9644e+00, -2.5428e+00, -3.4028e+38], [-2.2269e+00, -3.5804e+00, -2.9344e+00, ..., -3.0596e+00, -2.6335e+00, -1.7759e+00]], ..., [[-1.4098e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.9724e+00, -4.8375e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.5309e+00, -6.5884e-01, -7.6767e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.6823e+00, -3.5325e-01, -1.6668e-01, ..., -1.1548e+00, -3.4028e+38, -3.4028e+38], [ 1.3219e+00, -3.0234e-01, 7.9925e-02, ..., -8.3700e-01, -1.4604e+00, -3.4028e+38], [ 1.3191e+00, -5.0901e-01, -3.6811e-01, ..., -1.2528e+00, -1.2815e+00, -9.4165e-01]], [[-8.5641e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.9938e+00, -6.1290e-02, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.1440e+00, -9.2050e-01, -9.7892e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-6.4869e+00, -1.2307e+00, -1.2148e+00, ..., -9.2694e-01, -3.4028e+38, -3.4028e+38], [-6.1790e+00, -1.4306e+00, -1.4742e+00, ..., -1.1063e+00, -9.8613e-01, -3.4028e+38], [-5.8402e+00, -1.8115e+00, -1.7621e+00, ..., -1.3260e+00, -1.1715e+00, -1.2679e+00]], [[ 1.8292e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 9.5365e-01, -4.6707e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 8.0555e-01, 6.5082e-02, 2.3727e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 9.7184e-01, -8.8981e-03, -3.2301e+00, ..., 2.9439e+00, -3.4028e+38, -3.4028e+38], [ 1.6527e+00, 6.4238e-01, -1.3935e+00, ..., -9.6682e-01, 4.1661e+00, -3.4028e+38], [-6.2612e-01, -1.0668e+00, -1.7231e+00, ..., -2.6845e+00, -2.5670e+00, -1.1238e+00]]], [[[ 1.2823e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1981e+00, -1.2028e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.6485e+00, -4.8753e-01, -5.8615e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-6.7973e-01, -1.8233e+00, -1.7457e+00, ..., -9.1193e-01, -3.4028e+38, -3.4028e+38], [-2.1149e+00, -2.7591e+00, -2.0481e+00, ..., -1.2349e+00, -1.3748e+00, -3.4028e+38], [-1.4793e-01, -2.3528e+00, -5.1867e-01, ..., -5.7342e-01, 1.4240e-01, -7.4004e-01]], [[ 5.2174e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.3098e+00, -5.5193e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4165e-01, -3.6863e-01, -1.6412e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-2.3674e-01, -1.1929e+00, -1.5160e+00, ..., -1.6464e+00, -3.4028e+38, -3.4028e+38], [-9.3387e-01, -1.7905e+00, -1.9955e+00, ..., -2.0768e+00, -2.0107e+00, -3.4028e+38], [-8.0515e-03, -1.7177e+00, -1.5425e+00, ..., -1.6193e+00, -7.5606e-01, -2.6929e-01]], [[-9.5129e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-5.1648e-01, -3.9159e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.3196e+00, -3.3901e+00, -2.3023e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.8268e+00, -3.3415e+00, -2.5802e+00, ..., -2.8411e+00, -3.4028e+38, -3.4028e+38], [-2.1672e+00, -3.3389e+00, -2.7820e+00, ..., -2.9644e+00, -2.5428e+00, -3.4028e+38], [-2.2269e+00, -3.5804e+00, -2.9344e+00, ..., -3.0596e+00, -2.6335e+00, -1.7759e+00]], ..., [[-1.4098e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.9724e+00, -4.8375e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.5309e+00, -6.5884e-01, -7.6767e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.6823e+00, -3.5325e-01, -1.6668e-01, ..., -1.1548e+00, -3.4028e+38, -3.4028e+38], [ 1.3219e+00, -3.0234e-01, 7.9925e-02, ..., -8.3700e-01, -1.4604e+00, -3.4028e+38], [ 1.3191e+00, -5.0901e-01, -3.6811e-01, ..., -1.2528e+00, -1.2815e+00, -9.4165e-01]], [[-8.5641e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.9938e+00, -6.1290e-02, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.1440e+00, -9.2050e-01, -9.7892e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-6.4869e+00, -1.2307e+00, -1.2148e+00, ..., -9.2694e-01, -3.4028e+38, -3.4028e+38], [-6.1790e+00, -1.4306e+00, -1.4742e+00, ..., -1.1063e+00, -9.8613e-01, -3.4028e+38], [-5.8402e+00, -1.8115e+00, -1.7621e+00, ..., -1.3260e+00, -1.1715e+00, -1.2679e+00]], [[ 1.8292e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 9.5365e-01, -4.6707e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 8.0555e-01, 6.5082e-02, 2.3727e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 9.7184e-01, -8.8981e-03, -3.2301e+00, ..., 2.9439e+00, -3.4028e+38, -3.4028e+38], [ 1.6527e+00, 6.4238e-01, -1.3935e+00, ..., -9.6682e-01, 4.1661e+00, -3.4028e+38], [-6.2612e-01, -1.0668e+00, -1.7231e+00, ..., -2.6845e+00, -2.5670e+00, -1.1238e+00]]], [[[ 1.2823e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1981e+00, -1.2028e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.6485e+00, -4.8753e-01, -5.8615e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-6.7973e-01, -1.8233e+00, -1.7457e+00, ..., -9.1193e-01, -3.4028e+38, -3.4028e+38], [-2.1149e+00, -2.7591e+00, -2.0481e+00, ..., -1.2349e+00, -1.3748e+00, -3.4028e+38], [-1.4793e-01, -2.3528e+00, -5.1867e-01, ..., -5.7342e-01, 1.4240e-01, -7.4004e-01]], [[ 5.2174e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.3098e+00, -5.5193e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4165e-01, -3.6863e-01, -1.6412e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-2.3674e-01, -1.1929e+00, -1.5160e+00, ..., -1.6464e+00, -3.4028e+38, -3.4028e+38], [-9.3387e-01, -1.7905e+00, -1.9955e+00, ..., -2.0768e+00, -2.0107e+00, -3.4028e+38], [-8.0515e-03, -1.7177e+00, -1.5425e+00, ..., -1.6193e+00, -7.5606e-01, -2.6929e-01]], [[-9.5129e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-5.1648e-01, -3.9159e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.3196e+00, -3.3901e+00, -2.3023e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.8268e+00, -3.3415e+00, -2.5802e+00, ..., -2.8411e+00, -3.4028e+38, -3.4028e+38], [-2.1672e+00, -3.3389e+00, -2.7820e+00, ..., -2.9644e+00, -2.5428e+00, -3.4028e+38], [-2.2269e+00, -3.5804e+00, -2.9344e+00, ..., -3.0596e+00, -2.6335e+00, -1.7759e+00]], ..., [[-1.4098e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.9724e+00, -4.8375e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.5309e+00, -6.5884e-01, -7.6767e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.6823e+00, -3.5325e-01, -1.6668e-01, ..., -1.1548e+00, -3.4028e+38, -3.4028e+38], [ 1.3219e+00, -3.0234e-01, 7.9925e-02, ..., -8.3700e-01, -1.4604e+00, -3.4028e+38], [ 1.3191e+00, -5.0901e-01, -3.6811e-01, ..., -1.2528e+00, -1.2815e+00, -9.4165e-01]], [[-8.5641e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.9938e+00, -6.1290e-02, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.1440e+00, -9.2050e-01, -9.7892e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-6.4869e+00, -1.2307e+00, -1.2148e+00, ..., -9.2694e-01, -3.4028e+38, -3.4028e+38], [-6.1790e+00, -1.4306e+00, -1.4742e+00, ..., -1.1063e+00, -9.8613e-01, -3.4028e+38], [-5.8402e+00, -1.8115e+00, -1.7621e+00, ..., -1.3260e+00, -1.1715e+00, -1.2679e+00]], [[ 1.8292e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 9.5365e-01, -4.6707e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 8.0555e-01, 6.5082e-02, 2.3727e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 9.7184e-01, -8.8981e-03, -3.2301e+00, ..., 2.9439e+00, -3.4028e+38, -3.4028e+38], [ 1.6527e+00, 6.4238e-01, -1.3935e+00, ..., -9.6682e-01, 4.1661e+00, -3.4028e+38], [-6.2612e-01, -1.0668e+00, -1.7231e+00, ..., -2.6845e+00, -2.5670e+00, -1.1238e+00]]], [[[ 1.2823e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1981e+00, -1.2028e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.6485e+00, -4.8753e-01, -5.8615e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-6.7973e-01, -1.8233e+00, -1.7457e+00, ..., -9.1193e-01, -3.4028e+38, -3.4028e+38], [-2.1149e+00, -2.7591e+00, -2.0481e+00, ..., -1.2349e+00, -1.3748e+00, -3.4028e+38], [-1.4793e-01, -2.3528e+00, -5.1867e-01, ..., -5.7342e-01, 1.4240e-01, -7.4004e-01]], [[ 5.2174e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.3098e+00, -5.5193e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4165e-01, -3.6863e-01, -1.6412e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-2.3674e-01, -1.1929e+00, -1.5160e+00, ..., -1.6464e+00, -3.4028e+38, -3.4028e+38], [-9.3387e-01, -1.7905e+00, -1.9955e+00, ..., -2.0768e+00, -2.0107e+00, -3.4028e+38], [-8.0516e-03, -1.7177e+00, -1.5425e+00, ..., -1.6193e+00, -7.5606e-01, -2.6929e-01]], [[-9.5129e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-5.1648e-01, -3.9159e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.3196e+00, -3.3901e+00, -2.3023e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.8268e+00, -3.3415e+00, -2.5802e+00, ..., -2.8411e+00, -3.4028e+38, -3.4028e+38], [-2.1672e+00, -3.3389e+00, -2.7820e+00, ..., -2.9644e+00, -2.5428e+00, -3.4028e+38], [-2.2269e+00, -3.5804e+00, -2.9344e+00, ..., -3.0596e+00, -2.6335e+00, -1.7759e+00]], ..., [[-1.4098e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.9724e+00, -4.8375e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.5309e+00, -6.5884e-01, -7.6767e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.6823e+00, -3.5325e-01, -1.6668e-01, ..., -1.1548e+00, -3.4028e+38, -3.4028e+38], [ 1.3219e+00, -3.0234e-01, 7.9926e-02, ..., -8.3700e-01, -1.4604e+00, -3.4028e+38], [ 1.3191e+00, -5.0901e-01, -3.6811e-01, ..., -1.2528e+00, -1.2815e+00, -9.4165e-01]], [[-8.5641e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.9938e+00, -6.1289e-02, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.1440e+00, -9.2050e-01, -9.7892e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-6.4869e+00, -1.2307e+00, -1.2148e+00, ..., -9.2694e-01, -3.4028e+38, -3.4028e+38], [-6.1790e+00, -1.4306e+00, -1.4742e+00, ..., -1.1063e+00, -9.8613e-01, -3.4028e+38], [-5.8402e+00, -1.8115e+00, -1.7621e+00, ..., -1.3260e+00, -1.1715e+00, -1.2679e+00]], [[ 1.8292e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 9.5365e-01, -4.6707e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 8.0555e-01, 6.5082e-02, 2.3727e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 9.7184e-01, -8.8983e-03, -3.2301e+00, ..., 2.9439e+00, -3.4028e+38, -3.4028e+38], [ 1.6527e+00, 6.4237e-01, -1.3935e+00, ..., -9.6682e-01, 4.1661e+00, -3.4028e+38], [-6.2612e-01, -1.0668e+00, -1.7231e+00, ..., -2.6845e+00, -2.5670e+00, -1.1238e+00]]]]) attn_weights tensor([[[[ 1.3748e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.6654e-01, -3.3128e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.3153e+00, -3.2569e+00, -2.7809e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.4341e+00, -3.5812e+00, -2.6179e+00, ..., -4.1122e+00, -3.4028e+38, -3.4028e+38], [-1.3845e+00, -3.4265e+00, -2.2172e+00, ..., -2.7752e+00, -3.8452e+00, -3.4028e+38], [-1.5200e+00, -4.4548e+00, -2.1332e+00, ..., -3.4747e+00, -3.7491e+00, -3.1071e+00]], [[-6.3877e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.1421e+00, -1.5785e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.9012e+00, -6.6309e-01, -3.1614e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.2875e+00, -1.1435e+00, -2.6240e+00, ..., -9.5481e-01, -3.4028e+38, -3.4028e+38], [ 1.3192e+00, -1.2463e+00, -1.9914e+00, ..., -1.1514e+00, -1.8577e+00, -3.4028e+38], [ 1.6156e+00, -3.6972e-01, -1.4811e+00, ..., -9.1212e-01, -2.0355e+00, -8.8567e-01]], [[-8.8605e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 7.5355e-01, -5.6728e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-4.3371e+00, -3.6768e+00, -7.3714e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-5.9483e+00, -6.1223e+00, -6.7826e+00, ..., -6.1076e+00, -3.4028e+38, -3.4028e+38], [-5.5088e+00, -7.5049e+00, -5.9768e+00, ..., -3.4767e+00, -5.5521e+00, -3.4028e+38], [-8.0000e+00, -1.2842e+01, -9.0073e+00, ..., -6.9437e+00, -5.1912e+00, -5.5434e+00]], ..., [[-8.3518e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.5486e+00, -3.6403e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.3697e+00, -4.5553e+00, -5.3841e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-3.5115e+00, -4.7484e+00, -3.6419e+00, ..., -3.4534e+00, -3.4028e+38, -3.4028e+38], [-4.3902e+00, -5.9234e+00, -5.0463e+00, ..., -2.5518e+00, -4.7106e+00, -3.4028e+38], [-4.7555e+00, -8.3231e+00, -6.2912e+00, ..., -3.3778e+00, -2.5709e+00, -4.3723e+00]], [[ 4.2285e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-4.8483e-01, -3.1191e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-9.4446e-01, -3.0129e+00, -2.6438e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.1266e+00, -3.0494e+00, -2.7580e+00, ..., -1.7309e+00, -3.4028e+38, -3.4028e+38], [-8.3933e-01, -2.8693e+00, -2.5396e+00, ..., -1.6617e+00, -1.3670e+00, -3.4028e+38], [-1.2489e+00, -3.3855e+00, -2.9559e+00, ..., -2.0913e+00, -2.0099e+00, -2.2985e+00]], [[-7.9506e-02, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.2294e+00, -4.5237e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.1646e+00, -4.1651e+00, -3.6994e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-9.0788e-01, -4.2754e+00, -3.8699e+00, ..., -3.0398e+00, -3.4028e+38, -3.4028e+38], [-9.7489e-01, -4.4548e+00, -4.1134e+00, ..., -3.3533e+00, -3.1403e+00, -3.4028e+38], [-9.7120e-01, -4.9190e+00, -4.3547e+00, ..., -3.5138e+00, -3.2427e+00, -3.2375e+00]]], [[[ 1.3748e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.6654e-01, -3.3128e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.3153e+00, -3.2569e+00, -2.7809e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.4341e+00, -3.5812e+00, -2.6179e+00, ..., -4.1122e+00, -3.4028e+38, -3.4028e+38], [-1.3845e+00, -3.4265e+00, -2.2172e+00, ..., -2.7752e+00, -3.8452e+00, -3.4028e+38], [-1.5200e+00, -4.4548e+00, -2.1332e+00, ..., -3.4747e+00, -3.7491e+00, -3.1071e+00]], [[-6.3877e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.1421e+00, -1.5785e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.9012e+00, -6.6309e-01, -3.1614e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.2875e+00, -1.1435e+00, -2.6240e+00, ..., -9.5481e-01, -3.4028e+38, -3.4028e+38], [ 1.3192e+00, -1.2463e+00, -1.9914e+00, ..., -1.1514e+00, -1.8577e+00, -3.4028e+38], [ 1.6156e+00, -3.6972e-01, -1.4811e+00, ..., -9.1212e-01, -2.0355e+00, -8.8567e-01]], [[-8.8605e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 7.5355e-01, -5.6728e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-4.3371e+00, -3.6768e+00, -7.3714e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-5.9483e+00, -6.1223e+00, -6.7826e+00, ..., -6.1076e+00, -3.4028e+38, -3.4028e+38], [-5.5088e+00, -7.5049e+00, -5.9768e+00, ..., -3.4767e+00, -5.5521e+00, -3.4028e+38], [-8.0000e+00, -1.2842e+01, -9.0073e+00, ..., -6.9437e+00, -5.1912e+00, -5.5434e+00]], ..., [[-8.3518e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.5486e+00, -3.6403e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.3697e+00, -4.5553e+00, -5.3841e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-3.5115e+00, -4.7484e+00, -3.6419e+00, ..., -3.4534e+00, -3.4028e+38, -3.4028e+38], [-4.3902e+00, -5.9234e+00, -5.0463e+00, ..., -2.5518e+00, -4.7106e+00, -3.4028e+38], [-4.7555e+00, -8.3231e+00, -6.2912e+00, ..., -3.3778e+00, -2.5709e+00, -4.3723e+00]], [[ 4.2285e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-4.8483e-01, -3.1191e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-9.4446e-01, -3.0129e+00, -2.6438e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.1266e+00, -3.0494e+00, -2.7580e+00, ..., -1.7309e+00, -3.4028e+38, -3.4028e+38], [-8.3933e-01, -2.8693e+00, -2.5396e+00, ..., -1.6617e+00, -1.3670e+00, -3.4028e+38], [-1.2489e+00, -3.3855e+00, -2.9559e+00, ..., -2.0913e+00, -2.0099e+00, -2.2985e+00]], [[-7.9506e-02, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.2294e+00, -4.5237e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.1646e+00, -4.1651e+00, -3.6994e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-9.0788e-01, -4.2754e+00, -3.8699e+00, ..., -3.0398e+00, -3.4028e+38, -3.4028e+38], [-9.7489e-01, -4.4548e+00, -4.1134e+00, ..., -3.3533e+00, -3.1403e+00, -3.4028e+38], [-9.7120e-01, -4.9190e+00, -4.3547e+00, ..., -3.5138e+00, -3.2427e+00, -3.2375e+00]]], [[[ 1.3748e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.6654e-01, -3.3128e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.3153e+00, -3.2569e+00, -2.7809e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.4341e+00, -3.5812e+00, -2.6179e+00, ..., -4.1122e+00, -3.4028e+38, -3.4028e+38], [-1.3845e+00, -3.4265e+00, -2.2172e+00, ..., -2.7752e+00, -3.8452e+00, -3.4028e+38], [-1.5200e+00, -4.4548e+00, -2.1332e+00, ..., -3.4747e+00, -3.7491e+00, -3.1071e+00]], [[-6.3877e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.1421e+00, -1.5785e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.9012e+00, -6.6309e-01, -3.1614e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.2875e+00, -1.1435e+00, -2.6240e+00, ..., -9.5481e-01, -3.4028e+38, -3.4028e+38], [ 1.3192e+00, -1.2463e+00, -1.9914e+00, ..., -1.1514e+00, -1.8577e+00, -3.4028e+38], [ 1.6156e+00, -3.6972e-01, -1.4811e+00, ..., -9.1212e-01, -2.0355e+00, -8.8567e-01]], [[-8.8605e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 7.5355e-01, -5.6728e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-4.3371e+00, -3.6768e+00, -7.3714e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-5.9483e+00, -6.1223e+00, -6.7826e+00, ..., -6.1076e+00, -3.4028e+38, -3.4028e+38], [-5.5088e+00, -7.5049e+00, -5.9768e+00, ..., -3.4767e+00, -5.5521e+00, -3.4028e+38], [-8.0000e+00, -1.2842e+01, -9.0073e+00, ..., -6.9437e+00, -5.1912e+00, -5.5434e+00]], ..., [[-8.3518e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.5486e+00, -3.6403e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.3697e+00, -4.5553e+00, -5.3841e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-3.5115e+00, -4.7484e+00, -3.6419e+00, ..., -3.4534e+00, -3.4028e+38, -3.4028e+38], [-4.3902e+00, -5.9234e+00, -5.0463e+00, ..., -2.5518e+00, -4.7106e+00, -3.4028e+38], [-4.7555e+00, -8.3231e+00, -6.2912e+00, ..., -3.3778e+00, -2.5709e+00, -4.3723e+00]], [[ 4.2285e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-4.8483e-01, -3.1191e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-9.4446e-01, -3.0129e+00, -2.6438e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.1266e+00, -3.0494e+00, -2.7580e+00, ..., -1.7309e+00, -3.4028e+38, -3.4028e+38], [-8.3933e-01, -2.8693e+00, -2.5396e+00, ..., -1.6617e+00, -1.3670e+00, -3.4028e+38], [-1.2489e+00, -3.3855e+00, -2.9559e+00, ..., -2.0913e+00, -2.0099e+00, -2.2985e+00]], [[-7.9506e-02, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.2294e+00, -4.5237e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.1646e+00, -4.1651e+00, -3.6994e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-9.0788e-01, -4.2754e+00, -3.8699e+00, ..., -3.0398e+00, -3.4028e+38, -3.4028e+38], [-9.7489e-01, -4.4548e+00, -4.1134e+00, ..., -3.3533e+00, -3.1403e+00, -3.4028e+38], [-9.7120e-01, -4.9190e+00, -4.3547e+00, ..., -3.5138e+00, -3.2427e+00, -3.2375e+00]]], [[[ 1.3748e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.6654e-01, -3.3128e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.3153e+00, -3.2569e+00, -2.7809e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.4341e+00, -3.5812e+00, -2.6179e+00, ..., -4.1122e+00, -3.4028e+38, -3.4028e+38], [-1.3845e+00, -3.4265e+00, -2.2172e+00, ..., -2.7752e+00, -3.8452e+00, -3.4028e+38], [-1.5200e+00, -4.4548e+00, -2.1332e+00, ..., -3.4747e+00, -3.7491e+00, -3.1071e+00]], [[-6.3877e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.1421e+00, -1.5785e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.9012e+00, -6.6309e-01, -3.1614e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.2875e+00, -1.1435e+00, -2.6240e+00, ..., -9.5481e-01, -3.4028e+38, -3.4028e+38], [ 1.3192e+00, -1.2463e+00, -1.9914e+00, ..., -1.1514e+00, -1.8577e+00, -3.4028e+38], [ 1.6156e+00, -3.6972e-01, -1.4811e+00, ..., -9.1212e-01, -2.0355e+00, -8.8567e-01]], [[-8.8605e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 7.5355e-01, -5.6728e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-4.3371e+00, -3.6768e+00, -7.3714e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-5.9483e+00, -6.1223e+00, -6.7826e+00, ..., -6.1076e+00, -3.4028e+38, -3.4028e+38], [-5.5088e+00, -7.5049e+00, -5.9768e+00, ..., -3.4767e+00, -5.5521e+00, -3.4028e+38], [-8.0000e+00, -1.2842e+01, -9.0073e+00, ..., -6.9437e+00, -5.1912e+00, -5.5434e+00]], ..., [[-8.3518e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.5486e+00, -3.6403e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.3697e+00, -4.5553e+00, -5.3841e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-3.5115e+00, -4.7484e+00, -3.6419e+00, ..., -3.4534e+00, -3.4028e+38, -3.4028e+38], [-4.3902e+00, -5.9234e+00, -5.0463e+00, ..., -2.5518e+00, -4.7106e+00, -3.4028e+38], [-4.7555e+00, -8.3231e+00, -6.2912e+00, ..., -3.3778e+00, -2.5709e+00, -4.3723e+00]], [[ 4.2285e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-4.8483e-01, -3.1191e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-9.4446e-01, -3.0129e+00, -2.6438e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.1266e+00, -3.0494e+00, -2.7580e+00, ..., -1.7309e+00, -3.4028e+38, -3.4028e+38], [-8.3933e-01, -2.8693e+00, -2.5396e+00, ..., -1.6617e+00, -1.3670e+00, -3.4028e+38], [-1.2489e+00, -3.3855e+00, -2.9559e+00, ..., -2.0913e+00, -2.0099e+00, -2.2985e+00]], [[-7.9506e-02, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.2294e+00, -4.5237e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.1646e+00, -4.1651e+00, -3.6994e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-9.0788e-01, -4.2754e+00, -3.8699e+00, ..., -3.0398e+00, -3.4028e+38, -3.4028e+38], [-9.7489e-01, -4.4548e+00, -4.1134e+00, ..., -3.3533e+00, -3.1403e+00, -3.4028e+38], [-9.7120e-01, -4.9190e+00, -4.3547e+00, ..., -3.5138e+00, -3.2427e+00, -3.2375e+00]]], [[[ 1.3748e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.6654e-01, -3.3128e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.3153e+00, -3.2569e+00, -2.7809e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.4341e+00, -3.5812e+00, -2.6179e+00, ..., -4.1122e+00, -3.4028e+38, -3.4028e+38], [-1.3845e+00, -3.4265e+00, -2.2172e+00, ..., -2.7752e+00, -3.8452e+00, -3.4028e+38], [-1.5200e+00, -4.4548e+00, -2.1332e+00, ..., -3.4747e+00, -3.7491e+00, -3.1071e+00]], [[-6.3877e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.1421e+00, -1.5785e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.9012e+00, -6.6309e-01, -3.1614e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.2875e+00, -1.1435e+00, -2.6240e+00, ..., -9.5480e-01, -3.4028e+38, -3.4028e+38], [ 1.3192e+00, -1.2463e+00, -1.9914e+00, ..., -1.1514e+00, -1.8577e+00, -3.4028e+38], [ 1.6156e+00, -3.6972e-01, -1.4811e+00, ..., -9.1212e-01, -2.0355e+00, -8.8567e-01]], [[-8.8605e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 7.5356e-01, -5.6728e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-4.3371e+00, -3.6768e+00, -7.3714e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-5.9483e+00, -6.1223e+00, -6.7826e+00, ..., -6.1076e+00, -3.4028e+38, -3.4028e+38], [-5.5088e+00, -7.5049e+00, -5.9768e+00, ..., -3.4767e+00, -5.5521e+00, -3.4028e+38], [-8.0000e+00, -1.2842e+01, -9.0073e+00, ..., -6.9437e+00, -5.1912e+00, -5.5434e+00]], ..., [[-8.3518e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.5486e+00, -3.6403e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.3697e+00, -4.5553e+00, -5.3841e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-3.5115e+00, -4.7484e+00, -3.6419e+00, ..., -3.4534e+00, -3.4028e+38, -3.4028e+38], [-4.3902e+00, -5.9234e+00, -5.0463e+00, ..., -2.5518e+00, -4.7106e+00, -3.4028e+38], [-4.7555e+00, -8.3231e+00, -6.2912e+00, ..., -3.3778e+00, -2.5709e+00, -4.3723e+00]], [[ 4.2285e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-4.8483e-01, -3.1191e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-9.4446e-01, -3.0129e+00, -2.6438e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.1266e+00, -3.0494e+00, -2.7580e+00, ..., -1.7309e+00, -3.4028e+38, -3.4028e+38], [-8.3933e-01, -2.8693e+00, -2.5396e+00, ..., -1.6617e+00, -1.3670e+00, -3.4028e+38], [-1.2489e+00, -3.3855e+00, -2.9559e+00, ..., -2.0913e+00, -2.0099e+00, -2.2985e+00]], [[-7.9506e-02, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.2294e+00, -4.5237e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.1646e+00, -4.1651e+00, -3.6994e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-9.0788e-01, -4.2754e+00, -3.8699e+00, ..., -3.0398e+00, -3.4028e+38, -3.4028e+38], [-9.7489e-01, -4.4548e+00, -4.1134e+00, ..., -3.3533e+00, -3.1403e+00, -3.4028e+38], [-9.7120e-01, -4.9190e+00, -4.3547e+00, ..., -3.5138e+00, -3.2427e+00, -3.2375e+00]]]]) attn_weights tensor([[[[ 1.3370e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.5414e+00, -1.6294e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.4093e+00, -6.9634e-01, 1.9286e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 6.0392e+00, 4.6373e-02, -2.6897e+00, ..., 3.3760e+00, -3.4028e+38, -3.4028e+38], [ 6.9797e+00, 2.7495e-02, -1.5893e+00, ..., -2.6536e+00, 4.1670e+00, -3.4028e+38], [ 4.2373e+00, -3.6097e-01, -6.3418e-01, ..., -1.8845e+00, -3.1868e+00, -1.3555e+00]], [[ 3.4118e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.6398e+00, -4.7433e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.5557e+00, -4.3980e+00, -4.5282e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-2.4479e+00, -4.7177e+00, -3.6020e+00, ..., -5.1523e+00, -3.4028e+38, -3.4028e+38], [-2.6117e+00, -4.5784e+00, -3.5189e+00, ..., -4.9561e+00, -4.7676e+00, -3.4028e+38], [-2.8735e+00, -6.2049e+00, -3.9204e+00, ..., -6.8048e+00, -6.4545e+00, -3.9316e+00]], [[ 5.5059e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.3774e+00, -5.4990e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-3.6143e+00, -2.8628e+00, -4.3562e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-3.3383e+00, -5.3564e+00, -6.0400e+00, ..., -5.0555e+00, -3.4028e+38, -3.4028e+38], [-4.6294e+00, -6.1786e+00, -6.2973e+00, ..., -4.2973e+00, -4.7165e+00, -3.4028e+38], [-5.1593e+00, -8.4877e+00, -5.5703e+00, ..., -5.7308e+00, -5.6637e+00, -5.3823e+00]], ..., [[ 3.3260e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.6109e-01, -4.5554e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.3602e+00, -2.6441e+00, -3.3708e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.5410e+00, -3.8240e+00, -3.0517e+00, ..., -3.8653e+00, -3.4028e+38, -3.4028e+38], [-1.8272e+00, -3.6314e+00, -3.2827e+00, ..., -4.3390e+00, -4.7114e+00, -3.4028e+38], [-2.3302e+00, -4.9356e+00, -9.1044e-01, ..., -4.5500e+00, -4.9485e+00, -3.2114e+00]], [[ 4.8039e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-3.8261e-01, -6.9913e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.0456e-01, -5.0639e+00, -3.3534e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-7.5388e-01, -4.8873e+00, -5.1537e+00, ..., -2.1962e+00, -3.4028e+38, -3.4028e+38], [-9.4377e-01, -5.4111e+00, -5.6368e+00, ..., -2.1397e+00, -2.1948e+00, -3.4028e+38], [-1.2924e+00, -5.6647e+00, -4.4875e+00, ..., -3.7709e+00, -4.1344e+00, -2.9016e+00]], [[ 4.3822e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.0858e+00, -5.4014e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.0319e+00, -3.9772e+00, -4.4307e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.7595e+00, -4.4810e+00, -4.3304e+00, ..., -3.6133e+00, -3.4028e+38, -3.4028e+38], [-2.4498e+00, -4.8306e+00, -4.5289e+00, ..., -2.8773e+00, -2.9931e+00, -3.4028e+38], [-3.0744e+00, -5.5903e+00, -5.0912e+00, ..., -3.3333e+00, -3.3298e+00, -3.1947e+00]]], [[[ 1.3370e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.5414e+00, -1.6294e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.4093e+00, -6.9634e-01, 1.9286e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 6.0392e+00, 4.6373e-02, -2.6897e+00, ..., 3.3760e+00, -3.4028e+38, -3.4028e+38], [ 6.9797e+00, 2.7495e-02, -1.5893e+00, ..., -2.6536e+00, 4.1670e+00, -3.4028e+38], [ 4.2373e+00, -3.6097e-01, -6.3418e-01, ..., -1.8845e+00, -3.1868e+00, -1.3555e+00]], [[ 3.4118e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.6398e+00, -4.7433e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.5557e+00, -4.3980e+00, -4.5282e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-2.4479e+00, -4.7177e+00, -3.6020e+00, ..., -5.1523e+00, -3.4028e+38, -3.4028e+38], [-2.6117e+00, -4.5784e+00, -3.5189e+00, ..., -4.9561e+00, -4.7676e+00, -3.4028e+38], [-2.8735e+00, -6.2049e+00, -3.9204e+00, ..., -6.8048e+00, -6.4545e+00, -3.9316e+00]], [[ 5.5059e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.3774e+00, -5.4990e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-3.6143e+00, -2.8628e+00, -4.3562e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-3.3383e+00, -5.3564e+00, -6.0400e+00, ..., -5.0555e+00, -3.4028e+38, -3.4028e+38], [-4.6294e+00, -6.1786e+00, -6.2973e+00, ..., -4.2973e+00, -4.7165e+00, -3.4028e+38], [-5.1593e+00, -8.4877e+00, -5.5703e+00, ..., -5.7308e+00, -5.6637e+00, -5.3823e+00]], ..., [[ 3.3260e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.6109e-01, -4.5554e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.3602e+00, -2.6441e+00, -3.3708e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.5410e+00, -3.8240e+00, -3.0517e+00, ..., -3.8653e+00, -3.4028e+38, -3.4028e+38], [-1.8272e+00, -3.6314e+00, -3.2827e+00, ..., -4.3390e+00, -4.7114e+00, -3.4028e+38], [-2.3302e+00, -4.9356e+00, -9.1044e-01, ..., -4.5500e+00, -4.9485e+00, -3.2114e+00]], [[ 4.8039e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-3.8261e-01, -6.9913e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.0456e-01, -5.0639e+00, -3.3534e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-7.5388e-01, -4.8873e+00, -5.1537e+00, ..., -2.1962e+00, -3.4028e+38, -3.4028e+38], [-9.4377e-01, -5.4111e+00, -5.6368e+00, ..., -2.1397e+00, -2.1948e+00, -3.4028e+38], [-1.2924e+00, -5.6647e+00, -4.4875e+00, ..., -3.7709e+00, -4.1344e+00, -2.9016e+00]], [[ 4.3822e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.0858e+00, -5.4014e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.0319e+00, -3.9772e+00, -4.4307e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.7595e+00, -4.4810e+00, -4.3304e+00, ..., -3.6133e+00, -3.4028e+38, -3.4028e+38], [-2.4498e+00, -4.8306e+00, -4.5289e+00, ..., -2.8773e+00, -2.9931e+00, -3.4028e+38], [-3.0744e+00, -5.5903e+00, -5.0912e+00, ..., -3.3333e+00, -3.3298e+00, -3.1947e+00]]], [[[ 1.3370e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.5414e+00, -1.6294e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.4093e+00, -6.9634e-01, 1.9286e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 6.0392e+00, 4.6373e-02, -2.6897e+00, ..., 3.3760e+00, -3.4028e+38, -3.4028e+38], [ 6.9797e+00, 2.7495e-02, -1.5893e+00, ..., -2.6536e+00, 4.1670e+00, -3.4028e+38], [ 4.2373e+00, -3.6097e-01, -6.3418e-01, ..., -1.8845e+00, -3.1868e+00, -1.3555e+00]], [[ 3.4118e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.6398e+00, -4.7433e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.5557e+00, -4.3980e+00, -4.5282e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-2.4479e+00, -4.7177e+00, -3.6020e+00, ..., -5.1523e+00, -3.4028e+38, -3.4028e+38], [-2.6117e+00, -4.5784e+00, -3.5189e+00, ..., -4.9561e+00, -4.7676e+00, -3.4028e+38], [-2.8735e+00, -6.2049e+00, -3.9204e+00, ..., -6.8048e+00, -6.4545e+00, -3.9316e+00]], [[ 5.5059e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.3774e+00, -5.4990e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-3.6143e+00, -2.8628e+00, -4.3562e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-3.3383e+00, -5.3564e+00, -6.0400e+00, ..., -5.0555e+00, -3.4028e+38, -3.4028e+38], [-4.6294e+00, -6.1786e+00, -6.2973e+00, ..., -4.2973e+00, -4.7165e+00, -3.4028e+38], [-5.1593e+00, -8.4877e+00, -5.5703e+00, ..., -5.7308e+00, -5.6637e+00, -5.3823e+00]], ..., [[ 3.3260e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.6109e-01, -4.5554e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.3602e+00, -2.6441e+00, -3.3708e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.5410e+00, -3.8240e+00, -3.0517e+00, ..., -3.8653e+00, -3.4028e+38, -3.4028e+38], [-1.8272e+00, -3.6314e+00, -3.2827e+00, ..., -4.3390e+00, -4.7114e+00, -3.4028e+38], [-2.3302e+00, -4.9356e+00, -9.1044e-01, ..., -4.5500e+00, -4.9485e+00, -3.2114e+00]], [[ 4.8039e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-3.8261e-01, -6.9913e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.0456e-01, -5.0639e+00, -3.3534e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-7.5388e-01, -4.8873e+00, -5.1537e+00, ..., -2.1962e+00, -3.4028e+38, -3.4028e+38], [-9.4377e-01, -5.4111e+00, -5.6368e+00, ..., -2.1397e+00, -2.1948e+00, -3.4028e+38], [-1.2924e+00, -5.6647e+00, -4.4875e+00, ..., -3.7709e+00, -4.1344e+00, -2.9016e+00]], [[ 4.3822e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.0858e+00, -5.4014e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.0319e+00, -3.9772e+00, -4.4307e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.7595e+00, -4.4810e+00, -4.3304e+00, ..., -3.6133e+00, -3.4028e+38, -3.4028e+38], [-2.4498e+00, -4.8306e+00, -4.5289e+00, ..., -2.8773e+00, -2.9931e+00, -3.4028e+38], [-3.0744e+00, -5.5903e+00, -5.0912e+00, ..., -3.3333e+00, -3.3298e+00, -3.1947e+00]]], [[[ 1.3370e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.5414e+00, -1.6294e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.4093e+00, -6.9634e-01, 1.9286e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 6.0392e+00, 4.6373e-02, -2.6897e+00, ..., 3.3760e+00, -3.4028e+38, -3.4028e+38], [ 6.9797e+00, 2.7495e-02, -1.5893e+00, ..., -2.6536e+00, 4.1670e+00, -3.4028e+38], [ 4.2373e+00, -3.6097e-01, -6.3418e-01, ..., -1.8845e+00, -3.1868e+00, -1.3555e+00]], [[ 3.4118e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.6398e+00, -4.7433e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.5557e+00, -4.3980e+00, -4.5282e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-2.4479e+00, -4.7177e+00, -3.6020e+00, ..., -5.1523e+00, -3.4028e+38, -3.4028e+38], [-2.6117e+00, -4.5784e+00, -3.5189e+00, ..., -4.9561e+00, -4.7676e+00, -3.4028e+38], [-2.8735e+00, -6.2049e+00, -3.9204e+00, ..., -6.8048e+00, -6.4545e+00, -3.9316e+00]], [[ 5.5059e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.3774e+00, -5.4990e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-3.6143e+00, -2.8628e+00, -4.3562e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-3.3383e+00, -5.3564e+00, -6.0400e+00, ..., -5.0555e+00, -3.4028e+38, -3.4028e+38], [-4.6294e+00, -6.1786e+00, -6.2973e+00, ..., -4.2973e+00, -4.7165e+00, -3.4028e+38], [-5.1593e+00, -8.4877e+00, -5.5703e+00, ..., -5.7308e+00, -5.6637e+00, -5.3823e+00]], ..., [[ 3.3260e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.6109e-01, -4.5554e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.3602e+00, -2.6441e+00, -3.3708e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.5410e+00, -3.8240e+00, -3.0517e+00, ..., -3.8653e+00, -3.4028e+38, -3.4028e+38], [-1.8272e+00, -3.6314e+00, -3.2827e+00, ..., -4.3390e+00, -4.7114e+00, -3.4028e+38], [-2.3302e+00, -4.9356e+00, -9.1044e-01, ..., -4.5500e+00, -4.9485e+00, -3.2114e+00]], [[ 4.8039e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-3.8261e-01, -6.9913e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.0456e-01, -5.0639e+00, -3.3534e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-7.5388e-01, -4.8873e+00, -5.1537e+00, ..., -2.1962e+00, -3.4028e+38, -3.4028e+38], [-9.4377e-01, -5.4111e+00, -5.6368e+00, ..., -2.1397e+00, -2.1948e+00, -3.4028e+38], [-1.2924e+00, -5.6647e+00, -4.4875e+00, ..., -3.7709e+00, -4.1344e+00, -2.9016e+00]], [[ 4.3822e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.0858e+00, -5.4014e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.0319e+00, -3.9772e+00, -4.4307e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.7595e+00, -4.4810e+00, -4.3304e+00, ..., -3.6133e+00, -3.4028e+38, -3.4028e+38], [-2.4498e+00, -4.8306e+00, -4.5289e+00, ..., -2.8773e+00, -2.9931e+00, -3.4028e+38], [-3.0744e+00, -5.5903e+00, -5.0912e+00, ..., -3.3333e+00, -3.3298e+00, -3.1947e+00]]], [[[ 1.3370e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.5414e+00, -1.6294e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.4093e+00, -6.9634e-01, 1.9286e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 6.0392e+00, 4.6375e-02, -2.6897e+00, ..., 3.3760e+00, -3.4028e+38, -3.4028e+38], [ 6.9797e+00, 2.7497e-02, -1.5893e+00, ..., -2.6536e+00, 4.1670e+00, -3.4028e+38], [ 4.2373e+00, -3.6097e-01, -6.3418e-01, ..., -1.8845e+00, -3.1868e+00, -1.3555e+00]], [[ 3.4118e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.6398e+00, -4.7433e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.5557e+00, -4.3980e+00, -4.5282e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-2.4479e+00, -4.7177e+00, -3.6020e+00, ..., -5.1523e+00, -3.4028e+38, -3.4028e+38], [-2.6117e+00, -4.5784e+00, -3.5189e+00, ..., -4.9561e+00, -4.7676e+00, -3.4028e+38], [-2.8735e+00, -6.2049e+00, -3.9204e+00, ..., -6.8048e+00, -6.4545e+00, -3.9316e+00]], [[ 5.5059e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.3774e+00, -5.4990e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-3.6143e+00, -2.8628e+00, -4.3561e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-3.3383e+00, -5.3563e+00, -6.0400e+00, ..., -5.0555e+00, -3.4028e+38, -3.4028e+38], [-4.6294e+00, -6.1786e+00, -6.2973e+00, ..., -4.2973e+00, -4.7165e+00, -3.4028e+38], [-5.1593e+00, -8.4877e+00, -5.5703e+00, ..., -5.7308e+00, -5.6636e+00, -5.3823e+00]], ..., [[ 3.3260e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.6109e-01, -4.5554e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.3602e+00, -2.6441e+00, -3.3708e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.5410e+00, -3.8240e+00, -3.0517e+00, ..., -3.8653e+00, -3.4028e+38, -3.4028e+38], [-1.8272e+00, -3.6314e+00, -3.2827e+00, ..., -4.3390e+00, -4.7114e+00, -3.4028e+38], [-2.3302e+00, -4.9356e+00, -9.1045e-01, ..., -4.5500e+00, -4.9485e+00, -3.2114e+00]], [[ 4.8039e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-3.8262e-01, -6.9913e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.0456e-01, -5.0639e+00, -3.3534e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-7.5388e-01, -4.8873e+00, -5.1537e+00, ..., -2.1962e+00, -3.4028e+38, -3.4028e+38], [-9.4377e-01, -5.4111e+00, -5.6368e+00, ..., -2.1397e+00, -2.1948e+00, -3.4028e+38], [-1.2924e+00, -5.6647e+00, -4.4875e+00, ..., -3.7709e+00, -4.1344e+00, -2.9016e+00]], [[ 4.3822e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.0858e+00, -5.4014e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.0319e+00, -3.9772e+00, -4.4307e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.7595e+00, -4.4810e+00, -4.3304e+00, ..., -3.6133e+00, -3.4028e+38, -3.4028e+38], [-2.4498e+00, -4.8306e+00, -4.5289e+00, ..., -2.8773e+00, -2.9931e+00, -3.4028e+38], [-3.0744e+00, -5.5903e+00, -5.0912e+00, ..., -3.3333e+00, -3.3298e+00, -3.1947e+00]]]]) attn_weights tensor([[[[ 5.2258e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.2839e+00, -5.4823e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.0979e+00, -4.0280e+00, -5.0245e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-2.5159e+00, -4.9556e+00, -4.6603e+00, ..., -4.8628e+00, -3.4028e+38, -3.4028e+38], [-2.5849e+00, -5.5911e+00, -4.8803e+00, ..., -4.4907e+00, -3.7806e+00, -3.4028e+38], [-3.2263e+00, -6.3212e+00, -5.3159e+00, ..., -5.8555e+00, -4.9175e+00, -3.8112e+00]], [[ 3.4998e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.2955e+00, -5.5388e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.2073e+00, -2.1659e+00, -3.4009e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.6912e+00, -3.7512e+00, -3.0170e+00, ..., -4.9112e+00, -3.4028e+38, -3.4028e+38], [-1.7998e+00, -4.9061e+00, -4.0080e+00, ..., -4.5563e+00, -3.8540e+00, -3.4028e+38], [-2.1657e+00, -4.8217e+00, -4.0915e+00, ..., -5.3257e+00, -4.1937e+00, -3.2829e+00]], [[ 2.1360e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 8.5725e-02, -3.8091e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-3.3048e-01, -1.6859e+00, -3.6940e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.0814e-01, -2.5439e+00, -3.4072e+00, ..., -3.2358e+00, -3.4028e+38, -3.4028e+38], [ 1.4362e-01, -2.4037e+00, -3.2379e+00, ..., -3.8533e+00, -3.7491e+00, -3.4028e+38], [-3.6946e-01, -2.1885e+00, -3.0159e+00, ..., -3.7366e+00, -2.6264e+00, -2.3752e+00]], ..., [[ 3.3960e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-3.0455e-01, -3.8327e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-9.7245e-01, -1.3171e+00, -3.9416e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-6.7002e-01, -3.4138e+00, -3.3929e+00, ..., -4.5815e+00, -3.4028e+38, -3.4028e+38], [-6.6821e-01, -3.8797e+00, -3.9224e+00, ..., -4.1135e+00, -2.9419e+00, -3.4028e+38], [-1.3882e+00, -3.6128e+00, -3.0081e+00, ..., -4.0574e+00, -2.6247e+00, -3.2819e+00]], [[ 3.1170e-02, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.7083e+00, -2.1508e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.3599e+00, -1.0954e+00, -2.7121e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.3384e+00, -3.2187e+00, -3.9064e+00, ..., -1.8745e+00, -3.4028e+38, -3.4028e+38], [ 1.4236e+00, -2.9822e+00, -3.0266e+00, ..., -3.9205e+00, -2.3232e+00, -3.4028e+38], [ 1.1624e+00, -1.7251e+00, -2.2940e+00, ..., -2.7855e+00, -2.8873e+00, -1.7182e+00]], [[-3.9109e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 6.0680e+00, -1.7440e+01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-6.8638e+00, 2.3113e+00, -8.4546e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-6.9636e+00, -5.6462e+00, -3.7359e+00, ..., -3.0332e+00, -3.4028e+38, -3.4028e+38], [-5.6381e-01, -1.2027e+01, -1.6009e+01, ..., 1.5152e+01, 6.2844e+00, -3.4028e+38], [-4.6380e+00, -2.6326e+01, -2.4489e+01, ..., 1.0146e+00, 1.4930e+01, -2.1059e+00]]], [[[ 5.2258e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.2839e+00, -5.4823e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.0979e+00, -4.0280e+00, -5.0245e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-2.5159e+00, -4.9556e+00, -4.6603e+00, ..., -4.8628e+00, -3.4028e+38, -3.4028e+38], [-2.5849e+00, -5.5911e+00, -4.8803e+00, ..., -4.4907e+00, -3.7806e+00, -3.4028e+38], [-3.2263e+00, -6.3212e+00, -5.3159e+00, ..., -5.8555e+00, -4.9175e+00, -3.8112e+00]], [[ 3.4998e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.2955e+00, -5.5388e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.2073e+00, -2.1659e+00, -3.4009e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.6912e+00, -3.7512e+00, -3.0170e+00, ..., -4.9112e+00, -3.4028e+38, -3.4028e+38], [-1.7998e+00, -4.9061e+00, -4.0080e+00, ..., -4.5563e+00, -3.8540e+00, -3.4028e+38], [-2.1657e+00, -4.8217e+00, -4.0915e+00, ..., -5.3257e+00, -4.1937e+00, -3.2829e+00]], [[ 2.1360e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 8.5725e-02, -3.8091e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-3.3048e-01, -1.6859e+00, -3.6940e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.0814e-01, -2.5439e+00, -3.4072e+00, ..., -3.2358e+00, -3.4028e+38, -3.4028e+38], [ 1.4362e-01, -2.4037e+00, -3.2379e+00, ..., -3.8533e+00, -3.7491e+00, -3.4028e+38], [-3.6946e-01, -2.1885e+00, -3.0159e+00, ..., -3.7366e+00, -2.6264e+00, -2.3752e+00]], ..., [[ 3.3960e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-3.0455e-01, -3.8327e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-9.7245e-01, -1.3171e+00, -3.9416e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-6.7002e-01, -3.4138e+00, -3.3929e+00, ..., -4.5815e+00, -3.4028e+38, -3.4028e+38], [-6.6821e-01, -3.8797e+00, -3.9224e+00, ..., -4.1135e+00, -2.9419e+00, -3.4028e+38], [-1.3882e+00, -3.6128e+00, -3.0081e+00, ..., -4.0574e+00, -2.6247e+00, -3.2819e+00]], [[ 3.1170e-02, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.7083e+00, -2.1508e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.3599e+00, -1.0954e+00, -2.7121e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.3384e+00, -3.2187e+00, -3.9064e+00, ..., -1.8745e+00, -3.4028e+38, -3.4028e+38], [ 1.4236e+00, -2.9822e+00, -3.0266e+00, ..., -3.9205e+00, -2.3232e+00, -3.4028e+38], [ 1.1624e+00, -1.7251e+00, -2.2940e+00, ..., -2.7855e+00, -2.8873e+00, -1.7182e+00]], [[-3.9109e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 6.0680e+00, -1.7440e+01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-6.8638e+00, 2.3113e+00, -8.4546e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-6.9636e+00, -5.6462e+00, -3.7359e+00, ..., -3.0332e+00, -3.4028e+38, -3.4028e+38], [-5.6381e-01, -1.2027e+01, -1.6009e+01, ..., 1.5152e+01, 6.2844e+00, -3.4028e+38], [-4.6380e+00, -2.6326e+01, -2.4489e+01, ..., 1.0146e+00, 1.4930e+01, -2.1059e+00]]], [[[ 5.2258e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.2839e+00, -5.4823e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.0979e+00, -4.0280e+00, -5.0245e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-2.5159e+00, -4.9556e+00, -4.6603e+00, ..., -4.8628e+00, -3.4028e+38, -3.4028e+38], [-2.5849e+00, -5.5911e+00, -4.8803e+00, ..., -4.4907e+00, -3.7806e+00, -3.4028e+38], [-3.2263e+00, -6.3212e+00, -5.3159e+00, ..., -5.8555e+00, -4.9175e+00, -3.8112e+00]], [[ 3.4998e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.2955e+00, -5.5388e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.2073e+00, -2.1659e+00, -3.4009e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.6912e+00, -3.7512e+00, -3.0170e+00, ..., -4.9112e+00, -3.4028e+38, -3.4028e+38], [-1.7998e+00, -4.9061e+00, -4.0080e+00, ..., -4.5563e+00, -3.8540e+00, -3.4028e+38], [-2.1657e+00, -4.8217e+00, -4.0915e+00, ..., -5.3257e+00, -4.1937e+00, -3.2829e+00]], [[ 2.1360e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 8.5725e-02, -3.8091e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-3.3048e-01, -1.6859e+00, -3.6940e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.0814e-01, -2.5439e+00, -3.4072e+00, ..., -3.2358e+00, -3.4028e+38, -3.4028e+38], [ 1.4362e-01, -2.4037e+00, -3.2379e+00, ..., -3.8533e+00, -3.7491e+00, -3.4028e+38], [-3.6946e-01, -2.1885e+00, -3.0159e+00, ..., -3.7366e+00, -2.6264e+00, -2.3752e+00]], ..., [[ 3.3960e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-3.0455e-01, -3.8327e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-9.7245e-01, -1.3171e+00, -3.9416e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-6.7002e-01, -3.4138e+00, -3.3929e+00, ..., -4.5815e+00, -3.4028e+38, -3.4028e+38], [-6.6821e-01, -3.8797e+00, -3.9224e+00, ..., -4.1135e+00, -2.9419e+00, -3.4028e+38], [-1.3882e+00, -3.6128e+00, -3.0081e+00, ..., -4.0574e+00, -2.6247e+00, -3.2819e+00]], [[ 3.1170e-02, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.7083e+00, -2.1508e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.3599e+00, -1.0954e+00, -2.7121e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.3384e+00, -3.2187e+00, -3.9064e+00, ..., -1.8745e+00, -3.4028e+38, -3.4028e+38], [ 1.4236e+00, -2.9822e+00, -3.0266e+00, ..., -3.9205e+00, -2.3232e+00, -3.4028e+38], [ 1.1624e+00, -1.7251e+00, -2.2940e+00, ..., -2.7855e+00, -2.8873e+00, -1.7182e+00]], [[-3.9109e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 6.0680e+00, -1.7440e+01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-6.8638e+00, 2.3113e+00, -8.4546e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-6.9636e+00, -5.6462e+00, -3.7359e+00, ..., -3.0332e+00, -3.4028e+38, -3.4028e+38], [-5.6381e-01, -1.2027e+01, -1.6009e+01, ..., 1.5152e+01, 6.2844e+00, -3.4028e+38], [-4.6380e+00, -2.6326e+01, -2.4489e+01, ..., 1.0146e+00, 1.4930e+01, -2.1059e+00]]], [[[ 5.2258e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.2839e+00, -5.4823e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.0979e+00, -4.0280e+00, -5.0245e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-2.5159e+00, -4.9556e+00, -4.6603e+00, ..., -4.8628e+00, -3.4028e+38, -3.4028e+38], [-2.5849e+00, -5.5911e+00, -4.8803e+00, ..., -4.4907e+00, -3.7806e+00, -3.4028e+38], [-3.2263e+00, -6.3212e+00, -5.3159e+00, ..., -5.8555e+00, -4.9175e+00, -3.8112e+00]], [[ 3.4998e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.2955e+00, -5.5388e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.2073e+00, -2.1659e+00, -3.4009e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.6912e+00, -3.7512e+00, -3.0170e+00, ..., -4.9112e+00, -3.4028e+38, -3.4028e+38], [-1.7998e+00, -4.9061e+00, -4.0080e+00, ..., -4.5563e+00, -3.8540e+00, -3.4028e+38], [-2.1657e+00, -4.8217e+00, -4.0915e+00, ..., -5.3257e+00, -4.1937e+00, -3.2829e+00]], [[ 2.1360e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 8.5725e-02, -3.8091e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-3.3048e-01, -1.6859e+00, -3.6940e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.0814e-01, -2.5439e+00, -3.4072e+00, ..., -3.2358e+00, -3.4028e+38, -3.4028e+38], [ 1.4362e-01, -2.4037e+00, -3.2379e+00, ..., -3.8533e+00, -3.7491e+00, -3.4028e+38], [-3.6946e-01, -2.1885e+00, -3.0159e+00, ..., -3.7366e+00, -2.6264e+00, -2.3752e+00]], ..., [[ 3.3960e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-3.0455e-01, -3.8327e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-9.7245e-01, -1.3171e+00, -3.9416e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-6.7002e-01, -3.4138e+00, -3.3929e+00, ..., -4.5815e+00, -3.4028e+38, -3.4028e+38], [-6.6821e-01, -3.8797e+00, -3.9224e+00, ..., -4.1135e+00, -2.9419e+00, -3.4028e+38], [-1.3882e+00, -3.6128e+00, -3.0081e+00, ..., -4.0574e+00, -2.6247e+00, -3.2819e+00]], [[ 3.1170e-02, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.7083e+00, -2.1508e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.3599e+00, -1.0954e+00, -2.7121e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.3384e+00, -3.2187e+00, -3.9064e+00, ..., -1.8745e+00, -3.4028e+38, -3.4028e+38], [ 1.4236e+00, -2.9822e+00, -3.0266e+00, ..., -3.9205e+00, -2.3232e+00, -3.4028e+38], [ 1.1624e+00, -1.7251e+00, -2.2940e+00, ..., -2.7855e+00, -2.8873e+00, -1.7182e+00]], [[-3.9109e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 6.0680e+00, -1.7440e+01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-6.8638e+00, 2.3113e+00, -8.4546e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-6.9636e+00, -5.6462e+00, -3.7359e+00, ..., -3.0332e+00, -3.4028e+38, -3.4028e+38], [-5.6381e-01, -1.2027e+01, -1.6009e+01, ..., 1.5152e+01, 6.2844e+00, -3.4028e+38], [-4.6380e+00, -2.6326e+01, -2.4489e+01, ..., 1.0146e+00, 1.4930e+01, -2.1059e+00]]], [[[ 5.2258e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.2839e+00, -5.4823e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.0979e+00, -4.0280e+00, -5.0245e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-2.5159e+00, -4.9556e+00, -4.6603e+00, ..., -4.8628e+00, -3.4028e+38, -3.4028e+38], [-2.5849e+00, -5.5911e+00, -4.8803e+00, ..., -4.4907e+00, -3.7806e+00, -3.4028e+38], [-3.2263e+00, -6.3212e+00, -5.3159e+00, ..., -5.8554e+00, -4.9175e+00, -3.8112e+00]], [[ 3.4998e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.2955e+00, -5.5388e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.2073e+00, -2.1659e+00, -3.4009e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.6912e+00, -3.7512e+00, -3.0170e+00, ..., -4.9112e+00, -3.4028e+38, -3.4028e+38], [-1.7998e+00, -4.9061e+00, -4.0080e+00, ..., -4.5563e+00, -3.8540e+00, -3.4028e+38], [-2.1657e+00, -4.8217e+00, -4.0915e+00, ..., -5.3257e+00, -4.1937e+00, -3.2829e+00]], [[ 2.1360e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 8.5724e-02, -3.8090e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-3.3048e-01, -1.6859e+00, -3.6940e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.0814e-01, -2.5439e+00, -3.4072e+00, ..., -3.2358e+00, -3.4028e+38, -3.4028e+38], [ 1.4362e-01, -2.4037e+00, -3.2379e+00, ..., -3.8533e+00, -3.7491e+00, -3.4028e+38], [-3.6946e-01, -2.1885e+00, -3.0159e+00, ..., -3.7366e+00, -2.6264e+00, -2.3752e+00]], ..., [[ 3.3960e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-3.0455e-01, -3.8327e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-9.7245e-01, -1.3171e+00, -3.9416e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-6.7002e-01, -3.4138e+00, -3.3929e+00, ..., -4.5815e+00, -3.4028e+38, -3.4028e+38], [-6.6821e-01, -3.8797e+00, -3.9224e+00, ..., -4.1135e+00, -2.9419e+00, -3.4028e+38], [-1.3882e+00, -3.6128e+00, -3.0081e+00, ..., -4.0574e+00, -2.6247e+00, -3.2819e+00]], [[ 3.1170e-02, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.7083e+00, -2.1508e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.3599e+00, -1.0954e+00, -2.7121e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.3384e+00, -3.2187e+00, -3.9064e+00, ..., -1.8745e+00, -3.4028e+38, -3.4028e+38], [ 1.4236e+00, -2.9822e+00, -3.0266e+00, ..., -3.9205e+00, -2.3232e+00, -3.4028e+38], [ 1.1624e+00, -1.7251e+00, -2.2940e+00, ..., -2.7855e+00, -2.8873e+00, -1.7182e+00]], [[-3.9109e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 6.0680e+00, -1.7440e+01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-6.8638e+00, 2.3113e+00, -8.4546e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-6.9636e+00, -5.6462e+00, -3.7359e+00, ..., -3.0332e+00, -3.4028e+38, -3.4028e+38], [-5.6382e-01, -1.2027e+01, -1.6009e+01, ..., 1.5152e+01, 6.2845e+00, -3.4028e+38], [-4.6380e+00, -2.6326e+01, -2.4489e+01, ..., 1.0146e+00, 1.4930e+01, -2.1058e+00]]]]) attn_weights tensor([[[[ 5.5354e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.9950e+00, -2.7194e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.6488e+00, -2.6353e+00, -7.4467e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.0505e+00, -5.6088e+00, -5.4696e+00, ..., -2.1410e+00, -3.4028e+38, -3.4028e+38], [ 2.5608e+00, -6.4551e+00, -6.5813e+00, ..., -3.3749e+00, -3.6944e-01, -3.4028e+38], [ 2.8821e+00, -7.1525e+00, -1.5454e+00, ..., -1.9061e+00, -9.8796e-01, -2.9037e-01]], [[ 3.0970e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.2565e+00, -3.6192e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.8378e+00, -6.0636e+00, -1.8980e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.2379e+00, -1.2538e+01, -1.0748e+01, ..., -1.8623e+00, -3.4028e+38, -3.4028e+38], [ 4.7958e+00, -1.7049e+01, -1.5393e+01, ..., -4.9939e+00, 4.2980e-02, -3.4028e+38], [ 4.5539e+00, -1.4754e+01, -6.3261e+00, ..., -2.8039e+00, -5.1020e+00, -1.0666e+00]], [[ 1.9081e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 6.3271e-01, -5.8182e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.6856e-01, 4.6776e-01, -2.1147e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 5.6895e-01, -1.5966e+00, -1.9752e+00, ..., -3.3202e+00, -3.4028e+38, -3.4028e+38], [ 2.3748e-01, -2.5037e+00, -3.4269e+00, ..., -1.6147e+00, -3.3750e+00, -3.4028e+38], [-2.2952e-01, -2.5554e+00, -1.9919e+00, ..., -1.4025e+00, -1.8757e+00, -3.0655e+00]], ..., [[ 3.3014e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4848e+00, -4.0527e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.1000e+00, -2.6197e+00, -4.1458e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.1817e+00, -2.9270e+00, -4.0100e+00, ..., -2.5781e+00, -3.4028e+38, -3.4028e+38], [ 1.1613e+00, -3.0490e+00, -3.4711e+00, ..., -1.2918e+00, -2.4897e+00, -3.4028e+38], [ 1.0506e+00, -3.1133e+00, -2.9903e+00, ..., -2.0384e+00, -2.0099e+00, -1.4311e+00]], [[ 4.3132e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.7105e+00, -4.2972e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.3278e+00, -1.3996e+00, -1.7276e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.2652e+00, 1.7028e+00, 2.0620e-01, ..., 3.0405e+00, -3.4028e+38, -3.4028e+38], [ 2.9009e+00, -7.9501e-01, 1.4879e-01, ..., 2.1620e-01, 1.3044e+00, -3.4028e+38], [ 1.9817e+00, -1.2267e+00, -4.1662e-01, ..., -1.8797e-01, 1.1607e+00, 9.2088e-01]], [[ 3.5336e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4178e+00, -2.3004e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.1436e+00, -3.3290e-01, 1.3263e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 8.2124e-01, -3.2162e+00, -2.9845e+00, ..., -2.0351e+00, -3.4028e+38, -3.4028e+38], [ 9.6905e-01, -3.6250e+00, -3.6459e+00, ..., -2.2789e+00, -2.3357e+00, -3.4028e+38], [ 1.0930e+00, -1.7560e+00, -1.9461e+00, ..., -1.0655e+00, -2.9021e+00, -2.2092e-01]]], [[[ 5.5354e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.9950e+00, -2.7194e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.6488e+00, -2.6353e+00, -7.4467e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.0505e+00, -5.6088e+00, -5.4696e+00, ..., -2.1410e+00, -3.4028e+38, -3.4028e+38], [ 2.5608e+00, -6.4551e+00, -6.5813e+00, ..., -3.3749e+00, -3.6944e-01, -3.4028e+38], [ 2.8821e+00, -7.1525e+00, -1.5454e+00, ..., -1.9061e+00, -9.8796e-01, -2.9037e-01]], [[ 3.0970e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.2565e+00, -3.6192e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.8378e+00, -6.0636e+00, -1.8980e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.2379e+00, -1.2538e+01, -1.0748e+01, ..., -1.8623e+00, -3.4028e+38, -3.4028e+38], [ 4.7958e+00, -1.7049e+01, -1.5393e+01, ..., -4.9939e+00, 4.2980e-02, -3.4028e+38], [ 4.5539e+00, -1.4754e+01, -6.3261e+00, ..., -2.8039e+00, -5.1020e+00, -1.0666e+00]], [[ 1.9081e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 6.3271e-01, -5.8182e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.6856e-01, 4.6776e-01, -2.1147e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 5.6895e-01, -1.5966e+00, -1.9752e+00, ..., -3.3202e+00, -3.4028e+38, -3.4028e+38], [ 2.3748e-01, -2.5037e+00, -3.4269e+00, ..., -1.6147e+00, -3.3750e+00, -3.4028e+38], [-2.2952e-01, -2.5554e+00, -1.9919e+00, ..., -1.4025e+00, -1.8757e+00, -3.0655e+00]], ..., [[ 3.3014e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4848e+00, -4.0527e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.1000e+00, -2.6197e+00, -4.1458e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.1817e+00, -2.9270e+00, -4.0100e+00, ..., -2.5781e+00, -3.4028e+38, -3.4028e+38], [ 1.1613e+00, -3.0490e+00, -3.4711e+00, ..., -1.2918e+00, -2.4897e+00, -3.4028e+38], [ 1.0506e+00, -3.1133e+00, -2.9903e+00, ..., -2.0384e+00, -2.0099e+00, -1.4311e+00]], [[ 4.3132e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.7105e+00, -4.2972e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.3278e+00, -1.3996e+00, -1.7276e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.2652e+00, 1.7028e+00, 2.0620e-01, ..., 3.0405e+00, -3.4028e+38, -3.4028e+38], [ 2.9009e+00, -7.9501e-01, 1.4879e-01, ..., 2.1620e-01, 1.3044e+00, -3.4028e+38], [ 1.9817e+00, -1.2267e+00, -4.1662e-01, ..., -1.8797e-01, 1.1607e+00, 9.2088e-01]], [[ 3.5336e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4178e+00, -2.3004e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.1436e+00, -3.3290e-01, 1.3263e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 8.2124e-01, -3.2162e+00, -2.9845e+00, ..., -2.0351e+00, -3.4028e+38, -3.4028e+38], [ 9.6905e-01, -3.6250e+00, -3.6459e+00, ..., -2.2789e+00, -2.3357e+00, -3.4028e+38], [ 1.0930e+00, -1.7560e+00, -1.9461e+00, ..., -1.0655e+00, -2.9021e+00, -2.2092e-01]]], [[[ 5.5354e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.9950e+00, -2.7194e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.6488e+00, -2.6353e+00, -7.4467e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.0505e+00, -5.6088e+00, -5.4696e+00, ..., -2.1410e+00, -3.4028e+38, -3.4028e+38], [ 2.5608e+00, -6.4551e+00, -6.5813e+00, ..., -3.3749e+00, -3.6944e-01, -3.4028e+38], [ 2.8821e+00, -7.1525e+00, -1.5454e+00, ..., -1.9061e+00, -9.8796e-01, -2.9037e-01]], [[ 3.0970e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.2565e+00, -3.6192e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.8378e+00, -6.0636e+00, -1.8980e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.2379e+00, -1.2538e+01, -1.0748e+01, ..., -1.8623e+00, -3.4028e+38, -3.4028e+38], [ 4.7958e+00, -1.7049e+01, -1.5393e+01, ..., -4.9939e+00, 4.2980e-02, -3.4028e+38], [ 4.5539e+00, -1.4754e+01, -6.3261e+00, ..., -2.8039e+00, -5.1020e+00, -1.0666e+00]], [[ 1.9081e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 6.3271e-01, -5.8182e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.6856e-01, 4.6776e-01, -2.1147e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 5.6895e-01, -1.5966e+00, -1.9752e+00, ..., -3.3202e+00, -3.4028e+38, -3.4028e+38], [ 2.3748e-01, -2.5037e+00, -3.4269e+00, ..., -1.6147e+00, -3.3750e+00, -3.4028e+38], [-2.2952e-01, -2.5554e+00, -1.9919e+00, ..., -1.4025e+00, -1.8757e+00, -3.0655e+00]], ..., [[ 3.3014e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4848e+00, -4.0527e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.1000e+00, -2.6197e+00, -4.1458e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.1817e+00, -2.9270e+00, -4.0100e+00, ..., -2.5781e+00, -3.4028e+38, -3.4028e+38], [ 1.1613e+00, -3.0490e+00, -3.4711e+00, ..., -1.2918e+00, -2.4897e+00, -3.4028e+38], [ 1.0506e+00, -3.1133e+00, -2.9903e+00, ..., -2.0384e+00, -2.0099e+00, -1.4311e+00]], [[ 4.3132e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.7105e+00, -4.2972e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.3278e+00, -1.3996e+00, -1.7276e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.2652e+00, 1.7028e+00, 2.0620e-01, ..., 3.0405e+00, -3.4028e+38, -3.4028e+38], [ 2.9009e+00, -7.9501e-01, 1.4879e-01, ..., 2.1620e-01, 1.3044e+00, -3.4028e+38], [ 1.9817e+00, -1.2267e+00, -4.1662e-01, ..., -1.8797e-01, 1.1607e+00, 9.2088e-01]], [[ 3.5336e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4178e+00, -2.3004e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.1436e+00, -3.3290e-01, 1.3263e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 8.2124e-01, -3.2162e+00, -2.9845e+00, ..., -2.0351e+00, -3.4028e+38, -3.4028e+38], [ 9.6905e-01, -3.6250e+00, -3.6459e+00, ..., -2.2789e+00, -2.3357e+00, -3.4028e+38], [ 1.0930e+00, -1.7560e+00, -1.9461e+00, ..., -1.0655e+00, -2.9021e+00, -2.2092e-01]]], [[[ 5.5354e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.9950e+00, -2.7194e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.6488e+00, -2.6353e+00, -7.4467e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.0505e+00, -5.6088e+00, -5.4696e+00, ..., -2.1410e+00, -3.4028e+38, -3.4028e+38], [ 2.5608e+00, -6.4551e+00, -6.5813e+00, ..., -3.3749e+00, -3.6944e-01, -3.4028e+38], [ 2.8821e+00, -7.1525e+00, -1.5454e+00, ..., -1.9061e+00, -9.8796e-01, -2.9037e-01]], [[ 3.0970e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.2565e+00, -3.6192e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.8378e+00, -6.0636e+00, -1.8980e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.2379e+00, -1.2538e+01, -1.0748e+01, ..., -1.8623e+00, -3.4028e+38, -3.4028e+38], [ 4.7958e+00, -1.7049e+01, -1.5393e+01, ..., -4.9939e+00, 4.2980e-02, -3.4028e+38], [ 4.5539e+00, -1.4754e+01, -6.3261e+00, ..., -2.8039e+00, -5.1020e+00, -1.0666e+00]], [[ 1.9081e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 6.3271e-01, -5.8182e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.6856e-01, 4.6776e-01, -2.1147e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 5.6895e-01, -1.5966e+00, -1.9752e+00, ..., -3.3202e+00, -3.4028e+38, -3.4028e+38], [ 2.3748e-01, -2.5037e+00, -3.4269e+00, ..., -1.6147e+00, -3.3750e+00, -3.4028e+38], [-2.2952e-01, -2.5554e+00, -1.9919e+00, ..., -1.4025e+00, -1.8757e+00, -3.0655e+00]], ..., [[ 3.3014e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4848e+00, -4.0527e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.1000e+00, -2.6197e+00, -4.1458e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.1817e+00, -2.9270e+00, -4.0100e+00, ..., -2.5781e+00, -3.4028e+38, -3.4028e+38], [ 1.1613e+00, -3.0490e+00, -3.4711e+00, ..., -1.2918e+00, -2.4897e+00, -3.4028e+38], [ 1.0506e+00, -3.1133e+00, -2.9903e+00, ..., -2.0384e+00, -2.0099e+00, -1.4311e+00]], [[ 4.3132e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.7105e+00, -4.2972e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.3278e+00, -1.3996e+00, -1.7276e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.2652e+00, 1.7028e+00, 2.0620e-01, ..., 3.0405e+00, -3.4028e+38, -3.4028e+38], [ 2.9009e+00, -7.9501e-01, 1.4879e-01, ..., 2.1620e-01, 1.3044e+00, -3.4028e+38], [ 1.9817e+00, -1.2267e+00, -4.1662e-01, ..., -1.8797e-01, 1.1607e+00, 9.2088e-01]], [[ 3.5336e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4178e+00, -2.3004e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.1436e+00, -3.3290e-01, 1.3263e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 8.2124e-01, -3.2162e+00, -2.9845e+00, ..., -2.0351e+00, -3.4028e+38, -3.4028e+38], [ 9.6905e-01, -3.6250e+00, -3.6459e+00, ..., -2.2789e+00, -2.3357e+00, -3.4028e+38], [ 1.0930e+00, -1.7560e+00, -1.9461e+00, ..., -1.0655e+00, -2.9021e+00, -2.2092e-01]]], [[[ 5.5354e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.9950e+00, -2.7194e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.6488e+00, -2.6353e+00, -7.4467e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.0505e+00, -5.6088e+00, -5.4696e+00, ..., -2.1410e+00, -3.4028e+38, -3.4028e+38], [ 2.5608e+00, -6.4551e+00, -6.5813e+00, ..., -3.3749e+00, -3.6944e-01, -3.4028e+38], [ 2.8821e+00, -7.1525e+00, -1.5454e+00, ..., -1.9061e+00, -9.8796e-01, -2.9037e-01]], [[ 3.0970e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.2565e+00, -3.6192e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.8378e+00, -6.0635e+00, -1.8980e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.2379e+00, -1.2538e+01, -1.0748e+01, ..., -1.8623e+00, -3.4028e+38, -3.4028e+38], [ 4.7958e+00, -1.7049e+01, -1.5393e+01, ..., -4.9939e+00, 4.2987e-02, -3.4028e+38], [ 4.5539e+00, -1.4754e+01, -6.3261e+00, ..., -2.8039e+00, -5.1020e+00, -1.0666e+00]], [[ 1.9081e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 6.3271e-01, -5.8182e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.6856e-01, 4.6777e-01, -2.1147e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 5.6895e-01, -1.5966e+00, -1.9752e+00, ..., -3.3202e+00, -3.4028e+38, -3.4028e+38], [ 2.3748e-01, -2.5037e+00, -3.4269e+00, ..., -1.6147e+00, -3.3750e+00, -3.4028e+38], [-2.2952e-01, -2.5554e+00, -1.9919e+00, ..., -1.4025e+00, -1.8757e+00, -3.0655e+00]], ..., [[ 3.3014e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4848e+00, -4.0527e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.1000e+00, -2.6197e+00, -4.1458e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.1817e+00, -2.9270e+00, -4.0100e+00, ..., -2.5781e+00, -3.4028e+38, -3.4028e+38], [ 1.1613e+00, -3.0490e+00, -3.4711e+00, ..., -1.2918e+00, -2.4897e+00, -3.4028e+38], [ 1.0506e+00, -3.1133e+00, -2.9903e+00, ..., -2.0384e+00, -2.0099e+00, -1.4311e+00]], [[ 4.3132e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.7105e+00, -4.2972e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.3278e+00, -1.3996e+00, -1.7276e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.2652e+00, 1.7028e+00, 2.0620e-01, ..., 3.0405e+00, -3.4028e+38, -3.4028e+38], [ 2.9009e+00, -7.9500e-01, 1.4880e-01, ..., 2.1620e-01, 1.3044e+00, -3.4028e+38], [ 1.9817e+00, -1.2267e+00, -4.1662e-01, ..., -1.8797e-01, 1.1607e+00, 9.2088e-01]], [[ 3.5336e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4178e+00, -2.3004e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.1436e+00, -3.3289e-01, 1.3263e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 8.2124e-01, -3.2162e+00, -2.9845e+00, ..., -2.0351e+00, -3.4028e+38, -3.4028e+38], [ 9.6905e-01, -3.6250e+00, -3.6459e+00, ..., -2.2789e+00, -2.3357e+00, -3.4028e+38], [ 1.0930e+00, -1.7560e+00, -1.9461e+00, ..., -1.0655e+00, -2.9021e+00, -2.2092e-01]]]]) attn_weights tensor([[[[ 1.5595e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.5765e-01, -4.0991e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.5063e-02, -3.4246e+00, -4.1524e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-5.9888e-01, -2.0496e+00, -1.3279e+00, ..., -3.4410e+00, -3.4028e+38, -3.4028e+38], [-9.2254e-01, -2.9364e+00, -1.4567e+00, ..., -3.0546e+00, -3.3132e+00, -3.4028e+38], [-1.1129e+00, -2.3744e+00, -1.7321e+00, ..., -2.9090e+00, -2.5140e+00, -4.1522e+00]], [[ 6.9327e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 8.9727e-01, -2.4576e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 8.3690e-01, -2.7503e+00, -4.1970e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.1480e+00, -3.4138e+00, -3.0397e+00, ..., -1.6469e+00, -3.4028e+38, -3.4028e+38], [ 1.0910e+00, -3.7025e+00, -3.0896e+00, ..., -3.4788e+00, -1.2586e+00, -3.4028e+38], [-1.0161e+00, -3.8263e+00, -3.3365e+00, ..., -2.7629e+00, -1.9914e+00, -3.0287e+00]], [[ 9.2910e-02, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.5609e-01, -2.7191e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.8650e-01, -2.6593e+00, -3.1961e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.3325e-01, -2.9602e+00, -2.5710e+00, ..., -3.8998e+00, -3.4028e+38, -3.4028e+38], [ 4.7021e-01, -2.7205e+00, -2.8626e+00, ..., -3.1182e+00, -2.8122e+00, -3.4028e+38], [ 1.7110e-01, -2.6445e+00, -2.3916e+00, ..., -3.8227e+00, -3.5177e+00, -2.4957e+00]], ..., [[ 7.6010e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.0351e+00, 3.5953e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.7429e+00, -2.4632e+00, -6.4991e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.7784e+00, -1.0140e+01, -4.4584e+00, ..., -5.3343e-01, -3.4028e+38, -3.4028e+38], [ 5.0191e+00, -1.3655e+01, -8.5537e+00, ..., -1.9203e+00, 1.2180e+00, -3.4028e+38], [ 3.9097e+00, -9.0159e+00, -1.9880e+00, ..., -1.2924e+00, -2.5101e+00, -8.1018e-01]], [[ 3.5066e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.2273e+00, -1.5272e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.4265e+00, -2.6305e+00, -1.3850e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.9407e+00, -3.6736e+00, -2.4991e+00, ..., -1.7253e+00, -3.4028e+38, -3.4028e+38], [ 3.0804e+00, -3.3241e+00, -3.2150e+00, ..., -2.3451e+00, -1.0231e+00, -3.4028e+38], [ 2.9385e+00, -2.9038e+00, -4.0955e-01, ..., -1.1902e+00, -4.6012e-01, -1.0046e+00]], [[ 3.7192e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.4048e-01, -1.7917e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-4.1549e-01, -4.7461e-01, -3.3203e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.0951e-01, -1.7285e+00, -2.3677e+00, ..., -3.8545e+00, -3.4028e+38, -3.4028e+38], [-1.5241e-01, -1.6843e+00, -2.1289e+00, ..., -3.7978e+00, -2.6874e+00, -3.4028e+38], [-4.2704e-01, -1.9172e+00, -2.4153e+00, ..., -4.7899e+00, -2.5532e+00, -3.6891e+00]]], [[[ 1.5595e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.5765e-01, -4.0991e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.5063e-02, -3.4246e+00, -4.1524e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-5.9888e-01, -2.0496e+00, -1.3279e+00, ..., -3.4410e+00, -3.4028e+38, -3.4028e+38], [-9.2254e-01, -2.9364e+00, -1.4567e+00, ..., -3.0546e+00, -3.3132e+00, -3.4028e+38], [-1.1129e+00, -2.3744e+00, -1.7321e+00, ..., -2.9090e+00, -2.5140e+00, -4.1522e+00]], [[ 6.9327e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 8.9727e-01, -2.4576e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 8.3690e-01, -2.7503e+00, -4.1970e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.1480e+00, -3.4138e+00, -3.0397e+00, ..., -1.6469e+00, -3.4028e+38, -3.4028e+38], [ 1.0910e+00, -3.7025e+00, -3.0896e+00, ..., -3.4788e+00, -1.2586e+00, -3.4028e+38], [-1.0161e+00, -3.8263e+00, -3.3365e+00, ..., -2.7629e+00, -1.9914e+00, -3.0287e+00]], [[ 9.2910e-02, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.5609e-01, -2.7191e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.8650e-01, -2.6593e+00, -3.1961e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.3325e-01, -2.9602e+00, -2.5710e+00, ..., -3.8998e+00, -3.4028e+38, -3.4028e+38], [ 4.7021e-01, -2.7205e+00, -2.8626e+00, ..., -3.1182e+00, -2.8122e+00, -3.4028e+38], [ 1.7110e-01, -2.6445e+00, -2.3916e+00, ..., -3.8227e+00, -3.5177e+00, -2.4957e+00]], ..., [[ 7.6010e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.0351e+00, 3.5953e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.7429e+00, -2.4632e+00, -6.4991e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.7784e+00, -1.0140e+01, -4.4584e+00, ..., -5.3343e-01, -3.4028e+38, -3.4028e+38], [ 5.0191e+00, -1.3655e+01, -8.5537e+00, ..., -1.9203e+00, 1.2180e+00, -3.4028e+38], [ 3.9097e+00, -9.0159e+00, -1.9880e+00, ..., -1.2924e+00, -2.5101e+00, -8.1018e-01]], [[ 3.5066e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.2273e+00, -1.5272e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.4265e+00, -2.6305e+00, -1.3850e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.9407e+00, -3.6736e+00, -2.4991e+00, ..., -1.7253e+00, -3.4028e+38, -3.4028e+38], [ 3.0804e+00, -3.3241e+00, -3.2150e+00, ..., -2.3451e+00, -1.0231e+00, -3.4028e+38], [ 2.9385e+00, -2.9038e+00, -4.0955e-01, ..., -1.1902e+00, -4.6012e-01, -1.0046e+00]], [[ 3.7192e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.4048e-01, -1.7917e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-4.1549e-01, -4.7461e-01, -3.3203e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.0951e-01, -1.7285e+00, -2.3677e+00, ..., -3.8545e+00, -3.4028e+38, -3.4028e+38], [-1.5241e-01, -1.6843e+00, -2.1289e+00, ..., -3.7978e+00, -2.6874e+00, -3.4028e+38], [-4.2704e-01, -1.9172e+00, -2.4153e+00, ..., -4.7899e+00, -2.5532e+00, -3.6891e+00]]], [[[ 1.5595e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.5765e-01, -4.0991e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.5063e-02, -3.4246e+00, -4.1524e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-5.9888e-01, -2.0496e+00, -1.3279e+00, ..., -3.4410e+00, -3.4028e+38, -3.4028e+38], [-9.2254e-01, -2.9364e+00, -1.4567e+00, ..., -3.0546e+00, -3.3132e+00, -3.4028e+38], [-1.1129e+00, -2.3744e+00, -1.7321e+00, ..., -2.9090e+00, -2.5140e+00, -4.1522e+00]], [[ 6.9327e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 8.9727e-01, -2.4576e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 8.3690e-01, -2.7503e+00, -4.1970e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.1480e+00, -3.4138e+00, -3.0397e+00, ..., -1.6469e+00, -3.4028e+38, -3.4028e+38], [ 1.0910e+00, -3.7025e+00, -3.0896e+00, ..., -3.4788e+00, -1.2586e+00, -3.4028e+38], [-1.0161e+00, -3.8263e+00, -3.3365e+00, ..., -2.7629e+00, -1.9914e+00, -3.0287e+00]], [[ 9.2910e-02, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.5609e-01, -2.7191e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.8650e-01, -2.6593e+00, -3.1961e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.3325e-01, -2.9602e+00, -2.5710e+00, ..., -3.8998e+00, -3.4028e+38, -3.4028e+38], [ 4.7021e-01, -2.7205e+00, -2.8626e+00, ..., -3.1182e+00, -2.8122e+00, -3.4028e+38], [ 1.7110e-01, -2.6445e+00, -2.3916e+00, ..., -3.8227e+00, -3.5177e+00, -2.4957e+00]], ..., [[ 7.6010e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.0351e+00, 3.5953e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.7429e+00, -2.4632e+00, -6.4991e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.7784e+00, -1.0140e+01, -4.4584e+00, ..., -5.3343e-01, -3.4028e+38, -3.4028e+38], [ 5.0191e+00, -1.3655e+01, -8.5537e+00, ..., -1.9203e+00, 1.2180e+00, -3.4028e+38], [ 3.9097e+00, -9.0159e+00, -1.9880e+00, ..., -1.2924e+00, -2.5101e+00, -8.1018e-01]], [[ 3.5066e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.2273e+00, -1.5272e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.4265e+00, -2.6305e+00, -1.3850e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.9407e+00, -3.6736e+00, -2.4991e+00, ..., -1.7253e+00, -3.4028e+38, -3.4028e+38], [ 3.0804e+00, -3.3241e+00, -3.2150e+00, ..., -2.3451e+00, -1.0231e+00, -3.4028e+38], [ 2.9385e+00, -2.9038e+00, -4.0955e-01, ..., -1.1902e+00, -4.6012e-01, -1.0046e+00]], [[ 3.7192e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.4048e-01, -1.7917e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-4.1549e-01, -4.7461e-01, -3.3203e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.0951e-01, -1.7285e+00, -2.3677e+00, ..., -3.8545e+00, -3.4028e+38, -3.4028e+38], [-1.5241e-01, -1.6843e+00, -2.1289e+00, ..., -3.7978e+00, -2.6874e+00, -3.4028e+38], [-4.2704e-01, -1.9172e+00, -2.4153e+00, ..., -4.7899e+00, -2.5532e+00, -3.6891e+00]]], [[[ 1.5595e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.5765e-01, -4.0991e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.5063e-02, -3.4246e+00, -4.1524e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-5.9888e-01, -2.0496e+00, -1.3279e+00, ..., -3.4410e+00, -3.4028e+38, -3.4028e+38], [-9.2254e-01, -2.9364e+00, -1.4567e+00, ..., -3.0546e+00, -3.3132e+00, -3.4028e+38], [-1.1129e+00, -2.3744e+00, -1.7321e+00, ..., -2.9090e+00, -2.5140e+00, -4.1522e+00]], [[ 6.9327e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 8.9727e-01, -2.4576e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 8.3690e-01, -2.7503e+00, -4.1970e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.1480e+00, -3.4138e+00, -3.0397e+00, ..., -1.6469e+00, -3.4028e+38, -3.4028e+38], [ 1.0910e+00, -3.7025e+00, -3.0896e+00, ..., -3.4788e+00, -1.2586e+00, -3.4028e+38], [-1.0161e+00, -3.8263e+00, -3.3365e+00, ..., -2.7629e+00, -1.9914e+00, -3.0287e+00]], [[ 9.2910e-02, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.5609e-01, -2.7191e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.8650e-01, -2.6593e+00, -3.1961e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.3325e-01, -2.9602e+00, -2.5710e+00, ..., -3.8998e+00, -3.4028e+38, -3.4028e+38], [ 4.7021e-01, -2.7205e+00, -2.8626e+00, ..., -3.1182e+00, -2.8122e+00, -3.4028e+38], [ 1.7110e-01, -2.6445e+00, -2.3916e+00, ..., -3.8227e+00, -3.5177e+00, -2.4957e+00]], ..., [[ 7.6010e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.0351e+00, 3.5953e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.7429e+00, -2.4632e+00, -6.4991e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.7784e+00, -1.0140e+01, -4.4584e+00, ..., -5.3343e-01, -3.4028e+38, -3.4028e+38], [ 5.0191e+00, -1.3655e+01, -8.5537e+00, ..., -1.9203e+00, 1.2180e+00, -3.4028e+38], [ 3.9097e+00, -9.0159e+00, -1.9880e+00, ..., -1.2924e+00, -2.5101e+00, -8.1018e-01]], [[ 3.5066e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.2273e+00, -1.5272e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.4265e+00, -2.6305e+00, -1.3850e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.9407e+00, -3.6736e+00, -2.4991e+00, ..., -1.7253e+00, -3.4028e+38, -3.4028e+38], [ 3.0804e+00, -3.3241e+00, -3.2150e+00, ..., -2.3451e+00, -1.0231e+00, -3.4028e+38], [ 2.9385e+00, -2.9038e+00, -4.0955e-01, ..., -1.1902e+00, -4.6012e-01, -1.0046e+00]], [[ 3.7192e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.4048e-01, -1.7917e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-4.1549e-01, -4.7461e-01, -3.3203e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.0951e-01, -1.7285e+00, -2.3677e+00, ..., -3.8545e+00, -3.4028e+38, -3.4028e+38], [-1.5241e-01, -1.6843e+00, -2.1289e+00, ..., -3.7978e+00, -2.6874e+00, -3.4028e+38], [-4.2704e-01, -1.9172e+00, -2.4153e+00, ..., -4.7899e+00, -2.5532e+00, -3.6891e+00]]], [[[ 1.5595e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.5765e-01, -4.0991e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-2.5063e-02, -3.4246e+00, -4.1524e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-5.9888e-01, -2.0496e+00, -1.3279e+00, ..., -3.4410e+00, -3.4028e+38, -3.4028e+38], [-9.2253e-01, -2.9364e+00, -1.4567e+00, ..., -3.0546e+00, -3.3132e+00, -3.4028e+38], [-1.1129e+00, -2.3744e+00, -1.7321e+00, ..., -2.9090e+00, -2.5140e+00, -4.1522e+00]], [[ 6.9327e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 8.9727e-01, -2.4576e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 8.3690e-01, -2.7503e+00, -4.1970e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.1480e+00, -3.4138e+00, -3.0397e+00, ..., -1.6469e+00, -3.4028e+38, -3.4028e+38], [ 1.0910e+00, -3.7025e+00, -3.0896e+00, ..., -3.4788e+00, -1.2586e+00, -3.4028e+38], [-1.0161e+00, -3.8262e+00, -3.3365e+00, ..., -2.7629e+00, -1.9914e+00, -3.0287e+00]], [[ 9.2910e-02, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.5609e-01, -2.7191e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.8650e-01, -2.6593e+00, -3.1961e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.3325e-01, -2.9602e+00, -2.5710e+00, ..., -3.8998e+00, -3.4028e+38, -3.4028e+38], [ 4.7021e-01, -2.7205e+00, -2.8626e+00, ..., -3.1182e+00, -2.8122e+00, -3.4028e+38], [ 1.7110e-01, -2.6445e+00, -2.3916e+00, ..., -3.8227e+00, -3.5177e+00, -2.4957e+00]], ..., [[ 7.6010e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.0351e+00, 3.5953e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.7429e+00, -2.4632e+00, -6.4992e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.7784e+00, -1.0140e+01, -4.4584e+00, ..., -5.3343e-01, -3.4028e+38, -3.4028e+38], [ 5.0191e+00, -1.3655e+01, -8.5537e+00, ..., -1.9203e+00, 1.2181e+00, -3.4028e+38], [ 3.9097e+00, -9.0159e+00, -1.9880e+00, ..., -1.2924e+00, -2.5101e+00, -8.1019e-01]], [[ 3.5066e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.2273e+00, -1.5272e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.4265e+00, -2.6305e+00, -1.3850e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.9407e+00, -3.6736e+00, -2.4991e+00, ..., -1.7253e+00, -3.4028e+38, -3.4028e+38], [ 3.0804e+00, -3.3241e+00, -3.2150e+00, ..., -2.3451e+00, -1.0231e+00, -3.4028e+38], [ 2.9385e+00, -2.9038e+00, -4.0954e-01, ..., -1.1902e+00, -4.6011e-01, -1.0046e+00]], [[ 3.7192e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-1.4048e-01, -1.7917e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-4.1549e-01, -4.7461e-01, -3.3202e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-1.0951e-01, -1.7285e+00, -2.3677e+00, ..., -3.8545e+00, -3.4028e+38, -3.4028e+38], [-1.5241e-01, -1.6843e+00, -2.1289e+00, ..., -3.7978e+00, -2.6874e+00, -3.4028e+38], [-4.2705e-01, -1.9172e+00, -2.4153e+00, ..., -4.7899e+00, -2.5532e+00, -3.6891e+00]]]]) attn_weights tensor([[[[ 6.4607e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.9392e-01, -3.9598e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-4.5956e-01, -2.2953e+00, -4.9260e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-5.9144e-01, -3.6522e+00, -2.6094e+00, ..., -3.9763e+00, -3.4028e+38, -3.4028e+38], [-9.4251e-01, -3.9073e+00, -3.7773e+00, ..., -9.4786e-01, -2.6399e+00, -3.4028e+38], [-4.7146e-01, -8.0164e+00, -6.1332e+00, ..., -1.7563e+00, -1.7872e+00, -5.8059e+00]], [[ 6.8526e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.8190e+00, -6.0814e-02, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.2354e+00, -7.5352e-01, -6.0059e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.8032e+00, -3.0752e+00, -2.0034e+00, ..., -8.3330e-01, -3.4028e+38, -3.4028e+38], [ 4.0580e+00, -3.0920e+00, -1.7418e+00, ..., -1.0613e+00, 9.2449e-01, -3.4028e+38], [ 3.0283e+00, -3.5681e+00, -1.3349e+00, ..., -1.7087e+00, 8.4612e-02, -4.1233e-02]], [[ 1.3787e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 6.3006e+00, 8.0642e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 6.4115e+00, -1.2489e+00, -4.7462e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 6.9786e+00, -4.1326e+00, -3.9646e+00, ..., 7.2068e-01, -3.4028e+38, -3.4028e+38], [ 7.0681e+00, -5.8946e+00, -5.8948e+00, ..., -4.2750e-01, 2.5653e+00, -3.4028e+38], [ 6.0738e+00, -5.9986e+00, -2.3732e+00, ..., -5.3912e-02, 3.9439e-01, 7.3023e-02]], ..., [[ 5.0789e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 7.2909e-01, -1.9870e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.4326e-01, -1.6554e-01, -1.4205e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 6.5270e-01, -2.5560e+00, -2.6788e+00, ..., -2.3513e+00, -3.4028e+38, -3.4028e+38], [ 5.3415e-01, -2.2216e+00, -2.0947e+00, ..., -1.4977e+00, -2.2002e+00, -3.4028e+38], [ 5.3781e-01, -1.6909e+00, -2.2131e+00, ..., -2.5316e+00, -2.3404e+00, -2.2779e+00]], [[ 1.0446e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.3920e+00, 1.2534e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.2788e+00, -7.2871e-01, -1.2566e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 5.3586e+00, -6.3253e+00, -2.9825e+00, ..., 8.0093e-02, -3.4028e+38, -3.4028e+38], [ 5.1771e+00, -6.8257e+00, -4.1586e+00, ..., -3.3961e-01, 2.1551e+00, -3.4028e+38], [ 3.1287e+00, -5.8198e+00, -2.4226e+00, ..., -1.7002e+00, -1.3727e+00, -1.3577e+00]], [[ 7.0237e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.3685e+00, -1.7167e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.5399e+00, -2.6213e+00, -2.2255e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.2013e+00, -3.5816e+00, -4.5842e+00, ..., -2.2539e+00, -3.4028e+38, -3.4028e+38], [ 3.3943e+00, -3.5959e+00, -4.4567e+00, ..., -2.2558e+00, -3.1685e-01, -3.4028e+38], [ 3.2275e+00, -4.1261e+00, 2.9801e-01, ..., -1.0985e+00, -2.1517e+00, -1.4103e+00]]], [[[ 6.4607e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.9392e-01, -3.9598e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-4.5956e-01, -2.2953e+00, -4.9260e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-5.9144e-01, -3.6522e+00, -2.6094e+00, ..., -3.9763e+00, -3.4028e+38, -3.4028e+38], [-9.4251e-01, -3.9073e+00, -3.7773e+00, ..., -9.4786e-01, -2.6399e+00, -3.4028e+38], [-4.7146e-01, -8.0164e+00, -6.1332e+00, ..., -1.7563e+00, -1.7872e+00, -5.8059e+00]], [[ 6.8526e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.8190e+00, -6.0814e-02, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.2354e+00, -7.5352e-01, -6.0059e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.8032e+00, -3.0752e+00, -2.0034e+00, ..., -8.3330e-01, -3.4028e+38, -3.4028e+38], [ 4.0580e+00, -3.0920e+00, -1.7418e+00, ..., -1.0613e+00, 9.2449e-01, -3.4028e+38], [ 3.0283e+00, -3.5681e+00, -1.3349e+00, ..., -1.7087e+00, 8.4612e-02, -4.1233e-02]], [[ 1.3787e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 6.3006e+00, 8.0642e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 6.4115e+00, -1.2489e+00, -4.7462e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 6.9786e+00, -4.1326e+00, -3.9646e+00, ..., 7.2068e-01, -3.4028e+38, -3.4028e+38], [ 7.0681e+00, -5.8946e+00, -5.8948e+00, ..., -4.2750e-01, 2.5653e+00, -3.4028e+38], [ 6.0738e+00, -5.9986e+00, -2.3732e+00, ..., -5.3912e-02, 3.9439e-01, 7.3023e-02]], ..., [[ 5.0789e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 7.2909e-01, -1.9870e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.4326e-01, -1.6554e-01, -1.4205e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 6.5270e-01, -2.5560e+00, -2.6788e+00, ..., -2.3513e+00, -3.4028e+38, -3.4028e+38], [ 5.3415e-01, -2.2216e+00, -2.0947e+00, ..., -1.4977e+00, -2.2002e+00, -3.4028e+38], [ 5.3781e-01, -1.6909e+00, -2.2131e+00, ..., -2.5316e+00, -2.3404e+00, -2.2779e+00]], [[ 1.0446e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.3920e+00, 1.2534e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.2788e+00, -7.2871e-01, -1.2566e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 5.3586e+00, -6.3253e+00, -2.9825e+00, ..., 8.0093e-02, -3.4028e+38, -3.4028e+38], [ 5.1771e+00, -6.8257e+00, -4.1586e+00, ..., -3.3961e-01, 2.1551e+00, -3.4028e+38], [ 3.1287e+00, -5.8198e+00, -2.4226e+00, ..., -1.7002e+00, -1.3727e+00, -1.3577e+00]], [[ 7.0237e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.3685e+00, -1.7167e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.5399e+00, -2.6213e+00, -2.2255e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.2013e+00, -3.5816e+00, -4.5842e+00, ..., -2.2539e+00, -3.4028e+38, -3.4028e+38], [ 3.3943e+00, -3.5959e+00, -4.4567e+00, ..., -2.2558e+00, -3.1685e-01, -3.4028e+38], [ 3.2275e+00, -4.1261e+00, 2.9801e-01, ..., -1.0985e+00, -2.1517e+00, -1.4103e+00]]], [[[ 6.4607e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.9392e-01, -3.9598e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-4.5956e-01, -2.2953e+00, -4.9260e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-5.9144e-01, -3.6522e+00, -2.6094e+00, ..., -3.9763e+00, -3.4028e+38, -3.4028e+38], [-9.4251e-01, -3.9073e+00, -3.7773e+00, ..., -9.4786e-01, -2.6399e+00, -3.4028e+38], [-4.7146e-01, -8.0164e+00, -6.1332e+00, ..., -1.7563e+00, -1.7872e+00, -5.8059e+00]], [[ 6.8526e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.8190e+00, -6.0814e-02, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.2354e+00, -7.5352e-01, -6.0059e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.8032e+00, -3.0752e+00, -2.0034e+00, ..., -8.3330e-01, -3.4028e+38, -3.4028e+38], [ 4.0580e+00, -3.0920e+00, -1.7418e+00, ..., -1.0613e+00, 9.2449e-01, -3.4028e+38], [ 3.0283e+00, -3.5681e+00, -1.3349e+00, ..., -1.7087e+00, 8.4612e-02, -4.1233e-02]], [[ 1.3787e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 6.3006e+00, 8.0642e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 6.4115e+00, -1.2489e+00, -4.7462e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 6.9786e+00, -4.1326e+00, -3.9646e+00, ..., 7.2068e-01, -3.4028e+38, -3.4028e+38], [ 7.0681e+00, -5.8946e+00, -5.8948e+00, ..., -4.2750e-01, 2.5653e+00, -3.4028e+38], [ 6.0738e+00, -5.9986e+00, -2.3732e+00, ..., -5.3912e-02, 3.9439e-01, 7.3023e-02]], ..., [[ 5.0789e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 7.2909e-01, -1.9870e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.4326e-01, -1.6554e-01, -1.4205e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 6.5270e-01, -2.5560e+00, -2.6788e+00, ..., -2.3513e+00, -3.4028e+38, -3.4028e+38], [ 5.3415e-01, -2.2216e+00, -2.0947e+00, ..., -1.4977e+00, -2.2002e+00, -3.4028e+38], [ 5.3781e-01, -1.6909e+00, -2.2131e+00, ..., -2.5316e+00, -2.3404e+00, -2.2779e+00]], [[ 1.0446e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.3920e+00, 1.2534e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.2788e+00, -7.2871e-01, -1.2566e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 5.3586e+00, -6.3253e+00, -2.9825e+00, ..., 8.0093e-02, -3.4028e+38, -3.4028e+38], [ 5.1771e+00, -6.8257e+00, -4.1586e+00, ..., -3.3961e-01, 2.1551e+00, -3.4028e+38], [ 3.1287e+00, -5.8198e+00, -2.4226e+00, ..., -1.7002e+00, -1.3727e+00, -1.3577e+00]], [[ 7.0237e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.3685e+00, -1.7167e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.5399e+00, -2.6213e+00, -2.2255e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.2013e+00, -3.5816e+00, -4.5842e+00, ..., -2.2539e+00, -3.4028e+38, -3.4028e+38], [ 3.3943e+00, -3.5959e+00, -4.4567e+00, ..., -2.2558e+00, -3.1685e-01, -3.4028e+38], [ 3.2275e+00, -4.1261e+00, 2.9801e-01, ..., -1.0985e+00, -2.1517e+00, -1.4103e+00]]], [[[ 6.4607e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.9392e-01, -3.9598e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-4.5956e-01, -2.2953e+00, -4.9260e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-5.9144e-01, -3.6522e+00, -2.6094e+00, ..., -3.9763e+00, -3.4028e+38, -3.4028e+38], [-9.4251e-01, -3.9073e+00, -3.7773e+00, ..., -9.4786e-01, -2.6399e+00, -3.4028e+38], [-4.7146e-01, -8.0164e+00, -6.1332e+00, ..., -1.7563e+00, -1.7872e+00, -5.8059e+00]], [[ 6.8526e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.8190e+00, -6.0814e-02, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.2354e+00, -7.5352e-01, -6.0059e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.8032e+00, -3.0752e+00, -2.0034e+00, ..., -8.3330e-01, -3.4028e+38, -3.4028e+38], [ 4.0580e+00, -3.0920e+00, -1.7418e+00, ..., -1.0613e+00, 9.2449e-01, -3.4028e+38], [ 3.0283e+00, -3.5681e+00, -1.3349e+00, ..., -1.7087e+00, 8.4612e-02, -4.1233e-02]], [[ 1.3787e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 6.3006e+00, 8.0642e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 6.4115e+00, -1.2489e+00, -4.7462e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 6.9786e+00, -4.1326e+00, -3.9646e+00, ..., 7.2068e-01, -3.4028e+38, -3.4028e+38], [ 7.0681e+00, -5.8946e+00, -5.8948e+00, ..., -4.2750e-01, 2.5653e+00, -3.4028e+38], [ 6.0738e+00, -5.9986e+00, -2.3732e+00, ..., -5.3912e-02, 3.9439e-01, 7.3023e-02]], ..., [[ 5.0789e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 7.2909e-01, -1.9870e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.4326e-01, -1.6554e-01, -1.4205e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 6.5270e-01, -2.5560e+00, -2.6788e+00, ..., -2.3513e+00, -3.4028e+38, -3.4028e+38], [ 5.3415e-01, -2.2216e+00, -2.0947e+00, ..., -1.4977e+00, -2.2002e+00, -3.4028e+38], [ 5.3781e-01, -1.6909e+00, -2.2131e+00, ..., -2.5316e+00, -2.3404e+00, -2.2779e+00]], [[ 1.0446e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.3920e+00, 1.2534e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.2788e+00, -7.2871e-01, -1.2566e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 5.3586e+00, -6.3253e+00, -2.9825e+00, ..., 8.0093e-02, -3.4028e+38, -3.4028e+38], [ 5.1771e+00, -6.8257e+00, -4.1586e+00, ..., -3.3961e-01, 2.1551e+00, -3.4028e+38], [ 3.1287e+00, -5.8198e+00, -2.4226e+00, ..., -1.7002e+00, -1.3727e+00, -1.3577e+00]], [[ 7.0237e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.3685e+00, -1.7167e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.5399e+00, -2.6213e+00, -2.2255e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.2013e+00, -3.5816e+00, -4.5842e+00, ..., -2.2539e+00, -3.4028e+38, -3.4028e+38], [ 3.3943e+00, -3.5959e+00, -4.4567e+00, ..., -2.2558e+00, -3.1685e-01, -3.4028e+38], [ 3.2275e+00, -4.1261e+00, 2.9801e-01, ..., -1.0985e+00, -2.1517e+00, -1.4103e+00]]], [[[ 6.4607e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-7.9392e-01, -3.9598e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [-4.5956e-01, -2.2953e+00, -4.9260e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [-5.9144e-01, -3.6522e+00, -2.6094e+00, ..., -3.9763e+00, -3.4028e+38, -3.4028e+38], [-9.4251e-01, -3.9073e+00, -3.7773e+00, ..., -9.4785e-01, -2.6399e+00, -3.4028e+38], [-4.7146e-01, -8.0164e+00, -6.1332e+00, ..., -1.7563e+00, -1.7872e+00, -5.8059e+00]], [[ 6.8526e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.8190e+00, -6.0810e-02, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.2354e+00, -7.5352e-01, -6.0059e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.8032e+00, -3.0752e+00, -2.0034e+00, ..., -8.3331e-01, -3.4028e+38, -3.4028e+38], [ 4.0580e+00, -3.0920e+00, -1.7418e+00, ..., -1.0614e+00, 9.2449e-01, -3.4028e+38], [ 3.0283e+00, -3.5681e+00, -1.3349e+00, ..., -1.7087e+00, 8.4611e-02, -4.1240e-02]], [[ 1.3787e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 6.3006e+00, 8.0642e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 6.4115e+00, -1.2489e+00, -4.7462e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 6.9786e+00, -4.1326e+00, -3.9646e+00, ..., 7.2067e-01, -3.4028e+38, -3.4028e+38], [ 7.0681e+00, -5.8946e+00, -5.8948e+00, ..., -4.2750e-01, 2.5653e+00, -3.4028e+38], [ 6.0738e+00, -5.9986e+00, -2.3732e+00, ..., -5.3917e-02, 3.9439e-01, 7.3023e-02]], ..., [[ 5.0789e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 7.2909e-01, -1.9869e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.4326e-01, -1.6554e-01, -1.4205e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 6.5270e-01, -2.5560e+00, -2.6788e+00, ..., -2.3514e+00, -3.4028e+38, -3.4028e+38], [ 5.3415e-01, -2.2216e+00, -2.0947e+00, ..., -1.4977e+00, -2.2002e+00, -3.4028e+38], [ 5.3781e-01, -1.6909e+00, -2.2131e+00, ..., -2.5316e+00, -2.3404e+00, -2.2779e+00]], [[ 1.0446e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.3920e+00, 1.2534e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.2788e+00, -7.2871e-01, -1.2566e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 5.3586e+00, -6.3253e+00, -2.9825e+00, ..., 8.0093e-02, -3.4028e+38, -3.4028e+38], [ 5.1771e+00, -6.8257e+00, -4.1586e+00, ..., -3.3962e-01, 2.1551e+00, -3.4028e+38], [ 3.1287e+00, -5.8198e+00, -2.4226e+00, ..., -1.7002e+00, -1.3727e+00, -1.3577e+00]], [[ 7.0237e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.3685e+00, -1.7167e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.5399e+00, -2.6213e+00, -2.2255e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.2013e+00, -3.5816e+00, -4.5842e+00, ..., -2.2539e+00, -3.4028e+38, -3.4028e+38], [ 3.3943e+00, -3.5960e+00, -4.4567e+00, ..., -2.2558e+00, -3.1685e-01, -3.4028e+38], [ 3.2275e+00, -4.1261e+00, 2.9801e-01, ..., -1.0985e+00, -2.1517e+00, -1.4103e+00]]]]) attn_weights tensor([[[[ 1.1839e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.2352e+00, -1.8526e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.1215e+00, -1.1034e+00, -1.1380e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.0699e+00, -2.2538e+00, -2.9190e+00, ..., -2.7522e+00, -3.4028e+38, -3.4028e+38], [ 1.2503e+00, -2.3520e+00, -3.0299e+00, ..., -3.9587e+00, -2.3545e+00, -3.4028e+38], [ 1.1445e+00, -2.4599e+00, -1.4675e+00, ..., -4.5715e+00, -2.6766e+00, -3.2961e+00]], [[ 9.1653e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.4314e+00, 1.4052e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.8482e+00, -1.1521e+00, -2.2733e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.9443e+00, -2.2000e+00, -2.6604e+00, ..., 3.7069e-01, -3.4028e+38, -3.4028e+38], [ 5.1623e+00, -2.4533e+00, -2.8417e+00, ..., 1.8455e-01, 2.3588e+00, -3.4028e+38], [ 2.5013e+00, -3.2726e+00, -5.2775e-01, ..., 3.4743e-02, -4.2228e-01, -1.3789e+00]], [[ 5.5456e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.7686e+00, -5.9669e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.0608e+00, -2.9295e-01, -1.9495e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.2496e+00, -5.6383e-01, -1.7735e+00, ..., -7.2414e-01, -3.4028e+38, -3.4028e+38], [ 2.3608e+00, -4.4634e-01, -2.1191e+00, ..., -1.3539e+00, -1.7769e+00, -3.4028e+38], [ 1.9967e+00, -1.8365e-01, -1.5309e+00, ..., -9.5818e-01, -1.9410e+00, -1.3713e+00]], ..., [[ 4.1511e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4833e+00, -1.8749e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.2216e+00, -2.0234e+00, -2.1622e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.4239e+00, -3.5226e+00, -3.8543e+00, ..., 2.9924e-01, -3.4028e+38, -3.4028e+38], [ 1.5677e+00, -3.4006e+00, -3.4238e+00, ..., -1.7730e-01, -6.5243e-01, -3.4028e+38], [ 1.1460e+00, -2.7953e+00, -1.9780e+00, ..., -1.0973e+00, -9.9403e-01, -1.8633e+00]], [[ 4.7874e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.5284e+00, -8.1035e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4687e+00, -1.4795e+00, -1.8821e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.4817e+00, -2.0753e+00, -2.2936e+00, ..., -7.7886e-01, -3.4028e+38, -3.4028e+38], [ 1.3715e+00, -2.6386e+00, -2.7770e+00, ..., -1.5484e+00, -1.2749e+00, -3.4028e+38], [ 1.0764e+00, -1.5915e+00, -1.0792e+00, ..., -1.6231e+00, -1.4165e+00, -8.4046e-01]], [[ 9.3109e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 9.6087e-01, -2.6589e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4291e+00, -2.2902e+00, -3.5433e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.7776e+00, -2.7550e+00, -3.5866e+00, ..., -6.7503e-01, -3.4028e+38, -3.4028e+38], [ 1.5765e+00, -2.7960e+00, -3.4092e+00, ..., -1.9036e+00, -2.3868e+00, -3.4028e+38], [ 3.7332e-01, -2.6504e+00, -3.4292e+00, ..., -2.2849e+00, -2.7734e+00, -3.7061e+00]]], [[[ 1.1839e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.2352e+00, -1.8526e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.1215e+00, -1.1034e+00, -1.1380e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.0699e+00, -2.2538e+00, -2.9190e+00, ..., -2.7522e+00, -3.4028e+38, -3.4028e+38], [ 1.2503e+00, -2.3520e+00, -3.0299e+00, ..., -3.9587e+00, -2.3545e+00, -3.4028e+38], [ 1.1445e+00, -2.4599e+00, -1.4675e+00, ..., -4.5715e+00, -2.6766e+00, -3.2961e+00]], [[ 9.1653e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.4314e+00, 1.4052e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.8482e+00, -1.1521e+00, -2.2733e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.9443e+00, -2.2000e+00, -2.6604e+00, ..., 3.7069e-01, -3.4028e+38, -3.4028e+38], [ 5.1623e+00, -2.4533e+00, -2.8417e+00, ..., 1.8455e-01, 2.3588e+00, -3.4028e+38], [ 2.5013e+00, -3.2726e+00, -5.2775e-01, ..., 3.4743e-02, -4.2228e-01, -1.3789e+00]], [[ 5.5456e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.7686e+00, -5.9669e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.0608e+00, -2.9295e-01, -1.9495e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.2496e+00, -5.6383e-01, -1.7735e+00, ..., -7.2414e-01, -3.4028e+38, -3.4028e+38], [ 2.3608e+00, -4.4634e-01, -2.1191e+00, ..., -1.3539e+00, -1.7769e+00, -3.4028e+38], [ 1.9967e+00, -1.8365e-01, -1.5309e+00, ..., -9.5818e-01, -1.9410e+00, -1.3713e+00]], ..., [[ 4.1511e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4833e+00, -1.8749e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.2216e+00, -2.0234e+00, -2.1622e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.4239e+00, -3.5226e+00, -3.8543e+00, ..., 2.9924e-01, -3.4028e+38, -3.4028e+38], [ 1.5677e+00, -3.4006e+00, -3.4238e+00, ..., -1.7730e-01, -6.5243e-01, -3.4028e+38], [ 1.1460e+00, -2.7953e+00, -1.9780e+00, ..., -1.0973e+00, -9.9403e-01, -1.8633e+00]], [[ 4.7874e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.5284e+00, -8.1035e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4687e+00, -1.4795e+00, -1.8821e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.4817e+00, -2.0753e+00, -2.2936e+00, ..., -7.7886e-01, -3.4028e+38, -3.4028e+38], [ 1.3715e+00, -2.6386e+00, -2.7770e+00, ..., -1.5484e+00, -1.2749e+00, -3.4028e+38], [ 1.0764e+00, -1.5915e+00, -1.0792e+00, ..., -1.6231e+00, -1.4165e+00, -8.4046e-01]], [[ 9.3109e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 9.6087e-01, -2.6589e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4291e+00, -2.2902e+00, -3.5433e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.7776e+00, -2.7550e+00, -3.5866e+00, ..., -6.7503e-01, -3.4028e+38, -3.4028e+38], [ 1.5765e+00, -2.7960e+00, -3.4092e+00, ..., -1.9036e+00, -2.3868e+00, -3.4028e+38], [ 3.7332e-01, -2.6504e+00, -3.4292e+00, ..., -2.2849e+00, -2.7734e+00, -3.7061e+00]]], [[[ 1.1839e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.2352e+00, -1.8526e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.1215e+00, -1.1034e+00, -1.1380e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.0699e+00, -2.2538e+00, -2.9190e+00, ..., -2.7522e+00, -3.4028e+38, -3.4028e+38], [ 1.2503e+00, -2.3520e+00, -3.0299e+00, ..., -3.9587e+00, -2.3545e+00, -3.4028e+38], [ 1.1445e+00, -2.4599e+00, -1.4675e+00, ..., -4.5715e+00, -2.6766e+00, -3.2961e+00]], [[ 9.1653e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.4314e+00, 1.4052e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.8482e+00, -1.1521e+00, -2.2733e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.9443e+00, -2.2000e+00, -2.6604e+00, ..., 3.7069e-01, -3.4028e+38, -3.4028e+38], [ 5.1623e+00, -2.4533e+00, -2.8417e+00, ..., 1.8455e-01, 2.3588e+00, -3.4028e+38], [ 2.5013e+00, -3.2726e+00, -5.2775e-01, ..., 3.4743e-02, -4.2228e-01, -1.3789e+00]], [[ 5.5456e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.7686e+00, -5.9669e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.0608e+00, -2.9295e-01, -1.9495e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.2496e+00, -5.6383e-01, -1.7735e+00, ..., -7.2414e-01, -3.4028e+38, -3.4028e+38], [ 2.3608e+00, -4.4634e-01, -2.1191e+00, ..., -1.3539e+00, -1.7769e+00, -3.4028e+38], [ 1.9967e+00, -1.8365e-01, -1.5309e+00, ..., -9.5818e-01, -1.9410e+00, -1.3713e+00]], ..., [[ 4.1511e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4833e+00, -1.8749e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.2216e+00, -2.0234e+00, -2.1622e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.4239e+00, -3.5226e+00, -3.8543e+00, ..., 2.9924e-01, -3.4028e+38, -3.4028e+38], [ 1.5677e+00, -3.4006e+00, -3.4238e+00, ..., -1.7730e-01, -6.5243e-01, -3.4028e+38], [ 1.1460e+00, -2.7953e+00, -1.9780e+00, ..., -1.0973e+00, -9.9403e-01, -1.8633e+00]], [[ 4.7874e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.5284e+00, -8.1035e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4687e+00, -1.4795e+00, -1.8821e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.4817e+00, -2.0753e+00, -2.2936e+00, ..., -7.7886e-01, -3.4028e+38, -3.4028e+38], [ 1.3715e+00, -2.6386e+00, -2.7770e+00, ..., -1.5484e+00, -1.2749e+00, -3.4028e+38], [ 1.0764e+00, -1.5915e+00, -1.0792e+00, ..., -1.6231e+00, -1.4165e+00, -8.4046e-01]], [[ 9.3109e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 9.6087e-01, -2.6589e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4291e+00, -2.2902e+00, -3.5433e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.7776e+00, -2.7550e+00, -3.5866e+00, ..., -6.7503e-01, -3.4028e+38, -3.4028e+38], [ 1.5765e+00, -2.7960e+00, -3.4092e+00, ..., -1.9036e+00, -2.3868e+00, -3.4028e+38], [ 3.7332e-01, -2.6504e+00, -3.4292e+00, ..., -2.2849e+00, -2.7734e+00, -3.7061e+00]]], [[[ 1.1839e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.2352e+00, -1.8526e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.1215e+00, -1.1034e+00, -1.1380e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.0699e+00, -2.2538e+00, -2.9190e+00, ..., -2.7522e+00, -3.4028e+38, -3.4028e+38], [ 1.2503e+00, -2.3520e+00, -3.0299e+00, ..., -3.9587e+00, -2.3545e+00, -3.4028e+38], [ 1.1445e+00, -2.4599e+00, -1.4675e+00, ..., -4.5715e+00, -2.6766e+00, -3.2961e+00]], [[ 9.1653e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.4314e+00, 1.4052e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.8482e+00, -1.1521e+00, -2.2733e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.9443e+00, -2.2000e+00, -2.6604e+00, ..., 3.7069e-01, -3.4028e+38, -3.4028e+38], [ 5.1623e+00, -2.4533e+00, -2.8417e+00, ..., 1.8455e-01, 2.3588e+00, -3.4028e+38], [ 2.5013e+00, -3.2726e+00, -5.2775e-01, ..., 3.4743e-02, -4.2228e-01, -1.3789e+00]], [[ 5.5456e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.7686e+00, -5.9669e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.0608e+00, -2.9295e-01, -1.9495e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.2496e+00, -5.6383e-01, -1.7735e+00, ..., -7.2414e-01, -3.4028e+38, -3.4028e+38], [ 2.3608e+00, -4.4634e-01, -2.1191e+00, ..., -1.3539e+00, -1.7769e+00, -3.4028e+38], [ 1.9967e+00, -1.8365e-01, -1.5309e+00, ..., -9.5818e-01, -1.9410e+00, -1.3713e+00]], ..., [[ 4.1511e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4833e+00, -1.8749e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.2216e+00, -2.0234e+00, -2.1622e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.4239e+00, -3.5226e+00, -3.8543e+00, ..., 2.9924e-01, -3.4028e+38, -3.4028e+38], [ 1.5677e+00, -3.4006e+00, -3.4238e+00, ..., -1.7730e-01, -6.5243e-01, -3.4028e+38], [ 1.1460e+00, -2.7953e+00, -1.9780e+00, ..., -1.0973e+00, -9.9403e-01, -1.8633e+00]], [[ 4.7874e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.5284e+00, -8.1035e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4687e+00, -1.4795e+00, -1.8821e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.4817e+00, -2.0753e+00, -2.2936e+00, ..., -7.7886e-01, -3.4028e+38, -3.4028e+38], [ 1.3715e+00, -2.6386e+00, -2.7770e+00, ..., -1.5484e+00, -1.2749e+00, -3.4028e+38], [ 1.0764e+00, -1.5915e+00, -1.0792e+00, ..., -1.6231e+00, -1.4165e+00, -8.4046e-01]], [[ 9.3109e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 9.6087e-01, -2.6589e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4291e+00, -2.2902e+00, -3.5433e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.7776e+00, -2.7550e+00, -3.5866e+00, ..., -6.7503e-01, -3.4028e+38, -3.4028e+38], [ 1.5765e+00, -2.7960e+00, -3.4092e+00, ..., -1.9036e+00, -2.3868e+00, -3.4028e+38], [ 3.7332e-01, -2.6504e+00, -3.4292e+00, ..., -2.2849e+00, -2.7734e+00, -3.7061e+00]]], [[[ 1.1840e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.2352e+00, -1.8526e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.1215e+00, -1.1034e+00, -1.1380e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.0699e+00, -2.2538e+00, -2.9190e+00, ..., -2.7522e+00, -3.4028e+38, -3.4028e+38], [ 1.2503e+00, -2.3520e+00, -3.0299e+00, ..., -3.9587e+00, -2.3545e+00, -3.4028e+38], [ 1.1445e+00, -2.4599e+00, -1.4675e+00, ..., -4.5715e+00, -2.6766e+00, -3.2961e+00]], [[ 9.1653e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.4314e+00, 1.4052e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.8482e+00, -1.1521e+00, -2.2733e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.9443e+00, -2.2000e+00, -2.6604e+00, ..., 3.7069e-01, -3.4028e+38, -3.4028e+38], [ 5.1623e+00, -2.4533e+00, -2.8417e+00, ..., 1.8455e-01, 2.3588e+00, -3.4028e+38], [ 2.5013e+00, -3.2726e+00, -5.2775e-01, ..., 3.4745e-02, -4.2228e-01, -1.3789e+00]], [[ 5.5456e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.7686e+00, -5.9669e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.0608e+00, -2.9295e-01, -1.9495e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.2496e+00, -5.6383e-01, -1.7735e+00, ..., -7.2413e-01, -3.4028e+38, -3.4028e+38], [ 2.3608e+00, -4.4634e-01, -2.1191e+00, ..., -1.3539e+00, -1.7769e+00, -3.4028e+38], [ 1.9967e+00, -1.8365e-01, -1.5309e+00, ..., -9.5818e-01, -1.9410e+00, -1.3713e+00]], ..., [[ 4.1511e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4833e+00, -1.8749e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.2216e+00, -2.0234e+00, -2.1622e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.4239e+00, -3.5226e+00, -3.8543e+00, ..., 2.9924e-01, -3.4028e+38, -3.4028e+38], [ 1.5677e+00, -3.4006e+00, -3.4238e+00, ..., -1.7729e-01, -6.5243e-01, -3.4028e+38], [ 1.1460e+00, -2.7953e+00, -1.9780e+00, ..., -1.0973e+00, -9.9403e-01, -1.8633e+00]], [[ 4.7874e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.5284e+00, -8.1035e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4687e+00, -1.4795e+00, -1.8821e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.4817e+00, -2.0753e+00, -2.2936e+00, ..., -7.7886e-01, -3.4028e+38, -3.4028e+38], [ 1.3715e+00, -2.6386e+00, -2.7770e+00, ..., -1.5484e+00, -1.2749e+00, -3.4028e+38], [ 1.0764e+00, -1.5915e+00, -1.0792e+00, ..., -1.6231e+00, -1.4165e+00, -8.4047e-01]], [[ 9.3109e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 9.6087e-01, -2.6589e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.4291e+00, -2.2902e+00, -3.5433e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.7776e+00, -2.7550e+00, -3.5866e+00, ..., -6.7503e-01, -3.4028e+38, -3.4028e+38], [ 1.5765e+00, -2.7960e+00, -3.4092e+00, ..., -1.9036e+00, -2.3868e+00, -3.4028e+38], [ 3.7332e-01, -2.6504e+00, -3.4292e+00, ..., -2.2849e+00, -2.7734e+00, -3.7061e+00]]]]) attn_weights tensor([[[[ 1.2326e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.9418e+00, -1.0453e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.1731e+00, 7.2706e-01, -1.3961e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.7916e+00, -2.1471e+00, -2.7213e+00, ..., 3.5003e-01, -3.4028e+38, -3.4028e+38], [ 3.0402e+00, -2.7829e+00, -3.0008e+00, ..., -4.4084e-01, 1.0752e+00, -3.4028e+38], [ 2.0144e+00, -3.4351e+00, -2.7223e+00, ..., -8.7706e-02, 1.1748e+00, -2.9702e+00]], [[ 1.2333e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.3506e+00, 1.0742e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1625e+00, 3.2890e-01, -7.2091e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.5396e+00, -2.2646e+00, -3.7860e+00, ..., -2.1670e+00, -3.4028e+38, -3.4028e+38], [ 3.9361e+00, -1.4939e+00, -2.2751e+00, ..., -2.1288e+00, 2.7269e-01, -3.4028e+38], [ 2.5850e+00, -1.3266e+00, -1.1517e+00, ..., -1.7115e+00, -1.4336e+00, -1.6978e+00]], [[ 8.1681e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.6893e+00, -1.3733e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.2223e+00, -3.9066e-01, -9.5447e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.7165e+00, -2.5697e+00, -2.1829e+00, ..., -6.4560e-01, -3.4028e+38, -3.4028e+38], [ 3.0942e+00, -3.8041e+00, -3.5734e+00, ..., -1.2352e+00, -3.6663e-01, -3.4028e+38], [ 1.8164e+00, -3.8503e+00, -3.1246e+00, ..., -7.3449e-01, 1.0787e-01, -2.2610e+00]], ..., [[ 1.6889e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.7467e+00, -4.2717e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.0788e+00, -9.6161e-01, -2.0221e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 5.4608e+00, -2.7451e+00, -3.3223e+00, ..., 8.4800e-01, -3.4028e+38, -3.4028e+38], [ 5.2924e+00, -1.8860e+00, -2.2697e+00, ..., 8.8408e-01, 3.4495e+00, -3.4028e+38], [ 3.1222e+00, -2.4772e+00, -2.3100e+00, ..., 2.6781e-01, 1.1221e+00, -2.4833e+00]], [[ 1.3264e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 9.1998e-01, -2.0401e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 9.1255e-01, -6.0814e-01, -1.8739e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.2184e+00, -2.8972e+00, -2.6823e+00, ..., -2.4023e+00, -3.4028e+38, -3.4028e+38], [ 7.1134e-01, -3.4722e+00, -2.4964e+00, ..., -1.7251e+00, -2.0181e+00, -3.4028e+38], [ 3.0304e-01, -3.4860e+00, -2.3905e+00, ..., -1.7509e+00, -1.0019e+00, -2.4684e+00]], [[ 1.3739e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.8188e+00, 9.6610e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1034e+00, -9.8246e-01, -2.1082e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.8828e+00, -5.3131e-02, -2.1060e+00, ..., -1.8354e+00, -3.4028e+38, -3.4028e+38], [ 4.1489e+00, 1.2443e-01, -2.6470e+00, ..., -2.8027e+00, -1.5234e+00, -3.4028e+38], [ 3.9344e+00, -1.2475e+00, 7.6831e-01, ..., -1.5362e+00, -1.6578e+00, -1.0489e+00]]], [[[ 1.2326e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.9418e+00, -1.0453e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.1731e+00, 7.2706e-01, -1.3961e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.7916e+00, -2.1471e+00, -2.7213e+00, ..., 3.5003e-01, -3.4028e+38, -3.4028e+38], [ 3.0402e+00, -2.7829e+00, -3.0008e+00, ..., -4.4084e-01, 1.0752e+00, -3.4028e+38], [ 2.0144e+00, -3.4351e+00, -2.7223e+00, ..., -8.7706e-02, 1.1748e+00, -2.9702e+00]], [[ 1.2333e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.3506e+00, 1.0742e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1625e+00, 3.2890e-01, -7.2091e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.5396e+00, -2.2646e+00, -3.7860e+00, ..., -2.1670e+00, -3.4028e+38, -3.4028e+38], [ 3.9361e+00, -1.4939e+00, -2.2751e+00, ..., -2.1288e+00, 2.7269e-01, -3.4028e+38], [ 2.5850e+00, -1.3266e+00, -1.1517e+00, ..., -1.7115e+00, -1.4336e+00, -1.6978e+00]], [[ 8.1681e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.6893e+00, -1.3733e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.2223e+00, -3.9066e-01, -9.5447e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.7165e+00, -2.5697e+00, -2.1829e+00, ..., -6.4560e-01, -3.4028e+38, -3.4028e+38], [ 3.0942e+00, -3.8041e+00, -3.5734e+00, ..., -1.2352e+00, -3.6663e-01, -3.4028e+38], [ 1.8164e+00, -3.8503e+00, -3.1246e+00, ..., -7.3449e-01, 1.0787e-01, -2.2610e+00]], ..., [[ 1.6889e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.7467e+00, -4.2717e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.0788e+00, -9.6161e-01, -2.0221e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 5.4608e+00, -2.7451e+00, -3.3223e+00, ..., 8.4800e-01, -3.4028e+38, -3.4028e+38], [ 5.2924e+00, -1.8860e+00, -2.2697e+00, ..., 8.8408e-01, 3.4495e+00, -3.4028e+38], [ 3.1222e+00, -2.4772e+00, -2.3100e+00, ..., 2.6781e-01, 1.1221e+00, -2.4833e+00]], [[ 1.3264e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 9.1998e-01, -2.0401e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 9.1255e-01, -6.0814e-01, -1.8739e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.2184e+00, -2.8972e+00, -2.6823e+00, ..., -2.4023e+00, -3.4028e+38, -3.4028e+38], [ 7.1134e-01, -3.4722e+00, -2.4964e+00, ..., -1.7251e+00, -2.0181e+00, -3.4028e+38], [ 3.0304e-01, -3.4860e+00, -2.3905e+00, ..., -1.7509e+00, -1.0019e+00, -2.4684e+00]], [[ 1.3739e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.8188e+00, 9.6610e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1034e+00, -9.8246e-01, -2.1082e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.8828e+00, -5.3131e-02, -2.1060e+00, ..., -1.8354e+00, -3.4028e+38, -3.4028e+38], [ 4.1489e+00, 1.2443e-01, -2.6470e+00, ..., -2.8027e+00, -1.5234e+00, -3.4028e+38], [ 3.9344e+00, -1.2475e+00, 7.6831e-01, ..., -1.5362e+00, -1.6578e+00, -1.0489e+00]]], [[[ 1.2326e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.9418e+00, -1.0453e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.1731e+00, 7.2706e-01, -1.3961e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.7916e+00, -2.1471e+00, -2.7213e+00, ..., 3.5003e-01, -3.4028e+38, -3.4028e+38], [ 3.0402e+00, -2.7829e+00, -3.0008e+00, ..., -4.4084e-01, 1.0752e+00, -3.4028e+38], [ 2.0144e+00, -3.4351e+00, -2.7223e+00, ..., -8.7706e-02, 1.1748e+00, -2.9702e+00]], [[ 1.2333e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.3506e+00, 1.0742e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1625e+00, 3.2890e-01, -7.2091e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.5396e+00, -2.2646e+00, -3.7860e+00, ..., -2.1670e+00, -3.4028e+38, -3.4028e+38], [ 3.9361e+00, -1.4939e+00, -2.2751e+00, ..., -2.1288e+00, 2.7269e-01, -3.4028e+38], [ 2.5850e+00, -1.3266e+00, -1.1517e+00, ..., -1.7115e+00, -1.4336e+00, -1.6978e+00]], [[ 8.1681e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.6893e+00, -1.3733e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.2223e+00, -3.9066e-01, -9.5447e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.7165e+00, -2.5697e+00, -2.1829e+00, ..., -6.4560e-01, -3.4028e+38, -3.4028e+38], [ 3.0942e+00, -3.8041e+00, -3.5734e+00, ..., -1.2352e+00, -3.6663e-01, -3.4028e+38], [ 1.8164e+00, -3.8503e+00, -3.1246e+00, ..., -7.3449e-01, 1.0787e-01, -2.2610e+00]], ..., [[ 1.6889e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.7467e+00, -4.2717e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.0788e+00, -9.6161e-01, -2.0221e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 5.4608e+00, -2.7451e+00, -3.3223e+00, ..., 8.4800e-01, -3.4028e+38, -3.4028e+38], [ 5.2924e+00, -1.8860e+00, -2.2697e+00, ..., 8.8408e-01, 3.4495e+00, -3.4028e+38], [ 3.1222e+00, -2.4772e+00, -2.3100e+00, ..., 2.6781e-01, 1.1221e+00, -2.4833e+00]], [[ 1.3264e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 9.1998e-01, -2.0401e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 9.1255e-01, -6.0814e-01, -1.8739e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.2184e+00, -2.8972e+00, -2.6823e+00, ..., -2.4023e+00, -3.4028e+38, -3.4028e+38], [ 7.1134e-01, -3.4722e+00, -2.4964e+00, ..., -1.7251e+00, -2.0181e+00, -3.4028e+38], [ 3.0304e-01, -3.4860e+00, -2.3905e+00, ..., -1.7509e+00, -1.0019e+00, -2.4684e+00]], [[ 1.3739e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.8188e+00, 9.6610e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1034e+00, -9.8246e-01, -2.1082e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.8828e+00, -5.3131e-02, -2.1060e+00, ..., -1.8354e+00, -3.4028e+38, -3.4028e+38], [ 4.1489e+00, 1.2443e-01, -2.6470e+00, ..., -2.8027e+00, -1.5234e+00, -3.4028e+38], [ 3.9344e+00, -1.2475e+00, 7.6831e-01, ..., -1.5362e+00, -1.6578e+00, -1.0489e+00]]], [[[ 1.2326e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.9418e+00, -1.0453e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.1731e+00, 7.2706e-01, -1.3961e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.7916e+00, -2.1471e+00, -2.7213e+00, ..., 3.5003e-01, -3.4028e+38, -3.4028e+38], [ 3.0402e+00, -2.7829e+00, -3.0008e+00, ..., -4.4084e-01, 1.0752e+00, -3.4028e+38], [ 2.0144e+00, -3.4351e+00, -2.7223e+00, ..., -8.7706e-02, 1.1748e+00, -2.9702e+00]], [[ 1.2333e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.3506e+00, 1.0742e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1625e+00, 3.2890e-01, -7.2091e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.5396e+00, -2.2646e+00, -3.7860e+00, ..., -2.1670e+00, -3.4028e+38, -3.4028e+38], [ 3.9361e+00, -1.4939e+00, -2.2751e+00, ..., -2.1288e+00, 2.7269e-01, -3.4028e+38], [ 2.5850e+00, -1.3266e+00, -1.1517e+00, ..., -1.7115e+00, -1.4336e+00, -1.6978e+00]], [[ 8.1681e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.6893e+00, -1.3733e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.2223e+00, -3.9066e-01, -9.5447e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.7165e+00, -2.5697e+00, -2.1829e+00, ..., -6.4560e-01, -3.4028e+38, -3.4028e+38], [ 3.0942e+00, -3.8041e+00, -3.5734e+00, ..., -1.2352e+00, -3.6663e-01, -3.4028e+38], [ 1.8164e+00, -3.8503e+00, -3.1246e+00, ..., -7.3449e-01, 1.0787e-01, -2.2610e+00]], ..., [[ 1.6889e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.7467e+00, -4.2717e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.0788e+00, -9.6161e-01, -2.0221e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 5.4608e+00, -2.7451e+00, -3.3223e+00, ..., 8.4800e-01, -3.4028e+38, -3.4028e+38], [ 5.2924e+00, -1.8860e+00, -2.2697e+00, ..., 8.8408e-01, 3.4495e+00, -3.4028e+38], [ 3.1222e+00, -2.4772e+00, -2.3100e+00, ..., 2.6781e-01, 1.1221e+00, -2.4833e+00]], [[ 1.3264e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 9.1998e-01, -2.0401e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 9.1255e-01, -6.0814e-01, -1.8739e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.2184e+00, -2.8972e+00, -2.6823e+00, ..., -2.4023e+00, -3.4028e+38, -3.4028e+38], [ 7.1134e-01, -3.4722e+00, -2.4964e+00, ..., -1.7251e+00, -2.0181e+00, -3.4028e+38], [ 3.0304e-01, -3.4860e+00, -2.3905e+00, ..., -1.7509e+00, -1.0019e+00, -2.4684e+00]], [[ 1.3739e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.8188e+00, 9.6610e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1034e+00, -9.8246e-01, -2.1082e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.8828e+00, -5.3131e-02, -2.1060e+00, ..., -1.8354e+00, -3.4028e+38, -3.4028e+38], [ 4.1489e+00, 1.2443e-01, -2.6470e+00, ..., -2.8027e+00, -1.5234e+00, -3.4028e+38], [ 3.9344e+00, -1.2475e+00, 7.6831e-01, ..., -1.5362e+00, -1.6578e+00, -1.0489e+00]]], [[[ 1.2326e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.9418e+00, -1.0453e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.1731e+00, 7.2706e-01, -1.3961e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.7916e+00, -2.1471e+00, -2.7213e+00, ..., 3.5003e-01, -3.4028e+38, -3.4028e+38], [ 3.0402e+00, -2.7829e+00, -3.0008e+00, ..., -4.4083e-01, 1.0752e+00, -3.4028e+38], [ 2.0144e+00, -3.4351e+00, -2.7223e+00, ..., -8.7704e-02, 1.1748e+00, -2.9702e+00]], [[ 1.2333e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.3506e+00, 1.0742e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1625e+00, 3.2890e-01, -7.2091e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.5396e+00, -2.2646e+00, -3.7860e+00, ..., -2.1670e+00, -3.4028e+38, -3.4028e+38], [ 3.9361e+00, -1.4939e+00, -2.2751e+00, ..., -2.1288e+00, 2.7270e-01, -3.4028e+38], [ 2.5850e+00, -1.3266e+00, -1.1517e+00, ..., -1.7115e+00, -1.4336e+00, -1.6978e+00]], [[ 8.1681e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.6893e+00, -1.3733e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.2223e+00, -3.9066e-01, -9.5447e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.7165e+00, -2.5697e+00, -2.1829e+00, ..., -6.4560e-01, -3.4028e+38, -3.4028e+38], [ 3.0942e+00, -3.8041e+00, -3.5734e+00, ..., -1.2352e+00, -3.6663e-01, -3.4028e+38], [ 1.8164e+00, -3.8503e+00, -3.1246e+00, ..., -7.3449e-01, 1.0787e-01, -2.2610e+00]], ..., [[ 1.6889e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.7467e+00, -4.2717e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 5.0788e+00, -9.6161e-01, -2.0221e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 5.4608e+00, -2.7451e+00, -3.3223e+00, ..., 8.4800e-01, -3.4028e+38, -3.4028e+38], [ 5.2924e+00, -1.8860e+00, -2.2697e+00, ..., 8.8408e-01, 3.4495e+00, -3.4028e+38], [ 3.1222e+00, -2.4772e+00, -2.3100e+00, ..., 2.6781e-01, 1.1221e+00, -2.4833e+00]], [[ 1.3264e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 9.1998e-01, -2.0401e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 9.1255e-01, -6.0814e-01, -1.8739e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 1.2184e+00, -2.8972e+00, -2.6823e+00, ..., -2.4023e+00, -3.4028e+38, -3.4028e+38], [ 7.1134e-01, -3.4722e+00, -2.4964e+00, ..., -1.7251e+00, -2.0181e+00, -3.4028e+38], [ 3.0304e-01, -3.4860e+00, -2.3905e+00, ..., -1.7508e+00, -1.0019e+00, -2.4684e+00]], [[ 1.3739e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.8188e+00, 9.6610e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1034e+00, -9.8245e-01, -2.1082e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.8828e+00, -5.3131e-02, -2.1060e+00, ..., -1.8354e+00, -3.4028e+38, -3.4028e+38], [ 4.1489e+00, 1.2443e-01, -2.6470e+00, ..., -2.8027e+00, -1.5234e+00, -3.4028e+38], [ 3.9344e+00, -1.2475e+00, 7.6831e-01, ..., -1.5362e+00, -1.6578e+00, -1.0489e+00]]]]) attn_weights tensor([[[[ 1.8881e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.2298e+00, -1.3076e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.8242e+00, -2.4116e+00, -3.1160e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.4476e+00, -3.7197e+00, -3.3517e+00, ..., 2.3371e-01, -3.4028e+38, -3.4028e+38], [ 3.6899e+00, -3.4981e+00, -3.6427e+00, ..., 2.9593e-01, 7.7326e-01, -3.4028e+38], [ 2.4215e+00, -2.9721e+00, -3.3145e+00, ..., 4.5769e-01, 2.3140e-02, -2.7213e+00]], [[ 2.1284e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.5454e+00, 1.0637e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.0354e+00, 5.9217e-02, 2.1205e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 5.0357e+00, -2.8943e+00, -3.3918e+00, ..., 4.4465e-01, -3.4028e+38, -3.4028e+38], [ 4.8038e+00, -1.8523e+00, -2.4606e+00, ..., 6.3463e-01, 1.5785e+00, -3.4028e+38], [ 2.9741e+00, -1.3757e+00, -1.8934e+00, ..., 3.3296e-02, -4.0932e-01, -1.0441e+00]], [[ 2.0295e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.5071e+00, 5.4534e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.8420e+00, -5.2520e-01, -1.5990e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.2170e+00, -8.7713e-01, -2.0740e+00, ..., -1.0717e-02, -3.4028e+38, -3.4028e+38], [ 3.6595e+00, -7.8555e-01, -2.3994e+00, ..., -5.5738e-01, 6.0999e-01, -3.4028e+38], [ 2.7088e+00, -5.4943e-01, -8.2674e-01, ..., -3.2392e-01, 2.1910e-01, -9.7538e-01]], ..., [[ 1.3065e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.5816e-01, -1.8347e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.0854e+00, -2.8548e+00, -3.5144e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 9.7506e-01, -2.0979e+00, -2.6546e+00, ..., -1.4572e+00, -3.4028e+38, -3.4028e+38], [ 1.3201e-01, -3.9611e+00, -3.5308e+00, ..., -4.9247e-02, -9.2960e-01, -3.4028e+38], [ 4.8744e-01, -2.4605e+00, -1.0405e+00, ..., -1.2589e+00, -1.1491e+00, -8.9671e-01]], [[ 9.9695e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.3862e+00, -6.7815e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.9141e+00, -1.4110e+00, -1.9299e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.6747e+00, -1.5715e+00, -2.1566e+00, ..., -1.0629e+00, -3.4028e+38, -3.4028e+38], [ 3.9921e+00, -1.4977e+00, -2.1482e+00, ..., 3.6741e-01, 3.7661e-01, -3.4028e+38], [ 2.6573e+00, -2.1113e+00, -1.0212e+00, ..., -4.4855e-01, -8.3410e-01, -2.2498e+00]], [[ 2.3315e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.8503e+00, 3.6000e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1284e+00, 3.0324e-01, -6.2687e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.6108e+00, 5.5104e-01, 1.2587e+00, ..., 1.0846e+00, -3.4028e+38, -3.4028e+38], [ 5.3505e+00, -5.4460e-02, 1.6678e+00, ..., 8.4944e-01, 2.5584e+00, -3.4028e+38], [ 3.3526e+00, -5.9194e-01, 4.5551e-02, ..., 2.4971e+00, 2.6994e+00, 1.4745e-01]]], [[[ 1.8881e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.2298e+00, -1.3076e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.8242e+00, -2.4116e+00, -3.1160e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.4476e+00, -3.7197e+00, -3.3517e+00, ..., 2.3371e-01, -3.4028e+38, -3.4028e+38], [ 3.6899e+00, -3.4981e+00, -3.6427e+00, ..., 2.9593e-01, 7.7326e-01, -3.4028e+38], [ 2.4215e+00, -2.9721e+00, -3.3145e+00, ..., 4.5769e-01, 2.3140e-02, -2.7213e+00]], [[ 2.1284e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.5454e+00, 1.0637e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.0354e+00, 5.9217e-02, 2.1205e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 5.0357e+00, -2.8943e+00, -3.3918e+00, ..., 4.4465e-01, -3.4028e+38, -3.4028e+38], [ 4.8038e+00, -1.8523e+00, -2.4606e+00, ..., 6.3463e-01, 1.5785e+00, -3.4028e+38], [ 2.9741e+00, -1.3757e+00, -1.8934e+00, ..., 3.3296e-02, -4.0932e-01, -1.0441e+00]], [[ 2.0295e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.5071e+00, 5.4534e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.8420e+00, -5.2520e-01, -1.5990e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.2170e+00, -8.7713e-01, -2.0740e+00, ..., -1.0717e-02, -3.4028e+38, -3.4028e+38], [ 3.6595e+00, -7.8555e-01, -2.3994e+00, ..., -5.5738e-01, 6.0999e-01, -3.4028e+38], [ 2.7088e+00, -5.4943e-01, -8.2674e-01, ..., -3.2392e-01, 2.1910e-01, -9.7538e-01]], ..., [[ 1.3065e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.5816e-01, -1.8347e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.0854e+00, -2.8548e+00, -3.5144e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 9.7506e-01, -2.0979e+00, -2.6546e+00, ..., -1.4572e+00, -3.4028e+38, -3.4028e+38], [ 1.3201e-01, -3.9611e+00, -3.5308e+00, ..., -4.9247e-02, -9.2960e-01, -3.4028e+38], [ 4.8744e-01, -2.4605e+00, -1.0405e+00, ..., -1.2589e+00, -1.1491e+00, -8.9671e-01]], [[ 9.9695e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.3862e+00, -6.7815e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.9141e+00, -1.4110e+00, -1.9299e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.6747e+00, -1.5715e+00, -2.1566e+00, ..., -1.0629e+00, -3.4028e+38, -3.4028e+38], [ 3.9921e+00, -1.4977e+00, -2.1482e+00, ..., 3.6741e-01, 3.7661e-01, -3.4028e+38], [ 2.6573e+00, -2.1113e+00, -1.0212e+00, ..., -4.4855e-01, -8.3410e-01, -2.2498e+00]], [[ 2.3315e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.8503e+00, 3.6000e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1284e+00, 3.0324e-01, -6.2687e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.6108e+00, 5.5104e-01, 1.2587e+00, ..., 1.0846e+00, -3.4028e+38, -3.4028e+38], [ 5.3505e+00, -5.4460e-02, 1.6678e+00, ..., 8.4944e-01, 2.5584e+00, -3.4028e+38], [ 3.3526e+00, -5.9194e-01, 4.5551e-02, ..., 2.4971e+00, 2.6994e+00, 1.4745e-01]]], [[[ 1.8881e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.2298e+00, -1.3076e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.8242e+00, -2.4116e+00, -3.1160e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.4476e+00, -3.7197e+00, -3.3517e+00, ..., 2.3371e-01, -3.4028e+38, -3.4028e+38], [ 3.6899e+00, -3.4981e+00, -3.6427e+00, ..., 2.9593e-01, 7.7326e-01, -3.4028e+38], [ 2.4215e+00, -2.9721e+00, -3.3145e+00, ..., 4.5769e-01, 2.3140e-02, -2.7213e+00]], [[ 2.1284e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.5454e+00, 1.0637e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.0354e+00, 5.9217e-02, 2.1205e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 5.0357e+00, -2.8943e+00, -3.3918e+00, ..., 4.4465e-01, -3.4028e+38, -3.4028e+38], [ 4.8038e+00, -1.8523e+00, -2.4606e+00, ..., 6.3463e-01, 1.5785e+00, -3.4028e+38], [ 2.9741e+00, -1.3757e+00, -1.8934e+00, ..., 3.3296e-02, -4.0932e-01, -1.0441e+00]], [[ 2.0295e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.5071e+00, 5.4534e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.8420e+00, -5.2520e-01, -1.5990e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.2170e+00, -8.7713e-01, -2.0740e+00, ..., -1.0717e-02, -3.4028e+38, -3.4028e+38], [ 3.6595e+00, -7.8555e-01, -2.3994e+00, ..., -5.5738e-01, 6.0999e-01, -3.4028e+38], [ 2.7088e+00, -5.4943e-01, -8.2674e-01, ..., -3.2392e-01, 2.1910e-01, -9.7538e-01]], ..., [[ 1.3065e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.5816e-01, -1.8347e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.0854e+00, -2.8548e+00, -3.5144e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 9.7506e-01, -2.0979e+00, -2.6546e+00, ..., -1.4572e+00, -3.4028e+38, -3.4028e+38], [ 1.3201e-01, -3.9611e+00, -3.5308e+00, ..., -4.9247e-02, -9.2960e-01, -3.4028e+38], [ 4.8744e-01, -2.4605e+00, -1.0405e+00, ..., -1.2589e+00, -1.1491e+00, -8.9671e-01]], [[ 9.9695e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.3862e+00, -6.7815e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.9141e+00, -1.4110e+00, -1.9299e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.6747e+00, -1.5715e+00, -2.1566e+00, ..., -1.0629e+00, -3.4028e+38, -3.4028e+38], [ 3.9921e+00, -1.4977e+00, -2.1482e+00, ..., 3.6741e-01, 3.7661e-01, -3.4028e+38], [ 2.6573e+00, -2.1113e+00, -1.0212e+00, ..., -4.4855e-01, -8.3410e-01, -2.2498e+00]], [[ 2.3315e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.8503e+00, 3.6000e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1284e+00, 3.0324e-01, -6.2687e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.6108e+00, 5.5104e-01, 1.2587e+00, ..., 1.0846e+00, -3.4028e+38, -3.4028e+38], [ 5.3505e+00, -5.4460e-02, 1.6678e+00, ..., 8.4944e-01, 2.5584e+00, -3.4028e+38], [ 3.3526e+00, -5.9194e-01, 4.5551e-02, ..., 2.4971e+00, 2.6994e+00, 1.4745e-01]]], [[[ 1.8881e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.2298e+00, -1.3076e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.8242e+00, -2.4116e+00, -3.1160e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.4476e+00, -3.7197e+00, -3.3517e+00, ..., 2.3371e-01, -3.4028e+38, -3.4028e+38], [ 3.6899e+00, -3.4981e+00, -3.6427e+00, ..., 2.9593e-01, 7.7326e-01, -3.4028e+38], [ 2.4215e+00, -2.9721e+00, -3.3145e+00, ..., 4.5769e-01, 2.3140e-02, -2.7213e+00]], [[ 2.1284e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.5454e+00, 1.0637e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.0354e+00, 5.9217e-02, 2.1205e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 5.0357e+00, -2.8943e+00, -3.3918e+00, ..., 4.4465e-01, -3.4028e+38, -3.4028e+38], [ 4.8038e+00, -1.8523e+00, -2.4606e+00, ..., 6.3463e-01, 1.5785e+00, -3.4028e+38], [ 2.9741e+00, -1.3757e+00, -1.8934e+00, ..., 3.3296e-02, -4.0932e-01, -1.0441e+00]], [[ 2.0295e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.5071e+00, 5.4534e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.8420e+00, -5.2520e-01, -1.5990e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.2170e+00, -8.7713e-01, -2.0740e+00, ..., -1.0717e-02, -3.4028e+38, -3.4028e+38], [ 3.6595e+00, -7.8555e-01, -2.3994e+00, ..., -5.5738e-01, 6.0999e-01, -3.4028e+38], [ 2.7088e+00, -5.4943e-01, -8.2674e-01, ..., -3.2392e-01, 2.1910e-01, -9.7538e-01]], ..., [[ 1.3065e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.5816e-01, -1.8347e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.0854e+00, -2.8548e+00, -3.5144e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 9.7506e-01, -2.0979e+00, -2.6546e+00, ..., -1.4572e+00, -3.4028e+38, -3.4028e+38], [ 1.3201e-01, -3.9611e+00, -3.5308e+00, ..., -4.9247e-02, -9.2960e-01, -3.4028e+38], [ 4.8744e-01, -2.4605e+00, -1.0405e+00, ..., -1.2589e+00, -1.1491e+00, -8.9671e-01]], [[ 9.9695e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.3862e+00, -6.7815e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.9141e+00, -1.4110e+00, -1.9299e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.6747e+00, -1.5715e+00, -2.1566e+00, ..., -1.0629e+00, -3.4028e+38, -3.4028e+38], [ 3.9921e+00, -1.4977e+00, -2.1482e+00, ..., 3.6741e-01, 3.7661e-01, -3.4028e+38], [ 2.6573e+00, -2.1113e+00, -1.0212e+00, ..., -4.4855e-01, -8.3410e-01, -2.2498e+00]], [[ 2.3315e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.8503e+00, 3.6000e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1284e+00, 3.0324e-01, -6.2687e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.6108e+00, 5.5104e-01, 1.2587e+00, ..., 1.0846e+00, -3.4028e+38, -3.4028e+38], [ 5.3505e+00, -5.4460e-02, 1.6678e+00, ..., 8.4944e-01, 2.5584e+00, -3.4028e+38], [ 3.3526e+00, -5.9194e-01, 4.5551e-02, ..., 2.4971e+00, 2.6994e+00, 1.4745e-01]]], [[[ 1.8881e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.2298e+00, -1.3076e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.8242e+00, -2.4116e+00, -3.1160e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.4476e+00, -3.7197e+00, -3.3517e+00, ..., 2.3372e-01, -3.4028e+38, -3.4028e+38], [ 3.6899e+00, -3.4981e+00, -3.6427e+00, ..., 2.9593e-01, 7.7326e-01, -3.4028e+38], [ 2.4215e+00, -2.9721e+00, -3.3145e+00, ..., 4.5769e-01, 2.3144e-02, -2.7213e+00]], [[ 2.1284e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.5454e+00, 1.0637e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.0354e+00, 5.9217e-02, 2.1205e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 5.0357e+00, -2.8943e+00, -3.3918e+00, ..., 4.4465e-01, -3.4028e+38, -3.4028e+38], [ 4.8038e+00, -1.8523e+00, -2.4606e+00, ..., 6.3463e-01, 1.5785e+00, -3.4028e+38], [ 2.9741e+00, -1.3757e+00, -1.8934e+00, ..., 3.3296e-02, -4.0932e-01, -1.0441e+00]], [[ 2.0295e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.5071e+00, 5.4534e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.8420e+00, -5.2520e-01, -1.5990e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.2170e+00, -8.7713e-01, -2.0740e+00, ..., -1.0718e-02, -3.4028e+38, -3.4028e+38], [ 3.6595e+00, -7.8555e-01, -2.3994e+00, ..., -5.5739e-01, 6.0999e-01, -3.4028e+38], [ 2.7088e+00, -5.4943e-01, -8.2674e-01, ..., -3.2393e-01, 2.1910e-01, -9.7538e-01]], ..., [[ 1.3065e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.5817e-01, -1.8347e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.0854e+00, -2.8548e+00, -3.5144e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 9.7506e-01, -2.0979e+00, -2.6546e+00, ..., -1.4572e+00, -3.4028e+38, -3.4028e+38], [ 1.3201e-01, -3.9611e+00, -3.5308e+00, ..., -4.9249e-02, -9.2960e-01, -3.4028e+38], [ 4.8744e-01, -2.4605e+00, -1.0406e+00, ..., -1.2589e+00, -1.1491e+00, -8.9671e-01]], [[ 9.9695e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.3862e+00, -6.7815e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.9141e+00, -1.4110e+00, -1.9299e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.6747e+00, -1.5715e+00, -2.1566e+00, ..., -1.0629e+00, -3.4028e+38, -3.4028e+38], [ 3.9921e+00, -1.4977e+00, -2.1482e+00, ..., 3.6741e-01, 3.7661e-01, -3.4028e+38], [ 2.6573e+00, -2.1113e+00, -1.0212e+00, ..., -4.4854e-01, -8.3410e-01, -2.2498e+00]], [[ 2.3315e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.8503e+00, 3.5999e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1284e+00, 3.0323e-01, -6.2687e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.6108e+00, 5.5103e-01, 1.2587e+00, ..., 1.0846e+00, -3.4028e+38, -3.4028e+38], [ 5.3505e+00, -5.4460e-02, 1.6678e+00, ..., 8.4944e-01, 2.5584e+00, -3.4028e+38], [ 3.3526e+00, -5.9194e-01, 4.5552e-02, ..., 2.4971e+00, 2.6994e+00, 1.4745e-01]]]]) attn_weights tensor([[[[ 9.3403e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.8162e+00, 1.5035e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.7618e+00, 1.4776e+00, 8.1584e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.3868e+00, -3.4901e-01, -3.9808e-01, ..., 2.8684e-01, -3.4028e+38, -3.4028e+38], [ 2.1974e+00, -1.6077e-01, -8.2324e-01, ..., 7.2925e-01, 2.4942e-01, -3.4028e+38], [ 1.4640e+00, 7.9651e-01, 7.0362e-01, ..., 4.4562e-01, 7.5156e-01, 5.4296e-01]], [[ 2.5191e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.0207e+00, 2.1622e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1977e+00, -2.2375e-01, -7.4322e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.0347e+00, 2.4517e-01, -3.9776e-01, ..., -1.1429e+00, -3.4028e+38, -3.4028e+38], [ 4.5153e+00, 2.7451e-01, -5.1057e-01, ..., -1.2249e-01, 1.2522e+00, -3.4028e+38], [ 3.0509e+00, 5.5994e-01, -2.1430e-01, ..., 9.6363e-02, 1.5116e-01, 2.5033e-01]], [[ 4.3664e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.1365e+00, 3.6792e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.0077e+00, -4.5816e-01, -1.6199e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.6984e+00, -7.1395e-01, -1.9006e+00, ..., -4.9143e-02, -3.4028e+38, -3.4028e+38], [ 3.5790e+00, -4.9234e-01, -1.6544e+00, ..., 6.5879e-01, 9.1659e-01, -3.4028e+38], [ 2.5168e+00, -3.3554e-01, -1.4784e+00, ..., 2.4055e-01, -3.3571e-01, -6.5984e-01]], ..., [[ 9.6859e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.6863e+00, 5.6616e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.8816e+00, 6.1601e-01, 1.3178e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.7246e+00, -2.0344e+00, -3.3243e+00, ..., 4.3718e-04, -3.4028e+38, -3.4028e+38], [ 4.9006e+00, -1.4718e+00, -1.8556e+00, ..., 2.4667e-01, 1.7712e+00, -3.4028e+38], [ 3.4096e+00, -7.4837e-01, -1.5285e+00, ..., 2.5732e-01, 5.4028e-01, -6.1303e-01]], [[ 1.4775e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.7727e+00, 1.3764e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1652e+00, 1.3400e+00, 2.2661e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.5977e+00, -5.2545e-01, -1.6165e+00, ..., 1.5376e+00, -3.4028e+38, -3.4028e+38], [ 2.6520e+00, -9.3807e-01, -1.6327e+00, ..., 1.9087e+00, 1.8026e+00, -3.4028e+38], [ 2.5376e+00, 6.5691e-01, 1.1826e-01, ..., 1.2616e+00, 8.5567e-01, 1.0550e+00]], [[ 5.9822e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.3106e+00, -1.7496e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.3510e+00, 1.9541e-01, 1.5621e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.5344e+00, -7.4712e-02, -5.8267e-01, ..., 1.4142e+00, -3.4028e+38, -3.4028e+38], [ 3.4322e+00, -2.0629e-01, -8.1913e-01, ..., 1.4649e+00, 3.3822e-01, -3.4028e+38], [ 2.0776e+00, 6.7556e-03, -1.1207e+00, ..., 1.3069e+00, 1.1824e+00, 4.8304e-01]]], [[[ 9.3403e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.8162e+00, 1.5035e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.7618e+00, 1.4776e+00, 8.1584e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.3868e+00, -3.4901e-01, -3.9808e-01, ..., 2.8684e-01, -3.4028e+38, -3.4028e+38], [ 2.1974e+00, -1.6077e-01, -8.2324e-01, ..., 7.2925e-01, 2.4942e-01, -3.4028e+38], [ 1.4640e+00, 7.9651e-01, 7.0362e-01, ..., 4.4562e-01, 7.5156e-01, 5.4296e-01]], [[ 2.5191e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.0207e+00, 2.1622e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1977e+00, -2.2375e-01, -7.4322e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.0347e+00, 2.4517e-01, -3.9776e-01, ..., -1.1429e+00, -3.4028e+38, -3.4028e+38], [ 4.5153e+00, 2.7451e-01, -5.1057e-01, ..., -1.2249e-01, 1.2522e+00, -3.4028e+38], [ 3.0509e+00, 5.5994e-01, -2.1430e-01, ..., 9.6363e-02, 1.5116e-01, 2.5033e-01]], [[ 4.3664e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.1365e+00, 3.6792e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.0077e+00, -4.5816e-01, -1.6199e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.6984e+00, -7.1395e-01, -1.9006e+00, ..., -4.9143e-02, -3.4028e+38, -3.4028e+38], [ 3.5790e+00, -4.9234e-01, -1.6544e+00, ..., 6.5879e-01, 9.1659e-01, -3.4028e+38], [ 2.5168e+00, -3.3554e-01, -1.4784e+00, ..., 2.4055e-01, -3.3571e-01, -6.5984e-01]], ..., [[ 9.6859e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.6863e+00, 5.6616e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.8816e+00, 6.1601e-01, 1.3178e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.7246e+00, -2.0344e+00, -3.3243e+00, ..., 4.3718e-04, -3.4028e+38, -3.4028e+38], [ 4.9006e+00, -1.4718e+00, -1.8556e+00, ..., 2.4667e-01, 1.7712e+00, -3.4028e+38], [ 3.4096e+00, -7.4837e-01, -1.5285e+00, ..., 2.5732e-01, 5.4028e-01, -6.1303e-01]], [[ 1.4775e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.7727e+00, 1.3764e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1652e+00, 1.3400e+00, 2.2661e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.5977e+00, -5.2545e-01, -1.6165e+00, ..., 1.5376e+00, -3.4028e+38, -3.4028e+38], [ 2.6520e+00, -9.3807e-01, -1.6327e+00, ..., 1.9087e+00, 1.8026e+00, -3.4028e+38], [ 2.5376e+00, 6.5691e-01, 1.1826e-01, ..., 1.2616e+00, 8.5567e-01, 1.0550e+00]], [[ 5.9822e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.3106e+00, -1.7496e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.3510e+00, 1.9541e-01, 1.5621e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.5344e+00, -7.4712e-02, -5.8267e-01, ..., 1.4142e+00, -3.4028e+38, -3.4028e+38], [ 3.4322e+00, -2.0629e-01, -8.1913e-01, ..., 1.4649e+00, 3.3822e-01, -3.4028e+38], [ 2.0776e+00, 6.7556e-03, -1.1207e+00, ..., 1.3069e+00, 1.1824e+00, 4.8304e-01]]], [[[ 9.3403e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.8162e+00, 1.5035e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.7618e+00, 1.4776e+00, 8.1584e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.3868e+00, -3.4901e-01, -3.9808e-01, ..., 2.8684e-01, -3.4028e+38, -3.4028e+38], [ 2.1974e+00, -1.6077e-01, -8.2324e-01, ..., 7.2925e-01, 2.4942e-01, -3.4028e+38], [ 1.4640e+00, 7.9651e-01, 7.0362e-01, ..., 4.4562e-01, 7.5156e-01, 5.4296e-01]], [[ 2.5191e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.0207e+00, 2.1622e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1977e+00, -2.2375e-01, -7.4322e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.0347e+00, 2.4517e-01, -3.9776e-01, ..., -1.1429e+00, -3.4028e+38, -3.4028e+38], [ 4.5153e+00, 2.7451e-01, -5.1057e-01, ..., -1.2249e-01, 1.2522e+00, -3.4028e+38], [ 3.0509e+00, 5.5994e-01, -2.1430e-01, ..., 9.6363e-02, 1.5116e-01, 2.5033e-01]], [[ 4.3664e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.1365e+00, 3.6792e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.0077e+00, -4.5816e-01, -1.6199e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.6984e+00, -7.1395e-01, -1.9006e+00, ..., -4.9143e-02, -3.4028e+38, -3.4028e+38], [ 3.5790e+00, -4.9234e-01, -1.6544e+00, ..., 6.5879e-01, 9.1659e-01, -3.4028e+38], [ 2.5168e+00, -3.3554e-01, -1.4784e+00, ..., 2.4055e-01, -3.3571e-01, -6.5984e-01]], ..., [[ 9.6859e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.6863e+00, 5.6616e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.8816e+00, 6.1601e-01, 1.3178e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.7246e+00, -2.0344e+00, -3.3243e+00, ..., 4.3718e-04, -3.4028e+38, -3.4028e+38], [ 4.9006e+00, -1.4718e+00, -1.8556e+00, ..., 2.4667e-01, 1.7712e+00, -3.4028e+38], [ 3.4096e+00, -7.4837e-01, -1.5285e+00, ..., 2.5732e-01, 5.4028e-01, -6.1303e-01]], [[ 1.4775e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.7727e+00, 1.3764e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1652e+00, 1.3400e+00, 2.2661e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.5977e+00, -5.2545e-01, -1.6165e+00, ..., 1.5376e+00, -3.4028e+38, -3.4028e+38], [ 2.6520e+00, -9.3807e-01, -1.6327e+00, ..., 1.9087e+00, 1.8026e+00, -3.4028e+38], [ 2.5376e+00, 6.5691e-01, 1.1826e-01, ..., 1.2616e+00, 8.5567e-01, 1.0550e+00]], [[ 5.9822e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.3106e+00, -1.7496e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.3510e+00, 1.9541e-01, 1.5621e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.5344e+00, -7.4712e-02, -5.8267e-01, ..., 1.4142e+00, -3.4028e+38, -3.4028e+38], [ 3.4322e+00, -2.0629e-01, -8.1913e-01, ..., 1.4649e+00, 3.3822e-01, -3.4028e+38], [ 2.0776e+00, 6.7556e-03, -1.1207e+00, ..., 1.3069e+00, 1.1824e+00, 4.8304e-01]]], [[[ 9.3403e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.8162e+00, 1.5035e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.7618e+00, 1.4776e+00, 8.1584e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.3868e+00, -3.4901e-01, -3.9808e-01, ..., 2.8684e-01, -3.4028e+38, -3.4028e+38], [ 2.1974e+00, -1.6077e-01, -8.2324e-01, ..., 7.2925e-01, 2.4942e-01, -3.4028e+38], [ 1.4640e+00, 7.9651e-01, 7.0362e-01, ..., 4.4562e-01, 7.5156e-01, 5.4296e-01]], [[ 2.5191e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.0207e+00, 2.1622e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1977e+00, -2.2375e-01, -7.4322e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.0347e+00, 2.4517e-01, -3.9776e-01, ..., -1.1429e+00, -3.4028e+38, -3.4028e+38], [ 4.5153e+00, 2.7451e-01, -5.1057e-01, ..., -1.2249e-01, 1.2522e+00, -3.4028e+38], [ 3.0509e+00, 5.5994e-01, -2.1430e-01, ..., 9.6363e-02, 1.5116e-01, 2.5033e-01]], [[ 4.3664e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.1365e+00, 3.6792e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.0077e+00, -4.5816e-01, -1.6199e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.6984e+00, -7.1395e-01, -1.9006e+00, ..., -4.9143e-02, -3.4028e+38, -3.4028e+38], [ 3.5790e+00, -4.9234e-01, -1.6544e+00, ..., 6.5879e-01, 9.1659e-01, -3.4028e+38], [ 2.5168e+00, -3.3554e-01, -1.4784e+00, ..., 2.4055e-01, -3.3571e-01, -6.5984e-01]], ..., [[ 9.6859e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.6863e+00, 5.6616e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.8816e+00, 6.1601e-01, 1.3178e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.7246e+00, -2.0344e+00, -3.3243e+00, ..., 4.3718e-04, -3.4028e+38, -3.4028e+38], [ 4.9006e+00, -1.4718e+00, -1.8556e+00, ..., 2.4667e-01, 1.7712e+00, -3.4028e+38], [ 3.4096e+00, -7.4837e-01, -1.5285e+00, ..., 2.5732e-01, 5.4028e-01, -6.1303e-01]], [[ 1.4775e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.7727e+00, 1.3764e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1652e+00, 1.3400e+00, 2.2661e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.5977e+00, -5.2545e-01, -1.6165e+00, ..., 1.5376e+00, -3.4028e+38, -3.4028e+38], [ 2.6520e+00, -9.3807e-01, -1.6327e+00, ..., 1.9087e+00, 1.8026e+00, -3.4028e+38], [ 2.5376e+00, 6.5691e-01, 1.1826e-01, ..., 1.2616e+00, 8.5567e-01, 1.0550e+00]], [[ 5.9822e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.3106e+00, -1.7496e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.3510e+00, 1.9541e-01, 1.5621e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.5344e+00, -7.4712e-02, -5.8267e-01, ..., 1.4142e+00, -3.4028e+38, -3.4028e+38], [ 3.4322e+00, -2.0629e-01, -8.1913e-01, ..., 1.4649e+00, 3.3822e-01, -3.4028e+38], [ 2.0776e+00, 6.7556e-03, -1.1207e+00, ..., 1.3069e+00, 1.1824e+00, 4.8304e-01]]], [[[ 9.3403e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.8162e+00, 1.5035e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 1.7618e+00, 1.4776e+00, 8.1584e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.3868e+00, -3.4901e-01, -3.9808e-01, ..., 2.8684e-01, -3.4028e+38, -3.4028e+38], [ 2.1974e+00, -1.6077e-01, -8.2324e-01, ..., 7.2925e-01, 2.4942e-01, -3.4028e+38], [ 1.4640e+00, 7.9651e-01, 7.0362e-01, ..., 4.4562e-01, 7.5156e-01, 5.4296e-01]], [[ 2.5191e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.0207e+00, 2.1622e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1977e+00, -2.2375e-01, -7.4322e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.0347e+00, 2.4517e-01, -3.9776e-01, ..., -1.1429e+00, -3.4028e+38, -3.4028e+38], [ 4.5153e+00, 2.7451e-01, -5.1057e-01, ..., -1.2249e-01, 1.2522e+00, -3.4028e+38], [ 3.0509e+00, 5.5994e-01, -2.1430e-01, ..., 9.6363e-02, 1.5116e-01, 2.5034e-01]], [[ 4.3664e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.1365e+00, 3.6792e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.0077e+00, -4.5816e-01, -1.6199e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.6984e+00, -7.1395e-01, -1.9006e+00, ..., -4.9144e-02, -3.4028e+38, -3.4028e+38], [ 3.5790e+00, -4.9234e-01, -1.6544e+00, ..., 6.5879e-01, 9.1659e-01, -3.4028e+38], [ 2.5168e+00, -3.3554e-01, -1.4784e+00, ..., 2.4055e-01, -3.3571e-01, -6.5984e-01]], ..., [[ 9.6859e-01, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.6863e+00, 5.6616e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.8816e+00, 6.1601e-01, 1.3179e-01, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 4.7246e+00, -2.0344e+00, -3.3243e+00, ..., 4.3841e-04, -3.4028e+38, -3.4028e+38], [ 4.9006e+00, -1.4718e+00, -1.8556e+00, ..., 2.4667e-01, 1.7712e+00, -3.4028e+38], [ 3.4096e+00, -7.4837e-01, -1.5285e+00, ..., 2.5732e-01, 5.4028e-01, -6.1303e-01]], [[ 1.4775e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.7727e+00, 1.3764e+00, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 4.1652e+00, 1.3400e+00, 2.2661e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 2.5977e+00, -5.2545e-01, -1.6165e+00, ..., 1.5376e+00, -3.4028e+38, -3.4028e+38], [ 2.6520e+00, -9.3807e-01, -1.6327e+00, ..., 1.9087e+00, 1.8026e+00, -3.4028e+38], [ 2.5376e+00, 6.5692e-01, 1.1826e-01, ..., 1.2616e+00, 8.5567e-01, 1.0550e+00]], [[ 5.9822e+00, -3.4028e+38, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 2.3106e+00, -1.7496e-01, -3.4028e+38, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], [ 3.3510e+00, 1.9541e-01, 1.5621e+00, ..., -3.4028e+38, -3.4028e+38, -3.4028e+38], ..., [ 3.5344e+00, -7.4712e-02, -5.8266e-01, ..., 1.4142e+00, -3.4028e+38, -3.4028e+38], [ 3.4322e+00, -2.0630e-01, -8.1913e-01, ..., 1.4649e+00, 3.3822e-01, -3.4028e+38], [ 2.0776e+00, 6.7569e-03, -1.1207e+00, ..., 1.3069e+00, 1.1824e+00, 4.8304e-01]]]]) attn_weights tensor([[[[-0.0798, -2.1474, -1.5407, -1.5691, -2.9588, -1.8992, -1.6757, -2.3966, -1.5106]], [[ 2.6039, 2.3946, 7.2129, 1.0428, 0.7915, 0.4085, -2.0849, 1.5277, 6.9595]], [[-1.0434, -1.6345, -1.6926, -1.2905, -2.4269, -2.1491, -2.6025, -1.9524, -1.9215]], [[-2.6518, -4.6685, -1.6706, -0.8495, -2.8074, -2.8491, -2.1379, -0.5764, 3.2903]], [[-0.0539, -2.2498, -1.8439, -0.2455, -1.7541, -1.3389, -0.8291, -0.7274, 0.0851]], [[ 6.4396, 4.2452, 10.1010, 4.6820, 1.8988, 2.8373, -0.2217, 2.3963, 9.3917]], [[ 0.2892, -3.3889, -3.0983, -1.1834, -3.2794, -0.5845, -0.6989, -3.9417, -3.2199]], [[-4.6883, -5.7521, -6.1726, -5.1989, -4.8819, -5.5271, -4.2133, -3.5242, -3.5253]], [[-2.8595, -1.6545, -2.6239, -3.1154, -1.2141, -3.0024, -3.0473, -1.1753, -2.3429]], [[-1.3124, -1.5544, -1.8940, -2.3286, -1.8695, -2.3505, -2.4226, -1.7268, -2.0146]], [[ 2.1596, 1.5996, 2.8789, 1.4594, 1.0875, 0.3397, 0.0379, 0.9302, 2.4431]], [[-1.7957, -2.3958, -3.8272, -2.6368, -2.7319, -2.5468, -2.1996, -2.1609, -3.7873]]], [[[-0.9845, -3.2803, -1.6961, -1.8158, -2.9628, -2.1719, -2.5522, -3.3868, -3.3294]], [[-1.7068, 2.3602, -0.2458, -3.0730, -1.3521, -3.6299, -0.6442, 1.7784, 5.8404]], [[-1.9238, -2.1375, -2.9957, -2.9591, -3.4084, -3.2124, -3.2406, -2.3162, -0.5724]], [[-2.5726, -2.5392, -4.3275, -4.4061, -2.6839, -3.6602, -2.6177, 0.8507, 0.7913]], [[-1.0457, -1.8328, -1.4138, -0.6329, -0.7770, -0.6840, 0.1486, -0.1417, 0.5663]], [[ 1.5802, 2.8632, 1.5566, 0.0501, 3.2875, 0.3651, 0.7443, 1.9400, 3.9360]], [[-0.3494, -3.9777, -3.3119, -1.6683, -3.8833, -1.3316, -1.0931, -4.3411, -4.0269]], [[-5.2380, -6.1702, -5.4598, -5.6298, -5.1617, -4.5828, -4.5746, -3.8300, -3.4598]], [[-3.4877, -1.4497, -2.6723, -3.5059, -0.9521, -3.5928, -3.8673, -0.6566, -0.9291]], [[-1.2442, -1.4845, -1.5884, -2.2013, -1.7155, -2.4086, -2.4843, -1.6582, -1.5202]], [[ 1.0672, 1.2002, 1.0209, 0.2786, 0.8994, -0.1584, -0.0716, 0.7684, 0.8933]], [[-1.8198, -2.2605, -3.8847, -2.6789, -2.8852, -2.5311, -2.2192, -2.0157, -1.9576]]], [[[-0.9235, -2.4637, -0.9331, -1.2395, -2.2748, -2.1184, -2.2933, -2.4999, -2.1335]], [[ 1.9277, 2.1089, 3.7756, 0.8738, 1.5047, 0.3788, -0.7318, 0.9827, 8.1551]], [[-1.4468, -1.9047, -1.8864, -1.6449, -2.7361, -2.9876, -2.7908, -2.2349, -2.3692]], [[-1.7352, -3.8234, -2.2647, -2.3437, -2.2819, -3.8051, -1.6782, -0.3832, 3.2432]], [[ 0.4260, -1.4144, -0.8869, 0.5136, 0.0644, 0.5470, 0.6118, 0.1666, 2.1204]], [[ 5.3131, 3.2686, 3.9519, 0.7112, 2.4524, 2.9691, -0.1816, 1.2209, 8.7830]], [[ 0.4160, -2.5208, -2.2530, -0.6992, -2.2930, -0.3884, -0.2683, -2.7914, -1.9054]], [[-4.8318, -5.7982, -5.3948, -5.8307, -4.9958, -5.3301, -4.9810, -3.6281, -4.1576]], [[-2.2559, -1.0489, -1.5622, -2.4777, -0.7255, -2.8111, -3.4033, -0.5477, -1.7368]], [[-1.3870, -1.7591, -1.8605, -2.4153, -1.9276, -2.4692, -2.6824, -1.9151, -1.9928]], [[ 1.2629, 0.7603, 1.0595, 0.2564, 0.4346, -0.2890, -0.5002, 0.2572, 1.4384]], [[-1.2017, -2.1416, -3.6385, -2.1759, -3.0905, -2.4398, -2.2869, -2.0386, -1.7573]]], [[[-0.7487, -2.8765, -1.7882, -1.7501, -3.2866, -2.1736, -2.0146, -3.0334, -3.1944]], [[-0.6458, 0.0670, -0.3608, -2.6292, 5.8080, -3.1639, -3.3633, -1.0466, 5.7086]], [[-1.8932, -2.0249, -2.6022, -2.5460, -3.3139, -3.1323, -2.8666, -2.1769, -3.3667]], [[-2.5386, -3.7706, -4.1929, -3.7776, -1.7819, -3.3706, -2.0495, -0.4137, 1.0763]], [[-0.7344, -2.2668, -2.3658, -0.8635, -1.0912, -0.7980, -0.3318, -0.7645, 0.3158]], [[ 1.6379, 3.4558, 2.6782, 1.7160, 5.3328, 0.7371, 0.7813, 2.4272, 5.0206]], [[-0.4329, -4.2077, -3.1755, -1.3752, -4.2025, -1.0380, -1.0600, -4.6688, -4.1188]], [[-5.6770, -6.5120, -6.1128, -5.8756, -5.8265, -5.2067, -5.0879, -4.0886, -4.0279]], [[-3.3978, -1.7586, -2.9122, -3.2783, -0.6224, -3.5000, -2.9795, -0.9033, -0.2424]], [[-1.3104, -1.4389, -1.5693, -2.2230, -1.6347, -2.3239, -2.3408, -1.5983, -1.6234]], [[ 1.2546, 1.1839, 0.9788, 0.1698, 1.6633, -0.4271, -0.1957, 0.6874, 1.4596]], [[-1.5784, -2.2760, -3.6780, -2.5658, -2.5407, -2.4508, -2.0948, -2.1256, -2.4641]]], [[[-0.9089, -2.6152, -1.0567, -1.1952, -2.1079, -2.0326, -1.9905, -2.6810, -2.2111]], [[-0.1807, 1.8628, 2.4014, 0.7449, 3.6651, -1.9493, -1.4352, 0.6084, 8.2212]], [[-1.5268, -2.0036, -2.2240, -1.9799, -2.8265, -2.1780, -2.9658, -2.2748, -2.7778]], [[-3.9704, -6.0184, -6.3757, -3.6408, -3.8943, -5.5445, -3.7222, -1.8008, 2.5719]], [[-0.0125, -1.6894, -1.3991, 0.3541, -0.5212, -0.6082, 0.4462, -0.0491, 1.8142]], [[ 3.9613, 3.5298, 2.8912, 0.9590, 2.9914, 2.4504, 0.0756, 1.4641, 9.2752]], [[-0.0877, -2.8921, -2.4292, -0.6778, -2.8010, -0.2901, -0.5838, -3.0913, -1.3465]], [[-5.0285, -5.9961, -5.6946, -5.7435, -5.0344, -4.7105, -5.2426, -3.5825, -3.9192]], [[-3.3186, -1.9512, -2.6627, -3.1220, -1.6836, -3.0795, -3.3089, -1.2196, -2.6289]], [[-1.3914, -1.7197, -1.7862, -2.3665, -1.8785, -2.3754, -2.7023, -1.8758, -2.1289]], [[ 0.9908, 0.9741, 1.0427, 0.1292, 0.8925, -0.4218, -0.6076, 0.5622, 1.6939]], [[-1.2978, -2.1920, -3.6429, -2.2983, -2.7662, -2.5662, -2.2536, -2.0776, -2.2897]]]]) attn_weights tensor([[[[-0.0772, -1.8960, -1.9366, -0.8638, -0.6478, -1.0308, -0.2090, 0.0142, 0.1019]], [[-0.7678, -1.4176, -2.5195, -1.6528, -1.6140, -1.7906, -1.2552, 0.3902, -0.7590]], [[-2.5842, -3.8197, -3.1798, -3.6114, -2.8814, -3.3711, -2.8861, -2.0937, -2.2958]], [[-0.0610, -2.5560, -2.3520, -2.3687, -2.2971, -2.1529, -1.9670, -1.8486, -1.8147]], [[-0.4090, -2.4281, -2.4691, -2.4380, -2.3203, -1.9705, -1.8728, -1.8988, -1.9256]], [[-0.0967, -0.3370, -0.6386, -1.6321, -1.7316, -4.2667, -3.9272, -0.4400, -0.7362]], [[ 0.5067, -1.6331, -2.2765, -1.9740, -1.6467, -1.9932, -2.2904, -1.8251, -2.6558]], [[-0.4575, -2.1280, -2.9211, -2.3356, -2.4164, -1.9030, -1.6968, -1.8555, -2.9105]], [[-0.4197, -1.4261, -2.6499, -2.3645, -1.7430, -2.3511, -2.5827, -1.4910, -2.5081]], [[ 1.1663, -0.5993, -0.5290, -0.7581, 0.0150, -1.6587, -1.5491, -0.8249, -0.4253]], [[-5.6297, -1.9983, -1.8776, -1.9058, -1.8698, -1.4833, -1.3162, -1.4053, -1.2618]], [[-2.5537, -2.0772, -0.1471, -4.2197, -3.7901, -6.1865, -4.8687, -1.6565, 0.2255]]], [[[-0.8034, -2.4987, -1.2443, -0.9047, -0.6847, -0.6600, -0.8132, -0.6421, -0.0690]], [[-0.2808, -1.3229, -1.8183, -1.3337, -1.3033, -1.8405, -1.3285, 0.4073, -0.3308]], [[-2.3917, -3.6936, -3.0435, -3.4652, -2.8037, -3.1806, -2.7510, -1.9955, -2.0716]], [[ 0.0442, -2.4704, -2.2917, -2.3059, -2.2623, -2.0510, -1.8688, -1.7905, -1.7631]], [[-0.4641, -2.5378, -2.4985, -2.4740, -2.4719, -1.9154, -1.8602, -1.9712, -1.8954]], [[ 1.1259, 0.5968, -1.5090, -1.5847, -0.8383, -2.5409, -2.4245, 0.7929, 1.0195]], [[ 0.8414, -1.0111, -1.0849, -0.7362, -0.4036, -1.6140, -1.8332, -1.0098, -1.5533]], [[ 0.2862, -1.8183, -1.8094, -1.0456, -1.7520, -1.7295, -1.2743, -1.2553, -1.2981]], [[-0.0652, -1.1046, -1.6693, -1.8696, -1.3732, -1.8557, -2.0764, -1.1097, -1.3705]], [[ 1.4916, -0.6627, -0.1659, -0.6510, 0.0619, -1.1102, -1.1143, -1.0014, -0.5972]], [[-5.7045, -1.8777, -1.7911, -1.8182, -1.8187, -1.3783, -1.2083, -1.3177, -1.2656]], [[ 1.1872, 0.4989, -1.0690, -0.7680, -0.9851, -2.4312, -3.3971, 0.4566, 2.1492]]], [[[-0.5638, -2.6416, -0.7927, -0.5365, -0.7707, -1.8527, -1.7276, -0.5118, -0.6131]], [[-1.0793, -1.7621, -2.0061, -1.8154, -1.7270, -1.5995, -1.3641, 0.2728, -1.0675]], [[-2.5185, -3.7486, -3.1174, -3.5921, -2.8523, -3.2581, -2.8571, -2.0601, -2.5197]], [[-0.0307, -2.5316, -2.3297, -2.3749, -2.2646, -2.0448, -1.8778, -1.7827, -1.8624]], [[-0.4522, -2.5911, -2.5755, -2.6150, -2.5226, -2.0004, -1.9612, -2.0025, -2.0167]], [[ 0.9436, 0.7610, -0.9606, -0.3164, -0.5125, -2.6611, -2.4397, 0.8109, 0.6581]], [[ 1.3020, -0.7699, -0.8758, -0.7667, -0.2966, -1.7255, -1.6912, -1.1513, -1.9267]], [[ 0.4478, -1.7696, -1.9452, -1.1429, -1.9939, -2.1334, -1.4380, -1.3327, -1.4394]], [[-0.2907, -1.4795, -2.2960, -2.3104, -1.6839, -2.2157, -2.3777, -1.4594, -1.6701]], [[ 1.4588, -0.3633, 0.1145, -0.7919, 0.2625, -1.3009, -1.1379, -0.6552, -0.3530]], [[-5.7732, -1.9752, -1.8550, -1.9364, -1.8303, -1.4186, -1.2378, -1.3813, -1.3062]], [[ 1.3993, 0.7709, -1.9989, -2.9697, -1.5994, -1.3983, -2.4161, 0.9330, 3.4033]]], [[[-0.9855, -2.5436, -1.6444, -1.2763, -2.0599, -1.7731, -1.2059, -0.6472, -0.5021]], [[-0.5722, -1.5736, -1.8632, -1.3769, -2.1331, -1.8396, -1.0705, 0.5036, -0.6718]], [[-2.4254, -3.6621, -3.0700, -3.4747, -2.6735, -3.1531, -2.7159, -1.9625, -2.1967]], [[ 0.0228, -2.4677, -2.2931, -2.3230, -2.1668, -2.0388, -1.8670, -1.7649, -1.8426]], [[-0.4420, -2.4936, -2.5558, -2.4862, -2.3191, -1.8945, -1.8001, -1.8704, -1.9098]], [[ 0.1498, 0.0253, -1.6417, -0.7784, -1.2133, -2.1082, -1.9730, 0.1324, -1.2794]], [[ 0.9093, -1.1081, -1.3032, -1.3269, -1.1796, -1.2929, -1.1275, -1.1614, -1.3131]], [[-0.0114, -1.9413, -2.0253, -1.7102, -2.0233, -1.7464, -1.5774, -1.4428, -1.8576]], [[-0.2288, -1.1106, -1.9656, -2.0616, -1.4825, -2.0817, -2.2102, -1.2232, -1.4388]], [[ 1.3498, -0.5944, -0.1739, -0.7017, 0.0723, -1.1834, -1.2041, -0.8457, 0.1493]], [[-5.7640, -1.9584, -1.8509, -1.8684, -1.7689, -1.4026, -1.2512, -1.3623, -1.3754]], [[-1.6495, -2.0153, -4.0248, -4.4429, 0.8202, -5.3397, -5.8397, -1.6055, 1.0492]]], [[[-0.3989, -2.1827, -0.6050, -0.0123, -0.8163, -1.6438, -1.4922, -0.0378, -0.1441]], [[-0.0399, -1.1746, -1.5115, -1.4040, -1.0268, -1.6319, -0.9589, 0.8043, -0.7634]], [[-2.4922, -3.7171, -3.1559, -3.5980, -2.8242, -3.2885, -2.8284, -1.9868, -2.6657]], [[-0.0412, -2.4538, -2.3244, -2.3684, -2.2543, -2.0066, -1.8791, -1.7525, -1.9548]], [[-0.3879, -2.3843, -2.4662, -2.4412, -2.3056, -1.9022, -1.7893, -1.7485, -1.9431]], [[ 0.9471, 0.4035, -1.0588, -0.7028, -0.4724, -2.3488, -2.9581, 0.3435, 0.4198]], [[ 1.7535, -0.3674, -0.7407, -0.2994, 0.0792, -0.5609, -0.6613, -0.7638, -0.1864]], [[ 0.2397, -1.7631, -2.0260, -1.2188, -1.8467, -1.4245, -1.0613, -1.3089, -1.2424]], [[-0.5714, -1.5686, -2.2506, -2.3405, -1.6842, -2.2301, -2.4647, -1.5995, -1.7230]], [[ 1.3632, -0.6080, -0.1011, -1.0041, 0.0130, -1.2997, -1.2270, -0.8214, -0.2235]], [[-5.8714, -2.0366, -1.9517, -1.9989, -1.8911, -1.4939, -1.3016, -1.4221, -1.5000]], [[ 0.8635, 0.2775, -2.6386, -1.5585, -2.7891, -2.7389, -4.8506, 0.5611, 3.1056]]]]) attn_weights tensor([[[[ -1.6968, -4.3665, -3.5790, -2.9085, -3.0930, -3.5633, -3.5622, -2.8674, -1.7888]], [[ 1.5058, -0.7862, -2.2796, -0.8063, -2.4486, -1.0932, -2.1188, -1.2693, -3.3712]], [[ -7.3032, -10.9628, -13.9395, -9.3861, -8.1439, -7.9178, -5.2798, -3.9846, -6.2656]], [[ -3.2671, -6.4556, -6.4841, -5.4689, -3.2199, -4.6533, -4.4167, -3.1490, -3.1344]], [[ -2.2765, -4.7716, -7.1417, -4.3727, -3.8664, -4.6989, -3.9923, -1.6853, -3.7704]], [[ -4.7520, -6.9816, -8.8924, -6.6148, -5.9127, -6.6370, -5.6892, -2.4773, -4.4756]], [[ -1.4946, -4.1813, -4.7217, -3.5000, -4.1630, -4.0792, -4.1936, -2.6876, -3.2374]], [[ -1.4849, -4.2228, -2.4652, -2.0911, -2.1386, -1.3537, -1.4222, -1.0892, -0.4392]], [[ -3.3181, -5.5337, -7.5965, -2.9998, -4.1904, -4.3435, -3.9355, -2.9427, -4.2052]], [[ -4.7980, -8.5199, -9.2804, -7.5468, -6.1519, -4.2145, -3.5511, -4.0949, -4.9718]], [[ -1.8167, -3.6230, -3.3337, -2.9567, -3.2389, -2.5253, -2.4473, -2.5655, -2.2079]], [[ -0.8617, -4.6970, -4.4391, -4.1304, -4.0535, -3.5213, -3.2656, -3.2421, -2.9958]]], [[[ -1.5958, -3.9044, -2.4654, -3.1626, -3.0487, -3.6161, -3.5281, -2.3730, -1.8306]], [[ 1.6022, -0.9078, -1.9269, -1.1507, -2.6887, -1.8723, -2.5966, -1.2126, -1.4644]], [[ -7.7746, -11.5559, -10.1042, -10.2055, -8.5752, -8.3941, -6.2910, -4.2890, -6.6051]], [[ -3.4698, -6.1968, -3.8586, -4.4903, -2.4037, -4.9861, -3.9973, -3.2120, -3.0860]], [[ -2.0532, -4.9413, -5.2790, -4.4566, -3.9891, -6.7435, -7.7324, -2.0917, -3.5048]], [[ -4.2937, -6.3480, -6.2852, -5.5744, -5.1182, -5.6549, -4.7073, -1.9493, -4.2097]], [[ -1.2736, -4.1434, -3.7951, -3.3792, -3.8251, -4.0621, -4.0661, -2.8851, -2.1633]], [[ -1.4541, -4.3810, -2.5201, -2.1685, -2.2306, -1.2259, -1.3590, -1.1136, -1.1800]], [[ -3.5011, -5.7736, -6.0545, -2.4610, -3.9458, -5.1825, -4.0941, -3.0762, -3.6691]], [[ -5.1031, -8.1362, -6.2161, -6.5284, -5.9591, -3.9166, -3.3874, -4.1921, -5.1861]], [[ -1.4507, -3.5349, -3.1436, -2.8967, -3.2354, -2.2156, -2.1653, -2.4531, -2.5324]], [[ -0.8130, -4.7776, -4.4105, -4.1885, -4.2370, -3.4634, -3.2194, -3.2601, -3.5073]]], [[[ -1.7109, -4.3818, -2.5007, -3.6324, -3.1737, -3.1768, -3.8592, -2.7922, -1.8916]], [[ 1.4870, 0.0711, -2.2140, -1.1632, -2.7318, -1.7735, -2.6665, -0.8887, -2.3327]], [[ -7.6039, -12.2237, -9.4796, -9.0273, -9.2357, -8.8331, -7.7148, -4.4527, -6.7737]], [[ -3.1771, -6.2996, -4.2985, -5.3096, -2.4341, -4.2919, -3.3351, -3.2724, -3.0251]], [[ -2.1162, -4.9887, -4.7072, -3.8313, -4.0952, -7.3515, -6.2257, -1.9933, -5.5374]], [[ -4.8980, -6.8229, -7.3980, -6.4676, -5.9936, -5.8171, -5.7606, -2.6793, -5.1416]], [[ -1.3689, -3.8808, -3.8031, -3.2089, -3.6153, -4.0522, -3.8040, -2.7695, -1.9975]], [[ -1.4815, -4.1486, -2.5494, -2.2275, -2.1487, -1.3604, -1.5155, -1.0961, -1.1029]], [[ -3.7323, -5.8797, -6.5019, -2.9351, -3.2727, -4.1640, -3.7836, -2.8786, -3.8020]], [[ -4.2632, -7.0920, -5.7899, -6.0331, -4.9288, -2.9688, -2.7684, -3.1252, -4.2077]], [[ -1.6813, -3.6601, -3.2818, -2.8760, -3.2370, -2.4091, -2.4576, -2.5153, -2.1527]], [[ -0.8469, -4.7211, -4.4255, -4.0394, -4.0750, -3.4417, -3.2347, -3.1967, -2.9802]]], [[[ -1.6842, -4.3379, -2.5161, -3.5950, -3.6945, -3.1804, -3.4802, -2.8724, -2.3024]], [[ 1.6622, -1.3382, -1.5157, -1.0048, -2.3162, -1.6178, -1.8575, -1.2593, -2.6257]], [[ -8.6537, -12.1342, -9.9533, -9.6179, -12.2874, -7.9151, -6.7911, -4.4657, -6.5278]], [[ -3.2069, -6.1138, -5.0044, -5.9203, -5.5599, -4.8626, -3.8777, -2.9837, -2.8900]], [[ -2.4369, -4.7982, -4.6661, -4.3780, -5.5800, -5.6241, -3.3795, -1.6777, -3.0136]], [[ -4.6164, -6.3824, -7.1138, -6.1399, -7.7932, -5.1791, -5.0771, -2.3186, -4.7830]], [[ -1.1534, -3.9500, -3.4838, -3.5823, -3.8023, -4.1761, -4.1583, -2.5344, -2.5952]], [[ -1.4942, -4.3531, -2.5712, -2.2550, -2.1285, -1.3517, -1.4623, -1.1718, -0.9450]], [[ -4.1062, -6.8801, -7.0667, -3.8512, -7.0563, -5.3159, -3.8905, -3.6578, -4.5961]], [[ -4.3823, -7.2613, -6.0506, -6.7778, -7.6291, -3.3720, -2.8909, -3.5690, -4.5395]], [[ -1.5358, -3.4009, -3.0856, -2.8081, -2.9044, -2.2078, -2.0998, -2.3569, -2.1717]], [[ -0.8073, -4.6696, -4.3682, -4.0978, -4.0141, -3.4057, -3.1759, -3.1918, -3.0906]]], [[[ -1.8130, -4.5548, -3.0249, -3.5680, -3.2677, -3.6640, -3.2439, -3.0657, -2.7054]], [[ 1.3829, -0.8351, -1.8931, -0.9926, -2.6728, -2.0972, -2.7477, -1.3689, -1.7300]], [[ -7.9290, -11.3746, -8.8050, -9.5818, -7.5545, -7.9141, -5.9651, -3.6199, -6.6790]], [[ -3.2847, -5.9630, -5.0034, -5.4744, -2.8535, -5.0828, -4.4281, -2.7214, -3.3412]], [[ -2.6133, -4.8632, -5.1354, -5.0069, -3.3643, -7.5567, -5.0659, -1.5655, -4.2392]], [[ -4.4976, -6.6623, -7.1244, -6.4942, -5.2899, -5.8287, -4.7702, -2.1495, -5.2769]], [[ -1.0346, -3.5672, -3.0845, -3.1086, -3.4940, -4.0918, -4.0988, -2.3545, -3.0112]], [[ -1.5435, -4.4635, -2.7231, -2.3546, -2.3337, -1.4367, -1.5274, -1.1182, -1.3701]], [[ -3.7436, -5.9134, -6.8124, -2.7655, -3.8983, -4.8608, -4.3177, -2.6441, -3.3993]], [[ -4.4766, -7.1307, -5.7675, -6.7431, -4.9708, -3.4214, -3.4791, -3.5872, -4.4400]], [[ -1.6502, -3.3526, -3.2092, -2.9269, -3.1161, -2.4190, -2.2373, -2.2912, -2.1113]], [[ -0.9678, -4.6589, -4.5664, -4.3455, -4.1882, -3.6405, -3.3297, -3.2791, -3.1639]]]]) attn_weights tensor([[[[ 4.2728, -0.1995, 1.9111, -2.2852, -0.7780, -4.1645, -3.4287, -0.6093, 1.3047]], [[ -2.9989, -6.0399, -5.5310, -4.6812, -5.3849, -5.1004, -6.1096, -3.4553, -3.6954]], [[ -4.6544, -6.7866, -8.0430, -4.9193, -4.4627, -6.4895, -7.4996, -3.4747, -3.6960]], [[ -5.2299, -9.3578, -13.2670, -11.2389, -10.6908, -8.3974, -9.8543, -4.8719, -8.1318]], [[ 0.6043, -3.1108, -3.1331, -3.5077, -3.5117, -3.2003, -2.9512, -2.6837, -2.9946]], [[ -0.2414, -1.5526, -2.7205, -0.9378, -1.6933, -3.2176, -3.0416, -2.7307, -3.2096]], [[ -3.5850, -6.1111, -5.0983, -5.6588, -4.3563, -3.8613, -5.3358, -4.1859, -2.7565]], [[ -6.3133, -10.1591, -11.6793, -9.7232, -7.8472, -6.2268, -5.1337, -5.1784, -6.8329]], [[ -4.3534, -6.6875, -8.8684, -6.3698, -7.6489, -6.8108, -6.3901, -2.5411, -4.5876]], [[ -1.9450, -4.1921, -4.4171, -1.7184, -3.0993, -5.3316, -5.7309, -3.1636, -3.1951]], [[ -1.1463, -5.0668, -3.7867, -4.2640, -3.4064, -3.8417, -4.2610, -2.9781, -2.4272]], [[ -2.8309, -5.2912, -5.7601, -4.1481, -3.4849, -2.7711, -3.5061, -3.3202, -3.5324]]], [[[ 4.4476, -0.7140, -1.8837, -1.4257, -0.1094, -3.3831, -4.2224, -1.3852, -0.2039]], [[ -2.6062, -5.9397, -4.2439, -4.3486, -5.2625, -7.1883, -6.7084, -3.6693, -4.0850]], [[ -4.4793, -6.9548, -4.5462, -4.3006, -3.7977, -6.1059, -6.0566, -3.5612, -4.4968]], [[ -5.2666, -9.7591, -10.2752, -10.8883, -10.1651, -9.5934, -9.1383, -5.2470, -8.1106]], [[ 1.3541, -3.1936, -3.1331, -3.4792, -4.4726, -4.0375, -5.0187, -1.7925, -2.0230]], [[ -0.2712, -1.5647, -2.4574, -1.4726, -1.2342, -2.8090, -2.4886, -1.8515, -3.1938]], [[ -3.7393, -6.8182, -2.6846, -4.2154, -3.9304, -4.5622, -4.5463, -4.5307, -4.7855]], [[ -6.0973, -11.0484, -9.0366, -8.8435, -8.7032, -6.8167, -5.2775, -5.5460, -7.2924]], [[ -3.8183, -6.7303, -6.8612, -6.1333, -7.0076, -8.0343, -5.8840, -2.6020, -4.3065]], [[ -1.9514, -4.2758, -2.4889, -1.2985, -3.0055, -4.8964, -4.6139, -3.1510, -3.1863]], [[ -1.0800, -5.3508, -4.2394, -4.5163, -3.5527, -4.1093, -4.5974, -3.2465, -3.2563]], [[ -2.5002, -5.0176, -5.1837, -3.9133, -2.8678, -2.7630, -2.8795, -2.8381, -2.3942]]], [[[ 4.7720, -0.5353, -3.4534, -4.2362, -0.5440, -2.1481, -4.5203, -1.2969, 1.9329]], [[ -2.4002, -5.1261, -3.6794, -4.2781, -5.2119, -6.1315, -6.3463, -3.2537, -4.2348]], [[ -4.5538, -7.2736, -6.3154, -5.4339, -5.3538, -5.9261, -6.1785, -3.6744, -5.7504]], [[ -4.2611, -8.9993, -9.9396, -9.6296, -10.0193, -9.5152, -10.4464, -4.4984, -7.3720]], [[ 1.4638, -3.1195, -3.4764, -3.0232, -4.0222, -3.2744, -3.9675, -1.7160, -2.6691]], [[ -0.2542, -2.0518, -3.3510, -1.6563, -1.3958, -2.6073, -2.3160, -2.2398, -3.9927]], [[ -3.2264, -5.6745, -2.6845, -3.8483, -4.5497, -4.6707, -5.2186, -4.3928, -3.4685]], [[ -5.8923, -10.4387, -9.9676, -9.1446, -8.5284, -6.8968, -6.0075, -5.5000, -8.3672]], [[ -3.6978, -6.2180, -6.3553, -6.9250, -7.4953, -6.7023, -6.1668, -2.0450, -4.1820]], [[ -1.6919, -4.1043, -2.3242, -1.6744, -4.2053, -3.8156, -3.9036, -3.4264, -4.2617]], [[ -0.9538, -6.2593, -5.0689, -5.1786, -3.8473, -4.0428, -4.5112, -3.1600, -3.3277]], [[ -2.3509, -5.0162, -6.4660, -4.4286, -3.3957, -2.2614, -2.9169, -2.4766, -3.6755]]], [[[ 3.8174, -1.1851, -3.2352, -2.2225, 1.3859, -4.2007, -4.1615, -1.7086, 1.2300]], [[ -2.9225, -6.1084, -4.5445, -4.2759, -5.4964, -5.9804, -5.8967, -3.2296, -4.0029]], [[ -4.8420, -6.9103, -6.2767, -5.3832, -7.8034, -6.2749, -5.6076, -3.2812, -3.8176]], [[ -5.4572, -9.4851, -10.6315, -10.8147, -12.2932, -9.1069, -8.6744, -4.9111, -7.4324]], [[ 0.7086, -3.0314, -3.1182, -3.1967, -2.9175, -2.7929, -3.5646, -2.3769, -2.2814]], [[ -0.2255, -1.8678, -3.1348, -2.4116, -2.1510, -2.8129, -2.6021, -2.2385, -2.5015]], [[ -3.9254, -6.8810, -3.3097, -5.0078, -6.6346, -3.2760, -3.9817, -4.2680, -3.8605]], [[ -6.4394, -10.8353, -9.1401, -8.7188, -10.4802, -5.2072, -4.4100, -5.1518, -6.8067]], [[ -4.4310, -6.4652, -6.6039, -6.8857, -8.8878, -6.2316, -6.0798, -2.2584, -5.3000]], [[ -2.2983, -4.6082, -3.2606, -2.0135, -3.9261, -4.8824, -3.1370, -2.8530, -3.1149]], [[ -1.2156, -5.8160, -4.6691, -5.2258, -3.6826, -3.8916, -4.0245, -3.2411, -2.4446]], [[ -2.6065, -5.4440, -5.2084, -3.9867, -5.2275, -3.7148, -3.7395, -3.1746, -4.0097]]], [[[ 4.8049, -1.0053, -2.8728, -2.6945, -1.3578, -6.0921, -6.7668, -1.9710, 1.3005]], [[ -3.0205, -6.7231, -4.8593, -5.3325, -4.9260, -6.2643, -6.4694, -3.9906, -4.2203]], [[ -4.7735, -7.5388, -6.5397, -6.2856, -4.9065, -6.1653, -7.4000, -3.9784, -5.7678]], [[ -5.2056, -9.9627, -10.0996, -10.6708, -10.9322, -10.7432, -10.3563, -5.2252, -8.3701]], [[ 1.2316, -3.3079, -3.4481, -2.8615, -3.3422, -4.1038, -4.1330, -2.7015, -4.3049]], [[ -0.1977, -2.4510, -3.4433, -2.3345, -1.8413, -3.4928, -3.8255, -2.4136, -2.9573]], [[ -3.7279, -7.1198, -3.9382, -5.8761, -5.7999, -4.7807, -5.6578, -4.1050, -3.9156]], [[ -6.4020, -10.8163, -9.8030, -8.8029, -8.4541, -6.3153, -5.5768, -5.3353, -7.3640]], [[ -4.3187, -7.0824, -7.1432, -7.8962, -8.9700, -7.7751, -6.8810, -2.6354, -5.8578]], [[ -2.0391, -4.6782, -3.4551, -1.8099, -3.0980, -4.4158, -3.2689, -2.7380, -3.5378]], [[ -1.1611, -5.8492, -4.9948, -4.7285, -3.4020, -4.1608, -4.8426, -3.6819, -3.4235]], [[ -2.6793, -5.2841, -5.0497, -3.8900, -3.0174, -3.9452, -5.0566, -3.5246, -3.8669]]]]) attn_weights tensor([[[[-2.9054e+00, -7.3528e+00, -7.8702e+00, -5.1620e+00, -5.9462e+00, -7.2230e+00, -7.5548e+00, -4.2604e+00, -5.3871e+00]], [[-2.8431e+00, -4.6759e+00, -5.3462e+00, -4.0567e+00, -4.9035e+00, -4.2142e+00, -4.9490e+00, -1.0199e+00, -2.0467e+00]], [[-4.1467e-01, -2.5619e+00, -4.3731e+00, -3.4050e+00, -5.0696e+00, -4.7052e+00, -4.4862e+00, -2.8013e+00, -4.4997e+00]], [[-2.3674e+00, -5.2470e+00, -6.1372e+00, -4.4864e+00, -4.6024e+00, -4.1607e+00, -3.5156e+00, -4.0776e+00, -4.2196e+00]], [[ 1.1237e+00, -1.3242e+00, -8.1226e-01, -1.4939e+00, -8.4204e-01, -2.5794e+00, -3.8694e+00, -1.6970e+00, -9.1558e-01]], [[-2.6212e+00, -7.5787e+00, -7.3236e+00, -6.2517e+00, -5.6186e+00, -5.5145e+00, -5.8578e+00, -5.5948e+00, -5.7688e+00]], [[-2.3897e+00, -4.4448e+00, -6.1540e+00, -4.6426e+00, -3.7370e+00, -3.7327e+00, -4.1705e+00, -3.9143e+00, -4.7776e+00]], [[-1.4787e-01, -5.4077e+00, -2.4835e-01, -1.4593e+00, -1.5740e+00, -2.4108e+00, -1.7567e+00, -6.8747e-01, 7.9299e-01]], [[ 1.6358e+00, -2.5679e+00, -2.9760e+00, -2.2585e+00, -1.4506e+00, -2.5328e+00, -2.6592e+00, -1.4533e+00, -2.1685e+00]], [[-1.4661e+00, -3.0664e+00, -4.4436e+00, -2.8770e+00, -1.7464e+00, -3.9873e+00, -3.1154e+00, -3.3027e+00, -3.5246e+00]], [[ 1.2865e+00, -1.7915e+00, -2.9583e+00, -3.1440e+00, -2.7846e+00, -2.5197e+00, -3.2658e+00, -1.5940e+00, -2.7694e+00]], [[-6.5255e+00, -1.2462e+01, -1.9823e+01, -1.7472e+01, -2.2333e+01, -1.3431e+01, -1.3525e+01, 7.7157e+00, -5.1484e+00]]], [[[-2.9267e+00, -7.4517e+00, -6.4142e+00, -3.6042e+00, -3.9618e+00, -6.3730e+00, -5.4991e+00, -5.5066e+00, -4.2158e+00]], [[-1.8748e+00, -5.1472e+00, -5.2901e+00, -3.8394e+00, -5.5186e+00, -5.2451e+00, -5.1505e+00, -3.1776e+00, -3.4753e+00]], [[-2.1034e-01, -2.1794e+00, -3.1493e+00, -2.7033e+00, -3.9165e+00, -4.0905e+00, -3.7241e+00, -2.2114e+00, -2.7523e+00]], [[-2.7427e+00, -5.3727e+00, -3.3481e+00, -2.5048e+00, -3.5112e+00, -3.3229e+00, -1.6286e+00, -4.1980e+00, -4.1744e+00]], [[ 1.0325e+00, -2.0381e+00, -1.3662e+00, -1.8332e+00, -1.3563e+00, -2.3353e+00, -3.6074e+00, -1.6034e+00, -1.0462e+00]], [[-2.5372e+00, -7.0201e+00, -5.4270e+00, -4.9096e+00, -4.1678e+00, -5.4631e+00, -5.2500e+00, -5.6646e+00, -6.4778e+00]], [[-2.1577e+00, -4.2973e+00, -4.1781e+00, -3.8655e+00, -3.2932e+00, -3.4594e+00, -3.7488e+00, -3.7326e+00, -3.9468e+00]], [[ 2.9110e-01, -4.3093e+00, -1.4409e-01, -7.4080e-02, -4.7288e-01, -1.4563e+00, 1.7975e-01, -2.3292e-01, 1.8062e+00]], [[ 1.7844e+00, -2.8968e+00, -2.7385e+00, -2.2592e+00, -2.4879e+00, -3.2321e+00, -2.1091e+00, -9.7486e-01, -1.4003e+00]], [[-1.4307e+00, -3.3516e+00, -2.8917e+00, -2.1139e+00, -1.4211e+00, -4.0846e+00, -3.0046e+00, -2.8194e+00, -4.0436e+00]], [[ 1.2360e+00, -1.9248e+00, -2.5179e+00, -3.7866e+00, -3.4764e+00, -4.1476e+00, -3.0828e+00, -1.7262e+00, -7.6304e-01]], [[-5.7507e+00, -1.3986e+01, -1.9757e+01, -1.7027e+01, -2.1530e+01, -1.1882e+01, -8.8331e+00, 8.3721e+00, -1.1587e+00]]], [[[-2.5505e+00, -6.8559e+00, -6.6593e+00, -4.2599e+00, -4.3389e+00, -6.3774e+00, -5.3522e+00, -4.4277e+00, -5.5281e+00]], [[-1.8862e+00, -4.8502e+00, -4.5443e+00, -4.2481e+00, -5.2755e+00, -4.7415e+00, -3.9814e+00, -2.0207e+00, -3.1098e+00]], [[ 1.2369e-02, -1.2230e+00, -2.8710e+00, -3.2149e+00, -4.3791e+00, -4.4118e+00, -4.0991e+00, -2.4428e+00, -3.4534e+00]], [[-2.3241e+00, -4.1258e+00, -3.6927e+00, -2.0455e+00, -2.3997e+00, -1.9756e+00, -1.7099e+00, -2.8788e+00, -4.1713e+00]], [[ 1.2270e+00, -2.0851e+00, -1.2748e+00, -1.2578e+00, -3.8511e-01, -1.7480e+00, -3.9477e+00, -1.8124e+00, -1.0650e+00]], [[-2.3717e+00, -6.6775e+00, -5.7050e+00, -5.5804e+00, -4.6904e+00, -5.0611e+00, -5.1842e+00, -4.9045e+00, -5.2207e+00]], [[-2.1205e+00, -4.2269e+00, -4.6122e+00, -3.9904e+00, -3.7803e+00, -3.3832e+00, -3.5999e+00, -3.4203e+00, -3.6964e+00]], [[ 1.7491e-01, -3.9021e+00, -3.2873e-01, -4.3235e-01, -6.0145e-01, -2.0737e+00, -6.6535e-01, 4.9424e-01, 1.8811e+00]], [[ 1.6181e+00, -2.4844e+00, -2.0187e+00, -2.4112e+00, -2.3990e+00, -2.7616e+00, -2.3115e+00, -5.5427e-01, -1.1762e+00]], [[-1.3841e+00, -3.1764e+00, -3.1605e+00, -1.7343e+00, -8.3559e-01, -3.3616e+00, -1.7780e+00, -2.0154e+00, -3.7082e+00]], [[ 1.3619e+00, -1.5850e+00, -2.1431e+00, -3.8520e+00, -2.9257e+00, -4.0750e+00, -3.3190e+00, -1.8011e+00, -1.0918e+00]], [[-8.2955e+00, -1.3790e+01, -1.8276e+01, -1.7337e+01, -2.2028e+01, -1.5600e+01, -1.6485e+01, 6.1511e+00, -3.9340e+00]]], [[[-3.7370e+00, -7.0531e+00, -6.0757e+00, -3.4624e+00, -4.2700e+00, -6.0594e+00, -5.0144e+00, -3.5632e+00, -5.7158e+00]], [[-2.3718e+00, -5.2191e+00, -4.7572e+00, -4.6116e+00, -7.2254e+00, -6.1904e+00, -5.6339e+00, -1.8644e+00, -4.1357e+00]], [[-3.8489e-01, -2.3842e+00, -3.1107e+00, -2.6354e+00, -3.8662e+00, -4.1307e+00, -3.3445e+00, -2.2604e+00, -4.1024e+00]], [[-2.9876e+00, -5.7394e+00, -4.6084e+00, -4.5856e+00, -5.1396e+00, -2.4248e+00, -2.3682e+00, -3.7069e+00, -4.1985e+00]], [[ 9.6661e-01, -2.4232e+00, -2.7800e+00, -3.1794e+00, -8.7256e-01, -1.1775e+00, -2.5435e+00, -1.5318e+00, -3.4053e-01]], [[-2.6866e+00, -7.7649e+00, -4.9996e+00, -4.8096e+00, -6.1259e+00, -5.2540e+00, -4.8898e+00, -5.5315e+00, -5.4246e+00]], [[-2.3905e+00, -4.7289e+00, -5.1316e+00, -4.8043e+00, -4.5808e+00, -3.9716e+00, -4.7160e+00, -3.8226e+00, -4.1158e+00]], [[-3.4584e-01, -5.0529e+00, -8.1443e-01, -2.0007e+00, -7.8345e-01, -1.7222e+00, -1.2591e+00, -1.0883e+00, 1.0334e+00]], [[ 1.4311e+00, -3.6134e+00, -3.1733e+00, -2.8995e+00, -3.2145e+00, -3.0209e+00, -2.2731e+00, -7.6854e-01, -1.0498e+00]], [[-1.4757e+00, -3.4716e+00, -3.7669e+00, -3.3449e+00, -2.0559e+00, -4.1855e+00, -2.7482e+00, -2.5887e+00, -3.2802e+00]], [[ 1.1092e+00, -2.5785e+00, -3.3692e+00, -3.7459e+00, -3.4592e+00, -3.5993e+00, -2.7596e+00, -1.6370e+00, -2.4305e+00]], [[-6.5548e+00, -1.1141e+01, -1.5619e+01, -1.2122e+01, -2.1349e+01, -1.1126e+01, -1.1519e+01, 1.0348e+01, -2.2228e+00]]], [[[-2.9898e+00, -6.4672e+00, -5.5086e+00, -3.7849e+00, -3.1957e+00, -6.7128e+00, -4.9417e+00, -3.4870e+00, -5.4688e+00]], [[-2.5007e+00, -4.8230e+00, -4.9610e+00, -5.1474e+00, -4.5291e+00, -4.0796e+00, -6.4286e+00, -1.9768e+00, -2.8419e+00]], [[-2.7627e-01, -2.0375e+00, -3.0511e+00, -3.0901e+00, -3.6764e+00, -4.0689e+00, -2.8607e+00, -2.0866e+00, -3.3499e+00]], [[-2.5951e+00, -4.6382e+00, -3.2778e+00, -2.8243e+00, -3.4036e+00, -2.6036e+00, -2.0041e+00, -2.9326e+00, -4.0450e+00]], [[ 1.2985e+00, -1.7230e+00, -2.1001e+00, -3.4256e+00, -1.7641e+00, -2.6173e+00, -3.9890e+00, -1.7316e+00, -7.6486e-01]], [[-2.5254e+00, -6.8978e+00, -4.5788e+00, -4.8020e+00, -4.5875e+00, -6.1126e+00, -5.6622e+00, -4.8196e+00, -7.4075e+00]], [[-2.4808e+00, -4.4690e+00, -4.3468e+00, -4.4059e+00, -3.6798e+00, -4.2495e+00, -4.1078e+00, -3.4276e+00, -4.3254e+00]], [[ 1.2468e-01, -5.8080e+00, -6.4287e-01, -1.2783e+00, -1.0612e+00, -2.2171e+00, -1.6937e+00, -9.6663e-01, 6.8767e-01]], [[ 1.5684e+00, -2.6941e+00, -2.9250e+00, -2.8441e+00, -2.1730e+00, -3.0219e+00, -2.1807e+00, -1.3143e+00, -2.1049e+00]], [[-1.5872e+00, -2.5839e+00, -2.9711e+00, -1.8943e+00, 3.1354e-01, -2.9832e+00, -2.3078e+00, -1.4681e+00, -3.2633e+00]], [[ 1.3910e+00, -1.5729e+00, -2.0508e+00, -3.2234e+00, -2.8409e+00, -4.0584e+00, -4.1616e+00, -1.7848e+00, -1.6919e+00]], [[-8.3144e+00, -1.1055e+01, -1.5602e+01, -1.2846e+01, -1.8319e+01, -1.3835e+01, -1.3232e+01, 1.0451e+01, -6.7900e+00]]]]) attn_weights tensor([[[[ 2.2477e+00, -3.3101e+00, -3.9717e+00, -2.4559e-01, -1.6403e+00, -1.2238e+00, -2.6200e+00, -7.7814e-01, -3.5812e-01]], [[ 4.3495e+00, -9.1664e+00, -7.5811e+00, 1.3684e+00, -1.9247e+00, -1.4472e+00, -6.5338e+00, -4.9363e+00, -2.0767e+00]], [[-1.5245e-01, -2.4472e+00, -3.9156e+00, -2.4713e+00, -1.8754e+00, -1.9030e+00, -2.8744e+00, -2.6064e+00, -3.3627e+00]], [[-5.5045e-02, -1.1059e+00, -3.0914e+00, -1.6019e+00, -2.2744e+00, -2.7286e+00, -2.4354e+00, -2.0496e+00, -2.6859e+00]], [[-3.2071e-01, -3.5719e+00, -4.9128e+00, -1.9039e+00, -1.8988e+00, -1.5556e+00, -1.1838e+00, -1.1773e+00, -2.8892e+00]], [[ 1.4590e+00, -4.0244e+00, -4.0156e+00, -9.5966e-01, -1.5257e+00, -1.0106e+00, -3.5271e+00, -2.7560e+00, -2.7012e+00]], [[ 8.8737e-01, -6.7224e+00, -7.7923e+00, -7.4374e+00, -6.5074e+00, -1.7232e+00, -6.3147e-01, -1.1480e-01, -2.5658e+00]], [[ 7.1169e-01, -4.0652e+00, -5.3947e+00, -5.4209e+00, -4.6556e+00, -4.6491e+00, -1.8367e+00, -3.5998e+00, -3.8393e+00]], [[ 7.3555e-01, -3.7955e+00, -4.3095e+00, 9.7568e-03, -4.2846e-01, -1.8453e+00, -3.8235e+00, -2.4922e+00, -1.6772e+00]], [[ 6.5595e-01, -2.4872e+00, -3.7841e+00, -3.0673e+00, -2.6581e+00, -2.5846e+00, -2.4739e+00, -2.0428e+00, -3.0569e+00]], [[ 2.0135e+00, -1.6550e+00, -1.3686e+00, -1.1428e+00, 6.8246e-01, 2.9146e-01, 1.5230e+00, 1.4804e+00, -3.5744e-01]], [[ 1.0260e+00, -1.8232e+00, -9.4293e-01, -9.4669e-01, -7.7716e-01, -2.3796e+00, -4.3188e+00, -1.3938e+00, -4.4907e-02]]], [[[ 2.4835e+00, -4.3437e+00, -8.7496e-01, 3.2219e-01, -2.2510e+00, -1.6611e+00, -1.2261e+00, -1.9400e+00, 6.0925e-01]], [[ 4.7046e+00, -1.2046e+01, -7.7103e+00, -6.7322e+00, -6.9164e+00, -3.4348e+00, -8.2382e+00, -7.1911e+00, -1.4623e+00]], [[-2.9512e-01, -1.4405e+00, -1.4805e+00, -5.3468e-01, 1.1848e-01, -7.6918e-01, -1.7212e+00, -1.5661e+00, -3.4237e+00]], [[ 2.2289e-01, -2.2733e-01, -1.0785e+00, -5.7946e-01, -1.5608e+00, -2.3006e+00, -2.6596e+00, -2.0978e+00, -1.6536e+00]], [[-3.2859e-01, -3.2113e+00, -3.3144e+00, -1.2038e+00, -7.8842e-01, -1.1715e+00, -5.2668e-01, -1.4433e+00, -1.6585e+00]], [[ 1.4713e+00, -6.5027e+00, -4.0174e+00, -4.5376e+00, -3.8284e+00, -2.8018e+00, -3.5613e+00, -2.8357e+00, -2.5286e+00]], [[ 7.8930e-01, -7.5282e+00, -5.6029e+00, -5.0617e+00, -4.5273e+00, -2.6398e+00, -1.1054e+00, -8.6933e-01, -1.9012e+00]], [[ 8.3304e-01, -4.1251e+00, -4.6061e+00, -4.3908e+00, -3.2971e+00, -4.7898e+00, -2.5285e+00, -3.6541e+00, -3.9954e+00]], [[ 6.1825e-01, -3.3755e+00, -1.3720e+00, -1.8725e-01, -1.0775e+00, -2.5673e+00, -3.4260e+00, -2.5535e+00, -2.5738e+00]], [[ 1.0533e+00, -3.3253e+00, -2.7185e+00, -2.6825e+00, -2.3466e+00, -2.3546e+00, -2.6496e+00, -2.0149e+00, -1.8162e+00]], [[ 1.9450e+00, -1.4104e+00, -8.2101e-01, -6.9026e-01, -4.2436e-01, -1.0210e+00, 7.1636e-01, 7.0972e-01, -1.2824e+00]], [[ 9.8486e-01, -3.4001e+00, -2.8601e+00, -1.8959e+00, -1.2401e+00, -4.0624e+00, -4.1969e+00, -2.1961e+00, -5.1155e-01]]], [[[ 2.8453e+00, -3.1127e+00, -2.7810e+00, -1.2084e+00, -3.2282e+00, -2.3829e+00, -2.4455e+00, -1.3489e+00, -1.2667e+00]], [[ 4.7067e+00, -5.7425e+00, -3.6097e+00, -4.6039e+00, -6.3483e+00, -2.6573e+00, -6.1932e+00, -5.4886e+00, -1.7109e+00]], [[-1.3329e-01, -2.2073e+00, -2.4493e+00, -1.2369e+00, -1.0226e+00, -1.6014e+00, -2.0622e+00, -2.0609e+00, -3.1127e+00]], [[ 3.1450e-01, -3.7769e-01, -6.6998e-01, -8.8703e-01, -1.3490e+00, -2.2569e+00, -2.5875e+00, -2.1096e+00, -2.1727e+00]], [[-1.1731e-01, -3.1896e+00, -3.4323e+00, -1.3491e+00, -9.9446e-01, -2.0824e+00, -7.8394e-01, -9.0660e-01, -1.9537e+00]], [[ 1.8546e+00, -4.2403e+00, -2.6796e+00, -4.0577e+00, -5.2745e+00, -2.2815e+00, -2.1644e+00, -3.4458e+00, -2.1799e+00]], [[ 9.9437e-01, -7.7183e+00, -6.1355e+00, -4.9725e+00, -4.3059e+00, -2.5822e+00, -1.6560e+00, -7.3487e-01, -3.4049e+00]], [[ 7.8928e-01, -3.8781e+00, -3.1992e+00, -3.6956e+00, -3.4387e+00, -5.2811e+00, -2.0389e+00, -3.2018e+00, -4.9622e+00]], [[ 7.6407e-01, -1.3082e+00, -1.7428e+00, -8.2658e-01, -1.3357e+00, -2.1159e+00, -2.8715e+00, -2.0729e+00, -1.8418e+00]], [[ 1.1459e+00, -3.1405e+00, -3.0082e+00, -2.6293e+00, -2.3241e+00, -2.5559e+00, -3.0815e+00, -2.1135e+00, -2.4794e+00]], [[ 2.3675e+00, -1.3848e+00, -6.0084e-01, -5.0838e-01, -2.4015e-01, 5.1777e-01, 8.4877e-01, 1.1216e+00, -1.7363e+00]], [[ 1.1035e+00, -3.8409e+00, -2.3688e+00, -2.4070e+00, -1.8407e+00, -2.6902e+00, -4.3632e+00, -1.9479e+00, -5.4277e-01]]], [[[ 1.8294e+00, -4.6686e+00, -4.5845e+00, -1.8142e+00, -4.7119e+00, -5.1902e-01, -4.1618e-01, -1.8234e-01, -2.1377e+00]], [[ 4.3238e+00, -1.2916e+01, -9.2656e+00, -6.3980e+00, -7.9706e+00, 1.2459e+00, -4.4659e+00, -3.5871e+00, -1.3802e+00]], [[-1.7855e-01, -2.4133e+00, -3.5653e+00, -2.4785e+00, -1.7456e+00, -1.5661e+00, -1.7795e+00, -1.2659e+00, -2.6649e+00]], [[ 8.7734e-02, -8.0656e-01, -1.9598e+00, -8.0933e-01, -1.3494e+00, -2.0697e+00, -2.2917e+00, -1.4136e+00, -2.3882e+00]], [[-2.5242e-01, -3.4590e+00, -3.3426e+00, -2.0584e+00, -2.8716e+00, -1.7459e+00, -9.5852e-01, -9.3794e-01, -1.9121e+00]], [[ 1.6813e+00, -8.3938e+00, -5.8427e+00, -5.5275e+00, -6.5259e+00, -1.3165e+00, -3.0981e+00, -1.5519e+00, -1.7651e+00]], [[ 9.3803e-01, -6.6906e+00, -6.0991e+00, -6.4179e+00, -6.6541e+00, -1.8210e+00, -1.1513e+00, -6.7719e-01, -3.3955e+00]], [[ 7.7234e-01, -4.8644e+00, -4.9371e+00, -3.9850e+00, -4.0010e+00, -3.5214e+00, -2.1137e+00, -3.3530e+00, -3.4238e+00]], [[ 4.6172e-01, -6.3279e+00, -5.7685e+00, -4.0064e+00, -6.7469e+00, -1.0206e+00, -1.7678e+00, -6.5208e-01, -2.1994e+00]], [[ 7.3076e-01, -3.0359e+00, -3.2093e+00, -2.6350e+00, -1.9835e+00, -1.8248e+00, -1.9770e+00, -1.5938e+00, -1.6688e+00]], [[ 2.0474e+00, -1.4399e+00, -6.6797e-01, -5.9531e-01, 7.5170e-02, 4.1430e-02, 1.2293e+00, 1.1589e+00, -1.0215e+00]], [[ 9.6046e-01, -3.7932e+00, -3.3762e+00, -3.2685e+00, -1.6926e+00, -1.9586e+00, -3.6606e+00, -1.6805e+00, 2.7587e-01]]], [[[ 2.5000e+00, -3.4488e+00, -3.3292e+00, -2.5421e+00, -3.1874e+00, -2.0264e+00, -2.3833e+00, -1.7053e+00, -2.5097e+00]], [[ 4.7266e+00, -8.8315e+00, -8.0936e+00, -7.4232e+00, -5.8962e+00, -4.1757e+00, -8.5900e+00, -7.9486e+00, -3.6171e+00]], [[-1.7167e-01, -2.3613e+00, -3.3346e+00, -2.5804e+00, -1.6477e+00, -5.6322e-01, -1.4252e+00, -7.3183e-01, -2.4426e+00]], [[-2.6749e-02, -6.6547e-01, -1.8748e+00, -1.5754e+00, -1.8200e+00, -2.6664e+00, -3.0309e+00, -1.9257e+00, -2.1965e+00]], [[-3.2267e-01, -3.8552e+00, -4.1334e+00, -3.4226e+00, -1.8858e+00, -1.8439e+00, -1.0324e+00, -1.3212e+00, -1.7731e+00]], [[ 1.6654e+00, -5.9146e+00, -4.2627e+00, -5.6186e+00, -4.0390e+00, -2.9622e+00, -4.8287e+00, -4.3567e+00, -3.3122e+00]], [[ 8.8535e-01, -6.5178e+00, -6.5930e+00, -5.6357e+00, -4.9444e+00, -1.4391e+00, -1.1850e+00, -1.5282e+00, -3.8119e+00]], [[ 1.0891e+00, -4.0663e+00, -4.4655e+00, -4.2573e+00, -2.4855e+00, -4.1707e+00, -2.1651e+00, -2.4675e+00, -3.6676e+00]], [[ 4.7784e-01, -3.3771e+00, -4.6331e+00, -4.2982e+00, -1.3715e+00, -1.6824e+00, -2.5682e+00, -1.8543e+00, -3.6323e+00]], [[ 1.0879e+00, -3.0072e+00, -3.2870e+00, -3.1900e+00, -2.3912e+00, -2.1293e+00, -2.4821e+00, -1.5095e+00, -2.3279e+00]], [[ 2.2046e+00, -1.5388e+00, -1.3797e+00, -7.4532e-01, -3.8291e-02, -1.2926e+00, 2.0113e-01, 9.6695e-01, -4.0293e-01]], [[ 8.7173e-01, -3.6538e+00, -3.1897e+00, -2.4523e+00, -1.9597e+00, -1.5820e+00, -3.6221e+00, -2.0125e+00, -9.6129e-02]]]]) attn_weights tensor([[[[-0.6548, -4.0688, -4.3097, -3.6230, -3.9221, -4.0897, -2.9426, -3.2640, -3.1066]], [[-1.0134, -3.5067, -4.5635, -1.6355, -1.8380, -2.9206, -3.4818, -3.6636, -3.1667]], [[ 0.2123, -2.5102, -2.7732, -3.1224, -3.5647, -3.7341, -3.7183, -2.4715, -2.4018]], [[-0.1024, -1.8133, -3.4487, -1.8991, -0.8258, -2.6542, -2.6452, -1.5915, -2.7093]], [[ 1.2363, -1.3533, -2.5484, -2.4437, -1.9882, -3.0994, -1.6481, -1.2234, -2.3905]], [[-0.8050, -2.9626, -3.8342, -2.9063, -3.8351, -4.3437, -3.3116, -3.5632, -3.0146]], [[ 1.8777, -2.6727, -0.8338, -1.4768, -1.5148, -2.3604, -2.9280, -0.9536, 0.5937]], [[-0.8966, -3.5795, -4.8512, -3.6819, -2.9846, -2.1522, -1.1333, -2.1589, -3.8464]], [[-1.5751, -4.9790, -5.8083, -5.5496, -4.9134, -3.6522, -3.0794, -2.3669, -3.6850]], [[ 3.6974, -5.7265, -5.4598, 1.5312, -2.8025, -0.7587, -4.6834, -3.3275, -2.8163]], [[ 2.9892, -3.2001, -1.8690, -0.3680, -0.3378, -1.6427, -0.5237, -1.4429, 0.4428]], [[-0.2376, -2.5319, -4.2419, -3.9260, -3.2312, -3.8979, -3.5046, -1.8345, -1.9160]]], [[[-0.8026, -3.0528, -1.5578, -1.4387, -2.7819, -2.5075, -2.4057, -4.6106, -4.9505]], [[-0.8980, -2.3899, -2.5773, -1.6746, -1.8025, -3.0551, -2.6616, -2.9344, -2.7755]], [[ 0.2743, -3.1718, -2.8078, -3.1256, -3.4468, -4.2354, -3.7955, -2.9298, -3.2671]], [[-0.1593, -2.4030, -3.2598, -2.4797, -0.7704, -1.6646, -1.7728, -0.9154, -1.9469]], [[ 1.1842, -0.9864, -1.6229, -1.6234, -1.6242, -2.0456, -0.6749, -0.2039, -1.4658]], [[-0.5499, -2.9464, -3.4532, -3.0868, -3.6672, -4.3893, -3.9381, -3.7179, -2.6983]], [[ 2.0275, -2.6171, -1.0231, -1.5639, -0.9695, -2.3170, -3.1053, -1.2773, 0.4769]], [[-0.6564, -3.3546, -3.9547, -3.4108, -2.9081, -1.3441, -0.2563, -1.8384, -3.4405]], [[-1.6547, -4.5856, -4.4016, -4.9635, -3.7499, -3.4518, -2.4199, -2.3202, -4.8361]], [[ 4.0891, -6.5793, -2.9199, -3.0366, -3.2328, -1.7223, -4.9690, -4.8772, -1.1347]], [[ 3.1235, -3.1696, -1.6534, -2.2139, -1.5764, -2.4613, -1.2852, -1.3566, -0.5228]], [[ 0.0128, -2.3080, -2.4897, -2.5025, -3.2192, -5.3216, -2.8592, -4.2723, -2.7834]]], [[[-0.7744, -3.3002, -2.0405, -1.6287, -2.8930, -3.1365, -2.8340, -3.8003, -3.5979]], [[-0.0133, -1.6464, -3.1943, -1.7018, -2.1476, -3.3721, -3.4931, -1.9282, -3.3379]], [[ 0.1020, -3.1945, -3.2627, -3.5320, -3.6756, -3.8585, -3.4698, -2.8590, -3.9215]], [[-0.2613, -2.4416, -2.8898, -1.6232, -0.5472, -2.0079, -1.5269, -0.6070, -1.4983]], [[ 1.3217, -1.0123, -1.8140, -2.0531, -1.5598, -2.1072, -0.8157, -0.7166, -1.4087]], [[-0.5192, -2.3408, -3.6771, -2.8864, -3.9096, -4.2625, -3.8302, -3.5996, -2.6277]], [[ 2.1362, -2.2375, -1.1283, -1.6963, -1.6365, -1.3975, -2.4857, -1.2752, 0.2287]], [[-0.9774, -2.9568, -3.7824, -3.0648, -1.9632, -1.4657, -0.4019, -1.3987, -3.3635]], [[-1.3633, -4.2869, -4.8839, -4.7720, -3.9880, -4.3420, -3.9398, -2.6868, -3.9681]], [[ 4.8039, -2.0897, -1.0802, -2.2523, -3.8100, -0.5780, -5.5887, -4.0946, -1.8945]], [[ 2.9557, -3.3557, -1.1601, -1.2251, -1.4686, -2.1999, -1.3096, -1.4072, -0.4352]], [[ 0.0344, -1.1316, -2.4319, -2.8446, -3.7281, -5.7257, -3.5426, -3.0162, -4.5570]]], [[[-1.7783, -3.2042, -2.8784, -1.9729, -1.4931, -2.7414, -2.0765, -1.1598, -3.3315]], [[-0.9130, -3.9703, -3.5334, -3.6908, -4.0498, -0.9102, -1.2734, -1.1404, -2.7498]], [[ 0.2676, -3.1572, -3.0806, -3.4172, -3.5977, -4.2970, -3.8568, -2.6116, -2.5877]], [[ 0.2596, -3.1910, -4.5951, -4.0318, -3.2280, -3.8149, -3.5523, -3.1994, -3.6734]], [[ 1.1498, -1.4281, -1.9163, -1.9620, -1.8170, -1.3755, -0.8426, -0.9412, -1.7739]], [[-0.8367, -3.3557, -4.1896, -3.8996, -4.2034, -3.8240, -3.2978, -3.3887, -3.3123]], [[ 2.0287, -3.8172, -3.1926, -3.9665, -1.3477, -1.5382, -1.8675, -1.3286, 0.4711]], [[-0.5857, -4.1734, -4.5502, -4.3199, -4.3208, -2.7519, -1.7246, -3.1049, -3.8102]], [[-1.8767, -5.1934, -6.0994, -6.1585, -5.3172, -3.5704, -2.7345, -2.6075, -4.5872]], [[ 3.6556, -9.0527, -6.9472, -4.2212, -5.8349, 1.1415, -3.3824, -1.5834, -2.7370]], [[ 2.9081, -4.4453, -1.7752, -1.0491, -1.9144, -1.9264, -0.9743, -1.8868, 0.1695]], [[-0.6864, -3.0730, -3.4007, -2.5274, -2.7126, -4.0827, -2.9498, -1.4158, -2.4181]]], [[[-0.9277, -3.7660, -3.0636, -1.6879, -2.6122, -4.1050, -3.2543, -3.4590, -4.2265]], [[-1.1737, -2.7561, -3.1993, -3.2468, -0.1971, -2.8448, -1.2711, -2.0246, -3.1401]], [[ 0.1792, -3.0635, -2.7835, -3.5205, -3.5374, -4.1928, -3.8046, -2.9487, -2.9692]], [[ 0.3544, -2.3897, -3.2980, -2.9472, -2.2720, -2.3563, -2.6785, -2.2763, -1.9680]], [[ 1.4058, -1.1200, -1.9120, -2.4478, -1.9590, -2.8510, -1.3332, -1.3280, -0.5725]], [[-0.5612, -2.9643, -4.0324, -4.1082, -3.7053, -4.5868, -3.7442, -3.9326, -3.4818]], [[ 1.8054, -3.5581, -3.1551, -2.9603, -1.4327, -2.4000, -2.8659, -1.5116, 0.0184]], [[-0.5833, -3.8152, -4.4827, -4.0507, -2.9915, -3.1335, -1.4161, -1.6439, -3.9023]], [[-1.5585, -5.6408, -6.4597, -5.9395, -4.4261, -2.9966, -2.2824, -2.7701, -5.7059]], [[ 4.7339, -5.9426, -5.4733, -4.7576, -2.3654, -1.0903, -6.6534, -4.3797, -4.7260]], [[ 3.2219, -3.7997, -2.3110, -2.1968, -2.3892, -2.8535, -1.2689, -2.1416, -2.2266]], [[-0.2258, -2.5521, -3.1134, -2.4407, -1.6387, -4.0739, -2.7468, -1.9171, -2.8956]]]]) attn_weights tensor([[[[-2.8204e-01, -6.6029e+00, -8.2104e+00, -6.2800e+00, -6.1182e+00, -3.4351e+00, -3.7215e+00, -2.3528e+00, -4.4333e+00]], [[ 2.0891e+00, -2.2701e+00, -2.0365e+00, -2.3404e+00, 2.3090e-01, -2.7818e-02, 1.6406e+00, 1.6346e+00, 4.1578e-01]], [[ 5.6558e+00, -2.9073e+00, -4.0102e+00, 4.4282e-01, -1.4892e+00, 1.5370e-01, -2.0318e+00, -2.1609e+00, -2.8048e-01]], [[ 3.7917e-01, -2.3879e+00, -3.0530e+00, -1.8136e+00, -1.4274e+00, -2.8435e+00, -2.1697e+00, -1.5293e+00, -1.8843e+00]], [[ 6.7895e-01, -2.8343e+00, -3.3772e+00, -2.9988e+00, -3.0935e+00, -3.3625e+00, -2.2650e+00, -2.8269e+00, -3.6401e+00]], [[ 2.7736e-01, 1.4807e-01, -9.6324e-01, 8.5267e-01, 6.8089e-01, -3.9187e+00, -9.9039e-01, 6.6568e-01, -1.6458e+00]], [[ 1.0863e+00, -2.1715e+00, -2.4046e+00, -1.8329e+00, -2.0870e+00, -1.8317e+00, -1.7160e+00, -2.3691e+00, -2.2780e+00]], [[ 2.8928e+00, -1.5288e+00, -2.0560e+00, -2.0459e+00, -2.7875e-01, -1.1285e-01, -4.3750e-02, 4.2432e-01, -9.9876e-01]], [[-6.6669e-01, -3.9397e+00, -4.4951e+00, -3.4745e+00, -2.0514e+00, -2.0383e+00, -8.0689e-01, -1.2222e+00, -3.2892e+00]], [[ 7.5659e-02, -1.3615e+00, -2.9300e+00, -3.0201e+00, -3.4562e+00, -2.6434e+00, -1.8026e+00, -7.4293e-01, -1.9198e+00]], [[ 2.8876e+00, -2.0841e+00, -3.6582e+00, 1.5620e+00, -1.7664e+00, -2.0455e+00, -2.6517e+00, -1.0943e+00, -1.1134e+00]], [[ 3.0010e+00, -2.5294e+00, -2.2957e+00, 1.9870e+00, -1.0058e+00, -1.4804e+00, -3.2657e+00, -2.9523e+00, -1.0518e+00]]], [[[-3.0169e-01, -4.7706e+00, -5.0917e+00, -4.0785e+00, -3.4034e+00, -2.7113e+00, -3.0289e+00, -2.0077e+00, -4.8910e+00]], [[ 2.8672e+00, -2.5317e+00, -9.7803e-01, -2.2170e+00, -1.2782e+00, -1.5388e+00, 7.8214e-02, -4.9797e-01, -1.5416e+00]], [[ 6.4370e+00, -3.8889e+00, -1.5177e+00, -1.9811e+00, -1.0342e+00, 1.3774e-01, -2.6441e+00, -2.5160e+00, 1.0412e+00]], [[ 4.5274e-01, -2.7000e+00, -1.5692e+00, -1.4997e+00, -9.5723e-01, -2.5444e+00, -2.1876e+00, -1.5420e+00, -7.9017e-01]], [[-8.1276e-02, -1.5220e+00, -1.2947e+00, -6.6392e-01, -9.7303e-01, -2.5266e+00, -1.5135e+00, -2.8534e+00, -4.0203e+00]], [[ 1.0383e+00, -4.0546e-01, -1.4549e-01, 3.4982e-01, -9.1559e-01, -3.8531e+00, -1.1856e+00, -8.8490e-01, -1.3551e+00]], [[ 1.1436e+00, -2.2907e+00, -2.1397e+00, -2.4705e+00, -2.8958e+00, -2.1347e+00, -1.7768e+00, -1.5826e+00, -1.4076e+00]], [[ 2.8665e+00, -1.3730e+00, -1.6301e+00, -1.5596e+00, 3.5243e-01, -7.9713e-01, -2.5133e-01, -7.1768e-02, -2.5809e-01]], [[-5.2301e-01, -3.9979e+00, -3.4342e+00, -3.1822e+00, -2.5419e+00, -2.2795e+00, -1.2900e+00, -1.1707e+00, -3.7863e+00]], [[ 3.5997e-01, -4.4763e-01, -1.1629e+00, -1.5837e+00, -3.1110e+00, -2.6180e+00, -1.5631e+00, -1.4070e+00, -1.1695e+00]], [[ 2.9353e+00, -3.3742e+00, -1.5200e+00, -2.6281e+00, -2.0749e+00, -1.7804e+00, -2.0994e+00, -1.9444e+00, -1.0310e+00]], [[ 2.7618e+00, -3.1108e+00, -1.5018e+00, -2.6593e+00, -2.0044e+00, -2.4863e+00, -4.4246e+00, -3.6837e+00, -1.2445e+00]]], [[[-3.2794e-01, -5.5386e+00, -6.6423e+00, -6.0026e+00, -5.2457e+00, -3.0128e+00, -3.6369e+00, -2.1789e+00, -3.4713e+00]], [[ 3.0944e+00, -2.0085e+00, -1.4911e+00, -2.5283e+00, -1.5928e+00, -2.0419e+00, -7.0649e-01, -3.5804e-01, -9.0796e-01]], [[ 6.2911e+00, -1.5428e+00, -1.1092e+00, -1.6149e+00, -2.8558e+00, -1.3186e-01, -1.0022e+00, -2.4127e+00, -1.4081e-02]], [[ 3.7201e-01, -2.2871e+00, -2.2918e+00, -1.9432e+00, -2.1304e+00, -3.1658e+00, -2.7672e+00, -1.7234e+00, 7.4006e-02]], [[ 4.2960e-01, -1.3707e+00, -1.7780e+00, -1.1590e+00, -2.1060e+00, -3.9309e+00, -2.9327e+00, -3.4952e+00, -3.8757e+00]], [[ 9.0044e-01, 4.4895e-01, 1.4852e-01, -2.2522e-01, -8.5752e-01, -3.6314e+00, -1.0133e+00, -4.8013e-01, -1.3637e+00]], [[ 1.3924e+00, -1.7127e+00, -2.0618e+00, -2.5610e+00, -2.6548e+00, -2.9001e+00, -2.2099e+00, -1.5392e+00, -1.7362e+00]], [[ 3.3777e+00, -1.2809e+00, -1.5005e+00, -1.4695e+00, 6.5514e-03, -8.1403e-01, -1.1022e+00, -7.7485e-01, -2.5295e-01]], [[-3.8248e-01, -3.7219e+00, -3.2018e+00, -2.8154e+00, -2.0139e+00, -2.3823e+00, -1.0766e+00, -9.4916e-01, -2.3370e+00]], [[ 3.6878e-01, 2.9620e-01, -5.2729e-01, -1.0848e+00, -2.1413e+00, -3.1431e+00, -2.0260e+00, -1.5615e+00, -1.6057e+00]], [[ 3.9671e+00, -1.6310e+00, -1.6938e+00, -1.5154e+00, -1.5410e+00, -5.5251e-01, -1.0249e+00, -1.4791e+00, -8.6593e-01]], [[ 3.1021e+00, -1.2642e+00, -9.8509e-01, -1.7277e+00, -1.5762e+00, -2.1311e+00, -4.1136e+00, -3.0170e+00, -1.0819e+00]]], [[[-9.5689e-01, -4.9225e+00, -5.3643e+00, -4.1481e+00, -3.9767e+00, -2.3107e+00, -2.7038e+00, -7.7448e-01, -3.2798e+00]], [[ 2.6388e+00, -3.4861e+00, -1.6507e+00, -2.6129e+00, -2.9082e+00, -2.9812e-01, 1.2987e+00, 9.5432e-02, -1.2122e+00]], [[ 5.9836e+00, -4.4687e+00, -3.5130e+00, -2.0044e+00, -1.9945e+00, 3.0122e+00, -3.6163e-01, -2.5692e+00, -3.1904e-01]], [[ 5.0065e-01, -3.6007e+00, -3.8927e+00, -4.0487e+00, -3.2569e+00, -2.1763e+00, -2.5053e+00, -2.5965e+00, -2.8360e+00]], [[ 6.6605e-01, -3.8645e+00, -3.8054e+00, -3.2724e+00, -3.7068e+00, -3.2164e+00, -2.1685e+00, -2.3042e+00, -3.7679e+00]], [[ 7.5692e-01, -2.4229e+00, -2.0305e+00, -1.0845e+00, -8.3484e-01, -2.5670e+00, -6.2781e-01, -5.0764e-01, -1.3828e+00]], [[ 1.3101e+00, -2.9536e+00, -2.8661e+00, -3.1528e+00, -3.4846e+00, -1.5759e+00, -1.2520e+00, -2.1223e+00, -2.2655e+00]], [[ 2.3675e+00, -2.9840e+00, -3.3660e+00, -3.3410e+00, -2.7571e+00, 2.6565e-01, 1.3638e+00, 1.5556e-02, -1.3016e+00]], [[-6.8334e-01, -4.4705e+00, -3.1434e+00, -2.6189e+00, -2.6631e+00, -1.8003e+00, -1.0943e+00, -2.0090e+00, -3.3996e+00]], [[ 1.6219e-01, -3.3779e+00, -4.2205e+00, -4.2949e+00, -5.0929e+00, -2.4722e+00, -2.7077e+00, -2.5621e+00, -3.8818e+00]], [[ 3.1038e+00, -3.5526e+00, -3.6781e+00, -2.5631e+00, -4.8659e+00, 7.7374e-01, -2.0512e+00, -1.7189e+00, -3.2822e+00]], [[ 2.1673e+00, -4.3740e+00, -4.3424e+00, -3.2351e+00, -2.9327e+00, 3.2729e-01, -2.0744e+00, -3.2460e+00, -2.3978e+00]]], [[[-6.5480e-01, -4.9823e+00, -5.8638e+00, -4.4701e+00, -3.2780e+00, -2.4404e+00, -2.7435e+00, -1.9246e+00, -4.8625e+00]], [[ 3.1243e+00, -2.9926e+00, -2.2189e+00, -2.9752e+00, -1.3400e+00, -1.7916e+00, -8.3232e-01, -1.8842e-01, -3.5587e+00]], [[ 6.0146e+00, -3.1219e+00, -4.9931e+00, -5.6758e+00, -3.9830e+00, -9.3095e-01, -4.4641e+00, -3.8958e+00, -2.8467e+00]], [[ 3.4273e-01, -3.0311e+00, -2.4511e+00, -3.4807e+00, -3.1153e+00, -1.6537e+00, -1.5726e+00, -6.3395e-01, -1.3301e+00]], [[ 1.6339e-01, -2.8711e+00, -3.5570e+00, -3.2347e+00, -3.1270e+00, -2.9548e+00, -1.7724e+00, -1.6716e+00, -3.9850e+00]], [[ 1.4083e+00, -2.3576e+00, -2.0118e+00, -1.9035e+00, -1.7463e+00, -4.1640e+00, -2.3667e+00, -1.7992e+00, -3.1684e+00]], [[ 1.2795e+00, -2.6619e+00, -2.7773e+00, -3.1240e+00, -3.3004e+00, -2.5543e+00, -1.9228e+00, -2.5309e+00, -3.4367e+00]], [[ 1.8638e+00, -3.0465e+00, -2.5082e+00, -2.7024e+00, -1.5360e+00, -3.8660e-01, 1.5395e+00, 1.0289e+00, -1.1138e+00]], [[-1.1645e+00, -4.3718e+00, -3.8147e+00, -2.6635e+00, -1.8463e+00, -2.3847e+00, -1.8537e+00, -1.3600e+00, -3.4594e+00]], [[-3.1159e-02, -1.7320e+00, -1.6811e+00, -2.5713e+00, -2.5402e+00, -1.1543e+00, -1.6700e+00, -4.3193e-01, -1.6313e+00]], [[ 2.6926e+00, -2.7106e+00, -2.9651e+00, -4.1101e+00, -1.1840e+00, -1.8496e+00, -3.4855e+00, -2.3090e+00, -3.2589e+00]], [[ 2.5553e+00, -2.5877e+00, -3.3689e+00, -4.2383e+00, -1.8563e+00, -2.2493e+00, -3.8389e+00, -4.1017e+00, -4.6460e+00]]]]) attn_weights tensor([[[[ 9.9314e-01, -1.8044e+00, -1.8037e+00, -2.7680e+00, -1.4818e+00, -3.8524e+00, -1.9558e+00, -2.2023e+00, -1.2209e+00]], [[ 3.3124e+00, -3.1100e+00, -4.0009e+00, 9.2298e-01, -3.0541e-02, -1.0906e+00, -2.7716e+00, -2.4482e+00, -2.8581e+00]], [[ 2.3604e+00, -1.3853e+00, -2.7507e+00, -4.4790e-01, -1.1132e+00, -8.5111e-01, -1.7596e+00, -1.3330e+00, -2.9090e+00]], [[ 2.2659e+00, -2.5062e+00, -2.5593e+00, -2.0310e+00, -1.5658e+00, -1.5998e+00, -1.5983e+00, -1.5722e+00, -1.8226e+00]], [[-4.2500e-01, -3.2333e+00, -4.1323e+00, -4.2740e+00, -3.2856e+00, -2.9267e+00, -2.2112e+00, -1.0982e+00, -3.0140e+00]], [[-9.5604e-01, -2.7633e+00, -3.8438e+00, -3.3592e+00, -3.1591e+00, -3.0812e+00, -2.9770e+00, -1.5306e+00, -3.0229e+00]], [[ 1.5957e+00, -2.8872e+00, -2.7323e+00, -2.0382e+00, -4.7867e-01, -9.9539e-01, -9.3999e-01, -1.6650e+00, -1.7235e+00]], [[-3.9800e-01, -5.1439e+00, -6.5279e+00, -6.2841e+00, -5.4294e+00, -3.7986e+00, -3.4768e+00, -2.6623e+00, -3.8945e+00]], [[ 3.0167e-01, -2.7992e+00, -3.5371e+00, -3.5369e+00, -2.6348e+00, -2.0398e+00, -1.0582e+00, -1.1752e+00, -3.3078e+00]], [[ 9.3574e-01, -3.7129e+00, -3.3513e+00, -3.4379e+00, -2.6642e+00, -1.3469e+00, -8.4168e-01, -1.7489e+00, -2.0369e+00]], [[ 1.0450e+00, -3.3975e+00, -2.8428e+00, -2.1922e+00, -1.3889e+00, -2.2913e+00, -2.0345e+00, -1.2117e+00, -1.0663e+00]], [[ 5.6089e-01, -2.7588e+00, -3.5041e+00, -1.7148e+00, -3.3146e+00, -1.9878e+00, -1.7250e+00, -2.3520e+00, -4.0377e+00]]], [[[ 1.0374e+00, -1.5945e+00, -1.0929e+00, -1.8804e+00, -1.4059e+00, -4.3318e+00, -2.0483e+00, -2.2281e+00, -2.8785e+00]], [[ 2.9669e+00, -2.0096e+00, -4.9533e-01, 2.1122e-01, 2.3224e-01, -4.0874e-01, -9.6771e-01, -2.0658e+00, -3.4851e-01]], [[ 1.8734e+00, -7.1116e-02, -7.1415e-01, -5.4020e-01, -7.4936e-01, -2.1304e-01, -7.7517e-01, -8.3164e-01, -1.5070e+00]], [[ 1.8742e+00, -1.1114e+00, -1.8217e+00, -1.8720e+00, -1.6289e+00, -1.7130e+00, -1.2918e+00, -3.5436e-01, -9.6134e-01]], [[ 1.7518e-01, -2.7547e+00, -2.5755e+00, -1.6801e+00, -3.5022e+00, -3.3051e+00, -2.0877e+00, -1.8015e+00, -2.4615e+00]], [[-6.2576e-01, -3.0297e+00, -1.9863e+00, -2.5826e+00, -3.2730e+00, -2.7115e+00, -2.2440e+00, -1.9394e+00, -3.4175e+00]], [[ 1.3478e+00, -1.8112e+00, -6.1929e-01, -1.4091e+00, -1.5082e+00, -6.9512e-01, -9.9812e-01, -2.8204e+00, -2.0541e+00]], [[-1.4478e-01, -4.8286e+00, -5.4872e+00, -5.1549e+00, -4.1747e+00, -4.1764e+00, -3.5185e+00, -3.0648e+00, -3.8557e+00]], [[ 5.2842e-01, -1.3793e+00, -1.3334e+00, -2.2163e+00, -2.3825e+00, -6.7450e-01, -2.2443e-01, -3.2027e-02, -7.6409e-01]], [[ 1.1324e+00, -2.7066e+00, -1.7513e+00, -2.1263e+00, -1.8978e+00, -1.4162e+00, -1.0053e+00, -1.5459e+00, -1.9320e+00]], [[ 1.1244e+00, -2.3249e+00, -1.1464e+00, -1.4032e+00, -1.0416e+00, -1.6064e+00, -1.7835e+00, -1.4515e+00, -5.0547e-01]], [[ 1.0073e+00, -2.2755e+00, -2.8678e+00, -2.6360e+00, -2.9805e+00, -1.5756e+00, -1.9818e+00, -2.7498e+00, -3.7459e+00]]], [[[ 1.1369e+00, -1.7758e+00, -1.7797e+00, -1.9787e+00, -1.8212e+00, -4.3944e+00, -2.0115e+00, -2.6814e+00, -1.6633e+00]], [[ 5.0259e+00, -1.6050e-01, 2.2021e-01, 1.8816e+00, 3.3120e-01, -9.1288e-01, -1.6158e+00, -1.0122e+00, -1.8478e-01]], [[ 1.6437e+00, 9.4572e-03, -4.5607e-01, -3.4379e-01, -8.3586e-01, -5.8567e-01, -1.2229e+00, -8.8963e-01, -9.1630e-01]], [[ 1.9390e+00, -1.5580e+00, -2.0604e+00, -2.2394e+00, -1.7592e+00, -3.0287e+00, -2.0733e+00, -1.0056e+00, -1.7531e+00]], [[ 2.3612e-01, -2.3284e+00, -3.2444e+00, -3.5035e+00, -4.3141e+00, -3.8342e+00, -2.6020e+00, -2.4015e+00, -2.3707e+00]], [[-6.6359e-01, -2.4461e+00, -2.1823e+00, -3.0853e+00, -3.4088e+00, -2.6413e+00, -2.0499e+00, -2.4519e+00, -2.0583e+00]], [[ 2.8001e+00, -1.7746e-01, 4.5867e-01, -5.3396e-01, -2.1935e+00, -3.0524e+00, -2.6246e+00, -1.4762e+00, -1.8078e+00]], [[-3.9131e-02, -4.3952e+00, -6.0771e+00, -6.0361e+00, -5.6783e+00, -4.1214e+00, -3.7500e+00, -3.0898e+00, -3.1860e+00]], [[ 4.7835e-01, -1.6630e+00, -1.8982e+00, -2.3884e+00, -2.7291e+00, -6.6530e-01, -2.7130e-01, -6.3695e-02, -7.5394e-01]], [[ 1.1069e+00, -2.1039e+00, -1.3052e+00, -1.4827e+00, -1.4148e+00, -1.7338e+00, -9.6051e-01, -1.1857e+00, -1.8687e+00]], [[ 1.1267e+00, -2.1481e+00, -1.7190e+00, -1.7314e+00, -1.4850e+00, -2.8703e+00, -2.6998e+00, -2.2320e+00, -1.2234e+00]], [[ 1.0604e+00, -2.1623e+00, -3.0042e+00, -2.3795e+00, -3.0702e+00, -2.2280e+00, -1.7066e+00, -2.3952e+00, -3.4530e+00]]], [[[ 8.5180e-01, -3.6293e+00, -2.9164e+00, -3.4067e+00, -2.1060e+00, -4.3521e+00, -2.5141e+00, -2.4143e+00, -1.3220e+00]], [[ 2.7600e+00, -2.7956e+00, -3.9475e+00, -1.9141e+00, -2.0542e+00, 1.1414e+00, -5.5154e-01, -1.8667e+00, -6.3307e-01]], [[ 1.7608e+00, -1.2772e+00, -2.1552e+00, -1.8344e+00, -5.2228e-01, -6.2597e-02, -3.5388e-01, -1.0183e+00, -6.9953e-02]], [[ 2.6913e+00, -2.0835e+00, -1.4948e+00, -2.2313e+00, -1.8318e+00, -3.2648e-01, 1.7884e+00, 4.5051e-01, 6.3927e-02]], [[-4.1202e-01, -4.1465e+00, -4.8007e+00, -4.6416e+00, -4.2277e+00, -3.9512e+00, -2.8165e+00, -2.3189e+00, -4.1767e+00]], [[-1.0469e+00, -4.0209e+00, -4.7749e+00, -3.3123e+00, -3.7892e+00, -2.7927e+00, -3.0117e+00, -1.7149e+00, -3.9645e+00]], [[ 1.3272e+00, -4.0906e+00, -4.0642e+00, -4.4720e+00, -3.5209e+00, 2.3073e+00, 1.9150e+00, -2.2586e+00, -1.0231e+00]], [[-1.5361e+00, -5.8492e+00, -5.2385e+00, -4.1619e+00, -3.2436e+00, -3.1551e+00, -2.6622e+00, -1.7762e+00, -2.9105e+00]], [[ 3.1983e-01, -3.4689e+00, -3.7866e+00, -3.7102e+00, -3.5810e+00, -5.3680e-01, 9.8161e-02, -1.1217e+00, -2.8958e+00]], [[ 1.2212e+00, -4.5739e+00, -3.9854e+00, -4.3657e+00, -2.7622e+00, -7.7398e-01, -1.1475e+00, -2.4230e+00, -1.7621e+00]], [[ 1.1671e+00, -3.9786e+00, -3.3823e+00, -4.1764e+00, -2.7406e+00, -2.5601e-01, -2.5386e-01, -5.7694e-01, -4.5894e-01]], [[ 4.7364e-01, -3.4408e+00, -3.1746e+00, -3.1530e+00, -3.1619e+00, -3.3084e-01, -1.5713e+00, -2.8678e+00, -3.3648e+00]]], [[[ 7.0731e-01, -2.8422e+00, -2.5602e+00, -3.0444e+00, -1.7575e+00, -4.6981e+00, -2.2788e+00, -2.3462e+00, -2.8571e+00]], [[ 1.6589e+00, -2.1812e+00, -1.8434e+00, -1.5058e+00, 8.9850e-01, 3.9559e-01, 7.9826e-01, -9.5213e-01, -1.4984e+00]], [[ 1.1374e+00, -4.8082e-01, -1.1045e+00, -1.6863e+00, 7.5310e-02, -5.9543e-01, -3.5272e-01, -4.5323e-01, -1.2469e+00]], [[ 2.4882e+00, -2.7271e+00, -2.5081e+00, -2.9570e+00, -2.3931e+00, 1.9107e-03, 8.7045e-01, 6.2464e-02, -1.0422e+00]], [[ 3.2084e-02, -5.3627e+00, -4.4644e+00, -3.6185e+00, -3.5414e+00, -4.2169e+00, -2.5178e+00, -4.2093e+00, -4.8039e+00]], [[-1.0473e+00, -3.4548e+00, -3.0378e+00, -2.1201e+00, -2.5699e+00, -2.7162e+00, -2.5613e+00, -1.9802e+00, -3.8676e+00]], [[ 5.6282e-01, -3.3852e+00, -3.3190e+00, -4.3458e+00, -2.0809e+00, 2.1929e+00, 2.0561e+00, -1.5873e+00, -2.8693e+00]], [[-1.1913e+00, -6.5674e+00, -5.9009e+00, -4.5802e+00, -3.1405e+00, -2.3492e+00, -1.8381e+00, -2.7856e+00, -4.7052e+00]], [[-6.4323e-01, -1.5677e+00, -1.6034e+00, -2.0158e+00, -2.3146e+00, -2.2402e-01, 4.6173e-01, 7.9169e-01, -3.8650e+00]], [[ 9.8474e-01, -2.5647e+00, -1.7490e+00, -2.3449e+00, -1.2623e+00, -4.4894e-01, -2.5005e-01, -1.0505e+00, -2.1765e+00]], [[ 1.1346e+00, -3.4735e+00, -2.6557e+00, -3.5555e+00, -1.8279e+00, -4.0323e-01, -7.1463e-01, -9.6473e-01, -1.4461e+00]], [[ 1.6833e+00, -2.3199e+00, -3.4272e+00, -3.8307e+00, -3.3441e+00, -1.9919e+00, -2.6527e+00, -2.1336e+00, -5.7772e+00]]]]) attn_weights tensor([[[[ 1.8249e+00, -2.5190e+00, -3.3110e+00, -2.5549e+00, -2.4072e+00, 2.7882e-02, 1.6111e+00, -5.6210e-01, -3.2413e+00]], [[ 2.9651e+00, -1.4520e+00, -2.1103e+00, 3.3157e-01, -6.0324e-01, -2.6063e+00, -1.7560e+00, -2.4811e+00, -1.6259e+00]], [[ 1.2406e+00, -3.1980e+00, -3.6996e+00, -3.7036e+00, -2.2110e+00, -9.2774e-01, -1.6615e-01, -1.4684e+00, -3.1662e+00]], [[-9.5421e-01, -2.8340e+00, -4.0773e+00, -3.3428e+00, -4.6898e+00, -1.8520e+00, -1.4357e+00, -1.6029e+00, -3.4133e+00]], [[ 2.6244e+00, -2.6079e+00, -3.8661e+00, -3.6859e+00, -2.6045e+00, -2.3423e+00, -2.0336e+00, -1.6330e+00, -3.1584e+00]], [[ 1.6906e+00, -2.7901e+00, -3.1429e+00, -2.6573e+00, -2.5067e+00, -2.6855e+00, -2.3734e+00, -2.4654e+00, -2.7833e+00]], [[ 2.9420e+00, -3.1472e+00, -4.3023e+00, -1.5597e+00, -1.8834e+00, -2.1963e+00, -1.4416e+00, -2.1083e+00, -2.5127e+00]], [[ 4.6860e-01, -3.4581e+00, -4.2871e+00, -3.4161e+00, -2.7866e+00, -3.4596e+00, -3.0075e+00, -2.9626e+00, -4.0188e+00]], [[ 1.8138e+00, -3.4552e+00, -3.7648e+00, -2.7112e+00, -2.8289e+00, -1.4279e+00, -7.1869e-01, -2.5444e+00, -3.1626e+00]], [[ 3.7852e+00, -2.7587e+00, -2.7130e+00, -6.5464e-03, -6.5361e-01, -1.2535e+00, 2.5237e-01, -1.7460e+00, -1.2360e+00]], [[ 4.8509e-01, -3.0634e+00, -3.6031e+00, -2.7471e+00, -2.5236e+00, -1.7686e+00, -9.7240e-01, -5.7989e-01, -1.7103e+00]], [[ 3.4763e+00, -2.2545e+00, -2.7949e+00, 1.5829e+00, -1.2639e+00, -3.1802e+00, -2.1425e+00, -3.2139e+00, -2.7066e+00]]], [[[ 1.7416e+00, -1.2632e+00, -1.6293e+00, -1.7409e+00, -2.8801e+00, 2.6320e-01, 8.4871e-01, -1.3660e+00, -2.4462e+00]], [[ 2.7306e+00, -1.7193e+00, -1.4362e+00, -1.8308e+00, -1.4599e+00, -2.0072e+00, -9.5698e-01, -2.3340e+00, -5.9816e-01]], [[ 1.3383e+00, -3.0965e+00, -2.5699e+00, -3.1316e+00, -2.4839e+00, -6.6115e-01, -2.5032e-01, -1.7578e+00, -3.0309e+00]], [[-9.2614e-01, -1.5283e+00, -2.2863e+00, -2.4286e+00, -4.0735e+00, -1.7739e+00, -1.0333e+00, -1.2234e+00, -2.7723e+00]], [[ 2.2770e+00, -2.0505e+00, -3.2420e+00, -2.8005e+00, -2.2012e+00, -1.5385e+00, -1.1864e+00, -1.7998e+00, -3.6404e+00]], [[ 1.6725e+00, -2.1006e+00, -2.1631e+00, -2.6556e+00, -2.2007e+00, -1.2045e+00, -1.1311e+00, -1.8453e+00, -1.6790e+00]], [[ 2.6468e+00, -3.3659e+00, -3.0659e+00, -3.5696e+00, -2.8824e+00, 4.1841e-02, 7.3195e-02, -2.9346e+00, -2.9305e+00]], [[-6.2596e-02, -3.4142e+00, -3.5329e+00, -3.5181e+00, -2.6382e+00, -2.2370e+00, -2.0576e+00, -2.6982e+00, -3.2183e+00]], [[ 1.5156e+00, -2.6768e+00, -3.0365e+00, -2.3420e+00, -2.6901e+00, -2.3272e-01, -3.5158e-01, -2.4866e+00, -3.2210e+00]], [[ 3.0064e+00, -2.7747e+00, -2.2014e+00, -2.5600e+00, -2.0796e+00, 4.8959e-01, 3.6926e-01, -2.7484e+00, -2.7858e+00]], [[ 9.8150e-01, -2.7967e+00, -2.7784e+00, -2.3500e+00, -2.5564e+00, -2.2398e+00, -1.5537e+00, -1.1848e+00, -1.2409e+00]], [[ 3.5867e+00, -1.0341e+00, -1.2726e+00, -4.3469e-01, -3.6790e-01, -1.3626e+00, -1.6794e+00, -2.5426e+00, -6.1915e-01]]], [[[ 1.5413e+00, -1.1212e+00, -1.7515e+00, -2.6665e+00, -3.2706e+00, -2.7514e-01, 3.1950e-01, -1.3330e+00, -2.6580e+00]], [[ 3.4172e+00, -9.7469e-01, -1.8446e+00, -1.4895e+00, -1.3226e+00, -2.6842e+00, -2.3936e+00, -2.0904e+00, -5.1317e-01]], [[ 1.1227e+00, -2.3000e+00, -2.2714e+00, -2.6411e+00, -2.1116e+00, -2.1769e+00, -9.3204e-01, -1.4408e+00, -2.6770e+00]], [[-6.2742e-01, -7.5964e-01, -1.9197e+00, -2.7966e+00, -4.3410e+00, -2.4631e+00, -1.8922e+00, -1.3330e+00, -1.8480e+00]], [[ 2.2444e+00, -1.1893e+00, -2.5231e+00, -2.5880e+00, -1.7478e+00, -2.7907e+00, -1.9120e+00, -1.6525e+00, -2.3827e+00]], [[ 1.7486e+00, -1.1797e+00, -1.9291e+00, -2.9678e+00, -3.0043e+00, -1.4842e+00, -1.9576e+00, -1.8746e+00, -1.4900e+00]], [[ 2.4292e+00, -3.1800e+00, -3.1837e+00, -3.3978e+00, -2.9444e+00, -1.6431e+00, -1.3428e+00, -3.0559e+00, -3.1254e+00]], [[-5.0047e-03, -3.4464e+00, -3.5396e+00, -3.4487e+00, -3.0289e+00, -3.2840e+00, -2.6407e+00, -2.6319e+00, -2.5208e+00]], [[ 1.7913e+00, -2.5689e+00, -2.8038e+00, -2.2709e+00, -2.7442e+00, -6.7523e-01, -8.2896e-01, -2.3580e+00, -3.0129e+00]], [[ 3.0909e+00, -3.1351e+00, -3.0185e+00, -2.8042e+00, -2.7402e+00, -6.9505e-01, -6.9947e-01, -3.3767e+00, -2.8440e+00]], [[ 9.9941e-01, -3.1156e+00, -3.6808e+00, -3.2444e+00, -3.0205e+00, -2.6044e+00, -1.7368e+00, -1.9143e+00, -1.4379e+00]], [[ 3.7248e+00, -1.5423e-01, -5.3461e-01, -8.0421e-01, -2.2718e-01, -1.8683e+00, -2.2392e+00, -2.1137e+00, -8.7645e-01]]], [[[ 2.2509e+00, -3.3698e+00, -2.6284e+00, -1.9152e+00, -2.6643e+00, 2.1212e+00, 2.2259e+00, -1.8316e+00, -1.5606e+00]], [[ 2.7110e+00, -2.8297e+00, -2.9154e+00, -2.2770e+00, -1.6502e+00, 1.8251e-01, -3.1192e-01, -2.6890e+00, -1.0641e+00]], [[ 1.5182e+00, -4.1259e+00, -3.5729e+00, -3.5012e+00, -3.5045e+00, 8.6509e-01, 7.3312e-01, -2.3158e+00, -2.7696e+00]], [[-1.2235e+00, -3.4417e+00, -3.6690e+00, -2.7904e+00, -3.5804e+00, -1.9807e+00, -1.3745e+00, -1.3500e+00, -1.9154e+00]], [[ 3.6003e+00, -2.3797e+00, -3.5703e+00, -3.8975e+00, -3.8059e+00, -1.1862e-01, 1.5308e+00, -1.6871e+00, -2.1442e+00]], [[ 1.9191e+00, -3.7311e+00, -3.9686e+00, -3.4332e+00, -2.9130e+00, -2.0126e-01, -4.7386e-01, -2.1612e+00, -5.1511e-01]], [[ 4.1200e+00, -3.6728e+00, -4.4462e+00, -3.7692e+00, -3.7873e+00, 2.2276e+00, 2.2421e+00, -2.3575e+00, -1.6549e+00]], [[ 6.8426e-01, -4.6911e+00, -4.8241e+00, -5.7386e+00, -4.2120e+00, -1.8429e+00, -2.6979e+00, -4.3277e+00, -4.0493e+00]], [[ 1.4757e+00, -2.8791e+00, -3.1291e+00, -2.1083e+00, -2.5805e+00, 1.8713e-01, 1.4372e-01, -1.8218e+00, -1.9574e+00]], [[ 4.7441e+00, -2.2057e+00, -2.6796e+00, -2.4173e+00, -2.3670e+00, 2.2378e+00, 2.6498e+00, -1.1854e+00, -3.4518e-01]], [[ 3.8838e-01, -3.8777e+00, -4.1108e+00, -3.6828e+00, -3.2965e+00, -2.2465e+00, -2.2235e+00, -1.9748e+00, -2.3227e+00]], [[ 3.6665e+00, -1.2984e+00, -2.4768e+00, -1.0079e+00, -1.6114e+00, -9.4178e-01, -7.1754e-01, -2.5414e+00, -7.8398e-01]]], [[[ 2.1544e+00, -1.9412e+00, -1.3333e+00, -1.2653e+00, -1.6592e+00, 1.3437e+00, 1.1284e+00, -1.3294e+00, -2.5165e+00]], [[ 3.6772e+00, -2.3650e+00, -3.2125e+00, -3.4486e+00, -1.4459e+00, -1.0369e+00, -1.3780e+00, -3.9256e+00, -6.6341e-01]], [[ 1.2549e+00, -3.2539e+00, -2.3752e+00, -2.4083e+00, -1.7335e+00, 5.8259e-01, -1.6348e-01, -1.8157e+00, -1.7632e+00]], [[-1.2280e+00, -3.2680e+00, -4.6336e+00, -3.3788e+00, -3.2108e+00, -1.6214e+00, -2.0165e+00, -2.3229e+00, -3.9430e+00]], [[ 3.3098e+00, -2.3809e+00, -2.3395e+00, -2.4259e+00, -1.7177e+00, -3.0992e-01, 1.1795e+00, -1.7163e-01, -6.1551e-01]], [[ 1.7928e+00, -3.6452e+00, -3.5605e+00, -3.0901e+00, -1.8229e+00, -1.7549e+00, -1.2627e+00, -2.4648e+00, -8.9420e-02]], [[ 4.1271e+00, -2.4648e+00, -2.9315e+00, -3.1965e+00, -2.5868e+00, 1.3073e+00, 7.1244e-01, -1.8547e+00, -1.7976e+00]], [[ 3.2874e-01, -4.2532e+00, -3.1938e+00, -3.9794e+00, -3.0123e+00, 3.7858e-01, -4.5263e-01, -2.6490e+00, -4.3102e+00]], [[ 1.7646e+00, -2.3877e+00, -3.1897e+00, -2.6551e+00, -3.0146e+00, 2.6366e-01, -1.1005e-01, -2.0542e+00, -3.9210e+00]], [[ 5.0589e+00, -1.4219e+00, -1.0566e+00, -2.1294e+00, -4.5343e-01, 2.0565e+00, 1.2188e+00, -1.3510e+00, 5.8406e-01]], [[ 8.9410e-01, -5.0714e+00, -4.8692e+00, -3.7486e+00, -2.1837e+00, -2.7231e+00, -2.1448e+00, -3.0218e+00, -1.8002e+00]], [[ 3.6557e+00, -1.0638e+00, -2.4382e+00, -1.5424e+00, -2.2071e-02, -1.2048e+00, -1.2950e+00, -2.1992e+00, -2.4920e+00]]]]) attn_weights tensor([[[[ 2.4591, -3.9407, -4.0866, -2.9030, -3.3275, 0.1968, -0.1260, -2.7867, -3.9264]], [[ 3.3396, -2.1110, -1.5385, 1.8440, -1.3518, -1.1861, -0.2830, -0.9712, -0.9351]], [[ 3.2349, -2.0940, -2.2503, -1.2544, -1.3635, -1.9966, -0.3090, -1.7690, -1.2567]], [[ 2.9578, -1.2497, -2.8031, -1.4982, -1.3452, 0.4302, 0.4614, -1.2481, -2.1508]], [[ 2.0243, -1.2168, -1.9231, -1.2584, -0.6591, -0.4596, 0.7290, -0.3082, -0.9023]], [[ 0.9828, -1.5897, -2.7590, -3.0170, -2.6706, -1.8833, -2.3858, -1.2399, -2.0042]], [[ 3.0232, -3.6146, -4.0098, -2.2752, -2.3485, -0.7911, 0.8892, -2.8973, -3.1995]], [[ 2.6579, -1.6523, -1.1074, -0.8351, -1.1630, -1.5624, -0.7551, -0.4666, -0.9076]], [[ 3.3548, -1.2854, -2.6593, -0.5440, -1.0429, -2.1263, -2.1554, -2.3187, -2.2949]], [[ 1.3427, -4.1395, -3.3396, -2.8007, -2.8373, -2.0832, -2.4015, -3.0779, -2.8716]], [[ 3.2651, -2.5602, -2.4092, -0.9566, -2.4959, -1.2116, -0.6371, -2.2538, -1.8665]], [[ 4.6153, -0.8377, -0.2907, -1.8732, -2.5216, -0.3691, 0.8535, 1.1023, 0.4067]]], [[[ 1.9893, -2.7727, -3.4372, -3.1696, -2.9160, 1.7620, 0.2956, -2.4268, -2.8246]], [[ 2.8590, -2.0735, -2.7127, -2.0914, -2.2919, 0.6900, -0.3098, -1.8595, -1.9209]], [[ 2.4738, -1.4029, -1.1441, -2.6489, -2.0174, -0.2368, -0.1074, -1.5253, -1.3785]], [[ 2.2995, -0.5843, -2.1824, -2.0585, -2.2813, 1.2075, -0.8785, -1.0993, -1.2992]], [[ 2.1586, -0.3295, -1.7994, -1.6974, -0.7256, 0.6263, 1.0440, 0.1688, -0.4341]], [[ 1.4229, -1.5306, -1.5104, -2.4009, -3.1501, -2.0991, -2.6916, -1.4656, -1.7168]], [[ 2.4690, -3.2315, -3.4483, -2.9719, -3.4117, 0.2289, -0.1270, -2.8515, -3.0187]], [[ 1.6859, -1.5615, -1.4666, -2.4824, -1.7586, 0.7248, -0.5509, -0.5350, -0.6792]], [[ 2.9149, -2.0015, -2.2519, -2.6025, -0.9620, -2.6051, -3.4829, -2.8010, -0.7855]], [[ 0.5955, -2.0433, -0.9618, -0.9672, -1.2127, -1.5443, -1.0542, 0.0940, -1.3090]], [[ 2.9419, -2.6286, -1.4272, -2.0272, -2.4521, 0.3266, -0.5122, -2.9280, -2.7678]], [[ 2.1476, -0.7563, -1.1925, -2.7537, -2.2529, 2.2337, 1.9015, 0.8896, -0.1360]]], [[[ 2.0405, -3.1744, -3.7376, -3.7368, -3.5964, 1.0927, -0.4080, -3.1430, -3.6333]], [[ 3.1054, -2.0964, -2.7350, -2.4952, -2.8929, -0.2075, -1.5641, -2.3701, -1.6286]], [[ 2.2425, -1.1978, -0.8898, -2.3123, -2.0424, -1.2645, -1.3538, -2.1818, -1.5154]], [[ 2.2187, 0.0058, -1.9648, -1.9841, -2.3288, 0.5035, -1.3993, -0.9060, -1.3809]], [[ 2.0236, -0.2000, -1.4171, -1.0472, -1.0734, -0.1744, -0.0175, -0.1055, -0.7762]], [[ 1.4082, -1.0381, -1.9757, -2.3279, -3.3752, -2.6155, -2.8892, -1.7999, -1.1279]], [[ 2.5522, -3.0449, -3.4136, -2.9037, -3.5091, -0.3417, -0.8181, -3.1293, -3.1680]], [[ 1.7748, -1.4164, -1.2598, -2.4132, -1.7638, -1.2445, -1.9201, -0.7330, -0.4160]], [[ 3.0613, -0.8264, -1.7077, -2.4243, -1.8620, -3.3946, -4.3174, -2.9357, -1.4013]], [[ 0.5759, -2.1430, -0.7099, -1.2542, -1.2212, -1.8959, -1.0482, -0.3302, -1.2825]], [[ 2.8258, -2.6699, -1.1859, -1.7007, -2.5658, -0.4698, -0.8960, -2.8226, -2.5741]], [[ 2.3624, -0.6078, -1.1225, -3.1710, -3.1104, 0.9753, 0.3488, 0.4222, 0.2000]]], [[[ 2.5446, -2.4670, -3.3039, -2.6659, -2.8442, 1.8084, 0.8019, -2.1292, -1.9321]], [[ 3.6572, -1.8472, -3.3466, -1.9036, -1.8240, 1.7269, 1.0380, -1.0802, 0.4971]], [[ 3.7471, -2.0067, -3.0260, -3.1967, -2.8032, 1.5165, 1.4521, -2.0134, -0.9129]], [[ 2.6523, -1.5163, -3.5936, -2.6408, -2.6262, 1.8988, 0.7501, -1.5962, -0.7414]], [[ 1.9757, -1.6721, -2.1641, -1.8745, -1.1207, 1.5774, 1.4991, -0.9959, 0.0832]], [[ 1.8801, -3.3738, -4.1836, -4.6160, -4.5676, -1.7759, -2.9804, -2.5597, -3.6829]], [[ 3.0209, -2.9154, -3.6806, -2.6848, -2.8768, 1.1142, 0.7454, -2.4939, -1.7540]], [[ 1.5761, -2.5170, -2.8860, -3.3192, -1.9301, 3.4325, 1.2928, -0.4789, -0.5457]], [[ 3.5117, -0.6868, -2.4299, -1.9654, -2.5362, 0.2103, -0.3112, -1.3437, -0.8974]], [[ 1.0469, -3.7628, -4.5340, -3.1522, -2.5049, -1.6795, -2.3078, -2.0496, -2.0644]], [[ 3.5520, -1.7381, -2.7136, -2.3723, -2.2645, 1.7070, 0.7762, -1.2479, -0.2242]], [[ 3.3769, -0.0733, -0.1156, -0.3958, -0.4638, 4.7653, 5.2202, 2.6203, 2.4421]]], [[[ 2.7429, -1.6856, -2.1544, -2.2939, -1.8982, 2.8835, 1.4955, -1.1263, -1.2621]], [[ 4.0729, -1.5960, -3.1510, -2.2901, -1.3416, 1.9843, 0.4015, -0.5786, 1.5815]], [[ 3.3991, -0.9231, -2.0140, -3.4961, -1.8049, 0.6169, 0.6399, -1.2007, -1.6382]], [[ 2.9408, -1.7198, -2.2909, -2.4176, -1.5890, 1.2150, -0.2180, -0.6450, -1.2955]], [[ 2.4805, -0.8716, -1.2972, -1.9756, -1.6732, 0.5458, -0.1085, -1.2572, -0.7833]], [[ 1.8341, -3.1246, -3.4632, -3.3897, -3.6888, -3.0529, -3.7079, -3.0360, -2.3876]], [[ 3.3471, -2.1570, -2.8255, -2.5023, -1.8501, 1.3147, 0.3763, -1.4105, -1.5068]], [[ 1.1374, -2.6592, -2.3348, -3.2779, -1.8685, 2.2650, -0.3101, -0.8197, -1.7596]], [[ 3.3936, -1.9887, -2.5434, -3.3036, -0.5628, -1.0572, -1.6255, -1.8925, 0.1168]], [[ 0.1488, -3.6615, -3.9110, -2.4789, -1.8565, -1.5938, -1.3689, -1.5000, -2.6853]], [[ 3.7721, -1.8900, -1.3863, -1.7583, -0.9652, 1.2505, 0.0781, -1.1892, -0.8971]], [[ 3.2646, -0.8006, 0.2218, -0.2277, 1.2460, 3.4178, 3.4993, 2.4975, 2.0147]]]]) attn_weights tensor([[[[ 1.5866, 0.5327, -0.1381, 0.4010, 0.8136, 0.7047, 0.8231, 0.4033, -0.3409]], [[ 4.0471, -1.3284, -1.3137, -0.4354, -1.0694, -1.9550, -0.6527, -1.0563, -1.6661]], [[ 3.6110, -1.5611, -2.0099, -1.5413, -2.0228, -0.9218, -0.4709, -1.4886, -1.7940]], [[ 1.2439, -1.5028, -1.1534, -1.6701, -1.5944, 0.4814, -0.0673, 0.1607, -0.7992]], [[ 2.0948, -1.0047, -1.5983, -0.6079, -1.3587, -1.9923, -1.9962, -0.8723, -1.3616]], [[ 4.3082, 0.2359, 0.7417, 1.2587, 0.6224, -0.3812, 1.9006, 1.0917, 1.1368]], [[ 3.5225, -2.1724, -1.9257, -1.9578, -2.4854, -1.2815, -1.2457, -2.4684, -2.4978]], [[ 5.1837, -0.8287, -1.9109, -2.5489, -1.0456, 0.5372, 0.0979, -1.5789, -2.3019]], [[-3.3324, 4.6790, 5.9045, 4.6711, 4.4403, 4.3920, 4.3486, 4.6935, 5.6862]], [[ 4.3109, -0.4583, -0.9707, -0.6911, -0.7533, -1.0226, 0.7171, 0.5876, -0.2695]], [[ 3.4735, 0.2081, 1.8180, 1.2698, 0.3167, -0.0848, 0.7873, 1.4299, 2.0600]], [[ 2.8276, -0.8487, 0.4630, -0.6201, -1.3425, 1.5627, 1.6460, 0.4087, 0.9565]]], [[[ 1.5376, 1.0801, 0.8824, 0.8337, 1.0263, 0.9966, 0.4967, 0.7711, 1.7527]], [[ 3.2977, -0.4306, -1.2726, -0.8513, -0.0623, 0.0369, 0.0784, 0.2572, 0.2294]], [[ 2.7829, -0.4102, -1.7792, -2.3833, -1.8490, 0.4982, -0.0746, -0.2854, -0.6354]], [[ 1.1019, -0.3766, -1.9384, -1.8190, -0.7196, 0.8480, 0.8623, 0.1010, -0.4502]], [[ 2.1715, -0.4426, -0.1247, -0.4458, -0.4832, -0.9518, -1.9876, -0.1537, 0.4406]], [[ 3.5632, 0.5853, 1.3769, 0.0084, -0.9069, 1.2019, 2.8170, 1.1388, 0.9241]], [[ 3.0777, -1.5113, -2.0275, -1.9432, -1.8138, -0.2345, -1.4288, -1.8314, -1.8338]], [[ 3.2660, 1.1518, -1.0751, 0.1704, 0.8565, 2.5286, 0.7834, 1.4977, 1.3237]], [[-3.7308, 5.5210, 5.2974, 4.9377, 4.2808, 4.4481, 4.2614, 5.4370, 5.1675]], [[ 3.4174, -1.0683, -1.8813, -2.1227, -1.8971, 0.3339, 0.1733, -0.9005, -0.5857]], [[ 2.6380, 0.6521, 0.8439, 0.0891, -0.2819, 2.3659, 1.2342, 1.4707, 1.6770]], [[ 2.6322, 0.3075, -0.9373, -0.4653, -0.7311, 1.5477, 0.9155, 0.4130, 0.3883]]], [[[ 1.2427, 1.9151, 1.2425, 1.3682, 1.6163, 0.6332, 0.7533, 1.4198, 2.1484]], [[ 2.8678, -0.1861, -0.9491, -0.4343, -0.5404, -0.3454, -0.2612, 0.0554, -0.2993]], [[ 2.5031, -0.3157, -1.9791, -2.6050, -2.3635, 0.1491, -0.5042, -0.4441, -1.1854]], [[ 0.8167, -0.5076, -1.7609, -1.8612, -1.2666, 0.4885, 0.6466, 0.0428, -0.4823]], [[ 1.7752, -0.4550, -0.0595, -0.5427, -0.6279, -1.7192, -2.3954, -0.0976, 0.0343]], [[ 3.2921, 1.2718, 1.1444, 0.1894, -0.7706, 0.8560, 1.7317, 1.0522, 1.1400]], [[ 2.8263, -1.8130, -2.0857, -2.2720, -2.1499, -0.8743, -1.8265, -2.3572, -1.9632]], [[ 3.0197, 1.1860, -0.8535, 0.5137, 0.6577, 1.8363, 0.4648, 1.5735, 1.3188]], [[-3.3546, 5.3202, 5.2422, 4.5078, 4.1343, 4.1133, 4.1006, 5.5822, 4.5868]], [[ 3.1340, -0.9154, -1.7828, -2.3762, -2.3804, -0.5897, -0.7852, -1.2678, -0.7582]], [[ 2.7571, 1.1517, 0.7746, -0.0902, -0.5699, 1.1513, -0.1414, 1.2770, 1.5830]], [[ 2.0077, 0.0890, -0.6681, -0.4003, -1.2170, 1.1300, 0.4751, 0.5025, 0.4771]]], [[[ 1.7835, 0.5759, -0.8245, -0.0419, 1.0932, 1.4547, 0.3824, 0.6766, 0.9898]], [[ 3.6261, -0.4172, -1.1939, -1.1117, 0.5403, 0.5427, 0.8379, 0.4523, 0.8496]], [[ 3.2125, -0.9819, -1.5262, -1.5209, -1.1729, 0.8702, 0.8893, -0.2386, -0.0522]], [[ 1.2487, -0.8735, -1.8254, -1.8666, -0.6918, 0.0451, 0.2637, 0.1331, -0.8658]], [[ 2.4138, -0.7416, -1.4197, -1.2718, -0.8433, -0.3554, -1.4428, -0.8422, -0.3006]], [[ 4.0105, -0.6053, -1.1102, -1.0719, -1.3093, 2.2817, 3.4471, -0.4680, 0.1148]], [[ 3.4533, -1.5858, -2.4874, -2.2337, -1.4147, 0.0845, -0.4262, -0.9930, -0.8094]], [[ 3.7573, -0.2690, -0.9303, -1.5330, 0.1067, 2.3542, 0.9608, 0.1474, 1.1608]], [[-3.6325, 1.8436, 2.2364, 2.0905, 2.3133, 2.5605, 1.6914, 1.8923, 2.5038]], [[ 3.9527, -1.0897, -2.3324, -2.3887, -1.9605, 1.6945, 1.4592, -0.9183, -0.8286]], [[ 2.6870, -0.4358, -1.3203, -0.8758, -0.0355, 3.2874, 2.5865, 1.4475, 1.3553]], [[ 2.9938, -0.1495, -1.7097, -1.2618, -0.0526, 1.7002, 0.7739, 0.6416, 0.3999]]], [[[ 1.4435, 0.7275, -0.0459, -0.0172, 0.5940, 1.0285, 0.8967, 0.7350, 0.8947]], [[ 3.6912, -0.6848, -0.8568, -1.1294, 0.4298, -0.2517, 0.3064, 0.3560, 0.1674]], [[ 3.2108, -0.5724, -1.6821, -1.7872, -1.2194, 0.2105, 0.5964, -0.3803, -0.9228]], [[ 0.9754, -0.3849, -1.6936, -1.1554, 0.5264, 0.4744, 0.0143, -0.2662, -2.3778]], [[ 2.1179, -1.2373, -1.3978, -1.6709, -0.5474, -0.6400, -1.7085, -0.9272, -1.1248]], [[ 4.2278, -0.1721, 0.0508, -1.2453, -0.2903, 1.9365, 2.9288, 0.7131, 1.5187]], [[ 3.4630, -1.5979, -2.0844, -1.7215, -1.0949, -0.1936, -0.6069, -1.0631, -1.3696]], [[ 4.0607, 0.6609, -0.7502, -1.0890, 0.2467, 1.6482, 0.2790, 0.6985, 0.5666]], [[-4.8185, 3.1245, 3.7469, 3.4138, 3.2919, 3.4911, 2.4585, 3.0433, 3.4442]], [[ 4.3870, -1.5788, -2.0257, -2.6495, -1.6737, 1.1863, 0.7406, -0.7312, 0.5865]], [[ 2.5692, -0.7943, -1.0320, -0.8558, -0.1786, 1.9523, 1.1097, 0.9941, 1.2748]], [[ 2.7097, 0.4973, -1.4880, -0.3053, 0.8954, 1.4238, 1.0451, 1.3223, -0.6501]]]]) attn_weights tensor([[[[ 1.3223e-01, -1.3066e+00, -6.5525e-01, -9.8950e-01, -1.7088e+00, -1.8769e+00, -1.9034e+00, -1.4442e+00, -5.4331e-01, -9.0032e-01]], [[ 2.8544e+00, 3.1763e+00, 3.2770e+00, 9.6656e+00, 1.9641e+00, 3.4051e+00, 1.0931e+00, 1.8129e+00, 2.3296e+00, 9.3874e+00]], [[-9.9929e-01, -1.9513e+00, -1.3785e+00, -1.5243e+00, -2.0776e+00, -2.3043e+00, -2.4831e+00, -2.4093e+00, -1.5672e+00, -1.6826e+00]], [[-7.6734e-01, -3.9325e+00, 8.3902e-01, 9.4932e-01, -2.3792e+00, -1.4916e+00, -3.5628e+00, -6.0685e-01, 5.2167e+00, 5.1652e+00]], [[-7.9949e-01, -2.4999e+00, -2.3660e+00, -4.4876e-01, -1.7697e+00, -2.1249e+00, -7.6837e-01, -1.0125e+00, -4.9974e-01, 1.6247e+00]], [[ 7.5872e+00, 1.9975e+00, 5.4857e+00, 1.1109e+01, 1.4531e+00, 1.7433e+00, 2.1101e+00, -6.6111e-01, 4.2159e+00, 1.0602e+01]], [[-8.7340e-02, -2.1182e+00, -3.0462e+00, -1.6108e+00, -2.2519e+00, -1.1853e+00, -1.1621e+00, -2.4215e+00, -3.1473e+00, -1.5194e+00]], [[-5.1438e+00, -5.8607e+00, -5.3890e+00, -6.0763e+00, -4.9726e+00, -6.4725e+00, -5.5330e+00, -3.5591e+00, -2.5523e+00, -3.4927e+00]], [[-1.5232e+00, -1.1149e+00, -1.6270e+00, -2.3350e+00, -1.4427e+00, -3.1417e+00, -2.9858e+00, -1.0328e+00, -1.5392e+00, -2.2698e+00]], [[-1.6539e+00, -1.9317e+00, -2.1701e+00, -2.7670e+00, -2.2767e+00, -2.4829e+00, -2.7036e+00, -2.0933e+00, -2.2356e+00, -2.7811e+00]], [[ 1.5150e+00, 1.2463e+00, 1.8818e+00, 1.9409e+00, 7.8715e-01, 1.1792e-02, -1.1000e-01, 7.5780e-01, 1.5142e+00, 1.6460e+00]], [[-1.2317e+00, -1.8459e+00, -3.4657e+00, -1.8812e+00, -2.0752e+00, -2.3689e+00, -2.2055e+00, -1.8256e+00, -3.5991e+00, -1.8298e+00]]], [[[-1.1271e-01, -2.2372e+00, -1.5871e+00, -1.6264e+00, -3.0445e+00, -1.9477e+00, -1.7383e+00, -2.4865e+00, -2.4499e+00, -1.5168e+00]], [[ 2.5218e+00, 2.2823e+00, 7.0753e+00, 9.3104e-01, 6.7244e-01, 2.7222e-01, -2.1874e+00, 1.4988e+00, 8.4253e-01, 6.8940e+00]], [[-1.1160e+00, -1.7058e+00, -1.7414e+00, -1.3160e+00, -2.4905e+00, -2.1961e+00, -2.6214e+00, -1.9980e+00, -1.6517e+00, -1.9402e+00]], [[-2.8405e+00, -5.1153e+00, -2.1787e+00, -1.3739e+00, -3.4321e+00, -3.4516e+00, -2.7425e+00, -1.1458e+00, -4.9725e-01, 3.4890e+00]], [[-1.1071e-01, -2.3776e+00, -1.9755e+00, -3.8656e-01, -1.9210e+00, -1.5482e+00, -1.0579e+00, -9.1656e-01, -5.7987e-02, 2.5108e-01]], [[ 6.3933e+00, 4.2133e+00, 1.0186e+01, 4.7555e+00, 1.9223e+00, 2.8054e+00, -2.0971e-01, 2.3561e+00, 1.1214e+00, 9.4507e+00]], [[ 1.8842e-01, -3.5118e+00, -3.2276e+00, -1.2735e+00, -3.3941e+00, -6.5614e-01, -7.5053e-01, -4.0453e+00, -4.2367e+00, -3.3447e+00]], [[-4.8214e+00, -6.0586e+00, -6.5438e+00, -5.5440e+00, -5.2722e+00, -5.9762e+00, -4.5924e+00, -3.9248e+00, -3.3077e+00, -3.5467e+00]], [[-2.9352e+00, -1.7316e+00, -2.7088e+00, -3.1778e+00, -1.2832e+00, -3.0082e+00, -3.0857e+00, -1.2367e+00, -1.2235e+00, -2.3558e+00]], [[-1.3707e+00, -1.6162e+00, -1.9432e+00, -2.3725e+00, -1.9223e+00, -2.3895e+00, -2.4602e+00, -1.7768e+00, -1.6767e+00, -2.0397e+00]], [[ 1.9833e+00, 1.4021e+00, 2.7162e+00, 1.3303e+00, 9.4369e-01, 2.4497e-01, -4.6179e-02, 8.1838e-01, 8.3666e-01, 2.3292e+00]], [[-1.7715e+00, -2.4005e+00, -3.8147e+00, -2.6363e+00, -2.7541e+00, -2.5427e+00, -2.1868e+00, -2.1978e+00, -2.2796e+00, -3.8087e+00]]], [[[-1.1271e-01, -2.2372e+00, -1.5871e+00, -1.6264e+00, -3.0445e+00, -1.9477e+00, -1.7383e+00, -2.4865e+00, -1.2599e+00, -1.5168e+00]], [[ 2.5218e+00, 2.2823e+00, 7.0753e+00, 9.3104e-01, 6.7244e-01, 2.7222e-01, -2.1874e+00, 1.4988e+00, 1.2396e+00, 6.8940e+00]], [[-1.1160e+00, -1.7058e+00, -1.7414e+00, -1.3160e+00, -2.4905e+00, -2.1961e+00, -2.6214e+00, -1.9980e+00, -2.2193e+00, -1.9402e+00]], [[-2.8405e+00, -5.1153e+00, -2.1787e+00, -1.3739e+00, -3.4321e+00, -3.4516e+00, -2.7425e+00, -1.1458e+00, 2.4468e-01, 3.4890e+00]], [[-1.1071e-01, -2.3776e+00, -1.9755e+00, -3.8656e-01, -1.9210e+00, -1.5482e+00, -1.0579e+00, -9.1656e-01, 8.0910e-02, 2.5108e-01]], [[ 6.3933e+00, 4.2133e+00, 1.0186e+01, 4.7555e+00, 1.9223e+00, 2.8054e+00, -2.0971e-01, 2.3561e+00, 3.1647e+00, 9.4507e+00]], [[ 1.8842e-01, -3.5118e+00, -3.2276e+00, -1.2735e+00, -3.3941e+00, -6.5614e-01, -7.5053e-01, -4.0453e+00, -2.7018e+00, -3.3447e+00]], [[-4.8214e+00, -6.0586e+00, -6.5438e+00, -5.5440e+00, -5.2722e+00, -5.9762e+00, -4.5924e+00, -3.9248e+00, -3.5454e+00, -3.5467e+00]], [[-2.9352e+00, -1.7316e+00, -2.7088e+00, -3.1778e+00, -1.2832e+00, -3.0082e+00, -3.0857e+00, -1.2367e+00, -2.7504e+00, -2.3558e+00]], [[-1.3707e+00, -1.6162e+00, -1.9432e+00, -2.3725e+00, -1.9223e+00, -2.3895e+00, -2.4602e+00, -1.7768e+00, -1.8302e+00, -2.0397e+00]], [[ 1.9833e+00, 1.4021e+00, 2.7162e+00, 1.3303e+00, 9.4369e-01, 2.4497e-01, -4.6179e-02, 8.1838e-01, 1.0966e+00, 2.3292e+00]], [[-1.7715e+00, -2.4005e+00, -3.8147e+00, -2.6363e+00, -2.7541e+00, -2.5427e+00, -2.1868e+00, -2.1978e+00, -2.2247e+00, -3.8087e+00]]], [[[ 4.4311e-01, -5.4062e-01, -6.0528e-01, -1.1238e+00, -5.7384e-01, -4.9784e-02, 3.5463e-01, -9.3044e-01, -6.3975e-01, 3.1196e-01]], [[ 2.0355e+00, 2.3553e+00, 2.9903e+00, 3.7092e+00, 3.7854e+00, 3.6698e+00, 4.5867e+00, 7.7820e-01, 3.3784e+00, 1.2446e+01]], [[-1.1225e+00, -1.8671e+00, -1.7681e+00, -2.1873e+00, -1.6276e+00, -3.4498e-01, -1.9174e+00, -2.1164e+00, -1.6813e+00, -2.1390e+00]], [[-8.6761e-01, -6.4282e+00, -4.7132e+00, -3.8976e+00, -4.4826e+00, -3.3765e+00, -2.7032e+00, -3.4920e+00, -1.8470e+00, 4.6033e+00]], [[ 3.4024e-01, -2.5907e+00, -2.8681e+00, -1.2896e+00, -1.7515e+00, -1.2541e+00, -4.3416e-01, -1.4361e+00, -5.7441e-01, 3.8002e+00]], [[ 7.9561e+00, 9.8314e-01, 2.3448e+00, 2.7211e+00, 3.6357e-01, 9.8731e-01, 4.2520e+00, -1.7477e+00, -4.1623e-01, 1.3293e+01]], [[ 6.7716e-01, -1.1676e+00, -2.0089e+00, -1.4133e+00, -1.4349e+00, 2.1297e-01, -1.6873e-01, -1.6273e+00, -1.5444e+00, -8.5542e-02]], [[-3.5169e+00, -4.0782e+00, -3.7960e+00, -3.9471e+00, -3.0160e+00, -2.9976e+00, -2.9997e+00, -1.8754e+00, -1.4743e+00, -3.6198e+00]], [[-1.4081e+00, -2.0684e+00, -2.2915e+00, -2.9323e+00, -2.0036e+00, -1.8782e+00, -7.9468e-01, -2.2248e+00, -1.9592e+00, -2.2792e+00]], [[-1.7195e+00, -1.8962e+00, -2.1745e+00, -2.4662e+00, -2.0839e+00, -2.4684e+00, -2.4491e+00, -2.0864e+00, -2.0938e+00, -3.6328e+00]], [[ 1.0893e+00, 1.0602e+00, 1.0113e+00, 5.4586e-01, 1.0177e+00, 2.5291e-01, 5.1708e-01, 6.4932e-01, 7.9642e-01, 2.0031e+00]], [[-1.7297e+00, -1.9891e+00, -2.8888e+00, -2.5611e+00, -2.7882e+00, -2.5766e+00, -2.0672e+00, -2.0813e+00, -2.7797e+00, -2.3902e+00]]], [[[-7.1924e-01, -2.5991e+00, -1.7832e+00, -1.4832e+00, -3.0342e+00, -2.2948e+00, -2.2146e+00, -2.6908e+00, -2.3678e+00, -2.7854e+00]], [[-4.1931e-01, 1.5890e-01, -5.7845e-02, -5.8459e-01, 5.6286e+00, -1.9110e+00, -1.8148e+00, -1.0529e+00, 1.4082e+00, 7.8331e+00]], [[-1.5854e+00, -1.9755e+00, -2.2528e+00, -2.2206e+00, -2.7952e+00, -2.6276e+00, -2.8005e+00, -2.1782e+00, -2.4483e+00, -2.9912e+00]], [[-2.3735e+00, -4.8670e+00, -4.5868e+00, -4.3893e+00, -2.2617e+00, -3.7763e+00, -2.4544e+00, -1.3911e+00, 9.6583e-02, 2.3918e+00]], [[-7.8927e-01, -2.4232e+00, -2.5316e+00, -1.5519e+00, -1.4980e+00, -1.0707e+00, -4.0759e-01, -8.7056e-01, 1.7405e-01, 9.7651e-01]], [[ 3.0348e+00, 3.0722e+00, 2.2675e+00, 2.5190e+00, 5.4407e+00, 6.7007e-01, 1.5333e+00, 1.7766e+00, 2.5832e+00, 7.9278e+00]], [[-4.0647e-01, -3.6402e+00, -2.8942e+00, -1.5351e+00, -3.6453e+00, -1.1266e+00, -9.9714e-01, -4.0071e+00, -2.2961e+00, -3.0727e+00]], [[-5.3108e+00, -6.2318e+00, -5.8128e+00, -5.9555e+00, -5.4806e+00, -5.5096e+00, -4.8642e+00, -3.8368e+00, -3.1050e+00, -3.3003e+00]], [[-2.9872e+00, -1.7032e+00, -2.6062e+00, -2.7833e+00, -7.7039e-01, -3.2802e+00, -2.5874e+00, -9.8196e-01, -2.1329e+00, -8.3875e-01]], [[-1.3899e+00, -1.5201e+00, -1.5803e+00, -2.2217e+00, -1.6706e+00, -2.2608e+00, -2.3988e+00, -1.6517e+00, -1.9185e+00, -1.8165e+00]], [[ 1.1889e+00, 1.2476e+00, 1.0104e+00, 3.2072e-01, 1.7288e+00, -4.0189e-01, 1.4818e-02, 8.1478e-01, 6.8745e-01, 1.6673e+00]], [[-1.6219e+00, -2.2853e+00, -3.6452e+00, -2.6118e+00, -2.7893e+00, -2.4489e+00, -2.0016e+00, -2.1841e+00, -2.4798e+00, -2.6974e+00]]]]) attn_weights tensor([[[[-2.2924e+00, -3.7690e+00, -2.3774e+00, -3.8370e+00, -2.4050e+00, -3.3606e+00, -3.4884e+00, -1.5610e+00, -8.7155e-02, -1.6525e+00]], [[-6.1098e-01, -1.3529e+00, -2.3915e+00, -2.6606e+00, -1.7945e+00, -1.7697e+00, -1.3336e+00, 3.2504e-01, -6.3290e-01, -1.0099e+00]], [[-2.6387e+00, -3.7066e+00, -3.2004e+00, -3.5543e+00, -2.9147e+00, -3.3725e+00, -2.9099e+00, -2.1427e+00, -2.3947e+00, -2.8128e+00]], [[-9.6491e-02, -2.6458e+00, -2.5453e+00, -2.5336e+00, -2.4500e+00, -2.2722e+00, -2.0786e+00, -1.9701e+00, -2.0137e+00, -2.0792e+00]], [[-5.0789e-01, -2.4500e+00, -2.6032e+00, -2.4857e+00, -2.4798e+00, -2.0760e+00, -1.9766e+00, -2.0041e+00, -2.0690e+00, -1.9828e+00]], [[ 3.9209e-02, -5.5007e-01, -1.0731e+00, 1.8046e-02, -1.0707e+00, -3.9710e+00, -4.0197e+00, -5.9582e-01, -1.2265e+00, -6.5052e-02]], [[ 1.4154e+00, -3.0427e-01, -1.0396e+00, -1.8392e+00, -3.1546e-01, -1.7997e+00, -2.1218e+00, -6.0106e-01, -1.6042e+00, -2.4084e+00]], [[-1.6530e-01, -1.6698e+00, -2.8241e+00, -2.3218e+00, -2.0385e+00, -1.8754e+00, -1.6442e+00, -1.3765e+00, -2.8737e+00, -2.3752e+00]], [[-8.1596e-01, -2.0662e+00, -2.5291e+00, -2.6844e+00, -2.3324e+00, -2.6819e+00, -3.0409e+00, -1.9319e+00, -2.3360e+00, -2.4913e+00]], [[ 1.2970e+00, -4.4122e-01, -6.5117e-01, -1.0026e+00, 1.6137e-01, -1.3702e+00, -1.4687e+00, -5.8016e-01, -5.6039e-01, -9.1894e-01]], [[-5.6816e+00, -2.0417e+00, -1.9900e+00, -1.9253e+00, -1.9193e+00, -1.5537e+00, -1.3575e+00, -1.4690e+00, -1.3896e+00, -1.3749e+00]], [[-4.9901e-01, -8.0798e-01, -3.3212e+00, 1.7563e+00, -3.5457e+00, -4.3692e+00, -5.6141e+00, -4.4447e-01, -3.3050e+00, 2.1109e+00]]], [[[-7.5662e-02, -2.1358e+00, -1.7076e+00, -8.9500e-01, -9.9976e-01, -1.3179e+00, -5.7016e-01, -2.8523e-01, 1.0033e+00, 6.7714e-01]], [[-5.5618e-01, -1.3530e+00, -2.3298e+00, -1.4935e+00, -1.6181e+00, -1.7823e+00, -1.3369e+00, 3.7724e-01, 6.0076e-01, -3.6116e-01]], [[-2.7363e+00, -3.9346e+00, -3.3373e+00, -3.7556e+00, -3.0600e+00, -3.5032e+00, -3.0241e+00, -2.2782e+00, -2.4529e+00, -2.4331e+00]], [[-3.8779e-02, -2.6905e+00, -2.4919e+00, -2.5065e+00, -2.4406e+00, -2.2900e+00, -2.0962e+00, -1.9728e+00, -2.0188e+00, -1.8784e+00]], [[-4.1958e-01, -2.4452e+00, -2.5033e+00, -2.4696e+00, -2.3618e+00, -2.0120e+00, -1.9227e+00, -1.9443e+00, -2.0432e+00, -1.8500e+00]], [[-4.1646e-01, -6.6857e-01, -8.2020e-01, -1.8215e+00, -2.0766e+00, -4.7189e+00, -4.3000e+00, -7.2127e-01, -2.1461e+00, -9.4113e-01]], [[ 2.4289e-01, -1.9933e+00, -2.5691e+00, -2.1969e+00, -2.0145e+00, -2.3325e+00, -2.4795e+00, -2.1822e+00, -2.5237e+00, -2.9114e+00]], [[-7.0013e-01, -2.4342e+00, -2.9998e+00, -2.5237e+00, -2.7807e+00, -2.1531e+00, -1.9433e+00, -2.1416e+00, -2.5490e+00, -2.9751e+00]], [[-1.9784e-01, -1.0312e+00, -2.3463e+00, -1.9213e+00, -1.4302e+00, -2.0857e+00, -2.3032e+00, -1.1277e+00, -1.6239e+00, -2.2311e+00]], [[ 1.2096e+00, -4.8279e-01, -3.6569e-01, -5.3987e-01, 1.5731e-01, -1.4956e+00, -1.3604e+00, -7.4173e-01, -6.2466e-01, -3.3592e-01]], [[-5.5054e+00, -2.0760e+00, -1.9428e+00, -1.9722e+00, -1.9405e+00, -1.5387e+00, -1.3667e+00, -1.4546e+00, -1.4889e+00, -1.2107e+00]], [[-2.9547e+00, -2.3761e+00, -3.7506e-01, -4.4363e+00, -4.0831e+00, -6.4913e+00, -5.0751e+00, -1.9250e+00, -2.9251e+00, 1.9031e-02]]], [[[-3.7743e-01, -2.2729e+00, -2.2864e+00, -1.3094e+00, -1.1384e+00, -1.5990e+00, -7.9393e-01, -3.6418e-01, 3.8036e-01, -5.7246e-02]], [[-9.1538e-01, -1.6129e+00, -2.6771e+00, -1.8852e+00, -1.8505e+00, -1.9837e+00, -1.5381e+00, 1.7325e-01, 1.3843e-01, -6.2603e-01]], [[-2.7058e+00, -3.8586e+00, -3.2855e+00, -3.7052e+00, -3.0063e+00, -3.4404e+00, -2.9711e+00, -2.2339e+00, -2.6947e+00, -2.3648e+00]], [[-5.4723e-02, -2.7167e+00, -2.5195e+00, -2.5437e+00, -2.4608e+00, -2.3066e+00, -2.1155e+00, -1.9987e+00, -2.0921e+00, -1.8903e+00]], [[-4.8238e-01, -2.4617e+00, -2.5413e+00, -2.5119e+00, -2.3939e+00, -2.0344e+00, -1.9482e+00, -1.9776e+00, -2.0004e+00, -1.9152e+00]], [[-1.0481e-01, -4.0589e-01, -5.5712e-01, -1.5469e+00, -1.7121e+00, -4.3992e+00, -4.1218e+00, -4.6450e-01, -1.8377e+00, -5.6684e-01]], [[ 5.4276e-01, -1.6014e+00, -2.3155e+00, -1.9994e+00, -1.5895e+00, -2.0078e+00, -2.3526e+00, -1.7806e+00, -2.3377e+00, -2.6506e+00]], [[-3.5386e-01, -2.0299e+00, -2.9026e+00, -2.4184e+00, -2.4974e+00, -1.8610e+00, -1.6764e+00, -1.8096e+00, -2.4904e+00, -2.9416e+00]], [[-5.3074e-01, -1.5915e+00, -2.7680e+00, -2.4287e+00, -1.8420e+00, -2.4448e+00, -2.6814e+00, -1.6352e+00, -2.1308e+00, -2.6561e+00]], [[ 1.1148e+00, -5.9959e-01, -5.1916e-01, -7.8219e-01, 3.8195e-02, -1.6578e+00, -1.5568e+00, -8.1510e-01, -1.4211e-01, -4.5507e-01]], [[-5.4354e+00, -2.1058e+00, -1.9810e+00, -2.0196e+00, -1.9683e+00, -1.5700e+00, -1.3978e+00, -1.4910e+00, -1.4437e+00, -1.2547e+00]], [[-2.3748e+00, -1.9194e+00, -3.6546e-02, -4.0745e+00, -3.7656e+00, -6.1402e+00, -4.8454e+00, -1.5334e+00, -3.6038e+00, 5.2518e-01]]], [[[-7.7420e-01, -1.8451e+00, -2.0213e+00, -1.7930e+00, -2.8610e-04, -2.8960e-01, -9.2065e-04, 2.9274e-01, 1.6434e+00, 1.0312e+00]], [[-8.6249e-01, -1.9822e+00, -2.1907e+00, -2.0086e+00, -2.2794e+00, -2.1619e+00, -1.5145e+00, 7.7920e-02, -7.0449e-01, -1.3874e+00]], [[-2.6865e+00, -3.7377e+00, -3.2873e+00, -3.6588e+00, -3.0324e+00, -3.3967e+00, -2.9985e+00, -2.2090e+00, -2.5951e+00, -3.0714e+00]], [[ 6.7460e-02, -2.5168e+00, -2.3783e+00, -2.4471e+00, -2.3951e+00, -2.1451e+00, -1.9385e+00, -1.8613e+00, -2.0573e+00, -1.9405e+00]], [[-4.1233e-01, -2.3632e+00, -2.6520e+00, -2.5683e+00, -2.5345e+00, -2.0928e+00, -1.9217e+00, -2.0229e+00, -2.2023e+00, -1.6709e+00]], [[ 7.0174e-01, 4.7828e-01, -1.5676e+00, -1.6442e+00, 1.7151e-01, -6.8457e-02, 3.7868e-01, 2.8294e-02, -1.2242e-02, -2.9747e-01]], [[ 2.6642e+00, 4.4604e-01, -9.1943e-02, -6.1170e-01, -2.0042e-01, 1.7560e+00, 9.6833e-01, -7.1734e-02, -3.5029e-01, 1.2892e+00]], [[-2.8470e-01, -2.5578e+00, -2.4175e+00, -2.3057e+00, -2.8290e+00, -1.1825e+00, -1.4369e+00, -2.1127e+00, -2.4907e+00, -2.1073e+00]], [[-6.2861e-01, -1.2647e+00, -1.5883e+00, -2.1304e+00, -1.6095e+00, -1.9974e+00, -2.3555e+00, -1.3583e+00, -1.5191e+00, -2.5745e+00]], [[ 1.5924e+00, -2.1408e-01, -1.9937e-01, -4.1257e-01, 2.0956e-01, -3.5332e-01, -1.0307e+00, -4.4024e-01, 2.7718e-01, -1.6039e+00]], [[-5.7250e+00, -1.7665e+00, -1.7108e+00, -1.7322e+00, -1.7176e+00, -1.3154e+00, -1.1344e+00, -1.2235e+00, -1.3500e+00, -1.0272e+00]], [[ 1.4088e+00, 6.4864e-01, -3.0169e+00, -1.9315e+00, -2.1347e+00, -5.8900e-01, -1.3140e+00, 7.0601e-01, -2.6183e+00, 4.2487e+00]]], [[[-8.1333e-01, -2.3256e+00, -1.2666e+00, -1.1197e+00, -1.7736e+00, -1.6481e+00, -1.1174e+00, -6.0123e-01, 6.7363e-01, -2.4344e-01]], [[-3.9350e-02, -1.0639e+00, -1.3400e+00, -1.1216e+00, -1.5999e+00, -1.3349e+00, -7.1988e-01, 8.5798e-01, 9.2169e-02, 9.8712e-02]], [[-2.5641e+00, -3.7362e+00, -3.2023e+00, -3.5719e+00, -2.8094e+00, -3.2555e+00, -2.8258e+00, -2.0783e+00, -2.7614e+00, -2.2580e+00]], [[ 1.7761e-02, -2.5884e+00, -2.4300e+00, -2.4368e+00, -2.2952e+00, -2.1141e+00, -1.9395e+00, -1.8482e+00, -2.1127e+00, -1.8909e+00]], [[-4.5284e-01, -2.5035e+00, -2.5794e+00, -2.4951e+00, -2.3245e+00, -1.8874e+00, -1.7963e+00, -1.8863e+00, -2.0174e+00, -1.7518e+00]], [[ 1.5298e-01, 2.9839e-01, -1.5515e+00, -6.7033e-01, -8.2584e-01, -2.1454e+00, -1.8512e+00, 2.6343e-01, -9.7210e-01, -1.1989e+00]], [[ 1.3380e+00, -4.7231e-01, -7.7556e-01, -1.1845e+00, -7.0951e-01, -2.9542e-01, -2.6782e-02, -5.5607e-01, -4.2553e-01, -8.4986e-01]], [[ 2.9210e-01, -1.5807e+00, -1.7828e+00, -1.6425e+00, -1.6973e+00, -1.3232e+00, -1.1268e+00, -1.1337e+00, -1.4236e+00, -1.5371e+00]], [[-3.3136e-01, -1.0519e+00, -1.8726e+00, -1.9859e+00, -1.3186e+00, -1.9649e+00, -2.1727e+00, -1.1725e+00, -1.4745e+00, -1.3742e+00]], [[ 1.3759e+00, -3.6508e-01, 8.4215e-02, -4.7914e-01, 3.6301e-01, -8.1586e-01, -9.8576e-01, -6.6229e-01, -1.3409e-02, 3.7753e-01]], [[-5.6293e+00, -2.0817e+00, -1.9830e+00, -1.9822e+00, -1.8794e+00, -1.5108e+00, -1.3404e+00, -1.4667e+00, -1.5753e+00, -1.3665e+00]], [[-1.4906e+00, -1.7714e+00, -4.4728e+00, -3.8534e+00, -1.1890e-01, -4.8007e+00, -5.2708e+00, -1.3091e+00, -3.5494e+00, 1.2126e+00]]]]) attn_weights tensor([[[[ -1.8112, -4.3338, -3.7458, -4.2861, -3.7199, -3.7012, -3.5661, -2.8873, -2.0032, -2.5598]], [[ 1.4441, -0.7842, -2.6178, -1.4823, -2.2157, -1.6235, -2.6118, -1.5366, -3.8227, -2.3418]], [[ -8.4601, -13.2004, -11.9848, -14.0436, -8.9022, -9.0241, -7.2320, -6.2330, -4.6671, -6.9095]], [[ -3.9666, -7.0554, -6.6335, -8.3984, -4.2924, -5.2393, -4.7985, -3.6199, -3.2194, -4.9296]], [[ -2.0020, -4.5944, -5.6824, -5.4740, -3.8598, -5.6729, -5.5713, -1.9444, -2.5814, -2.4352]], [[ -4.8244, -7.0517, -7.8677, -8.1038, -5.9755, -6.5009, -6.1121, -2.6813, -3.7412, -4.3186]], [[ -1.2205, -3.9667, -4.7183, -3.9462, -3.8964, -3.9050, -3.5850, -2.3882, -3.3362, -2.9181]], [[ -1.4260, -4.1062, -2.6358, -2.2697, -2.2823, -1.5037, -1.5740, -1.4123, -0.7938, -0.9123]], [[ -2.9822, -4.9910, -7.7650, -5.3717, -3.7523, -4.3522, -3.8276, -2.3735, -4.4469, -2.1806]], [[ -4.9286, -7.8770, -7.6697, -8.2581, -6.5659, -4.3256, -4.0471, -4.2487, -3.7991, -4.4022]], [[ -2.0298, -3.7938, -3.5326, -3.1692, -3.4147, -2.8026, -2.6385, -2.8344, -2.4459, -2.2691]], [[ -0.8959, -4.9319, -4.5811, -4.3582, -4.1687, -3.7852, -3.5171, -3.3983, -3.1341, -3.1279]]], [[[ -1.7516, -4.2899, -4.0484, -3.3666, -3.4557, -3.6852, -3.6720, -2.7396, -0.9365, -2.2575]], [[ 1.3838, -1.0164, -2.2885, -1.0264, -2.6437, -1.2226, -2.1323, -1.5433, -1.3641, -3.3871]], [[ -7.1517, -11.2122, -14.2582, -9.7425, -8.5556, -8.7803, -6.1833, -4.8373, -3.7183, -6.0032]], [[ -3.1834, -6.6352, -6.4161, -5.6139, -3.1101, -4.8823, -4.7741, -3.8463, -2.1631, -3.1411]], [[ -2.2935, -5.0885, -7.4272, -4.6516, -4.2567, -5.1080, -4.3815, -2.2117, -0.8088, -3.6953]], [[ -4.5601, -7.0724, -9.1897, -6.8770, -6.0461, -6.7264, -6.0898, -2.7924, -2.8658, -4.2163]], [[ -1.5062, -4.2623, -4.3602, -3.2177, -4.3219, -4.2638, -4.2008, -2.7948, -2.1102, -2.7427]], [[ -1.4254, -4.1284, -2.3901, -2.0239, -2.1555, -1.3090, -1.3866, -1.1992, -1.2766, -0.3589]], [[ -3.1345, -5.3647, -7.4652, -2.3293, -4.2100, -4.7341, -4.2478, -3.2060, -2.2537, -3.8659]], [[ -4.4494, -8.2602, -8.8106, -7.3083, -5.9330, -4.1128, -3.6316, -4.3262, -3.8320, -4.1834]], [[ -1.8422, -3.7918, -3.3220, -2.9458, -3.3882, -2.4872, -2.4212, -2.7778, -2.6484, -1.9775]], [[ -0.7762, -4.7998, -4.4742, -4.1864, -4.2241, -3.4744, -3.2640, -3.5267, -3.4771, -2.8171]]], [[[ -1.8238, -4.4757, -4.1160, -3.4521, -3.5970, -3.7572, -3.6582, -2.9890, -2.3465, -2.0605]], [[ 1.4084, -0.8122, -1.9761, -0.8173, -2.6639, -1.0025, -1.9563, -1.4534, -1.5009, -3.0361]], [[ -7.3649, -11.6385, -14.8725, -10.3990, -9.0488, -9.2396, -6.3256, -5.0396, -4.3214, -6.2624]], [[ -3.4612, -7.1298, -7.2923, -6.4545, -3.8086, -5.3373, -5.0877, -3.7873, -1.7808, -3.3980]], [[ -2.1735, -4.9088, -7.4268, -4.8263, -4.2068, -5.1327, -4.5504, -2.0069, -1.0417, -3.7015]], [[ -4.7956, -7.3175, -9.3647, -7.1133, -6.3765, -7.1564, -6.2589, -2.9150, -2.9360, -4.2879]], [[ -1.5247, -4.2201, -4.5878, -3.6523, -4.2651, -4.1084, -4.1944, -2.7425, -1.9871, -3.0758]], [[ -1.4507, -4.2094, -2.5237, -2.1522, -2.2552, -1.4264, -1.4972, -1.2755, -0.9294, -0.4517]], [[ -3.2383, -5.7886, -8.3403, -3.4982, -4.7326, -5.1634, -4.5568, -3.2252, -1.6821, -4.3836]], [[ -4.8196, -8.8022, -9.5719, -8.1334, -6.6776, -4.6323, -4.0275, -4.6493, -4.2247, -4.7531]], [[ -1.9168, -3.7805, -3.4938, -3.1068, -3.4625, -2.6373, -2.5694, -2.7907, -2.1828, -2.1816]], [[ -0.8423, -4.9057, -4.6412, -4.2793, -4.3280, -3.6687, -3.4448, -3.5416, -3.0453, -2.9513]]], [[[ -1.5560, -4.1803, -2.6958, -4.0357, -3.9201, -3.6332, -3.9558, -2.9624, -2.5864, -3.5757]], [[ 1.3185, -1.9365, -2.1538, -0.7010, -2.4256, -1.0142, -1.4070, -1.9071, -2.0304, -1.3461]], [[ -6.3653, -9.6434, -9.1851, -8.8446, -7.2307, -6.5605, -5.4852, -3.6106, -2.6822, -3.9178]], [[ -3.3429, -5.8339, -4.5206, -5.5071, -3.8307, -4.6324, -4.2929, -2.6199, -1.5032, -2.9719]], [[ -1.4988, -4.0089, -4.4346, -5.8264, -4.2573, -5.5726, -5.2793, -1.5415, -1.9999, -3.5060]], [[ -4.4086, -5.7483, -6.0763, -5.9468, -6.1434, -5.6133, -4.4719, -2.2411, -3.4766, -5.4293]], [[ -0.6026, -3.7393, -3.3657, -3.8689, -3.6643, -4.3606, -3.7140, -2.2930, -2.2809, -3.5664]], [[ -1.3266, -3.9835, -2.4679, -2.3407, -2.3005, -1.3507, -1.3545, -1.3064, -1.2455, -0.9437]], [[ -3.3426, -6.0746, -5.7243, -4.0367, -5.2265, -5.7168, -3.2605, -2.8885, -2.9553, -4.3103]], [[ -4.1226, -7.2179, -5.7831, -6.5503, -6.5217, -3.5263, -3.8314, -3.9979, -3.7381, -3.0719]], [[ -1.5981, -3.5766, -3.4555, -3.1512, -3.3129, -2.3205, -2.1275, -2.4926, -2.5647, -1.9385]], [[ -0.7418, -4.4918, -4.4172, -4.2410, -4.0799, -3.4567, -3.2807, -3.0358, -3.1583, -2.9283]]], [[[ -1.8238, -4.3675, -3.3266, -4.3204, -4.0967, -3.4558, -3.2774, -2.7173, -1.9702, -2.4992]], [[ 1.5870, -1.5244, -1.0511, -0.9353, -2.1864, -1.7167, -1.7689, -1.5672, -1.1608, -2.4936]], [[ -8.4794, -12.5419, -9.9172, -10.8768, -12.3297, -8.5068, -7.2554, -5.2659, -4.2940, -5.7841]], [[ -3.1754, -6.1998, -5.2474, -6.5677, -5.4955, -4.8387, -4.1086, -2.9762, -2.6469, -2.0109]], [[ -2.2449, -4.6988, -4.6812, -5.0821, -5.3410, -6.3998, -4.4492, -1.7435, -2.0333, -2.6144]], [[ -4.5800, -6.1993, -7.0497, -6.2241, -7.8331, -5.3508, -5.0442, -2.1749, -3.5094, -4.0162]], [[ -0.7575, -3.7225, -3.0599, -3.5733, -3.5776, -4.0604, -3.8615, -2.1835, -3.1074, -2.6397]], [[ -1.4850, -4.3846, -2.6498, -2.3453, -2.2203, -1.3929, -1.5129, -1.3171, -1.4412, -1.2194]], [[ -4.2655, -7.0624, -7.5114, -4.2180, -7.4177, -5.6660, -4.3130, -3.5877, -3.1206, -4.4176]], [[ -4.2981, -6.9243, -5.7597, -6.6469, -7.4148, -3.0413, -2.9094, -3.5164, -3.0689, -3.7949]], [[ -1.4361, -3.5667, -3.2014, -2.8697, -3.0023, -2.2356, -2.1052, -2.5393, -2.1854, -2.1415]], [[ -0.8253, -4.8465, -4.5607, -4.2436, -4.2441, -3.5683, -3.3781, -3.4620, -3.3457, -3.1330]]]]) attn_weights tensor([[[[ 3.7633, -0.9201, -0.6244, 2.5715, -1.0310, -5.4231, -3.9030, -1.3241, -1.1900, 1.2408]], [[ -2.9789, -6.4869, -6.0075, -6.8490, -5.8327, -4.5282, -6.0001, -3.3566, -4.0397, -4.8120]], [[ -4.2118, -6.8727, -6.9373, -8.7739, -6.2385, -7.2030, -7.7924, -4.3113, -2.7847, -4.8054]], [[ -4.6845, -9.4602, -10.5282, -11.3021, -10.2825, -8.8730, -10.2144, -5.5584, -5.7481, -6.8968]], [[ 0.6722, -3.5806, -3.3552, -2.0050, -2.9285, -4.0854, -2.8360, -3.2985, -3.3813, -1.9828]], [[ -0.2063, -2.1438, -3.1653, -2.3407, -1.8762, -3.1523, -2.8757, -2.9580, -3.7415, -3.1479]], [[ -2.8942, -6.3530, -4.1685, -5.9080, -5.0810, -4.0806, -4.8855, -3.5560, -0.8635, -2.9296]], [[ -5.6715, -9.7551, -10.8096, -11.0560, -8.2107, -6.4830, -6.6567, -5.4343, -6.1667, -6.6523]], [[ -4.1322, -6.3329, -8.5702, -8.6599, -7.8296, -5.8217, -5.9127, -2.8069, -4.7457, -5.2489]], [[ -1.6025, -4.1498, -5.2065, -4.4308, -5.0945, -5.7049, -5.7015, -3.2621, -3.9704, -3.2613]], [[ -1.0881, -4.7319, -4.5790, -3.9156, -3.5786, -3.6070, -4.2167, -3.1605, -3.2992, -2.7958]], [[ -2.5755, -5.4940, -6.5190, -5.8729, -4.6504, -3.6347, -4.3773, -4.0399, -4.4916, -4.1200]]], [[[ 3.9789, -0.6265, 1.5282, -2.5938, -1.1194, -4.2932, -3.5710, -0.8045, -1.3982, 0.2905]], [[ -2.7651, -5.6144, -5.6839, -4.4953, -5.8369, -5.7913, -6.3228, -3.1814, -3.1008, -3.3168]], [[ -4.2935, -7.0380, -8.1333, -5.3769, -5.6170, -7.0482, -8.9105, -4.6498, -2.9917, -3.4265]], [[ -5.2801, -8.7438, -12.9025, -10.0915, -10.3422, -8.6368, -10.9234, -5.3088, -4.4628, -7.8788]], [[ 0.6305, -3.2893, -3.3001, -3.7562, -3.5849, -3.5762, -3.2287, -2.9588, -2.5864, -3.3603]], [[ -0.2480, -2.5266, -2.3342, -0.4600, -1.3653, -3.5813, -3.6108, -3.4540, -3.7613, -3.3244]], [[ -3.2564, -5.9273, -4.6904, -5.5036, -4.7817, -4.5058, -6.1010, -4.6354, -3.3362, -2.6110]], [[ -6.2042, -9.4840, -10.5349, -8.8865, -7.5111, -7.0650, -7.0480, -5.6976, -5.6309, -5.6935]], [[ -3.9614, -6.7752, -9.3487, -6.2407, -8.6514, -8.1249, -7.7577, -3.1627, -2.8261, -4.9982]], [[ -1.5479, -4.2701, -4.3906, -1.6985, -4.0308, -5.9671, -6.6628, -3.6422, -2.4108, -2.1193]], [[ -0.9547, -5.2403, -3.6767, -4.6053, -3.9280, -4.0489, -4.8683, -3.5639, -2.1184, -2.3495]], [[ -2.4271, -5.4365, -5.7519, -4.9079, -3.8789, -2.9009, -4.5916, -4.0051, -2.6399, -2.6573]]], [[[ 4.4618, -0.1525, 2.0436, -1.8960, -0.5542, -3.8934, -2.8146, -0.4016, -2.0266, 1.3931]], [[ -2.7665, -5.9838, -6.0717, -5.7403, -6.5935, -5.7618, -6.8132, -3.6425, -2.5087, -3.7189]], [[ -4.3647, -7.6139, -8.8826, -6.3255, -6.3988, -7.9312, -8.8929, -4.9316, -5.3571, -4.1210]], [[ -5.0919, -9.9193, -14.3660, -11.6250, -11.4180, -9.1908, -11.5760, -6.2192, -5.6821, -9.1176]], [[ 0.8182, -3.3805, -3.0825, -3.7366, -3.5304, -3.2731, -3.1255, -3.0999, -2.9842, -2.9367]], [[ -0.1807, -2.0663, -2.4716, -0.9317, -1.4699, -3.0355, -3.1335, -3.0064, -3.0478, -2.5295]], [[ -3.2438, -6.8426, -6.1729, -6.9628, -5.8556, -4.8235, -6.3590, -4.8931, -3.3645, -3.2665]], [[ -5.8928, -10.4285, -12.3306, -10.6290, -8.4495, -7.2415, -7.7170, -6.1652, -6.0154, -6.9563]], [[ -4.0085, -7.2411, -9.6028, -6.9755, -8.8498, -8.5024, -8.2331, -3.7834, -2.9956, -5.0026]], [[ -1.5125, -4.8026, -5.2160, -2.8205, -4.6041, -6.2374, -6.1263, -3.6581, -1.1670, -2.9533]], [[ -1.0815, -4.6180, -3.8653, -4.8076, -3.7425, -3.9814, -4.6495, -3.6829, -3.1840, -2.2330]], [[ -2.4382, -5.9537, -7.1072, -6.2304, -4.7564, -4.7326, -5.7688, -4.1804, -2.3992, -4.2622]]], [[[ 6.0110, 0.3053, -4.4105, -2.5406, -0.1636, -2.2173, -1.3168, -0.7663, -1.8615, 3.3581]], [[ -2.5450, -6.1961, -4.3683, -4.7668, -4.2683, -5.0942, -5.2744, -3.3076, -2.6335, -5.2039]], [[ -3.6687, -7.9295, -7.1767, -6.7357, -5.9835, -7.1859, -6.6259, -3.8534, -2.1819, -3.8674]], [[ -4.2084, -9.7058, -12.6230, -11.1982, -10.5032, -8.4070, -10.4390, -5.5777, -6.6087, -5.9810]], [[ 1.4201, -3.3120, -4.3315, -4.6244, -3.0726, -2.2946, -1.8948, -2.8794, -3.3075, -4.1168]], [[ 0.1130, -2.9828, -4.7752, -3.5546, -2.7480, -1.6669, -2.0136, -2.6966, -2.8826, -2.4444]], [[ -3.0960, -6.4150, -4.2481, -5.4986, -5.2999, -3.7408, -4.8671, -3.4591, -2.7179, -2.7038]], [[ -5.1736, -10.3706, -8.9578, -8.9855, -9.4480, -5.4958, -7.8137, -5.4873, -5.9582, -5.4394]], [[ -4.0426, -7.1260, -6.9257, -6.5541, -7.0331, -6.5632, -6.4673, -2.6430, -3.7618, -6.0107]], [[ -1.7062, -4.8336, -3.6219, -2.9927, -3.4965, -4.5800, -3.9722, -3.0026, -1.8834, -3.6439]], [[ -0.8557, -5.5804, -5.7933, -6.7201, -4.3972, -2.8546, -3.3018, -3.2230, -2.7560, -1.2253]], [[ -1.9272, -5.7717, -5.8412, -4.8882, -6.0446, -4.4060, -5.0365, -2.9474, -4.2146, -2.1894]]], [[[ 4.1785, -1.5588, -3.3563, -1.7855, 0.1060, -4.8820, -2.7349, -1.9954, -2.6077, 1.0304]], [[ -3.0153, -6.3331, -4.5507, -5.2818, -6.1214, -6.7138, -6.6879, -3.2460, -2.7018, -4.5854]], [[ -5.0819, -7.1226, -6.1535, -4.8720, -8.1501, -6.8260, -6.7832, -3.4178, -1.9880, -3.3450]], [[ -5.9144, -9.9563, -10.7556, -10.0696, -12.1482, -10.0728, -9.3931, -5.3431, -5.9632, -8.0506]], [[ 0.9745, -3.5583, -3.4863, -3.7406, -2.8872, -2.7799, -3.3651, -3.1444, -4.0472, -3.3838]], [[ -0.0639, -2.6615, -3.2491, -2.8344, -2.4241, -3.2863, -3.4114, -2.8615, -3.0832, -2.5784]], [[ -4.0743, -7.1777, -3.1270, -5.4450, -7.6440, -3.5348, -4.8821, -3.9850, -2.6677, -4.5754]], [[ -6.6326, -11.0731, -9.1859, -9.3532, -10.5022, -5.7216, -6.7181, -5.7196, -6.6929, -6.9577]], [[ -4.8130, -7.0293, -6.7876, -6.5208, -9.0459, -6.9260, -7.0054, -3.0269, -3.6451, -6.1051]], [[ -2.2493, -5.6189, -3.7825, -2.5524, -4.6957, -5.3213, -3.0665, -3.2001, -1.9673, -3.6091]], [[ -1.1914, -5.6923, -5.0301, -5.2648, -3.9994, -3.7730, -4.5118, -3.8496, -2.9469, -2.2662]], [[ -2.5335, -6.1415, -5.8678, -5.5029, -6.2285, -5.4195, -5.0538, -3.6404, -2.2405, -3.8209]]]]) attn_weights tensor([[[[-2.4854e+00, -7.4783e+00, -7.1239e+00, -6.9737e+00, -7.4615e+00, -7.0741e+00, -7.3889e+00, -4.9031e+00, -5.1301e+00, -5.0570e+00]], [[-2.8389e+00, -3.9204e+00, -4.3735e+00, -4.6083e+00, -4.5303e+00, -3.4085e+00, -4.3579e+00, -1.0979e-01, -1.1870e+00, -2.1627e+00]], [[-4.0068e-01, -2.0400e+00, -3.4336e+00, -3.3811e+00, -4.2862e+00, -4.2425e+00, -3.9877e+00, -2.3520e+00, -3.6048e+00, -3.6607e+00]], [[-1.9062e+00, -5.3567e+00, -3.9144e+00, -4.5070e+00, -4.2380e+00, -4.0066e+00, -4.1996e+00, -3.7802e+00, -2.1050e+00, -2.8967e+00]], [[ 1.3670e+00, -1.5330e+00, -4.3864e-01, -8.1115e-02, -1.4782e+00, -3.2753e+00, -3.7014e+00, -1.6421e+00, -4.0998e-01, -1.1287e-01]], [[-2.2386e+00, -6.5402e+00, -6.0438e+00, -6.3379e+00, -6.0072e+00, -6.2529e+00, -6.1297e+00, -4.5424e+00, -4.5127e+00, -4.7885e+00]], [[-2.2857e+00, -4.4613e+00, -5.9641e+00, -5.9214e+00, -3.8906e+00, -3.8237e+00, -3.2895e+00, -3.8354e+00, -4.7296e+00, -4.9001e+00]], [[ 6.0883e-01, -4.8714e+00, -1.7098e+00, 5.9374e-01, -8.9044e-01, -2.0809e+00, -3.2458e+00, -2.2629e+00, -1.4298e+00, 7.1415e-01]], [[ 1.4764e+00, -1.9850e+00, -2.5566e+00, -2.1295e+00, -1.6329e+00, -2.8412e+00, -2.1412e+00, -1.4646e+00, -2.1929e+00, -2.2502e+00]], [[-1.2555e+00, -2.6833e+00, -4.2679e+00, -4.7419e+00, -2.7439e+00, -4.2222e+00, -3.0198e+00, -3.1023e+00, -3.4802e+00, -3.9543e+00]], [[ 1.1298e+00, -1.7138e+00, -2.3396e+00, -2.2142e+00, -2.4544e+00, -2.7058e+00, -3.0833e+00, -1.9137e+00, -2.2865e+00, -2.5945e+00]], [[-2.5287e+00, -1.6405e+01, 6.4008e-01, -8.1727e+00, -1.4795e+01, -1.2464e+01, -2.0909e+01, -6.5599e+00, 1.2998e+01, 5.0083e+00]]], [[[-2.1681e+00, -7.3192e+00, -7.7328e+00, -5.2007e+00, -7.0135e+00, -7.2967e+00, -9.4960e+00, -6.1896e+00, -5.0593e+00, -4.7831e+00]], [[-2.3335e+00, -4.5837e+00, -6.4170e+00, -4.8538e+00, -6.2222e+00, -5.2537e+00, -5.6426e+00, -3.2179e+00, -1.2527e+00, -2.8549e+00]], [[-1.0776e-01, -2.3940e+00, -3.9404e+00, -3.0860e+00, -4.5716e+00, -4.9688e+00, -4.8435e+00, -2.8688e+00, -2.8990e+00, -4.4293e+00]], [[-2.1300e+00, -5.9640e+00, -6.0388e+00, -4.0569e+00, -4.3511e+00, -4.3595e+00, -3.4584e+00, -4.5981e+00, -4.0240e+00, -3.7210e+00]], [[ 1.2791e+00, -1.7202e+00, -4.3090e-01, -1.3155e+00, -1.0895e+00, -3.2101e+00, -4.1862e+00, -2.1589e+00, -1.6233e+00, -9.1225e-01]], [[-1.8271e+00, -5.7713e+00, -7.2121e+00, -6.2183e+00, -6.8524e+00, -7.7536e+00, -8.1720e+00, -4.8837e+00, -6.3839e+00, -4.8564e+00]], [[-2.1311e+00, -4.8516e+00, -6.0189e+00, -5.0225e+00, -4.3187e+00, -4.1123e+00, -4.1649e+00, -4.3579e+00, -4.0897e+00, -4.7012e+00]], [[ 4.8049e-01, -5.6392e+00, -2.4355e+00, -2.1411e+00, -2.7526e+00, -3.5406e+00, -4.0319e+00, -2.9928e+00, -7.0004e-01, 3.4161e-01]], [[ 1.9146e+00, -3.2909e+00, -3.0541e+00, -2.8639e+00, -2.0805e+00, -3.4281e+00, -2.5593e+00, -2.6598e+00, -1.5511e+00, -2.6433e+00]], [[-1.2561e+00, -3.4624e+00, -4.1234e+00, -2.6288e+00, -1.2275e+00, -3.8761e+00, -3.3958e+00, -3.3230e+00, -4.3038e+00, -3.7945e+00]], [[ 1.4271e+00, -2.1685e+00, -3.2316e+00, -3.3190e+00, -3.1041e+00, -2.8251e+00, -3.8172e+00, -2.0134e+00, -7.3826e-01, -3.1042e+00]], [[-4.3338e+00, -1.1226e+01, -1.7237e+01, -1.5948e+01, -2.0632e+01, -1.7218e+01, -2.7022e+01, -2.1181e+00, 1.2556e+01, 3.6298e-01]]], [[[-2.3108e+00, -8.7465e+00, -8.8623e+00, -6.9917e+00, -8.3492e+00, -8.5469e+00, -9.8157e+00, -6.9795e+00, -6.5778e+00, -5.7081e+00]], [[-2.4454e+00, -5.0127e+00, -5.9821e+00, -5.4077e+00, -6.5258e+00, -4.7513e+00, -5.6840e+00, -3.4680e+00, -1.9830e+00, -2.5730e+00]], [[ 6.9462e-03, -2.0425e+00, -3.1048e+00, -3.2113e+00, -4.6546e+00, -5.1818e+00, -4.2595e+00, -3.2773e+00, -3.0428e+00, -4.5068e+00]], [[-1.9803e+00, -5.8540e+00, -5.8671e+00, -4.8161e+00, -4.8148e+00, -4.7309e+00, -4.4841e+00, -4.7989e+00, -4.5815e+00, -3.3940e+00]], [[ 1.4018e+00, -1.9765e+00, -6.3641e-01, -1.1823e+00, -1.4512e+00, -3.2481e+00, -3.6750e+00, -2.3701e+00, -6.7174e-01, -1.2027e+00]], [[-1.9453e+00, -6.9100e+00, -7.9006e+00, -7.7579e+00, -7.5697e+00, -7.8870e+00, -8.4622e+00, -5.7538e+00, -5.9867e+00, -5.2417e+00]], [[-2.0349e+00, -5.0544e+00, -6.6133e+00, -5.4772e+00, -4.5109e+00, -4.2672e+00, -4.2071e+00, -4.5044e+00, -4.3611e+00, -4.8778e+00]], [[ 5.6100e-01, -4.1179e+00, -1.4033e+00, -2.0635e+00, -2.8238e+00, -2.8718e+00, -3.5119e+00, -2.5542e+00, -4.0085e-01, 8.0336e-01]], [[ 1.7254e+00, -3.0139e+00, -3.0873e+00, -2.7819e+00, -1.8007e+00, -2.7836e+00, -2.2590e+00, -2.5083e+00, -1.3147e+00, -2.8172e+00]], [[-1.0872e+00, -4.2609e+00, -5.0595e+00, -3.8094e+00, -3.1497e+00, -3.7098e+00, -2.8342e+00, -3.6721e+00, -3.8087e+00, -3.5783e+00]], [[ 1.5135e+00, -2.0874e+00, -3.1651e+00, -2.7430e+00, -3.0255e+00, -2.7886e+00, -3.8830e+00, -2.1148e+00, -1.6949e+00, -2.8180e+00]], [[-8.8264e+00, -8.9894e+00, -1.4883e+01, -1.6883e+01, -1.8837e+01, -1.6039e+01, -2.3571e+01, -6.0723e+00, 8.1710e+00, 5.4941e-01]]], [[[-3.0942e+00, -7.4916e+00, -6.3175e+00, -4.4136e+00, -4.2549e+00, -5.8310e+00, -4.7978e+00, -3.3874e+00, -3.5579e+00, -5.6129e+00]], [[-2.1439e+00, -5.4310e+00, -3.6959e+00, -4.9395e+00, -5.1370e+00, -6.0026e+00, -5.8999e+00, -1.2859e+00, -2.1427e+00, -4.6310e+00]], [[ 3.4008e-03, -2.3167e+00, -2.9642e+00, -2.7726e+00, -2.3566e+00, -3.7802e+00, -3.1838e+00, -1.7744e+00, -3.0453e+00, -4.3731e+00]], [[-1.3164e+00, -6.0568e+00, -3.9381e+00, -4.2015e+00, -4.1879e+00, -2.5650e+00, -4.8390e+00, -3.7620e+00, -3.9241e+00, -3.2633e+00]], [[ 1.7525e+00, -3.5506e+00, -4.4006e+00, -5.1350e+00, -2.1311e+00, -1.2235e+00, -2.0277e+00, -1.5476e+00, -1.0362e+00, -1.0432e+00]], [[-1.7612e+00, -6.6719e+00, -5.1124e+00, -5.7133e+00, -7.1565e+00, -4.9046e+00, -5.3644e+00, -3.7484e+00, -4.1946e+00, -2.7859e+00]], [[-1.7838e+00, -4.5614e+00, -5.3708e+00, -5.3295e+00, -4.9751e+00, -4.0606e+00, -4.5996e+00, -3.5911e+00, -4.0599e+00, -4.7914e+00]], [[ 4.7195e-02, -5.1183e+00, -2.2446e+00, -3.6278e+00, -2.1901e+00, 3.6380e-01, -2.5191e+00, -2.4413e+00, -1.5808e+00, 1.7856e+00]], [[ 1.6873e+00, -5.0220e+00, -4.5142e+00, -3.7062e+00, -2.9419e+00, -8.1928e-01, -2.3707e+00, -2.0564e+00, -1.6621e+00, -2.9367e+00]], [[-9.7514e-01, -3.5785e+00, -3.5677e+00, -3.9127e+00, -2.5667e+00, -4.5686e+00, -3.4091e+00, -2.5349e+00, -3.3977e+00, -4.7594e+00]], [[ 1.3079e+00, -3.9476e+00, -3.1466e+00, -4.5555e+00, -4.0235e+00, -3.5326e+00, -1.8289e+00, -2.4627e+00, -2.5869e+00, -3.3517e+00]], [[-7.5509e+00, -1.1089e+01, -8.0675e+00, -9.1486e+00, 2.0586e-01, -2.8517e+00, -1.9204e+01, -5.0056e-01, 1.3736e+01, -2.4940e-01]]], [[[-3.8267e+00, -7.2274e+00, -6.2555e+00, -3.5257e+00, -5.1738e+00, -7.3378e+00, -5.8517e+00, -3.6452e+00, -3.6379e+00, -4.5497e+00]], [[-2.8673e+00, -4.9690e+00, -4.8505e+00, -5.6244e+00, -7.5032e+00, -4.4492e+00, -5.4000e+00, -1.8776e+00, -1.6477e+00, -3.9015e+00]], [[-2.3930e-01, -2.7958e+00, -3.4112e+00, -3.3701e+00, -4.2153e+00, -4.1940e+00, -2.8719e+00, -2.4645e+00, -3.0587e+00, -4.5654e+00]], [[-3.0233e+00, -5.4252e+00, -3.3005e+00, -3.2000e+00, -5.1562e+00, -1.7912e+00, -1.9310e+00, -2.7087e+00, -2.9222e+00, -4.5369e+00]], [[ 1.1118e+00, -3.2204e+00, -2.4415e+00, -2.9002e+00, -9.0216e-01, -1.6444e+00, -3.2190e+00, -2.1786e+00, -4.3880e-01, -6.5314e-01]], [[-2.4001e+00, -5.8670e+00, -4.5381e+00, -4.8386e+00, -6.7733e+00, -6.2625e+00, -5.5774e+00, -3.8689e+00, -4.2786e+00, -5.2924e+00]], [[-2.3619e+00, -5.0203e+00, -5.4311e+00, -5.4288e+00, -5.2804e+00, -4.2113e+00, -4.3265e+00, -3.9171e+00, -4.1435e+00, -4.8460e+00]], [[-9.6478e-02, -4.1427e+00, -3.0176e+00, -2.7813e+00, -1.4726e+00, -1.7486e+00, -2.3907e+00, -1.9289e+00, -6.2301e-01, 8.9234e-01]], [[ 1.6567e+00, -3.8525e+00, -3.2902e+00, -3.0773e+00, -2.9394e+00, -4.0467e+00, -2.1828e+00, -2.0028e+00, -2.0070e+00, -2.0842e+00]], [[-1.4295e+00, -2.9763e+00, -3.7734e+00, -3.7774e+00, -2.7035e+00, -3.8328e+00, -2.3756e+00, -2.5769e+00, -4.1214e+00, -2.9068e+00]], [[ 1.2492e+00, -3.3082e+00, -3.4182e+00, -3.4085e+00, -2.8536e+00, -3.3770e+00, -3.6017e+00, -3.2252e+00, -3.7412e+00, -3.0530e+00]], [[-7.6135e+00, -1.4563e+01, -1.9278e+01, -1.4622e+01, -1.8069e+01, -1.3888e+01, -1.8626e+01, -8.4118e+00, 7.9123e+00, -1.2235e+00]]]]) attn_weights tensor([[[[ 1.9943e+00, -4.2663e+00, -3.8905e+00, -3.3862e+00, 2.4115e-01, -5.0490e-01, -2.1549e+00, -1.0895e+00, -1.2492e+00, -1.0773e+00]], [[ 4.3798e+00, -1.0221e+01, -7.4569e+00, -3.6811e+00, 2.9392e+00, 5.3263e-01, -7.4849e+00, -6.7235e+00, -3.3320e+00, -9.9119e-01]], [[ 6.4693e-02, -2.7194e+00, -3.6182e+00, -5.3551e+00, -3.2739e+00, -2.6759e+00, -2.7698e+00, -2.3351e+00, -2.1976e+00, -4.2820e+00]], [[-2.4868e-01, -1.0045e+00, -2.5898e+00, -2.6965e+00, -2.5482e+00, -2.0172e+00, -1.5989e+00, -1.2270e+00, -1.3752e+00, -2.1232e+00]], [[-4.4911e-01, -3.8347e+00, -5.0098e+00, -5.0203e+00, -2.8512e+00, -2.1992e+00, -1.7794e+00, -8.6841e-01, -2.4712e+00, -2.6061e+00]], [[ 1.7745e+00, -5.0060e+00, -3.6681e+00, -3.3549e+00, 5.3638e-01, -7.9352e-01, -4.0571e+00, -2.4619e+00, -2.4847e+00, -3.7198e+00]], [[ 9.6244e-01, -4.6784e+00, -3.0568e+00, -4.2632e+00, -4.5467e+00, -3.0295e+00, -4.1407e+00, -1.5949e+00, 1.9763e-01, -1.6989e+00]], [[ 6.3201e-01, -3.7750e+00, -5.8789e+00, -6.2435e+00, -4.3752e+00, -3.6820e+00, -2.3351e+00, -3.7879e+00, -4.2109e+00, -4.6508e+00]], [[ 8.6460e-01, -4.7844e+00, -4.7103e+00, -4.8154e+00, 3.9846e-01, -1.3828e+00, -3.0295e+00, -1.7907e+00, -2.6283e+00, -3.4979e+00]], [[ 5.6012e-01, -2.6142e+00, -3.3720e+00, -3.4752e+00, -2.2936e+00, -1.6790e+00, -1.5669e+00, -1.6824e+00, -2.6488e+00, -3.3383e+00]], [[ 1.5842e+00, -1.1151e+00, -8.4445e-01, -7.7031e-01, 6.0438e-01, -4.4454e-01, 1.3742e+00, 1.5837e+00, -3.4677e-02, -7.8604e-01]], [[ 9.9134e-01, -2.9614e+00, -2.8105e+00, -4.5242e-01, -8.0074e-01, -2.4521e+00, -3.8079e+00, -2.0706e+00, -2.0188e+00, 2.8271e-01]]], [[[ 2.0312e+00, -4.0360e+00, -4.1221e+00, -8.5134e-01, -1.6336e+00, -1.0359e+00, -2.4255e+00, -1.9337e+00, -7.4776e-01, -9.4966e-01]], [[ 4.2229e+00, -7.3423e+00, -6.7914e+00, 1.4581e+00, -1.7727e+00, -2.0277e+00, -7.6816e+00, -8.2086e+00, -4.8148e+00, -7.1895e-01]], [[-9.0811e-02, -2.3736e+00, -2.9314e+00, -1.1383e+00, -6.9287e-01, -2.1669e+00, -2.4733e+00, -2.8219e+00, -3.1740e+00, -3.3586e+00]], [[ 6.5297e-02, -3.9905e-01, -1.6240e+00, -4.8947e-01, -1.5631e+00, -2.3289e+00, -1.7405e+00, -2.1642e+00, -9.1703e-01, -1.9265e+00]], [[-2.0061e-02, -4.5836e+00, -6.3713e+00, -3.3558e+00, -3.1490e+00, -2.6699e+00, -2.0210e+00, -2.9873e+00, -2.0801e+00, -3.2736e+00]], [[ 1.3970e+00, -3.3745e+00, -3.4751e+00, -4.2148e-01, -7.3599e-01, -6.7198e-01, -3.1649e+00, -2.4802e+00, -1.8566e+00, -2.2976e+00]], [[ 1.1232e+00, -5.6055e+00, -6.9360e+00, -7.2231e+00, -5.8819e+00, -3.1653e+00, -4.0132e+00, -2.2521e+00, 4.3810e-01, -2.0751e+00]], [[ 9.9324e-01, -4.1226e+00, -5.6915e+00, -6.1508e+00, -4.9808e+00, -4.9538e+00, -1.9234e+00, -4.2187e+00, -2.9829e+00, -3.9737e+00]], [[ 7.5642e-01, -3.8180e+00, -4.1111e+00, 1.8940e-01, -3.5135e-03, -1.5285e+00, -3.5282e+00, -2.8549e+00, -2.0789e+00, -1.3307e+00]], [[ 6.6843e-01, -2.5455e+00, -3.4168e+00, -2.9651e+00, -2.4520e+00, -2.0469e+00, -2.3854e+00, -2.1009e+00, -2.5510e+00, -3.1697e+00]], [[ 1.7932e+00, -1.1055e+00, -1.1008e+00, -1.1479e+00, 5.9882e-01, 5.9012e-01, 2.1116e+00, 1.6577e+00, -1.0511e+00, -3.1588e-01]], [[ 9.9492e-01, -2.7062e+00, -1.7645e+00, -1.7546e+00, -1.1360e+00, -3.3412e+00, -4.2590e+00, -2.5250e+00, -1.9288e+00, 3.8038e-02]]], [[[ 2.2895e+00, -4.4893e+00, -4.8016e+00, -1.6245e+00, -1.1966e+00, -1.3134e+00, -2.7742e+00, -2.4428e+00, -2.5855e+00, -1.4047e+00]], [[ 4.4989e+00, -6.3279e+00, -5.1063e+00, 1.5785e+00, -1.5168e+00, -2.5202e+00, -8.3295e+00, -9.0121e+00, -6.4754e+00, -1.8729e+00]], [[ 1.7948e-01, -2.7948e+00, -4.2023e+00, -3.2903e+00, -2.2165e+00, -2.3076e+00, -2.0227e+00, -2.7214e+00, -2.6618e+00, -3.1576e+00]], [[ 1.3467e-01, -1.0214e+00, -1.7262e+00, -1.2092e+00, -2.0347e+00, -2.1576e+00, -2.0740e+00, -2.0459e+00, -1.3872e+00, -1.6226e+00]], [[ 4.7475e-02, -4.5705e+00, -6.2605e+00, -3.5392e+00, -3.8664e+00, -3.1153e+00, -2.1440e+00, -3.5997e+00, -1.4172e+00, -2.8005e+00]], [[ 1.6611e+00, -3.0435e+00, -3.0216e+00, -5.3034e-01, -8.4064e-01, -7.8383e-01, -3.2690e+00, -2.9929e+00, -2.3108e+00, -2.7791e+00]], [[ 1.6753e+00, -4.5723e+00, -6.2149e+00, -6.7415e+00, -5.5814e+00, -2.8387e+00, -4.4570e+00, -2.6368e+00, -5.7182e-01, -2.6532e+00]], [[ 9.4557e-01, -4.3037e+00, -5.4012e+00, -5.7879e+00, -4.9636e+00, -4.9688e+00, -1.6799e+00, -4.9587e+00, -2.6496e+00, -3.4295e+00]], [[ 7.7235e-01, -2.6223e+00, -4.0384e+00, -4.6504e-01, 3.7336e-02, -1.2827e+00, -2.9825e+00, -2.3080e+00, -3.0514e+00, -2.4355e+00]], [[ 8.0030e-01, -2.4870e+00, -3.5171e+00, -3.1582e+00, -2.7774e+00, -2.5155e+00, -2.6954e+00, -2.7284e+00, -3.3663e+00, -3.3736e+00]], [[ 2.0153e+00, -1.5693e+00, -1.4951e+00, -1.4235e+00, 2.9907e-01, 2.2341e-01, 1.7911e+00, 1.4342e+00, -1.1854e+00, -1.1691e+00]], [[ 9.6412e-01, -3.1774e+00, -2.2081e+00, -2.6833e+00, -2.3372e+00, -2.9177e+00, -4.5373e+00, -2.8688e+00, -1.5371e+00, -7.5921e-01]]], [[[ 2.3183e+00, -6.6559e+00, -6.1706e+00, -6.7583e+00, -7.4574e+00, -2.4396e+00, 1.6209e+00, 6.6534e-01, -2.2364e+00, -2.4908e+00]], [[ 4.4356e+00, -1.9070e+01, -1.7582e+01, -1.4491e+01, -1.4096e+01, -5.1143e+00, -4.5233e+00, -4.8523e+00, -6.6369e+00, -3.1607e+00]], [[ 2.7611e-01, -3.1785e+00, -4.3825e+00, -3.9608e+00, -2.0468e+00, -3.1620e+00, -2.0433e+00, -1.3042e+00, -1.3943e+00, -3.0767e+00]], [[ 1.8833e-01, -1.4521e+00, -2.5800e+00, -1.5670e+00, -1.6358e+00, -2.3444e+00, -1.7912e+00, -9.7137e-01, -1.1746e+00, -2.1225e+00]], [[-1.5045e-01, -4.3364e+00, -4.3170e+00, -4.3500e+00, -4.4392e+00, -2.7528e+00, -2.8034e+00, -1.1674e+00, -1.2220e+00, -3.1381e+00]], [[ 2.5301e+00, -1.4008e+01, -1.0071e+01, -8.6471e+00, -7.5198e+00, -4.4559e+00, -3.8165e+00, -3.5564e+00, -2.1009e+00, -3.2961e+00]], [[ 1.1955e+00, -5.5290e+00, -5.7458e+00, -5.1567e+00, -3.6307e+00, -1.7360e+00, -4.3325e+00, -1.7078e+00, -1.3626e+00, -2.4159e+00]], [[ 1.4778e+00, -6.7526e+00, -7.0278e+00, -6.4976e+00, -4.2088e+00, -3.6273e+00, -2.1587e+00, -4.1725e+00, -3.9217e+00, -2.6995e+00]], [[ 6.7927e-01, -7.3985e+00, -7.5066e+00, -6.5876e+00, -6.3407e+00, -3.8006e+00, -1.4001e+00, -1.6570e+00, -2.8110e+00, -2.6790e+00]], [[ 1.2481e+00, -4.3574e+00, -4.1459e+00, -3.9721e+00, -3.3867e+00, -1.4306e+00, -1.0515e+00, -1.2116e+00, -2.4821e+00, -4.1518e+00]], [[ 3.0233e+00, -2.5684e+00, -2.1392e+00, -1.3017e+00, -9.4736e-01, 1.8817e+00, 1.8626e+00, 7.7333e-01, -8.6893e-01, 1.0233e+00]], [[ 9.0988e-01, -4.6210e+00, -4.0555e+00, -4.3310e+00, -4.0105e+00, -2.4630e+00, -2.8372e+00, -2.1727e+00, -2.4109e+00, -2.6643e+00]]], [[[ 1.7160e+00, -4.4367e+00, -5.6512e+00, -4.0282e+00, -5.1789e+00, -1.0149e+00, 2.2217e-01, -5.2337e-01, -1.9481e+00, -2.3960e+00]], [[ 4.3099e+00, -1.4165e+01, -1.1942e+01, -8.8681e+00, -7.9734e+00, -1.1817e+00, -6.5087e+00, -8.7503e+00, -6.2162e+00, -2.7952e+00]], [[-1.0730e-01, -3.1318e+00, -4.7069e+00, -3.2331e+00, -2.4644e+00, -2.0898e+00, -1.4535e+00, -1.3304e+00, -1.5457e+00, -3.4761e+00]], [[-1.9231e-02, -1.3697e+00, -2.1416e+00, -1.7808e+00, -2.0691e+00, -2.2685e+00, -2.6947e+00, -1.7395e+00, -1.7437e+00, -2.5246e+00]], [[-2.6476e-01, -4.2414e+00, -4.2287e+00, -3.5047e+00, -4.2615e+00, -1.9995e+00, -2.0821e+00, -1.6776e+00, -5.8001e-02, -2.4009e+00]], [[ 1.7358e+00, -9.3356e+00, -6.1293e+00, -5.1979e+00, -5.4177e+00, -1.1415e+00, -3.7339e+00, -2.3755e+00, -1.9364e+00, -2.9034e+00]], [[ 8.3814e-01, -4.7982e+00, -4.7223e+00, -5.2066e+00, -5.9301e+00, -3.6386e+00, -5.8719e+00, -3.6150e+00, -9.7634e-01, -3.2836e+00]], [[ 8.0179e-01, -3.8078e+00, -4.4804e+00, -5.1129e+00, -4.1485e+00, -2.6526e+00, -1.6088e+00, -2.9264e+00, -2.3162e+00, -2.6529e+00]], [[ 5.2814e-01, -6.5633e+00, -6.4356e+00, -5.2587e+00, -6.3708e+00, -7.3172e-01, -1.5797e+00, -5.4980e-01, -1.0950e+00, -3.9553e+00]], [[ 6.3528e-01, -3.1028e+00, -3.7592e+00, -3.5797e+00, -2.5365e+00, -2.0479e+00, -1.8129e+00, -1.7673e+00, -2.2171e+00, -2.8521e+00]], [[ 1.8783e+00, -5.7904e-01, -4.0995e-01, -2.1178e-01, -3.6789e-02, 2.0946e-01, 1.2067e+00, 1.3048e+00, -9.6748e-02, -1.3901e+00]], [[ 8.8093e-01, -3.5581e+00, -3.4297e+00, -3.8962e+00, -1.5867e+00, -1.8722e+00, -3.5920e+00, -2.0349e+00, -2.1631e+00, 7.9901e-02]]]]) attn_weights tensor([[[[-1.1240e+00, -3.8250e+00, -2.9900e+00, -4.5846e+00, -4.6378e+00, -4.7275e+00, -3.7883e+00, -3.1817e+00, -1.0721e+00, -3.1393e+00]], [[-1.0884e+00, -3.6033e+00, -3.8744e+00, -4.2849e+00, -1.8437e+00, -1.2253e+00, -1.7274e+00, -3.3679e+00, -2.6995e+00, -3.1474e+00]], [[ 6.3332e-02, -2.3286e+00, -2.7274e+00, -2.9878e+00, -3.6832e+00, -3.6919e+00, -3.3940e+00, -2.2139e+00, -2.3730e+00, -3.1540e+00]], [[-2.4892e-01, -1.9227e+00, -3.7752e+00, -2.8214e+00, -1.2013e+00, -2.4358e+00, -2.4147e+00, -1.2560e+00, -2.8202e+00, -2.8257e+00]], [[ 9.3373e-01, -1.0952e+00, -1.9492e+00, -2.1228e+00, -1.4046e+00, -2.8902e+00, -1.7240e+00, -1.0733e+00, -2.0020e+00, -2.6783e+00]], [[-9.7759e-01, -3.6314e+00, -4.3237e+00, -4.0624e+00, -4.2521e+00, -3.9686e+00, -3.6815e+00, -3.7829e+00, -3.1652e+00, -2.9750e+00]], [[ 1.6573e+00, -2.7913e+00, -1.6051e+00, -8.2845e-01, -7.9751e-01, -1.9847e+00, -2.4817e+00, -8.1766e-01, 3.2489e-01, 5.5271e-01]], [[-8.8579e-01, -3.9245e+00, -4.8980e+00, -4.5435e+00, -3.9474e+00, -2.1265e+00, -1.2140e+00, -2.1025e+00, -3.8895e+00, -3.5125e+00]], [[-1.9737e+00, -4.0411e+00, -3.7627e+00, -6.2591e+00, -4.7817e+00, -3.1460e+00, -3.8946e+00, -2.0954e+00, -1.5422e+00, -4.1502e+00]], [[ 3.8388e+00, -5.8413e+00, -5.4786e+00, -3.1166e+00, 1.8137e+00, 2.7454e-01, -5.0549e+00, -3.8954e+00, -4.1875e+00, -2.4349e+00]], [[ 2.5900e+00, -3.6120e+00, -2.1183e+00, -1.4418e+00, -5.6042e-01, -1.0963e+00, -2.5214e-01, -9.8757e-01, -3.1694e-01, 2.7902e-01]], [[-9.4743e-01, -2.4212e+00, -3.8035e+00, -4.8999e+00, -3.2966e+00, -2.9134e+00, -2.7685e+00, -1.0248e+00, -8.6401e-01, -2.5431e+00]]], [[[-7.4567e-01, -3.7842e+00, -3.7982e+00, -2.7968e+00, -2.9887e+00, -3.8808e+00, -3.0530e+00, -3.8433e+00, -2.7946e+00, -2.7181e+00]], [[-4.8573e-01, -3.2703e+00, -4.8454e+00, -1.7969e+00, -2.2553e+00, -2.8208e+00, -3.4617e+00, -3.2966e+00, -2.1971e+00, -3.1477e+00]], [[ 2.9304e-01, -2.7430e+00, -2.5883e+00, -3.1615e+00, -3.4598e+00, -3.7434e+00, -3.4044e+00, -2.4362e+00, -2.7537e+00, -2.8395e+00]], [[-6.9826e-02, -2.6203e+00, -4.0848e+00, -2.6639e+00, -8.5795e-01, -2.1042e+00, -1.6839e+00, -9.1405e-01, -1.1565e+00, -3.1722e+00]], [[ 1.0672e+00, -9.6084e-01, -1.9435e+00, -1.7356e+00, -1.3646e+00, -2.6680e+00, -1.3877e+00, -6.6669e-01, -1.7851e+00, -2.6949e+00]], [[-6.6582e-01, -4.0044e+00, -4.5142e+00, -3.4301e+00, -4.0238e+00, -4.6498e+00, -3.4593e+00, -4.4522e+00, -3.4296e+00, -2.5628e+00]], [[ 2.0752e+00, -2.6800e+00, -6.0279e-01, -8.5651e-01, -1.0527e+00, -2.4879e+00, -3.0207e+00, -1.3418e+00, -1.0227e-01, 1.0035e+00]], [[-7.9984e-01, -3.5817e+00, -4.5331e+00, -3.6022e+00, -2.8650e+00, -1.5429e+00, -3.0227e-01, -1.9662e+00, -3.2138e+00, -4.1350e+00]], [[-1.7064e+00, -4.6435e+00, -4.7586e+00, -5.5103e+00, -5.3169e+00, -4.3862e+00, -4.2050e+00, -3.8671e+00, -2.2332e+00, -3.4743e+00]], [[ 3.8284e+00, -5.0569e+00, -5.0300e+00, 1.6285e+00, -1.8034e+00, -1.4496e+00, -5.5391e+00, -4.8013e+00, -3.8280e+00, -1.0876e+00]], [[ 2.9187e+00, -3.5690e+00, -3.4063e+00, -2.9159e+00, -1.7140e+00, -2.0358e+00, -1.2183e+00, -1.5366e+00, -7.7401e-01, -4.5903e-01]], [[ 1.1935e-02, -2.8778e+00, -4.5462e+00, -4.8153e+00, -4.4650e+00, -5.2654e+00, -4.1640e+00, -3.9153e+00, -1.2987e+00, -2.5812e+00]]], [[[-7.7178e-01, -4.1683e+00, -3.6559e+00, -2.8299e+00, -3.1697e+00, -3.9556e+00, -3.1211e+00, -3.9743e+00, -3.2896e+00, -2.6465e+00]], [[ 5.5570e-02, -3.5493e+00, -5.3986e+00, -2.9030e+00, -2.4543e+00, -2.7144e+00, -3.0662e+00, -3.1220e+00, -4.7472e+00, -3.7823e+00]], [[ 2.3568e-01, -2.7693e+00, -2.6085e+00, -3.0538e+00, -3.3134e+00, -3.4088e+00, -3.3247e+00, -2.2232e+00, -2.6903e+00, -2.6299e+00]], [[-1.8640e-01, -2.6088e+00, -3.2812e+00, -2.0854e+00, -7.4759e-01, -2.1329e+00, -1.1187e+00, -9.1226e-01, -8.3588e-01, -2.3441e+00]], [[ 1.1440e+00, -1.0659e+00, -1.7225e+00, -1.3018e+00, -1.0053e+00, -2.7839e+00, -1.3357e+00, -8.2371e-01, -1.4065e+00, -1.6373e+00]], [[-6.9608e-01, -3.9812e+00, -4.5521e+00, -3.2960e+00, -3.8304e+00, -4.4171e+00, -3.4871e+00, -4.1369e+00, -2.4555e+00, -3.0763e+00]], [[ 2.1776e+00, -2.2975e+00, -6.9813e-01, -9.8962e-01, -1.8474e+00, -2.6134e+00, -3.3807e+00, -1.8090e+00, -5.8805e-01, 7.9548e-01]], [[-9.9789e-01, -3.4583e+00, -4.4962e+00, -3.3520e+00, -2.3332e+00, -1.5030e+00, -3.2151e-01, -1.7797e+00, -3.3293e+00, -3.7225e+00]], [[-1.4952e+00, -5.0002e+00, -5.5467e+00, -6.3479e+00, -5.6082e+00, -4.5477e+00, -4.4286e+00, -4.0254e+00, -2.8734e+00, -3.7114e+00]], [[ 4.0780e+00, -4.5231e+00, -3.6409e+00, 1.6757e+00, -2.3023e+00, -1.3966e+00, -5.6451e+00, -4.6426e+00, -3.7644e+00, -1.7936e+00]], [[ 2.6732e+00, -3.3679e+00, -3.0981e+00, -2.7011e+00, -1.8667e+00, -2.3048e+00, -1.5109e+00, -1.4497e+00, -1.4605e+00, -3.0229e-01]], [[-3.4991e-01, -2.8893e+00, -4.5664e+00, -4.9056e+00, -4.3753e+00, -5.0551e+00, -3.8521e+00, -3.6762e+00, -2.1759e+00, -3.1646e+00]]], [[[-1.0794e+00, -3.5953e+00, -3.9065e+00, -3.5589e+00, -2.4497e+00, -3.9215e+00, -2.8807e+00, -1.4876e+00, -1.4534e+00, -3.8941e+00]], [[ 1.1870e-01, -3.7730e+00, -3.4292e+00, -4.6218e+00, -3.3199e+00, -2.3187e+00, -1.3917e+00, -1.6194e+00, -3.0605e+00, -2.6668e+00]], [[ 4.1077e-01, -3.4651e+00, -3.5863e+00, -3.7931e+00, -3.5112e+00, -3.8045e+00, -3.3641e+00, -2.4245e+00, -2.3221e+00, -3.7766e+00]], [[ 7.3247e-01, -3.5885e+00, -5.0502e+00, -4.9283e+00, -3.9702e+00, -3.2896e+00, -2.9255e+00, -3.4080e+00, -4.1256e+00, -4.2745e+00]], [[ 2.1480e+00, -3.5236e+00, -3.1099e+00, -3.4775e+00, -3.1379e+00, -7.4920e-01, -4.7956e-01, -1.7095e+00, -2.4327e+00, -4.0592e-01]], [[-2.2502e-01, -3.8906e+00, -4.4102e+00, -4.4593e+00, -4.3272e+00, -3.7136e+00, -3.6932e+00, -3.2576e+00, -3.1255e+00, -3.1767e+00]], [[ 2.3873e+00, -4.1509e+00, -4.8325e+00, -5.1781e+00, -3.7498e+00, -1.4503e+00, -1.0339e+00, -1.9290e+00, -1.6688e+00, -2.1925e-01]], [[ 3.0636e-01, -3.6853e+00, -3.5550e+00, -3.6522e+00, -4.1531e+00, -3.2719e+00, -2.2058e+00, -3.5840e+00, -4.1438e+00, -1.6488e+00]], [[-5.6920e-01, -5.8953e+00, -6.7344e+00, -7.0852e+00, -4.9319e+00, -4.0559e+00, -3.4828e+00, -3.5275e+00, -2.8635e+00, -3.7794e+00]], [[ 4.9873e+00, -1.4813e+01, -1.1940e+01, -1.1422e+01, -6.9075e+00, -2.9576e+00, -5.5007e+00, -4.1100e+00, -4.0842e+00, -1.6170e+00]], [[ 3.1463e+00, -6.0835e+00, -4.7746e+00, -4.7544e+00, -3.8904e+00, -2.1570e+00, -1.3779e+00, -2.6188e+00, -2.5939e+00, -2.5294e+00]], [[-3.9840e-01, -3.2587e+00, -3.7537e+00, -3.8205e+00, -2.6450e+00, -3.9135e+00, -2.8036e+00, -9.8345e-01, -1.2009e+00, -2.9910e+00]]], [[[-1.8819e+00, -4.4723e+00, -3.6314e+00, -2.2745e+00, -2.2311e+00, -3.0813e+00, -2.6869e+00, -2.8184e+00, -1.5279e+00, -3.6111e+00]], [[-1.5960e+00, -4.2515e+00, -3.1256e+00, -4.9014e+00, -3.5175e+00, 7.9754e-02, -2.7675e-01, -1.7594e+00, -3.5640e+00, -3.3364e+00]], [[ 2.5518e-01, -3.5354e+00, -3.4299e+00, -4.4100e+00, -4.2154e+00, -4.6324e+00, -4.3212e+00, -3.1946e+00, -3.5016e+00, -3.7843e+00]], [[ 3.4141e-01, -3.4852e+00, -4.6373e+00, -4.3667e+00, -3.6238e+00, -3.9831e+00, -3.6577e+00, -3.2443e+00, -3.3051e+00, -3.9552e+00]], [[ 1.4042e+00, -1.5738e+00, -2.2464e+00, -2.2043e+00, -1.9090e+00, -2.1682e+00, -1.5265e+00, -1.0786e+00, -1.5804e+00, -2.4565e+00]], [[-8.0641e-01, -4.3689e+00, -5.1483e+00, -5.4359e+00, -4.8080e+00, -4.6719e+00, -4.0417e+00, -4.3381e+00, -2.8006e+00, -3.4440e+00]], [[ 1.9753e+00, -4.0140e+00, -4.2720e+00, -4.2400e+00, -1.8152e+00, -1.9722e+00, -1.8824e+00, -2.0026e+00, -2.1879e+00, 3.7729e-01]], [[-7.2578e-01, -4.0151e+00, -4.4783e+00, -4.0317e+00, -3.8660e+00, -2.8282e+00, -1.7011e+00, -2.8988e+00, -4.6397e+00, -4.1833e+00]], [[-1.9192e+00, -5.3075e+00, -5.9409e+00, -5.9876e+00, -5.2854e+00, -3.7464e+00, -3.9092e+00, -4.1349e+00, -3.5157e+00, -4.8806e+00]], [[ 3.4827e+00, -8.9393e+00, -7.0195e+00, -4.0614e+00, -4.1177e+00, 4.1053e-01, -5.2599e+00, -3.4012e+00, -4.0831e+00, -2.2146e-01]], [[ 3.1279e+00, -4.6572e+00, -3.7287e+00, -3.4325e+00, -3.3450e+00, -2.4622e+00, -1.3874e+00, -2.6921e+00, -2.7160e+00, -1.6920e+00]], [[-6.5141e-01, -4.2100e+00, -4.8035e+00, -3.7554e+00, -3.2620e+00, -4.1088e+00, -3.6592e+00, -2.7406e+00, -6.4533e-01, -2.3991e+00]]]]) attn_weights tensor([[[[-5.6689e-01, -5.9636e+00, -5.3437e+00, -6.5440e+00, -5.9696e+00, -3.8050e+00, -4.6354e+00, -3.0968e+00, -2.1940e+00, -3.6409e+00]], [[ 2.2951e+00, -2.2858e+00, -2.0181e+00, -3.5661e+00, -7.5168e-01, -4.6977e-01, 7.7755e-01, 8.9294e-01, -8.0999e-02, -1.8457e+00]], [[ 5.8894e+00, -4.2281e+00, -4.1733e+00, -2.7402e+00, 1.6844e+00, 1.1434e+00, -1.6922e+00, -2.3825e+00, -2.3767e+00, -6.3501e-01]], [[ 2.1727e-01, -2.9776e+00, -3.3476e+00, -3.5739e+00, -2.1216e+00, -2.2815e+00, -1.8575e+00, -9.0335e-01, -1.5259e+00, -2.0151e+00]], [[ 6.1704e-01, -3.6563e+00, -3.7417e+00, -4.2316e+00, -3.7626e+00, -3.4031e+00, -2.4025e+00, -3.0637e+00, -3.7851e+00, -4.3417e+00]], [[ 2.9166e-01, -9.8374e-01, -1.2924e+00, -1.1037e+00, -6.9956e-01, -3.7381e+00, -1.3280e+00, 5.3005e-02, -1.3288e+00, -1.9718e+00]], [[ 1.0795e+00, -2.9415e+00, -2.8853e+00, -3.1291e+00, -2.7937e+00, -1.7121e+00, -1.9497e+00, -2.4875e+00, -2.6429e+00, -2.5901e+00]], [[ 2.2802e+00, -2.1799e+00, -2.5544e+00, -2.6793e+00, -6.7917e-01, 8.5172e-01, 1.3871e+00, 1.4668e+00, -7.2546e-01, -7.0013e-01]], [[-9.2661e-01, -3.8550e+00, -2.7885e+00, -3.7763e+00, -2.6149e+00, -1.5547e+00, -7.8915e-01, -1.6123e+00, -1.6656e+00, -3.2625e+00]], [[-1.9413e-01, -1.6519e+00, -2.4697e+00, -3.9839e+00, -4.1638e+00, -2.7152e+00, -1.8831e+00, -1.2147e+00, -1.1001e+00, -2.8643e+00]], [[ 3.0807e+00, -2.5515e+00, -3.6004e+00, -2.9286e+00, 6.3311e-01, -1.7642e+00, -3.5887e+00, -1.7636e+00, -2.0592e+00, -1.7134e+00]], [[ 2.5827e+00, -3.4913e+00, -3.0058e+00, -1.6029e+00, 8.1724e-01, -9.1764e-01, -2.9838e+00, -3.6889e+00, -2.4450e+00, -8.2732e-01]]], [[[-4.2979e-01, -6.4953e+00, -7.5400e+00, -5.8352e+00, -6.1409e+00, -5.3541e+00, -5.5487e+00, -4.4485e+00, -2.4173e+00, -3.9692e+00]], [[ 2.7539e+00, -1.8592e+00, -1.9200e+00, -2.6135e+00, -7.4552e-03, -4.5933e-01, 1.3538e+00, 1.4497e+00, 1.8443e-01, -6.0628e-01]], [[ 6.3710e+00, -3.3790e+00, -3.9432e+00, 5.5473e-01, -8.7185e-01, -7.1958e-02, -2.7913e+00, -2.8144e+00, -9.0102e-01, -2.1795e-01]], [[ 3.0184e-01, -3.0636e+00, -3.2637e+00, -2.1663e+00, -1.5656e+00, -2.5765e+00, -1.7011e+00, -1.4973e+00, -1.0208e+00, -2.0437e+00]], [[ 8.6004e-01, -2.7685e+00, -3.3405e+00, -2.7578e+00, -3.1279e+00, -3.6791e+00, -3.0116e+00, -3.8964e+00, -3.7747e+00, -3.9097e+00]], [[ 7.1763e-01, -3.5984e-02, -6.4789e-01, 7.0253e-01, -7.4658e-03, -4.7076e+00, -1.7235e+00, -1.9091e-01, -4.9550e-01, -2.2834e+00]], [[ 1.4196e+00, -1.9475e+00, -2.3393e+00, -2.1570e+00, -2.6056e+00, -1.8857e+00, -1.7767e+00, -1.8147e+00, -1.2820e+00, -2.1872e+00]], [[ 3.5560e+00, -2.0832e+00, -2.8549e+00, -3.5122e+00, -1.2362e+00, -1.0807e+00, -6.9741e-01, 2.2036e-01, 4.2917e-01, -9.1087e-01]], [[-7.7202e-01, -3.0787e+00, -4.0414e+00, -3.1063e+00, -1.7153e+00, -1.7643e+00, -5.3233e-01, -8.5439e-01, -1.6583e+00, -2.7512e+00]], [[ 1.6800e-01, -7.8739e-01, -1.6564e+00, -2.2034e+00, -2.6830e+00, -2.7840e+00, -1.5201e+00, -1.6375e+00, -5.2553e-01, -1.6954e+00]], [[ 3.7632e+00, -1.5009e+00, -3.3359e+00, 1.0749e+00, -1.9401e+00, -2.1635e+00, -2.6561e+00, -1.5052e+00, -1.2192e+00, -2.6541e-01]], [[ 3.2722e+00, -2.7444e+00, -2.9165e+00, 2.0889e+00, -1.1459e+00, -1.7418e+00, -3.6614e+00, -2.9358e+00, -2.5851e+00, -3.8522e-01]]], [[[-5.1481e-01, -6.6217e+00, -7.7427e+00, -7.0733e+00, -7.5026e+00, -5.8282e+00, -6.1020e+00, -5.1645e+00, -2.7458e+00, -4.1636e+00]], [[ 2.8315e+00, -1.6202e+00, -2.0189e+00, -2.3846e+00, 1.6384e-01, -7.7204e-01, 1.2353e+00, 1.7868e+00, -9.0499e-02, -3.6695e-01]], [[ 6.3698e+00, -2.2099e+00, -2.7554e+00, 1.7571e+00, -1.2247e+00, -1.9618e-01, -2.5566e+00, -2.9895e+00, -7.4410e-01, 1.4823e-01]], [[ 1.9652e-01, -3.0296e+00, -3.3684e+00, -2.2027e+00, -1.8394e+00, -2.8453e+00, -1.9814e+00, -1.5971e+00, 5.9984e-01, -1.5715e+00]], [[ 1.0931e+00, -3.1248e+00, -3.6923e+00, -3.6248e+00, -3.5696e+00, -4.5778e+00, -3.9971e+00, -4.8572e+00, -4.0060e+00, -3.8999e+00]], [[ 8.6951e-01, 4.4875e-01, -6.4441e-01, 1.9699e-01, -9.9458e-01, -3.9506e+00, -9.1511e-01, 2.2336e-01, 4.6567e-01, -1.7197e+00]], [[ 1.5332e+00, -2.1007e+00, -2.3396e+00, -2.5601e+00, -2.3527e+00, -2.3345e+00, -2.1882e+00, -2.1074e+00, -1.7869e+00, -2.0925e+00]], [[ 3.7580e+00, -1.9843e+00, -2.8904e+00, -3.2117e+00, -1.0778e+00, -1.0229e+00, -1.0542e+00, -4.6962e-01, -1.2685e+00, -1.3899e+00]], [[-6.1847e-01, -3.7621e+00, -4.1478e+00, -3.8157e+00, -2.7337e+00, -2.3420e+00, -1.2842e+00, -2.2007e+00, -1.6151e+00, -2.8378e+00]], [[ 2.5358e-01, -7.0557e-01, -1.0875e+00, -2.1163e+00, -2.1483e+00, -3.2184e+00, -2.0499e+00, -2.4668e+00, -1.0985e+00, -2.1371e+00]], [[ 4.2840e+00, -7.3590e-01, -2.2002e+00, 1.9630e+00, -1.2627e+00, -2.0946e+00, -1.9118e+00, -1.2052e+00, -7.3079e-01, -3.2028e-01]], [[ 3.4969e+00, -2.9431e+00, -2.7233e+00, 2.0517e+00, -1.4943e+00, -2.2649e+00, -3.4776e+00, -2.6554e+00, -2.2037e+00, -8.0622e-01]]], [[[-8.6311e-01, -4.7650e+00, -3.7576e+00, -4.2928e+00, -2.7600e+00, -4.4479e+00, -4.2240e+00, -6.8453e-01, -1.3628e-01, -3.4830e+00]], [[ 4.1015e+00, -5.5342e+00, -3.8901e+00, -4.2501e+00, -4.1997e+00, -2.7367e+00, -1.0770e-01, -7.4969e-01, -1.5513e+00, 1.1071e-01]], [[ 6.4441e+00, -6.5787e+00, -7.2476e+00, -6.4098e+00, -4.3735e+00, -1.0837e-01, 9.3118e-01, -1.6685e+00, -1.8134e+00, 1.0169e+00]], [[ 7.0128e-01, -5.6413e+00, -5.2083e+00, -6.5872e+00, -6.2556e+00, -2.0373e+00, -2.5489e+00, -4.0182e+00, -4.0821e+00, -1.6893e+00]], [[ 8.1465e-01, -5.9718e+00, -5.2184e+00, -5.4048e+00, -4.9082e+00, -3.7717e+00, -3.8280e+00, -3.6692e+00, -2.9104e+00, -3.2622e+00]], [[ 9.1897e-01, -3.2764e+00, -2.5315e+00, -2.8196e+00, -1.5396e+00, -3.5242e+00, -2.0362e+00, -1.2065e+00, -7.6916e-01, -3.6770e+00]], [[ 1.6440e+00, -4.1760e+00, -3.8757e+00, -5.1946e+00, -4.0988e+00, -2.0985e+00, -1.3777e+00, -2.7368e+00, -1.5937e+00, -1.4164e+00]], [[ 2.4610e+00, -5.4069e+00, -5.6292e+00, -6.0130e+00, -4.8355e+00, -2.0638e+00, 3.8165e-01, 7.6836e-01, -8.8122e-01, -8.3615e-01]], [[ 3.4328e-01, -6.0987e+00, -4.9165e+00, -4.9162e+00, -4.9728e+00, -4.2820e+00, -3.3696e+00, -3.8334e+00, -4.3314e+00, -3.2170e+00]], [[ 4.0420e-01, -4.1638e+00, -4.1592e+00, -5.4924e+00, -5.5593e+00, -2.2862e+00, -2.6362e+00, -2.1939e+00, -2.5717e+00, -3.1682e+00]], [[ 4.6471e+00, -8.7224e+00, -8.0866e+00, -7.7851e+00, -6.3853e+00, -1.2528e+00, -1.0566e+00, -2.1414e+00, -3.7292e+00, -1.2908e+00]], [[ 2.7117e+00, -4.2245e+00, -5.1587e+00, -6.4009e+00, -4.0048e+00, -9.3809e-02, 6.3409e-01, -9.3850e-01, -2.3201e+00, -6.1426e-01]]], [[[-8.8823e-01, -5.7773e+00, -6.5617e+00, -4.9233e+00, -4.7571e+00, -4.1241e+00, -4.5229e+00, -3.7856e+00, -2.1367e+00, -4.1357e+00]], [[ 2.8133e+00, -3.0931e+00, -1.8733e+00, -2.8381e+00, -2.0475e+00, -1.9340e+00, -2.8473e-02, 2.8799e-01, -2.2352e+00, -7.4467e-01]], [[ 5.9991e+00, -4.9474e+00, -5.5890e+00, -4.8847e+00, -3.4960e+00, 6.7337e-01, -4.1829e+00, -6.0899e+00, -4.1665e+00, 3.2940e-01]], [[ 1.1101e-01, -3.7105e+00, -3.0847e+00, -4.3378e+00, -4.0291e+00, -4.9321e-01, -4.4846e-01, -1.0102e+00, -1.1276e+00, -2.2183e+00]], [[ 8.1254e-01, -4.5501e+00, -4.2225e+00, -3.9722e+00, -4.8660e+00, -3.6394e+00, -2.5663e+00, -3.7727e+00, -3.3777e+00, -5.3168e+00]], [[ 1.3079e+00, -3.3177e+00, -2.4458e+00, -2.4966e+00, -3.4877e+00, -3.6073e+00, -1.9170e+00, -2.4984e+00, -3.3662e+00, -3.1492e+00]], [[ 1.2748e+00, -3.3172e+00, -3.5681e+00, -4.3692e+00, -4.1111e+00, -2.0166e+00, -1.6252e+00, -2.3341e+00, -3.3612e+00, -2.6577e+00]], [[ 1.3689e+00, -4.1055e+00, -4.5042e+00, -4.3025e+00, -3.1262e+00, 4.3435e-02, 2.4626e+00, 2.4023e-01, -6.0089e-01, -1.6264e+00]], [[-1.2605e+00, -3.9081e+00, -2.9019e+00, -1.6328e+00, -1.9556e+00, -9.7088e-01, -1.4093e+00, -1.9857e+00, -3.6920e+00, -4.2725e+00]], [[-3.3821e-01, -3.1414e+00, -3.2459e+00, -4.1479e+00, -4.1147e+00, -1.8027e+00, -1.7144e+00, -2.7148e+00, -8.2121e-01, -2.9500e+00]], [[ 2.5980e+00, -4.8642e+00, -5.1543e+00, -4.2703e+00, -3.3699e+00, 3.2208e-01, -2.7143e+00, -2.4649e+00, -3.8095e+00, -2.6312e+00]], [[ 1.5086e+00, -4.0366e+00, -4.1665e+00, -4.5717e+00, -2.6061e+00, 1.9127e-01, -2.2782e+00, -3.8032e+00, -5.1199e+00, -2.5409e+00]]]]) attn_weights tensor([[[[ 8.9732e-01, -2.8390e+00, -2.3809e+00, -2.7554e+00, -1.9986e+00, -4.0807e+00, -1.9751e+00, -2.7654e+00, -1.7131e+00, -1.9430e+00]], [[ 3.1760e+00, -3.0693e+00, -3.2085e+00, -2.7552e+00, 1.8707e+00, 5.3912e-01, -1.6160e+00, -2.2334e+00, -2.0109e+00, -1.6276e+00]], [[ 1.7768e+00, -1.7984e+00, -2.5976e+00, -2.6251e+00, -1.0550e+00, -4.6768e-01, -7.6573e-01, -1.3432e+00, -2.5427e+00, -2.2171e+00]], [[ 2.9361e+00, -2.5794e+00, -2.3932e+00, -2.3761e+00, -1.8488e+00, -8.5080e-01, -5.3871e-01, -1.2299e+00, -1.1497e+00, -1.2277e+00]], [[-8.9967e-01, -3.2649e+00, -3.3660e+00, -4.9371e+00, -3.4102e+00, -3.0717e+00, -2.3055e+00, -2.2434e+00, -2.4108e+00, -4.2740e+00]], [[-1.2409e+00, -3.6338e+00, -3.5066e+00, -4.7506e+00, -4.0682e+00, -2.6515e+00, -3.2658e+00, -1.9302e+00, -1.9939e+00, -3.8617e+00]], [[ 1.2169e+00, -3.6474e+00, -3.9568e+00, -4.5923e+00, -1.0484e+00, 6.9731e-01, 1.0536e+00, -1.4623e+00, -3.0060e+00, -3.4755e+00]], [[-7.7548e-01, -6.2165e+00, -4.5153e+00, -6.3420e+00, -4.8344e+00, -2.4641e+00, -2.5019e+00, -2.8771e+00, -2.1155e+00, -4.3131e+00]], [[-5.1767e-02, -2.8836e+00, -3.6239e+00, -3.9245e+00, -2.9089e+00, -1.2304e+00, -7.6152e-01, -8.7678e-01, -2.9885e+00, -3.2881e+00]], [[ 8.6382e-01, -3.6222e+00, -3.4593e+00, -3.9631e+00, -2.7666e+00, -1.2213e+00, -8.0281e-01, -1.7217e+00, -2.0924e+00, -2.2823e+00]], [[ 1.1912e+00, -3.7176e+00, -3.2978e+00, -3.4025e+00, -1.1885e+00, -1.1324e+00, -8.1445e-01, -2.5688e-01, -9.5171e-01, -1.0918e+00]], [[ 8.4162e-01, -3.5075e+00, -3.8241e+00, -3.2938e+00, -3.5542e+00, -1.9255e+00, -2.3608e+00, -3.0170e+00, -4.3306e+00, -3.7773e+00]]], [[[ 1.0944e+00, -1.9328e+00, -1.5809e+00, -2.5229e+00, -1.8686e+00, -4.0444e+00, -1.8371e+00, -2.6444e+00, -3.1731e+00, -1.7210e+00]], [[ 4.8728e+00, -2.7277e+00, -3.8867e+00, 6.6323e-01, -2.5548e-01, -1.2716e+00, -2.4632e+00, -2.4866e+00, -1.5959e+00, -1.6104e+00]], [[ 2.1421e+00, -1.1811e+00, -2.6257e+00, -4.0959e-01, -1.2308e+00, -7.7767e-01, -1.2713e+00, -1.4844e+00, -1.9416e+00, -2.3487e+00]], [[ 2.6916e+00, -2.0080e+00, -2.3422e+00, -2.1322e+00, -1.7882e+00, -1.4687e+00, -1.7127e+00, -9.0895e-01, -1.0953e+00, -2.6783e+00]], [[-3.4202e-01, -2.7636e+00, -3.2376e+00, -3.4857e+00, -3.2343e+00, -2.8485e+00, -2.2414e+00, -2.1856e+00, -1.2319e+00, -2.6925e+00]], [[-9.8194e-01, -2.6256e+00, -3.0833e+00, -3.0458e+00, -2.9301e+00, -3.0544e+00, -2.6518e+00, -1.9129e+00, -1.7895e+00, -3.0530e+00]], [[ 2.3045e+00, -2.1241e+00, -1.9622e+00, -1.6508e+00, -3.2788e-01, -1.7584e+00, -1.3081e+00, -1.3813e+00, -1.5239e-01, -1.9771e+00]], [[-2.4881e-01, -4.8862e+00, -6.1275e+00, -6.3205e+00, -5.3746e+00, -4.5574e+00, -4.2876e+00, -3.5205e+00, -2.4710e+00, -4.0768e+00]], [[ 4.5881e-01, -1.9708e+00, -2.6572e+00, -2.8598e+00, -2.0662e+00, -1.1838e+00, -6.5308e-01, -2.1579e-01, -5.1189e-01, -2.7140e+00]], [[ 9.6156e-01, -3.7126e+00, -3.3302e+00, -3.6181e+00, -2.7945e+00, -1.3160e+00, -6.0326e-01, -1.9651e+00, -1.9606e+00, -2.4593e+00]], [[ 1.1701e+00, -3.2473e+00, -2.6992e+00, -1.9127e+00, -1.1376e+00, -2.5401e+00, -2.2461e+00, -1.6390e+00, -9.7133e-01, -1.8424e+00]], [[ 1.1468e+00, -2.2285e+00, -3.4470e+00, -1.7857e+00, -3.6668e+00, -1.8962e+00, -1.4526e+00, -2.0954e+00, -2.8739e+00, -3.9356e+00]]], [[[ 1.2021e+00, -2.3398e+00, -1.9188e+00, -2.6478e+00, -2.0942e+00, -4.1539e+00, -1.9414e+00, -3.1649e+00, -2.5062e+00, -2.4891e+00]], [[ 5.3810e+00, -1.9552e+00, -3.2128e+00, 1.0123e+00, -3.6297e-03, -1.6755e+00, -2.6742e+00, -2.3826e+00, -2.0222e+00, -1.3138e+00]], [[ 2.3140e+00, -1.3053e+00, -3.0362e+00, -6.7487e-01, -1.3951e+00, -1.1217e+00, -1.4538e+00, -1.5902e+00, -1.4886e+00, -2.5611e+00]], [[ 3.1408e+00, -2.1569e+00, -2.4842e+00, -2.3021e+00, -1.8709e+00, -2.5416e+00, -2.0421e+00, -1.6354e+00, -2.0585e+00, -3.0751e+00]], [[-1.6979e-01, -2.5318e+00, -3.5482e+00, -4.2504e+00, -3.9404e+00, -2.7994e+00, -2.3773e+00, -2.2267e+00, -8.6022e-01, -2.0987e+00]], [[-7.2897e-01, -2.5066e+00, -3.1634e+00, -3.3716e+00, -3.4242e+00, -3.6692e+00, -2.9500e+00, -2.3608e+00, -5.3967e-01, -2.7693e+00]], [[ 2.7198e+00, -1.9087e+00, -2.1131e+00, -1.7329e+00, -6.3785e-01, -2.7161e+00, -1.7647e+00, -1.5567e+00, -1.1054e+00, -1.7551e+00]], [[-2.8580e-01, -4.6227e+00, -6.6685e+00, -6.9430e+00, -6.0678e+00, -4.9990e+00, -5.0116e+00, -3.6430e+00, -3.2554e+00, -3.9845e+00]], [[ 7.1935e-01, -2.1516e+00, -3.0613e+00, -3.2470e+00, -2.6039e+00, -1.3913e+00, -9.4403e-01, -5.4899e-01, -7.7536e-01, -3.0065e+00]], [[ 9.9303e-01, -3.4018e+00, -2.9942e+00, -3.3191e+00, -2.8260e+00, -1.8626e+00, -7.7790e-01, -2.1201e+00, -2.0892e+00, -1.9923e+00]], [[ 1.2300e+00, -3.5003e+00, -3.3347e+00, -2.3248e+00, -1.7049e+00, -2.9778e+00, -2.5426e+00, -2.2746e+00, -1.7015e+00, -2.2865e+00]], [[ 1.6034e+00, -1.9531e+00, -3.6514e+00, -2.2067e+00, -4.1923e+00, -2.3158e+00, -1.6327e+00, -2.2471e+00, -3.5654e+00, -4.2441e+00]]], [[[ 8.3142e-01, -3.2167e+00, -3.4154e+00, -3.5022e+00, -2.7417e+00, -4.0331e+00, -2.6257e+00, -1.2734e+00, -1.9976e+00, -3.5041e+00]], [[ 3.3347e+00, -3.3482e+00, -4.4591e+00, -4.6784e+00, -3.1281e+00, 6.1593e-01, 2.5417e+00, -3.0365e-02, -1.0065e+00, -8.7989e-01]], [[ 2.1562e+00, -2.4596e+00, -3.3946e+00, -3.1041e+00, -1.3923e+00, -1.8297e+00, -1.6383e+00, -1.6457e+00, -5.8795e-01, -1.9854e+00]], [[ 2.4487e+00, -2.9356e+00, -1.8456e+00, -2.4233e+00, -1.5711e+00, -4.3249e-01, 1.2793e+00, 1.2178e+00, -8.4204e-02, -1.5329e+00]], [[ 3.8213e-01, -6.2715e+00, -6.5925e+00, -6.0801e+00, -3.8673e+00, -5.4188e+00, -4.3666e+00, -4.0019e+00, -3.4687e+00, -3.1628e+00]], [[-8.3480e-01, -5.0027e+00, -4.6984e+00, -4.7711e+00, -3.3795e+00, -3.2972e+00, -3.7165e+00, -2.2202e+00, -1.7485e+00, -3.3609e+00]], [[ 2.1661e+00, -4.1448e+00, -4.0196e+00, -4.7297e+00, -4.2467e+00, 7.1486e-01, 1.4282e+00, -1.3291e+00, -1.2959e+00, -1.2862e+00]], [[-1.0902e+00, -5.4325e+00, -4.9189e+00, -3.8261e+00, -2.0017e+00, -4.1487e+00, -3.6597e+00, -1.3489e+00, 3.5088e-01, -3.3117e+00]], [[ 1.0505e+00, -4.6137e+00, -3.7765e+00, -3.7894e+00, -3.5923e+00, -1.4722e+00, -1.1573e+00, -2.4734e+00, -3.1586e+00, -1.0378e+00]], [[ 1.4447e+00, -5.0607e+00, -5.2264e+00, -5.7332e+00, -4.3571e+00, -9.6226e-01, -1.5133e+00, -3.0568e+00, -2.2262e+00, -1.5577e-01]], [[ 1.2963e+00, -4.1860e+00, -3.5006e+00, -4.1002e+00, -3.5910e+00, -1.6778e-01, 2.2487e-02, -9.0365e-01, -1.6906e+00, 1.5650e-01]], [[ 5.6568e-01, -4.4438e+00, -3.2539e+00, -3.4460e+00, -3.8648e+00, -1.4937e+00, -1.4537e+00, -2.5197e+00, -3.3048e+00, -2.0610e+00]]], [[[ 6.8174e-01, -3.6088e+00, -2.9343e+00, -3.3599e+00, -2.0325e+00, -4.7419e+00, -1.9398e+00, -2.9785e+00, -2.9617e+00, -7.6968e-01]], [[ 3.1708e+00, -2.6186e+00, -4.0802e+00, -3.1299e+00, -2.4964e+00, 1.3480e-01, 4.1629e-01, -3.2385e+00, -2.0040e+00, -4.8411e-01]], [[ 7.3637e-01, -5.0079e-01, -1.5202e+00, -1.7527e+00, -2.5581e-01, 2.2153e-01, 5.8268e-01, -8.6532e-01, -1.1720e+00, -1.4781e+00]], [[ 3.5336e+00, -2.7414e+00, -1.7307e+00, -3.0953e+00, -2.8316e+00, -1.7224e-01, 2.9901e+00, 8.8200e-01, -4.4466e-01, -3.3328e-01]], [[ 3.5147e-01, -5.1202e+00, -4.5978e+00, -5.3408e+00, -5.3252e+00, -4.6323e+00, -3.6266e+00, -5.5108e+00, -1.9522e+00, -3.2332e+00]], [[-1.1523e+00, -4.1154e+00, -4.4763e+00, -3.5078e+00, -4.1017e+00, -2.8297e+00, -2.5432e+00, -3.1535e+00, -9.8393e-01, -3.2302e+00]], [[ 5.6424e-01, -4.0459e+00, -3.9624e+00, -5.7776e+00, -4.4796e+00, 3.1951e+00, 2.4750e+00, -2.9727e+00, -4.1170e+00, -3.5279e+00]], [[-1.1881e+00, -7.0278e+00, -5.5729e+00, -4.6040e+00, -3.9170e+00, -3.7890e+00, -3.7604e+00, -4.4818e+00, -3.5862e+00, -4.3918e+00]], [[-5.0125e-01, -1.4993e+00, -2.3887e+00, -2.6384e+00, -2.7824e+00, 2.2275e-01, 1.3274e+00, 5.6684e-01, -4.1120e+00, -3.4641e+00]], [[ 1.1280e+00, -3.2471e+00, -2.3875e+00, -2.9809e+00, -1.8415e+00, -9.8158e-02, -6.7474e-01, -1.8851e+00, -3.2635e+00, -2.6932e+00]], [[ 1.1268e+00, -4.1837e+00, -3.7719e+00, -4.7436e+00, -3.0296e+00, 3.2102e-01, 1.2277e-02, -1.3531e+00, -1.5912e+00, 1.5369e-01]], [[ 2.0845e+00, -1.4590e+00, -2.9506e+00, -2.9372e+00, -3.3251e+00, -9.6192e-01, -1.5350e+00, -1.6970e+00, -5.8350e+00, -2.8705e+00]]]]) attn_weights tensor([[[[ 2.1219, -2.4070, -1.6356, -1.8316, -1.9670, 1.4540, 1.6863, -0.8485, -1.6707, -1.4016]], [[ 2.7888, -2.7337, -2.6052, -2.0592, -0.0338, -1.5732, -0.7580, -2.5979, -1.6227, -1.0497]], [[ 1.4016, -3.1653, -2.5837, -3.3475, -2.4613, 0.5000, 0.4233, -1.1570, -2.1159, -2.4503]], [[-1.0278, -3.1983, -3.1259, -4.8129, -5.1899, -2.1077, -1.8087, -2.2710, -2.0893, -3.8381]], [[ 3.3082, -3.1764, -3.4485, -3.6357, -2.1587, -1.1193, 0.3783, -1.3530, -2.5777, -2.7033]], [[ 1.8768, -3.7896, -3.4965, -3.1601, -2.4889, -1.3617, -1.3068, -2.6659, -2.8220, -2.0252]], [[ 3.9918, -3.4945, -3.5037, -3.1679, -1.0600, 0.6346, 0.6661, -2.2448, -1.7845, -1.2260]], [[ 0.4725, -3.6228, -3.9296, -4.3507, -2.5195, -1.7113, -1.9056, -2.9639, -3.3367, -3.8200]], [[ 1.5378, -2.7854, -3.0936, -3.1709, -2.5845, -0.1225, -0.1785, -2.1595, -2.4633, -2.1500]], [[ 4.5286, -2.4460, -1.7624, -1.2299, 0.7782, 0.4386, 1.0666, -1.7048, -0.7758, -0.0661]], [[ 0.2590, -3.5028, -1.8599, -3.9994, -3.1123, -2.1939, -1.4993, -1.1647, -0.1326, -2.1709]], [[ 3.5019, -1.6594, -2.5603, -0.4049, 0.1849, -1.5387, -1.4959, -2.8354, -2.6559, -0.0960]]], [[[ 1.7968, -0.6468, -2.1488, -1.8594, -2.1123, -0.1067, 1.2047, 0.0925, -1.6679, -2.3332]], [[ 3.8142, -0.6792, -1.6848, 0.4439, -0.3570, -2.4017, -1.5477, -1.7693, -0.6886, -1.5742]], [[ 1.5877, -1.3842, -2.4629, -2.9295, -1.7190, -1.0953, -0.3018, -0.3282, -1.3873, -2.7970]], [[-0.9142, -2.4209, -3.2827, -2.8685, -4.5170, -2.1408, -1.3031, -1.6220, -1.2262, -2.9227]], [[ 2.9681, -1.8265, -3.3758, -3.3090, -2.6571, -3.1399, -2.3833, -1.9824, -3.1022, -4.3562]], [[ 1.9068, -2.4698, -2.6768, -2.6240, -2.6449, -2.6274, -2.7040, -2.6574, -2.5914, -2.6521]], [[ 3.3311, -2.9408, -3.9807, -1.5382, -1.9453, -2.2771, -1.5479, -2.6750, -2.4504, -2.6487]], [[ 0.5740, -2.8725, -4.2262, -2.9274, -2.5970, -3.4023, -2.6345, -2.3300, -2.5922, -4.0774]], [[ 1.9103, -3.1620, -3.3745, -2.5399, -2.5962, -1.3162, -0.5482, -2.3387, -1.9040, -3.1557]], [[ 4.5838, -2.4094, -2.6272, 0.1282, -0.8636, -1.1816, -0.0216, -1.8904, -1.9253, -2.2665]], [[ 0.5821, -2.5952, -3.1545, -2.6788, -2.7179, -1.9806, -1.4208, -1.2217, 0.2308, -1.6370]], [[ 3.7698, -1.8384, -2.8066, 1.1437, -1.4220, -3.2441, -2.3092, -3.4122, -2.1104, -3.0461]]], [[[ 1.8951, -0.6077, -2.1043, -1.8854, -2.3156, -0.7313, 0.7632, 0.1109, -1.9903, -1.9412]], [[ 3.9931, -0.5849, -2.1994, 0.1965, -0.4966, -2.7230, -1.9124, -1.6701, -0.4184, -1.5953]], [[ 1.9521, -1.5169, -2.4087, -2.7500, -1.4827, -2.1336, -1.0113, -0.6125, -1.1916, -2.1246]], [[-0.6590, -2.8158, -3.9068, -3.7174, -5.2270, -2.7353, -2.2949, -2.5235, -1.2967, -3.5241]], [[ 2.9985, -1.5342, -2.8648, -3.0960, -2.3130, -3.8549, -2.4280, -1.8083, -2.3323, -3.2113]], [[ 2.0481, -2.0807, -2.5182, -2.7613, -2.9297, -2.9792, -3.1177, -2.8803, -2.7208, -2.9256]], [[ 3.6176, -2.4696, -3.8720, -0.9524, -1.9398, -2.7189, -1.9418, -2.6410, -2.6058, -2.8516]], [[ 0.7087, -3.1109, -4.6911, -3.4533, -3.1052, -3.9484, -3.2839, -2.5775, -2.4313, -4.0561]], [[ 2.2576, -2.9255, -3.1391, -2.7101, -2.8760, -1.9968, -1.2225, -2.6084, -1.3651, -2.7240]], [[ 4.8187, -2.0760, -2.6485, 0.3217, -1.2053, -1.6298, -0.2057, -1.7402, -1.5543, -2.1810]], [[ 0.7292, -2.7021, -3.4279, -3.2873, -3.2861, -2.6845, -1.8507, -1.6738, 0.6335, -1.2603]], [[ 3.6582, -1.8372, -2.6520, 1.0165, -1.2611, -3.2318, -2.3994, -3.8635, -3.1266, -2.9687]]], [[[ 2.3338, -4.7773, -3.2014, -2.5574, -4.0185, -0.1643, 0.7663, -3.3054, -3.2077, -0.3181]], [[ 3.2545, -4.5729, -4.6298, -4.5300, -4.0705, -1.7332, 0.5273, -3.3177, -2.7675, -0.4844]], [[ 2.1325, -5.6341, -3.8506, -3.7193, -3.8981, -0.4373, -0.4628, -2.9960, -3.5004, -0.7183]], [[-0.9546, -4.2094, -4.2593, -3.4875, -2.1671, -3.8217, -3.6363, -1.9401, -0.1595, -3.1499]], [[ 3.4163, -3.7153, -3.9534, -4.1376, -3.4565, -1.1144, 1.0478, -1.4491, -2.3821, -2.1926]], [[ 1.9946, -3.8048, -4.2406, -4.0660, -3.0406, -1.6533, -1.3472, -2.3717, -0.9859, -0.6384]], [[ 3.8467, -4.1687, -4.8598, -4.1198, -4.3420, 0.9401, 2.0736, -2.8352, -3.0271, 0.1245]], [[ 0.4651, -4.1432, -4.7084, -5.4917, -4.3889, -2.7060, -3.4811, -3.8008, -4.5016, -4.6058]], [[ 2.3801, -3.6284, -4.0006, -2.7148, -3.3830, -0.6813, -1.4297, -2.8899, -3.3164, -0.5640]], [[ 4.6542, -2.8879, -3.3520, -3.4423, -2.4608, 2.1579, 2.5496, -1.2524, -1.4634, 1.1564]], [[ 0.9870, -4.6406, -4.6411, -4.4938, -2.2733, -3.9083, -4.1586, -2.6486, -0.8875, -2.9725]], [[ 3.3569, -2.0047, -3.7282, -2.8079, -2.9366, -1.9644, -0.7849, -1.8480, -1.8834, -1.2126]]], [[[ 2.0182, -1.3553, -0.4270, -0.1565, -0.9781, 3.1895, 2.0811, -0.8055, -2.4681, -1.9861]], [[ 4.1001, -2.5026, -5.0280, -4.2256, -2.4328, -0.8483, 0.5467, -3.1326, -1.7627, -0.0153]], [[ 1.2996, -2.5196, -1.8449, -2.2407, -1.6372, 1.8387, 0.8512, -1.2473, -2.5020, -1.2758]], [[-1.4711, -3.6129, -3.8010, -3.1324, -3.2715, -1.7291, -1.5872, -2.1911, -0.2461, -1.2927]], [[ 3.9247, -2.3745, -2.8330, -3.3333, -3.1396, 0.0748, 1.9862, -1.4564, -1.9968, -1.3997]], [[ 2.0690, -3.9596, -3.6665, -3.2392, -2.0906, -0.6713, -0.5442, -2.3241, -0.0695, 1.0046]], [[ 4.7574, -2.0276, -2.3565, -2.4667, -3.0063, 1.1480, 0.6019, -1.6289, -1.5937, -1.5695]], [[ 0.3275, -4.1623, -3.4421, -4.2230, -3.5093, 1.2884, 0.3866, -2.8984, -5.0364, -5.2356]], [[ 1.7337, -1.7800, -2.6701, -1.5278, -2.1906, 1.1486, 1.2479, -1.4698, -3.2671, -3.6927]], [[ 6.2774, -0.6214, -0.4890, -1.3136, -0.2821, 2.7484, 2.3490, 0.4207, 0.4814, 2.3687]], [[ 0.8604, -4.9529, -4.9984, -4.9890, -4.0211, -3.3624, -3.6664, -4.8592, -1.1466, -1.7879]], [[ 3.9286, -1.3309, -3.1262, -1.3687, -0.9466, -1.0413, -0.9294, -2.8557, -2.9144, -0.9862]]]]) attn_weights tensor([[[[ 2.6038e+00, -2.8731e+00, -3.2582e+00, -2.8387e+00, -2.3358e+00, 9.5209e-01, 2.3964e-02, -2.3242e+00, -3.3365e+00, -2.6327e+00]], [[ 3.8587e+00, -1.2434e+00, -2.2451e+00, -8.0034e-01, -2.9590e-01, 1.1467e+00, 2.1461e-01, -1.5269e+00, -1.9948e+00, 1.9371e-01]], [[ 3.3142e+00, -8.5431e-01, -1.5213e+00, -1.6262e+00, -7.0560e-01, 8.0007e-01, 1.3039e+00, -3.3824e-01, -9.9534e-01, -2.7412e-01]], [[ 2.9238e+00, -3.1740e-01, -1.9054e+00, -1.4641e+00, -3.8635e-01, 4.0939e-01, 2.3549e-01, -9.2362e-01, -1.5182e+00, -9.8126e-01]], [[ 1.9253e+00, -1.1172e+00, -1.4956e+00, -1.5890e+00, -6.6692e-01, 1.2153e-01, 7.6951e-01, -4.8664e-01, -7.7265e-01, -9.1749e-01]], [[ 9.9058e-01, -1.3648e+00, -1.9288e+00, -3.2459e+00, -2.2340e+00, -1.5507e+00, -1.9238e+00, -8.5506e-01, -9.9243e-01, -2.2711e+00]], [[ 3.1714e+00, -2.6814e+00, -2.6798e+00, -2.4173e+00, -1.3075e+00, 4.2645e-01, 1.1309e+00, -2.0185e+00, -2.1765e+00, -1.8550e+00]], [[ 1.6107e+00, -2.1400e+00, -1.7458e+00, -2.3343e+00, -1.2642e+00, 9.3029e-01, -6.7215e-01, -6.2989e-01, -1.3769e+00, -1.3776e+00]], [[ 3.3459e+00, -1.8796e+00, -2.1874e+00, -1.9787e+00, 1.0707e+00, -8.1146e-01, -1.2767e+00, -1.2813e+00, -1.3208e+00, -9.1313e-01]], [[ 7.0734e-01, -3.0884e+00, -2.7036e+00, -2.3467e+00, -1.9286e+00, -1.2351e+00, -1.2321e+00, -1.1139e+00, -1.7930e+00, -1.6910e+00]], [[ 3.3590e+00, -2.0810e+00, -1.6178e+00, -1.4989e+00, -1.3378e+00, -6.4736e-02, -4.7165e-01, -1.7191e+00, -1.4633e+00, -1.1877e+00]], [[ 4.6757e+00, -1.6827e-02, 1.6249e+00, -6.0169e-01, 7.8123e-01, 2.1424e+00, 2.9909e+00, 2.3956e+00, 2.9335e+00, 1.3378e+00]]], [[[ 2.7751e+00, -3.7577e+00, -3.9950e+00, -2.9393e+00, -3.6317e+00, 1.1962e-01, -2.8929e-01, -2.8775e+00, -3.5098e+00, -4.0639e+00]], [[ 3.7541e+00, -1.6744e+00, -1.1539e+00, 2.0015e+00, -1.5570e+00, -1.3109e+00, -7.9201e-01, -1.1407e+00, -1.1685e+00, -3.7138e-01]], [[ 3.3553e+00, -1.7769e+00, -2.0300e+00, -9.5345e-01, -1.1147e+00, -2.0818e+00, -4.5339e-01, -1.6206e+00, -5.2236e-01, -1.5184e+00]], [[ 3.1306e+00, -6.3974e-01, -2.4978e+00, -9.8565e-01, -1.2034e+00, 3.5476e-01, 3.0426e-01, -1.1496e+00, -1.4314e+00, -2.1219e+00]], [[ 2.3826e+00, -6.8209e-01, -1.1100e+00, -5.0663e-01, -1.1239e-01, -5.6924e-01, 7.7142e-01, -4.4371e-01, 4.7881e-02, -5.5616e-01]], [[ 1.0685e+00, -1.5786e+00, -2.6401e+00, -2.9489e+00, -2.6857e+00, -2.0024e+00, -2.5370e+00, -1.7081e+00, -1.1009e+00, -2.2712e+00]], [[ 3.2528e+00, -2.9922e+00, -3.8014e+00, -1.9528e+00, -2.1262e+00, -8.9307e-01, 6.5190e-01, -2.6518e+00, -2.5082e+00, -3.1242e+00]], [[ 2.8138e+00, -1.6053e+00, -1.0369e+00, -6.6088e-01, -1.2787e+00, -2.2407e+00, -1.6203e+00, -9.1431e-01, -3.4484e-01, -6.4731e-01]], [[ 3.5212e+00, -1.5122e+00, -2.8424e+00, -5.8584e-01, -1.3111e+00, -2.2596e+00, -1.9504e+00, -2.8690e+00, -1.6557e+00, -2.5494e+00]], [[ 1.4385e+00, -4.0223e+00, -3.2801e+00, -2.9602e+00, -2.8466e+00, -2.2027e+00, -2.4622e+00, -3.3219e+00, -3.4213e+00, -2.9855e+00]], [[ 3.5076e+00, -2.1986e+00, -2.2615e+00, -6.2093e-01, -2.4773e+00, -1.3281e+00, -9.0250e-01, -2.0276e+00, -1.4280e+00, -2.0295e+00]], [[ 4.1461e+00, -3.5635e-01, -4.3911e-01, -1.6873e+00, -2.2081e+00, -9.8341e-01, -1.4835e-01, 9.5567e-01, 8.6115e-01, -3.0959e-02]]], [[[ 2.9351e+00, -3.6803e+00, -3.7878e+00, -2.7933e+00, -3.3823e+00, -4.6258e-01, -9.7174e-01, -2.7745e+00, -3.7307e+00, -3.4651e+00]], [[ 4.1086e+00, -1.5569e+00, -1.2229e+00, 1.8231e+00, -1.6946e+00, -1.8448e+00, -1.0462e+00, -1.3340e+00, -1.7605e+00, -2.9811e-01]], [[ 3.3524e+00, -1.7715e+00, -2.1173e+00, -9.9819e-01, -1.1492e+00, -2.5661e+00, -7.5303e-01, -1.8303e+00, -1.0849e+00, -1.6172e+00]], [[ 3.4476e+00, -4.9977e-01, -2.4782e+00, -1.0232e+00, -1.4716e+00, -2.3078e-01, 4.0310e-03, -1.5907e+00, -1.5761e+00, -1.6635e+00]], [[ 2.5792e+00, -9.3619e-01, -1.6366e+00, -8.6762e-01, -3.6252e-01, -1.2444e+00, 6.6096e-02, -3.3378e-01, -2.8108e-01, -1.0026e+00]], [[ 1.1008e+00, -1.6724e+00, -2.4561e+00, -3.0722e+00, -3.0548e+00, -2.3504e+00, -2.7902e+00, -2.2208e+00, -1.1337e+00, -2.4025e+00]], [[ 3.5132e+00, -2.7783e+00, -3.6158e+00, -1.6817e+00, -2.2420e+00, -1.4919e+00, 5.1143e-02, -2.6005e+00, -2.5207e+00, -2.9362e+00]], [[ 2.8290e+00, -2.1533e+00, -1.5132e+00, -1.2345e+00, -1.7414e+00, -2.7233e+00, -2.0340e+00, -1.2742e+00, -8.4464e-01, -9.3133e-01]], [[ 3.4510e+00, -1.3473e+00, -2.9640e+00, -7.1139e-01, -1.9603e+00, -2.5671e+00, -2.3696e+00, -3.1775e+00, -2.4783e+00, -2.7046e+00]], [[ 1.5447e+00, -3.9779e+00, -3.3313e+00, -3.3036e+00, -3.1110e+00, -2.9526e+00, -2.9878e+00, -3.6550e+00, -4.0843e+00, -2.8377e+00]], [[ 3.7530e+00, -2.0278e+00, -1.9833e+00, -2.7813e-01, -2.2461e+00, -1.7877e+00, -9.6425e-01, -1.8081e+00, -1.5889e+00, -1.8994e+00]], [[ 3.9702e+00, -6.0129e-01, -1.2083e+00, -2.1289e+00, -2.8688e+00, -1.4702e+00, -5.9950e-01, 4.5691e-01, 6.0761e-01, -3.1161e-01]]], [[[ 2.8631e+00, -3.3817e+00, -3.7898e+00, -3.5875e+00, -3.3363e+00, 1.1041e+00, 1.2540e+00, -2.4478e+00, -1.9746e+00, 4.9157e-01]], [[ 4.3655e+00, -2.4236e+00, -3.6682e+00, -3.1637e+00, -2.9964e+00, 1.3925e+00, 1.4702e+00, -1.4458e+00, -7.7857e-01, 1.6220e+00]], [[ 3.9001e+00, -2.6386e+00, -3.5446e+00, -4.0859e+00, -3.4072e+00, 2.0253e-01, 1.6484e+00, -2.0358e+00, -1.2160e+00, 6.4411e-02]], [[ 2.9670e+00, -2.9561e+00, -3.9205e+00, -3.8466e+00, -3.4359e+00, 4.1268e-01, 3.0273e-01, -1.9400e+00, -2.2232e+00, -8.3901e-01]], [[ 2.3698e+00, -3.0970e+00, -3.4134e+00, -4.0759e+00, -1.6427e+00, -1.0924e+00, -8.2384e-01, -1.8297e+00, -5.9688e-01, -9.0459e-01]], [[ 1.7027e+00, -3.5824e+00, -4.4407e+00, -4.8517e+00, -3.5305e+00, -3.6559e+00, -4.0378e+00, -2.9352e+00, -2.6092e+00, -3.6934e+00]], [[ 3.1457e+00, -3.9062e+00, -3.8253e+00, -3.2210e+00, -3.1690e+00, 4.6884e-01, 8.1372e-01, -2.0161e+00, -1.7986e+00, 5.4390e-01]], [[ 2.2508e+00, -2.6110e+00, -3.2770e+00, -3.7727e+00, -2.2053e+00, 1.6641e+00, 6.3089e-01, -6.0196e-01, -8.5646e-01, -3.7905e-01]], [[ 3.4686e+00, -1.9993e+00, -2.6225e+00, -3.2043e+00, -2.6951e+00, -9.9170e-01, -5.8868e-01, -1.2916e+00, -7.6859e-01, -4.5619e-01]], [[ 7.6249e-01, -5.0370e+00, -4.6553e+00, -4.9066e+00, -2.5003e+00, -2.5830e+00, -2.7723e+00, -2.7539e+00, -6.6235e-01, -1.7396e+00]], [[ 3.7717e+00, -2.0816e+00, -2.4184e+00, -2.4581e+00, -1.8994e+00, 8.2206e-01, 1.2496e+00, -8.6101e-01, -3.8942e-01, 9.8622e-01]], [[ 3.8838e+00, -1.2760e+00, -8.3134e-01, -1.5687e+00, 2.0308e-02, 2.6829e+00, 3.8388e+00, 9.5385e-01, 2.2208e+00, 9.3905e-02]]], [[[ 2.9502e+00, -7.1647e-01, -1.8282e+00, -1.6071e+00, -1.0837e+00, 3.0745e+00, 1.8561e+00, 1.9402e-01, -1.2964e+00, -9.7667e-01]], [[ 4.7269e+00, -6.1550e-01, -2.5057e+00, -2.2706e+00, -1.3683e+00, 1.1590e+00, -1.0972e-01, 8.8517e-02, 1.0594e+00, 1.8469e+00]], [[ 4.1333e+00, -6.0116e-01, -2.0402e+00, -2.9925e+00, -1.8000e+00, 1.3394e+00, 1.7543e+00, -1.3037e+00, -1.1980e+00, -2.7331e-02]], [[ 3.4964e+00, -1.2436e+00, -2.3791e+00, -2.0917e+00, -1.6946e+00, 6.6135e-01, -9.3671e-02, -1.0049e+00, -1.8384e+00, -1.3462e+00]], [[ 2.3851e+00, -1.5810e+00, -2.0910e+00, -2.1585e+00, -1.5640e+00, 2.0097e+00, 6.1874e-01, -1.9021e+00, -7.5456e-01, -6.5519e-01]], [[ 2.2736e+00, -4.1836e+00, -3.8288e+00, -4.4356e+00, -4.6412e+00, -3.2778e+00, -4.5276e+00, -3.7453e+00, -2.4974e+00, -3.3939e+00]], [[ 3.8927e+00, -1.0994e+00, -2.5176e+00, -1.7359e+00, -2.5582e-02, 1.2886e+00, 4.3120e-01, -2.2377e-01, -1.1421e+00, -7.9401e-01]], [[ 1.1515e+00, -3.2801e+00, -3.1619e+00, -3.9988e+00, -2.3882e+00, 3.1531e+00, 9.5191e-01, -9.7117e-01, -2.6185e+00, -1.3359e+00]], [[ 3.6785e+00, -1.3911e+00, -2.0949e+00, -2.9542e+00, -2.4278e+00, -1.4059e+00, -1.1700e+00, -2.5452e+00, -1.8346e+00, -6.9138e-02]], [[ 1.0140e+00, -3.6483e+00, -3.8650e+00, -2.7377e+00, -1.9782e+00, -1.8355e+00, -2.0937e+00, -2.9151e+00, -1.2721e+00, -1.3355e+00]], [[ 4.2276e+00, -1.5161e-01, -4.7434e-01, -6.7105e-01, 1.1143e-01, 1.2457e+00, 6.6037e-01, 4.9669e-01, 5.0073e-02, 7.4367e-01]], [[ 3.4396e+00, -6.1723e-02, -5.1201e-02, 5.1962e-01, -3.9856e-01, 3.5023e+00, 3.9316e+00, 2.4797e+00, 3.6176e+00, 4.1247e+00]]]]) attn_weights tensor([[[[ 1.3807e+00, 1.1774e+00, 1.0050e+00, 7.5113e-01, 1.3428e+00, 9.1879e-01, 9.3019e-01, 9.8355e-01, 8.4874e-01, 4.6784e-01]], [[ 3.9062e+00, 1.7045e-01, -4.0189e-01, -3.2391e-01, 1.2052e+00, 1.8160e-01, 5.4780e-01, 7.7722e-01, -4.2555e-01, -2.5851e-01]], [[ 2.9586e+00, -3.8834e-01, -1.2265e+00, -1.5327e+00, -9.7377e-01, 4.7457e-01, -1.8764e-01, -4.4125e-01, -1.4121e+00, -1.2888e+00]], [[ 1.1811e+00, -3.0158e-02, -6.5579e-01, -1.4228e+00, -6.1672e-01, -1.4019e-02, -1.3971e-02, 2.4341e-01, -1.0822e+00, -1.9395e+00]], [[ 2.0723e+00, -1.0117e+00, -1.4684e+00, -1.5615e+00, -5.1307e-01, -8.3476e-01, -1.4192e+00, -7.1873e-01, -1.2306e+00, -1.0923e+00]], [[ 4.3001e+00, 7.4045e-01, 4.3015e-01, -5.1069e-01, 1.5377e+00, 1.1343e+00, 2.5052e+00, 1.5783e+00, 1.2698e+00, 3.4100e-01]], [[ 3.2721e+00, -1.0436e+00, -1.3070e+00, -1.3741e+00, -3.7969e-01, 3.5071e-01, -6.2955e-02, -6.3484e-01, -1.4169e+00, -1.1304e+00]], [[ 3.8194e+00, 3.8707e-01, -1.3730e+00, -1.0598e+00, 7.2962e-01, 1.9530e+00, 6.9423e-01, 3.6427e-01, -1.6667e+00, -1.0993e+00]], [[-4.1669e+00, 3.4593e+00, 3.8875e+00, 3.2781e+00, 3.3341e+00, 3.4632e+00, 3.6170e+00, 3.5794e+00, 4.2946e+00, 4.0541e+00]], [[ 4.4022e+00, -5.0841e-01, -8.1179e-01, -1.1393e+00, -8.3088e-02, 6.2671e-03, 9.9810e-01, 1.1435e-01, -1.8543e-01, 1.4823e-01]], [[ 2.6726e+00, 2.0562e-01, 9.1352e-01, -4.8397e-02, 4.1573e-01, 1.7316e+00, 9.3839e-01, 1.0779e+00, 1.1345e+00, 2.9467e-01]], [[ 3.2196e+00, 2.7276e-01, 5.4384e-01, 1.3782e-02, 2.8872e-01, 1.3217e+00, 1.5095e+00, 9.3591e-01, 6.8455e-01, 1.3283e-02]]], [[[ 1.5463e+00, 7.5222e-01, 7.2871e-02, 4.8912e-01, 9.3924e-01, 7.7224e-01, 6.3982e-01, 5.6886e-01, 8.2621e-01, 2.9836e-01]], [[ 4.1837e+00, -1.2856e+00, -1.1329e+00, -4.8943e-01, -1.3528e+00, -2.0119e+00, -8.7893e-01, -9.9281e-01, -5.6031e-01, -1.4191e+00]], [[ 3.8549e+00, -1.4656e+00, -1.8588e+00, -1.5250e+00, -2.0408e+00, -1.0890e+00, -5.4929e-01, -1.4400e+00, -1.6166e+00, -1.7735e+00]], [[ 1.3918e+00, -1.3583e+00, -7.9401e-01, -1.5152e+00, -1.5873e+00, 3.9447e-01, -2.0187e-01, 1.1155e-01, -9.8716e-01, -6.8303e-01]], [[ 2.0843e+00, -9.5946e-01, -1.7277e+00, -3.6754e-01, -1.4389e+00, -1.9996e+00, -1.7939e+00, -7.2734e-01, 2.1162e-01, -1.2115e+00]], [[ 4.4207e+00, 3.8806e-01, 1.1356e+00, 8.5568e-01, 5.4354e-01, -9.4845e-01, 1.3966e+00, 9.3553e-01, 9.7013e-01, 1.4769e+00]], [[ 3.7360e+00, -2.2814e+00, -1.9011e+00, -1.9287e+00, -2.4250e+00, -1.2785e+00, -1.1847e+00, -2.5196e+00, -2.2021e+00, -2.6736e+00]], [[ 5.5466e+00, -4.6459e-01, -1.8180e+00, -2.3699e+00, -1.0486e+00, 2.6475e-01, -1.4408e-01, -1.5829e+00, -1.6075e+00, -2.5700e+00]], [[-3.1882e+00, 4.5699e+00, 6.3070e+00, 5.0220e+00, 4.0782e+00, 3.8263e+00, 3.6615e+00, 4.6180e+00, 4.8533e+00, 5.4501e+00]], [[ 4.5550e+00, -3.0210e-02, -5.0477e-01, -2.4380e-01, -3.1522e-01, -1.4373e+00, 1.7555e-01, 7.0356e-01, 1.4433e+00, 1.3836e-01]], [[ 3.3439e+00, 1.5873e-01, 2.1880e+00, 1.3005e+00, 5.1813e-01, -4.2037e-02, 4.6344e-01, 1.0831e+00, 1.0946e+00, 1.9495e+00]], [[ 3.0493e+00, -1.0394e+00, 7.9705e-01, -2.0634e-01, -8.2419e-01, 1.6560e+00, 1.5711e+00, -2.2782e-01, -1.6539e-01, 1.1021e+00]]], [[[ 1.6259e+00, 6.1266e-01, 1.5470e-01, 6.1633e-01, 6.8673e-01, 4.4161e-01, 5.1264e-01, 5.2969e-01, 5.7650e-01, 5.0809e-01]], [[ 4.1723e+00, -1.4001e+00, -1.1809e+00, -6.8209e-01, -1.6691e+00, -2.4758e+00, -1.0951e+00, -1.2119e+00, -1.4661e+00, -1.3533e+00]], [[ 3.8960e+00, -1.5486e+00, -1.8126e+00, -1.4963e+00, -2.0946e+00, -1.6289e+00, -7.9637e-01, -1.5599e+00, -2.4943e+00, -1.8842e+00]], [[ 1.4406e+00, -1.8262e+00, -1.1260e+00, -2.0287e+00, -2.2030e+00, -4.3094e-01, -6.5124e-01, -2.7680e-01, -1.5711e+00, -5.8258e-01]], [[ 2.1008e+00, -1.0056e+00, -1.6992e+00, -2.5752e-01, -1.5009e+00, -2.1620e+00, -1.7616e+00, -9.4687e-01, -2.9417e-01, -1.0291e+00]], [[ 4.3556e+00, 4.8785e-01, 9.7564e-01, 8.5093e-01, 1.8732e-01, -1.1677e+00, 9.4261e-01, 5.1749e-01, 6.0445e-01, 1.3065e+00]], [[ 3.8415e+00, -2.2953e+00, -1.7704e+00, -1.6986e+00, -2.5050e+00, -1.7156e+00, -1.3737e+00, -2.5663e+00, -2.4554e+00, -2.2889e+00]], [[ 5.5181e+00, -4.1391e-01, -1.7429e+00, -2.4485e+00, -1.2839e+00, -3.1059e-01, -3.2026e-01, -1.5214e+00, -2.3278e+00, -2.5173e+00]], [[-2.2587e+00, 4.3195e+00, 6.2101e+00, 4.7848e+00, 3.7232e+00, 3.5040e+00, 3.5144e+00, 4.4671e+00, 4.2206e+00, 5.6188e+00]], [[ 4.5556e+00, 1.9706e-02, -6.4420e-01, -3.7323e-01, -6.8882e-01, -2.1729e+00, -3.1606e-01, 3.0714e-01, 4.4296e-01, 1.0171e-01]], [[ 3.3637e+00, 2.6324e-02, 2.0426e+00, 9.4895e-01, 2.2160e-01, -7.9822e-01, -4.1133e-01, 5.7574e-01, 7.5969e-01, 1.9536e+00]], [[ 2.8469e+00, -1.5213e+00, 6.1777e-01, -6.3536e-01, -1.4398e+00, 1.0176e+00, 9.5854e-01, -7.5709e-01, -7.5356e-01, 1.0912e+00]]], [[[ 2.0793e+00, -4.7280e-01, -1.7911e+00, -5.2788e-01, -3.1510e-01, 2.7963e-01, -2.8844e-01, -2.0381e-01, -8.4950e-01, -3.4631e-01]], [[ 4.1314e+00, -9.6376e-01, -1.8757e+00, -1.5533e+00, 6.2123e-01, 3.7829e-01, 1.3554e+00, 4.3237e-01, 1.6079e+00, -1.6621e-01]], [[ 3.3767e+00, -1.0438e+00, -1.5942e+00, -2.0963e+00, -1.2401e+00, 2.6037e-01, 1.0702e+00, -3.9121e-01, 1.4942e-02, -2.8584e-01]], [[ 1.7130e+00, -1.6362e+00, -2.5985e+00, -2.5955e+00, -8.7116e-01, -8.8650e-01, -8.0540e-01, -5.9627e-01, -6.4152e-01, -7.0329e-01]], [[ 2.3095e+00, -1.0866e+00, -1.3442e+00, -1.3258e+00, -1.1630e+00, -6.3881e-01, -9.1033e-01, -8.8115e-01, -5.6309e-01, -1.3736e-01]], [[ 4.0629e+00, -1.0212e+00, -1.5576e+00, -1.1679e+00, -9.1887e-01, 1.0000e+00, 3.2419e+00, -4.2303e-01, 3.4384e-02, 4.2101e-01]], [[ 3.5850e+00, -1.6326e+00, -2.8154e+00, -1.7666e+00, -1.3753e+00, -7.1937e-02, 5.5167e-02, -7.8912e-01, -5.5589e-01, 4.0437e-03]], [[ 4.2295e+00, -7.3687e-01, -7.7019e-01, -1.0215e+00, 2.9963e-02, 2.0859e+00, 1.3910e+00, 3.9473e-01, 1.3857e+00, 1.6591e+00]], [[-2.7575e+00, 6.8465e-01, 1.2055e+00, 6.1366e-01, 2.6079e+00, 2.6847e+00, 1.9014e+00, 1.3198e+00, 2.5677e+00, 1.5036e+00]], [[ 4.3119e+00, -1.6694e+00, -3.0583e+00, -2.9125e+00, -2.2468e+00, 6.9772e-01, 1.6177e+00, -1.1851e+00, -1.1553e+00, 8.6314e-01]], [[ 2.4526e+00, -9.7549e-01, -1.9535e+00, -1.5203e+00, -2.9537e-02, 2.0493e+00, 2.1575e+00, 5.6644e-01, 1.4404e+00, 1.2858e+00]], [[ 3.1788e+00, -1.2949e-01, -1.9102e+00, -1.3412e+00, 4.5183e-01, 1.1859e+00, 5.1454e-01, 5.7462e-01, 8.1149e-01, 7.0354e-02]]], [[[ 1.8756e+00, 2.8681e-01, -7.4961e-01, -3.8363e-01, 3.8032e-01, 1.2978e+00, 5.7640e-01, 6.0076e-01, 6.1512e-01, 1.0951e+00]], [[ 4.0547e+00, -6.1399e-01, -1.0592e+00, -5.0376e-01, 1.2292e+00, -2.2716e-01, 7.5597e-01, 3.3740e-01, 5.6116e-01, 1.2632e-01]], [[ 3.7248e+00, -5.6999e-01, -1.3088e+00, -1.4962e+00, -3.4739e-01, -5.3947e-01, 9.2231e-01, -8.7422e-02, -8.2907e-01, -1.6230e+00]], [[ 1.1430e+00, -4.6103e-01, -1.3708e+00, -1.0613e+00, 3.5928e-01, 5.6390e-01, 2.2681e-01, -3.2377e-02, -1.1997e+00, -1.2856e+00]], [[ 2.3984e+00, -3.8553e-01, -8.5597e-01, -5.9811e-01, -2.8323e-01, 2.3943e-01, -9.1689e-01, -2.7136e-01, -3.1988e-01, -4.7491e-01]], [[ 4.4205e+00, -3.4946e-01, -1.4803e-01, -6.8279e-01, -5.8695e-01, 9.0987e-01, 2.4060e+00, 2.1393e-02, -4.3596e-02, 8.5894e-02]], [[ 4.0571e+00, -1.0179e+00, -1.7334e+00, -7.7467e-01, -5.9424e-01, -5.2320e-01, -1.6979e-01, -2.5946e-01, -1.3942e+00, -1.0976e+00]], [[ 4.5027e+00, 6.3733e-01, -1.6531e-01, -8.0640e-01, 2.6395e-01, 1.1322e+00, 7.5595e-01, 9.5370e-01, 2.7787e-01, 7.4801e-01]], [[-2.8157e+00, 1.7414e+00, 3.0485e+00, 2.0556e+00, 2.0312e+00, 2.1485e+00, 1.1200e+00, 1.9251e+00, 2.8804e+00, 1.3745e+00]], [[ 4.7040e+00, -8.8932e-01, -1.5019e+00, -1.9724e+00, -2.9969e-01, 9.1901e-01, 4.9717e-01, -3.1942e-01, 1.1035e-01, -1.1319e+00]], [[ 2.3822e+00, -8.9244e-01, 1.1706e-01, -6.0192e-01, 5.1083e-01, 3.2340e+00, 2.5899e+00, 1.2090e+00, 2.1748e+00, 1.5009e+00]], [[ 3.0827e+00, -4.1938e-01, -1.2285e+00, -4.8517e-01, 1.2749e+00, 1.9120e+00, 9.4741e-01, -2.9655e-01, -2.7424e-01, -3.1112e-02]]]]) attn_weights tensor([[[[-2.7769e-01, -2.0583e+00, -1.6912e+00, -6.0701e-01, -2.5635e+00, -1.9286e+00, -1.1225e+00, -2.2301e+00, -1.6224e+00, -4.3043e-01, -2.8681e+00]], [[ 2.8547e+00, 1.9209e+00, 3.8613e+00, 2.1419e+00, 1.7349e+00, 3.0893e+00, 1.1153e+00, 6.5562e-01, 3.1998e+00, 1.4870e+00, 9.4475e+00]], [[-6.8518e-01, -2.2776e+00, -2.1177e+00, -1.7923e+00, -1.7333e+00, -2.5182e+00, -2.4599e+00, -2.7302e+00, -2.3092e+00, -1.8657e+00, -2.2115e+00]], [[-4.0572e-01, -5.2547e+00, -3.0793e+00, -3.1305e+00, -4.7709e+00, -9.5759e-01, -2.2864e+00, -3.0200e+00, 5.6703e-02, 7.7727e-02, 4.9547e+00]], [[-1.2213e-01, -2.1174e+00, -2.7159e+00, -1.6630e+00, -1.6394e+00, -1.5094e+00, -4.7043e-01, -1.2797e+00, -1.3109e+00, -2.1530e-01, 1.6588e+00]], [[ 8.3318e+00, 1.7752e+00, 3.0423e+00, 1.0790e+00, 5.0148e-01, 6.1261e+00, 2.7250e+00, -1.4671e+00, 1.3283e+00, -3.6450e-01, 1.2403e+01]], [[ 2.5413e-01, -2.1116e+00, -2.2945e+00, -2.2679e+00, -2.5797e+00, 2.8958e-01, 1.9441e-01, -2.7977e+00, -2.6681e+00, -2.5244e+00, -6.4706e-01]], [[-5.5392e+00, -5.7257e+00, -5.0018e+00, -5.5757e+00, -4.8176e+00, -4.0824e+00, -4.7885e+00, -3.6702e+00, -2.6775e+00, -3.1993e+00, -4.0328e+00]], [[-2.3683e+00, -2.5889e+00, -2.6410e+00, -2.9144e+00, -2.5875e+00, -1.1215e+00, -3.2390e+00, -2.6723e+00, -2.5804e+00, -2.8428e+00, -3.2731e+00]], [[-1.5661e+00, -2.0762e+00, -2.2561e+00, -2.6133e+00, -2.3144e+00, -2.5066e+00, -2.3924e+00, -2.2826e+00, -2.3572e+00, -2.6330e+00, -3.2113e+00]], [[ 1.2997e+00, 8.0641e-01, 9.9437e-01, 3.1965e-01, 5.8784e-01, 7.9647e-01, -1.6075e-01, 5.0282e-01, 7.0836e-01, 2.6026e-02, 1.9538e+00]], [[-1.1421e+00, -1.6681e+00, -3.3603e+00, -2.2660e+00, -2.4606e+00, -2.2557e+00, -1.9087e+00, -1.7054e+00, -3.5659e+00, -2.2980e+00, -2.1763e+00]]], [[[ 7.3664e-02, -1.3794e+00, -7.2458e-01, -1.0660e+00, -1.7886e+00, -1.9213e+00, -1.9342e+00, -1.5099e+00, -1.3952e+00, -5.5938e-01, -9.4821e-01]], [[ 2.7469e+00, 3.0361e+00, 3.1128e+00, 9.5499e+00, 1.8255e+00, 3.3140e+00, 9.7177e-01, 1.7309e+00, 7.7559e-01, 2.1418e+00, 9.2755e+00]], [[-1.0358e+00, -2.0283e+00, -1.4134e+00, -1.5208e+00, -2.0967e+00, -2.3265e+00, -2.5100e+00, -2.4675e+00, -2.0389e+00, -1.6053e+00, -1.6620e+00]], [[-9.4084e-01, -4.3288e+00, 3.6683e-01, 5.0525e-01, -2.9265e+00, -2.0300e+00, -4.0596e+00, -1.1582e+00, -7.6994e-01, 5.3875e+00, 5.2761e+00]], [[-8.2665e-01, -2.5857e+00, -2.4670e+00, -5.5558e-01, -1.9177e+00, -2.3260e+00, -9.3861e-01, -1.1801e+00, -2.8935e-01, -3.1866e-01, 1.8370e+00]], [[ 7.5776e+00, 1.9998e+00, 5.5365e+00, 1.1142e+01, 1.4583e+00, 1.7819e+00, 2.0952e+00, -6.6485e-01, -1.3725e+00, 4.2017e+00, 1.0591e+01]], [[-1.6934e-01, -2.2556e+00, -3.1644e+00, -1.7322e+00, -2.3706e+00, -1.2834e+00, -1.2321e+00, -2.5494e+00, -2.5576e+00, -3.2442e+00, -1.5985e+00]], [[-5.2963e+00, -6.0967e+00, -5.6695e+00, -6.3481e+00, -5.2997e+00, -6.7750e+00, -5.8600e+00, -3.8802e+00, -3.2594e+00, -2.4130e+00, -3.3927e+00]], [[-1.5765e+00, -1.1930e+00, -1.7178e+00, -2.3979e+00, -1.5307e+00, -3.1735e+00, -3.0280e+00, -1.1019e+00, -1.2272e+00, -1.5899e+00, -2.3086e+00]], [[-1.7182e+00, -2.0089e+00, -2.2420e+00, -2.8242e+00, -2.3495e+00, -2.5160e+00, -2.7536e+00, -2.1618e+00, -2.0861e+00, -2.2831e+00, -2.8159e+00]], [[ 1.3361e+00, 1.0522e+00, 1.7026e+00, 1.7992e+00, 6.3295e-01, -8.3290e-02, -2.1922e-01, 6.3567e-01, 6.7819e-01, 1.3746e+00, 1.5341e+00]], [[-1.2282e+00, -1.8544e+00, -3.4902e+00, -1.8703e+00, -2.0895e+00, -2.4075e+00, -2.2433e+00, -1.8522e+00, -1.7552e+00, -3.6695e+00, -1.8198e+00]]], [[[-1.9112e-01, -1.6284e+00, -6.4950e-01, -1.3055e+00, -1.9839e+00, -1.4906e+00, -1.6617e+00, -1.7298e+00, -9.3618e-01, -4.9683e-01, -1.3541e+00]], [[ 1.8770e+00, 2.8527e+00, 4.1041e+00, 4.3514e+00, 4.7030e-01, -1.8660e-01, -7.8036e-01, 1.6906e+00, 1.9177e+00, 3.4525e+00, 9.9226e+00]], [[-1.2460e+00, -1.9922e+00, -1.9755e+00, -2.0929e+00, -2.4964e+00, -2.5029e+00, -2.4577e+00, -2.3111e+00, -1.9538e+00, -2.1515e+00, -2.5729e+00]], [[-2.7874e+00, -7.0924e+00, -5.5764e+00, -4.1672e+00, -5.9134e+00, -5.6093e+00, -4.4464e+00, -3.3835e+00, -2.3227e+00, -3.0968e-01, 3.3576e+00]], [[-6.1588e-01, -2.1783e+00, -2.2425e+00, -1.4513e+00, -2.0330e+00, -2.4615e+00, -8.5719e-01, -8.4710e-01, -7.1534e-01, -7.5485e-02, 2.0398e+00]], [[ 6.3769e+00, 3.6419e+00, 4.9098e+00, 4.5020e+00, 8.8842e-01, 9.8693e-01, 1.6680e+00, 9.2482e-01, 1.6430e+00, 3.2009e+00, 1.1673e+01]], [[ 6.3398e-01, -1.8549e+00, -2.2250e+00, -7.4500e-01, -1.9380e+00, -9.1113e-02, -4.3602e-01, -2.1141e+00, -1.3724e+00, -2.2947e+00, -2.5346e-01]], [[-4.9993e+00, -6.1379e+00, -5.2937e+00, -6.1238e+00, -5.2651e+00, -5.8464e+00, -5.4853e+00, -3.9224e+00, -3.8252e+00, -2.3632e+00, -3.5826e+00]], [[-2.2612e+00, -1.7133e+00, -1.2911e+00, -2.7709e+00, -1.9796e+00, -3.4449e+00, -3.8250e+00, -1.5970e+00, -2.0399e+00, -1.0292e+00, -2.4266e+00]], [[-1.6403e+00, -2.0570e+00, -2.0611e+00, -2.5667e+00, -2.2335e+00, -2.6990e+00, -2.7501e+00, -2.1671e+00, -1.9921e+00, -2.0531e+00, -2.5125e+00]], [[ 1.1045e+00, 8.0532e-01, 1.1708e+00, 7.8607e-01, 3.9791e-01, -3.3961e-01, -6.3904e-01, 5.1819e-01, 7.2278e-01, 8.8220e-01, 1.6104e+00]], [[-1.0839e+00, -2.0257e+00, -3.5453e+00, -1.7966e+00, -2.4821e+00, -2.6213e+00, -2.4924e+00, -2.0202e+00, -2.1081e+00, -3.7134e+00, -2.3347e+00]]], [[[-1.1249e+00, -1.9629e+00, -1.9009e+00, -1.8641e+00, -1.6221e+00, -1.3173e+00, -6.9999e-01, -2.2347e+00, -1.5342e+00, -4.8702e-01, -5.7729e-01]], [[ 1.2045e+00, 1.0020e+00, 1.6680e+00, 1.6426e+00, -1.0223e+00, 1.0199e+00, 9.1275e+00, -4.8488e-01, -1.5860e+00, 3.0048e+00, 9.0472e+00]], [[-1.1707e+00, -2.1021e+00, -1.9553e+00, -2.1598e+00, -1.8168e+00, -1.3247e+00, -2.4107e+00, -2.5897e+00, -1.9269e+00, -2.4336e+00, -2.4563e+00]], [[-2.4217e+00, -7.9099e+00, -7.6811e+00, -6.6226e+00, -6.2033e+00, -3.3328e+00, 1.2915e+00, -4.5384e+00, -3.5497e+00, 7.1092e-01, 3.8525e+00]], [[-5.6768e-01, -2.2092e+00, -3.3454e+00, -3.7982e+00, -2.3564e+00, -1.7573e+00, 1.4855e+00, -1.3081e+00, -1.2880e+00, 2.2564e+00, 2.7118e+00]], [[ 6.6268e+00, 1.6500e+00, 1.6347e+00, 1.1028e+00, 8.4248e-01, 2.9894e+00, 1.2344e+01, -9.1540e-01, 2.9936e-02, 3.5567e+00, 1.2087e+01]], [[-2.5831e-02, -2.1952e+00, -2.4775e+00, -2.0547e+00, -2.9267e+00, -1.0103e+00, -9.3560e-01, -2.6194e+00, -3.0253e+00, -3.1951e-01, -8.7421e-01]], [[-4.4310e+00, -5.7625e+00, -5.3642e+00, -5.9905e+00, -4.7812e+00, -3.7387e+00, -4.7804e+00, -3.2256e+00, -3.1442e+00, -2.1574e+00, -3.2075e+00]], [[-1.5769e+00, -2.1150e+00, -2.9692e+00, -2.4585e+00, -2.0138e+00, -2.6222e+00, -3.2302e+00, -2.1008e+00, -1.9089e+00, -3.2524e+00, -3.1473e+00]], [[-1.8554e+00, -2.0608e+00, -2.2224e+00, -2.6067e+00, -2.1397e+00, -1.8731e+00, -3.6281e+00, -2.2121e+00, -2.1115e+00, -2.2116e+00, -3.6088e+00]], [[ 4.0312e-01, 3.9998e-01, 1.8267e-02, -1.4041e-01, 3.8616e-01, -1.7662e-01, 1.7050e+00, 1.9028e-01, 2.5916e-01, 3.2301e-01, 1.6363e+00]], [[-1.4576e+00, -2.4834e+00, -2.9796e+00, -2.8454e+00, -3.1217e+00, -3.0063e+00, -2.0951e+00, -2.6101e+00, -3.1005e+00, -2.1518e+00, -2.0325e+00]]], [[[-2.4603e-02, -1.8958e+00, -1.4931e+00, -1.1381e+00, -2.1818e+00, -3.0796e-01, -1.5977e+00, -2.2822e+00, -2.1040e+00, -2.1367e+00, -1.1555e+00]], [[ 1.6427e+00, 6.7832e-02, 1.5865e+00, 8.2084e-01, 4.0978e-01, 2.7956e+00, 2.2452e+00, -1.5078e+00, 2.8668e-01, 1.1020e+00, 9.1502e+00]], [[-4.7623e-01, -1.6455e+00, -2.0455e+00, -1.5906e+00, -1.5461e+00, -8.7211e-01, -2.3624e+00, -2.0876e+00, -2.1546e+00, -1.6960e+00, -3.1622e+00]], [[-1.7342e+00, -7.9737e+00, -7.1968e+00, -6.0175e+00, -6.0543e+00, -4.5314e+00, -3.0990e+00, -4.9993e+00, -2.9995e+00, -2.3057e+00, 3.6816e+00]], [[-4.3775e-02, -2.2566e+00, -2.7972e+00, -1.7419e+00, -1.8821e+00, -1.0325e+00, 1.5467e-01, -1.2169e+00, -6.0848e-01, 3.3911e-01, 2.5418e+00]], [[ 6.4767e+00, 1.8935e+00, 1.0238e+00, -1.4909e+00, 6.7190e-01, 4.4261e+00, 3.4602e+00, -2.7889e-01, -4.7419e-01, 1.0577e+00, 1.2658e+01]], [[ 2.1027e-01, -1.9342e+00, -2.3819e+00, -1.7348e+00, -3.0397e+00, -6.3036e-01, -2.4496e-01, -2.5227e+00, -2.9772e+00, -2.7477e+00, -9.5201e-01]], [[-5.1970e+00, -6.1217e+00, -5.1701e+00, -4.9124e+00, -5.0589e+00, -3.0168e+00, -4.8477e+00, -3.8116e+00, -3.5776e+00, -2.7471e+00, -4.3507e+00]], [[-1.0349e+00, -1.9414e+00, -1.5947e+00, -2.9145e+00, -2.4109e+00, -2.9232e+00, -1.9725e+00, -2.1199e+00, -1.8789e+00, -2.4124e+00, -3.0017e+00]], [[-1.8940e+00, -2.1048e+00, -2.3504e+00, -2.6762e+00, -2.2065e+00, -2.4792e+00, -2.8664e+00, -2.2952e+00, -2.5328e+00, -2.2910e+00, -4.3998e+00]], [[ 7.7637e-01, 5.4256e-01, 1.7900e-01, -1.9233e-02, 4.7793e-01, 3.7704e-01, -3.9760e-02, 2.4921e-01, -7.7062e-03, 4.0224e-01, 1.5370e+00]], [[-1.1828e+00, -2.1444e+00, -3.0453e+00, -2.3001e+00, -2.9403e+00, -2.6877e+00, -2.0355e+00, -2.1294e+00, -2.2120e+00, -2.6529e+00, -1.5218e+00]]]]) attn_weights tensor([[[[-2.1543, -3.2118, -1.9549, -2.3166, -1.8609, -1.6290, -1.7416, -0.9635, -0.0587, -0.5485, -1.0776]], [[-1.9190, -2.7370, -2.8124, -2.3755, -2.3072, -3.1871, -2.6309, -0.4879, -0.7422, -0.4396, -1.6535]], [[-2.6842, -3.5815, -3.2176, -3.5931, -2.9842, -3.3299, -2.8792, -2.2000, -2.4936, -2.9122, -2.4250]], [[ 0.0962, -2.8242, -2.6292, -2.6642, -2.5704, -2.4018, -2.1778, -2.0507, -2.0807, -2.1962, -1.8040]], [[-0.5586, -2.4733, -2.7066, -2.6895, -2.5671, -2.1575, -2.0661, -2.0774, -2.2510, -2.2369, -1.6661]], [[ 0.9263, 0.5537, -0.7983, -0.1225, -0.1753, 1.3603, -0.4121, 0.1612, -1.3551, -0.7189, -0.1681]], [[ 2.2739, 0.6132, -0.3496, -0.0565, -0.4100, 1.3260, -1.4068, -0.1508, -1.1352, -0.7249, 0.3959]], [[ 0.4191, -1.3828, -1.2092, -1.6477, -1.8311, -1.7983, -0.2771, -1.4691, -1.3194, -1.8284, -2.3534]], [[-0.6089, -1.8547, -2.0076, -2.2495, -1.9774, -2.4255, -2.7697, -1.7292, -1.8811, -2.0382, -2.6111]], [[ 1.1203, -0.3237, -0.1476, -0.5217, 0.2118, -1.4310, -1.4566, -0.6277, -0.2110, -0.4317, -1.5719]], [[-5.2673, -2.0080, -1.9394, -1.9326, -1.9267, -1.5289, -1.3105, -1.4273, -1.3619, -1.3965, -0.7603]], [[ 1.4173, 0.5565, -1.9142, -2.2222, -1.2816, 0.4046, -1.9165, 0.7848, -2.2929, -2.5121, 4.6258]]], [[[-2.3768, -3.9802, -2.3314, -3.9936, -2.6932, -3.6105, -3.7512, -1.8264, -1.2409, 0.2453, -1.4638]], [[-0.5600, -1.3986, -2.3448, -2.6472, -1.8742, -1.8660, -1.4864, 0.2161, 0.3372, -0.3476, -0.7512]], [[-2.7892, -3.7925, -3.3334, -3.6743, -3.0628, -3.4833, -3.0289, -2.2985, -2.4686, -2.5207, -2.8633]], [[-0.0795, -2.7958, -2.6957, -2.6801, -2.5973, -2.4161, -2.2150, -2.1019, -2.1428, -2.0822, -2.1348]], [[-0.5378, -2.4666, -2.6423, -2.5229, -2.5207, -2.1203, -2.0232, -2.0419, -2.1296, -2.0009, -1.9212]], [[-0.2676, -0.8623, -1.2030, -0.1256, -1.3776, -4.2349, -4.2635, -0.8496, -1.6442, -1.3760, -0.1452]], [[ 1.1593, -0.6202, -1.2901, -2.0451, -0.6799, -1.9645, -2.1840, -0.8932, -1.3482, -1.8085, -2.6135]], [[-0.4020, -1.9323, -2.8849, -2.4542, -2.3403, -2.0748, -1.8120, -1.6141, -2.0677, -2.9289, -2.4834]], [[-0.6916, -1.8234, -2.3197, -2.4163, -2.1357, -2.5105, -2.8746, -1.7320, -2.2262, -2.1590, -2.2233]], [[ 1.2959, -0.4040, -0.5360, -0.8891, 0.2553, -1.3014, -1.4023, -0.5619, -0.4496, -0.5407, -0.8514]], [[-5.5516, -2.1373, -2.0720, -2.0041, -1.9980, -1.6253, -1.4250, -1.5332, -1.5444, -1.3559, -1.3339]], [[-0.8119, -1.0305, -3.5615, 1.5458, -3.8603, -4.6254, -5.8052, -0.6441, -1.6528, -3.5428, 2.0094]]], [[[-1.6482, -3.0152, -1.1951, -2.3025, -2.4900, -3.0859, -3.3057, -1.0159, -0.1618, 1.2393, -0.8368]], [[-0.6339, -1.2257, -1.7269, -1.8216, -0.9883, -1.5263, -1.0679, 0.6287, 0.4816, 0.5012, -0.7464]], [[-2.7735, -3.8710, -3.3966, -3.7057, -3.0717, -3.5216, -3.0368, -2.2768, -2.7099, -2.5102, -3.2064]], [[-0.0974, -2.7470, -2.6326, -2.6126, -2.5514, -2.3369, -2.1560, -2.0482, -2.1265, -1.9872, -2.2920]], [[-0.5229, -2.4999, -2.6750, -2.4743, -2.4975, -2.1471, -2.0659, -1.9913, -2.0231, -1.9702, -2.1376]], [[ 0.4269, -0.1675, -0.7396, 0.5633, -0.5717, -3.8871, -3.6365, 0.0241, -0.3262, -1.0057, -0.4447]], [[ 1.8744, -0.2182, -0.8067, -1.2113, 0.2216, -1.4778, -1.1083, -0.3503, -0.1430, -1.3471, -2.1317]], [[ 0.6776, -0.9676, -2.2615, -1.4067, -1.5481, -1.1558, -1.1943, -0.7552, -1.5245, -2.4028, -1.8809]], [[-0.8729, -2.0601, -2.1668, -2.5050, -2.2654, -2.5132, -2.8128, -1.9596, -2.2717, -2.0192, -2.6450]], [[ 1.4454, -0.5146, -0.1221, -1.1274, 0.0674, -1.1608, -1.2087, -0.5834, 0.0451, -0.0627, -0.6941]], [[-5.7233, -2.1569, -2.0756, -2.0029, -2.0528, -1.6262, -1.4575, -1.5580, -1.4683, -1.3476, -1.6749]], [[ 0.1997, 0.1362, -2.8034, -0.7586, -3.0026, -4.1241, -4.9218, 0.4155, -3.0253, -2.9604, 3.0930]]], [[[-2.0768, -2.8045, -2.4829, -3.1173, -1.5157, -1.5596, -1.5267, -0.7310, 0.1009, -0.0526, -0.6356]], [[-1.1634, -2.2421, -2.3717, -2.3765, -2.2262, -2.6410, -2.6444, -0.2549, -0.7594, -1.7510, -1.5617]], [[-2.7749, -3.6155, -3.2876, -3.6153, -3.0223, -3.3588, -2.9683, -2.2320, -2.6199, -3.0604, -2.5845]], [[ 0.0970, -2.7429, -2.5825, -2.5933, -2.5405, -2.3812, -2.1834, -2.0582, -2.2160, -2.1546, -1.8983]], [[-0.5809, -2.3319, -2.6377, -2.5707, -2.4955, -2.2039, -1.9653, -1.9659, -2.1518, -1.7432, -1.6842]], [[-0.5285, -0.3525, -1.3264, -2.0707, -0.8382, -0.7959, -0.6605, -0.7333, -0.8817, -0.8435, -0.5646]], [[ 2.2852, 0.4610, 0.1916, -0.9323, -0.1811, -2.0796, 1.2512, 0.0585, -0.5285, 2.1779, 1.0626]], [[-0.0944, -2.1166, -2.3254, -2.2461, -2.5036, -1.0030, -2.5830, -1.6689, -2.1942, -1.0241, -2.6301]], [[-0.7129, -1.5506, -2.2787, -2.5226, -1.8550, -2.3928, -2.8269, -1.6291, -1.7705, -2.7882, -2.5473]], [[ 1.1226, -0.2976, 0.1159, -0.2957, 0.1818, -0.7337, -1.5438, -0.6914, 0.2196, -1.5285, -1.0258]], [[-5.4322, -1.8857, -1.8782, -1.8561, -1.8396, -1.4721, -1.3407, -1.3617, -1.4791, -1.1957, -0.9811]], [[-1.9387, -1.9888, -4.1020, -5.3361, -4.5247, -3.5531, 1.5595, -1.4685, -4.3133, -2.9212, 1.1334]]], [[[-2.8094, -3.4879, -3.2033, -2.9863, -1.7453, -1.8076, -0.7172, -1.1866, -0.2657, 0.3215, -0.8722]], [[-1.2447, -2.2910, -2.6621, -2.3623, -1.8840, -2.5170, -1.9522, -0.2747, -1.0206, -0.4209, -1.4042]], [[-2.6929, -3.4991, -3.2006, -3.6067, -2.9518, -3.2878, -2.8978, -2.1834, -2.9126, -2.5146, -2.5741]], [[ 0.0611, -2.7833, -2.6231, -2.6583, -2.5550, -2.3533, -2.1492, -2.0336, -2.3414, -2.1902, -1.8744]], [[-0.5919, -2.4082, -2.7010, -2.7422, -2.6311, -2.1642, -1.9938, -2.1079, -2.3368, -2.2260, -1.6464]], [[ 0.3275, -0.2687, -2.3736, -1.8517, -0.5365, 0.1727, 0.0733, -0.6566, -1.3836, -0.7902, 0.5005]], [[ 1.6805, 0.2812, -0.5677, -1.3382, -0.8440, 0.6048, -0.5470, -0.1990, -2.4441, -0.8041, 0.2495]], [[-0.5372, -2.1624, -2.2324, -2.0932, -2.2910, -1.3887, -1.6444, -1.8034, -2.2310, -2.2337, -2.5889]], [[-0.6384, -1.7708, -2.0079, -2.5320, -1.8055, -2.2853, -2.7588, -1.6571, -1.5890, -1.7794, -2.3109]], [[ 1.2199, -0.1776, 0.0512, -0.4837, 0.0258, -0.5331, -1.2598, -0.5298, 0.0096, -0.0440, -1.2721]], [[-5.3408, -1.8719, -1.7935, -1.8716, -1.8472, -1.4555, -1.2789, -1.3424, -1.5457, -1.3773, -0.8667]], [[-0.3465, -0.6373, -4.7299, -4.2378, -3.0629, -2.7793, -2.0693, -0.4314, -3.1478, -2.7056, 2.7204]]]]) attn_weights tensor([[[[ -1.6164, -4.5646, -3.2663, -5.0323, -4.2261, -4.4295, -3.8716, -3.0438, -1.4839, -3.4737, -3.4594]], [[ 1.6846, -1.3272, -2.1937, -1.1100, -2.2788, -0.3281, -1.3510, -1.6461, -2.9500, -1.7632, -0.6391]], [[ -6.2494, -10.3336, -9.8940, -10.6124, -7.3004, -7.9414, -6.1213, -4.5385, -3.5520, -4.2835, -5.3463]], [[ -3.2708, -6.0724, -5.7321, -6.2038, -2.8254, -5.6812, -4.4880, -3.6268, -2.9261, -3.3351, -3.3851]], [[ -1.8398, -4.6972, -4.9321, -4.4307, -3.0570, -4.2788, -4.7664, -1.6995, -1.7920, -1.5454, -4.0944]], [[ -4.8019, -6.4943, -6.8889, -6.8317, -5.8618, -6.2786, -5.0526, -2.3624, -2.8751, -3.0922, -4.9611]], [[ -1.0338, -4.0582, -4.1915, -4.7320, -3.8769, -4.0160, -3.5547, -2.4557, -2.7561, -3.6248, -2.6863]], [[ -1.2658, -4.1110, -2.5913, -2.3895, -2.3202, -1.6352, -1.6810, -1.5511, -0.9155, -1.1639, -0.7472]], [[ -3.2862, -5.6667, -7.6979, -4.6480, -3.9121, -5.9792, -4.6632, -3.1171, -4.5780, -1.8658, -2.6554]], [[ -4.2416, -7.7277, -6.8629, -7.5603, -5.8827, -4.9601, -3.2972, -4.4062, -3.3007, -3.9921, -4.0885]], [[ -1.7486, -3.7856, -3.4998, -3.1829, -3.2937, -2.7384, -2.4307, -2.7861, -2.4247, -2.2890, -1.6485]], [[ -0.6835, -4.8600, -4.5269, -4.3709, -4.1830, -3.8706, -3.4918, -3.5124, -3.1874, -3.2101, -2.7400]]], [[[ -1.8442, -4.3001, -4.0879, -4.6597, -4.0199, -3.8548, -3.6958, -2.8385, -1.1344, -2.3807, -2.8126]], [[ 1.3215, -0.9427, -2.5154, -1.5370, -2.3458, -1.6661, -2.5133, -1.7755, -1.6910, -3.6761, -2.3763]], [[ -8.3397, -13.5661, -12.4786, -14.6246, -9.5154, -9.8297, -8.1297, -7.0733, -6.2662, -4.6721, -6.8951]], [[ -3.8962, -7.2204, -6.6685, -8.5367, -4.3582, -5.5211, -5.1683, -4.1608, -2.8274, -3.1493, -4.7708]], [[ -2.0370, -4.9201, -6.0119, -5.8047, -4.2647, -6.0973, -5.9847, -2.4217, -1.1454, -2.4205, -2.2715]], [[ -4.7048, -7.1718, -8.1667, -8.4234, -6.2010, -6.6961, -6.4810, -2.9949, -2.8266, -3.6924, -4.1800]], [[ -1.2010, -3.9890, -4.4368, -3.7737, -4.0025, -4.0842, -3.6174, -2.4366, -1.8717, -2.8799, -2.5787]], [[ -1.3922, -4.1272, -2.6412, -2.2708, -2.3385, -1.5152, -1.5861, -1.5259, -1.4695, -0.7497, -0.8037]], [[ -2.8669, -4.9296, -7.7775, -5.0938, -3.8931, -4.6661, -4.1294, -2.6082, -1.1927, -4.2354, -1.6635]], [[ -4.7550, -7.8141, -7.5359, -8.2625, -6.5870, -4.4518, -4.2956, -4.5206, -3.8420, -3.2138, -3.9181]], [[ -2.0341, -3.9332, -3.5489, -3.1810, -3.5302, -2.7929, -2.6316, -3.0039, -2.7739, -2.2720, -2.1210]], [[ -0.8457, -5.0626, -4.6694, -4.4566, -4.3388, -3.8121, -3.5770, -3.6458, -3.4670, -3.0298, -3.0426]]], [[[ -2.0393, -4.6240, -3.9217, -3.3408, -3.9572, -4.1706, -3.4552, -2.9475, -2.8543, -1.7506, -2.3402]], [[ 1.7558, -0.7988, -2.5906, -1.4475, -2.3653, -1.8420, -2.4133, -1.3000, -1.5138, -3.6741, -2.8689]], [[ -8.1182, -13.8596, -12.7610, -13.6363, -9.9787, -10.2096, -7.7867, -6.5321, -5.3272, -3.9577, -6.6367]], [[ -3.8791, -7.2806, -7.2292, -6.7742, -4.5694, -5.7983, -5.2117, -3.8895, -2.5372, -3.4865, -4.8622]], [[ -2.3379, -5.5204, -5.7263, -6.1897, -4.1811, -8.0845, -5.5631, -2.3881, -2.1219, -2.1270, -4.1057]], [[ -4.6618, -7.0617, -8.2379, -7.5158, -6.3068, -6.8459, -6.4511, -2.7615, -2.6305, -3.3413, -4.7366]], [[ -1.2586, -3.8399, -4.6568, -3.4849, -3.8888, -3.7299, -3.9233, -2.4922, -2.2016, -3.2883, -3.0030]], [[ -1.4353, -4.0132, -2.5983, -2.2011, -2.3560, -1.5080, -1.5294, -1.3171, -1.0525, -0.5938, -1.1964]], [[ -3.1126, -5.3060, -8.0816, -4.1107, -4.2633, -5.0815, -4.5246, -2.5554, -2.0180, -4.0587, -2.0818]], [[ -4.6036, -7.6295, -7.4228, -8.0379, -6.2627, -4.0926, -3.4769, -4.2361, -3.8722, -2.8888, -4.2027]], [[ -1.9814, -3.6916, -3.4398, -2.8979, -3.3982, -2.6660, -2.5274, -2.6865, -2.1487, -2.1473, -2.4002]], [[ -0.9129, -4.9227, -4.7953, -4.3540, -4.4968, -3.9200, -3.6483, -3.5866, -3.2092, -3.0674, -3.1613]]], [[[ -1.4358, -4.2703, -2.8097, -3.6294, -3.6496, -3.6509, -4.9046, -2.7184, -2.1664, -2.0645, -4.0304]], [[ 1.2647, -2.2582, -2.3936, -1.1298, -2.6787, -1.2528, -2.1383, -2.3092, -2.1351, -1.0993, -2.5519]], [[ -6.4955, -11.6014, -10.0842, -10.9523, -10.0641, -7.5965, -9.3883, -5.0900, -4.7246, -3.2576, -5.1237]], [[ -3.0967, -6.1130, -5.8104, -4.9884, -4.3043, -5.4237, -5.3316, -2.8498, -1.7778, -2.6567, -3.7418]], [[ -1.7176, -4.0989, -4.6761, -5.3184, -4.0035, -4.5236, -5.5210, -1.3949, -1.3914, -2.1922, -3.5521]], [[ -4.6910, -6.7650, -7.4193, -6.8654, -6.9900, -6.4794, -6.8817, -2.8037, -3.9757, -4.4954, -4.1848]], [[ -0.7987, -3.8157, -3.1814, -3.6530, -3.3190, -4.8346, -4.3187, -2.2029, -2.0117, -3.7032, -3.3637]], [[ -1.3828, -4.1313, -2.4739, -2.4958, -2.4017, -1.5897, -1.6418, -1.4896, -1.3387, -1.1749, -0.5066]], [[ -3.2954, -6.3601, -5.9017, -4.4177, -5.7621, -6.0387, -6.1297, -2.9460, -3.2201, -3.3434, -4.5498]], [[ -5.0613, -8.1267, -7.4155, -7.6604, -7.5127, -4.9264, -6.6654, -4.6016, -4.5955, -2.6656, -3.9770]], [[ -1.5128, -3.2332, -2.9834, -2.8677, -2.7660, -2.1851, -1.9391, -2.2029, -2.0655, -1.7819, -1.3419]], [[ -0.7647, -4.7222, -4.4607, -4.3316, -4.0496, -3.7357, -3.6017, -3.2508, -3.2368, -3.1073, -2.8208]]], [[[ -1.4692, -3.9631, -3.3188, -4.6998, -4.1792, -3.6242, -3.4835, -2.7593, -1.2774, -2.6379, -3.1309]], [[ 1.7140, -2.0615, -2.8329, -1.7906, -2.3510, -1.2669, -1.4434, -1.4156, -1.3327, -1.6940, -0.9632]], [[ -6.8278, -11.3160, -10.8629, -10.1004, -9.9541, -8.0646, -7.8850, -5.2510, -4.1400, -4.1008, -5.5632]], [[ -3.4548, -6.5444, -5.6922, -6.1303, -4.4355, -5.1636, -4.0380, -3.0048, -2.5512, -1.2296, -3.5209]], [[ -1.8905, -4.5455, -5.2644, -4.7558, -4.5448, -5.3725, -4.4731, -1.8882, -2.3523, -1.4143, -3.4331]], [[ -4.4554, -6.2331, -6.9444, -6.2760, -6.7684, -6.0934, -5.1577, -2.1973, -3.3904, -3.3071, -4.0399]], [[ -0.3858, -3.4093, -2.8429, -3.5031, -3.4464, -4.2977, -3.5705, -1.8769, -2.2234, -2.2589, -3.4670]], [[ -1.3768, -4.0919, -2.4482, -2.3413, -2.3379, -1.5046, -1.4790, -1.4203, -1.6500, -1.4538, -0.5664]], [[ -3.6881, -6.0774, -6.0216, -3.6887, -5.6526, -5.2551, -4.2161, -2.7489, -2.5077, -3.0465, -3.8012]], [[ -4.4316, -7.0525, -6.4052, -6.5535, -6.6565, -3.2656, -3.6550, -3.5875, -3.0921, -3.4450, -2.7869]], [[ -1.5507, -3.5332, -3.1737, -2.9583, -3.0017, -2.2187, -1.9782, -2.3633, -2.1932, -2.0868, -1.4556]], [[ -0.7694, -4.6246, -4.5011, -4.2753, -4.0262, -3.5443, -3.3010, -3.3373, -3.3774, -3.1062, -2.7830]]]]) attn_weights tensor([[[[ 5.3101, -0.5637, -2.6752, -1.6014, -0.1388, -1.8984, -0.8495, -1.1926, -3.0325, -2.4273, 1.6073]], [[ -2.5890, -6.1686, -5.1110, -5.8210, -6.0012, -6.1155, -6.1710, -2.9920, -2.8782, -3.6568, -4.9982]], [[ -4.2967, -8.4237, -7.2096, -6.8292, -5.5982, -7.1876, -7.6802, -4.9729, -2.6967, -2.9569, -5.0355]], [[ -4.4620, -9.0080, -12.7327, -11.9865, -11.2459, -9.7515, -10.7504, -6.4043, -8.5037, -7.9475, -9.0593]], [[ 1.2321, -3.4472, -4.1320, -3.2330, -3.5312, -3.6018, -2.4478, -2.7599, -4.0749, -3.3886, -4.1690]], [[ -0.0716, -2.2200, -2.6903, -1.9833, -1.8602, -2.4444, -2.2251, -3.1588, -3.1165, -2.3951, -2.6258]], [[ -2.9421, -6.3285, -3.1153, -3.8859, -6.7042, -4.9720, -4.6473, -3.7781, -0.1172, -1.3193, -3.2693]], [[ -5.5395, -9.3561, -10.2877, -9.9461, -6.9194, -7.0389, -7.5590, -5.1497, -5.9182, -6.0923, -6.5809]], [[ -4.0971, -7.4774, -8.6269, -7.3681, -7.5509, -7.1913, -7.4508, -3.4316, -4.3455, -3.7112, -5.1862]], [[ -1.4437, -4.4670, -4.0081, -1.8907, -2.3619, -4.0578, -6.1160, -2.9042, -2.3497, -0.8762, -3.8697]], [[ -0.8853, -5.2806, -4.4387, -4.6889, -3.1918, -4.0020, -3.6271, -3.2530, -3.2873, -3.6175, -2.0227]], [[ -2.5256, -5.5478, -5.6596, -6.2828, -4.0231, -4.2680, -5.3499, -3.5244, -3.2669, -4.3310, -5.3411]]], [[[ 3.7575, -1.1278, -0.8388, 2.3300, -1.2397, -5.5228, -3.9345, -1.3791, -1.7932, -1.7466, 0.8396]], [[ -2.8951, -6.2856, -5.8959, -6.4729, -5.8287, -5.3098, -6.4619, -3.2556, -3.1203, -3.5804, -4.1781]], [[ -4.2022, -7.1174, -6.9309, -8.8781, -6.3863, -7.7308, -8.9941, -5.1725, -3.4594, -2.5315, -4.4812]], [[ -4.7455, -9.4451, -10.7427, -11.0074, -10.3154, -9.6048, -11.3267, -6.0686, -5.9036, -5.9009, -6.2493]], [[ 0.6829, -3.6298, -3.3984, -2.1471, -2.9555, -4.1143, -2.9166, -3.2738, -2.8658, -3.6465, -2.2026]], [[ -0.2696, -2.4264, -2.6797, -1.7826, -1.5803, -3.2082, -2.9520, -3.2534, -3.0886, -3.6378, -2.7295]], [[ -2.8519, -6.2361, -3.7068, -5.7181, -5.2092, -4.6305, -5.6983, -3.9782, -3.6901, -0.6968, -2.7095]], [[ -5.7681, -9.6298, -10.3176, -10.6861, -8.2307, -7.2427, -7.9171, -5.9736, -5.9773, -5.4002, -5.8485]], [[ -4.0585, -6.6474, -8.7913, -8.5328, -8.1844, -6.8369, -7.0240, -3.4186, -2.6126, -4.6246, -4.3362]], [[ -1.4984, -4.3243, -5.0522, -4.1686, -5.3044, -6.0009, -6.4615, -3.6300, -3.0145, -3.1554, -2.5712]], [[ -0.9928, -5.0946, -4.6794, -4.3212, -4.0962, -3.8996, -4.7984, -3.5908, -3.0538, -3.2116, -2.8057]], [[ -2.4608, -5.5566, -6.3976, -6.2222, -4.7369, -3.8648, -4.9893, -4.2932, -2.8476, -3.4005, -3.7335]]], [[[ 4.6839, -0.7412, -1.9787, -0.1359, -1.1946, -4.2734, -5.4666, -1.2484, -3.3836, -2.2772, 0.5497]], [[ -2.9422, -6.7522, -5.8982, -6.4420, -6.0867, -5.3730, -7.0925, -3.9075, -3.4151, -3.8075, -5.6778]], [[ -4.4819, -8.5749, -7.7642, -8.1455, -6.6584, -7.5679, -8.7799, -5.5357, -5.8648, -2.5206, -5.0756]], [[ -4.8791, -10.3590, -12.3307, -11.6536, -11.7394, -11.3915, -13.0776, -6.9492, -5.3695, -6.6033, -8.1033]], [[ 1.2136, -3.1583, -3.7706, -2.4989, -3.1839, -3.9106, -3.0158, -2.9428, -4.2675, -3.7301, -4.4047]], [[ -0.1686, -2.1319, -3.7030, -1.6200, -1.8779, -3.1007, -3.1846, -3.0331, -3.1629, -3.5076, -3.1299]], [[ -2.9740, -7.3784, -5.5324, -6.3890, -6.2563, -5.8117, -6.7878, -4.1721, -4.3759, -1.4653, -3.0854]], [[ -5.8467, -11.6042, -11.9435, -10.9475, -9.8911, -7.7879, -8.8187, -7.1165, -6.4550, -5.9441, -7.3994]], [[ -4.3542, -7.9165, -9.8769, -8.1878, -9.2331, -7.8705, -7.7294, -4.0614, -2.9115, -4.6648, -5.2928]], [[ -1.5298, -5.2313, -5.0715, -4.8147, -5.3567, -6.8567, -5.8352, -3.4125, 0.7975, -2.6510, -3.3010]], [[ -1.1111, -4.6799, -4.5074, -3.5040, -4.0735, -4.3832, -5.0533, -3.8614, -3.7355, -2.6088, -3.2207]], [[ -2.4488, -6.2275, -6.7997, -6.6339, -5.6844, -5.5117, -7.2140, -4.5527, -2.6632, -3.5756, -3.7022]]], [[[ 4.6078, 0.3416, -1.1292, -1.6191, -0.5588, -2.2514, 4.3638, 0.0770, -1.6902, -2.1101, 2.6091]], [[ -2.7791, -5.8605, -4.4596, -4.5863, -4.6713, -5.6473, -5.2072, -3.0337, -3.0135, -5.1550, -4.1500]], [[ -4.6623, -8.1146, -8.5102, -7.3782, -5.6878, -7.2853, -7.6160, -3.3319, -1.6272, -3.4352, -4.4928]], [[ -4.7289, -10.4078, -13.9073, -12.0000, -11.3079, -8.3241, -10.8937, -6.5183, -7.4681, -5.1599, -6.4023]], [[ 0.6556, -3.3164, -3.5198, -3.5357, -2.6338, -1.1154, -4.1983, -3.0757, -2.5470, -1.3662, -3.9742]], [[ -0.1297, -2.9287, -3.0293, -2.8976, -2.2369, -2.2528, -2.4260, -2.7590, -2.3714, -2.1193, -2.9859]], [[ -3.8395, -5.5537, -4.6412, -5.3526, -4.6541, -3.8077, -6.2197, -3.0298, -2.6033, -1.7301, -3.4835]], [[ -5.7404, -11.1071, -9.9657, -9.2867, -10.2001, -7.1662, -10.0201, -7.0314, -7.0203, -4.2429, -5.9940]], [[ -4.7207, -7.7842, -7.6050, -7.0226, -7.0785, -6.3925, -7.4997, -3.3686, -4.5837, -5.2197, -5.1403]], [[ -1.9459, -4.7290, -4.4162, -3.8542, -3.9171, -5.5841, -5.4651, -3.1911, -2.7089, -3.3184, -4.5658]], [[ -1.1158, -5.4540, -5.9063, -6.4903, -5.2652, -2.7728, -3.2272, -3.1440, -3.6870, -2.1350, -1.9072]], [[ -2.3499, -6.1727, -6.2008, -4.7840, -6.0865, -4.9981, -5.9222, -2.5883, -3.4830, -1.0103, -4.3520]]], [[[ 5.8887, 0.4696, -3.9345, -2.7473, 0.7326, -2.7643, -1.8781, -1.1300, -4.7941, -0.8803, 3.4073]], [[ -2.6795, -6.3533, -4.5995, -5.4240, -5.3234, -6.0767, -5.5482, -3.5024, -3.3419, -3.6281, -5.7446]], [[ -3.8579, -8.5016, -8.9424, -7.0386, -6.5292, -7.7161, -7.6913, -4.1003, -3.2975, -2.0583, -3.8705]], [[ -4.5337, -9.5779, -12.6344, -10.6190, -11.5030, -8.2710, -10.4015, -6.2192, -7.0369, -6.6751, -7.3290]], [[ 1.1991, -3.7770, -3.8282, -4.4419, -2.9878, -2.3614, -2.1555, -3.1701, -4.6430, -3.2887, -4.8947]], [[ 0.0151, -2.3068, -2.8723, -2.3372, -1.9787, -2.1157, -1.3142, -2.8237, -3.0654, -2.7239, -2.4009]], [[ -3.4890, -7.1329, -5.4325, -7.0904, -6.1050, -3.9350, -5.8699, -4.0332, -3.6527, -2.9064, -2.8944]], [[ -5.3846, -10.0950, -9.5844, -9.8134, -10.1134, -6.6232, -9.2230, -6.2044, -6.8903, -6.1615, -6.4984]], [[ -4.4627, -7.9047, -7.2734, -6.6188, -8.2563, -7.1629, -6.8675, -3.6657, -3.4432, -4.6608, -5.3878]], [[ -1.8828, -5.3995, -5.3046, -4.1498, -4.0452, -4.7118, -3.3840, -2.8642, -3.5851, -2.9461, -3.9813]], [[ -0.8766, -5.7341, -6.0428, -6.6740, -5.3491, -3.3283, -4.0312, -3.7122, -4.6742, -3.3956, -1.8956]], [[ -2.0537, -6.1693, -5.2026, -5.1863, -6.7208, -4.7800, -4.7362, -3.8162, -2.4662, -3.8940, -3.0888]]]]) attn_weights tensor([[[[-1.4202e+00, -8.6091e+00, -6.7980e+00, -6.2468e+00, -4.4402e+00, -7.4254e+00, -8.1296e+00, -4.8989e+00, -4.0679e+00, -3.9679e+00, -4.1532e+00]], [[-2.5455e+00, -5.2040e+00, -4.5295e+00, -4.5938e+00, -4.9122e+00, -3.6263e+00, -3.2149e+00, -1.1182e+00, -1.3422e+00, -2.1919e+00, -3.1475e+00]], [[ 3.1358e-02, -2.0800e+00, -3.2541e+00, -3.1407e+00, -4.3959e+00, -4.5737e+00, -3.7265e+00, -3.0096e+00, -3.7753e+00, -3.6585e+00, -3.3117e+00]], [[-1.6270e+00, -4.4404e+00, -3.1502e+00, -3.7677e+00, -2.8390e+00, -3.5799e+00, -3.5426e+00, -3.5008e+00, -1.2299e+00, -2.4194e+00, -4.0296e+00]], [[ 1.7845e+00, -1.9281e+00, -1.2757e+00, -1.3258e+00, -2.3546e+00, -2.5332e+00, -3.7709e+00, -2.1028e+00, -1.4821e+00, -1.5294e+00, -1.6154e+00]], [[-1.9461e+00, -6.6562e+00, -6.3550e+00, -5.9690e+00, -4.7601e+00, -7.7717e+00, -7.3584e+00, -4.9360e+00, -4.5128e+00, -4.4640e+00, -4.7896e+00]], [[-1.7707e+00, -4.9387e+00, -5.9867e+00, -5.7145e+00, -4.0651e+00, -3.7011e+00, -3.9648e+00, -4.1146e+00, -4.8513e+00, -4.5794e+00, -4.5707e+00]], [[ 6.5683e-01, -5.0974e+00, -2.8767e+00, -8.8908e-01, 6.7380e-01, -1.8740e+00, -2.5970e+00, -1.3209e+00, -1.8499e+00, -3.2611e-01, 1.6603e+00]], [[ 1.6598e+00, -2.6243e+00, -2.2329e+00, -1.3890e+00, -1.5345e+00, -2.4475e+00, -1.7127e+00, -1.5796e+00, -2.1288e+00, -1.8945e+00, -2.1549e+00]], [[-1.1283e+00, -2.6294e+00, -3.2632e+00, -2.4108e+00, -2.8369e+00, -3.0848e+00, -2.8261e+00, -2.4493e+00, -2.0663e+00, -1.5876e+00, -2.3107e+00]], [[ 1.4924e+00, -2.7674e+00, -3.4076e+00, -3.1864e+00, -3.3251e+00, -2.7707e+00, -2.7552e+00, -3.1777e+00, -3.5217e+00, -3.5366e+00, -3.1215e+00]], [[-6.2477e+00, -2.1620e+01, -1.3719e+01, -1.4904e+00, -7.0458e+00, -1.2228e+01, -1.5830e+01, -5.6276e+00, 1.2490e+00, 1.1485e+01, 7.2643e-02]]], [[[-2.0404e+00, -7.4163e+00, -7.0164e+00, -6.8149e+00, -7.7507e+00, -7.2564e+00, -9.1795e+00, -6.5776e+00, -4.8132e+00, -4.3716e+00, -4.3861e+00]], [[-2.4950e+00, -4.4384e+00, -5.5442e+00, -5.4422e+00, -5.4357e+00, -4.6582e+00, -5.2929e+00, -2.8474e+00, -3.2224e-01, -2.0985e+00, -2.2749e+00]], [[-1.8384e-01, -1.7749e+00, -2.9668e+00, -3.0477e+00, -4.0073e+00, -4.2086e+00, -4.2556e+00, -2.4398e+00, -2.5684e+00, -3.2424e+00, -3.2375e+00]], [[-1.9309e+00, -5.8660e+00, -4.0858e+00, -4.2942e+00, -4.4244e+00, -4.3554e+00, -4.2206e+00, -4.6050e+00, -3.0687e+00, -1.9770e+00, -2.1411e+00]], [[ 1.3466e+00, -1.7643e+00, -1.8836e-01, -2.3705e-03, -1.2988e+00, -3.4686e+00, -3.9378e+00, -1.9533e+00, -2.0792e+00, -3.6021e-01, -1.5526e-01]], [[-1.8462e+00, -5.6043e+00, -6.3013e+00, -6.4813e+00, -6.3376e+00, -7.8131e+00, -8.1641e+00, -4.7893e+00, -5.1665e+00, -3.9968e+00, -4.2956e+00]], [[-2.1073e+00, -4.8487e+00, -5.7109e+00, -6.0503e+00, -4.0898e+00, -4.2307e+00, -3.3716e+00, -4.3141e+00, -4.0691e+00, -4.4606e+00, -4.9592e+00]], [[ 9.6176e-01, -5.3493e+00, -3.4710e+00, -1.6391e-01, -1.6104e+00, -3.0038e+00, -4.6169e+00, -4.0146e+00, -2.3952e+00, -8.6996e-01, 1.0326e+00]], [[ 1.5003e+00, -2.1914e+00, -2.3825e+00, -2.2206e+00, -1.7871e+00, -3.2367e+00, -2.0369e+00, -2.1540e+00, -1.2729e+00, -2.3264e+00, -2.3721e+00]], [[-1.0556e+00, -3.1841e+00, -3.9335e+00, -4.5507e+00, -2.1850e+00, -4.5212e+00, -3.5012e+00, -3.3792e+00, -4.1193e+00, -3.4904e+00, -3.9772e+00]], [[ 1.2087e+00, -1.6881e+00, -2.2704e+00, -2.2763e+00, -2.6338e+00, -2.8618e+00, -3.2856e+00, -1.9064e+00, -1.0382e+00, -2.3003e+00, -2.8540e+00]], [[-7.5157e-01, -1.7217e+01, -9.2062e-01, -9.4465e+00, -1.5929e+01, -1.6027e+01, -2.7419e+01, -1.2923e+01, -1.5465e+00, 1.5926e+01, 7.1531e+00]]], [[[-2.1229e+00, -8.3231e+00, -7.9158e+00, -7.6513e+00, -7.8335e+00, -9.4810e+00, -8.9969e+00, -6.3705e+00, -5.6830e+00, -4.6851e+00, -5.3841e+00]], [[-2.4739e+00, -5.8177e+00, -5.9963e+00, -6.5670e+00, -6.4418e+00, -4.3612e+00, -7.1079e+00, -3.5338e+00, -1.6535e+00, -2.2651e+00, -2.3296e+00]], [[-3.2983e-03, -1.7818e+00, -2.6135e+00, -3.2911e+00, -4.2173e+00, -5.0066e+00, -3.6390e+00, -2.8445e+00, -3.5193e+00, -3.3094e+00, -3.7505e+00]], [[-2.4254e+00, -5.7234e+00, -5.2825e+00, -5.3617e+00, -5.0908e+00, -4.6547e+00, -4.2380e+00, -4.6558e+00, -4.1935e+00, -2.6770e+00, -4.0326e+00]], [[ 1.4440e+00, -2.4533e+00, -5.9810e-01, -1.3471e+00, -2.2768e+00, -3.4938e+00, -4.4894e+00, -2.2493e+00, -2.0008e+00, -1.3399e+00, -1.8185e+00]], [[-1.9309e+00, -6.7950e+00, -7.2643e+00, -7.8596e+00, -7.7361e+00, -8.5604e+00, -9.0157e+00, -5.1315e+00, -5.8393e+00, -4.3350e+00, -6.6802e+00]], [[-2.1285e+00, -5.5190e+00, -6.1677e+00, -5.5962e+00, -4.9003e+00, -4.1762e+00, -4.0161e+00, -4.7100e+00, -4.7907e+00, -4.3047e+00, -4.6337e+00]], [[ 8.3849e-01, -3.9570e+00, -2.0543e+00, 6.6841e-01, -1.5839e+00, -2.0905e+00, -3.4943e+00, -2.3268e+00, -1.4010e+00, 3.2285e-01, 1.3314e+00]], [[ 1.6877e+00, -3.1114e+00, -2.3608e+00, -2.3117e+00, -2.1960e+00, -2.6202e+00, -1.7329e+00, -2.2977e+00, -1.8739e+00, -2.1484e+00, -3.8371e+00]], [[-9.6063e-01, -4.1172e+00, -4.2325e+00, -4.7970e+00, -2.7075e+00, -2.6938e+00, -1.8416e+00, -3.2918e+00, -3.7696e+00, -2.4304e+00, -3.4671e+00]], [[ 1.5584e+00, -1.9058e+00, -2.8084e+00, -3.1164e+00, -3.0650e+00, -3.1255e+00, -4.6228e+00, -2.1968e+00, -1.8946e+00, -3.0434e+00, -4.3647e+00]], [[-3.6855e+00, -1.6094e+01, -2.3307e+00, -6.3169e+00, -1.1819e+01, -1.2986e+01, -2.6505e+01, -1.1994e+01, -7.9160e-02, 1.5547e+01, 4.2497e+00]]], [[[-3.0522e+00, -6.5650e+00, -6.4546e+00, -3.6271e+00, -4.4193e+00, -7.0774e+00, -6.7770e+00, -3.7034e+00, -3.9205e+00, -5.6867e+00, -5.5668e+00]], [[-2.4679e+00, -6.2479e+00, -4.8403e+00, -5.2688e+00, -5.6446e+00, -6.7030e+00, -5.7359e+00, -1.6242e+00, -2.4114e+00, -4.0293e+00, -3.7803e+00]], [[-2.3512e-01, -2.9423e+00, -3.3121e+00, -2.9933e+00, -3.2037e+00, -4.0661e+00, -4.0212e+00, -2.1063e+00, -3.4552e+00, -4.1053e+00, -4.0978e+00]], [[-2.3092e+00, -4.0736e+00, -3.7609e+00, -4.0287e+00, -4.2568e+00, -3.2533e+00, -5.5701e+00, -3.3741e+00, -3.9407e+00, -2.1441e+00, -3.1825e+00]], [[ 1.3450e+00, -2.2118e+00, -2.8458e+00, -3.9054e+00, -1.7373e+00, -6.1426e-01, -8.5858e-01, -9.3924e-01, -3.8055e-01, -8.4363e-01, -4.2268e-01]], [[-2.4521e+00, -5.8005e+00, -5.2653e+00, -5.6495e+00, -6.4642e+00, -5.6621e+00, -5.8603e+00, -3.3926e+00, -3.6577e+00, -2.4856e+00, -4.8863e+00]], [[-2.0358e+00, -4.2576e+00, -5.6920e+00, -5.1135e+00, -4.4957e+00, -3.2098e+00, -5.8027e+00, -3.5726e+00, -4.4379e+00, -2.9957e+00, -4.8591e+00]], [[ 2.6202e-02, -4.6855e+00, -3.3001e+00, -3.9272e+00, -3.5024e+00, -5.3895e-01, -9.5681e-01, -2.0675e+00, -2.1641e+00, 1.2023e+00, 1.4516e+00]], [[ 1.8086e+00, -4.5234e+00, -4.5304e+00, -4.0759e+00, -3.4028e+00, -9.2760e-01, -2.0158e+00, -1.4543e+00, -1.1222e+00, -1.8786e+00, -2.5287e+00]], [[-1.0739e+00, -4.1194e+00, -4.4248e+00, -4.1617e+00, -3.1299e+00, -5.2934e+00, -4.4977e+00, -3.1802e+00, -3.4395e+00, -3.9108e+00, -4.4412e+00]], [[ 1.1041e+00, -3.6748e+00, -3.3690e+00, -3.9111e+00, -3.0937e+00, -3.4750e+00, -1.5515e+00, -2.8460e+00, -2.8585e+00, -4.3447e+00, -2.7577e+00]], [[-1.6652e+00, -1.4471e+01, -2.3955e+01, -2.7933e+01, -2.1762e+01, -7.6523e-01, -1.1287e+01, -8.6022e+00, -6.9766e+00, 1.8131e+01, 5.7024e+00]]], [[[-3.2590e+00, -7.3258e+00, -6.2600e+00, -3.6091e+00, -3.5000e+00, -6.3517e+00, -5.3524e+00, -3.9580e+00, -4.8318e+00, -3.3120e+00, -4.9018e+00]], [[-2.2913e+00, -5.9511e+00, -4.9200e+00, -5.0805e+00, -6.1078e+00, -5.2960e+00, -5.1740e+00, -2.6248e+00, -1.2145e+00, -2.4708e+00, -3.6003e+00]], [[-1.9713e-02, -3.5513e+00, -4.0108e+00, -3.2709e+00, -3.1096e+00, -2.7788e+00, -2.6148e+00, -2.2130e+00, -2.8194e+00, -2.5758e+00, -3.9276e+00]], [[-2.1364e+00, -5.6527e+00, -3.0925e+00, -2.9790e+00, -4.9349e+00, -2.5774e+00, -3.8120e+00, -4.1590e+00, -4.0854e+00, -5.4292e+00, -3.2206e+00]], [[ 1.5200e+00, -2.9924e+00, -3.8388e+00, -2.3234e+00, -1.2555e+00, -1.8298e+00, -3.1748e+00, -2.1965e+00, -2.6984e+00, -9.6051e-01, -7.2334e-01]], [[-1.8226e+00, -6.2592e+00, -5.7490e+00, -5.7455e+00, -6.5106e+00, -5.8353e+00, -5.3156e+00, -3.5432e+00, -5.0218e+00, -4.4920e+00, -3.5704e+00]], [[-2.0070e+00, -4.7623e+00, -4.4004e+00, -4.8560e+00, -4.4988e+00, -2.5163e+00, -3.8963e+00, -4.0034e+00, -3.8612e+00, -3.9703e+00, -4.2086e+00]], [[ 6.4481e-02, -5.2342e+00, -3.5337e+00, -3.4003e+00, -1.6761e+00, -1.5615e-01, -2.7766e+00, -3.2078e+00, -2.8170e+00, -1.4888e+00, 7.9138e-01]], [[ 1.8692e+00, -4.3540e+00, -4.8999e+00, -3.3727e+00, -3.2831e+00, -2.7828e-01, -1.6818e+00, -2.4890e+00, -2.2189e+00, -1.5932e+00, -2.4592e+00]], [[-1.1383e+00, -3.9172e+00, -3.7168e+00, -3.7481e+00, -2.6511e+00, -2.8941e+00, -1.4472e+00, -3.4676e+00, -4.4282e+00, -2.5721e+00, -3.0925e+00]], [[ 1.3265e+00, -4.6601e+00, -4.1783e+00, -4.9870e+00, -2.9244e+00, -3.6588e+00, -2.3606e+00, -4.1550e+00, -4.0476e+00, -2.7099e+00, -3.2988e+00]], [[-5.0103e+00, -1.4652e+01, -1.5702e+01, -1.4318e+01, -4.6955e+00, -4.4836e+00, -1.9108e+01, -8.6864e+00, -3.2794e-01, 1.3909e+01, -5.2829e-01]]]]) attn_weights tensor([[[[ 2.1583e+00, -3.5417e+00, -5.9781e+00, -6.1771e+00, -3.1164e+00, -1.1603e+00, -4.4169e-02, 7.9757e-01, -1.8858e+00, -4.3037e+00, -1.3282e+00]], [[ 4.2291e+00, -8.6734e+00, -8.6176e+00, -7.6106e+00, -4.4179e+00, -1.2393e+00, -6.1683e+00, -4.9559e+00, -5.8654e+00, -6.7785e+00, -3.0629e+00]], [[ 2.1816e-01, -3.2669e+00, -2.9599e+00, -3.4797e+00, -4.5073e+00, -3.4317e+00, -3.4685e+00, -3.1235e+00, -1.1954e+00, -2.2157e+00, -3.0822e+00]], [[-2.3291e-01, -2.2344e-01, -1.0659e+00, -1.0274e+00, -1.4638e+00, -2.3454e+00, -1.4278e+00, -3.7451e-01, 4.8822e-01, -4.2647e-01, -9.0924e-01]], [[-8.9219e-03, -4.1364e+00, -4.2612e+00, -4.0994e+00, -3.2148e+00, -1.8822e+00, -1.9004e+00, -1.4402e+00, -1.6646e+00, -1.8053e+00, -1.2547e+00]], [[ 2.1647e+00, -4.7805e+00, -3.3359e+00, -2.6265e+00, -3.1091e+00, -1.9291e+00, -3.2960e+00, -2.5006e+00, -2.4004e+00, -3.5816e+00, -3.5405e+00]], [[ 1.2151e+00, -5.6832e+00, -5.0486e+00, -3.2293e+00, -2.3572e+00, -2.3817e+00, -4.1586e+00, -2.8640e+00, -1.8982e+00, -1.5278e+00, -2.9941e+00]], [[ 1.0843e+00, -4.3317e+00, -5.3709e+00, -4.1089e+00, -3.2507e+00, -2.1629e+00, -1.5785e+00, -3.6799e+00, -3.3050e+00, -2.5019e+00, -1.8979e+00]], [[ 9.2363e-01, -3.7176e+00, -4.3809e+00, -4.1437e+00, -2.9435e+00, -1.5864e+00, -1.2178e+00, -8.9061e-01, -2.3508e+00, -3.3253e+00, -2.8609e+00]], [[ 1.0384e+00, -2.8370e+00, -3.7936e+00, -3.7036e+00, -2.0800e+00, -2.3224e+00, -1.0551e+00, -1.7895e+00, -3.3857e+00, -4.2304e+00, -4.6520e+00]], [[ 2.3198e+00, 5.0107e-01, 9.1203e-01, 4.0473e-01, 3.9341e-01, -1.8751e-01, 2.7052e+00, 1.1609e+00, 6.6544e-01, -3.6071e-01, 1.2632e-01]], [[ 1.1853e+00, -3.2416e+00, -3.4424e+00, -1.5411e+00, -1.3843e+00, -3.3961e+00, -3.2924e+00, -2.5797e+00, -3.0527e+00, -1.2838e+00, -1.0310e+00]]], [[[ 1.8538e+00, -4.9299e+00, -4.0049e+00, -3.9729e+00, -7.0870e-02, -3.7730e-01, -2.3851e+00, -2.2042e+00, -3.9629e-01, -1.7718e+00, -2.8130e+00]], [[ 4.3539e+00, -9.8609e+00, -7.6925e+00, -4.6808e+00, 2.4417e+00, -1.9100e-01, -9.2677e+00, -9.5328e+00, -5.3616e+00, -2.0630e+00, -1.4458e+00]], [[ 1.4120e-02, -2.9015e+00, -2.5677e+00, -3.7729e+00, -2.2346e+00, -2.9882e+00, -2.8215e+00, -3.3389e+00, -3.1834e+00, -2.1198e+00, -3.3705e+00]], [[-1.0881e-01, -6.8719e-01, -1.5270e+00, -1.7738e+00, -2.2969e+00, -1.8506e+00, -1.5763e+00, -1.9398e+00, -6.0889e-01, -1.1574e+00, -1.5021e+00]], [[-2.7796e-01, -4.5172e+00, -5.8706e+00, -6.0186e+00, -3.3707e+00, -3.2913e+00, -2.4118e+00, -2.9228e+00, -2.2188e+00, -2.9082e+00, -2.8496e+00]], [[ 1.8276e+00, -4.5924e+00, -3.2832e+00, -3.2181e+00, 8.0753e-01, -7.1265e-01, -4.2937e+00, -2.7216e+00, -1.3917e+00, -2.6813e+00, -3.8536e+00]], [[ 1.0989e+00, -4.2858e+00, -3.1399e+00, -4.7465e+00, -4.4562e+00, -3.9243e+00, -5.8554e+00, -3.6066e+00, -1.1318e-01, 3.5161e-01, -2.1627e+00]], [[ 7.0098e-01, -3.5922e+00, -5.6904e+00, -6.1977e+00, -4.5179e+00, -4.2272e+00, -2.9194e+00, -4.6351e+00, -3.4446e+00, -4.1973e+00, -4.3594e+00]], [[ 9.3686e-01, -4.8888e+00, -4.1962e+00, -4.3762e+00, 9.2183e-01, -9.2100e-01, -2.8398e+00, -2.2423e+00, -2.2529e+00, -2.2683e+00, -3.1212e+00]], [[ 6.2582e-01, -2.5291e+00, -2.9094e+00, -3.1945e+00, -2.0512e+00, -1.7005e+00, -1.7780e+00, -1.9064e+00, -2.1445e+00, -2.6524e+00, -3.5066e+00]], [[ 1.5686e+00, -7.9059e-01, -4.4836e-01, -6.5338e-01, 7.4027e-01, -5.2518e-01, 1.6720e+00, 1.6882e+00, -9.8733e-01, -1.5620e-01, -1.0791e+00]], [[ 1.0459e+00, -3.2219e+00, -3.1367e+00, -5.6987e-01, -6.7379e-01, -3.1483e+00, -3.6489e+00, -2.6949e+00, -1.8850e+00, -1.7410e+00, 5.4129e-01]]], [[[ 2.4157e+00, -4.1676e+00, -4.3321e+00, -3.2931e+00, -4.9676e-01, -1.1582e+00, -1.7252e+00, -1.4879e+00, -2.6163e+00, -1.0547e+00, -1.6464e+00]], [[ 4.8188e+00, -9.6656e+00, -6.3176e+00, -3.0654e+00, -3.5869e+00, -6.0360e+00, -1.1420e+01, -1.1707e+01, -7.0346e+00, -5.7205e+00, -2.3229e+00]], [[ 2.1686e-01, -2.8631e+00, -3.1897e+00, -4.0482e+00, -3.2392e+00, -2.6932e+00, -3.2172e+00, -3.2021e+00, -2.5977e+00, -1.2750e+00, -2.4096e+00]], [[-1.6386e-01, -1.6605e+00, -2.0565e+00, -2.1639e+00, -2.3960e+00, -2.1305e+00, -2.4828e+00, -1.7660e+00, -9.6095e-01, -8.5365e-01, -1.9985e+00]], [[-5.0578e-01, -4.7983e+00, -5.9630e+00, -4.8071e+00, -3.7804e+00, -3.1836e+00, -2.3115e+00, -3.3479e+00, -1.3448e+00, -2.1196e+00, -2.0226e+00]], [[ 1.8286e+00, -4.6360e+00, -2.7186e+00, -2.2571e+00, -2.0373e+00, -1.7277e+00, -4.4051e+00, -3.6663e+00, -2.0235e+00, -2.9551e+00, -3.1858e+00]], [[ 1.1045e+00, -3.3390e+00, -2.4460e+00, -3.3814e+00, -2.8151e+00, -2.6267e+00, -6.4014e+00, -3.9597e+00, -1.9850e+00, 4.5977e-01, -2.1785e+00]], [[ 9.1308e-01, -4.3272e+00, -6.2944e+00, -6.9791e+00, -4.9556e+00, -4.5449e+00, -6.0568e-01, -4.1605e+00, -2.1775e+00, -3.8647e+00, -2.4340e+00]], [[ 6.6324e-01, -3.8629e+00, -4.3156e+00, -3.3412e+00, -1.5258e+00, -3.3933e+00, -4.7233e+00, -4.0225e+00, -3.4072e+00, -3.0430e+00, -3.1297e+00]], [[ 8.2946e-01, -2.7982e+00, -3.2829e+00, -3.3298e+00, -2.8563e+00, -2.2726e+00, -2.5159e+00, -2.4563e+00, -3.2760e+00, -2.8334e+00, -4.3245e+00]], [[ 1.9162e+00, -1.2524e+00, -1.0755e+00, -1.2710e+00, -4.4239e-01, -5.3136e-01, 1.1551e+00, 1.0616e+00, -1.2112e+00, -1.1508e+00, -2.3522e+00]], [[ 8.9684e-01, -3.8314e+00, -3.3426e+00, -2.2409e+00, -2.7412e+00, -2.9647e+00, -4.9443e+00, -3.7141e+00, -2.4878e+00, -2.5144e+00, -1.4684e+00]]], [[[ 1.9731e+00, -7.6471e+00, -7.1070e+00, -5.7929e+00, -7.0159e+00, -4.2189e+00, -2.4187e+00, 3.1634e-01, -2.4970e+00, -2.8281e+00, -3.4586e+00]], [[ 4.3475e+00, -1.8250e+01, -1.5224e+01, -1.0938e+01, -1.1656e+01, -7.0276e+00, -5.9861e+00, 2.7009e+00, -9.7688e-01, -4.0988e+00, -2.3229e+00]], [[ 1.6645e-02, -2.7948e+00, -4.7602e+00, -3.8023e+00, -1.8245e+00, -2.9585e+00, -3.9488e+00, -2.5262e+00, -1.1299e+00, -1.6191e+00, -3.3728e+00]], [[-1.4304e-01, -1.0964e+00, -2.1410e+00, -1.3530e+00, -1.4433e+00, -1.9135e+00, -2.1819e+00, -8.1666e-01, -4.1362e-01, -1.2650e+00, -1.6618e+00]], [[-4.0378e-01, -3.4842e+00, -3.8019e+00, -3.8496e+00, -3.4024e+00, -3.3821e+00, -2.9701e+00, -7.4480e-01, -6.4868e-01, -2.3475e+00, -2.2014e+00]], [[ 2.2594e+00, -1.1835e+01, -8.7625e+00, -6.1219e+00, -5.3988e+00, -3.1631e+00, -4.3119e+00, 3.1903e+00, 1.2488e+00, -1.1511e+00, -3.0668e+00]], [[ 9.0652e-01, -8.2010e+00, -9.1288e+00, -8.5523e+00, -7.3750e+00, -2.7219e+00, -4.0309e+00, -4.0863e+00, -3.6619e+00, 1.5752e+00, -3.5407e-01]], [[ 1.1601e+00, -4.9748e+00, -5.7984e+00, -6.6451e+00, -3.7393e+00, -4.7874e+00, -3.1878e+00, -3.6274e+00, -2.5821e+00, -1.9068e+00, -2.6014e+00]], [[ 6.1184e-01, -8.0592e+00, -7.4307e+00, -5.8431e+00, -6.2002e+00, -4.7546e+00, -4.1477e+00, 1.0382e+00, -5.5178e-01, -3.2716e+00, -4.4051e+00]], [[ 6.7746e-01, -3.4095e+00, -3.8543e+00, -3.0099e+00, -2.3946e+00, -8.4105e-01, -2.1833e+00, -7.8690e-01, -2.1924e+00, -2.8583e+00, -3.3097e+00]], [[ 2.8044e+00, -1.3573e+00, -8.6662e-01, 1.1840e-01, -4.7920e-01, -4.6382e-01, 1.7186e+00, 1.2503e+00, -9.0522e-01, 2.5241e-01, 8.4786e-01]], [[ 8.2130e-01, -3.2898e+00, -3.4967e+00, -3.8042e+00, -3.1977e+00, -2.5086e+00, -2.4435e+00, -1.5974e+00, -2.0595e+00, -2.0259e+00, -2.0140e+00]]], [[[ 2.4167e+00, -6.0602e+00, -6.8811e+00, -5.9327e+00, -5.9152e+00, -3.9682e+00, 8.3261e-01, -5.4867e-01, -2.9712e+00, -1.2929e+00, -1.0346e+00]], [[ 4.2475e+00, -1.5371e+01, -1.3459e+01, -1.1165e+01, -1.2254e+01, -6.7655e+00, -4.4121e+00, -4.3062e+00, -4.7726e+00, -3.2350e+00, -1.1636e+00]], [[ 2.6397e-01, -3.2868e+00, -4.3200e+00, -3.1399e+00, -2.2401e+00, -4.3840e+00, -3.3615e+00, -2.8366e+00, -2.3530e+00, -2.0135e+00, -4.0527e+00]], [[ 3.4405e-01, -2.2825e+00, -2.7702e+00, -2.3945e+00, -2.8357e+00, -2.5956e+00, -2.5518e+00, -2.0985e+00, -1.4671e+00, -1.9752e+00, -2.8626e+00]], [[-2.8131e-01, -4.3644e+00, -4.0810e+00, -3.6563e+00, -3.7229e+00, -2.8888e+00, -2.6513e+00, -1.7332e+00, -6.7680e-01, -1.7146e+00, -2.7225e+00]], [[ 2.1290e+00, -1.0930e+01, -7.0054e+00, -7.8874e+00, -8.0313e+00, -4.3961e+00, -4.8281e+00, -3.9428e+00, -3.9633e+00, -2.9974e+00, -1.8965e+00]], [[ 8.8678e-01, -4.7092e+00, -4.3279e+00, -4.1130e+00, -1.7997e+00, -1.5872e+00, -4.7732e+00, -3.0726e+00, -1.7408e+00, 2.9633e-01, -7.9392e-01]], [[ 1.3941e+00, -4.8702e+00, -5.8049e+00, -5.8605e+00, -3.0632e+00, -2.3803e+00, -9.7205e-01, -3.9848e+00, -3.6261e+00, -2.0542e+00, -2.2103e+00]], [[ 6.9472e-01, -6.8281e+00, -6.1784e+00, -5.8225e+00, -7.0067e+00, -4.2191e+00, -2.8739e+00, -2.4765e+00, -2.3422e+00, -3.5379e+00, -2.9483e+00]], [[ 1.2212e+00, -3.5735e+00, -4.0502e+00, -3.5454e+00, -2.6274e+00, -1.5269e+00, -2.8191e+00, -1.8076e+00, -3.4458e+00, -4.2491e+00, -5.8138e+00]], [[ 3.1652e+00, -1.0274e+00, -7.7135e-01, 6.0298e-01, 4.1150e-01, -1.7462e+00, 1.4201e-01, 8.0090e-01, -1.3616e+00, -1.5606e+00, 6.3606e-01]], [[ 9.5286e-01, -3.7976e+00, -3.9677e+00, -4.3168e+00, -3.7374e+00, -3.6090e+00, -3.1529e+00, -2.4678e+00, -3.7425e+00, -2.5883e+00, -2.5252e+00]]]]) attn_weights tensor([[[[-1.2085e+00, -3.1768e+00, -2.7964e+00, -2.2743e+00, -3.5265e+00, -3.8210e+00, -2.9640e+00, -2.0368e+00, -8.0049e-01, -5.6637e-01, -2.3260e+00]], [[ 5.5095e-02, -3.9966e+00, -4.7059e+00, -5.5957e+00, -3.2472e+00, -2.1641e+00, -1.1127e+00, -3.0318e+00, -3.8550e+00, -5.2643e+00, -2.0446e+00]], [[ 1.6490e-01, -2.9083e+00, -3.4111e+00, -3.5712e+00, -3.7484e+00, -3.7996e+00, -3.3389e+00, -2.5970e+00, -2.9724e+00, -3.6741e+00, -2.8166e+00]], [[ 3.0272e-01, -2.1288e+00, -4.1224e+00, -3.3203e+00, -2.1209e+00, -2.2191e+00, -2.1475e+00, -1.5000e+00, -3.4977e+00, -3.4248e+00, -2.9597e+00]], [[ 1.1264e+00, -8.2795e-01, -1.4998e+00, -1.3884e+00, -1.3968e+00, -2.1110e+00, -1.2293e+00, -7.8196e-01, -2.3446e+00, -2.6165e+00, -1.5461e+00]], [[-6.6449e-01, -3.2144e+00, -4.1410e+00, -3.4609e+00, -4.0969e+00, -4.5873e+00, -4.7607e+00, -3.5707e+00, -2.6914e+00, -2.1233e+00, -2.8352e+00]], [[ 2.2298e+00, -3.6836e+00, -3.1199e+00, -3.1169e+00, -2.2199e+00, -2.2797e+00, -2.3146e+00, -1.7631e+00, -1.6185e+00, -2.0526e+00, -6.4700e-01]], [[-3.6280e-01, -3.8022e+00, -4.6298e+00, -3.9928e+00, -3.6585e+00, -2.3880e+00, -1.3869e+00, -2.5523e+00, -4.1199e+00, -3.4084e+00, -2.7928e+00]], [[-1.2111e+00, -5.8543e+00, -5.1808e+00, -5.1750e+00, -6.9391e+00, -4.9817e+00, -5.0971e+00, -3.9147e+00, -2.4510e+00, -2.4472e+00, -3.8328e+00]], [[ 5.1268e+00, -5.0172e+00, -3.9920e+00, -3.5705e+00, -1.9044e+00, -3.3855e-01, -6.9160e+00, -3.8998e+00, -5.2548e+00, -4.5826e+00, -2.0826e+00]], [[ 2.9100e+00, -4.3415e+00, -3.0836e+00, -2.8910e+00, -1.3896e+00, -1.3830e+00, -4.3455e-01, -3.9335e-01, -6.0146e-01, -1.2884e+00, 5.1920e-01]], [[-5.1556e-01, -3.2072e+00, -3.5089e+00, -3.4164e+00, -3.2529e+00, -2.6799e+00, -2.5120e+00, -6.9989e-01, -3.0539e-01, -6.4422e-01, -1.9510e+00]]], [[[-1.1198e+00, -3.3500e+00, -2.7919e+00, -3.7699e+00, -3.8163e+00, -4.6452e+00, -4.2221e+00, -4.3817e+00, -2.9645e+00, -1.5060e+00, -3.0486e+00]], [[-4.3894e-01, -3.4899e+00, -4.0380e+00, -4.3858e+00, -2.6429e+00, -1.9223e+00, -2.6049e+00, -3.4410e+00, -2.4337e+00, -2.7424e+00, -3.5702e+00]], [[ 1.4171e-01, -2.7297e+00, -2.8087e+00, -3.1985e+00, -3.7451e+00, -3.8300e+00, -3.2896e+00, -2.2275e+00, -2.7635e+00, -3.0719e+00, -3.7016e+00]], [[-1.4311e-01, -2.7256e+00, -4.3439e+00, -3.2643e+00, -1.2953e+00, -2.0721e+00, -1.6480e+00, -9.6630e-01, -9.8489e-01, -3.2667e+00, -3.1059e+00]], [[ 6.2466e-01, -7.5587e-01, -1.4779e+00, -1.2707e+00, -1.0085e+00, -2.4402e+00, -1.4035e+00, -8.1421e-01, -1.4715e+00, -2.2172e+00, -2.5036e+00]], [[-8.2264e-01, -4.3123e+00, -4.6641e+00, -4.3379e+00, -4.4365e+00, -4.6059e+00, -4.0247e+00, -4.7393e+00, -3.9579e+00, -2.8781e+00, -2.9070e+00]], [[ 1.9447e+00, -2.7506e+00, -1.3482e+00, -2.8059e-01, -5.4017e-01, -2.2023e+00, -2.7956e+00, -1.3253e+00, -5.3500e-01, 5.7540e-01, 7.5184e-01]], [[-7.2539e-01, -3.7671e+00, -4.5191e+00, -4.1848e+00, -3.6183e+00, -1.5673e+00, -5.8397e-01, -2.1114e+00, -3.2199e+00, -4.0693e+00, -3.6554e+00]], [[-1.8971e+00, -4.0788e+00, -2.8124e+00, -5.5686e+00, -4.6230e+00, -4.0202e+00, -4.8052e+00, -3.8190e+00, -1.6378e+00, -1.4948e+00, -4.0786e+00]], [[ 4.1327e+00, -5.7626e+00, -5.2990e+00, -3.0640e+00, 2.1532e+00, -9.7820e-02, -5.7689e+00, -4.8100e+00, -4.1660e+00, -2.3963e+00, -2.0938e+00]], [[ 2.5394e+00, -3.3908e+00, -2.7668e+00, -2.9976e+00, -1.5457e+00, -1.3294e+00, -8.8225e-01, -1.3143e+00, -8.8117e-01, -2.8556e-01, -6.2733e-01]], [[-6.8845e-01, -2.5510e+00, -3.9320e+00, -5.6004e+00, -4.4346e+00, -4.3787e+00, -3.4942e+00, -3.6728e+00, -1.1553e+00, -1.7864e+00, -3.2559e+00]]], [[[-1.0466e+00, -3.5773e+00, -2.5581e+00, -4.1173e+00, -4.1022e+00, -5.6310e+00, -5.0240e+00, -4.9407e+00, -2.9038e+00, -1.4729e+00, -3.7723e+00]], [[-1.0878e-01, -3.3339e+00, -4.2300e+00, -3.0195e+00, -2.1844e+00, -1.8537e+00, -2.1285e+00, -2.8603e+00, -4.7238e+00, -3.2821e+00, -4.8252e+00]], [[ 2.5050e-01, -3.2644e+00, -2.5837e+00, -3.4697e+00, -3.3541e+00, -3.9060e+00, -3.6857e+00, -2.8983e+00, -3.1228e+00, -2.8534e+00, -4.3782e+00]], [[-1.5100e-01, -2.7829e+00, -3.8691e+00, -3.0490e+00, -1.5311e+00, -2.3046e+00, -1.9019e+00, -1.3388e+00, -1.1656e+00, -2.5851e+00, -3.1026e+00]], [[ 1.3524e+00, -1.1663e+00, -2.3170e+00, -1.9419e+00, -1.7103e+00, -3.8274e+00, -1.4873e+00, -1.1565e+00, -1.0637e+00, -2.0549e+00, -1.6145e+00]], [[-7.0593e-01, -3.3606e+00, -4.5458e+00, -3.8957e+00, -4.4303e+00, -4.6417e+00, -3.8843e+00, -4.1499e+00, -2.8675e+00, -3.4265e+00, -3.2430e+00]], [[ 1.9542e+00, -2.5431e+00, -8.9041e-01, -8.9402e-01, -1.7906e+00, -2.7486e+00, -3.6310e+00, -2.0612e+00, -7.5919e-01, 9.1847e-02, -3.3385e-01]], [[-1.1714e+00, -3.0582e+00, -3.7750e+00, -3.1894e+00, -2.5589e+00, -2.0896e+00, -7.7271e-01, -1.6448e+00, -3.1515e+00, -3.0047e+00, -2.8203e+00]], [[-1.6650e+00, -5.2324e+00, -5.4931e+00, -7.4733e+00, -6.0124e+00, -4.8812e+00, -5.2341e+00, -4.4225e+00, -3.3126e+00, -3.1829e+00, -5.0558e+00]], [[ 4.4254e+00, -6.3664e+00, -5.1940e+00, -1.3626e+00, -1.0431e+00, -1.7718e+00, -6.5462e+00, -5.4438e+00, -4.2582e+00, -4.4347e+00, -1.3373e+00]], [[ 2.9191e+00, -2.9141e+00, -2.8392e+00, -3.0926e+00, -2.2836e+00, -3.1723e+00, -1.7666e+00, -1.7469e+00, -9.8630e-01, -3.0974e-01, -7.2177e-01]], [[-5.2007e-01, -2.4571e+00, -3.6841e+00, -5.5583e+00, -4.4501e+00, -4.3541e+00, -3.5829e+00, -3.7155e+00, -2.7202e+00, -2.1540e+00, -2.8746e+00]]], [[[-1.8001e+00, -3.2467e+00, -2.7670e+00, -2.3512e+00, -1.1144e+00, -3.7615e+00, -4.0605e+00, -1.2114e+00, -1.1991e+00, -2.7552e+00, -4.0750e+00]], [[-6.2000e-01, -4.3252e+00, -2.9834e+00, -2.8137e+00, -3.2551e+00, -3.1801e+00, -2.3714e+00, -7.9262e-01, -2.8144e+00, -2.5153e+00, -3.6072e+00]], [[ 3.8240e-01, -2.5918e+00, -2.7615e+00, -3.1554e+00, -2.8787e+00, -3.4514e+00, -3.1604e+00, -2.0285e+00, -2.6961e+00, -3.5417e+00, -3.4467e+00]], [[ 2.4905e-01, -3.5644e+00, -5.4068e+00, -4.5728e+00, -3.2654e+00, -3.9190e+00, -3.8255e+00, -3.1259e+00, -3.5430e+00, -3.4698e+00, -4.6290e+00]], [[ 1.8105e+00, -2.3362e+00, -2.8459e+00, -3.0974e+00, -2.5078e+00, -1.6514e+00, -9.4919e-01, -1.3071e+00, -1.9005e+00, -1.8748e+00, -2.5365e+00]], [[-4.9425e-01, -3.6494e+00, -3.9633e+00, -4.1005e+00, -4.2560e+00, -3.7783e+00, -3.8082e+00, -2.9659e+00, -2.7786e+00, -2.5453e+00, -2.3005e+00]], [[ 1.9529e+00, -3.1713e+00, -3.2840e+00, -3.9480e+00, -2.7265e+00, -1.1593e+00, 3.1233e-05, -4.7515e-01, -1.0920e+00, -8.5678e-01, 4.3787e-01]], [[-2.7901e-01, -3.2972e+00, -3.5810e+00, -3.3692e+00, -4.1774e+00, -2.8104e+00, -2.5846e+00, -3.2082e+00, -3.5022e+00, -4.6935e-01, -2.1032e+00]], [[-1.3360e+00, -5.3671e+00, -6.2003e+00, -6.3949e+00, -3.9230e+00, -4.5541e+00, -5.4985e+00, -2.6738e+00, -1.8515e+00, 1.7920e-01, -3.5881e+00]], [[ 4.3236e+00, -1.5363e+01, -1.0385e+01, -7.9278e+00, -6.6851e+00, -3.0104e+00, -2.9114e+00, 2.9039e+00, 1.1419e+00, -9.2601e-02, -3.2330e+00]], [[ 2.9299e+00, -4.2394e+00, -3.0597e+00, -3.0380e+00, -2.8894e+00, -2.4976e+00, -1.6007e+00, -2.1575e+00, -1.4779e+00, -1.6223e+00, -1.4275e-01]], [[-7.1494e-01, -3.2396e+00, -3.5132e+00, -2.2396e+00, -2.2233e+00, -4.6801e+00, -3.6334e+00, -1.0607e+00, -9.9405e-01, -2.4796e+00, -2.5850e+00]]], [[[-1.3764e+00, -5.3878e+00, -4.0420e+00, -3.6923e+00, -2.0909e+00, -4.6154e+00, -4.1004e+00, -3.2054e+00, -1.7336e+00, -7.7492e-01, -3.6042e+00]], [[ 1.3685e-01, -4.8232e+00, -4.6933e+00, -4.0263e+00, -2.7880e+00, -2.3181e+00, -3.4399e-01, -1.0472e+00, -3.9253e+00, -3.3872e+00, -2.8353e+00]], [[ 4.4100e-01, -3.5847e+00, -3.6332e+00, -4.0980e+00, -3.8067e+00, -3.6239e+00, -3.2802e+00, -2.5982e+00, -3.4352e+00, -3.5505e+00, -3.3939e+00]], [[ 7.4079e-01, -3.5155e+00, -4.5949e+00, -3.8611e+00, -3.1636e+00, -3.5183e+00, -3.8348e+00, -3.1381e+00, -3.6345e+00, -4.0042e+00, -4.2046e+00]], [[ 1.9926e+00, -3.7008e+00, -2.9022e+00, -3.5250e+00, -2.1978e+00, -1.0480e+00, -2.7796e-01, -1.4829e+00, -3.4498e+00, -2.2065e+00, -5.7281e-01]], [[-2.3835e-01, -4.6251e+00, -5.3536e+00, -5.1754e+00, -3.9873e+00, -3.9514e+00, -4.4270e+00, -3.5376e+00, -2.0086e+00, -2.0952e+00, -3.4017e+00]], [[ 2.2861e+00, -3.9280e+00, -4.4602e+00, -4.6258e+00, -2.9038e+00, -2.0892e+00, -1.7881e+00, -1.9486e+00, -2.9404e+00, -2.4146e+00, -5.0444e-01]], [[-3.4230e-02, -2.9396e+00, -3.2082e+00, -2.7232e+00, -2.3439e+00, -2.8003e+00, -1.9553e+00, -2.8428e+00, -4.2410e+00, -3.6476e+00, -2.1654e+00]], [[-1.0777e+00, -6.5219e+00, -6.3532e+00, -6.3235e+00, -5.1544e+00, -4.6019e+00, -4.7207e+00, -5.0849e+00, -3.1633e+00, -2.0021e+00, -3.1029e+00]], [[ 4.6451e+00, -1.3504e+01, -6.2178e+00, -6.3668e+00, -6.6664e+00, -2.3568e+00, -1.8560e+00, -1.5072e+00, -1.7545e+00, -2.1793e+00, -1.5847e+00]], [[ 3.0568e+00, -4.3320e+00, -3.8195e+00, -4.5191e+00, -3.6788e+00, -2.5916e+00, -1.1663e+00, -1.9745e+00, -2.3493e+00, -2.3437e+00, -1.8651e+00]], [[-4.1407e-01, -3.7690e+00, -4.1342e+00, -3.5819e+00, -2.6811e+00, -4.5011e+00, -3.4834e+00, -2.6377e+00, -8.5527e-01, -1.3925e+00, -2.8946e+00]]]]) attn_weights tensor([[[[-0.5412, -6.3222, -5.6413, -4.6081, -4.9095, -5.5273, -5.7715, -3.4123, -2.4725, -1.1748, -3.7793]], [[ 3.0976, -1.6562, -1.3826, -2.0793, -1.9341, 0.1887, 1.2175, -0.0956, -0.3984, -0.9745, -0.1248]], [[ 6.5577, -3.4935, -4.3256, -3.6838, -0.5415, 0.7955, -2.0988, -1.6899, -4.3602, -3.7292, 0.7719]], [[ 0.2893, -3.7881, -4.0228, -3.8553, -3.2616, -3.0814, -2.2861, -1.3447, -2.0015, -2.1577, -2.3646]], [[ 0.9619, -4.6077, -4.0718, -4.0681, -5.5308, -3.7918, -3.5683, -3.0652, -3.0537, -3.4758, -2.7053]], [[ 0.5351, -1.3691, -1.2474, -0.8719, -1.1088, -3.6986, -1.2986, -0.2896, -1.8513, -1.7656, -2.4292]], [[ 1.2531, -2.6735, -3.5872, -3.4825, -3.2117, -1.6559, -1.1507, -1.9540, -3.0100, -2.6782, -1.9491]], [[ 2.4451, -3.2698, -2.8432, -3.1270, -1.7556, -0.2534, -0.0095, 1.6414, -0.7837, -1.7197, 0.6668]], [[ 0.2538, -5.1471, -3.9984, -4.2367, -4.3068, -2.9487, -2.4314, -3.5045, -3.6014, -4.0866, -3.0072]], [[ 0.0304, -2.1327, -2.6269, -2.7485, -4.6175, -3.7471, -2.6368, -1.6949, -1.9226, -1.6910, -2.8818]], [[ 4.3261, -3.6195, -3.9441, -3.3119, -2.6566, -1.4285, -2.6106, -2.1554, -3.6947, -3.1582, -1.6397]], [[ 2.4730, -3.3498, -3.9465, -2.6898, -1.4371, -1.1951, -1.9466, -1.7989, -3.6939, -2.4140, -0.3827]]], [[[-0.3777, -5.7697, -5.0660, -6.2131, -5.9401, -5.4896, -6.2996, -5.2026, -2.9663, -2.3474, -3.6363]], [[ 3.0575, -1.5779, -0.8031, -2.7583, -0.5561, -0.8278, 0.4279, 0.5646, -0.1607, 0.0198, -1.8374]], [[ 6.7111, -4.6335, -4.5290, -3.3126, 1.7051, 0.9364, -2.0242, -2.6993, -1.9725, -1.2188, -0.5711]], [[ 0.0856, -3.2063, -2.9142, -3.3190, -2.0639, -1.7852, -1.1591, -0.8377, -1.3401, -1.8073, -2.5100]], [[ 0.7088, -3.3894, -3.2080, -3.4168, -3.3645, -3.7636, -2.8698, -4.3293, -4.6755, -3.8735, -3.8835]], [[ 0.6290, -0.5573, -0.4846, -0.7630, -0.7093, -4.5280, -1.7108, -0.7671, -1.0009, -1.9082, -2.4892]], [[ 1.4076, -2.2558, -2.2605, -2.9480, -2.9362, -1.8043, -1.9690, -1.9506, -1.5005, -2.0035, -2.4766]], [[ 3.3214, -2.2631, -2.6129, -3.4933, -1.0503, 0.1072, 0.5117, 1.1316, 1.2216, -0.1359, -0.5295]], [[-0.7461, -3.1679, -2.0614, -3.5642, -2.3327, -2.0054, -0.9277, -1.3188, -1.3170, -0.7606, -2.7007]], [[-0.0792, -0.9260, -0.8708, -2.7712, -2.8507, -2.5484, -1.2645, -1.9433, -0.4207, -0.9632, -2.7650]], [[ 4.3770, -2.1461, -3.1898, -3.3894, 0.4400, -1.8100, -3.1205, -2.0050, -1.3951, -1.2933, -1.5204]], [[ 3.0897, -3.4908, -2.9028, -1.0257, 1.0685, -0.6334, -2.9452, -3.2624, -2.6787, -1.4211, -0.3845]]], [[[-0.4830, -7.1938, -6.5216, -7.1353, -6.6047, -5.2219, -6.2626, -6.0377, -3.0071, -2.5910, -3.5133]], [[ 3.2534, -1.7673, -1.4753, -1.6640, -0.5076, -1.2705, -0.9390, -0.1896, -0.3415, -0.9806, -1.7820]], [[ 6.1825, -3.8487, -4.7500, -2.8619, -2.9841, -2.3662, -3.8003, -5.5386, -2.0393, -2.1847, -0.8504]], [[ 0.1664, -3.6892, -3.7415, -3.9248, -3.6022, -3.2078, -2.5079, -1.5918, -0.4667, -2.1469, -2.5533]], [[ 1.0018, -3.3893, -3.2475, -4.0533, -3.9466, -5.2575, -4.3082, -4.9321, -4.0903, -2.8458, -5.2640]], [[ 0.9043, -0.7802, -1.6556, -2.4062, -3.0644, -3.8148, -2.6982, -1.2955, 0.2286, -2.4133, -2.0017]], [[ 1.5769, -2.2677, -2.7968, -3.4452, -3.1321, -2.6278, -2.4701, -2.8733, -2.2085, -2.3656, -4.0412]], [[ 3.4626, -3.5313, -3.4517, -4.3608, -2.7646, -2.5119, -2.1361, -1.8870, -1.2962, -1.4426, -1.5183]], [[-0.5178, -4.2820, -4.2339, -5.6237, -4.0631, -3.7691, -2.3528, -3.1724, -2.2543, -2.9141, -3.5413]], [[ 0.3538, -1.0439, -1.1975, -2.8059, -3.1870, -3.2613, -2.7937, -2.6719, -1.2639, -1.6892, -2.7193]], [[ 3.8339, -2.9692, -2.6397, -0.1490, -2.5647, -3.9775, -3.9569, -3.6129, -0.9763, -1.9339, -0.8903]], [[ 3.8577, -3.4618, -2.2623, 3.3535, -1.2914, -2.0849, -3.7020, -3.6057, -2.8113, -0.1156, 1.6920]]], [[[-1.0587, -4.2332, -5.4076, -3.8173, -2.4271, -3.4010, -4.9139, -1.0966, -0.9302, -0.1549, -3.7901]], [[ 3.7306, -3.5904, -2.2196, -2.5972, -2.4801, -1.5288, 0.4414, 0.7051, 0.5024, 0.2188, -0.5250]], [[ 6.5709, -6.2125, -5.6582, -5.1226, -4.4636, -1.2904, -0.3160, 1.9870, 0.5589, -0.3270, 0.2074]], [[ 0.2538, -4.1633, -4.1110, -4.4590, -4.4907, -2.4591, -3.3713, -2.5208, -1.9880, -1.5074, -1.9545]], [[-0.0309, -3.3012, -3.9173, -3.6471, -3.3021, -3.7094, -3.4438, -0.9469, -1.0656, -1.6512, -3.8053]], [[ 1.0591, -2.7880, -2.8385, -2.5611, -2.0383, -4.4039, -2.6476, -2.1485, -1.6391, -3.2847, -2.8352]], [[ 1.5100, -2.8088, -2.6108, -3.4171, -3.2338, -2.5359, -2.4852, -2.5853, -1.6314, -2.8040, -2.7273]], [[ 2.6215, -2.6845, -3.4895, -3.4959, -3.0505, -1.3927, -1.0471, 0.3643, -0.2594, -0.5645, -0.7089]], [[-0.0872, -5.7826, -3.5949, -4.1554, -3.5669, -4.4707, -4.0013, -3.9102, -2.7734, -2.1443, -3.6907]], [[ 0.1822, -2.8168, -3.2272, -3.3440, -4.1967, -3.3866, -3.3981, -1.4179, -1.8380, -2.8407, -3.5391]], [[ 3.9674, -6.8475, -4.7419, -3.4312, -4.0603, -1.9148, -1.1031, 1.4336, 1.5903, -1.0396, -2.9839]], [[ 2.3736, -3.4181, -3.8864, -4.3010, -3.8854, -1.9722, -0.9740, 1.1203, -0.9265, -2.0625, -1.7344]]], [[[-0.6679, -5.5521, -6.2312, -5.6793, -3.7410, -5.0693, -5.6944, -2.9344, -0.5787, 0.3282, -2.2278]], [[ 4.1153, -3.4054, -1.8334, -3.0917, -3.6477, -3.0600, -1.1514, -0.9254, -2.2309, -1.2765, 0.3247]], [[ 6.2724, -5.4766, -6.2032, -7.0910, -7.0785, -2.6271, 0.0695, -1.7315, -3.3165, -0.8773, 1.1389]], [[ 0.4986, -4.9099, -4.6983, -5.3524, -5.0194, -3.2074, -3.1507, -3.1333, -2.2027, -2.7703, -3.0286]], [[ 0.3163, -3.1790, -3.2365, -3.0734, -3.6370, -3.9538, -3.2927, -2.5798, -1.4508, -2.0504, -4.2921]], [[ 1.6387, -4.4514, -3.1544, -3.0415, -3.2611, -3.4032, -1.8995, -2.9998, -3.8097, -2.5385, -2.5387]], [[ 1.6348, -3.6139, -3.7996, -3.8700, -3.6590, -2.2099, -2.0877, -3.0724, -3.5815, -2.9610, -3.0159]], [[ 2.3982, -4.3620, -4.9448, -5.0324, -4.3012, -3.0572, -1.1679, -0.9720, -1.2582, -2.0659, -1.4397]], [[ 0.2560, -4.6216, -2.9462, -3.3671, -3.3419, -3.1895, -2.5284, -3.7225, -4.1600, -3.8987, -3.3436]], [[ 0.3550, -3.1461, -3.3073, -3.6594, -4.4818, -3.8584, -3.8602, -3.6275, -1.1601, -2.4295, -2.8535]], [[ 4.1950, -8.2009, -3.4612, -4.5930, -5.4866, -1.1813, 0.7039, -0.4188, -1.9349, -3.2847, 0.0083]], [[ 2.6241, -3.5700, -5.0664, -4.2693, -5.4665, -2.6840, 1.1099, -0.7832, -4.7874, -4.1097, -3.0207]]]]) attn_weights tensor([[[[ 0.7932, -2.7499, -2.7488, -2.9246, -2.2401, -4.3212, -2.2179, -1.5923, -1.7501, -1.7090, -2.8960]], [[ 3.6653, -2.0911, -2.7285, -1.2788, -0.0768, 0.0330, -0.5439, -0.3650, -1.8150, -0.3379, 0.0836]], [[ 1.4934, -1.3332, -2.1766, -1.5433, -0.9356, -1.1593, -1.6461, -0.9802, -2.3748, -1.3921, -1.5701]], [[ 2.4590, -2.0364, -1.1144, -2.5426, -2.1951, 0.6766, 1.0694, -0.6567, -0.3786, -0.8599, -1.1626]], [[ 0.1411, -5.2321, -4.6295, -4.5567, -4.2256, -3.7432, -2.8819, -3.3843, -3.4251, -3.0806, -2.8351]], [[-1.3855, -3.7055, -3.4337, -2.3500, -3.1135, -3.0409, -3.3297, -1.2404, -1.4311, -0.7823, -2.3930]], [[ 1.9904, -3.1814, -3.0466, -4.1653, -2.6250, 0.2805, -0.0859, -1.1068, -2.6606, -3.4407, -1.7639]], [[-0.1559, -5.7075, -5.3098, -5.1381, -4.6803, -4.4027, -4.4703, -2.7982, -2.0911, -1.5743, -1.1811]], [[ 0.5039, -2.6792, -3.0275, -3.3843, -3.1916, 0.3672, -0.1687, -0.7076, -2.7474, -2.8813, -1.9331]], [[ 1.3128, -3.9332, -4.5684, -4.9393, -3.6092, -0.9995, -1.7461, -2.7565, -3.0762, -3.1048, -1.8910]], [[ 1.2555, -2.8006, -2.2151, -3.3438, -2.6818, -0.4157, -0.9939, -0.9185, -1.2865, -1.8562, -1.6884]], [[ 0.7536, -4.1658, -3.6610, -3.7694, -4.3055, -1.2409, -2.0589, -3.0877, -3.6568, -3.5687, -2.8273]]], [[[ 0.9729, -2.3469, -1.7007, -2.1346, -2.0335, -4.0601, -1.6557, -2.9782, -3.1408, -1.8204, -2.0441]], [[ 4.9405, -2.9317, -3.4958, -3.0002, 1.6395, 0.3952, -1.4928, -2.1920, -0.6739, -1.9041, -1.8237]], [[ 1.6738, -1.2547, -2.4453, -2.3102, -1.1526, -0.6569, -0.5955, -1.2473, -1.9491, -2.2739, -2.0184]], [[ 2.9661, -1.6337, -2.1301, -2.1916, -2.0103, -1.7865, -1.5075, -0.8538, -0.8891, -2.2764, -2.4888]], [[-0.6939, -2.8488, -2.4745, -4.1944, -3.6439, -3.0380, -2.2981, -3.1502, -1.8138, -1.9614, -3.7958]], [[-1.4655, -3.1780, -2.3808, -4.1446, -3.5627, -2.5431, -2.8375, -2.3982, -1.5172, -1.8073, -3.9660]], [[ 2.5666, -2.3498, -2.5829, -3.8909, -1.0481, -1.0506, -0.5809, -1.4779, -1.0671, -2.5122, -3.9912]], [[-0.6075, -5.6769, -4.1878, -6.4107, -5.0689, -3.4297, -3.3801, -3.9880, -3.0212, -2.0121, -4.5443]], [[ 0.2589, -2.0542, -2.2765, -3.0209, -2.2109, -1.1145, -0.9181, -0.2720, -0.5042, -1.9442, -2.6550]], [[ 0.8678, -3.1130, -2.9032, -3.5032, -2.7159, -1.5409, -0.9009, -1.8575, -2.1495, -2.4570, -3.1521]], [[ 1.1962, -3.0093, -3.0004, -2.8261, -0.8282, -2.1998, -1.7619, -0.8410, -0.3180, -1.9037, -1.8637]], [[ 1.2570, -2.8686, -3.9892, -3.5278, -3.9555, -2.1148, -2.1423, -2.7812, -3.7426, -4.5028, -4.2441]]], [[[ 1.1104, -3.2635, -2.5601, -2.6317, -2.3446, -3.0013, -2.0934, -2.9812, -3.3839, -2.8405, -2.4559]], [[ 5.4483, -2.0015, -3.7280, -0.7781, -1.8492, -1.8740, -2.9124, -3.2966, -2.2824, -1.6592, 0.2882]], [[ 2.8900, -1.6661, -3.0694, -0.5090, -0.9104, -1.5525, -2.4846, -2.5682, -1.5774, -3.0259, -2.7773]], [[ 3.0067, -3.1676, -3.3692, -3.7552, -3.5992, -3.9608, -3.4236, -3.7520, -3.3451, -4.1610, -3.2093]], [[ 0.4515, -4.5096, -4.2274, -5.1001, -5.3251, -4.9709, -3.8900, -3.7613, -3.3407, -1.9131, -3.1507]], [[-0.6420, -2.8285, -2.7482, -4.3247, -3.9246, -3.9424, -3.3522, -3.2162, -1.0325, -1.8235, -3.7572]], [[ 2.4964, -2.7089, -3.4670, -3.3886, -2.6827, -3.3844, -3.0762, -3.0294, -2.1734, -2.1129, -2.2518]], [[-0.6772, -5.6163, -6.5454, -8.7341, -7.3435, -5.6666, -6.3598, -5.6051, -5.0240, -3.8473, -3.4683]], [[ 0.4802, -3.0340, -3.4119, -3.7780, -3.1027, -2.4452, -2.1759, -2.1060, -1.4676, -3.2319, -3.2471]], [[ 0.9375, -2.9119, -2.6338, -3.4106, -3.4954, -2.4149, -1.3977, -2.8352, -2.0773, -1.8070, -2.9431]], [[ 1.0865, -3.0588, -3.5619, -3.1149, -2.2416, -2.9488, -3.4169, -2.3928, -1.4271, -2.6029, -2.4593]], [[ 1.2974, -2.8471, -4.4968, -3.4496, -4.7361, -3.5574, -4.1277, -2.9803, -3.1669, -4.1420, -4.4787]]], [[[ 1.4228, -3.2708, -4.0435, -3.5976, -3.3888, -3.4602, -2.4718, -1.7768, -3.0991, -3.5091, -2.2688]], [[ 2.4090, -3.1128, -2.3482, -2.5139, -1.5634, -0.4015, 0.7141, 2.3374, 1.7799, -1.7797, 0.2494]], [[ 2.0718, -0.2689, -1.4819, -0.9511, -0.4471, -1.7579, -2.5385, -0.4872, 0.2729, -2.0262, -2.3281]], [[ 2.1273, -2.4033, -2.2659, -2.3094, -1.5030, -0.8360, -0.8081, 0.4975, -0.2965, -2.9295, -1.8506]], [[-0.0480, -6.1835, -6.4141, -5.5217, -3.1758, -5.4838, -4.2430, -3.7598, -2.8404, -3.2294, -3.8257]], [[-1.4455, -4.1326, -4.3367, -3.9714, -3.6802, -4.0376, -4.5291, -2.3010, -2.7981, -1.9566, -3.6593]], [[ 2.5843, -3.0197, -3.4701, -3.8573, -2.6576, -2.1475, -0.9247, -0.2908, -0.8809, -3.9453, -0.6007]], [[-1.4347, -5.3101, -4.8954, -3.0385, -1.5437, -3.7264, -4.3576, -1.5118, 0.1507, -1.4232, -3.4045]], [[ 1.1586, -4.0382, -4.2277, -4.1375, -3.9096, -3.3322, -2.3776, -2.2597, -3.8160, -2.0918, -2.2102]], [[ 1.1806, -4.2837, -4.6986, -4.7614, -3.3665, -1.1085, -1.3249, -2.3415, -1.7730, -0.3859, -1.6457]], [[ 1.0936, -3.5670, -3.4846, -4.0411, -3.6409, -2.5236, -2.1559, -1.0340, -1.7625, -2.1401, -1.4325]], [[ 1.0661, -3.3569, -4.0160, -3.8977, -3.9195, -2.8045, -2.8023, -2.1906, -3.6733, -3.4358, -1.8415]]], [[[ 1.2888, -3.1894, -3.6225, -3.8360, -3.9441, -3.4407, -1.9959, -2.0504, -4.4575, -3.9738, -2.7944]], [[ 3.3048, -2.7530, -3.0567, -3.9755, -3.4136, -0.9076, 2.4383, 0.6904, -0.8640, -1.3312, -1.3971]], [[ 2.3993, -1.4247, -2.5465, -2.8136, -1.3043, -1.8076, -2.0401, -1.5924, -2.3863, -1.8825, -2.4013]], [[ 2.3103, -1.6963, -2.5583, -2.3962, -1.9393, -1.8810, -0.2141, 0.8389, 0.0367, -1.1581, -1.6495]], [[ 0.8354, -6.0744, -5.6272, -5.0494, -3.9290, -4.9851, -4.4242, -4.9310, -3.3831, -3.2000, -1.8648]], [[-1.0768, -3.1289, -3.8555, -3.5109, -3.0767, -3.7567, -3.4923, -1.9538, -0.1945, -1.0827, -4.0073]], [[ 2.5923, -3.2487, -4.7727, -5.9142, -4.1742, -0.8442, 0.4286, -1.6774, -3.8122, -3.3046, -3.3267]], [[-0.9269, -5.9058, -4.3983, -3.5294, -2.5325, -3.6825, -3.6054, -2.6663, -0.7890, 0.6647, -2.7195]], [[ 1.0600, -3.4144, -3.5779, -3.0928, -2.9848, -0.7932, -0.0935, -1.2388, -5.1325, -4.6277, -1.2646]], [[ 1.8335, -4.2464, -4.5589, -4.4582, -3.8773, -0.8755, -1.9104, -3.3390, -3.9129, -3.7367, -1.0700]], [[ 1.1083, -3.6785, -3.8412, -4.4644, -3.8008, -1.5535, -1.1422, -2.1009, -3.2193, -1.8480, -0.6081]], [[ 0.7718, -3.8118, -4.1409, -3.8897, -3.7785, -2.1234, -2.1434, -2.8142, -5.0160, -4.3505, -2.5493]]]]) attn_weights tensor([[[[ 2.5924, -2.5617, -1.0533, -1.1325, -2.7474, 1.7189, 2.1447, -0.9771, -1.6578, -1.0171, -0.4880]], [[ 2.6351, -2.0329, -2.7141, -2.6089, -1.6883, -1.7754, -0.7912, -2.2642, -2.4513, -2.2733, -0.8574]], [[ 2.1799, -3.3891, -2.5255, -3.6147, -3.8485, 1.2049, 0.4345, -2.0767, -3.1787, -3.2147, -2.4498]], [[-0.6404, -3.1035, -2.8154, -2.9345, -3.9852, -3.6516, -2.9570, -1.5870, -1.5113, -1.3620, -1.7212]], [[ 3.6446, -1.9372, -2.8488, -3.2769, -2.2689, 0.6128, 1.6519, -0.9556, -2.3818, -1.6220, -0.8162]], [[ 1.6128, -3.4561, -3.6567, -3.2475, -2.6709, -0.5964, -0.6068, -1.8797, -2.3430, -1.9908, -0.3374]], [[ 3.5754, -2.8826, -4.3054, -4.8832, -3.9336, 1.1518, 0.9566, -1.8972, -3.6072, -3.5266, -1.1887]], [[ 0.0837, -4.1510, -3.8680, -4.4549, -4.1111, -2.5258, -2.3988, -3.6532, -4.3164, -4.3318, -3.3033]], [[ 1.6401, -2.0498, -2.6505, -1.7813, -1.8645, 0.3976, -0.0927, -1.2448, -2.4460, -1.3459, -1.8219]], [[ 3.9203, -1.6190, -1.9771, -2.6257, -2.2628, 1.2481, 1.0796, -1.3012, -2.0896, -1.9997, 0.6545]], [[ 1.0018, -3.9771, -2.8328, -2.2602, -2.8523, -2.2855, -2.6542, -2.4920, -1.8604, -0.9880, -1.2048]], [[ 2.9751, -0.6370, -2.4252, -1.8893, -1.0522, -1.4102, -1.6754, -0.5536, -2.2707, -1.4014, -1.0252]]], [[[ 1.9617, -1.0035, -1.2203, -1.8547, -2.2858, 0.1617, 0.7347, -0.8288, -1.8925, -1.4526, -2.2360]], [[ 3.5721, -1.7182, -2.1449, -1.4638, 0.6836, -1.8327, -1.0192, -2.1650, -1.2592, -2.1898, -1.5985]], [[ 1.5718, -1.3732, -1.4969, -2.8700, -2.1071, -0.2768, -0.0358, -0.3090, -1.3811, -2.1355, -3.4657]], [[-1.1969, -2.7691, -2.3034, -4.3552, -5.1734, -2.5520, -1.7507, -2.3914, -1.7473, -1.6641, -3.5543]], [[ 3.3784, -2.5718, -3.5696, -3.6213, -2.5690, -2.6202, -1.2317, -2.6699, -3.8931, -4.6035, -4.5856]], [[ 1.9866, -3.0962, -3.1188, -3.1068, -2.5628, -1.9096, -2.3329, -3.1000, -3.1554, -3.1938, -3.3547]], [[ 3.9334, -3.4012, -3.3270, -2.9831, -0.8472, -0.0918, -0.1328, -3.2390, -2.7232, -2.3773, -2.3774]], [[ 0.5982, -3.0581, -4.0418, -3.9919, -2.5487, -2.6862, -2.2103, -2.6527, -2.8105, -3.9120, -3.8560]], [[ 1.6360, -2.6537, -2.9773, -3.2844, -2.6038, -0.5841, -0.6345, -2.0564, -2.1183, -2.8015, -2.7620]], [[ 4.7920, -2.3259, -2.1011, -1.3649, 0.6353, -0.1674, 0.4927, -2.3925, -2.0502, -2.0299, -1.8309]], [[ 0.2379, -3.0696, -1.1261, -3.5394, -2.9928, -2.2802, -1.4538, -1.5825, -0.0350, 0.4523, -1.9809]], [[ 3.8354, -1.3685, -2.7712, -0.6746, -0.0855, -1.6129, -1.5153, -3.1660, -1.6929, -2.9913, -0.8056]]], [[[ 2.7119, -3.0116, -2.4730, -2.7662, -2.5070, -1.8701, -1.0718, -1.8972, -2.7711, -2.3608, -3.4115]], [[ 4.4080, -1.2993, -3.1587, -1.7403, -1.0927, -3.3957, -3.6125, -3.1534, -1.3115, -2.2310, -2.1191]], [[ 3.0538, -3.6485, -3.3358, -4.4345, -3.3340, -3.9575, -3.1816, -2.9880, -3.4948, -3.4796, -5.3756]], [[-0.6669, -3.4697, -3.8066, -5.4081, -5.8625, -4.7183, -4.4157, -4.1828, -3.9340, -3.3106, -5.5885]], [[ 3.4892, -2.9303, -3.7366, -3.7551, -2.2785, -4.2203, -3.4386, -3.0726, -4.2038, -4.9832, -5.6775]], [[ 2.0441, -1.5887, -2.0660, -2.3599, -2.1011, -3.8392, -3.1587, -1.5048, -1.2315, -1.7704, -2.1493]], [[ 3.6856, -0.8360, -2.8437, -1.1208, -1.8871, -5.3982, -5.3825, -1.1817, -2.4199, -2.2201, -2.1870]], [[ 0.8039, -3.8411, -4.8789, -4.3995, -3.7053, -4.1980, -2.7897, -2.0137, -2.5086, -4.2018, -6.7795]], [[ 2.2289, -2.5083, -2.9574, -2.5119, -2.5529, -1.7354, -2.4832, -2.1766, -1.5263, -2.8648, -3.6920]], [[ 5.3177, -1.6726, -2.9466, -2.3638, -3.0587, -2.7188, -2.3961, -2.8543, -2.2758, -3.0906, -3.2539]], [[ 1.5371, -4.3737, -2.8384, -5.9172, -5.5621, -3.9786, -3.8744, -3.6293, -2.2719, -0.9190, -2.2079]], [[ 3.2929, -2.1037, -2.9752, 2.5217, -0.7110, -4.1153, -2.0156, -3.2340, -2.5717, -2.8880, -0.8251]]], [[[ 2.7295, -4.9410, -4.6352, -3.8380, -4.3033, -1.3096, 0.4228, -3.5746, -3.7716, -1.4189, -0.1574]], [[ 2.9207, -1.6555, -2.2435, -2.4559, -1.3465, -2.8423, -1.1307, 0.0267, -0.4768, -2.0074, -1.5339]], [[ 2.4656, -4.9932, -4.3072, -3.9808, -3.5916, -1.7349, -0.6501, -3.0609, -3.0174, -1.5339, -1.1751]], [[-1.0281, -2.7917, -4.0530, -2.6575, -3.0909, -3.4976, -4.1670, -1.8699, -1.7696, -1.7627, -4.1322]], [[ 2.6638, -2.1800, -3.7716, -3.9200, -3.5996, -1.3090, -0.8888, -1.4517, -2.2346, -2.4629, -1.7494]], [[ 1.7638, -3.7629, -4.2282, -3.7062, -3.3909, -3.0643, -2.7649, -1.9840, -2.4597, -3.2078, -2.5685]], [[ 3.3273, -2.8685, -3.3278, -3.3072, -3.0130, -0.0720, 0.6762, -0.0133, -1.3545, -1.6450, -0.3177]], [[ 0.4362, -3.5970, -4.1970, -4.5569, -3.6750, -4.0209, -4.0517, -3.5965, -3.4434, -4.8544, -4.3516]], [[ 2.4097, -3.9758, -3.7277, -2.8720, -3.5555, -2.3613, -2.3003, -2.7662, -3.5359, -2.4614, -2.2143]], [[ 4.0076, -1.4493, -1.8360, -1.7541, -0.7804, 0.7485, 2.1423, 0.8947, 0.4116, -0.5830, 0.8133]], [[ 0.0829, -3.9929, -3.8118, -2.5046, -1.0972, -2.1791, -1.6413, -1.2435, 0.1968, -0.8540, -1.9623]], [[ 3.6267, -1.6848, -2.8321, -3.0910, -2.1178, -3.2734, -2.7860, 0.6415, -0.2531, -3.0268, -2.6552]]], [[[ 2.7693, -4.2311, -3.6223, -3.4020, -3.9365, -0.5389, 1.7929, -2.9703, -4.4609, -3.6109, 1.1502]], [[ 3.9535, -2.8063, -4.6528, -4.5456, -4.4469, -3.4758, -0.0563, -2.4668, -2.3540, -1.7413, -1.2713]], [[ 2.7482, -4.0645, -3.2153, -3.2034, -3.0249, -0.2038, 0.1755, -2.6311, -3.2817, -2.3373, 0.5851]], [[-0.7875, -3.7471, -4.7266, -3.6112, -2.7089, -3.7403, -3.6923, -1.9920, -1.0689, -0.3730, -3.3009]], [[ 3.4839, -2.4870, -3.9502, -4.3050, -4.1312, -2.2043, -0.4641, -2.3101, -2.8434, -2.1252, -1.4154]], [[ 2.0605, -3.3360, -4.1160, -3.9179, -3.0294, -2.3557, -1.7497, -2.3715, -2.2939, -0.8503, -1.6858]], [[ 3.8295, -3.5080, -3.9972, -4.3363, -4.5169, 0.3570, 2.7257, -1.6250, -2.5922, -2.1847, -0.4083]], [[ 0.4945, -3.7303, -3.8413, -4.7729, -4.2315, -3.4906, -3.1902, -3.6464, -5.6411, -5.0426, -4.2814]], [[ 2.4826, -3.0706, -2.8363, -2.2641, -2.8317, -0.5787, -0.9892, -2.9086, -3.5322, -3.4984, 0.3316]], [[ 5.1073, -2.1889, -2.2693, -2.4730, -2.1043, 1.3784, 4.0193, -0.8209, -0.7598, 0.1364, 1.9681]], [[ 1.2388, -5.1270, -4.7803, -4.6439, -2.3394, -3.5349, -3.8601, -4.9216, -1.6898, -0.5844, -1.9455]], [[ 3.9395, -1.3343, -3.6645, -3.0456, -2.6760, -2.8657, -1.7756, -0.0131, -3.0392, -2.0811, -3.1469]]]]) attn_weights tensor([[[[ 2.5428e+00, -3.1774e+00, -4.1538e+00, -3.6270e+00, -3.8792e+00, 2.1749e+00, 1.2425e+00, -2.8253e+00, -4.2946e+00, -3.4257e+00, -1.7794e-01]], [[ 3.6941e+00, -2.0470e+00, -3.4762e+00, -2.3872e+00, -2.6953e+00, 1.3783e+00, 1.3205e-01, -1.9966e+00, -3.4097e+00, -1.3760e+00, 3.9020e-01]], [[ 2.6910e+00, -1.4508e+00, -2.5689e+00, -3.2570e+00, -2.9144e+00, -3.2066e-01, -3.4461e-01, -1.4660e+00, -2.8943e+00, -2.7387e+00, -2.9687e-01]], [[ 2.1122e+00, -6.5155e-01, -3.5256e+00, -3.4559e+00, -2.6695e+00, 1.9248e+00, 3.8979e-02, -4.4934e-01, -3.0994e+00, -2.5412e+00, -8.9836e-01]], [[ 2.2927e+00, 3.2455e-01, -1.3688e+00, -1.5178e+00, -9.4667e-01, 3.7275e-01, 1.3623e+00, 9.1177e-01, -9.7752e-01, -8.7810e-01, -5.4995e-01]], [[ 1.1468e+00, -1.7708e+00, -2.8194e+00, -2.6247e+00, -2.6907e+00, -2.0917e+00, -3.0176e+00, -1.6454e+00, -1.7660e+00, -1.5108e+00, -1.6690e+00]], [[ 2.8006e+00, -2.5915e+00, -3.1127e+00, -2.9246e+00, -3.5231e+00, 1.1303e+00, 5.9152e-01, -2.4481e+00, -3.7834e+00, -3.2408e+00, -7.9439e-01]], [[ 1.7991e+00, -1.4212e+00, -2.3487e+00, -2.8745e+00, -1.6782e+00, 1.7889e+00, 2.4748e-01, 1.2917e-02, -2.3395e+00, -2.3177e+00, 3.3034e-01]], [[ 3.1534e+00, -1.8411e+00, -2.4701e+00, -3.1110e+00, -1.2946e+00, -3.1360e+00, -3.1101e+00, -8.2964e-01, -1.6482e+00, -1.6550e+00, 4.5977e-01]], [[ 2.0664e-01, -2.9411e+00, -2.9615e+00, -3.0298e+00, -3.0998e+00, -1.2697e+00, -1.2783e+00, -1.3755e+00, -2.5527e+00, -2.4755e+00, -6.3138e-01]], [[ 3.0120e+00, -1.3862e+00, -1.9446e+00, -1.8016e+00, -1.8029e+00, 1.3747e+00, -5.0908e-02, -1.3204e+00, -2.2929e+00, -1.6728e+00, -6.2636e-01]], [[ 3.8433e+00, -8.6747e-01, -6.3309e-01, -2.4173e+00, -1.8858e+00, 2.4636e+00, 2.5765e+00, 4.3791e-01, -1.8845e-01, -1.1168e+00, 3.2635e+00]]], [[[ 2.6951e+00, -3.1060e+00, -3.6152e+00, -2.9706e+00, -3.0482e+00, 3.0209e-01, -4.3127e-01, -2.9426e+00, -3.3000e+00, -3.8899e+00, -3.3592e+00]], [[ 4.1780e+00, -1.0440e+00, -1.9526e+00, -8.2827e-01, -5.3722e-01, 7.6520e-01, -2.6241e-01, -2.3767e+00, -2.3028e+00, -2.5603e+00, -1.4518e+00]], [[ 3.2119e+00, -5.0897e-01, -1.1808e+00, -9.3032e-01, -1.5318e-01, 5.1661e-01, 1.1672e+00, -4.1358e-01, -6.2362e-01, -1.3508e+00, -9.3414e-01]], [[ 2.9501e+00, 2.1215e-01, -1.3894e+00, -6.5412e-01, -2.0833e-01, 3.4830e-01, -4.2328e-02, -1.0485e+00, -1.2060e+00, -1.6561e+00, -9.2579e-01]], [[ 2.2296e+00, -3.8182e-01, -8.2736e-02, -5.2492e-01, 1.2362e-01, -6.6883e-01, 7.8925e-01, -7.6722e-01, -4.5452e-02, -4.7294e-02, -3.5974e-01]], [[ 1.2167e+00, -1.5376e+00, -1.6515e+00, -3.2045e+00, -2.2930e+00, -1.7869e+00, -2.1840e+00, -1.6060e+00, -1.0223e+00, -1.0360e+00, -3.0318e+00]], [[ 3.1086e+00, -1.7396e+00, -2.2672e+00, -1.7085e+00, -9.4103e-01, -9.9017e-02, 8.3074e-01, -1.7449e+00, -1.7921e+00, -2.2243e+00, -1.8903e+00]], [[ 1.9435e+00, -1.9647e+00, -1.5628e+00, -1.6918e+00, -1.2713e+00, -1.5406e+00, -2.4885e+00, -1.4680e+00, -1.0759e+00, -1.3845e+00, -1.4879e+00]], [[ 3.5396e+00, -2.3050e+00, -2.7306e+00, -2.3076e+00, 8.5208e-01, -1.2165e+00, -1.2820e+00, -1.9539e+00, -1.2311e+00, -2.6110e+00, -2.1497e+00]], [[ 9.7385e-01, -3.2120e+00, -2.6815e+00, -2.3822e+00, -2.1606e+00, -1.5700e+00, -1.0816e+00, -1.7015e+00, -2.3271e+00, -1.9520e+00, -1.9214e+00]], [[ 3.4603e+00, -2.0689e+00, -1.8335e+00, -1.3347e+00, -1.6549e+00, -7.1989e-01, -8.9695e-01, -2.1359e+00, -2.2715e+00, -2.5019e+00, -1.9891e+00]], [[ 4.5423e+00, 6.8114e-01, 2.4465e+00, -1.9987e-01, 7.7880e-01, 1.2574e+00, 1.5136e+00, 1.9286e+00, 1.4435e+00, 2.5156e+00, 7.6687e-02]]], [[[ 2.2968e+00, -3.8970e+00, -5.6527e+00, -4.0842e+00, -4.5258e+00, -1.1305e+00, -2.3346e+00, -4.7223e+00, -4.9596e+00, -5.4026e+00, -3.6177e+00]], [[ 3.4554e+00, -2.2952e+00, -1.4860e+00, 1.6125e-01, -2.0395e+00, -2.0039e+00, -2.1014e+00, -1.7530e+00, -2.6172e+00, -1.1228e+00, -5.2788e-01]], [[ 2.8326e+00, -9.2152e-01, -2.0841e+00, -1.2942e+00, -1.8703e+00, -3.5623e+00, -2.7173e+00, -2.6481e+00, -2.1255e+00, -2.6533e+00, -5.1501e-01]], [[ 2.9173e+00, -1.8304e+00, -3.3172e+00, -3.3047e+00, -2.4755e+00, -1.4065e+00, -1.5641e+00, -1.7777e+00, -1.9040e+00, -2.3463e+00, -2.3207e+00]], [[ 3.3177e+00, 5.8552e-01, -2.6627e+00, -2.1428e+00, -1.9510e+00, -3.6370e+00, -2.1399e+00, -5.1368e-01, -1.0328e+00, -2.5932e+00, -1.2405e-01]], [[ 2.1517e+00, -2.8343e+00, -1.6700e+00, -4.4109e+00, -3.9720e+00, -3.5802e+00, -4.4066e+00, -2.4212e+00, -2.9819e+00, -1.3654e+00, -4.1109e+00]], [[ 3.6355e+00, -4.3301e+00, -4.7642e+00, -3.4258e+00, -5.3664e+00, -1.5807e+00, -1.5963e+00, -4.8100e+00, -4.5710e+00, -5.0589e+00, -3.1046e+00]], [[ 5.0094e+00, -2.3607e+00, -3.3227e+00, -2.9877e+00, -2.9614e+00, -3.8692e+00, -4.4493e+00, -2.4603e+00, -2.0653e+00, -3.7964e+00, -3.5015e+00]], [[ 3.0877e+00, -2.3892e+00, -4.0349e+00, -2.7496e+00, -3.2531e+00, -3.0774e+00, -3.6286e+00, -2.7275e+00, -2.8840e+00, -3.4782e+00, -2.6297e+00]], [[ 1.5204e+00, -5.5855e+00, -3.7199e+00, -4.1768e+00, -4.3786e+00, -3.3215e+00, -3.3294e+00, -4.7463e+00, -5.2769e+00, -2.6300e+00, -3.2417e+00]], [[ 2.8101e+00, -2.5651e+00, -2.9011e+00, -2.2470e+00, -3.0977e+00, -4.0278e+00, -4.2512e+00, -3.0270e+00, -2.8719e+00, -2.6796e+00, -2.7888e+00]], [[ 4.7928e+00, -1.7397e+00, -2.0605e+00, -3.4888e+00, -2.6413e+00, -3.7557e+00, -2.4628e+00, -1.5457e+00, -2.1703e+00, -2.6550e+00, -2.6347e+00]]], [[[ 3.0906e+00, -3.6384e+00, -4.4425e+00, -4.2234e+00, -4.7745e+00, -6.5656e-01, -2.4410e-01, -2.7279e+00, -3.5799e+00, -8.5946e-01, -7.7273e-01]], [[ 3.7970e+00, -1.4612e+00, -2.2704e+00, -1.2499e+00, -1.2992e+00, 3.3986e-01, 9.0473e-01, -1.2805e-01, 3.4746e-01, 3.4347e-02, -2.9973e-01]], [[ 2.6952e+00, -3.1508e-01, -2.3464e+00, -2.9748e+00, -2.1853e+00, -8.4640e-01, -1.7059e-01, -9.7201e-02, -4.6900e-01, -1.5236e+00, -6.1609e-01]], [[ 2.4663e+00, 1.1491e+00, -2.2112e+00, -2.1808e+00, -1.3661e+00, -1.9823e-01, -1.0631e+00, 1.4810e+00, -1.1421e+00, -2.1536e+00, -1.6298e+00]], [[ 2.1446e+00, -1.0735e-01, -3.4225e+00, -2.2163e+00, -1.8850e+00, -4.3160e+00, -3.1123e+00, -4.4936e-01, -1.2920e+00, -3.3242e+00, -3.4366e+00]], [[-8.2987e-02, -1.7030e+00, -2.0026e+00, -1.1064e+00, -9.1445e-01, -1.3632e+00, -9.7980e-01, -4.6966e-01, -2.0004e-01, -1.3384e+00, -1.8583e+00]], [[ 3.2894e+00, -3.7209e+00, -3.4425e+00, -3.3014e+00, -3.2619e+00, -5.6604e-01, 6.5311e-01, -2.1595e+00, -2.2030e+00, -8.4077e-01, 1.2366e-01]], [[ 2.8216e+00, -1.2059e+00, -1.5567e+00, -2.0068e+00, -9.9088e-01, -1.7211e+00, -4.1772e-01, 6.6856e-01, -3.7551e-01, -3.4204e+00, -4.2071e-01]], [[ 3.4577e+00, -1.0459e+00, -2.0496e+00, -2.3855e+00, -5.6694e-01, -2.0416e+00, -8.3476e-01, 2.6550e-01, 1.4680e-01, -2.8600e+00, -1.7513e+00]], [[ 5.2106e-02, -4.0774e+00, -4.0994e+00, -4.4146e+00, -2.5345e+00, -8.8014e-01, -9.0830e-01, -2.3065e+00, -1.1722e+00, -5.0309e-01, -1.4751e+00]], [[ 3.5480e+00, -2.6518e+00, -2.2294e+00, -2.6729e+00, -2.0879e+00, -1.5038e-01, -4.8880e-02, -1.8831e+00, -1.0039e+00, -9.5338e-01, -8.7308e-01]], [[ 5.0608e+00, -1.7328e+00, 2.7262e-01, -5.8744e-01, -7.2365e-02, 1.3932e+00, 2.9277e+00, 3.9730e-01, 1.2246e+00, 8.2962e-02, 1.8672e+00]]], [[[ 3.3897e+00, -3.4068e+00, -4.1994e+00, -4.0532e+00, -4.0097e+00, 1.8279e-01, 1.4880e+00, -2.2448e+00, -3.4580e+00, -3.2215e+00, -5.5127e-01]], [[ 4.5734e+00, -3.4425e+00, -3.5064e+00, -3.1938e+00, -3.6198e+00, 5.2706e-01, 1.4646e+00, -1.8995e+00, -5.6310e-01, -5.7390e-02, 4.6800e-01]], [[ 3.9827e+00, -1.4787e+00, -3.5948e+00, -4.4208e+00, -3.7232e+00, -1.2006e+00, 3.5251e-01, -1.8256e+00, -2.7079e+00, -2.4041e+00, -1.5251e+00]], [[ 3.3319e+00, -5.5122e-01, -3.8382e+00, -3.4273e+00, -3.1333e+00, 2.2531e-01, -1.7054e-01, 4.8581e-03, -2.1839e+00, -1.5638e+00, -1.0407e+00]], [[ 3.0317e+00, -1.5564e+00, -4.3798e+00, -3.4095e+00, -2.5590e+00, -2.7792e+00, -1.4865e+00, -1.8628e+00, -3.2424e+00, -2.5334e+00, -1.2160e+00]], [[ 1.3923e+00, -3.1387e+00, -2.5800e+00, -2.8502e+00, -2.0939e+00, -2.7546e+00, -2.8897e+00, -2.9900e+00, -1.1450e+00, -1.8892e+00, -2.7502e+00]], [[ 3.5696e+00, -4.3830e+00, -4.6094e+00, -3.4689e+00, -3.2833e+00, 1.6148e-01, 1.9497e+00, -2.6088e+00, -2.6121e+00, -2.2704e+00, -3.0351e-01]], [[ 2.7291e+00, -1.9722e+00, -2.3507e+00, -2.9151e+00, -2.3932e+00, -2.9773e-01, 1.6769e+00, -5.1570e-01, -1.9283e+00, -1.1730e+00, -2.1334e-01]], [[ 3.9477e+00, -7.9926e-01, -2.3827e+00, -2.9477e+00, -1.9254e+00, -1.3221e+00, -3.5375e-02, 3.7619e-01, -1.7086e-01, 5.8221e-01, -1.7425e-01]], [[ 1.2394e+00, -4.2861e+00, -4.1438e+00, -5.0000e+00, -2.8681e+00, -2.1784e+00, -2.1790e+00, -3.5269e+00, -2.8435e+00, -1.8014e+00, -1.9747e+00]], [[ 3.7656e+00, -1.2360e+00, -1.6898e+00, -1.4548e+00, -1.5771e+00, 1.8814e-01, 1.3120e+00, -4.3068e-01, -9.2146e-01, 2.4140e-02, -4.6534e-01]], [[ 4.9295e+00, -1.2941e+00, -5.1057e-01, -4.3359e-01, -3.2745e-01, 2.0529e+00, 4.7139e+00, 1.2084e+00, 1.9920e+00, 2.5596e+00, 1.3477e+00]]]]) attn_weights tensor([[[[ 1.7117e+00, 1.3163e+00, -6.8311e-02, 2.5348e-01, 8.3976e-01, 7.4721e-01, 4.3954e-01, 1.0993e+00, 1.4713e-02, 2.0474e-01, 1.1638e+00]], [[ 3.5721e+00, -9.9471e-01, -1.6557e+00, -1.6798e+00, -1.2513e-01, -1.2685e-01, 3.4067e-01, 8.0802e-02, -1.3683e+00, -1.2295e+00, 8.4783e-01]], [[ 2.7248e+00, -5.2969e-01, -2.0102e+00, -2.1180e+00, -1.5280e+00, 6.2294e-01, 6.1010e-01, 3.0454e-01, -1.9828e+00, -1.5862e+00, -3.3271e-02]], [[ 1.3754e+00, 4.9861e-01, -1.1005e+00, -1.1232e+00, 2.8799e-01, -1.6683e-01, -9.8415e-02, 6.9443e-02, -1.6797e+00, -1.9801e+00, -1.5212e+00]], [[ 2.2045e+00, -7.1010e-01, -1.2563e+00, -1.4788e+00, -9.9288e-01, -7.7132e-01, -1.9661e+00, -7.0437e-01, -1.2620e+00, -1.3133e+00, -2.1177e-01]], [[ 4.0335e+00, -1.6338e-01, -5.8054e-01, -1.3156e+00, -1.4025e+00, 1.6558e+00, 3.4265e+00, 9.6236e-02, -7.8585e-01, -1.5437e+00, 4.5478e-01]], [[ 3.1324e+00, -1.6603e+00, -2.3500e+00, -1.8128e+00, -1.6783e+00, -3.3505e-01, -1.4957e+00, -1.3810e+00, -2.4126e+00, -2.0495e+00, -1.0967e+00]], [[ 3.5680e+00, 6.6192e-01, -9.0993e-01, -7.4807e-01, -1.1264e-01, 1.7804e+00, 3.4262e-01, 1.0228e+00, -4.0775e-01, -6.2227e-01, 1.0790e+00]], [[-3.2305e+00, 3.6959e+00, 3.9505e+00, 3.8462e+00, 2.6389e+00, 3.4924e+00, 3.2892e+00, 4.2462e+00, 4.8352e+00, 4.8208e+00, 3.7451e+00]], [[ 3.7436e+00, -1.3679e+00, -3.2171e+00, -3.1235e+00, -2.6583e+00, 1.2069e+00, 8.1808e-01, -1.2375e+00, -3.5885e+00, -2.9723e+00, -2.9773e-01]], [[ 2.8330e+00, 4.8368e-01, -5.8059e-01, -8.5834e-01, -6.9349e-01, 2.9326e+00, 1.4409e+00, 1.3557e+00, -7.5730e-01, -5.1706e-01, 2.0629e+00]], [[ 3.8777e+00, 7.0559e-01, -1.2318e+00, -8.5181e-01, 8.4126e-01, 2.2096e+00, 8.0921e-01, 8.1290e-01, -1.5551e+00, -1.3592e+00, 1.3248e+00]]], [[[ 1.3953e+00, 1.0859e+00, 9.3119e-01, 7.0835e-01, 1.2171e+00, 5.3843e-01, 7.7694e-01, 6.6472e-01, 1.1206e+00, 1.1725e+00, 6.6804e-01]], [[ 3.9819e+00, 4.2184e-01, -3.1654e-02, -9.4113e-02, 1.0015e+00, 7.6235e-02, 3.0978e-01, 5.4515e-01, 3.7226e-01, -3.2008e-01, -3.7368e-01]], [[ 3.2205e+00, -5.4403e-01, -1.3304e+00, -1.6489e+00, -1.0755e+00, 1.5758e-01, -6.1933e-01, -9.4819e-01, -1.1290e+00, -1.8859e+00, -1.8069e+00]], [[ 1.3697e+00, -1.1526e-01, 2.2666e-03, -1.3096e+00, -1.5506e+00, -1.3054e-01, -1.8209e-01, 2.6398e-02, -3.9612e-01, -4.2690e-01, -1.4983e+00]], [[ 2.0047e+00, -8.6196e-01, -1.6433e+00, -1.0511e+00, -3.5059e-01, -9.2308e-01, -1.1376e+00, -5.6400e-01, -3.6215e-01, -1.8426e+00, -1.0668e+00]], [[ 4.4690e+00, 5.4881e-01, 1.9126e-01, -1.0155e+00, 1.4628e+00, 4.0190e-01, 1.7027e+00, 8.2420e-01, 6.3095e-01, 3.4365e-01, -1.2267e+00]], [[ 3.4537e+00, -1.4271e+00, -1.5545e+00, -1.3951e+00, -5.7153e-01, 2.8185e-01, 4.0301e-02, -1.1441e+00, -1.3623e+00, -2.0969e+00, -1.5566e+00]], [[ 4.1606e+00, 2.5564e-01, -1.6241e+00, -1.1423e+00, 5.2640e-01, 1.5585e+00, 3.1447e-01, -2.5996e-01, -6.6029e-01, -2.5267e+00, -2.0485e+00]], [[-3.7766e+00, 3.1124e+00, 4.3460e+00, 3.2486e+00, 2.7391e+00, 2.8049e+00, 3.0353e+00, 3.1122e+00, 3.4777e+00, 4.1223e+00, 3.6306e+00]], [[ 4.4956e+00, -1.6764e-02, -1.2529e-01, -2.4544e-01, 3.5918e-01, -7.6891e-01, 3.5653e-01, 2.5888e-01, 5.6398e-01, -2.4895e-02, 5.5953e-02]], [[ 2.8483e+00, 1.8813e-02, 1.3970e+00, 3.7144e-01, -6.3458e-02, 3.8046e-01, -2.0433e-02, 2.9317e-01, 5.6021e-01, 1.1665e+00, 1.6527e-01]], [[ 3.3063e+00, -5.3810e-01, 1.1941e+00, 5.1894e-01, -4.0295e-03, 1.4303e+00, 1.4188e+00, -1.9588e-01, 5.0695e-01, 1.6950e+00, 6.4561e-01]]], [[[ 2.7992e+00, -1.6882e+00, -1.8036e+00, -2.2699e+00, -2.0559e+00, -1.1267e+00, -1.2198e+00, -2.2323e+00, -2.4608e+00, -2.1363e+00, 2.1970e+00]], [[ 3.8404e+00, -1.5136e+00, -9.7609e-01, -3.2635e-01, -1.7589e+00, -2.7528e+00, -1.3183e+00, -9.5905e-01, -1.1781e+00, -1.2197e+00, -2.0507e+00]], [[ 4.1037e+00, -4.8415e-01, -1.7596e+00, -1.1590e+00, -2.5315e+00, -1.8969e+00, -1.1467e+00, -1.6719e+00, -2.2089e+00, -2.5829e+00, -1.1830e+00]], [[ 3.3727e+00, -3.5478e+00, -3.8292e+00, -4.5060e+00, -3.2210e+00, -4.5007e+00, -3.8107e+00, -2.3207e+00, -4.1422e+00, -3.9868e+00, -2.4931e+00]], [[ 3.1056e+00, -1.9150e-01, -7.1239e-01, -8.1103e-01, -8.5826e-01, -3.1293e+00, -3.4676e+00, -1.3675e+00, -1.6258e+00, -1.3777e+00, -1.6910e+00]], [[ 4.3110e+00, -7.4882e-01, -7.5514e-01, 4.2453e-01, -8.9276e-01, -7.0662e-01, 5.2261e-01, -1.4301e+00, -1.4480e+00, -1.8046e+00, -1.2217e+00]], [[ 3.0986e+00, -1.8315e+00, -1.5751e+00, -1.3024e+00, -2.4934e+00, -2.3258e+00, -2.5141e+00, -3.2297e+00, -2.9602e+00, -2.5682e+00, -1.3285e+00]], [[ 4.3523e+00, 1.3388e-01, -3.5383e-02, -1.1077e+00, -1.4200e+00, -1.9341e+00, -1.4380e+00, -1.0140e+00, -1.8413e+00, -9.7309e-01, 3.0942e-01]], [[ 1.0727e+00, 8.0018e+00, 9.6364e+00, 7.0624e+00, 6.6186e+00, 7.7271e+00, 9.0987e+00, 1.0042e+01, 9.0004e+00, 1.0383e+01, 1.2220e+01]], [[ 3.3746e+00, -4.9130e-01, -1.8372e+00, -1.6254e+00, -1.7446e+00, -1.0405e+00, -1.2889e+00, -1.8386e+00, -1.5434e+00, -2.7128e+00, -1.2351e+00]], [[ 6.3259e+00, 2.4860e+00, 2.8951e+00, 1.8534e+00, 2.1138e+00, -2.4797e+00, -1.6804e+00, 2.1688e+00, 1.9315e+00, 2.3129e+00, 9.2623e-01]], [[ 7.5151e+00, -1.2005e+00, -2.0441e+00, -1.9357e+00, 6.1214e-02, -4.7785e-02, -2.5891e+00, -4.5732e+00, -2.2227e+00, -2.9275e+00, -3.8153e+01]]], [[[ 1.2588e+00, 1.9719e+00, 7.9437e-02, 5.1797e-01, 1.2469e+00, 9.6878e-01, 6.1558e-01, 1.4205e+00, 8.4090e-01, -2.7343e-02, 9.7413e-01]], [[ 3.9022e+00, -2.7586e-01, -6.2503e-01, 1.5864e-01, 1.1716e+00, -2.9387e-01, 8.5613e-01, 9.0465e-01, 1.3338e+00, -7.4068e-01, 3.8792e-01]], [[ 3.4478e+00, 1.8933e-02, -1.7133e+00, -1.9562e+00, -1.4842e+00, 3.8585e-02, 5.1573e-01, 5.5231e-01, -7.8616e-01, -7.6951e-02, 5.9503e-02]], [[ 1.3890e+00, -1.2633e+00, -2.4555e+00, -2.3301e+00, -1.1914e+00, -9.4993e-01, -9.7303e-01, -4.8533e-01, -8.8430e-01, -6.7416e-01, -1.3977e+00]], [[ 1.8382e+00, -5.2004e-01, -7.7667e-01, -1.4638e+00, -8.5146e-01, -2.0913e+00, -2.3093e+00, -4.8687e-01, -5.1063e-01, -1.8218e+00, -2.2399e+00]], [[ 3.9906e+00, 7.6634e-01, -1.0631e+00, 2.7323e-01, 5.7583e-01, 3.2657e-01, 2.6709e+00, 1.8594e+00, 1.1500e+00, -4.6171e-01, 1.9505e+00]], [[ 3.3395e+00, -1.6576e+00, -2.4282e+00, -1.3110e+00, -1.4413e+00, -7.7186e-01, -6.9563e-01, -9.2078e-01, -7.0796e-01, -1.1999e+00, -1.2738e+00]], [[ 3.6979e+00, 1.2920e+00, -3.3144e-01, 1.5493e-01, 4.2189e-01, 1.4723e+00, 1.4477e+00, 1.5310e+00, 8.2710e-01, 3.6312e-01, 9.0691e-01]], [[-7.6636e+00, 1.7005e+00, 1.1262e+00, 1.1211e+00, 1.3504e+00, 2.9023e+00, 2.6390e+00, 1.9059e+00, 5.1334e-01, 1.2067e+00, 2.1546e+00]], [[ 4.1418e+00, -5.3975e-01, -1.3097e+00, -9.7117e-01, -6.4609e-01, 2.4499e-01, 1.6050e+00, 1.0566e+00, 5.0648e-01, 1.2401e-01, 4.7375e-01]], [[ 3.0164e+00, 3.9177e-01, -1.1311e+00, -4.5151e-01, 4.3244e-01, 7.3767e-01, 1.1080e+00, 1.7032e+00, 1.0980e+00, 5.8877e-01, 1.2032e+00]], [[ 2.6136e+00, 1.5574e+00, -6.4039e-01, -1.6621e-01, 2.3023e-01, 6.3827e-01, 5.6048e-01, 2.3406e+00, 2.7246e-01, 2.7975e-01, 1.1582e-01]]], [[[ 2.3926e+00, -4.4802e-01, -2.1337e+00, -8.8440e-01, -1.0787e+00, 2.9100e-01, -3.1161e-01, -5.7295e-01, -1.2406e+00, -8.9496e-01, -3.3677e-01]], [[ 4.2576e+00, -1.3607e+00, -1.9635e+00, -1.7639e+00, -1.0527e+00, -1.1975e+00, 9.5381e-01, -6.2867e-01, -6.9737e-01, -1.1888e+00, -8.9781e-01]], [[ 3.6958e+00, -2.9450e-01, -1.5299e+00, -2.2424e+00, -1.6107e+00, -5.7835e-01, 1.3957e+00, 1.4393e-02, -1.5115e+00, -1.5966e+00, -9.9411e-01]], [[ 1.9465e+00, -2.4966e+00, -2.9110e+00, -3.2020e+00, -1.8857e+00, -1.2623e+00, -1.2177e+00, -1.5099e+00, -3.5471e+00, -2.3543e+00, -1.2716e+00]], [[ 2.4263e+00, -9.3421e-01, -1.7254e+00, -1.7147e+00, -1.6538e+00, -1.3755e+00, -7.8605e-01, -9.3457e-01, -1.2461e+00, -1.6439e+00, -1.6268e+00]], [[ 4.2507e+00, -5.8296e-01, -1.5662e+00, -4.6984e-01, -6.5384e-01, 7.1866e-02, 3.3505e+00, 3.4714e-02, -1.9953e-01, -6.4860e-01, 2.4122e-01]], [[ 3.5944e+00, -1.7700e+00, -2.7781e+00, -1.6262e+00, -1.6965e+00, -8.5649e-01, 3.5839e-01, -1.0792e+00, -8.2707e-01, -1.4568e+00, -1.4559e+00]], [[ 4.6647e+00, 3.7664e-01, 6.7858e-02, -1.2847e+00, -5.6966e-01, 1.3257e+00, 2.0011e+00, 3.7464e-01, -2.3509e-01, -1.2852e-01, 9.1058e-01]], [[-2.5301e+00, 1.1337e+00, 1.7146e+00, 8.7563e-01, 8.6604e-01, 2.3315e+00, 2.9337e+00, 1.2492e+00, 7.9293e-01, -5.2288e-02, 1.0590e+00]], [[ 4.4539e+00, -1.2304e+00, -2.4893e+00, -2.7310e+00, -2.0826e+00, 3.5482e-02, 2.0206e+00, -5.9002e-01, -2.3092e-01, -4.8425e-01, 2.5086e-01]], [[ 3.0678e+00, -1.0666e+00, -1.9053e+00, -1.9465e+00, -1.3266e+00, 9.6002e-01, 1.9442e+00, 1.4188e-02, -1.8412e-01, 4.6637e-01, 1.0076e+00]], [[ 3.3218e+00, -1.3904e-01, -1.8931e+00, -2.1664e+00, -5.9289e-01, 1.0096e+00, 6.6594e-01, 3.4737e-01, -1.2304e+00, -4.4745e-01, 5.8080e-01]]]]) attn_weights tensor([[[[-9.1344e-01, -3.1558e+00, -1.9875e+00, -1.9361e+00, -3.5518e+00, -2.3624e+00, -2.2157e+00, -3.3045e+00, -1.8538e+00, -1.6673e+00, -1.4524e+00, -3.3509e+00]], [[-9.5989e-01, -3.9004e-01, -9.4804e-01, -3.1085e+00, 5.4493e+00, -3.5950e+00, -3.6807e+00, -1.3085e+00, -1.6881e+00, -3.7017e+00, -3.2120e+00, 5.4600e+00]], [[-2.0451e+00, -2.2416e+00, -2.7670e+00, -2.6235e+00, -3.4759e+00, -3.2631e+00, -2.9753e+00, -2.3279e+00, -2.8422e+00, -2.6121e+00, -2.3247e+00, -3.4627e+00]], [[-3.0572e+00, -4.9898e+00, -5.6810e+00, -5.2733e+00, -3.5097e+00, -5.0753e+00, -3.7174e+00, -2.1105e+00, -2.0285e+00, -1.4685e+00, -8.3533e-01, 1.2549e+00]], [[-9.0432e-01, -2.6312e+00, -2.7967e+00, -1.3361e+00, -1.6455e+00, -1.4408e+00, -9.7716e-01, -1.3658e+00, -1.0982e+00, 5.3171e-01, 6.2621e-01, 7.3730e-01]], [[ 1.4809e+00, 3.4405e+00, 2.7913e+00, 1.7671e+00, 5.4583e+00, 6.6965e-01, 8.1090e-01, 2.4049e+00, 1.8465e+00, 1.0063e+00, 1.5727e+00, 4.9716e+00]], [[-6.9088e-01, -4.6262e+00, -3.5597e+00, -1.6913e+00, -4.5837e+00, -1.3084e+00, -1.2719e+00, -5.0544e+00, -3.4656e+00, -1.4000e+00, -1.2837e+00, -4.4025e+00]], [[-6.0933e+00, -7.3711e+00, -7.0859e+00, -6.8639e+00, -6.9275e+00, -6.3649e+00, -6.2187e+00, -5.2270e+00, -4.6430e+00, -4.4259e+00, -4.3673e+00, -3.9019e+00]], [[-3.5800e+00, -1.9861e+00, -3.1773e+00, -3.4523e+00, -8.3332e-01, -3.5926e+00, -3.1250e+00, -1.0914e+00, -2.6708e+00, -3.0389e+00, -3.6655e+00, -2.0883e-01]], [[-1.4853e+00, -1.6381e+00, -1.7422e+00, -2.3666e+00, -1.8142e+00, -2.4490e+00, -2.4655e+00, -1.7684e+00, -1.8148e+00, -2.3765e+00, -2.2035e+00, -1.7224e+00]], [[ 7.2398e-01, 6.0143e-01, 4.4698e-01, -2.5832e-01, 1.2251e+00, -7.3022e-01, -4.8486e-01, 3.3238e-01, 1.7130e-01, -5.0298e-01, -3.9322e-01, 1.0957e+00]], [[-1.5431e+00, -2.3091e+00, -3.7056e+00, -2.5753e+00, -2.5860e+00, -2.5016e+00, -2.1420e+00, -2.2263e+00, -3.8089e+00, -2.5335e+00, -2.4874e+00, -2.5285e+00]]], [[[-4.5692e-02, -1.8651e+00, -1.0319e+00, -1.0732e+00, -2.2666e+00, -1.0505e+00, -2.2125e+00, -2.0819e+00, -2.0599e+00, -8.6773e-01, -8.7671e-01, -9.9871e-01]], [[ 1.7277e+00, 2.0221e+00, 3.5343e+00, 2.9283e+00, 3.2135e+00, 5.0341e-01, 2.6183e+00, 9.1106e-01, 1.4399e+00, 2.7952e+00, 2.3309e+00, 9.5893e+00]], [[-1.3391e+00, -2.3052e+00, -2.2790e+00, -1.9682e+00, -2.1343e+00, -1.7607e+00, -2.2831e+00, -2.5698e+00, -1.7998e+00, -2.3668e+00, -2.0043e+00, -2.0634e+00]], [[-1.9116e+00, -5.8682e+00, -4.2076e+00, -4.7624e+00, -4.7972e+00, -4.4566e+00, -3.8415e+00, -3.1190e+00, -2.4904e+00, -4.4876e-02, -5.8935e-01, 3.5238e+00]], [[-1.3241e+00, -2.7582e+00, -3.4031e+00, -2.6934e+00, -1.9374e+00, -2.9798e+00, -6.9823e-01, -1.6712e+00, -1.1885e+00, -1.4970e+00, -6.0197e-01, 2.5981e+00]], [[ 6.1381e+00, 1.1971e+00, 2.4496e+00, 2.0404e+00, 5.1804e-01, 1.5307e+00, 2.8256e+00, -2.2847e+00, -9.8357e-01, 3.8864e-01, 5.6452e-01, 1.1428e+01]], [[-3.9159e-01, -2.3667e+00, -3.2026e+00, -2.1397e+00, -2.5279e+00, -1.2883e+00, -9.1002e-01, -2.7277e+00, -2.6738e+00, -3.3573e+00, -2.0789e+00, -1.1369e+00]], [[-4.8171e+00, -5.7309e+00, -5.4133e+00, -5.7768e+00, -5.0411e+00, -5.4688e+00, -5.2244e+00, -3.6670e+00, -3.1803e+00, -2.6487e+00, -3.0072e+00, -2.8755e+00]], [[-1.7523e+00, -1.8519e+00, -1.9169e+00, -2.7048e+00, -1.7051e+00, -2.0043e+00, -2.6920e+00, -1.7734e+00, -1.4348e+00, -1.7831e+00, -2.5894e+00, -3.2080e+00]], [[-1.7560e+00, -2.2149e+00, -2.2499e+00, -2.6515e+00, -2.2975e+00, -2.4727e+00, -2.6401e+00, -2.3214e+00, -2.2160e+00, -2.2501e+00, -2.6019e+00, -2.5918e+00]], [[ 6.9941e-01, 3.6308e-01, 4.7528e-01, -8.6610e-03, 3.5120e-01, -5.5930e-01, -3.6255e-01, 1.2360e-01, 2.3168e-01, 2.8328e-01, -1.9120e-01, 1.5468e+00]], [[-1.3883e+00, -2.2640e+00, -3.6902e+00, -2.2476e+00, -2.9947e+00, -2.4375e+00, -2.2604e+00, -2.1291e+00, -1.9187e+00, -3.7388e+00, -2.0881e+00, -2.1968e+00]]], [[[-8.9709e-01, -2.0216e+00, -1.3328e+00, -1.1369e+00, -2.6822e+00, -1.9364e+00, -2.2756e+00, -2.0860e+00, -1.2178e+00, -1.0248e+00, -5.0814e-01, -2.4420e+00]], [[ 3.7053e-01, 2.0372e+00, 4.7754e-01, 3.7965e+00, 6.3408e-01, -2.1318e+00, -7.2921e-01, 6.9387e-01, 1.6811e+00, -6.5017e-01, 3.9814e+00, 7.7701e+00]], [[-1.2852e+00, -1.6526e+00, -1.9981e+00, -1.4096e+00, -2.8352e+00, -2.9207e+00, -2.8594e+00, -2.0570e+00, -2.3033e+00, -2.2106e+00, -1.4923e+00, -2.1641e+00]], [[-2.2257e+00, -4.2046e+00, -3.2910e+00, -7.9049e-01, -3.9343e+00, -2.8211e+00, -5.4176e+00, -1.4828e+00, -7.1707e-01, 1.1742e+00, 6.0340e+00, 4.3264e+00]], [[-4.1355e+00, -4.7419e+00, -4.8269e+00, -2.4635e+00, -4.7132e+00, -3.8555e+00, -2.1596e+00, -3.3627e+00, -3.5620e+00, -2.8277e+00, 3.6385e+00, 1.3825e+00]], [[ 5.1150e+00, 2.7728e+00, 4.1746e+00, 6.2854e+00, 1.3599e+00, 2.4403e-01, -3.3116e-01, 2.9855e-01, 2.9330e+00, 2.5765e+00, 9.6954e+00, 9.4159e+00]], [[-1.0974e+00, -3.0425e+00, -4.0728e+00, -1.8585e+00, -3.3094e+00, -1.9602e+00, -1.9065e+00, -3.3417e+00, -2.7081e+00, -4.1337e+00, -1.2676e+00, -2.4423e+00]], [[-5.4150e+00, -6.4781e+00, -6.2679e+00, -6.5035e+00, -5.7362e+00, -6.6434e+00, -6.2397e+00, -4.2691e+00, -4.1840e+00, -3.4557e+00, -2.8867e+00, -4.0708e+00]], [[-2.5928e+00, -1.6605e+00, -2.4246e+00, -2.8119e+00, -1.9457e+00, -3.8832e+00, -3.9345e+00, -1.2766e+00, -2.6419e+00, -2.1363e+00, -3.0861e+00, -3.3003e+00]], [[-1.4773e+00, -1.8693e+00, -2.0456e+00, -2.4904e+00, -2.2237e+00, -2.5600e+00, -2.7886e+00, -2.0459e+00, -1.9773e+00, -2.1193e+00, -2.4466e+00, -2.6616e+00]], [[ 1.2296e+00, 1.0453e+00, 9.5251e-01, 7.5304e-01, 5.1486e-01, -4.7723e-01, -6.1962e-01, 6.1192e-01, 5.6656e-01, 4.9288e-01, 8.9041e-01, 1.5630e+00]], [[-1.2939e+00, -1.7888e+00, -3.2907e+00, -2.1145e+00, -2.0879e+00, -2.2263e+00, -2.2740e+00, -1.7204e+00, -2.0993e+00, -3.3788e+00, -2.3886e+00, -2.2252e+00]]], [[[-6.8554e-01, -2.7887e+00, -1.8125e+00, -2.1728e+00, -2.6326e+00, -3.1579e+00, -3.4095e+00, -2.9199e+00, -2.5475e+00, -1.7309e+00, -3.3255e+00, -2.8620e+00]], [[ 1.9182e+00, 1.7637e+00, 1.4554e+00, -2.2928e-02, -1.5317e+00, -2.0590e+00, -9.6384e-01, 8.8786e-01, -1.9587e+00, -5.5245e-01, -1.1939e+00, 7.3532e+00]], [[-9.7679e-01, -1.9082e+00, -1.1069e+00, -1.2400e+00, -2.5702e+00, -2.7441e+00, -3.4880e+00, -2.2675e+00, -2.6790e+00, -2.6341e+00, -3.5466e+00, -1.2434e+00]], [[-7.4161e-01, -3.4350e+00, -1.7456e+00, -2.5264e+00, -2.8250e+00, -3.6920e+00, -3.1158e+00, -8.3079e-01, -3.0328e-01, -4.0489e-01, -8.0608e-01, 4.6485e+00]], [[-5.7176e-02, -1.4019e+00, -1.0461e+00, -4.0758e-01, -9.1935e-01, -1.9009e+00, -7.4013e-01, 1.1238e-01, 3.6779e-01, -2.0914e-02, 5.4193e-01, 1.9548e+00]], [[ 7.0116e+00, 2.3119e+00, 4.0296e+00, 2.0170e+00, 1.1840e+00, 2.3021e+00, 4.0743e-01, 3.7732e-01, 5.3980e-01, 1.1969e+00, -2.3338e-02, 1.0217e+01]], [[ 5.1230e-01, -2.1365e+00, -3.4787e+00, -1.8907e+00, -2.6077e+00, -1.0532e+00, -7.7528e-01, -2.5927e+00, -2.6609e+00, -7.0115e-01, -6.6482e-01, -1.4620e+00]], [[-5.0696e+00, -6.3275e+00, -5.8703e+00, -6.0785e+00, -5.5856e+00, -6.0940e+00, -4.9641e+00, -4.2902e+00, -3.8584e+00, -3.6104e+00, -3.2678e+00, -2.7027e+00]], [[-2.7323e+00, -1.2358e+00, -2.2497e+00, -3.4634e+00, -1.6774e+00, -3.6404e+00, -3.3039e+00, -1.0143e+00, -1.5039e+00, -2.8081e+00, -3.1693e+00, -2.1742e+00]], [[-1.8353e+00, -2.0782e+00, -2.2444e+00, -2.6779e+00, -2.3592e+00, -2.9217e+00, -2.8766e+00, -2.2415e+00, -2.3325e+00, -2.7648e+00, -2.8255e+00, -2.6308e+00]], [[ 1.0074e+00, 5.4632e-01, 6.9959e-01, 1.3674e-02, 2.1138e-01, -6.5661e-01, -6.6719e-01, 2.6729e-01, 8.2931e-02, -1.8644e-01, -7.7113e-01, 1.4070e+00]], [[-1.3719e+00, -2.1469e+00, -3.4357e+00, -2.4055e+00, -2.5378e+00, -2.2159e+00, -2.0908e+00, -2.1599e+00, -2.5551e+00, -1.8622e+00, -2.0566e+00, -2.7436e+00]]], [[[-1.1833e+00, -2.0508e+00, -1.9713e+00, -1.9067e+00, -1.6937e+00, -1.3968e+00, -7.8956e-01, -2.3238e+00, -2.5587e+00, -1.2095e+00, -7.4240e-01, -5.6989e-01]], [[ 1.1388e+00, 8.5054e-01, 1.4818e+00, 1.5039e+00, -1.1974e+00, 9.0455e-01, 9.1299e+00, -5.9305e-01, -8.0932e-01, -1.6990e+00, 1.4293e+00, 9.0932e+00]], [[-1.1936e+00, -2.1586e+00, -2.0160e+00, -2.1986e+00, -1.8721e+00, -1.3622e+00, -2.4632e+00, -2.6324e+00, -2.2619e+00, -2.1553e+00, -2.0393e+00, -2.5131e+00]], [[-2.5466e+00, -8.2683e+00, -8.1173e+00, -7.0702e+00, -6.7324e+00, -3.8170e+00, 7.9626e-01, -5.0786e+00, -4.0787e+00, -3.3344e+00, -4.3020e-01, 3.9458e+00]], [[-6.3834e-01, -2.3450e+00, -3.5283e+00, -4.0121e+00, -2.5896e+00, -1.9766e+00, 1.2656e+00, -1.5342e+00, -1.4641e+00, -1.0865e+00, -5.4777e-01, 2.7904e+00]], [[ 6.6172e+00, 1.6494e+00, 1.6581e+00, 1.0932e+00, 8.6429e-01, 2.9458e+00, 1.2423e+01, -9.2835e-01, -1.6442e+00, 5.7551e-01, 2.9547e+00, 1.2134e+01]], [[-8.1248e-02, -2.3077e+00, -2.5921e+00, -2.1502e+00, -3.0361e+00, -1.0969e+00, -1.0143e+00, -2.7296e+00, -3.1958e+00, -2.9415e+00, -8.1139e-01, -9.5164e-01]], [[-4.5170e+00, -6.0196e+00, -5.6328e+00, -6.3084e+00, -5.0996e+00, -4.0899e+00, -5.1448e+00, -3.5798e+00, -3.6389e+00, -3.0992e+00, -2.2017e+00, -3.2339e+00]], [[-1.6007e+00, -2.1765e+00, -3.0414e+00, -2.4929e+00, -2.0757e+00, -2.6640e+00, -3.2899e+00, -2.1608e+00, -2.9771e+00, -2.2277e+00, -2.0746e+00, -3.1765e+00]], [[-1.9018e+00, -2.1178e+00, -2.2757e+00, -2.6483e+00, -2.1938e+00, -1.9196e+00, -3.6685e+00, -2.2632e+00, -2.6066e+00, -2.2960e+00, -2.8053e+00, -3.6235e+00]], [[ 2.5486e-01, 2.3344e-01, -1.3854e-01, -2.6627e-01, 2.4889e-01, -2.6912e-01, 1.6309e+00, 8.2425e-02, -3.7635e-01, 9.0580e-02, -1.6329e-01, 1.5844e+00]], [[-1.4468e+00, -2.4984e+00, -2.9846e+00, -2.8594e+00, -3.1259e+00, -3.0177e+00, -2.1116e+00, -2.6415e+00, -2.4131e+00, -3.1080e+00, -2.4599e+00, -2.0229e+00]]]]) attn_weights tensor([[[[-1.4972, -3.1589, -2.8069, -2.2276, -2.8516, -2.7045, -2.1156, -1.3071, -1.1235, -0.5393, -0.4358, -0.6445]], [[-0.8685, -1.8813, -2.4189, -2.0586, -2.5690, -2.2553, -1.6771, 0.0471, -0.6565, -0.4081, -0.6177, -0.5669]], [[-2.7920, -3.7787, -3.3879, -3.7490, -3.0238, -3.3866, -2.9777, -2.3535, -2.6050, -3.0107, -2.4351, -2.3101]], [[ 0.0579, -2.9098, -2.7732, -2.8110, -2.6230, -2.4991, -2.3077, -2.1787, -2.2291, -2.3317, -1.8616, -2.0547]], [[-0.5877, -2.5646, -2.7310, -2.6617, -2.4686, -2.0898, -2.0009, -2.0544, -2.2082, -2.1604, -1.6075, -1.8835]], [[ 0.2499, 0.1231, -1.5602, -0.6198, -0.9582, -2.0255, -1.8624, 0.2949, -1.7328, -0.8805, -2.6482, -1.0757]], [[ 1.1356, -0.7252, -1.0180, -1.0097, -0.7383, -1.0595, -0.9039, -0.7305, -1.3382, -1.4162, -0.8203, -0.9611]], [[ 0.2108, -1.6247, -2.1531, -1.9413, -1.8869, -1.4650, -1.4159, -1.2740, -2.1946, -2.0901, -1.3104, -1.7311]], [[-0.5062, -1.4559, -2.1081, -2.2701, -1.7379, -2.3141, -2.4251, -1.5792, -2.0024, -2.1743, -2.3070, -1.6467]], [[ 1.2884, -0.6584, -0.2622, -0.5996, 0.0874, -1.2164, -1.2698, -0.8884, -0.2395, -0.5244, -1.0358, 0.0719]], [[-5.2009, -2.2134, -2.1000, -2.1053, -1.9871, -1.6317, -1.4657, -1.5627, -1.4708, -1.5258, -0.8324, -1.3031]], [[-1.4453, -1.7738, -3.9860, -4.4104, 0.7901, -5.3719, -6.0188, -1.3558, -3.3586, -3.6923, -3.9670, 1.3940]]], [[[-0.8015, -2.0213, -1.4223, -0.3970, -1.1978, -1.5514, -1.7012, -0.0153, 0.7369, 0.8291, 1.8631, 0.3054]], [[-0.4381, -1.6173, -1.9428, -1.6365, -1.6498, -1.7050, -1.3720, 0.2682, 0.2022, 0.0507, 0.3233, -0.6922]], [[-2.9343, -3.8524, -3.5086, -3.8744, -3.1789, -3.5555, -3.1339, -2.4096, -2.5947, -2.7050, -3.0518, -2.8354]], [[-0.0208, -2.9976, -2.8860, -2.9066, -2.7788, -2.5853, -2.3690, -2.2360, -2.2680, -2.2393, -2.3193, -2.1653]], [[-0.5690, -2.6059, -2.8093, -2.7725, -2.6106, -2.2963, -2.0999, -2.0588, -2.1416, -2.1243, -2.1133, -1.6949]], [[ 1.1595, 0.9308, -0.4367, 0.8050, 0.4446, -1.7416, -1.2025, 0.7054, 0.1570, -0.9784, 0.4268, -0.0408]], [[ 0.5687, -0.9758, -1.1823, -1.8494, -1.5145, -1.0378, -1.0648, -1.1328, -1.4347, -1.6341, -2.3847, -1.5705]], [[ 0.4401, -1.3029, -2.1767, -2.2093, -1.9190, -1.0382, -0.6702, -1.0568, -1.6467, -2.1904, -2.3042, -1.9145]], [[-0.6960, -1.7852, -2.0584, -2.2635, -2.0173, -2.4762, -2.6953, -1.7692, -2.0547, -1.9591, -2.1053, -2.4777]], [[ 1.2389, -0.6699, -0.0475, -0.9770, 0.1682, -0.9346, -1.2755, -0.9113, -0.7343, -0.1423, -0.9131, -0.5933]], [[-5.3463, -2.3152, -2.2388, -2.2558, -2.1971, -1.7333, -1.5463, -1.6239, -1.6291, -1.4653, -1.5409, -1.2487]], [[ 1.0785, 0.8187, -1.9582, -2.6809, -1.9352, -3.6379, -3.0410, 0.7714, 0.0968, -2.7230, -3.1319, 4.3139]]], [[[-1.5354, -3.6719, -2.1020, -2.1451, -2.6796, -3.6660, -3.9501, -1.3050, -1.3546, 0.4015, 1.5260, -1.5365]], [[-0.0415, -1.1507, -1.7830, -1.9761, -1.3902, -1.6060, -1.1640, 0.6238, 0.3970, 0.3862, -0.8084, -0.7487]], [[-2.6724, -3.7894, -3.3282, -3.7293, -3.0541, -3.4247, -2.9791, -2.2487, -2.6462, -2.4467, -3.2043, -3.1003]], [[-0.0309, -2.6793, -2.6214, -2.6704, -2.5470, -2.3288, -2.1821, -2.0595, -2.1498, -2.0302, -2.3944, -2.3657]], [[-0.4948, -2.4620, -2.5858, -2.5358, -2.4230, -2.0970, -2.0041, -1.9457, -1.9717, -1.9039, -2.1685, -2.1556]], [[ 1.3308, 0.8459, -0.7776, 0.1510, 0.1532, -3.1270, -3.3372, 0.9328, 0.6873, -0.9077, -0.3087, 0.7440]], [[ 1.4272, -0.6627, -1.0112, -0.8176, -0.0247, -1.5867, -1.4287, -0.9968, -0.8653, -1.4796, -0.8860, -1.0202]], [[ 1.1515, -0.8448, -1.7856, -1.3564, -1.4861, -0.6659, -0.4998, -0.4652, -1.2522, -1.7810, -1.7172, -1.2414]], [[-0.8124, -1.9640, -2.3420, -2.4307, -2.0743, -2.7058, -2.9193, -1.8198, -2.2212, -2.2414, -2.5856, -2.2799]], [[ 1.4385, -0.4585, -0.0257, -0.9078, 0.1641, -1.1286, -1.1308, -0.6380, -0.1068, 0.0351, -0.4815, -0.2961]], [[-5.5592, -2.0976, -2.0693, -2.0696, -1.9977, -1.6218, -1.4382, -1.5283, -1.4216, -1.3738, -1.7199, -1.6731]], [[ 0.5369, 0.0520, -2.8949, -0.9289, -2.8415, -3.4688, -5.5223, 0.4114, -2.7686, -2.7713, 0.3121, 3.3745]]], [[[-0.2154, -1.4997, -1.0103, -0.8718, -1.2537, -1.2488, -0.7382, -0.0881, -0.0445, -0.2686, -0.1668, 0.5418]], [[-0.1949, -1.2328, -2.2511, -2.2178, -2.1246, -2.4347, -2.2730, -0.0510, -1.0618, -1.9934, -1.4243, -0.0314]], [[-2.7423, -3.7655, -3.2467, -3.6497, -3.0591, -3.4028, -3.0345, -2.3546, -2.6233, -3.0495, -2.6273, -2.1397]], [[ 0.2078, -2.7755, -2.5696, -2.6434, -2.5366, -2.3745, -2.1610, -2.0990, -2.1976, -2.1049, -1.8693, -1.5814]], [[-0.5084, -2.5846, -2.6355, -2.6522, -2.5555, -2.1996, -2.0880, -2.1048, -2.1521, -1.6866, -1.7279, -1.5374]], [[ 2.3341, 1.8071, 0.6724, 0.2755, 0.3377, -1.4589, -1.8357, 1.5763, 0.2088, -3.1896, -2.3297, 2.3264]], [[ 0.7500, -0.7912, -1.8892, -2.7445, -2.7795, -1.6913, -2.5580, -1.2008, -2.8482, -2.6236, -2.7711, -0.6018]], [[ 0.1277, -1.9937, -1.5851, -1.2889, -2.4559, -1.7741, -1.4684, -1.7037, -2.3098, -1.2849, -1.6713, -1.2154]], [[-0.0354, -0.6068, -1.6108, -1.7094, -1.1447, -1.3691, -1.7222, -0.8353, -1.1415, -1.8684, -1.5579, -0.9535]], [[ 1.3268, -0.4096, -0.4986, -0.6177, -0.1061, -0.9719, -1.1919, -0.7725, -0.0478, -1.5275, -1.0353, 0.1010]], [[-5.2087, -2.1132, -1.9657, -2.0320, -1.9797, -1.5926, -1.4309, -1.5119, -1.5821, -1.2023, -1.0379, -0.8117]], [[ 1.3867, 0.4327, -1.9042, -1.4776, -2.9905, -3.5377, -2.0067, 0.2989, -3.4036, -2.2789, -2.7012, 3.3903]]], [[[-2.1578, -2.9251, -2.4799, -3.2765, -1.5691, -1.5450, -1.5834, -0.8933, -1.5722, 0.1976, 0.3924, -0.3766]], [[-1.1443, -2.3012, -2.4508, -2.4814, -2.2960, -2.6345, -2.6541, -0.3877, -1.3431, -0.7630, -1.1143, -1.4077]], [[-2.8764, -3.6577, -3.3702, -3.7026, -3.1132, -3.4297, -3.0383, -2.3474, -3.0656, -2.6700, -2.6903, -2.5209]], [[ 0.1077, -2.8696, -2.7065, -2.7254, -2.6551, -2.4959, -2.2947, -2.1873, -2.5007, -2.2978, -1.9696, -1.9330]], [[-0.6311, -2.3568, -2.6712, -2.6280, -2.5390, -2.2822, -2.0438, -2.0166, -2.2367, -2.1670, -1.6329, -1.6282]], [[-1.0953, -0.8248, -1.9191, -2.6316, -1.2998, -1.1107, -1.0976, -1.1020, -3.2324, -1.5817, -0.1828, -0.9212]], [[ 2.1846, 0.6435, 0.2900, -1.1661, -0.1429, -2.3570, 1.2920, 0.2667, -1.5915, -0.0065, 1.5117, 1.0023]], [[-0.2346, -2.2670, -2.4976, -2.4467, -2.7112, -1.0559, -2.7602, -1.8248, -2.1473, -2.3703, -1.3913, -2.8812]], [[-0.8507, -1.5999, -2.3305, -2.6341, -1.8565, -2.4797, -2.9418, -1.6502, -1.8633, -1.9218, -2.5386, -2.5866]], [[ 1.1301, -0.1908, 0.1172, -0.2481, 0.2407, -0.5462, -1.5343, -0.6353, -0.0102, 0.1409, -1.4780, -0.9310]], [[-5.2284, -1.9399, -1.9371, -1.9138, -1.8877, -1.5244, -1.3904, -1.4182, -1.6042, -1.4321, -0.9622, -0.9507]], [[-2.3810, -2.3277, -4.5858, -5.8357, -4.8177, -4.0249, 1.1993, -1.6664, -5.9304, -4.4472, -2.5657, 0.8820]]]]) attn_weights tensor([[[[ -1.9445, -4.5651, -3.7659, -5.2221, -4.9057, -3.8821, -4.1430, -3.0556, -1.9759, -3.5093, -1.7000, -2.6430]], [[ 1.7184, -1.2901, -1.9670, -1.5243, -2.2565, -1.8765, -2.0246, -1.3077, -3.0529, -2.4693, -1.5932, -2.7210]], [[ -8.3496, -14.4715, -13.3600, -13.0723, -15.1692, -10.3149, -9.2352, -7.6571, -5.9635, -6.0313, -3.1834, -5.9566]], [[ -3.2277, -6.9412, -6.4671, -7.4678, -6.7821, -6.1127, -5.2566, -4.1226, -3.3270, -4.1181, -2.3555, -2.6543]], [[ -2.4702, -5.7732, -6.1149, -5.7395, -7.1016, -6.8954, -4.4833, -2.9941, -2.9392, -2.8786, -2.7012, -3.0975]], [[ -4.5596, -6.9739, -8.3055, -7.6671, -9.2983, -6.3757, -6.3144, -3.2928, -4.3354, -3.8487, -4.6764, -4.2742]], [[ -1.0333, -3.9283, -3.9616, -4.1959, -3.8331, -4.1732, -4.1721, -2.2997, -2.6111, -3.1517, -2.6122, -2.4213]], [[ -1.3798, -4.2714, -2.7824, -2.5285, -2.4381, -1.6636, -1.7933, -1.6764, -0.9925, -1.2106, -0.7958, -0.9489]], [[ -4.1417, -7.8155, -8.7997, -6.0542, -8.5375, -6.6227, -5.3761, -4.4904, -5.0999, -2.7093, -0.8179, -4.1347]], [[ -4.5036, -8.5084, -7.9983, -8.8557, -9.5105, -4.7965, -4.4747, -5.0060, -4.0493, -4.9415, -2.2276, -4.5409]], [[ -1.7842, -3.7926, -3.4672, -3.1856, -3.2531, -2.5897, -2.4549, -2.8842, -2.4125, -2.2807, -1.5504, -2.0841]], [[ -0.7544, -5.0717, -4.7853, -4.5236, -4.4495, -3.9091, -3.7046, -3.7433, -3.4419, -3.3511, -2.7228, -2.9959]]], [[[ -1.6690, -4.2476, -4.2112, -5.0355, -4.4681, -3.0219, -3.6541, -2.9560, -1.1616, -2.3636, -3.3124, -2.5034]], [[ 1.0779, -0.9130, -1.0595, -1.3656, -2.4217, -1.3490, -1.2995, -1.8232, -1.7957, -2.3211, -2.2424, -1.7668]], [[ -6.7150, -12.1100, -10.8668, -11.1770, -9.1143, -8.3180, -7.8640, -6.1290, -4.2038, -3.1991, -3.6896, -4.8235]], [[ -2.8990, -6.3816, -6.0589, -7.4634, -3.7070, -5.0007, -4.0920, -3.5748, -2.3373, -2.7612, -3.9358, -3.1301]], [[ -2.2409, -6.6381, -7.9502, -6.3291, -5.0953, -7.1771, -4.2645, -3.4143, -1.9069, -4.1771, -2.6097, -5.7343]], [[ -4.3408, -7.2340, -7.8008, -7.7336, -6.5652, -6.6326, -5.8117, -3.0689, -2.6908, -3.4201, -3.4518, -5.5109]], [[ -1.3042, -4.2354, -4.4391, -4.4157, -4.1295, -4.4178, -4.1209, -2.7341, -2.1558, -2.9501, -3.2546, -3.0817]], [[ -1.3877, -4.2419, -2.7426, -2.3816, -2.4250, -1.7663, -1.8041, -1.5444, -1.5041, -0.8438, -0.9216, -1.2147]], [[ -3.3888, -6.1436, -8.3655, -4.8600, -5.2369, -5.9702, -4.9810, -3.2061, -2.2689, -4.5771, -1.3541, -3.3356]], [[ -4.0606, -8.4154, -7.6005, -8.9697, -7.1148, -4.3356, -4.3299, -4.9448, -4.5151, -3.2086, -4.5901, -4.1225]], [[ -1.8742, -3.9951, -3.6621, -3.3050, -3.5543, -2.8925, -2.6186, -2.9522, -2.7507, -2.4115, -2.2543, -1.9375]], [[ -0.8282, -5.0370, -4.8455, -4.6753, -4.4498, -3.9756, -3.7505, -3.7536, -3.4459, -3.2755, -3.2568, -2.9478]]], [[[ -2.1254, -4.6184, -4.6122, -4.7141, -4.3633, -4.4257, -3.6144, -3.1171, -2.9431, -2.4022, -2.8890, -3.2254]], [[ 1.3061, -1.0711, -1.9188, -1.7202, -2.7539, -2.0670, -2.2383, -1.9538, -2.2092, -3.1261, -2.7311, -2.7316]], [[ -8.4108, -14.2517, -11.6721, -13.4655, -9.8659, -10.4308, -8.6136, -7.3237, -5.9549, -3.0107, -3.9746, -7.5903]], [[ -3.4980, -6.7422, -6.3058, -7.2400, -3.8578, -5.9446, -5.4914, -3.7370, -1.7272, -2.7352, -4.4492, -4.3570]], [[ -2.5704, -5.7981, -6.7848, -6.5760, -4.4335, -8.4868, -5.8736, -2.8495, -2.6007, -3.2684, -2.9257, -5.5713]], [[ -4.5939, -7.3566, -8.4022, -7.8631, -6.2560, -6.9749, -6.3575, -3.1246, -3.4942, -3.5395, -4.9492, -5.2456]], [[ -1.1267, -3.7893, -3.5106, -3.4217, -3.6518, -3.9322, -3.9370, -2.4620, -2.4193, -2.0595, -2.6745, -2.9620]], [[ -1.3515, -4.1144, -2.7654, -2.4394, -2.5239, -1.6695, -1.7934, -1.6027, -1.2811, -0.8564, -1.4932, -1.6140]], [[ -3.5613, -6.0889, -8.4557, -4.1863, -4.4792, -5.6241, -5.3029, -2.9582, -2.0736, -4.4337, -0.7542, -3.2613]], [[ -4.3628, -7.7033, -7.2686, -8.2930, -6.1374, -4.6011, -4.2490, -4.6576, -3.7160, -2.9363, -4.3618, -5.0242]], [[ -2.0129, -3.8115, -3.5213, -3.1903, -3.4882, -2.8172, -2.6619, -2.9299, -2.2586, -2.2525, -2.6524, -2.2385]], [[ -0.9044, -5.1559, -4.8897, -4.5229, -4.5990, -4.0299, -3.7934, -3.8719, -3.4182, -3.1862, -3.4383, -3.2041]]], [[[ -1.1685, -4.6157, -2.4711, -3.1776, -3.1253, -4.1821, -4.0260, -3.8010, -2.1067, -2.6406, -3.3281, -2.7636]], [[ 1.3303, -0.7329, -1.3409, -0.6967, -2.5734, -1.2164, -2.0467, -1.8299, -3.0886, -2.3775, -3.4081, -1.4395]], [[ -6.0556, -12.8990, -11.0933, -10.6399, -9.9087, -8.8289, -8.7115, -7.5117, -5.4385, -4.6060, -4.9733, -4.5411]], [[ -2.6189, -5.6408, -4.6930, -4.7677, -4.0421, -5.1555, -4.8462, -3.2179, -2.0215, -2.6147, -3.4704, -2.7054]], [[ -0.9269, -3.7610, -4.9129, -5.0278, -3.8384, -6.6360, -6.3321, -2.1572, -1.9380, -4.7213, -4.8568, -2.7572]], [[ -3.3513, -6.0825, -6.4732, -6.5074, -6.0561, -6.3352, -5.5056, -3.1223, -3.7543, -4.4620, -3.1563, -2.0946]], [[ -1.5370, -4.2059, -4.1801, -3.5293, -4.0267, -4.6766, -4.0582, -2.8673, -2.8675, -3.3102, -3.1669, -1.5428]], [[ -1.3173, -4.0303, -2.4076, -2.2747, -2.2130, -1.3824, -1.4114, -1.3350, -1.1963, -0.8121, -0.3735, -0.3381]], [[ -2.4417, -5.0375, -4.9393, -3.6689, -4.2930, -5.0635, -4.2042, -3.1347, -2.4190, -3.0412, -3.1308, -2.2493]], [[ -3.8977, -7.7707, -6.9603, -6.7566, -6.2458, -4.9699, -4.2797, -4.7614, -3.7384, -2.6723, -2.2029, -3.2873]], [[ -1.4158, -3.6018, -3.2686, -3.1059, -3.1801, -2.2724, -2.2514, -2.6364, -2.4909, -1.7688, -1.6254, -1.7305]], [[ -0.5646, -5.0820, -4.5159, -4.5053, -4.3704, -3.7024, -3.4828, -3.8389, -3.5231, -3.1145, -2.7145, -2.8514]]], [[[ -1.4527, -4.4548, -3.0666, -3.8454, -4.0315, -3.9788, -5.2885, -2.8903, -1.8364, -2.2538, -1.5738, -3.7563]], [[ 1.5816, -2.0704, -2.6807, -1.5635, -2.6787, -1.6738, -2.4124, -1.8992, -1.9090, -2.0840, -1.2661, -3.7822]], [[ -6.4220, -12.1883, -10.7990, -11.4069, -10.7187, -8.3986, -10.0225, -6.0869, -4.7126, -4.7661, -3.4666, -4.2847]], [[ -3.3633, -6.6370, -6.4041, -5.6123, -4.6225, -5.7619, -5.6442, -3.4173, -3.5531, -1.4627, -2.7943, -3.0209]], [[ -1.4547, -4.1613, -5.0708, -5.5381, -4.1027, -4.9660, -5.6732, -1.7373, -5.5478, -1.3607, -2.8610, -3.3253]], [[ -4.9064, -7.1763, -8.1289, -7.4816, -7.4726, -6.8147, -7.5856, -3.2366, -4.2647, -3.9770, -3.7684, -4.1785]], [[ -0.5129, -3.4319, -2.9976, -3.7572, -3.1803, -4.8464, -4.3214, -1.8341, -2.5644, -2.1348, -3.4424, -3.3325]], [[ -1.3214, -4.0544, -2.4578, -2.5332, -2.4266, -1.6817, -1.7442, -1.6165, -1.8580, -1.6387, -0.7726, -0.5301]], [[ -3.3840, -6.8591, -6.6799, -5.0304, -6.3536, -6.5209, -6.5168, -3.4400, -3.1997, -3.4958, -3.8690, -4.1423]], [[ -5.1341, -8.4460, -7.8317, -8.1545, -7.6800, -5.1676, -7.0768, -4.9941, -4.8767, -4.2890, -2.4746, -3.7659]], [[ -1.7629, -3.3206, -3.0920, -3.0353, -2.9023, -2.3797, -2.1675, -2.3787, -2.2989, -2.1355, -1.6766, -1.4880]], [[ -0.7491, -4.7834, -4.5244, -4.4226, -4.1251, -3.8590, -3.7527, -3.4047, -3.4454, -3.2571, -3.0363, -2.8510]]]]) attn_weights tensor([[[[ 4.4140, -1.2410, -3.2250, -1.7223, 1.3003, -3.3359, -2.6328, -1.6489, -3.4755, -2.6026, -4.1158, 0.8776]], [[ -2.9483, -6.2952, -5.5505, -5.6814, -5.8819, -6.1145, -6.7914, -3.3354, -3.3857, -3.4727, -5.0123, -3.7195]], [[ -5.0319, -10.0508, -10.2900, -9.0356, -10.6625, -8.6907, -7.1675, -6.8726, -5.7156, -4.8798, -3.2417, -4.4303]], [[ -5.7775, -12.1632, -15.7950, -12.8525, -14.9969, -10.8927, -10.1064, -8.7233, -11.0165, -8.5486, -4.6258, -7.8767]], [[ 1.0353, -3.4242, -3.9566, -3.7693, -3.0493, -2.7544, -3.1743, -3.2663, -3.8370, -3.8978, -3.3155, -2.8274]], [[ -0.1633, -2.9036, -3.9753, -3.3687, -3.1075, -2.6802, -2.5222, -3.3092, -4.0523, -3.5871, -2.8971, -2.8027]], [[ -3.8033, -8.2664, -6.2434, -7.0384, -9.0319, -5.0962, -5.4975, -5.3356, -3.0394, -4.2190, -4.1296, -4.7253]], [[ -6.1147, -12.7271, -13.2196, -12.4982, -14.2415, -7.7090, -7.3269, -7.8517, -8.0108, -8.0228, -5.3119, -6.1826]], [[ -4.6713, -8.7629, -10.6108, -8.9979, -10.9929, -7.6135, -7.9210, -5.6039, -6.4814, -5.2335, -3.9679, -5.8166]], [[ -2.3954, -6.2094, -5.7829, -5.3963, -5.5944, -5.9835, -3.9511, -4.0459, -3.4897, -3.1346, -1.8358, -3.3644]], [[ -1.1308, -5.8911, -5.9968, -7.0263, -4.4227, -4.4942, -4.6316, -4.2026, -4.8379, -6.0259, -3.2206, -2.0693]], [[ -2.8217, -6.8437, -8.0097, -7.0632, -7.2574, -5.6530, -5.6192, -4.4115, -5.1953, -4.8672, -3.7336, -4.3953]]], [[[ 5.0615, -1.3404, -2.7535, -1.8761, -1.3643, -5.4335, -2.3423, -1.8152, -2.5312, -3.1823, -2.9041, 2.0766]], [[ -2.5985, -5.8497, -4.9938, -5.7907, -6.2749, -5.6984, -6.3847, -3.4291, -3.0113, -3.0288, -3.7619, -6.7259]], [[ -4.2951, -8.0999, -7.0011, -7.7557, -5.6654, -6.9454, -7.9789, -5.1373, -4.5828, -2.9254, -3.8082, -6.1995]], [[ -4.6353, -9.4962, -13.1521, -10.6308, -10.6788, -10.0338, -10.8911, -6.1205, -6.2604, -8.5382, -6.1564, -7.9539]], [[ 1.3714, -4.1353, -5.3228, -3.7298, -3.4622, -3.5024, -2.1585, -3.5977, -3.2693, -5.3105, -3.9328, -5.7773]], [[ -0.2263, -2.4139, -3.4286, -2.2130, -1.4614, -2.4621, -2.1056, -3.1844, -3.4117, -3.6717, -2.7400, -1.9425]], [[ -2.8009, -6.1614, -3.8883, -4.3129, -5.9629, -4.2303, -5.2716, -3.8960, -3.4350, -1.1639, -1.6948, -3.6388]], [[ -5.6758, -9.3717, -9.5110, -9.8122, -6.9655, -6.8235, -6.0250, -5.2613, -5.7383, -4.9104, -5.7357, -6.9604]], [[ -4.1479, -7.1347, -8.3072, -7.5049, -7.3224, -6.6291, -6.2683, -3.4207, -2.8269, -4.3818, -3.4630, -5.3387]], [[ -1.4936, -4.9067, -4.5227, -2.4258, -3.0324, -4.5603, -3.8871, -3.0868, -2.6576, -2.8326, -1.2809, -4.0079]], [[ -0.8186, -5.3637, -4.6474, -5.4519, -3.9277, -4.4705, -4.5435, -3.4180, -3.2033, -3.5725, -4.2602, -2.1398]], [[ -2.5665, -5.7522, -6.7542, -5.9852, -4.0944, -4.9632, -4.7411, -3.6863, -3.3056, -3.8289, -3.6955, -3.5490]]], [[[ 4.4850, -0.9656, -2.8068, -1.2517, -1.1732, -6.0177, -5.3904, -1.8841, -3.7802, -3.3138, -1.1741, 0.8975]], [[ -2.9638, -6.8328, -5.8323, -7.2949, -6.4398, -5.8166, -6.9951, -4.0121, -3.6526, -3.8185, -5.9572, -5.8832]], [[ -4.9477, -8.5901, -8.0626, -7.5314, -6.1871, -7.7671, -8.9447, -5.8187, -6.6174, -3.0824, -4.2284, -5.7982]], [[ -4.9802, -10.8797, -12.4337, -11.2944, -11.2056, -12.3065, -12.5856, -7.4520, -7.7508, -6.7353, -5.0312, -6.9353]], [[ 1.2289, -3.7274, -3.8472, -2.6992, -3.0382, -4.8765, -3.5077, -3.4496, -4.0046, -3.8336, -3.7904, -3.5888]], [[ -0.1830, -2.7967, -3.9042, -2.3496, -2.4601, -3.2557, -3.5313, -3.2102, -3.9371, -3.8663, -3.4624, -3.2751]], [[ -3.1832, -7.6437, -5.7328, -7.5131, -7.1607, -6.2156, -7.2520, -4.3337, -4.3657, -1.4502, -2.9989, -4.5789]], [[ -5.8305, -11.2553, -11.6641, -10.7865, -9.2966, -7.6891, -8.6032, -6.9192, -6.4994, -5.8275, -6.9645, -7.3554]], [[ -4.5261, -8.1514, -9.6213, -8.3826, -9.7581, -8.6490, -7.9245, -4.7205, -3.3177, -4.9294, -5.2951, -5.2225]], [[ -1.8506, -5.5424, -5.2423, -3.8895, -4.7266, -5.6226, -5.1549, -3.6602, -0.6962, -2.9133, -0.7711, -2.9918]], [[ -1.1374, -5.4155, -4.9871, -3.9734, -3.3643, -4.3846, -5.2384, -4.2295, -4.7839, -3.4727, -4.5713, -3.3919]], [[ -2.4499, -6.1272, -7.4221, -6.6715, -4.9071, -5.8317, -7.5313, -4.4530, -2.8484, -4.3326, -4.1460, -4.6653]]], [[[ 5.2886, 0.6544, -1.9481, -0.8691, -0.2619, -3.6579, -3.4723, -0.5307, -0.9903, -1.7858, -3.8370, 3.3885]], [[ -2.5907, -6.2873, -5.2256, -5.6725, -5.4587, -6.8717, -7.2612, -4.9164, -3.9828, -7.4388, -6.0155, -4.2761]], [[ -4.1770, -8.2665, -8.1534, -8.2731, -6.4734, -8.1690, -8.1330, -5.8347, -3.1995, -5.6637, -5.4041, -5.6006]], [[ -4.3422, -12.3284, -15.4232, -13.9040, -12.8006, -12.1893, -9.9903, -8.9442, -8.8771, -9.0296, -6.8577, -6.3948]], [[ 1.2601, -2.5627, -3.6803, -4.1167, -3.8029, -3.6994, -2.8928, -1.9733, -2.3912, -1.7988, -2.6606, -1.7050]], [[ -0.3157, -1.6209, -1.9431, -1.4975, -1.2951, -2.3735, -2.8108, -2.4253, -2.2496, -2.7449, -3.5998, -3.0332]], [[ -3.3984, -6.8242, -4.3778, -6.0239, -5.6631, -4.7390, -5.8103, -5.5495, -3.2324, -3.0732, -3.7458, -4.4569]], [[ -5.2232, -12.5469, -12.5283, -12.0668, -11.8153, -8.4259, -7.0093, -7.9565, -8.2591, -5.5508, -4.0563, -6.0087]], [[ -3.8735, -8.7960, -8.9609, -8.6019, -7.8025, -8.2668, -6.8667, -5.4909, -4.8820, -7.0241, -4.7210, -3.5294]], [[ -1.6012, -3.8042, -4.6933, -4.5578, -5.6116, -5.1358, -5.4896, -3.3225, -3.2762, -5.0825, -4.6449, -4.2682]], [[ -1.0650, -5.5802, -4.5319, -5.0182, -4.5514, -4.1788, -4.2169, -2.9731, -2.9560, -3.1857, -2.9380, -2.8962]], [[ -2.2689, -6.2272, -5.7679, -4.1566, -5.2313, -4.0656, -4.8571, -4.7791, -4.4125, -2.9366, -4.3225, -3.7280]]], [[[ 4.7274, 0.6865, -0.9804, -1.4257, -0.1961, -2.6393, 4.2332, 0.2491, -4.5439, -1.7760, -1.2808, 2.7406]], [[ -3.0007, -5.9886, -4.6318, -4.9293, -4.6401, -6.2806, -5.8365, -2.8964, -2.5320, -3.1823, -5.4031, -4.7035]], [[ -5.3142, -9.4737, -9.8399, -7.9619, -6.4222, -7.3868, -7.6273, -4.4643, -4.2735, -2.0107, -3.2187, -2.8266]], [[ -5.3195, -12.0684, -14.8799, -13.2681, -12.0657, -8.2106, -10.0747, -7.6219, -8.4951, -6.7847, -3.7788, -5.8204]], [[ 0.5984, -3.5256, -3.4500, -3.6878, -3.0500, -1.3403, -4.8819, -3.2640, -4.0774, -3.1858, -2.0669, -4.4600]], [[ -0.1514, -2.7395, -2.7935, -2.9190, -1.8794, -2.4269, -2.8142, -2.7698, -2.0245, -1.9844, -2.0848, -3.3463]], [[ -4.3958, -6.5847, -6.1009, -6.8655, -5.1745, -3.7674, -6.1993, -3.5672, -3.1087, -2.2053, -1.5374, -3.0664]], [[ -6.5411, -12.7469, -11.5546, -9.8816, -10.9406, -6.5692, -8.6510, -7.3646, -7.4499, -6.5812, -3.0175, -4.8480]], [[ -5.0754, -8.7818, -8.5225, -7.6943, -7.9847, -7.4220, -7.8946, -4.1192, -4.4588, -4.8224, -3.7245, -4.7301]], [[ -2.0178, -4.9997, -4.5852, -4.0619, -4.0758, -6.3522, -5.4877, -3.2206, -3.1174, -2.4184, -4.2697, -3.8573]], [[ -1.3340, -5.8744, -6.4926, -6.3511, -5.4940, -2.9609, -3.4847, -3.6462, -5.0076, -3.9870, -1.5444, -2.1801]], [[ -2.7077, -6.8452, -7.2066, -5.6602, -6.1108, -4.9742, -5.1636, -3.1252, -2.7871, -4.2056, -1.6948, -3.9698]]]]) attn_weights tensor([[[[-3.5888e+00, -9.5342e+00, -9.1733e+00, -7.0523e+00, -8.3222e+00, -7.9386e+00, -7.5110e+00, -6.1633e+00, -6.3091e+00, -4.6534e+00, -1.3176e+00, -4.7757e+00]], [[-2.9928e+00, -6.6680e+00, -5.3443e+00, -6.0216e+00, -7.3904e+00, -4.6586e+00, -4.4688e+00, -2.6137e+00, -2.2458e+00, -3.4339e+00, -3.8028e+00, -5.1694e+00]], [[-3.7210e-01, -2.4928e+00, -3.4200e+00, -3.3986e+00, -4.1138e+00, -4.8198e+00, -3.4417e+00, -2.5784e+00, -3.2755e+00, -3.5183e+00, -3.0626e+00, -3.9088e+00]], [[-2.1915e+00, -5.8632e+00, -4.8946e+00, -4.2896e+00, -5.0653e+00, -3.6558e+00, -3.9514e+00, -4.6273e+00, -3.3047e+00, -3.2095e+00, -2.5475e+00, -3.8541e+00]], [[ 1.3732e+00, -2.6487e+00, -1.9245e+00, -2.8160e+00, -1.8017e+00, -2.7572e+00, -3.7041e+00, -2.4119e+00, -1.8092e+00, -2.8121e+00, -1.2019e+00, -1.1813e+00]], [[-2.3576e+00, -7.3587e+00, -7.5490e+00, -6.8985e+00, -8.1200e+00, -6.9060e+00, -6.8024e+00, -5.4429e+00, -5.4663e+00, -5.1017e+00, -4.8602e+00, -4.6714e+00]], [[-2.0853e+00, -5.4196e+00, -6.2044e+00, -5.9299e+00, -5.6390e+00, -4.3419e+00, -4.6071e+00, -4.5622e+00, -5.0268e+00, -4.8519e+00, -3.8177e+00, -4.2418e+00]], [[ 4.0257e-01, -4.3794e+00, -3.5001e+00, -2.6943e+00, -2.1812e+00, -1.1675e+00, -2.4664e+00, -2.2176e+00, -2.9789e+00, -2.2330e+00, 2.1222e-01, 1.0996e+00]], [[ 1.4614e+00, -3.2563e+00, -3.0428e+00, -2.4014e+00, -2.4578e+00, -2.7344e+00, -1.8950e+00, -1.4909e+00, -2.4125e+00, -2.2346e+00, -1.9133e+00, -1.7240e+00]], [[-1.5312e+00, -3.9103e+00, -3.5804e+00, -3.5875e+00, -4.1123e+00, -3.3059e+00, -2.9417e+00, -3.3655e+00, -2.2470e+00, -2.3662e+00, -1.4917e+00, -3.1084e+00]], [[ 1.1601e+00, -2.7213e+00, -3.2715e+00, -3.6636e+00, -3.1531e+00, -2.9632e+00, -2.7297e+00, -2.6976e+00, -3.1283e+00, -4.0085e+00, -3.3953e+00, -2.7926e+00]], [[-6.8723e+00, -2.2067e+01, -2.6973e+01, -1.7035e+01, -2.1345e+01, -1.3806e+01, -1.2428e+01, -1.0794e+01, -1.6316e+01, -5.7901e+00, 1.2623e+01, 5.0329e+00]]], [[[-1.5195e+00, -8.7545e+00, -7.1717e+00, -6.7217e+00, -5.6865e+00, -7.9216e+00, -8.6505e+00, -6.5901e+00, -3.6485e+00, -3.7247e+00, -3.7258e+00, -4.7589e+00]], [[-2.2856e+00, -5.2832e+00, -5.3672e+00, -5.2656e+00, -5.8754e+00, -5.3156e+00, -4.8555e+00, -3.4805e+00, -1.6923e+00, -2.0660e+00, -2.2121e+00, -4.5291e+00]], [[-9.5828e-03, -1.6491e+00, -2.4648e+00, -3.0969e+00, -4.1058e+00, -5.1909e+00, -3.7990e+00, -3.3241e+00, -2.9337e+00, -3.2020e+00, -3.6644e+00, -3.4438e+00]], [[-2.0012e+00, -4.9253e+00, -2.9055e+00, -2.7565e+00, -3.0704e+00, -3.7088e+00, -3.5510e+00, -4.0152e+00, -1.6964e+00, -4.7907e-01, -7.6007e-01, -2.5871e+00]], [[ 1.5679e+00, -2.6094e+00, -9.3392e-01, -2.9893e-01, -2.4882e+00, -4.6987e+00, -4.0354e+00, -2.4687e+00, -2.9414e+00, -1.0673e+00, -5.1628e-01, -1.8114e+00]], [[-1.7153e+00, -6.3519e+00, -7.1872e+00, -6.7861e+00, -5.9530e+00, -7.9142e+00, -8.6887e+00, -5.5718e+00, -4.8888e+00, -4.6249e+00, -4.6492e+00, -5.3174e+00]], [[-1.8807e+00, -4.9628e+00, -5.3259e+00, -5.2844e+00, -3.9547e+00, -3.7252e+00, -3.8848e+00, -4.2708e+00, -3.4147e+00, -3.9427e+00, -4.1010e+00, -4.3026e+00]], [[ 7.9954e-01, -6.5743e+00, -4.4157e+00, -1.6296e+00, -5.0181e-01, -3.0804e+00, -4.6724e+00, -3.0476e+00, -1.8635e+00, -1.4920e+00, 4.0668e-01, 2.1021e+00]], [[ 1.7463e+00, -2.9769e+00, -2.4169e+00, -1.8796e+00, -1.5469e+00, -2.8638e+00, -1.2984e+00, -2.7514e+00, -1.6478e+00, -1.9712e+00, -1.7774e+00, -1.0385e+00]], [[-8.9292e-01, -1.9809e+00, -2.7550e+00, -1.8271e+00, -1.6927e+00, -4.0180e+00, -3.2384e+00, -2.1039e+00, -2.7761e+00, -1.2276e+00, -7.7860e-01, -2.0021e+00]], [[ 1.5016e+00, -2.5895e+00, -3.5411e+00, -3.6750e+00, -4.5098e+00, -3.9873e+00, -4.0168e+00, -2.9217e+00, -2.7151e+00, -3.9225e+00, -4.1255e+00, -4.7877e+00]], [[-4.8482e+00, -2.1817e+01, -1.5667e+01, -4.0575e+00, -8.1599e+00, -1.3141e+01, -2.2513e+01, -1.2196e+01, -7.8688e+00, -1.4323e+00, 8.8666e+00, -3.6020e+00]]], [[[-2.5038e+00, -8.4107e+00, -7.3407e+00, -6.1027e+00, -7.3441e+00, -9.3407e+00, -8.9707e+00, -5.7249e+00, -6.6062e+00, -4.0441e+00, -2.7395e+00, -3.9600e+00]], [[-2.4732e+00, -5.3766e+00, -5.4421e+00, -6.4982e+00, -5.1334e+00, -4.1028e+00, -7.0966e+00, -2.7518e+00, -9.3993e-01, -1.7854e+00, -2.0637e+00, -2.7930e+00]], [[-4.4201e-02, -1.8628e+00, -2.6819e+00, -3.5297e+00, -4.3389e+00, -4.5434e+00, -2.7555e+00, -2.8019e+00, -3.2070e+00, -3.4703e+00, -3.7959e+00, -3.7441e+00]], [[-2.2188e+00, -5.6320e+00, -3.8573e+00, -4.2243e+00, -5.7096e+00, -5.6793e+00, -5.4023e+00, -4.7737e+00, -3.8880e+00, -1.4920e+00, -2.8847e+00, -3.6549e+00]], [[ 1.4995e+00, -2.6191e+00, -8.0886e-01, -2.3445e+00, -2.6916e+00, -3.3479e+00, -4.8425e+00, -2.5213e+00, -2.6685e+00, -1.5881e+00, -1.2954e+00, -9.5570e-01]], [[-1.9142e+00, -6.6791e+00, -6.6407e+00, -7.1767e+00, -7.0727e+00, -9.0505e+00, -8.9697e+00, -5.5561e+00, -5.7099e+00, -3.6380e+00, -5.6122e+00, -7.6272e+00]], [[-2.0447e+00, -5.5925e+00, -6.4350e+00, -6.1314e+00, -5.1701e+00, -4.6312e+00, -4.0515e+00, -4.7942e+00, -4.3438e+00, -4.7696e+00, -4.8592e+00, -4.8918e+00]], [[ 9.7692e-01, -4.2492e+00, -2.7806e+00, -3.7808e-01, -1.3316e+00, -2.3774e+00, -3.9552e+00, -3.0089e+00, -2.5301e+00, -1.0246e+00, -4.4892e-01, 1.0478e+00]], [[ 1.6119e+00, -2.4463e+00, -2.3876e+00, -2.4632e+00, -1.7916e+00, -2.8834e+00, -1.9186e+00, -2.3220e+00, -1.2928e+00, -2.3993e+00, -3.2061e+00, -2.4274e+00]], [[-9.1871e-01, -3.9871e+00, -4.0824e+00, -4.7828e+00, -2.9605e+00, -2.5917e+00, -1.8018e+00, -2.9327e+00, -3.8608e+00, -2.4597e+00, -2.3580e+00, -3.5421e+00]], [[ 1.3939e+00, -2.0824e+00, -2.4803e+00, -2.9582e+00, -3.0353e+00, -3.0427e+00, -4.4665e+00, -2.2774e+00, -2.0730e+00, -2.7373e+00, -3.9688e+00, -3.1509e+00]], [[-7.0497e+00, -1.9667e+01, -8.9473e+00, -7.2919e+00, -1.2769e+01, -1.4446e+01, -1.6940e+01, -1.1703e+01, 1.1951e-01, 7.3991e+00, 1.4941e+01, 6.7215e+00]]], [[[-2.6212e+00, -8.0761e+00, -7.3274e+00, -5.7425e+00, -5.4805e+00, -8.0624e+00, -6.4853e+00, -5.1118e+00, -4.2953e+00, -8.0722e+00, -6.1174e+00, -4.7846e+00]], [[-2.0407e+00, -5.2789e+00, -5.4532e+00, -4.8318e+00, -6.0341e+00, -6.2526e+00, -5.9183e+00, -2.7527e+00, -3.6767e+00, -5.1796e+00, -4.5594e+00, -2.8692e+00]], [[-8.0594e-02, -2.1330e+00, -2.7643e+00, -2.3363e+00, -4.5814e+00, -4.5157e+00, -3.9220e+00, -2.3326e+00, -4.8848e+00, -5.2132e+00, -4.2619e+00, -2.6873e+00]], [[-2.2843e+00, -4.9944e+00, -5.0562e+00, -4.4577e+00, -4.2791e+00, -3.6085e+00, -3.6665e+00, -3.8486e+00, -3.6359e+00, -2.7454e+00, -2.5495e+00, -4.0369e+00]], [[ 1.2284e+00, -1.6381e+00, -2.6493e+00, -2.6471e+00, -2.4539e+00, -3.1870e+00, -3.1779e+00, -2.4206e+00, -2.8282e+00, -4.4143e+00, -3.5697e+00, -6.6849e-01]], [[-2.4449e+00, -8.2439e+00, -6.8411e+00, -7.3826e+00, -6.2724e+00, -5.4008e+00, -6.7977e+00, -6.6192e+00, -4.2188e+00, -4.5368e+00, -5.9355e+00, -4.4788e+00]], [[-2.0412e+00, -4.3386e+00, -5.3339e+00, -4.5857e+00, -4.0048e+00, -4.0977e+00, -4.5088e+00, -3.6157e+00, -3.6008e+00, -3.4736e+00, -4.0262e+00, -3.8535e+00]], [[-3.2085e-01, -4.8816e+00, -3.8985e+00, -3.0480e+00, -2.7607e+00, -2.7053e+00, -1.0433e+00, -6.5092e-02, -1.2239e+00, -1.5390e+00, -7.8036e-01, 1.2163e+00]], [[ 1.7306e+00, -1.2889e+00, -2.5294e+00, -1.8773e+00, -2.2048e+00, -2.2987e+00, -2.7404e+00, -2.0305e+00, -2.1031e+00, -2.8048e+00, -4.2206e+00, -5.4604e-01]], [[-1.1251e+00, -2.9614e+00, -3.3792e+00, -3.5234e+00, -2.8927e+00, -5.4712e+00, -3.7356e+00, -3.2151e+00, -3.7421e+00, -3.7355e+00, -4.1500e+00, -4.1973e+00]], [[ 1.1921e+00, -1.6534e+00, -2.6485e+00, -3.7162e+00, -3.1221e+00, -2.4801e+00, -4.0436e+00, -1.5099e+00, -2.8507e+00, -5.1867e+00, -5.3129e+00, -1.5832e+00]], [[-5.8819e+00, -3.0455e+01, -2.7978e+01, -2.9174e+01, -2.9216e+01, -8.6238e+00, 1.7946e+00, -9.1895e+00, -1.1023e+01, 1.5730e-01, 1.3496e+01, -2.3909e+00]]], [[[-3.3000e+00, -8.2894e+00, -8.1913e+00, -5.5610e+00, -5.1755e+00, -8.6416e+00, -6.9029e+00, -5.0539e+00, -4.6978e+00, -3.3650e+00, -6.4257e+00, -5.9420e+00]], [[-2.8207e+00, -7.4962e+00, -6.3645e+00, -5.9232e+00, -5.7527e+00, -6.8049e+00, -6.0874e+00, -3.5492e+00, -1.9019e+00, -2.7101e+00, -4.2701e+00, -4.4405e+00]], [[-2.1651e-01, -3.4977e+00, -4.0875e+00, -3.5670e+00, -3.8102e+00, -4.2925e+00, -4.3947e+00, -2.3158e+00, -3.0078e+00, -3.5890e+00, -4.1196e+00, -4.9568e+00]], [[-2.6277e+00, -4.9684e+00, -5.4179e+00, -5.1119e+00, -5.5021e+00, -4.0424e+00, -6.1247e+00, -3.9631e+00, -3.0137e+00, -3.1125e+00, -3.2432e+00, -3.9936e+00]], [[ 1.3955e+00, -2.2692e+00, -3.3452e+00, -4.1500e+00, -2.2155e+00, -7.4560e-01, -1.2768e+00, -1.4450e+00, -4.2828e+00, -1.2235e+00, -1.2271e+00, -4.7576e-01]], [[-3.0022e+00, -6.4357e+00, -6.2212e+00, -6.7500e+00, -6.7366e+00, -6.2837e+00, -6.6175e+00, -3.8529e+00, -3.6210e+00, -3.1535e+00, -3.0579e+00, -5.9106e+00]], [[-2.2123e+00, -4.6365e+00, -6.2028e+00, -5.5414e+00, -4.8141e+00, -3.5348e+00, -5.7712e+00, -3.9743e+00, -3.9797e+00, -3.7627e+00, -2.7882e+00, -4.9026e+00]], [[-1.8380e-01, -5.4744e+00, -4.4564e+00, -4.3215e+00, -3.9978e+00, -1.0679e+00, -7.5388e-01, -1.9658e+00, -2.5989e+00, -2.0985e+00, 1.6338e-01, 5.0985e-01]], [[ 2.0552e+00, -4.8736e+00, -5.1565e+00, -4.2485e+00, -3.4956e+00, -1.5004e+00, -2.5672e+00, -2.3193e+00, -1.8754e+00, -1.3692e+00, -2.2214e+00, -2.4681e+00]], [[-1.0017e+00, -5.1118e+00, -5.1959e+00, -5.3659e+00, -4.0631e+00, -5.8032e+00, -4.6957e+00, -4.3129e+00, -5.0602e+00, -2.5826e+00, -3.5524e+00, -4.3017e+00]], [[ 1.1593e+00, -4.5623e+00, -3.7211e+00, -4.1883e+00, -2.9097e+00, -3.9137e+00, -2.3940e+00, -3.7301e+00, -3.5715e+00, -2.7361e+00, -3.8406e+00, -3.3808e+00]], [[-8.1663e-02, -2.3638e+01, -2.9392e+01, -2.9972e+01, -3.1763e+01, 1.4579e+00, -2.2954e-02, -1.0259e+01, -1.0070e+01, -1.5620e+01, 1.2901e+01, 7.5867e+00]]]]) attn_weights tensor([[[[ 1.8755e+00, -5.5490e+00, -5.7244e+00, -4.0127e+00, -5.0104e+00, -1.5151e+00, -1.6264e+00, -5.9643e-01, -3.2361e+00, -3.3463e+00, -2.4787e+00, -1.3835e+00]], [[ 4.3612e+00, -1.1958e+01, -9.5760e+00, -6.2461e+00, -7.7155e+00, 9.1997e-01, -7.1215e+00, -6.7360e+00, -7.1879e+00, -6.6726e+00, -5.9173e+00, -2.2303e+00]], [[ 3.6211e-01, -3.9194e+00, -3.6740e+00, -4.9288e+00, -5.3845e+00, -3.5267e+00, -3.3383e+00, -4.1869e+00, -2.3624e+00, -3.9060e+00, -1.7812e+00, -4.1021e+00]], [[-2.5170e-01, -1.4155e+00, -1.9216e+00, -1.8462e+00, -2.5575e+00, -2.5087e+00, -1.9789e+00, -1.0600e+00, -2.3629e-01, -9.8960e-01, -1.7567e-01, -2.0787e+00]], [[-2.7159e-01, -5.4611e+00, -5.4284e+00, -5.1454e+00, -6.1076e+00, -2.3996e+00, -2.0005e+00, -2.2905e+00, -2.7063e+00, -3.0120e+00, -9.7890e-01, -2.3636e+00]], [[ 1.8509e+00, -7.1136e+00, -4.4723e+00, -3.3616e+00, -5.8000e+00, -8.0475e-01, -3.3283e+00, -1.7757e+00, -1.6656e+00, -2.8664e+00, -4.8374e+00, -3.4445e+00]], [[ 2.0352e+00, -6.6956e+00, -7.6403e+00, -6.6953e+00, -7.5832e+00, -2.7659e+00, -4.3870e+00, -3.9790e+00, -5.2972e+00, -5.9094e+00, -9.2296e-01, -3.0705e+00]], [[ 8.1486e-01, -4.8447e+00, -5.2070e+00, -4.8169e+00, -5.2747e+00, -3.5865e+00, -1.4509e+00, -3.5880e+00, -3.4645e+00, -3.3462e+00, -7.1867e-01, -2.3703e+00]], [[ 6.0055e-01, -6.0479e+00, -5.7063e+00, -5.0390e+00, -7.0720e+00, -1.3575e+00, -2.0599e+00, -6.3539e-01, -2.8817e+00, -3.6976e+00, -4.4678e+00, -3.9194e+00]], [[ 9.6996e-01, -3.1147e+00, -3.9479e+00, -3.2132e+00, -2.1547e+00, -1.6575e+00, -1.3000e+00, -1.5399e+00, -3.5505e+00, -3.7290e+00, -3.2217e+00, -2.7964e+00]], [[ 2.1342e+00, -3.6217e-01, -5.5480e-01, -1.0433e+00, -6.7718e-01, 2.4665e-01, 1.5875e+00, 3.4073e-01, -3.2600e-01, -1.5462e+00, 4.1342e-02, 3.4946e-02]], [[ 1.0337e+00, -3.5281e+00, -3.7614e+00, -3.4442e+00, -2.0234e+00, -3.4482e+00, -3.8249e+00, -2.8652e+00, -2.6870e+00, -2.5189e+00, -2.5820e+00, -2.4159e-01]]], [[[ 2.0918e+00, -4.0964e+00, -5.1364e+00, -5.3944e+00, -2.1413e+00, -5.2087e-01, -1.3952e+00, -1.0269e+00, -1.0448e+00, -2.8301e+00, -5.2204e+00, -2.9029e+00]], [[ 4.5362e+00, -1.1625e+01, -1.1148e+01, -9.4703e+00, -4.4018e+00, -2.7523e+00, -1.0275e+01, -8.0998e+00, -7.0898e+00, -7.0145e+00, -7.6630e+00, -4.9688e+00]], [[ 2.7894e-01, -2.7428e+00, -2.4408e+00, -2.2670e+00, -3.6532e+00, -3.3858e+00, -3.9992e+00, -4.1608e+00, -3.2031e+00, -2.3807e+00, -2.5288e+00, -3.0063e+00]], [[ 1.4914e-01, -8.7890e-01, -1.1123e+00, -1.1623e+00, -1.8092e+00, -3.3533e+00, -2.4203e+00, -1.8225e+00, -3.4528e-01, -8.3066e-01, -1.0541e+00, -2.4756e+00]], [[ 1.5426e-01, -4.4339e+00, -4.9623e+00, -4.7315e+00, -3.4427e+00, -2.6579e+00, -2.1111e+00, -3.3634e+00, -1.7296e+00, -2.2681e+00, -2.0272e+00, -1.9462e+00]], [[ 2.0530e+00, -9.0757e+00, -6.5460e+00, -5.3097e+00, -3.5468e+00, -2.9822e+00, -7.2256e+00, -3.2003e+00, -2.1138e+00, -3.0055e+00, -4.3656e+00, -4.2124e+00]], [[ 1.2316e+00, -4.7627e+00, -3.6036e+00, -3.2421e+00, -2.3834e+00, -3.7401e+00, -5.3776e+00, -4.1305e+00, -1.7505e+00, -2.5539e-01, -9.9922e-01, -2.9935e+00]], [[ 1.6340e+00, -4.6428e+00, -5.2872e+00, -4.7892e+00, -3.5846e+00, -2.9991e+00, -1.7458e+00, -4.3797e+00, -3.4197e+00, -3.0968e+00, -2.9033e+00, -1.1051e+00]], [[ 7.2804e-01, -5.5486e+00, -5.3132e+00, -4.0335e+00, -2.7543e+00, -2.1835e+00, -4.2959e+00, -2.5765e+00, -2.8527e+00, -3.2575e+00, -3.3282e+00, -3.8933e+00]], [[ 8.8119e-01, -2.9201e+00, -2.5326e+00, -3.0948e+00, -2.2979e+00, -3.2940e+00, -2.3053e+00, -2.8852e+00, -3.7777e+00, -2.9997e+00, -3.8100e+00, -3.8499e+00]], [[ 1.7575e+00, -8.3563e-01, 6.0413e-01, 3.5518e-01, 4.3843e-01, -7.7263e-01, 2.6079e+00, 1.1747e+00, -9.4007e-01, 4.0629e-01, -3.3596e-01, 1.0935e+00]], [[ 1.2065e+00, -3.9113e+00, -2.8444e+00, -1.5141e+00, -1.6679e+00, -4.0479e+00, -4.3090e+00, -2.8267e+00, -2.2659e+00, -1.8585e+00, -6.9035e-01, -1.3863e+00]]], [[[ 2.3129e+00, -4.8236e+00, -4.7047e+00, -3.7055e+00, -3.2045e-01, -1.4741e+00, -3.3461e+00, -3.0898e+00, -3.3363e+00, -2.6731e+00, -2.4411e+00, -2.1854e+00]], [[ 4.8596e+00, -7.1667e+00, -7.0944e+00, -3.8581e+00, -4.0111e+00, -6.5079e+00, -1.4158e+01, -1.4312e+01, -1.0194e+01, -1.0220e+01, -6.2636e+00, -2.1738e+00]], [[ 2.8900e-01, -3.0783e+00, -3.0629e+00, -4.0975e+00, -3.4640e+00, -3.0542e+00, -3.2194e+00, -3.1682e+00, -2.7378e+00, -1.4973e+00, -1.3851e+00, -2.6438e+00]], [[-1.9592e-01, -1.2383e+00, -1.4565e+00, -1.9685e+00, -1.8653e+00, -2.0878e+00, -2.4943e+00, -1.7576e+00, -4.2098e-01, -5.7035e-01, -1.7201e+00, -2.9656e+00]], [[-2.3624e-01, -4.6163e+00, -5.8538e+00, -5.2385e+00, -4.4071e+00, -3.2882e+00, -2.5933e+00, -3.0415e+00, -1.1540e+00, -2.6410e+00, -2.4174e+00, -2.8104e+00]], [[ 1.7814e+00, -3.4597e+00, -2.3380e+00, -2.6516e+00, -1.7815e+00, -1.9329e+00, -5.2440e+00, -4.6166e+00, -2.4941e+00, -4.6942e+00, -4.3801e+00, -3.4536e+00]], [[ 7.8427e-01, -4.2324e+00, -2.2289e+00, -3.0948e+00, -3.5236e+00, -3.2127e+00, -5.5190e+00, -3.7145e+00, -1.9630e+00, -6.2628e-02, -3.0997e-01, -1.6996e+00]], [[ 9.9147e-01, -3.3483e+00, -4.0910e+00, -4.4629e+00, -3.4006e+00, -3.8961e+00, -1.1709e+00, -2.8811e+00, -9.6903e-01, -1.9870e+00, -2.1714e+00, -2.7717e+00]], [[ 8.3041e-01, -3.0654e+00, -4.3520e+00, -3.6134e+00, -4.6440e-01, -2.6249e+00, -4.0068e+00, -4.0665e+00, -3.8131e+00, -3.6747e+00, -3.7823e+00, -3.8876e+00]], [[ 9.6743e-01, -2.8298e+00, -3.2322e+00, -3.3958e+00, -2.8632e+00, -2.3693e+00, -2.5186e+00, -2.4197e+00, -2.9192e+00, -2.9979e+00, -4.2769e+00, -4.0465e+00]], [[ 1.7782e+00, -1.7830e+00, -1.5749e+00, -1.6462e+00, -9.3002e-01, -1.6099e+00, 2.5211e-01, 3.8090e-01, -1.9736e+00, -1.7011e+00, -2.1383e+00, -2.0239e+00]], [[ 9.8320e-01, -4.1574e+00, -3.9284e+00, -2.8303e+00, -2.8683e+00, -3.9842e+00, -4.7875e+00, -3.7584e+00, -3.1016e+00, -2.8067e+00, -2.5611e+00, -9.7730e-02]]], [[[ 2.7418e+00, -2.7642e+00, -3.0018e+00, -2.4275e+00, -3.5808e+00, -3.2329e+00, -5.5212e+00, -3.4421e+00, -1.4271e+00, -2.4326e+00, -4.4520e+00, -3.0284e+00]], [[ 4.1661e+00, -1.0896e+01, -7.7590e+00, -8.6499e+00, -9.1533e+00, -7.1993e+00, -1.0941e+01, -6.1694e+00, -1.8438e+00, -4.7027e+00, -9.2152e+00, -2.6556e+00]], [[-4.3997e-02, -1.5812e+00, -3.1508e+00, -2.4297e+00, -1.7020e+00, -2.1418e+00, -3.2363e+00, -2.5325e+00, -2.0329e+00, -2.7169e+00, -1.8657e+00, -2.3884e+00]], [[ 1.0095e-01, -2.5321e-01, -1.6596e+00, -1.4148e+00, -2.9095e+00, -2.3647e+00, -2.8078e+00, -2.0714e+00, -2.9905e+00, -3.2029e+00, -2.4694e+00, -1.8551e+00]], [[-3.2299e-01, -3.7177e+00, -3.6296e+00, -3.3698e+00, -2.5803e+00, -2.8489e+00, -2.3176e+00, -1.7800e+00, -1.1106e+00, -2.3966e+00, -1.9571e+00, -1.7602e+00]], [[ 2.3078e+00, -6.2942e+00, -2.1302e+00, -4.2269e+00, -4.0509e+00, -3.6692e+00, -6.8288e+00, -5.6225e+00, -1.4904e+00, -3.1812e+00, -6.4552e+00, -2.8588e+00]], [[ 1.5379e+00, -9.4258e+00, -9.1562e+00, -8.3332e+00, -7.8999e+00, -4.3574e+00, -2.8155e+00, -3.4378e+00, -4.1981e+00, -2.3733e+00, -1.1184e+00, -3.5201e+00]], [[ 9.2360e-01, -3.3217e+00, -4.5142e+00, -5.3197e+00, -5.0739e+00, -4.1098e+00, -2.7118e+00, -4.1303e+00, -4.6109e+00, -3.8748e+00, -3.4149e+00, -3.0089e+00]], [[ 9.3384e-01, -4.5671e+00, -3.7547e+00, -4.7528e+00, -4.7807e+00, -5.3715e+00, -7.1560e+00, -5.2190e+00, -1.4116e+00, -3.2439e+00, -5.2630e+00, -2.5316e+00]], [[ 1.1589e+00, -2.9577e+00, -3.4671e+00, -2.7540e+00, -3.3868e+00, -2.8638e+00, -3.3484e+00, -1.5675e+00, -2.0548e+00, -3.4840e+00, -3.9958e+00, -2.7081e+00]], [[ 2.2863e+00, -1.9843e+00, -2.1868e+00, -1.3689e+00, -2.1169e+00, -1.2155e+00, -1.6379e-02, 2.4369e-01, -1.5885e+00, -8.0150e-01, -1.2017e+00, -7.9628e-01]], [[ 1.4007e+00, -2.5689e+00, -2.0735e+00, -1.5573e+00, -2.2674e+00, -2.8253e+00, -3.6703e+00, -9.3865e-01, -1.6080e+00, -3.0148e+00, -3.0110e+00, -1.1388e-01]]], [[[ 2.0047e+00, -8.7834e+00, -9.1515e+00, -8.2662e+00, -8.2101e+00, -5.6863e+00, -3.6109e+00, 1.4478e-01, -2.0643e+00, -4.4809e+00, -2.8357e+00, -2.1601e+00]], [[ 4.4415e+00, -1.9951e+01, -1.8176e+01, -1.5209e+01, -1.4448e+01, -9.2867e+00, -7.5681e+00, 2.7216e+00, -2.1305e+00, -7.2618e+00, -4.2176e+00, -4.8061e-01]], [[-3.2781e-01, -3.8182e+00, -5.6443e+00, -4.7516e+00, -2.8176e+00, -2.2666e+00, -2.9567e+00, -2.9398e+00, -3.2772e+00, -1.1070e+00, -4.3873e-01, -1.7030e+00]], [[-2.4819e-01, -1.6227e+00, -2.4757e+00, -1.8350e+00, -2.0691e+00, -1.9817e+00, -2.6995e+00, -1.4416e+00, -4.6580e-01, -7.9510e-01, -1.8474e+00, -2.3827e+00]], [[-5.2276e-01, -4.0027e+00, -4.3553e+00, -4.3991e+00, -4.1041e+00, -4.2708e+00, -3.6525e+00, -2.0386e+00, -4.1957e-01, -7.5633e-01, -1.8019e+00, -2.1220e+00]], [[ 2.1389e+00, -1.2428e+01, -9.5898e+00, -8.1330e+00, -7.1455e+00, -4.0179e+00, -4.9808e+00, 2.8041e+00, 1.1542e-01, -4.0583e+00, -1.1875e+00, -2.6858e+00]], [[ 1.1164e+00, -8.9025e+00, -9.3536e+00, -8.3016e+00, -8.3767e+00, -1.8836e+00, -2.3727e+00, -4.2358e+00, -3.8711e+00, -3.5664e+00, 2.8796e+00, -4.1497e-01]], [[ 1.0748e+00, -4.6265e+00, -5.1179e+00, -6.1415e+00, -3.8939e+00, -5.7004e+00, -3.1286e+00, -3.6073e+00, -3.6348e+00, -2.2279e+00, -3.6694e+00, -2.2216e+00]], [[ 5.9117e-01, -9.1318e+00, -8.3681e+00, -7.1002e+00, -6.8911e+00, -5.1412e+00, -4.6678e+00, 4.9648e-01, -7.0061e-01, -3.2646e+00, -2.9776e+00, -2.4881e+00]], [[ 6.8355e-01, -3.6125e+00, -4.5856e+00, -3.8510e+00, -3.1644e+00, -1.6054e+00, -2.7793e+00, -1.2931e+00, -2.3087e+00, -3.3305e+00, -3.2434e+00, -3.2990e+00]], [[ 2.5875e+00, -1.8225e+00, -1.8406e+00, -1.0419e+00, -8.9577e-01, -1.3566e+00, 5.9352e-01, 1.3997e-01, -1.2649e+00, -1.4967e+00, 4.5686e-02, 5.8782e-01]], [[ 7.5954e-01, -4.0374e+00, -4.2744e+00, -4.2182e+00, -3.3429e+00, -2.0838e+00, -2.6178e+00, -2.3761e+00, -3.8948e+00, -2.8159e+00, -2.2073e+00, -1.9865e+00]]]]) attn_weights tensor([[[[-1.8702e+00, -3.6965e+00, -3.1296e+00, -3.5424e+00, -4.4712e+00, -3.6326e+00, -3.3646e+00, -3.1973e+00, -1.1612e+00, -2.1191e+00, -9.6775e-01, -3.1488e+00]], [[ 2.2509e-01, -5.1425e+00, -5.9483e+00, -6.1559e+00, -5.0723e+00, -2.3148e+00, -1.5360e+00, -2.7785e+00, -4.5325e+00, -5.9001e+00, -2.2149e+00, -2.1805e+00]], [[ 2.2865e-01, -3.0104e+00, -3.3854e+00, -3.5834e+00, -3.5245e+00, -4.0505e+00, -3.5785e+00, -2.3687e+00, -2.6675e+00, -3.4929e+00, -2.8803e+00, -3.0313e+00]], [[ 1.0951e-01, -3.1254e+00, -4.7477e+00, -4.4522e+00, -3.7658e+00, -3.2774e+00, -2.8002e+00, -2.6324e+00, -4.0400e+00, -4.3403e+00, -3.1272e+00, -2.9745e+00]], [[ 1.0227e+00, -1.4097e+00, -1.8490e+00, -1.7913e+00, -2.0291e+00, -1.6026e+00, -9.5376e-01, -1.2457e+00, -2.5082e+00, -2.5638e+00, -1.4922e+00, -1.5818e+00]], [[-7.9962e-01, -4.2000e+00, -4.8897e+00, -4.4213e+00, -5.4735e+00, -4.6124e+00, -4.5319e+00, -3.8813e+00, -3.0873e+00, -2.8757e+00, -3.3530e+00, -3.9332e+00]], [[ 2.1877e+00, -3.8064e+00, -3.1385e+00, -3.6680e+00, -1.7831e+00, -2.4518e+00, -2.4070e+00, -1.7920e+00, -1.9454e+00, -2.8072e+00, -1.5592e+00, -9.6514e-02]], [[-4.6069e-01, -4.2689e+00, -5.2899e+00, -4.9455e+00, -5.0321e+00, -2.6806e+00, -2.2900e+00, -3.4838e+00, -5.0980e+00, -4.2416e+00, -2.6420e+00, -3.5931e+00]], [[-1.5853e+00, -6.2043e+00, -5.4137e+00, -6.2202e+00, -7.5128e+00, -5.2115e+00, -5.5620e+00, -4.9651e+00, -3.0123e+00, -3.6430e+00, -2.0493e+00, -5.1066e+00]], [[ 4.2741e+00, -7.3738e+00, -5.2034e+00, -2.2905e+00, -3.8084e+00, 8.5190e-01, -6.7790e+00, -3.9686e+00, -4.2618e+00, -2.3501e+00, -3.2248e+00, -1.4742e+00]], [[ 2.8267e+00, -4.5941e+00, -3.6734e+00, -3.5930e+00, -2.2943e+00, -1.3343e+00, -6.2008e-01, -1.0057e+00, -1.5130e+00, -2.0351e+00, -3.1087e-01, -1.4678e+00]], [[-9.7770e-01, -4.2449e+00, -3.6266e+00, -3.7580e+00, -5.0319e+00, -3.6483e+00, -3.3451e+00, -2.2370e+00, -1.2961e+00, -1.5175e+00, -8.9444e-01, -3.2814e+00]]], [[[-8.2332e-01, -3.4873e+00, -2.8915e+00, -2.6196e+00, -4.1725e+00, -4.6900e+00, -4.5067e+00, -4.5299e+00, -3.5168e+00, -2.0002e+00, -2.0468e+00, -3.5246e+00]], [[ 4.2103e-01, -3.3886e+00, -4.3439e+00, -4.4833e+00, -3.3606e+00, -4.1787e+00, -3.8594e+00, -4.9255e+00, -4.1681e+00, -3.7257e+00, -4.2863e+00, -2.4967e+00]], [[ 4.0954e-01, -2.8254e+00, -2.4617e+00, -2.6380e+00, -3.1655e+00, -3.9136e+00, -3.5322e+00, -2.6254e+00, -2.5460e+00, -2.2915e+00, -2.9207e+00, -3.5620e+00]], [[ 1.5277e-01, -1.6628e+00, -3.1481e+00, -2.6887e+00, -1.7467e+00, -1.7903e+00, -1.3600e+00, -1.0667e+00, -1.3409e+00, -2.7845e+00, -3.0223e+00, -2.7725e+00]], [[ 1.3064e+00, -3.0943e-01, -1.1209e+00, -7.9179e-01, -1.0853e+00, -3.3733e+00, -1.0617e+00, -1.1610e+00, -2.0991e+00, -1.9707e+00, -1.9831e+00, -8.9506e-01]], [[-6.4675e-01, -3.7493e+00, -4.1752e+00, -3.8364e+00, -4.0451e+00, -4.7297e+00, -4.6926e+00, -4.0722e+00, -3.1872e+00, -2.7613e+00, -2.4806e+00, -2.9009e+00]], [[ 2.2652e+00, -3.2070e+00, -1.3364e+00, -1.5043e+00, -2.1019e+00, -3.6297e+00, -4.3762e+00, -2.8410e+00, -1.7068e+00, -7.1567e-01, -1.1182e+00, -2.5892e-01]], [[-7.1009e-01, -3.2323e+00, -4.0355e+00, -3.7451e+00, -3.1363e+00, -1.9419e+00, -1.2176e+00, -1.7498e+00, -2.6751e+00, -3.4513e+00, -3.2899e+00, -2.5298e+00]], [[-1.1155e+00, -5.2321e+00, -4.1650e+00, -4.5906e+00, -6.3954e+00, -5.4660e+00, -5.5600e+00, -5.1502e+00, -3.0784e+00, -2.1291e+00, -2.6583e+00, -4.5072e+00]], [[ 5.2563e+00, -7.3681e+00, -8.1033e+00, -6.4861e+00, -3.2049e+00, -2.0959e+00, -1.1248e+01, -6.2256e+00, -6.4362e+00, -5.2993e+00, -5.5787e+00, -4.3557e+00]], [[ 3.0442e+00, -3.3642e+00, -2.7575e+00, -2.8223e+00, -1.5905e+00, -1.7475e+00, -1.0216e+00, -1.0081e+00, 5.2519e-03, -2.6572e-01, -6.7485e-01, -2.5442e-01]], [[ 1.0939e-01, -2.5011e+00, -3.4191e+00, -4.5683e+00, -4.8145e+00, -4.7562e+00, -3.7556e+00, -3.8787e+00, -1.4736e+00, -1.3279e+00, -2.0064e+00, -1.3939e+00]]], [[[-1.0500e+00, -3.7364e+00, -2.4099e+00, -3.3867e+00, -4.3989e+00, -5.1263e+00, -4.4236e+00, -5.1933e+00, -3.0705e+00, -9.1388e-01, -1.8589e+00, -3.5402e+00]], [[ 3.6535e-02, -3.9653e+00, -4.8273e+00, -3.9751e+00, -2.5210e+00, -3.2824e+00, -3.0962e+00, -3.5693e+00, -5.0072e+00, -3.6230e+00, -5.5100e+00, -6.0104e+00]], [[ 1.9567e-01, -3.3592e+00, -3.0836e+00, -3.5034e+00, -3.3846e+00, -3.6135e+00, -3.7247e+00, -2.7417e+00, -3.2524e+00, -3.1820e+00, -4.3407e+00, -3.7884e+00]], [[ 1.5661e-02, -2.8043e+00, -3.8678e+00, -3.1907e+00, -2.1186e+00, -2.2838e+00, -1.8951e+00, -1.6099e+00, -9.1667e-01, -2.2186e+00, -3.0655e+00, -3.6465e+00]], [[ 1.1547e+00, -1.6511e+00, -1.9272e+00, -2.3184e+00, -1.8554e+00, -2.8538e+00, -9.7201e-01, -1.2910e+00, -1.4770e+00, -2.0577e+00, -1.6712e+00, -1.4175e+00]], [[-6.4019e-01, -3.5332e+00, -4.6796e+00, -4.3781e+00, -4.6889e+00, -5.2140e+00, -4.1790e+00, -4.7005e+00, -2.9715e+00, -3.4891e+00, -3.7014e+00, -3.6236e+00]], [[ 2.1480e+00, -3.0591e+00, -1.4131e+00, -1.4032e+00, -1.8936e+00, -3.3544e+00, -4.1077e+00, -2.4895e+00, -1.5650e+00, -3.3358e-01, -1.4323e+00, 1.9872e-01]], [[-7.9797e-01, -3.5157e+00, -4.9956e+00, -4.4292e+00, -3.5961e+00, -2.5552e+00, -1.3439e+00, -2.2075e+00, -4.0506e+00, -4.2248e+00, -4.0143e+00, -4.5577e+00]], [[-1.6494e+00, -5.0296e+00, -5.0794e+00, -6.5529e+00, -5.4463e+00, -5.2564e+00, -5.1766e+00, -3.8014e+00, -3.0290e+00, -3.1664e+00, -2.6349e+00, -5.0137e+00]], [[ 4.6082e+00, -5.3636e+00, -4.8940e+00, -1.5891e+00, -1.6433e+00, -2.2905e+00, -7.7513e+00, -5.8916e+00, -6.2753e+00, -6.4096e+00, -3.0790e+00, -1.0970e+00]], [[ 3.0086e+00, -2.8827e+00, -2.5047e+00, -2.8115e+00, -2.2512e+00, -2.5761e+00, -1.6627e+00, -1.9665e+00, -1.0023e+00, -6.1710e-01, -9.0301e-01, -1.4982e+00]], [[-5.4871e-01, -2.4859e+00, -3.1479e+00, -4.7224e+00, -4.0176e+00, -4.0809e+00, -3.3567e+00, -3.4927e+00, -8.6572e-01, -1.7374e+00, -2.1155e+00, -3.7661e+00]]], [[[-4.0312e-01, -3.4905e+00, -3.6106e+00, -3.0728e+00, -3.2405e+00, -3.3090e+00, -2.8334e+00, -3.5543e+00, -4.1609e+00, -3.8265e+00, -3.7488e+00, -4.0761e+00]], [[-3.0361e-02, -2.9527e+00, -4.1640e+00, -3.4253e+00, -3.3667e+00, -4.9996e+00, -4.4229e+00, -3.2695e+00, -1.9621e+00, -3.4481e+00, -3.9364e+00, -3.3640e+00]], [[ 3.9095e-01, -2.6620e+00, -2.0484e+00, -2.5813e+00, -3.5661e+00, -3.1371e+00, -3.6221e+00, -2.8488e+00, -3.1871e+00, -3.7804e+00, -3.6885e+00, -2.5852e+00]], [[-1.1926e-01, -1.0707e+00, -2.1143e+00, -1.8803e+00, -1.8355e+00, -2.8139e+00, -2.6810e+00, -1.8937e+00, -1.7392e+00, -2.8178e+00, -3.0355e+00, -1.7878e+00]], [[ 1.5064e+00, -3.8584e-01, -7.9175e-01, -1.4109e+00, -2.0997e+00, -2.3169e+00, -1.9055e+00, -1.8428e+00, -2.9599e+00, -2.9717e+00, -2.9339e+00, -2.1583e-01]], [[-5.0207e-01, -3.1670e+00, -4.0620e+00, -4.0059e+00, -4.5414e+00, -4.7029e+00, -4.1177e+00, -3.8534e+00, -3.8069e+00, -3.9211e+00, -3.6127e+00, -2.7848e+00]], [[ 2.0368e+00, -1.9295e+00, -2.0335e+00, -2.8523e+00, -2.9336e+00, -2.9474e+00, -3.1599e+00, -1.6234e+00, -2.4253e+00, -3.6265e+00, -3.2030e+00, -1.5121e-01]], [[-2.5391e-01, -3.3168e+00, -3.6197e+00, -3.3026e+00, -3.0416e+00, -2.4165e+00, -1.5424e+00, -2.5415e+00, -2.2272e+00, -8.5605e-01, -1.3313e+00, -3.1979e+00]], [[-1.2091e+00, -4.2193e+00, -4.7507e+00, -5.1710e+00, -4.7221e+00, -4.4577e+00, -3.3902e+00, -2.6601e+00, -2.8845e+00, -3.1047e+00, -1.8263e+00, -4.1530e+00]], [[ 5.1000e+00, -4.8882e+00, -1.5279e+00, -4.8723e+00, -4.3285e+00, -1.9643e+00, -8.5408e+00, -2.9171e+00, 1.5043e-01, -2.3874e+00, -9.3842e+00, -1.9139e+00]], [[ 3.1947e+00, -1.2974e+00, -1.4215e+00, -1.9140e+00, -1.7671e+00, -1.5817e+00, -1.7672e+00, -2.8814e+00, -1.3947e+00, -2.8121e+00, -1.3610e+00, -1.1900e+00]], [[ 1.3311e-02, -2.2344e+00, -3.9900e+00, -4.1785e+00, -4.8748e+00, -5.1088e+00, -3.5548e+00, -4.0367e+00, -4.3276e+00, -4.6007e+00, -3.7534e+00, -3.3574e+00]]], [[[-1.7008e+00, -4.7490e+00, -3.8664e+00, -3.0882e+00, -1.9146e+00, -4.0636e+00, -4.7872e+00, -3.5282e+00, -1.3762e+00, -1.1443e+00, -3.5458e+00, -4.9693e+00]], [[-1.2078e-01, -4.5247e+00, -3.4190e+00, -4.0993e+00, -3.6099e+00, -3.4443e+00, -2.9364e+00, -1.3230e+00, -1.9349e+00, -3.5914e+00, -3.3249e+00, -3.2883e+00]], [[ 3.3545e-01, -2.9959e+00, -2.9100e+00, -3.4303e+00, -3.2842e+00, -3.3827e+00, -2.8996e+00, -2.4007e+00, -3.0802e+00, -3.4876e+00, -3.0411e+00, -3.3520e+00]], [[ 3.2275e-01, -4.0440e+00, -5.2797e+00, -4.6853e+00, -4.0171e+00, -4.1239e+00, -4.1366e+00, -3.6881e+00, -2.5524e+00, -3.2817e+00, -3.4656e+00, -4.9855e+00]], [[ 1.8015e+00, -2.2269e+00, -2.6210e+00, -3.3066e+00, -2.9158e+00, -1.5847e+00, -9.3665e-01, -1.4020e+00, -2.3021e+00, -2.3083e+00, -1.4993e+00, -1.9270e+00]], [[-5.7460e-01, -4.2574e+00, -4.3596e+00, -5.0364e+00, -4.3669e+00, -3.9027e+00, -4.4268e+00, -3.5376e+00, -1.1591e+00, -2.7429e+00, -2.7004e+00, -2.9683e+00]], [[ 1.9927e+00, -3.3219e+00, -3.9239e+00, -4.1341e+00, -2.9290e+00, -1.4392e+00, -5.4384e-01, -1.1076e+00, -2.8523e+00, -1.9213e+00, -6.2833e-01, -3.0299e-01]], [[-5.3050e-01, -3.7082e+00, -4.0496e+00, -3.9979e+00, -4.2726e+00, -2.3177e+00, -2.5132e+00, -3.4703e+00, -3.9143e+00, -3.9464e+00, 1.4296e-02, -1.9574e+00]], [[-1.3531e+00, -5.5792e+00, -6.2507e+00, -7.0464e+00, -4.4247e+00, -3.4634e+00, -4.6366e+00, -3.7846e+00, -2.8935e+00, -2.0010e+00, 4.2087e-01, -2.2278e+00]], [[ 4.5372e+00, -1.5210e+01, -9.3464e+00, -9.1090e+00, -7.8721e+00, -3.0548e+00, -3.7521e+00, 2.4878e+00, 1.8386e+00, -2.3282e+00, -1.4295e+00, -8.2199e-01]], [[ 2.9228e+00, -3.8177e+00, -3.6273e+00, -4.0237e+00, -3.5476e+00, -2.7549e+00, -1.3328e+00, -1.6926e+00, -1.4821e+00, -2.1078e+00, -1.6808e+00, -5.3036e-01]], [[-7.0768e-01, -3.5226e+00, -4.0339e+00, -3.1709e+00, -2.9404e+00, -5.0259e+00, -4.0548e+00, -2.7102e+00, -6.4221e-01, -1.2117e+00, -2.8512e+00, -3.9970e+00]]]]) attn_weights tensor([[[[-7.2279e-01, -7.4013e+00, -7.2552e+00, -6.7517e+00, -7.0432e+00, -5.8780e+00, -5.5824e+00, -5.3234e+00, -5.0832e+00, -4.1748e+00, -1.5827e+00, -4.4208e+00]], [[ 3.3262e+00, -1.9751e+00, -1.5722e+00, -1.7912e+00, -2.8022e+00, -7.6208e-01, 5.4271e-01, -6.7802e-01, -7.8508e-01, -9.8014e-01, -1.0899e+00, -9.9953e-01]], [[ 6.4199e+00, -3.6641e+00, -4.2857e+00, -1.5220e+00, -2.2542e+00, 2.1446e+00, -2.6949e+00, -2.8794e+00, -4.7671e+00, -2.2985e+00, -6.1292e-01, 6.9863e-01]], [[ 1.9894e-01, -4.3789e+00, -4.7956e+00, -4.8232e+00, -4.8588e+00, -2.6474e+00, -2.4188e+00, -2.2976e+00, -3.1654e+00, -3.4817e+00, -2.4573e+00, -2.9751e+00]], [[ 1.0206e+00, -4.8974e+00, -4.0932e+00, -4.0257e+00, -5.9894e+00, -4.4765e+00, -3.5122e+00, -4.0639e+00, -3.4356e+00, -3.8467e+00, -2.0113e+00, -3.5538e+00]], [[ 6.4564e-01, -2.0674e+00, -1.9094e+00, -1.3677e+00, -2.9603e+00, -3.3864e+00, -1.7196e+00, -1.2721e+00, -2.8080e+00, -2.5745e+00, -1.6191e+00, -2.8962e+00]], [[ 1.3929e+00, -2.6763e+00, -3.3238e+00, -3.2379e+00, -3.2820e+00, -1.8197e+00, -1.1117e+00, -1.7392e+00, -2.7302e+00, -2.4009e+00, -1.9547e+00, -1.9248e+00]], [[ 2.8090e+00, -3.3957e+00, -3.7921e+00, -4.0715e+00, -2.8704e+00, -2.0540e-01, 1.8256e-01, 4.6738e-01, -1.4814e+00, -2.3357e+00, -3.7375e-01, -5.9938e-01]], [[ 9.4288e-02, -4.9747e+00, -4.7848e+00, -5.0933e+00, -5.6181e+00, -4.0886e+00, -3.0676e+00, -3.8072e+00, -4.2194e+00, -4.4381e+00, -1.4477e+00, -3.5494e+00]], [[ 3.7035e-02, -2.3460e+00, -3.1409e+00, -3.6551e+00, -5.8658e+00, -3.2058e+00, -2.4252e+00, -2.1740e+00, -2.0177e+00, -2.2713e+00, -2.5392e+00, -3.8589e+00]], [[ 4.0234e+00, -2.3341e+00, -3.2093e+00, -1.9208e+00, -5.2939e+00, 1.0335e+00, -3.0295e+00, -2.1884e+00, -3.1157e+00, -2.3299e+00, -3.1502e+00, -2.5751e+00]], [[ 2.4976e+00, -5.0076e+00, -5.0558e+00, -2.8560e+00, -3.4171e+00, -7.9835e-01, -3.0503e+00, -2.4441e+00, -3.8570e+00, -2.3660e+00, -1.4547e+00, -2.3962e+00]]], [[[-2.9017e-01, -6.1636e+00, -6.0386e+00, -5.2288e+00, -5.5238e+00, -6.8031e+00, -7.2015e+00, -5.7073e+00, -4.0731e+00, -3.2425e+00, -2.2259e+00, -4.9992e+00]], [[ 2.9393e+00, -1.6048e+00, -2.0045e+00, -3.4581e+00, -1.4576e+00, -3.3638e-01, 7.3898e-03, -1.7250e-01, -4.6447e-01, -5.2032e-01, -2.0051e+00, -3.4057e-01]], [[ 6.9648e+00, -4.2241e+00, -5.4560e+00, -5.4685e+00, -1.5573e+00, -3.9481e-02, -3.0016e+00, -2.2241e+00, -3.1580e+00, -4.7961e+00, -5.8247e+00, -1.0252e+00]], [[ 4.0132e-01, -3.7917e+00, -3.4890e+00, -3.2821e+00, -2.3783e+00, -3.9098e+00, -2.5276e+00, -1.5307e+00, -1.1051e+00, -1.8463e+00, -2.0079e+00, -2.4249e+00]], [[ 9.5780e-01, -3.4431e+00, -3.1691e+00, -3.3810e+00, -4.8241e+00, -4.5675e+00, -4.0251e+00, -5.3367e+00, -4.3230e+00, -3.4406e+00, -3.3787e+00, -3.8776e+00]], [[ 1.0486e+00, -1.2680e+00, -1.3707e+00, -6.7801e-01, -7.2519e-01, -4.3634e+00, -1.9496e+00, -8.8973e-01, -1.3246e+00, -2.3065e+00, -1.8272e+00, -2.3112e+00]], [[ 1.4802e+00, -2.1271e+00, -2.8202e+00, -2.9427e+00, -2.5695e+00, -2.0821e+00, -1.5591e+00, -1.6016e+00, -1.6931e+00, -1.9297e+00, -2.2501e+00, -2.2150e+00]], [[ 3.2976e+00, -2.3197e+00, -1.2362e+00, -2.4519e+00, -1.1556e+00, -6.3865e-01, -1.2210e+00, -3.2427e-01, 6.1614e-01, -1.3243e+00, -2.3404e+00, -1.6063e+00]], [[ 6.1614e-02, -4.1035e+00, -3.3562e+00, -4.0878e+00, -3.0416e+00, -3.3639e+00, -1.6119e+00, -2.3220e+00, -2.1681e+00, -2.5569e+00, -3.4635e+00, -3.1109e+00]], [[ 2.5195e-01, -2.3580e+00, -2.1046e+00, -2.6289e+00, -3.6545e+00, -3.6436e+00, -2.8475e+00, -2.8006e+00, -1.9149e+00, -2.3950e+00, -2.5244e+00, -2.6422e+00]], [[ 5.2829e+00, -3.6688e+00, -4.5149e+00, -4.5200e+00, -3.1641e+00, -2.3597e+00, -4.3176e+00, -2.7451e+00, -3.8969e+00, -4.1961e+00, -4.6495e+00, -2.0695e+00]], [[ 3.4027e+00, -3.6153e+00, -3.9112e+00, -2.5625e+00, -1.8091e+00, -1.2526e+00, -2.3016e+00, -1.8702e+00, -4.0952e+00, -2.5160e+00, -2.2946e+00, -2.1139e+00]]], [[[-4.8829e-01, -7.1000e+00, -6.0095e+00, -6.2065e+00, -6.7924e+00, -6.2458e+00, -6.5518e+00, -6.2599e+00, -3.2335e+00, -2.5434e+00, -2.1532e+00, -4.3180e+00]], [[ 2.8811e+00, -1.6356e+00, -1.3459e+00, -1.8249e+00, -2.2706e-01, -1.4787e+00, -7.2397e-01, 3.0067e-01, -3.1340e-01, -1.1240e+00, -1.7271e+00, -2.2983e+00]], [[ 6.1070e+00, -2.0317e+00, -3.9260e+00, -1.9801e+00, -2.6621e+00, -1.3964e+00, -4.7146e+00, -5.7854e+00, -3.0746e+00, -3.7145e+00, -1.5186e+00, -8.6457e-01]], [[ 5.2637e-02, -3.5507e+00, -3.4344e+00, -3.4415e+00, -3.3348e+00, -3.4629e+00, -2.6979e+00, -1.3201e+00, -9.3688e-03, -1.6153e+00, -2.3193e+00, -2.6279e+00]], [[ 6.8573e-01, -3.0393e+00, -3.2493e+00, -4.0961e+00, -3.6226e+00, -4.3461e+00, -3.9280e+00, -4.2361e+00, -3.2318e+00, -3.1137e+00, -3.9414e+00, -4.2967e+00]], [[ 5.9324e-01, -1.4982e+00, -2.2696e+00, -2.6093e+00, -3.0082e+00, -3.4107e+00, -1.5579e+00, -6.0837e-01, 6.5009e-01, -2.5389e+00, -1.4325e+00, -2.8682e+00]], [[ 1.4609e+00, -2.2275e+00, -2.5477e+00, -3.1086e+00, -2.6438e+00, -2.3721e+00, -2.1431e+00, -2.3332e+00, -1.9061e+00, -2.1141e+00, -3.3400e+00, -3.4713e+00]], [[ 3.1932e+00, -3.9522e+00, -3.6240e+00, -4.7462e+00, -2.9006e+00, -2.4626e+00, -2.1704e+00, -1.9949e+00, -1.9907e+00, -2.0181e+00, -2.0872e+00, -1.6574e+00]], [[-8.4746e-01, -4.3990e+00, -3.6904e+00, -4.6204e+00, -4.0405e+00, -2.6980e+00, -1.4795e+00, -2.2141e+00, -2.1599e+00, -1.9184e+00, -2.6899e+00, -3.8280e+00]], [[ 7.9558e-02, -1.2177e+00, -8.5364e-01, -2.5275e+00, -2.6621e+00, -2.7067e+00, -2.5348e+00, -2.2743e+00, -8.4992e-01, -1.0811e+00, -1.9943e+00, -3.3285e+00]], [[ 3.2500e+00, -1.6335e+00, -1.7496e+00, 1.2940e+00, -1.5466e+00, -2.9395e+00, -2.7906e+00, -2.4879e+00, -1.5910e+00, -2.2411e+00, -4.1242e-01, 6.7577e-02]], [[ 3.2389e+00, -3.4843e+00, -3.8473e+00, -1.1325e+00, -1.7049e+00, -2.6131e+00, -4.3330e+00, -4.2605e+00, -4.5575e+00, -1.8101e+00, -9.3963e-01, -6.3380e-01]]], [[[-2.0521e-01, -7.6831e+00, -6.5991e+00, -6.8593e+00, -5.4143e+00, -2.8030e+00, -2.9133e+00, -5.4264e+00, -4.2322e+00, -2.8159e+00, -2.1583e+00, -4.8165e+00]], [[ 3.3617e+00, -2.9833e+00, -2.0771e+00, -3.1771e+00, -3.0922e+00, -2.4530e+00, -1.6619e+00, -2.2974e+00, -2.4856e+00, -1.8397e+00, -2.2741e+00, -5.2834e-01]], [[ 5.7374e+00, -3.4894e+00, -1.7884e+00, -3.1035e+00, -3.6444e+00, -1.4492e+00, -2.6923e+00, -3.2881e+00, 5.9939e-02, -7.4421e-01, -2.7615e+00, 8.1476e-02]], [[ 6.5628e-01, -2.6881e+00, -2.6803e+00, -3.6132e+00, -4.0740e+00, -4.2721e+00, -4.1781e+00, -3.9903e+00, -3.2819e+00, -3.0477e+00, -3.8273e+00, -2.6193e+00]], [[ 2.7271e-01, -1.4849e+00, -1.2964e+00, -1.5485e+00, -2.0331e+00, -3.0088e+00, -2.0789e+00, -2.5324e+00, -2.9665e+00, -2.8850e+00, -2.4769e+00, -2.2775e+00]], [[ 8.8653e-01, -8.0667e-01, -8.3741e-01, -1.0281e+00, -1.0866e+00, -2.5270e+00, -2.0493e+00, -1.3949e+00, -1.8726e+00, -3.9658e+00, -2.4341e+00, -1.9514e+00]], [[ 1.2601e+00, -1.9866e+00, -2.8954e+00, -2.8768e+00, -3.0372e+00, -2.6669e+00, -2.6399e+00, -2.4484e+00, -1.6685e+00, -2.2852e+00, -2.1025e+00, -1.7201e+00]], [[ 3.3700e+00, 2.6619e-01, -1.2500e+00, -2.1329e+00, -2.0980e+00, -1.8722e+00, -3.5505e+00, -3.8725e+00, -2.7294e+00, -1.2776e+00, -2.7739e+00, -1.6290e+00]], [[-9.2524e-02, -4.6500e+00, -4.1576e+00, -4.0670e+00, -4.7144e+00, -3.9786e+00, -2.7547e+00, -3.5951e+00, -3.8602e+00, -2.9215e+00, -2.5726e+00, -3.8457e+00]], [[ 6.9701e-01, -3.2179e+00, -3.4539e+00, -4.0186e+00, -4.6967e+00, -3.5382e+00, -3.4015e+00, -3.7925e+00, -4.5316e+00, -4.0251e+00, -5.0297e+00, -2.0497e+00]], [[ 3.9090e+00, -3.2324e+00, -1.1024e+00, -3.9616e+00, -3.6817e+00, -2.8191e+00, -3.2391e+00, -4.3584e+00, 1.4531e-01, -2.4116e+00, -4.3644e+00, -2.0844e+00]], [[ 3.6191e+00, -1.5788e+00, -1.1892e+00, -3.6130e+00, -4.2729e+00, -2.4404e+00, -4.4655e+00, -2.9497e+00, -4.4056e-01, -3.4531e+00, -4.2537e+00, -1.4816e+00]]], [[[-1.0102e+00, -5.0167e+00, -6.6753e+00, -4.4595e+00, -2.5301e+00, -3.3983e+00, -5.5506e+00, -3.1025e+00, -9.9915e-01, -1.0605e+00, -1.5083e-01, -3.7610e+00]], [[ 3.6384e+00, -3.6247e+00, -3.0333e+00, -2.9129e+00, -3.0121e+00, -2.6967e+00, -6.0453e-01, 4.7683e-02, -6.1131e-01, -6.3989e-01, -1.0567e+00, -8.9351e-02]], [[ 6.7374e+00, -7.1776e+00, -7.6079e+00, -8.7059e+00, -7.0418e+00, -2.9857e+00, -2.7119e+00, 2.6262e-01, -1.9891e+00, -2.1046e+00, -8.6665e-01, 1.3690e+00]], [[ 1.8588e-01, -3.7576e+00, -3.6860e+00, -4.2082e+00, -4.7845e+00, -2.1144e+00, -2.9103e+00, -2.3892e+00, -1.1023e+00, -1.9317e+00, -2.1807e+00, -1.7314e+00]], [[-2.1943e-01, -2.3977e+00, -2.5860e+00, -2.5348e+00, -2.6187e+00, -2.8986e+00, -2.7735e+00, -7.5375e-01, 9.2574e-01, -7.6127e-01, -3.1501e+00, -4.8175e+00]], [[ 1.4037e+00, -3.1068e+00, -3.2251e+00, -3.3425e+00, -3.4721e+00, -4.3902e+00, -3.0329e+00, -3.0134e+00, -2.2950e+00, -2.2620e+00, -3.5726e+00, -2.7474e+00]], [[ 1.4176e+00, -3.1183e+00, -3.1224e+00, -4.2455e+00, -3.4745e+00, -2.7736e+00, -2.4443e+00, -2.4917e+00, -2.3755e+00, -2.0321e+00, -3.0733e+00, -2.0358e+00]], [[ 2.7439e+00, -2.9789e+00, -3.9807e+00, -4.0073e+00, -3.6597e+00, -2.5194e+00, -2.1673e+00, -1.3918e+00, -6.6440e-01, -1.9141e+00, -2.1721e+00, -2.5723e+00]], [[ 1.4891e-01, -4.8921e+00, -3.5494e+00, -3.8361e+00, -3.0456e+00, -4.7987e+00, -3.8370e+00, -3.8186e+00, -3.5355e+00, -2.9045e+00, -3.2236e+00, -4.1498e+00]], [[ 6.1650e-03, -2.1577e+00, -2.2304e+00, -2.5604e+00, -4.0563e+00, -3.0931e+00, -3.4042e+00, -2.2168e+00, -5.0508e-01, -2.4826e+00, -2.4372e+00, -3.8617e+00]], [[ 3.4924e+00, -6.6390e+00, -4.5428e+00, -4.4428e+00, -4.6641e+00, -2.7144e+00, -2.3998e+00, 6.6286e-01, 9.3724e-01, -1.3140e+00, -1.8797e+00, -1.9334e+00]], [[ 2.4105e+00, -3.1834e+00, -4.3916e+00, -4.6387e+00, -4.6270e+00, -2.5762e+00, -1.6129e+00, 1.0055e+00, -2.5807e+00, -3.3495e+00, -2.8377e+00, -1.8583e+00]]]]) attn_weights tensor([[[[ 0.6670, -3.2306, -3.1049, -3.2156, -2.3556, -4.4845, -2.3755, -2.1793, -1.9252, -2.2614, -2.7027, -1.9720]], [[ 3.6896, -2.6501, -4.2519, -2.5843, -2.9820, 0.6465, -0.6082, -0.7440, -1.9761, -1.2429, -2.0240, -1.2999]], [[ 1.3934, -1.0275, -2.4842, -1.7218, -1.0551, -0.5632, -0.8645, -0.8091, -2.4086, -1.4291, -0.9758, -0.7276]], [[ 2.5613, -2.1981, -1.1065, -2.3300, -2.1241, 0.1251, 1.9457, 0.2018, -0.3040, -0.9592, -2.1169, -1.3713]], [[-0.3536, -5.0123, -5.0280, -5.8478, -6.3044, -4.0461, -3.7003, -3.1322, -3.7933, -4.1828, -2.1994, -4.0916]], [[-2.0555, -4.3290, -4.3274, -3.0860, -4.2197, -3.1487, -3.0645, -1.4448, -1.9036, -1.1079, -1.3703, -3.0282]], [[ 2.1998, -3.0211, -3.8625, -4.7124, -4.2169, 0.4120, 0.0449, -1.6328, -3.5523, -4.8111, -1.8433, -1.8216]], [[-0.8880, -6.2844, -6.0837, -5.7902, -5.7934, -3.4335, -3.1275, -3.4137, -3.4956, -2.7981, 0.4592, -1.4762]], [[ 0.1837, -3.0398, -3.4453, -3.5411, -3.1199, -0.1999, -0.2897, -1.2209, -3.3502, -3.1339, -1.5844, -2.5825]], [[ 1.0078, -4.5493, -4.1532, -4.8528, -3.3994, -1.2233, -1.5291, -2.8413, -3.0023, -3.3695, -2.1435, -2.0989]], [[ 1.0235, -3.3412, -2.8972, -3.7246, -3.2350, -0.5534, -0.8190, -1.2982, -1.7995, -2.2599, -2.1090, -1.7576]], [[ 0.4309, -3.7163, -4.0696, -3.7641, -4.4173, -1.0680, -2.0640, -2.9764, -4.3538, -3.8027, -2.9151, -3.8331]]], [[[ 0.9355, -2.6106, -2.5790, -2.8782, -2.9420, -4.2382, -1.9721, -2.4792, -2.9822, -2.7304, -2.8540, -1.8717]], [[ 5.3487, -1.4958, -3.1383, -1.7224, -0.1326, 0.4784, -1.8142, -1.3274, -1.7201, -1.7377, -0.6215, 0.5052]], [[ 1.5181, -0.7585, -2.2356, -2.1220, -0.8234, -1.0129, -1.1667, -0.5385, -1.4222, -2.2010, -1.8567, -1.5126]], [[ 2.3481, -2.1789, -1.8114, -2.5413, -2.2744, -0.5362, -0.8609, -0.8067, -2.0169, -2.3136, -2.8495, -2.5184]], [[ 0.3932, -4.5030, -4.1690, -4.3912, -4.1077, -3.8127, -3.0752, -3.4397, -3.3328, -3.4132, -3.7822, -2.7641]], [[-1.1624, -3.0681, -3.3389, -2.3360, -3.4894, -3.5774, -3.3931, -2.4026, -2.2427, -2.5581, -1.9809, -2.6759]], [[ 2.9598, -3.6890, -3.3525, -4.3461, -1.9501, -1.6745, -1.5065, -1.5925, -1.6798, -2.8328, -3.6272, -1.3098]], [[-0.2912, -5.7960, -6.0214, -7.0533, -5.8453, -5.1055, -5.0818, -4.3548, -3.5885, -3.7237, -4.6816, -4.1212]], [[ 0.6311, -1.5160, -2.1486, -2.5409, -2.4200, -1.4157, -1.1496, -1.0457, -0.8438, -2.1886, -2.7977, -2.5644]], [[ 1.0351, -4.1593, -4.1276, -5.0232, -3.4855, -1.1115, -1.5238, -2.5358, -2.4387, -3.1751, -3.8745, -2.6150]], [[ 1.1537, -2.9319, -2.4272, -2.8765, -2.4944, -1.8999, -2.1163, -1.3193, -1.5316, -1.9353, -2.2568, -1.6529]], [[ 1.2599, -2.8517, -3.9498, -3.0446, -3.4866, -2.0675, -2.7447, -2.9633, -3.8872, -4.3886, -3.8303, -5.3745]]], [[[ 1.0974, -2.9940, -2.5862, -2.9521, -2.2718, -3.9287, -2.2831, -3.2421, -2.5970, -2.7263, -2.0976, -1.0887]], [[ 5.3766, -2.2675, -3.0166, -0.4800, -0.0738, -1.0523, -3.2666, -4.1221, -2.7645, -1.7535, -0.1360, 0.5023]], [[ 1.9545, -0.7558, -2.3177, -2.0280, -0.8740, -0.9700, -0.8693, -0.5983, -0.8032, -1.9354, -2.3452, -1.9082]], [[ 2.7708, -3.0912, -2.9030, -3.0982, -2.7206, -2.2575, -1.9571, -1.7986, -1.3051, -3.4108, -2.5296, -3.1235]], [[ 0.0718, -4.0162, -3.6532, -3.9084, -5.0220, -3.2729, -2.5390, -3.5459, -2.1710, -1.5589, -0.6278, -2.4534]], [[-1.3507, -3.2643, -2.3371, -3.7914, -4.0052, -2.7946, -2.8417, -2.7027, -0.0878, -0.9917, -1.7686, -3.7292]], [[ 2.6203, -1.3745, -3.0654, -2.6745, -1.1446, -2.5024, -2.7278, -1.6532, -1.4886, -1.9064, -1.2651, -1.7031]], [[-0.3789, -5.9531, -5.5601, -8.0212, -7.8539, -4.1948, -4.9241, -4.8685, -4.1094, -3.1483, -2.9216, -4.6494]], [[-0.3592, -1.1942, -2.1180, -2.1066, -1.8923, 0.0814, -0.6019, 0.1047, -0.1052, -1.9676, -3.2072, -2.5139]], [[ 0.7003, -2.8792, -2.9273, -2.9345, -2.8886, -1.8446, -0.9413, -2.0871, -2.2995, -2.5825, -3.4688, -3.4769]], [[ 1.0898, -3.7034, -4.2502, -3.7926, -2.3203, -2.6623, -3.1847, -2.7222, -1.8540, -3.2066, -3.7621, -1.8568]], [[ 1.4208, -2.8078, -4.8120, -4.0331, -4.5139, -3.7417, -3.3130, -2.9498, -3.7808, -4.5722, -5.0081, -5.0563]]], [[[ 1.4994, -2.0601, -1.9245, -2.4012, -3.1748, -4.2547, -2.2547, -4.1802, -4.2617, -4.5273, -2.7123, -1.5745]], [[ 3.1153, -2.0189, -1.1498, -1.3485, -1.0900, -1.1242, -1.2680, -1.4371, 0.4196, -2.1905, -1.4291, -1.6003]], [[ 2.1083, -0.0405, -1.0053, -1.7187, -0.7607, -0.6227, -1.2713, -1.6494, -1.4220, -1.1872, -1.6632, 1.3200]], [[ 1.4119, -1.3648, -2.0842, -1.5188, -1.4478, -2.1687, -1.6380, -1.4179, -1.8460, -2.5738, -2.6992, 0.1350]], [[ 0.0716, -3.0778, -4.2096, -4.0940, -4.0348, -4.0763, -2.7256, -2.9747, -4.9373, -4.5360, -3.2384, -3.4525]], [[-0.7851, -2.5584, -3.0940, -2.7194, -3.3758, -3.3997, -3.0186, -2.8441, -4.7819, -3.7512, -3.4811, -3.4497]], [[ 2.2318, -0.6761, -0.4112, -2.4756, -2.8081, -2.6590, -2.0695, -2.9019, -1.6679, -3.0519, -2.0997, -2.4818]], [[-0.2527, -5.5484, -5.9655, -5.7932, -4.7705, -3.7125, -3.1307, -4.5694, -5.2302, -5.0765, -3.4789, -4.1232]], [[ 0.6479, -1.2096, -2.4457, -3.3295, -3.5316, -2.0804, -2.3688, -2.5735, -3.0881, -1.8905, -1.9825, -2.7540]], [[ 1.1716, -2.3851, -1.9337, -2.4386, -2.3824, -2.4942, -2.3910, -1.8479, -1.6596, -1.8617, -2.3763, -0.9915]], [[ 1.0556, -1.8324, -2.1814, -2.5372, -2.4408, -2.8248, -2.9378, -2.7607, -2.4258, -2.6501, -3.1979, -1.2643]], [[ 0.9691, -2.0169, -2.8816, -4.0341, -3.0242, -2.5020, -2.0719, -3.1194, -3.2537, -2.4936, -3.1269, -2.6815]]], [[[ 1.5643, -2.5001, -3.3476, -3.2796, -3.8472, -3.3932, -1.9732, -2.2165, -4.7441, -5.5935, -3.9081, -1.3162]], [[ 3.8316, -2.6129, -2.9919, -3.8972, -2.6872, -0.2121, 0.4780, 1.0326, 0.1589, -0.6212, -1.7279, 0.1650]], [[ 1.3771, 0.8505, -0.7020, -0.6785, -0.3874, -1.9197, -2.2417, -0.0801, -0.4509, -1.0078, -2.6721, -2.7298]], [[ 2.1822, -2.2067, -2.3628, -2.2123, -1.6039, -1.4308, -0.6904, 0.2983, -0.4374, -1.5671, -2.6709, -2.2128]], [[ 0.5891, -5.2360, -5.5875, -5.6278, -3.9189, -5.4304, -4.4825, -5.0915, -3.2090, -2.9225, -1.8822, -2.7765]], [[-1.4599, -1.9372, -3.0806, -2.4555, -2.9379, -3.2466, -3.4463, -1.6507, -2.1672, -3.8205, -4.2962, -4.1197]], [[ 3.0681, -2.0370, -3.2172, -4.5751, -2.8539, -2.4882, -1.2356, -0.1511, -2.6585, -3.3284, -5.0710, -0.2081]], [[-1.1594, -5.4213, -5.1395, -3.5011, -1.5564, -4.1570, -4.6295, -3.1444, -0.2160, 1.0833, -2.5930, -3.3423]], [[ 0.9813, -3.0383, -3.1750, -3.4005, -3.4650, -2.5389, -1.5748, -1.9090, -4.2638, -4.0011, -2.2231, -2.3852]], [[ 1.0022, -3.7018, -3.8466, -4.0558, -3.1469, -1.1094, -1.4393, -2.3071, -3.0453, -2.6718, -1.5469, -1.4518]], [[ 0.9839, -3.1174, -3.2903, -3.8568, -3.7582, -1.8710, -1.8030, -1.2973, -2.0818, -1.2444, -1.9765, -0.5920]], [[ 1.2822, -2.6515, -4.2813, -4.1677, -4.1060, -2.8437, -2.9201, -2.2985, -5.4369, -5.1026, -3.3064, -2.9728]]]]) attn_weights tensor([[[[ 2.2704e+00, -3.0819e+00, -1.4400e+00, -1.6152e+00, -3.2327e+00, 1.7126e+00, 2.2791e+00, -1.7721e+00, -2.0903e+00, -1.5571e+00, -3.1257e-01, -1.6194e+00]], [[ 2.7283e+00, -2.4627e+00, -3.3688e+00, -2.4253e+00, -2.0791e+00, -8.1144e-01, -8.8485e-01, -2.3926e+00, -3.2545e+00, -2.5983e+00, -1.9231e+00, -8.6320e-01]], [[ 1.9376e+00, -3.7954e+00, -3.0445e+00, -3.8411e+00, -4.0031e+00, 9.2846e-01, 1.8065e-01, -2.1702e+00, -3.5468e+00, -3.3838e+00, -2.8403e+00, -2.9236e+00]], [[-1.0616e+00, -3.2687e+00, -2.6516e+00, -3.3274e+00, -4.8910e+00, -3.4318e+00, -2.7480e+00, -2.0974e+00, -1.7202e+00, -1.9587e+00, -5.2096e-01, -2.1160e+00]], [[ 3.6793e+00, -2.3100e+00, -3.8921e+00, -4.4234e+00, -4.3565e+00, -2.0624e-01, 1.7872e+00, -2.2887e+00, -3.8195e+00, -3.3290e+00, -2.1832e+00, -2.3048e+00]], [[ 1.7458e+00, -3.1348e+00, -3.6489e+00, -3.4470e+00, -2.9171e+00, -4.0841e-02, -4.9583e-01, -1.9541e+00, -2.7120e+00, -2.4026e+00, -2.6214e-01, -1.3308e+00]], [[ 3.4067e+00, -3.4866e+00, -5.0957e+00, -4.8607e+00, -5.1617e+00, 1.7044e+00, 1.1399e+00, -2.2684e+00, -4.2342e+00, -3.6372e+00, -2.1452e+00, -2.1055e+00]], [[ 3.0314e-01, -4.6196e+00, -4.6670e+00, -5.3717e+00, -4.7684e+00, -2.3089e+00, -2.6727e+00, -3.9781e+00, -4.7138e+00, -5.1200e+00, -3.5585e+00, -3.7370e+00]], [[ 1.4144e+00, -2.5632e+00, -3.0528e+00, -1.8500e+00, -2.5017e+00, 5.0579e-01, 4.1435e-01, -1.6620e+00, -2.7220e+00, -1.2893e+00, -1.1058e+00, -1.3137e+00]], [[ 4.3433e+00, -1.8480e+00, -2.5088e+00, -2.7673e+00, -4.0833e+00, 2.0221e+00, 2.1955e+00, -1.3461e+00, -2.4412e+00, -2.2659e+00, -4.4850e-01, -6.6004e-01]], [[ 4.4283e-01, -3.7874e+00, -3.0140e+00, -3.0933e+00, -3.8915e+00, -2.6676e+00, -2.5504e+00, -2.7602e+00, -1.9604e+00, -1.9514e+00, -7.2726e-01, -1.9442e+00]], [[ 3.1895e+00, -1.1998e+00, -2.7765e+00, -1.7115e+00, -2.1881e+00, -9.0140e-01, -1.0856e+00, -2.2027e+00, -3.0186e+00, -1.7587e+00, -1.4700e+00, -1.3082e+00]]], [[[ 2.3087e+00, -2.0428e+00, -2.9287e+00, -1.9155e+00, -2.3853e+00, -3.5179e-02, 7.0040e-01, -6.4697e-01, -1.8097e+00, -2.6759e+00, -2.1235e+00, -3.0676e+00]], [[ 3.6261e+00, -8.7826e-01, -1.9418e+00, -2.5921e+00, -1.7518e+00, -2.8130e+00, -2.2098e+00, -2.0876e+00, -2.4231e+00, -3.0196e+00, -3.1482e+00, -1.1072e+00]], [[ 2.3035e+00, -2.6340e+00, -2.6404e+00, -3.3085e+00, -2.3989e+00, -1.4882e-03, 1.5313e-01, -7.5685e-01, -1.4733e+00, -2.8723e+00, -3.5116e+00, -2.0201e+00]], [[-9.6133e-01, -2.7960e+00, -3.0322e+00, -3.7413e+00, -5.5532e+00, -4.6077e+00, -4.0929e+00, -2.9240e+00, -2.6205e+00, -2.2115e+00, -2.4554e+00, -3.5301e+00]], [[ 3.3405e+00, -2.8225e+00, -4.8204e+00, -4.5965e+00, -3.1096e+00, -1.5718e+00, -2.1288e+00, -2.6839e+00, -4.4538e+00, -5.2493e+00, -5.0102e+00, -1.7972e+00]], [[ 1.8637e+00, -2.4820e+00, -2.4611e+00, -2.8426e+00, -2.5867e+00, -2.8888e+00, -1.9523e+00, -2.0012e+00, -2.0170e+00, -2.1543e+00, -2.8898e+00, -2.8754e+00]], [[ 3.8062e+00, -2.0783e+00, -3.6423e+00, -3.5029e+00, -2.3530e+00, -4.1497e-01, -1.0336e+00, -1.5598e+00, -2.9369e+00, -3.9515e+00, -4.0146e+00, -2.4794e+00]], [[ 2.3364e-01, -3.7851e+00, -4.0253e+00, -4.3721e+00, -3.8991e+00, -2.8875e+00, -2.8259e+00, -3.2897e+00, -3.9211e+00, -4.1947e+00, -4.5542e+00, -3.9015e+00]], [[ 1.7466e+00, -2.0270e+00, -3.7671e+00, -1.7249e+00, -3.1490e+00, -1.7151e-01, -7.3617e-01, -1.6052e+00, -1.3315e+00, -3.5834e+00, -9.2037e-01, -3.3090e+00]], [[ 4.4738e+00, -2.0058e+00, -4.0497e+00, -3.7105e+00, -2.5616e+00, -4.5328e-01, -7.7933e-01, -1.9076e+00, -2.8213e+00, -4.3116e+00, -4.3112e+00, -2.1500e+00]], [[ 1.2605e+00, -3.9264e+00, -2.4649e+00, -2.6552e+00, -4.5079e+00, -3.5920e+00, -3.2599e+00, -2.6568e+00, -2.1258e+00, -1.0244e+00, -1.0049e+00, -1.6347e+00]], [[ 3.6015e+00, -5.6361e-01, -1.9280e+00, -1.5200e+00, 1.7317e-01, -1.6384e+00, -1.8256e+00, -1.9998e+00, -1.5491e+00, -2.5316e+00, -2.0384e+00, -2.2963e+00]]], [[[ 1.5190e+00, -1.3609e+00, -1.0437e+00, -1.8657e+00, -2.0066e+00, -4.8821e-01, 3.7873e-01, -1.8277e-01, -1.4025e+00, -7.1963e-01, -2.4446e+00, -1.2671e+00]], [[ 4.4906e+00, -7.7907e-01, -4.1828e+00, -2.8651e+00, -1.7395e+00, -2.8865e+00, -3.0985e+00, -3.5168e+00, -1.1674e+00, -3.3901e+00, -3.4686e+00, -1.4979e+00]], [[ 1.2894e+00, -2.4556e+00, -2.5821e+00, -3.2226e+00, -1.7982e+00, -2.3090e+00, -1.8335e+00, -1.4036e+00, -1.9540e+00, -2.1986e+00, -4.5311e+00, -2.7791e+00]], [[-8.9417e-01, -3.9400e+00, -2.9716e+00, -4.4698e+00, -6.5517e+00, -3.4439e+00, -3.2323e+00, -3.4256e+00, -2.1402e+00, -2.2261e+00, -2.1743e+00, -3.6195e+00]], [[ 3.4056e+00, -3.0513e+00, -3.1569e+00, -3.1811e+00, -2.1269e+00, -3.5814e+00, -2.3566e+00, -2.2229e+00, -1.9925e+00, -3.3961e+00, -3.7957e+00, -2.3969e+00]], [[ 2.1608e+00, -2.5902e+00, -3.1127e+00, -3.3192e+00, -3.0789e+00, -3.0571e+00, -2.0815e+00, -2.4281e+00, -2.4756e+00, -2.9233e+00, -3.8011e+00, -3.1448e+00]], [[ 3.7828e+00, -2.9615e+00, -3.8534e+00, -1.5058e+00, -2.8455e+00, -2.8208e+00, -2.8939e+00, -3.7119e+00, -2.8864e+00, -3.1466e+00, -2.7464e+00, -2.3804e+00]], [[ 4.5386e-01, -3.5807e+00, -4.8443e+00, -3.9547e+00, -3.6907e+00, -2.9025e+00, -2.1374e+00, -1.7751e+00, -1.8373e+00, -4.0597e+00, -5.0090e+00, -5.7391e+00]], [[ 2.1734e+00, -2.6961e+00, -2.5505e+00, -3.0460e+00, -2.5105e+00, -1.7207e+00, -8.1423e-01, -2.2128e+00, -9.7651e-01, -2.0822e+00, -3.8954e+00, -3.0514e+00]], [[ 5.2184e+00, -2.0895e+00, -2.0704e+00, -9.3818e-01, -1.9965e+00, -1.5652e+00, -1.4425e+00, -3.4236e+00, -2.3099e+00, -2.7911e+00, -1.5698e+00, -4.0707e-01]], [[ 9.9287e-01, -5.2589e+00, -3.0797e+00, -5.6721e+00, -5.5712e+00, -2.8152e+00, -2.5004e+00, -4.3996e+00, -2.3793e+00, -8.5472e-01, -5.0933e-01, -1.0310e+00]], [[ 3.7050e+00, -1.5289e+00, -2.8264e+00, -1.1591e+00, -1.5380e+00, -2.8297e+00, -2.3429e+00, -3.4979e+00, -3.5334e+00, -3.3793e+00, -3.5576e+00, -2.5833e+00]]], [[[ 1.5595e+00, -1.9734e+00, -2.5997e+00, -2.4934e+00, -3.6199e+00, -7.5141e-01, -7.9914e-01, -3.1100e+00, -3.7605e+00, -9.8489e-01, -1.4856e+00, -1.8905e+00]], [[ 2.3187e+00, -1.4151e+00, -1.8655e+00, -2.6348e+00, -2.2736e+00, -3.5430e+00, -2.5845e+00, -2.5123e+00, -1.6365e+00, -2.9018e+00, -2.9756e+00, -1.7205e+00]], [[ 1.4698e+00, -3.0232e+00, -2.3706e+00, -2.5892e+00, -2.6799e+00, -1.5324e+00, -1.1312e+00, -2.1842e+00, -2.7325e+00, -1.2654e+00, -2.0501e+00, -2.5118e+00]], [[-6.0018e-01, -2.0264e+00, -2.8477e+00, -1.9650e+00, -3.2889e+00, -1.9067e+00, -1.2722e+00, -2.8828e+00, -3.9193e+00, -2.8414e+00, -2.9522e+00, -2.9530e+00]], [[ 1.7773e+00, 1.8611e-01, -2.4272e+00, -2.1125e+00, -2.3271e+00, -2.0486e+00, -2.6103e+00, -2.5440e+00, -3.4078e+00, -3.5951e+00, -3.5071e+00, -1.0953e+00]], [[ 1.5549e+00, -1.2268e+00, -2.0309e+00, -2.6562e+00, -3.5205e+00, -1.7412e+00, -2.5991e+00, -2.3945e+00, -3.6106e+00, -3.2884e+00, -2.7276e+00, -1.0379e+00]], [[ 2.1491e+00, -1.8830e+00, -2.6102e+00, -3.5492e+00, -3.6525e+00, -1.5508e+00, -1.5476e+00, -2.9041e+00, -3.1685e+00, -8.6575e-01, -1.8099e+00, -9.6456e-01]], [[ 1.4309e-01, -3.4797e+00, -3.7326e+00, -3.4973e+00, -3.3945e+00, -3.2109e+00, -3.3959e+00, -4.0189e+00, -3.8324e+00, -3.9648e+00, -3.9604e+00, -3.9503e+00]], [[ 1.8781e+00, -2.1357e+00, -2.4826e+00, -2.7955e+00, -2.7676e+00, -1.1958e+00, -1.4299e+00, -2.5963e+00, -3.0040e+00, -1.8000e+00, -2.0277e+00, -1.6936e+00]], [[ 3.0374e+00, -2.7278e+00, -2.9653e+00, -4.0884e+00, -3.0850e+00, -5.1622e-01, -5.9252e-01, -3.5430e+00, -2.1942e+00, -4.3103e-01, -1.0016e+00, -1.5933e+00]], [[-8.9048e-02, -3.2261e+00, -3.7187e+00, -2.1657e+00, -1.4099e+00, -2.2471e+00, -1.0046e+00, -1.8791e+00, -2.0720e+00, -2.5188e+00, -1.2400e+00, -1.7736e+00]], [[ 3.8843e+00, -2.2902e-01, -9.6013e-01, -2.1047e+00, -2.2858e+00, -2.7782e+00, -3.7248e+00, -2.0016e+00, -1.3527e+00, -3.2454e+00, -4.1102e+00, 1.7382e-01]]], [[[ 2.6610e+00, -3.5294e+00, -4.1139e+00, -3.6477e+00, -3.7445e+00, -1.2935e+00, -9.8419e-02, -3.3225e+00, -5.0738e+00, -4.2258e+00, -1.0651e+00, -1.0691e+00]], [[ 4.0375e+00, -6.3752e-01, -2.2840e+00, -3.0646e+00, -2.1600e+00, -2.9287e+00, -1.8297e+00, -4.6028e-01, -1.2202e+00, -1.8689e+00, -2.7992e+00, -8.8162e-01]], [[ 2.8396e+00, -4.3700e+00, -3.5668e+00, -4.0471e+00, -3.6210e+00, -2.0721e+00, -9.2472e-01, -2.8723e+00, -3.4504e+00, -2.7694e+00, -1.6407e+00, -1.3904e+00]], [[-1.2197e+00, -2.0539e+00, -4.4365e+00, -3.0488e+00, -3.1280e+00, -2.9992e+00, -3.9704e+00, -2.1667e+00, -2.5826e+00, -2.9041e+00, -3.1725e+00, -4.2958e+00]], [[ 2.7054e+00, -1.2346e+00, -3.0244e+00, -3.1296e+00, -3.3087e+00, -2.3376e+00, -1.7830e+00, -2.2588e+00, -3.2775e+00, -2.3048e+00, -3.6839e+00, -3.7609e+00]], [[ 1.8941e+00, -3.0833e+00, -3.6750e+00, -3.6673e+00, -3.4775e+00, -3.8728e+00, -3.4698e+00, -2.2227e+00, -3.1773e+00, -3.0796e+00, -3.9591e+00, -3.0603e+00]], [[ 3.6319e+00, -1.9893e+00, -2.6481e+00, -3.3012e+00, -3.7434e+00, -9.6081e-01, -3.8894e-01, -4.7146e-02, -1.6382e+00, -2.5502e+00, -2.5957e+00, -4.7925e-01]], [[ 4.1189e-01, -2.8809e+00, -4.0280e+00, -3.9339e+00, -3.6567e+00, -3.5364e+00, -2.8544e+00, -2.3022e+00, -3.5701e+00, -3.8916e+00, -4.2324e+00, -3.8522e+00]], [[ 2.3881e+00, -3.5315e+00, -3.2014e+00, -2.8526e+00, -3.5593e+00, -1.6346e+00, -1.6037e+00, -2.8750e+00, -3.5512e+00, -3.8579e+00, -1.6757e+00, -1.7286e+00]], [[ 4.5183e+00, -1.3791e+00, -1.7310e+00, -2.4381e+00, -1.8219e+00, 4.4825e-01, 1.3826e+00, 2.0267e-01, -5.0751e-01, -5.6813e-01, -6.6699e-01, 1.0424e+00]], [[ 3.4059e-01, -4.0071e+00, -4.2207e+00, -3.4792e+00, -1.6489e+00, -2.8479e+00, -2.5779e+00, -3.1581e+00, 1.7148e-01, -1.4089e-01, -8.0613e-01, -1.8266e+00]], [[ 4.0981e+00, -6.4299e-01, -2.6187e+00, -2.8802e+00, -1.7976e+00, -3.2119e+00, -3.0416e+00, 1.1374e+00, -2.0116e+00, -2.1590e+00, -4.1677e+00, -3.6798e+00]]]]) attn_weights tensor([[[[ 2.4005e+00, -2.7458e+00, -4.1358e+00, -2.9655e+00, -3.6351e+00, 1.8027e+00, 1.0430e+00, -2.4965e+00, -4.1188e+00, -3.1004e+00, -5.2031e-01, -2.2552e+00]], [[ 3.4521e+00, -2.0563e+00, -3.5396e+00, -2.1518e+00, -2.6352e+00, 2.0980e+00, 5.8193e-01, -1.8752e+00, -3.3492e+00, -1.4192e+00, -3.2778e-01, 1.0461e-01]], [[ 3.1105e+00, -1.8338e+00, -2.9774e+00, -2.7412e+00, -2.9976e+00, 7.3761e-01, 5.5494e-01, -2.1807e+00, -3.1279e+00, -2.2723e+00, 2.5669e-01, -9.1133e-01]], [[ 2.2885e+00, -1.2993e+00, -3.6526e+00, -3.0822e+00, -3.2451e+00, 2.3889e+00, 5.7494e-01, -1.4728e+00, -3.0677e+00, -2.2896e+00, -9.0507e-01, -1.6560e+00]], [[ 2.2313e+00, -7.5793e-01, -1.7070e+00, -1.3301e+00, -1.2603e+00, 8.7156e-01, 1.3879e+00, -5.2017e-01, -1.3515e+00, -8.2889e-01, 1.8022e-01, -3.8028e-01]], [[ 1.7307e+00, -2.8274e+00, -3.8626e+00, -4.3306e+00, -4.4336e+00, -1.8693e+00, -3.4095e+00, -1.9677e+00, -2.8104e+00, -2.8024e+00, -1.7821e+00, -3.7782e+00]], [[ 2.4869e+00, -2.2643e+00, -3.2690e+00, -2.4613e+00, -3.4797e+00, 9.8464e-01, 3.3928e-01, -2.3670e+00, -3.5717e+00, -2.7816e+00, -1.1285e+00, -1.5340e+00]], [[ 1.7661e+00, -1.9121e+00, -2.7877e+00, -3.0194e+00, -1.9554e+00, 2.6763e+00, 1.1919e+00, -4.3280e-01, -2.5180e+00, -2.3000e+00, 5.6916e-01, 1.8306e-01]], [[ 3.4109e+00, -1.2053e+00, -2.7536e+00, -2.3319e+00, -2.9661e+00, -7.8706e-01, -1.0032e+00, -1.4749e+00, -2.3015e+00, -1.6896e+00, -1.5421e-01, -3.2575e-01]], [[ 1.1460e+00, -3.9984e+00, -4.1075e+00, -4.1225e+00, -3.9722e+00, -2.1926e+00, -2.4974e+00, -3.1846e+00, -3.7707e+00, -3.5249e+00, -1.1830e+00, -2.2422e+00]], [[ 3.1553e+00, -1.8784e+00, -2.9925e+00, -2.5035e+00, -2.6891e+00, 1.8936e+00, 5.8340e-01, -1.5611e+00, -2.7003e+00, -2.0630e+00, -6.4245e-01, -4.2624e-01]], [[ 3.8388e+00, -7.2836e-01, 5.8850e-02, -1.5956e+00, -2.6501e+00, 3.1453e+00, 3.2669e+00, 1.6563e-01, -8.6023e-02, -3.4860e-01, 5.3193e+00, 3.3217e+00]]], [[[ 2.9749e+00, -3.1494e+00, -3.8058e+00, -3.4223e+00, -3.5374e+00, 2.6849e-01, -1.2629e-01, -2.6058e+00, -3.5605e+00, -4.2564e+00, -3.6514e+00, -2.5873e+00]], [[ 4.5583e+00, -1.2760e+00, -2.3984e+00, -1.2151e+00, -1.8149e+00, 4.8610e-01, -4.2168e-01, -1.6008e+00, -2.2419e+00, -2.7609e+00, -1.1459e+00, -6.6922e-01]], [[ 3.1083e+00, -8.2768e-01, -1.3613e+00, -1.2959e+00, -1.1765e+00, -1.0812e+00, -1.1970e+00, -1.1856e+00, -1.0523e+00, -2.1273e+00, -1.9680e+00, -1.1539e+00]], [[ 3.1290e+00, 6.5358e-01, -2.5313e+00, -2.1121e+00, -1.5724e+00, 5.1511e-01, -6.9954e-01, -1.3129e-01, -1.4898e+00, -2.6754e+00, -2.2173e+00, -1.2720e+00]], [[ 2.9012e+00, 6.7310e-01, -7.3481e-01, -6.3008e-01, -3.9763e-01, -1.4021e+00, 8.2054e-02, -1.1322e-01, -2.3000e-01, -1.2790e+00, -3.6589e-01, -9.8178e-01]], [[ 1.4001e+00, -2.5668e+00, -2.8019e+00, -2.6449e+00, -3.2555e+00, -2.6432e+00, -2.9673e+00, -3.2992e+00, -1.7770e+00, -1.8844e+00, -1.4572e+00, -2.5584e+00]], [[ 3.8508e+00, -2.7572e+00, -3.2821e+00, -2.8826e+00, -3.6775e+00, -2.5597e-01, -2.8746e-01, -2.3165e+00, -3.1718e+00, -3.8759e+00, -3.4446e+00, -2.1250e+00]], [[ 2.6631e+00, -1.4164e+00, -2.1232e+00, -2.0915e+00, -2.0606e+00, -2.6129e+00, -3.0398e+00, -7.3303e-01, -1.0543e+00, -2.1042e+00, -1.9721e+00, -1.3730e+00]], [[ 3.9365e+00, -2.0326e+00, -3.4042e+00, -3.5324e+00, -1.7231e+00, -3.3537e+00, -2.7644e+00, -1.8261e+00, -2.6443e+00, -3.1584e+00, -3.3773e+00, -1.6938e+00]], [[ 6.7010e-01, -3.3240e+00, -2.4647e+00, -2.5521e+00, -3.3043e+00, -2.1428e+00, -1.8622e+00, -2.4427e+00, -2.7729e+00, -2.1180e+00, -2.2490e+00, -2.0356e+00]], [[ 3.4718e+00, -1.6749e+00, -2.7280e+00, -2.0286e+00, -2.8995e+00, -1.5154e+00, -2.1561e+00, -2.1731e+00, -2.7449e+00, -3.5473e+00, -2.7314e+00, -2.6862e+00]], [[ 4.9225e+00, -1.9444e-01, 7.2052e-02, -2.3727e+00, -1.9962e+00, 1.5393e+00, 6.1662e-01, 4.7180e-01, -1.5385e-01, 2.7843e-02, -2.6848e+00, -8.9041e-01]]], [[[ 2.6808e+00, -3.3441e+00, -3.1326e+00, -2.7544e+00, -3.3109e+00, 4.1169e-01, -4.7108e-01, -3.0302e+00, -3.2178e+00, -2.8639e+00, -3.4887e+00, -3.1730e+00]], [[ 4.1973e+00, -1.4258e+00, -2.6210e+00, 2.5184e-01, -2.1036e+00, -1.1243e+00, -1.3412e+00, -1.3958e+00, -1.7138e+00, -1.7094e+00, -1.0200e+00, -2.8200e-01]], [[ 3.5776e+00, -9.5691e-01, -1.8054e+00, -1.4198e+00, -1.0914e+00, -1.7538e+00, -3.2106e-01, -1.6992e+00, -7.2851e-01, -1.6768e+00, -7.3392e-01, 1.4782e-01]], [[ 3.2455e+00, -5.7359e-01, -2.3591e+00, -1.3484e+00, -1.5041e+00, -1.4910e-01, -1.0066e-01, -1.2387e+00, -1.2107e+00, -1.3870e+00, -1.3868e+00, -7.1634e-01]], [[ 2.5009e+00, -9.3183e-01, -1.0599e+00, -1.1740e+00, -1.3894e+00, -2.2512e+00, -8.0806e-01, -1.0763e+00, -7.8748e-01, -4.1900e-01, -1.7109e+00, -3.2836e-01]], [[ 1.8347e+00, -2.6423e+00, -2.4506e+00, -4.5839e+00, -3.9492e+00, -2.9897e+00, -2.9965e+00, -3.1985e+00, -2.2138e+00, -1.9219e+00, -2.1703e+00, -2.6033e+00]], [[ 3.2187e+00, -2.2084e+00, -3.3474e+00, -1.8916e+00, -2.1725e+00, -1.3211e+00, -2.4017e-01, -2.0498e+00, -2.0202e+00, -2.7090e+00, -1.4073e+00, -2.0832e+00]], [[ 2.5812e+00, -2.1695e+00, -1.5354e+00, -1.4988e+00, -2.0579e+00, -2.1865e+00, -2.1320e+00, -1.5856e+00, -1.0987e+00, -1.3446e+00, -1.8232e+00, -6.0541e-01]], [[ 3.6885e+00, -1.3901e+00, -3.4728e+00, -2.1989e+00, -2.2485e+00, -2.7167e+00, -2.8077e+00, -2.4650e+00, -2.1953e+00, -2.8226e+00, -2.2498e+00, -1.1000e+00]], [[ 5.7528e-01, -4.7384e+00, -3.0142e+00, -3.3670e+00, -4.2841e+00, -2.6233e+00, -2.5087e+00, -3.2387e+00, -4.0764e+00, -2.1433e+00, -1.5971e+00, -2.2681e+00]], [[ 3.7868e+00, -1.8966e+00, -2.2912e+00, -1.2830e+00, -2.0422e+00, -1.5694e+00, -1.5022e+00, -1.8169e+00, -1.9451e+00, -2.1340e+00, -2.6231e+00, -9.9853e-01]], [[ 4.5488e+00, -6.8922e-02, 2.8965e-01, -8.5544e-01, -1.8872e+00, -1.0435e+00, 3.0293e-01, 2.0178e+00, 2.1431e+00, 1.8656e+00, 2.9109e-01, 1.8568e+00]]], [[[ 2.0230e+00, -2.8763e+00, -3.2173e+00, -3.4335e+00, -3.7817e+00, 8.1543e-01, -5.3847e-01, -3.2392e+00, -3.2647e+00, 5.8280e-01, -1.2640e+00, -1.1325e+00]], [[ 2.9974e+00, -4.7576e-01, -1.8614e+00, -1.6093e+00, -2.1085e+00, -1.4464e-01, -1.4533e+00, -1.5426e+00, -1.8037e+00, 7.6997e-02, -1.9378e+00, -1.0509e-01]], [[ 2.3541e+00, 1.9297e-01, -7.9890e-01, -2.4523e+00, -2.6914e+00, -4.7326e-01, -1.1664e+00, -2.1918e+00, -2.1406e+00, -1.4238e+00, -1.6147e+00, -5.2856e-03]], [[ 2.4254e+00, 3.7375e-01, -1.4477e+00, -1.9493e+00, -2.0383e+00, 1.3355e+00, -1.6395e+00, -1.4248e+00, -2.3498e+00, -1.5289e+00, -2.5340e+00, 1.3670e-01]], [[ 2.3146e+00, 7.3252e-02, -2.4628e+00, -1.3555e+00, -1.6218e+00, -1.6829e+00, -1.1975e+00, -1.4030e+00, -2.2134e+00, -6.0684e-01, -1.9064e+00, -9.7778e-01]], [[ 5.4249e-01, -1.7317e+00, -2.2641e+00, -1.5456e+00, -1.7529e+00, -2.2774e+00, -2.1798e+00, -1.5100e+00, -2.8834e+00, -3.0040e+00, -3.2022e+00, -1.8032e+00]], [[ 2.4132e+00, -2.3658e+00, -2.9384e+00, -2.9027e+00, -3.4069e+00, -1.6997e-01, -7.9637e-01, -3.5889e+00, -3.9392e+00, 3.1826e-02, -1.2788e+00, -2.0935e+00]], [[ 1.8815e+00, -5.9898e-02, -6.3117e-01, -1.8255e+00, -1.6350e+00, -9.7758e-01, -2.4894e+00, -7.2138e-01, -1.2364e+00, -2.6566e+00, -2.4378e+00, -1.1202e-01]], [[ 3.1313e+00, -2.0298e+00, -2.0075e+00, -2.5929e+00, -1.1114e+00, -3.0691e+00, -4.2317e+00, -2.5273e+00, -9.0887e-01, -2.4346e+00, -4.7511e+00, -1.6434e+00]], [[-3.1563e-01, -2.6880e+00, -2.3410e+00, -1.5023e+00, -1.8566e+00, -1.1782e+00, 1.2911e-02, -3.8597e-01, -2.5923e+00, -1.9650e+00, -1.1864e+00, -1.2319e+00]], [[ 2.5711e+00, -1.9839e+00, -1.3530e+00, -1.9956e+00, -2.0619e+00, -4.4327e-01, -1.6669e+00, -2.8311e+00, -1.8066e+00, -7.2683e-01, -1.7865e+00, -1.8660e+00]], [[ 2.4415e+00, -1.1917e+00, -1.6440e+00, -2.5129e+00, -1.8709e+00, 9.8800e-01, 3.1218e-01, -1.6036e+00, -1.2686e+00, -7.2791e-01, 3.8396e-01, -1.6619e+00]]], [[[ 3.4920e+00, -3.1732e+00, -4.4420e+00, -4.3249e+00, -4.6515e+00, -4.4413e-01, -6.0438e-01, -2.5274e+00, -3.4936e+00, -3.1891e+00, -2.0873e+00, -8.8783e-01]], [[ 4.1168e+00, -1.1234e+00, -2.1121e+00, -1.3833e+00, -1.9541e+00, -4.0857e-01, -6.9819e-01, -4.3862e-01, -3.5977e-01, -2.4496e-01, -1.5212e+00, -3.3269e-01]], [[ 2.8881e+00, 4.4290e-01, -1.8883e+00, -2.5781e+00, -2.1254e+00, -6.3979e-01, -1.9441e-01, -1.6127e-02, -1.2980e+00, -1.1946e+00, -2.2869e+00, -1.0915e+00]], [[ 2.6168e+00, 1.6337e+00, -1.7156e+00, -1.9180e+00, -1.2950e+00, 3.4281e-01, -9.3117e-01, 1.2682e+00, -1.8422e+00, -1.8580e+00, -2.4304e+00, -1.3099e+00]], [[ 2.5456e+00, 5.3595e-01, -2.6288e+00, -9.5903e-01, -1.9419e+00, -4.3717e+00, -3.8494e+00, -1.2378e+00, -2.3761e+00, -2.6505e+00, -3.9345e+00, -3.9976e+00]], [[ 2.1035e-01, -1.5538e+00, -1.2100e+00, -5.9011e-01, -5.7652e-01, -9.4534e-01, -9.1859e-01, -9.5479e-01, 3.7502e-01, -5.7694e-01, -1.3981e+00, -2.2831e+00]], [[ 3.4362e+00, -3.5214e+00, -3.6019e+00, -3.6060e+00, -3.2511e+00, -4.9940e-01, 9.6685e-02, -2.4861e+00, -2.5311e+00, -2.2803e+00, -1.0430e+00, -3.1080e-01]], [[ 2.4958e+00, -5.0894e-01, -1.1198e+00, -1.8054e+00, -1.2334e+00, -1.8454e+00, -9.5007e-01, 3.6733e-01, -8.7472e-01, -7.3080e-01, -2.2308e+00, -1.2029e+00]], [[ 3.8474e+00, -8.1319e-01, -2.2496e+00, -2.4078e+00, -8.9202e-01, -1.3775e+00, -9.3066e-01, 8.8387e-01, -1.6262e-01, 6.8168e-01, -1.8317e+00, -5.5832e-01]], [[ 2.8960e-01, -2.5044e+00, -3.6837e+00, -3.3119e+00, -1.8149e+00, -7.3601e-01, -4.6010e-01, -2.1448e+00, -2.3921e+00, -1.6014e+00, -7.3129e-01, -2.0959e+00]], [[ 3.5124e+00, -1.6891e+00, -1.8554e+00, -2.1787e+00, -1.7702e+00, -3.3048e-01, -8.7981e-01, -1.2889e+00, -1.7164e+00, -1.6179e+00, -2.8761e+00, -9.0942e-01]], [[ 4.8727e+00, -1.4657e+00, -3.8143e-01, -5.8912e-01, -2.9712e-01, 2.7093e-01, 1.5724e+00, -9.3664e-01, 2.5672e-01, 5.4247e-01, -1.8058e+00, 1.4239e+00]]]]) attn_weights tensor([[[[ 1.9204e+00, 6.5704e-01, -9.5680e-01, -2.2240e-02, 6.1985e-01, 1.0406e+00, 3.8839e-01, 5.6717e-01, -7.6675e-01, -1.0984e-01, 8.3896e-01, 6.8430e-01]], [[ 3.6521e+00, -1.0823e+00, -1.5976e+00, -1.7216e+00, -4.3302e-01, 4.5805e-01, 4.7705e-01, -1.4695e-01, -1.6422e+00, -1.1731e+00, 6.2938e-01, 7.5783e-01]], [[ 2.9102e+00, -1.0166e+00, -1.8584e+00, -1.7562e+00, -1.4926e+00, 9.6198e-01, 9.0324e-01, -2.1883e-01, -1.7759e+00, -1.2398e+00, 1.7364e-01, 4.9041e-01]], [[ 1.4727e+00, -1.9995e-01, -1.1691e+00, -1.7380e+00, -8.9498e-01, -1.2853e+00, -6.8949e-01, -6.1462e-01, -1.6437e+00, -2.4877e+00, -1.2579e+00, -1.8458e+00]], [[ 2.5600e+00, -9.9111e-01, -1.5815e+00, -1.4419e+00, -1.2232e+00, -1.4893e-01, -1.2917e+00, -1.0914e+00, -1.6249e+00, -1.2881e+00, -2.2449e-02, -3.9191e-01]], [[ 3.9244e+00, -5.5774e-01, -6.8679e-01, -9.6446e-01, -1.4368e+00, 2.3234e+00, 3.7751e+00, -6.9828e-01, -1.0908e+00, -1.3442e+00, 4.5088e-01, 6.0029e-01]], [[ 3.1409e+00, -1.4793e+00, -2.6745e+00, -2.2849e+00, -2.1480e+00, -6.7391e-02, -1.1107e+00, -1.2736e+00, -2.8298e+00, -2.3152e+00, -1.1489e+00, -9.0869e-01]], [[ 3.7616e+00, -2.0967e-01, -1.0014e+00, -1.6336e+00, -4.1072e-01, 2.1599e+00, 4.5686e-01, 1.2521e-01, -1.0012e+00, -1.4175e+00, 2.8875e-01, 1.3581e+00]], [[-1.6028e+00, 2.4030e+00, 3.4062e+00, 2.8856e+00, 2.1874e+00, 2.3758e+00, 2.1219e+00, 2.4118e+00, 3.9658e+00, 3.6927e+00, 3.0686e+00, 2.2405e+00]], [[ 3.9181e+00, -1.1866e+00, -3.0715e+00, -2.7272e+00, -3.1241e+00, 1.7777e+00, 1.1919e+00, -1.3255e+00, -3.1414e+00, -2.4390e+00, -5.0461e-01, -1.2534e+00]], [[ 2.6932e+00, -3.8805e-02, -9.8603e-01, -7.6984e-01, -8.4498e-01, 3.2951e+00, 2.1565e+00, 1.0082e+00, -1.0337e+00, -4.7441e-01, 2.3361e+00, 1.3191e+00]], [[ 3.5577e+00, 4.2467e-01, -1.1143e+00, -1.0893e+00, 3.4489e-01, 1.7215e+00, 5.1861e-01, 4.6919e-01, -1.3635e+00, -1.5447e+00, 1.2195e+00, 2.9026e-01]]], [[[ 1.3303e+00, 1.2622e+00, 3.4920e-01, 2.5183e-02, 1.2844e+00, 5.6652e-01, 2.7818e-01, 6.8715e-01, 1.5315e+00, 6.8808e-01, -2.9789e-02, 1.1947e+00]], [[ 3.9101e+00, -8.6750e-01, -1.4476e+00, -9.9601e-01, -6.9710e-01, -9.3624e-01, -2.2598e-01, -5.4075e-01, -1.9793e-01, -1.2632e+00, -1.4820e+00, -4.9227e-01]], [[ 3.2502e+00, -6.9077e-02, -1.7241e+00, -2.2429e+00, -2.2635e+00, -9.7561e-02, -7.1293e-01, -3.7551e-01, -1.5778e+00, -2.7227e+00, -2.6857e+00, -2.4909e+00]], [[ 1.5612e+00, -3.5098e-01, -1.4582e+00, -1.6088e+00, -1.2345e+00, -1.1593e+00, -8.3413e-01, -9.2294e-02, -6.8130e-01, -2.0426e+00, -2.1484e+00, -2.2062e+00]], [[ 2.1837e+00, -7.5455e-01, -9.2849e-01, -1.5268e+00, -9.4687e-01, -2.1069e+00, -2.3428e+00, -8.4584e-01, -1.0501e+00, -1.2394e+00, -1.9341e+00, -2.0117e+00]], [[ 4.4019e+00, -1.0155e-01, -1.9126e+00, -1.4891e+00, -9.5969e-01, 6.4089e-01, 1.4660e+00, 2.7283e-01, -7.2133e-01, -2.5931e+00, -2.4153e+00, -9.7251e-01]], [[ 3.3118e+00, -1.2227e+00, -1.9302e+00, -1.3773e+00, -9.4095e-01, -8.1005e-01, -1.4819e+00, -1.2076e+00, -1.1381e+00, -2.2458e+00, -1.9911e+00, -1.0556e+00]], [[ 3.8267e+00, 1.1103e+00, -2.0790e+00, 2.3613e-01, 4.4083e-01, 1.2959e+00, 4.4305e-01, 1.8058e+00, 1.1832e+00, -1.7614e+00, -2.7662e-01, 2.1528e+00]], [[-4.5950e+00, 4.1415e+00, 3.2346e+00, 3.7545e+00, 4.2463e+00, 4.3858e+00, 3.9505e+00, 3.9090e+00, 4.0158e+00, 2.6549e+00, 4.2693e+00, 3.9714e+00]], [[ 4.2659e+00, -8.3855e-01, -2.0198e+00, -1.6599e+00, -1.8189e+00, -1.1267e-02, -8.9047e-02, -5.7768e-01, -9.8298e-01, -2.5508e+00, -2.3085e+00, -6.2036e-01]], [[ 4.0734e+00, 1.2656e+00, -4.6997e-02, 1.6221e-01, 1.9199e-02, 4.3717e-01, 1.1314e-01, 1.6588e+00, 1.5672e+00, -8.5237e-01, 1.7421e-02, 3.3166e-03]], [[ 2.2265e+00, 2.3207e+00, -1.6690e-01, -4.4523e-01, -5.2071e-01, 8.9134e-01, -9.9047e-02, 3.4847e+00, 1.6718e+00, -7.9769e-01, -2.8495e-01, -7.9851e-01]]], [[[ 1.2467e+00, 7.6462e-01, 2.5874e-01, 5.2915e-01, 6.9489e-01, 9.0070e-01, 6.8526e-01, 7.8289e-01, 8.6952e-01, 3.5294e-01, -1.2195e+00, 3.9667e-01]], [[ 3.9237e+00, -1.6829e+00, -1.0634e+00, -7.7351e-01, -1.6953e+00, -1.4350e+00, -6.6116e-01, -9.4644e-01, -1.5523e+00, -9.8496e-01, -1.5670e+00, -1.5062e+00]], [[ 3.7656e+00, -1.2170e+00, -2.2216e+00, -1.8213e+00, -1.8592e+00, -1.5795e+00, -4.2459e-01, -1.5255e+00, -1.9543e+00, -2.1220e+00, -1.9422e+00, -2.4686e+00]], [[ 1.1192e+00, -2.1783e+00, -1.0141e+00, -2.6895e+00, -2.5906e+00, 7.6851e-01, -5.0155e-02, -6.4681e-01, -1.5063e+00, -3.5371e-01, -3.7277e+00, -1.4598e+00]], [[ 2.0336e+00, -1.3727e+00, -1.8991e+00, -9.1625e-01, -1.6363e+00, -2.1083e+00, -1.9041e+00, -1.3642e+00, -9.2956e-01, -1.3193e+00, -2.0958e+00, -1.6216e+00]], [[ 4.2474e+00, -1.8398e-01, 2.4805e-01, -1.2689e+00, 7.2495e-01, -1.0086e+00, 9.3103e-01, 2.8115e-02, 3.7321e-01, 1.0045e+00, -8.5628e-01, 8.0918e-01]], [[ 3.5349e+00, -2.3692e+00, -2.4031e+00, -2.3057e+00, -2.6824e+00, -1.5887e+00, -1.1845e+00, -2.3888e+00, -2.2924e+00, -2.6114e+00, -1.9203e+00, -1.9872e+00]], [[ 5.3366e+00, -4.8779e-01, -1.5634e+00, -2.2662e+00, -1.1097e+00, -2.7942e-01, -5.7078e-01, -1.4513e+00, -1.9834e+00, -2.5169e+00, -1.1499e+00, -1.9929e+00]], [[-4.7064e+00, 3.0355e+00, 5.5650e+00, 4.2064e+00, 3.2663e+00, 3.5431e+00, 3.5007e+00, 3.9417e+00, 3.8342e+00, 5.3827e+00, 1.9469e+00, 4.1281e+00]], [[ 4.9536e+00, -5.7524e-01, -7.4140e-01, -1.1469e+00, -9.5872e-01, -2.1662e+00, -4.3415e-01, -1.4929e-01, 3.6187e-01, 3.7530e-01, -1.5388e-01, 9.6830e-01]], [[ 3.1913e+00, -4.2257e-02, 2.7056e+00, 5.1162e-01, -2.9907e-01, -6.9217e-01, -4.8379e-01, 6.0351e-01, 9.0266e-01, 2.8258e+00, 8.6856e-01, 1.5076e+00]], [[ 2.7821e+00, -5.9954e-01, 1.7405e+00, -2.0048e-01, -1.0991e+00, 1.4426e+00, 9.2728e-01, 6.1678e-02, -2.8406e-02, 2.0636e+00, -6.0739e+00, 9.2272e-01]]], [[[ 1.8189e+00, 2.7523e+00, 1.1840e+00, 1.1285e+00, 1.4928e+00, 9.2381e-01, 1.1851e+00, 1.4256e+00, 1.3032e+00, 6.1060e-01, 1.2458e+00, 2.7666e+00]], [[ 2.8227e+00, 5.5998e-01, -6.0588e-01, -5.4412e-02, 2.7137e-01, -3.2912e-01, -4.2255e-01, -5.0347e-02, -2.2893e-01, -6.2221e-01, -1.1418e+00, 9.1055e-02]], [[ 2.7297e+00, 1.1863e-01, -1.3908e+00, -2.0611e+00, -1.9439e+00, -1.8740e-01, -7.9908e-01, -8.5438e-01, -1.6538e+00, -4.3587e-01, -1.8363e+00, 3.8976e-01]], [[ 8.4713e-01, -7.6074e-01, -1.9332e+00, -2.0855e+00, -1.9608e+00, 1.0088e-01, 5.7645e-01, -2.5828e-01, -1.6816e+00, -7.2439e-02, -6.6387e-02, -2.1183e-01]], [[ 1.9949e+00, -3.3209e-01, -1.8244e-01, -1.1158e+00, -6.4373e-01, -1.3799e+00, -2.7709e+00, -1.4557e+00, -7.7607e-01, -1.3673e+00, -2.8642e+00, -1.2239e+00]], [[ 3.1128e+00, 2.1261e+00, 3.6145e-01, 9.0760e-01, -3.3609e-01, 9.9053e-01, 2.0161e+00, 1.5879e+00, -2.2428e-01, -1.5266e-01, 1.5634e+00, 1.5508e+00]], [[ 3.0255e+00, -5.9560e-01, -1.7793e+00, -7.4310e-01, -1.4148e+00, -6.6884e-02, -1.4637e+00, -1.1933e+00, -1.4008e+00, -5.3803e-01, -1.9486e+00, -1.2097e+00]], [[ 2.8314e+00, 1.2881e+00, 2.7510e-02, 4.6888e-01, 5.2815e-01, 2.0060e+00, 7.8482e-01, 1.1423e+00, 2.8178e-01, 5.7431e-01, 6.8562e-02, 1.2432e+00]], [[-4.4901e+00, 3.9100e+00, 3.0297e+00, 2.2987e+00, 2.6609e+00, 3.2210e+00, 3.8054e+00, 4.1053e+00, 1.2988e+00, 1.4441e+00, 2.4442e+00, 5.1134e+00]], [[ 3.3181e+00, 3.4332e-02, -1.3921e+00, -1.6678e+00, -1.9922e+00, 2.5659e-01, 2.1347e-01, -8.5868e-01, -1.4837e+00, 1.0598e+00, -3.7379e-01, 4.4771e-02]], [[ 2.4405e+00, 1.2000e+00, 1.7472e-01, -3.5208e-01, -2.1857e-01, 4.7463e-01, -8.4832e-01, 9.2549e-01, -1.5057e-01, -7.0946e-01, -9.0735e-01, 1.1180e+00]], [[ 1.9551e+00, 3.7714e-01, -9.9529e-01, 1.3580e-01, -1.2006e+00, 1.2803e+00, 8.4054e-01, 4.3604e-01, -6.3566e-01, 3.2042e-01, 1.7944e-01, -2.9925e-01]]], [[[ 1.5480e+00, 2.5080e+00, 3.6895e-01, 5.7667e-01, 1.2750e+00, 1.3524e+00, 6.4713e-01, 1.7344e+00, 9.7073e-01, 1.5340e+00, 8.1818e-02, 8.0299e-01]], [[ 3.6486e+00, 1.1420e-01, -4.7165e-01, 9.9037e-02, 2.8591e-01, -6.4528e-01, 2.0629e-01, 6.1376e-01, 4.9987e-01, -3.2944e-01, -7.0110e-01, -2.0656e-02]], [[ 3.4828e+00, 7.5889e-01, -1.4809e+00, -1.9435e+00, -1.7273e+00, -3.8180e-01, 3.1604e-02, 5.2100e-01, -1.6224e+00, -1.4120e+00, -2.0154e+00, -6.4472e-01]], [[ 1.4320e+00, -2.9610e-01, -2.2663e+00, -1.8838e+00, -8.6406e-01, -1.4993e+00, -1.1812e+00, -6.9860e-01, -2.5826e+00, -2.0965e+00, -8.1506e-01, -1.9120e+00]], [[ 2.0663e+00, 2.1946e-01, -4.0338e-01, -9.8481e-01, -5.5050e-01, -1.9352e+00, -2.1314e+00, -1.6419e-01, -1.8241e+00, -1.1538e+00, -2.6295e+00, -1.6534e+00]], [[ 4.0539e+00, 1.5265e+00, -1.1809e+00, 1.5703e-01, 4.1219e-01, -4.6125e-01, 1.8607e+00, 1.7640e+00, 1.0860e+00, 3.0328e-01, -8.7198e-01, 1.7295e+00]], [[ 3.4801e+00, -9.3587e-01, -1.8884e+00, -8.8270e-01, -1.4622e+00, -4.4653e-01, -7.3164e-01, -9.5342e-01, -7.6961e-01, -1.0477e+00, -2.6006e+00, -1.8338e+00]], [[ 3.7782e+00, 2.4089e+00, 1.4172e-01, 6.5722e-01, 3.6053e-01, 1.1043e+00, 9.6491e-01, 1.7856e+00, 1.0960e+00, 2.7478e-01, -5.3829e-01, 1.4844e+00]], [[-7.2121e+00, 2.2945e+00, 1.7397e+00, 1.2075e+00, 7.8289e-01, 2.1170e+00, 2.5324e+00, 1.6305e+00, 6.2018e-01, -2.2392e+00, 3.5515e-01, 6.1831e-01]], [[ 4.1341e+00, -1.5593e-02, -1.0914e+00, -1.3547e+00, -1.3388e+00, -2.4917e-01, 6.2770e-01, 5.9936e-01, 8.0263e-01, 4.4953e-01, -1.0783e+00, 6.1922e-01]], [[ 2.8370e+00, 8.8263e-01, -1.4703e+00, -1.2493e+00, 6.1449e-02, 5.8716e-01, 4.1184e-01, 1.3835e+00, 3.3774e-01, 8.2970e-01, -2.1133e-01, -1.5617e-01]], [[ 2.6665e+00, 2.0555e+00, -9.4796e-01, -3.2060e-01, 2.0589e-01, 3.2563e-01, -1.3584e-01, 1.9392e+00, -3.4564e-01, 1.9260e-01, -7.1705e-01, -6.6488e-01]]]]) attn_weights tensor([[[[-1.1526e+00, -2.0852e+00, -2.4680e+00, -2.0501e+00, -2.7300e+00, -2.3921e+00, -1.3029e+00, -2.1593e+00, -2.4931e+00, -1.9604e+00, -2.6107e+00, -2.5496e+00, -2.2340e+00]], [[ 2.5831e+00, -4.9413e-01, -1.4965e-01, 3.2499e-01, 1.1993e+00, 1.5223e+00, -3.5264e-01, -1.5251e+00, -6.7945e-01, -2.2441e-03, 8.3734e-01, 9.1956e-01, 6.9637e+00]], [[-1.1987e+00, -2.1584e+00, -2.1512e+00, -2.6184e+00, -2.4289e+00, -2.5926e+00, -2.5361e+00, -2.4806e+00, -2.3115e+00, -2.7091e+00, -2.0971e+00, -2.4718e+00, -2.7060e+00]], [[-9.9438e-01, -6.0534e+00, -6.1964e+00, -6.0436e+00, -5.1990e+00, -3.6851e+00, -3.2660e+00, -3.3949e+00, -2.6850e+00, -2.4790e+00, 4.4782e-01, -6.6474e-01, 4.3227e+00]], [[ 5.3595e-01, -2.4091e+00, -2.8342e+00, -1.4133e+00, -1.2035e+00, -8.2153e-01, -1.1933e+00, -1.7406e+00, -1.7909e+00, -7.5521e-02, 3.6041e-01, 6.8599e-01, 2.6649e+00]], [[ 7.1037e+00, 2.6099e+00, 3.2520e+00, 2.0534e+00, 1.6513e+00, 1.9740e+00, 1.6093e+00, -2.2608e-01, 1.6056e+00, 8.3263e-01, 1.6967e+00, 4.8837e-01, 1.0951e+01]], [[-1.7272e-01, -3.8716e+00, -3.4097e+00, -2.3088e+00, -4.0492e+00, -1.6443e+00, -1.4970e+00, -4.3760e+00, -3.5110e+00, -2.2262e+00, -1.3320e+00, -3.9981e+00, -1.8422e+00]], [[-5.4001e+00, -6.8876e+00, -6.7884e+00, -6.6393e+00, -6.2514e+00, -6.4491e+00, -5.8079e+00, -5.0806e+00, -4.6289e+00, -4.5349e+00, -4.3133e+00, -3.5016e+00, -4.2198e+00]], [[-3.1215e+00, -2.8376e+00, -3.2640e+00, -3.7772e+00, -2.1802e+00, -4.1911e+00, -3.0452e+00, -2.6170e+00, -3.0665e+00, -3.6018e+00, -4.0294e+00, -1.8455e+00, -3.6659e+00]], [[-1.7184e+00, -2.1098e+00, -2.2561e+00, -2.6753e+00, -2.3166e+00, -2.6807e+00, -2.6722e+00, -2.2911e+00, -2.3514e+00, -2.6947e+00, -2.5433e+00, -2.2510e+00, -2.6658e+00]], [[ 6.7607e-01, 1.8846e-01, -2.0569e-01, -4.7392e-01, 1.0593e-01, -4.5408e-01, -6.7618e-01, -1.0171e-01, -4.9444e-01, -7.0857e-01, -4.1738e-01, -4.7583e-02, 1.1996e+00]], [[-1.0977e+00, -2.1049e+00, -3.2122e+00, -2.6511e+00, -2.6738e+00, -2.6083e+00, -2.1281e+00, -2.0187e+00, -3.3361e+00, -2.6836e+00, -2.6516e+00, -2.7049e+00, -2.3192e+00]]], [[[-1.1154e+00, -3.1742e+00, -2.0543e+00, -1.5408e+00, -3.3054e+00, -2.5668e+00, -2.4117e+00, -3.2597e+00, -3.2409e+00, -1.7807e+00, -1.1564e+00, -1.7889e+00, -3.6310e+00]], [[-1.5745e+00, 7.6572e-01, -1.9745e+00, -4.7290e+00, -1.2280e+00, -3.9334e+00, -4.7180e+00, 3.5264e-01, 1.6297e+00, -2.6865e+00, -5.3761e+00, -2.3602e+00, 4.8846e+00]], [[-1.9479e+00, -2.2512e+00, -2.6884e+00, -2.6146e+00, -3.2713e+00, -3.1418e+00, -2.8472e+00, -2.4636e+00, -2.0371e+00, -2.8128e+00, -2.6481e+00, -2.2386e+00, -1.4620e+00]], [[-3.3110e+00, -5.0542e+00, -6.4723e+00, -6.6866e+00, -4.2632e+00, -4.3316e+00, -4.7241e+00, -2.6192e+00, -2.1059e+00, -2.4568e+00, -2.3702e+00, -3.6582e-01, 1.8993e+00]], [[-1.8895e+00, -4.1526e+00, -4.4630e+00, -2.8962e+00, -3.0426e+00, -2.1817e+00, -1.8782e+00, -2.9182e+00, -2.0246e+00, -2.4006e+00, -5.6145e-01, 2.2710e+00, 2.1255e-01]], [[ 1.8320e+00, 2.6310e+00, 2.3283e+00, 2.0344e+00, 4.0044e+00, 9.4246e-01, -6.6706e-02, 1.7049e+00, 2.2927e+00, 1.3558e+00, 1.3087e+00, 1.6764e+00, 4.5248e+00]], [[-9.8111e-01, -4.2936e+00, -3.8625e+00, -2.6188e+00, -4.5619e+00, -2.0435e+00, -2.1001e+00, -4.7118e+00, -4.3327e+00, -3.6798e+00, -2.2154e+00, -1.6662e+00, -5.1052e-01]], [[-6.3645e+00, -7.8117e+00, -7.4810e+00, -7.4417e+00, -7.2142e+00, -7.0799e+00, -6.7049e+00, -5.8556e+00, -5.3835e+00, -4.7255e+00, -4.6988e+00, -3.9110e+00, -4.0767e+00]], [[-3.6331e+00, -1.6112e+00, -2.8616e+00, -3.6640e+00, -1.0217e+00, -3.3345e+00, -3.5791e+00, -8.4420e-01, -6.5595e-01, -2.3981e+00, -3.2832e+00, -3.2699e+00, -3.8125e-01]], [[-1.4479e+00, -1.6632e+00, -1.7483e+00, -2.3126e+00, -1.7435e+00, -2.4110e+00, -2.5689e+00, -1.7722e+00, -1.5770e+00, -1.7791e+00, -2.2913e+00, -1.9076e+00, -1.4381e+00]], [[ 6.1764e-01, 6.9097e-01, 6.6049e-01, -3.5332e-02, 6.8838e-01, -3.1323e-01, -5.0654e-01, 5.1226e-01, 6.8807e-01, 4.2845e-01, -2.6215e-01, 1.7388e-01, 8.6986e-01]], [[-1.5573e+00, -2.2392e+00, -3.5826e+00, -2.4646e+00, -2.6543e+00, -2.6220e+00, -2.1904e+00, -2.1784e+00, -2.2303e+00, -3.7199e+00, -2.4376e+00, -2.4775e+00, -2.1873e+00]]], [[[-5.1274e-01, -2.1069e+00, -1.6119e+00, -1.3376e+00, -2.2217e+00, -1.6789e+00, -1.9340e+00, -2.2237e+00, -1.8704e+00, -1.5646e+00, -1.6787e+00, -2.2418e+00, -2.2742e+00]], [[ 1.7261e+00, 1.8501e-01, 1.6120e+00, 1.9637e+00, 9.0752e-01, -1.7737e+00, -2.7337e-01, -1.0142e+00, 6.1971e-01, 9.2021e-01, 3.1429e+00, 1.4817e+00, 8.1717e+00]], [[-1.5711e+00, -2.4982e+00, -2.4974e+00, -1.9407e+00, -2.6354e+00, -2.1186e+00, -2.4602e+00, -2.6853e+00, -2.2296e+00, -2.5546e+00, -2.0162e+00, -2.6572e+00, -2.2173e+00]], [[-3.2890e+00, -7.0387e+00, -6.7342e+00, -5.9970e+00, -6.1061e+00, -6.5541e+00, -4.8733e+00, -3.7887e+00, -2.3906e+00, -2.0782e+00, 3.0472e-01, -2.0296e-01, 3.7903e+00]], [[-1.1180e-01, -2.2927e+00, -2.8484e+00, -2.6283e+00, -2.1424e+00, -2.5231e+00, -1.5661e+00, -1.3758e+00, -9.1531e-01, -1.0078e+00, 7.0500e-02, -1.1619e+00, 1.5034e+00]], [[ 6.0245e+00, 3.0714e+00, 4.3486e+00, 3.7638e+00, 1.8954e+00, 2.5866e-01, 1.8554e+00, 4.0172e-01, 1.4471e+00, 2.6472e+00, 5.8989e+00, 3.0391e+00, 1.1060e+01]], [[-2.5210e-01, -3.1764e+00, -3.4025e+00, -1.9295e+00, -3.3844e+00, -1.0693e+00, -1.2726e+00, -3.4747e+00, -2.5019e+00, -3.4463e+00, -1.4660e+00, -2.0061e+00, -1.6279e+00]], [[-5.1228e+00, -6.4802e+00, -6.2048e+00, -6.4850e+00, -5.9117e+00, -5.8151e+00, -6.4570e+00, -4.6125e+00, -4.6777e+00, -3.5177e+00, -3.4209e+00, -3.5389e+00, -3.1906e+00]], [[-2.5333e+00, -2.3390e+00, -2.3649e+00, -3.5841e+00, -2.4901e+00, -3.1884e+00, -3.2966e+00, -2.0947e+00, -2.4880e+00, -2.0538e+00, -2.8342e+00, -3.3384e+00, -3.0767e+00]], [[-2.0549e+00, -2.3497e+00, -2.4931e+00, -2.8619e+00, -2.4938e+00, -2.7717e+00, -2.9646e+00, -2.4273e+00, -2.2229e+00, -2.4768e+00, -2.7019e+00, -2.6873e+00, -2.6634e+00]], [[ 6.9078e-01, 1.7478e-01, 2.6405e-01, -4.7653e-02, -4.3243e-02, -1.1204e+00, -8.2263e-01, -4.2666e-02, 1.6581e-01, 1.0839e-01, 9.1829e-02, -3.1314e-02, 1.0151e+00]], [[-1.4226e+00, -2.3673e+00, -3.2538e+00, -2.3848e+00, -2.7741e+00, -2.6842e+00, -2.3107e+00, -2.2703e+00, -2.2606e+00, -3.2675e+00, -2.5988e+00, -2.1835e+00, -2.7664e+00]]], [[[-4.9900e-01, -2.3190e+00, -1.2200e+00, -1.5923e+00, -2.9071e+00, -2.0157e+00, -2.4472e+00, -2.4767e+00, -2.8711e+00, -1.6728e+00, -2.2936e+00, -2.3690e+00, -8.4053e-01]], [[ 1.0454e+00, 1.1538e+00, 5.4525e+00, 5.0064e-01, 2.5088e+00, 2.5771e-01, 2.2333e-01, 5.0794e-02, 2.1505e+00, 7.2349e-01, -4.9651e-02, 9.8848e-01, 9.0502e+00]], [[-1.1245e+00, -2.0640e+00, -1.5902e+00, -9.7497e-01, -2.6689e+00, -2.2555e+00, -2.8870e+00, -2.3169e+00, -2.7628e+00, -2.7053e+00, -2.9118e+00, -1.4978e+00, -1.7818e+00]], [[-3.6533e+00, -7.0178e+00, -6.3025e+00, -5.1501e+00, -6.0587e+00, -7.4047e+00, -6.6083e+00, -3.5907e+00, -3.0913e+00, -4.7309e+00, -3.9183e+00, -1.5737e+00, 3.4356e+00]], [[ 2.8940e-02, -1.3129e+00, -9.6907e-01, 1.0164e-01, -4.1869e-01, -7.5222e-01, -1.1596e-01, 1.5157e-02, 7.2024e-01, 5.1802e-01, 1.0447e+00, 1.8209e+00, 3.1101e+00]], [[ 5.6087e+00, 2.6650e+00, 5.7724e+00, 3.0509e+00, 2.3473e+00, 1.2541e+00, -3.6578e-01, 2.9543e-01, 1.6378e+00, -1.7668e-01, -9.1386e-01, 3.0993e+00, 9.7582e+00]], [[ 6.3243e-01, -2.7398e+00, -2.5916e+00, -1.2173e+00, -2.7841e+00, -8.6451e-01, -4.8699e-01, -3.0412e+00, -2.7818e+00, -2.4870e-01, -3.6053e-01, -8.3616e-01, -2.3778e+00]], [[-5.1963e+00, -6.5233e+00, -6.3825e+00, -5.9373e+00, -5.9587e+00, -6.0746e+00, -6.0826e+00, -4.4955e+00, -4.3036e+00, -4.7512e+00, -4.4735e+00, -2.1422e+00, -2.6630e+00]], [[-2.0965e+00, -9.9065e-01, -1.3157e+00, -2.3774e+00, -7.3975e-01, -2.6308e+00, -2.8904e+00, -5.2116e-01, -5.4191e-01, -2.4821e+00, -2.7506e+00, -1.8232e+00, -1.2668e+00]], [[-1.5973e+00, -1.8502e+00, -1.7039e+00, -2.3138e+00, -2.0232e+00, -2.6065e+00, -2.6970e+00, -1.9124e+00, -1.9998e+00, -2.6073e+00, -2.6414e+00, -1.6793e+00, -1.6521e+00]], [[ 8.6215e-01, 7.1558e-01, 1.0238e+00, 2.3979e-01, 6.1251e-01, -2.6164e-01, -3.9153e-01, 5.1848e-01, 4.6557e-01, -3.8323e-01, -5.2450e-01, 4.5808e-01, 1.9313e+00]], [[-1.6172e+00, -2.3015e+00, -3.6032e+00, -2.5902e+00, -2.7904e+00, -2.6396e+00, -2.3843e+00, -2.1961e+00, -2.7666e+00, -1.9770e+00, -2.3379e+00, -2.3099e+00, -3.1936e+00]]], [[[-1.2967e+00, -4.2521e+00, -2.2967e+00, -2.4058e+00, -3.8062e+00, -2.9188e+00, -3.5834e+00, -4.4924e+00, -3.1641e+00, -3.4990e+00, -2.5524e+00, -3.3441e+00, -4.5852e+00]], [[-1.8559e+00, 5.6544e-01, -2.6926e+00, -3.8142e+00, -4.0039e+00, -6.6778e+00, -4.8485e+00, 3.5246e-01, -5.2088e+00, -5.8228e+00, -6.6297e+00, -5.0526e+00, 3.8553e+00]], [[-1.5294e+00, -2.9050e+00, -1.8346e+00, -1.4006e+00, -3.8323e+00, -3.6159e+00, -3.3002e+00, -3.0741e+00, -2.9443e+00, -3.8398e+00, -3.6483e+00, -3.2585e+00, -2.9152e+00]], [[-2.4377e+00, -4.2854e+00, -5.0547e+00, -3.2933e+00, -4.0997e+00, -3.4501e+00, -2.3952e+00, -1.6782e+00, -6.7624e-01, -9.3061e-01, -1.0254e+00, 5.5918e-01, 1.1504e+00]], [[-1.1045e+00, -2.0096e+00, -2.4522e+00, -1.7730e+00, -1.9017e+00, -2.1116e+00, -1.1877e+00, -7.6380e-01, -6.2992e-02, -1.9055e-01, -2.5648e-01, 3.7322e-01, 1.2804e+00]], [[ 1.4668e+00, 2.5038e+00, 2.5599e+00, 1.6961e+00, 1.8971e+00, -9.7380e-02, -3.3484e-01, 1.8569e+00, 6.1853e-01, 1.1964e+00, -1.1897e+00, -6.1394e-01, 2.7861e+00]], [[-6.3558e-01, -4.9354e+00, -4.4373e+00, -2.6606e+00, -4.9034e+00, -2.2877e+00, -1.8105e+00, -5.5579e+00, -4.1826e+00, -4.3333e+00, -1.8182e+00, -1.5760e+00, -5.6761e+00]], [[-6.1633e+00, -7.4938e+00, -6.6967e+00, -6.8950e+00, -6.6804e+00, -7.1100e+00, -6.6032e+00, -5.5666e+00, -4.8263e+00, -4.6764e+00, -4.7725e+00, -4.5448e+00, -3.2234e+00]], [[-4.0049e+00, -1.7818e+00, -3.5868e+00, -4.9529e+00, -2.3275e+00, -4.9898e+00, -4.8216e+00, -1.2821e+00, -3.7038e+00, -2.8230e+00, -4.5619e+00, -4.6147e+00, -7.4924e-01]], [[-1.4826e+00, -1.8076e+00, -1.7864e+00, -2.2729e+00, -2.0332e+00, -2.5627e+00, -2.6701e+00, -1.9449e+00, -2.0594e+00, -2.1467e+00, -2.4669e+00, -2.6060e+00, -1.7477e+00]], [[ 2.6303e-01, 9.3742e-02, -1.0793e-01, -3.9520e-01, -3.1771e-01, -7.2411e-01, -7.5384e-01, 1.4598e-02, -4.5423e-01, -5.5514e-01, -9.3810e-01, -7.8883e-01, 3.5951e-01]], [[-1.3695e+00, -2.0587e+00, -3.3833e+00, -2.2425e+00, -2.5618e+00, -2.3645e+00, -2.0485e+00, -2.0453e+00, -2.2373e+00, -2.5164e+00, -2.0978e+00, -2.0224e+00, -1.8003e+00]]]]) attn_weights tensor([[[[-2.4581, -3.7180, -3.7607, -3.3199, -1.9208, -2.6160, -1.8729, -1.3274, -1.8147, -1.5185, -0.5677, 0.6508, -0.7645]], [[-0.8370, -2.0131, -2.3641, -2.1189, -2.1189, -2.4261, -1.7820, 0.0075, -0.5247, -0.3816, -0.5882, 0.0545, -0.4370]], [[-2.8705, -3.7515, -3.4207, -3.7984, -3.2170, -3.4398, -3.0182, -2.3882, -2.6581, -3.0718, -2.5271, -2.5063, -2.7166]], [[ 0.0612, -2.9985, -2.8499, -2.8619, -2.7749, -2.5359, -2.3467, -2.2239, -2.2810, -2.3613, -1.9119, -2.1820, -2.1649]], [[-0.5794, -2.4458, -2.7299, -2.7039, -2.6111, -2.1083, -2.0066, -2.0324, -2.2360, -2.2093, -1.5991, -2.0081, -1.7674]], [[ 0.4988, -0.3649, -2.7749, -0.7363, -0.7405, -1.9758, -2.1284, -0.5636, -3.0106, -1.0900, -0.9908, -0.9234, -0.2907]], [[ 0.6294, -1.5439, -1.9377, -1.6546, -1.8484, -1.0008, -1.6832, -1.7888, -2.2959, -2.2605, -0.4521, -2.1136, -0.7223]], [[-0.1669, -2.3001, -2.3423, -2.6960, -2.6874, -1.7162, -1.7520, -1.9480, -2.2563, -2.8182, -1.9706, -2.4034, -2.7415]], [[-0.7936, -1.8595, -2.0389, -2.3616, -1.9761, -2.4174, -2.6882, -1.8842, -1.9165, -2.2121, -2.3195, -1.8495, -2.2982]], [[ 1.2330, -0.4267, -0.1628, -0.2207, 0.5237, -0.7964, -1.3720, -0.6836, -0.2085, -0.1393, -1.2478, 0.4204, -0.5341]], [[-5.3878, -2.2290, -2.1406, -2.0969, -2.1099, -1.6460, -1.4471, -1.5760, -1.5129, -1.5194, -0.8361, -1.4214, -1.1804]], [[ 1.7089, 0.4207, -3.0809, -2.3369, -1.7406, -2.1811, -3.0809, 0.7362, -3.2983, -2.3275, -1.2012, -1.7408, 4.2450]]], [[[-1.7936, -4.2901, -3.5819, -3.0863, -2.8722, -3.6915, -3.4161, -2.0057, -2.2421, -1.4179, -0.9551, 1.6002, -1.5662]], [[-0.1292, -1.2301, -1.7214, -1.6264, -1.2393, -1.5168, -1.3483, 0.3590, 0.2885, -0.0648, 0.0215, -0.0483, 0.1874]], [[-2.9892, -3.8630, -3.5699, -3.8997, -3.2746, -3.5668, -3.1686, -2.5469, -2.7292, -2.7791, -3.0976, -2.8940, -2.3056]], [[ 0.0513, -3.0746, -2.9733, -2.9986, -2.8576, -2.6911, -2.4774, -2.3359, -2.3603, -2.3349, -2.4157, -2.2305, -2.0347]], [[-0.6423, -2.6006, -2.7804, -2.7260, -2.5383, -2.2163, -2.1011, -2.1135, -2.2180, -2.1233, -2.0985, -1.6962, -1.6632]], [[ 0.7599, -0.4976, -1.9454, -1.2815, -0.6269, -2.6117, -3.0486, -0.4911, -0.3368, -2.1962, -1.6385, -1.3695, 1.9888]], [[ 0.8209, -1.3980, -1.6975, -1.2443, -0.7283, -1.3524, -1.9468, -1.3847, -1.2268, -1.8759, -1.5760, -0.2822, -1.4794]], [[ 0.8594, -1.0279, -1.8574, -1.4617, -1.2557, -0.8060, -0.5531, -0.7605, -1.0385, -1.9083, -1.5836, -1.0033, -0.5021]], [[-0.3692, -1.3246, -1.8202, -1.9351, -1.5266, -2.1321, -2.3474, -1.4145, -1.6363, -1.7871, -1.8589, -2.0793, -1.5145]], [[ 1.4581, -0.5476, -0.0996, -0.4604, 0.3188, -1.1782, -1.1011, -0.9076, -0.6920, -0.2654, -0.4991, -0.3065, -0.6865]], [[-4.9544, -2.3177, -2.2417, -2.2042, -2.1933, -1.7725, -1.6056, -1.6708, -1.6688, -1.5107, -1.5103, -1.2744, -1.1571]], [[ 1.5181, 0.3954, -1.9914, -3.2766, -0.8059, -3.4770, -3.2734, 0.5321, 0.5962, -1.7650, -2.8785, -2.0857, 3.1847]]], [[[-3.1301, -4.2256, -3.2667, -3.5023, -3.2607, -4.1177, -3.7677, -1.8351, -1.9556, -0.5880, 0.3283, -0.4521, -1.3053]], [[-0.4812, -1.4506, -2.0936, -2.1771, -1.5581, -1.6724, -1.8699, 0.2014, -0.1556, -0.0449, -0.5566, -0.3695, -0.2793]], [[-3.0132, -3.9430, -3.6435, -3.9708, -3.3091, -3.6220, -3.2211, -2.4914, -2.9162, -2.7781, -3.3636, -3.3421, -2.6371]], [[-0.0286, -3.1539, -3.0396, -3.0364, -2.8895, -2.6924, -2.4730, -2.3336, -2.4290, -2.3218, -2.6251, -2.6412, -2.1208]], [[-0.5261, -2.4580, -2.7898, -2.7033, -2.5665, -2.2053, -2.0980, -2.0172, -2.1184, -2.1732, -2.2203, -2.2793, -1.4969]], [[ 0.4697, 0.0105, -1.8000, -0.3809, -0.2697, -3.3658, -2.7318, 0.0282, -0.6757, -2.0744, -0.7176, -0.5277, -0.8673]], [[ 0.2552, -1.1881, -2.2332, -2.6442, -1.6155, -1.6283, -2.1130, -1.2869, -2.6360, -2.6971, -3.0688, -3.2958, -2.1353]], [[ 0.5400, -1.2250, -2.3300, -2.3271, -1.9102, -0.6853, -0.8253, -1.0588, -2.1458, -2.4941, -2.4729, -2.1485, -2.1186]], [[-0.8247, -1.9192, -2.3657, -2.4676, -2.1740, -2.7387, -3.0372, -1.9004, -2.1759, -2.2947, -2.5344, -2.2516, -2.4190]], [[ 1.2651, -0.3351, -0.0655, -0.5074, 0.3826, -0.9673, -1.3371, -0.6218, 0.0468, -0.1258, -0.4087, -0.1073, -0.2744]], [[-5.2202, -2.3510, -2.2973, -2.2631, -2.2010, -1.7924, -1.5700, -1.6816, -1.5292, -1.5432, -1.8209, -1.7684, -1.1079]], [[ 0.5797, 0.2662, -3.3338, -0.7469, -2.6356, -3.4156, -5.1830, 0.5722, -2.7783, -3.3408, -1.5754, -1.0485, 3.9655]]], [[[ 0.8541, -0.7801, -0.5327, 0.0641, -0.4900, -0.6408, -0.4901, 0.3632, 0.6943, -0.1016, 0.1511, 1.3208, 0.9440]], [[-0.9844, -1.9700, -2.5442, -2.2046, -2.2668, -2.0906, -1.5030, -0.4435, -1.0329, -1.3437, -0.5159, 1.0682, -0.3550]], [[-3.0090, -3.9180, -3.4941, -3.9364, -3.2887, -3.6361, -3.2271, -2.5456, -2.8514, -3.2901, -2.7915, -2.3162, -2.4550]], [[ 0.0477, -3.0742, -2.9419, -3.0258, -2.8546, -2.7185, -2.4976, -2.3663, -2.5023, -2.3991, -2.1768, -1.7819, -1.9866]], [[-0.5366, -2.4980, -2.6233, -2.6750, -2.5247, -2.1999, -2.0146, -2.0787, -2.1584, -1.7043, -1.6366, -1.5202, -1.5551]], [[ 1.0748, 0.2575, -0.4627, -0.3829, -0.3934, -3.1337, -2.0405, 0.2122, -0.5494, -3.0372, -2.6991, -1.5937, 0.8724]], [[ 0.7858, -1.5360, -1.6334, -1.8307, -1.2563, -0.5975, -1.4627, -1.8679, -1.4874, -1.9306, -1.7385, -1.0682, -2.1461]], [[ 0.0487, -2.1267, -1.7267, -1.5823, -2.1356, -1.5676, -1.6586, -1.8594, -2.1020, -1.7169, -1.9906, -1.3267, -2.1132]], [[-0.2283, -0.9783, -1.7979, -1.6892, -1.3331, -1.8619, -2.1445, -1.2017, -1.3475, -2.3396, -2.0077, -1.2079, -1.5707]], [[ 1.2787, -0.3385, -0.1474, -0.5054, 0.5328, -1.2554, -1.3510, -0.6283, 0.5796, -1.9408, -1.1869, -0.0347, 0.0494]], [[-5.2460, -2.2720, -2.1479, -2.2196, -2.1192, -1.7432, -1.5734, -1.6375, -1.7288, -1.3804, -1.1706, -0.8840, -1.0010]], [[-0.0394, -0.0328, -1.7468, -1.9341, -2.8622, -2.9402, -3.2741, 0.1091, -3.0549, -2.6413, -3.7144, -0.2400, 3.0760]]], [[[-0.6088, -2.5435, -1.4979, -1.5695, -1.7088, -1.8436, -1.7415, -1.3279, -0.0061, -0.6498, -0.6944, -0.9306, -0.3429]], [[-0.2300, -1.7083, -2.1984, -2.0526, -2.0393, -2.3784, -1.8520, -0.6155, -1.3758, -1.1120, -1.1269, -1.1573, 0.3322]], [[-2.7252, -3.7884, -3.3270, -3.6968, -3.1078, -3.4162, -3.0032, -2.4050, -2.9602, -2.6175, -2.6445, -2.4525, -1.8543]], [[ 0.2291, -2.9173, -2.7194, -2.7801, -2.6690, -2.5153, -2.3256, -2.2330, -2.4772, -2.3113, -1.9946, -1.9640, -1.5646]], [[-0.6359, -2.4950, -2.6371, -2.6215, -2.5947, -2.1535, -2.0327, -2.1915, -2.2466, -2.1223, -1.6228, -1.5638, -1.5652]], [[ 0.9486, 0.1147, -0.5572, -1.0579, -0.7686, -2.2463, -1.7174, 0.3146, -0.8570, -0.9251, -2.0078, -2.1375, 0.3396]], [[ 0.3088, -1.6401, -2.3127, -2.8962, -2.9228, -1.8711, -2.3930, -1.8603, -2.9839, -3.2098, -1.3261, -2.6582, -0.9198]], [[-0.1125, -2.4701, -2.0185, -1.6505, -2.5481, -1.8911, -1.8452, -2.0864, -1.9995, -2.4321, -1.7823, -2.2978, -1.7417]], [[ 0.6488, -0.0591, -0.6747, -0.8356, -0.4107, -0.7007, -1.0032, -0.3404, -0.5647, -0.5162, -0.9051, -0.9029, 0.1309]], [[ 1.3542, -0.3810, -0.0762, -0.5418, 0.2286, -1.1699, -1.1043, -0.8561, -0.1466, 0.2266, -1.2702, -0.8820, -0.6370]], [[-4.9183, -2.1755, -2.0506, -2.0775, -2.0583, -1.6616, -1.4407, -1.5635, -1.6634, -1.5654, -0.9952, -0.9671, -0.7721]], [[ 0.0725, -0.7617, -1.5494, -1.2171, -0.9016, -2.1080, -1.8123, -1.0037, -2.1970, -1.2656, -2.0176, -2.1200, -0.3160]]]]) attn_weights tensor([[[[ -1.9552, -4.7808, -4.5358, -5.6415, -4.8946, -3.6885, -4.0634, -3.1574, -2.6714, -3.9373, -1.9673, -2.6092, -2.2043]], [[ 1.6754, -1.6103, -2.3011, -2.1365, -2.2988, -2.7294, -2.4948, -1.7762, -3.2190, -2.8870, -2.1041, -2.6138, -2.0615]], [[ -6.2411, -12.8174, -12.6874, -12.9907, -12.1534, -10.3155, -8.9942, -7.0691, -5.9757, -6.4431, -4.7028, -3.9094, -5.0199]], [[ -3.3254, -7.1784, -6.6782, -7.4308, -5.5843, -6.0166, -5.1170, -3.8761, -3.1054, -3.9073, -1.7266, -1.2647, -2.2915]], [[ -1.6802, -5.5881, -6.2274, -5.7800, -5.6776, -6.4833, -5.0957, -2.5683, -3.3514, -2.9778, -3.6534, -1.9220, -4.5778]], [[ -4.4563, -7.0804, -8.2129, -7.5397, -8.3796, -6.7138, -6.0752, -3.3089, -4.2288, -3.8141, -4.4483, -3.4308, -5.2482]], [[ -0.6634, -3.4500, -3.8472, -4.1825, -3.7000, -4.6615, -4.0873, -2.0886, -2.5962, -3.1659, -2.8244, -2.3292, -2.8071]], [[ -1.3442, -4.1690, -2.7904, -2.6755, -2.6658, -1.7411, -1.8350, -1.7535, -1.1295, -1.4254, -1.0831, -1.2344, -0.7992]], [[ -3.4020, -6.9355, -7.4188, -5.4612, -7.2511, -6.7245, -4.1641, -3.9003, -4.0883, -2.5077, -0.5449, -3.2657, -3.5699]], [[ -3.9832, -8.6729, -7.9203, -8.2101, -8.8439, -5.3076, -4.4910, -5.5518, -4.2040, -4.5472, -3.0284, -4.2069, -3.3603]], [[ -1.9061, -3.7473, -3.5901, -3.3268, -3.4503, -2.5193, -2.3901, -2.7686, -2.5189, -2.4098, -1.6140, -2.2523, -1.7655]], [[ -0.7150, -4.9448, -4.8320, -4.5956, -4.5585, -3.9172, -3.7432, -3.6870, -3.5411, -3.4631, -2.8933, -3.1368, -2.8053]]], [[[ -2.3303, -5.0923, -5.1376, -5.8305, -5.1617, -3.8309, -3.9433, -3.2475, -2.0782, -2.9491, -3.7314, -2.5779, -1.7494]], [[ 1.6590, -1.1110, -1.7690, -1.6652, -2.2258, -1.1877, -1.7243, -1.4273, -1.3560, -2.8550, -2.5396, -1.2980, -1.3468]], [[ -7.2417, -15.6069, -14.7882, -14.4456, -11.9485, -11.2644, -10.4319, -8.7828, -7.6864, -6.7748, -6.5765, -3.6314, -7.0265]], [[ -2.9967, -6.7847, -6.2097, -7.5025, -4.0147, -5.7500, -5.3627, -4.0110, -3.3984, -2.6628, -3.6214, -1.7665, -3.9272]], [[ -3.7057, -7.5780, -9.6505, -8.5175, -7.5339, -7.4709, -6.7121, -4.5164, -3.9813, -5.6337, -4.5252, -0.4107, -3.4277]], [[ -4.3343, -7.6423, -8.7167, -8.0401, -7.3501, -7.1495, -6.3583, -3.6410, -3.1260, -3.9848, -3.4672, -4.1043, -3.9571]], [[ -0.7674, -3.7133, -3.2079, -3.7827, -3.5350, -4.1680, -3.9133, -2.2338, -2.0620, -1.8980, -2.7029, -2.8224, -2.0395]], [[ -1.3583, -4.2505, -2.8246, -2.5091, -2.5236, -1.7837, -1.8051, -1.6787, -1.6558, -0.9384, -1.0427, -1.2667, -1.0639]], [[ -3.8914, -7.6491, -9.8212, -6.2875, -6.8436, -7.8326, -7.4431, -4.2282, -3.9689, -5.6307, -2.2637, -1.0005, -4.0055]], [[ -4.7115, -8.6536, -8.2197, -9.1176, -7.4527, -4.9149, -4.7022, -5.0812, -4.9085, -3.7609, -4.5878, -2.7739, -4.6689]], [[ -1.5445, -4.0478, -3.5945, -3.2996, -3.4817, -2.6851, -2.5352, -3.0087, -2.7895, -2.3234, -2.2154, -1.6688, -1.9696]], [[ -0.7831, -5.3983, -4.9913, -4.7431, -4.7596, -4.1340, -4.0183, -4.0677, -3.8456, -3.3950, -3.3467, -3.0082, -3.0818]]], [[[ -2.0268, -4.5482, -4.6656, -5.3162, -4.4696, -3.9529, -3.1839, -2.9566, -3.5386, -2.4808, -2.5061, -2.1065, -2.9553]], [[ 1.3487, -1.1064, -2.2741, -1.6666, -2.4483, -1.6067, -1.5503, -1.7964, -2.1509, -3.1885, -3.1670, -2.4445, -2.6321]], [[ -7.3187, -13.5476, -11.6791, -12.5626, -10.8253, -10.1408, -9.3975, -7.0145, -5.3473, -3.1335, -3.9872, -5.0391, -6.1547]], [[ -3.3056, -6.2711, -6.0116, -6.5556, -3.3080, -4.7957, -4.6020, -3.4099, -2.8263, -2.3468, -2.3756, -2.4657, -2.6800]], [[ -2.4844, -5.6084, -6.9604, -5.8509, -4.5327, -6.7334, -5.9069, -2.8967, -3.0422, -3.0637, -1.4391, -2.7395, -3.4401]], [[ -4.7529, -7.5072, -8.4037, -7.4723, -6.6897, -7.0236, -6.5970, -3.2702, -3.4910, -3.4296, -4.1685, -3.9288, -4.8956]], [[ -0.8099, -3.5696, -3.5808, -3.8717, -3.7090, -4.1984, -3.6473, -2.1184, -1.9486, -2.2241, -3.1725, -3.1577, -3.1199]], [[ -1.3299, -4.2824, -2.8882, -2.5738, -2.5672, -1.8048, -1.8033, -1.7635, -1.3598, -1.0400, -1.5992, -1.6901, -0.9861]], [[ -3.4903, -6.6279, -9.0663, -4.6922, -5.4390, -6.8830, -6.1200, -3.4045, -2.8513, -4.8708, -2.2378, -2.9753, -3.5316]], [[ -4.7957, -8.5379, -7.5770, -9.1062, -7.2439, -5.1561, -4.6520, -5.1894, -5.6920, -3.2696, -4.8709, -5.2317, -4.3714]], [[ -1.9462, -4.0051, -3.7726, -3.3173, -3.5448, -2.7685, -2.5853, -2.9767, -2.2915, -2.4586, -2.6642, -2.3633, -1.6865]], [[ -0.8206, -5.1521, -4.9396, -4.6447, -4.5939, -4.0426, -3.8652, -3.9082, -3.2924, -3.3537, -3.5315, -3.2795, -2.9293]]], [[[ -1.3787, -4.2643, -2.9529, -2.8811, -3.5249, -3.9130, -4.1365, -3.3083, -2.3461, -2.5916, -3.2209, -2.0199, -1.6175]], [[ 1.4432, -1.1128, -1.0791, -0.4697, -2.4004, -1.3858, -2.1410, -1.5308, -2.8944, -1.6986, -3.7413, -0.4365, -2.0528]], [[ -6.5959, -12.4583, -12.4091, -12.2467, -11.8582, -11.0864, -9.8938, -8.4789, -7.9258, -7.8612, -6.4675, -4.0523, -6.3488]], [[ -2.6688, -5.8567, -5.7595, -6.6571, -4.8039, -5.5644, -4.8935, -3.4397, -2.7210, -2.9735, -3.3677, -1.8740, -2.0708]], [[ -1.3827, -5.4181, -6.7565, -7.0953, -5.4258, -7.7054, -7.1656, -3.2030, -3.3493, -6.1034, -5.8469, -3.2405, -5.5156]], [[ -4.1064, -6.8453, -8.1492, -7.4870, -7.2004, -7.3316, -7.1817, -4.1307, -4.9594, -5.5076, -4.7903, -1.8561, -3.7796]], [[ -1.5961, -4.5627, -3.5821, -3.6865, -3.7243, -4.3032, -3.7606, -3.5626, -2.9052, -3.9568, -3.1143, -0.8494, -2.0525]], [[ -1.2709, -3.9413, -2.5385, -2.3387, -2.4127, -1.6212, -1.6544, -1.5306, -1.4633, -1.2687, -0.6001, -0.4512, -0.3234]], [[ -3.0423, -5.6230, -7.8414, -4.5976, -5.4303, -5.5847, -4.6816, -3.7237, -3.6416, -3.9659, -3.3832, -2.3363, -3.2260]], [[ -4.0489, -8.3693, -8.5398, -8.1500, -7.4635, -5.6120, -5.3064, -5.7070, -5.1064, -3.0960, -3.2275, -2.6184, -3.2103]], [[ -1.7577, -3.6792, -3.4857, -3.2257, -3.4344, -2.8823, -2.6214, -2.9307, -2.8290, -2.3517, -2.0117, -1.8327, -1.5381]], [[ -0.6579, -5.1164, -4.9164, -4.7157, -4.6065, -4.1100, -3.8311, -3.9043, -3.8456, -3.4982, -3.1136, -2.9400, -2.6232]]], [[[ -1.0387, -4.2313, -2.6210, -3.2366, -3.2797, -4.2691, -3.8559, -3.5954, -1.6552, -2.3261, -2.8358, -2.8316, -2.2564]], [[ 1.7972, -1.7554, -2.1317, -1.4714, -2.5895, -2.1862, -2.2850, -1.7827, -1.6898, -2.6687, -1.8563, -4.4202, -1.5918]], [[ -6.8407, -14.5558, -11.6506, -12.4516, -10.9880, -10.3744, -9.2647, -10.1315, -7.3520, -6.2498, -5.4204, -4.0370, -4.6201]], [[ -2.5869, -5.6076, -4.5330, -5.0161, -3.6687, -5.2633, -4.6305, -3.6708, -2.9861, -1.9824, -3.1381, -2.9194, -2.9513]], [[ -1.4286, -4.6531, -4.6601, -4.9319, -4.0054, -6.2697, -5.6712, -3.1267, -3.7947, -2.6999, -3.2912, -4.1030, -1.3532]], [[ -3.4201, -5.5622, -7.1144, -6.1746, -5.9350, -6.0173, -5.6710, -3.1534, -5.1341, -3.5541, -3.7664, -3.1570, -1.9794]], [[ -1.0293, -3.9882, -2.5828, -3.1132, -3.3026, -4.2054, -3.6701, -3.1084, -2.6116, -2.5375, -3.4218, -3.0216, -0.5367]], [[ -1.2653, -3.8371, -2.1859, -2.1168, -2.0982, -1.2134, -1.2994, -1.3204, -1.4253, -1.2879, -0.4016, -0.1495, -0.4841]], [[ -2.5521, -5.1015, -5.8939, -3.5015, -4.4929, -5.5938, -5.1442, -3.5715, -1.8327, -2.6809, -3.7388, -3.8165, -1.9966]], [[ -4.0925, -8.2993, -7.5268, -7.1376, -6.6150, -4.5679, -4.2372, -5.8260, -4.2547, -3.8970, -2.1777, -1.7726, -2.8885]], [[ -1.2525, -3.7005, -3.2796, -3.2183, -3.3660, -2.4472, -2.3768, -2.8357, -2.4851, -2.5912, -1.7974, -1.6069, -1.7861]], [[ -0.5387, -5.1087, -4.6173, -4.6042, -4.3654, -3.7689, -3.6052, -3.9630, -3.5457, -3.5013, -2.9327, -2.7790, -2.7160]]]]) attn_weights tensor([[[[ 5.0582, -0.1876, -3.2849, -1.3023, -0.1066, -3.6976, -2.9885, -0.8718, -3.6774, -2.2414, -2.7535, -0.3017, 2.1206]], [[ -2.7906, -5.8898, -5.2012, -5.9611, -5.8676, -6.0833, -6.3406, -3.3875, -3.2450, -3.9263, -4.8317, -3.7234, -4.9316]], [[ -4.5705, -10.1959, -10.4622, -9.4695, -8.8271, -8.2329, -7.7763, -7.0437, -6.3543, -5.5685, -4.8023, -3.6116, -4.5007]], [[ -4.8689, -11.9770, -16.1213, -12.3313, -12.7561, -10.4706, -10.6589, -8.3839, -11.5663, -8.3534, -5.3405, -6.7281, -7.9093]], [[ 1.3098, -3.3501, -4.7020, -4.3377, -3.0012, -2.9192, -2.6215, -3.3296, -4.9029, -4.9644, -3.7269, -3.1551, -4.6639]], [[ -0.2416, -2.4787, -3.9041, -2.5001, -2.3930, -2.1432, -1.8028, -3.2000, -4.0020, -2.9396, -2.4776, -2.5134, -2.4560]], [[ -3.2107, -8.0799, -6.7797, -7.6634, -7.2915, -5.1696, -6.3406, -5.2349, -3.9884, -5.2264, -4.3644, -3.4939, -3.9184]], [[ -5.5609, -11.4620, -12.0911, -11.7125, -12.9417, -7.8341, -8.6076, -7.3860, -7.6120, -7.7479, -6.6148, -6.4327, -6.9655]], [[ -4.7632, -9.5524, -10.5876, -9.2096, -9.4758, -7.6269, -7.2155, -5.9801, -6.5686, -5.4478, -4.0256, -5.1984, -6.9235]], [[ -2.4712, -6.0100, -5.6087, -4.2997, -5.1375, -5.9195, -3.6506, -3.9024, -3.3205, -2.5651, -2.5845, -3.0237, -3.8435]], [[ -1.0626, -6.4473, -6.3435, -7.7271, -6.0644, -3.9484, -3.7546, -4.4525, -5.0960, -6.5983, -4.3662, -3.7216, -2.3931]], [[ -2.4530, -6.3641, -8.0545, -6.5394, -6.9673, -5.7218, -5.2495, -3.8899, -5.5769, -4.7959, -4.7260, -4.2193, -2.7485]]], [[[ 5.0964, -0.6930, -2.1250, -2.6510, -0.2665, -2.8788, -2.2206, -1.6338, -1.1970, -3.0421, -3.8450, -0.3120, -0.1463]], [[ -2.7474, -6.1832, -5.5373, -5.5348, -5.7205, -5.8034, -7.1209, -3.9319, -3.3734, -3.5228, -3.3605, -6.1775, -4.7451]], [[ -4.7846, -8.9768, -9.0338, -7.8691, -6.1259, -8.4827, -8.5143, -6.2866, -5.7232, -4.9620, -3.8367, -3.2051, -4.8185]], [[ -4.8959, -10.8398, -15.3883, -11.9612, -11.2106, -12.1827, -11.7961, -8.0195, -8.6751, -11.3808, -7.6975, -5.6126, -5.6649]], [[ 1.4490, -4.1623, -3.6870, -2.9174, -3.0350, -3.2926, -3.1062, -3.3631, -2.8115, -3.9182, -3.2961, -3.6787, -3.3727]], [[ -0.1164, -2.0661, -3.1047, -2.3548, -2.3040, -2.1149, -1.7042, -2.7678, -2.7974, -3.2280, -2.9056, -2.2094, -2.8292]], [[ -3.4374, -7.3024, -4.9725, -6.2928, -7.2016, -5.3425, -5.5556, -4.7064, -4.2573, -2.1396, -3.4146, -3.4082, -3.8903]], [[ -5.7994, -10.9878, -12.0587, -11.6246, -10.2352, -8.0255, -7.7576, -7.3548, -8.3528, -7.6585, -7.3081, -6.3788, -6.1050]], [[ -4.4537, -8.4208, -9.4179, -8.3301, -10.0701, -9.8402, -7.4304, -5.0002, -4.1421, -5.5751, -4.2687, -6.4240, -4.9259]], [[ -1.7537, -5.5079, -5.5270, -3.7915, -4.4754, -7.1771, -7.1071, -3.7908, -3.3488, -3.2094, -1.4750, -1.0066, -2.3607]], [[ -0.9635, -6.3130, -5.3781, -6.6899, -5.0384, -4.9377, -5.1248, -4.4896, -4.0639, -4.4428, -5.5659, -3.9768, -2.2569]], [[ -2.7129, -6.0832, -7.6270, -7.0089, -4.8793, -4.4856, -5.8889, -4.3609, -3.7879, -5.1919, -4.6449, -3.3701, -3.6628]]], [[[ 5.0151, -0.9851, -2.8804, -1.5351, -0.3730, -5.1322, -4.4159, -1.0346, -3.4301, -3.0012, -3.5641, -1.3108, 1.9439]], [[ -2.8035, -6.6212, -5.5703, -6.5301, -6.4855, -6.7887, -7.1499, -3.9703, -3.4091, -3.4595, -4.4727, -4.5644, -5.9858]], [[ -4.3851, -9.4217, -9.1030, -7.3927, -7.0685, -8.3365, -9.9805, -6.8173, -7.5519, -4.5547, -4.0201, -4.4722, -5.5035]], [[ -4.8237, -10.7730, -12.4643, -11.7916, -11.3429, -12.4241, -12.7636, -7.7449, -7.3397, -7.6102, -6.6796, -6.2396, -7.3885]], [[ 1.2988, -3.4688, -3.7150, -3.0567, -3.0843, -3.5746, -2.9728, -3.3659, -4.1149, -3.7110, -4.4650, -3.5228, -4.6086]], [[ -0.1332, -2.5808, -4.3610, -2.7147, -2.6472, -3.1744, -2.2137, -3.3005, -4.1858, -4.0259, -3.0863, -3.6610, -3.1271]], [[ -3.2231, -7.4746, -5.3268, -7.1871, -7.3954, -6.2167, -6.3298, -4.5413, -5.0510, -1.0384, -2.6222, -3.8157, -4.8700]], [[ -5.7656, -11.1055, -11.3964, -10.3216, -10.2507, -8.7328, -9.7065, -7.4527, -8.1658, -6.2401, -7.4357, -7.4190, -6.7523]], [[ -4.3951, -8.7776, -9.7236, -7.6162, -9.3809, -7.9183, -8.5016, -5.1586, -4.2388, -4.9563, -5.2036, -5.4469, -5.4307]], [[ -1.8051, -5.6546, -4.1305, -4.2639, -4.2423, -6.7228, -5.4086, -3.9468, -2.7775, -1.9346, -1.4403, -3.2521, -2.7291]], [[ -0.8883, -4.9363, -4.9519, -4.5426, -3.9509, -5.3071, -4.9494, -3.9328, -4.7236, -3.7268, -4.7261, -3.4297, -2.5477]], [[ -2.4842, -6.1875, -6.3239, -7.1666, -5.7735, -6.2970, -5.4923, -4.9693, -4.2146, -3.3972, -3.2774, -3.0614, -3.5016]]], [[[ 4.5057, -0.3860, -1.6986, -2.1240, -0.6952, -4.1941, -2.2227, -0.7445, -1.5532, -3.0228, -3.1267, -3.4738, 1.1636]], [[ -2.6756, -6.0047, -6.0791, -5.9611, -6.8632, -5.7137, -6.8329, -4.6092, -5.2819, -6.3821, -5.6145, -3.5741, -5.1299]], [[ -4.2125, -7.6703, -10.3693, -6.8988, -7.0938, -8.6023, -9.0651, -5.2313, -3.8791, -6.0441, -5.7644, -3.8167, -5.0623]], [[ -4.6978, -11.4038, -14.6776, -12.5992, -12.7572, -11.7378, -11.1536, -8.8035, -9.7324, -9.5210, -8.2916, -6.2141, -9.1844]], [[ 1.0060, -3.3197, -3.4930, -4.1201, -3.2453, -3.2898, -2.2881, -2.6377, -2.7790, -3.9189, -2.4459, -2.8172, -3.0662]], [[ -0.2169, -2.2386, -2.6281, -0.6990, -1.4921, -1.6520, -1.9268, -3.0468, -2.3259, -2.1644, -2.4553, -1.7327, -2.7180]], [[ -3.1385, -7.8180, -6.3889, -7.9253, -6.5562, -5.7500, -6.7777, -6.1640, -4.2871, -4.0844, -5.2273, -4.5224, -4.2678]], [[ -5.6573, -11.3359, -11.9680, -11.6941, -10.7458, -8.9481, -8.4636, -8.2367, -7.5396, -6.4890, -5.7423, -4.4882, -6.5833]], [[ -4.0383, -8.0743, -9.7282, -8.9004, -8.7077, -7.9619, -8.0152, -5.4076, -6.5156, -6.6984, -5.6385, -3.4177, -5.6018]], [[ -1.6312, -5.3954, -7.3376, -4.7671, -6.3926, -6.2373, -5.8212, -5.0775, -5.3441, -5.2515, -5.1984, -3.4019, -3.6406]], [[ -1.0537, -5.0724, -4.1188, -4.7230, -4.2459, -4.3392, -4.7980, -3.8729, -3.0821, -3.8796, -3.6340, -3.1645, -2.5280]], [[ -2.2309, -6.9757, -8.0677, -6.6114, -5.4771, -4.5460, -5.6284, -6.0258, -4.5036, -3.8668, -4.7854, -4.3184, -4.5030]]], [[[ 3.6135, -1.0038, -1.7258, -2.4901, -0.6326, -3.1650, -2.3954, -1.7907, -2.5322, -1.4946, -3.3443, -3.8543, -1.1756]], [[ -2.7600, -4.7523, -4.2433, -4.9591, -4.7637, -6.8146, -6.2991, -4.3806, -4.8755, -4.5111, -6.9633, -5.8796, -4.5879]], [[ -4.8783, -7.0893, -7.5406, -6.6834, -5.9244, -7.7214, -7.9579, -5.0880, -5.1271, -3.4790, -5.6471, -4.5816, -5.7085]], [[ -4.8623, -13.0648, -13.2768, -14.3502, -13.2017, -11.5971, -10.3239, -9.4570, -10.0130, -9.5887, -7.6081, -5.9806, -5.7464]], [[ 0.9812, -3.1805, -3.9860, -3.2946, -3.3771, -2.6702, -2.7107, -2.7094, -3.6368, -3.0455, -2.9725, -3.2437, -2.1802]], [[ -0.4296, -2.0409, -1.5893, -1.6740, -1.3139, -2.6057, -2.6207, -2.6606, -2.0840, -2.1968, -3.0974, -3.8784, -3.3113]], [[ -3.9970, -6.9683, -4.0961, -5.6732, -5.3218, -4.4478, -5.5442, -5.9099, -3.6309, -3.2418, -3.0678, -3.3001, -4.4210]], [[ -5.5280, -12.7666, -13.2122, -11.6874, -11.5120, -8.6528, -7.2111, -8.4372, -7.9715, -7.8775, -5.3384, -3.5395, -5.4375]], [[ -4.0689, -7.8974, -8.0176, -7.4714, -7.9034, -8.1117, -6.8111, -5.1965, -4.8464, -5.7374, -5.2689, -4.7616, -3.6924]], [[ -2.1727, -4.3138, -3.7386, -3.0680, -4.2965, -6.8190, -6.8504, -4.0367, -2.0447, -4.6912, -5.7132, -6.5213, -3.7462]], [[ -1.2059, -5.3014, -4.8862, -5.4841, -5.1159, -4.1105, -4.2580, -3.7077, -3.7961, -3.3803, -3.1249, -2.6370, -2.6602]], [[ -2.7264, -6.1795, -5.9513, -4.7014, -5.2166, -4.0891, -4.5780, -4.9635, -2.1453, -4.1066, -4.2914, -4.5199, -3.7187]]]]) attn_weights tensor([[[[-3.6118e+00, -9.1145e+00, -9.6827e+00, -6.3584e+00, -6.8145e+00, -7.5944e+00, -6.3561e+00, -5.9580e+00, -6.6291e+00, -4.1656e+00, -1.1928e+00, -4.4933e+00, -5.7826e+00]], [[-2.5634e+00, -6.4131e+00, -5.6908e+00, -6.3507e+00, -6.6275e+00, -5.5573e+00, -5.5670e+00, -3.3468e+00, -3.1086e+00, -4.0861e+00, -4.4233e+00, -4.4549e+00, -5.7311e+00]], [[-2.2156e-01, -2.2919e+00, -3.0749e+00, -3.1212e+00, -3.5819e+00, -3.8567e+00, -2.7174e+00, -2.7060e+00, -3.2644e+00, -3.4348e+00, -2.9271e+00, -3.6124e+00, -3.6435e+00]], [[-1.8565e+00, -6.0261e+00, -4.9124e+00, -4.3709e+00, -4.5606e+00, -4.4875e+00, -4.2031e+00, -4.8000e+00, -3.3475e+00, -3.4486e+00, -2.4782e+00, -3.1812e+00, -4.2815e+00]], [[ 1.5906e+00, -2.8290e+00, -2.3544e+00, -4.0227e+00, -1.9972e+00, -3.8933e+00, -4.5515e+00, -2.9248e+00, -2.3500e+00, -4.0486e+00, -2.1097e+00, -1.0774e+00, -1.1157e+00]], [[-2.1223e+00, -6.5985e+00, -7.2564e+00, -7.7163e+00, -8.3091e+00, -5.3305e+00, -6.1194e+00, -4.4843e+00, -5.0498e+00, -6.1801e+00, -6.0988e+00, -3.8925e+00, -3.7434e+00]], [[-1.7641e+00, -5.3268e+00, -6.1745e+00, -5.8874e+00, -5.1047e+00, -4.4505e+00, -4.2569e+00, -4.7305e+00, -4.8318e+00, -4.8931e+00, -3.5467e+00, -4.1028e+00, -4.5235e+00]], [[ 5.0616e-01, -4.8752e+00, -3.2746e+00, -2.8904e+00, -2.4800e+00, -8.7666e-02, -2.5863e+00, -2.7525e+00, -2.7468e+00, -2.5514e+00, -1.2119e+00, -4.1242e-01, 1.2737e+00]], [[ 1.7925e+00, -3.1106e+00, -3.6416e+00, -2.5958e+00, -2.0796e+00, -2.4278e+00, -1.7630e+00, -2.5168e+00, -3.1107e+00, -2.4555e+00, -2.0772e+00, -1.2947e+00, -1.8440e+00]], [[-1.2039e+00, -3.5212e+00, -3.4441e+00, -3.8200e+00, -3.7257e+00, -4.6639e+00, -2.7462e+00, -3.3633e+00, -2.5636e+00, -2.6580e+00, -2.3871e+00, -3.0421e+00, -3.3097e+00]], [[ 1.2483e+00, -2.7658e+00, -2.5326e+00, -2.7779e+00, -2.9448e+00, -3.9617e+00, -2.8623e+00, -2.6157e+00, -2.8237e+00, -3.0677e+00, -3.5151e+00, -2.6755e+00, -3.0203e+00]], [[-6.2530e+00, -2.1617e+01, -1.7964e+01, -1.3271e+01, -2.6874e+00, -4.5892e+00, -1.7839e+01, -7.8442e+00, -6.7152e+00, -2.4584e+00, 1.2412e+00, 1.7041e+01, 6.5677e+00]]], [[[-2.0774e+00, -9.2063e+00, -7.2654e+00, -6.3270e+00, -7.2859e+00, -8.5602e+00, -9.3959e+00, -7.8278e+00, -4.9343e+00, -4.1546e+00, -3.6080e+00, -4.2969e+00, -5.0946e+00]], [[-2.6149e+00, -6.1621e+00, -5.7425e+00, -6.1555e+00, -6.9018e+00, -4.3118e+00, -5.0787e+00, -3.9208e+00, -2.3757e+00, -2.8314e+00, -3.2150e+00, -3.8272e+00, -4.8493e+00]], [[-7.7134e-02, -2.0243e+00, -2.8661e+00, -3.0831e+00, -3.6841e+00, -4.6436e+00, -3.6725e+00, -2.8299e+00, -2.9095e+00, -3.1523e+00, -3.4324e+00, -2.4446e+00, -2.9525e+00]], [[-1.9736e+00, -5.2597e+00, -2.4398e+00, -2.5660e+00, -3.2216e+00, -4.0457e+00, -4.0518e+00, -5.1423e+00, -3.0506e+00, -6.5949e-01, -1.1719e+00, -3.0742e+00, -3.3099e+00]], [[ 1.4537e+00, -2.4013e+00, -8.3616e-01, -2.3047e+00, -3.0584e+00, -4.8479e+00, -4.2470e+00, -2.5665e+00, -3.6255e+00, -1.0174e+00, -2.5778e+00, -3.3476e-01, -7.7427e-01]], [[-2.1411e+00, -6.2321e+00, -6.6455e+00, -6.6327e+00, -5.6816e+00, -7.4662e+00, -8.0498e+00, -5.7519e+00, -5.1943e+00, -4.6132e+00, -4.6474e+00, -4.4717e+00, -5.3970e+00]], [[-1.7754e+00, -5.3734e+00, -5.7133e+00, -5.9502e+00, -4.6329e+00, -4.2869e+00, -4.2555e+00, -4.8390e+00, -3.9350e+00, -4.4454e+00, -4.8862e+00, -4.2970e+00, -4.3659e+00]], [[ 1.2118e+00, -4.3699e+00, -4.2279e+00, -2.4261e+00, -1.4553e+00, -2.2462e+00, -2.3417e+00, -2.4018e+00, -2.4863e+00, -2.2608e+00, -1.3740e+00, 4.3471e-01, 2.1850e+00]], [[ 1.5845e+00, -2.7503e+00, -1.7233e+00, -2.0292e+00, -1.5474e+00, -1.5720e+00, -1.1141e+00, -1.9920e+00, -6.9193e-01, -1.2374e+00, -1.9151e+00, -1.0269e-01, -1.0969e+00]], [[-1.2462e+00, -2.8737e+00, -3.5932e+00, -1.7823e+00, -2.5524e+00, -2.7214e+00, -2.5225e+00, -2.8958e+00, -3.1369e+00, -2.0060e+00, -9.0987e-01, 2.8024e-01, -2.0222e+00]], [[ 1.3218e+00, -2.4363e+00, -2.8474e+00, -3.5955e+00, -3.4465e+00, -2.8010e+00, -2.5271e+00, -2.3883e+00, -2.3044e+00, -2.8086e+00, -3.8164e+00, -3.1374e+00, -2.0751e+00]], [[-6.1319e+00, -2.5820e+01, -2.5968e+01, -1.7336e+01, -1.8136e+01, -1.7886e+01, -1.6116e+01, -1.8100e+01, -2.2329e+01, -1.4785e+01, -5.8039e+00, 1.1363e+01, 2.1054e+00]]], [[[-1.8050e+00, -9.5054e+00, -8.0297e+00, -6.9240e+00, -7.9516e+00, -1.0333e+01, -1.0681e+01, -6.4798e+00, -6.1933e+00, -5.1813e+00, -4.0159e+00, -3.7299e+00, -3.0506e+00]], [[-2.6793e+00, -5.8989e+00, -6.0464e+00, -6.1369e+00, -5.8431e+00, -3.3886e+00, -6.1527e+00, -3.1303e+00, -1.5121e+00, -1.8199e+00, -1.7710e+00, -2.1740e+00, -4.6347e+00]], [[-3.3751e-02, -2.6462e+00, -3.1343e+00, -4.0006e+00, -3.8900e+00, -4.6001e+00, -2.6140e+00, -3.2578e+00, -3.2514e+00, -3.3269e+00, -3.9833e+00, -4.0086e+00, -3.4277e+00]], [[-2.1921e+00, -4.9839e+00, -3.6322e+00, -3.4373e+00, -5.4818e+00, -5.3864e+00, -5.0436e+00, -4.8848e+00, -4.4341e+00, -1.4635e+00, -1.8492e+00, -2.7788e+00, -3.5515e+00]], [[ 1.5287e+00, -2.9819e+00, -1.3542e+00, -2.3063e+00, -2.7553e+00, -3.9898e+00, -5.4568e+00, -2.7098e+00, -4.4351e+00, -1.5714e+00, -2.5172e+00, -1.5931e+00, -2.5651e+00]], [[-1.8826e+00, -6.7002e+00, -6.8959e+00, -6.4708e+00, -6.5120e+00, -8.5216e+00, -8.6344e+00, -5.5544e+00, -7.0411e+00, -4.3944e+00, -4.1953e+00, -5.2542e+00, -6.5561e+00]], [[-1.8515e+00, -5.3713e+00, -5.7187e+00, -5.2223e+00, -5.0589e+00, -4.1547e+00, -4.6629e+00, -4.8555e+00, -4.4654e+00, -4.3271e+00, -4.5711e+00, -4.6501e+00, -4.4164e+00]], [[ 9.0888e-01, -3.6094e+00, -3.4091e+00, -6.1405e-01, -1.4071e+00, -2.9494e+00, -4.0010e+00, -2.9253e+00, -3.6276e+00, -1.9787e+00, -1.4599e+00, 7.2933e-02, 9.1525e-01]], [[ 1.5594e+00, -3.2803e+00, -2.9848e+00, -1.9583e+00, -2.1554e+00, -2.2985e+00, -1.2339e+00, -2.7535e+00, -1.6189e+00, -2.8061e+00, -2.6376e+00, -1.4024e+00, -1.8228e+00]], [[-8.9546e-01, -4.0337e+00, -4.2566e+00, -5.4996e+00, -3.7619e+00, -3.9206e+00, -3.0712e+00, -4.2101e+00, -4.8990e+00, -2.9166e+00, -2.1214e+00, -2.8031e+00, -3.3881e+00]], [[ 1.3866e+00, -2.7448e+00, -2.4638e+00, -2.7409e+00, -2.9308e+00, -3.1723e+00, -4.1914e+00, -2.6635e+00, -2.7307e+00, -2.5436e+00, -4.6294e+00, -3.2236e+00, -2.9254e+00]], [[-7.5802e+00, -1.8536e+01, -1.2060e+01, -1.4073e+01, -1.7491e+01, -1.9130e+01, -2.4570e+01, -1.5717e+01, -7.5651e+00, 4.0902e+00, 8.4452e+00, 1.3860e+01, 2.8494e+00]]], [[[-2.5997e+00, -8.9942e+00, -9.1591e+00, -7.0187e+00, -8.1236e+00, -8.7793e+00, -9.2205e+00, -7.2829e+00, -7.4477e+00, -7.6075e+00, -8.6180e+00, -6.2671e+00, -5.0627e+00]], [[-2.3337e+00, -7.1724e+00, -8.3591e+00, -7.6115e+00, -8.6140e+00, -7.1702e+00, -6.7632e+00, -5.5627e+00, -6.9283e+00, -6.9642e+00, -5.8891e+00, -2.1360e+00, -3.9529e+00]], [[-1.6232e-01, -1.4625e+00, -2.3404e+00, -2.5244e+00, -4.1846e+00, -4.8430e+00, -3.1049e+00, -2.4931e+00, -5.0994e+00, -5.1322e+00, -4.0242e+00, -1.0964e+00, -2.5544e+00]], [[-1.6099e+00, -6.7787e+00, -7.1561e+00, -5.9432e+00, -5.6284e+00, -3.0431e+00, -3.9151e+00, -5.3095e+00, -5.5745e+00, -3.7737e+00, -3.5013e+00, -4.5867e+00, -3.5622e+00]], [[ 1.3122e+00, -2.0708e+00, -2.3232e+00, -2.5781e+00, -2.3680e+00, -2.4260e+00, -2.6571e+00, -2.2076e+00, -2.7681e+00, -3.6604e+00, -2.5808e+00, -1.5558e+00, -1.2427e+00]], [[-2.1197e+00, -8.1629e+00, -8.8897e+00, -8.1082e+00, -7.9583e+00, -7.5487e+00, -7.7479e+00, -7.3667e+00, -6.3824e+00, -6.3114e+00, -7.0975e+00, -4.5475e+00, -4.6637e+00]], [[-2.3401e+00, -4.6078e+00, -4.9649e+00, -4.4399e+00, -4.3179e+00, -4.8211e+00, -4.0919e+00, -4.2998e+00, -4.4280e+00, -4.1573e+00, -3.6214e+00, -3.1372e+00, -4.0016e+00]], [[ 3.8215e-02, -6.3934e+00, -2.4313e+00, -3.3576e+00, -4.1879e+00, -3.8487e+00, -3.5480e+00, -3.3990e+00, -2.0800e+00, -2.6549e+00, -2.9316e+00, -5.6643e-01, 1.0234e+00]], [[ 1.3045e+00, -2.5097e+00, -2.0879e+00, -1.7997e+00, -2.0624e+00, -2.7247e+00, -1.4615e+00, -1.6400e+00, -1.0290e+00, -2.2114e+00, -3.1719e+00, -9.8124e-01, -1.5867e+00]], [[-1.2891e+00, -3.4786e+00, -5.2817e+00, -3.7561e+00, -3.4931e+00, -5.3048e+00, -3.7351e+00, -3.5238e+00, -4.6681e+00, -4.3454e+00, -4.3385e+00, -2.5707e+00, -3.2535e+00]], [[ 1.1422e+00, -2.1100e+00, -2.9689e+00, -2.8011e+00, -3.1285e+00, -2.4700e+00, -3.6789e+00, -2.0627e+00, -2.8370e+00, -5.2866e+00, -4.6796e+00, -1.8365e+00, -1.8344e+00]], [[-8.1052e+00, -1.5877e+01, -2.4263e+01, -2.3066e+01, -2.7455e+01, -2.3257e+01, -2.3724e+01, -1.0583e+01, -1.4689e+01, -1.4358e+01, -1.2329e+01, 5.5628e+00, -5.4149e+00]]], [[[-3.3494e+00, -8.1121e+00, -7.8851e+00, -4.7821e+00, -4.5325e+00, -7.5383e+00, -7.6651e+00, -5.5281e+00, -3.9651e+00, -3.7361e+00, -5.7163e+00, -7.6222e+00, -5.6005e+00]], [[-2.2804e+00, -5.6157e+00, -6.6335e+00, -5.3930e+00, -6.4487e+00, -7.0616e+00, -6.1414e+00, -4.1857e+00, -2.4642e+00, -4.4725e+00, -5.5718e+00, -5.1813e+00, -3.6798e+00]], [[-1.1140e-01, -2.2301e+00, -2.8038e+00, -2.7082e+00, -3.4819e+00, -4.2481e+00, -2.8599e+00, -2.6270e+00, -2.6711e+00, -4.0862e+00, -4.0180e+00, -3.7771e+00, -2.0602e+00]], [[-2.6087e+00, -6.3779e+00, -5.0637e+00, -3.7948e+00, -3.9033e+00, -4.2974e+00, -3.8672e+00, -4.8673e+00, -3.7712e+00, -3.2487e+00, -3.9938e+00, -2.2973e+00, -4.2409e+00]], [[ 1.1480e+00, -2.6233e+00, -2.2501e+00, -1.9231e+00, -1.6660e+00, -1.5902e+00, -2.3090e+00, -2.0446e+00, -2.8778e+00, -1.7469e+00, -2.6062e+00, -1.6708e+00, -1.8034e+00]], [[-2.7312e+00, -7.7446e+00, -7.0989e+00, -7.2548e+00, -6.0212e+00, -6.1314e+00, -7.3997e+00, -6.3477e+00, -5.5768e+00, -4.2072e+00, -4.9393e+00, -6.7676e+00, -5.1647e+00]], [[-2.3781e+00, -4.7978e+00, -4.9231e+00, -4.3128e+00, -3.8428e+00, -3.6551e+00, -4.2173e+00, -4.2918e+00, -3.6646e+00, -3.5108e+00, -3.5839e+00, -3.5861e+00, -3.8628e+00]], [[-8.5705e-03, -4.9340e+00, -4.0642e+00, -1.7744e+00, -1.9423e+00, -2.4060e+00, -2.9876e-01, -1.2675e-02, -1.1557e+00, -1.6485e+00, -1.0151e+00, 6.1770e-01, 2.0230e+00]], [[ 1.2835e+00, -3.0073e+00, -3.8259e+00, -3.1850e+00, -3.1601e+00, -2.4333e+00, -1.7859e+00, -2.6548e+00, -1.7634e+00, -2.0296e+00, -1.8146e+00, -3.0049e+00, -1.7174e+00]], [[-1.4636e+00, -3.8022e+00, -3.6093e+00, -2.9731e+00, -2.6427e+00, -4.4966e+00, -3.1631e+00, -3.5058e+00, -3.2639e+00, -2.4100e+00, -4.1785e+00, -3.9581e+00, -4.7276e+00]], [[ 1.1204e+00, -2.9265e+00, -2.9229e+00, -3.6902e+00, -2.5414e+00, -3.2222e+00, -3.0389e+00, -2.8686e+00, -3.2115e+00, -2.2637e+00, -3.3771e+00, -4.3057e+00, -1.6622e+00]], [[-5.9833e+00, -3.3562e+01, -2.8889e+01, -2.7368e+01, -2.9465e+01, -1.1948e+01, 3.3818e+00, -1.3810e+01, -1.4071e+01, -1.4380e+01, 5.7232e+00, 2.0719e+01, -3.8499e+00]]]]) attn_weights tensor([[[[ 2.2653e+00, -6.5720e+00, -4.9758e+00, -4.7396e+00, -4.0260e+00, -2.1615e+00, -1.2448e+00, -1.3801e+00, -3.2864e+00, -4.4555e+00, -2.8158e+00, -2.6546e+00, -1.4483e+00]], [[ 4.4687e+00, -8.2492e+00, -8.0049e+00, -9.0399e+00, -1.0606e+01, -2.2226e+00, -8.3129e+00, -9.4646e+00, -1.0400e+01, -1.1393e+01, -9.3715e+00, -6.9443e+00, -9.6548e-01]], [[ 2.4547e-01, -3.4128e+00, -3.3074e+00, -4.3750e+00, -3.5006e+00, -4.0746e+00, -3.0318e+00, -3.9208e+00, -2.5187e+00, -3.5359e+00, -2.0293e+00, -1.7307e+00, -2.9452e+00]], [[-3.0242e-01, -1.2002e+00, -1.9505e+00, -1.6772e+00, -1.9727e+00, -2.6065e+00, -1.8476e+00, -9.1991e-01, -2.5515e-01, -1.0523e+00, -3.1146e-01, -1.6497e+00, -1.7403e+00]], [[-3.5769e-01, -5.5121e+00, -5.2890e+00, -4.9349e+00, -5.2847e+00, -2.0223e+00, -2.0361e+00, -1.8487e+00, -2.3877e+00, -2.6874e+00, -9.6630e-01, -1.8950e+00, -1.3970e+00]], [[ 2.0427e+00, -4.7131e+00, -2.9891e+00, -5.6841e+00, -7.2084e+00, -3.2878e+00, -5.2550e+00, -4.8994e+00, -3.6999e+00, -6.3911e+00, -6.4655e+00, -5.4634e+00, -3.6190e+00]], [[ 1.2639e+00, -6.0547e+00, -6.1429e+00, -4.4740e+00, -4.0423e+00, -2.2530e+00, -4.2887e+00, -3.4684e+00, -4.0594e+00, -3.3972e+00, -1.3935e+00, -7.3135e-01, -2.6471e+00]], [[ 8.6568e-01, -4.6187e+00, -4.4293e+00, -4.2558e+00, -4.2720e+00, -3.6027e+00, -7.2178e-01, -3.2594e+00, -3.4061e+00, -3.3817e+00, 1.8334e-01, -1.3646e+00, -2.3869e+00]], [[ 4.1028e-01, -5.0524e+00, -5.6178e+00, -6.4481e+00, -7.0105e+00, -2.5776e+00, -3.8355e+00, -3.5113e+00, -4.4984e+00, -5.7321e+00, -6.1475e+00, -4.6201e+00, -2.6102e+00]], [[ 1.2889e+00, -3.3175e+00, -4.6162e+00, -4.0104e+00, -2.6750e+00, -2.2596e+00, -2.4418e+00, -2.1550e+00, -4.1284e+00, -4.5371e+00, -4.3403e+00, -2.8274e+00, -5.3027e+00]], [[ 2.1244e+00, -8.5620e-01, -7.0812e-01, -8.0360e-01, -3.0899e-01, -1.4481e-01, 8.4214e-01, 2.7383e-01, -3.2921e-01, -1.2011e+00, 9.4121e-02, 3.0441e-01, 1.2404e+00]], [[ 1.0700e+00, -4.0296e+00, -4.5287e+00, -3.9735e+00, -3.4800e+00, -3.7436e+00, -3.8476e+00, -4.0068e+00, -4.2888e+00, -3.6943e+00, -3.3884e+00, -2.3334e+00, -1.3061e+00]]], [[[ 2.1201e+00, -6.4386e+00, -5.1663e+00, -4.6492e+00, -2.7428e+00, -1.4235e+00, -2.0698e+00, -1.3394e+00, -1.2859e+00, -3.1173e+00, -4.6851e+00, -3.5692e+00, -2.1895e+00]], [[ 4.5323e+00, -1.1804e+01, -9.7318e+00, -7.6880e+00, -5.7012e+00, -3.3140e+00, -1.2307e+01, -1.0278e+01, -8.1576e+00, -7.1520e+00, -6.9572e+00, -6.9395e+00, -2.1147e+00]], [[ 5.0632e-01, -3.7861e+00, -3.0760e+00, -3.8506e+00, -4.3428e+00, -4.0783e+00, -4.4277e+00, -5.4539e+00, -4.1685e+00, -3.0987e+00, -3.8245e+00, -2.1788e+00, -4.9953e+00]], [[ 1.4381e-01, -1.1958e+00, -1.4504e+00, -2.0081e+00, -2.4260e+00, -3.0928e+00, -2.2844e+00, -2.5341e+00, -1.2509e+00, -1.2936e+00, -1.7998e+00, -1.6166e+00, -3.4076e+00]], [[ 5.2847e-01, -4.7772e+00, -6.0526e+00, -5.9568e+00, -4.8691e+00, -3.4683e+00, -2.4505e+00, -3.3603e+00, -2.7874e+00, -3.8982e+00, -3.4918e+00, -2.8122e+00, -3.6394e+00]], [[ 1.7138e+00, -8.0771e+00, -6.0983e+00, -5.1701e+00, -3.7479e+00, -2.5629e+00, -6.2422e+00, -3.1628e+00, -3.1101e+00, -3.9506e+00, -4.9438e+00, -4.0422e+00, -2.6251e+00]], [[ 1.2276e+00, -5.1359e+00, -5.1447e+00, -4.9019e+00, -4.2433e+00, -3.7261e+00, -4.0209e+00, -3.1518e+00, -2.6647e+00, -2.8235e+00, -3.7654e+00, -8.0345e-01, -2.6158e+00]], [[ 1.6217e+00, -3.9837e+00, -5.1385e+00, -4.4578e+00, -3.1959e+00, -2.8078e+00, -9.3865e-01, -3.4238e+00, -3.4538e+00, -3.6182e+00, -2.8232e+00, -1.0454e+00, -1.2759e+00]], [[ 7.2842e-01, -5.4933e+00, -5.2062e+00, -4.7478e+00, -3.8540e+00, -3.0306e+00, -3.6673e+00, -3.2802e+00, -3.2343e+00, -4.2513e+00, -4.1415e+00, -4.9491e+00, -2.8260e+00]], [[ 1.0117e+00, -2.9176e+00, -3.0708e+00, -3.0538e+00, -2.3733e+00, -2.4884e+00, -1.9986e+00, -2.4838e+00, -3.4812e+00, -3.5211e+00, -3.9975e+00, -3.3063e+00, -3.3634e+00]], [[ 1.7318e+00, -9.1760e-01, -8.9351e-02, -6.6240e-01, -2.4618e-01, -5.5710e-01, 2.1393e+00, 1.1529e+00, -1.2745e+00, -6.1213e-02, -1.2493e+00, 2.2373e-01, -5.2203e-01]], [[ 1.3030e+00, -3.9112e+00, -3.7117e+00, -2.7738e+00, -2.3405e+00, -5.1813e+00, -4.5192e+00, -3.5444e+00, -3.2372e+00, -2.6750e+00, -1.8948e+00, -3.2140e+00, -3.6128e-01]]], [[[ 2.4686e+00, -5.5288e+00, -6.3004e+00, -6.0392e+00, -1.3969e+00, -1.2577e+00, -2.4914e+00, -1.7375e+00, -3.1113e+00, -3.7459e+00, -4.6219e+00, -2.4382e+00, -4.5223e-01]], [[ 4.8320e+00, -9.5133e+00, -1.0080e+01, -9.7282e+00, -5.3555e+00, -6.0818e+00, -1.2923e+01, -1.3362e+01, -1.0559e+01, -1.0560e+01, -1.0308e+01, -7.2839e+00, -2.3433e+00]], [[ 3.0295e-01, -4.2648e+00, -4.3265e+00, -4.7104e+00, -4.5673e+00, -3.4078e+00, -3.1961e+00, -4.1938e+00, -4.0612e+00, -2.5683e+00, -1.9937e+00, -2.0258e+00, -3.7605e+00]], [[-1.1524e-02, -1.7045e+00, -1.7699e+00, -2.8064e+00, -3.2877e+00, -2.2911e+00, -2.5140e+00, -2.1519e+00, -4.4396e-01, -7.1024e-01, -1.3902e+00, -2.0961e+00, -2.1381e+00]], [[ 7.8820e-03, -4.3813e+00, -5.5098e+00, -5.0539e+00, -4.2455e+00, -2.9042e+00, -2.8275e+00, -3.2229e+00, -2.0794e+00, -2.7823e+00, -2.3625e+00, -2.2727e+00, -1.9977e+00]], [[ 2.1511e+00, -4.2945e+00, -4.0653e+00, -4.5606e+00, -4.1571e+00, -1.8844e+00, -6.0731e+00, -4.6784e+00, -2.8678e+00, -3.4510e+00, -5.0881e+00, -5.4993e+00, -1.5524e+00]], [[ 9.2139e-01, -4.9957e+00, -3.8157e+00, -3.7600e+00, -4.1163e+00, -4.3849e+00, -7.7357e+00, -5.5062e+00, -4.2255e+00, -3.0549e+00, -1.0471e+00, -9.4720e-02, -3.1295e+00]], [[ 1.1558e+00, -3.2119e+00, -4.1501e+00, -5.0513e+00, -5.3758e+00, -4.1907e+00, -2.1807e+00, -4.0418e+00, -3.9088e+00, -2.6302e+00, -3.2974e+00, -8.5547e-01, -1.7608e+00]], [[ 9.5737e-01, -4.0616e+00, -5.1906e+00, -6.6369e+00, -3.0638e+00, -1.5496e+00, -3.9040e+00, -3.2028e+00, -3.9768e+00, -3.7351e+00, -5.3470e+00, -6.0159e+00, -3.2413e+00]], [[ 9.0143e-01, -3.0554e+00, -4.0226e+00, -3.8474e+00, -3.3422e+00, -1.7383e+00, -2.0166e+00, -2.6158e+00, -4.0956e+00, -4.1513e+00, -4.7899e+00, -4.6433e+00, -5.0801e+00]], [[ 1.7169e+00, -1.4129e+00, -2.1395e+00, -1.7844e+00, -1.0126e+00, -9.7084e-01, -1.7135e-01, 1.9136e-01, -2.2198e+00, -2.1062e+00, -2.0045e+00, -1.9695e+00, -1.0562e+00]], [[ 1.0612e+00, -4.8861e+00, -5.0517e+00, -3.8843e+00, -2.9442e+00, -3.4824e+00, -4.1056e+00, -3.8550e+00, -3.6276e+00, -3.8258e+00, -3.1376e+00, -2.4473e+00, -1.0559e+00]]], [[[ 1.7962e+00, -2.7994e+00, -6.9451e+00, -3.4765e+00, -3.0421e+00, -2.6171e+00, -3.9676e+00, -4.2929e+00, -5.5060e+00, -3.6921e+00, -4.8324e+00, -3.0731e+00, -2.9739e+00]], [[ 3.6979e+00, -1.1648e+01, -1.0745e+01, -6.2478e+00, -7.8939e+00, -7.1853e+00, -9.3182e+00, -9.8490e+00, -7.2807e+00, -6.8503e+00, -9.8695e+00, -5.6012e+00, -3.9814e+00]], [[ 3.4480e-01, -3.0237e+00, -4.7728e+00, -3.1836e+00, -2.5118e+00, -3.2589e+00, -3.8569e+00, -3.8674e+00, -3.8805e+00, -4.3108e+00, -3.6774e+00, -1.4274e+00, -3.0854e+00]], [[ 3.7301e-02, -1.1937e+00, -2.8914e+00, -1.6939e+00, -2.5210e+00, -2.6558e+00, -2.5971e+00, -2.6555e+00, -3.7643e+00, -3.3956e+00, -2.8264e+00, -1.0266e+00, -1.1847e+00]], [[-1.1508e-01, -4.9648e+00, -5.2704e+00, -4.1614e+00, -2.8285e+00, -3.4633e+00, -1.8586e+00, -2.4213e+00, -3.2853e+00, -3.1058e+00, -2.8940e+00, -1.4437e+00, -2.0773e+00]], [[ 1.3198e+00, -6.6712e+00, -4.8671e+00, -4.9931e+00, -4.9672e+00, -2.4405e+00, -3.5853e+00, -2.9232e+00, -2.6067e+00, -2.7955e+00, -4.2799e+00, -1.8070e+00, -2.2368e+00]], [[ 1.2976e+00, -5.2710e+00, -7.6788e+00, -7.6591e+00, -8.0458e+00, -6.3776e+00, -6.8557e+00, -4.6430e+00, -5.0890e+00, -5.6275e+00, -5.8958e+00, -4.8268e-01, -2.4694e+00]], [[ 7.2641e-01, -3.6905e+00, -4.6576e+00, -4.9403e+00, -3.7115e+00, -4.6763e+00, -2.2121e+00, -3.7019e+00, -3.8204e+00, -3.5313e+00, -3.2964e+00, -2.5992e+00, -3.2202e+00]], [[ 4.5527e-01, -4.5947e+00, -5.1592e+00, -4.9667e+00, -5.1872e+00, -3.6465e+00, -4.0083e+00, -3.0508e+00, -1.3854e+00, -2.3296e+00, -3.6296e+00, -1.1499e+00, -2.5169e+00]], [[ 7.3084e-01, -2.9102e+00, -2.9670e+00, -1.5005e+00, -1.0157e+00, -2.5054e+00, -1.7850e+00, -1.2783e+00, -2.1809e+00, -3.7125e+00, -3.5080e+00, -1.6457e+00, -3.0334e+00]], [[ 2.0058e+00, -9.5915e-01, -4.0301e+00, -2.8980e+00, -2.4427e+00, 1.1642e+00, 1.4195e+00, 1.0689e+00, -9.5616e-01, -1.4223e+00, 1.6597e-01, 1.6004e-01, -8.1236e-01]], [[ 9.3988e-01, -3.6451e+00, -2.1268e+00, -3.0642e+00, -3.2270e+00, -3.0164e+00, -3.6634e+00, -3.0924e+00, -1.9269e+00, -3.2933e+00, -2.7074e+00, -1.4655e+00, 1.6761e-01]]], [[[ 2.4636e+00, -6.1211e+00, -5.6559e+00, -4.9782e+00, -5.8333e+00, -5.1177e+00, -5.8910e+00, -4.3394e+00, -1.9497e+00, -4.2087e+00, -4.6251e+00, -5.5818e+00, -3.2625e+00]], [[ 4.0536e+00, -1.3916e+01, -1.1605e+01, -1.0593e+01, -1.0588e+01, -7.3540e+00, -1.0437e+01, -5.8839e+00, -2.8310e+00, -6.7652e+00, -4.9318e+00, -7.9108e+00, -2.8312e+00]], [[-1.7383e-01, -2.0292e+00, -3.0587e+00, -1.8625e+00, -7.1331e-01, -1.4552e+00, -1.9926e+00, -2.3675e+00, -1.8055e+00, -1.4543e+00, -2.6971e+00, -2.6840e+00, -3.2910e+00]], [[ 5.9419e-02, -6.8391e-02, -9.7358e-01, -1.0951e+00, -2.5709e+00, -2.7392e+00, -3.1026e+00, -2.5405e+00, -1.9103e+00, -3.6102e+00, -4.6367e+00, -3.9694e+00, -1.9242e+00]], [[-2.0797e-01, -3.0479e+00, -2.9579e+00, -2.6215e+00, -2.5089e+00, -2.8717e+00, -2.1590e+00, -1.8208e+00, -8.1536e-01, -1.5229e+00, -3.1335e+00, -2.0036e+00, -1.3425e+00]], [[ 1.7797e+00, -7.4299e+00, -4.0681e+00, -4.3735e+00, -4.7868e+00, -3.5541e+00, -4.2542e+00, -3.0655e+00, -9.6395e-01, -3.3826e+00, -2.4023e+00, -3.8863e+00, -1.4304e+00]], [[ 1.8727e+00, -1.0308e+01, -9.6634e+00, -9.2966e+00, -7.6920e+00, -5.0991e+00, -3.6066e+00, -4.1246e+00, -4.9397e+00, -6.2784e+00, -2.6180e+00, -8.6077e-01, -2.1447e+00]], [[ 9.0935e-01, -3.2642e+00, -3.8319e+00, -4.9694e+00, -3.8592e+00, -5.2595e+00, -1.7839e+00, -2.7177e+00, -1.4661e+00, -1.9569e+00, -2.8864e+00, -2.6112e+00, -2.2439e+00]], [[ 5.7999e-01, -5.2543e+00, -4.3504e+00, -3.7627e+00, -3.6153e+00, -4.1656e+00, -5.6195e+00, -3.9160e+00, -1.5374e+00, -2.1374e+00, -2.9868e+00, -4.6426e+00, -2.8665e+00]], [[ 8.6181e-01, -3.2610e+00, -2.9174e+00, -2.8309e+00, -2.9524e+00, -2.8508e+00, -3.4850e+00, -1.9564e+00, -2.1084e+00, -3.0994e+00, -4.4235e+00, -4.2994e+00, -1.6306e+00]], [[ 2.1555e+00, -2.0544e+00, -1.7567e+00, -1.0598e+00, -6.2222e-01, -1.6072e+00, 4.6489e-01, 9.5179e-01, -6.3866e-01, -1.4898e+00, -1.8430e+00, -8.7405e-01, 7.8398e-01]], [[ 1.1647e+00, -3.0235e+00, -2.7359e+00, -2.9851e+00, -2.3130e+00, -6.2914e-01, -2.5945e+00, -8.8922e-01, -3.0973e+00, -2.9333e+00, -3.4752e+00, -2.8332e+00, 2.0239e-01]]]]) attn_weights tensor([[[[-1.3361, -3.5611, -2.0088, -3.4646, -2.8090, -3.9053, -3.3097, -2.6392, -0.3695, -1.9451, -1.7331, -1.7009, -4.0669]], [[ 0.8709, -4.9341, -5.8000, -5.4660, -5.2524, -2.8327, -2.5325, -3.9479, -4.9954, -5.1398, -3.5638, -2.8674, -1.6385]], [[ 0.3228, -3.0063, -3.2655, -3.7084, -3.6523, -3.8751, -3.4539, -2.7285, -2.7575, -3.5871, -2.6528, -3.0641, -3.7676]], [[ 0.4699, -3.1423, -4.8729, -4.4452, -3.8260, -3.1480, -2.9924, -2.8702, -4.3180, -4.5328, -2.9658, -3.0696, -1.8919]], [[ 1.1225, -1.0306, -0.8207, -1.3081, -1.5753, -1.4943, -0.3900, -0.3367, -1.1617, -2.2487, -1.1017, -1.4168, -1.5898]], [[-0.5584, -4.2308, -5.0966, -4.6640, -5.1899, -3.9166, -4.1972, -3.5661, -3.1079, -3.2381, -3.3538, -3.8385, -3.7134]], [[ 2.3094, -3.6223, -3.6158, -4.0239, -3.1229, -2.7579, -2.6352, -2.5164, -3.0222, -3.6383, -2.3466, -1.4388, -0.7005]], [[-0.1604, -4.4258, -4.3464, -4.2306, -4.1569, -1.9102, -1.7818, -3.5847, -4.0649, -3.9021, -2.8522, -3.4017, -3.5089]], [[-1.1193, -6.0103, -5.0915, -5.1653, -5.2151, -6.1173, -5.2243, -5.5680, -3.3801, -2.7996, -2.1328, -2.3088, -4.2578]], [[ 4.8906, -5.6729, -3.6978, -5.6262, -3.7180, 0.2598, -7.7264, -5.5520, -5.6632, -6.8833, -3.2873, -3.0153, -0.4470]], [[ 2.8977, -4.4311, -2.9234, -3.0538, -1.6452, -0.8694, -0.5727, -0.5722, -0.9297, -2.2023, -0.8410, -1.5990, -0.3397]], [[-0.8029, -4.1781, -3.6229, -4.5040, -4.1498, -4.1809, -3.1885, -2.7544, -1.7021, -2.6272, -1.6306, -2.1137, -3.1983]]], [[[-1.1572, -3.1838, -2.4535, -2.6125, -3.8147, -3.3702, -3.1622, -4.1851, -3.4618, -1.4572, -2.0545, -1.4574, -3.9003]], [[ 0.4184, -3.7453, -5.5732, -4.8529, -3.7077, -3.6137, -2.2414, -4.2384, -4.4260, -4.9814, -4.7671, -4.3759, -4.5428]], [[ 0.5488, -3.0245, -2.5424, -3.2010, -2.8466, -3.5380, -3.1810, -2.2915, -2.4259, -2.0402, -3.2107, -2.9647, -2.7854]], [[ 0.3066, -2.4284, -3.8933, -3.6011, -2.3163, -2.1916, -1.6155, -1.7492, -2.1167, -3.9266, -4.0170, -3.0549, -2.6566]], [[ 0.9565, -1.1981, -1.0670, -0.9860, -0.9742, -1.3442, 0.0446, -0.5815, -1.7637, -1.2138, -1.6034, 0.0103, -0.6430]], [[-0.5679, -4.1539, -4.4275, -4.4777, -4.5534, -4.4530, -4.3776, -4.2369, -3.3898, -2.9143, -3.1435, -3.4589, -2.5926]], [[ 2.3617, -3.5396, -2.5800, -2.8777, -2.4271, -2.8614, -2.6740, -1.9427, -1.8189, -1.5026, -2.2613, -1.9006, 0.2509]], [[-0.5494, -3.5040, -4.3251, -4.0633, -3.1715, -1.6520, -0.9918, -2.1174, -3.0713, -3.9843, -3.6917, -3.1148, -2.8378]], [[-1.3295, -5.3240, -4.4456, -5.6371, -6.4870, -5.8149, -5.0856, -5.0537, -4.0415, -3.2148, -4.0196, -2.2702, -5.2562]], [[ 4.4631, -6.9862, -5.9576, -3.5665, -2.9342, -2.2479, -9.9303, -5.6328, -5.3607, -4.1050, -3.5945, -4.6734, -1.4613]], [[ 3.0022, -4.0033, -3.1447, -3.1784, -2.0342, -1.3417, -0.6521, -0.8503, -0.4801, -0.7121, -1.2066, -0.5383, -0.6674]], [[-0.1588, -3.6010, -3.9005, -4.5848, -4.5295, -4.9301, -3.1684, -3.9049, -2.3336, -2.3681, -2.7585, -1.3460, -2.5905]]], [[[-1.0207, -4.4970, -3.2067, -4.1691, -5.0024, -4.8701, -4.4036, -5.0980, -3.6045, -1.4654, -1.8440, -2.2156, -3.8510]], [[ 0.5567, -4.5251, -6.0618, -5.1312, -4.0318, -5.0543, -4.3323, -5.0948, -6.4922, -5.3646, -5.3192, -5.8637, -4.4547]], [[ 0.3368, -3.8835, -3.2822, -4.2678, -3.7729, -4.2489, -4.1505, -3.3809, -3.1283, -2.9326, -4.1397, -3.8852, -4.5023]], [[ 0.3435, -2.7771, -4.2869, -4.3444, -2.5884, -2.5322, -2.5613, -2.3241, -1.8696, -3.1318, -4.5842, -5.0224, -4.3328]], [[ 1.0912, -2.4621, -2.3160, -2.4837, -1.7639, -2.6617, -1.2637, -1.2327, -2.2203, -2.0345, -1.5170, -1.8853, -1.5305]], [[-0.6244, -4.2717, -5.4740, -5.2545, -5.2195, -5.4678, -4.6749, -4.8625, -3.5019, -3.7934, -3.9026, -3.3620, -3.2791]], [[ 2.1504, -2.9283, -1.9078, -2.0762, -2.4565, -3.4561, -4.8592, -3.5443, -2.3100, -1.3204, -2.5028, -1.8851, -1.0633]], [[-0.5543, -3.8818, -4.1837, -3.9287, -2.9848, -2.6436, -1.3728, -2.2565, -3.3187, -3.3908, -3.5046, -3.9915, -3.8496]], [[-1.5256, -5.9981, -5.6984, -7.2190, -5.9947, -6.0812, -6.1935, -5.0596, -4.0626, -3.6221, -3.5326, -2.8901, -4.5962]], [[ 4.8167, -9.6184, -7.8935, -6.8112, -2.7040, -1.7929, -8.7850, -7.0330, -6.9407, -6.6291, -7.0483, -6.2961, -2.7010]], [[ 3.4544, -3.0488, -2.9636, -3.4488, -2.1887, -2.6765, -1.8761, -2.6895, -1.2651, -1.1471, -1.7975, -2.1813, -1.3945]], [[-0.5982, -3.8193, -3.8714, -5.1436, -4.3624, -4.5069, -4.2617, -4.1321, -2.0989, -2.3987, -2.0835, -1.7179, -3.1568]]], [[[-0.0922, -4.8289, -5.9029, -4.0819, -3.3679, -1.1471, -1.2715, -4.0885, -4.7744, -4.3550, -3.5466, -2.9625, -2.4125]], [[-0.3009, -5.0086, -4.9042, -4.5388, -4.4313, -3.6919, -3.1345, -4.0832, -3.0738, -1.9503, -3.1506, -3.7255, -3.3942]], [[ 0.3714, -2.8403, -2.3680, -2.6303, -3.0565, -3.0939, -3.6380, -2.5756, -2.8177, -3.6070, -3.6492, -1.7311, -2.3117]], [[-0.1248, -2.2715, -3.0139, -2.2378, -1.5080, -2.3961, -1.7985, -1.8116, -2.2912, -3.5884, -3.3639, -2.0281, -3.4076]], [[ 0.9480, -0.6522, -1.3982, -1.4571, -1.7556, -2.0185, -1.6243, -1.4509, -2.1004, -3.1287, -2.8175, -1.3740, -2.6046]], [[-0.6965, -3.5518, -4.8041, -4.0526, -4.4175, -4.2455, -3.4610, -4.2604, -4.6125, -3.6644, -3.3492, -3.1655, -3.5653]], [[ 2.1482, -3.4819, -2.3920, -3.0297, -3.6667, -3.0714, -3.9273, -3.3645, -3.0982, -3.2997, -4.4705, -2.2764, -0.5670]], [[-0.4978, -3.7085, -4.8159, -3.0723, -2.2311, -2.6693, -1.4108, -2.7708, -2.4157, -1.4494, -1.3964, -2.4167, -3.4516]], [[-0.8103, -5.6774, -8.0627, -7.8504, -7.5079, -6.0584, -5.0651, -4.8222, -7.6506, -5.2847, -4.9512, -2.3793, -4.9492]], [[ 4.0574, -8.0546, -7.2008, -3.1714, -4.4845, -2.8932, -4.4087, -3.7456, -5.4207, -3.1573, -7.8194, -2.5738, -2.6483]], [[ 2.8354, -2.2333, -2.3237, -2.0697, -1.9441, -1.5438, -1.0247, -2.2361, -2.0009, -2.4079, -1.2917, -0.9801, -1.1148]], [[ 0.0200, -3.3783, -6.2815, -5.7885, -5.5367, -5.4723, -3.3390, -5.0716, -6.0879, -4.5270, -3.7530, -3.1186, -2.8841]]], [[[-0.6865, -3.3374, -2.4580, -2.4352, -2.3781, -2.6580, -2.1091, -4.0524, -3.0620, -5.0118, -4.4616, -4.7919, -3.7405]], [[-0.3037, -2.3032, -3.4745, -3.4120, -3.1849, -3.6390, -3.3819, -3.7672, -4.0402, -4.3797, -4.0174, -4.2163, -3.0678]], [[ 0.2181, -2.5317, -3.0802, -3.7181, -3.8014, -3.2095, -3.3588, -3.0516, -4.1222, -4.3816, -3.3130, -4.2296, -2.0982]], [[-0.1999, -1.3566, -1.9591, -1.8650, -1.3008, -2.3071, -1.7415, -1.5169, -1.5784, -1.7144, -3.0311, -3.3085, -1.5501]], [[ 1.1065, -0.1674, -0.4894, -1.3258, -1.6737, -2.3274, -1.0077, -1.6071, -1.8455, -2.2269, -1.9108, -2.1687, 0.1091]], [[-0.7547, -2.7991, -4.0664, -3.9488, -3.8502, -4.0967, -3.9057, -3.7382, -1.8085, -3.0561, -3.7481, -3.2243, -2.3351]], [[ 2.1117, -2.3436, -1.8476, -2.6116, -2.2827, -2.4066, -2.7339, -1.6511, -1.9498, -2.1448, -1.9908, -2.8734, -0.2299]], [[-0.7029, -3.6096, -3.7276, -2.9420, -2.2276, -2.1519, -1.1855, -2.2791, -2.5204, -1.6091, -0.5146, -0.9031, -2.7975]], [[-1.3104, -4.7059, -5.0012, -5.4624, -4.6742, -4.2858, -2.9598, -4.0520, -3.0564, -3.2558, -2.4267, -2.2379, -5.8633]], [[ 3.9511, -8.3983, -3.4070, -5.0426, -5.0535, -2.6477, -5.7829, -3.5607, -0.3089, -4.5530, -4.1349, -5.5184, -2.7586]], [[ 2.7846, -2.6151, -2.3385, -2.9477, -3.0938, -2.7759, -1.5298, -3.2014, -2.1442, -2.3935, -2.1603, -0.9968, -0.9673]], [[ 0.0185, -1.4143, -3.9959, -3.2825, -3.4333, -4.9267, -2.9270, -4.9639, -3.7021, -4.5558, -3.9986, -4.6464, -4.0762]]]]) attn_weights tensor([[[[-5.7229e-01, -6.5878e+00, -5.7032e+00, -5.9775e+00, -4.5645e+00, -6.0381e+00, -5.6258e+00, -5.0115e+00, -3.8928e+00, -3.7829e+00, -2.0301e+00, -1.7095e+00, -3.0110e+00]], [[ 3.7772e+00, -2.0872e+00, -1.7848e+00, -2.5006e+00, -2.5305e+00, -3.9422e-01, -2.6434e-01, -9.5927e-01, -9.6962e-01, -1.7540e+00, -1.3898e+00, -1.1823e+00, -7.6233e-01]], [[ 6.6663e+00, -2.9478e+00, -4.2027e+00, -2.8222e+00, -3.7694e+00, 1.7182e+00, -3.4618e+00, -4.2411e+00, -7.4125e+00, -5.2700e+00, -3.3169e+00, -1.8533e+00, 2.2797e+00]], [[ 3.1754e-01, -4.1768e+00, -4.8633e+00, -4.6645e+00, -4.8078e+00, -3.4223e+00, -2.9508e+00, -2.9429e+00, -3.5698e+00, -3.6046e+00, -2.3610e+00, -2.6847e+00, -2.1444e+00]], [[ 1.1643e+00, -5.7815e+00, -4.6644e+00, -4.9857e+00, -5.7204e+00, -5.4771e+00, -4.7064e+00, -5.1775e+00, -4.1356e+00, -4.3312e+00, -3.0888e+00, -3.6975e+00, -4.7953e+00]], [[ 8.5011e-01, -3.0959e+00, -2.2086e+00, -2.5103e+00, -3.4833e+00, -3.9132e+00, -2.4990e+00, -2.1914e+00, -3.1740e+00, -3.5143e+00, -2.2660e+00, -2.5815e+00, -2.6395e+00]], [[ 1.5109e+00, -3.2606e+00, -3.8838e+00, -4.2441e+00, -3.3433e+00, -1.3313e+00, -7.0411e-01, -2.1117e+00, -2.9391e+00, -3.2119e+00, -2.4410e+00, -1.7492e+00, -2.4724e+00]], [[ 2.9383e+00, -3.6412e+00, -3.1768e+00, -3.9557e+00, -2.8611e+00, -7.9706e-01, -4.8285e-01, -3.0338e-01, -1.2044e+00, -2.1528e+00, -9.0420e-01, -1.5966e+00, -1.1490e+00]], [[-1.8428e-02, -5.5556e+00, -5.1444e+00, -4.5498e+00, -4.5178e+00, -3.4404e+00, -2.9376e+00, -4.1793e+00, -4.3058e+00, -3.3174e+00, -1.7675e+00, -2.7608e+00, -4.9749e+00]], [[ 3.3670e-01, -2.7106e+00, -3.3708e+00, -4.2556e+00, -5.4243e+00, -2.2443e+00, -2.6640e+00, -2.1823e+00, -1.8488e+00, -2.3646e+00, -1.9643e+00, -3.1886e+00, -3.6053e+00]], [[ 3.9598e+00, -3.4190e+00, -2.7579e+00, -4.3041e+00, -6.0418e+00, 3.4517e-01, -3.8252e+00, -5.2660e+00, -5.2416e+00, -6.4873e+00, -5.3572e+00, -4.4150e+00, -6.3803e-01]], [[ 2.8861e+00, -3.9367e+00, -5.4170e+00, -4.6174e+00, -3.9901e+00, -1.3975e+00, -3.2752e+00, -3.6674e+00, -5.1849e+00, -4.3238e+00, -1.9163e+00, -2.2783e+00, -1.5553e-01]]], [[[-7.0287e-01, -5.6644e+00, -5.4562e+00, -5.3464e+00, -6.3500e+00, -7.2174e+00, -7.0536e+00, -5.2468e+00, -3.6359e+00, -2.9690e+00, -2.8170e+00, -2.8610e+00, -4.8708e+00]], [[ 2.8359e+00, -1.5664e+00, -1.1772e+00, -1.8272e+00, -8.0321e-01, 1.5742e-01, 1.4435e+00, 1.1272e+00, 1.0737e+00, 3.0447e-01, -5.0235e-01, 2.3236e-03, 6.0890e-01]], [[ 6.3790e+00, -4.4555e+00, -4.5291e+00, -3.3388e+00, -1.2863e+00, -7.5956e-02, -4.3791e+00, -2.4230e+00, -2.2413e+00, -3.3626e+00, -3.1476e+00, -6.1962e-01, 1.1844e+00]], [[ 1.6918e-01, -3.4270e+00, -3.4698e+00, -3.5201e+00, -2.7677e+00, -3.4244e+00, -1.8612e+00, -1.2062e+00, -8.0520e-01, -1.8089e+00, -2.2359e+00, -1.8033e+00, -2.1714e+00]], [[ 7.2123e-01, -3.2478e+00, -3.3760e+00, -3.4430e+00, -4.4797e+00, -3.9361e+00, -3.9011e+00, -4.2302e+00, -3.9897e+00, -3.8223e+00, -3.8339e+00, -3.0961e+00, -4.5690e+00]], [[ 7.5917e-01, -1.1163e+00, -1.2690e+00, -8.8046e-01, -1.4836e+00, -3.9359e+00, -1.2142e+00, -9.6780e-01, -1.2174e+00, -2.2575e+00, -1.9967e+00, -1.3355e+00, -2.6644e+00]], [[ 1.4630e+00, -2.1170e+00, -2.5624e+00, -2.8611e+00, -2.3372e+00, -1.3534e+00, -1.1659e+00, -1.3667e+00, -1.4389e+00, -2.2083e+00, -2.5800e+00, -2.1571e+00, -1.8565e+00]], [[ 3.1475e+00, -2.8522e+00, -2.1355e+00, -3.3879e+00, -2.5790e+00, -9.6542e-01, -1.5054e+00, -7.4032e-01, -4.8283e-02, -2.3302e+00, -3.2182e+00, -2.3453e+00, -2.2077e+00]], [[-3.9866e-01, -2.9515e+00, -2.2791e+00, -3.6421e+00, -2.8643e+00, -2.7160e+00, -7.9970e-01, -1.3711e+00, -1.4016e+00, -2.1008e+00, -3.4125e+00, -2.3077e+00, -3.2088e+00]], [[-4.8423e-02, -2.5860e+00, -1.9093e+00, -2.5949e+00, -3.6540e+00, -2.8041e+00, -2.3607e+00, -2.0267e+00, -2.8714e-01, -9.7925e-01, -1.5220e+00, -1.1070e+00, -1.6912e+00]], [[ 4.4727e+00, -4.5509e+00, -4.2575e+00, -3.1713e+00, -2.9973e+00, -2.0383e+00, -3.0076e+00, -2.4193e+00, -2.3849e+00, -3.6358e+00, -2.9675e+00, -1.8331e+00, 1.6934e-01]], [[ 3.1502e+00, -4.4894e+00, -4.2918e+00, -3.2210e+00, -1.8851e+00, -1.7674e+00, -2.8579e+00, -2.7668e+00, -3.6136e+00, -3.1902e+00, -3.2287e+00, -1.2538e+00, -2.8001e+00]]], [[[-6.2403e-01, -6.7745e+00, -6.2035e+00, -6.9477e+00, -7.4295e+00, -7.5220e+00, -8.2635e+00, -6.4298e+00, -4.3715e+00, -3.0097e+00, -2.8608e+00, -2.6588e+00, -4.9678e+00]], [[ 2.9551e+00, -3.2724e-01, -2.3182e+00, -2.9610e+00, -6.3119e-01, -1.1578e+00, -8.5513e-01, -1.1046e+00, -2.0855e+00, -2.0509e+00, -1.9510e+00, -2.4499e+00, -6.2343e-01]], [[ 6.3916e+00, -3.7451e+00, -3.9277e+00, -6.2866e+00, -2.9979e+00, -1.8151e+00, -4.7235e+00, -7.7455e+00, -5.3109e+00, -4.8980e+00, -6.0932e+00, -5.8195e+00, -1.4264e+00]], [[ 5.5679e-02, -3.9299e+00, -3.3366e+00, -4.0571e+00, -3.7711e+00, -2.8235e+00, -2.7422e+00, -1.9792e+00, -6.5626e-01, -1.3820e+00, -2.1972e+00, -2.3273e+00, -2.5393e+00]], [[ 1.1088e+00, -5.2249e+00, -4.0213e+00, -5.4955e+00, -6.9434e+00, -4.7068e+00, -4.5692e+00, -5.4700e+00, -4.5177e+00, -3.5295e+00, -4.9466e+00, -4.6759e+00, -4.1566e+00]], [[ 8.5890e-01, -2.1026e+00, -3.3907e+00, -4.3336e+00, -4.7356e+00, -4.3258e+00, -3.1128e+00, -1.8386e+00, -9.1271e-01, -3.9179e+00, -2.8107e+00, -3.2490e+00, -3.3020e+00]], [[ 1.4749e+00, -2.4386e+00, -3.5478e+00, -3.3507e+00, -2.9681e+00, -2.6936e+00, -3.0765e+00, -3.1490e+00, -3.0724e+00, -3.4766e+00, -4.2145e+00, -3.9101e+00, -4.6168e+00]], [[ 3.1118e+00, -4.1242e+00, -3.9059e+00, -5.7205e+00, -3.7892e+00, -3.3939e+00, -3.3475e+00, -2.7835e+00, -2.8707e+00, -3.7852e+00, -4.2183e+00, -4.4177e+00, -3.0146e+00]], [[-1.0577e+00, -4.5123e+00, -3.0498e+00, -4.2088e+00, -4.0701e+00, -4.6697e+00, -2.7619e+00, -3.2518e+00, -2.2743e+00, -1.3802e+00, -2.1438e+00, -2.1115e+00, -3.7977e+00]], [[-1.9191e-01, -1.9414e+00, -1.7673e+00, -3.1567e+00, -3.5086e+00, -4.3146e+00, -3.1276e+00, -2.9993e+00, -1.8074e+00, -2.0530e+00, -2.7354e+00, -2.3925e+00, -3.5484e+00]], [[ 4.4375e+00, -2.3250e+00, -2.3240e+00, -3.3288e+00, -1.5148e+00, -1.7820e+00, -3.3326e+00, -2.2930e+00, -4.0674e+00, -3.0953e+00, -5.4733e+00, -4.8636e+00, -2.5182e+00]], [[ 3.1252e+00, -3.8377e+00, -4.6023e+00, -3.7157e+00, -2.6024e+00, -2.8233e+00, -3.8992e+00, -3.8651e+00, -5.8569e+00, -2.7578e+00, -3.6589e+00, -3.0936e+00, -2.9067e+00]]], [[[-1.7880e-01, -7.1405e+00, -7.8580e+00, -7.3399e+00, -7.0393e+00, -6.0260e+00, -6.1187e+00, -6.2677e+00, -6.5309e+00, -5.5105e+00, -6.5234e+00, -2.8943e+00, -4.7336e+00]], [[ 2.4837e+00, -1.9288e+00, -3.3354e+00, -4.5567e+00, -3.5458e+00, -8.5219e-01, -9.3310e-01, -1.0126e+00, -2.0921e+00, -2.4367e+00, -2.4484e+00, -6.4838e-01, -1.4525e+00]], [[ 6.1856e+00, -2.4684e+00, -3.5480e+00, -1.0487e+00, -2.3190e+00, -1.1414e+00, -1.5292e+00, -2.0006e+00, -1.9319e+00, -4.9955e-01, -3.2299e+00, 1.0471e+00, -7.2892e-01]], [[ 3.9790e-01, -3.8020e+00, -4.1800e+00, -3.3588e+00, -3.2383e+00, -3.1735e+00, -2.7131e+00, -2.8131e+00, -3.2431e+00, -2.8811e+00, -2.8853e+00, -1.9340e+00, -1.5977e+00]], [[ 1.1687e+00, -5.1168e+00, -5.0668e+00, -4.8807e+00, -4.1963e+00, -4.4198e+00, -3.3092e+00, -3.2545e+00, -4.8900e+00, -4.7985e+00, -4.6572e+00, -3.0361e+00, -3.2709e+00]], [[ 4.5408e-01, -1.2046e+00, -2.3021e+00, -1.0293e+00, -9.9173e-01, -3.4158e+00, -1.4380e+00, -2.7072e-01, -1.7590e+00, -3.2012e+00, -2.2525e+00, -1.4443e+00, -2.4308e+00]], [[ 1.3881e+00, -1.9742e+00, -2.3456e+00, -2.2236e+00, -2.1198e+00, -2.0670e+00, -1.8977e+00, -2.0255e+00, -1.8522e+00, -1.9140e+00, -2.4074e+00, -1.5791e+00, -2.3425e+00]], [[ 3.2957e+00, -9.0786e-01, -1.9620e+00, -3.0812e+00, -1.8967e+00, -1.7441e+00, -1.5635e+00, -9.7361e-01, -1.4154e+00, -9.4431e-01, -1.7337e+00, -2.0061e-01, -1.5896e+00]], [[-5.5137e-01, -5.6700e+00, -6.1528e+00, -4.4092e+00, -3.6480e+00, -2.2075e+00, -4.5162e-01, -2.7234e+00, -3.8826e+00, -3.6241e+00, -1.5885e+00, -3.1633e+00, -2.4657e+00]], [[ 3.2519e-01, -2.2218e+00, -3.3828e+00, -3.9182e+00, -4.7893e+00, -3.6926e+00, -3.1236e+00, -2.7751e+00, -4.6840e+00, -4.4246e+00, -4.5826e+00, -4.0515e-01, -1.2323e+00]], [[ 3.8033e+00, -3.5616e+00, -3.3949e+00, -2.0936e+00, -3.7379e+00, -3.4146e+00, -1.2904e+00, -1.8666e+00, -2.4318e+00, -3.3691e+00, -4.7622e+00, -1.1468e+00, -8.9264e-01]], [[ 3.3128e+00, -1.6567e+00, -2.6939e+00, 1.8136e+00, -1.3896e+00, -2.4667e+00, -2.3562e+00, -3.1162e+00, -3.5860e+00, -2.4609e+00, -5.1000e+00, -1.5195e+00, -2.1461e+00]]], [[[-8.0017e-02, -7.1151e+00, -6.6027e+00, -6.5036e+00, -5.5839e+00, -4.2610e+00, -3.8920e+00, -6.9912e+00, -5.6211e+00, -5.8017e+00, -3.2119e+00, -3.2827e+00, -6.3191e+00]], [[ 3.0178e+00, -3.6474e+00, -2.4022e+00, -3.3509e+00, -2.6245e+00, -1.5403e+00, -9.8603e-01, -1.4588e+00, -1.9760e+00, -9.1931e-01, -6.9203e-01, -9.6388e-01, 4.6649e-01]], [[ 6.0288e+00, -4.9236e+00, -2.2417e+00, -4.1993e+00, -4.1311e+00, -1.1220e+00, -2.8609e+00, -4.0673e+00, 2.6233e-01, -2.6218e+00, -1.2186e+00, -1.4529e+00, -9.2133e-01]], [[ 5.7432e-01, -2.3028e+00, -2.6662e+00, -2.9887e+00, -3.2896e+00, -4.1585e+00, -3.7803e+00, -3.4041e+00, -1.4775e+00, -2.3664e+00, -3.5143e+00, -4.0778e+00, -2.2614e+00]], [[ 2.6825e-01, -1.0191e+00, -6.0026e-01, -9.2176e-01, -1.6824e+00, -2.9227e+00, -1.9940e+00, -2.3591e+00, -2.4864e+00, -3.8134e+00, -4.8246e+00, -4.3328e+00, -2.4534e+00]], [[ 8.4621e-01, -6.3320e-01, -1.0842e+00, -6.6478e-01, -1.1036e+00, -3.9041e+00, -1.9729e+00, -1.7421e+00, -1.7314e+00, -2.0862e+00, -3.4849e+00, -2.9898e+00, -7.1135e-01]], [[ 1.1535e+00, -1.9992e+00, -2.5277e+00, -2.5510e+00, -2.7474e+00, -2.3626e+00, -2.4568e+00, -2.1492e+00, -1.9717e+00, -2.4384e+00, -2.5469e+00, -2.4177e+00, -1.8189e+00]], [[ 3.2115e+00, 8.7671e-02, -1.4917e+00, -2.1981e+00, -1.4513e+00, -2.1014e+00, -2.8851e+00, -3.7413e+00, -3.9405e+00, -2.1044e+00, -1.6047e+00, -3.5114e+00, -1.4508e+00]], [[-2.0377e-01, -4.1335e+00, -3.6407e+00, -3.0766e+00, -2.8523e+00, -3.4259e+00, -2.3659e+00, -3.4821e+00, -2.9870e+00, -3.3158e+00, -3.8826e+00, -3.7418e+00, -4.1596e+00]], [[ 8.3365e-01, -2.6819e+00, -3.4809e+00, -3.7129e+00, -4.4343e+00, -3.8895e+00, -4.0905e+00, -4.2783e+00, -4.6896e+00, -5.7702e+00, -4.9837e+00, -6.5310e+00, -1.3529e+00]], [[ 3.5115e+00, -5.0980e+00, -1.7113e+00, -3.7597e+00, -3.1984e+00, -1.3643e+00, -3.4601e+00, -3.7089e+00, -1.2269e+00, -2.9778e+00, -1.6137e+00, -4.0434e+00, -2.2440e+00]], [[ 3.0162e+00, -4.0110e+00, -1.8977e+00, -4.1930e+00, -4.9355e+00, -2.3704e+00, -3.5412e+00, -2.8618e+00, -1.8826e+00, -5.0553e+00, -3.6887e+00, -4.4595e+00, -1.5388e+00]]]]) attn_weights tensor([[[[ 7.1797e-01, -3.0150e+00, -2.8575e+00, -3.0115e+00, -2.2168e+00, -4.0658e+00, -2.2827e+00, -2.3997e+00, -2.1421e+00, -2.6692e+00, -3.1919e+00, -1.9775e+00, -1.8681e+00]], [[ 4.8035e+00, -1.9745e-01, -2.4642e+00, -2.5328e+00, -3.0543e+00, 1.8967e-01, -1.0920e+00, -1.4508e+00, -2.5231e+00, -2.2297e+00, -2.1316e+00, -6.7988e-01, 1.9710e+00]], [[ 1.8369e+00, -7.1399e-01, -2.3870e+00, -1.5018e+00, -4.4366e-01, -3.2804e-01, -7.8393e-01, -5.6865e-01, -2.6897e+00, -1.8084e+00, -9.7312e-01, -3.1334e-01, -1.0883e+00]], [[ 2.0966e+00, -2.6928e+00, -2.1169e+00, -2.7656e+00, -2.7450e+00, 7.8204e-01, 8.2250e-01, 2.4681e-01, -1.2639e+00, -1.7619e+00, -2.8501e+00, -2.3625e+00, -2.2423e+00]], [[ 5.2409e-02, -6.9858e+00, -6.6522e+00, -6.8427e+00, -5.7891e+00, -4.2948e+00, -4.0543e+00, -4.4509e+00, -5.5502e+00, -5.3576e+00, -2.7724e+00, -3.1255e+00, -3.9394e+00]], [[-1.7197e+00, -5.1914e+00, -4.3945e+00, -4.2819e+00, -4.3298e+00, -3.7719e+00, -3.4836e+00, -2.8008e+00, -2.1512e+00, -2.3789e+00, -2.0060e+00, -2.5327e+00, -3.4611e+00]], [[ 2.9587e+00, -2.9628e+00, -3.5282e+00, -4.6812e+00, -5.5739e+00, -5.4106e-01, -1.0090e+00, -2.5854e+00, -4.6010e+00, -5.8275e+00, -4.2711e+00, -2.9624e+00, -9.5888e-01]], [[-1.3370e+00, -6.2507e+00, -6.3455e+00, -6.0408e+00, -4.5615e+00, -4.3903e+00, -3.9147e+00, -3.6517e+00, -3.8130e+00, -3.2143e+00, -1.0253e-01, -4.5496e-01, -1.9331e+00]], [[ 3.2598e-01, -2.4613e+00, -2.7605e+00, -2.9300e+00, -2.7268e+00, -5.3524e-02, -8.7515e-01, -1.8938e+00, -3.0787e+00, -2.9226e+00, -1.7117e+00, -2.1411e+00, -1.5131e+00]], [[ 1.2144e+00, -4.1385e+00, -3.7782e+00, -4.3677e+00, -3.2423e+00, -1.0178e-01, -9.4216e-01, -2.5363e+00, -2.6460e+00, -3.1242e+00, -1.5618e+00, -2.1257e+00, -1.8258e+00]], [[ 9.9859e-01, -3.2325e+00, -2.8226e+00, -3.4175e+00, -3.0692e+00, -5.1171e-01, -1.0131e+00, -1.7246e+00, -2.2810e+00, -2.6380e+00, -2.1880e+00, -1.8884e+00, -1.5102e+00]], [[ 3.6805e-01, -4.5246e+00, -3.7459e+00, -3.7683e+00, -4.2089e+00, -7.2163e-01, -1.8534e+00, -2.9018e+00, -3.4905e+00, -3.5252e+00, -2.8179e+00, -3.6341e+00, -3.6750e+00]]], [[[ 1.0149e+00, -3.0099e+00, -2.5861e+00, -3.1676e+00, -2.5603e+00, -4.0257e+00, -1.4977e+00, -2.8253e+00, -3.6472e+00, -2.6204e+00, -3.0284e+00, -1.6385e+00, -5.1540e-01]], [[ 5.2862e+00, -2.6469e+00, -3.1832e+00, -2.4146e+00, 2.9495e-02, 1.5000e-01, -1.3624e+00, -1.7458e+00, -9.5242e-01, -2.0148e+00, -1.4388e+00, -4.6448e-01, 2.0088e+00]], [[ 2.1061e+00, -1.5735e+00, -2.7878e+00, -2.2396e+00, -8.3401e-01, -4.9961e-01, -5.7880e-01, -8.5652e-01, -1.4406e+00, -2.4821e+00, -1.7316e+00, -1.3399e+00, -7.5034e-01]], [[ 2.7245e+00, -1.8992e+00, -1.7945e+00, -2.7269e+00, -2.2605e+00, -7.6851e-01, -5.7301e-01, -2.0187e-01, -5.7466e-01, -1.9543e+00, -2.5290e+00, -2.2449e+00, -1.2477e+00]], [[-1.2185e-01, -5.1464e+00, -3.7981e+00, -4.3195e+00, -3.8750e+00, -2.3491e+00, -1.9616e+00, -3.7662e+00, -3.4146e+00, -3.1967e+00, -3.5799e+00, -2.1520e+00, -1.8104e+00]], [[-1.3716e+00, -4.2328e+00, -3.6993e+00, -3.0618e+00, -3.4986e+00, -3.3658e+00, -3.3181e+00, -3.1474e+00, -2.7017e+00, -2.4357e+00, -2.1394e+00, -1.4653e+00, -3.2162e+00]], [[ 3.3233e+00, -3.8086e+00, -3.4052e+00, -4.6464e+00, -2.6280e+00, -1.8964e+00, -1.5385e+00, -3.4741e+00, -2.3801e+00, -3.7592e+00, -4.8884e+00, -2.7352e+00, -2.8694e+00]], [[-2.1796e-01, -5.4875e+00, -4.8003e+00, -6.1643e+00, -6.1841e+00, -5.0361e+00, -4.5264e+00, -4.0901e+00, -2.7790e+00, -3.0258e+00, -4.5538e+00, -3.8840e+00, -4.0632e+00]], [[ 8.7437e-02, -2.1856e+00, -3.0561e+00, -3.4375e+00, -2.9291e+00, 3.5167e-02, 3.2337e-01, -4.8819e-01, -1.0163e+00, -2.9441e+00, -3.2721e+00, -2.5965e+00, -1.8332e+00]], [[ 1.0332e+00, -3.5760e+00, -3.7812e+00, -4.2941e+00, -2.7311e+00, -5.0836e-02, -1.4344e-01, -1.4708e+00, -2.1857e+00, -3.1843e+00, -3.5066e+00, -2.4962e+00, -2.0372e+00]], [[ 1.2162e+00, -3.3582e+00, -2.9647e+00, -3.6224e+00, -2.6103e+00, -2.0207e+00, -1.1950e+00, -1.1956e+00, -1.3826e+00, -2.2250e+00, -2.7297e+00, -2.7708e+00, -8.9176e-01]], [[ 1.1039e+00, -3.7661e+00, -4.1729e+00, -3.7194e+00, -4.0815e+00, -2.3588e+00, -1.7477e+00, -2.8967e+00, -3.5978e+00, -4.0833e+00, -4.0660e+00, -4.9255e+00, -4.5107e+00]]], [[[ 8.7335e-01, -3.8753e+00, -3.4776e+00, -3.3562e+00, -2.8231e+00, -4.4649e+00, -2.3907e+00, -3.3604e+00, -3.3807e+00, -3.6168e+00, -3.4543e+00, -2.7294e+00, -2.2509e+00]], [[ 5.0023e+00, -1.7045e+00, -2.9846e+00, -3.6689e+00, -1.2566e+00, -1.4483e+00, -2.0184e+00, -2.7641e+00, -2.7681e+00, -3.1086e+00, -3.1167e+00, -3.2677e+00, -1.9048e+00]], [[ 2.0992e+00, -1.0536e+00, -2.0007e+00, -2.2612e+00, -1.1345e+00, -1.0543e+00, -1.4629e+00, -1.5468e+00, -1.7376e+00, -2.3659e+00, -3.1459e+00, -2.5511e+00, -2.1818e+00]], [[ 2.5897e+00, -2.2075e+00, -2.3156e+00, -3.2689e+00, -3.5973e+00, -4.2244e+00, -2.7174e+00, -2.7390e+00, -1.8823e+00, -3.3124e+00, -3.6164e+00, -3.9883e+00, -2.8657e+00]], [[ 5.2573e-01, -4.5145e+00, -4.9295e+00, -6.2233e+00, -6.2871e+00, -4.1868e+00, -3.6993e+00, -4.5220e+00, -5.2035e+00, -3.5262e+00, -2.7492e+00, -1.4964e+00, -2.9602e+00]], [[-1.6572e+00, -3.3035e+00, -3.1040e+00, -4.6608e+00, -4.7492e+00, -3.4778e+00, -3.6197e+00, -3.1158e+00, -1.4899e+00, -2.1335e+00, -2.6582e+00, -1.7462e+00, -2.8605e+00]], [[ 2.4858e+00, -3.0377e+00, -3.5934e+00, -4.9841e+00, -3.4554e+00, -3.8478e+00, -3.5286e+00, -3.1956e+00, -2.2389e+00, -3.1594e+00, -4.6333e+00, -4.8165e+00, -2.9147e+00]], [[-3.0658e-01, -5.7141e+00, -4.7359e+00, -7.6799e+00, -7.6240e+00, -4.9658e+00, -5.7735e+00, -5.5363e+00, -4.1552e+00, -2.3852e+00, -1.7836e+00, -1.9532e+00, -3.7006e+00]], [[ 7.2814e-03, -2.1305e+00, -2.3915e+00, -2.7123e+00, -1.9303e+00, -9.5352e-01, -8.9248e-01, -2.9848e-01, -1.3547e+00, -1.4723e+00, -3.3066e+00, -2.7621e+00, -2.5036e+00]], [[ 9.3270e-01, -3.4592e+00, -2.7538e+00, -3.6451e+00, -3.0634e+00, -2.3473e+00, -1.4755e+00, -2.6044e+00, -2.9583e+00, -2.5634e+00, -3.4461e+00, -4.0827e+00, -3.2883e+00]], [[ 9.9574e-01, -3.5882e+00, -4.1036e+00, -4.3834e+00, -2.8690e+00, -3.5678e+00, -3.8846e+00, -3.6981e+00, -3.2160e+00, -3.8570e+00, -4.8863e+00, -3.1865e+00, -1.8631e+00]], [[ 1.3759e+00, -2.3979e+00, -4.5361e+00, -4.2455e+00, -3.5286e+00, -2.6286e+00, -3.0761e+00, -2.8498e+00, -3.9885e+00, -4.7453e+00, -5.6936e+00, -5.4576e+00, -4.5395e+00]]], [[[ 1.0065e+00, -2.7150e+00, -2.4037e+00, -3.0117e+00, -2.4594e+00, -3.9821e+00, -2.1863e+00, -3.2886e+00, -2.4242e+00, -3.7192e+00, -2.6288e+00, -1.4675e+00, -1.3614e+00]], [[ 4.3183e+00, -2.6958e+00, -3.8915e+00, -2.3315e+00, -2.9556e+00, -2.2803e+00, -9.8489e-01, -2.2710e+00, -2.0620e+00, -2.0840e+00, -1.9581e+00, -1.8049e+00, -2.0315e+00]], [[ 2.4403e+00, -7.4394e-01, -2.0974e+00, -2.6611e-01, -9.7784e-01, -9.3733e-01, -1.1699e+00, -1.0597e+00, -1.0299e+00, -9.0165e-01, -1.7690e+00, 3.1726e-01, -7.6257e-01]], [[ 1.9735e+00, -3.0798e+00, -3.1078e+00, -3.1115e+00, -2.4709e+00, -1.3900e+00, -1.4985e+00, -2.0083e+00, -3.0074e+00, -2.6431e+00, -3.3565e+00, -4.5910e-01, -8.7020e-01]], [[-1.3902e-02, -4.3146e+00, -5.3288e+00, -5.5288e+00, -4.3126e+00, -3.6000e+00, -2.8383e+00, -3.2913e+00, -4.3621e+00, -2.7574e+00, -2.5821e+00, -3.3628e+00, -3.4343e+00]], [[-5.0440e-01, -3.8116e+00, -4.8588e+00, -5.1059e+00, -5.3488e+00, -3.1078e+00, -2.8605e+00, -3.6819e+00, -5.2905e+00, -3.8031e+00, -3.6418e+00, -2.6320e+00, -3.2300e+00]], [[ 1.6767e+00, -3.1609e+00, -3.5650e+00, -3.2294e+00, -1.7606e+00, -2.9737e+00, -2.2476e+00, -2.5225e+00, -1.9331e+00, -3.4302e+00, -3.5956e+00, -1.8312e+00, -2.1798e+00]], [[-1.4545e-01, -6.4287e+00, -7.1699e+00, -6.6420e+00, -5.7410e+00, -4.0287e+00, -3.5976e+00, -4.2793e+00, -5.3546e+00, -4.5783e+00, -3.5285e+00, -2.8114e+00, -3.3446e+00]], [[-1.4592e-02, -3.0049e+00, -4.1978e+00, -4.2186e+00, -3.5620e+00, -2.0057e+00, -1.6572e+00, -1.5728e+00, -3.2662e+00, -1.7169e+00, -1.2743e+00, -2.1877e+00, -2.5611e+00]], [[ 8.5942e-01, -4.4534e+00, -3.8012e+00, -3.6997e+00, -2.1594e+00, -1.5133e+00, -1.0091e+00, -1.8065e+00, -9.2592e-01, -8.1825e-01, -1.4342e+00, -1.8466e+00, -2.1405e+00]], [[ 1.1598e+00, -4.0546e+00, -3.6047e+00, -3.6452e+00, -2.5016e+00, -2.7248e+00, -2.5516e+00, -2.6449e+00, -2.2324e+00, -2.1121e+00, -2.7636e+00, -1.9297e+00, -2.0997e+00]], [[ 9.1981e-01, -4.0646e+00, -4.1876e+00, -3.4027e+00, -4.1481e+00, -2.2189e+00, -2.0626e+00, -3.0618e+00, -4.7809e+00, -2.6933e+00, -2.4598e+00, -3.6032e+00, -3.2293e+00]]], [[[ 1.3831e+00, -1.4728e+00, -2.0248e+00, -2.6385e+00, -2.8095e+00, -4.2825e+00, -1.6614e+00, -4.0988e+00, -4.5547e+00, -5.0751e+00, -4.5693e+00, -2.6797e+00, -1.6710e+00]], [[ 3.4840e+00, -1.8888e+00, -6.7378e-01, -9.7744e-01, -9.6654e-01, -3.8678e-01, -1.3756e+00, -2.4515e+00, -1.9818e-01, -1.8456e+00, -2.0582e+00, -2.6820e+00, -1.9148e+00]], [[ 1.5428e+00, 7.7797e-01, -2.4064e-01, -4.3442e-01, -4.3376e-01, -1.6818e-01, -3.3682e-01, -6.2083e-01, -5.9317e-01, -1.5818e+00, -7.4236e-01, -1.3225e+00, 4.7995e-01]], [[ 1.1558e+00, -1.4102e+00, -1.9158e+00, -1.6488e+00, -1.2388e+00, -3.2090e+00, -1.3705e+00, -1.7076e+00, -2.0957e-01, -1.3239e+00, -2.6311e+00, -2.0142e+00, -7.3016e-01]], [[ 2.5183e-01, -3.2301e+00, -4.4190e+00, -4.6401e+00, -5.4937e+00, -4.1734e+00, -3.8048e+00, -3.9841e+00, -7.4682e+00, -6.9198e+00, -4.5167e+00, -4.9793e+00, -3.1082e+00]], [[-5.4379e-01, -2.6137e+00, -3.0890e+00, -3.1189e+00, -3.7806e+00, -3.4077e+00, -2.7562e+00, -2.8519e+00, -5.3229e+00, -7.3428e+00, -5.5971e+00, -5.1475e+00, -2.7151e+00]], [[ 2.3500e+00, -1.1491e-01, -8.1242e-02, -1.7040e+00, -2.8111e+00, -2.4455e+00, -3.0865e+00, -3.2648e+00, -2.7418e+00, -4.4683e+00, -4.1158e+00, -4.8903e+00, -1.4569e+00]], [[ 1.7781e-01, -6.4795e+00, -6.6446e+00, -6.7372e+00, -5.6290e+00, -4.4219e+00, -3.9912e+00, -6.6245e+00, -4.7578e+00, -5.9493e+00, -5.4239e+00, -4.2038e+00, -4.9957e+00]], [[ 3.5733e-01, -1.1501e+00, -2.0423e+00, -2.8144e+00, -3.1357e+00, -1.3594e+00, -1.6671e+00, -2.2839e+00, -2.2670e+00, -2.0699e+00, -1.0939e+00, -1.3140e+00, -1.3330e+00]], [[ 1.0563e+00, -2.2507e+00, -1.6902e+00, -2.4045e+00, -2.4138e+00, -1.9179e+00, -1.8562e+00, -1.7847e+00, -1.0290e+00, -2.0108e+00, -1.9640e+00, -2.4325e+00, -8.1957e-01]], [[ 9.8478e-01, -1.8535e+00, -1.7293e+00, -2.2720e+00, -2.3296e+00, -2.8735e+00, -2.8757e+00, -2.8003e+00, -1.9186e+00, -2.6351e+00, -2.6625e+00, -2.8557e+00, -1.2332e+00]], [[ 5.8878e-01, -2.7343e+00, -3.1324e+00, -3.4738e+00, -3.3194e+00, -2.2248e+00, -2.2492e+00, -3.8491e+00, -5.1024e+00, -4.7028e+00, -1.9802e+00, -3.6489e+00, -3.0126e+00]]]]) attn_weights tensor([[[[ 1.9289, -3.1912, -1.1654, -1.8254, -2.7044, 2.1483, 1.7856, -1.8488, -1.6099, -1.7947, 0.2510, -1.6750, -2.4420]], [[ 3.7149, -2.7616, -3.8190, -3.7651, -3.3553, -0.9231, -0.3740, -3.0755, -4.2208, -4.3928, -3.3357, -2.2712, -0.0228]], [[ 2.1641, -3.4512, -3.0048, -3.5648, -3.3363, 0.6422, -0.2573, -1.8763, -3.5333, -3.2930, -2.8874, -3.0783, -2.6200]], [[-1.4084, -4.0543, -3.5362, -4.0385, -3.3443, -4.2981, -3.5752, -3.0405, -2.4292, -2.5743, -1.1016, -0.1639, -1.4587]], [[ 3.5353, -2.6652, -3.8791, -4.5580, -3.6474, 0.2386, 0.6898, -2.2707, -3.7605, -3.5623, -2.9551, -2.4611, -2.4422]], [[ 1.8087, -3.3398, -3.5023, -3.8811, -3.5084, -0.7201, -0.8695, -2.4920, -2.5447, -2.8976, -0.4046, -1.5013, -1.4560]], [[ 3.5960, -3.5889, -4.6889, -4.4843, -5.2043, 0.8292, 0.5123, -2.8922, -4.8481, -4.2443, -3.4110, -2.9721, -1.5405]], [[ 0.3659, -4.4400, -4.5942, -5.0216, -4.4445, -2.6509, -3.4588, -3.9838, -4.6358, -5.1494, -3.9330, -3.7569, -3.9255]], [[ 1.4727, -2.8460, -3.1593, -1.8243, -2.6609, -0.0201, 0.0131, -2.5560, -3.0585, -1.5202, -1.5151, -1.7530, -2.0122]], [[ 4.3984, -1.5795, -2.5667, -3.1449, -3.9779, 1.8930, 1.5774, -1.8369, -3.3359, -3.4477, -1.7054, -1.4143, -0.1293]], [[ 1.1383, -4.6010, -3.7636, -4.0516, -3.6349, -4.0309, -4.3536, -3.9020, -2.8818, -2.9478, -1.6109, -1.4978, -2.4152]], [[ 3.6619, -1.0410, -3.3542, -2.7915, -2.5779, -0.7624, -1.0270, -1.7248, -3.8577, -3.0551, -2.4322, -1.6527, -1.1535]]], [[[ 1.9937, -2.6889, -2.4834, -2.0344, -2.9130, 1.3772, 1.8246, -0.8317, -2.5786, -2.1367, -2.2289, -3.9706, -2.0487]], [[ 3.7759, -2.1875, -3.7621, -3.5063, -2.5063, -2.1817, -1.5078, -3.0022, -2.8517, -4.1985, -3.8168, -1.2811, -0.5645]], [[ 1.6423, -2.9865, -3.2107, -3.4875, -2.4628, 0.3329, 0.5510, -0.7484, -1.6392, -3.4614, -3.5961, -2.8222, -2.0431]], [[-1.0785, -3.4052, -2.9111, -3.5838, -4.7983, -3.5167, -3.3940, -2.8039, -1.8192, -1.3769, -1.9760, -1.0449, -2.0183]], [[ 3.7533, -3.2520, -4.7750, -5.1031, -3.4882, -2.1000, -1.4787, -2.6259, -4.0094, -5.0063, -5.1079, -3.1182, -2.6651]], [[ 1.9744, -3.8094, -3.6740, -3.8756, -2.9823, -1.1740, -0.6867, -2.4086, -2.8017, -2.7959, -3.4018, -2.3309, -0.8645]], [[ 3.8435, -3.0154, -3.9800, -3.1052, -2.6616, -0.4108, 0.5794, -2.2347, -2.4986, -3.7694, -3.1661, -1.7330, -1.2169]], [[ 0.6847, -3.5310, -4.4893, -4.5318, -3.9561, -2.6687, -2.5404, -2.9175, -3.3772, -4.5890, -4.5205, -3.4768, -3.9022]], [[ 1.8473, -3.2764, -3.9292, -3.0645, -3.1390, -1.0469, -1.2726, -2.2735, -2.4585, -3.4609, -2.3536, -2.8293, -2.3623]], [[ 4.5793, -2.4308, -3.6839, -2.4262, -2.0585, -0.1002, 0.3378, -1.8188, -2.3087, -3.5856, -3.0818, -1.3275, -0.7477]], [[ 1.1554, -3.8776, -2.8879, -3.3825, -4.4048, -2.1197, -2.4652, -2.5952, -2.5509, -1.8257, -1.8895, -0.9303, -0.8464]], [[ 3.8042, -0.5476, -2.4221, -1.5587, -1.6218, -2.4554, -2.4481, -3.0851, -2.7560, -2.9776, -1.8981, -3.1490, -2.3766]]], [[[ 1.8680, -1.5243, -0.9246, -1.7571, -1.6549, -0.1984, -0.4511, -1.5091, -2.0026, -0.8197, -3.2799, -0.8207, -1.6415]], [[ 3.9277, -2.4230, -3.5889, -3.5981, -2.0271, -2.5599, -3.2633, -4.8196, -1.7589, -3.3322, -5.2577, -2.7982, -0.6107]], [[ 1.3206, -1.9022, -2.1410, -3.4635, -2.0909, -1.7007, -1.7431, -0.9130, -2.2910, -1.9798, -4.4288, -2.3771, -0.2971]], [[-0.8990, -3.6310, -3.2634, -5.5078, -6.9606, -4.4676, -3.7601, -3.6092, -1.2551, -2.1729, -2.3998, -0.8624, -2.6400]], [[ 3.2196, -2.0215, -2.6798, -1.9269, -1.3070, -3.9523, -3.6296, -2.9787, -2.8235, -4.0037, -4.0633, -2.7314, -1.8051]], [[ 1.9114, -2.9030, -3.1814, -3.5484, -3.2766, -2.3999, -2.3362, -3.4807, -3.1603, -3.0707, -4.3006, -3.1935, -2.0392]], [[ 3.8707, -2.7238, -2.6946, -3.2336, -2.3348, -1.5619, -2.9527, -4.1325, -5.1705, -4.1912, -4.6003, -4.1877, -1.9281]], [[ 0.2091, -3.7073, -4.1661, -4.3198, -4.5878, -3.2252, -2.5519, -2.8867, -3.0073, -3.8678, -4.7340, -5.3013, -4.5028]], [[ 1.8441, -2.6201, -2.8875, -2.6811, -2.9921, -1.0672, -0.7329, -2.0206, -2.2098, -2.6449, -3.8077, -3.1221, -2.7861]], [[ 4.4230, -1.4877, -2.2620, -2.3839, -1.4511, -2.1711, -1.8480, -4.0938, -3.6910, -4.4195, -5.6331, -4.2357, -2.1228]], [[ 1.0418, -4.8754, -3.8159, -6.4063, -6.5587, -3.8110, -3.9033, -5.5259, -4.0591, -2.0895, -2.2666, 0.2473, -1.0582]], [[ 3.4572, -1.6801, -2.6267, -2.4139, -0.8283, -1.6806, -1.2321, -2.1232, -3.3470, -3.2159, -5.4964, -3.7019, -3.6343]]], [[[ 1.2979, -4.0310, -5.3820, -4.4196, -3.8135, -0.5065, -0.3290, -2.5376, -2.5112, -1.9971, -0.7859, -3.1265, -1.8522]], [[ 3.1205, -2.0066, -2.8875, -1.1112, -2.2663, -3.9334, -2.6270, -2.6625, -2.1762, -3.5415, -4.1139, -1.9002, -1.8942]], [[ 1.2597, -3.5081, -4.0903, -4.0014, -2.7206, -2.2122, -1.3941, -1.9499, -1.9206, -1.7044, -1.4749, -1.9625, -2.7772]], [[-0.3124, -3.1102, -3.7922, -4.3347, -5.2849, -2.9310, -2.4579, -2.9641, -5.0307, -4.0445, -2.8106, -1.3950, -2.7968]], [[ 2.4488, -2.4544, -3.2614, -3.1855, -2.1336, -2.4964, -2.5790, -1.5179, -2.6260, -2.9008, -3.8760, -1.6864, -2.7928]], [[ 1.9215, -2.7088, -2.2864, -2.9257, -3.5120, -2.6801, -1.7178, -2.7692, -3.1414, -3.3598, -2.5989, -2.5161, -1.5456]], [[ 2.7795, -4.0645, -3.7577, -2.5730, -3.7563, -2.9774, -2.0687, -3.4054, -2.9054, -2.8315, -3.5054, -1.4316, -2.5512]], [[ 0.5115, -3.3029, -3.8713, -3.4929, -2.5936, -4.9971, -3.8792, -2.9049, -3.0295, -5.0914, -4.0797, -2.5263, -3.4648]], [[ 1.9667, -2.7325, -3.0654, -2.0556, -3.0812, -1.9161, -1.0916, -2.2031, -2.6582, -1.8252, -0.8724, -0.5199, -2.0317]], [[ 3.7028, -3.6699, -3.4626, -2.1460, -2.7811, -2.2159, -0.4399, -2.3235, -1.6629, -1.8193, -2.2081, -1.0298, -2.0833]], [[ 0.8380, -3.8176, -4.9726, -4.4914, -4.1589, -2.6638, -2.0645, -2.1166, -2.8833, -2.2190, -2.1944, -1.4245, -1.6845]], [[ 3.3170, -0.6574, -2.6413, 0.7848, -1.7145, -3.7731, -2.7428, -3.2126, -1.6664, -3.2649, -3.6692, 0.2571, -2.0415]]], [[[ 1.6709, -2.2779, -3.0968, -3.3247, -4.3508, -0.6564, -0.2390, -3.5314, -4.8258, -4.5078, 0.0815, -1.2021, -2.2413]], [[ 2.7836, -1.1758, -1.6613, -2.5077, -1.7459, -3.0136, -2.6807, -2.9274, -1.2633, -2.7961, -2.8436, -3.1589, -0.5501]], [[ 1.2866, -2.9920, -2.5574, -2.6957, -2.5617, -1.8921, -1.2762, -2.5476, -3.2113, -2.6560, -1.0250, -2.0539, -1.3139]], [[-0.1697, -2.4357, -3.3379, -3.1861, -4.7048, -3.0174, -2.2492, -3.4302, -4.3912, -5.7708, -4.6349, -4.5696, -3.1393]], [[ 1.8340, -0.2872, -2.6467, -2.3971, -1.9459, -1.3575, -1.9553, -2.0680, -2.3814, -2.3547, -3.5388, -3.1478, -0.6239]], [[ 1.7265, -0.8504, -1.7910, -2.8076, -3.2714, -1.3312, -1.7518, -2.1224, -3.4902, -4.1387, -3.1327, -2.6588, -0.9418]], [[ 2.0895, -2.2954, -2.8023, -3.8366, -3.4454, -0.0378, -0.3028, -3.3981, -2.9943, -3.1349, -0.0483, -1.3792, -2.3357]], [[-0.2064, -3.1502, -3.3851, -3.3614, -3.1914, -3.3031, -3.0483, -3.4585, -2.7632, -3.2756, -3.8955, -3.8828, -3.4655]], [[ 1.5450, -2.7547, -3.4390, -2.4930, -3.1125, -0.5772, -1.1050, -2.7163, -3.4215, -4.3213, -0.6516, -1.6771, -2.6000]], [[ 2.6752, -2.7432, -2.4277, -3.6823, -2.6165, 0.3662, -0.2759, -3.0573, -2.5264, -1.3674, 0.3356, -1.1455, -2.3761]], [[ 0.7786, -2.9048, -3.0784, -2.9659, -2.7928, -3.4085, -2.5106, -2.8407, -2.4403, -3.5448, -3.3574, -2.7145, -1.5284]], [[ 3.7898, -0.9706, -1.3168, -2.4663, -1.8091, -1.8179, -2.8915, -3.5226, -1.5533, -2.1677, -3.1892, -3.9907, -2.0759]]]]) attn_weights tensor([[[[ 2.4317, -2.8555, -3.5818, -2.8731, -3.3910, 1.7475, 1.2190, -2.4742, -3.9032, -3.0020, -0.7270, -2.1607, -2.1641]], [[ 4.1391, -1.9720, -3.4901, -1.8247, -3.3170, 1.5577, 0.1979, -2.4484, -4.3168, -1.6915, -1.0456, -0.8227, 1.2748]], [[ 3.2737, -1.5648, -2.4436, -2.7146, -3.2074, 0.5103, 0.8452, -1.7647, -2.6046, -2.2688, 0.0382, -0.7242, -0.1053]], [[ 2.8683, -0.8363, -2.7522, -2.5280, -2.4393, 2.1964, 0.0495, -0.8649, -3.5461, -2.7085, -1.5514, -1.0628, -0.1485]], [[ 2.5226, -1.2364, -1.7762, -1.8641, -1.2804, 0.8624, 0.4256, -0.8618, -1.7558, -1.1794, -0.5270, -0.3876, 0.3585]], [[ 2.1339, -3.5738, -3.9007, -4.2770, -4.0335, -3.2378, -4.4346, -3.5972, -3.0214, -2.7568, -2.7015, -3.4788, -3.1406]], [[ 2.7127, -2.1788, -3.3867, -2.3709, -2.7535, 1.0468, -0.1598, -2.0558, -3.8228, -2.9052, -1.2627, -1.3776, -1.6316]], [[ 1.8937, -1.6796, -2.7372, -3.1133, -2.1854, 2.3448, 0.4029, -0.6025, -3.0820, -2.9963, -0.3998, -0.3260, -0.9935]], [[ 3.6246, -1.2815, -2.8363, -3.3140, -2.7718, -0.8531, -1.2309, -1.1094, -2.6422, -2.5184, -1.1488, -0.8742, 0.0431]], [[ 1.2304, -4.4526, -4.4068, -4.9023, -2.9878, -2.9964, -2.9852, -3.8136, -3.9499, -4.1800, -1.2364, -0.6489, -1.6471]], [[ 3.3299, -1.6529, -2.3219, -2.0422, -2.3606, 1.4007, 0.1531, -1.5865, -2.4971, -1.9037, -1.1612, -0.4633, -0.5740]], [[ 4.2798, -1.1394, -0.3421, -1.3709, -1.7073, 2.4867, 2.3617, -0.7831, -0.7447, -0.8815, 4.2425, 4.1326, 2.8722]]], [[[ 2.7825, -3.7114, -4.0034, -3.3719, -3.6450, 0.4303, 0.7453, -2.9750, -3.4339, -4.2106, -3.6683, -2.6858, -2.3368]], [[ 4.1002, -2.3660, -2.7396, -1.6407, -2.2416, 0.1940, 0.6860, -1.5469, -1.9491, -2.5447, -1.2284, -1.6162, -0.3058]], [[ 3.4518, -1.6372, -2.1423, -1.8700, -1.0303, -1.4774, -0.5116, -1.9242, -1.5572, -2.6281, -2.2200, -1.0681, -0.8849]], [[ 3.1303, -0.7422, -2.6344, -2.1273, -1.6500, 0.7485, 0.5051, -0.9016, -2.0149, -2.5402, -2.1212, -1.0195, 0.2584]], [[ 2.2705, -1.3461, -1.4044, -1.4517, -0.6383, -0.3331, 1.7279, -0.3414, -0.7865, -0.9223, -0.8109, -0.2632, 0.1287]], [[ 1.7891, -3.1320, -3.1537, -4.0876, -3.5590, -2.8392, -3.6335, -3.5694, -3.0185, -2.6563, -3.2562, -2.7734, -2.3097]], [[ 3.3220, -2.7456, -3.3367, -2.4723, -2.2455, -0.4466, 1.2352, -1.9250, -2.0177, -2.5774, -2.0807, -0.8743, -0.0999]], [[ 2.6340, -2.7953, -2.3503, -2.4993, -2.1375, -1.1708, -0.2411, -0.9182, -1.0815, -1.7850, -1.7866, -1.1520, 0.0938]], [[ 3.2924, -1.9605, -3.4363, -2.3749, -2.0909, -2.7591, -2.2818, -2.2847, -2.1508, -2.9965, -1.7383, -0.9073, -0.5953]], [[ 0.8070, -3.4922, -4.1710, -3.6564, -4.1321, -2.7892, -3.1925, -3.0697, -3.3529, -3.7132, -3.3748, -3.3039, -2.0010]], [[ 3.6663, -1.7217, -2.6495, -1.5711, -2.1889, -1.1962, -0.7165, -1.5402, -1.5503, -2.8658, -1.6817, -1.3810, -0.9359]], [[ 4.8826, -0.2780, 0.5395, -2.6273, -2.0750, 1.2477, 1.5317, 1.6593, 1.3011, 1.4632, -1.6964, 1.1419, 2.4785]]], [[[ 2.7131, -3.1536, -4.1534, -3.6226, -3.7200, -0.7859, -1.8754, -3.6634, -3.4206, -4.2252, -4.0357, -4.5095, -1.7842]], [[ 4.4556, -1.3536, -3.3106, -3.2605, -2.1471, -0.6474, -1.6035, -2.8103, -2.4721, -4.3372, -3.7806, -3.5503, 0.1942]], [[ 3.2235, -1.3436, -2.0061, -3.1774, -1.9173, -0.7402, -0.4617, -2.4749, -2.3588, -2.8299, -3.0717, -3.2762, -0.7844]], [[ 2.7328, -1.9889, -2.1062, -2.5645, -1.8553, -0.4427, -1.4184, -2.1745, -3.1479, -2.6512, -2.5572, -3.0194, -1.0882]], [[ 2.5018, -0.4478, -0.8723, -0.7693, -1.5452, -1.0315, -0.6385, -1.1997, -0.6134, -0.5873, -2.1747, 0.0239, -0.4713]], [[ 1.9851, -2.9367, -2.5717, -4.3090, -4.7017, -3.3459, -3.9447, -3.7672, -3.3244, -2.3223, -1.7171, -1.6892, -2.9053]], [[ 3.0797, -1.6810, -2.8091, -2.7202, -1.9317, -0.9397, -1.4789, -2.6808, -2.8606, -3.5991, -3.1849, -3.7054, -1.2354]], [[ 2.1833, -2.5734, -2.8358, -2.7554, -2.5604, -3.5157, -4.6857, -2.8131, -2.5943, -3.0840, -3.4701, -2.3915, -1.2801]], [[ 3.5183, -2.3639, -2.8044, -4.1308, -1.8336, -3.9264, -3.9500, -2.9704, -2.4829, -3.2452, -2.3705, -2.2124, -0.4776]], [[ 0.4520, -3.2385, -3.2452, -3.9695, -3.9720, -2.6010, -2.2624, -3.3223, -2.3157, -2.2187, -2.6231, -2.0084, -1.6202]], [[ 3.2857, -1.5790, -2.5814, -2.0810, -2.3933, -1.6087, -2.2868, -2.4260, -2.7809, -3.4802, -3.4268, -2.7678, -0.8668]], [[ 4.9465, -0.7799, 1.2474, -0.7912, -2.2342, -0.7820, -0.4459, 0.3549, 0.0765, 1.3640, -1.5714, -0.6696, 1.2673]]], [[[ 2.9443, -4.8579, -5.3655, -4.3748, -5.2815, -0.9240, -0.5660, -4.0061, -5.1804, -1.0463, -2.0079, -1.8826, -3.7564]], [[ 3.6525, -2.7686, -2.4713, 1.1121, -2.8081, -1.9526, -1.5562, -1.2734, -2.1368, -0.9596, -3.0355, -1.5234, -0.7381]], [[ 3.1821, -2.5401, -2.5651, -2.0548, -3.1866, -2.9811, -1.5909, -2.4759, -1.9829, -2.7849, -1.5860, -0.4037, -1.4721]], [[ 2.7514, -2.3557, -3.6559, -2.6409, -3.1550, -1.7493, -1.2509, -2.5202, -2.6504, -2.6459, -2.1831, 0.3777, -2.3544]], [[ 2.3266, -1.2063, -2.0987, -1.2707, -1.3403, -1.4401, 0.3730, -0.8044, -0.6444, -0.6619, -0.1632, -0.6749, -0.3177]], [[ 0.7734, -1.9656, -3.5640, -3.2458, -3.1278, -2.2920, -2.2676, -1.7753, -2.5515, -2.7822, -2.9772, -1.1807, -2.0377]], [[ 3.5217, -5.2000, -5.0662, -4.3438, -4.7260, -1.9249, 0.2556, -4.7951, -4.3360, -1.1567, -0.9374, -3.2479, -3.1816]], [[ 2.8166, -2.1124, -1.7488, -1.9911, -2.4209, -3.1520, -1.8825, -0.9564, -2.3544, -5.2077, -1.8866, -0.2419, -1.2484]], [[ 3.1230, -1.2396, -3.0681, -0.8455, -2.4281, -2.7894, -2.7935, -2.3080, -1.8138, -2.6349, -4.4913, -0.7362, -1.5051]], [[ 0.9341, -4.0086, -2.6889, -2.9486, -2.3894, -1.6616, -1.5100, -2.9820, -3.0339, -3.0362, -3.0570, -2.2964, -1.4009]], [[ 3.0294, -3.0855, -2.7181, -1.6085, -4.0508, -3.0271, -2.1012, -2.5418, -3.8584, -3.0245, -3.4346, -1.7664, -1.7984]], [[ 4.2538, -1.3812, -2.4552, -3.3125, -3.8301, -1.8263, -0.7553, -0.0347, -2.0606, -2.0697, -1.8960, 0.7827, 0.2131]]], [[[ 1.8836, -3.2724, -4.1656, -4.3072, -4.4148, 1.4704, -0.2452, -3.5351, -3.8229, -3.6139, 0.0464, -1.5799, -2.7259]], [[ 2.6695, -1.6893, -2.3958, -2.7215, -2.6392, 0.5131, -1.5009, -2.0909, -1.4234, -1.3496, 0.4509, -1.4687, -0.9430]], [[ 2.4933, -0.8556, -1.4410, -3.2015, -3.2484, -0.8620, -1.8051, -3.3359, -2.0981, -1.9548, -1.2676, -2.1953, -0.9646]], [[ 2.2274, -0.5162, -2.5525, -3.0042, -3.0874, 1.2509, -1.8886, -2.0220, -2.4957, -2.5531, -1.8056, -2.4684, 0.0793]], [[ 2.5124, 0.0765, -2.8524, -1.9863, -1.9687, -1.7506, -0.8331, -1.9637, -2.3434, -3.1724, -0.7012, -1.8019, 0.2174]], [[ 0.9513, -1.5092, -1.8592, -2.1072, -2.4780, -2.2596, -2.2858, -1.2891, -3.6473, -3.8697, -3.7144, -3.9484, -0.9803]], [[ 2.2501, -3.5351, -3.8855, -3.8069, -4.4129, 0.1030, -0.8366, -4.0204, -3.8014, -3.4387, 0.1174, -1.0746, -2.9360]], [[ 2.0757, -0.2167, -0.7359, -2.1613, -1.7922, -0.3755, -1.7429, -0.4052, -1.3090, -1.5877, -1.0433, -2.0980, -0.1579]], [[ 3.0774, -2.5198, -2.4163, -3.1003, -1.9456, -3.0569, -4.2729, -3.8353, -2.1954, -0.9508, -2.5532, -3.6926, -1.6266]], [[ 0.5545, -3.1790, -0.8510, -1.1477, -1.9718, -1.7645, -0.7185, -0.4280, -1.6498, -3.0011, -2.7071, -2.6135, -1.1062]], [[ 2.4385, -3.1470, -2.0722, -2.8924, -2.4532, 0.5529, -1.1521, -3.6568, -2.7414, -2.2111, -0.5633, -1.4445, -2.6891]], [[ 2.8894, -1.5186, -1.7420, -3.2917, -2.3880, 0.9246, 0.1040, -1.7559, -2.2038, -2.4872, 0.5036, -0.2301, -0.6437]]]]) attn_weights tensor([[[[ 1.9948e+00, 5.7403e-01, -8.8786e-01, -6.5304e-02, 2.9232e-01, 8.0140e-01, 3.7400e-01, 4.4484e-01, -6.2319e-01, -2.9331e-01, 8.5993e-01, 6.6714e-01, 4.2429e-01]], [[ 3.7068e+00, -1.1218e+00, -1.7587e+00, -1.6609e+00, 1.0721e-01, -3.8819e-02, 4.3918e-01, -3.0182e-01, -1.7543e+00, -1.2946e+00, 5.1597e-01, 1.2905e+00, 8.8946e-01]], [[ 2.9178e+00, -9.3791e-01, -1.7413e+00, -1.9378e+00, -1.2813e+00, 4.3109e-01, 6.6204e-01, -3.9430e-01, -1.9544e+00, -1.6367e+00, -4.0407e-01, 5.1233e-01, 1.6615e-01]], [[ 1.4051e+00, -5.7593e-01, -1.8070e+00, -2.3146e+00, -8.5091e-01, -1.5834e+00, -1.0090e+00, -7.9589e-01, -2.3276e+00, -3.0741e+00, -1.4446e+00, -9.9051e-01, -1.9283e+00]], [[ 2.3782e+00, -6.9190e-01, -1.2609e+00, -9.8260e-01, -8.4465e-01, -2.2246e-01, -1.0779e+00, -7.4681e-01, -1.3954e+00, -9.7356e-01, 1.4768e-01, -5.9019e-02, 8.0926e-02]], [[ 3.7514e+00, -6.5684e-01, -6.4386e-01, -9.1215e-01, -9.0789e-01, 1.2591e+00, 3.0158e+00, -6.6781e-01, -1.2541e+00, -1.3430e+00, -3.5931e-01, 5.2802e-01, 6.5981e-01]], [[ 3.0940e+00, -1.2716e+00, -2.7101e+00, -1.8181e+00, -1.9242e+00, -2.8086e-01, -1.0006e+00, -1.0620e+00, -3.0714e+00, -2.2679e+00, -1.2515e+00, -7.4773e-01, -6.3046e-01]], [[ 3.8629e+00, 1.5705e-01, -6.3548e-01, -1.4435e+00, -4.1189e-01, 1.5111e+00, 3.6098e-01, 3.5189e-01, -4.2068e-01, -1.3982e+00, 1.1342e-01, 1.5857e+00, 1.4420e+00]], [[-1.3901e+00, 2.6069e+00, 3.4372e+00, 2.6353e+00, 3.0159e+00, 2.4111e+00, 2.2057e+00, 2.4139e+00, 4.0795e+00, 3.1903e+00, 3.6016e+00, 3.9099e+00, 2.7286e+00]], [[ 4.2089e+00, -1.6165e+00, -3.5011e+00, -2.8111e+00, -3.0306e+00, 1.2799e+00, 8.2999e-01, -1.8967e+00, -3.7098e+00, -2.8332e+00, -5.0172e-01, -1.1914e+00, 2.3833e-01]], [[ 2.6464e+00, -4.2579e-03, -2.7274e-01, -6.8771e-01, -2.1715e-01, 2.3346e+00, 1.7256e+00, 9.5739e-01, -3.5782e-01, -6.0982e-01, 1.9833e+00, 1.7334e+00, 5.7025e-01]], [[ 3.4141e+00, -4.5027e-02, -1.8252e+00, -1.1667e+00, 5.9508e-01, 1.9591e+00, 3.6253e-01, 2.0290e-01, -1.8370e+00, -1.6261e+00, 1.2614e+00, 7.8963e-01, -1.6749e-01]]], [[[ 1.6357e+00, 8.3826e-02, -4.3971e-01, -5.3006e-01, 2.8673e-01, 7.8535e-01, 7.5833e-01, 1.4693e-01, 3.7461e-01, -4.0599e-01, -4.3815e-01, 3.6038e-01, 6.8265e-01]], [[ 3.9585e+00, -1.0068e+00, -9.8788e-01, -9.2272e-01, -8.1054e-01, -1.1633e+00, -4.3327e-01, -3.2233e-01, -4.8350e-01, -1.3306e+00, -9.6592e-01, -8.8613e-01, -8.1485e-01]], [[ 3.5150e+00, -1.5510e+00, -2.0537e+00, -2.1515e+00, -2.0804e+00, -7.5025e-01, -2.4166e-01, -1.1354e+00, -1.5674e+00, -2.1344e+00, -1.7810e+00, -1.1114e+00, -1.1776e+00]], [[ 1.6394e+00, -1.8012e+00, -1.0701e+00, -1.8761e+00, -2.5543e+00, -2.3187e-01, -6.5036e-01, -7.4564e-01, -1.5686e+00, -1.1263e+00, -1.8308e+00, -1.2156e+00, -1.7180e+00]], [[ 2.1550e+00, -9.5978e-01, -1.8259e+00, -1.2682e+00, -1.3194e+00, -1.4543e+00, -1.5411e+00, -6.9911e-01, 1.7135e-01, -1.8038e+00, -1.2549e+00, -1.2719e+00, -6.6028e-01]], [[ 4.4310e+00, 6.9316e-01, -2.0553e+00, -1.0841e+00, 2.5066e-01, 1.0281e-01, 1.6601e+00, 9.7632e-01, 1.5656e-01, -2.0226e+00, -1.3651e+00, 6.8226e-02, 6.0474e-01]], [[ 3.5861e+00, -1.9333e+00, -2.6134e+00, -2.4995e+00, -2.1427e+00, -1.3428e+00, -1.2583e+00, -1.2690e+00, -1.5570e+00, -3.0176e+00, -2.7704e+00, -5.1008e-01, -8.6578e-01]], [[ 4.8447e+00, -4.8740e-01, -1.3296e+00, -2.3566e+00, -7.5738e-01, 1.0869e+00, 5.4028e-01, -3.6986e-01, -5.9230e-01, -1.7977e+00, -2.5782e+00, -1.8547e-01, 1.4109e-01]], [[-1.5104e+00, 4.1706e+00, 6.1366e+00, 5.1837e+00, 3.6503e+00, 3.4642e+00, 3.6783e+00, 4.1747e+00, 4.5553e+00, 6.1091e+00, 6.1134e+00, 3.7770e+00, 5.8744e+00]], [[ 4.3281e+00, -2.8763e-01, -1.6331e+00, -2.0674e+00, -8.0315e-01, -7.1553e-01, 2.1085e-01, 6.5612e-01, 2.6039e-01, -1.0418e+00, -1.7022e+00, -1.0478e-01, 1.1565e+00]], [[ 3.1419e+00, -4.0215e-01, 8.8905e-01, 5.6713e-02, -6.9678e-01, 8.9046e-01, 1.2778e+00, 7.5895e-01, 4.5502e-01, 9.2545e-01, 1.5080e-01, 2.6677e+00, 2.0893e+00]], [[ 3.1827e+00, -1.3480e+00, 1.8344e-01, -4.7549e-01, -1.0905e+00, 1.7874e+00, 1.7863e+00, 2.3759e-01, -3.1626e-02, 1.0306e+00, -7.0894e-02, 1.2746e+00, 1.2807e+00]]], [[[ 1.2117e+00, 1.1522e+00, 1.1587e-01, 5.7633e-01, 1.2150e+00, 3.2009e-01, 1.0590e+00, 8.3094e-01, 1.2847e+00, 2.5960e-01, -8.8590e-01, 4.4257e-01, 2.7945e-01]], [[ 3.1064e+00, -1.0560e+00, -1.1522e+00, -1.5411e+00, -5.2352e-01, -4.7204e-01, -7.4924e-01, -4.7347e-01, -8.7182e-01, -1.2802e+00, -2.2487e+00, -1.8270e+00, -8.2146e-01]], [[ 2.9644e+00, -1.5330e+00, -2.1789e+00, -3.0595e+00, -2.6729e+00, -3.6774e-01, -1.1128e+00, -2.0473e+00, -2.2254e+00, -2.3398e+00, -2.7766e+00, -3.3470e+00, -2.8602e+00]], [[ 7.5569e-01, -1.2617e+00, -1.2981e+00, -1.4008e+00, -1.6937e+00, 6.0948e-01, 2.6473e-01, 6.7504e-02, 5.5299e-01, -1.9810e-01, -4.5244e+00, 1.0675e-02, -9.2919e-01]], [[ 1.6506e+00, -1.0799e+00, -1.2626e+00, -1.4048e+00, -1.1245e+00, -1.7640e+00, -2.0208e+00, -1.2183e+00, -1.3860e+00, -1.1925e+00, -2.0905e+00, -1.7936e+00, -2.1099e+00]], [[ 3.5471e+00, -1.3720e+00, -1.3517e+00, -3.1062e+00, -6.6997e-01, 5.7508e-01, 8.2996e-01, -2.0132e+00, -2.4295e+00, -1.8411e+00, -2.7336e+00, -3.1393e+00, -1.9888e+00]], [[ 3.2527e+00, -2.2577e+00, -2.1125e+00, -2.5838e+00, -2.0142e+00, -1.0473e+00, -1.4159e+00, -2.2824e+00, -2.4350e+00, -2.8845e+00, -2.9455e+00, -2.8787e+00, -1.4802e+00]], [[ 3.3064e+00, 3.4951e-01, -1.0533e+00, -9.3666e-01, -5.5983e-01, 6.3469e-01, -7.7058e-01, -3.8341e-01, -9.9836e-01, -1.6446e+00, -1.9749e+00, -1.6462e+00, -6.6930e-01]], [[-3.7241e+00, 1.9678e+00, 3.0022e+00, 2.2442e+00, 1.9926e+00, 2.5523e+00, 2.0959e+00, 2.3208e+00, 3.0344e+00, 2.9542e+00, -1.1752e+00, 3.2262e+00, 1.6370e+00]], [[ 3.7209e+00, -1.1016e+00, -1.2231e+00, -1.9479e+00, -1.0669e+00, -1.1786e+00, -1.4783e+00, -2.2311e+00, -2.1786e+00, -2.1293e+00, -1.7270e+00, -2.0996e+00, -1.6475e-02]], [[ 2.6100e+00, -1.3855e+00, -1.4086e+00, -1.0704e+00, -1.1238e+00, -8.1763e-01, -1.4903e+00, -5.2604e-01, -3.8117e-01, -1.1262e+00, -2.0358e+00, -1.3991e+00, 3.8709e-02]], [[ 2.8816e+00, -5.4192e-01, -1.5524e-01, -5.2535e-01, -5.9117e-01, 1.3937e+00, -3.9319e-01, -2.0989e-01, 6.1077e-01, 3.0363e-01, -5.1242e+00, 2.0251e-01, 1.6699e+00]]], [[[ 1.2954e+00, 1.3782e+00, 7.2446e-01, 8.8869e-01, 1.3545e+00, -1.8737e-02, 8.3043e-01, 1.1855e+00, 1.2991e+00, -4.1780e-01, 9.9229e-01, 1.4820e+00, 1.5337e+00]], [[ 3.8812e+00, -1.8538e+00, -1.8155e+00, -1.4897e+00, -1.7624e+00, -2.3532e+00, -8.7311e-01, -1.4525e+00, -1.7676e+00, -2.0751e+00, -2.0740e+00, -9.8148e-01, -1.1835e+00]], [[ 3.7696e+00, -1.3795e+00, -2.0253e+00, -2.1210e+00, -2.6127e+00, -1.8139e+00, -9.1113e-01, -1.4114e+00, -2.3996e+00, -1.4135e+00, -2.2028e+00, 4.4007e-01, -2.5922e+00]], [[ 1.5845e+00, -2.6511e+00, -2.8276e+00, -3.4059e+00, -3.9545e+00, -1.0993e+00, -7.4125e-01, -1.4029e+00, -3.9087e+00, -2.0366e+00, -1.0049e+00, -1.8427e+00, -1.2950e+00]], [[ 1.7428e+00, -1.5654e+00, -1.3533e+00, -1.5141e+00, -1.5769e+00, -2.8096e+00, -2.3753e+00, -1.3777e+00, -2.3558e+00, -2.9642e+00, -3.0192e+00, -1.2661e+00, -5.8481e-01]], [[ 3.9544e+00, -4.7783e-01, -1.6146e+00, -1.3848e+00, -7.1050e-01, -1.4543e+00, 1.3360e+00, -1.6862e-02, -6.7731e-01, -1.7313e+00, 3.7395e-01, -5.5156e-01, -1.7038e-01]], [[ 3.6943e+00, -2.5357e+00, -2.6108e+00, -1.8009e+00, -2.3577e+00, -2.6359e+00, -2.0293e+00, -2.5273e+00, -2.3218e+00, -2.5120e+00, -2.9690e+00, -2.4060e+00, -1.7331e+00]], [[ 4.5162e+00, -7.9262e-01, -1.2414e+00, -1.7349e+00, -9.9548e-01, -8.0956e-02, 3.4175e-01, -6.4100e-01, -1.3849e+00, -6.8238e-01, -1.1148e+00, 2.3806e-01, -1.4284e+00]], [[-4.5056e+00, 5.2411e+00, 6.4803e+00, 4.4153e+00, 5.3331e+00, 5.0254e+00, 5.2576e+00, 4.7127e+00, 5.1847e+00, 4.8639e+00, 3.5221e+00, 4.8975e+00, 4.8801e+00]], [[ 3.9041e+00, -1.5795e+00, -2.4534e+00, -1.5430e+00, -1.7209e+00, -1.4877e+00, 3.0064e-02, -9.2613e-01, -1.3727e+00, -6.7598e-01, -1.0795e+00, -6.6345e-01, -1.5610e+00]], [[ 3.0459e+00, -7.1506e-01, -1.0448e+00, -8.7751e-01, -8.8719e-01, 1.8231e-01, -5.0712e-02, 9.2395e-01, -4.8032e-01, -1.8873e+00, 3.1240e-02, 3.2999e-02, 1.3187e+00]], [[ 2.7716e+00, 5.2232e-01, -2.9384e-01, -8.1712e-01, -1.5314e+00, 3.3041e-01, 9.2604e-01, 1.3397e+00, -1.2087e+00, -6.7075e-01, 4.5103e-01, 1.6974e+00, 1.0705e+00]]], [[[ 2.5097e+00, 1.9311e+00, 3.5976e-01, 3.8287e-01, 6.6350e-01, 6.7807e-01, 3.2702e-01, 6.8250e-01, -3.9083e-01, 3.3600e-01, 1.4156e-01, 2.9544e-01, 2.7138e+00]], [[ 2.7726e+00, -1.9865e-01, -1.0565e+00, -8.9661e-01, -4.0249e-01, -2.9652e-01, -5.2602e-01, 6.8999e-02, -4.7124e-01, -1.1198e-01, 3.4601e-01, -1.5354e+00, 8.2905e-01]], [[ 2.4625e+00, -1.8100e-01, -1.8022e+00, -2.7379e+00, -2.3150e+00, -1.8608e-01, -7.2834e-01, -5.4371e-01, -1.9681e+00, -1.5478e+00, -1.3213e+00, -2.3333e+00, 3.7590e-01]], [[ 9.8991e-01, -1.2655e+00, -2.7640e+00, -3.1070e+00, -2.4838e+00, -2.2887e-01, 1.0846e-01, -6.3390e-01, -2.8957e+00, -2.9118e+00, -6.6336e-01, -9.2194e-01, -9.3906e-02]], [[ 1.9670e+00, -5.4046e-01, -6.2349e-01, -1.2566e+00, -8.8585e-01, -1.0360e+00, -2.2698e+00, -1.2498e+00, -1.6930e+00, -1.6747e+00, -2.2682e+00, -2.5710e+00, -6.9266e-01]], [[ 2.9187e+00, 1.9900e+00, 2.1096e-01, 1.9230e-01, -7.0402e-01, 1.2051e+00, 1.8494e+00, 1.6843e+00, 6.3355e-01, 8.8796e-01, 7.7061e-01, 1.3431e+00, 2.4710e+00]], [[ 2.8329e+00, -1.6724e+00, -2.4253e+00, -2.0015e+00, -2.0048e+00, -1.3405e-01, -1.6783e+00, -1.9230e+00, -2.0761e+00, -1.3539e+00, -1.2687e+00, -2.7029e+00, -1.5087e+00]], [[ 2.8245e+00, 6.6591e-01, -7.2110e-01, 1.9037e-01, 4.6118e-01, 2.3228e+00, 5.9095e-01, 1.3703e+00, 1.6094e+00, 9.4345e-01, 6.4174e-01, 8.4142e-02, 1.3645e+00]], [[-2.2651e+00, 5.3417e+00, 5.8347e+00, 4.2213e+00, 4.1150e+00, 4.2965e+00, 4.7982e+00, 5.6272e+00, 3.3746e+00, 2.7551e+00, 1.0899e+00, 2.6061e+00, 7.0535e+00]], [[ 2.9530e+00, -6.7727e-01, -1.9217e+00, -2.6564e+00, -2.7660e+00, 1.5121e-01, -4.3328e-01, -1.2381e+00, -1.0141e+00, -1.3037e+00, 2.9497e-01, -9.7000e-01, -5.6016e-01]], [[ 2.7590e+00, 1.1602e+00, 9.8519e-02, -6.2063e-01, -5.4009e-01, 2.1082e+00, 4.1200e-01, 1.1744e+00, 3.2344e-02, -6.3123e-02, 1.4859e-01, -6.0746e-01, 2.3912e+00]], [[ 2.5236e+00, 4.6681e-02, -1.2541e+00, -1.1114e+00, -1.3356e+00, 1.4921e+00, 6.6539e-01, -1.2058e-01, -9.5467e-01, -1.0198e+00, 6.6584e-01, -1.1396e+00, -5.1450e-01]]]]) attn_weights tensor([[[[-8.4191e-01, -2.7179e+00, -2.3755e+00, -2.1246e+00, -2.1412e+00, -2.9143e+00, -2.4080e+00, -3.0995e+00, -2.4414e+00, -2.0004e+00, -1.3506e+00, -1.9458e+00, -1.9830e+00, -2.7255e+00]], [[ 3.7216e+00, 9.6928e-01, 2.9042e+00, 3.1786e+00, 1.1464e+00, 8.1087e+00, 2.6464e-01, -1.7418e-01, 2.2451e+00, 2.7089e+00, 3.0768e+00, 5.6262e-01, 2.0644e+00, 8.0085e+00]], [[-1.1974e+00, -2.1886e+00, -1.8567e+00, -2.4048e+00, -2.4242e+00, -2.4410e+00, -2.0044e+00, -2.5293e+00, -2.0152e+00, -2.4852e+00, -1.2002e+00, -2.5108e+00, -2.3251e+00, -2.4428e+00]], [[ 1.4520e-02, -6.2286e+00, -5.6917e+00, -3.3892e+00, -5.4293e+00, 2.4777e-01, -2.7968e+00, -4.1519e+00, -3.0193e+00, -4.5723e-01, 1.5825e+00, -1.7541e+00, 2.1058e+00, 4.3521e+00]], [[ 4.0912e-01, -2.6616e+00, -3.6266e+00, -2.1320e+00, -2.5935e+00, -3.0769e-01, -1.2820e+00, -2.3057e+00, -2.6799e+00, -1.0362e+00, 1.1809e+00, -9.6005e-01, 9.1977e-01, 1.6079e+00]], [[ 8.7195e+00, 2.0668e+00, 3.9815e+00, 7.7584e-01, -6.5819e-01, 1.2166e+01, 2.9314e+00, -4.6219e-01, 2.5785e+00, -5.2818e-01, 4.3510e+00, -1.9831e+00, 1.3323e+00, 1.1763e+01]], [[-9.9195e-02, -2.8483e+00, -3.8890e+00, -2.9044e+00, -3.4096e+00, -1.2540e+00, -1.0297e+00, -3.3938e+00, -4.2025e+00, -2.9932e+00, -1.5296e+00, -3.4918e+00, -2.1968e+00, -1.0999e+00]], [[-4.1104e+00, -5.5855e+00, -5.4655e+00, -5.0307e+00, -4.8792e+00, -5.5207e+00, -5.0854e+00, -3.8169e+00, -3.7489e+00, -3.1953e+00, -8.8843e-01, -2.6999e+00, -2.5086e+00, -3.0005e+00]], [[-2.0953e+00, -2.4687e+00, -2.8106e+00, -3.2781e+00, -2.6768e+00, -3.4140e+00, -1.9773e+00, -2.5197e+00, -2.7690e+00, -3.2447e+00, -2.3997e+00, -2.5333e+00, -2.8637e+00, -3.2640e+00]], [[-1.9532e+00, -2.2649e+00, -2.4014e+00, -2.6543e+00, -2.5477e+00, -3.9869e+00, -2.3709e+00, -2.4146e+00, -2.4914e+00, -2.6581e+00, -2.6145e+00, -2.5003e+00, -2.5682e+00, -3.9520e+00]], [[ 9.7088e-01, 4.8423e-01, 4.9341e-01, 2.2952e-01, 2.3550e-01, 1.8129e+00, -3.9829e-01, 3.7177e-01, 2.9689e-01, 1.1557e-02, 5.9685e-01, 2.5550e-02, 1.4071e-01, 1.7097e+00]], [[-1.3234e+00, -2.0736e+00, -3.5085e+00, -2.2504e+00, -2.2687e+00, -2.6940e+00, -2.8280e+00, -2.1462e+00, -3.6921e+00, -2.2671e+00, -2.6107e+00, -2.2537e+00, -2.4502e+00, -2.6880e+00]]], [[[-7.8273e-01, -2.6602e+00, -1.7064e+00, -1.1548e+00, -2.6672e+00, -2.6314e+00, -2.8906e+00, -2.8301e+00, -2.5822e+00, -1.4878e+00, -8.2750e-01, -1.5593e+00, -2.7636e+00, -2.7873e+00]], [[ 2.3330e-01, 1.5016e+00, 1.7207e+00, 2.2654e+00, 1.9103e+00, -1.7225e+00, -7.9485e-01, 5.8024e-01, 6.7355e-01, 1.0484e+00, 1.7964e+00, 2.1247e-01, 1.6217e+00, 7.1659e+00]], [[-1.4308e+00, -2.4727e+00, -2.4607e+00, -2.2802e+00, -2.7713e+00, -2.8236e+00, -2.7688e+00, -2.7336e+00, -2.2570e+00, -2.6100e+00, -2.3256e+00, -1.7370e+00, -1.0742e+00, -2.7622e+00]], [[-4.8028e+00, -8.5288e+00, -9.9921e+00, -7.4792e+00, -7.1009e+00, -9.5594e+00, -6.6627e+00, -5.3043e+00, -4.5863e+00, -4.9883e+00, -2.2270e+00, -2.8852e+00, -1.2964e+00, 1.0821e+00]], [[-7.8820e-01, -3.1186e+00, -3.0356e+00, -1.2472e+00, -2.7106e+00, -3.2769e+00, -1.4824e+00, -1.8786e+00, -1.1799e+00, -1.2264e+00, 7.6663e-01, 3.9379e-01, 4.8271e-01, 1.9837e+00]], [[ 3.9039e+00, 3.4324e+00, 3.0097e+00, 3.0576e+00, 3.1049e+00, 1.4835e+00, 1.4303e-01, 1.5126e+00, 6.0869e-01, 1.6365e+00, 2.0366e+00, -5.2925e-01, 1.4787e+00, 8.7145e+00]], [[-4.1095e-01, -3.6150e+00, -3.3351e+00, -1.9642e+00, -3.8308e+00, -1.4410e+00, -1.4126e+00, -3.8888e+00, -3.6167e+00, -3.2727e+00, -1.6981e+00, -1.4123e+00, -3.3020e+00, -3.1562e+00]], [[-5.6010e+00, -7.1622e+00, -6.9472e+00, -7.3660e+00, -6.3890e+00, -7.1317e+00, -6.8337e+00, -5.2278e+00, -4.7247e+00, -4.2916e+00, -4.7424e+00, -3.6460e+00, -3.0970e+00, -3.5462e+00]], [[-2.6703e+00, -2.0906e+00, -2.1068e+00, -3.0132e+00, -1.9808e+00, -3.0423e+00, -3.1454e+00, -1.4824e+00, -1.2714e+00, -1.6078e+00, -2.6140e+00, -2.8218e+00, -8.5750e-01, -1.8089e+00]], [[-1.6968e+00, -2.0018e+00, -2.0749e+00, -2.6058e+00, -2.1812e+00, -2.4862e+00, -2.7786e+00, -2.0646e+00, -1.9281e+00, -2.0727e+00, -2.5539e+00, -2.1279e+00, -1.7392e+00, -2.3015e+00]], [[ 7.0716e-01, 4.2077e-01, 3.7206e-01, 1.2373e-01, 3.4754e-01, -5.1357e-01, -6.0776e-01, 2.7774e-01, 4.2184e-01, 1.7208e-01, -3.8991e-02, -1.3281e-01, 5.1810e-01, 1.3750e+00]], [[-1.4316e+00, -2.1811e+00, -3.3929e+00, -2.3325e+00, -2.9625e+00, -2.6013e+00, -2.2530e+00, -2.3187e+00, -2.0755e+00, -3.6817e+00, -2.4252e+00, -2.4158e+00, -2.4058e+00, -2.6340e+00]]], [[[-7.9532e-01, -2.1080e+00, -1.2961e+00, -1.3690e+00, -2.3697e+00, -1.6948e+00, -1.6372e+00, -2.1918e+00, -2.0397e+00, -1.0974e+00, -1.2841e+00, -1.7087e+00, -1.8353e+00, -1.7912e+00]], [[ 1.6180e+00, 1.0902e+00, 2.8816e+00, 2.0939e-01, 2.8091e+00, 5.6161e-01, -1.1527e+00, -8.1776e-02, 4.0400e+00, 2.3301e+00, 1.4072e+00, -8.4246e-01, -5.3309e-01, 9.0321e+00]], [[-1.5525e+00, -1.8327e+00, -2.3090e+00, -2.2006e+00, -2.4577e+00, -2.4584e+00, -2.4965e+00, -2.0708e+00, -2.0178e+00, -2.4629e+00, -2.4624e+00, -2.3137e+00, -2.1748e+00, -2.9075e+00]], [[-2.1467e+00, -7.0657e+00, -8.1992e+00, -5.2331e+00, -6.1632e+00, -5.0072e+00, -4.0980e+00, -4.6778e+00, -1.1659e+00, -4.3108e+00, -1.9022e+00, -9.5929e-01, -5.6384e-01, 3.7208e+00]], [[-1.0706e+00, -3.1216e+00, -2.9965e+00, -1.9260e+00, -1.9823e+00, -2.5503e+00, -1.5276e+00, -2.0213e+00, -2.9783e-01, -1.1719e+00, -1.6753e-01, -8.5872e-01, 6.8832e-01, 1.2765e+00]], [[ 7.7910e+00, 3.5002e+00, 4.8535e+00, 3.3257e+00, 1.4427e+00, 2.8607e+00, -6.5525e-01, 7.4160e-01, 4.6479e+00, 3.0785e+00, 1.7917e+00, 9.7855e-01, 6.6386e-01, 1.1135e+01]], [[ 1.1580e-01, -2.4715e+00, -2.6147e+00, -1.0960e+00, -2.0439e+00, -6.9653e-01, -6.9100e-01, -2.6511e+00, -1.3681e+00, -2.5722e+00, -5.8727e-01, -1.2018e+00, -1.0729e+00, -6.9838e-01]], [[-5.3913e+00, -6.7227e+00, -6.7842e+00, -6.8064e+00, -6.2457e+00, -8.0661e+00, -6.3993e+00, -5.3097e+00, -5.0849e+00, -4.5091e+00, -4.6972e+00, -3.6750e+00, -3.6576e+00, -4.0676e+00]], [[-2.5136e+00, -2.3156e+00, -2.4183e+00, -2.8975e+00, -1.6288e+00, -3.2206e+00, -3.1793e+00, -1.9008e+00, -2.4223e+00, -2.0570e+00, -2.4595e+00, -2.8189e+00, -2.3590e+00, -2.9956e+00]], [[-1.7823e+00, -2.1458e+00, -2.2401e+00, -2.7980e+00, -2.2692e+00, -2.8357e+00, -2.9668e+00, -2.2794e+00, -2.0973e+00, -2.2706e+00, -2.6774e+00, -2.6347e+00, -2.5186e+00, -2.3713e+00]], [[ 6.3180e-01, 3.4198e-01, 2.0592e-01, -3.4291e-01, 4.2633e-01, -5.7810e-01, -9.3381e-01, 8.2107e-02, 3.1625e-01, -7.6014e-02, -2.6356e-01, -4.9101e-01, -7.8238e-01, 1.3951e+00]], [[-1.3085e+00, -2.2230e+00, -3.5171e+00, -2.2364e+00, -3.0427e+00, -2.4090e+00, -2.0894e+00, -2.1516e+00, -1.9222e+00, -3.6649e+00, -2.1597e+00, -1.9027e+00, -2.2619e+00, -2.3216e+00]]], [[[-8.6695e-01, -3.2442e+00, -1.6906e+00, -1.8006e+00, -3.6106e+00, -2.5889e+00, -2.3190e+00, -3.3960e+00, -3.5281e+00, -2.3171e+00, -2.1350e+00, -2.6180e+00, -1.1828e+00, -3.2929e+00]], [[-1.0564e+00, 1.2284e+00, -2.1423e+00, 2.3100e+00, -3.0755e+00, -3.3075e+00, -2.1469e+00, 6.8376e-01, -3.5002e+00, -2.2794e+00, -2.3639e+00, -2.1633e+00, -2.0342e+00, 5.3132e+00]], [[-1.8726e+00, -2.7073e+00, -2.5066e+00, -1.6708e+00, -3.5566e+00, -2.7774e+00, -3.2613e+00, -2.9028e+00, -3.6478e+00, -3.3882e+00, -3.2641e+00, -2.1970e+00, -2.7463e+00, -2.6559e+00]], [[-2.6544e+00, -4.9744e+00, -4.8361e+00, -4.2138e+00, -5.1377e+00, -4.9774e+00, -6.2358e+00, -1.6995e+00, -2.4377e+00, -3.7999e+00, -3.7416e+00, 3.8838e-01, 4.8326e+00, 3.0501e+00]], [[-7.0057e-01, -2.7646e+00, -2.9668e+00, -2.2438e+00, -2.7411e+00, -2.3493e+00, -1.3569e+00, -1.9723e+00, -1.7859e+00, -1.5677e+00, -2.9990e-01, -1.1562e+00, 4.3715e-01, 8.0987e-01]], [[ 3.2479e+00, 2.8196e+00, 3.5035e+00, 5.0336e+00, 3.4672e+00, 4.3171e-02, 6.5493e-01, 1.6843e+00, 3.1032e+00, 4.6480e-01, 3.5506e-01, 1.4682e+00, 3.1334e+00, 6.1851e+00]], [[-1.0350e+00, -4.4015e+00, -4.3705e+00, -2.7749e+00, -4.5187e+00, -2.1157e+00, -1.9088e+00, -4.5855e+00, -4.4232e+00, -1.4475e+00, -1.7057e+00, -2.1931e+00, -3.5408e+00, -3.8191e+00]], [[-6.1140e+00, -7.7689e+00, -7.6910e+00, -7.5195e+00, -7.2388e+00, -7.6091e+00, -6.8627e+00, -5.8684e+00, -5.6627e+00, -5.6021e+00, -5.2860e+00, -3.7460e+00, -3.4303e+00, -4.3331e+00]], [[-3.1042e+00, -2.1542e+00, -3.5858e+00, -3.3855e+00, -2.3429e+00, -4.5800e+00, -4.3593e+00, -1.6746e+00, -2.1992e+00, -3.4669e+00, -4.2627e+00, -3.4246e+00, -3.1920e+00, -3.5843e-01]], [[-1.7143e+00, -2.0593e+00, -2.1445e+00, -2.6324e+00, -2.3065e+00, -2.6650e+00, -2.6858e+00, -2.1977e+00, -2.3012e+00, -2.7147e+00, -2.6353e+00, -2.0017e+00, -1.9713e+00, -2.1289e+00]], [[ 4.7482e-01, 3.3403e-01, 1.6457e-01, 7.8629e-02, 6.1844e-02, -7.0292e-01, -4.3225e-01, 1.5261e-01, -4.6525e-02, -6.5993e-01, -5.1462e-01, -3.5388e-01, 7.3105e-02, 4.4860e-01]], [[-1.4838e+00, -2.0472e+00, -3.4656e+00, -2.2391e+00, -2.7012e+00, -2.4078e+00, -2.0590e+00, -2.0695e+00, -2.7284e+00, -1.9963e+00, -2.0366e+00, -2.3631e+00, -2.9285e+00, -2.8533e+00]]], [[[-7.0926e-01, -3.7033e+00, -1.5594e+00, -2.6674e+00, -3.4433e+00, -2.8105e+00, -3.3527e+00, -4.1305e+00, -3.6126e+00, -3.0383e+00, -2.2732e+00, -3.1970e+00, -3.9964e+00, -3.5867e+00]], [[-7.9039e-01, 1.0444e+00, -8.6073e-01, -2.7699e+00, -1.0552e+00, -3.6896e+00, -3.3681e+00, 8.7186e-01, -1.6334e+00, -1.8165e+00, -2.9404e+00, -3.5546e+00, 1.3149e+00, 4.7347e+00]], [[-1.3061e+00, -2.3984e+00, -1.3471e+00, -9.6375e-01, -3.4829e+00, -2.9871e+00, -2.9644e+00, -2.4862e+00, -2.4411e+00, -3.4971e+00, -3.0398e+00, -2.9325e+00, -1.8264e+00, -3.1748e+00]], [[-3.1974e+00, -5.3720e+00, -5.4480e+00, -5.7599e+00, -5.2552e+00, -5.5400e+00, -6.7219e+00, -3.1093e+00, -3.2987e+00, -2.1961e+00, -3.0123e+00, -3.8098e+00, -1.4874e+00, 1.7757e-01]], [[-3.2652e-01, -2.1267e+00, -1.2652e+00, -9.4080e-01, -1.2665e+00, -1.8746e+00, -1.5826e+00, -1.1886e+00, 3.3783e-02, 3.4545e-01, -3.2105e-02, -1.9018e-01, 2.4413e-01, 1.5776e+00]], [[ 2.1536e+00, 2.7200e+00, 1.4537e+00, -1.3092e+00, 5.4888e-01, -1.6302e-02, -2.1844e+00, 1.4059e+00, 4.0742e-01, -1.3556e+00, -1.5785e+00, -2.5889e+00, 1.6504e+00, 8.9482e+00]], [[ 4.7703e-01, -4.0010e+00, -2.9747e+00, -2.2354e+00, -4.1924e+00, -9.9942e-01, -9.5578e-01, -4.5883e+00, -3.4022e+00, -3.8288e+00, -7.7300e-01, -8.0296e-01, -4.7170e+00, -4.5360e+00]], [[-5.2749e+00, -6.7165e+00, -6.4453e+00, -6.2051e+00, -6.2297e+00, -6.2476e+00, -5.9473e+00, -4.8366e+00, -4.5711e+00, -4.2112e+00, -4.4575e+00, -3.9648e+00, -1.6604e+00, -2.5524e+00]], [[-2.4841e+00, -1.1134e+00, -2.1527e+00, -3.6141e+00, -1.5015e+00, -3.8632e+00, -3.2695e+00, -9.2502e-01, -2.5965e+00, -1.8972e+00, -3.4563e+00, -3.1345e+00, -6.3987e-01, -4.1285e-01]], [[-1.0743e+00, -1.3553e+00, -1.2777e+00, -1.7832e+00, -1.5205e+00, -2.0046e+00, -2.1476e+00, -1.5004e+00, -1.6419e+00, -1.5950e+00, -2.0499e+00, -2.0993e+00, -1.3243e+00, -1.0135e+00]], [[ 6.3062e-01, 2.9443e-01, 3.3622e-01, -1.1702e-01, 1.0850e-01, -3.5684e-01, -7.2071e-01, 2.3818e-01, -2.9388e-02, -8.5756e-02, -4.0938e-01, -7.7977e-01, 3.5546e-01, 4.4624e-01]], [[-1.1162e+00, -2.1820e+00, -3.2431e+00, -2.3157e+00, -2.4392e+00, -2.3086e+00, -1.8949e+00, -2.1162e+00, -2.2630e+00, -2.4232e+00, -2.0949e+00, -1.8932e+00, -1.9356e+00, -1.6602e+00]]]]) attn_weights tensor([[[[-1.1273e+00, -2.5843e+00, -3.1912e+00, -2.7960e+00, -1.2454e+00, -1.6930e+00, -2.6671e-01, -9.7264e-01, -1.8079e+00, -1.4694e+00, -1.0556e-03, 9.1690e-01, 1.0171e+00, 1.4516e-01]], [[-9.8871e-01, -2.4393e+00, -2.7597e+00, -2.6024e+00, -2.5633e+00, -3.0613e+00, -2.0447e+00, -4.4976e-01, -1.0396e+00, -9.9389e-01, -1.2688e+00, -4.8293e-01, -5.5338e-01, -1.1301e+00]], [[-2.9616e+00, -3.8487e+00, -3.5359e+00, -3.8751e+00, -3.3320e+00, -3.5936e+00, -3.1688e+00, -2.5641e+00, -2.8363e+00, -3.2078e+00, -2.6891e+00, -2.6675e+00, -2.8952e+00, -2.6768e+00]], [[ 9.5294e-02, -3.0835e+00, -2.9234e+00, -2.9645e+00, -2.8907e+00, -2.7314e+00, -2.4512e+00, -2.3588e+00, -2.3991e+00, -2.5082e+00, -2.1149e+00, -2.3428e+00, -2.2881e+00, -2.1224e+00]], [[-5.5354e-01, -2.3919e+00, -2.7359e+00, -2.6834e+00, -2.5941e+00, -2.2014e+00, -2.1239e+00, -2.1167e+00, -2.3626e+00, -2.2942e+00, -1.7620e+00, -2.0911e+00, -1.9147e+00, -1.6044e+00]], [[-7.6720e-01, -4.7044e-01, -3.1273e+00, -2.8720e+00, -1.2972e+00, -1.0055e+00, -2.2554e+00, -5.8812e-01, -3.2225e+00, -3.1248e+00, -1.7323e+00, -1.2629e+00, -1.9173e+00, -1.0355e+00]], [[ 1.8175e+00, 7.3984e-01, -1.0638e+00, -1.1522e+00, -2.7129e-01, 6.3372e-02, -2.4021e+00, 4.2707e-01, -1.4046e+00, -1.6161e+00, 5.1590e-01, -2.7901e-01, -1.0211e+00, -8.6629e-01]], [[-5.4581e-01, -2.1276e+00, -2.6215e+00, -2.7894e+00, -2.9204e+00, -2.7533e+00, -1.0360e+00, -1.8220e+00, -2.5657e+00, -2.8565e+00, -2.0686e+00, -2.6115e+00, -2.4083e+00, -2.5592e+00]], [[-1.0271e+00, -1.8648e+00, -2.1951e+00, -2.5894e+00, -2.0398e+00, -2.7118e+00, -2.8933e+00, -1.8671e+00, -2.0336e+00, -2.4182e+00, -2.4624e+00, -1.8969e+00, -2.2705e+00, -2.2410e+00]], [[ 1.2377e+00, -5.6757e-01, -4.9089e-01, -9.3096e-01, 1.5919e-01, -1.3227e+00, -1.8076e+00, -6.6645e-01, -3.3189e-01, -6.7592e-01, -1.3001e+00, 2.6074e-01, -2.2820e-01, -5.3847e-01]], [[-5.0179e+00, -2.0412e+00, -1.9476e+00, -1.9815e+00, -1.9553e+00, -1.5843e+00, -1.3790e+00, -1.4789e+00, -1.3898e+00, -1.4572e+00, -8.1833e-01, -1.3208e+00, -1.1546e+00, -8.7513e-01]], [[-2.8944e+00, -2.6545e+00, -6.6529e+00, -6.0097e+00, -5.5874e+00, -2.4753e-01, -4.7518e+00, -1.7800e+00, -5.9757e+00, -5.2142e+00, -2.2421e+00, -4.7483e+00, -4.9414e+00, 3.2620e-01]]], [[[-2.2723e+00, -4.5400e+00, -3.7965e+00, -3.9950e+00, -3.7183e+00, -4.4984e+00, -4.4297e+00, -2.1657e+00, -2.3085e+00, -1.4574e+00, -1.7166e+00, 2.8130e-01, 6.3949e-01, -1.8182e+00]], [[-2.9258e-01, -1.6441e+00, -1.9893e+00, -1.9446e+00, -1.6822e+00, -1.9851e+00, -1.8098e+00, 9.4447e-02, -4.6849e-02, -5.9762e-02, -5.4342e-02, -1.0850e-01, 5.0419e-01, 1.7940e-03]], [[-3.2138e+00, -4.0514e+00, -3.7879e+00, -4.0549e+00, -3.4637e+00, -3.7976e+00, -3.3673e+00, -2.6970e+00, -2.8638e+00, -2.9547e+00, -3.2116e+00, -3.0148e+00, -2.5301e+00, -2.6698e+00]], [[ 1.6995e-02, -3.2881e+00, -3.1667e+00, -3.1309e+00, -3.0664e+00, -2.8679e+00, -2.6497e+00, -2.4951e+00, -2.5086e+00, -2.4734e+00, -2.5025e+00, -2.3972e+00, -2.2188e+00, -2.1945e+00]], [[-5.4947e-01, -2.5035e+00, -2.7950e+00, -2.6381e+00, -2.5608e+00, -2.2419e+00, -2.1312e+00, -2.0450e+00, -2.1488e+00, -2.1204e+00, -1.9842e+00, -1.5939e+00, -1.6554e+00, -1.4767e+00]], [[ 1.2525e+00, 5.2607e-01, -5.7173e-01, 2.2473e-01, -3.0279e-02, -2.1348e+00, -2.5219e+00, 3.8563e-01, -1.1397e-01, -1.0687e+00, -2.6486e-01, -4.9582e-01, 2.8051e-01, 3.4772e-01]], [[ 1.6002e+00, -1.1053e+00, -7.9836e-01, -9.2446e-01, -7.0344e-01, -1.1706e+00, -8.3976e-01, -1.2464e+00, -8.4363e-01, -1.2880e+00, -1.5066e+00, -5.4893e-01, -9.2292e-01, -1.1827e+00]], [[ 4.3657e-01, -1.4855e+00, -1.9053e+00, -1.5449e+00, -1.9158e+00, -1.0081e+00, -1.0104e+00, -1.1942e+00, -1.4671e+00, -1.9474e+00, -1.6112e+00, -1.2576e+00, -1.0849e+00, -1.3354e+00]], [[-5.7771e-01, -1.5294e+00, -1.9613e+00, -1.9847e+00, -1.6825e+00, -2.3363e+00, -2.4984e+00, -1.6013e+00, -1.8535e+00, -1.9081e+00, -1.8811e+00, -2.2460e+00, -1.7383e+00, -1.8180e+00]], [[ 1.3401e+00, -4.7985e-01, 1.9834e-02, -4.1088e-01, 4.2941e-01, -1.0390e+00, -1.0935e+00, -8.4090e-01, -6.8725e-01, -1.3740e-01, -4.5964e-01, -3.7105e-01, -5.4051e-01, -2.1444e-01]], [[-4.9558e+00, -2.4856e+00, -2.3598e+00, -2.2650e+00, -2.2656e+00, -1.8794e+00, -1.6630e+00, -1.7507e+00, -1.7510e+00, -1.5855e+00, -1.5383e+00, -1.2777e+00, -1.2843e+00, -1.1743e+00]], [[ 1.0192e+00, 1.6919e-01, -3.1131e+00, 2.6559e-01, -9.5607e-01, -3.0285e+00, -4.5056e+00, 4.2422e-01, 4.5849e-02, -3.1209e+00, 5.1503e-01, -2.7442e+00, 5.1756e-01, 3.8945e+00]]], [[[-1.5949e+00, -3.1349e+00, -4.1910e+00, -2.6812e+00, -2.1056e+00, -3.5745e+00, -2.9617e+00, -8.4381e-01, 1.4556e+00, -1.7076e+00, 4.5763e-01, 1.5000e+00, 1.8265e-01, -1.5585e+00]], [[-7.8868e-01, -1.8602e+00, -2.4510e+00, -2.4804e+00, -1.8028e+00, -2.0634e+00, -1.8151e+00, 5.0611e-02, -5.4798e-01, -2.5086e-01, -1.0004e+00, -4.7930e-01, 3.9189e-01, -1.5811e-01]], [[-3.1547e+00, -3.9572e+00, -3.7615e+00, -4.0929e+00, -3.4674e+00, -3.6378e+00, -3.3159e+00, -2.6722e+00, -3.1350e+00, -2.9083e+00, -3.5906e+00, -3.4938e+00, -2.7905e+00, -3.0014e+00]], [[-5.7761e-02, -3.3478e+00, -3.2389e+00, -3.2805e+00, -3.1178e+00, -2.8233e+00, -2.6688e+00, -2.4985e+00, -2.6074e+00, -2.4844e+00, -2.8205e+00, -2.8114e+00, -2.2772e+00, -2.3612e+00]], [[-7.4355e-01, -2.6876e+00, -2.9373e+00, -2.8944e+00, -2.7248e+00, -2.2450e+00, -2.1880e+00, -2.2084e+00, -2.2990e+00, -2.3117e+00, -2.5320e+00, -2.4462e+00, -1.7045e+00, -1.8108e+00]], [[ 2.2582e+00, 1.7864e+00, -5.2471e-01, 7.3636e-01, 9.5948e-01, -1.0700e+00, -1.5064e+00, 1.8457e+00, 1.9931e+00, -8.3018e-01, 5.8376e-01, 2.2918e+00, 1.5503e-01, 1.1589e+00]], [[ 1.5110e+00, -3.0999e-01, -8.0245e-01, -7.5075e-01, 1.5072e-01, -1.8550e+00, -5.5648e-01, -3.9837e-01, -6.9893e-01, -1.1734e+00, -1.1524e+00, -3.0163e-01, -4.1910e-01, -9.7321e-01]], [[ 9.9109e-01, -1.0368e+00, -1.6572e+00, -1.3195e+00, -1.5426e+00, -8.8179e-01, -9.3660e-01, -7.7454e-01, -1.4446e+00, -1.7298e+00, -1.6854e+00, -1.0293e+00, -8.3904e-01, -1.4133e+00]], [[-1.1754e+00, -2.3521e+00, -2.8274e+00, -2.9614e+00, -2.4538e+00, -3.1021e+00, -3.1762e+00, -2.3572e+00, -2.6801e+00, -2.7567e+00, -2.8486e+00, -2.6841e+00, -2.5378e+00, -2.8446e+00]], [[ 1.1782e+00, -7.5502e-01, -1.4988e-01, -1.0290e+00, 1.9615e-01, -1.1303e+00, -1.1887e+00, -8.5340e-01, -3.1394e-01, -6.4921e-02, -8.1310e-01, -3.3067e-01, -4.6347e-01, -4.6602e-01]], [[-5.1071e+00, -2.4489e+00, -2.3580e+00, -2.4183e+00, -2.2927e+00, -1.8441e+00, -1.6345e+00, -1.7653e+00, -1.7049e+00, -1.5840e+00, -1.9874e+00, -1.8880e+00, -1.2042e+00, -1.3327e+00]], [[ 1.7986e+00, 1.5108e+00, -2.2757e+00, -1.9474e+00, -1.6730e+00, -2.0116e+00, -3.3593e+00, 1.5406e+00, -3.1619e-01, -2.5819e+00, -1.0508e+00, -1.4336e+00, -1.7313e+00, 4.6290e+00]]], [[[-2.4975e+00, -4.2137e+00, -3.5942e+00, -3.9009e+00, -2.3300e+00, -3.2737e+00, -3.2670e+00, -2.1438e+00, -5.1583e-01, -2.4544e+00, -2.5902e+00, -1.7768e+00, 1.7433e+00, -7.3633e-01]], [[-1.0597e+00, -2.0408e+00, -2.7225e+00, -3.2679e+00, -2.4237e+00, -2.4989e+00, -2.1128e+00, -5.3322e-01, -1.2638e+00, -1.6147e+00, -1.0285e+00, 7.0319e-01, 4.8666e-01, 2.6931e-02]], [[-3.1508e+00, -3.9519e+00, -3.6455e+00, -3.9367e+00, -3.4108e+00, -3.6995e+00, -3.2680e+00, -2.7022e+00, -2.9878e+00, -3.3237e+00, -2.8347e+00, -2.4684e+00, -2.6449e+00, -2.4254e+00]], [[ 9.4197e-02, -3.2171e+00, -3.0939e+00, -3.0919e+00, -2.9655e+00, -2.8158e+00, -2.6047e+00, -2.4996e+00, -2.6233e+00, -2.5395e+00, -2.2879e+00, -1.9294e+00, -2.1465e+00, -2.0563e+00]], [[-5.9687e-01, -2.4699e+00, -2.7150e+00, -2.6200e+00, -2.5613e+00, -2.2167e+00, -2.1189e+00, -2.1324e+00, -2.2133e+00, -1.7773e+00, -1.7616e+00, -1.6815e+00, -1.6613e+00, -1.5670e+00]], [[ 1.2814e+00, 4.1611e-01, -1.1895e-01, 1.5223e+00, 3.8428e-03, -2.8859e+00, -2.5474e+00, 2.9298e-01, -1.8893e-01, -3.1052e+00, -3.2135e+00, -1.5988e+00, -4.1913e-01, 2.0479e+00]], [[ 2.4594e+00, 1.0912e-01, 1.1752e-01, -2.6310e-01, 8.2168e-01, -9.0848e-01, -1.1113e+00, -1.3955e-01, 4.1966e-01, -1.8926e+00, -1.8640e+00, 8.8556e-01, 1.8476e-01, 2.7455e-01]], [[ 7.2232e-01, -1.1760e+00, -1.3489e+00, -8.0122e-01, -1.3581e+00, -1.3115e+00, -1.2933e+00, -9.0186e-01, -1.3480e+00, -1.4551e+00, -1.6509e+00, -3.0005e-01, -1.0868e+00, 7.7690e-02]], [[-3.2976e-01, -1.1706e+00, -2.1028e+00, -1.7402e+00, -1.3416e+00, -1.8743e+00, -2.0585e+00, -1.3240e+00, -1.3293e+00, -2.3756e+00, -1.9370e+00, -1.3799e+00, -1.8790e+00, -1.1156e+00]], [[ 1.3979e+00, -3.9981e-01, 1.7703e-02, -4.4197e-01, 2.1594e-01, -1.1630e+00, -1.1822e+00, -7.1697e-01, 2.9968e-01, -1.6877e+00, -1.0714e+00, 1.0026e-01, 3.8666e-01, 1.9012e-01]], [[-5.0130e+00, -2.2973e+00, -2.1979e+00, -2.1529e+00, -2.1468e+00, -1.7963e+00, -1.5931e+00, -1.6751e+00, -1.7601e+00, -1.4047e+00, -1.1903e+00, -9.2445e-01, -1.0186e+00, -1.0576e+00]], [[ 7.7484e-01, -2.6175e-01, -2.4633e+00, 1.9732e+00, -2.1127e+00, -2.7575e+00, -4.3670e+00, -4.6609e-02, -2.2161e+00, -4.3713e+00, -4.5673e+00, -7.5293e-01, -1.2301e+00, 3.8740e+00]]], [[[ 2.9509e-01, -1.2715e+00, -1.1599e+00, -1.1284e+00, -1.0154e+00, -9.4166e-01, -9.6449e-01, -4.0644e-01, -5.1600e-02, 1.5968e-01, -4.9275e-01, -3.8997e-01, 9.3244e-01, 9.0488e-01]], [[ 4.8604e-01, -7.4882e-01, -1.4129e+00, -1.7309e+00, -1.0692e+00, -1.4011e+00, -8.2917e-01, 5.4120e-02, -8.7706e-01, -1.6212e-01, -2.1211e-01, -1.4442e-01, 2.1167e+00, 1.3498e+00]], [[-2.8877e+00, -3.8901e+00, -3.4389e+00, -3.7943e+00, -3.1971e+00, -3.5423e+00, -3.1265e+00, -2.5517e+00, -3.0805e+00, -2.7313e+00, -2.7604e+00, -2.5514e+00, -2.0754e+00, -2.1670e+00]], [[ 3.1780e-01, -2.9173e+00, -2.7690e+00, -2.8275e+00, -2.7410e+00, -2.5887e+00, -2.4487e+00, -2.3562e+00, -2.6170e+00, -2.4272e+00, -2.1552e+00, -2.1033e+00, -1.7199e+00, -1.7744e+00]], [[-3.2935e-01, -2.3109e+00, -2.4268e+00, -2.4883e+00, -2.4111e+00, -1.9404e+00, -1.7686e+00, -2.0915e+00, -2.1141e+00, -1.9579e+00, -1.3028e+00, -1.2358e+00, -1.5026e+00, -1.2295e+00]], [[ 2.0203e+00, -6.5020e-02, -6.5680e-01, -2.2171e+00, 9.9054e-01, -1.2933e+00, -2.3145e+00, -7.0418e-01, -1.7619e+00, 7.5535e-01, -1.3671e+00, -2.7826e+00, -2.9103e-01, 3.3635e+00]], [[ 2.0997e+00, -1.9662e-01, -7.2600e-01, -7.1014e-01, -1.5170e+00, -1.1823e+00, -8.6355e-01, -6.8328e-01, -1.9128e+00, -1.7523e+00, -5.9901e-01, -1.2054e+00, 9.0431e-01, 7.5113e-01]], [[ 6.9023e-01, -2.0994e+00, -9.0195e-01, -1.0525e+00, -1.9110e+00, -1.0792e+00, -6.2404e-01, -1.6741e+00, -1.6315e+00, -1.6722e+00, -7.6270e-01, -9.3039e-01, -1.2866e+00, -1.5199e+00]], [[ 1.2410e+00, 6.8845e-01, 2.9470e-01, 2.8389e-01, 4.7461e-01, 1.5851e-01, -9.6423e-02, 4.0179e-01, 3.8527e-01, 4.4614e-01, 1.0700e-01, -1.1478e-01, 7.0880e-01, 8.4807e-01]], [[ 1.6984e+00, -3.5601e-01, 1.4094e-01, 2.8400e-03, 4.3074e-01, -4.8132e-01, -4.3133e-01, -7.9727e-01, -2.7727e-02, 4.5523e-01, -6.7164e-01, -2.0858e-01, -5.7412e-01, 4.2712e-02]], [[-5.1028e+00, -2.0751e+00, -1.9435e+00, -2.0062e+00, -1.9690e+00, -1.6107e+00, -1.4153e+00, -1.5200e+00, -1.6114e+00, -1.5184e+00, -9.7985e-01, -9.6681e-01, -8.0252e-01, -8.6424e-01]], [[ 1.0317e+00, -2.0372e-03, -1.3802e+00, -1.0732e+00, -2.7182e-01, -1.6517e+00, -1.2063e+00, -4.4461e-01, -1.9183e+00, -7.2386e-01, -2.3682e+00, -1.8792e+00, 2.8889e-01, 1.3098e+00]]]]) attn_weights tensor([[[[-1.4909e+00, -4.6206e+00, -3.8373e+00, -5.0991e+00, -4.5840e+00, -5.7058e+00, -4.3227e+00, -3.3584e+00, -2.2473e+00, -3.5564e+00, -2.7710e+00, -2.3432e+00, -1.0957e+00, -3.6287e+00]], [[ 1.4034e+00, -1.8375e+00, -3.0239e+00, -2.1007e+00, -2.2409e+00, -1.3619e+00, -4.7862e-01, -1.4559e+00, -3.4433e+00, -2.4804e+00, -8.5491e-01, -1.9924e+00, -1.9848e+00, -1.6211e+00]], [[-6.6266e+00, -1.2775e+01, -1.3803e+01, -1.3362e+01, -1.1922e+01, -1.2295e+01, -9.3522e+00, -8.1831e+00, -7.9456e+00, -7.2597e+00, -5.2189e+00, -4.2800e+00, -3.5097e+00, -4.3986e+00]], [[-3.5292e+00, -7.0829e+00, -6.8912e+00, -6.5514e+00, -5.2011e+00, -7.5039e+00, -5.7679e+00, -4.3899e+00, -3.9067e+00, -3.5582e+00, -3.3243e+00, -1.3543e+00, -1.2999e+00, -3.7941e+00]], [[-1.7036e+00, -4.7100e+00, -4.4586e+00, -6.5368e+00, -4.9491e+00, -6.2971e+00, -5.7447e+00, -3.0161e+00, -2.1293e+00, -3.6939e+00, -3.7451e+00, -1.3999e+00, -1.6855e+00, -2.9232e+00]], [[-4.5102e+00, -6.6571e+00, -7.7513e+00, -7.2560e+00, -7.4942e+00, -9.0027e+00, -5.2852e+00, -3.4049e+00, -4.2960e+00, -4.0000e+00, -4.1681e+00, -3.0859e+00, -3.8715e+00, -4.3605e+00]], [[-3.2218e-01, -3.1226e+00, -3.1407e+00, -4.0568e+00, -3.2121e+00, -4.6799e+00, -3.9818e+00, -1.6611e+00, -1.8705e+00, -3.0141e+00, -2.9772e+00, -1.7592e+00, -2.5651e+00, -3.2543e+00]], [[-1.2569e+00, -3.9588e+00, -2.6505e+00, -2.7182e+00, -2.6530e+00, -1.8443e+00, -1.9501e+00, -1.8447e+00, -1.1529e+00, -1.5928e+00, -1.1416e+00, -1.3282e+00, -9.2780e-01, -2.6712e-01]], [[-3.0335e+00, -6.8910e+00, -7.0437e+00, -6.0846e+00, -6.0816e+00, -7.5328e+00, -5.5467e+00, -3.9013e+00, -3.8178e+00, -3.1677e+00, -2.2068e+00, -2.1215e+00, -1.1466e+00, -3.9507e+00]], [[-4.7147e+00, -8.5789e+00, -8.1220e+00, -8.7297e+00, -8.7435e+00, -7.5233e+00, -5.3251e+00, -5.8553e+00, -4.8609e+00, -5.3494e+00, -4.2578e+00, -4.3676e+00, -2.8570e+00, -3.1346e+00]], [[-1.9931e+00, -3.6450e+00, -3.4933e+00, -3.3663e+00, -3.2778e+00, -2.6780e+00, -2.4851e+00, -2.7555e+00, -2.5044e+00, -2.5195e+00, -1.8303e+00, -2.1396e+00, -1.8301e+00, -1.4386e+00]], [[-6.7318e-01, -5.0132e+00, -4.7386e+00, -4.7677e+00, -4.3430e+00, -4.2108e+00, -4.0190e+00, -3.6998e+00, -3.5491e+00, -3.7125e+00, -3.1088e+00, -3.0000e+00, -2.9284e+00, -2.7227e+00]]], [[[-2.3608e+00, -5.0391e+00, -5.6501e+00, -7.4013e+00, -5.7482e+00, -4.2385e+00, -4.3570e+00, -3.3804e+00, -2.5215e+00, -3.5778e+00, -5.3750e+00, -2.2699e+00, -1.2721e+00, -4.9470e+00]], [[ 1.5170e+00, -1.0986e+00, -2.6667e+00, -1.9055e+00, -2.8210e+00, -1.5984e+00, -1.9181e+00, -1.7033e+00, -1.8079e+00, -3.7842e+00, -2.7462e+00, -1.6177e+00, -1.4828e+00, -1.8668e+00]], [[-7.0323e+00, -1.5183e+01, -1.3919e+01, -1.5953e+01, -1.1783e+01, -1.2055e+01, -1.0729e+01, -9.5061e+00, -7.6048e+00, -5.9416e+00, -7.9313e+00, -4.8359e+00, -2.8372e+00, -6.6270e+00]], [[-3.2568e+00, -7.1883e+00, -6.4794e+00, -8.8664e+00, -4.3365e+00, -6.0275e+00, -5.9479e+00, -4.7412e+00, -3.6788e+00, -3.0380e+00, -5.1003e+00, -1.7989e+00, -4.1541e+00, -3.4011e+00]], [[-3.1691e+00, -7.1771e+00, -7.6818e+00, -8.0901e+00, -6.2663e+00, -7.7614e+00, -7.0379e+00, -4.2632e+00, -3.0422e+00, -3.6807e+00, -4.0459e+00, 6.8544e-02, -2.3836e+00, -3.2975e+00]], [[-4.4500e+00, -7.7163e+00, -8.4020e+00, -8.6872e+00, -7.3876e+00, -7.4157e+00, -6.7992e+00, -3.9566e+00, -3.2919e+00, -3.9199e+00, -4.2535e+00, -4.5564e+00, -3.6740e+00, -3.9205e+00]], [[-5.1682e-01, -3.3788e+00, -3.1790e+00, -3.6765e+00, -3.5551e+00, -4.1754e+00, -3.8610e+00, -1.9375e+00, -2.0878e+00, -1.9999e+00, -2.6519e+00, -2.8393e+00, -2.0432e+00, -2.6159e+00]], [[-1.3447e+00, -4.3651e+00, -2.9956e+00, -2.6852e+00, -2.7554e+00, -1.9158e+00, -2.0040e+00, -1.9192e+00, -1.8701e+00, -1.1804e+00, -1.2569e+00, -1.5307e+00, -1.2967e+00, -1.1771e+00]], [[-3.4646e+00, -6.6971e+00, -9.2216e+00, -6.3997e+00, -6.1969e+00, -7.5993e+00, -6.3089e+00, -3.9085e+00, -4.0619e+00, -5.3423e+00, -2.6280e+00, -1.7761e+00, -2.5851e+00, -3.3936e+00]], [[-4.8428e+00, -8.8637e+00, -7.9421e+00, -9.6587e+00, -7.9822e+00, -5.3736e+00, -5.4756e+00, -5.8653e+00, -5.4613e+00, -3.6723e+00, -5.3271e+00, -2.8714e+00, -4.8099e+00, -4.2580e+00]], [[-1.6383e+00, -4.0940e+00, -3.6758e+00, -3.2704e+00, -3.5719e+00, -2.7650e+00, -2.5583e+00, -3.0831e+00, -2.7559e+00, -2.3776e+00, -2.1623e+00, -1.7129e+00, -2.0472e+00, -1.5586e+00]], [[-7.7812e-01, -5.6202e+00, -5.1031e+00, -4.8611e+00, -4.9190e+00, -4.2883e+00, -4.1392e+00, -4.2019e+00, -3.9224e+00, -3.5035e+00, -3.4828e+00, -3.1468e+00, -3.2638e+00, -2.7975e+00]]], [[[-2.1466e+00, -4.9052e+00, -5.1844e+00, -6.0852e+00, -4.8727e+00, -4.2237e+00, -4.7532e+00, -3.1083e+00, -4.3617e+00, -2.7963e+00, -1.6892e+00, -1.0570e+00, -1.4941e+00, -2.2555e+00]], [[ 1.6081e+00, -6.4791e-01, -2.6094e+00, -2.4093e+00, -2.8343e+00, -2.3386e+00, -2.7304e+00, -8.6909e-01, -2.0789e+00, -3.4147e+00, -3.4352e+00, -2.6203e+00, -2.2989e+00, -2.8801e+00]], [[-7.6576e+00, -1.4444e+01, -1.5273e+01, -1.4627e+01, -1.1142e+01, -1.1805e+01, -1.0417e+01, -8.8924e+00, -5.4184e+00, -6.8462e+00, -5.0242e+00, -5.0331e+00, -3.3005e+00, -5.4774e+00]], [[-3.4491e+00, -8.0232e+00, -6.8905e+00, -9.1418e+00, -4.1342e+00, -6.1604e+00, -5.1624e+00, -4.6156e+00, -4.0669e+00, -2.7540e+00, -3.9723e+00, -3.8399e+00, -2.4060e+00, -3.0813e+00]], [[-2.1344e+00, -6.5265e+00, -7.6396e+00, -6.1000e+00, -6.0234e+00, -9.3130e+00, -8.8634e+00, -3.2467e+00, -2.5405e+00, -3.5421e+00, -1.9903e+00, 2.8632e-01, -2.2886e+00, -5.9837e+00]], [[-4.5610e+00, -7.6583e+00, -8.8840e+00, -7.7361e+00, -7.8529e+00, -7.5646e+00, -6.9462e+00, -3.8936e+00, -5.6869e+00, -4.1062e+00, -4.3918e+00, -3.6601e+00, -3.6559e+00, -4.5476e+00]], [[-6.0848e-01, -3.4644e+00, -3.8551e+00, -4.5088e+00, -3.4204e+00, -4.2708e+00, -3.9109e+00, -1.9324e+00, -2.3118e+00, -2.5062e+00, -3.4260e+00, -3.3472e+00, -2.8761e+00, -2.9583e+00]], [[-1.3554e+00, -4.3766e+00, -3.0604e+00, -2.7824e+00, -2.8265e+00, -1.9541e+00, -2.0383e+00, -1.9425e+00, -1.6126e+00, -1.1955e+00, -1.7695e+00, -1.8621e+00, -1.2000e+00, -1.3441e+00]], [[-3.6464e+00, -8.0608e+00, -8.7754e+00, -6.4004e+00, -6.5971e+00, -8.0364e+00, -6.8981e+00, -4.6051e+00, -6.9745e+00, -4.7639e+00, -4.5343e+00, -3.0734e+00, -1.0670e+00, -4.3184e+00]], [[-3.9930e+00, -8.6786e+00, -7.9646e+00, -8.5821e+00, -7.4549e+00, -4.9789e+00, -5.5646e+00, -5.3476e+00, -6.2658e+00, -3.4648e+00, -3.8367e+00, -3.9068e+00, -2.2365e+00, -3.1437e+00]], [[-1.9865e+00, -3.9250e+00, -3.8337e+00, -3.6311e+00, -3.7879e+00, -2.9549e+00, -2.8674e+00, -3.2187e+00, -2.5807e+00, -2.6039e+00, -2.7266e+00, -2.3642e+00, -1.8966e+00, -1.8719e+00]], [[-8.2690e-01, -5.2300e+00, -5.0573e+00, -4.8448e+00, -4.8358e+00, -4.1999e+00, -4.0667e+00, -4.0230e+00, -3.6225e+00, -3.4345e+00, -3.6466e+00, -3.4020e+00, -3.0900e+00, -2.9820e+00]]], [[[-1.4930e+00, -4.6054e+00, -3.9919e+00, -4.5012e+00, -4.1435e+00, -4.6950e+00, -4.3321e+00, -3.7488e+00, -3.0519e+00, -2.8973e+00, -3.5054e+00, -2.5945e+00, -2.3084e+00, -2.0403e+00]], [[ 1.4331e+00, -7.8323e-01, -1.6073e+00, -1.1857e+00, -2.6071e+00, -1.6620e+00, -2.6497e+00, -1.2558e+00, -3.2496e+00, -1.8956e+00, -3.9648e+00, -4.2828e-01, -2.2460e+00, -1.7920e+00]], [[-8.3798e+00, -1.5368e+01, -1.4862e+01, -1.7182e+01, -1.2829e+01, -1.2330e+01, -1.1184e+01, -1.0046e+01, -8.1606e+00, -7.9434e+00, -7.0274e+00, -4.9639e+00, -2.6819e+00, -7.3995e+00]], [[-3.6465e+00, -7.3902e+00, -7.2223e+00, -9.4997e+00, -5.1026e+00, -6.9497e+00, -6.3520e+00, -4.4948e+00, -2.6786e+00, -4.0866e+00, -4.7667e+00, -2.9111e+00, -2.2247e+00, -4.8358e+00]], [[-1.5041e+00, -5.8558e+00, -7.3632e+00, -6.7880e+00, -5.3881e+00, -7.8777e+00, -8.7735e+00, -3.5704e+00, -3.3526e+00, -6.2710e+00, -7.4046e+00, -3.4548e+00, -1.8280e+00, -2.5526e+00]], [[-4.3692e+00, -7.1428e+00, -8.3354e+00, -9.2429e+00, -7.1967e+00, -7.4001e+00, -8.0496e+00, -3.9014e+00, -4.8565e+00, -6.1453e+00, -5.7601e+00, -1.8692e+00, -2.7850e+00, -3.4412e+00]], [[-1.6776e+00, -4.7255e+00, -4.1480e+00, -4.5050e+00, -4.0599e+00, -4.2916e+00, -3.8500e+00, -3.4480e+00, -3.0863e+00, -3.9157e+00, -3.1524e+00, -1.0859e+00, -1.7037e+00, -2.2382e+00]], [[-1.2595e+00, -4.0219e+00, -2.6936e+00, -2.4495e+00, -2.4426e+00, -1.7164e+00, -1.7794e+00, -1.7733e+00, -1.5458e+00, -1.3050e+00, -7.7279e-01, -5.9982e-01, -4.7988e-01, -6.6157e-01]], [[-2.6836e+00, -5.8837e+00, -8.5345e+00, -6.1127e+00, -5.2930e+00, -6.5066e+00, -6.0183e+00, -3.8513e+00, -3.5699e+00, -3.9500e+00, -4.5613e+00, -1.9102e+00, -3.3879e+00, -2.2242e+00]], [[-4.8791e+00, -8.9185e+00, -9.5579e+00, -1.0085e+01, -8.6805e+00, -6.6616e+00, -6.3992e+00, -6.2232e+00, -6.1813e+00, -4.4586e+00, -4.2152e+00, -3.4694e+00, -3.1239e+00, -4.2889e+00]], [[-1.7885e+00, -3.7008e+00, -3.4450e+00, -3.2512e+00, -3.3505e+00, -2.8582e+00, -2.6124e+00, -2.9987e+00, -2.7629e+00, -2.2960e+00, -2.0315e+00, -1.8158e+00, -1.4591e+00, -1.5922e+00]], [[-6.8294e-01, -5.4538e+00, -5.0527e+00, -4.9550e+00, -4.7219e+00, -4.3911e+00, -4.0805e+00, -4.1723e+00, -3.9960e+00, -3.6484e+00, -3.3781e+00, -3.0873e+00, -2.7432e+00, -2.8828e+00]]], [[[-7.3125e-01, -3.4544e+00, -1.8154e+00, -2.5454e+00, -2.6842e+00, -4.1944e+00, -3.6029e+00, -2.8314e+00, -2.1795e+00, -2.2284e+00, -2.8016e+00, -2.8871e+00, -2.3736e+00, -2.3139e+00]], [[ 1.5566e+00, -2.3098e+00, -1.4910e+00, -1.4506e+00, -2.5239e+00, -2.5917e+00, -2.3445e+00, -2.0846e+00, -1.7272e+00, -2.7173e+00, -2.2660e+00, -4.2076e+00, -1.7524e+00, -2.0904e+00]], [[-5.5297e+00, -1.2276e+01, -1.1672e+01, -1.1546e+01, -1.0821e+01, -1.1347e+01, -9.6361e+00, -8.7979e+00, -7.5970e+00, -7.2161e+00, -6.6350e+00, -5.2899e+00, -2.2831e+00, -4.0904e+00]], [[-2.0178e+00, -4.2091e+00, -3.8446e+00, -4.5548e+00, -3.4428e+00, -4.6687e+00, -4.5453e+00, -2.8259e+00, -3.0827e+00, -2.0439e+00, -3.3505e+00, -3.1690e+00, -1.5752e+00, -9.4920e-01]], [[-1.2929e+00, -3.5828e+00, -6.2173e+00, -5.6272e+00, -4.3329e+00, -7.0302e+00, -7.8436e+00, -2.6138e+00, -4.4135e+00, -3.5849e+00, -5.5764e+00, -6.5762e+00, 1.4886e-01, -2.4399e+00]], [[-3.4582e+00, -5.4496e+00, -6.2473e+00, -6.3099e+00, -6.0654e+00, -7.1748e+00, -6.4951e+00, -3.2840e+00, -4.7776e+00, -4.1544e+00, -4.3398e+00, -3.8003e+00, -5.4521e-01, -2.4811e+00]], [[-1.5938e+00, -4.5654e+00, -2.8185e+00, -2.9240e+00, -2.8349e+00, -3.6283e+00, -3.2617e+00, -3.4573e+00, -2.2332e+00, -2.0008e+00, -2.4316e+00, -2.6468e+00, -4.5032e-01, 1.0628e-01]], [[-1.2522e+00, -3.4141e+00, -1.8310e+00, -1.7397e+00, -1.6722e+00, -8.3991e-01, -8.3951e-01, -1.0216e+00, -1.0457e+00, -9.6759e-01, -1.2166e-01, 2.2521e-01, -2.6664e-01, -5.9029e-03]], [[-1.6657e+00, -4.3374e+00, -5.0649e+00, -4.3845e+00, -4.6361e+00, -4.8389e+00, -5.7966e+00, -2.9728e+00, -2.5417e+00, -3.4357e+00, -4.6905e+00, -4.6704e+00, -8.8144e-01, -1.7117e+00]], [[-2.9143e+00, -6.2744e+00, -6.1037e+00, -5.9102e+00, -6.0785e+00, -4.7598e+00, -4.4924e+00, -4.5092e+00, -3.6182e+00, -4.0447e+00, -3.1738e+00, -2.5568e+00, -1.2479e+00, -2.4057e+00]], [[-5.3312e-02, -2.9076e+00, -2.2562e+00, -2.2125e+00, -2.3794e+00, -1.6060e+00, -1.3220e+00, -2.2417e+00, -1.5993e+00, -1.8631e+00, -1.0773e+00, -8.4242e-01, -1.1730e+00, -1.0320e+00]], [[-4.4536e-01, -5.2528e+00, -4.6217e+00, -4.5679e+00, -4.4752e+00, -3.6314e+00, -3.6122e+00, -4.2238e+00, -3.5706e+00, -3.6850e+00, -2.9394e+00, -2.9365e+00, -3.0001e+00, -2.5112e+00]]]]) attn_weights tensor([[[[ 4.8957e+00, 4.2997e-01, -2.1495e+00, -2.7136e+00, -3.1520e-02, 3.2507e+00, -1.4736e+00, 2.8286e-01, -2.4469e+00, -3.3623e+00, -2.3412e+00, -7.6374e-01, -3.9187e+00, 2.6030e+00]], [[-2.6912e+00, -6.8143e+00, -5.7419e+00, -6.2815e+00, -5.9686e+00, -7.5197e+00, -6.5982e+00, -4.0666e+00, -3.5135e+00, -4.0928e+00, -4.9301e+00, -3.6375e+00, -4.5020e+00, -4.5362e+00]], [[-4.3039e+00, -1.1387e+01, -1.2839e+01, -1.1066e+01, -8.3666e+00, -1.0311e+01, -9.5119e+00, -7.7354e+00, -8.5421e+00, -6.8481e+00, -5.6394e+00, -2.3583e+00, -3.1543e+00, -5.4226e+00]], [[-4.9132e+00, -1.3294e+01, -1.5622e+01, -1.3688e+01, -1.3672e+01, -1.1908e+01, -1.2634e+01, -1.0361e+01, -1.1173e+01, -9.5662e+00, -9.0007e+00, -6.6258e+00, -5.1733e+00, -6.7082e+00]], [[ 7.7246e-01, -2.6192e+00, -3.9612e+00, -4.6596e+00, -3.0965e+00, -4.0909e+00, -1.0646e+00, -2.8417e+00, -3.8806e+00, -4.9398e+00, -4.5649e+00, -2.6374e+00, -3.3449e+00, -3.5928e+00]], [[ 1.5070e-01, -3.5157e+00, -4.8918e+00, -4.2156e+00, -3.2108e+00, -3.0247e+00, -2.6936e+00, -3.5345e+00, -4.7694e+00, -4.1957e+00, -3.3466e+00, -2.6315e+00, -2.5455e+00, -2.4051e+00]], [[-3.5426e+00, -8.3674e+00, -8.4047e+00, -8.8976e+00, -7.9587e+00, -6.9561e+00, -8.2446e+00, -5.9248e+00, -5.4748e+00, -6.2250e+00, -5.5631e+00, -3.6219e+00, -2.7835e+00, -4.0676e+00]], [[-5.2865e+00, -1.2222e+01, -1.3627e+01, -1.2934e+01, -1.2670e+01, -1.1047e+01, -1.1253e+01, -9.4863e+00, -9.8799e+00, -9.2500e+00, -7.3136e+00, -6.3143e+00, -5.3794e+00, -6.1335e+00]], [[-4.5351e+00, -1.0404e+01, -1.0965e+01, -9.6509e+00, -9.4919e+00, -1.1598e+01, -8.4010e+00, -7.0219e+00, -7.4269e+00, -6.3589e+00, -4.7650e+00, -4.9083e+00, -5.4536e+00, -6.5796e+00]], [[-1.8145e+00, -5.9448e+00, -6.1877e+00, -6.0036e+00, -5.8726e+00, -6.6274e+00, -5.3839e+00, -4.7441e+00, -4.6179e+00, -4.4378e+00, -3.5355e+00, -2.9333e+00, -2.7942e+00, -3.5760e+00]], [[-1.1015e+00, -5.9600e+00, -7.0947e+00, -7.4581e+00, -5.9462e+00, -3.5059e+00, -3.8446e+00, -4.5851e+00, -5.9373e+00, -6.3261e+00, -4.4409e+00, -3.1467e+00, -2.6512e+00, -1.7766e+00]], [[-2.3633e+00, -7.6963e+00, -8.7915e+00, -7.5115e+00, -7.8586e+00, -7.2990e+00, -5.8923e+00, -4.5692e+00, -6.1417e+00, -5.3190e+00, -5.0107e+00, -4.0831e+00, -1.4236e+00, -4.6062e+00]]], [[[ 5.0038e+00, -1.3347e+00, -2.8710e+00, -1.2404e+00, -4.4874e-01, -2.5221e+00, -3.4554e+00, -1.4353e+00, -1.9801e+00, -3.1837e+00, -1.9770e+00, -2.0026e+00, -8.7021e-01, 2.2735e+00]], [[-2.8376e+00, -6.8177e+00, -5.7838e+00, -6.8200e+00, -5.9679e+00, -7.2577e+00, -8.0068e+00, -4.0899e+00, -3.9655e+00, -3.4803e+00, -4.3490e+00, -5.2994e+00, -5.5562e+00, -4.8406e+00]], [[-4.6823e+00, -9.9007e+00, -9.4149e+00, -9.1986e+00, -7.6016e+00, -8.6772e+00, -9.7621e+00, -7.7249e+00, -6.9259e+00, -5.8262e+00, -5.5266e+00, -4.4394e+00, -5.0774e+00, -5.2067e+00]], [[-5.2997e+00, -1.2190e+01, -1.4736e+01, -1.3566e+01, -1.1947e+01, -1.2523e+01, -1.2215e+01, -8.7415e+00, -9.3150e+00, -1.0305e+01, -9.2667e+00, -5.3674e+00, -5.7975e+00, -7.1595e+00]], [[ 1.3168e+00, -3.7857e+00, -4.1151e+00, -3.5445e+00, -3.1515e+00, -3.4363e+00, -3.0389e+00, -3.2610e+00, -3.0193e+00, -4.1254e+00, -3.8437e+00, -3.2977e+00, -3.2722e+00, -3.3494e+00]], [[-3.0264e-03, -2.9585e+00, -3.8891e+00, -3.3856e+00, -2.7087e+00, -2.7042e+00, -1.9987e+00, -3.2360e+00, -3.5363e+00, -3.8949e+00, -3.6453e+00, -3.2092e+00, -3.1143e+00, -3.1432e+00]], [[-3.8284e+00, -7.6662e+00, -5.1773e+00, -7.5398e+00, -7.9918e+00, -5.6928e+00, -6.3447e+00, -5.3778e+00, -5.1339e+00, -2.2966e+00, -4.5733e+00, -3.5449e+00, -3.7195e+00, -5.0813e+00]], [[-6.5014e+00, -1.1426e+01, -1.1779e+01, -1.3031e+01, -1.0675e+01, -8.7432e+00, -7.8842e+00, -7.5950e+00, -8.5435e+00, -7.2762e+00, -8.5115e+00, -6.6566e+00, -7.0656e+00, -6.6439e+00]], [[-4.6195e+00, -9.1980e+00, -1.0492e+01, -1.1097e+01, -1.0809e+01, -8.9229e+00, -8.7211e+00, -5.7092e+00, -5.7188e+00, -7.1593e+00, -7.1042e+00, -7.2459e+00, -4.8063e+00, -5.8863e+00]], [[-1.8437e+00, -6.2925e+00, -6.4114e+00, -5.1036e+00, -5.1980e+00, -8.8442e+00, -5.6707e+00, -4.3868e+00, -4.8782e+00, -4.4293e+00, -2.8959e+00, -4.8953e-01, -2.1601e+00, -2.6232e+00]], [[-1.0536e+00, -6.4053e+00, -5.7214e+00, -6.9376e+00, -4.9649e+00, -4.8595e+00, -4.9553e+00, -4.7166e+00, -4.7383e+00, -4.7214e+00, -5.6233e+00, -3.9760e+00, -5.1676e+00, -2.5863e+00]], [[-2.8445e+00, -6.5602e+00, -7.5093e+00, -7.8048e+00, -5.1973e+00, -5.5283e+00, -5.8436e+00, -4.9784e+00, -4.7074e+00, -5.0223e+00, -5.3374e+00, -1.7768e+00, -3.3306e+00, -4.2114e+00]]], [[[ 4.6282e+00, -1.3096e+00, -2.9121e+00, -2.2405e+00, -3.3649e-01, -3.2773e+00, -4.0560e+00, -1.5571e+00, -1.8676e+00, -3.2535e+00, -3.3571e+00, -2.6472e+00, -2.9452e+00, 1.4633e+00]], [[-2.7575e+00, -6.2095e+00, -5.4657e+00, -7.0703e+00, -6.3317e+00, -6.6847e+00, -7.2839e+00, -4.2076e+00, -4.0430e+00, -3.5734e+00, -4.8603e+00, -5.0175e+00, -5.8385e+00, -5.1276e+00]], [[-4.5781e+00, -1.1699e+01, -1.1208e+01, -8.9143e+00, -8.7494e+00, -8.8968e+00, -9.6800e+00, -8.8005e+00, -7.2675e+00, -5.6488e+00, -5.8527e+00, -4.4594e+00, -1.3726e+00, -4.8145e+00]], [[-5.1420e+00, -1.2903e+01, -1.5574e+01, -1.2929e+01, -1.2829e+01, -1.2966e+01, -1.2226e+01, -9.6039e+00, -9.5807e+00, -1.1033e+01, -7.3912e+00, -6.4992e+00, -4.4153e+00, -7.5628e+00]], [[ 1.6216e+00, -4.1354e+00, -3.9836e+00, -3.9055e+00, -3.8346e+00, -2.5983e+00, -4.2044e+00, -3.6429e+00, -3.5890e+00, -3.7510e+00, -4.9329e+00, -4.0766e+00, -4.8597e+00, -5.2068e+00]], [[ 1.7067e-01, -3.2170e+00, -4.9244e+00, -4.0106e+00, -3.1354e+00, -2.6893e+00, -3.2864e+00, -3.6369e+00, -4.2068e+00, -4.4630e+00, -3.5119e+00, -3.5382e+00, -2.4080e+00, -2.9104e+00]], [[-3.1337e+00, -7.8141e+00, -6.5236e+00, -7.7134e+00, -9.0985e+00, -6.3591e+00, -6.7852e+00, -5.3419e+00, -6.4022e+00, -2.8845e+00, -4.9054e+00, -3.8947e+00, -4.1451e+00, -4.4882e+00]], [[-5.8495e+00, -1.1852e+01, -1.2986e+01, -1.2164e+01, -1.2713e+01, -9.2040e+00, -9.3606e+00, -8.2477e+00, -1.2055e+01, -7.7322e+00, -7.7897e+00, -8.5367e+00, -4.9338e+00, -6.6474e+00]], [[-4.0972e+00, -9.1179e+00, -1.0389e+01, -9.1361e+00, -1.0631e+01, -9.5771e+00, -9.7398e+00, -6.0475e+00, -9.6072e+00, -6.3984e+00, -5.9317e+00, -6.8268e+00, -4.1201e+00, -6.6775e+00]], [[-1.7954e+00, -5.6247e+00, -5.6624e+00, -5.1856e+00, -4.2551e+00, -6.7938e+00, -5.9017e+00, -3.3529e+00, -6.6988e+00, -3.4361e+00, -1.9661e+00, -2.6646e+00, -3.8747e-01, -3.5544e+00]], [[-8.1763e-01, -5.4975e+00, -6.3030e+00, -7.0194e+00, -5.2481e+00, -4.8025e+00, -5.4112e+00, -4.8023e+00, -6.6247e+00, -5.1915e+00, -5.3533e+00, -3.5594e+00, -3.7874e+00, -2.5553e+00]], [[-2.2720e+00, -6.6641e+00, -7.5970e+00, -8.1259e+00, -5.4824e+00, -7.3646e+00, -6.9605e+00, -4.6824e+00, -6.7276e+00, -4.9484e+00, -3.5170e+00, -2.7908e+00, -3.2356e+00, -3.1003e+00]]], [[[ 4.5946e+00, -9.4692e-01, -1.9832e+00, 1.6301e+00, -7.5263e-01, -5.6415e+00, -3.7605e+00, -9.8738e-01, -1.1274e+00, -5.8176e+00, -4.4651e+00, -3.1593e+00, -2.0049e+00, 1.6052e+00]], [[-2.8656e+00, -7.3561e+00, -7.4716e+00, -8.4215e+00, -8.0456e+00, -6.1416e+00, -7.6125e+00, -5.1382e+00, -6.1526e+00, -7.0950e+00, -6.4866e+00, -3.9119e+00, -5.4040e+00, -4.8968e+00]], [[-4.4310e+00, -8.7895e+00, -1.0731e+01, -1.1654e+01, -8.0027e+00, -1.0410e+01, -1.0304e+01, -7.4635e+00, -5.3266e+00, -7.3313e+00, -7.7437e+00, -5.6535e+00, -3.7884e+00, -5.8091e+00]], [[-4.8412e+00, -1.2530e+01, -1.3960e+01, -1.4190e+01, -1.2119e+01, -1.1730e+01, -1.2377e+01, -9.5502e+00, -9.8242e+00, -1.1996e+01, -1.0174e+01, -6.1273e+00, -5.6958e+00, -6.4323e+00]], [[ 1.1882e+00, -3.8055e+00, -3.5130e+00, -2.0179e+00, -3.1456e+00, -3.3405e+00, -3.3375e+00, -3.3001e+00, -2.9630e+00, -4.1359e+00, -3.4848e+00, -2.7929e+00, -3.8105e+00, -2.1692e+00]], [[-8.0648e-02, -2.9151e+00, -3.5210e+00, -2.3760e+00, -1.4484e+00, -1.9113e+00, -2.0674e+00, -3.4530e+00, -2.2277e+00, -2.5737e+00, -2.7198e+00, -2.7309e+00, -2.7271e+00, -2.6408e+00]], [[-3.0301e+00, -8.6964e+00, -6.7702e+00, -9.3013e+00, -7.7313e+00, -5.7513e+00, -6.6535e+00, -6.2863e+00, -6.1861e+00, -4.6145e+00, -5.1528e+00, -4.6337e+00, -2.9424e+00, -5.3112e+00]], [[-5.7178e+00, -1.2300e+01, -1.3674e+01, -1.3924e+01, -1.1297e+01, -9.6997e+00, -9.3715e+00, -8.6740e+00, -8.7465e+00, -6.9769e+00, -7.6461e+00, -5.8963e+00, -6.0385e+00, -6.7977e+00]], [[-4.2287e+00, -8.5422e+00, -1.0138e+01, -1.1134e+01, -1.0073e+01, -9.3243e+00, -8.7515e+00, -6.3723e+00, -7.8010e+00, -7.9379e+00, -6.8204e+00, -4.8925e+00, -5.9708e+00, -5.5911e+00]], [[-1.5856e+00, -5.9962e+00, -7.5775e+00, -6.4563e+00, -7.6416e+00, -7.3307e+00, -7.1261e+00, -5.6090e+00, -5.9939e+00, -6.3563e+00, -6.3582e+00, -4.5427e+00, -3.5116e+00, -2.8833e+00]], [[-1.0557e+00, -4.7572e+00, -5.5239e+00, -5.0977e+00, -4.7559e+00, -4.5855e+00, -4.8822e+00, -4.1234e+00, -3.7561e+00, -3.8038e+00, -4.0247e+00, -3.8640e+00, -3.4041e+00, -2.7048e+00]], [[-2.3493e+00, -7.3906e+00, -8.7804e+00, -8.2865e+00, -6.3242e+00, -5.7498e+00, -7.2641e+00, -6.7143e+00, -4.8019e+00, -5.6680e+00, -6.6221e+00, -4.1359e+00, -4.6789e+00, -4.8603e+00]]], [[[ 4.6419e+00, 8.1849e-01, -2.5424e+00, -9.5163e-01, 6.5112e-04, -4.1519e+00, -4.2286e+00, -5.9632e-01, -2.9538e+00, -1.6967e+00, -3.8602e+00, -5.5162e+00, -5.3095e-01, 2.1570e+00]], [[-2.3394e+00, -4.6884e+00, -5.2499e+00, -5.5576e+00, -7.0804e+00, -7.6366e+00, -7.4399e+00, -5.1610e+00, -7.0742e+00, -6.3479e+00, -7.7418e+00, -6.5416e+00, -3.2039e+00, -3.9672e+00]], [[-4.2183e+00, -5.6004e+00, -6.5603e+00, -7.1983e+00, -7.0409e+00, -7.0348e+00, -7.8106e+00, -5.0602e+00, -5.6638e+00, -5.5956e+00, -6.5867e+00, -5.6175e+00, -4.1372e+00, -4.4235e+00]], [[-4.6993e+00, -1.1070e+01, -1.2526e+01, -1.2129e+01, -1.2616e+01, -1.0806e+01, -1.0059e+01, -1.0303e+01, -1.1630e+01, -1.0873e+01, -9.0570e+00, -8.1104e+00, -6.2187e+00, -7.3016e+00]], [[ 9.7445e-01, -1.9564e+00, -3.7211e+00, -4.7867e+00, -3.1169e+00, -4.6658e+00, -3.5116e+00, -2.8746e+00, -3.2922e+00, -3.4793e+00, -3.6784e+00, -4.2796e+00, -2.3949e+00, -1.6316e+00]], [[-4.1333e-01, -1.3198e+00, -4.1986e-01, -6.7931e-01, -9.8486e-01, -2.4464e+00, -3.2198e+00, -2.4248e+00, -2.0914e+00, -2.5185e+00, -3.5770e+00, -5.1606e+00, -2.4696e+00, -3.4066e+00]], [[-3.0279e+00, -6.0488e+00, -5.0438e+00, -5.5326e+00, -4.9454e+00, -4.1522e+00, -4.3520e+00, -5.8935e+00, -4.5155e+00, -4.2903e+00, -3.8671e+00, -3.7970e+00, -4.6758e+00, -4.4437e+00]], [[-5.1883e+00, -9.9697e+00, -9.7256e+00, -9.2847e+00, -9.6912e+00, -8.6641e+00, -7.9371e+00, -7.7667e+00, -6.4766e+00, -7.6476e+00, -5.8840e+00, -5.5475e+00, -5.2215e+00, -6.7998e+00]], [[-3.3115e+00, -7.2902e+00, -8.2673e+00, -8.0093e+00, -8.9364e+00, -8.6495e+00, -7.3427e+00, -4.7276e+00, -5.6728e+00, -7.0627e+00, -6.5253e+00, -5.5396e+00, -2.4280e+00, -3.9044e+00]], [[-1.5508e+00, -2.8970e+00, -4.6714e+00, -4.2221e+00, -5.6322e+00, -4.4659e+00, -6.5829e+00, -3.6235e+00, -4.1302e+00, -6.0136e+00, -7.5771e+00, -6.5026e+00, -3.0125e+00, -4.4002e+00]], [[-9.6355e-01, -5.1393e+00, -4.9412e+00, -5.0693e+00, -4.8305e+00, -4.0765e+00, -4.7252e+00, -4.4449e+00, -4.7759e+00, -4.0815e+00, -3.7343e+00, -3.3960e+00, -3.2611e+00, -2.9418e+00]], [[-2.0438e+00, -5.7566e+00, -6.2974e+00, -5.2390e+00, -5.5255e+00, -3.9273e+00, -5.0942e+00, -5.3192e+00, -3.3904e+00, -4.9402e+00, -5.3131e+00, -5.7665e+00, -4.4517e+00, -2.6253e+00]]]]) attn_weights tensor([[[[-3.1516e+00, -8.7058e+00, -9.8753e+00, -6.5485e+00, -6.8870e+00, -8.6486e+00, -6.8709e+00, -5.8984e+00, -7.2546e+00, -4.4068e+00, -2.7100e+00, -4.0517e+00, -4.3333e+00, -5.0957e+00]], [[-2.5019e+00, -7.5158e+00, -6.6972e+00, -6.6013e+00, -6.8928e+00, -7.6650e+00, -5.8925e+00, -4.0231e+00, -4.1750e+00, -4.3530e+00, -4.7392e+00, -4.4377e+00, -5.5799e+00, -5.3424e+00]], [[-3.2112e-01, -2.8948e+00, -3.5718e+00, -3.4156e+00, -3.4535e+00, -4.9834e+00, -3.3907e+00, -2.3706e+00, -3.0104e+00, -3.0918e+00, -3.0437e+00, -2.8347e+00, -3.4968e+00, -4.1267e+00]], [[-1.8664e+00, -6.0726e+00, -5.6302e+00, -6.1666e+00, -6.5169e+00, -5.3805e+00, -7.2207e+00, -5.3561e+00, -4.5369e+00, -4.9565e+00, -4.2152e+00, -4.3178e+00, -3.7922e+00, -2.6146e+00]], [[ 1.5758e+00, -2.7398e+00, -4.8761e+00, -5.5352e+00, -2.2231e+00, -9.0897e-01, -3.3194e+00, -2.1242e+00, -4.5760e+00, -5.4652e+00, -2.1865e+00, -8.9351e-01, 2.9679e-01, -5.4601e-01]], [[-2.5770e+00, -7.0580e+00, -7.7978e+00, -7.2982e+00, -8.0117e+00, -6.7234e+00, -6.4207e+00, -3.9769e+00, -5.2890e+00, -5.1551e+00, -5.2260e+00, -3.6260e+00, -2.1795e+00, -4.4362e+00]], [[-2.0075e+00, -5.7305e+00, -6.2863e+00, -6.5646e+00, -5.7263e+00, -6.2311e+00, -4.0440e+00, -4.8624e+00, -4.9733e+00, -5.4706e+00, -4.0072e+00, -4.2339e+00, -4.1680e+00, -4.7382e+00]], [[ 2.5404e-01, -3.9614e+00, -3.2668e+00, -4.2090e+00, -3.3982e+00, -2.0983e-01, -2.1081e+00, -3.4828e+00, -3.9087e+00, -4.7066e+00, -2.2676e+00, -1.7399e+00, -1.7645e-01, 1.3658e+00]], [[ 1.9296e+00, -5.0911e+00, -4.0697e+00, -4.1666e+00, -3.0696e+00, -3.3280e+00, -2.3513e+00, -2.2566e+00, -3.1880e+00, -3.4619e+00, -3.9928e+00, -2.3030e+00, -1.4976e+00, -2.3499e+00]], [[-1.1035e+00, -4.7600e+00, -4.5176e+00, -5.7027e+00, -4.4272e+00, -6.5865e+00, -4.3875e+00, -4.2249e+00, -3.5348e+00, -4.3170e+00, -3.7298e+00, -2.7434e+00, -2.5297e+00, -4.8608e+00]], [[ 1.1946e+00, -4.1557e+00, -4.2782e+00, -5.9050e+00, -3.5835e+00, -2.6387e+00, -2.2957e+00, -3.4057e+00, -4.1381e+00, -5.5569e+00, -3.5303e+00, -2.8954e+00, -3.0079e+00, -2.5382e+00]], [[-4.6263e+00, -1.7685e+01, -2.5253e+01, -2.7368e+01, -1.9076e+01, -1.0822e+01, -1.8401e+01, -1.8802e+01, -1.9781e+01, -2.0122e+01, -4.0877e+00, 5.0621e+00, 1.4615e+01, 6.7650e+00]]], [[[-2.2784e+00, -1.0130e+01, -8.9178e+00, -1.0219e+01, -1.0603e+01, -1.0119e+01, -1.0264e+01, -8.6302e+00, -7.1363e+00, -6.2361e+00, -7.4638e+00, -6.7712e+00, -5.4881e+00, -4.3207e+00]], [[-3.0154e+00, -6.6274e+00, -6.5438e+00, -6.8824e+00, -7.0911e+00, -4.4068e+00, -5.7173e+00, -3.9976e+00, -3.2763e+00, -3.8942e+00, -4.1941e+00, -2.6928e+00, -4.2995e+00, -3.6138e+00]], [[-1.6581e-01, -2.9587e+00, -3.5456e+00, -3.6341e+00, -4.1978e+00, -4.5594e+00, -3.3354e+00, -2.9889e+00, -3.2918e+00, -3.6307e+00, -3.5893e+00, -3.3861e+00, -3.4586e+00, -3.8280e+00]], [[-2.2591e+00, -5.3506e+00, -3.7809e+00, -4.0846e+00, -4.9093e+00, -4.7639e+00, -4.7983e+00, -5.4741e+00, -4.1997e+00, -1.6410e+00, -2.5527e+00, -4.0444e+00, -4.1353e+00, -3.5326e+00]], [[ 1.5770e+00, -2.3873e+00, -1.4475e+00, -3.1646e+00, -2.7594e+00, -4.3522e+00, -4.0844e+00, -2.4036e+00, -3.8726e+00, -1.6419e+00, -3.4792e+00, -4.7534e-01, -8.3880e-01, -9.9269e-01]], [[-2.3929e+00, -7.3375e+00, -8.3418e+00, -9.5472e+00, -7.4315e+00, -8.4577e+00, -9.1351e+00, -6.3980e+00, -5.7719e+00, -6.0575e+00, -7.4595e+00, -5.8355e+00, -6.2385e+00, -7.2367e+00]], [[-2.0226e+00, -6.1436e+00, -6.4311e+00, -6.7330e+00, -5.4765e+00, -5.4190e+00, -4.9145e+00, -5.4729e+00, -5.2208e+00, -5.3970e+00, -5.7939e+00, -3.9086e+00, -4.3486e+00, -4.6141e+00]], [[ 1.0590e+00, -4.7707e+00, -4.1811e+00, -2.8977e+00, -2.4337e+00, -3.0513e+00, -3.3505e+00, -3.4199e+00, -3.3056e+00, -3.0743e+00, -2.1810e+00, -1.2194e+00, 4.5046e-01, 1.5530e+00]], [[ 1.8224e+00, -3.6642e+00, -2.8012e+00, -3.1880e+00, -2.4069e+00, -2.6128e+00, -1.3817e+00, -2.8191e+00, -1.7069e+00, -2.7119e+00, -3.4926e+00, -2.0859e+00, -2.0239e+00, -2.4131e+00]], [[-1.2305e+00, -4.6216e+00, -5.0930e+00, -4.7154e+00, -4.2620e+00, -4.6234e+00, -3.9059e+00, -4.2776e+00, -4.2374e+00, -3.5873e+00, -3.6199e+00, -3.3077e-01, -1.7207e+00, -3.2016e+00]], [[ 1.4949e+00, -2.7714e+00, -3.6615e+00, -4.2020e+00, -3.4682e+00, -3.6438e+00, -2.9482e+00, -2.1036e+00, -2.6262e+00, -3.6224e+00, -4.4391e+00, -3.5633e+00, -2.5061e+00, -3.3522e+00]], [[-5.8839e+00, -2.4662e+01, -2.6641e+01, -2.1579e+01, -2.4469e+01, -2.7319e+01, -2.8793e+01, -2.2759e+01, -2.1697e+01, -1.3452e+01, -7.6548e+00, 2.7602e+00, 1.5845e+01, 9.9762e+00]]], [[[-2.3852e+00, -1.0438e+01, -8.9713e+00, -7.5600e+00, -7.8305e+00, -8.8870e+00, -8.7837e+00, -6.6076e+00, -9.2399e+00, -5.4034e+00, -4.9919e+00, -4.2944e+00, -1.4565e+00, -5.4164e+00]], [[-2.1024e+00, -6.2947e+00, -5.6924e+00, -5.9283e+00, -6.9611e+00, -4.2862e+00, -5.9929e+00, -3.7662e+00, -4.1731e+00, -2.4950e+00, -3.4174e+00, -2.5902e+00, -3.7919e+00, -3.4005e+00]], [[ 4.2909e-02, -2.5768e+00, -3.3066e+00, -3.5089e+00, -4.2416e+00, -4.4549e+00, -3.8397e+00, -2.9276e+00, -3.2121e+00, -3.5461e+00, -3.6579e+00, -3.3452e+00, -2.4201e+00, -4.4798e+00]], [[-1.9538e+00, -5.7352e+00, -4.1345e+00, -3.4846e+00, -4.7341e+00, -4.7234e+00, -4.4328e+00, -4.8672e+00, -5.2969e+00, -2.1343e+00, -1.8508e+00, -3.3123e+00, -2.8855e+00, -4.9774e+00]], [[ 1.6487e+00, -3.2741e+00, -1.9012e+00, -3.6943e+00, -3.2586e+00, -5.1033e+00, -5.5206e+00, -2.4587e+00, -4.1066e+00, -2.1790e+00, -3.2760e+00, -1.9217e+00, -2.2110e+00, -1.9019e+00]], [[-1.8106e+00, -7.6949e+00, -7.9831e+00, -6.5058e+00, -6.1258e+00, -7.0045e+00, -7.9525e+00, -5.6542e+00, -6.3602e+00, -4.5932e+00, -3.9141e+00, -4.9655e+00, -4.1010e+00, -3.5556e+00]], [[-1.6828e+00, -5.7346e+00, -6.8385e+00, -5.6196e+00, -5.7631e+00, -4.6244e+00, -4.7572e+00, -4.7922e+00, -5.3503e+00, -5.3497e+00, -4.9114e+00, -3.9499e+00, -3.3466e+00, -4.0315e+00]], [[ 7.6926e-01, -2.6640e+00, -3.8660e+00, -2.9724e+00, -1.6437e+00, -2.0744e+00, -3.4393e+00, -3.1656e+00, -3.7023e+00, -2.7086e+00, -3.0128e+00, -1.8795e+00, 4.5504e-01, 1.4758e+00]], [[ 1.6164e+00, -3.5891e+00, -3.2361e+00, -2.2840e+00, -2.3062e+00, -2.7526e+00, -2.7709e+00, -2.1607e+00, -1.7917e+00, -2.8457e+00, -2.9056e+00, -1.4801e+00, -1.5560e+00, -8.2036e-01]], [[-9.8678e-01, -5.6831e+00, -5.0778e+00, -5.0443e+00, -5.1195e+00, -3.6146e+00, -4.7562e+00, -5.1473e+00, -4.2600e+00, -3.0412e+00, -1.9154e+00, -2.7347e+00, -1.0260e+00, -3.2106e+00]], [[ 1.5810e+00, -2.7442e+00, -3.6834e+00, -3.6607e+00, -3.1413e+00, -3.4417e+00, -3.2980e+00, -2.0988e+00, -2.2278e+00, -3.1566e+00, -4.9404e+00, -3.5991e+00, -3.8353e+00, -4.0455e+00]], [[-6.1545e+00, -2.3414e+01, -2.5208e+01, -1.3870e+01, -1.4196e+01, -1.9661e+01, -2.3178e+01, -2.0912e+01, -1.4240e+01, -1.0643e+01, -1.4853e+00, 4.3454e+00, 1.6084e+01, 7.9175e+00]]], [[[-2.5710e+00, -9.4955e+00, -9.5399e+00, -1.0150e+01, -9.7635e+00, -8.8169e+00, -7.9624e+00, -8.1335e+00, -7.6797e+00, -7.7511e+00, -7.4517e+00, -5.3989e+00, -3.7693e+00, -4.4043e+00]], [[-2.6850e+00, -6.5855e+00, -7.9743e+00, -7.6184e+00, -8.1792e+00, -6.6531e+00, -6.4486e+00, -4.4847e+00, -6.1125e+00, -6.2223e+00, -5.2480e+00, -1.9400e+00, -3.1103e+00, -3.5396e+00]], [[-3.5793e-01, -1.4657e+00, -2.4103e+00, -2.8730e+00, -4.0779e+00, -4.5395e+00, -2.7874e+00, -2.0161e+00, -4.4849e+00, -4.4467e+00, -3.4276e+00, -1.4472e+00, -2.2998e+00, -2.5548e+00]], [[-1.8125e+00, -7.5660e+00, -7.0799e+00, -6.8672e+00, -5.8925e+00, -1.7430e+00, -3.5046e+00, -4.7778e+00, -5.0061e+00, -3.1062e+00, -2.7605e+00, -4.6553e+00, -2.0968e+00, -3.1848e+00]], [[ 1.5606e+00, -2.5692e+00, -3.1538e+00, -2.1686e+00, -2.9486e+00, -3.2201e+00, -3.1185e+00, -2.3326e+00, -2.8237e+00, -4.3181e+00, -3.0051e+00, -1.7333e+00, -6.0796e-01, -1.0053e+00]], [[-2.2161e+00, -8.3482e+00, -8.6472e+00, -8.7230e+00, -8.0331e+00, -7.6865e+00, -7.7805e+00, -6.8586e+00, -7.0476e+00, -7.6944e+00, -7.8689e+00, -4.4219e+00, -3.6300e+00, -4.3272e+00]], [[-2.2208e+00, -5.7035e+00, -6.0252e+00, -5.8835e+00, -4.5568e+00, -4.7355e+00, -4.0050e+00, -5.1744e+00, -5.1926e+00, -4.0444e+00, -4.0389e+00, -3.7613e+00, -4.5276e+00, -4.1009e+00]], [[ 7.5151e-01, -6.5432e+00, -3.7060e+00, -2.2314e+00, -4.0616e+00, -3.5589e+00, -4.3492e+00, -3.8845e+00, -3.4891e+00, -2.2282e+00, -3.6260e+00, -1.2171e+00, -3.1661e-01, 6.9068e-01]], [[ 1.3416e+00, -2.6809e+00, -3.0078e+00, -2.6303e+00, -2.4147e+00, -3.0480e+00, -1.4917e+00, -2.2533e+00, -2.0777e+00, -2.6233e+00, -2.5260e+00, -2.2310e+00, -1.9929e+00, -1.7235e+00]], [[-1.1108e+00, -3.7059e+00, -5.7028e+00, -5.9638e+00, -4.6000e+00, -5.0897e+00, -3.1658e+00, -3.8843e+00, -5.6904e+00, -4.1457e+00, -3.2710e+00, -3.3878e+00, -2.8697e+00, -3.3352e+00]], [[ 1.1592e+00, -2.2123e+00, -2.6703e+00, -3.0569e+00, -2.7594e+00, -2.8512e+00, -3.0193e+00, -1.6737e+00, -1.9378e+00, -4.8982e+00, -3.8888e+00, -1.4180e+00, -1.8220e+00, -2.9209e+00]], [[-4.5357e+00, -3.0358e+01, -1.6455e+01, -2.3331e+01, -2.9587e+01, -1.7932e+01, -1.9944e+01, -1.9118e+01, -1.7004e+01, -1.3349e+01, -7.9929e+00, -1.1442e+00, 1.1691e+01, 8.1352e-01]]], [[[-2.8830e+00, -6.2582e+00, -5.9213e+00, -5.1505e+00, -7.0390e+00, -6.7144e+00, -6.2083e+00, -5.7254e+00, -5.7865e+00, -5.4293e+00, -7.9880e+00, -6.2291e+00, -4.0340e+00, -2.8625e+00]], [[-1.3689e+00, -6.2490e+00, -7.8751e+00, -6.5599e+00, -7.7685e+00, -7.8361e+00, -7.4864e+00, -5.2608e+00, -5.3050e+00, -6.7966e+00, -7.5315e+00, -6.8541e+00, -3.6883e+00, -4.7935e+00]], [[ 4.2408e-01, -1.6175e+00, -2.9304e+00, -2.6739e+00, -3.2890e+00, -5.2268e+00, -4.5773e+00, -2.8153e+00, -2.5005e+00, -4.7758e+00, -5.2200e+00, -5.4512e+00, -1.6982e+00, -2.3148e+00]], [[-1.5116e+00, -6.1042e+00, -5.9077e+00, -5.0299e+00, -4.7993e+00, -4.7577e+00, -4.2381e+00, -5.0133e+00, -5.2131e+00, -5.2989e+00, -5.4420e+00, -4.1037e+00, -5.3986e+00, -4.9716e+00]], [[ 1.4541e+00, -2.3956e+00, -2.8326e+00, -2.9493e+00, -2.4035e+00, -3.1765e+00, -2.7354e+00, -3.3421e+00, -5.2953e+00, -2.7727e+00, -3.8003e+00, -2.2367e+00, -2.2043e+00, 1.4783e-03]], [[-1.6505e+00, -7.5672e+00, -6.9489e+00, -6.6528e+00, -7.5090e+00, -7.4768e+00, -9.2565e+00, -7.8758e+00, -6.0042e+00, -6.5281e+00, -6.9329e+00, -8.8241e+00, -4.3869e+00, -4.8378e+00]], [[-2.0833e+00, -3.6284e+00, -4.5086e+00, -3.9698e+00, -3.7426e+00, -4.0658e+00, -4.3879e+00, -3.7117e+00, -3.7906e+00, -4.0284e+00, -3.4739e+00, -4.1836e+00, -3.0797e+00, -3.4712e+00]], [[ 6.8261e-01, -5.1303e+00, -3.1536e+00, -2.1211e+00, -3.3652e+00, -3.6134e+00, -3.2706e+00, -3.0814e+00, -2.5181e+00, -3.4957e+00, -3.7042e+00, -2.8507e+00, -6.0480e-01, 9.5230e-01]], [[ 1.0961e+00, -2.4749e+00, -2.9166e+00, -2.2142e+00, -2.3099e+00, -2.6110e+00, -2.2064e+00, -2.3231e+00, -1.6902e+00, -2.8127e+00, -3.6220e+00, -4.5381e+00, -1.5090e+00, -2.2113e+00]], [[-1.0391e+00, -3.0415e+00, -3.6241e+00, -3.1270e+00, -3.7903e+00, -5.0604e+00, -4.5236e+00, -3.2338e+00, -3.7886e+00, -3.8232e+00, -5.3139e+00, -5.4140e+00, -3.8503e+00, -4.9803e+00]], [[ 1.3761e+00, -1.8568e+00, -2.0366e+00, -2.6441e+00, -2.3188e+00, -3.0142e+00, -2.3627e+00, -1.4519e+00, -2.6881e+00, -1.7390e+00, -3.6119e+00, -3.6485e+00, -1.0389e+00, -7.6239e-01]], [[-7.6221e+00, -1.4024e+01, -1.7546e+01, -1.6116e+01, -2.3093e+01, -2.0162e+01, -1.9664e+01, -4.8419e+00, -8.8095e+00, -1.6516e+01, -1.1274e+01, -1.4302e+01, 7.0494e+00, -1.9931e+00]]]]) attn_weights tensor([[[[ 1.8755e+00, -7.9492e+00, -5.8028e+00, -4.9400e+00, -6.0634e+00, -4.7616e+00, -1.7924e+00, -1.2129e+00, -1.9850e+00, -3.4526e+00, -4.1676e+00, -5.1562e+00, -3.5986e+00, -2.5380e+00]], [[ 3.8377e+00, -1.2773e+01, -9.2870e+00, -9.2289e+00, -1.1902e+01, -6.3842e+00, 3.6981e-01, -3.9689e+00, -5.4462e+00, -8.8231e+00, -9.4786e+00, -9.8071e+00, -6.7856e+00, -2.1939e+00]], [[ 2.6833e-01, -3.1154e+00, -4.2869e+00, -4.7368e+00, -3.0939e+00, -4.3145e+00, -3.3316e+00, -2.9254e+00, -1.9134e+00, -2.6149e+00, -1.0456e+00, -6.2934e-01, -4.7598e-01, -3.3805e+00]], [[-4.3568e-01, -1.1456e+00, -1.5182e+00, -1.4292e+00, -1.3403e+00, -2.4101e+00, -2.0430e+00, -8.4515e-01, 1.0998e-01, -6.6435e-01, 3.4072e-01, -7.7711e-01, -1.0400e+00, -2.1749e+00]], [[-2.1417e-01, -4.5884e+00, -4.9250e+00, -4.8012e+00, -5.0089e+00, -4.2409e+00, -3.6151e+00, -2.1366e+00, -3.0584e+00, -3.2800e+00, -1.8232e+00, -1.8583e+00, -1.5428e+00, -2.1613e+00]], [[ 2.0550e+00, -8.1451e+00, -4.6190e+00, -6.9864e+00, -7.9057e+00, -3.3074e+00, 2.9985e+00, -2.0277e+00, -6.5695e-01, -5.6120e+00, -5.5248e+00, -5.9860e+00, -4.5457e+00, -2.1608e+00]], [[ 1.5467e+00, -6.0543e+00, -7.7115e+00, -8.7676e+00, -6.8558e+00, -3.7380e+00, -7.5238e+00, -5.4985e+00, -7.0336e+00, -8.3353e+00, -4.1330e+00, -4.0721e+00, 1.4328e-01, -1.1336e+00]], [[ 1.1948e+00, -5.0665e+00, -5.9927e+00, -6.1345e+00, -4.4994e+00, -4.5993e+00, -3.1989e+00, -4.0642e+00, -4.6640e+00, -5.0904e+00, -2.4209e+00, -2.0609e+00, -1.4510e+00, -2.2582e+00]], [[ 5.5183e-01, -6.7442e+00, -5.3048e+00, -5.4259e+00, -5.8587e+00, -5.0462e+00, -5.8944e-01, -2.1035e+00, -1.1874e+00, -3.2124e+00, -4.4575e+00, -4.6773e+00, -4.8902e+00, -3.5479e+00]], [[ 1.0398e+00, -3.4443e+00, -4.5958e+00, -4.2110e+00, -3.4438e+00, -2.4984e+00, -5.4973e-01, -1.3008e+00, -3.5850e+00, -4.4014e+00, -3.9952e+00, -3.3560e+00, -3.8009e+00, -2.7843e+00]], [[ 2.9959e+00, -1.4221e-02, -1.3514e+00, -8.2915e-01, -2.3135e-01, 2.4918e+00, 4.5386e-01, 1.1557e+00, -6.2680e-01, -7.1893e-01, -1.2598e+00, 1.7403e-01, -6.5464e-01, 2.5676e+00]], [[ 7.1618e-01, -3.1745e+00, -3.3139e+00, -3.2826e+00, -2.6707e+00, -1.6735e+00, -2.4320e+00, -1.9258e+00, -2.7268e+00, -2.9672e+00, -2.3631e+00, -1.5461e+00, -1.9002e+00, -1.3007e+00]]], [[[ 2.3376e+00, -7.0176e+00, -5.4957e+00, -6.1027e+00, -3.8543e+00, -1.4446e+00, -1.5212e+00, -2.4044e+00, -2.1210e+00, -5.0827e+00, -6.3748e+00, -4.7937e+00, -3.1524e+00, -1.4585e+00]], [[ 4.7557e+00, -1.4729e+01, -1.0464e+01, -1.1536e+01, -3.2480e+00, -1.5606e+00, -9.8077e+00, -1.0993e+01, -8.9458e+00, -9.0924e+00, -1.1701e+01, -5.7159e+00, -3.8557e+00, -1.1646e+00]], [[ 3.0367e-01, -4.4995e+00, -3.7789e+00, -4.4760e+00, -4.4067e+00, -4.3620e+00, -3.8848e+00, -5.0995e+00, -4.1969e+00, -3.1674e+00, -4.0211e+00, -1.5825e+00, -2.8378e+00, -4.1698e+00]], [[ 1.8771e-02, -1.4132e+00, -2.0426e+00, -2.4806e+00, -3.0441e+00, -2.7606e+00, -2.6577e+00, -2.2285e+00, -1.0494e+00, -1.3322e+00, -1.8007e+00, -1.0515e+00, -1.9302e+00, -1.5987e+00]], [[ 5.9038e-02, -4.9226e+00, -5.5381e+00, -7.1152e+00, -5.5871e+00, -3.3680e+00, -2.7492e+00, -3.4780e+00, -3.1926e+00, -3.9989e+00, -5.0958e+00, -2.9800e+00, -2.8905e+00, -2.7492e+00]], [[ 1.8739e+00, -7.1815e+00, -5.4342e+00, -5.3172e+00, -2.1299e+00, -1.6398e+00, -4.7777e+00, -2.4820e+00, -2.1096e+00, -3.9488e+00, -5.6904e+00, -2.8703e+00, -4.4301e+00, -3.2112e+00]], [[ 6.9447e-01, -4.7962e+00, -5.0941e+00, -4.9479e+00, -4.1166e+00, -3.0576e+00, -3.2012e+00, -2.9608e+00, -2.3604e+00, -3.0749e+00, -3.8409e+00, 1.5599e+00, 8.4457e-01, -8.4343e-01]], [[ 8.6510e-01, -3.8275e+00, -5.4641e+00, -4.7661e+00, -3.6121e+00, -3.5267e+00, -1.6270e+00, -3.8505e+00, -3.4664e+00, -4.1831e+00, -3.2174e+00, 5.3545e-01, -3.0675e-01, 4.3604e-03]], [[ 7.0184e-01, -5.3045e+00, -4.1403e+00, -6.4495e+00, -1.3285e+00, -2.1199e-01, -7.3990e-01, -1.0542e+00, -9.0283e-01, -2.8347e+00, -5.8552e+00, -1.4401e+00, -1.8701e+00, -1.9625e+00]], [[ 1.0410e+00, -3.1383e+00, -3.9290e+00, -4.0410e+00, -3.2488e+00, -2.5884e+00, -2.1754e+00, -2.8579e+00, -3.4223e+00, -4.2768e+00, -4.9241e+00, -3.5015e+00, -3.4947e+00, -4.2471e+00]], [[ 1.8240e+00, -9.9955e-01, -4.2455e-01, -4.6973e-01, -6.5621e-02, -5.2424e-01, 1.5920e+00, 1.6800e+00, -8.0253e-01, 1.6961e-01, -7.1661e-01, -1.5227e-01, -3.0999e-01, 2.4400e-01]], [[ 1.3297e+00, -4.1461e+00, -4.0291e+00, -2.6193e+00, -1.6572e+00, -4.3262e+00, -4.1934e+00, -2.9011e+00, -2.6683e+00, -2.9334e+00, -1.9034e+00, -2.4914e+00, -1.6620e+00, -2.3710e-01]]], [[[ 2.4551e+00, -6.3033e+00, -4.3400e+00, -4.6289e+00, -3.8860e+00, -3.5637e+00, -4.6230e+00, -3.8188e+00, -3.5989e+00, -4.5651e+00, -6.3933e+00, -5.3092e+00, -2.6325e+00, -2.7874e+00]], [[ 5.1061e+00, -1.4836e+01, -1.1494e+01, -9.9395e+00, -8.5630e+00, -6.9546e+00, -1.0950e+01, -1.4099e+01, -1.1388e+01, -1.2370e+01, -1.1972e+01, -1.2385e+01, -6.1476e+00, -7.2806e-01]], [[ 3.9161e-01, -5.5568e+00, -3.7567e+00, -4.0587e+00, -5.3254e+00, -4.9749e+00, -4.5013e+00, -6.0976e+00, -4.4813e+00, -2.8162e+00, -2.0924e+00, -2.2766e+00, -1.6504e+00, -3.5717e+00]], [[ 2.7858e-02, -1.8889e+00, -2.4281e+00, -2.7508e+00, -3.7648e+00, -2.5920e+00, -3.2404e+00, -2.1915e+00, -1.4077e+00, -9.4687e-01, -1.6661e+00, -2.6540e+00, -2.2828e+00, -2.8711e+00]], [[ 9.0352e-02, -4.7105e+00, -5.5931e+00, -4.8077e+00, -6.2656e+00, -4.1123e+00, -4.0768e+00, -4.5445e+00, -5.7799e+00, -4.0187e+00, -4.1846e+00, -3.7393e+00, -9.8601e-02, -3.4811e+00]], [[ 2.6367e+00, -9.5255e+00, -5.4318e+00, -5.2837e+00, -4.7296e+00, -2.4275e+00, -6.0618e+00, -6.1423e+00, -3.0799e+00, -5.5573e+00, -5.7487e+00, -6.3960e+00, -2.7103e+00, -2.5527e+00]], [[ 9.6524e-01, -6.1793e+00, -6.5081e+00, -4.2854e+00, -4.6224e+00, -6.2029e+00, -7.1940e+00, -5.3070e+00, -6.0575e+00, -4.5880e+00, -3.5648e+00, -1.4340e+00, 1.0870e+00, -3.1830e+00]], [[ 1.6125e+00, -4.8500e+00, -5.7011e+00, -6.5796e+00, -6.7896e+00, -4.2616e+00, -2.9824e+00, -4.1391e+00, -8.0377e+00, -4.7846e+00, -3.2077e+00, -1.6307e+00, 2.3502e+00, -4.0923e+00]], [[ 1.3337e+00, -6.2633e+00, -4.2873e+00, -5.2716e+00, -5.0919e+00, -2.3229e+00, -3.6157e+00, -3.9670e+00, -4.0326e+00, -4.5027e+00, -5.4957e+00, -6.1728e+00, -2.4671e+00, -2.4954e+00]], [[ 1.3298e+00, -3.7042e+00, -4.4245e+00, -4.4086e+00, -3.3527e+00, -3.0627e+00, -2.3634e+00, -3.0984e+00, -3.5221e+00, -4.6239e+00, -4.9483e+00, -4.8257e+00, -4.0889e+00, -5.0406e+00]], [[ 1.8517e+00, -1.1655e+00, -1.8187e+00, -1.4587e+00, -1.6256e+00, -6.5658e-01, -7.0228e-01, -2.9125e-01, -2.9680e+00, -1.2607e+00, -1.1588e+00, -1.8099e+00, -8.4597e-01, -2.1597e+00]], [[ 1.0996e+00, -3.3705e+00, -3.6539e+00, -3.5885e+00, -3.2621e+00, -4.3808e+00, -4.5597e+00, -2.9532e+00, -3.4194e+00, -3.5932e+00, -3.5541e+00, -2.2862e+00, -1.9858e+00, -6.3800e-01]]], [[[ 1.9371e+00, -3.8668e+00, -5.2013e+00, -5.3467e+00, -1.8946e+00, -2.5682e+00, -4.3899e+00, -4.3374e+00, -4.4209e+00, -4.2910e+00, -4.6868e+00, -4.4071e+00, -3.4865e+00, -3.4659e+00]], [[ 4.1531e+00, -1.3203e+01, -1.2098e+01, -1.1024e+01, -5.1153e+00, -4.5250e+00, -9.2932e+00, -1.0546e+01, -6.8138e+00, -4.2517e+00, -8.9847e+00, -7.0614e+00, -5.2010e+00, -2.1374e+00]], [[ 6.4970e-01, -4.0174e+00, -4.9510e+00, -6.2314e+00, -4.8848e+00, -3.6543e+00, -3.6456e+00, -4.9831e+00, -4.6834e+00, -4.2873e+00, -3.6094e+00, -2.3359e+00, -2.1807e+00, -3.7931e+00]], [[ 5.7604e-02, -1.8206e+00, -3.4266e+00, -3.6244e+00, -4.1105e+00, -3.0796e+00, -3.2892e+00, -3.3570e+00, -4.3128e+00, -3.5892e+00, -3.5121e+00, -1.2810e+00, -1.0523e+00, -2.2060e+00]], [[ 1.3206e-01, -5.9042e+00, -7.2210e+00, -7.3251e+00, -4.6491e+00, -4.8319e+00, -3.1659e+00, -3.7966e+00, -4.2136e+00, -3.8111e+00, -3.8848e+00, -2.5942e+00, -3.3123e+00, -4.0969e+00]], [[ 1.5396e+00, -7.6695e+00, -5.3194e+00, -8.0129e+00, -4.9637e+00, -2.9824e+00, -3.8134e+00, -3.1561e+00, -2.7509e+00, -2.8170e+00, -4.7766e+00, -2.2586e+00, -2.5879e+00, -2.3449e+00]], [[ 1.1441e+00, -7.2542e+00, -6.9963e+00, -7.9773e+00, -8.2194e+00, -5.5247e+00, -5.4869e+00, -5.6929e+00, -4.8320e+00, -4.5793e+00, -4.6751e+00, -1.4017e+00, -1.7817e-01, -1.7361e+00]], [[ 8.2765e-01, -4.8173e+00, -6.4614e+00, -6.7950e+00, -5.1748e+00, -4.3696e+00, -2.3719e+00, -4.6321e+00, -4.8428e+00, -3.0658e+00, -2.6102e+00, -3.8723e+00, -4.2449e+00, -5.0460e+00]], [[ 8.0846e-01, -5.5881e+00, -5.1801e+00, -7.8876e+00, -4.1259e+00, -2.4489e+00, -2.8538e+00, -2.6426e+00, -1.9901e+00, -1.7450e+00, -2.9678e+00, -1.2367e+00, -2.5789e+00, -3.1013e+00]], [[ 8.2803e-01, -3.7207e+00, -3.2426e+00, -2.5728e+00, -1.7617e+00, -2.3300e+00, -1.7185e+00, -1.4662e+00, -2.1923e+00, -3.4028e+00, -2.9255e+00, -1.9772e+00, -2.2577e+00, -2.4934e+00]], [[ 1.7610e+00, -1.2852e+00, -4.1986e+00, -2.9181e+00, -2.3971e+00, 4.3731e-01, 9.0097e-01, 1.0198e+00, -5.5512e-01, -1.8403e+00, -1.0119e-01, -8.2900e-02, -6.5953e-01, -7.2699e-01]], [[ 1.1330e+00, -4.2685e+00, -3.7976e+00, -1.7560e+00, -2.7949e+00, -2.7276e+00, -3.9751e+00, -3.3301e+00, -2.2017e+00, -3.8230e+00, -3.5273e+00, -2.6648e+00, -1.6781e+00, 7.3415e-01]]], [[[ 2.7854e+00, -3.1666e+00, -4.1792e+00, -4.0403e+00, -4.3468e+00, -1.6733e+00, -1.9007e+00, -2.6799e+00, -4.1323e+00, -3.7675e+00, -3.1528e+00, -3.2897e+00, -4.2899e+00, -3.1105e+00]], [[ 4.0573e+00, -6.7628e+00, -7.7657e+00, -7.2606e+00, -7.7482e+00, -3.1439e+00, -8.4968e+00, -8.4080e+00, -5.1423e+00, -6.6025e+00, -4.8459e+00, -8.5264e+00, -7.5648e+00, -1.7756e+00]], [[ 4.5029e-01, -2.1703e+00, -3.6354e+00, -3.3728e+00, -2.7308e+00, -2.9143e+00, -3.5482e+00, -3.6050e+00, -4.2593e+00, -3.8356e+00, -4.2537e+00, -4.6389e+00, -2.5278e+00, -4.9005e+00]], [[ 5.7164e-01, -5.0881e-01, -1.5943e+00, -1.6804e+00, -3.0160e+00, -2.8532e+00, -3.2681e+00, -2.5212e+00, -3.3939e+00, -4.5051e+00, -4.5473e+00, -3.9951e+00, -1.4381e+00, -2.2913e+00]], [[ 1.5848e-01, -3.4178e+00, -3.6900e+00, -3.6490e+00, -3.1207e+00, -4.1473e+00, -3.2779e+00, -3.0989e+00, -2.5648e+00, -3.4805e+00, -4.6404e+00, -3.1425e+00, -2.1116e+00, -4.2195e+00]], [[ 2.3052e+00, -6.3230e+00, -3.2402e+00, -5.8945e+00, -5.0421e+00, -3.4199e+00, -5.0312e+00, -4.3880e+00, -2.7290e+00, -4.8849e+00, -3.5138e+00, -6.0726e+00, -2.8414e+00, -1.7193e+00]], [[ 8.3106e-01, -6.9729e+00, -6.7473e+00, -7.3063e+00, -7.2030e+00, -5.7954e+00, -5.8166e+00, -4.7985e+00, -5.3943e+00, -5.5458e+00, -4.7890e+00, -4.1543e+00, -1.9685e+00, -2.5313e+00]], [[ 1.3476e+00, -2.9038e+00, -3.4370e+00, -5.9156e+00, -4.8722e+00, -5.3071e+00, -2.8352e+00, -2.2984e+00, -3.1036e+00, -4.3867e+00, -5.2079e+00, -3.6211e+00, -2.4486e+00, -2.6058e+00]], [[ 1.0579e+00, -3.1584e+00, -3.3383e+00, -4.3659e+00, -4.1225e+00, -4.2064e+00, -5.2956e+00, -5.1863e+00, -4.0003e+00, -4.8138e+00, -4.0315e+00, -5.4728e+00, -4.2922e+00, -3.8804e+00]], [[ 1.0271e+00, -3.1183e+00, -3.1054e+00, -2.8515e+00, -3.0953e+00, -3.6638e+00, -3.8793e+00, -2.4135e+00, -2.7936e+00, -3.8739e+00, -4.5698e+00, -4.8876e+00, -2.0320e+00, -2.9471e+00]], [[ 2.6081e+00, -1.4557e+00, -2.0104e+00, -1.8457e+00, -2.1771e+00, -1.8716e+00, -8.8447e-01, 1.4874e-01, -1.5305e+00, -2.6405e+00, -3.4055e+00, -2.2566e+00, 4.1913e-01, -1.1389e+00]], [[ 1.1639e+00, -3.4724e+00, -3.2683e+00, -2.7944e+00, -3.1415e+00, -1.0677e+00, -3.6223e+00, -2.1812e+00, -4.2213e+00, -5.2077e+00, -4.1538e+00, -4.5196e+00, -1.7438e+00, -1.7599e+00]]]]) attn_weights tensor([[[[-1.4032e+00, -3.5924e+00, -3.3780e+00, -3.8782e+00, -2.9062e+00, -4.8788e+00, -4.1327e+00, -3.4692e+00, -1.8671e+00, -2.2529e+00, -9.9491e-01, -7.4557e-01, -1.1029e+00, -3.6736e+00]], [[ 7.0542e-01, -4.9520e+00, -4.9953e+00, -5.1844e+00, -5.7955e+00, -4.9647e+00, -1.9560e+00, -1.7526e+00, -3.2306e+00, -4.6870e+00, -4.7509e+00, -4.2014e+00, -1.9963e+00, -2.7624e+00]], [[ 2.6272e-01, -2.5566e+00, -2.6375e+00, -3.2286e+00, -3.1253e+00, -3.5142e+00, -3.0821e+00, -2.1591e+00, -2.4461e+00, -3.3339e+00, -2.2017e+00, -2.6310e+00, -2.8798e+00, -2.8070e+00]], [[ 3.4700e-01, -3.4250e+00, -4.7709e+00, -4.2430e+00, -3.6848e+00, -4.0255e+00, -3.3264e+00, -2.7363e+00, -3.0228e+00, -3.2186e+00, -3.0809e+00, -2.7993e+00, -2.2617e+00, -3.7382e+00]], [[ 1.6818e+00, -2.4564e+00, -2.9207e+00, -3.1158e+00, -2.7722e+00, -1.9756e+00, -8.1120e-01, -1.1769e+00, -2.5316e+00, -2.7276e+00, -2.9231e+00, -1.9669e+00, -1.6341e+00, -1.4385e+00]], [[-4.3404e-01, -3.9949e+00, -4.6117e+00, -4.7296e+00, -4.9017e+00, -4.7998e+00, -4.3497e+00, -3.3750e+00, -2.9151e+00, -3.2864e+00, -2.8892e+00, -3.0480e+00, -3.0255e+00, -3.0625e+00]], [[ 2.2986e+00, -3.6237e+00, -3.7632e+00, -4.0533e+00, -2.8825e+00, -9.2677e-01, -5.8807e-01, -1.5916e+00, -2.6618e+00, -3.2244e+00, -2.5943e+00, -2.1594e+00, -2.2759e+00, -1.2595e-01]], [[ 2.4593e-01, -3.8282e+00, -4.4638e+00, -4.2576e+00, -4.3479e+00, -3.6775e+00, -2.0603e+00, -3.9878e+00, -4.6885e+00, -3.9061e+00, -3.0457e+00, -2.9936e+00, -2.1906e+00, -2.0889e+00]], [[-8.4165e-01, -6.3236e+00, -6.7132e+00, -6.9245e+00, -5.6615e+00, -6.4510e+00, -6.0726e+00, -5.7570e+00, -4.5181e+00, -4.2912e+00, -2.4534e+00, -2.5891e+00, -2.1559e+00, -4.0556e+00]], [[ 4.5336e+00, -1.0996e+01, -4.7937e+00, -7.2942e+00, -5.4606e+00, -1.7576e+00, 3.6794e+00, -1.3530e+00, -1.4273e-01, -4.8772e+00, -3.0157e+00, -5.6837e+00, -3.5791e+00, -2.5569e+00]], [[ 2.9293e+00, -3.7860e+00, -2.9805e+00, -2.8325e+00, -2.0575e+00, -2.2177e+00, -9.1196e-01, -1.0974e+00, -6.0160e-01, -1.1113e+00, -8.1523e-01, -1.4330e+00, -1.4004e+00, -1.2311e+00]], [[-9.3657e-01, -3.8691e+00, -3.8894e+00, -3.8315e+00, -3.9641e+00, -4.5422e+00, -3.3568e+00, -2.8377e+00, -2.3053e+00, -2.3495e+00, -1.2720e+00, -1.4649e+00, -1.3554e+00, -2.8906e+00]]], [[[-1.4658e+00, -2.9166e+00, -2.6809e+00, -2.5918e+00, -4.3047e+00, -4.0553e+00, -3.7528e+00, -3.9557e+00, -2.8350e+00, -6.3223e-01, -1.3206e+00, -4.6922e-01, -1.7551e+00, -2.7606e+00]], [[ 1.4621e-01, -3.9881e+00, -5.4867e+00, -6.5936e+00, -3.6043e+00, -2.5928e+00, -1.1021e+00, -3.3261e+00, -4.3359e+00, -5.6743e+00, -7.3620e+00, -3.8929e+00, -3.5399e+00, -5.0524e+00]], [[ 4.8475e-01, -3.5189e+00, -2.8447e+00, -3.9043e+00, -3.6532e+00, -3.6842e+00, -3.2724e+00, -2.5398e+00, -2.6002e+00, -2.6438e+00, -4.0639e+00, -3.4047e+00, -3.4725e+00, -4.1013e+00]], [[ 4.4098e-01, -2.6862e+00, -4.5102e+00, -4.2349e+00, -3.0128e+00, -2.8438e+00, -2.0659e+00, -2.0535e+00, -2.5091e+00, -4.4824e+00, -4.6205e+00, -3.3743e+00, -3.2938e+00, -4.0431e+00]], [[ 1.1697e+00, -2.0040e+00, -2.0081e+00, -2.0966e+00, -2.0666e+00, -2.6064e+00, -1.4711e+00, -1.8523e+00, -2.3959e+00, -2.4691e+00, -2.5992e+00, -1.1367e+00, -1.8023e+00, -2.2514e+00]], [[-6.2513e-01, -4.6820e+00, -5.1708e+00, -5.4342e+00, -5.0052e+00, -4.5152e+00, -4.8036e+00, -4.6842e+00, -4.0524e+00, -3.6667e+00, -3.9861e+00, -3.8577e+00, -2.8960e+00, -3.0610e+00]], [[ 2.2530e+00, -3.9057e+00, -3.2285e+00, -3.0979e+00, -2.0323e+00, -2.5288e+00, -3.0812e+00, -2.1436e+00, -1.9163e+00, -2.2367e+00, -2.4213e+00, -2.4136e+00, -9.9797e-01, 1.6549e-01]], [[-5.5923e-01, -3.2901e+00, -4.1812e+00, -4.3065e+00, -3.9138e+00, -2.3803e+00, -1.5948e+00, -2.7833e+00, -3.4163e+00, -4.2633e+00, -4.2758e+00, -3.2606e+00, -3.0726e+00, -3.0250e+00]], [[-1.6161e+00, -6.0106e+00, -5.6010e+00, -7.1115e+00, -6.5675e+00, -6.3351e+00, -5.2418e+00, -5.2229e+00, -4.6325e+00, -4.0582e+00, -5.3234e+00, -1.4309e+00, -2.3777e+00, -4.7707e+00]], [[ 5.5435e+00, -9.5739e+00, -6.6838e+00, -5.3311e+00, -7.1638e-01, -8.3165e-01, -9.2072e+00, -7.7572e+00, -6.3957e+00, -5.4683e+00, -5.9027e+00, -2.6581e+00, -2.4409e+00, -4.4331e-01]], [[ 3.0309e+00, -4.4031e+00, -3.2253e+00, -3.3666e+00, -2.8588e+00, -2.2640e+00, -1.3257e+00, -2.2989e+00, -1.6728e+00, -1.5360e+00, -2.0583e+00, -1.1328e+00, -1.1988e+00, -1.7637e+00]], [[-5.5644e-01, -4.2020e+00, -4.8281e+00, -4.9683e+00, -4.9804e+00, -4.9405e+00, -3.5672e+00, -4.3016e+00, -3.3898e+00, -3.5624e+00, -3.5422e+00, -1.1181e+00, -1.3463e+00, -2.0199e+00]]], [[[-1.0503e+00, -5.5866e+00, -4.1709e+00, -4.3516e+00, -5.6820e+00, -3.8454e+00, -3.8106e+00, -4.8852e+00, -4.2524e+00, -2.2511e+00, -2.5355e+00, -1.6964e+00, -9.7581e-01, -3.4897e+00]], [[ 1.4972e+00, -5.4403e+00, -6.9567e+00, -6.7041e+00, -5.5407e+00, -5.1814e+00, -4.9609e+00, -5.8871e+00, -7.8314e+00, -6.1158e+00, -7.8018e+00, -7.4976e+00, -4.1809e+00, -2.9871e+00]], [[ 3.3225e-01, -3.4558e+00, -2.8278e+00, -3.5994e+00, -3.5172e+00, -3.6746e+00, -3.7379e+00, -2.8751e+00, -3.1504e+00, -2.9258e+00, -3.9792e+00, -3.5143e+00, -4.2063e+00, -3.8344e+00]], [[ 2.8831e-01, -3.0235e+00, -4.7588e+00, -4.9665e+00, -3.7926e+00, -2.7902e+00, -2.6945e+00, -1.9958e+00, -2.2854e+00, -3.3824e+00, -4.4705e+00, -4.4527e+00, -4.1630e+00, -4.6164e+00]], [[ 1.2275e+00, -1.8886e+00, -1.5254e+00, -1.9091e+00, -1.6996e+00, -2.8518e+00, -2.2089e+00, -1.2943e+00, -2.3265e+00, -1.4591e+00, -1.5626e+00, -1.4699e+00, -1.4950e+00, -2.1648e+00]], [[-5.1275e-01, -4.2635e+00, -5.3813e+00, -5.7890e+00, -5.5481e+00, -5.9705e+00, -4.8136e+00, -4.7828e+00, -3.9965e+00, -3.9384e+00, -5.5340e+00, -4.4867e+00, -3.9429e+00, -3.6301e+00]], [[ 2.0996e+00, -2.8382e+00, -2.1858e+00, -2.4178e+00, -2.5616e+00, -3.5607e+00, -3.7064e+00, -2.9203e+00, -1.2432e+00, -1.7074e+00, -2.3819e+00, -1.9890e+00, -1.6292e+00, -6.3696e-01]], [[-2.7183e-01, -3.2305e+00, -4.4090e+00, -4.1178e+00, -3.6907e+00, -2.5622e+00, -1.8226e+00, -2.8914e+00, -3.9592e+00, -4.1566e+00, -4.4505e+00, -4.8517e+00, -3.3102e+00, -3.5082e+00]], [[-9.4832e-01, -6.1673e+00, -4.4934e+00, -5.2317e+00, -5.4687e+00, -6.4776e+00, -6.2381e+00, -5.9639e+00, -3.8090e+00, -2.8625e+00, -4.0662e+00, -2.4823e+00, -1.8642e+00, -3.5032e+00]], [[ 4.9435e+00, -1.1229e+01, -6.9710e+00, -5.5684e+00, -2.8132e+00, -2.3307e+00, -7.6946e+00, -7.4082e+00, -7.5511e+00, -7.5971e+00, -7.3771e+00, -8.1380e+00, -3.8685e+00, -4.4244e-01]], [[ 3.0681e+00, -2.9534e+00, -2.8409e+00, -2.7905e+00, -1.7182e+00, -2.3086e+00, -1.1709e+00, -1.6313e+00, -7.9658e-01, -3.7981e-01, -1.0249e+00, -1.5096e+00, -9.5688e-01, -5.0785e-01]], [[-4.2570e-01, -4.5012e+00, -4.7839e+00, -5.3496e+00, -5.8013e+00, -5.1258e+00, -4.2623e+00, -4.6907e+00, -3.2277e+00, -3.2482e+00, -3.4457e+00, -3.3797e+00, -1.8745e+00, -2.7079e+00]]], [[[-7.0303e-01, -5.5041e+00, -5.7184e+00, -5.4512e+00, -4.5868e+00, -1.4127e+00, -2.2360e+00, -5.1037e+00, -4.7243e+00, -3.1847e+00, -3.2426e+00, -2.5336e+00, -9.5771e-01, -2.6199e+00]], [[-1.0308e-01, -5.0079e+00, -4.6079e+00, -6.8818e+00, -4.5761e+00, -2.9665e+00, -3.2591e+00, -4.6745e+00, -3.2708e+00, -2.6095e+00, -3.3816e+00, -4.0862e+00, -2.8200e+00, -3.2414e+00]], [[ 2.5874e-01, -2.9387e+00, -2.5167e+00, -2.7414e+00, -3.4533e+00, -3.5146e+00, -3.4439e+00, -2.6988e+00, -3.0465e+00, -3.9808e+00, -3.5573e+00, -2.0924e+00, -2.4850e+00, -3.0072e+00]], [[-2.3654e-01, -2.4191e+00, -3.2992e+00, -3.1403e+00, -1.7437e+00, -2.5377e+00, -2.0842e+00, -1.6581e+00, -2.2866e+00, -3.3810e+00, -3.0551e+00, -1.7931e+00, -2.9850e+00, -2.8251e+00]], [[ 1.0474e+00, -7.9002e-01, -1.6532e+00, -1.7237e+00, -1.3672e+00, -2.8239e+00, -1.5627e+00, -1.2459e+00, -1.5977e+00, -3.2105e+00, -2.7363e+00, -1.1419e+00, -2.0705e+00, -2.3068e+00]], [[-8.6429e-01, -4.2230e+00, -5.1674e+00, -5.2771e+00, -5.0934e+00, -4.5791e+00, -3.9758e+00, -5.0934e+00, -4.7994e+00, -3.9056e+00, -3.3399e+00, -3.5649e+00, -3.8649e+00, -3.6515e+00]], [[ 2.0867e+00, -3.5818e+00, -2.8127e+00, -2.1640e+00, -2.5336e+00, -2.6112e+00, -2.9811e+00, -2.4629e+00, -2.2106e+00, -2.9056e+00, -3.3059e+00, -2.1480e+00, -1.2452e+00, 6.4159e-02]], [[-7.5093e-01, -3.8490e+00, -4.8997e+00, -3.8592e+00, -2.2873e+00, -1.8780e+00, -1.3657e+00, -2.3068e+00, -2.3496e+00, -9.7975e-01, -1.4983e+00, -2.6660e+00, -2.9688e+00, -3.0618e+00]], [[-1.4229e+00, -5.7818e+00, -6.0392e+00, -8.4775e+00, -7.4530e+00, -5.3279e+00, -5.2016e+00, -5.8315e+00, -7.1025e+00, -5.3403e+00, -4.8843e+00, -3.3103e+00, -2.4321e+00, -4.8461e+00]], [[ 4.5777e+00, -8.7551e+00, -8.4220e+00, -7.6245e+00, -1.9599e+00, -2.3321e+00, -5.8624e+00, -4.9398e+00, -4.8598e+00, -1.7074e+00, -8.3173e+00, -4.4136e+00, -4.3932e+00, -2.4360e+00]], [[ 2.8783e+00, -2.8435e+00, -2.4496e+00, -2.5098e+00, -2.0537e+00, -1.8126e+00, -1.2084e+00, -1.4043e+00, -1.7001e+00, -2.6548e+00, -1.5963e+00, -7.9044e-01, -1.2090e+00, -8.8937e-01]], [[-3.2419e-01, -3.1983e+00, -5.6184e+00, -6.3054e+00, -5.5136e+00, -5.5131e+00, -3.5810e+00, -5.1473e+00, -5.4921e+00, -4.9520e+00, -3.9096e+00, -2.7378e+00, -2.0246e+00, -3.5865e+00]]], [[[ 3.3949e-01, -3.7948e+00, -3.6829e+00, -4.0360e+00, -3.2049e+00, -4.1716e+00, -2.9716e+00, -5.6252e+00, -5.9200e+00, -6.5697e+00, -5.7420e+00, -5.7444e+00, -4.4351e+00, -4.2589e+00]], [[ 1.2634e+00, -2.6192e+00, -4.8832e+00, -3.4326e+00, -4.0777e+00, -4.8949e+00, -4.8811e+00, -5.0966e+00, -7.5222e+00, -6.4012e+00, -5.8387e+00, -5.8071e+00, -4.2117e+00, -4.1228e+00]], [[ 5.0303e-01, -2.7946e+00, -3.3435e+00, -3.4957e+00, -3.3887e+00, -2.9013e+00, -2.9150e+00, -2.5669e+00, -4.2204e+00, -3.9478e+00, -3.4152e+00, -3.9736e+00, -2.2183e+00, -3.4194e+00]], [[ 5.3206e-01, -1.7457e+00, -2.3376e+00, -2.8456e+00, -2.5536e+00, -3.1019e+00, -1.9163e+00, -2.8481e+00, -3.4453e+00, -3.9826e+00, -3.8717e+00, -4.2864e+00, -1.4132e+00, -2.8133e+00]], [[ 1.4293e+00, -2.8173e-01, -1.6926e+00, -1.4260e+00, -2.2392e+00, -2.4850e+00, -9.3029e-01, -1.4053e+00, -2.3324e+00, -2.8583e+00, -1.4048e+00, -1.0470e+00, -6.0087e-01, -3.6737e-01]], [[-3.0565e-01, -3.1578e+00, -3.6053e+00, -3.9747e+00, -4.1555e+00, -4.0641e+00, -4.3210e+00, -3.5904e+00, -2.7029e+00, -3.8233e+00, -4.5156e+00, -4.3889e+00, -2.5690e+00, -3.3755e+00]], [[ 2.4127e+00, -1.6646e+00, -2.0559e+00, -2.7515e+00, -2.8762e+00, -1.8663e+00, -2.8465e+00, -2.3736e+00, -4.2203e+00, -4.4357e+00, -3.3254e+00, -3.9501e+00, -1.8030e+00, -1.0571e+00]], [[-7.6425e-03, -1.9159e+00, -2.6583e+00, -1.9613e+00, -1.6909e+00, -1.2611e+00, -5.4319e-01, -1.2989e+00, -2.9849e+00, -2.8475e+00, -1.2779e+00, -1.2868e+00, -6.4018e-01, -3.0003e+00]], [[-6.4961e-01, -4.6366e+00, -6.6909e+00, -6.5019e+00, -6.3027e+00, -5.0801e+00, -3.8540e+00, -4.4069e+00, -5.2395e+00, -5.3954e+00, -3.7104e+00, -4.1848e+00, -2.4475e+00, -5.9293e+00]], [[ 4.4445e+00, -4.1234e+00, -2.9119e+00, -3.0755e+00, -5.6334e+00, -2.4130e+00, -6.2895e+00, -5.3467e+00, -2.6946e+00, -7.1282e+00, -4.5588e+00, -8.2326e+00, -5.0205e+00, -2.3851e+00]], [[ 2.5662e+00, -3.8763e+00, -2.7843e+00, -4.4747e+00, -4.2632e+00, -3.3441e+00, -1.8707e+00, -4.0771e+00, -3.7293e+00, -3.9504e+00, -3.1398e+00, -2.3061e+00, -2.4528e+00, -1.6638e+00]], [[ 6.6085e-01, -2.7630e+00, -5.4453e+00, -5.4992e+00, -4.2783e+00, -4.8628e+00, -3.4018e+00, -5.1786e+00, -5.6988e+00, -5.8652e+00, -5.2609e+00, -5.1197e+00, -4.8207e+00, -3.8854e+00]]]]) attn_weights tensor([[[[-0.9931, -5.9427, -6.3060, -5.7598, -4.7639, -6.1035, -6.5186, -4.4901, -4.3661, -3.4461, -2.3765, -1.6666, -0.5866, -3.7307]], [[ 4.4279, -3.0697, -2.6195, -4.8982, -4.0816, -1.6507, -0.1632, -0.7066, -0.1203, -2.1552, -2.5230, -1.2362, -1.3849, 0.2074]], [[ 6.3131, -4.6737, -4.1587, -4.2864, -4.4962, -1.0898, 2.6447, 0.5780, -3.1448, -3.4475, -2.9461, -2.4655, -2.0339, 0.5093]], [[ 0.2923, -4.7702, -4.6511, -5.3793, -5.0988, -3.3192, -2.4893, -2.5646, -3.1044, -4.2179, -2.6475, -2.8109, -2.3621, -1.6733]], [[ 0.2475, -3.8974, -3.9618, -3.8259, -3.6506, -3.8243, -3.3740, -3.8303, -3.0421, -2.6946, -1.4865, -1.5961, -1.4164, -3.1522]], [[ 1.0230, -3.0685, -2.1615, -1.9241, -1.8565, -3.2265, -1.4826, -1.3497, -2.4142, -2.4545, -1.6326, -0.9514, -0.8733, -2.1448]], [[ 1.6380, -3.6535, -3.8006, -4.6374, -4.0770, -2.7567, -1.3074, -2.5524, -2.6402, -3.0370, -3.2138, -2.4586, -2.9303, -1.8770]], [[ 3.1893, -2.8997, -3.2369, -3.9259, -2.7623, -2.3295, -1.4393, 0.1591, -0.3737, -1.7004, -1.0119, -2.5849, -2.7461, -1.4343]], [[ 0.4665, -6.7253, -6.0643, -6.8422, -5.8730, -5.4742, -4.7631, -5.8013, -5.4362, -6.0518, -3.1005, -3.4616, -2.3995, -3.2539]], [[ 0.1379, -2.4754, -2.6818, -3.4521, -4.2634, -3.8807, -2.4275, -1.9051, -1.5075, -2.2548, -1.9168, -2.2976, -2.2735, -2.9479]], [[ 4.5706, -5.7051, -3.4723, -5.3579, -6.5815, -1.8769, 2.9431, -1.0557, -0.1377, -2.6253, -3.9439, -4.1420, -2.5917, -2.3242]], [[ 3.1011, -3.4321, -4.9472, -4.8257, -4.4625, -3.3724, 0.2896, -0.0462, -3.8575, -4.4273, -2.9164, -2.7327, -2.8187, -1.2838]]], [[[-0.5588, -5.2465, -6.0558, -6.2840, -6.7008, -7.4085, -8.0662, -5.6050, -4.3859, -3.8817, -4.2518, -2.8288, -2.2953, -3.2238]], [[ 3.0176, -1.2177, -1.4742, -2.7380, -0.9004, -0.5364, 0.2762, 1.1123, 1.0996, 0.0532, -1.5484, -0.1457, 0.0962, -0.6112]], [[ 6.6745, -4.8198, -4.7871, -5.7955, -0.4764, -0.1712, -3.6798, -4.1106, -3.1452, -4.6605, -6.3182, -0.2980, 0.7471, 1.5298]], [[ 0.3261, -3.5502, -3.2184, -3.6220, -2.9181, -3.4314, -2.6777, -1.7384, -1.1917, -1.9060, -2.7078, -1.6957, -2.1047, -2.3482]], [[ 0.9833, -4.1032, -3.6760, -4.3533, -5.0846, -4.2933, -4.1379, -5.2759, -3.8074, -3.9405, -4.3150, -3.3891, -3.7662, -4.1969]], [[ 1.0477, -1.9121, -2.1307, -2.5744, -3.4431, -4.4673, -2.5679, -2.2730, -2.1522, -3.2445, -3.5430, -3.0996, -2.9379, -3.0459]], [[ 1.5450, -2.6305, -2.6031, -2.9416, -2.3434, -1.7024, -1.5142, -1.9647, -1.7088, -2.2612, -2.6753, -2.6645, -2.2632, -2.9336]], [[ 3.0709, -3.8816, -3.3383, -4.4756, -3.0226, -0.5216, -0.8728, 0.0892, 0.0892, -2.5846, -3.9017, -2.2991, -2.6024, -2.4924]], [[-0.4076, -3.4639, -2.9026, -3.5995, -3.7856, -2.9341, -1.6684, -2.0129, -1.7458, -1.9661, -2.8912, -2.4634, -2.1725, -3.0300]], [[-0.0912, -3.2543, -2.3991, -3.1099, -3.7206, -2.2761, -2.2707, -1.6363, 0.1448, -0.6571, -1.3292, -0.5101, -1.1956, -1.9327]], [[ 4.9654, -4.1040, -4.2558, -5.3524, -0.1990, -0.8131, -3.2183, -3.0610, -3.3585, -4.4882, -6.1039, -1.0136, 0.3810, -0.1625]], [[ 3.2932, -4.2090, -4.3381, -4.2875, -1.4128, -1.0338, -2.1889, -2.4429, -3.7255, -3.6543, -4.5782, -1.5349, -2.5819, -2.3386]]], [[[-0.3401, -8.2257, -7.4520, -6.1090, -7.3734, -7.4800, -7.6080, -7.2130, -6.9543, -5.3579, -4.6832, -3.8568, -1.0214, -4.5762]], [[ 2.9451, -0.1588, -1.2287, -1.8164, -1.4618, -0.9092, -1.0268, -1.8538, -2.4584, -1.2108, -1.6937, -2.6546, -1.0489, -0.7636]], [[ 6.8813, -6.9382, -5.5775, -6.0970, -5.1112, -2.8938, -5.4279, -8.8141, -6.3870, -6.7258, -7.2411, -8.0089, -3.4370, -0.7854]], [[ 0.2651, -4.3903, -3.7043, -3.7836, -3.6998, -2.8964, -2.6710, -2.1491, -0.3504, -1.3745, -1.9147, -2.0589, -1.5786, -3.2813]], [[ 0.9119, -5.6718, -3.8177, -4.8073, -5.4816, -4.5364, -4.7478, -5.0947, -3.0792, -2.5735, -3.3627, -3.2450, -3.0973, -3.2976]], [[ 0.7298, -3.5641, -4.0458, -4.2288, -4.8399, -3.7622, -2.4862, -2.3515, -2.3314, -4.2436, -2.9073, -3.6154, -2.5647, -3.1019]], [[ 1.4930, -2.5530, -3.3958, -2.9766, -2.5697, -2.5341, -2.3984, -2.4335, -2.0887, -3.1699, -3.8468, -4.0820, -3.3125, -3.0780]], [[ 2.9549, -4.9549, -4.3351, -6.5945, -5.4153, -4.6229, -3.9500, -3.5689, -3.0056, -3.9301, -5.1927, -5.5411, -4.5141, -2.0683]], [[-0.6503, -4.7017, -3.9789, -3.5662, -3.5358, -3.1238, -1.8063, -1.9749, -3.7002, -2.3088, -1.7997, -2.1099, -0.0733, -2.6234]], [[-0.1884, -2.3393, -1.9333, -2.9209, -4.0626, -3.7763, -2.9750, -2.0932, -1.0088, -1.2039, -2.2013, -2.4939, -2.3028, -2.8327]], [[ 4.9077, -3.8161, -2.1260, -1.5885, -1.4163, -1.4910, -4.1591, -4.0182, -4.1820, -3.8399, -4.8916, -5.7487, -1.5117, 0.0587]], [[ 2.8867, -3.3222, -3.8915, -4.0857, -3.8846, -2.7872, -4.3622, -4.3758, -5.1006, -3.3091, -3.9732, -3.9637, -2.0282, -2.4934]]], [[[-0.3927, -6.7615, -6.0965, -7.4815, -7.0416, -5.6562, -6.2010, -7.3256, -6.4946, -5.9711, -6.6516, -3.8572, -2.7599, -4.7546]], [[ 2.5583, -1.5054, -2.6936, -4.4852, -3.3296, -1.0118, -0.9190, -0.6628, -1.5280, -2.3749, -1.9056, -0.2378, -0.9357, -1.4924]], [[ 6.4084, -4.6472, -4.1527, -4.8521, -1.1278, -0.2932, -1.8324, -2.1648, -2.0283, 0.0761, -3.4288, -0.2905, -0.9152, 1.1374]], [[ 0.3106, -3.9893, -4.2359, -4.3015, -3.7556, -2.7631, -2.2878, -2.3421, -3.1183, -2.2342, -2.3070, -1.8314, -1.3839, -1.6503]], [[ 1.0782, -5.0099, -4.6008, -5.5418, -4.6951, -3.9429, -3.0897, -4.2524, -5.6138, -4.5802, -4.5025, -2.9566, -3.5267, -4.7916]], [[ 0.5744, -0.6277, -1.8039, -1.3086, -0.9907, -3.6200, -1.2561, -0.0808, -1.7341, -3.1443, -1.9537, -1.3563, -1.8157, -1.4777]], [[ 1.4038, -2.0727, -2.6644, -3.2510, -3.0821, -2.1710, -2.2174, -2.1247, -2.3152, -1.8909, -2.5824, -1.5325, -2.0992, -1.9465]], [[ 3.4401, -1.8536, -2.3536, -3.7961, -2.6076, -1.8873, -1.1829, -0.6651, -1.3623, -0.9086, -1.0283, -0.0308, -1.2163, -1.3789]], [[-0.7106, -5.1052, -4.9755, -5.3630, -4.3483, -2.2873, -0.9909, -2.5380, -3.6545, -3.0096, -1.6786, -2.4435, -0.8244, -2.8730]], [[ 0.2322, -1.6553, -2.2105, -3.6568, -4.3471, -2.8218, -2.7834, -2.5859, -3.8845, -3.3797, -3.3295, -0.2057, -0.0924, -2.0857]], [[ 3.6896, -4.7503, -4.5879, -7.1511, -2.7394, -3.0302, -2.5970, -2.3963, -1.8386, -2.5703, -5.0093, -2.0304, -2.3876, -2.2747]], [[ 3.3480, -3.1412, -3.7291, -2.5123, -0.5884, -2.0820, -3.6214, -3.7649, -3.0929, -2.2024, -4.2413, -2.9207, -3.3007, -1.6108]]], [[[-0.1330, -6.0650, -6.0711, -6.2695, -6.2612, -4.9955, -4.6249, -5.7238, -5.7368, -5.8940, -4.6215, -3.9296, -2.7076, -3.2917]], [[ 4.4593, -2.5965, -1.7911, -3.5788, -3.8289, -2.6370, -1.8938, -3.1832, -3.1239, -2.9674, -2.7230, -2.4884, -1.5741, -0.7985]], [[ 6.2740, -3.5004, -4.1197, -4.4009, -4.5352, -1.5990, -4.8920, -7.0829, -3.8891, -5.5368, -3.7772, -5.8032, -5.3721, -1.8036]], [[ 0.8813, -3.1661, -3.5969, -3.9915, -5.0234, -3.3000, -3.2445, -4.8528, -3.6481, -4.8848, -3.6536, -5.0946, -3.5189, -4.1394]], [[ 1.2179, -2.1814, -2.5254, -2.1501, -2.6603, -5.1278, -3.9838, -4.0785, -5.4529, -6.4227, -6.5125, -6.0819, -2.6148, -2.7546]], [[ 1.5913, -2.7995, -3.2369, -3.5638, -3.1280, -5.6679, -3.1928, -3.6803, -4.0925, -3.7775, -4.7851, -4.8049, -3.3547, -2.4352]], [[ 1.6132, -1.7842, -3.1466, -2.8956, -3.3405, -2.9829, -2.6234, -2.6724, -3.2773, -3.6935, -3.1576, -3.4774, -2.4446, -2.3067]], [[ 3.8714, 0.9657, -1.1157, -2.6611, -2.5628, -1.4490, -2.6953, -3.4760, -4.5243, -5.9436, -4.9454, -5.4079, -3.0925, -2.2402]], [[ 0.7016, -3.2155, -3.0644, -2.5872, -3.7110, -3.4580, -2.4668, -3.2684, -6.1422, -5.4259, -5.1759, -4.4491, -2.8527, -3.9722]], [[ 1.7583, -5.3054, -4.8068, -5.5268, -5.2693, -5.1759, -4.6858, -6.6101, -6.0284, -5.8255, -6.1824, -6.9041, -2.7083, -1.4993]], [[ 5.6492, -3.7993, -3.4111, -5.5770, -4.3440, -1.6417, -3.7301, -5.5327, -5.1068, -5.8575, -3.9000, -5.8364, -4.8127, -3.4091]], [[ 3.3074, 0.1793, -2.3660, -1.3483, -2.8773, 0.2322, -2.5583, -3.7278, -3.6069, -5.8241, -3.4564, -5.7563, -1.9152, -2.0040]]]]) attn_weights tensor([[[[ 1.1182, -2.6332, -3.7504, -3.1122, -3.4214, -3.3427, -2.4598, -2.0486, -2.9727, -2.8585, -3.1713, -3.2023, -3.3873, -3.0932]], [[ 4.1218, -1.0656, -1.3785, -2.0606, -2.6463, -0.6198, 1.3622, 1.1858, 0.2309, -1.0817, -1.8360, -1.0072, -1.1393, 0.2324]], [[ 2.1907, -0.7027, -1.8329, -1.8379, -1.1157, -1.3541, -1.5630, -0.8505, -2.0094, -2.1711, -1.9133, -1.3856, -1.6918, -1.8119]], [[ 2.4742, -2.4100, -2.0310, -1.8961, -1.7515, -0.3840, -0.3532, -0.2489, -0.8198, -1.0047, -2.0731, -1.6040, -1.7752, 0.1440]], [[-0.0884, -5.5987, -6.1097, -5.8040, -4.5711, -4.7681, -3.9927, -4.2321, -5.2877, -4.4253, -2.4904, -1.9767, -0.9113, -3.1021]], [[-1.4163, -3.6465, -3.3785, -3.1618, -3.3264, -4.1301, -4.0930, -2.3970, -1.7164, -1.9122, -1.6802, -2.4127, -2.5147, -2.9841]], [[ 3.2070, -2.8463, -3.5911, -4.3111, -4.0314, -1.4886, -0.1459, -0.8059, -3.1059, -4.4604, -3.0130, -2.2470, -2.5334, -0.1571]], [[-1.2240, -6.2353, -6.6313, -6.1037, -4.5014, -5.0637, -5.1698, -3.8833, -4.3265, -3.5277, -0.1582, -0.5657, -0.5839, -2.6362]], [[ 1.3933, -3.9668, -4.3619, -4.6426, -3.8985, -2.2434, -1.4799, -2.5956, -3.8697, -3.9110, -3.8576, -3.5531, -2.3961, -1.8887]], [[ 1.6284, -4.7738, -4.9947, -5.2538, -4.0639, -1.0949, -1.7501, -3.2403, -3.4653, -3.7673, -2.1595, -2.8232, -1.7066, -0.3826]], [[ 1.0824, -2.6907, -2.5199, -2.8800, -2.8227, -1.5398, -1.0922, -0.9988, -1.7789, -2.3648, -2.2479, -1.9319, -2.2383, -0.8344]], [[ 1.0790, -3.5094, -3.9434, -3.4511, -3.8867, -1.7116, -2.2335, -2.3594, -3.5846, -3.6361, -3.3119, -3.6972, -3.3155, -2.0328]]], [[[ 1.0858, -3.0083, -2.6242, -2.5235, -2.7550, -3.4183, -1.3039, -2.7908, -3.2717, -2.9359, -2.4026, -1.3358, -0.7071, -0.5161]], [[ 5.5723, -1.9988, -2.8555, -3.6883, 1.7053, 2.0187, 0.5792, -0.0657, 0.2741, -2.3982, -3.7505, 0.8532, 1.3796, 2.2784]], [[ 2.3201, -1.1470, -2.5836, -2.9595, -0.7917, -0.5868, -0.6774, -0.3577, -1.5982, -2.1106, -2.3222, -1.4953, -0.9715, -1.5638]], [[ 2.1911, -1.8278, -1.7045, -2.7795, -2.0468, -0.8120, -0.5385, 0.3869, -0.2998, -1.7488, -2.5936, -3.1566, -2.5959, -1.7145]], [[-0.1731, -5.9986, -4.9608, -5.9276, -4.8457, -3.2292, -2.3736, -4.8559, -3.8752, -3.6303, -4.5045, -3.1115, -0.7568, -1.9535]], [[-1.3675, -4.3569, -4.2709, -3.8174, -3.5606, -4.2441, -4.1148, -3.4088, -2.9850, -3.0267, -2.8918, -1.0918, -1.7942, -2.6909]], [[ 3.3093, -4.8872, -3.7089, -5.9811, -2.6496, -2.0873, -1.5688, -3.7017, -3.1821, -4.2478, -6.1490, -3.1435, -2.6293, -1.5962]], [[-0.3663, -6.3802, -5.3579, -6.0680, -5.8961, -4.5416, -4.2425, -4.3005, -2.9886, -2.8188, -3.6474, -3.1358, -0.9943, -2.2540]], [[-0.2914, -2.2611, -3.1498, -3.5944, -3.0259, -0.6367, -0.6943, -0.3897, -1.2939, -2.6643, -3.2065, -2.2884, -1.6577, -1.7983]], [[ 0.8791, -3.1240, -2.9292, -3.2850, -2.0158, -0.4083, -0.1395, -0.7273, -1.7320, -2.0187, -2.6582, -1.9507, -1.7334, -1.7656]], [[ 1.1815, -3.3917, -3.4948, -4.1050, -2.0273, -2.7401, -1.7533, -1.1785, -1.4826, -2.6279, -3.1168, -3.0021, -1.3708, -1.0017]], [[ 0.8069, -3.2272, -3.8342, -3.5996, -3.6599, -2.6339, -2.5403, -2.9446, -3.7310, -4.3772, -4.4337, -4.1449, -4.4158, -4.2989]]], [[[ 1.2949, -2.4971, -2.7252, -2.1572, -2.6966, -4.1781, -1.8472, -2.5286, -3.0179, -2.7123, -2.6492, -2.7712, -2.1116, -2.2465]], [[ 5.6453, -2.6199, -3.5896, -3.6342, -2.9310, -2.0728, -3.0643, -3.7783, -3.9447, -4.0009, -3.3406, -4.6517, -2.6818, -0.9309]], [[ 1.9837, -1.2701, -2.0593, -2.0296, -1.8989, -0.9780, -1.0063, -1.5379, -1.1002, -2.0103, -2.0093, -1.9740, -1.6690, -1.1701]], [[ 2.7061, -1.9371, -2.4571, -3.1615, -2.8788, -4.2410, -2.6539, -2.1766, -2.0757, -3.2461, -3.8925, -4.7506, -3.3350, -2.8089]], [[ 0.0947, -5.8454, -5.0334, -5.3795, -5.9986, -4.3934, -3.5351, -4.4601, -3.6099, -3.6526, -2.5121, -2.4367, -0.6678, -2.4344]], [[-1.5544, -3.5757, -2.8431, -3.4798, -4.8116, -3.5767, -3.2483, -3.1655, -1.8390, -2.2057, -3.0277, -2.6930, -2.2288, -3.3711]], [[ 3.4205, -3.8277, -4.1238, -5.6380, -4.5744, -5.0611, -4.7499, -3.8534, -3.5004, -3.4273, -5.2678, -5.8711, -2.6537, -3.0316]], [[-0.3308, -6.3372, -5.4791, -6.3578, -7.8686, -5.4525, -5.9820, -5.9573, -4.6263, -3.2441, -1.8160, -2.4548, 0.0682, -3.9834]], [[-0.1041, -1.7132, -2.1532, -2.2729, -1.6929, -0.9517, -1.0295, 0.2358, -0.7433, -1.2612, -3.0716, -3.1174, -2.1325, -2.8945]], [[ 0.7213, -3.4711, -2.3761, -3.1253, -2.0335, -1.6722, -0.6975, -1.9483, -3.1622, -1.6112, -2.5231, -3.9735, -2.5502, -3.9810]], [[ 1.1401, -3.1758, -3.9230, -4.1431, -2.8478, -2.6724, -3.2798, -2.7670, -2.5339, -3.2581, -3.8616, -2.6228, -1.5265, -2.1292]], [[ 0.9794, -3.8301, -5.6390, -4.8002, -4.7841, -2.8157, -3.0242, -3.2087, -3.8408, -5.8927, -5.8682, -6.4336, -5.1889, -4.4884]]], [[[ 1.0425, -2.9508, -1.7750, -2.3856, -2.6838, -3.6729, -2.1060, -3.3965, -2.5064, -4.2644, -2.8061, -1.8235, -1.2650, -1.6981]], [[ 4.1491, -3.3541, -3.9117, -5.7114, -1.8799, -1.4076, -0.7957, -1.9722, -0.9505, -1.6184, -0.8992, -1.4977, -2.1514, -1.7500]], [[ 2.1059, -1.2839, -1.7723, -2.5767, -0.9231, -1.2763, -0.8323, -0.9431, -0.5834, -1.0521, -1.3135, 0.3043, -0.6059, -1.5082]], [[ 1.9988, -2.9169, -2.8895, -3.4929, -2.3926, -0.2722, -0.6306, -1.1353, -2.1183, -1.4296, -1.2885, 0.1024, -0.6567, -1.7926]], [[-0.2556, -3.8457, -3.9916, -5.2468, -4.8689, -3.7067, -2.9999, -3.4853, -4.8599, -3.2982, -2.9510, -3.1380, -2.0753, -4.3082]], [[-0.8474, -3.9430, -3.9059, -5.3024, -5.1297, -2.4679, -3.0577, -4.0167, -5.2176, -3.9262, -3.6538, -2.6720, -1.4918, -3.0346]], [[ 1.9566, -4.0495, -3.7646, -5.8187, -2.6592, -1.9939, -1.4754, -1.8150, -1.4781, -2.5171, -2.6554, -1.9489, -1.2421, -2.5522]], [[-0.3671, -6.8234, -5.3335, -6.6311, -5.2458, -2.8587, -2.6844, -4.2015, -4.1640, -4.4134, -3.1291, -2.8695, -0.8196, -2.7073]], [[-0.1331, -2.6572, -3.3520, -3.9961, -3.0691, -1.7037, -1.5500, -1.2546, -2.7731, -1.6007, -1.2438, -2.0323, -1.6848, -2.2982]], [[ 0.5961, -4.1798, -3.7322, -4.0114, -2.3887, -1.3821, -0.7972, -1.4844, -0.6747, -0.8090, -1.2154, -1.7563, -1.2824, -1.7296]], [[ 1.1511, -3.8371, -3.6710, -3.9093, -2.1569, -1.9994, -1.5040, -1.6755, -1.3815, -0.8736, -1.6611, -1.6272, -1.9920, -1.3478]], [[ 0.7509, -3.9244, -4.0347, -4.3702, -4.0479, -2.3290, -2.7464, -3.7142, -5.2515, -2.9015, -3.3438, -3.7794, -3.6567, -4.0427]]], [[[ 1.4713, -2.9452, -2.3451, -3.8419, -2.8194, -4.4684, -3.2437, -4.5417, -6.5168, -6.2166, -4.4993, -4.1565, -2.4756, -2.1133]], [[ 4.9055, -2.2571, -3.4826, -3.6571, -2.2649, -1.4181, -3.0931, -4.6693, -4.1038, -5.1094, -3.6532, -4.1853, -4.1807, -4.1073]], [[ 1.7684, -0.9868, -1.1351, -1.9413, -2.3328, -1.4374, -1.4831, -2.2588, -2.2454, -3.2405, -1.1487, -2.1776, -1.2184, -1.0332]], [[ 2.4071, -0.3670, -1.4816, -2.2235, -2.5558, -3.6012, -1.5056, -2.4078, -2.3817, -2.3651, -3.3202, -2.3041, -1.4669, -1.3627]], [[ 0.5997, -3.3449, -5.0518, -4.8361, -5.7523, -4.4153, -4.8797, -3.5070, -6.5755, -5.8663, -5.2452, -5.6473, -2.1051, -2.4261]], [[ 0.3916, -3.8168, -4.7576, -4.8326, -4.7358, -3.5963, -3.2948, -3.6724, -5.9974, -7.2405, -5.2582, -5.7715, -3.3475, -3.5989]], [[ 3.1635, -0.9977, -2.8681, -2.9186, -3.2128, -3.8348, -4.0360, -5.1757, -5.6307, -5.7098, -6.1448, -5.9185, -2.9396, -1.9535]], [[-0.0596, -5.0443, -6.1802, -5.1336, -5.9186, -5.1511, -4.8569, -4.9166, -5.8349, -6.9295, -6.2218, -5.4588, -4.1134, -3.8516]], [[ 1.6495, -2.8116, -2.8140, -3.6272, -4.0820, -2.1881, -3.2086, -4.0056, -4.8840, -4.8168, -3.3832, -4.2301, -2.0759, -3.0757]], [[ 1.2858, -2.1350, -2.0123, -3.2183, -3.1264, -2.4087, -3.1311, -3.0826, -4.1625, -4.8458, -3.4824, -4.1399, -1.0873, -1.2863]], [[ 1.0274, -1.7706, -2.7208, -3.3373, -2.6450, -3.4331, -3.4719, -3.2126, -3.3966, -3.4838, -3.9096, -4.1503, -2.5603, -1.7530]], [[ 1.4270, -2.1993, -3.2606, -3.6855, -4.0305, -2.4281, -3.5232, -4.3417, -6.2532, -5.5464, -2.4594, -5.3901, -3.2672, -3.2816]]]]) attn_weights tensor([[[[ 3.2034, -4.0742, -3.9028, -3.5813, -3.9251, -0.1393, 1.4668, -2.1187, -3.9513, -3.1676, -0.1248, -1.4871, -1.0576, -0.2628]], [[ 3.5853, -2.2557, -3.0182, -2.7212, -2.5236, -3.5907, -0.3708, -0.9308, -2.0801, -2.4282, -2.3719, -1.6451, -1.2238, -2.4889]], [[ 3.3493, -3.5061, -3.4745, -4.0899, -2.9011, -0.7639, -0.3287, -1.7474, -3.8254, -3.7980, -2.5412, -1.8006, -1.0457, -0.7671]], [[-1.0532, -3.9146, -4.7182, -5.2272, -4.7528, -4.9603, -5.0962, -3.2925, -3.2880, -3.8172, -2.3726, -1.5602, -1.1544, -3.1029]], [[ 3.2348, -1.9661, -3.2711, -3.7586, -2.8030, -1.9704, -0.2929, -1.9962, -3.0341, -2.8559, -2.5880, -1.7507, -2.5651, -1.4833]], [[ 1.6551, -2.6831, -3.6519, -3.2188, -2.5947, -1.9430, -2.2282, -1.7470, -3.1501, -2.9851, -2.0911, -1.8671, -2.2149, -1.6876]], [[ 3.8078, -1.9296, -3.8682, -3.5835, -4.4553, -0.9472, 2.6482, -0.7033, -2.8093, -2.7009, -2.1126, -3.2719, -2.7671, -0.5044]], [[ 0.2471, -3.4246, -3.2389, -4.5469, -3.7543, -4.1440, -3.1463, -3.0857, -3.2945, -4.2609, -3.3598, -2.7934, -3.1916, -3.1644]], [[ 2.5964, -3.3663, -4.1105, -2.3649, -3.4702, -0.9730, -0.7187, -2.8402, -4.3595, -2.2108, -2.4626, -2.4316, -2.9464, -1.1236]], [[ 4.5931, -1.0821, -2.2030, -2.3642, -2.5712, 0.3736, 4.5783, -0.6751, -1.9541, -1.9419, 0.0684, -0.5047, -0.6744, 1.2298]], [[ 0.2842, -4.6089, -3.5441, -3.2951, -2.3330, -3.2107, -2.7060, -2.9169, -2.4734, -1.9395, 0.2679, -0.0275, 0.5469, -1.8720]], [[ 3.7648, -0.2537, -2.3862, -2.6508, -1.8888, -3.1144, -2.3670, 0.1675, -2.3083, -2.7318, -2.5089, -1.3920, -2.6705, -3.0536]]], [[[ 2.0808, -1.8274, -2.1523, -1.9848, -3.0758, 0.4099, 0.2336, -1.2323, -2.6925, -2.0430, -2.2089, -3.7306, -1.4848, -1.8906]], [[ 3.5342, -2.0203, -3.4813, -4.6434, -1.7470, -1.9416, -1.4959, -2.6055, -2.8743, -4.1724, -5.3039, -2.7717, -1.8609, -1.0777]], [[ 1.3387, -2.5033, -2.9735, -3.4562, -2.3154, -0.5063, -0.4926, -0.6676, -2.1353, -3.0692, -3.6776, -3.2431, -2.1353, -2.2110]], [[-1.1699, -3.9022, -3.8605, -4.9036, -5.3853, -3.9029, -3.4241, -2.9206, -2.3995, -1.9957, -3.1744, -1.2032, -0.6518, -2.8892]], [[ 3.6450, -3.0209, -3.8282, -4.1803, -2.6946, -1.1011, -1.0129, -1.3587, -2.6559, -3.7719, -3.7436, -3.5818, -2.9690, -2.1403]], [[ 1.8894, -4.0842, -4.6902, -4.4367, -3.2623, -2.0299, -1.5930, -2.2535, -3.0387, -3.5897, -3.6565, -2.7749, -1.7146, -1.2956]], [[ 4.2524, -2.4602, -3.8623, -3.5989, -1.0333, 1.3600, 1.0067, -1.6608, -2.9030, -3.5425, -3.8833, -1.6357, -0.8300, -0.1899]], [[ 0.4726, -3.6822, -4.3005, -4.5039, -3.7063, -2.8954, -2.7529, -3.2710, -3.2319, -4.7148, -4.6386, -4.0942, -4.1331, -4.5305]], [[ 1.6305, -2.8021, -3.6838, -3.2588, -2.9680, -1.2388, -1.8334, -2.4808, -2.8374, -3.4255, -2.8169, -3.7962, -2.2534, -2.8790]], [[ 4.4015, -1.7450, -3.9944, -3.6629, -0.2951, -0.1065, 0.2490, -0.9197, -2.0429, -3.4584, -4.0325, -1.4489, -0.7160, -0.2528]], [[ 0.7837, -4.0376, -4.1301, -4.8676, -5.0602, -2.3546, -2.9591, -3.8392, -3.5884, -2.8493, -3.7410, -1.7871, 0.6151, -0.8583]], [[ 3.7008, -0.8281, -2.5904, -2.2390, -0.5768, -1.5211, -1.2000, -2.3511, -2.2304, -3.0263, -2.9356, -3.3330, -1.5356, -1.9783]]], [[[ 1.4593, -1.2672, -1.0209, -1.5947, -2.3378, -0.4973, -0.2548, -1.5926, -2.7268, -1.4459, -3.1223, -1.8964, -1.3731, -3.6887]], [[ 4.6214, -2.8341, -5.0645, -4.6215, -3.2646, -3.5472, -3.7169, -3.4677, -3.2905, -4.7062, -6.1734, -3.8559, -2.5010, -1.1601]], [[ 1.1288, -2.3907, -2.2375, -3.1428, -1.9880, -1.9224, -1.5913, -0.3847, -2.1572, -1.5379, -4.0845, -2.5461, -1.5158, -1.5927]], [[-0.7790, -5.1046, -4.6708, -5.7004, -7.1593, -4.7083, -4.6800, -3.8940, -2.3964, -3.0041, -3.6547, -2.8968, -1.6528, -2.6424]], [[ 3.5708, -3.3620, -4.1840, -4.4866, -2.9579, -3.3367, -3.3817, -4.1382, -4.1558, -4.7444, -4.8925, -4.2573, -4.1962, -2.2466]], [[ 2.0751, -2.9136, -3.4265, -4.0457, -3.8897, -2.4769, -3.6075, -4.0026, -3.9609, -3.4188, -4.7637, -3.7619, -2.3963, -3.0103]], [[ 4.0646, -4.0277, -4.0899, -4.5435, -3.7089, -0.5172, -2.3047, -5.1390, -5.6030, -5.1879, -6.2282, -5.8318, -3.7496, -1.9371]], [[ 0.4504, -3.9248, -5.2601, -5.3497, -5.1113, -2.6814, -2.9245, -3.0560, -3.4603, -4.9250, -5.5851, -5.6240, -4.0856, -4.4372]], [[ 1.8864, -3.7087, -3.3113, -1.9813, -2.5550, -0.3238, -1.0732, -2.8125, -3.0644, -3.0524, -3.7166, -3.0645, -2.3659, -4.0577]], [[ 4.6138, -2.7578, -3.6412, -4.0013, -3.2788, -1.6523, -1.9893, -5.5356, -4.5384, -5.7299, -5.7932, -5.6995, -2.8076, -1.4895]], [[ 0.8247, -5.4977, -4.3153, -5.2807, -5.7141, -3.8582, -3.5219, -4.9562, -3.8855, -2.3224, -2.5210, -1.5854, 0.5654, -1.1228]], [[ 3.4010, -1.2382, -3.1779, -2.1894, -1.2781, -1.6908, -0.8965, -1.9885, -3.6380, -3.8718, -4.9564, -3.9332, -3.1605, -3.4085]]], [[[ 1.3838, -3.8427, -4.3810, -4.4100, -3.4436, 0.1755, -0.5839, -2.9259, -2.3812, -1.2248, -1.4767, -3.1573, -0.0235, -1.6414]], [[ 2.8068, -2.7715, -2.8943, -2.9453, -0.8646, -3.3968, -2.5816, -2.3814, -1.3398, -3.5145, -3.8797, -1.9519, -2.5409, -1.3219]], [[ 1.2789, -2.7883, -2.9580, -3.6304, -2.3318, -1.3497, -1.3698, -1.4051, -1.1926, -0.8783, -1.2950, -1.4387, -1.5225, -2.6549]], [[-0.7009, -3.3396, -2.8036, -4.7017, -5.0104, -2.5300, -2.5684, -3.5500, -4.8894, -4.6183, -3.4337, -1.6852, -0.9119, -2.7497]], [[ 2.9015, -2.4903, -2.5113, -2.8461, -1.6794, -1.1636, -0.8017, -0.8671, -1.8530, -1.4401, -1.8152, -1.6057, -2.5999, -2.8641]], [[ 1.9241, -2.7908, -2.5621, -2.9623, -3.1330, -2.6960, -2.0510, -2.9819, -2.8274, -3.1695, -2.6863, -3.1324, -2.0633, -1.8243]], [[ 3.3189, -4.2100, -3.2039, -4.1852, -2.6824, -1.2034, -0.9196, -3.0860, -1.4136, -0.3460, -2.2960, -2.1110, -1.7494, -1.1990]], [[ 0.5235, -3.4137, -3.8757, -4.4110, -2.7182, -3.4111, -3.2346, -2.7000, -2.7462, -3.7161, -3.2059, -2.3138, -3.1875, -2.9078]], [[ 1.4825, -2.2949, -2.7911, -2.8890, -2.4805, -0.6697, -0.4753, -1.9663, -2.0230, -0.9672, -0.2680, -1.4095, -1.4183, -2.3839]], [[ 3.6907, -3.9023, -3.5042, -3.9868, -1.6747, -1.2799, -0.6934, -2.9258, -1.1834, -0.2488, -2.4915, -1.6077, -2.1447, -1.9679]], [[ 0.4981, -3.8454, -3.3546, -4.6800, -3.6542, -2.3906, -2.0532, -2.6296, -2.7897, -2.3443, -2.1411, -1.7672, 0.2072, -1.7819]], [[ 3.2045, -0.3649, -1.9953, -0.9199, -0.0857, -2.1040, -2.3158, -3.2194, -0.4507, -2.1731, -3.2243, 0.1259, -1.5753, -1.4774]]], [[[ 2.7586, -2.1754, -2.7649, -3.5224, -4.0434, -1.1075, -0.6552, -3.0752, -4.9731, -4.9633, -1.6866, -2.4014, -2.1427, -3.3230]], [[ 3.1983, -1.4441, -3.2379, -4.2263, -3.7684, -3.2091, -3.2554, -3.5597, -4.3336, -4.8518, -4.0904, -4.4889, -2.3387, -1.5120]], [[ 2.9988, -5.1386, -3.0604, -4.9713, -4.2499, -1.9785, -1.0281, -2.6226, -4.5088, -4.9475, -2.6529, -2.8601, -1.6649, -2.3926]], [[ 0.1440, -4.8009, -6.5514, -6.6809, -6.5541, -4.6971, -4.7343, -4.5708, -5.9479, -6.0532, -6.9297, -6.0641, -3.3444, -2.5016]], [[ 2.3289, -0.6065, -2.3004, -4.2055, -3.8768, -3.5577, -2.5425, -3.2093, -6.7575, -5.7971, -3.5685, -3.7263, -1.5348, -0.0350]], [[ 1.9624, -0.5955, -1.1909, -3.1594, -3.9291, -0.5139, -1.4439, -2.0483, -4.2993, -4.6760, -3.0393, -2.4987, 0.1739, -0.4385]], [[ 3.2192, -2.8347, -2.9027, -3.4676, -3.0692, -1.2438, -1.5253, -3.7270, -4.1480, -3.9254, -2.6783, -2.7482, -2.8395, -1.8013]], [[ 0.2340, -3.4470, -3.9094, -4.7080, -4.4322, -4.8849, -4.7032, -4.9483, -5.6126, -4.4953, -5.1429, -5.1701, -3.5543, -3.2593]], [[ 1.4882, -4.3346, -3.8673, -2.0973, -2.9035, 0.5076, -1.2486, -4.2695, -4.8752, -5.5218, -0.6137, -1.7974, -3.5869, -3.0882]], [[ 3.6950, -3.1640, -2.7675, -4.3473, -3.3157, -0.7869, -1.3080, -3.8138, -2.6978, -3.1270, -2.4356, -3.7560, -2.9168, -3.2744]], [[ 1.3377, -4.2637, -3.8655, -3.8625, -4.6202, -4.0462, -3.8986, -4.2317, -4.6732, -4.8302, -5.5025, -4.4859, -2.3928, -3.1600]], [[ 3.7433, 1.1985, -2.0415, -2.3654, -2.7195, -2.3908, -1.9630, -2.2790, -2.9180, -3.3453, -3.1180, -3.3518, -2.0416, -2.5709]]]]) attn_weights tensor([[[[ 3.5579e+00, -3.7431e+00, -4.2115e+00, -3.8743e+00, -4.0421e+00, -6.3432e-01, 1.7273e+00, -2.5703e+00, -3.8331e+00, -3.3335e+00, -9.5384e-01, -3.0964e+00, -3.1338e+00, -7.8481e-01]], [[ 4.7087e+00, -1.9189e+00, -3.4816e+00, -1.9871e+00, -3.0841e+00, 3.8227e-02, 1.9875e+00, -1.4096e+00, -3.1428e+00, -1.1380e+00, -5.4212e-01, -4.3215e-01, 3.2391e-01, 1.1835e+00]], [[ 3.2701e+00, 1.5981e-01, -1.7304e+00, -2.3235e+00, -2.8958e+00, -1.1911e+00, 7.8755e-01, -2.1526e-03, -1.3455e+00, -1.4186e+00, -3.9961e-01, -9.9463e-01, -1.3164e+00, -1.5821e-01]], [[ 3.1365e+00, 7.5457e-01, -3.1299e+00, -3.0556e+00, -1.9774e+00, -7.1408e-01, -3.3599e-01, 6.7564e-01, -3.1986e+00, -2.8230e+00, -1.9115e+00, -1.4530e+00, -9.3956e-01, -6.0934e-02]], [[ 2.4236e+00, 5.5497e-02, -2.8249e+00, -2.2081e+00, -2.0324e+00, -3.2250e+00, -1.5812e+00, -2.6070e-01, -3.0287e+00, -2.5080e+00, -3.3414e+00, -2.4890e+00, -2.0718e+00, -2.6258e+00]], [[-2.1445e-02, -2.4494e+00, -2.5902e+00, -1.8680e+00, -2.1685e+00, -2.9009e+00, -2.7342e+00, -2.3653e+00, -2.0390e+00, -1.3567e+00, -8.8930e-01, -1.4566e+00, -8.9137e-01, -1.9637e+00]], [[ 3.5429e+00, -3.3332e+00, -3.5942e+00, -3.2237e+00, -3.0729e+00, -7.8380e-01, 1.8364e+00, -3.2593e+00, -3.6103e+00, -2.9477e+00, -5.1427e-01, -1.5481e+00, -1.7430e+00, -6.5161e-01]], [[ 2.3051e+00, -1.9478e+00, -2.4447e+00, -2.9232e+00, -2.2822e+00, -2.0598e-02, 1.3961e+00, -4.8658e-01, -2.1719e+00, -2.1918e+00, -8.4490e-01, -1.0139e+00, -2.1479e+00, 9.8666e-02]], [[ 3.5336e+00, -7.9432e-01, -2.5738e+00, -2.9443e+00, -1.3345e+00, -1.9039e+00, -1.0234e+00, 5.3054e-01, -1.8127e+00, -2.1502e+00, -2.2355e+00, -7.8066e-01, -2.2494e+00, -1.4288e+00]], [[ 4.6237e-01, -3.9481e+00, -4.1754e+00, -5.8068e+00, -3.2199e+00, -2.2820e+00, -1.9187e+00, -4.2684e+00, -3.2854e+00, -5.1691e+00, -3.6320e-01, 4.0383e-02, 3.8346e-01, -5.7016e-01]], [[ 3.4521e+00, -2.4677e+00, -2.2871e+00, -1.9436e+00, -2.3279e+00, -1.5320e+00, 1.6657e-01, -2.2041e+00, -2.3071e+00, -1.7939e+00, -2.0049e+00, -1.2168e+00, -2.1642e+00, -1.1283e+00]], [[ 4.6625e+00, -1.4962e+00, -1.2004e+00, -2.4358e+00, -1.8459e+00, -1.4797e-01, 1.8626e+00, -1.5766e+00, -9.1470e-01, -1.5139e+00, 2.1507e+00, 2.7344e+00, 2.9206e+00, 1.1377e+00]]], [[[ 2.6701e+00, -2.6475e+00, -3.3180e+00, -3.3598e+00, -2.6842e+00, 6.0960e-01, -3.2762e-01, -2.3481e+00, -2.9291e+00, -3.5532e+00, -3.5488e+00, -3.0814e+00, -2.4099e+00, -2.5952e+00]], [[ 4.3741e+00, -1.2538e+00, -3.7758e+00, -2.9460e+00, -9.7302e-01, 1.2743e+00, 2.3781e-01, -1.1996e+00, -1.8276e+00, -3.7531e+00, -2.3878e+00, -1.1306e+00, -9.0416e-01, 1.0717e+00]], [[ 3.6088e+00, -1.2391e+00, -2.1341e+00, -2.8922e+00, -1.0010e+00, 3.4204e-01, 8.7593e-01, -4.6920e-01, -1.1063e+00, -2.1938e+00, -2.5627e+00, -1.3061e+00, -9.0833e-01, -1.1762e+00]], [[ 3.2501e+00, -9.0750e-01, -2.3019e+00, -2.5277e+00, -5.8455e-01, 9.0605e-01, 3.9621e-01, -1.0027e+00, -2.0995e+00, -2.0766e+00, -2.1997e+00, -1.0799e+00, -3.2306e-01, -5.7232e-01]], [[ 2.3377e+00, -1.3417e+00, -9.5665e-01, -1.0586e+00, -7.4571e-01, 2.2680e-01, 7.8852e-01, -4.4357e-01, -4.1437e-01, -6.4758e-01, -2.9633e-01, -1.7971e+00, 9.0694e-02, 4.9297e-01]], [[ 1.7014e+00, -3.4151e+00, -3.2992e+00, -3.8684e+00, -4.2950e+00, -2.2761e+00, -3.1625e+00, -3.9066e+00, -3.3068e+00, -2.6542e+00, -3.3277e+00, -2.2873e+00, -9.2387e-01, -1.5791e+00]], [[ 3.3539e+00, -2.6516e+00, -3.0045e+00, -2.9872e+00, -2.0205e+00, 3.9935e-01, 7.7998e-02, -1.9447e+00, -2.7725e+00, -2.8637e+00, -2.7183e+00, -1.3518e+00, -1.1026e+00, -9.3740e-01]], [[ 2.1389e+00, -2.6099e+00, -2.7565e+00, -2.8162e+00, -1.1159e+00, 1.3004e-01, -8.5787e-01, -7.0211e-01, -1.0334e+00, -2.0797e+00, -1.9095e+00, -2.6866e+00, -7.8342e-01, -7.4192e-01]], [[ 3.5223e+00, -2.0469e+00, -3.7697e+00, -4.3457e+00, -2.3237e-01, -2.2653e+00, -1.1592e+00, -1.0994e+00, -1.5963e+00, -3.6570e+00, -3.8110e+00, -8.9566e-01, -5.3959e-01, -1.4527e-01]], [[ 6.3442e-01, -3.3102e+00, -4.7280e+00, -4.4465e+00, -3.7626e+00, -2.8197e+00, -3.0089e+00, -2.7678e+00, -3.6057e+00, -4.1482e+00, -4.3778e+00, -5.0432e+00, -1.7568e+00, -2.3411e+00]], [[ 3.9026e+00, -1.4293e+00, -2.4283e+00, -2.0290e+00, -1.3045e+00, 3.7645e-01, 1.4123e-02, -8.0416e-01, -2.1189e+00, -2.9185e+00, -2.1869e+00, -1.1317e+00, -1.8118e+00, -1.2254e+00]], [[ 5.4744e+00, -2.8777e-01, 1.6446e+00, -1.5330e+00, -7.4474e-01, 2.4539e+00, 2.3122e+00, 2.6491e+00, 1.8773e+00, 2.6158e+00, -4.5902e-01, 5.3929e-01, 2.9174e+00, 1.6104e+00]]], [[[ 2.3760e+00, -3.1397e+00, -4.3654e+00, -3.9543e+00, -4.5195e+00, -3.8965e-01, -1.3582e+00, -4.4626e+00, -4.1934e+00, -4.7615e+00, -4.1597e+00, -5.5378e+00, -2.4659e+00, -2.8495e+00]], [[ 4.6462e+00, -2.0051e+00, -4.9503e+00, -4.1422e+00, -2.9257e+00, -1.1570e-01, -2.0717e+00, -3.3234e+00, -3.6818e+00, -5.9328e+00, -4.3800e+00, -6.1576e+00, -1.8531e+00, -1.3578e-01]], [[ 3.1530e+00, -1.5181e+00, -2.0613e+00, -2.9089e+00, -2.2477e+00, -1.3922e-01, 2.8353e-01, -2.3094e+00, -1.8789e+00, -2.7867e+00, -3.3397e+00, -4.5047e+00, -1.1967e+00, -1.5062e+00]], [[ 2.7471e+00, -1.1129e+00, -2.4141e+00, -2.1048e+00, -1.8705e+00, 1.1506e-01, -9.0039e-01, -1.7615e+00, -2.7713e+00, -3.0400e+00, -2.6546e+00, -3.4203e+00, -1.4393e+00, -1.7894e+00]], [[ 1.9164e+00, -7.5769e-01, -1.3073e+00, -8.2709e-01, -1.4231e+00, -9.3596e-01, -6.2199e-01, -2.1459e+00, -1.4200e+00, -1.3995e+00, -3.7342e+00, -1.9808e+00, -8.7468e-02, -1.1517e+00]], [[ 1.4644e+00, -3.4321e+00, -3.1458e+00, -3.6747e+00, -4.3436e+00, -3.4750e+00, -3.9851e+00, -4.1287e+00, -2.8870e+00, -2.7564e+00, -2.6556e+00, -3.0547e+00, -2.4730e+00, -1.6893e+00]], [[ 2.8579e+00, -6.2411e-01, -2.8664e+00, -2.5846e+00, -1.7933e+00, -1.2655e+00, -1.6286e+00, -1.5185e+00, -2.0092e+00, -3.2037e+00, -3.2286e+00, -4.1875e+00, -1.3432e+00, -1.2656e+00]], [[ 1.7713e+00, -3.0522e+00, -2.7509e+00, -3.6351e+00, -2.6905e+00, -2.2852e+00, -3.5827e+00, -2.9840e+00, -2.7950e+00, -3.1849e+00, -3.6867e+00, -2.8282e+00, -2.2209e+00, -2.8588e+00]], [[ 3.4443e+00, -1.5712e+00, -3.2495e+00, -4.0775e+00, -2.9846e+00, -2.8443e+00, -2.5428e+00, -2.0951e+00, -2.1102e+00, -3.6138e+00, -3.1427e+00, -3.9839e+00, -2.0895e+00, -2.0970e+00]], [[ 3.6465e-01, -4.1986e+00, -3.8132e+00, -3.9166e+00, -3.6684e+00, -2.7190e+00, -1.9595e+00, -3.6761e+00, -2.7617e+00, -2.7060e+00, -2.6952e+00, -1.7392e+00, 1.0231e-01, -1.1558e-01]], [[ 3.3619e+00, -1.5538e+00, -3.0017e+00, -2.5286e+00, -2.2347e+00, -9.5676e-01, -1.7366e+00, -2.1579e+00, -2.8307e+00, -3.9131e+00, -3.8522e+00, -3.8238e+00, -1.6152e+00, -2.0840e+00]], [[ 4.9419e+00, -9.1840e-01, 4.4400e-01, 7.1767e-01, -3.3681e+00, -2.7064e+00, -1.3804e+00, -1.8961e-01, 1.1909e+00, 1.1941e+00, -6.8367e-01, -2.5814e-01, 4.6464e+00, 3.6165e+00]]], [[[ 2.4678e+00, -3.9197e+00, -3.8604e+00, -3.8790e+00, -3.6534e+00, 6.6621e-01, -2.9328e-01, -3.5307e+00, -3.5200e+00, 4.5782e-01, -2.1037e+00, -1.7366e+00, -2.7504e+00, -3.0200e+00]], [[ 4.0677e+00, -2.2578e+00, -2.9883e+00, -2.0310e+00, -2.0984e+00, -9.1082e-01, -1.6833e+00, -2.4341e+00, -1.2975e+00, 6.6797e-02, -2.4634e+00, -1.9659e+00, -1.4579e+00, 2.2835e-02]], [[ 3.1791e+00, -1.7275e+00, -1.9773e+00, -2.3138e+00, -2.0431e+00, -2.7243e-01, -1.3718e-01, -1.4946e+00, -1.0913e+00, 6.9572e-02, -3.0261e-01, 3.5807e-01, -8.5599e-01, -1.1298e+00]], [[ 2.8032e+00, -1.1670e+00, -2.6552e+00, -2.0680e+00, -1.7271e+00, -4.3094e-01, -8.8403e-01, -2.2366e+00, -1.3190e+00, -1.3813e+00, -2.4348e+00, 1.8299e+00, -1.7057e+00, -7.8325e-01]], [[ 2.3700e+00, -9.2135e-01, -3.9563e-01, -1.1686e+00, -7.4953e-01, -6.4422e-01, 4.3717e-01, -7.1181e-01, -6.3327e-01, 7.1459e-01, 2.4928e-01, -4.2992e-01, 8.2882e-01, 3.0149e-01]], [[ 1.3195e+00, -1.9557e+00, -2.7030e+00, -3.8390e+00, -2.7690e+00, -2.0626e+00, -2.2376e+00, -1.9228e+00, -2.2051e+00, -2.8071e+00, -3.0590e+00, -7.8868e-01, -2.9729e-01, -2.0944e+00]], [[ 3.1673e+00, -4.1577e+00, -3.7741e+00, -4.3168e+00, -3.5082e+00, -2.1827e-01, 5.2027e-02, -3.5660e+00, -2.8776e+00, 5.1646e-01, -1.1434e+00, -2.9060e+00, -2.8658e+00, -3.1178e+00]], [[ 2.0388e+00, -2.0828e+00, -2.0897e+00, -2.7979e+00, -2.1591e+00, -5.5384e-01, -1.2223e+00, -7.4213e-01, -1.2594e+00, -1.7867e+00, -1.4092e+00, -6.4103e-01, -1.4098e+00, -1.0184e+00]], [[ 3.2908e+00, -2.0443e+00, -2.5773e+00, -2.4819e+00, -1.0585e+00, -2.4606e+00, -2.6670e+00, -1.9324e+00, -3.3054e-01, -2.5137e+00, -4.5452e+00, -5.7853e-01, -1.7178e+00, -4.6919e-01]], [[ 3.9554e-01, -3.7426e+00, -2.8974e+00, -2.4033e+00, -2.5600e+00, -1.3618e+00, -1.2476e+00, -1.4573e+00, -2.9590e+00, -2.7860e+00, -2.6723e+00, -1.4013e+00, -4.8155e-01, -7.1552e-01]], [[ 3.1331e+00, -2.9986e+00, -2.3512e+00, -2.4228e+00, -2.8675e+00, -9.9609e-01, -1.6877e+00, -2.3106e+00, -2.6992e+00, -3.0998e-01, -2.9241e+00, -2.4256e+00, -1.9372e+00, -2.0175e+00]], [[ 3.3906e+00, -1.4150e+00, -1.1250e+00, -3.0779e+00, -2.0885e+00, 9.2017e-01, 1.2907e-01, 7.9806e-01, -6.4370e-01, -5.0521e-01, -7.2149e-01, 6.0520e-01, 2.5377e+00, 1.1667e+00]]], [[[ 2.7720e+00, -3.3430e+00, -3.7381e+00, -3.9243e+00, -3.9501e+00, 1.0660e+00, -2.0957e-02, -3.7462e+00, -3.9840e+00, -4.0337e+00, -8.0094e-01, -1.7785e+00, -3.0000e+00, -3.2292e+00]], [[ 3.8252e+00, -2.5147e+00, -2.8729e+00, -2.1650e+00, -2.8397e+00, -1.0149e+00, -2.1005e+00, -3.6148e+00, -3.0812e+00, -3.2754e+00, -1.9090e+00, -3.1219e+00, -2.6220e+00, -2.1971e+00]], [[ 3.5544e+00, -7.8868e-01, -1.5497e+00, -2.6905e+00, -2.1413e+00, -9.0318e-01, -1.9126e+00, -2.6488e+00, -3.6259e+00, -3.3017e+00, -2.0520e+00, -2.6844e+00, -9.7133e-01, 1.6702e-01]], [[ 4.0537e+00, 9.2543e-02, -2.9692e+00, -2.7271e+00, -2.6343e+00, 2.5403e-01, -1.6774e+00, -2.0029e+00, -4.0536e+00, -4.3826e+00, -2.6470e+00, -2.7122e+00, -2.7591e-01, 6.5222e-01]], [[ 3.0210e+00, -1.7946e+00, -3.3661e+00, -3.4512e+00, -3.4144e+00, -2.5641e+00, -1.9843e+00, -3.1340e+00, -4.6378e+00, -5.0276e+00, -1.0703e+00, -3.0592e+00, -6.3449e-02, -1.3800e+00]], [[ 1.4168e+00, -2.6909e+00, -3.5974e+00, -3.1951e+00, -3.6291e+00, -2.9459e+00, -3.7254e+00, -2.7149e+00, -5.6790e+00, -5.3123e+00, -5.0152e+00, -5.2028e+00, -1.5711e+00, -1.3114e+00]], [[ 2.8405e+00, -2.9527e+00, -2.6514e+00, -3.0186e+00, -3.1425e+00, -9.6496e-01, -1.1256e+00, -3.3433e+00, -3.2527e+00, -2.8795e+00, -7.2292e-01, -1.9237e+00, -2.1780e+00, -2.1519e+00]], [[ 2.1318e+00, -1.7490e+00, -2.2827e+00, -3.3016e+00, -2.6660e+00, -2.6542e+00, -3.3537e+00, -2.5877e+00, -3.5244e+00, -2.6420e+00, -2.7109e+00, -3.7801e+00, -1.7180e+00, -1.6039e+00]], [[ 3.4907e+00, -2.0317e+00, -3.2476e+00, -3.1628e+00, -2.9092e+00, -2.3442e+00, -3.2155e+00, -3.5529e+00, -2.8648e+00, -2.1514e+00, -1.8197e+00, -2.8503e+00, -1.7951e+00, -9.0516e-01]], [[ 8.3600e-01, -3.9304e+00, -3.7467e+00, -4.2063e+00, -3.4913e+00, -3.4446e+00, -2.3442e+00, -2.9180e+00, -3.0409e+00, -3.6896e+00, -4.2249e+00, -4.4431e+00, -1.1182e+00, -1.2528e+00]], [[ 2.9577e+00, -1.9046e+00, -1.8857e+00, -2.2575e+00, -2.2158e+00, -8.1358e-01, -2.6382e+00, -2.8200e+00, -2.8266e+00, -2.2241e+00, -2.8214e+00, -3.3571e+00, -2.4432e+00, -2.0899e+00]], [[ 3.5466e+00, -9.0596e-01, -1.9451e+00, -2.1653e+00, -2.0737e+00, 1.2116e-02, -1.6137e+00, -2.6411e+00, -4.0636e+00, -4.4720e+00, -1.9176e+00, -2.5216e+00, -1.1480e+00, -1.5013e+00]]]]) attn_weights tensor([[[[ 1.7736e+00, 9.9098e-01, -4.2903e-01, 9.7026e-02, 1.1520e-01, 6.2933e-01, 2.8077e-01, 5.9648e-01, -4.2205e-01, -3.6668e-01, 4.6385e-01, 4.7221e-01, 4.0443e-01, 9.0328e-01]], [[ 4.0005e+00, -6.2410e-01, -1.1707e+00, -1.1865e+00, -4.9304e-01, -1.4347e+00, 1.0663e+00, 6.3999e-02, -1.0512e+00, -5.8348e-01, 8.6747e-02, 8.6353e-01, 2.0097e-01, 1.4806e-02]], [[ 3.4159e+00, 2.0970e-01, -1.4278e+00, -2.0855e+00, -1.6274e+00, -1.1100e+00, 1.0975e+00, 1.2008e+00, -1.7146e+00, -1.7443e+00, -4.1791e-02, -2.3606e-01, -6.1834e-01, -6.8425e-01]], [[ 1.7831e+00, -1.9613e+00, -2.9477e+00, -3.5580e+00, -2.1143e+00, -2.6443e+00, -1.4311e+00, -2.4397e+00, -3.1011e+00, -3.9694e+00, -2.5616e+00, -1.2413e+00, -1.3973e+00, -1.8849e+00]], [[ 2.1051e+00, -5.0056e-01, -7.6410e-01, -1.0371e+00, -1.1447e+00, -2.1788e+00, -1.8115e+00, -1.5872e-01, -1.0023e+00, -1.1926e+00, -9.2323e-01, -3.3236e-01, -1.0549e+00, -1.5350e+00]], [[ 4.2299e+00, 2.7113e-01, -6.9757e-01, -3.0087e-01, -2.1819e-01, 3.0318e-01, 4.4988e+00, 8.3297e-01, -5.2900e-01, -1.0768e-01, 1.2088e+00, 9.2385e-01, 1.0295e-01, 2.9181e-01]], [[ 3.5106e+00, -1.9296e+00, -2.6828e+00, -1.7308e+00, -2.2916e+00, -1.4699e+00, -7.4054e-01, -1.4901e+00, -2.7008e+00, -1.9745e+00, -1.7839e+00, -1.1110e+00, -1.4876e+00, -7.3579e-01]], [[ 3.9948e+00, 1.5450e+00, 1.9404e-01, 5.6637e-02, -1.3999e-01, 9.1139e-01, 1.6336e+00, 2.0213e+00, 7.5381e-01, 6.4578e-02, 6.7563e-01, 1.4890e+00, 8.3172e-01, 1.9503e+00]], [[-3.8046e+00, 2.7206e+00, 2.7344e+00, 1.9278e+00, 1.1443e+00, 1.8847e+00, 3.2994e+00, 2.3459e+00, 2.1468e+00, 1.4365e+00, 2.7374e+00, 1.2455e+00, 1.7575e+00, 3.0267e+00]], [[ 4.2924e+00, -8.5140e-01, -3.1344e+00, -2.3118e+00, -2.0462e+00, -3.5679e-01, 2.6355e+00, 2.0877e-01, -2.3511e+00, -1.1753e+00, -8.6342e-02, -4.8612e-01, -4.9402e-02, 1.8053e-01]], [[ 2.5251e+00, -2.9911e-01, -1.5200e+00, -1.8672e+00, -8.9776e-01, 2.2888e-01, 2.3790e+00, 5.2378e-01, -1.4036e+00, -2.1110e+00, 1.2647e+00, 1.6513e+00, 9.5196e-01, 9.9204e-01]], [[ 3.8296e+00, 8.2713e-01, -9.0489e-01, -1.0484e+00, 4.9197e-02, 2.5866e-01, 1.3553e+00, 6.0979e-01, -1.1116e+00, -1.6379e+00, 1.5720e+00, 1.0475e+00, 1.2302e+00, 3.7337e-01]]], [[[ 1.3071e+00, 5.2373e-01, 6.8931e-01, -1.4186e-01, 5.6290e-01, 2.9209e-01, 8.9942e-01, 3.8690e-01, 7.8746e-01, 7.1822e-01, -2.0756e-01, 6.6073e-01, 9.1751e-01, 4.5180e-01]], [[ 3.5973e+00, -1.5523e-01, -7.6670e-01, -1.2126e+00, 1.2780e+00, -1.7406e-01, 5.3878e-01, 9.2182e-01, 4.4382e-01, -3.0279e-01, -7.3822e-01, -7.1742e-01, 4.5419e-01, 2.2378e-01]], [[ 3.0087e+00, -1.2839e+00, -2.0505e+00, -2.1911e+00, -9.4231e-01, 5.1862e-01, -1.3948e-02, -8.6046e-01, -1.2501e+00, -2.3353e+00, -1.9279e+00, -1.6648e+00, -1.6833e+00, -2.3843e+00]], [[ 1.0776e+00, -1.0043e+00, -1.1705e+00, -1.1030e+00, -1.2966e+00, 6.9287e-01, 2.2591e-01, -9.7579e-02, -2.3887e-01, -7.4793e-01, -4.8534e-01, -1.2077e+00, 7.9931e-01, 6.3448e-02]], [[ 1.9483e+00, -1.2524e+00, -1.8192e+00, -1.8935e+00, -9.0856e-01, -8.0821e-01, -1.1988e+00, -4.7563e-01, -6.6932e-01, -1.7228e+00, -1.7336e+00, -1.3901e+00, -5.9966e-01, -3.4721e-01]], [[ 4.0962e+00, -1.0083e+00, -2.7704e+00, -4.0108e+00, -7.5779e-01, 7.9869e-01, 1.5806e+00, -1.1775e+00, -1.9882e+00, -2.9460e+00, -4.3889e+00, -6.4373e-01, -6.9979e-01, 1.5767e+00]], [[ 3.4806e+00, -1.2305e+00, -2.0254e+00, -1.9443e+00, -3.2032e-01, 8.9650e-02, -3.5736e-01, -3.6256e-01, -1.1312e+00, -2.4317e+00, -1.7706e+00, -4.3572e-01, -8.1587e-01, -4.8544e-01]], [[ 3.7135e+00, -5.1093e-02, -1.0420e+00, -1.9653e+00, 1.6245e-01, 1.9964e+00, 1.0218e+00, 4.5970e-01, -2.3026e-01, -1.2083e+00, -1.7861e+00, -1.1642e-01, 6.7356e-01, 5.7948e-01]], [[-3.4262e+00, 2.9743e+00, 3.4233e+00, 3.3825e+00, 2.5690e+00, 2.5816e+00, 2.8534e+00, 3.4035e+00, 3.7543e+00, 4.1902e+00, 4.5913e+00, 3.5658e+00, 5.5858e+00, 4.9656e+00]], [[ 4.2057e+00, -6.9618e-01, -2.0608e+00, -2.6272e+00, -6.9394e-01, 6.1106e-02, -3.5559e-01, -9.0089e-01, -1.2030e+00, -2.4300e+00, -2.4183e+00, -6.6800e-01, -2.8278e-01, 4.3909e-01]], [[ 3.0743e+00, -4.8473e-01, -3.5657e-01, 3.4568e-02, -3.8538e-01, 4.5450e-01, -1.1804e-01, 6.5107e-01, 6.8445e-01, -3.1408e-01, 4.8703e-01, 1.2446e+00, 1.3365e+00, 1.3759e+00]], [[ 3.1728e+00, -3.3530e-01, -7.0188e-01, 1.0610e-01, -3.1822e-01, 1.4815e+00, 1.4958e+00, 1.3520e+00, 8.5189e-01, -8.3853e-02, 6.5930e-01, 1.3031e+00, 2.1720e+00, 2.1632e+00]]], [[[ 1.1671e+00, -1.1736e-01, 1.0408e-01, 2.1907e-01, 6.0372e-01, 2.4006e-01, 7.2988e-01, 7.6815e-02, 4.4115e-01, 4.9932e-01, -3.1234e-01, 4.8446e-01, -1.1176e-02, 1.2936e-01]], [[ 2.9499e+00, -1.1383e+00, -1.2274e+00, -2.3219e+00, -1.3374e+00, -8.4821e-01, -1.0960e+00, -9.8613e-01, -1.5480e+00, -1.5213e+00, -3.0340e+00, -2.2422e+00, -5.7341e-01, -8.3753e-01]], [[ 2.8233e+00, -1.0059e+00, -2.3003e+00, -2.9226e+00, -2.4427e+00, 3.0376e-01, -9.1279e-01, -1.2504e+00, -1.5856e+00, -2.3564e+00, -3.4454e+00, -3.8259e+00, -2.6208e+00, -2.1712e+00]], [[ 7.6949e-01, -1.2518e+00, -1.3020e+00, -1.2759e+00, -2.3845e+00, -1.5744e-01, -3.3727e-01, -4.0317e-01, -4.5818e-01, -5.2575e-01, -4.3176e+00, -5.8224e-01, 6.7898e-01, -1.9990e+00]], [[ 1.9234e+00, -9.8202e-01, -1.0362e+00, -1.2158e+00, -1.3784e+00, -1.2524e+00, -2.1918e+00, -7.5925e-01, -7.8099e-01, -1.0439e+00, -2.3508e+00, -1.4038e+00, -5.1249e-01, -1.1311e+00]], [[ 4.1958e+00, -1.6615e+00, -2.5856e+00, -2.5654e+00, -1.7951e+00, -3.6616e-01, 4.4278e-01, -2.7398e+00, -3.4989e+00, -3.2483e+00, -3.6221e+00, -3.5380e+00, -3.0081e+00, -7.3928e-01]], [[ 3.0794e+00, -2.3406e+00, -2.3728e+00, -3.4665e+00, -2.2397e+00, -5.8840e-01, -1.4156e+00, -2.8027e+00, -2.6938e+00, -3.3424e+00, -3.8201e+00, -3.5959e+00, -2.1311e+00, -1.5432e+00]], [[ 3.5005e+00, 2.9466e-01, -8.9020e-01, -2.1262e+00, -1.3154e+00, 4.1510e-01, -5.4430e-01, -1.1501e+00, -1.2199e+00, -1.9277e+00, -2.8036e+00, -3.1726e+00, -1.4690e+00, -1.5897e-01]], [[-3.6737e+00, 7.2708e-02, 1.5803e+00, 3.1807e-01, -1.6364e-01, 6.4640e-02, 2.3341e-01, -2.6433e-01, 3.0688e-02, 1.2229e+00, -3.0550e+00, 1.7283e+00, -4.2850e-02, -7.3990e-01]], [[ 4.2964e+00, -8.8219e-01, -2.0363e+00, -2.7938e+00, -1.3518e+00, -2.3655e+00, -2.7536e+00, -2.5233e+00, -2.0820e+00, -2.8165e+00, -1.8048e+00, -3.3566e+00, -9.5693e-01, 6.4930e-01]], [[ 1.9988e+00, -2.0294e+00, -1.0833e+00, -4.3121e-01, -1.6040e+00, 5.5266e-01, -8.4819e-01, -1.4804e+00, -2.3129e-01, -1.2763e+00, -2.5031e+00, -1.5576e+00, 1.7922e+00, 4.9702e-01]], [[ 2.5560e+00, -1.4075e+00, 1.0618e-01, 4.0946e-01, -4.6552e-01, 1.4471e+00, -1.4208e-01, -1.2661e+00, -7.1264e-01, 2.2399e-01, -6.5707e+00, 9.9416e-01, 2.6765e+00, 1.5777e+00]]], [[[ 1.1440e+00, 1.6469e+00, 1.1490e+00, 1.1256e+00, 1.5455e+00, 5.0074e-01, 1.1284e+00, 1.2124e+00, 1.6497e+00, -7.3243e-02, 1.4875e+00, 1.3577e+00, 1.7624e+00, 1.4795e+00]], [[ 3.5659e+00, -7.9236e-01, -1.1997e+00, -1.7309e+00, -3.2799e-01, -6.0010e-01, -2.7681e-01, 3.0450e-01, -2.8867e-01, -2.6709e-02, -1.3399e+00, 3.1664e-02, -6.2913e-01, -6.1068e-01]], [[ 3.0440e+00, -9.3700e-01, -1.9159e+00, -2.6715e+00, -1.9942e+00, -1.0829e-01, -8.9399e-01, -8.9911e-01, -1.6377e+00, 1.6868e-01, -2.1409e+00, -4.3867e-03, -2.5707e+00, -1.5709e+00]], [[ 1.0780e+00, -1.8087e+00, -2.6186e+00, -3.1182e+00, -2.5699e+00, -1.1425e-01, 5.7875e-02, -6.3526e-01, -2.6474e+00, -8.4308e-01, -6.4933e-01, -3.6820e-01, -6.4878e-01, -1.0043e+00]], [[ 1.7468e+00, -1.4290e+00, -1.4109e+00, -1.7171e+00, -1.1495e+00, -1.8765e+00, -2.2832e+00, -1.0937e+00, -1.1551e+00, -1.3813e+00, -2.8571e+00, -1.4732e+00, -7.2326e-01, -6.4187e-01]], [[ 4.3769e+00, -5.5761e-03, -9.7737e-01, -2.1681e+00, -5.0843e-01, 2.6854e-01, 1.7140e+00, 8.2474e-01, 2.2410e-01, 2.9121e-01, 5.9197e-01, -1.8058e-01, 2.3604e-01, -3.9803e-01]], [[ 3.3522e+00, -1.6885e+00, -1.9588e+00, -2.0889e+00, -1.2665e+00, -8.5378e-01, -1.4936e+00, -1.2185e+00, -1.0780e+00, -3.8105e-02, -2.4736e+00, -1.4934e+00, -1.6155e+00, -1.7341e+00]], [[ 3.3648e+00, 4.3394e-01, -1.0808e+00, -1.1038e-01, 5.2720e-01, 7.5636e-01, -5.5973e-02, 1.3170e+00, -1.5693e-01, 8.0947e-01, -1.3675e+00, 6.0847e-01, -4.6073e-01, 1.1117e-01]], [[-2.1615e+00, 4.7110e+00, 5.6051e+00, 4.1183e+00, 3.7858e+00, 3.9400e+00, 3.8958e+00, 4.7543e+00, 3.7649e+00, 3.0202e+00, 2.3154e+00, 5.2153e+00, 5.6819e+00, 6.0614e+00]], [[ 4.2252e+00, -1.7786e+00, -2.4941e+00, -2.3624e+00, -1.9316e+00, -6.8048e-01, -6.2467e-01, -1.3671e+00, -1.0239e+00, 4.6745e-01, -1.1593e+00, -8.9196e-01, -1.4287e+00, -3.0130e-01]], [[ 2.8912e+00, -4.5854e-01, -7.6206e-01, -1.0633e+00, -9.6842e-01, 9.4719e-01, -3.3509e-01, 4.9979e-01, -1.1593e-01, -7.0002e-01, -4.3809e-01, 5.2715e-02, 5.5262e-01, 1.1068e+00]], [[ 3.0436e+00, -4.7702e-01, -4.1280e-01, -4.3226e-01, -7.4035e-01, 8.3281e-01, 1.0414e+00, 6.4792e-02, -7.2026e-01, -4.0857e-01, 2.0265e-02, -5.9446e-01, 1.2903e+00, 1.0080e+00]]], [[[ 2.4447e+00, -3.0362e-01, -1.2991e+00, -8.3920e-01, -1.7052e-01, 1.9360e-01, -6.0023e-01, -8.5584e-01, -1.7884e+00, -1.0877e+00, -2.2542e-01, -3.2320e-01, 1.4344e+00, 6.1532e-01]], [[ 3.4790e+00, -1.8377e-01, -1.2706e+00, -9.5829e-01, -8.1125e-01, -7.8573e-01, -5.6547e-01, -5.9502e-01, -1.6915e+00, -1.1802e+00, -2.0578e-01, -1.8878e+00, 1.8453e-01, -9.8195e-01]], [[ 3.2637e+00, -6.3196e-01, -1.0652e+00, -2.0153e+00, -1.4351e+00, -3.5377e-01, -7.9227e-01, -1.4512e+00, -2.3454e+00, -2.3398e+00, -1.3358e+00, -2.4202e+00, -2.3439e-01, -5.4628e-01]], [[ 1.2837e+00, -5.3806e-01, -2.5115e+00, -2.2505e+00, -2.0526e+00, -1.9118e-01, 4.6781e-01, 5.9592e-01, -2.3263e+00, -2.7871e+00, -5.4026e-01, -7.5110e-01, 6.7520e-01, -1.3837e+00]], [[ 2.1020e+00, -5.7114e-01, -1.3694e+00, -1.6475e+00, -1.8708e+00, -1.2742e+00, -2.4774e+00, -1.4247e+00, -1.4746e+00, -1.6513e+00, -2.2979e+00, -3.0026e+00, -9.0429e-01, -1.1312e+00]], [[ 3.7109e+00, -1.7165e-01, -2.5378e+00, -1.7895e+00, -2.8581e+00, 6.6063e-01, 7.6945e-01, -1.3097e+00, -2.6866e+00, -1.5724e+00, -8.6393e-01, 7.0319e-02, 2.2258e-01, 9.6225e-02]], [[ 3.4629e+00, -1.3537e+00, -2.2335e+00, -2.6533e+00, -1.9137e+00, -2.6676e-01, -1.5214e+00, -1.8149e+00, -2.8121e+00, -1.4776e+00, -8.3238e-01, -2.3470e+00, -8.6579e-01, -1.6999e+00]], [[ 3.3271e+00, 9.1775e-02, -9.9141e-01, -1.4315e+00, -5.3708e-01, 1.5208e+00, 5.0445e-02, -6.9894e-02, -1.0247e+00, -4.3795e-01, -4.3626e-01, -1.2817e+00, -3.3616e-02, -4.8500e-01]], [[ 2.2538e-01, 5.4550e+00, 5.1217e+00, 3.9117e+00, 5.0272e+00, 6.3576e+00, 7.0334e+00, 6.4204e+00, 4.7377e+00, 5.9001e+00, 5.0487e+00, 5.6676e+00, 6.7454e+00, 6.8836e+00]], [[ 4.1010e+00, -7.8708e-01, -2.0019e+00, -2.7606e+00, -2.0947e+00, 5.2533e-02, -5.8986e-01, -2.1756e+00, -3.3983e+00, -2.5276e+00, -6.8007e-01, -2.1310e+00, -1.1705e+00, -2.3972e+00]], [[ 3.8474e+00, 1.9982e+00, 7.5109e-01, -6.7636e-01, 3.1466e-01, -3.9014e-01, -7.5854e-01, 1.6097e+00, -3.7866e-01, -2.2729e-01, -1.7761e+00, -1.0441e+00, 3.1431e+00, 1.0590e+00]], [[ 1.2937e+00, 1.2994e+00, -1.4960e+00, -2.2281e+00, -2.2570e+00, -5.6089e-01, -8.6440e-01, 1.3503e+00, -1.5875e+00, -1.4391e+00, -1.0919e+00, -1.7443e+00, 4.1275e+00, 5.6255e+00]]]]) attn_weights tensor([[[[-1.1494, -3.2566, -2.3227, -1.6769, -2.9849, -2.2974, -2.6895, -3.3532, -2.1671, -1.3956, -1.7322, -2.7264, -2.1308, -1.9663, -3.5605]], [[-1.1273, 1.2522, -0.4758, -3.8933, -0.2416, -3.1712, -2.3491, 0.6110, -1.1092, -4.6021, -2.2149, -0.6172, -2.3099, -3.6249, 7.2574]], [[-1.7965, -2.2064, -2.5727, -2.8124, -3.1319, -2.9265, -2.9834, -2.3254, -2.6669, -2.8377, -2.6976, -3.1451, -3.1584, -2.8827, -1.7395]], [[-3.7731, -4.5937, -6.6297, -5.7159, -4.0861, -3.8828, -3.4813, -2.5867, -3.7333, -2.6124, -1.6900, 0.1370, 0.6127, 0.5763, 3.2184]], [[-1.3522, -4.0961, -4.3554, -2.2991, -3.1940, -2.9376, -1.8961, -3.2563, -3.0148, -0.7663, -0.7970, -1.1075, -0.5551, -0.5970, -0.0225]], [[ 2.1838, 3.1377, 3.9492, 2.0965, 4.4695, 0.6807, 1.3328, 1.8025, 2.9468, 1.2499, 0.8711, 3.8305, 2.2063, -0.0561, 6.1759]], [[-1.0834, -4.1986, -3.4912, -1.9652, -4.0627, -1.6548, -1.3294, -4.3443, -3.3435, -1.6635, -1.5573, -3.8383, -1.7146, -1.2562, -3.8928]], [[-6.0696, -7.6567, -7.5769, -7.6292, -7.2989, -7.5761, -6.9446, -6.1674, -5.7076, -5.7518, -4.7027, -4.6505, -4.5442, -4.6792, -3.7870]], [[-3.6532, -1.9069, -2.8763, -3.3990, -1.4321, -3.5792, -3.5399, -1.1634, -2.4567, -3.0693, -3.1134, -0.8971, -2.6845, -3.2187, -1.4326]], [[-1.5936, -1.8262, -1.8614, -2.4237, -1.9770, -2.7573, -2.7132, -1.9053, -1.8928, -2.4044, -2.3207, -1.8650, -2.0794, -2.6496, -1.6418]], [[ 0.1501, 0.1994, 0.1287, -0.6422, 0.1429, -0.9567, -0.8108, 0.0647, -0.0166, -0.7936, -0.7726, 0.0758, -0.6173, -1.0547, 1.2394]], [[-1.4857, -2.2334, -3.5815, -2.3541, -2.5841, -2.7652, -2.3984, -2.2653, -3.7980, -2.4063, -2.5599, -2.6244, -2.5316, -2.8011, -2.1773]]], [[[-1.0158, -3.3266, -1.4904, -1.3746, -2.9093, -1.8902, -1.8093, -3.3264, -3.3081, -1.1145, -0.9557, -1.3765, -3.0926, -1.9601, -3.1281]], [[-0.4253, 0.5792, -0.5599, -3.5398, 1.2246, -1.9637, -2.3397, -0.2462, 2.3817, -1.3542, -4.2783, -2.3463, 2.2284, -1.4584, 6.7123]], [[-1.9302, -2.4360, -2.6741, -2.2231, -3.1472, -2.7534, -3.3743, -2.5466, -2.0727, -2.7254, -2.1466, -1.9779, -1.6095, -2.6968, -2.0503]], [[-2.8491, -5.3056, -7.2219, -6.1744, -4.9140, -6.1465, -5.1917, -3.1516, -2.8908, -3.4417, -2.0159, -1.9984, -0.1364, 1.5766, 2.9606]], [[-0.6548, -2.7417, -2.8488, -1.1502, -2.3326, -2.1524, -1.4896, -1.6144, -0.8394, -0.9974, 0.9307, 1.2583, 0.3306, 1.7763, 2.0604]], [[ 2.9851, 3.0679, 2.4955, 1.0352, 3.0455, 1.8401, 0.5928, 1.6061, 2.7496, 1.2378, -0.0519, -0.2462, 1.2080, 1.8109, 7.7504]], [[-0.7965, -3.6863, -3.1173, -1.6173, -3.4011, -1.0714, -0.8707, -3.8311, -3.4721, -2.9562, -1.2860, -1.1005, -3.4005, -2.6766, -2.9767]], [[-5.8870, -7.4629, -7.2939, -7.3535, -7.1504, -7.2854, -6.9666, -5.8033, -5.4827, -4.9947, -4.9241, -4.3753, -4.1387, -3.3447, -3.2358]], [[-3.2719, -1.8216, -2.5328, -3.0681, -1.1809, -3.2740, -3.6602, -0.9918, -0.8338, -1.9711, -2.6188, -2.7531, -0.6739, -1.6345, -1.3905]], [[-1.6762, -2.0087, -2.1003, -2.5640, -2.1464, -2.6295, -2.7157, -2.0772, -1.9128, -2.1053, -2.5146, -2.0826, -1.7660, -2.2236, -1.8962]], [[-0.0806, -0.3663, -0.4108, -0.9666, -0.2513, -0.8438, -0.9863, -0.3754, -0.2236, -0.4410, -1.0112, -0.7012, -0.1528, -0.5526, 0.7988]], [[-1.3218, -2.1311, -3.5958, -2.5077, -2.8531, -2.7908, -2.1902, -2.1925, -2.1614, -3.8768, -2.5981, -2.4081, -2.2562, -2.9552, -2.0684]]], [[[-1.2101, -2.9674, -2.1610, -1.8261, -3.0930, -2.7552, -2.2332, -3.1006, -2.2257, -2.0031, -1.8079, -2.0425, -2.1296, -2.0425, -3.3494]], [[-1.5440, 1.6740, -0.8732, -3.9402, -1.8379, -4.0284, -2.9728, 1.2189, -1.9798, -1.6059, -3.6133, -4.1545, -3.6726, -2.2844, 6.0910]], [[-1.3636, -1.8569, -2.2018, -2.7492, -2.5278, -2.3197, -2.6527, -2.1204, -1.8043, -2.3700, -2.5521, -2.7106, -2.4527, -2.3271, -2.0421]], [[-4.1280, -5.9752, -6.2455, -6.3713, -5.4155, -4.8611, -2.7198, -3.8396, -3.0181, -2.5141, -1.2257, -2.6125, -0.7762, -0.4767, 1.8136]], [[-1.5128, -3.7672, -4.2468, -3.1604, -3.6174, -2.6735, -1.1974, -3.1062, -2.5928, -2.6284, -0.7825, -1.9775, 0.1432, -0.1314, -0.1967]], [[ 0.6191, 3.1698, 2.8224, 1.1365, 4.5164, 0.7205, 0.5153, 2.3187, 1.8174, 1.9598, 0.4881, 1.2752, 1.6797, 1.4945, 4.8575]], [[-1.1853, -4.1301, -3.6559, -2.4074, -4.1704, -1.3747, -1.4365, -4.3880, -2.9506, -3.5541, -2.1245, -2.4908, -2.1046, -2.2456, -4.3337]], [[-6.1713, -7.6690, -7.5433, -7.3865, -7.1402, -6.9087, -6.5319, -6.1026, -5.8799, -5.1425, -5.1531, -4.7792, -4.0297, -3.4819, -3.8406]], [[-3.6185, -1.9341, -3.0588, -3.3587, -0.9855, -3.4591, -3.3312, -1.1539, -2.5579, -2.5876, -2.7542, -3.7751, -2.4450, -2.5105, -1.2428]], [[-1.5375, -1.8071, -1.9373, -2.4620, -1.9462, -2.5036, -2.5549, -1.9225, -1.8137, -1.9743, -2.3655, -2.3500, -2.1464, -1.9678, -1.6954]], [[ 0.4013, 0.4956, 0.0920, -0.4570, 0.3372, -0.4157, -0.5066, 0.3382, -0.1394, -0.1480, -0.7067, -0.7731, -0.8433, 0.0542, 1.2606]], [[-1.7213, -2.3993, -3.6384, -2.5684, -2.7881, -2.5401, -2.1746, -2.3146, -2.4894, -3.7530, -2.5194, -2.8986, -2.6418, -2.6882, -3.2577]]], [[[-1.2361, -3.1135, -1.4404, -1.5530, -2.5574, -2.3975, -2.3365, -3.1734, -2.4191, -1.6319, -2.1549, -2.1882, -0.8045, -2.1727, -2.3235]], [[-0.7751, 1.0589, 1.4459, -0.0357, 2.9144, -2.7271, -1.9868, 0.1423, 2.7665, -0.6554, -2.1441, 0.1901, 2.2924, -0.2378, 8.0667]], [[-1.8114, -2.4101, -2.5113, -2.1535, -3.1167, -2.4159, -3.1630, -2.5705, -3.1760, -3.1420, -3.1492, -1.9560, -2.3847, -2.5259, -2.9343]], [[-4.9883, -8.2865, -9.1266, -6.3881, -7.1694, -8.8200, -6.9986, -5.1661, -4.1432, -5.7129, -4.1507, -2.4680, 0.4283, -0.3244, 3.5923]], [[-0.2295, -2.2579, -2.0790, -0.3698, -1.4759, -1.7781, -0.7385, -1.1869, -0.4954, -1.0262, 0.3193, 0.0890, 1.3202, 1.9587, 2.5319]], [[ 3.7793, 3.4209, 3.0411, 0.9798, 3.0776, 2.3821, 0.0896, 1.3211, 2.3526, -0.7523, -0.4001, 0.5510, 1.4126, 0.4623, 9.3444]], [[-0.5534, -3.5968, -3.1058, -1.2359, -3.4486, -0.7551, -0.9894, -3.7353, -3.3483, -0.3321, -0.7938, -1.7612, -2.3892, -2.6374, -1.5807]], [[-5.7570, -7.4427, -7.3621, -7.4603, -7.0091, -6.8298, -7.3465, -5.7366, -5.5534, -6.1981, -5.8173, -3.7192, -3.6065, -3.5923, -3.5935]], [[-3.6801, -2.4180, -3.1557, -3.4626, -2.1376, -3.2904, -3.6271, -1.6187, -1.8004, -3.4683, -3.3717, -2.9370, -2.1712, -1.6052, -2.6477]], [[-1.7393, -2.1417, -2.1606, -2.6829, -2.2658, -2.6380, -2.9927, -2.2437, -2.2376, -2.5956, -2.9404, -1.9720, -1.9336, -2.1369, -2.3399]], [[ 0.0406, -0.0831, 0.0637, -0.6674, 0.0589, -1.0090, -1.1707, -0.1073, 0.0337, -0.5792, -1.2022, -0.4142, 0.3071, -0.1112, 1.1761]], [[-1.2186, -2.2237, -3.6280, -2.2865, -2.8382, -2.7030, -2.3624, -2.2442, -2.8959, -2.2113, -2.3768, -2.3765, -3.1603, -2.6916, -2.4065]]], [[[-0.7579, -3.7754, -1.6282, -2.7243, -3.4844, -2.9073, -3.3988, -4.2048, -3.6840, -3.0750, -2.3520, -3.2437, -4.0460, -3.6601, -3.6418]], [[-0.8832, 0.9394, -0.9533, -2.8901, -1.1598, -3.8210, -3.4253, 0.8117, -1.6632, -1.9033, -3.0239, -3.5896, 1.2546, 4.6602, 4.6734]], [[-1.3232, -2.4251, -1.3635, -0.9840, -3.5120, -2.9946, -3.0099, -2.5026, -2.4604, -3.5254, -3.0567, -2.9775, -1.8466, -3.2093, -3.1947]], [[-3.3200, -5.6776, -5.7875, -6.1530, -5.7100, -6.0267, -7.2103, -3.6339, -3.8380, -2.8187, -3.5695, -4.3629, -2.0698, -0.4313, 0.1940]], [[-0.3448, -2.2066, -1.3621, -1.0399, -1.4341, -2.0946, -1.7809, -1.3976, -0.2023, 0.0607, -0.2447, -0.4357, -0.0147, 1.3182, 1.6250]], [[ 2.1041, 2.6897, 1.4669, -1.3442, 0.5459, -0.0229, -2.2159, 1.3868, 0.4392, -1.3481, -1.6453, -2.6186, 1.6534, 8.9225, 8.9015]], [[ 0.4368, -4.0933, -3.0438, -2.3107, -4.2683, -1.0732, -1.0058, -4.6741, -3.4615, -3.9001, -0.8272, -0.8492, -4.8004, -4.5898, -4.5758]], [[-5.3699, -6.9153, -6.6735, -6.4482, -6.5213, -6.6071, -6.2410, -5.1709, -4.9311, -4.6434, -4.8052, -4.3227, -2.0560, -2.9602, -2.5422]], [[-2.5222, -1.1805, -2.2097, -3.6673, -1.5690, -3.8811, -3.3205, -0.9873, -2.6599, -1.9639, -3.4607, -3.1856, -0.7108, -0.4690, -0.4446]], [[-1.1245, -1.4252, -1.3402, -1.8343, -1.5912, -2.0461, -2.1991, -1.5635, -1.7090, -1.6673, -2.0750, -2.1502, -1.3795, -1.0673, -1.0427]], [[ 0.5021, 0.1461, 0.1947, -0.2340, -0.0154, -0.4489, -0.8052, 0.1382, -0.1254, -0.1823, -0.4778, -0.8416, 0.2846, 0.3827, 0.3851]], [[-1.0958, -2.1763, -3.2163, -2.3041, -2.4236, -2.3379, -1.9190, -2.1256, -2.2608, -2.4257, -2.1368, -1.9321, -1.9551, -1.6984, -1.6949]]]]) attn_weights tensor([[[[-1.7761, -3.7787, -3.5584, -3.1608, -2.4530, -2.5465, -1.7350, -1.6346, -1.8008, -1.6164, 0.2356, -0.1530, -0.5397, -0.7948, -0.6890]], [[-0.7094, -1.8670, -2.5072, -2.4224, -2.2031, -2.5385, -2.0060, -0.1506, -0.8598, -0.8880, -1.0657, -0.2488, -0.6841, -0.6822, 0.0918]], [[-3.1585, -3.9537, -3.6721, -4.0417, -3.4603, -3.6700, -3.3075, -2.7315, -2.9370, -3.3263, -2.7010, -2.7355, -2.9356, -2.6680, -2.2747]], [[ 0.1119, -3.3259, -3.2065, -3.2588, -3.1213, -2.9483, -2.7388, -2.5584, -2.6340, -2.7461, -2.2375, -2.5033, -2.4732, -2.2680, -2.0549]], [[-0.6573, -2.5596, -2.7721, -2.8312, -2.6195, -2.2628, -2.1871, -2.1295, -2.2689, -2.3186, -1.7207, -2.0179, -1.8481, -1.5479, -1.5770]], [[ 0.9672, -0.3851, -2.2813, -1.1166, -0.4001, -2.5564, -2.3369, -0.3117, -2.4315, -1.4202, -1.3128, -0.6194, -1.4092, -3.3828, 2.1921]], [[ 0.1161, -1.6583, -1.7065, -1.7706, -1.6069, -1.7764, -1.2491, -1.4245, -2.0002, -2.2222, -1.3577, -1.8070, -1.3662, -2.6667, -2.3709]], [[ 0.2052, -1.5359, -2.0635, -1.9657, -1.9096, -1.2689, -1.2319, -1.2780, -2.0958, -2.1206, -1.1935, -1.7772, -1.4916, -1.7413, -1.2288]], [[-0.6672, -1.6198, -2.1437, -2.3656, -1.8510, -2.3814, -2.5222, -1.7617, -2.0529, -2.2557, -2.2832, -1.7611, -2.1582, -2.1006, -1.7381]], [[ 1.2850, -0.6502, -0.0753, -0.6817, 0.1540, -1.2042, -1.3837, -0.9467, -0.1267, -0.6358, -1.1806, 0.0948, -0.2605, -0.9043, -0.3670]], [[-4.7095, -2.4229, -2.3226, -2.3297, -2.2601, -1.8214, -1.6461, -1.7085, -1.6757, -1.7297, -0.9956, -1.5454, -1.3458, -1.0178, -0.8994]], [[ 1.2541, 0.5883, -2.6377, -3.1089, -0.7051, -3.8301, -3.9225, 0.5608, -2.5227, -2.9613, -3.0097, -0.5498, -2.3909, -3.8329, 3.6094]]], [[[-1.5638, -3.6527, -2.9823, -2.7487, -1.9441, -3.2322, -2.8038, -1.6271, -1.3565, -1.0290, -0.9389, 0.1723, -0.0175, 0.2791, -1.7660]], [[-0.6802, -1.9970, -2.4830, -2.6257, -2.2701, -2.3336, -2.1760, -0.4542, -0.4539, -0.7614, -0.8996, -0.2557, 0.0699, 0.0178, -0.1085]], [[-3.2818, -4.0706, -3.8292, -4.1528, -3.5481, -3.7981, -3.4198, -2.8449, -2.9732, -3.0478, -3.3510, -3.1295, -2.6416, -2.8693, -2.4844]], [[ 0.0978, -3.4117, -3.3003, -3.3337, -3.1862, -2.9841, -2.7914, -2.6233, -2.6246, -2.6213, -2.7089, -2.5155, -2.3587, -2.3866, -2.1093]], [[-0.6278, -2.5731, -2.8228, -2.7729, -2.5961, -2.2878, -2.1976, -2.1328, -2.1949, -2.1990, -2.1547, -1.7844, -1.7847, -1.6795, -1.5547]], [[ 0.9998, 0.0927, -1.3049, -0.7558, -0.0803, -1.7095, -2.9857, 0.0799, -0.2115, -1.8680, -1.3080, -1.5320, -0.9952, -0.3897, 2.1867]], [[ 0.2271, -2.0032, -1.8346, -2.3540, -1.8399, -1.6000, -1.8545, -1.6162, -1.8203, -1.7838, -2.7678, -1.1948, -1.6582, -1.9552, -3.0428]], [[ 0.4307, -1.5881, -1.7858, -1.7778, -2.0711, -1.3335, -1.0169, -1.1856, -1.5558, -1.7583, -1.8573, -1.2829, -1.2337, -1.4429, -1.1259]], [[-0.5317, -1.5380, -2.0772, -2.1236, -1.7854, -2.3969, -2.6130, -1.5442, -1.7759, -1.9591, -1.9886, -2.1700, -1.7169, -1.6397, -1.7294]], [[ 1.3889, -0.3346, 0.1219, -0.3052, 0.4710, -1.1671, -1.0519, -0.7355, -0.6425, 0.0170, -0.3108, -0.3442, -0.4756, 0.1014, -0.0443]], [[-4.8489, -2.5098, -2.3672, -2.3784, -2.2879, -1.9061, -1.7110, -1.7760, -1.7616, -1.5977, -1.6547, -1.3641, -1.3137, -1.2781, -0.9900]], [[ 2.2086, 1.2045, -2.5818, -1.7864, -0.5645, -1.3616, -3.6679, 1.3063, 1.2059, -2.8497, -1.7494, -1.4900, 0.5526, 0.0371, 4.8974]]], [[[-2.6474, -4.7147, -4.9339, -4.2757, -2.6258, -2.8468, -1.8203, -2.3462, -2.6097, -2.8377, -1.9927, -2.3936, -1.3474, 0.0819, -1.9303]], [[-0.1781, -1.3062, -1.7188, -1.7149, -1.4292, -1.5550, -1.4045, 0.2786, -0.3853, 0.0904, -0.7770, -0.4056, 0.4689, 0.3171, -0.0286]], [[-2.9959, -3.8773, -3.6083, -3.9253, -3.3391, -3.5497, -3.1787, -2.6240, -3.0821, -2.8005, -3.4556, -3.3430, -2.7122, -3.0073, -2.4760]], [[ 0.0604, -3.2535, -3.1654, -3.2108, -3.0665, -2.8459, -2.6542, -2.5031, -2.6655, -2.5002, -2.8294, -2.8240, -2.3352, -2.4476, -2.3099]], [[-0.6139, -2.5090, -2.7647, -2.7377, -2.5412, -2.1324, -2.0863, -2.1190, -2.2584, -2.1870, -2.4496, -2.3176, -1.5870, -1.9324, -1.8569]], [[ 1.0414, -0.5483, -1.9331, -1.6007, -0.0197, -2.2735, -2.4186, -0.1812, -0.7794, -2.0988, -1.8453, -1.0992, -0.9743, -0.7535, 2.7155]], [[ 1.3695, -0.6307, -0.8387, -0.7777, -0.2263, -1.0893, -0.2822, -0.5918, -0.9455, -1.2127, -1.4621, -0.9412, -0.5073, -0.9970, -0.7215]], [[ 1.3332, -0.6753, -1.3190, -1.1512, -1.0686, -0.2690, -0.4309, -0.4149, -1.1426, -1.4534, -1.4072, -1.0947, -0.8623, -1.1231, -0.1985]], [[-0.6483, -1.7703, -2.1340, -2.3193, -1.8137, -2.4854, -2.6157, -1.7300, -2.0263, -2.0026, -2.3704, -2.0515, -2.1148, -2.3300, -2.0720]], [[ 1.3144, -0.7154, -0.0520, -0.4898, 0.2591, -1.0131, -1.1692, -0.9717, -0.1947, -0.0774, -0.5249, -0.1364, -0.1643, -0.4271, -0.8101]], [[-4.8134, -2.4261, -2.3379, -2.3236, -2.2867, -1.8163, -1.6476, -1.7475, -1.7101, -1.5989, -1.9281, -1.8286, -1.2060, -1.3871, -1.4168]], [[ 1.6064, 0.7601, -2.7454, -2.6209, 0.1410, -2.7717, -4.0036, 0.5910, -2.3042, -2.5630, -2.8986, -1.3847, -1.4232, -1.9123, 3.3476]]], [[[-1.4121, -3.3064, -2.0104, -1.4558, -2.1758, -3.4235, -3.4838, -1.5267, -1.1510, -2.5597, -2.7704, -1.2223, 0.9035, 2.3055, 0.0365]], [[-0.9212, -2.1948, -2.5736, -2.6598, -2.1232, -2.7221, -2.1404, -0.3485, -0.9148, -1.5524, -1.1170, 0.8657, 0.7148, 1.0387, -0.3854]], [[-3.2629, -4.0281, -3.8093, -4.1791, -3.5525, -3.7907, -3.4074, -2.8474, -3.1487, -3.4020, -2.9681, -2.5737, -2.7837, -2.6922, -2.8345]], [[ 0.0676, -3.3526, -3.2640, -3.3345, -3.1551, -2.9319, -2.7689, -2.6281, -2.7998, -2.6536, -2.4154, -1.9985, -2.2504, -2.2883, -2.3510]], [[-0.5807, -2.5049, -2.7159, -2.7101, -2.5537, -2.2283, -2.1240, -2.0959, -2.2373, -1.6981, -1.7734, -1.6374, -1.6485, -1.6335, -1.7023]], [[ 1.3321, 0.6852, -0.7081, -0.3239, -0.0366, -2.1659, -2.7743, 0.7163, -0.2308, -3.1470, -3.1662, -1.2673, -0.6862, 0.4970, 1.1514]], [[ 2.3739, 0.3170, -0.0496, 0.4568, 0.8302, 0.1643, -0.2097, -0.1367, 0.6854, -0.8050, -0.6863, 0.9559, 0.5334, 0.9640, 0.7308]], [[ 0.6829, -1.3284, -1.6369, -1.0179, -1.5715, -1.0936, -0.7018, -1.0461, -1.5638, -1.1684, -1.0928, -0.3211, -1.2232, -0.3265, -0.6948]], [[-0.7556, -1.6243, -2.4192, -2.3097, -1.7066, -2.2877, -2.4820, -1.7641, -1.6929, -2.6741, -2.3241, -1.7145, -2.0084, -1.6179, -1.9311]], [[ 1.2552, -0.5713, 0.1156, -0.7988, 0.2045, -1.1716, -1.2510, -0.8321, 0.3092, -1.6957, -1.0270, -0.2029, 0.4250, -0.0954, -0.2901]], [[-4.9270, -2.5077, -2.3956, -2.4484, -2.2890, -1.9331, -1.7192, -1.8261, -1.8997, -1.5252, -1.2983, -1.0376, -1.1525, -1.3059, -1.2675]], [[ 0.9544, 0.4339, -2.7503, -1.5997, -3.0682, -2.8208, -5.3310, 0.7539, -3.3153, -3.4404, -5.5323, 0.2940, -2.4556, -0.5647, 3.8716]]], [[[-0.4590, -1.8712, -1.7114, -1.8188, -1.7180, -1.6897, -1.8278, -1.0613, -0.9001, -0.6531, -1.2004, -1.2323, 0.3138, 0.2111, 0.2845]], [[-0.2656, -1.3772, -1.9977, -2.3025, -1.6350, -1.9802, -1.4034, -0.4293, -1.3988, -0.7117, -0.7658, -0.6264, 1.5494, 0.9251, 1.0135]], [[-3.1302, -4.0300, -3.6394, -3.9871, -3.4279, -3.7246, -3.3237, -2.7926, -3.2982, -2.9778, -2.9532, -2.7387, -2.2926, -2.3604, -2.1939]], [[ 0.2569, -3.1980, -3.0469, -3.1027, -3.0117, -2.8517, -2.6847, -2.6038, -2.8660, -2.6845, -2.3749, -2.3089, -1.9417, -1.9838, -1.9123]], [[-0.4063, -2.3602, -2.4895, -2.5520, -2.4838, -2.0269, -1.8927, -2.1869, -2.2106, -2.0572, -1.4384, -1.3763, -1.6034, -1.3134, -1.1841]], [[ 1.6996, -0.0200, -0.8993, -2.4775, 0.8527, -1.6720, -2.5867, -0.5272, -1.9528, 0.7324, -1.6602, -2.9821, -0.2068, 3.3994, 3.0583]], [[ 1.4657, -0.4200, -1.1951, -1.3309, -1.5247, -1.5087, -1.3573, -0.8268, -2.2173, -1.8457, -0.8514, -1.6548, 0.6317, 0.0922, 0.2115]], [[ 0.6704, -1.8785, -0.9437, -1.0677, -1.7346, -1.0631, -0.7005, -1.5000, -1.4561, -1.5533, -0.8897, -1.0592, -1.2636, -1.3681, -1.1640]], [[ 0.8573, 0.2017, -0.2496, -0.3342, -0.0370, -0.4445, -0.6799, -0.0426, -0.1146, -0.0636, -0.5072, -0.6524, 0.2544, 0.0172, 0.1229]], [[ 1.5050, -0.3949, -0.0564, -0.2915, 0.3900, -0.6300, -0.7027, -0.8759, -0.1374, 0.4051, -0.8169, -0.5021, -0.7281, -0.2766, -0.3230]], [[-4.9024, -2.2463, -2.0937, -2.1533, -2.1139, -1.7466, -1.5502, -1.6590, -1.7515, -1.6495, -1.0929, -1.0755, -0.9151, -0.9726, -0.8517]], [[ 0.7595, -0.2022, -1.4219, -1.0920, -0.4192, -1.8759, -1.6227, -0.5795, -1.9686, -0.8545, -2.3804, -2.2750, 0.1393, 0.9286, 0.7904]]]]) attn_weights tensor([[[[ -1.9308, -5.1005, -4.7339, -5.3565, -4.9724, -4.6768, -5.0871, -3.3880, -2.7869, -3.6023, -2.1632, -2.6127, -2.6353, -2.6944, -1.1357]], [[ 1.6737, -1.5252, -2.3032, -1.2089, -1.9816, -2.2887, -2.0333, -1.6397, -3.2771, -2.1010, -1.7519, -2.4307, -1.5917, -3.3952, -1.4246]], [[ -6.2599, -15.1166, -14.7269, -14.5667, -13.5413, -11.9424, -10.7323, -9.4945, -8.1103, -8.1315, -5.5023, -5.0931, -5.0732, -3.4944, -5.4052]], [[ -2.5869, -7.0429, -6.0308, -7.5277, -5.0594, -6.7437, -5.6044, -4.8909, -3.3027, -4.6031, -2.5805, -1.4017, -1.1497, -3.0771, -2.4332]], [[ -2.7709, -6.7672, -7.1115, -8.6376, -7.5221, -6.4691, -4.9156, -3.8421, -4.2585, -5.6569, -1.9173, -3.4650, -3.2713, -2.9369, -2.5480]], [[ -4.0420, -7.6171, -8.8027, -7.8192, -8.3085, -7.8554, -7.3265, -4.1595, -4.9765, -4.1247, -4.1602, -3.6363, -4.3115, -3.0214, -3.2735]], [[ -0.2569, -3.3624, -3.3987, -3.5865, -3.5696, -4.6753, -4.5282, -1.9910, -2.2504, -2.7040, -2.9796, -2.3370, -3.0281, -3.5269, -2.0284]], [[ -1.2966, -4.2399, -2.9267, -2.7705, -2.7844, -1.9603, -2.1035, -1.9292, -1.3024, -1.5539, -1.2109, -1.3910, -0.9991, -0.3259, -1.0626]], [[ -3.3581, -7.2546, -7.9394, -5.7888, -7.3362, -7.1753, -6.3585, -4.4500, -4.7458, -2.7519, -1.1870, -3.4646, -2.7941, -3.5498, -2.7864]], [[ -4.3772, -9.3463, -9.0459, -9.6152, -9.3046, -6.1258, -5.5671, -6.2470, -5.5649, -6.0169, -3.2977, -4.6769, -2.7764, -1.6205, -4.2758]], [[ -1.8483, -3.8642, -3.6812, -3.5415, -3.6012, -2.8414, -2.8110, -3.0567, -2.6930, -2.6545, -1.8125, -2.4422, -2.1052, -1.5866, -1.7076]], [[ -0.6612, -5.1689, -5.0974, -4.8669, -4.7357, -4.1808, -4.1688, -4.1145, -3.9079, -3.7837, -3.1297, -3.3561, -3.0408, -2.7144, -2.8447]]], [[[ -2.2294, -5.1879, -5.0499, -6.5926, -5.4933, -4.5799, -5.0652, -3.2863, -2.5767, -3.2297, -4.7096, -2.5666, -1.4847, -4.2119, -1.9501]], [[ 1.4576, -0.9950, -2.2646, -1.7198, -2.6375, -1.3526, -2.1928, -1.6508, -2.0001, -3.5143, -2.5666, -1.9910, -2.0831, -1.8134, -2.1665]], [[ -6.1389, -15.4709, -15.2379, -14.5251, -11.8932, -13.1192, -10.9583, -10.1411, -8.0270, -7.6710, -7.0663, -4.9115, -4.5477, -3.4758, -5.8677]], [[ -2.5729, -7.3690, -6.0154, -7.1170, -3.9963, -6.3593, -5.2427, -4.8018, -3.2576, -2.7354, -3.4878, -1.7514, -2.3882, -1.6291, -2.1714]], [[ -2.6053, -7.3110, -7.3524, -8.2384, -7.2139, -9.1484, -7.8616, -4.5542, -3.8095, -3.5961, -4.7062, -3.2498, -2.6753, -3.7685, -3.3743]], [[ -4.0085, -8.0032, -8.4470, -8.6698, -8.2867, -8.7911, -7.8264, -4.4494, -3.8905, -4.2070, -4.2878, -5.1337, -2.9699, -2.8639, -3.6854]], [[ -0.3951, -3.5703, -3.4450, -4.2187, -3.5499, -4.1237, -4.0220, -1.9361, -1.8495, -2.0850, -3.1137, -3.2289, -2.5355, -2.8414, -2.0019]], [[ -1.3835, -4.4143, -2.9969, -2.7761, -2.7900, -1.9600, -2.0153, -1.9359, -1.8589, -1.1408, -1.3197, -1.6224, -1.3935, -1.2869, -1.0246]], [[ -3.4450, -7.8709, -8.6098, -6.8300, -6.5067, -6.8070, -6.6533, -4.7527, -4.4277, -4.7140, -3.0771, -4.3749, -2.1573, -0.7596, -3.4924]], [[ -4.2271, -9.2552, -8.3917, -9.6022, -8.8025, -5.7578, -6.3252, -6.3316, -5.8239, -4.0762, -5.2208, -3.0707, -4.0092, -3.7018, -4.3428]], [[ -1.6941, -4.2178, -3.7526, -3.3767, -3.7017, -2.7970, -2.6460, -3.2286, -2.9051, -2.4400, -2.2497, -1.9886, -2.2574, -1.7319, -1.8433]], [[ -0.7676, -5.5124, -5.2275, -4.9990, -4.9960, -4.3293, -4.2039, -4.3632, -4.2000, -3.6245, -3.5934, -3.2730, -3.3908, -2.9229, -3.0828]]], [[[ -2.2583, -4.7333, -4.8424, -5.4503, -5.3412, -4.4571, -4.1436, -2.9537, -3.3894, -2.6156, -2.5548, -1.6270, -2.1111, -1.6301, -1.6315]], [[ 1.9063, -1.2511, -2.4730, -1.5893, -2.1449, -1.9842, -2.3397, -1.4057, -2.0326, -3.4227, -2.9251, -2.2037, -1.9926, -2.4803, -1.1687]], [[ -7.3702, -15.5573, -15.7220, -15.2199, -13.9126, -11.2721, -9.4572, -9.1070, -8.3866, -7.1710, -7.8450, -7.1490, -5.2583, -2.1733, -6.6179]], [[ -2.9571, -7.6993, -6.8385, -7.9015, -4.9033, -7.2115, -6.2837, -4.6747, -4.1726, -2.8920, -4.0050, -3.3370, -2.1043, -1.1395, -3.5804]], [[ -4.4184, -8.5881, -10.8909, -9.5544, -9.1824, -6.3340, -4.9818, -5.4465, -9.0248, -6.8077, -6.1131, -5.2498, -6.0761, -2.2073, -4.6958]], [[ -4.2710, -7.5983, -8.4165, -8.0299, -8.5593, -7.0913, -7.2386, -3.7881, -4.6605, -3.6688, -4.6364, -3.6105, -3.4664, -2.9034, -3.9346]], [[ -0.4999, -3.3421, -3.3077, -4.0306, -3.3150, -4.0941, -3.8079, -1.8503, -1.9114, -2.0222, -3.1691, -3.1396, -2.7301, -3.0008, -1.9491]], [[ -1.3568, -4.3015, -2.9754, -2.7447, -2.7488, -1.8037, -1.9390, -1.8490, -1.5739, -1.1045, -1.8265, -1.9034, -1.1536, -1.4019, -1.4243]], [[ -3.3250, -7.0854, -8.7848, -5.8296, -7.5579, -6.5598, -5.9357, -3.7981, -5.1925, -4.6440, -3.7208, -3.1902, -0.4521, -3.3349, -3.3502]], [[ -4.5184, -9.3012, -8.3948, -9.5429, -9.2082, -6.0599, -5.8556, -6.2227, -6.0122, -4.1160, -5.1504, -5.2427, -3.2638, -2.7516, -4.9680]], [[ -1.6251, -3.7156, -3.5646, -3.2899, -3.5187, -2.5071, -2.4937, -2.9588, -2.2679, -2.3388, -2.5913, -2.2776, -1.6576, -1.7850, -2.0680]], [[ -0.7774, -5.3419, -5.1456, -4.8446, -4.8861, -4.2330, -4.1569, -4.1143, -3.7118, -3.5579, -3.7824, -3.7108, -3.1853, -3.0840, -3.2611]]], [[[ -1.8941, -5.0129, -4.4259, -5.3911, -4.9343, -4.8000, -4.3669, -4.0832, -3.9721, -3.5829, -3.6771, -2.9036, -2.4177, -2.3909, -1.8175]], [[ 1.5020, -0.9644, -2.0314, -1.7692, -2.6253, -2.2604, -2.6105, -1.6281, -3.1712, -2.2918, -3.7317, -1.4810, -2.6189, -1.7914, -1.6584]], [[ -7.7586, -15.0687, -13.1303, -15.2894, -12.3525, -12.8486, -11.6336, -9.5684, -8.0453, -8.6584, -7.6341, -6.4042, -3.3377, -4.7465, -6.0955]], [[ -3.3206, -7.2091, -7.0842, -8.1430, -5.0727, -7.4899, -7.0309, -5.0055, -3.1988, -4.2776, -5.5258, -2.7261, -1.3835, -3.0825, -2.9364]], [[ -2.4196, -6.2859, -7.0282, -7.3975, -5.7208, -10.0818, -7.5364, -4.0454, -3.8890, -6.6135, -6.0566, -1.9962, -2.0997, -1.6887, -3.7061]], [[ -4.1135, -7.7731, -8.8652, -9.2817, -7.7198, -8.1675, -7.4503, -4.4019, -5.3905, -5.9579, -4.8785, -2.4684, -3.0843, -2.9164, -4.4456]], [[ -1.6220, -4.5702, -3.7099, -4.3919, -4.0377, -4.2188, -4.2444, -3.3679, -3.1348, -3.7883, -3.5639, -1.3714, -1.4775, -2.3706, -2.4051]], [[ -1.2905, -4.2974, -3.0087, -2.7560, -2.7556, -1.9474, -2.0455, -1.9590, -1.7984, -1.4634, -0.9970, -0.8126, -0.6814, -0.9255, -1.1896]], [[ -3.4944, -6.9312, -9.1220, -5.6583, -5.8650, -7.1027, -6.8831, -4.3424, -4.1987, -5.5369, -5.3144, -3.2000, -3.0021, -0.8323, -3.0459]], [[ -4.3551, -8.8569, -8.3040, -9.9567, -8.0939, -6.1642, -6.5208, -6.7207, -6.0525, -4.5183, -4.5231, -3.7246, -2.2832, -4.1935, -3.7574]], [[ -2.0073, -3.8411, -3.7288, -3.4367, -3.6290, -3.0096, -2.7861, -3.1483, -3.0612, -2.2497, -2.2364, -2.0093, -1.6483, -1.8080, -1.5391]], [[ -0.8017, -5.4977, -5.3831, -5.1676, -5.0700, -4.5433, -4.2898, -4.5209, -4.3235, -3.8002, -3.5914, -3.2078, -2.9543, -3.1307, -2.8356]]], [[[ -0.9185, -3.5263, -2.0725, -2.6687, -2.9009, -4.2344, -3.8936, -2.8800, -2.1276, -2.3999, -2.9807, -3.1212, -2.4386, -2.6307, -2.3603]], [[ 1.7052, -1.7826, -1.1245, -1.1887, -2.1473, -1.9818, -1.9370, -1.4812, -1.3000, -2.3287, -1.9095, -3.7918, -1.2680, -1.8164, -1.7959]], [[ -5.7548, -13.2264, -12.5880, -12.4325, -12.0425, -12.3422, -10.8090, -9.8825, -8.5302, -8.4287, -7.7073, -6.3564, -3.2152, -4.9448, -4.3173]], [[ -2.3147, -4.8088, -4.5259, -5.1915, -4.0069, -5.2672, -5.0844, -3.4271, -3.5869, -2.5412, -3.8999, -3.6381, -2.0257, -1.2879, -1.2372]], [[ -1.4587, -3.7896, -6.3287, -6.0254, -4.6093, -7.3414, -8.3461, -2.9735, -5.2765, -3.9043, -5.7471, -7.0734, -0.1851, -2.6146, -2.6757]], [[ -3.7453, -6.0247, -7.0972, -7.0871, -6.8939, -7.9216, -7.4603, -3.8213, -5.5241, -4.9254, -5.2325, -4.6484, -1.1186, -3.1140, -2.7951]], [[ -2.0653, -5.1972, -3.2424, -3.3262, -3.2872, -3.8459, -3.5214, -4.0577, -2.4716, -2.4600, -2.7513, -2.8561, -0.9170, -0.2543, -0.2825]], [[ -1.2235, -3.5158, -2.0227, -1.9818, -1.9195, -1.0826, -1.1253, -1.3542, -1.3293, -1.2790, -0.4026, -0.0622, -0.6520, -0.3726, -0.0708]], [[ -1.9792, -4.7681, -5.6302, -4.6556, -5.1261, -5.2660, -6.2645, -3.5058, -2.8947, -3.8969, -5.1420, -5.0965, -1.4705, -2.1748, -2.0524]], [[ -3.3394, -6.9644, -6.8876, -6.7762, -6.8743, -5.5109, -5.3622, -5.2325, -4.4747, -4.8127, -3.9250, -3.3784, -1.8709, -3.0042, -2.8026]], [[ -0.3817, -3.0639, -2.4100, -2.3559, -2.5464, -1.7501, -1.4941, -2.4159, -1.7506, -2.0233, -1.2545, -0.9876, -1.3632, -1.3129, -0.9588]], [[ -0.4871, -5.4468, -4.8588, -4.7713, -4.7152, -3.8496, -3.8303, -4.4064, -3.7886, -3.9084, -3.1404, -3.1212, -3.2555, -2.8425, -2.5568]]]]) attn_weights tensor([[[[ 5.2124, -0.8772, -3.2299, -2.3819, -0.6992, -1.6665, -2.0669, -1.1166, -3.8079, -3.3818, -4.9179, -1.0148, -3.7058, -2.2055, 2.8173]], [[ -2.8793, -6.3480, -5.6066, -6.1948, -5.9949, -8.6133, -7.6166, -3.9909, -3.4562, -4.1723, -5.4565, -4.1372, -6.0393, -6.0362, -4.5374]], [[ -4.6740, -12.0159, -11.7958, -11.2725, -9.0448, -10.4942, -9.8444, -9.3408, -7.7785, -7.3890, -5.2590, -3.3019, -3.7961, -5.2152, -6.0843]], [[ -4.8924, -14.3568, -17.5810, -17.7858, -14.6355, -10.7473, -10.4660, -10.4145, -12.4925, -13.4155, -8.1751, -8.1167, -7.6735, -4.6386, -5.6888]], [[ 1.3310, -3.1587, -3.9738, -3.8130, -3.2601, -3.1335, -2.9735, -2.9570, -3.8416, -4.2975, -3.5736, -3.0740, -3.6174, -3.2889, -2.8962]], [[ -0.0769, -3.6994, -4.1949, -3.7977, -3.1620, -2.2899, -2.8825, -3.5064, -3.9977, -3.8055, -2.8744, -2.6040, -1.8061, -2.0453, -2.8116]], [[ -3.7092, -9.0442, -7.4060, -9.1938, -8.4270, -7.6246, -8.8948, -6.1914, -4.6747, -6.6663, -5.5415, -4.4850, -4.4974, -4.0434, -4.3451]], [[ -6.1122, -15.0609, -16.4182, -16.0167, -15.0294, -10.7850, -9.3939, -9.7607, -11.3992, -11.2042, -9.1114, -6.9127, -7.1238, -3.9619, -6.7030]], [[ -4.5700, -9.8226, -11.4258, -10.6894, -11.0333, -11.1107, -10.2588, -7.4602, -8.2026, -7.5567, -5.5130, -6.4381, -7.5881, -6.1764, -4.9520]], [[ -2.3126, -7.1489, -6.2359, -6.0307, -5.4445, -7.3677, -5.3680, -4.4816, -3.6442, -4.1612, -2.5775, -3.2550, -3.6269, -4.0700, -5.6924]], [[ -1.1686, -6.7888, -6.8695, -7.9150, -6.4263, -5.3758, -5.2421, -4.5735, -5.5765, -6.6811, -4.6922, -3.7493, -3.5832, -3.2505, -2.0171]], [[ -3.0366, -7.6539, -8.7330, -7.7795, -7.3464, -6.7437, -5.8356, -4.8067, -5.9622, -5.5912, -3.4452, -4.5294, -1.7939, -4.3344, -3.8230]]], [[[ 5.3512, -1.3097, -2.9657, -2.6648, -0.0949, -0.1461, -3.6056, -1.0140, -0.9724, -3.3897, -3.5542, -5.6278, -2.2257, -1.5050, 2.0860]], [[ -2.7942, -6.8887, -5.9606, -7.1789, -7.2790, -8.0911, -7.9116, -3.9476, -4.0284, -3.6205, -4.6140, -5.6850, -4.8430, -4.8127, -4.7624]], [[ -4.7667, -11.4534, -11.1068, -10.3895, -9.2054, -10.6582, -11.1603, -8.8445, -8.2800, -6.9352, -6.1276, -6.1516, -4.1791, -2.8843, -5.1174]], [[ -5.4506, -14.2554, -17.3742, -15.1205, -13.7776, -11.8065, -14.6284, -9.5960, -10.3808, -12.5802, -10.0896, -7.6879, -5.2951, -4.8512, -6.3434]], [[ 1.4862, -3.7106, -4.3658, -3.3428, -3.7101, -3.9381, -3.6701, -2.9001, -2.9110, -3.8001, -3.1966, -4.5722, -3.9099, -3.8339, -4.1513]], [[ 0.1166, -3.4015, -4.6620, -4.0579, -3.7095, -2.9518, -3.0655, -3.8188, -3.6421, -4.2544, -4.0950, -3.6235, -3.0079, -2.9313, -3.4422]], [[ -3.5171, -8.6034, -5.9573, -6.9410, -7.6446, -6.1702, -7.1425, -6.0919, -5.1859, -3.2877, -4.4303, -3.9901, -3.4347, -3.5893, -4.0285]], [[ -6.5466, -13.2872, -12.8308, -12.8368, -12.7103, -9.6736, -10.2043, -9.2807, -9.9470, -8.0597, -8.2204, -6.9670, -7.1435, -5.0641, -6.6398]], [[ -4.2570, -10.4168, -11.0260, -10.7445, -10.2364, -11.5992, -10.0083, -6.6504, -6.4521, -7.4131, -6.5913, -6.5976, -3.5039, -3.9898, -5.4702]], [[ -1.8433, -6.5613, -6.3528, -6.4861, -5.3050, -5.6226, -5.7420, -4.3105, -4.9161, -4.3453, -4.3321, -3.9324, -1.5514, -0.0250, -4.1380]], [[ -1.0729, -6.0683, -5.7200, -6.1566, -4.9063, -4.6850, -5.7982, -4.9061, -5.1817, -4.9254, -5.0255, -3.9065, -4.3615, -3.2197, -2.4144]], [[ -2.6378, -7.0105, -7.4334, -7.7151, -5.3435, -6.4877, -6.1984, -5.2471, -4.7400, -4.5340, -5.2961, -2.0847, -3.2081, -3.9999, -3.5090]]], [[[ 4.9314, -1.2400, -2.8506, -2.2985, -0.4796, -2.2186, -2.4263, -1.7420, -2.6619, -3.4387, -4.4642, -3.7036, -3.6872, -2.0439, -2.6300]], [[ -2.6937, -6.6167, -6.2949, -7.5857, -6.7229, -7.2331, -7.5846, -4.3899, -5.1284, -4.0192, -5.7323, -5.1547, -5.0385, -4.6229, -5.0941]], [[ -4.5315, -12.1849, -11.7255, -8.8954, -7.9662, -10.2146, -10.5287, -8.7271, -8.1007, -6.7726, -5.3967, -5.0242, -3.0029, -1.8407, -5.2840]], [[ -5.6905, -14.4392, -18.1370, -14.9777, -14.7939, -12.2443, -11.3310, -10.4145, -14.2797, -12.3769, -8.6543, -9.1267, -7.1864, -3.6721, -6.5255]], [[ 1.7347, -4.0392, -4.7890, -4.4873, -3.7632, -3.1868, -3.8331, -3.5993, -4.2563, -4.7392, -5.3061, -4.5981, -4.4786, -5.1696, -4.7048]], [[ 0.1270, -3.5421, -4.5771, -4.2221, -3.8462, -2.6774, -2.8843, -3.8208, -4.8727, -3.9911, -3.6869, -4.1881, -2.7905, -3.1048, -3.3428]], [[ -3.4119, -9.0988, -6.9634, -8.3048, -8.4544, -6.6024, -6.8637, -5.5538, -5.6988, -2.5851, -5.4957, -4.9776, -3.8240, -3.4945, -4.2532]], [[ -6.4544, -13.9628, -14.2636, -13.1353, -13.6176, -9.3598, -10.0089, -9.4917, -10.8694, -8.8991, -7.8463, -8.3765, -5.4305, -6.0734, -6.5734]], [[ -4.5894, -10.3403, -11.0937, -9.4036, -11.5768, -9.8717, -9.7630, -6.7844, -8.4337, -6.6817, -5.6512, -6.3120, -3.3372, -5.2884, -5.0296]], [[ -1.9942, -6.7646, -6.7215, -6.1639, -5.2844, -6.2799, -5.2307, -4.0650, -6.4070, -4.5751, -4.3362, -4.7313, -1.4419, -5.2008, -3.7923]], [[ -1.0283, -6.8793, -6.7378, -7.7024, -6.4920, -5.4394, -5.7709, -4.9671, -6.3782, -5.4122, -7.0824, -5.5287, -4.4759, -2.8521, -2.7053]], [[ -2.9177, -7.5261, -9.1067, -8.5937, -6.1558, -6.6018, -7.2326, -5.3886, -7.3130, -6.0911, -3.8081, -2.7970, -3.5410, -1.2218, -4.1294]]], [[[ 4.4960, -1.1854, -2.6808, -1.6279, -1.1509, -5.3198, -5.8042, -1.6997, -1.9899, -5.6508, -6.1932, -3.2405, -1.7811, -2.2131, 0.9079]], [[ -2.9347, -7.3406, -7.1156, -9.0190, -8.4278, -7.7693, -8.3970, -5.4632, -6.1346, -7.4692, -7.2018, -4.7886, -4.5071, -5.2452, -4.9504]], [[ -4.5178, -10.4906, -11.5739, -11.7797, -8.4224, -9.8412, -11.0364, -8.5133, -7.1007, -8.5599, -8.7048, -6.9312, -5.2613, -5.2068, -6.9693]], [[ -5.0269, -13.6137, -14.9654, -13.6986, -13.1218, -14.2477, -14.7620, -11.1499, -11.5685, -12.6989, -11.6531, -7.4625, -6.5331, -6.0146, -8.1263]], [[ 1.3200, -3.5927, -3.6178, -2.5328, -3.0673, -4.0524, -3.7192, -3.2426, -3.0524, -4.6417, -4.2621, -3.2026, -3.4920, -2.6447, -4.2252]], [[ -0.1094, -3.4551, -3.8498, -2.6188, -2.0971, -2.3476, -3.0109, -3.5208, -2.5634, -3.3435, -3.2119, -3.8057, -2.7307, -2.6042, -2.2413]], [[ -3.2605, -9.3498, -7.0725, -9.2885, -8.9843, -6.7653, -8.0708, -6.6420, -6.5020, -5.3450, -5.8882, -5.2276, -2.9352, -4.4282, -5.4760]], [[ -5.8782, -13.4100, -14.2099, -14.0620, -11.8309, -10.3543, -10.2814, -9.7462, -9.8271, -8.3400, -8.0204, -6.9855, -5.8959, -6.6922, -7.8052]], [[ -4.1168, -9.5805, -11.0134, -11.6667, -11.7323, -10.3922, -10.2275, -7.2804, -9.8468, -8.5197, -8.4993, -5.6854, -6.7260, -5.8367, -7.2195]], [[ -1.4922, -6.8633, -7.1494, -5.8043, -6.7692, -5.9970, -5.6572, -5.7552, -5.4701, -6.0820, -4.8684, -6.1097, -3.4297, -2.2713, -3.9488]], [[ -1.0194, -5.3907, -6.0658, -5.6898, -3.9427, -4.6162, -5.5693, -4.9359, -4.5801, -4.9699, -5.2208, -5.0182, -3.6872, -4.1972, -3.8473]], [[ -2.2985, -7.4667, -8.0473, -7.1740, -5.3322, -6.4838, -8.3758, -6.4222, -4.6976, -6.4834, -7.6643, -4.0612, -4.1301, -3.6703, -3.7917]]], [[[ 4.5911, 0.6003, -2.5471, -1.0697, -0.2732, -4.4556, -4.5421, -0.8794, -2.9947, -1.7986, -3.9910, -5.8818, -0.7385, 1.8823, 1.9128]], [[ -2.3303, -5.1049, -5.5989, -5.8812, -7.6556, -8.3917, -8.0361, -5.3183, -7.2743, -6.7722, -8.1645, -7.1554, -3.1228, -3.5992, -3.6280]], [[ -4.5211, -6.0243, -7.1407, -8.0437, -7.1964, -7.7118, -8.6652, -5.6069, -6.7504, -5.9228, -7.5088, -6.6311, -4.5039, -4.1027, -4.5370]], [[ -4.9593, -11.7316, -13.0196, -12.9388, -12.8064, -11.3989, -10.9132, -11.1816, -12.4762, -11.0365, -9.4383, -9.2833, -6.6265, -7.0617, -7.5889]], [[ 0.9668, -2.1745, -3.6763, -4.6601, -3.1846, -4.4013, -3.4372, -3.0261, -3.1798, -3.3089, -3.5627, -4.2084, -2.3999, -2.0175, -1.4749]], [[ -0.3826, -1.5292, -1.1166, -1.2579, -1.4715, -2.6168, -3.1196, -2.5266, -2.6071, -2.7564, -3.6785, -4.8809, -2.5513, -3.1684, -3.5382]], [[ -3.1267, -6.4283, -5.1972, -5.9180, -5.3955, -4.8861, -5.1445, -6.4991, -5.1715, -5.0233, -4.7778, -4.9243, -4.7426, -4.0307, -4.2189]], [[ -5.6251, -10.3613, -9.8566, -9.6897, -9.7604, -9.0826, -8.4974, -8.3842, -6.9663, -7.9718, -6.7645, -6.6036, -5.6258, -6.8996, -6.7211]], [[ -3.6451, -7.7565, -8.3866, -8.4837, -9.5478, -9.2059, -7.9413, -5.4696, -6.4578, -7.7884, -7.3589, -6.4172, -2.7096, -3.8995, -4.1390]], [[ -1.5512, -3.4641, -4.7914, -4.6018, -5.9990, -5.2374, -7.0650, -4.3009, -4.6573, -6.5051, -8.1026, -7.2368, -3.1318, -5.1572, -4.3081]], [[ -0.9912, -5.3769, -4.9507, -5.4305, -5.0598, -4.3203, -5.0612, -4.8346, -4.9526, -4.3475, -4.0711, -3.8734, -3.4783, -3.0894, -2.9457]], [[ -2.1581, -6.0110, -6.7442, -5.6908, -5.3527, -4.3651, -5.3686, -5.9737, -3.8361, -4.9792, -6.0611, -6.2547, -4.6321, -2.4981, -3.1336]]]]) attn_weights tensor([[[[-3.7813e+00, -9.2428e+00, -8.4033e+00, -7.4219e+00, -7.5129e+00, -9.5555e+00, -7.5709e+00, -6.3651e+00, -5.9977e+00, -5.2849e+00, -1.8435e+00, -3.7715e+00, -4.8536e+00, -5.9157e+00, -4.9231e+00]], [[-2.9865e+00, -7.6029e+00, -6.7581e+00, -7.6308e+00, -7.2746e+00, -5.6226e+00, -5.4902e+00, -4.0915e+00, -4.4028e+00, -5.3954e+00, -5.9329e+00, -5.3377e+00, -5.1739e+00, -3.1987e+00, -5.0619e+00]], [[-3.6284e-01, -2.8304e+00, -3.1482e+00, -3.4463e+00, -3.1691e+00, -4.6276e+00, -4.0585e+00, -2.9701e+00, -3.2587e+00, -3.6311e+00, -2.7205e+00, -3.3174e+00, -3.1218e+00, -4.4728e+00, -3.7863e+00]], [[-2.7711e+00, -6.8492e+00, -5.5881e+00, -5.7035e+00, -5.8829e+00, -3.5724e+00, -3.4274e+00, -4.2131e+00, -3.6108e+00, -3.8853e+00, -3.1515e+00, -2.7958e+00, -2.4184e+00, -2.4390e-01, -2.9918e+00]], [[ 1.4699e+00, -2.6418e+00, -2.7923e+00, -3.7447e+00, -1.8855e+00, -9.3888e-01, -2.2499e+00, -2.3516e+00, -3.2056e+00, -4.3535e+00, -1.9024e+00, -1.6300e+00, -6.8431e-01, -9.1752e-01, -1.0748e+00]], [[-2.8136e+00, -7.7023e+00, -7.7348e+00, -7.4650e+00, -7.8726e+00, -7.0955e+00, -5.8827e+00, -4.7430e+00, -5.2903e+00, -5.7486e+00, -5.5479e+00, -4.0344e+00, -2.7023e+00, -4.5001e+00, -4.5675e+00]], [[-2.1203e+00, -6.1776e+00, -6.4621e+00, -6.5191e+00, -5.7573e+00, -5.6333e+00, -5.3562e+00, -5.3531e+00, -5.2268e+00, -5.3479e+00, -4.5530e+00, -4.6066e+00, -4.0786e+00, -3.8531e+00, -4.2632e+00]], [[ 1.0057e-01, -4.6550e+00, -4.0219e+00, -3.7143e+00, -3.7533e+00, -2.5703e+00, -1.7191e-01, -6.6373e-01, -3.0941e+00, -3.0613e+00, -2.0389e+00, -1.3466e+00, -1.4124e+00, -2.1475e-01, 1.5096e+00]], [[ 1.7986e+00, -4.1760e+00, -3.7678e+00, -3.1693e+00, -2.7933e+00, -3.1236e+00, -2.3200e+00, -2.3147e+00, -3.1203e+00, -2.7907e+00, -3.0320e+00, -1.8854e+00, -1.5034e+00, -2.5690e+00, -1.1258e+00]], [[-1.6696e+00, -4.6262e+00, -3.7746e+00, -4.3712e+00, -2.8016e+00, -5.5371e+00, -3.4793e+00, -3.4330e+00, -2.1133e+00, -3.3128e+00, -1.4835e+00, -1.6051e+00, -1.9634e+00, -4.5555e+00, -2.9237e+00]], [[ 1.1779e+00, -2.8961e+00, -2.7020e+00, -4.3629e+00, -3.2699e+00, -3.8047e+00, -2.0941e+00, -3.3174e+00, -2.5204e+00, -4.4141e+00, -3.7462e+00, -2.8087e+00, -3.3099e+00, -3.4384e+00, -2.4532e+00]], [[-6.2280e+00, -3.1780e+01, -3.2614e+01, -3.5521e+01, -3.6661e+01, -5.9677e+00, 2.2758e+00, -1.2359e+01, -1.7020e+01, -2.0342e+01, -8.7407e+00, -1.2573e+01, -6.6125e+00, 1.8445e+01, 2.0649e+00]]], [[[-2.3106e+00, -1.0771e+01, -9.9320e+00, -9.6450e+00, -8.2424e+00, -8.8418e+00, -8.5562e+00, -8.1082e+00, -7.1048e+00, -7.2559e+00, -6.7285e+00, -7.7889e+00, -5.4425e+00, -1.6719e+00, -6.1571e+00]], [[-2.7703e+00, -6.8843e+00, -6.8495e+00, -5.8895e+00, -6.9615e+00, -4.7843e+00, -6.5959e+00, -3.8446e+00, -3.0350e+00, -3.5973e+00, -3.1648e+00, 2.1299e-02, -2.5515e+00, -2.2087e+00, -4.9653e+00]], [[ 1.0819e-01, -3.3714e+00, -3.5191e+00, -4.2214e+00, -4.6379e+00, -4.3123e+00, -3.4373e+00, -3.7157e+00, -3.6247e+00, -3.8212e+00, -4.2988e+00, -3.9250e+00, -3.4792e+00, -3.4249e+00, -2.0554e+00]], [[-2.3539e+00, -5.8498e+00, -4.5587e+00, -4.2857e+00, -5.8998e+00, -3.7397e+00, -4.5041e+00, -5.6084e+00, -4.5188e+00, -2.4292e+00, -2.8267e+00, -4.1056e+00, -4.1398e+00, -3.5103e+00, -5.0371e+00]], [[ 1.5764e+00, -3.7200e+00, -3.1068e+00, -2.9744e+00, -1.8695e+00, -3.8910e+00, -4.2603e+00, -3.1161e+00, -4.0222e+00, -3.0515e+00, -3.1854e+00, -3.4074e+00, -3.4976e+00, -1.0847e+00, -4.1325e-01]], [[-2.1251e+00, -7.9338e+00, -8.7386e+00, -9.4631e+00, -6.5862e+00, -7.6265e+00, -8.5638e+00, -6.9500e+00, -5.3161e+00, -6.5445e+00, -7.8794e+00, -5.3717e+00, -5.3166e+00, -6.5688e+00, -4.3560e+00]], [[-1.9829e+00, -6.2424e+00, -6.4783e+00, -6.4054e+00, -5.9042e+00, -5.0650e+00, -4.7938e+00, -5.6520e+00, -4.7878e+00, -5.4669e+00, -5.1793e+00, -4.3332e+00, -4.8046e+00, -4.6832e+00, -4.6636e+00]], [[ 6.3736e-01, -5.5257e+00, -4.4887e+00, -3.8279e+00, -1.9113e+00, -2.0010e+00, -2.5566e+00, -3.1596e+00, -2.3594e+00, -3.0532e+00, -2.7148e+00, -9.2570e-01, -1.8816e-01, 6.5471e-01, 1.0465e+00]], [[ 2.0363e+00, -4.3271e+00, -3.3198e+00, -3.8010e+00, -2.8266e+00, -2.2492e+00, -1.4799e+00, -3.1679e+00, -2.3338e+00, -3.4256e+00, -4.4808e+00, -3.0977e+00, -2.3005e+00, -1.9555e+00, -1.7175e+00]], [[-1.0814e+00, -4.6287e+00, -4.6253e+00, -4.1234e+00, -4.3543e+00, -4.1241e+00, -2.8448e+00, -3.6231e+00, -3.4545e+00, -2.7077e+00, -2.7995e+00, -1.7296e+00, -1.4118e+00, -1.3195e+00, -2.4762e+00]], [[ 1.5270e+00, -3.1706e+00, -3.8717e+00, -3.6156e+00, -4.2101e+00, -4.3492e+00, -3.7206e+00, -2.5559e+00, -1.9605e+00, -3.9075e+00, -4.0466e+00, -4.5067e+00, -2.8950e+00, -3.1657e+00, -3.1309e+00]], [[-4.1645e+00, -2.6804e+01, -3.2592e+01, -1.6946e+01, -1.6869e+01, -2.1636e+01, -2.3278e+01, -1.6767e+01, -2.1548e+01, -2.3574e+01, -6.9976e+00, -8.9402e-01, 1.6008e+00, 1.5532e+01, 1.3750e+00]]], [[[-3.3528e+00, -1.0531e+01, -9.4492e+00, -8.1281e+00, -8.3323e+00, -8.1411e+00, -7.8773e+00, -6.8586e+00, -8.9676e+00, -6.3888e+00, -5.5160e+00, -3.5217e+00, -8.2063e-01, -3.7473e+00, -5.6509e+00]], [[-2.6174e+00, -7.4541e+00, -7.3195e+00, -7.4319e+00, -7.4873e+00, -2.2955e+00, -4.3644e+00, -3.6747e+00, -6.1369e+00, -3.3608e+00, -3.8579e+00, -3.5313e+00, -4.4171e+00, -1.8656e+00, -4.6013e+00]], [[ 2.2420e-01, -2.8740e+00, -4.0522e+00, -3.7142e+00, -4.2617e+00, -5.2198e+00, -4.5886e+00, -3.5258e+00, -3.3101e+00, -4.3256e+00, -4.0889e+00, -3.8005e+00, -2.3396e+00, -4.2854e+00, -5.2965e+00]], [[-2.0172e+00, -6.1550e+00, -5.8999e+00, -4.8298e+00, -6.2661e+00, -5.7268e+00, -4.6880e+00, -5.3364e+00, -5.2154e+00, -3.4209e+00, -2.8839e+00, -3.8996e+00, -3.1435e+00, -2.6794e+00, -3.4967e+00]], [[ 1.5078e+00, -3.7317e+00, -2.2357e+00, -4.0420e+00, -3.0038e+00, -5.0336e+00, -5.4955e+00, -2.6875e+00, -3.3252e+00, -2.1993e+00, -2.8944e+00, -1.9896e+00, -2.7967e+00, -1.5046e+00, -1.5614e+00]], [[-2.0851e+00, -7.8218e+00, -8.6433e+00, -7.2817e+00, -6.9746e+00, -7.2332e+00, -7.7511e+00, -5.6788e+00, -7.5485e+00, -5.2881e+00, -5.1805e+00, -5.2543e+00, -2.8695e+00, -8.4506e-01, -4.0624e+00]], [[-1.8345e+00, -5.8582e+00, -5.9906e+00, -5.6999e+00, -5.9653e+00, -5.1895e+00, -5.5818e+00, -5.3607e+00, -5.2143e+00, -4.7752e+00, -4.9671e+00, -4.4896e+00, -3.5492e+00, -3.6431e+00, -4.2077e+00]], [[ 9.5069e-01, -3.9722e+00, -4.2346e+00, -4.0397e+00, -4.1422e+00, -1.9134e+00, -3.4993e+00, -3.5196e+00, -3.9632e+00, -2.9353e+00, -3.3096e+00, -3.1393e+00, -3.4192e-01, 9.4650e-01, 1.8815e+00]], [[ 1.9897e+00, -4.1439e+00, -4.3657e+00, -4.3223e+00, -3.2528e+00, -2.5307e+00, -2.1848e+00, -2.9176e+00, -2.6220e+00, -4.0696e+00, -4.6509e+00, -2.2832e+00, -1.9451e+00, -1.6159e+00, -2.8242e+00]], [[-9.5523e-01, -5.5713e+00, -4.9744e+00, -5.0082e+00, -4.1558e+00, -3.8710e+00, -4.5241e+00, -5.4591e+00, -4.5539e+00, -3.0433e+00, -2.3151e+00, -1.0602e+00, -1.0422e+00, -2.2373e+00, -3.7135e+00]], [[ 1.6550e+00, -3.3883e+00, -3.4390e+00, -3.5598e+00, -3.7417e+00, -3.5416e+00, -3.1662e+00, -2.4312e+00, -2.4529e+00, -2.8444e+00, -4.6047e+00, -3.1692e+00, -2.9906e+00, -3.5720e+00, -3.3498e+00]], [[-4.8430e+00, -2.9226e+01, -3.4640e+01, -3.2233e+01, -2.9672e+01, -1.4253e+01, -2.0990e+01, -2.4695e+01, -1.6807e+01, -1.9487e+01, -1.2194e+01, -5.5831e+00, 1.2088e+00, 1.9081e+01, 7.7835e+00]]], [[[-2.0937e+00, -9.2317e+00, -9.4362e+00, -8.9312e+00, -7.8214e+00, -8.6707e+00, -7.3342e+00, -7.1228e+00, -6.4499e+00, -6.6600e+00, -7.0620e+00, -6.1147e+00, -4.6097e+00, -3.7901e+00, -5.8001e+00]], [[-2.4855e+00, -6.6255e+00, -7.2896e+00, -7.9685e+00, -7.2191e+00, -5.5000e+00, -7.6286e+00, -4.0204e+00, -5.3145e+00, -5.7332e+00, -6.7944e+00, -3.4699e+00, -2.7979e+00, -3.6271e+00, -3.8710e+00]], [[-3.0876e-01, -1.6892e+00, -2.5568e+00, -3.5292e+00, -4.1637e+00, -4.2067e+00, -2.2813e+00, -2.1440e+00, -4.6497e+00, -4.0791e+00, -2.9947e+00, -1.2642e+00, -2.7690e+00, -2.7860e+00, -2.5215e+00]], [[-2.0881e+00, -7.5538e+00, -6.8589e+00, -5.8354e+00, -5.5248e+00, -2.6552e+00, -3.3165e+00, -5.2687e+00, -4.8228e+00, -3.3074e+00, -2.9030e+00, -5.1356e+00, -1.7135e+00, -2.2892e+00, -3.3549e+00]], [[ 1.5351e+00, -2.7980e+00, -2.8736e+00, -2.4531e+00, -2.6928e+00, -3.1237e+00, -3.7680e+00, -2.6395e+00, -2.6018e+00, -4.7674e+00, -3.3383e+00, -2.9024e+00, -3.8858e-01, -1.4199e+00, -4.4986e-01]], [[-1.8557e+00, -7.8906e+00, -8.1655e+00, -8.5902e+00, -7.4083e+00, -8.6355e+00, -8.5205e+00, -6.7819e+00, -6.1304e+00, -7.9491e+00, -7.8297e+00, -4.4157e+00, -4.0652e+00, -4.0107e+00, -5.4291e+00]], [[-2.0466e+00, -6.3356e+00, -6.6097e+00, -6.6357e+00, -5.7435e+00, -5.4715e+00, -4.5403e+00, -5.4542e+00, -5.6168e+00, -4.5766e+00, -4.4253e+00, -4.3365e+00, -4.3111e+00, -4.1808e+00, -4.5131e+00]], [[ 8.5409e-01, -6.2276e+00, -4.7084e+00, -3.3632e+00, -2.5062e+00, -3.5872e+00, -4.1844e+00, -3.8663e+00, -3.6302e+00, -2.8607e+00, -4.1650e+00, -1.3741e+00, -1.0867e+00, -4.6917e-01, 8.2569e-01]], [[ 1.6136e+00, -3.3483e+00, -3.1880e+00, -2.9401e+00, -2.1183e+00, -3.0537e+00, -1.3441e+00, -2.6022e+00, -2.1296e+00, -2.7658e+00, -2.0881e+00, -2.3099e+00, -2.0651e+00, -2.1731e+00, -2.2106e+00]], [[-8.2219e-01, -4.3750e+00, -5.4896e+00, -5.3278e+00, -4.1830e+00, -4.1563e+00, -3.3184e+00, -3.5126e+00, -5.7900e+00, -4.3409e+00, -4.3367e+00, -4.7295e+00, -2.4992e+00, -3.0196e+00, -2.4821e+00]], [[ 1.3876e+00, -2.1941e+00, -2.5016e+00, -2.8876e+00, -2.9794e+00, -3.9380e+00, -4.0189e+00, -2.0544e+00, -2.4101e+00, -5.7576e+00, -5.0961e+00, -1.6220e+00, -2.0529e+00, -2.6711e+00, -3.4525e+00]], [[-7.9640e+00, -3.0528e+01, -2.5827e+01, -9.6765e+00, -1.4900e+01, -1.5594e+01, -1.6410e+01, -1.3583e+01, -1.2439e+01, -1.6557e+01, -1.1977e+01, -4.7695e+00, 2.2228e-01, 1.3243e+01, 5.9883e+00]]], [[[-2.8798e+00, -6.3324e+00, -6.8843e+00, -6.4125e+00, -7.1968e+00, -7.1539e+00, -6.8806e+00, -6.6208e+00, -6.5094e+00, -6.7463e+00, -7.7538e+00, -7.4320e+00, -4.4444e+00, -2.1034e+00, -4.7532e+00]], [[-1.4635e+00, -6.3791e+00, -8.3991e+00, -7.3584e+00, -8.9360e+00, -8.8052e+00, -7.9463e+00, -6.1457e+00, -6.2324e+00, -8.4136e+00, -8.3561e+00, -7.6376e+00, -3.7858e+00, -4.1690e+00, -4.0626e+00]], [[ 4.3584e-01, -1.8294e+00, -2.6367e+00, -2.5467e+00, -3.0699e+00, -4.8389e+00, -4.3791e+00, -3.0772e+00, -3.0363e+00, -4.5448e+00, -5.3367e+00, -5.3218e+00, -1.9433e+00, -2.5823e+00, -2.0297e+00]], [[-1.2146e+00, -6.5642e+00, -6.7013e+00, -5.5335e+00, -5.9440e+00, -5.4829e+00, -4.3393e+00, -6.0698e+00, -7.3555e+00, -7.5999e+00, -6.8188e+00, -5.5866e+00, -5.9407e+00, -4.5761e+00, -4.3397e+00]], [[ 1.5155e+00, -2.5582e+00, -3.1548e+00, -2.3865e+00, -2.4194e+00, -3.3785e+00, -2.8776e+00, -3.4145e+00, -4.9594e+00, -2.9051e+00, -3.7372e+00, -2.3506e+00, -2.3894e+00, -3.0985e-01, -1.4389e-01]], [[-1.6528e+00, -7.6341e+00, -7.2482e+00, -7.3084e+00, -7.9106e+00, -8.3754e+00, -9.5299e+00, -8.4562e+00, -7.1424e+00, -7.5218e+00, -7.6636e+00, -1.0018e+01, -4.8101e+00, -5.5769e+00, -4.4547e+00]], [[-2.1497e+00, -3.8063e+00, -4.7589e+00, -4.5138e+00, -4.0326e+00, -4.2348e+00, -4.4781e+00, -4.1667e+00, -4.4000e+00, -4.8773e+00, -4.0733e+00, -4.6672e+00, -3.4409e+00, -3.7357e+00, -3.5551e+00]], [[ 1.1991e+00, -5.9213e+00, -3.3485e+00, -1.2863e+00, -2.8261e+00, -3.3473e+00, -2.6381e+00, -2.9435e+00, -2.6875e+00, -3.9874e+00, -4.0410e+00, -3.0740e+00, 7.9789e-01, 1.1712e+00, 3.5663e+00]], [[ 9.7895e-01, -2.5298e+00, -2.5237e+00, -2.3564e+00, -2.1675e+00, -2.3910e+00, -1.9391e+00, -2.3213e+00, -1.7256e+00, -2.6496e+00, -3.2733e+00, -3.8564e+00, -1.5807e+00, -1.9386e+00, -1.6759e+00]], [[-1.0265e+00, -3.1155e+00, -3.8837e+00, -3.8211e+00, -4.5779e+00, -5.5772e+00, -4.4743e+00, -3.5335e+00, -4.6088e+00, -5.1151e+00, -5.9224e+00, -5.9677e+00, -4.0145e+00, -4.6881e+00, -4.9285e+00]], [[ 1.4809e+00, -2.2369e+00, -1.9956e+00, -2.7768e+00, -2.6486e+00, -3.7183e+00, -2.4333e+00, -2.0459e+00, -3.2983e+00, -2.1007e+00, -3.7494e+00, -3.7800e+00, -1.2634e+00, -1.3910e+00, -9.4411e-01]], [[-9.0108e+00, -1.7443e+01, -2.0947e+01, -2.0882e+01, -2.5047e+01, -2.1681e+01, -2.2955e+01, -1.1137e+01, -1.4535e+01, -2.1046e+01, -1.8364e+01, -2.2183e+01, 1.6831e+00, 3.0993e+00, 4.0331e+00]]]]) attn_weights tensor([[[[ 2.1023e+00, -6.0258e+00, -6.8866e+00, -5.0946e+00, -5.3335e+00, -3.4136e+00, -2.8287e+00, -1.1830e+00, -3.5997e+00, -3.7443e+00, -4.3421e+00, -3.7496e+00, -2.6597e+00, -1.9276e+00, -2.5419e+00]], [[ 4.1688e+00, -1.0452e+01, -8.7312e+00, -1.0350e+01, -9.0412e+00, -5.4723e+00, -7.3099e+00, -7.1332e+00, -5.9736e+00, -9.8143e+00, -8.6394e+00, -9.7378e+00, -7.1930e+00, -5.9868e+00, -5.5512e+00]], [[ 1.0484e-01, -4.4926e+00, -4.5020e+00, -5.2251e+00, -3.7175e+00, -2.4706e+00, -3.1866e+00, -4.6575e+00, -3.6458e+00, -4.0642e+00, -2.5290e+00, -2.1013e+00, -1.9639e+00, -1.1150e+00, -3.2292e+00]], [[-3.6210e-01, -1.3658e+00, -1.9029e+00, -1.7720e+00, -1.7958e+00, -2.5810e+00, -2.4942e+00, -1.3292e+00, -5.7185e-01, -1.1010e+00, 3.0931e-01, -1.1477e+00, -1.2208e+00, -2.2284e+00, -1.9522e+00]], [[-2.8916e-01, -5.0767e+00, -4.6405e+00, -5.4273e+00, -5.0406e+00, -2.5882e+00, -3.0808e+00, -2.3038e+00, -2.6225e+00, -3.5971e+00, -2.4433e+00, -1.3348e+00, -8.2685e-01, 1.4009e-01, -1.6911e+00]], [[ 1.4476e+00, -6.5872e+00, -4.9521e+00, -6.6268e+00, -6.2841e+00, -3.0624e+00, -2.7270e+00, -1.3675e+00, -2.1278e+00, -5.2201e+00, -5.0191e+00, -5.1957e+00, -4.2081e+00, -3.2011e+00, -2.1684e+00]], [[ 1.9007e+00, -8.9514e+00, -8.4925e+00, -9.1110e+00, -9.7139e+00, -2.3024e+00, -4.3231e+00, -3.9709e+00, -5.0269e+00, -7.2335e+00, -6.4943e+00, -8.1554e+00, -4.9570e+00, 1.8959e-01, -3.4493e+00]], [[ 7.1602e-01, -4.5521e+00, -4.9720e+00, -6.1646e+00, -4.9851e+00, -3.0743e+00, -1.0224e+00, -3.0584e+00, -3.6069e+00, -4.6212e+00, -1.3526e+00, -1.4768e+00, -3.8625e-01, 1.9413e-01, -9.2211e-01]], [[ 2.5748e-01, -4.3243e+00, -4.7206e+00, -4.2721e+00, -4.9007e+00, -4.4694e+00, -4.4789e+00, -2.4075e+00, -3.1150e+00, -3.1638e+00, -5.2080e+00, -3.8616e+00, -3.2456e+00, -2.6331e+00, -2.9500e+00]], [[ 1.0974e+00, -3.8972e+00, -4.4931e+00, -3.9967e+00, -2.5394e+00, -2.2040e+00, -1.5687e+00, -1.8893e+00, -3.7927e+00, -4.3668e+00, -3.3901e+00, -3.1223e+00, -3.3623e+00, -2.2530e+00, -2.6045e+00]], [[ 2.0888e+00, -1.4607e+00, -1.5210e+00, -1.5687e+00, -9.7376e-01, 1.1995e+00, 1.4110e+00, 1.3219e-01, -9.3296e-01, -2.0204e+00, -1.6169e+00, 1.8907e-02, -3.8943e-01, 1.9299e+00, 7.3768e-01]], [[ 1.0351e+00, -3.6380e+00, -4.7737e+00, -4.5703e+00, -3.4885e+00, -2.8529e+00, -3.5920e+00, -2.5196e+00, -4.0726e+00, -4.0100e+00, -3.2971e+00, -1.9704e+00, -1.7031e+00, -2.2663e+00, -3.2896e-01]]], [[[ 2.6370e+00, -5.6776e+00, -4.1520e+00, -5.1464e+00, -5.4884e+00, -3.0356e+00, -1.6149e+00, -3.3416e+00, -3.4352e+00, -5.3787e+00, -6.3888e+00, -6.7770e+00, -5.7307e+00, -3.4979e+00, -1.3398e+00]], [[ 5.1222e+00, -1.3700e+01, -9.7368e+00, -1.1898e+01, -6.0322e+00, -3.1279e+00, -7.5492e+00, -1.2113e+01, -1.0525e+01, -8.0112e+00, -1.2191e+01, -6.1634e+00, -1.0453e+01, -8.1057e+00, -7.8871e-01]], [[ 3.4351e-01, -4.6304e+00, -4.3153e+00, -3.6698e+00, -4.6602e+00, -4.8444e+00, -5.1387e+00, -5.4055e+00, -5.0360e+00, -3.7740e+00, -2.7318e+00, -3.3888e+00, -2.8473e+00, -1.7572e+00, -3.7082e+00]], [[ 1.4340e-01, -2.2358e+00, -3.2064e+00, -2.3190e+00, -3.0155e+00, -2.6296e+00, -2.9546e+00, -1.9340e+00, -1.3871e+00, -1.6967e+00, -1.1345e+00, -4.5720e-01, 3.4497e-01, -2.0574e-01, -3.4394e+00]], [[-2.4508e-01, -5.7697e+00, -6.1801e+00, -5.1353e+00, -5.9109e+00, -4.4689e+00, -3.4330e+00, -4.6207e+00, -3.9167e+00, -4.5765e+00, -3.4263e+00, -3.0939e+00, -3.1698e+00, -9.7644e-01, -2.6204e+00]], [[ 2.1745e+00, -6.9170e+00, -5.5274e+00, -7.3458e+00, -4.8532e+00, -1.6961e+00, -3.4121e+00, -3.1845e+00, -3.3342e+00, -2.7551e+00, -6.5978e+00, -4.3697e+00, -8.7788e+00, -7.9383e+00, -2.9155e+00]], [[ 1.0434e+00, -6.0888e+00, -5.6391e+00, -3.7732e+00, -3.4188e+00, -3.3312e+00, -3.6507e+00, -3.9665e+00, -3.8984e+00, -3.3221e+00, -2.7498e+00, -7.8917e-01, -8.5988e-01, 5.1044e-01, -1.9621e+00]], [[ 1.1676e+00, -4.8408e+00, -6.3267e+00, -7.5863e+00, -5.2788e+00, -4.2153e+00, -1.8917e+00, -5.3156e+00, -4.3256e+00, -5.3577e+00, -6.3621e+00, -2.6407e+00, -2.1762e+00, -8.1950e-01, -1.0989e-01]], [[ 9.2901e-01, -5.8988e+00, -5.1929e+00, -6.3258e+00, -3.5261e+00, -1.0289e+00, -9.0030e-01, -1.1905e+00, -8.0324e-01, -3.0644e+00, -5.5623e+00, -2.4365e+00, -5.0863e+00, -5.3640e+00, -1.5507e+00]], [[ 1.3691e+00, -3.6689e+00, -5.1555e+00, -4.7962e+00, -3.7187e+00, -2.5338e+00, -2.1824e+00, -2.8060e+00, -3.4095e+00, -4.9922e+00, -5.4891e+00, -4.2746e+00, -3.9739e+00, -4.5810e+00, -4.0867e+00]], [[ 2.0584e+00, -1.0133e+00, -4.6494e-01, 1.6365e-01, -2.9551e-02, -6.6948e-01, 5.9375e-01, 1.1886e+00, -1.0901e+00, -3.6262e-01, -6.6732e-01, -1.2207e+00, -1.0376e+00, -3.9223e-01, -9.2667e-01]], [[ 1.3706e+00, -4.2312e+00, -4.9957e+00, -5.6746e+00, -3.3379e+00, -4.1208e+00, -4.9267e+00, -3.2910e+00, -3.5712e+00, -4.0859e+00, -4.8545e+00, -5.5852e+00, -3.8273e+00, -3.7332e+00, -1.0496e+00]]], [[[ 2.8115e+00, -7.4619e+00, -6.1822e+00, -6.2925e+00, -5.1091e+00, -4.3304e+00, -7.9677e+00, -5.5633e+00, -4.4952e+00, -4.7175e+00, -6.4800e+00, -7.1200e+00, -3.5940e+00, -3.2957e+00, -3.1768e+00]], [[ 5.6760e+00, -1.5392e+01, -8.9787e+00, -1.0020e+01, -8.5176e+00, -7.2589e+00, -1.6264e+01, -1.9079e+01, -1.1814e+01, -1.1790e+01, -1.3253e+01, -1.3034e+01, -8.0660e+00, -4.2929e+00, -1.5863e+00]], [[ 5.4148e-01, -4.8591e+00, -4.1841e+00, -4.4563e+00, -4.3535e+00, -5.8860e+00, -5.8427e+00, -6.2390e+00, -3.6608e+00, -3.5095e+00, -2.7078e+00, -1.8765e+00, -1.3057e+00, -8.5230e-01, -3.7033e+00]], [[-3.8637e-02, -2.7211e+00, -3.2970e+00, -3.7159e+00, -4.8481e+00, -3.1580e+00, -3.7021e+00, -3.0372e+00, -1.6308e+00, -2.0603e+00, -2.1408e+00, -2.9641e+00, -2.9007e+00, -3.1385e+00, -5.2401e+00]], [[ 1.7841e-01, -4.7629e+00, -5.8096e+00, -5.0992e+00, -6.1921e+00, -5.1367e+00, -4.5035e+00, -4.9375e+00, -6.1090e+00, -4.0994e+00, -3.6492e+00, -3.3021e+00, 3.8891e-01, -1.5700e+00, -1.4565e+00]], [[ 2.1766e+00, -1.0451e+01, -5.1761e+00, -5.0638e+00, -5.0758e+00, -1.5016e+00, -5.0163e+00, -4.6301e+00, -3.1503e+00, -4.8241e+00, -4.5872e+00, -6.6284e+00, -2.4319e+00, -2.9123e+00, -2.6240e+00]], [[ 1.7893e+00, -8.2728e+00, -7.8040e+00, -5.4967e+00, -5.7999e+00, -4.5845e+00, -7.3410e+00, -6.4168e+00, -6.0881e+00, -5.8934e+00, -4.6138e+00, -3.3178e+00, -1.1410e+00, 9.4357e-01, -1.5886e+00]], [[ 1.2037e+00, -5.3176e+00, -5.2881e+00, -6.1791e+00, -5.4561e+00, -3.9616e+00, -2.0510e+00, -3.0582e+00, -6.5849e+00, -4.4822e+00, -2.9449e+00, -2.9393e+00, 2.0534e+00, -1.4961e+00, -1.5415e+00]], [[ 1.0461e+00, -6.7636e+00, -4.4840e+00, -6.1440e+00, -4.7108e+00, -2.3525e+00, -3.1482e+00, -3.6899e+00, -3.5070e+00, -4.6856e+00, -6.2180e+00, -6.1770e+00, -2.6231e+00, -2.6224e+00, -2.4676e+00]], [[ 1.2416e+00, -3.4755e+00, -4.2355e+00, -4.1042e+00, -3.7585e+00, -3.1111e+00, -1.7938e+00, -2.9001e+00, -3.3276e+00, -4.3233e+00, -4.6189e+00, -4.7702e+00, -4.1516e+00, -4.1115e+00, -5.8702e+00]], [[ 1.8100e+00, -1.4980e+00, -3.0044e+00, -1.9910e+00, -2.1615e+00, -5.6932e-01, -4.3504e-01, 7.8760e-02, -2.4506e+00, -2.6781e+00, -2.1200e+00, -1.8766e+00, -1.1572e+00, -9.2145e-01, -2.5017e+00]], [[ 9.8060e-01, -5.1835e+00, -5.5986e+00, -4.9169e+00, -3.9764e+00, -3.9721e+00, -4.9518e+00, -4.1752e+00, -3.1647e+00, -4.7772e+00, -4.6091e+00, -3.9479e+00, -2.6052e+00, -2.6349e+00, -1.0132e+00]]], [[[ 2.1556e+00, -3.8473e+00, -6.1937e+00, -6.5493e+00, -3.4769e+00, -2.9658e+00, -3.8692e+00, -3.8313e+00, -4.7329e+00, -4.2767e+00, -3.7393e+00, -3.6711e+00, -3.3161e+00, -4.3595e+00, -2.5047e+00]], [[ 4.7657e+00, -1.0258e+01, -1.1720e+01, -1.2234e+01, -7.5187e+00, -6.2840e+00, -1.0372e+01, -1.2325e+01, -9.6057e+00, -8.4086e+00, -1.0127e+01, -8.8624e+00, -7.4643e+00, -6.9633e+00, -2.3343e+00]], [[ 6.4773e-01, -3.7283e+00, -4.3246e+00, -4.2338e+00, -4.9149e+00, -3.2884e+00, -3.9252e+00, -3.7721e+00, -4.0534e+00, -3.7671e+00, -3.5076e+00, -1.5027e+00, -1.4388e+00, -1.7616e+00, -2.1024e+00]], [[-1.7639e-01, -1.5416e+00, -2.7457e+00, -2.8725e+00, -3.3016e+00, -3.4532e+00, -3.5970e+00, -2.8011e+00, -3.1871e+00, -3.0194e+00, -3.2670e+00, -8.7000e-01, -6.0138e-01, -1.2868e+00, -2.0419e+00]], [[ 2.3089e-01, -6.3853e+00, -7.6300e+00, -7.7545e+00, -5.5705e+00, -4.4908e+00, -3.3265e+00, -3.7241e+00, -4.4806e+00, -4.1899e+00, -4.2163e+00, -2.9989e+00, -3.6389e+00, -3.6203e+00, -4.2012e+00]], [[ 1.7253e+00, -6.9396e+00, -4.7603e+00, -7.6557e+00, -5.5266e+00, -2.8975e+00, -3.7573e+00, -3.9049e+00, -2.7146e+00, -2.6004e+00, -4.3859e+00, -2.3882e+00, -2.2348e+00, -2.5120e+00, -1.2307e+00]], [[ 7.3092e-01, -6.9176e+00, -6.4472e+00, -5.7221e+00, -5.2612e+00, -3.6829e+00, -3.8922e+00, -5.1953e+00, -3.9157e+00, -3.8698e+00, -3.7844e+00, -2.7841e+00, -4.5117e-01, -1.6328e-01, -2.2449e+00]], [[ 1.1867e+00, -5.1193e+00, -6.3274e+00, -6.2421e+00, -4.9238e+00, -4.3132e+00, -2.3993e+00, -4.1743e+00, -4.1113e+00, -3.6600e+00, -2.6934e+00, -3.3878e+00, -4.5432e+00, -4.4205e+00, -3.0741e+00]], [[ 7.1975e-01, -5.1854e+00, -6.2159e+00, -8.5318e+00, -3.3792e+00, -1.8660e+00, -2.5456e+00, -2.3361e+00, -3.1314e+00, -2.0708e+00, -3.6032e+00, -1.4074e+00, -3.5236e+00, -4.9341e+00, -2.9291e+00]], [[ 9.4407e-01, -3.5609e+00, -3.2591e+00, -2.5086e+00, -1.8528e+00, -2.5790e+00, -1.9294e+00, -1.5045e+00, -2.6199e+00, -3.4556e+00, -3.2869e+00, -2.1379e+00, -2.5303e+00, -2.4026e+00, -2.3985e+00]], [[ 1.7325e+00, -1.7816e+00, -4.4090e+00, -2.7223e+00, -2.5295e+00, 2.4862e-02, 6.4243e-01, 5.0743e-01, -1.3242e+00, -2.0330e+00, -5.7532e-01, -5.9428e-01, -1.0984e+00, -8.6494e-01, -1.0811e+00]], [[ 1.0669e+00, -5.3006e+00, -4.5022e+00, -3.9266e+00, -3.6422e+00, -2.6330e+00, -4.2917e+00, -3.9726e+00, -4.0389e+00, -4.9673e+00, -3.7765e+00, -3.9352e+00, -2.0427e+00, -1.1357e+00, 2.0765e-01]]], [[[ 2.5367e+00, -2.3865e+00, -5.0839e+00, -3.9089e+00, -3.8548e+00, -2.5568e+00, -3.5330e+00, -4.4556e+00, -4.4740e+00, -5.1053e+00, -4.8624e+00, -5.0687e+00, -5.7242e+00, -3.2292e+00, -1.1832e+00]], [[ 3.7602e+00, -8.5842e+00, -7.6820e+00, -7.5464e+00, -7.1164e+00, -3.6710e+00, -9.0035e+00, -9.9630e+00, -6.1592e+00, -7.3705e+00, -5.8347e+00, -1.0143e+01, -9.2950e+00, -3.1121e+00, -6.9581e-01]], [[ 6.4202e-01, -1.8029e+00, -3.0134e+00, -4.1933e+00, -3.2577e+00, -2.9258e+00, -3.5225e+00, -3.9505e+00, -4.4448e+00, -4.8218e+00, -4.5496e+00, -5.3980e+00, -3.4436e+00, -3.6439e+00, -4.6848e+00]], [[ 5.6591e-01, -9.1055e-01, -1.4375e+00, -2.1000e+00, -2.8129e+00, -2.8064e+00, -2.7339e+00, -2.6940e+00, -3.8169e+00, -4.7680e+00, -3.8997e+00, -4.2326e+00, -1.5811e+00, -8.2311e-01, -1.4838e+00]], [[ 1.1012e-01, -3.3354e+00, -3.6223e+00, -3.4678e+00, -2.6164e+00, -3.4572e+00, -2.7352e+00, -3.2766e+00, -2.8110e+00, -3.7725e+00, -4.4043e+00, -3.0081e+00, -2.2909e+00, -3.8821e+00, -3.7929e+00]], [[ 2.1160e+00, -6.2721e+00, -2.5692e+00, -4.8033e+00, -4.4064e+00, -3.7627e+00, -4.4391e+00, -4.9517e+00, -2.6282e+00, -4.5026e+00, -4.2101e+00, -5.9240e+00, -3.5639e+00, -1.6848e+00, -9.8819e-01]], [[ 6.6039e-01, -5.0293e+00, -5.1762e+00, -5.1159e+00, -4.7924e+00, -5.4616e+00, -6.9553e+00, -4.6034e+00, -4.8127e+00, -4.6116e+00, -5.1002e+00, -6.8629e+00, -3.0482e+00, -1.7823e+00, -2.6414e+00]], [[ 8.9797e-01, -2.2343e+00, -2.7035e+00, -5.5800e+00, -4.7606e+00, -4.9405e+00, -2.5097e+00, -1.8046e+00, -2.1028e+00, -4.7781e+00, -4.9768e+00, -3.0180e+00, -2.4305e+00, -3.5608e+00, -3.7390e+00]], [[ 9.2845e-01, -2.3303e+00, -2.9602e+00, -3.4237e+00, -3.2583e+00, -4.7022e+00, -5.5427e+00, -5.2408e+00, -4.2054e+00, -4.1795e+00, -4.3672e+00, -5.7615e+00, -4.6238e+00, -5.2559e+00, -4.1127e+00]], [[ 9.6719e-01, -2.6453e+00, -1.9550e+00, -2.1429e+00, -2.5848e+00, -3.0303e+00, -3.3518e+00, -2.9635e+00, -2.7603e+00, -3.8853e+00, -4.2986e+00, -4.7679e+00, -2.5323e+00, -3.0032e+00, -2.2346e+00]], [[ 2.1982e+00, -8.1700e-01, -8.9000e-01, -7.6469e-01, -1.3454e+00, -9.4487e-01, -1.4771e-02, 2.4084e-01, -1.3348e+00, -2.2736e+00, -1.9815e+00, -1.4195e+00, 3.8502e-01, -1.7939e-01, -8.0214e-02]], [[ 1.1721e+00, -4.0267e+00, -3.8919e+00, -3.9240e+00, -3.5823e+00, -1.7922e+00, -3.4414e+00, -3.6256e+00, -5.2204e+00, -5.5098e+00, -4.4495e+00, -4.1570e+00, -2.4503e+00, -2.9264e+00, -1.0159e+00]]]]) attn_weights tensor([[[[ -1.7434, -4.1382, -3.0239, -3.5593, -2.8090, -3.3339, -3.4404, -3.6769, -1.5150, -2.3432, -0.8623, -1.2033, -1.9417, -1.9974, -2.8841]], [[ 0.5865, -4.2913, -5.2106, -6.7219, -5.5813, -4.7143, -4.1101, -3.5745, -4.2749, -6.3616, -5.0848, -3.8210, -1.7056, -2.9204, -4.1863]], [[ 0.3412, -3.3703, -3.3587, -3.5076, -3.2054, -3.7801, -3.5865, -2.9153, -3.1306, -3.6340, -2.8100, -2.7733, -3.3564, -3.0712, -2.9512]], [[ 0.3433, -3.0183, -4.3377, -3.9972, -3.6245, -3.3418, -3.4223, -3.0325, -3.6281, -3.8563, -3.2245, -2.6539, -2.1860, -2.5300, -3.6159]], [[ 1.0435, -1.7184, -1.3233, -1.3874, -1.8055, -1.6674, -1.0228, -0.7131, -1.6827, -1.9286, -1.7406, -1.4761, -1.7606, -0.9874, -1.3095]], [[ -0.6218, -5.2032, -5.6948, -5.4132, -5.1768, -5.1092, -5.2683, -4.0277, -3.7488, -3.9744, -3.6602, -3.6405, -3.4836, -3.2179, -2.9610]], [[ 2.2986, -3.6555, -3.8076, -4.7661, -3.2773, -2.2493, -2.4940, -2.3394, -3.4889, -4.2533, -3.2656, -2.1334, -2.2384, -1.2893, -0.4248]], [[ -0.3567, -4.3090, -5.0031, -4.7306, -4.4417, -3.1870, -2.4968, -4.2796, -4.5298, -4.1736, -4.2558, -3.7008, -2.4973, -1.4601, -2.9952]], [[ -1.7531, -7.2342, -6.0942, -7.2305, -5.5553, -3.3038, -4.1450, -6.7076, -4.2483, -4.7033, -2.7206, -2.0413, -1.8913, -0.6627, -3.2907]], [[ 4.4507, -8.4825, -5.9494, -6.9741, -4.7874, -1.3398, -4.9933, -3.7624, -3.7463, -5.3186, -3.4966, -5.5493, -2.9334, -2.8703, -2.6053]], [[ 2.8622, -3.5922, -3.2774, -3.5852, -2.2781, -1.4549, -0.7965, -1.2427, -1.3238, -2.4718, -1.6948, -2.1696, -0.9153, -0.7939, -1.6461]], [[ -1.0711, -3.9125, -3.5024, -3.8176, -3.9792, -4.1911, -3.3284, -2.7975, -1.7868, -2.3495, -2.2155, -1.9668, -1.9775, -2.0267, -2.5541]]], [[[ -1.0143, -3.1448, -3.4546, -3.0055, -4.9256, -3.9967, -3.3729, -3.9552, -2.8034, -1.3870, -1.1252, -0.7319, -0.5536, -0.9635, -3.8854]], [[ 0.4219, -4.3081, -6.1268, -5.5181, -4.7800, -4.4233, -4.6772, -5.3942, -5.7220, -7.8999, -7.4802, -6.5461, -6.5437, -4.9575, -3.6832]], [[ 0.3778, -3.0847, -2.9523, -3.4986, -3.6807, -3.7734, -3.9778, -3.2895, -3.1516, -3.0671, -3.8433, -3.1476, -3.4599, -4.1572, -4.0218]], [[ 0.4331, -3.3949, -4.6206, -4.6713, -3.6378, -3.4909, -3.1620, -3.0365, -3.4926, -4.9026, -5.0824, -4.4138, -4.2150, -4.1159, -3.6036]], [[ 1.2183, -2.1030, -3.3448, -3.2719, -3.0705, -2.7190, -1.3077, -1.7972, -2.9142, -4.1994, -3.8273, -2.6929, -2.5216, -2.4859, -2.5112]], [[ -0.4873, -4.5636, -5.3349, -5.4462, -4.7037, -4.9214, -4.5379, -4.0797, -4.2189, -3.7535, -3.9148, -3.3665, -2.3974, -2.6207, -2.6714]], [[ 2.3478, -3.9064, -3.1823, -3.6273, -2.1979, -2.4463, -3.4693, -2.5681, -1.4902, -2.7564, -2.8315, -3.0016, -2.7832, -2.1411, 0.2689]], [[ -0.1673, -3.2552, -3.7152, -4.0370, -3.5324, -2.6323, -1.4635, -2.9580, -3.3407, -3.9796, -3.9565, -3.9464, -3.5397, -3.1288, -3.2659]], [[ -0.9915, -6.1558, -6.2133, -4.9133, -6.4605, -6.4074, -6.1939, -5.5613, -4.5080, -4.5748, -3.2804, -3.0114, -2.9320, -1.3626, -3.8165]], [[ 5.5165, -9.2673, -5.9775, -5.7517, -0.8222, -0.0353, -7.9949, -7.4902, -6.0055, -4.0922, -7.0288, -3.4898, -7.4147, -6.8412, 0.1851]], [[ 3.0914, -3.5549, -3.0929, -3.7053, -3.3801, -2.3697, -1.3264, -1.6962, -1.3237, -1.8076, -2.1456, -1.7635, -1.8629, -2.3105, -1.3795]], [[ -0.4856, -4.4278, -5.1341, -5.3030, -5.9503, -4.9821, -3.7500, -4.8985, -3.3430, -3.2147, -3.5159, -1.6994, 0.0550, 0.8546, -1.1527]]], [[[ -1.0735, -5.5864, -3.6798, -4.5802, -5.0886, -3.8544, -3.6894, -5.7894, -4.1729, -1.7476, -1.7871, -0.8589, -0.0352, -1.1244, -4.3237]], [[ 1.0434, -5.9784, -5.8219, -5.4264, -4.7089, -4.0351, -5.1589, -6.1233, -5.8680, -4.7291, -6.7129, -6.7940, -2.4713, 0.6720, -1.4433]], [[ 0.4899, -4.0007, -3.5490, -3.6314, -4.0982, -4.4143, -3.8527, -3.2663, -3.9315, -3.6548, -4.7279, -3.8162, -4.1365, -3.9574, -3.7731]], [[ 0.4461, -3.5485, -4.8480, -4.5755, -4.0453, -3.0929, -3.1387, -2.8828, -3.0107, -3.9421, -4.3576, -4.4128, -3.9868, -4.1456, -4.5284]], [[ 1.6110, -2.6612, -2.1744, -2.6612, -2.3027, -3.0228, -2.6711, -2.0330, -3.8820, -2.3737, -2.1509, -2.3291, -2.1928, -2.5260, -3.1531]], [[ -0.6513, -4.5199, -5.2669, -6.0343, -5.9201, -5.8800, -5.5583, -5.2981, -3.9457, -3.8812, -5.7011, -4.5195, -4.4309, -3.9556, -3.2262]], [[ 2.0627, -3.0525, -2.4960, -3.3947, -2.7335, -3.1856, -3.6278, -2.9632, -2.0387, -1.9732, -3.2689, -3.2479, -2.1323, -1.7347, -1.4752]], [[ -0.3639, -3.7779, -4.8363, -4.3206, -4.1067, -2.3843, -1.2310, -2.8526, -4.4723, -4.2581, -4.5245, -5.0428, -3.2904, -4.0860, -3.7622]], [[ -1.0200, -6.6944, -4.1296, -5.3085, -4.6917, -7.6813, -6.5771, -6.9275, -3.6596, -2.7827, -3.5239, -2.0812, -2.0225, -0.8773, -3.4843]], [[ 5.1501, -12.2988, -6.0586, -6.7897, -3.3793, -1.6569, -10.4262, -8.5795, -6.1033, -7.2985, -7.2994, -7.6536, -4.5386, -2.5616, -0.4942]], [[ 3.2215, -3.1700, -3.8581, -4.0169, -3.1369, -2.7923, -2.0834, -2.7960, -1.9974, -1.7332, -2.3437, -2.5643, -2.7808, -2.1566, -2.6578]], [[ -0.6180, -5.4854, -4.6905, -5.3551, -5.4477, -5.3830, -3.9880, -4.6190, -3.9038, -2.6640, -3.4128, -3.1114, -2.2401, -1.2984, -2.9090]]], [[[ -0.8224, -5.0303, -5.3039, -3.2970, -4.2134, -2.4741, -2.7242, -4.9463, -4.7425, -3.4007, -3.0857, -3.5234, -1.2062, -1.2010, -2.6151]], [[ -0.2576, -4.3610, -4.1695, -6.0845, -3.2258, -3.0955, -3.1722, -3.9723, -3.1856, -2.0093, -4.1941, -3.7580, -3.2565, -3.7482, -4.3452]], [[ 0.2646, -3.3665, -2.7971, -3.4155, -3.5983, -3.5940, -3.7364, -3.2838, -3.8241, -4.4671, -4.0775, -2.5198, -2.6845, -3.5259, -3.6014]], [[ 0.1122, -2.4032, -3.5419, -3.1597, -1.7025, -2.1887, -1.8952, -1.8262, -2.1249, -3.3437, -2.6269, -1.5569, -2.9568, -2.4555, -2.2782]], [[ 0.8949, -0.8294, -1.9876, -2.1349, -1.8959, -2.4495, -1.1221, -1.6595, -2.0172, -2.6274, -2.1810, -1.3110, -2.2890, -1.9697, -1.2704]], [[ -0.7542, -4.0771, -5.3710, -5.7552, -5.4127, -5.2269, -4.1296, -5.2406, -4.7959, -4.5368, -3.5615, -4.0026, -4.2082, -4.0817, -3.7016]], [[ 2.0721, -3.7114, -2.9385, -2.8974, -2.7024, -3.0798, -3.5798, -2.9230, -2.5738, -3.1205, -3.5383, -2.5505, -1.4820, -1.1620, -0.1729]], [[ -0.6302, -4.2514, -5.6016, -4.3706, -2.7526, -2.6074, -1.8153, -2.3164, -2.5475, -1.6276, -1.7774, -2.9039, -3.4305, -3.1394, -3.8308]], [[ -1.4146, -6.2886, -6.8365, -6.6809, -7.8564, -6.1410, -4.9505, -5.5860, -6.3498, -5.7657, -4.0852, -4.1187, -2.8363, -2.9822, -4.6060]], [[ 4.9096, -7.6082, -7.1107, -6.2142, -2.2781, -1.9796, -6.8380, -5.3700, -5.9738, -3.0727, -7.3926, -4.2994, -4.9867, -3.4211, -0.5478]], [[ 2.9775, -2.6450, -2.2946, -2.5123, -2.3969, -2.4724, -1.5859, -1.8802, -1.5226, -3.0893, -1.6419, -0.7427, -1.1687, -1.3520, -1.8466]], [[ -0.2446, -3.3571, -4.7693, -5.4698, -5.3358, -4.8052, -3.6912, -4.5985, -4.9520, -4.7991, -3.8841, -3.3628, -2.1869, -2.8614, -3.4942]]], [[[ 0.3096, -3.8651, -3.5451, -4.5489, -3.8500, -4.0871, -3.4421, -6.3168, -6.3219, -7.3408, -6.8955, -5.9070, -4.3530, -2.7854, -4.0166]], [[ 0.7857, -2.8268, -5.1322, -4.3796, -4.7476, -4.1858, -4.7262, -4.5680, -6.7205, -5.6860, -5.0647, -5.0431, -3.5642, -4.4681, -4.9685]], [[ 0.5295, -2.8685, -3.3300, -3.4407, -3.3609, -2.9772, -2.8268, -2.4542, -3.5874, -3.4946, -3.0562, -3.8120, -2.0537, -3.1294, -2.1139]], [[ 0.4771, -1.5015, -2.1046, -2.3493, -2.1111, -2.5838, -1.5893, -2.9826, -3.2156, -3.3142, -3.7659, -3.7664, -1.3448, -1.1032, -1.6903]], [[ 1.0558, -0.3698, -0.4883, -0.4857, -1.2821, -1.7568, -0.1957, -0.5777, -2.1635, -1.9702, -1.0514, -0.3606, 0.4674, 0.4985, 0.4765]], [[ -0.4906, -3.7171, -3.9804, -4.1344, -4.4087, -3.7995, -4.0231, -3.9714, -2.8535, -4.2552, -4.0568, -4.4360, -2.6852, -3.4247, -2.8099]], [[ 2.1445, -1.8289, -2.1457, -2.9356, -2.9472, -2.0617, -2.8652, -2.8036, -4.1835, -3.9773, -3.0567, -3.9028, -2.1834, -2.5310, -0.5510]], [[ -0.0614, -1.9972, -2.4742, -1.9861, -2.3160, -1.2819, -0.6160, -1.1713, -2.8597, -3.0682, -0.9231, -1.1632, -0.3905, -2.5553, -2.8025]], [[ -1.0326, -5.5993, -6.6697, -6.8708, -5.7736, -4.2041, -4.8510, -5.1188, -5.0006, -6.1512, -4.3680, -5.5113, -3.4666, -3.0375, -5.4154]], [[ 3.8347, -4.5564, -2.2129, -4.0571, -4.5075, -3.0172, -5.5195, -6.6418, -3.0264, -5.7868, -5.1523, -7.4934, -5.7712, -2.1222, -1.8208]], [[ 2.5809, -1.9700, -1.3339, -2.8048, -2.9159, -2.6136, -1.7786, -3.8114, -3.1727, -3.8377, -2.7067, -2.5888, -1.5989, -1.1849, -1.3244]], [[ 0.3509, -3.3658, -5.2598, -5.3307, -5.2009, -4.9103, -3.6253, -5.3585, -5.0745, -6.2341, -5.0728, -5.2235, -4.3792, -2.0687, -3.7305]]]]) attn_weights tensor([[[[-4.4166e-01, -9.0674e+00, -8.1817e+00, -9.5424e+00, -8.0292e+00, -4.7891e+00, -5.5510e+00, -5.8734e+00, -5.2437e+00, -6.6361e+00, -5.5740e+00, -4.9749e+00, -3.7146e+00, -2.6093e+00, -4.2575e+00]], [[ 3.1857e+00, -2.2537e+00, -1.4208e+00, -2.3914e+00, -3.2938e+00, 2.4623e-02, -5.9775e-01, -1.4402e+00, -6.9108e-01, -1.5147e+00, -1.5981e+00, -1.8066e+00, -1.7885e+00, 3.9354e-01, -1.5487e+00]], [[ 6.1402e+00, -5.1088e+00, -4.8268e+00, -4.6591e+00, -3.7822e+00, -2.2966e-01, -1.6454e+00, -1.4268e+00, -3.1436e+00, -3.1543e+00, -2.0557e+00, -7.7351e-01, -1.7271e-03, 1.1088e-01, -1.8104e+00]], [[-4.8894e-02, -4.7144e+00, -3.3538e+00, -3.4884e+00, -2.7566e+00, -1.4701e+00, -1.7433e+00, -2.6225e+00, -1.9293e+00, -2.5954e+00, -7.4310e-01, -1.0835e+00, -1.5318e+00, 3.0092e-01, -1.0472e+00]], [[ 4.0115e-01, -5.1557e+00, -4.3201e+00, -4.8698e+00, -5.0655e+00, -4.3325e+00, -3.0883e+00, -4.0024e+00, -3.5921e+00, -4.3113e+00, -1.5966e+00, -2.2278e+00, -2.1820e+00, -3.0682e+00, -4.4957e+00]], [[ 5.3845e-01, -2.5330e+00, -1.6091e+00, -1.6110e+00, -1.8774e+00, -3.2434e+00, -2.3851e+00, -2.0892e+00, -2.6654e+00, -2.7865e+00, -2.0121e+00, -1.2186e+00, -5.1866e-01, -1.7196e+00, -2.3343e+00]], [[ 1.4929e+00, -2.6620e+00, -3.0377e+00, -3.7016e+00, -3.1005e+00, -2.6518e+00, -2.2022e+00, -2.1738e+00, -2.1784e+00, -2.8723e+00, -2.4818e+00, -1.9765e+00, -2.2763e+00, -1.9377e+00, -1.9869e+00]], [[ 3.1413e+00, -2.3756e+00, -3.1331e+00, -4.3384e+00, -3.6438e+00, -1.8871e+00, -1.6276e+00, -5.9645e-01, -1.1576e+00, -2.4486e+00, -1.8854e+00, -2.6074e+00, -1.7453e+00, -6.8305e-01, -2.3325e+00]], [[-2.3233e-01, -5.9863e+00, -4.1313e+00, -5.3321e+00, -3.9996e+00, -3.3519e+00, -2.9879e+00, -5.1005e+00, -3.8748e+00, -4.7852e+00, -2.4047e+00, -2.1551e+00, -7.2410e-01, -1.3856e+00, -3.4209e+00]], [[-3.9454e-01, -3.5952e+00, -3.2451e+00, -3.9174e+00, -4.7196e+00, -2.7777e+00, -3.7248e+00, -1.8425e+00, -8.6151e-01, -1.5935e+00, -1.5509e+00, -2.3264e+00, -2.8983e+00, -2.0988e+00, -2.5216e+00]], [[ 4.0074e+00, -3.9379e+00, -3.9044e+00, -4.3246e+00, -4.3682e+00, -5.2373e-01, -2.5976e+00, -7.9021e-01, -2.2823e+00, -3.0617e+00, -1.3192e+00, -2.9371e+00, -1.1783e+00, -1.8918e+00, -2.4096e+00]], [[ 2.8688e+00, -4.7613e+00, -4.1130e+00, -3.7145e+00, -2.8094e+00, -2.8217e+00, -2.7916e+00, -1.9974e+00, -3.3899e+00, -3.1613e+00, -1.9661e+00, -1.1801e+00, -1.9563e+00, -2.9386e+00, -2.8382e+00]]], [[[-1.0243e-01, -7.5645e+00, -8.0236e+00, -7.4899e+00, -7.3167e+00, -7.4963e+00, -7.6053e+00, -6.0717e+00, -6.9937e+00, -6.5125e+00, -6.0498e+00, -4.2585e+00, -3.4711e+00, -1.5449e+00, -4.3037e+00]], [[ 3.2015e+00, -2.8190e+00, -2.3954e+00, -3.9977e+00, -2.7599e+00, -8.8343e-01, -8.3560e-01, -3.4747e-01, -4.7017e-01, -1.4889e+00, -3.1367e+00, -1.3199e+00, -1.5664e+00, -2.6045e+00, -1.3350e+00]], [[ 6.4281e+00, -3.5830e+00, -3.2358e+00, -4.5805e+00, -9.7861e-01, 6.6998e-01, -1.8369e+00, -3.5708e+00, -2.7973e+00, -3.0538e+00, -5.1383e+00, -3.8485e-01, -2.7444e+00, -2.3547e+00, 3.2192e+00]], [[ 4.2517e-01, -4.7574e+00, -4.0466e+00, -5.2417e+00, -4.8342e+00, -3.6559e+00, -3.7959e+00, -3.5671e+00, -3.0032e+00, -3.5595e+00, -4.8349e+00, -3.1968e+00, -3.1463e+00, -3.5064e+00, -2.6701e+00]], [[ 1.2325e+00, -5.6462e+00, -4.7526e+00, -4.4794e+00, -6.3865e+00, -6.1308e+00, -4.9691e+00, -5.9359e+00, -3.9084e+00, -4.5927e+00, -4.2231e+00, -3.4506e+00, -3.6910e+00, -4.1663e+00, -4.5760e+00]], [[ 1.3771e+00, -4.1211e+00, -3.0105e+00, -3.8514e+00, -4.9873e+00, -4.7695e+00, -2.2534e+00, -2.5780e+00, -2.6860e+00, -4.0933e+00, -4.6354e+00, -2.7869e+00, -1.9894e+00, -1.7989e+00, -2.7582e+00]], [[ 1.6279e+00, -3.8842e+00, -3.7579e+00, -4.2050e+00, -3.9726e+00, -2.3671e+00, -2.4648e+00, -3.0389e+00, -2.9282e+00, -3.4517e+00, -3.4983e+00, -3.3924e+00, -2.7953e+00, -3.1556e+00, -2.9838e+00]], [[ 3.3809e+00, -5.1189e+00, -5.6436e+00, -7.2651e+00, -5.9615e+00, -2.7603e+00, -3.1218e+00, -2.8697e+00, -2.7653e+00, -4.5572e+00, -5.5592e+00, -4.5739e+00, -5.8601e+00, -5.5613e+00, -2.3267e+00]], [[-3.3456e-01, -4.5664e+00, -3.5925e+00, -3.0668e+00, -4.3027e+00, -1.7624e+00, -1.6943e+00, -2.1940e+00, -2.1912e+00, -2.7458e+00, -2.1851e+00, -3.4204e+00, -2.1195e+00, -1.7163e+00, -3.4415e+00]], [[ 3.4887e-01, -4.3288e+00, -3.5542e+00, -3.8272e+00, -4.8489e+00, -3.1892e+00, -3.2955e+00, -2.4040e+00, -8.7605e-01, -1.8044e+00, -1.9113e+00, -1.6404e+00, -1.4820e+00, -2.2662e+00, -3.6590e+00]], [[ 4.6212e+00, -1.8382e+00, -4.4236e+00, -4.7598e+00, -8.0395e-04, 4.8450e-03, -1.1675e+00, -1.9110e+00, -2.9334e+00, -3.8042e+00, -5.3992e+00, -1.2400e+00, -2.6791e+00, -3.4521e+00, 1.0392e+00]], [[ 3.2013e+00, -4.4461e+00, -4.8204e+00, -5.4460e+00, -2.7698e+00, -2.2100e+00, -2.9065e+00, -3.8103e+00, -5.1694e+00, -4.3176e+00, -5.4537e+00, -3.0879e+00, -3.4884e+00, -3.0236e+00, -6.5726e-01]]], [[[-3.9836e-01, -7.6845e+00, -6.5348e+00, -6.2393e+00, -7.3587e+00, -7.6500e+00, -7.0195e+00, -5.8758e+00, -5.4432e+00, -4.7851e+00, -4.2415e+00, -3.5519e+00, -1.0521e+00, -2.8382e+00, -4.3799e+00]], [[ 2.8762e+00, -1.7686e+00, -1.7158e+00, -1.7728e+00, -1.7251e+00, -1.5368e+00, 3.2758e-02, -1.1937e+00, -1.7584e+00, -7.0966e-01, -1.9267e+00, -3.2536e+00, -1.6026e+00, -2.1693e+00, -1.7023e+00]], [[ 7.1616e+00, -7.8383e+00, -4.5590e+00, -7.1028e+00, -4.6763e+00, -2.3002e+00, -7.5214e+00, -1.0383e+01, -5.2812e+00, -6.7781e+00, -7.9589e+00, -7.8242e+00, -4.0110e+00, -2.3625e+00, -8.6201e-01]], [[ 1.1478e-01, -3.8023e+00, -3.4406e+00, -3.8758e+00, -3.6300e+00, -3.4991e+00, -2.8414e+00, -1.8634e+00, -4.2294e-01, -1.3737e+00, -2.3027e+00, -2.4013e+00, -1.7424e+00, -2.6866e+00, -3.0612e+00]], [[ 8.6675e-01, -5.4222e+00, -2.9627e+00, -4.2480e+00, -5.3174e+00, -4.9871e+00, -5.2392e+00, -4.3892e+00, -2.8894e+00, -2.4185e+00, -2.7619e+00, -2.3300e+00, -2.6134e+00, -2.5370e+00, -4.9410e+00]], [[ 8.3135e-01, -3.3765e+00, -3.2244e+00, -3.1160e+00, -3.4502e+00, -2.8530e+00, -2.1154e+00, -1.6104e+00, -1.5660e+00, -3.0740e+00, -2.5413e+00, -2.7220e+00, -1.7438e+00, -2.8672e+00, -3.6354e+00]], [[ 1.4796e+00, -2.4528e+00, -3.5509e+00, -3.3779e+00, -2.9927e+00, -2.2562e+00, -2.3435e+00, -2.2185e+00, -2.1243e+00, -3.2865e+00, -4.0307e+00, -4.1637e+00, -4.0386e+00, -3.8512e+00, -4.1022e+00]], [[ 2.7584e+00, -5.2979e+00, -4.5305e+00, -6.5670e+00, -5.1789e+00, -4.5826e+00, -4.1747e+00, -4.1557e+00, -3.3056e+00, -4.3605e+00, -5.5226e+00, -5.8438e+00, -4.8744e+00, -4.0561e+00, -5.2651e+00]], [[-4.3847e-01, -4.1656e+00, -3.1045e+00, -3.5102e+00, -2.7018e+00, -3.9760e+00, -2.4805e+00, -1.4297e+00, -2.2436e+00, -1.5376e+00, -1.5786e+00, -1.3014e+00, -1.0154e+00, -2.6904e+00, -4.1018e+00]], [[-1.4482e-01, -2.2755e+00, -1.9290e+00, -2.8239e+00, -4.2566e+00, -3.6788e+00, -2.4185e+00, -1.7860e+00, -1.1659e+00, -9.3815e-01, -2.0347e+00, -2.0705e+00, -2.1850e+00, -2.5127e+00, -3.2793e+00]], [[ 5.1807e+00, -5.2986e+00, -1.9248e+00, -4.1223e+00, -1.3930e+00, -2.0791e+00, -5.4146e+00, -5.0213e+00, -3.8753e+00, -4.6267e+00, -6.1776e+00, -5.9994e+00, -2.6070e+00, -2.0980e+00, 3.2109e-01]], [[ 2.9946e+00, -5.8563e+00, -4.0586e+00, -6.9572e+00, -4.6906e+00, -4.0488e+00, -4.8582e+00, -4.9615e+00, -4.6666e+00, -3.3446e+00, -4.3216e+00, -4.3701e+00, -3.4642e+00, -4.2626e+00, -4.8740e+00]]], [[[-6.4981e-01, -7.0453e+00, -7.1171e+00, -5.7125e+00, -6.2720e+00, -5.6660e+00, -5.9514e+00, -7.0520e+00, -6.9071e+00, -6.2921e+00, -6.6793e+00, -4.7827e+00, -3.5256e+00, -3.0289e+00, -5.1237e+00]], [[ 2.5049e+00, -2.2568e+00, -3.3721e+00, -4.6123e+00, -2.9648e+00, -1.7905e+00, -1.8988e+00, -1.2015e+00, -2.1045e+00, -2.1631e+00, -2.7919e+00, -3.0758e-01, -1.4346e+00, -1.5670e+00, -2.4937e+00]], [[ 6.0427e+00, -2.6236e+00, -4.5495e+00, -6.1043e+00, -3.2931e+00, -1.2478e+00, -3.7080e+00, -4.1605e+00, -4.1427e+00, -1.6122e+00, -4.8661e+00, -1.8561e+00, -2.4512e+00, -1.6751e+00, 2.9566e-01]], [[ 2.1511e-01, -4.1163e+00, -3.9176e+00, -4.2697e+00, -3.9483e+00, -3.3742e+00, -3.1127e+00, -2.3295e+00, -3.2377e+00, -2.3631e+00, -2.9392e+00, -2.4632e+00, -1.2738e+00, -1.6971e+00, -2.2436e+00]], [[ 9.2400e-01, -5.2103e+00, -5.1740e+00, -5.5692e+00, -5.5511e+00, -5.0628e+00, -3.9051e+00, -4.6431e+00, -5.9786e+00, -4.6676e+00, -4.8198e+00, -3.0445e+00, -4.1679e+00, -4.6138e+00, -4.9446e+00]], [[ 7.0635e-01, -2.2002e+00, -2.7388e+00, -2.9597e+00, -2.0200e+00, -3.4747e+00, -2.0320e+00, -8.7431e-01, -2.5428e+00, -2.8721e+00, -2.5354e+00, -1.5982e+00, -2.3650e+00, -3.0484e+00, -2.2339e+00]], [[ 1.3649e+00, -2.3619e+00, -2.9081e+00, -3.3930e+00, -2.8644e+00, -2.5302e+00, -2.3583e+00, -2.7313e+00, -2.7295e+00, -2.3162e+00, -2.9301e+00, -2.2644e+00, -2.3154e+00, -2.1539e+00, -2.9445e+00]], [[ 2.9521e+00, -2.8894e+00, -2.9282e+00, -4.5232e+00, -3.4685e+00, -3.0788e+00, -2.3635e+00, -1.5309e+00, -1.9311e+00, -1.8420e+00, -2.1301e+00, -6.1647e-01, -1.9232e+00, -2.7149e+00, -2.0815e+00]], [[-1.0070e+00, -5.8649e+00, -5.3174e+00, -4.4063e+00, -4.0401e+00, -1.7821e+00, -6.9042e-01, -2.1756e+00, -3.6570e+00, -2.4784e+00, -1.4600e+00, -3.0542e+00, -6.7299e-01, -1.3146e+00, -2.6848e+00]], [[ 8.0677e-02, -2.3074e+00, -2.1320e+00, -3.0837e+00, -4.1371e+00, -3.0884e+00, -3.5261e+00, -2.2503e+00, -3.4294e+00, -3.1425e+00, -3.9923e+00, -4.2185e-01, -1.7127e-01, -1.2411e+00, -2.1020e+00]], [[ 3.0472e+00, -3.4840e+00, -3.4426e+00, -5.7211e+00, -2.1359e+00, -2.6973e+00, -2.2832e+00, -2.0232e+00, -1.4004e+00, -2.8531e+00, -4.3567e+00, -1.3381e+00, -2.2326e+00, -2.0815e+00, -1.0512e+00]], [[ 3.2719e+00, -2.4127e+00, -4.1864e+00, -3.4782e+00, -1.7937e+00, -2.4906e+00, -3.9995e+00, -3.8883e+00, -4.2903e+00, -3.3182e+00, -4.0869e+00, -2.8542e+00, -3.8254e+00, -2.6000e+00, -1.5858e+00]]], [[[-7.8452e-01, -4.5835e+00, -4.7751e+00, -5.3415e+00, -5.3397e+00, -3.4410e+00, -4.6627e+00, -4.4115e+00, -5.7349e+00, -5.2252e+00, -3.6875e+00, -4.8814e+00, -1.8962e+00, -7.2970e-01, -3.7294e+00]], [[ 2.9563e+00, -1.9940e+00, -1.3898e+00, -2.7637e+00, -2.0391e+00, -3.4721e-01, -6.6589e-01, -8.8057e-01, -1.2409e+00, -7.1652e-01, -5.7418e-01, -1.2527e+00, 1.1009e-01, 2.0626e-02, -7.1054e-01]], [[ 5.3071e+00, -1.9472e+00, -2.1177e+00, -3.7431e+00, -3.7299e+00, -8.1122e-01, -2.6457e+00, -4.6285e+00, -2.0218e+00, -4.5594e+00, -3.4849e+00, -4.7156e+00, -4.0804e+00, -1.3254e+00, 3.4405e-01]], [[ 7.2191e-01, -2.6758e+00, -2.7844e+00, -3.6308e+00, -4.3503e+00, -4.1305e+00, -3.8909e+00, -4.3794e+00, -3.5402e+00, -3.8352e+00, -4.0858e+00, -4.6429e+00, -3.7161e+00, -3.7272e+00, -3.3489e+00]], [[ 8.3367e-01, -2.0508e+00, -2.3160e+00, -2.8527e+00, -1.8727e+00, -4.2446e+00, -3.4988e+00, -3.9469e+00, -4.8210e+00, -5.0483e+00, -5.4845e+00, -5.5986e+00, -2.4000e+00, -9.7130e-01, -4.1948e+00]], [[ 1.0833e+00, -2.1768e+00, -1.7410e+00, -2.1660e+00, -2.2278e+00, -3.2151e+00, -1.3529e+00, -2.3268e+00, -2.4917e+00, -2.8168e+00, -3.4557e+00, -2.8648e+00, -1.6484e+00, -1.2357e+00, -2.1415e+00]], [[ 1.2997e+00, -1.1785e+00, -2.1544e+00, -1.6008e+00, -2.0311e+00, -2.0993e+00, -2.2278e+00, -1.6980e+00, -2.0514e+00, -2.8472e+00, -2.4284e+00, -2.9390e+00, -1.3699e+00, -2.3493e+00, -2.3428e+00]], [[ 3.3725e+00, 1.8453e+00, 3.8462e-01, -1.1679e+00, -1.0699e+00, -1.5175e+00, -2.4303e+00, -3.0004e+00, -3.9115e+00, -3.9627e+00, -3.0674e+00, -4.1484e+00, -1.9343e+00, -1.3828e+00, -1.0137e+00]], [[ 1.4301e-02, -2.9364e+00, -2.6959e+00, -2.8692e+00, -3.1001e+00, -3.3259e+00, -2.5868e+00, -2.6039e+00, -5.6029e+00, -4.6757e+00, -4.6916e+00, -3.8670e+00, -1.6056e+00, -1.8177e+00, -3.6236e+00]], [[ 1.1493e+00, -4.7343e+00, -4.7261e+00, -5.1202e+00, -5.7378e+00, -4.8163e+00, -5.1866e+00, -5.7099e+00, -5.3984e+00, -6.1862e+00, -4.5076e+00, -6.8396e+00, -1.9196e+00, -8.2247e-01, -2.1431e+00]], [[ 3.5426e+00, -2.9965e+00, -2.1414e+00, -4.4514e+00, -1.8570e+00, -9.7884e-01, -3.0023e+00, -4.5892e+00, -3.5288e+00, -3.2243e+00, -2.9065e+00, -5.1449e+00, -3.7429e+00, -1.8226e+00, -2.2115e+00]], [[ 3.1065e+00, -3.6755e+00, -2.5054e+00, -3.3235e+00, -3.5002e+00, -1.1426e+00, -2.9803e+00, -3.8568e+00, -2.9126e+00, -4.8037e+00, -3.4848e+00, -5.3365e+00, -2.6841e+00, -2.0893e+00, -1.4612e+00]]]]) attn_weights tensor([[[[ 0.7355, -2.9989, -2.5146, -3.0779, -2.0275, -3.8571, -1.8546, -2.3701, -1.2747, -2.0904, -2.4117, -1.9417, -2.4197, -3.2288, -1.2329]], [[ 4.9653, -1.6628, -2.4980, -3.5324, -2.6967, -0.2510, -0.8129, -0.1015, -1.6388, -2.1666, -1.0497, -0.3922, 0.7689, -0.1864, -0.2950]], [[ 1.2931, -0.1224, -0.2213, -0.8683, -0.5108, -1.0296, -1.3551, -0.9199, -0.8569, -1.4371, -1.3560, -0.6847, -1.2291, -0.8694, -1.0289]], [[ 1.8636, -1.6577, -1.0216, -1.5080, -1.8643, 1.5283, -0.6250, 0.4377, -0.9085, -0.8395, -2.3134, -2.3046, -2.1613, 0.8431, -2.3540]], [[ 0.1171, -7.8652, -7.2759, -7.7294, -7.3353, -3.9851, -3.5415, -6.3826, -6.0933, -5.9416, -5.3848, -4.0087, -1.8175, -1.8756, -2.8742]], [[-2.2948, -4.1155, -3.2275, -3.6991, -2.9703, -3.6748, -3.4595, -2.7549, -1.3489, -2.1227, -1.1785, -1.1899, -2.2143, -2.4312, -3.2280]], [[ 3.2316, -2.1671, -2.0492, -3.8321, -3.8284, -0.3848, -1.7569, -1.8619, -2.4004, -4.8941, -3.1135, -1.5045, -0.1667, 0.0722, -1.3225]], [[ 0.5729, -7.6839, -6.2270, -8.0340, -7.4567, -3.5131, -3.9291, -4.8454, -4.0094, -5.7652, -4.4776, -4.1425, -3.1868, -1.6290, -0.9060]], [[ 0.6170, -2.8160, -3.5065, -3.7225, -3.4646, -0.9166, -0.9205, -2.1736, -3.6729, -3.6543, -2.5966, -2.9021, -0.8566, -1.1412, -2.0438]], [[ 1.2870, -4.2554, -3.6844, -4.1230, -2.9453, -0.3111, -1.6594, -2.6607, -2.7599, -3.1350, -2.3290, -2.1286, -1.8761, 0.4253, -2.4495]], [[ 0.9942, -3.6461, -2.3241, -3.4421, -3.2250, -0.6726, -2.1014, -2.0927, -1.6426, -2.5185, -2.7801, -2.3947, -2.1354, -0.1151, -0.6581]], [[ 0.6279, -3.1520, -2.5061, -2.8740, -3.3963, -1.9224, -3.2605, -3.2001, -3.4823, -3.5379, -3.8092, -3.8900, -3.4391, -2.7754, -3.5729]]], [[[ 1.0618, -3.3346, -2.5404, -2.4671, -2.6987, -3.0268, -1.4396, -2.9155, -2.7915, -2.5576, -2.0242, -1.4665, -1.0625, -1.0494, -0.4549]], [[ 5.2834, -0.7922, -2.9220, -1.8841, 1.0350, 1.5439, -0.3279, -0.5071, -0.6873, -3.0998, -3.2753, -0.1824, -0.5976, 0.6527, 2.0557]], [[ 1.7749, -1.0352, -2.0155, -3.0521, -1.6134, -0.8650, -0.6608, -1.1239, -1.6077, -1.4109, -2.4800, -1.3603, -1.0690, -1.7551, -1.5303]], [[ 2.4913, -2.1864, -2.4881, -3.0072, -2.7711, -1.5590, -1.2997, 0.2462, 0.0397, -2.2003, -2.9788, -3.5608, -3.0772, -2.1862, -1.1998]], [[ 0.4463, -5.8745, -5.6891, -4.6427, -4.3399, -3.7351, -2.0777, -3.4740, -4.3104, -4.2507, -3.5056, -4.0610, -1.6495, -0.3890, -2.5831]], [[-1.3566, -4.7034, -4.5048, -3.8543, -3.9596, -3.6289, -3.7262, -3.7322, -2.8943, -3.3420, -2.7028, -1.5600, -1.9238, -1.4101, -3.0577]], [[ 3.4976, -4.7344, -3.5724, -4.8997, -2.6502, -2.8273, -3.3229, -4.0589, -3.0838, -4.2331, -5.1887, -3.8162, -3.3468, -1.1251, 0.2504]], [[ 0.0177, -6.8867, -5.7424, -6.2826, -8.1829, -4.3377, -4.7377, -5.5877, -5.1204, -4.4640, -4.7881, -4.8414, -2.3939, -1.5606, -4.3511]], [[-0.5870, -2.8687, -4.1108, -4.1102, -3.5247, -0.7579, -0.3853, -1.6018, -2.6298, -3.6287, -3.7375, -3.2307, -2.4753, -2.0752, -2.1279]], [[ 1.1234, -4.5482, -4.5019, -4.4076, -2.5808, -0.5177, -0.8393, -2.1457, -3.2737, -4.3720, -4.3682, -3.6228, -2.8567, -2.8107, -2.8376]], [[ 1.2708, -4.1159, -4.2927, -4.9444, -2.6544, -3.0480, -2.2883, -2.0301, -2.5815, -3.7519, -4.0525, -3.4159, -2.0115, -1.4961, -0.2032]], [[ 0.4912, -3.0622, -3.9283, -3.2408, -4.2188, -2.6179, -2.7093, -3.4555, -3.9251, -4.7453, -4.4943, -4.4262, -4.4881, -4.2703, -3.6115]]], [[[ 1.2520, -3.1163, -2.7219, -3.0676, -3.1319, -4.5592, -2.4585, -3.2799, -3.8697, -2.6818, -3.4950, -3.0706, -2.8646, -3.0898, -3.3466]], [[ 5.6637, -3.3576, -3.8727, -3.0602, -1.5286, -1.1287, -2.7365, -3.0435, -3.5066, -4.5012, -3.4281, -4.6015, -1.5165, 1.1828, 1.1990]], [[ 2.1916, -1.4612, -2.1000, -2.8357, -2.2929, -2.0283, -1.8493, -2.7772, -2.6378, -2.7511, -2.9474, -3.4481, -2.6247, -2.3506, -3.0507]], [[ 2.2609, -2.2054, -2.9590, -3.9367, -3.1725, -3.2251, -1.3627, -1.1054, -2.2551, -3.3635, -4.2705, -5.2969, -4.1775, -3.4119, -3.9685]], [[ 0.5969, -6.6426, -5.7008, -6.5408, -6.5264, -4.5611, -4.0662, -5.5601, -5.0046, -4.1969, -3.2162, -2.3635, -1.8757, -2.0248, -3.2820]], [[-1.5595, -3.9324, -2.5567, -4.0522, -4.9732, -3.8481, -3.6230, -3.6423, -2.3640, -1.8735, -2.8577, -2.2115, -2.3442, -2.4701, -5.0287]], [[ 3.5093, -4.1448, -4.1460, -6.2740, -4.7900, -4.1564, -4.2103, -4.1344, -4.2587, -4.2773, -6.3594, -7.5084, -3.4633, -3.2259, -2.6178]], [[-0.7978, -6.1969, -4.8414, -6.5100, -6.1886, -5.7133, -5.7023, -5.6600, -4.3309, -2.8801, -1.9479, -2.1282, -0.1637, -1.1405, -3.0703]], [[ 0.2965, -1.9584, -1.7191, -1.8247, -1.3206, -1.4673, -0.8619, 0.1573, -1.2611, -1.3832, -3.5863, -2.8388, -2.6572, -2.3372, -2.4170]], [[ 0.8326, -3.9868, -3.3363, -3.5417, -2.2330, -1.6064, -1.0401, -1.7750, -3.0090, -2.3573, -2.4690, -4.2977, -3.5295, -4.2665, -4.4712]], [[ 0.9615, -3.9152, -4.1622, -4.5520, -3.3321, -2.2772, -2.6221, -2.8853, -2.6148, -3.2578, -4.5302, -3.2494, -2.7683, -3.1694, -2.3359]], [[ 0.9864, -3.8355, -5.1086, -4.8398, -4.7133, -2.3051, -2.1763, -2.9656, -3.7718, -5.3647, -5.2061, -6.0814, -4.5653, -4.6933, -4.9311]]], [[[ 1.0351, -2.9622, -2.2634, -2.7836, -2.3001, -3.7505, -2.2289, -2.9190, -2.2408, -4.3764, -2.6115, -1.7351, -1.2539, -1.5911, -2.3033]], [[ 3.8818, -3.3358, -4.2114, -5.6000, -2.3202, -1.9563, -0.8691, -2.2563, -1.8426, -2.4317, -2.1006, -1.7794, -1.7814, -1.5136, -0.8339]], [[ 2.0841, -0.8992, -1.2928, -2.6507, -0.7782, -1.2531, -0.8725, -0.2905, -0.0547, -1.0347, -1.1705, 0.5421, -0.2587, -1.3610, -1.2442]], [[ 2.0171, -3.3614, -3.3328, -3.9851, -2.9371, -0.2905, -0.4814, -1.0246, -2.4842, -1.0487, -1.2820, 0.1615, -0.9473, -1.8993, -1.8327]], [[ 0.2152, -5.4095, -5.2561, -4.7022, -5.7994, -4.2989, -3.0794, -4.8085, -5.9193, -3.6112, -3.3900, -4.9192, -2.9474, -2.7905, -2.6215]], [[-0.9073, -4.1725, -4.2755, -3.9851, -4.9719, -3.3306, -3.8516, -4.2565, -5.4889, -4.8302, -4.5834, -3.3739, -1.8500, -1.7532, -3.3471]], [[ 2.1912, -3.7741, -3.9514, -5.8944, -2.7048, -1.7306, -1.5011, -1.9387, -1.8462, -2.7333, -2.3984, -1.6263, -1.2468, -2.2609, -1.8015]], [[-0.8369, -7.6549, -6.2071, -5.9956, -6.0896, -3.4359, -3.2657, -5.2129, -5.5014, -4.8577, -3.9980, -4.0515, -1.4459, -1.9397, -3.1536]], [[-0.6357, -2.4017, -3.1565, -3.7507, -3.0905, -1.3943, -1.5505, -0.7375, -2.4346, -0.9056, -1.1185, -1.6586, -1.4544, -1.6759, -2.2677]], [[ 0.5687, -4.1871, -3.5655, -3.8407, -2.2774, -1.7245, -1.0799, -1.7478, -1.0338, -1.2867, -1.6150, -2.0748, -1.5390, -1.9873, -2.0718]], [[ 1.0245, -4.0313, -4.0094, -4.5950, -2.5074, -1.9589, -1.8723, -2.0608, -1.6803, -1.4187, -2.0562, -1.7046, -2.1237, -1.9584, -1.3026]], [[ 0.9423, -4.0285, -4.8748, -5.4060, -4.4447, -3.2921, -3.5769, -3.7286, -4.3572, -2.9938, -4.5218, -3.6653, -3.2098, -3.0811, -4.1723]]], [[[ 1.3367, -2.8168, -3.1615, -4.8084, -3.4072, -4.5885, -4.0969, -4.7536, -6.5772, -5.5464, -3.7048, -4.5173, -2.8972, -3.4351, -1.6129]], [[ 3.3258, -2.1352, -1.4913, -1.8558, -1.0310, -1.0609, -3.2723, -4.1767, -2.4288, -2.8845, -3.2326, -4.0700, -3.5082, -2.8469, -2.1449]], [[ 1.5300, -0.4067, -0.7360, -1.5677, -1.3520, -1.1267, -1.0105, -1.6112, -1.5184, -2.4953, -1.5640, -2.2322, -0.4838, -0.9903, -0.8279]], [[ 1.5327, -0.0211, -1.0477, -1.3606, -1.2469, -2.7877, -0.6245, -1.4418, -0.6772, -1.6591, -2.8029, -1.4681, -0.7344, -0.8080, -0.6286]], [[ 0.2691, -3.9788, -5.7880, -4.8589, -5.7600, -4.2433, -4.2922, -3.8796, -6.1866, -5.4391, -4.0487, -5.2397, -1.4163, -0.9909, -2.9566]], [[ 0.0748, -3.2988, -4.3857, -4.5941, -4.9073, -3.1835, -3.4306, -4.2149, -5.9886, -6.6451, -5.7429, -6.1396, -3.1054, -0.7407, -3.4054]], [[ 2.0406, -0.3320, -1.1617, -1.6380, -3.7933, -2.8626, -3.1911, -4.5007, -4.2526, -5.4372, -4.5001, -5.2119, -2.3068, -1.3466, -2.0193]], [[-0.4519, -4.5149, -5.0633, -5.8741, -4.6568, -4.8788, -4.5651, -4.6145, -4.9734, -5.6038, -5.9872, -4.5554, -2.7310, -1.8296, -4.4656]], [[ 0.6795, -0.6819, -1.5658, -2.7695, -2.8621, -0.5779, -1.7767, -2.4050, -3.2300, -2.9929, -0.7949, -2.0027, -0.5549, -2.1972, -2.0348]], [[ 0.9595, -1.7956, -1.4854, -2.4716, -2.2355, -1.6401, -1.8207, -1.9969, -2.3956, -3.4594, -2.2949, -3.1551, -0.5196, -1.8183, -1.3729]], [[ 0.9248, -1.2232, -1.9658, -2.6042, -2.1869, -2.4928, -2.3456, -2.6357, -2.9228, -3.1971, -3.1236, -3.3027, -2.2066, -2.4500, -1.9716]], [[ 0.6918, -3.3948, -3.3321, -4.4624, -3.8525, -1.8640, -2.2170, -4.5460, -5.6695, -5.3124, -1.5127, -3.7490, -3.1224, -3.0826, -2.8996]]]]) attn_weights tensor([[[[ 2.6128, -3.9081, -2.4404, -2.8209, -3.4186, 0.7665, 0.9002, -3.3877, -3.6424, -3.4015, -0.7741, -2.1986, -1.8973, 0.4626, -1.7141]], [[ 3.4034, -0.4962, -1.4880, -2.4372, -0.5675, -0.8985, -0.8864, -1.5087, -2.5686, -2.9505, -1.4232, -0.2086, 0.6192, -1.2236, -0.1513]], [[ 2.1065, -3.3799, -4.1053, -4.3226, -3.8204, 0.4521, -0.1561, -3.0454, -5.4210, -4.7944, -2.7731, -2.8961, -1.5463, -0.0859, -2.2277]], [[-0.9232, -2.9332, -2.7614, -3.9369, -4.4278, -3.0553, -2.0690, -2.0376, -2.0413, -2.9010, -2.5253, -2.4384, -2.1393, -1.4861, -1.6973]], [[ 3.3334, -2.1812, -3.0203, -2.6304, -2.0148, -0.9060, -1.8190, -2.0748, -3.5924, -2.8910, -2.8614, -1.7026, -1.3209, -0.9168, -2.4351]], [[ 1.4929, -3.4435, -2.9215, -3.0371, -2.2036, -0.2215, -0.6050, -1.9973, -1.6397, -1.8281, -0.3782, -1.4354, -1.7056, 0.0480, -0.5984]], [[ 3.5414, -2.7128, -2.5010, -3.6143, -3.1495, 1.1602, 0.4513, -2.6047, -3.3518, -3.4679, -0.9407, -3.3601, -2.0442, -0.4941, -2.3711]], [[ 0.1265, -3.4053, -3.6250, -4.4488, -3.5868, -2.7952, -3.6762, -3.3775, -3.3928, -4.1013, -2.2639, -2.5700, -2.6078, -2.2522, -3.2911]], [[ 1.3928, -2.7995, -3.7237, -2.5488, -3.0107, 0.0372, -0.9392, -3.2836, -4.1237, -2.2296, -2.6666, -2.3321, -2.9876, -0.5038, -3.0361]], [[ 3.7887, -1.7570, -1.3719, -1.7241, -0.9663, 1.4239, -0.0111, -1.7902, -2.1996, -2.1723, 0.2442, -0.8558, -0.2561, 0.4465, -0.0375]], [[ 0.7830, -5.1691, -4.9174, -4.5336, -4.0841, -3.1757, -3.4879, -3.7113, -4.1659, -3.8593, -2.5610, -2.5442, -1.1648, -2.0787, -2.6325]], [[ 3.4189, -1.4304, -2.8508, -2.3388, -1.0676, -0.8355, -1.6479, -1.9178, -2.8416, -1.9737, -1.5433, -0.1465, -0.5335, -1.2780, -1.0834]]], [[[ 1.5748, -3.4175, -3.4802, -3.4167, -3.8599, 0.7665, 0.3937, -1.4454, -3.6592, -3.2848, -3.2718, -4.8304, -2.5744, -2.5889, -4.0807]], [[ 4.5835, -1.2589, -4.6483, -4.1431, -2.1452, -1.6734, -1.6959, -2.6621, -3.3413, -5.4168, -4.7818, -3.3091, -1.1625, -0.7038, 0.9282]], [[ 0.7391, -3.3774, -3.9270, -4.2342, -3.1322, -0.0142, -0.2826, -1.3115, -3.1050, -3.9751, -4.6144, -4.2208, -2.9882, -3.2092, -3.4513]], [[-1.0983, -4.1472, -3.4381, -3.6994, -4.2836, -3.0148, -2.5498, -2.8530, -2.3577, -1.8308, -2.2212, -1.8717, -0.1737, -0.6870, -2.4366]], [[ 3.5895, -4.0091, -4.2133, -5.3633, -3.9772, -1.7494, -0.6595, -2.9802, -3.4365, -4.0788, -4.7818, -4.2269, -3.4200, -3.4255, -3.1703]], [[ 1.9889, -4.8683, -4.8496, -5.1079, -3.8474, -1.6120, -1.5697, -3.2047, -3.4470, -3.7183, -4.1040, -3.1637, -1.3813, -1.6365, -1.2509]], [[ 4.0608, -3.3000, -4.6794, -4.5094, -1.6727, 0.4553, 0.0296, -2.1722, -3.8755, -4.4129, -4.9476, -3.7396, -2.1436, -2.5012, -0.4531]], [[ 0.5292, -3.9086, -4.0333, -3.9723, -3.5830, -2.9215, -2.8838, -3.6739, -3.2076, -4.2566, -4.0458, -3.5057, -3.6269, -4.0107, -4.2902]], [[ 1.4876, -3.2646, -3.8221, -3.2863, -3.3804, -0.5598, -1.2223, -3.2503, -3.1780, -3.8257, -3.1723, -4.2354, -2.6869, -3.3177, -2.7110]], [[ 3.9888, -2.9957, -5.9690, -5.5439, -2.4743, -1.3015, -1.2592, -2.5931, -4.1273, -5.8842, -5.9742, -3.1666, -2.5165, -2.7244, -0.4402]], [[ 0.8370, -5.0140, -5.5061, -4.6886, -4.4319, -1.9627, -2.1319, -3.2585, -4.0912, -3.8075, -3.0583, -0.5998, -1.2698, 0.0730, -3.4339]], [[ 3.9362, -1.0390, -3.1041, -1.0920, -1.2294, -1.9296, -1.2528, -3.5030, -2.7705, -3.5584, -1.6359, -3.8162, -1.8889, -1.9533, -2.1738]]], [[[ 1.7723, -1.6782, -1.9750, -1.7360, -2.1239, -0.2602, -0.2170, -1.2132, -2.9246, -1.8476, -3.4867, -2.4745, -2.4727, -3.4101, -2.2959]], [[ 4.3750, -3.4957, -4.9270, -5.5447, -3.2440, -2.8016, -2.5061, -3.8993, -3.3496, -4.5914, -6.2218, -4.1451, -3.1143, -1.1246, -1.7696]], [[ 1.5175, -3.7170, -2.2544, -3.7530, -2.7937, -1.8328, -1.2466, -1.2126, -3.0961, -1.9186, -4.2880, -3.2552, -2.3327, -2.1178, -2.1825]], [[-1.0283, -4.4230, -3.1037, -4.8685, -5.8796, -5.1035, -4.7853, -3.5995, -1.4889, -1.9262, -2.7252, -1.6776, -1.4992, -1.9651, -3.6361]], [[ 3.0347, -2.0285, -2.9062, -2.9701, -2.5747, -2.6586, -2.2938, -1.9713, -2.2193, -3.5660, -4.2627, -3.6293, -3.2715, -2.0475, -2.5392]], [[ 1.8671, -3.3492, -3.0254, -3.7709, -3.8146, -2.1979, -2.8491, -4.0682, -3.7469, -2.6860, -4.2485, -3.0083, -1.4796, -2.6566, -2.4688]], [[ 3.7641, -3.3250, -2.7480, -3.9188, -3.8197, -1.0222, -1.7809, -4.3346, -4.0542, -3.6019, -5.4087, -4.5635, -2.8725, -1.2970, -2.6908]], [[ 0.1529, -4.1099, -4.5618, -4.7000, -4.3095, -1.5194, -1.9593, -2.5736, -3.7515, -4.2506, -5.7467, -4.8909, -3.5186, -3.9766, -3.9417]], [[ 1.6125, -3.0263, -2.8872, -2.0873, -2.6274, -0.7419, -1.4091, -2.5810, -2.3927, -2.9265, -4.2422, -2.8705, -2.4944, -3.3025, -3.3043]], [[ 4.3351, -2.9423, -2.6050, -3.9026, -3.2478, -1.0598, -1.4520, -4.4701, -3.4748, -4.2299, -5.1160, -4.6483, -2.9038, -2.2373, -2.4807]], [[ 1.1711, -5.1967, -3.8226, -5.3591, -4.7776, -4.4931, -3.6781, -3.7456, -3.0281, -1.6920, -2.6359, -1.6376, -0.2406, 0.0752, -1.8491]], [[ 3.0362, -2.8540, -3.6371, -2.4322, -1.3866, -2.1710, -2.4346, -3.3494, -4.3654, -4.1749, -5.2433, -3.0806, -3.1003, -3.7647, -4.4827]]], [[[ 1.4458, -3.7781, -3.7386, -3.9430, -3.0860, 0.0413, -0.7242, -2.6622, -2.3836, -1.7973, -1.5779, -3.1442, -0.2407, -1.5489, -2.4850]], [[ 3.9962, -2.2281, -4.5023, -4.5981, -1.9299, -3.2931, -3.1144, -3.7381, -2.4586, -2.6866, -4.3599, -2.7430, -3.0394, -2.4010, -0.9101]], [[ 1.0068, -3.3771, -3.0781, -3.8698, -2.3107, -1.5158, -2.2185, -2.0140, -1.7820, -1.5570, -2.3474, -2.2064, -2.0446, -2.7878, -2.1797]], [[-0.9370, -4.3417, -4.2399, -4.0207, -5.6747, -3.2852, -3.3948, -4.1423, -5.5540, -4.9682, -4.2107, -2.1515, -2.0003, -1.4413, -2.6128]], [[ 3.0286, -2.8903, -1.8926, -2.6536, -1.7462, -1.4116, -0.9558, -1.0347, -2.8608, -1.9370, -2.1774, -1.4461, -2.9894, -3.7223, -2.0319]], [[ 1.9170, -2.7483, -3.2611, -3.3703, -3.1384, -3.3498, -2.0512, -2.7983, -2.8067, -3.9281, -2.8350, -3.1135, -2.4712, -1.9213, -1.6215]], [[ 3.4164, -3.8016, -3.5018, -4.4324, -3.1705, -0.9447, -1.6985, -3.1222, -2.3119, 0.1445, -3.0121, -1.3345, -2.1169, -2.4073, -1.8270]], [[ 0.3663, -3.2856, -3.4958, -3.5234, -2.6818, -2.0904, -1.8370, -1.6000, -2.0872, -1.3571, -2.1622, -2.3795, -2.3286, -1.9775, -4.1687]], [[ 1.7242, -2.1581, -3.0522, -3.4120, -3.0555, -1.0293, -1.0985, -2.0070, -2.7407, -1.2185, -0.8091, -1.4594, -1.6090, -2.6938, -2.8688]], [[ 4.1665, -3.3785, -3.2588, -5.0437, -2.5717, -0.8924, -0.9661, -3.4447, -1.4686, 0.7909, -1.7550, -2.0615, -2.2017, -3.3391, -0.9429]], [[ 0.6794, -5.7198, -5.5037, -5.3583, -4.9521, -2.6972, -2.3305, -4.7376, -4.8781, -3.2801, -3.5236, -3.4572, -1.9261, -1.9671, -1.2380]], [[ 3.4261, -0.3769, -2.3200, -2.1270, -0.4530, -2.1604, -2.5290, -2.3733, -0.9264, -2.2402, -3.3054, 0.6298, -1.6137, -2.9788, -2.5879]]], [[[ 1.8004, -1.7479, -3.0097, -3.3672, -3.8214, 0.1231, 0.5975, -2.8367, -4.2459, -4.0730, 0.8136, -0.4625, -1.3487, -2.7973, -1.2393]], [[ 2.6812, -0.7384, -1.5535, -2.8611, -2.1520, -2.5718, -2.2140, -2.5035, -1.4261, -2.7299, -3.1726, -3.1470, -0.9702, -2.3911, -1.0558]], [[ 1.6139, -3.2968, -2.1249, -2.8056, -2.8171, -1.3906, -0.7717, -2.0747, -3.2491, -3.3971, -0.7864, -1.7638, -0.6312, -2.2421, -1.4069]], [[-0.1523, -2.8046, -4.6840, -5.1525, -4.8379, -3.0708, -2.6576, -3.2936, -5.2300, -5.2879, -5.3164, -4.8178, -1.6404, -0.4308, -3.2110]], [[ 1.8138, -0.2974, -2.1640, -3.2065, -2.1993, -2.1519, -1.1615, -2.0999, -3.4291, -3.0959, -3.0787, -2.4104, -0.8161, -0.6690, 0.0290]], [[ 1.7625, -1.0763, -1.7143, -2.9623, -3.8091, -0.8652, -1.5653, -2.8128, -4.0025, -4.3840, -2.6490, -2.2811, -1.3489, -3.7437, -2.0861]], [[ 2.6171, -2.7066, -2.2017, -3.4773, -2.9003, 0.4640, 0.3940, -2.9624, -2.9268, -2.9416, 0.4209, -0.5969, -2.3877, -2.9281, -1.3655]], [[ 0.0691, -2.7356, -3.1414, -3.6787, -2.6776, -3.5301, -3.5694, -3.6739, -3.1556, -3.1580, -3.7574, -4.0543, -3.1067, -3.0973, -3.3707]], [[ 1.3512, -2.9842, -3.5705, -2.6417, -3.1336, -0.1418, -0.4719, -3.1981, -3.7469, -4.2897, 0.6909, -0.5708, -2.3648, -2.2373, -1.3802]], [[ 2.8544, -2.5694, -1.7074, -3.3981, -2.0821, 0.4619, 0.1234, -3.0113, -1.9882, -1.5514, 0.3191, -1.4489, -2.1729, -2.6110, -1.7109]], [[ 1.0899, -2.5882, -2.1368, -2.6902, -2.2209, -3.3157, -2.6622, -2.4397, -2.7492, -3.4861, -4.0797, -3.3991, 0.2415, -0.7051, -2.6112]], [[ 3.5726, -0.6995, -2.6119, -2.6292, -2.3033, -2.2252, -2.5173, -3.4002, -3.5103, -3.4418, -3.6783, -4.0547, -2.6742, -3.0681, -1.4378]]]]) attn_weights tensor([[[[ 2.5890e+00, -2.1642e+00, -4.3508e+00, -2.9392e+00, -3.2346e+00, 6.5211e-01, -3.9150e-02, -2.4133e+00, -4.9084e+00, -3.4620e+00, -5.8630e-01, -2.5442e+00, -2.1033e+00, 3.9765e-01, -1.8625e+00]], [[ 3.7798e+00, -2.3988e+00, -3.2791e+00, -2.1459e+00, -2.3445e+00, 9.5971e-01, -9.7775e-02, -2.6480e+00, -4.0483e+00, -2.5590e+00, -6.1641e-01, -1.9090e+00, 5.7306e-01, -9.1588e-02, -4.3883e-01]], [[ 3.3586e+00, -8.4869e-01, -1.5777e+00, -2.3281e+00, -1.9570e+00, -4.3443e-02, -1.8901e-01, -1.7442e+00, -2.7775e+00, -2.9485e+00, -5.1012e-01, -1.6599e+00, -1.6470e+00, -7.1930e-01, -9.0639e-01]], [[ 2.6167e+00, -8.3124e-01, -3.0691e+00, -2.8157e+00, -1.4152e+00, 1.5354e+00, -5.4569e-01, -7.5319e-01, -3.9679e+00, -3.2420e+00, -1.3702e+00, -1.4097e+00, 4.1030e-02, 1.8439e-01, -1.6957e-01]], [[ 2.5286e+00, -1.2380e-01, -1.5378e+00, -1.5542e+00, -1.1579e+00, -1.0986e-01, 1.5595e+00, 4.5526e-01, -1.2865e+00, -9.8985e-01, 6.4475e-02, -2.9484e-01, 9.8639e-01, 6.9666e-01, 3.2124e-01]], [[ 1.4959e+00, -2.3817e+00, -2.9199e+00, -3.0453e+00, -3.4060e+00, -3.3028e+00, -3.7979e+00, -2.9784e+00, -2.6840e+00, -2.5200e+00, -2.3607e+00, -2.7787e+00, -2.8656e+00, -3.4199e+00, -3.7699e+00]], [[ 3.0852e+00, -1.8916e+00, -3.1814e+00, -2.8245e+00, -2.3785e+00, 2.9419e-01, -1.3780e-01, -2.3477e+00, -4.5024e+00, -3.5558e+00, -4.9998e-01, -2.1996e+00, -2.0553e+00, -1.1431e+00, -1.3871e+00]], [[ 1.9303e+00, -2.0995e+00, -2.3782e+00, -3.4649e+00, -2.4685e+00, 2.8475e-01, -1.7901e+00, -1.3028e+00, -2.7637e+00, -3.3897e+00, -6.0936e-01, -1.2045e+00, -1.8330e+00, -1.3143e-01, -9.0854e-01]], [[ 3.1213e+00, -2.0491e+00, -2.8108e+00, -3.4814e+00, -1.7273e+00, -2.3385e+00, -2.5075e+00, -1.3692e+00, -2.8779e+00, -3.1303e+00, -2.0808e+00, -3.3660e-01, -1.1016e+00, -2.5019e+00, -1.1163e+00]], [[ 4.6917e-01, -2.4672e+00, -2.7075e+00, -2.7324e+00, -2.7107e+00, -2.1176e+00, -2.6961e+00, -1.4966e+00, -2.6116e+00, -2.6364e+00, -1.5279e+00, -1.6800e+00, -1.7952e+00, -1.1360e+00, -1.7622e+00]], [[ 3.4770e+00, -1.4994e+00, -1.6779e+00, -1.8262e+00, -1.4589e+00, 2.1161e-01, -9.3057e-01, -2.3518e+00, -2.7308e+00, -2.6252e+00, -1.3551e+00, -1.5905e+00, -1.7784e+00, -9.9028e-01, -1.7023e+00]], [[ 4.0249e+00, -1.4633e+00, -8.3551e-01, -3.2800e+00, -2.5937e+00, 2.5468e+00, 1.8984e+00, -7.1150e-01, -1.8840e+00, -3.3867e+00, -1.0305e+00, -1.9907e+00, -1.6077e+00, 5.9121e-01, 1.1014e+00]]], [[[ 2.2089e+00, -3.3815e+00, -4.0842e+00, -3.8600e+00, -3.0178e+00, 1.2010e+00, 1.0809e-01, -3.8516e+00, -3.8368e+00, -4.2929e+00, -4.1787e+00, -2.6900e+00, -2.5422e+00, -3.0287e+00, -3.0006e+00]], [[ 3.7097e+00, -2.0085e+00, -5.0463e+00, -2.9900e+00, -1.4988e+00, 9.5371e-01, -3.0310e-01, -1.7803e+00, -2.6757e+00, -4.7251e+00, -2.3061e+00, -2.0389e+00, -1.1160e+00, 4.0954e-01, 1.3229e-01]], [[ 3.6168e+00, -2.2130e+00, -2.5497e+00, -2.9777e+00, -1.3341e+00, 5.0136e-01, 6.0612e-01, -9.8193e-01, -1.1359e+00, -2.2288e+00, -2.4450e+00, -1.4354e+00, -1.2674e+00, -1.3410e+00, 7.0354e-02]], [[ 2.9077e+00, -1.7108e+00, -3.0093e+00, -2.8967e+00, -7.9401e-01, 8.9254e-01, 7.1650e-01, -1.3151e+00, -2.6349e+00, -2.8096e+00, -2.4829e+00, -1.3624e+00, -9.1940e-01, -1.6101e+00, -5.1300e-01]], [[ 1.6267e+00, -2.1611e+00, -7.2744e-01, -9.8418e-01, -5.4970e-01, 1.8761e+00, 2.0607e+00, -1.1280e+00, -8.7899e-01, -2.6040e-01, -4.1384e-01, -1.4858e+00, 5.5716e-01, 1.0813e+00, 3.9546e-01]], [[ 1.8106e+00, -4.0118e+00, -4.0355e+00, -4.7695e+00, -5.0289e+00, -2.8896e+00, -3.7436e+00, -4.5069e+00, -4.3773e+00, -3.7563e+00, -4.2186e+00, -3.0586e+00, -2.3119e+00, -2.4662e+00, -4.3722e+00]], [[ 2.8938e+00, -3.7173e+00, -3.4566e+00, -3.4054e+00, -2.3752e+00, 2.6872e-01, -8.5808e-02, -2.6224e+00, -3.5269e+00, -3.1577e+00, -3.1713e+00, -1.2145e+00, -1.4822e+00, -1.8861e+00, -8.2978e-01]], [[ 2.0077e+00, -3.0964e+00, -3.6856e+00, -3.3147e+00, -1.7663e+00, 3.6844e-01, -9.4445e-01, -1.4856e+00, -1.8626e+00, -3.0848e+00, -2.5152e+00, -3.1654e+00, -1.4770e+00, -9.4007e-01, 2.4156e-02]], [[ 3.6280e+00, -2.0407e+00, -4.0648e+00, -4.1155e+00, -9.6815e-01, -2.0166e+00, -9.4345e-01, -1.9526e+00, -1.9948e+00, -3.7315e+00, -3.6054e+00, -1.6340e+00, -8.1570e-01, -5.3727e-01, 4.7626e-01]], [[-5.5186e-02, -4.1021e+00, -3.8589e+00, -2.7709e+00, -2.9977e+00, -1.3114e+00, -2.3561e+00, -3.4199e+00, -3.9490e+00, -3.3836e+00, -2.3283e+00, -3.9144e+00, -1.1708e+00, 2.8459e-01, -7.0266e-01]], [[ 3.5456e+00, -1.8951e+00, -2.7278e+00, -2.5054e+00, -1.4742e+00, 6.3178e-01, 4.1793e-01, -1.1172e+00, -2.1521e+00, -2.7727e+00, -2.3066e+00, -1.0611e+00, -1.6766e+00, -1.4562e+00, -3.5613e-01]], [[ 3.7926e+00, -1.9555e+00, 6.7090e-01, 1.7024e-01, -1.1031e+00, 2.6736e+00, 2.8177e+00, 1.5129e+00, 1.6728e+00, 2.3666e+00, 1.8967e+00, -4.6363e-01, 2.8695e+00, 3.5156e+00, 2.9061e-01]]], [[[ 2.2463e+00, -2.9235e+00, -3.3084e+00, -3.8691e+00, -3.6781e+00, -5.1670e-01, -1.1545e+00, -3.2985e+00, -3.4042e+00, -3.6942e+00, -3.7077e+00, -4.2483e+00, -2.7234e+00, -3.0298e+00, -4.1951e+00]], [[ 4.3289e+00, -2.8604e+00, -4.3351e+00, -3.8370e+00, -3.5325e+00, -1.0048e+00, -1.7144e+00, -3.1121e+00, -3.0716e+00, -4.5716e+00, -3.4353e+00, -5.0809e+00, -1.6971e+00, -1.7328e-01, -9.4162e-01]], [[ 2.9066e+00, -2.1811e+00, -1.7402e+00, -3.3618e+00, -2.7174e+00, -7.6205e-01, -1.2637e-01, -1.8645e+00, -1.7707e+00, -1.8134e+00, -3.5646e+00, -3.7686e+00, -2.8600e+00, -1.9757e+00, -2.8572e+00]], [[ 2.6174e+00, -2.0657e+00, -1.8239e+00, -2.4283e+00, -1.9022e+00, -5.4682e-01, -1.2247e+00, -2.5248e+00, -2.4519e+00, -1.7872e+00, -2.3294e+00, -2.7366e+00, -1.4071e+00, -6.9601e-01, -1.2269e+00]], [[ 2.2733e+00, -2.0682e+00, -1.3879e+00, -2.5287e+00, -1.6034e+00, -1.3165e+00, -1.4708e+00, -1.5908e+00, -1.9043e+00, -1.3510e+00, -4.1800e+00, -2.0743e+00, -9.3836e-01, -1.6029e+00, -1.4376e+00]], [[ 1.7330e+00, -3.2778e+00, -3.2741e+00, -4.4891e+00, -4.7360e+00, -4.1889e+00, -4.9095e+00, -3.9246e+00, -3.5755e+00, -2.8170e+00, -2.7283e+00, -3.4487e+00, -3.6586e+00, -3.2126e+00, -3.8949e+00]], [[ 2.7914e+00, -1.9443e+00, -3.1054e+00, -2.9569e+00, -2.6067e+00, -1.2884e+00, -1.8486e+00, -2.1236e+00, -2.3150e+00, -3.4543e+00, -3.1652e+00, -4.2913e+00, -1.9066e+00, -2.1360e+00, -1.5632e+00]], [[ 1.5169e+00, -3.2011e+00, -2.4022e+00, -3.7345e+00, -2.5193e+00, -2.1708e+00, -3.3396e+00, -2.6723e+00, -2.9106e+00, -2.9122e+00, -3.4203e+00, -3.0920e+00, -3.0843e+00, -2.9700e+00, -1.9578e+00]], [[ 3.3159e+00, -2.1997e+00, -3.2923e+00, -4.3107e+00, -2.6609e+00, -2.7438e+00, -3.5803e+00, -2.3143e+00, -2.5190e+00, -3.4760e+00, -3.4430e+00, -2.2215e+00, -2.0997e+00, -8.4860e-01, -1.2969e+00]], [[-2.0623e-01, -3.5650e+00, -3.0872e+00, -3.7446e+00, -3.7393e+00, -2.5007e+00, -1.6780e+00, -2.1369e+00, -1.8713e+00, -2.1850e+00, -3.2753e+00, -2.5805e+00, -3.6072e-01, -1.0154e+00, -2.6867e+00]], [[ 3.3722e+00, -2.3225e+00, -2.4846e+00, -2.7214e+00, -2.7146e+00, -1.0122e+00, -1.3283e+00, -2.5825e+00, -2.9655e+00, -3.4196e+00, -3.6452e+00, -3.7709e+00, -2.2609e+00, -2.4820e+00, -2.9228e+00]], [[ 4.5911e+00, -2.5173e+00, -8.7316e-01, -1.0118e+00, -2.9779e+00, -3.0864e+00, -1.2411e+00, -1.1174e+00, -4.4946e-01, -6.0937e-01, -1.1988e+00, -2.2858e+00, 1.7827e+00, 2.4469e+00, 9.9133e-01]]], [[[ 2.2647e+00, -3.2683e+00, -3.1978e+00, -3.3758e+00, -3.2835e+00, 1.5051e+00, 7.1735e-02, -3.1426e+00, -3.3414e+00, 8.9359e-01, -1.4328e+00, -1.5137e+00, -2.3798e+00, -2.9864e+00, -1.7380e+00]], [[ 3.9574e+00, -1.5253e+00, -3.5588e+00, -2.5463e+00, -2.2219e+00, -4.9818e-01, -1.8316e+00, -1.5886e+00, -1.4354e+00, 4.7362e-01, -2.6322e+00, -1.0401e+00, -1.5691e+00, -5.3642e-01, -9.9039e-02]], [[ 3.1268e+00, -1.2867e+00, -2.1118e+00, -3.2477e+00, -2.0589e+00, 1.3672e-02, -4.5867e-01, -1.6210e+00, -1.4311e+00, 1.0717e-01, -6.1046e-01, 7.8845e-01, -1.0102e+00, -1.9082e+00, -1.1258e+00]], [[ 2.8036e+00, -1.2843e+00, -2.7586e+00, -2.6982e+00, -2.0352e+00, 9.3456e-02, -7.5589e-01, -1.0830e+00, -1.8753e+00, -1.0031e+00, -2.2097e+00, 2.1086e+00, -1.3285e+00, -1.7227e+00, -1.2773e+00]], [[ 2.6158e+00, -8.0783e-01, -1.6231e+00, -1.9228e+00, -1.9158e+00, -1.5654e+00, -1.2457e+00, -1.5770e+00, -2.5700e+00, -1.9156e+00, -1.7907e+00, -9.0007e-01, -9.0198e-01, -1.2166e+00, 5.9437e-01]], [[ 1.5954e+00, -3.1806e+00, -3.6528e+00, -3.5942e+00, -3.9294e+00, -3.4575e+00, -3.6167e+00, -3.7453e+00, -3.3649e+00, -3.8023e+00, -4.6566e+00, -2.7321e+00, -1.8042e+00, -2.1334e+00, -1.5517e+00]], [[ 3.1708e+00, -3.7048e+00, -3.8324e+00, -4.3045e+00, -3.5580e+00, -2.3371e-04, -7.8536e-02, -3.0603e+00, -3.3814e+00, 6.9119e-01, -1.0813e+00, -2.3527e+00, -2.8433e+00, -3.2356e+00, -2.0870e+00]], [[ 1.7943e+00, -1.8572e+00, -2.2667e+00, -2.9010e+00, -2.0526e+00, -5.4325e-01, -1.8397e+00, -6.0576e-01, -1.5203e+00, -1.5145e+00, -1.9405e+00, -5.0613e-01, -1.6423e+00, -1.5697e+00, -1.4108e+00]], [[ 3.4785e+00, -1.9828e+00, -3.3578e+00, -4.0703e+00, -1.6289e+00, -3.0245e+00, -2.7374e+00, -2.1060e+00, -8.6344e-01, -2.8907e+00, -4.9498e+00, -5.2258e-01, -3.1607e+00, -2.5233e+00, -5.6927e-01]], [[-1.1300e-02, -4.1911e+00, -4.1563e+00, -2.2599e+00, -3.2250e+00, -2.3699e+00, -1.9424e+00, -1.7133e+00, -3.6127e+00, -3.9309e+00, -3.0890e+00, -2.1070e+00, -1.8134e+00, -4.5055e-01, -1.1578e+00]], [[ 3.2418e+00, -3.5010e+00, -2.8330e+00, -3.3931e+00, -2.8320e+00, -3.1557e-01, -1.3222e+00, -2.4515e+00, -2.7114e+00, 1.0915e-01, -2.3478e+00, -2.2989e+00, -2.1609e+00, -2.5035e+00, -2.0797e+00]], [[ 3.2060e+00, -1.2864e+00, -4.0737e-01, -1.8279e+00, -1.9423e+00, 1.7075e+00, 5.9511e-01, 1.7256e+00, -3.3298e-01, 6.8647e-02, -8.4266e-02, 1.3202e+00, 3.2713e+00, 2.1189e+00, 1.5870e+00]]], [[[ 2.5039e+00, -3.2142e+00, -3.7723e+00, -3.8731e+00, -4.3044e+00, 1.6521e+00, 8.3225e-01, -3.5350e+00, -3.4236e+00, -3.5091e+00, 8.7444e-01, -4.3699e-01, -2.6278e+00, -3.0628e+00, -1.2255e+00]], [[ 2.8697e+00, -1.3758e+00, -2.0553e+00, -1.7633e+00, -2.2315e+00, 4.5588e-02, -1.3214e+00, -2.5304e+00, -1.4470e+00, -1.4827e+00, 1.6851e-01, -1.3724e+00, -1.1547e+00, -2.1489e+00, -9.4897e-01]], [[ 2.7091e+00, -5.6367e-01, -8.2934e-01, -2.7350e+00, -2.1337e+00, -4.3794e-01, -1.9261e+00, -2.8574e+00, -2.9050e+00, -2.6201e+00, -1.0055e+00, -2.1971e+00, -4.2237e-01, 5.8885e-01, 7.9871e-01]], [[ 2.7234e+00, -7.0937e-02, -2.4884e+00, -2.5831e+00, -2.9872e+00, 8.2718e-01, -9.5080e-01, -1.8232e+00, -2.9718e+00, -2.9825e+00, -1.5206e+00, -1.7436e+00, 1.2734e-01, 2.6331e-01, 6.0962e-01]], [[ 2.6331e+00, 4.8386e-01, -1.7434e+00, -1.5431e+00, -1.6750e+00, -1.7040e+00, -6.9420e-01, -6.1144e-01, -1.7800e+00, -2.7340e+00, -9.9417e-02, -1.0545e+00, 1.1718e+00, -1.3008e-01, 1.4742e+00]], [[ 9.6581e-01, -1.5320e+00, -2.2441e+00, -2.5887e+00, -3.1909e+00, -2.4612e+00, -2.8107e+00, -1.7426e+00, -4.5920e+00, -4.7685e+00, -4.3859e+00, -4.4816e+00, -5.4672e-01, -6.1448e-01, -1.8574e+00]], [[ 2.4379e+00, -3.0603e+00, -3.2489e+00, -3.2335e+00, -3.8051e+00, 1.8096e-01, -3.5965e-01, -3.7178e+00, -3.4230e+00, -3.1004e+00, 2.7356e-01, -6.4958e-01, -2.4221e+00, -2.4689e+00, -1.6135e+00]], [[ 2.2193e+00, -4.0838e-01, -8.9264e-01, -2.1804e+00, -1.5565e+00, -5.3859e-01, -1.5864e+00, -1.0252e+00, -1.7047e+00, -1.7237e+00, -7.7605e-01, -1.9596e+00, -3.8705e-01, -6.3504e-01, 2.1003e-01]], [[ 2.7318e+00, -1.4219e+00, -2.0000e+00, -2.6463e+00, -1.8921e+00, -1.8920e+00, -3.1808e+00, -3.0134e+00, -1.3708e+00, -4.9773e-01, -1.5233e+00, -3.0406e+00, -1.1307e+00, -1.0830e+00, 2.1975e-01]], [[ 9.9694e-01, -2.5932e+00, -2.1068e+00, -2.6259e+00, -2.7173e+00, -2.3383e+00, -1.1976e+00, -9.4574e-01, -2.6622e+00, -3.5673e+00, -3.2674e+00, -3.2283e+00, -1.5914e-02, 1.4868e-01, -1.1717e+00]], [[ 2.5595e+00, -2.9536e+00, -1.7129e+00, -2.6679e+00, -2.4605e+00, 5.4469e-01, -1.5538e+00, -4.0975e+00, -2.8097e+00, -2.2348e+00, -1.2202e+00, -2.0535e+00, -3.0591e+00, -1.7511e+00, -1.6583e+00]], [[ 2.8906e+00, -7.2656e-01, -1.3528e+00, -2.8144e+00, -2.4251e+00, 8.4235e-01, -5.4732e-01, -1.8460e+00, -3.0752e+00, -2.9158e+00, 3.5009e-01, -1.1568e+00, 5.0361e-01, -3.2407e-01, 6.1148e-01]]]]) attn_weights tensor([[[[ 1.6345e+00, 1.0634e+00, 4.9691e-01, 2.2618e-01, 1.0123e+00, 1.3864e+00, 6.6602e-01, 8.5681e-01, 5.4628e-01, -9.1016e-02, 8.9736e-01, 1.1685e+00, 1.0884e+00, 1.3370e+00, 1.5526e+00]], [[ 3.9180e+00, 4.3532e-01, -9.7421e-01, -4.2400e-01, 8.4041e-01, 2.3710e-01, -8.8647e-03, 6.7317e-01, -1.3849e+00, -8.4422e-01, 2.8744e-01, 6.1518e-01, 1.1880e-01, -6.5106e-01, 5.3654e-01]], [[ 3.1352e+00, 7.0462e-02, -1.5137e+00, -1.8458e+00, -1.3095e+00, 5.8397e-01, -1.9373e-01, -1.4691e-01, -2.5794e+00, -2.0463e+00, -3.3708e-01, -6.5663e-01, -3.0870e-01, -5.9737e-01, 5.5821e-01]], [[ 1.5030e+00, 4.2244e-01, -1.7969e+00, -1.6495e+00, -9.1481e-01, -2.7844e-01, 1.0264e-01, -4.2547e-03, -2.5537e+00, -2.4877e+00, -1.3563e+00, -8.2433e-01, -7.8017e-01, 1.5121e-01, -1.8060e-01]], [[ 2.6694e+00, -1.2275e-01, -5.8664e-01, -8.7006e-01, 1.8722e-01, -2.9510e-01, -1.3892e+00, -1.8248e-01, -6.8623e-01, -8.9684e-01, -2.5980e-01, 3.2968e-01, 4.3033e-01, -6.4776e-01, 4.9305e-01]], [[ 4.2002e+00, 7.2142e-02, -9.4714e-01, -7.6559e-01, -4.6518e-01, 2.2072e+00, 3.1677e+00, 3.0720e-01, -1.6012e+00, -9.5907e-01, 1.1546e+00, 2.0105e-01, 9.1369e-01, 4.0254e-01, 5.1813e-01]], [[ 3.6266e+00, -6.9687e-01, -1.8390e+00, -1.3279e+00, -8.1082e-01, 1.0860e-01, -1.0891e+00, -9.0043e-01, -2.6661e+00, -2.3860e+00, -1.4350e+00, -1.1415e+00, -8.7844e-01, -9.0164e-01, -2.7534e-01]], [[ 3.7546e+00, 1.4783e+00, -7.8377e-01, 1.5387e-01, 1.0843e+00, 2.2654e+00, 5.0657e-01, 1.5688e+00, -1.1806e+00, -9.6099e-02, 1.0138e+00, 1.3154e+00, 1.6065e+00, 9.2744e-01, 2.3682e+00]], [[-4.4364e+00, 3.4915e+00, 2.8681e+00, 3.0770e+00, 2.8402e+00, 3.5002e+00, 3.1725e+00, 3.1794e+00, 3.7808e+00, 3.9264e+00, 4.1601e+00, 3.7075e+00, 2.8462e+00, 2.6697e+00, 3.8892e+00]], [[ 4.0144e+00, -1.1213e+00, -2.7510e+00, -2.8695e+00, -1.7842e+00, 7.9182e-01, 8.1886e-01, -6.9082e-01, -3.0108e+00, -2.5307e+00, -4.9609e-03, -1.1561e+00, 2.6768e-01, -7.8004e-01, 4.3740e-01]], [[ 3.0183e+00, 6.9739e-01, -4.1281e-01, -8.7487e-01, -7.4214e-01, 1.9616e+00, 4.8797e-01, 9.6216e-01, -1.1485e+00, -9.9464e-01, 8.1413e-01, 1.1736e-01, -2.2941e-01, 1.7185e+00, 2.3045e+00]], [[ 3.2723e+00, 1.0487e+00, -1.5059e+00, -1.1224e+00, -5.5298e-01, 1.5234e+00, 3.6321e-01, 8.0366e-01, -2.2401e+00, -1.7602e+00, 2.2801e-01, -1.7903e-01, -2.6711e-01, 6.4868e-01, 5.5272e-01]]], [[[ 1.2892e+00, 2.5050e-01, -3.2797e-01, -5.0607e-01, 9.8602e-01, 6.5423e-01, 9.0756e-01, 8.5512e-01, 1.4905e+00, 2.2663e-01, 7.2828e-02, 9.4850e-01, 1.3222e+00, 2.8466e-01, 4.0140e-01]], [[ 3.4928e+00, -9.0045e-01, -1.0384e+00, -1.2896e+00, 1.0757e+00, 2.9291e-01, 6.9189e-01, 9.1107e-01, 2.7406e-01, -4.6159e-01, -2.8782e-01, -7.6278e-01, 6.4636e-01, 8.7481e-01, 1.5678e+00]], [[ 2.9744e+00, -1.9371e+00, -1.9769e+00, -2.4686e+00, -7.2408e-01, 6.1888e-01, 4.9915e-01, -1.0021e+00, -1.1731e+00, -1.6907e+00, -1.3168e+00, -1.7863e+00, -1.3544e+00, -1.1915e+00, -8.1862e-01]], [[ 8.2023e-01, -1.2666e+00, -1.2777e+00, -2.8411e-01, -1.0871e+00, 4.0185e-01, 5.7957e-01, -4.5924e-01, -7.2947e-01, -9.7562e-01, 5.5018e-01, -1.0229e+00, 9.3028e-01, 2.3201e+00, 1.6180e-01]], [[ 1.7265e+00, -1.3686e+00, -1.7412e+00, -1.7075e+00, -9.5719e-01, -4.1316e-01, -7.9295e-01, -4.0638e-01, 3.5220e-01, -1.3801e+00, -9.2944e-01, -6.3995e-01, 5.8420e-03, 6.4578e-01, 6.7833e-01]], [[ 4.2542e+00, -1.6185e+00, -2.8868e+00, -3.5980e+00, -8.3781e-01, 1.5210e+00, 2.1172e+00, -1.4415e+00, -2.3182e+00, -2.7370e+00, -3.6971e+00, -1.6551e+00, -7.2732e-01, 7.5037e-01, -6.1747e-01]], [[ 3.3372e+00, -1.6572e+00, -2.4817e+00, -2.5333e+00, -2.0419e-01, 4.9812e-01, 1.4430e-01, -4.3892e-01, -1.3117e+00, -2.7515e+00, -1.9428e+00, -3.5920e-01, -1.1601e+00, -3.3999e-01, 9.9855e-01]], [[ 3.4329e+00, -5.5512e-01, -1.0316e+00, -2.4502e+00, 2.0680e-01, 1.8015e+00, 1.1192e+00, 4.0779e-01, -7.7769e-02, -7.4674e-01, -1.4911e+00, -1.3011e-01, 1.1039e+00, 1.0852e+00, 1.5839e+00]], [[-1.5310e+00, 1.5301e+00, 2.9811e+00, 3.3200e+00, 2.0705e+00, 1.7026e+00, 1.1872e+00, 2.1008e+00, 2.7960e+00, 3.6877e+00, 4.8808e+00, 2.4055e+00, 5.4149e+00, 5.6452e+00, 3.8710e+00]], [[ 4.1862e+00, -9.2473e-01, -2.0447e+00, -2.6336e+00, -1.4347e-01, 7.9730e-01, -5.2273e-01, -1.0985e+00, -1.0558e+00, -2.1066e+00, -2.1780e+00, -1.2545e+00, 2.6916e-01, 2.5498e-01, 6.5288e-01]], [[ 2.0903e+00, -2.0773e+00, -1.2245e+00, 3.0285e-01, -2.0556e-01, 2.8612e+00, 7.8409e-01, 1.3877e-01, -9.7337e-02, -8.0279e-01, 1.4875e+00, 1.5443e+00, 1.9262e+00, 3.6286e+00, 2.9640e+00]], [[ 2.8240e+00, -2.2909e+00, -1.5883e+00, 1.7484e-01, 5.0247e-01, 2.4874e+00, 1.9051e+00, -3.5956e-01, -6.0108e-01, -4.2206e-01, 1.5463e+00, 1.6962e+00, 2.2639e+00, 5.3633e+00, 2.0283e+00]]], [[[ 1.1086e+00, 6.6699e-01, -1.3567e-01, 1.5138e-02, 6.2390e-01, 1.6980e-01, 7.8103e-01, 5.8293e-01, 1.4993e+00, 4.6838e-01, -6.7586e-01, -7.6489e-02, 2.5082e-01, 1.7769e-01, 1.1506e+00]], [[ 2.9599e+00, -6.0782e-01, -1.1307e+00, -1.8718e+00, -5.7361e-01, -7.4675e-01, -2.9404e-01, -3.0276e-01, -1.0674e+00, -8.7578e-01, -2.7473e+00, -1.9869e+00, -1.5442e+00, -1.1737e+00, -1.4584e+00]], [[ 2.5216e+00, -1.0045e+00, -2.1656e+00, -2.9962e+00, -2.5610e+00, -2.3877e-01, -5.2069e-01, -1.0144e+00, -1.1479e+00, -2.2850e+00, -2.9284e+00, -3.4047e+00, -2.9309e+00, -2.7392e+00, -3.4060e+00]], [[ 5.4859e-01, -7.4928e-01, -1.5091e+00, -1.7075e+00, -2.0471e+00, 5.3535e-01, -4.9563e-01, -1.2545e-01, 6.5775e-02, -1.1244e+00, -3.8053e+00, -6.9500e-01, -4.7483e-01, -1.8832e+00, -3.5305e+00]], [[ 1.9200e+00, -1.4906e+00, -1.9062e+00, -2.0458e+00, -1.7289e+00, -1.9867e+00, -2.4363e+00, -1.4539e+00, -1.4916e+00, -1.9090e+00, -2.3253e+00, -2.2044e+00, -2.6134e+00, -1.4546e+00, -2.7380e+00]], [[ 3.7989e+00, -9.6710e-01, -1.6515e+00, -2.6718e+00, -1.8344e+00, -5.4426e-01, 4.9542e-01, -1.5135e+00, -2.4784e+00, -2.1177e+00, -3.4920e+00, -2.5998e+00, -2.4947e+00, -6.1391e-01, -6.4257e-01]], [[ 2.9868e+00, -1.8428e+00, -2.0531e+00, -2.5696e+00, -2.3673e+00, -1.1872e+00, -1.5220e+00, -2.0694e+00, -2.0920e+00, -2.8718e+00, -2.8774e+00, -3.0914e+00, -2.6506e+00, -2.2361e+00, -3.2070e+00]], [[ 3.1110e+00, 6.0053e-01, -1.2694e+00, -1.1490e+00, -1.1444e+00, -2.9145e-01, -5.4543e-01, -1.6977e-01, -4.4616e-01, -1.5987e+00, -2.0820e+00, -2.3520e+00, -9.7446e-01, -3.0800e-01, -1.2793e+00]], [[-6.4290e+00, 1.9873e+00, 2.5759e+00, 1.9115e+00, 1.1566e+00, 1.6938e+00, 1.1486e+00, 9.9823e-01, 1.9309e+00, 2.3492e+00, -2.9492e+00, 2.2651e+00, 2.1877e+00, 1.9722e+00, 4.1199e-01]], [[ 3.9292e+00, -1.0278e+00, -1.6604e+00, -2.7369e+00, -1.6651e+00, -1.8939e+00, -1.9845e+00, -1.4909e+00, -1.2305e+00, -2.1281e+00, -1.1748e+00, -2.0846e+00, -1.3826e+00, 2.2252e-01, -5.7218e-01]], [[ 1.8032e+00, -1.4697e+00, -8.8679e-01, -1.1357e+00, -1.9293e+00, -1.0146e+00, -1.1180e+00, -1.1779e+00, -5.4700e-01, -1.2277e+00, -1.3263e+00, -1.4569e+00, -2.9232e-01, -4.8862e-01, -7.0288e-01]], [[ 1.9881e+00, 1.3598e-01, -8.5086e-02, -6.1309e-01, -1.0764e+00, 1.0514e+00, 4.2882e-01, 3.8859e-01, 8.7214e-01, -3.8735e-01, -1.8684e+00, 1.2632e-01, 1.5015e+00, 1.4243e+00, 6.1274e-01]]], [[[ 1.1162e+00, 1.0279e+00, 7.5313e-01, 8.0393e-01, 5.7837e-01, 6.5384e-01, 7.8859e-01, 9.0239e-01, 4.1357e-01, -2.2204e-01, 9.4917e-01, 7.4024e-01, 1.0692e+00, 1.0406e+00, 9.2261e-01]], [[ 3.1865e+00, -1.4019e+00, -1.5580e+00, -2.0493e+00, -1.0459e+00, -5.7260e-01, -5.0720e-01, 7.5287e-02, -9.8661e-01, -2.1391e-01, -1.8031e+00, -2.1337e-01, -8.6541e-01, -1.0039e+00, -8.7348e-01]], [[ 2.8956e+00, -1.1282e+00, -2.4904e+00, -2.7702e+00, -1.6693e+00, 2.7149e-01, -3.1571e-01, -9.8265e-01, -1.6413e+00, 5.3560e-01, -1.6264e+00, 3.2736e-01, -2.4417e+00, -1.6882e+00, -1.4813e+00]], [[ 8.6392e-01, -1.9061e+00, -2.2145e+00, -2.2666e+00, -2.1873e+00, 4.6905e-01, 1.3909e-01, -9.1290e-01, -2.8104e+00, -1.2499e+00, -7.3992e-01, -5.7481e-01, -6.0610e-01, -3.8248e-01, -3.4700e-01]], [[ 1.6729e+00, -1.6811e+00, -1.6613e+00, -1.9730e+00, -1.3765e+00, -1.3105e+00, -2.0570e+00, -1.1296e+00, -1.6029e+00, -1.1580e+00, -2.7249e+00, -1.6984e+00, -1.1215e+00, -9.7447e-01, -6.2772e-01]], [[ 4.2244e+00, -7.7383e-01, -1.1882e+00, -2.6344e+00, -7.9029e-01, 9.6388e-01, 1.8199e+00, 1.9209e-01, -2.7562e-02, 8.9929e-01, 5.0890e-01, -6.7682e-01, -3.7126e-01, -1.4026e+00, 6.2083e-01]], [[ 3.1397e+00, -2.2592e+00, -2.4242e+00, -2.6565e+00, -1.4620e+00, -4.1829e-01, -1.2889e+00, -1.8127e+00, -1.1484e+00, 2.0708e-01, -2.3007e+00, -1.7457e+00, -2.1449e+00, -2.4011e+00, -1.3453e+00]], [[ 3.4283e+00, 9.8416e-02, -5.5189e-01, -6.6396e-01, 2.0842e-01, 9.2976e-01, -2.4591e-01, 8.4936e-01, -4.8305e-01, 1.1265e+00, -1.6337e+00, 1.7231e-01, -7.5061e-01, -4.5002e-01, 2.0000e-01]], [[-3.2330e+00, 3.2830e+00, 4.4796e+00, 3.3181e+00, 2.3075e+00, 3.0688e+00, 2.7247e+00, 3.6430e+00, 2.2557e+00, 1.5756e+00, 1.6669e+00, 3.9215e+00, 4.5865e+00, 5.5205e+00, 4.9333e+00]], [[ 4.3124e+00, -2.0574e+00, -2.7162e+00, -3.1496e+00, -2.5404e+00, -5.3836e-01, -7.2919e-01, -1.5873e+00, -1.7100e+00, 6.1841e-01, -1.4042e+00, -1.2565e+00, -1.7690e+00, -8.2898e-01, 1.2253e+00]], [[ 2.8869e+00, -1.0852e+00, -1.2296e+00, -1.0449e+00, -1.7734e+00, 1.2521e+00, -1.5516e-01, 2.8601e-01, -1.0192e+00, -6.3128e-01, -1.7937e-01, -1.2235e-01, -3.3167e-01, 1.2771e+00, 2.2940e+00]], [[ 2.9864e+00, -1.0579e+00, -9.7677e-01, -7.7823e-02, -9.4003e-01, 1.1738e+00, 1.1451e+00, -5.2907e-01, -1.0211e+00, -3.6603e-01, 4.1455e-02, -1.4583e+00, 6.5404e-01, 1.2032e+00, 1.0097e+00]]], [[[ 2.0063e+00, 2.2218e+00, 6.3290e-01, 6.3148e-01, 1.5166e+00, 6.4333e-01, 6.4968e-01, 1.7574e+00, 4.1720e-01, 8.5107e-01, 7.7230e-01, 8.1383e-01, 1.9760e+00, 1.6724e+00, 1.3459e+00]], [[ 3.1121e+00, 5.0845e-01, -6.0365e-01, -6.8917e-01, -4.6217e-02, 6.5001e-02, -1.7003e-01, 1.2987e-01, -1.0848e+00, -6.7782e-01, 6.7437e-01, -1.7022e+00, 8.7109e-01, 6.8334e-01, 1.4159e+00]], [[ 2.7581e+00, -6.1939e-03, -1.2734e+00, -2.2433e+00, -1.5899e+00, 5.3743e-01, 4.2053e-02, -4.5770e-01, -1.6049e+00, -1.5335e+00, -5.4051e-01, -1.5009e+00, 7.3243e-01, -4.7744e-01, 1.1189e+00]], [[ 1.3142e+00, -5.4492e-01, -2.3623e+00, -2.4159e+00, -2.2942e+00, 4.1626e-02, 1.4545e-01, -2.4382e-01, -3.0861e+00, -2.6847e+00, -5.4026e-01, -7.5005e-01, 2.4981e-01, -6.7602e-01, 1.4762e-01]], [[ 2.1446e+00, -1.6993e-01, -1.8450e-01, -1.6076e+00, -9.7778e-01, -1.3302e+00, -2.8372e+00, -1.0626e+00, -1.6233e+00, -1.5066e+00, -2.5543e+00, -3.3718e+00, -3.7382e-01, -7.9034e-01, 2.0240e-01]], [[ 3.3276e+00, 1.9228e+00, -1.0241e-01, 1.3395e-01, -9.7217e-01, 1.7454e+00, 2.3084e+00, 1.2090e+00, 4.2568e-01, 5.5122e-01, 7.5134e-01, 1.5188e+00, 2.2168e+00, 7.0068e-01, 1.5815e+00]], [[ 3.0367e+00, -1.3427e+00, -2.2735e+00, -1.7360e+00, -1.7267e+00, 2.3719e-01, -1.5159e+00, -1.6785e+00, -2.1669e+00, -1.6173e+00, -9.2281e-01, -2.6309e+00, -1.3507e+00, -2.4208e+00, -9.0552e-01]], [[ 2.9054e+00, 9.8647e-01, 4.5291e-01, -2.3421e-01, 2.1305e-01, 2.1652e+00, 8.4769e-01, 8.1716e-01, 2.8052e-02, 3.4249e-01, 7.9479e-01, -1.9700e-01, 1.3931e+00, -6.8809e-01, 1.2015e+00]], [[-3.2445e+00, 6.2191e+00, 6.6268e+00, 4.2655e+00, 4.3010e+00, 4.2138e+00, 5.2797e+00, 5.7252e+00, 3.1475e+00, 2.7713e+00, 2.7453e+00, 3.5225e+00, 7.9618e+00, 7.0417e+00, 7.7772e+00]], [[ 3.2618e+00, -5.8149e-01, -1.8192e+00, -2.1633e+00, -2.0480e+00, 3.2219e-01, 2.6799e-01, -1.3968e+00, -1.3631e+00, -1.8030e+00, 4.9596e-01, -7.7727e-01, -6.6718e-01, -2.3182e+00, -1.9050e-01]], [[ 3.3360e+00, 1.8787e+00, 7.2369e-01, -1.6783e-01, 4.4298e-01, 2.0740e+00, 8.6596e-01, 1.5704e+00, 5.8618e-01, 9.7090e-01, 1.0460e+00, 2.3900e-01, 3.1248e+00, 1.4685e+00, 3.3779e+00]], [[ 3.1772e+00, 6.3425e-01, -1.1227e+00, -7.7365e-01, -9.5242e-01, 1.2827e+00, 6.1011e-01, 1.0732e-01, -1.0995e+00, -7.4306e-01, 6.6804e-01, -1.2726e+00, -1.6940e-01, -1.2169e+01, -6.1025e+00]]]]) attn_weights tensor([[[[-1.1938e+00, -3.6770e+00, -2.4757e+00, -2.9790e+00, -4.1276e+00, -2.3163e+00, -2.9535e+00, -3.8612e+00, -2.3667e+00, -2.7497e+00, -2.0273e+00, -3.9434e+00, -2.7704e+00, -2.0297e+00, -3.1089e+00, -3.3063e+00]], [[ 1.5073e+00, -5.5403e-02, 1.5957e+00, -2.5774e+00, -4.4778e-01, -3.6216e+00, -4.9285e+00, -8.6050e-01, 1.2671e+00, -3.0431e+00, -2.3844e+00, -7.1931e-01, -3.2079e+00, -4.0006e+00, -1.7040e-01, 6.0024e+00]], [[-1.7243e+00, -2.5983e+00, -2.1776e+00, -1.8172e+00, -2.8313e+00, -2.8915e+00, -2.7422e+00, -2.7599e+00, -2.2526e+00, -1.8208e+00, -1.5810e+00, -2.8388e+00, -2.5004e+00, -2.8552e+00, -1.7281e+00, -2.3814e+00]], [[-3.5980e+00, -7.7055e+00, -8.1809e+00, -6.6237e+00, -7.4244e+00, -7.2211e+00, -6.6628e+00, -5.0835e+00, -4.9269e+00, -3.1179e+00, -1.8878e+00, -2.9988e+00, -2.0154e+00, -2.5622e+00, -5.9031e-01, 2.7160e+00]], [[-7.9697e-01, -3.1168e+00, -3.0991e+00, -2.0558e+00, -3.1370e+00, -2.7991e+00, -2.2685e+00, -2.4494e+00, -2.0240e+00, -7.2696e-01, -1.2767e+00, -1.2332e+00, -8.9224e-01, -5.9092e-01, 5.3468e-01, 9.0978e-01]], [[ 5.5974e+00, 3.0219e+00, 5.2068e+00, 1.6955e+00, 2.3288e+00, 1.4572e+00, -5.0449e-02, 9.9382e-01, 4.0408e+00, 6.0492e-01, 1.2615e+00, 1.3956e+00, 2.9501e+00, 6.3639e-01, 1.5998e+00, 8.8368e+00]], [[-5.3003e-01, -3.9822e+00, -4.3096e+00, -2.7490e+00, -4.4336e+00, -1.7790e+00, -1.6402e+00, -4.2296e+00, -4.3481e+00, -2.5935e+00, -2.3449e+00, -4.3156e+00, -2.6043e+00, -1.4529e+00, -4.0641e+00, -4.6591e+00]], [[-5.5092e+00, -7.3480e+00, -7.3637e+00, -7.5124e+00, -6.9455e+00, -7.5196e+00, -7.2567e+00, -5.9186e+00, -5.7102e+00, -5.7844e+00, -5.7356e+00, -4.4789e+00, -4.6254e+00, -4.8061e+00, -3.3976e+00, -3.4711e+00]], [[-2.3871e+00, -2.0412e+00, -6.4815e-01, -3.0539e+00, -1.8693e+00, -3.3926e+00, -3.2954e+00, -1.7519e+00, -3.0045e-01, -2.8951e+00, -3.6772e+00, -1.6240e+00, -2.9410e+00, -3.1788e+00, -2.0379e+00, -8.4589e-01]], [[-1.8036e+00, -2.3028e+00, -2.2431e+00, -2.6917e+00, -2.5934e+00, -3.0475e+00, -2.8636e+00, -2.4486e+00, -2.2817e+00, -2.6868e+00, -2.7095e+00, -2.5292e+00, -2.5765e+00, -2.9573e+00, -2.3686e+00, -2.5160e+00]], [[ 6.2829e-01, 8.6425e-02, 2.5705e-01, -3.7367e-01, -5.9525e-02, -9.2908e-01, -1.0792e+00, -3.4971e-02, 1.6549e-01, -4.7417e-01, -4.8199e-01, -1.0953e-01, -5.7093e-01, -1.0105e+00, 4.1185e-02, 1.6263e+00]], [[-1.5584e+00, -2.4937e+00, -3.4524e+00, -2.3174e+00, -2.9290e+00, -2.6290e+00, -2.3544e+00, -2.6061e+00, -3.6689e+00, -2.3731e+00, -2.6348e+00, -2.9988e+00, -2.8409e+00, -2.6554e+00, -2.3587e+00, -2.9836e+00]]], [[[ 5.6788e-01, -1.3178e+00, -1.1512e+00, -1.4488e+00, -1.3756e+00, -6.0649e-01, -9.3465e-01, -1.6562e+00, -1.3752e+00, -1.2491e+00, -1.4638e+00, -8.9097e-01, -9.4543e-01, -1.1022e+00, -1.3142e+00, -7.1359e-01]], [[ 2.9770e+00, 1.7580e+00, 2.0911e+00, 3.2052e+00, 2.9869e+00, 5.5003e+00, 2.7418e+00, 6.7004e-01, 2.4862e+00, 1.2023e+00, 2.6811e+00, 2.4375e+00, 1.6490e+00, 3.1689e+00, 3.1350e+00, 1.1591e+01]], [[-1.1363e+00, -1.5451e+00, -1.2648e+00, -1.5525e+00, -1.6117e+00, -1.6135e+00, -1.5952e+00, -1.9047e+00, -2.1941e+00, -1.4012e+00, -1.6380e+00, -1.6646e+00, -2.0493e+00, -1.6723e+00, -1.9941e+00, -1.1570e+00]], [[-1.4434e+00, -9.0893e+00, -1.0045e+01, -6.4748e+00, -8.2973e+00, -3.2975e+00, -6.3128e+00, -6.8532e+00, -6.7852e+00, -6.3405e+00, -2.3164e+00, -2.9653e+00, -3.6402e+00, -1.7224e+00, -1.7671e+00, 6.9003e+00]], [[ 3.2751e-01, -3.2645e+00, -3.7654e+00, -1.6151e+00, -3.4085e+00, -1.7428e+00, -2.5020e+00, -2.7053e+00, -2.6152e+00, -2.4652e+00, -7.6465e-02, -1.6305e+00, -1.6324e+00, -8.7751e-01, 1.9690e-02, 3.8377e+00]], [[ 1.0252e+01, -3.5485e-01, 6.7823e-01, 3.3751e+00, -1.9771e-01, 5.3295e+00, 2.6531e+00, -3.0596e+00, -1.2111e+00, -9.2705e-01, 2.2986e+00, 8.9750e-01, -2.7684e+00, -2.3954e+00, 3.5707e-01, 1.4271e+01]], [[ 6.5489e-01, -1.0463e+00, -2.5452e+00, -2.3711e+00, -1.4920e+00, 6.7285e-02, -3.0610e-01, -1.5666e+00, -1.7297e+00, -3.0446e+00, -2.6550e+00, -1.9704e+00, -2.7181e+00, -2.9548e+00, -2.6897e+00, -2.6039e-01]], [[-4.0991e+00, -5.1490e+00, -4.9048e+00, -5.2757e+00, -4.5891e+00, -5.0374e+00, -4.3990e+00, -3.7810e+00, -3.4661e+00, -3.3551e+00, -3.4072e+00, -3.0510e+00, -2.1185e+00, -2.0667e+00, -1.4846e+00, -2.0829e+00]], [[-1.4298e+00, -1.7591e+00, -1.7640e+00, -2.2554e+00, -2.1076e+00, -1.4065e+00, -2.2222e+00, -1.9377e+00, -1.5761e+00, -1.7693e+00, -2.2060e+00, -2.1570e+00, -1.4951e+00, -1.8737e+00, -1.8118e+00, -2.6574e+00]], [[-1.7546e+00, -2.1449e+00, -2.3057e+00, -2.4795e+00, -2.4782e+00, -2.7401e+00, -2.4178e+00, -2.2830e+00, -2.2164e+00, -2.4064e+00, -2.4994e+00, -2.2891e+00, -2.1896e+00, -2.4703e+00, -2.4702e+00, -3.6177e+00]], [[ 7.4248e-01, 4.1565e-01, 6.5726e-02, -8.7819e-04, 1.5878e-01, 6.9474e-01, -2.9148e-01, 2.4942e-01, 3.5818e-01, -1.8064e-01, -2.1729e-01, 9.8976e-04, 2.9455e-01, -6.2828e-02, 1.8292e-01, 1.8556e+00]], [[-2.1186e+00, -1.2669e+00, -3.3420e+00, -2.7272e+00, -2.4627e+00, -2.9274e+00, -2.2256e+00, -1.3089e+00, -1.9331e+00, -3.5690e+00, -2.7557e+00, -2.1844e+00, -2.5023e+00, -1.8986e+00, -1.5579e+00, -2.7759e+00]]], [[[-1.1225e+00, -3.4765e+00, -2.2646e+00, -2.2191e+00, -3.8524e+00, -2.6115e+00, -2.4413e+00, -3.6320e+00, -2.5487e+00, -2.0877e+00, -2.2372e+00, -2.4920e+00, -2.5034e+00, -2.3674e+00, -3.6516e+00, -3.4504e+00]], [[-1.3243e+00, -9.2771e-01, -1.5883e+00, -3.6411e+00, 5.0159e+00, -4.0939e+00, -4.0753e+00, -1.6613e+00, -1.3771e+00, -2.1753e+00, -4.2725e+00, -4.5402e+00, -1.9093e+00, -1.1567e+00, -9.5902e-01, 5.2211e+00]], [[-2.2486e+00, -2.5001e+00, -2.9730e+00, -2.7848e+00, -3.6830e+00, -3.4458e+00, -3.0594e+00, -2.5168e+00, -2.5518e+00, -2.9691e+00, -2.7348e+00, -3.0439e+00, -2.5730e+00, -3.0561e+00, -1.9284e+00, -3.5718e+00]], [[-3.6352e+00, -6.2700e+00, -7.2719e+00, -6.9245e+00, -5.4870e+00, -7.0603e+00, -5.8015e+00, -4.2999e+00, -4.3662e+00, -3.8652e+00, -2.6476e+00, -3.3682e+00, -1.8258e+00, -1.3073e+00, -2.4617e-01, 1.3669e+00]], [[-9.9666e-01, -2.9438e+00, -3.1930e+00, -1.7444e+00, -2.2151e+00, -2.1125e+00, -1.6978e+00, -2.1585e+00, -1.3493e+00, -1.7168e+00, 4.2127e-01, -1.0238e+00, 1.0788e+00, 3.9800e-01, 7.1509e-01, 1.1947e+00]], [[ 1.3597e+00, 3.3260e+00, 2.8479e+00, 1.7767e+00, 5.5448e+00, 5.9127e-01, 8.3606e-01, 2.2746e+00, 2.5966e+00, 1.8256e+00, 9.7852e-01, 8.9074e-01, 2.0501e+00, 2.2499e+00, 2.2323e+00, 4.9418e+00]], [[-9.8552e-01, -5.0506e+00, -3.9805e+00, -2.0400e+00, -4.9875e+00, -1.5908e+00, -1.5281e+00, -5.4608e+00, -3.2129e+00, -3.8475e+00, -1.7746e+00, -2.3003e+00, -1.7952e+00, -2.1113e+00, -4.7684e+00, -4.5978e+00]], [[-6.4658e+00, -8.1033e+00, -7.9602e+00, -7.7939e+00, -8.0746e+00, -7.6247e+00, -7.4697e+00, -6.5762e+00, -6.6067e+00, -5.7444e+00, -5.4304e+00, -5.4420e+00, -4.8869e+00, -4.4836e+00, -3.9366e+00, -3.6972e+00]], [[-3.8023e+00, -2.2779e+00, -3.4868e+00, -3.6675e+00, -1.1045e+00, -3.7447e+00, -3.3020e+00, -1.3427e+00, -3.0208e+00, -2.8898e+00, -2.9575e+00, -3.8463e+00, -2.8513e+00, -2.9377e+00, -1.6407e+00, -2.2303e-01]], [[-1.7017e+00, -1.9096e+00, -1.9962e+00, -2.5785e+00, -2.0653e+00, -2.6325e+00, -2.6547e+00, -2.0071e+00, -1.9251e+00, -2.0309e+00, -2.4004e+00, -2.4632e+00, -2.2995e+00, -2.0325e+00, -1.7357e+00, -1.8543e+00]], [[ 1.8735e-01, -6.3084e-03, -1.3455e-01, -7.2918e-01, 7.4388e-01, -1.0934e+00, -8.2989e-01, -6.9561e-02, -2.1071e-01, -2.2255e-01, -9.8061e-01, -9.6655e-01, -7.2167e-01, -9.3650e-02, -9.5423e-02, 7.9459e-01]], [[-1.5007e+00, -2.3100e+00, -3.6657e+00, -2.5449e+00, -2.5924e+00, -2.6004e+00, -2.2127e+00, -2.3147e+00, -2.4743e+00, -3.8903e+00, -2.5361e+00, -2.7837e+00, -2.6994e+00, -2.6440e+00, -3.2124e+00, -2.6009e+00]]], [[[-7.8021e-01, -2.4156e+00, -2.1182e+00, -2.4293e+00, -2.9840e+00, -1.7472e+00, -1.7736e+00, -2.5428e+00, -2.9864e+00, -1.7220e+00, -1.6807e+00, -2.5183e+00, -9.9584e-01, -2.5779e+00, -2.3079e+00, -3.5465e+00]], [[ 3.2955e+00, 2.1633e+00, 7.0954e+00, 1.9716e+00, 2.2103e+00, 2.8158e+00, -1.6084e+00, 1.2745e+00, 1.9107e+00, -6.4001e-01, -1.8577e+00, 2.4657e+00, 2.4774e+00, -1.2826e+00, 6.9442e-01, 8.5019e+00]], [[-1.0599e+00, -1.8342e+00, -2.1508e+00, -1.0559e+00, -1.9265e+00, -1.6520e+00, -2.4104e+00, -2.1663e+00, -1.9988e+00, -2.1724e+00, -2.4074e+00, -9.7478e-01, -1.5734e+00, -1.3152e+00, -2.1415e+00, -2.5663e+00]], [[-3.7734e+00, -8.7089e+00, -6.4642e+00, -5.8719e+00, -7.9503e+00, -8.5210e+00, -7.6452e+00, -6.2196e+00, -5.5890e+00, -6.5424e+00, -5.2601e+00, -3.7510e+00, -2.2541e+00, -2.6884e+00, -7.9881e-01, 1.9211e+00]], [[-5.3553e-01, -3.4481e+00, -3.6435e+00, -2.2325e+00, -3.6214e+00, -2.4696e+00, -3.3944e+00, -2.8752e+00, -2.7301e+00, -3.2348e+00, -2.3902e+00, -1.2106e+00, -6.1095e-01, -5.8932e-01, 1.1852e-01, 1.4248e-01]], [[ 7.9370e+00, 4.2123e+00, 8.3545e+00, 4.8655e+00, 2.8040e+00, 5.2651e+00, 1.6798e-01, 1.5098e+00, 1.8752e+00, -4.2398e-01, -4.7214e-01, 3.1464e+00, 1.3984e+00, 1.2251e+00, 1.6245e+00, 1.1085e+01]], [[-1.1789e+00, -3.6691e+00, -4.3214e+00, -2.5395e+00, -3.7965e+00, -1.8799e+00, -1.8764e+00, -3.9048e+00, -3.7455e+00, -1.3031e+00, -1.7321e+00, -1.9650e+00, -3.2621e+00, -3.6743e+00, -2.9425e+00, -3.6655e+00]], [[-5.0796e+00, -6.1583e+00, -6.5389e+00, -6.5342e+00, -6.0570e+00, -6.3133e+00, -6.0772e+00, -5.1156e+00, -4.9032e+00, -6.1576e+00, -4.7640e+00, -3.5236e+00, -3.2698e+00, -3.3668e+00, -2.6204e+00, -3.2637e+00]], [[-2.2727e+00, -1.8861e+00, -3.3314e+00, -2.8668e+00, -1.6665e+00, -2.4472e+00, -3.3105e+00, -1.5828e+00, -1.5215e+00, -3.1525e+00, -3.1882e+00, -2.1008e+00, -2.1611e+00, -1.5302e+00, -2.3108e+00, -3.1716e+00]], [[-1.8635e+00, -2.1331e+00, -2.4866e+00, -2.8555e+00, -2.4711e+00, -2.6799e+00, -2.8394e+00, -2.2715e+00, -2.4618e+00, -2.9473e+00, -2.7765e+00, -2.0961e+00, -2.0855e+00, -2.2250e+00, -2.5226e+00, -2.5295e+00]], [[ 1.0166e+00, 4.0727e-01, 1.6766e+00, 5.3155e-01, 1.8491e-01, -3.6940e-01, -9.1170e-01, 1.7457e-01, 8.8478e-02, -7.0579e-01, -9.8237e-01, 3.1576e-01, 4.6495e-01, 2.4819e-01, 4.6981e-02, 1.6666e+00]], [[-1.4806e+00, -2.3404e+00, -3.7904e+00, -2.2247e+00, -2.8178e+00, -2.5013e+00, -2.2003e+00, -2.4319e+00, -2.8742e+00, -2.0041e+00, -2.2088e+00, -2.4855e+00, -3.5523e+00, -2.7172e+00, -2.5292e+00, -3.3757e+00]]], [[[-3.7861e-01, -1.9352e+00, -1.0537e+00, -1.1806e+00, -2.1697e+00, -1.8922e+00, -1.3178e+00, -2.0735e+00, -1.8960e+00, -1.7702e+00, -7.7713e-01, -1.1193e+00, -2.1321e+00, -2.0177e+00, -1.9905e+00, -8.8966e-01]], [[ 6.3696e-01, 1.5318e+00, 3.3558e+00, -1.4667e-01, 1.8693e+00, 1.0633e-01, -1.5319e+00, 6.0143e-01, 1.3308e+00, 2.6446e+00, 1.0765e+00, -1.8568e+00, -1.2772e+00, 1.7626e+00, 1.7821e+00, 9.8506e+00]], [[-1.5313e+00, -1.9014e+00, -1.3835e+00, -1.2968e+00, -2.2840e+00, -2.0452e+00, -2.0879e+00, -2.1273e+00, -1.9523e+00, -2.2694e+00, -2.3625e+00, -2.0635e+00, -1.1485e+00, -1.8158e+00, -1.8138e+00, -1.3198e+00]], [[-4.8097e+00, -8.2668e+00, -8.9360e+00, -8.0485e+00, -7.9615e+00, -9.2503e+00, -8.6716e+00, -6.0812e+00, -5.4347e+00, -4.1345e+00, -4.3807e+00, -5.6062e+00, -3.5488e+00, -2.2146e+00, -1.4862e+00, 2.9836e+00]], [[-1.6437e-01, -1.8612e+00, -1.6110e+00, -2.0290e+00, -2.1141e+00, -2.3721e+00, -1.5947e+00, -1.1724e+00, -6.2561e-01, -2.9262e-01, -5.6387e-01, -1.9722e-01, 1.6325e-03, 9.7349e-01, 1.3065e+00, 3.3856e+00]], [[ 5.1475e+00, 2.0489e+00, 3.2987e+00, 2.0717e+00, 2.9398e+00, 4.9571e-01, -8.3405e-01, 4.1479e-01, 2.3965e+00, 3.3642e+00, -3.6509e-01, -1.3438e+00, -9.6397e-02, 3.4195e-01, 2.8716e-01, 9.9881e+00]], [[ 5.7187e-01, -2.6342e+00, -2.0941e+00, -9.7727e-01, -2.7074e+00, -1.9319e-01, -4.2291e-01, -2.8906e+00, -2.0833e+00, -2.3311e+00, -2.4359e-01, -2.8908e-01, -2.5378e+00, -2.6801e+00, -2.6572e+00, -1.6372e+00]], [[-5.4027e+00, -6.7183e+00, -6.7357e+00, -6.6843e+00, -6.4331e+00, -7.2373e+00, -6.8478e+00, -5.3364e+00, -5.2087e+00, -4.7176e+00, -5.2747e+00, -4.9685e+00, -2.8519e+00, -2.6127e+00, -2.1644e+00, -2.3275e+00]], [[-2.6176e+00, -1.4525e+00, -2.2189e+00, -2.5855e+00, -1.1799e+00, -3.0368e+00, -2.6976e+00, -8.5774e-01, -1.8840e+00, -1.3474e+00, -2.9140e+00, -2.4466e+00, -6.6538e-01, -1.0435e+00, -9.9482e-01, -1.8544e+00]], [[-1.6270e+00, -1.8578e+00, -1.7929e+00, -2.3443e+00, -2.0153e+00, -2.5391e+00, -2.7257e+00, -1.9325e+00, -2.1134e+00, -2.0928e+00, -2.4293e+00, -2.6460e+00, -1.7685e+00, -1.5981e+00, -1.5681e+00, -1.6095e+00]], [[ 4.6256e-01, 4.9535e-01, 5.0274e-01, -8.6825e-02, 4.9463e-01, -3.8443e-01, -4.8115e-01, 4.0716e-01, -7.2623e-03, 4.4652e-01, -1.5682e-01, -5.7706e-01, 3.7267e-01, 4.8828e-01, 4.8654e-01, 1.6224e+00]], [[-9.8358e-01, -2.0646e+00, -3.1119e+00, -2.4899e+00, -2.2517e+00, -2.7454e+00, -2.3581e+00, -2.0785e+00, -2.2321e+00, -2.3364e+00, -2.6556e+00, -2.3778e+00, -2.1580e+00, -1.5123e+00, -1.5004e+00, -2.3636e+00]]]]) attn_weights tensor([[[[-1.9956e+00, -3.9687e+00, -2.0597e+00, -2.4717e+00, -3.2869e+00, -3.6573e+00, -3.2261e+00, -2.0192e+00, -4.8186e-01, -8.3642e-01, -1.4941e+00, -1.1358e+00, -1.0304e+00, -1.9592e+00, 8.7739e-01, -1.3643e+00]], [[-1.0424e+00, -2.2705e+00, -3.0527e+00, -2.9684e+00, -2.7424e+00, -2.8454e+00, -2.6808e+00, -5.8069e-01, -1.4617e+00, -1.4053e+00, -1.0264e+00, -7.7104e-01, -7.5104e-01, -8.6865e-01, 4.4553e-01, -2.8976e-01]], [[-3.3978e+00, -4.1192e+00, -3.8431e+00, -4.2721e+00, -3.6517e+00, -3.8375e+00, -3.4362e+00, -2.9428e+00, -3.1350e+00, -3.5792e+00, -2.9205e+00, -2.9505e+00, -3.1666e+00, -2.8499e+00, -2.5508e+00, -2.8441e+00]], [[ 7.5111e-02, -3.5108e+00, -3.3594e+00, -3.4692e+00, -3.3178e+00, -3.1458e+00, -2.9305e+00, -2.7665e+00, -2.7653e+00, -2.9322e+00, -2.4008e+00, -2.6771e+00, -2.6374e+00, -2.4307e+00, -2.2502e+00, -2.1748e+00]], [[-7.1659e-01, -2.4718e+00, -2.7787e+00, -2.8454e+00, -2.6264e+00, -2.3665e+00, -2.2554e+00, -2.1833e+00, -2.3401e+00, -2.3803e+00, -1.8471e+00, -2.0915e+00, -1.9427e+00, -1.6738e+00, -1.7721e+00, -1.7486e+00]], [[ 6.4283e-01, -1.8135e-01, 1.5785e-02, -6.6191e-01, -8.9471e-01, -3.5380e+00, -3.4712e+00, -2.0494e-01, -2.4571e-01, -9.3227e-01, -3.2029e+00, -1.0718e+00, -2.4718e+00, -4.1555e+00, -1.9986e+00, 1.1627e-02]], [[ 1.3421e+00, -1.3249e+00, -1.6052e+00, -1.2635e+00, -9.9761e-01, -1.6458e+00, -1.8551e+00, -1.5749e+00, -1.9699e+00, -1.6678e+00, -1.1222e+00, -1.2244e+00, -8.8314e-01, -2.7806e+00, -1.6832e+00, -1.8956e+00]], [[-1.2404e-01, -1.8426e+00, -2.7144e+00, -2.4683e+00, -2.4435e+00, -1.9493e+00, -1.5048e+00, -1.7628e+00, -2.8454e+00, -2.5599e+00, -1.3034e+00, -2.2915e+00, -1.6438e+00, -2.3925e+00, -1.4537e+00, -2.2297e+00]], [[-9.1403e-01, -2.1854e+00, -2.5347e+00, -2.4543e+00, -2.2313e+00, -2.6091e+00, -2.8535e+00, -2.1817e+00, -2.4073e+00, -2.3225e+00, -2.4965e+00, -2.1268e+00, -2.4580e+00, -2.2258e+00, -2.1473e+00, -2.0305e+00]], [[ 1.1133e+00, -6.0105e-01, -1.4477e-01, -7.0291e-01, 7.4730e-02, -1.1171e+00, -1.4320e+00, -7.9477e-01, -1.0387e-01, -5.4376e-01, -1.3473e+00, 8.4120e-02, -5.2299e-01, -6.5370e-01, -4.1996e-01, -3.8065e-02]], [[-4.5732e+00, -2.5665e+00, -2.3661e+00, -2.4305e+00, -2.3369e+00, -1.9159e+00, -1.7342e+00, -1.8327e+00, -1.7071e+00, -1.8147e+00, -1.0607e+00, -1.6120e+00, -1.4209e+00, -1.0960e+00, -1.0334e+00, -1.0057e+00]], [[ 4.3234e-01, -1.3407e-01, -1.7428e+00, -3.1805e+00, -2.1549e+00, -4.8516e+00, -5.2025e+00, 6.0855e-02, -1.7780e+00, -2.9172e+00, -3.8591e+00, -1.9853e+00, -3.2962e+00, -5.2074e+00, -1.6798e+00, 3.0335e+00]]], [[[ 1.0028e-01, -1.5767e+00, -1.9120e+00, -1.1319e+00, -6.9295e-01, -2.0555e-01, -1.9103e-01, -1.2522e-01, 2.0519e-02, -4.1006e-01, 3.5815e-01, 1.3270e+00, 1.1455e+00, 2.5000e+00, 2.8807e+00, 2.3522e+00]], [[-1.1439e+00, -2.7166e+00, -2.8770e+00, -2.8570e+00, -2.9940e+00, -2.9962e+00, -2.7723e+00, -1.1353e+00, -1.1872e+00, -1.1927e+00, -1.1484e+00, -8.6747e-01, -1.0040e+00, -5.6766e-01, 6.8274e-02, -5.8509e-01]], [[-3.2388e+00, -3.9553e+00, -3.7712e+00, -4.1117e+00, -3.6346e+00, -3.7790e+00, -3.4397e+00, -2.8919e+00, -3.0656e+00, -3.1074e+00, -3.4177e+00, -3.2221e+00, -2.7538e+00, -3.0006e+00, -2.5775e+00, -2.9237e+00]], [[ 1.6973e-01, -3.2607e+00, -3.2036e+00, -3.2778e+00, -3.1861e+00, -2.9849e+00, -2.7506e+00, -2.6563e+00, -2.6788e+00, -2.6516e+00, -2.7627e+00, -2.5695e+00, -2.4233e+00, -2.5012e+00, -2.1859e+00, -2.1998e+00]], [[-7.2974e-01, -2.5166e+00, -2.8894e+00, -2.8809e+00, -2.8416e+00, -2.3685e+00, -2.3449e+00, -2.3649e+00, -2.4876e+00, -2.5224e+00, -2.4662e+00, -2.1171e+00, -2.1908e+00, -2.0847e+00, -1.8998e+00, -1.5627e+00]], [[ 5.9199e-01, -9.6167e-02, -1.5542e+00, -1.3356e+00, -4.1347e-01, 1.1775e+00, -8.4177e-01, -4.1453e-01, -4.2497e-01, -1.9126e+00, -1.7434e+00, -4.3090e-01, -8.4091e-01, -1.1588e+00, -7.8321e-01, 1.0046e-01]], [[ 3.8758e+00, 1.4761e+00, 7.6037e-01, 7.5614e-01, 5.6304e-01, 3.8197e+00, 1.3195e+00, 8.6788e-01, 1.0169e+00, 8.3844e-03, 5.9212e-02, -6.6133e-01, 5.4438e-01, 2.1892e-01, -3.1465e-01, 2.1891e+00]], [[ 4.4340e-02, -2.0167e+00, -2.0069e+00, -1.7264e+00, -2.5702e+00, -1.4230e+00, -6.4700e-01, -1.8248e+00, -1.6753e+00, -2.0761e+00, -1.8059e+00, -1.6687e+00, -1.7936e+00, -1.7752e+00, -1.7435e+00, -1.7258e+00]], [[-7.1016e-01, -1.7310e+00, -1.9544e+00, -2.3016e+00, -1.6708e+00, -2.0854e+00, -2.4935e+00, -1.7246e+00, -1.3745e+00, -1.8238e+00, -2.0824e+00, -2.0227e+00, -1.5525e+00, -2.0681e+00, -1.7245e+00, -2.4234e+00]], [[ 1.4501e+00, -1.3999e-01, -2.4951e-02, -1.6699e-01, 4.2200e-01, -3.0603e-01, -5.7587e-01, -3.8780e-01, -4.6277e-01, -1.0899e-01, -5.3499e-02, -3.6229e-01, -3.0231e-01, -1.9572e-01, -4.0267e-01, -1.5968e+00]], [[-5.0605e+00, -2.1363e+00, -2.0649e+00, -2.0855e+00, -2.0690e+00, -1.6745e+00, -1.4642e+00, -1.5632e+00, -1.6003e+00, -1.4291e+00, -1.4630e+00, -1.2192e+00, -1.1309e+00, -1.1543e+00, -8.0927e-01, -7.4397e-01]], [[ 4.3467e-01, -6.2993e-01, -4.6492e+00, -3.5252e+00, -2.4122e+00, -1.0397e+00, -1.0583e+00, -3.4762e-01, -1.1980e+00, -5.3677e+00, -3.9698e+00, -2.2354e+00, -8.6330e-01, -2.4600e+00, -1.6188e+00, 3.4944e+00]]], [[[-1.5372e+00, -3.6715e+00, -3.5106e+00, -2.9980e+00, -3.6529e+00, -3.5874e+00, -2.9912e+00, -2.0749e+00, -2.3232e+00, -1.7590e+00, -1.4986e+00, -1.2104e+00, 8.7675e-02, -4.7678e-02, 2.6461e-01, -4.4615e-01]], [[-6.5607e-01, -2.0861e+00, -2.5425e+00, -2.4240e+00, -3.1019e+00, -2.5159e+00, -2.1001e+00, -4.0302e-01, -1.1522e+00, -7.3993e-01, -1.2173e+00, -1.0646e+00, -5.3514e-01, -3.9317e-01, 1.6699e-01, -4.3854e-01]], [[-3.1590e+00, -3.9962e+00, -3.7615e+00, -4.0862e+00, -3.4591e+00, -3.6564e+00, -3.3048e+00, -2.8239e+00, -3.2571e+00, -2.9780e+00, -3.6210e+00, -3.5424e+00, -2.9035e+00, -3.1389e+00, -2.7162e+00, -2.5362e+00]], [[ 8.1481e-02, -3.3817e+00, -3.2923e+00, -3.3428e+00, -3.1501e+00, -3.0004e+00, -2.7951e+00, -2.6650e+00, -2.8217e+00, -2.6515e+00, -2.9600e+00, -2.9791e+00, -2.5080e+00, -2.5809e+00, -2.5092e+00, -2.2923e+00]], [[-7.1836e-01, -2.6837e+00, -2.9013e+00, -2.8379e+00, -2.6581e+00, -2.2543e+00, -2.1856e+00, -2.2728e+00, -2.4191e+00, -2.3357e+00, -2.5399e+00, -2.4913e+00, -1.8018e+00, -2.0059e+00, -2.0427e+00, -1.8138e+00]], [[ 1.4889e-01, -3.9171e-02, -1.6870e+00, -7.1461e-01, -1.0589e+00, -2.1594e+00, -1.9887e+00, 2.7056e-01, -2.0541e-01, -1.8000e+00, -9.6345e-01, -8.0285e-01, -1.0023e+00, -1.1204e+00, -3.1806e-01, -1.0756e+00]], [[ 1.0581e+00, -9.5368e-01, -1.0852e+00, -1.1794e+00, -1.2047e+00, -6.0705e-01, -5.9514e-01, -9.3142e-01, -1.6459e+00, -1.3590e+00, -1.4232e+00, -1.1476e+00, -6.7798e-01, -1.0891e+00, -1.0028e+00, -1.3593e+00]], [[ 1.8208e-01, -1.8768e+00, -2.0501e+00, -2.1322e+00, -2.3014e+00, -1.2765e+00, -1.3220e+00, -1.5194e+00, -2.1426e+00, -2.0935e+00, -2.2738e+00, -2.1941e+00, -1.9089e+00, -1.7942e+00, -1.5387e+00, -2.0873e+00]], [[-4.9548e-01, -1.3209e+00, -1.8873e+00, -1.9946e+00, -1.5798e+00, -2.2627e+00, -2.3778e+00, -1.4783e+00, -1.8377e+00, -1.8152e+00, -2.1690e+00, -1.8502e+00, -1.8998e+00, -2.2666e+00, -1.9238e+00, -1.6112e+00]], [[ 1.2505e+00, -6.3568e-01, -5.1341e-02, -4.8188e-01, 2.5733e-01, -9.4522e-01, -1.0782e+00, -8.4278e-01, -1.0346e-01, -3.8848e-02, -4.0548e-01, -1.3399e-01, -2.0527e-02, -4.5896e-01, -8.4045e-01, 6.9488e-02]], [[-4.8106e+00, -2.4808e+00, -2.3595e+00, -2.3685e+00, -2.2454e+00, -1.8540e+00, -1.6958e+00, -1.7956e+00, -1.7493e+00, -1.6178e+00, -1.9704e+00, -1.8933e+00, -1.2425e+00, -1.4060e+00, -1.5197e+00, -1.2152e+00]], [[-1.1623e+00, -1.5088e+00, -4.0108e+00, -4.5116e+00, 9.0520e-01, -5.2938e+00, -6.0763e+00, -1.1079e+00, -3.8925e+00, -3.1920e+00, -4.5461e+00, -4.4944e+00, -3.9617e+00, -3.6198e+00, -8.2820e-01, 2.0593e+00]]], [[[-1.9513e+00, -3.8036e+00, -4.1179e+00, -2.9284e+00, -3.3131e+00, -3.8146e+00, -3.4376e+00, -2.1862e+00, -1.9949e+00, -2.2893e+00, -2.5541e+00, -1.3853e+00, 2.0188e-01, 5.2319e-01, 2.0880e-01, -1.1804e+00]], [[-1.2998e+00, -2.4037e+00, -3.2524e+00, -2.5575e+00, -2.3966e+00, -2.6272e+00, -2.5472e+00, -7.6863e-01, -1.2958e+00, -1.5134e+00, -1.5405e+00, 5.5984e-01, 2.4212e-02, 7.0929e-01, 5.4580e-01, 4.8901e-02]], [[-3.5296e+00, -4.1952e+00, -3.9950e+00, -4.2970e+00, -3.6991e+00, -3.9744e+00, -3.5800e+00, -3.0299e+00, -3.3089e+00, -3.6364e+00, -3.1237e+00, -2.7627e+00, -2.9437e+00, -2.7720e+00, -3.0753e+00, -2.6431e+00]], [[ 7.7706e-02, -3.6717e+00, -3.5074e+00, -3.5287e+00, -3.3771e+00, -3.2237e+00, -2.9834e+00, -2.8407e+00, -3.0006e+00, -2.8819e+00, -2.6063e+00, -2.2078e+00, -2.4630e+00, -2.3881e+00, -2.6424e+00, -2.2473e+00]], [[-6.2755e-01, -2.4422e+00, -2.7305e+00, -2.6645e+00, -2.5536e+00, -2.4427e+00, -2.2660e+00, -2.1573e+00, -2.2719e+00, -1.9269e+00, -1.9326e+00, -1.7390e+00, -1.7713e+00, -1.6708e+00, -1.8283e+00, -1.6287e+00]], [[ 6.8746e-01, -1.8591e-01, 7.4132e-01, -5.7447e-01, -9.8525e-01, -3.3114e+00, -3.5866e+00, -1.7595e-01, -1.0377e+00, -5.0135e+00, -4.0631e+00, -1.3141e+00, -4.2786e-01, -3.1506e-01, -1.0856e+00, 1.1999e-01]], [[ 1.3227e+00, -1.1824e+00, -1.5216e+00, -1.5063e+00, -1.5739e+00, -1.2394e+00, -1.8403e+00, -1.3244e+00, -1.6827e+00, -1.9617e+00, -1.9849e+00, -3.0781e-01, -1.1831e+00, -1.0697e+00, -1.3598e+00, -2.2276e+00]], [[ 1.4075e-01, -1.6874e+00, -2.0346e+00, -2.0505e+00, -1.9789e+00, -1.5646e+00, -1.1257e+00, -1.5337e+00, -1.9343e+00, -1.5100e+00, -1.5173e+00, -8.7502e-01, -2.2896e+00, -1.4336e+00, -1.6586e+00, -1.6078e+00]], [[-9.9628e-01, -2.0566e+00, -2.9771e+00, -2.7268e+00, -2.0175e+00, -2.7249e+00, -3.0478e+00, -2.0926e+00, -1.9701e+00, -3.1342e+00, -2.8257e+00, -1.8368e+00, -2.2343e+00, -1.8811e+00, -2.0999e+00, -2.6496e+00]], [[ 1.1369e+00, -4.5575e-01, 2.1142e-01, -5.7888e-01, 2.5854e-01, -1.0618e+00, -1.6421e+00, -7.2374e-01, 3.3107e-01, -1.9706e+00, -1.3240e+00, -3.2990e-01, 1.4389e-01, 3.2004e-01, -6.4103e-02, -2.5281e-01]], [[-4.5404e+00, -2.5456e+00, -2.3912e+00, -2.3866e+00, -2.2855e+00, -1.9630e+00, -1.7421e+00, -1.8277e+00, -1.8999e+00, -1.5510e+00, -1.3115e+00, -1.0366e+00, -1.1533e+00, -1.2421e+00, -1.3445e+00, -8.8160e-01]], [[-2.8944e-01, -2.0380e-01, 6.1014e-01, -2.3386e+00, -2.5998e+00, -4.2734e+00, -4.3107e+00, -6.3651e-02, -2.5822e+00, -4.5631e+00, -4.2031e+00, 2.6159e-01, -1.2931e+00, -2.2314e+00, -2.3714e+00, 2.9335e+00]]], [[[ 7.5638e-01, -8.3373e-01, -1.4272e+00, -1.1043e+00, -6.5640e-01, -6.3179e-01, -5.5135e-01, 1.3341e-02, -8.1394e-01, 2.5255e-01, 7.3131e-01, 3.9609e-01, 1.4626e+00, 2.3221e+00, 2.4920e+00, 1.3608e+00]], [[-6.7438e-01, -2.0017e+00, -2.7532e+00, -2.0697e+00, -2.0600e+00, -2.0748e+00, -1.7759e+00, -6.4164e-01, -1.3707e+00, -9.5609e-01, -7.2334e-01, -6.5374e-01, 1.1300e+00, 1.5405e+00, 1.9053e+00, 6.5011e-01]], [[-3.2539e+00, -3.9312e+00, -3.7127e+00, -4.0934e+00, -3.5376e+00, -3.7610e+00, -3.3980e+00, -2.8585e+00, -3.4452e+00, -3.1422e+00, -3.0292e+00, -2.8235e+00, -2.4215e+00, -2.5052e+00, -2.3301e+00, -2.6025e+00]], [[ 1.9481e-01, -3.4088e+00, -3.3084e+00, -3.3874e+00, -3.2296e+00, -3.0844e+00, -2.8654e+00, -2.7440e+00, -3.0349e+00, -2.8818e+00, -2.5045e+00, -2.4517e+00, -2.0647e+00, -2.1417e+00, -2.0393e+00, -2.1615e+00]], [[-6.3350e-01, -2.5315e+00, -2.7257e+00, -2.7665e+00, -2.6010e+00, -2.2676e+00, -2.1300e+00, -2.2311e+00, -2.3475e+00, -2.1924e+00, -1.6427e+00, -1.6052e+00, -1.7149e+00, -1.5057e+00, -1.3468e+00, -1.3018e+00]], [[ 1.4844e+00, -5.6606e-02, -1.1334e+00, -7.4497e-01, 5.1491e-01, -1.8431e+00, -1.6154e+00, -1.0830e-01, -2.3915e-01, 1.2488e-01, -1.4270e+00, -2.3848e+00, -7.0485e-03, 2.1852e-01, 1.0617e-01, 2.2602e+00]], [[ 2.3561e+00, 8.1787e-02, 5.6107e-01, 4.5245e-01, 4.4301e-02, 8.7216e-02, -2.5628e-01, -2.6198e-01, -1.1735e-01, -1.5595e-01, -3.4954e-01, -8.5897e-01, 2.7498e-01, 7.0324e-01, 4.3738e-01, -3.8264e-01]], [[ 7.6840e-01, -1.6074e+00, -1.0992e+00, -1.0006e+00, -1.4667e+00, -6.6703e-01, -4.6674e-01, -1.3236e+00, -1.1480e+00, -1.3732e+00, -6.9067e-01, -8.7544e-01, -9.1114e-01, -1.2618e+00, -1.2447e+00, -6.8505e-01]], [[ 1.2800e-01, -3.2728e-01, -1.3411e+00, -1.2239e+00, -5.8938e-01, -1.1160e+00, -1.3425e+00, -8.0823e-01, -8.9035e-01, -7.9153e-01, -1.2655e+00, -1.3094e+00, -4.7766e-01, -4.3474e-01, -3.9182e-01, -6.5572e-01]], [[ 1.4886e+00, -3.2944e-01, 2.4711e-01, -1.2019e-01, 6.7671e-01, -6.8195e-01, -1.1781e+00, -6.9400e-01, 2.0520e-01, 6.1914e-01, -1.0473e+00, -9.2287e-01, -5.0961e-01, -5.1150e-01, -4.0143e-01, 4.6901e-01]], [[-5.1120e+00, -2.4283e+00, -2.3066e+00, -2.3522e+00, -2.2766e+00, -1.9165e+00, -1.7162e+00, -1.8127e+00, -1.9583e+00, -1.8364e+00, -1.2528e+00, -1.2366e+00, -1.0902e+00, -1.1241e+00, -1.0036e+00, -9.1983e-01]], [[ 1.2289e+00, 1.4863e-01, -1.2639e+00, -2.5883e+00, -2.4886e+00, -2.9289e+00, -3.6914e+00, -3.6926e-03, -1.9597e+00, -2.2434e+00, -4.6161e+00, -4.7236e+00, 7.0557e-01, 1.0387e+00, 7.5906e-01, 3.9308e+00]]]]) attn_weights tensor([[[[ -1.9280, -4.8445, -4.9087, -5.9456, -5.3720, -5.2074, -5.6710, -3.4941, -3.3514, -4.2686, -3.1564, -3.1858, -2.4947, -3.3598, -0.5811, -2.7632]], [[ 1.7829, -0.3842, -1.1836, -0.5448, -2.1567, -2.1426, -3.0152, -0.9627, -2.5509, -1.5083, -1.0617, -2.7915, -2.5236, -3.5255, -1.2744, -2.8197]], [[ -6.1807, -15.6552, -16.4727, -15.5864, -13.4423, -12.3129, -12.2143, -10.5993, -9.9964, -9.1482, -7.0700, -5.2363, -5.5790, -3.7648, -1.5760, -5.7593]], [[ -3.0667, -7.7203, -7.9799, -8.9914, -6.0677, -7.1530, -6.8307, -5.4563, -5.2029, -5.9663, -4.6067, -2.1570, -2.4201, -3.3286, -0.9811, -2.3406]], [[ -1.8692, -6.6377, -6.9016, -7.1955, -6.4127, -6.6360, -7.8284, -4.3216, -4.3134, -4.5667, -4.3576, -2.8373, -3.0079, -3.3420, -1.8353, -2.7363]], [[ -4.2576, -7.8564, -10.3860, -8.6067, -8.9842, -8.3218, -7.8593, -4.7371, -6.8538, -5.0246, -5.6621, -4.3735, -4.5437, -3.5456, -2.3500, -3.4915]], [[ -0.6452, -3.5541, -2.2067, -3.4399, -4.2674, -5.2327, -4.3970, -2.3717, -1.2792, -2.6253, -3.1133, -3.0916, -3.4691, -4.0187, -2.6687, -2.7856]], [[ -1.2452, -4.0690, -2.7772, -2.6810, -2.8021, -1.9813, -2.0845, -2.0343, -1.2738, -1.5473, -1.2118, -1.4976, -1.0198, -0.4399, -1.2581, -0.8866]], [[ -3.4422, -7.5907, -9.8483, -6.6942, -7.6130, -7.7288, -6.4336, -5.3608, -6.7627, -3.7798, -3.3480, -3.7244, -3.5643, -4.1232, -1.0302, -3.8397]], [[ -4.0815, -9.4128, -10.2334, -9.7748, -8.9251, -6.4351, -6.5054, -6.6634, -6.9855, -6.3087, -4.0167, -4.5932, -3.1506, -2.2225, -3.4859, -3.1655]], [[ -1.9413, -3.8402, -3.5506, -3.3514, -3.6407, -2.9251, -2.7965, -3.1372, -2.5614, -2.4764, -1.8614, -2.5183, -2.2477, -1.7213, -1.9969, -1.6138]], [[ -0.6643, -5.0756, -4.9968, -4.8278, -4.9399, -4.4043, -4.2814, -4.0922, -3.8515, -3.7821, -3.1589, -3.5870, -3.3212, -2.9075, -3.0585, -2.6392]]], [[[ -1.6223, -4.8725, -4.4939, -6.4486, -5.1719, -4.4066, -4.2195, -3.4587, -2.5142, -2.8747, -4.8628, -2.4358, -1.4492, -4.1041, -1.2251, -2.4667]], [[ 1.9125, -1.5066, -2.5500, -1.9691, -2.7877, -0.2049, -1.0196, -1.6267, -1.8717, -3.3556, -2.4938, -2.4007, -1.0562, -1.1953, -1.4316, -0.7654]], [[ -4.8653, -11.4791, -12.0420, -11.9723, -10.6559, -9.7940, -9.4510, -8.1070, -7.6262, -6.2276, -6.0042, -5.9264, -3.0999, -3.7139, -0.8153, -2.4459]], [[ -3.1981, -7.0495, -6.5165, -7.1564, -4.2580, -6.3530, -5.9506, -4.8166, -4.1683, -3.7185, -4.1315, -2.3707, -3.2598, -1.7839, -0.8480, -1.0348]], [[ -0.9032, -4.5047, -6.1904, -6.6551, -5.1287, -6.4146, -5.7333, -2.9082, -2.7592, -3.7210, -4.0145, -4.8196, -2.0792, -2.5237, -0.3304, -2.8801]], [[ -4.0723, -6.9553, -7.8325, -7.9836, -7.7659, -7.9696, -6.6903, -4.0217, -3.7478, -4.1273, -4.2751, -4.6919, -2.9806, -3.3513, -1.7035, -3.4473]], [[ -0.4001, -3.4915, -3.3429, -4.4642, -3.6946, -4.4672, -4.0190, -2.1406, -2.2823, -2.2352, -3.4920, -3.2848, -2.4170, -3.3749, -2.1282, -2.7019]], [[ -1.1031, -3.8885, -2.7164, -2.7614, -2.7715, -1.9193, -1.9946, -1.9947, -1.8815, -1.2382, -1.5946, -1.8257, -1.5158, -1.6086, -1.2262, -0.6568]], [[ -3.0211, -6.8815, -7.8356, -6.4653, -6.1486, -6.8547, -5.6045, -4.1155, -4.4207, -4.4530, -3.2662, -2.3691, -1.7528, -0.1330, -0.4597, -1.3171]], [[ -3.8534, -7.9673, -7.3294, -7.9515, -7.9259, -5.6790, -5.9960, -6.1431, -6.0333, -4.1618, -4.6414, -3.7422, -4.1635, -3.0377, -2.7469, -2.2429]], [[ -2.0557, -3.8733, -3.7049, -3.5654, -3.7092, -2.7508, -2.6309, -3.0505, -2.9049, -2.5349, -2.5305, -2.1716, -2.2637, -2.1362, -1.8138, -1.1375]], [[ -0.5862, -5.0040, -4.8698, -4.8584, -4.7096, -4.0735, -4.0820, -4.0183, -3.9033, -3.5190, -3.6442, -3.3364, -3.3304, -3.1378, -2.9377, -2.4160]]], [[[ -2.0768, -4.8067, -5.1425, -6.7157, -5.8986, -4.2793, -4.6191, -3.2042, -3.8218, -3.1105, -2.7079, -1.7951, -2.9815, -1.9298, -1.0692, -2.9599]], [[ 1.4649, -1.5501, -2.0294, -1.9281, -2.8296, -1.3671, -1.4883, -1.8166, -2.3290, -3.0318, -3.1416, -2.6504, -2.5581, -2.4078, -1.7752, -3.1135]], [[ -7.4092, -15.4049, -14.5768, -14.6953, -17.1245, -12.4543, -11.2696, -10.0319, -8.9304, -6.9857, -7.4335, -6.6458, -5.0807, -3.3193, -2.2004, -5.4211]], [[ -3.0278, -7.3692, -6.9338, -8.6552, -7.6392, -6.6724, -5.9284, -4.9634, -3.5512, -3.5996, -4.4678, -3.8499, -2.8020, -1.3401, -2.7440, -2.1725]], [[ -2.3107, -6.1998, -6.7987, -6.7302, -8.0924, -7.5858, -5.3359, -3.9285, -5.3066, -3.4185, -2.8805, -2.6025, -3.8430, -2.2832, -2.9417, -3.0916]], [[ -4.2675, -7.1253, -8.6915, -8.0347, -10.3168, -6.7994, -6.9470, -4.0488, -4.7352, -4.5234, -5.0843, -3.9327, -4.4369, -4.0303, -3.4592, -4.2083]], [[ -0.4933, -3.6118, -3.0458, -3.7415, -3.6976, -4.2915, -4.1023, -2.0883, -2.0232, -1.7435, -3.0746, -3.1787, -2.7792, -3.2188, -2.1252, -2.2119]], [[ -1.2418, -4.1206, -2.8650, -2.6464, -2.6874, -1.7679, -1.9250, -2.0111, -1.5905, -1.2002, -1.8674, -1.9439, -1.2911, -1.4935, -1.6877, -1.2623]], [[ -3.7448, -7.9932, -9.2209, -6.2839, -9.9173, -7.2120, -5.8483, -5.0894, -4.8380, -5.4019, -4.6625, -4.2518, -1.5189, -3.5924, -2.4736, -4.6238]], [[ -4.1633, -8.5545, -7.9265, -9.2907, -10.3588, -5.3890, -5.5218, -6.0761, -5.6318, -3.9998, -4.4278, -4.7734, -3.2446, -2.4822, -3.8939, -4.3646]], [[ -1.6467, -3.9263, -3.5911, -3.2506, -3.5047, -2.5767, -2.4634, -3.1605, -2.3987, -2.4073, -2.5658, -2.3882, -1.8284, -1.8410, -2.3426, -1.9976]], [[ -0.6130, -5.2038, -5.0182, -4.6479, -4.8458, -4.0680, -3.9590, -4.1120, -3.7258, -3.5077, -3.6715, -3.6909, -3.1178, -2.9306, -3.3210, -2.9871]]], [[[ -1.8409, -5.1244, -4.7973, -5.5664, -5.0610, -4.7667, -4.6426, -4.1589, -3.8167, -3.2591, -3.6831, -2.8482, -2.4221, -2.4252, -1.0908, -2.2957]], [[ 1.9968, -0.3758, -1.5791, -1.5495, -2.1312, -1.1917, -2.5354, -1.3204, -2.9980, -2.2504, -4.2626, -1.3488, -2.9998, -2.0499, -1.8421, -2.9695]], [[ -8.1052, -16.4133, -17.4318, -17.6635, -13.5316, -13.3665, -12.0412, -11.3750, -9.0292, -8.0885, -7.8681, -7.3681, -5.8165, -6.2587, -3.8463, -5.1992]], [[ -3.3025, -8.2106, -8.2240, -9.2188, -5.7564, -7.0268, -6.3914, -5.7025, -3.3136, -3.9552, -4.7015, -3.5569, -1.7503, -3.9323, -1.9462, -2.4868]], [[ -2.1378, -6.5196, -6.6063, -7.1184, -6.3239, -6.3161, -8.0681, -4.5724, -4.3528, -5.4010, -6.6368, -3.4821, -1.4546, -2.6793, -2.8529, -3.8245]], [[ -4.2836, -8.4159, -9.9430, -9.2487, -8.7804, -8.4632, -8.1287, -5.1058, -6.2109, -6.6786, -5.5289, -3.1191, -3.1333, -2.9937, -3.4762, -3.2463]], [[ -1.1891, -4.4251, -4.5418, -4.4628, -4.2607, -4.2997, -4.3503, -2.9827, -3.1575, -3.9670, -3.5332, -0.9337, -1.4374, -2.3522, -2.7641, -2.7503]], [[ -1.2492, -4.4228, -3.1891, -2.9877, -2.9593, -2.2247, -2.3390, -2.2079, -2.0580, -1.8938, -1.3367, -1.0640, -0.8969, -1.0768, -1.5173, -0.6569]], [[ -4.3326, -8.1606, -10.4822, -7.6263, -7.0593, -7.9311, -6.9235, -5.6192, -5.0372, -5.8720, -5.2246, -4.0587, -4.7785, -2.5571, -2.7719, -4.5182]], [[ -4.8859, -9.8445, -9.6795, -10.9616, -9.2061, -6.8304, -6.5091, -7.3739, -6.7296, -4.8074, -4.3966, -4.0722, -3.0393, -4.9330, -3.6911, -3.1937]], [[ -2.2943, -4.1315, -3.8236, -3.6149, -3.7498, -3.1446, -2.9450, -3.4000, -3.1113, -2.6108, -2.3419, -2.0956, -1.7507, -1.9181, -1.9200, -1.5411]], [[ -0.7173, -5.5596, -5.3244, -5.2178, -5.0318, -4.6102, -4.4951, -4.4982, -4.3234, -4.0727, -3.7530, -3.3094, -2.9999, -3.1172, -3.0453, -2.6766]]], [[[ -1.2634, -4.1436, -3.4699, -4.2816, -3.8572, -4.8911, -4.2049, -3.1388, -2.8391, -2.9733, -2.8580, -3.1881, -2.3288, -2.2389, -1.9285, -0.3221]], [[ 1.6131, -1.0885, 0.0619, 0.2800, -1.7644, -1.9365, -2.2616, -1.4977, -0.7713, -2.2969, -2.0165, -4.2537, -1.2432, -1.9829, -1.8927, -1.0659]], [[ -6.4704, -13.1539, -13.2013, -13.4449, -13.0064, -11.9752, -11.8912, -10.1688, -10.0492, -9.2982, -8.8662, -7.7199, -4.5201, -4.3544, -3.4442, -6.0484]], [[ -2.6861, -5.6233, -6.0676, -6.5071, -4.7900, -6.2178, -6.1075, -4.2925, -4.9532, -3.4135, -4.5953, -4.6378, -2.8432, -1.7286, -1.3363, -2.1793]], [[ -0.2979, -4.5108, -6.4537, -6.2639, -5.4056, -5.8620, -8.6230, -3.1494, -5.9740, -3.9812, -5.5594, -6.8564, -0.7593, -2.5420, -2.3092, -2.4496]], [[ -3.2661, -6.5363, -8.2713, -7.5412, -7.4208, -8.4090, -7.1453, -4.4253, -6.3297, -5.2385, -5.2999, -4.5343, -1.8415, -2.4486, -1.9855, -4.0926]], [[ -2.5246, -5.6361, -3.8998, -4.0002, -4.1326, -4.3600, -3.5644, -4.7289, -3.3526, -3.2423, -3.4312, -2.9030, -1.1946, -0.5844, -0.3518, -1.3222]], [[ -1.1551, -3.6403, -2.5080, -2.4282, -2.4103, -1.5823, -1.6671, -1.7663, -2.0231, -1.7878, -0.9137, -0.6040, -1.1249, -1.0342, -0.6648, -0.5965]], [[ -1.8202, -5.0756, -6.7770, -5.1869, -5.7796, -6.4047, -5.8070, -4.0950, -3.8565, -4.4300, -5.5218, -4.5424, -1.7577, -1.7381, -1.4623, -1.8799]], [[ -2.9478, -7.5618, -7.7443, -7.8843, -7.7245, -6.2752, -5.9634, -6.7579, -5.5311, -5.7588, -4.1932, -4.0088, -2.8652, -2.6176, -2.3043, -3.1526]], [[ -1.2003, -3.2570, -3.1849, -3.0499, -3.2717, -2.4780, -2.1531, -2.7642, -2.6656, -2.6733, -1.8393, -1.5583, -1.8418, -1.9532, -1.4779, -1.3220]], [[ -0.6436, -5.5049, -5.2728, -5.0333, -5.0484, -4.2609, -4.1927, -4.4134, -4.3451, -4.2137, -3.5148, -3.3708, -3.2911, -3.2112, -2.8628, -2.9091]]]]) attn_weights tensor([[[[ 5.1121e+00, -6.4348e-01, -2.5379e+00, -2.3270e+00, -1.3091e-03, -3.0981e+00, -5.2409e+00, -1.0744e+00, -2.1873e+00, -2.5249e+00, -2.7104e+00, -4.9417e-01, -3.3794e+00, -3.3418e+00, -3.2778e+00, 2.9567e+00]], [[-2.8711e+00, -6.5085e+00, -5.9097e+00, -6.8609e+00, -6.6542e+00, -7.6443e+00, -8.7929e+00, -3.9555e+00, -4.2156e+00, -4.8709e+00, -5.9436e+00, -5.0278e+00, -6.2741e+00, -5.2145e+00, -4.6142e+00, -4.0810e+00]], [[-4.1993e+00, -1.2499e+01, -1.5008e+01, -1.2923e+01, -1.1332e+01, -1.2648e+01, -1.2364e+01, -1.0833e+01, -1.1337e+01, -8.9372e+00, -7.2702e+00, -5.4849e+00, -5.8240e+00, -7.3446e+00, -4.1025e+00, -4.6833e+00]], [[-5.4004e+00, -1.5558e+01, -1.8488e+01, -1.6530e+01, -1.5382e+01, -1.4007e+01, -1.4133e+01, -1.2187e+01, -1.4177e+01, -1.2519e+01, -9.7682e+00, -8.8234e+00, -7.3366e+00, -7.9337e+00, -4.9148e+00, -9.2164e+00]], [[ 1.2836e+00, -2.8601e+00, -2.2590e+00, -4.0505e+00, -3.5756e+00, -2.8550e+00, -2.8812e+00, -3.0583e+00, -2.5766e+00, -4.5178e+00, -4.1374e+00, -3.2672e+00, -4.1563e+00, -3.5734e+00, -3.6198e+00, -5.4119e+00]], [[-3.6681e-01, -2.0586e+00, -1.7661e+00, -2.3161e+00, -2.4024e+00, -2.9077e+00, -3.5361e+00, -3.0648e+00, -2.2016e+00, -2.6749e+00, -2.4870e+00, -2.3443e+00, -1.9556e+00, -3.2840e+00, -2.5831e+00, -2.1226e+00]], [[-3.5103e+00, -9.8550e+00, -7.4025e+00, -9.2743e+00, -9.4301e+00, -7.9389e+00, -8.8375e+00, -8.0190e+00, -5.2818e+00, -6.9061e+00, -6.3027e+00, -5.5109e+00, -5.3066e+00, -5.3136e+00, -4.6810e+00, -4.7903e+00]], [[-5.9526e+00, -1.4128e+01, -1.7072e+01, -1.5561e+01, -1.4824e+01, -1.1515e+01, -1.0910e+01, -1.0877e+01, -1.3445e+01, -1.1513e+01, -8.7246e+00, -8.4197e+00, -8.0080e+00, -5.5250e+00, -5.9399e+00, -6.7830e+00]], [[-4.2581e+00, -1.1384e+01, -1.4000e+01, -1.2095e+01, -1.3918e+01, -1.1493e+01, -1.0160e+01, -8.5218e+00, -1.0460e+01, -8.4632e+00, -7.4836e+00, -8.0458e+00, -7.5679e+00, -5.9105e+00, -2.6942e+00, -5.5007e+00]], [[-2.4156e+00, -6.9598e+00, -6.7498e+00, -5.1919e+00, -5.6309e+00, -7.6619e+00, -6.4008e+00, -5.2927e+00, -4.9429e+00, -3.6268e+00, -3.6087e+00, -4.1366e+00, -3.7802e+00, -6.1078e+00, -3.5935e+00, -4.0722e+00]], [[-1.1706e+00, -7.0802e+00, -6.0502e+00, -7.2340e+00, -6.5959e+00, -5.6680e+00, -5.8202e+00, -5.4730e+00, -4.9470e+00, -6.0506e+00, -4.8436e+00, -4.5531e+00, -3.8645e+00, -3.8317e+00, -3.8595e+00, -3.1909e+00]], [[-2.9872e+00, -7.4126e+00, -9.3001e+00, -8.6489e+00, -6.9033e+00, -6.5167e+00, -6.4779e+00, -5.9175e+00, -7.2616e+00, -6.5100e+00, -4.7432e+00, -4.5160e+00, -3.3760e+00, -4.8233e+00, -2.4945e+00, -3.8931e+00]]], [[[ 5.7028e+00, 1.8309e-01, -3.1844e+00, -1.1151e+00, 1.4255e-01, 4.8996e-01, 1.5801e-01, -5.2967e-01, -3.7537e-01, -3.7469e+00, -2.2560e+00, -3.6892e+00, -5.4592e-01, -1.4751e+00, -1.7866e+00, 3.8612e+00]], [[-2.4176e+00, -6.4184e+00, -5.1591e+00, -6.6560e+00, -6.5324e+00, -6.8697e+00, -6.5274e+00, -3.8862e+00, -3.2190e+00, -3.1163e+00, -4.6244e+00, -4.2219e+00, -4.1193e+00, -4.6019e+00, -3.7476e+00, -5.7631e+00]], [[-3.3160e+00, -1.0661e+01, -1.0481e+01, -1.0454e+01, -7.9800e+00, -9.9184e+00, -1.0278e+01, -9.1339e+00, -8.3787e+00, -7.1525e+00, -6.6812e+00, -6.3952e+00, -4.0005e+00, -2.6254e+00, -2.0864e+00, -3.4621e+00]], [[-3.7608e+00, -1.2385e+01, -1.5848e+01, -1.3982e+01, -1.4476e+01, -1.1590e+01, -1.4561e+01, -1.0335e+01, -1.0834e+01, -1.2452e+01, -9.9968e+00, -8.8308e+00, -7.0818e+00, -7.6091e+00, -5.7771e+00, -6.2470e+00]], [[ 1.4707e+00, -3.5452e+00, -3.6160e+00, -4.0804e+00, -2.1837e+00, -2.7537e+00, -1.8496e+00, -3.5252e+00, -2.8986e+00, -3.9872e+00, -4.4610e+00, -3.8321e+00, -2.9394e+00, -3.6713e+00, -3.4983e+00, -3.4380e+00]], [[ 1.8634e-01, -2.8596e+00, -4.4194e+00, -3.4921e+00, -2.8883e+00, -1.2073e+00, -1.4174e+00, -3.1275e+00, -2.9335e+00, -4.2972e+00, -3.6431e+00, -3.3084e+00, -3.0094e+00, -2.6290e+00, -2.0847e+00, -2.1399e+00]], [[-2.9781e+00, -8.1504e+00, -5.8360e+00, -7.1047e+00, -8.1740e+00, -6.2184e+00, -7.3387e+00, -6.3321e+00, -5.0658e+00, -3.4077e+00, -4.6889e+00, -5.0974e+00, -3.2476e+00, -3.3861e+00, -3.7506e+00, -3.6104e+00]], [[-4.8928e+00, -1.1843e+01, -1.2104e+01, -1.2650e+01, -1.2257e+01, -9.6221e+00, -1.0506e+01, -9.3837e+00, -9.4933e+00, -8.3161e+00, -8.6784e+00, -6.9069e+00, -6.9312e+00, -6.2326e+00, -6.2480e+00, -5.6298e+00]], [[-3.4495e+00, -1.0247e+01, -1.0190e+01, -1.0317e+01, -1.0797e+01, -9.6368e+00, -9.2689e+00, -6.8555e+00, -6.5297e+00, -6.3638e+00, -6.3087e+00, -4.6831e+00, -2.9748e+00, -3.8944e+00, -3.4787e+00, -4.8474e+00]], [[-1.3112e+00, -6.1206e+00, -6.5526e+00, -6.2468e+00, -5.8803e+00, -5.9403e+00, -6.3801e+00, -4.8321e+00, -4.7664e+00, -4.9622e+00, -4.5289e+00, -3.2973e+00, -2.6362e+00, -1.5186e+00, -4.6915e+00, -3.4670e+00]], [[-7.4329e-01, -6.2510e+00, -6.8731e+00, -7.9594e+00, -5.8236e+00, -4.0155e+00, -4.1381e+00, -4.6619e+00, -4.7666e+00, -6.0332e+00, -6.7943e+00, -4.5316e+00, -4.4565e+00, -4.8571e+00, -4.0813e+00, -1.3106e+00]], [[-1.8464e+00, -7.0012e+00, -7.7070e+00, -7.5214e+00, -6.2313e+00, -6.9005e+00, -6.1925e+00, -5.3952e+00, -5.5199e+00, -5.8472e+00, -5.5951e+00, -3.6371e+00, -3.2884e+00, -3.0686e+00, -1.4703e+00, -2.1320e+00]]], [[[ 4.7438e+00, -1.6525e+00, -3.8726e+00, -2.2289e+00, 1.1967e+00, -3.4375e+00, -3.8302e+00, -2.1791e+00, -3.4593e+00, -4.0241e+00, -4.0837e+00, -4.6703e+00, -5.4028e+00, -3.5415e+00, -3.3902e+00, 7.5500e-01]], [[-3.0053e+00, -6.5243e+00, -6.4740e+00, -7.5009e+00, -7.8473e+00, -7.9450e+00, -7.8302e+00, -4.3423e+00, -3.8960e+00, -4.0870e+00, -5.4378e+00, -4.8595e+00, -5.3908e+00, -5.4907e+00, -5.5787e+00, -4.7800e+00]], [[-5.1042e+00, -1.0962e+01, -1.0463e+01, -9.4705e+00, -1.1886e+01, -1.0120e+01, -9.7376e+00, -8.9732e+00, -6.8995e+00, -6.0994e+00, -5.1649e+00, -4.7284e+00, -4.3888e+00, -3.5334e+00, -2.6647e+00, -4.3244e+00]], [[-6.5154e+00, -1.3474e+01, -1.6575e+01, -1.4520e+01, -1.5778e+01, -1.1349e+01, -1.0711e+01, -1.0790e+01, -1.2537e+01, -1.1708e+01, -9.3038e+00, -9.3863e+00, -7.7734e+00, -5.2396e+00, -7.2644e+00, -7.9203e+00]], [[ 1.4209e+00, -3.6619e+00, -4.2380e+00, -4.2954e+00, -3.1003e+00, -2.6609e+00, -3.4227e+00, -3.5679e+00, -4.4045e+00, -4.3255e+00, -5.5995e+00, -4.7532e+00, -4.4831e+00, -4.9059e+00, -4.7812e+00, -3.5802e+00]], [[-1.5863e-02, -3.0099e+00, -4.0354e+00, -3.8653e+00, -3.6621e+00, -2.7128e+00, -2.6479e+00, -3.5569e+00, -4.5922e+00, -3.7576e+00, -3.6895e+00, -4.1531e+00, -3.1137e+00, -3.2821e+00, -3.0777e+00, -3.1724e+00]], [[-4.1226e+00, -9.1180e+00, -6.5545e+00, -8.4905e+00, -9.2487e+00, -5.5365e+00, -6.3087e+00, -6.0169e+00, -5.0758e+00, -2.8235e+00, -4.9549e+00, -4.9190e+00, -3.8771e+00, -3.4796e+00, -3.9848e+00, -4.2081e+00]], [[-6.7803e+00, -1.3113e+01, -1.3149e+01, -1.2780e+01, -1.4949e+01, -8.2462e+00, -8.9891e+00, -9.4420e+00, -1.0585e+01, -7.9670e+00, -7.6362e+00, -7.7405e+00, -5.7932e+00, -5.8143e+00, -5.3565e+00, -6.5676e+00]], [[-4.6852e+00, -9.8058e+00, -1.1022e+01, -1.0237e+01, -1.2509e+01, -8.9627e+00, -9.2584e+00, -7.2459e+00, -8.4633e+00, -7.0256e+00, -6.4988e+00, -6.6628e+00, -4.6309e+00, -4.8531e+00, -3.9004e+00, -6.7604e+00]], [[-2.5039e+00, -7.2000e+00, -6.5856e+00, -6.2419e+00, -6.9409e+00, -6.3658e+00, -4.5102e+00, -5.0217e+00, -7.5135e+00, -4.4878e+00, -3.6240e+00, -4.9512e+00, -1.5615e+00, -3.6756e+00, -3.5746e+00, -4.7078e+00]], [[-1.0804e+00, -7.0817e+00, -6.6549e+00, -8.1848e+00, -5.9470e+00, -5.2460e+00, -5.6309e+00, -5.4736e+00, -5.9740e+00, -5.6098e+00, -6.6694e+00, -4.8775e+00, -4.9921e+00, -2.9813e+00, -3.4896e+00, -2.4389e+00]], [[-3.0908e+00, -7.4139e+00, -8.8048e+00, -8.3203e+00, -9.2183e+00, -6.7009e+00, -6.4509e+00, -5.1640e+00, -6.6422e+00, -5.8311e+00, -3.8656e+00, -3.0230e+00, -3.6438e+00, -1.3812e+00, -3.9813e+00, -4.5875e+00]]], [[[ 4.2787e+00, -5.6667e-01, 1.5696e+00, -1.6824e+00, -3.0992e-01, -2.8059e+00, -2.4494e+00, -3.8243e-01, -1.3418e+00, -3.8315e+00, -2.9531e+00, -3.1492e+00, -1.2926e+00, -3.3397e+00, -2.2671e+00, 1.5399e+00]], [[-2.9368e+00, -8.2980e+00, -8.2531e+00, -9.5728e+00, -8.8739e+00, -7.2897e+00, -8.1594e+00, -5.6519e+00, -6.5345e+00, -7.2500e+00, -6.7497e+00, -4.8402e+00, -3.1907e+00, -5.3937e+00, -4.6759e+00, -4.5641e+00]], [[-4.4240e+00, -1.2426e+01, -1.5124e+01, -1.2724e+01, -1.0499e+01, -1.1298e+01, -1.2464e+01, -1.0323e+01, -9.7881e+00, -9.7202e+00, -9.6916e+00, -9.4490e+00, -7.7572e+00, -5.8496e+00, -4.4122e+00, -4.5550e+00]], [[-5.8956e+00, -1.5783e+01, -1.9279e+01, -1.6089e+01, -1.5505e+01, -1.3518e+01, -1.5014e+01, -1.2811e+01, -1.3444e+01, -1.1562e+01, -1.1468e+01, -9.2495e+00, -9.4461e+00, -8.1247e+00, -7.7528e+00, -8.7576e+00]], [[ 9.2289e-01, -3.7434e+00, -3.8234e+00, -4.3002e+00, -3.6828e+00, -3.9332e+00, -3.6628e+00, -3.8394e+00, -3.1510e+00, -4.5619e+00, -3.5713e+00, -4.1098e+00, -3.0680e+00, -3.6993e+00, -4.1930e+00, -3.7409e+00]], [[ 1.1225e-01, -3.4661e+00, -2.9091e+00, -2.7027e+00, -2.6716e+00, -2.3810e+00, -3.4761e+00, -4.0558e+00, -3.0267e+00, -3.7527e+00, -3.4976e+00, -4.4516e+00, -2.3436e+00, -2.4307e+00, -2.0030e+00, -2.9770e+00]], [[-3.3809e+00, -9.4628e+00, -8.6052e+00, -1.0283e+01, -9.1397e+00, -6.4414e+00, -9.3695e+00, -7.4932e+00, -7.6537e+00, -6.2998e+00, -7.0045e+00, -6.0609e+00, -3.9804e+00, -5.2092e+00, -2.3511e+00, -2.6422e+00]], [[-5.9481e+00, -1.3898e+01, -1.4005e+01, -1.3443e+01, -1.2556e+01, -1.0941e+01, -1.4415e+01, -1.1063e+01, -1.1325e+01, -9.4289e+00, -1.1192e+01, -8.1902e+00, -7.0752e+00, -6.6913e+00, -6.2594e+00, -6.3858e+00]], [[-4.6456e+00, -1.1282e+01, -1.2367e+01, -1.1079e+01, -1.2425e+01, -1.2028e+01, -9.9558e+00, -8.6596e+00, -1.1222e+01, -7.9024e+00, -7.8257e+00, -6.3309e+00, -6.9166e+00, -4.4656e+00, -4.2775e+00, -5.3398e+00]], [[-2.4334e+00, -7.9178e+00, -8.5257e+00, -6.2131e+00, -6.5787e+00, -6.1163e+00, -5.6165e+00, -6.3290e+00, -5.4982e+00, -5.8205e+00, -4.6964e+00, -5.0928e+00, -3.4304e+00, -2.1873e+00, -2.9950e+00, -2.8605e+00]], [[-1.2033e+00, -5.0999e+00, -5.6202e+00, -5.2755e+00, -4.8015e+00, -4.5142e+00, -5.7101e+00, -4.9912e+00, -4.9675e+00, -4.9615e+00, -5.1756e+00, -4.8892e+00, -3.8228e+00, -3.7895e+00, -3.6361e+00, -2.0114e+00]], [[-2.6694e+00, -8.3654e+00, -9.4405e+00, -9.6609e+00, -7.1213e+00, -7.7851e+00, -7.5997e+00, -6.4364e+00, -5.9726e+00, -5.1432e+00, -5.9121e+00, -4.7355e+00, -4.0393e+00, -4.9833e+00, -2.6470e+00, -3.3222e+00]]], [[[ 4.6845e+00, -1.2861e-01, -3.4404e-01, -2.3274e+00, -1.4883e+00, -2.4778e+00, -5.1791e+00, -3.3758e-01, -6.1897e-01, -4.5080e-01, -1.7040e+00, -6.2036e+00, -3.3375e-01, 1.9280e-01, 1.5699e-01, 7.9465e-01]], [[-2.4727e+00, -6.3393e+00, -5.8722e+00, -6.7212e+00, -8.3296e+00, -8.7698e+00, -7.9347e+00, -5.7554e+00, -6.2925e+00, -7.3614e+00, -7.8385e+00, -7.3227e+00, -3.5900e+00, -3.1418e+00, -2.7905e+00, -4.8979e+00]], [[-4.4892e+00, -8.9010e+00, -1.0043e+01, -8.6455e+00, -8.0895e+00, -9.7592e+00, -1.0365e+01, -7.3213e+00, -8.5752e+00, -6.3172e+00, -8.7888e+00, -8.4145e+00, -4.9002e+00, -3.9223e+00, -3.5684e+00, -6.0077e+00]], [[-4.5239e+00, -1.1266e+01, -1.2763e+01, -1.2858e+01, -1.3329e+01, -1.2001e+01, -1.2413e+01, -9.8218e+00, -1.1578e+01, -1.1187e+01, -1.1519e+01, -1.0333e+01, -5.6356e+00, -5.2737e+00, -5.2238e+00, -8.0913e+00]], [[ 1.0704e+00, -2.6219e+00, -4.2547e+00, -4.2045e+00, -3.6929e+00, -3.7119e+00, -3.8821e+00, -2.4873e+00, -3.4113e+00, -4.0913e+00, -3.8659e+00, -5.0636e+00, -2.5269e+00, -2.2043e+00, -1.7968e+00, -2.7959e+00]], [[-5.9067e-02, -2.7857e+00, -2.7766e+00, -2.1556e+00, -2.3418e+00, -2.8744e+00, -2.8795e+00, -3.1425e+00, -2.8544e+00, -2.7230e+00, -3.2690e+00, -4.4330e+00, -3.0421e+00, -2.4370e+00, -2.5974e+00, -3.1383e+00]], [[-3.1741e+00, -8.5130e+00, -6.7143e+00, -7.9030e+00, -7.2867e+00, -7.2213e+00, -7.1879e+00, -7.2552e+00, -6.2951e+00, -6.0127e+00, -6.1947e+00, -6.1358e+00, -4.8734e+00, -3.9635e+00, -3.6712e+00, -4.2334e+00]], [[-5.7215e+00, -1.2341e+01, -1.2645e+01, -1.2181e+01, -1.2403e+01, -1.0487e+01, -9.4637e+00, -9.9259e+00, -1.0387e+01, -1.0114e+01, -8.2343e+00, -7.5078e+00, -6.3586e+00, -6.5346e+00, -6.1774e+00, -7.0832e+00]], [[-3.6297e+00, -8.3856e+00, -9.8345e+00, -9.8047e+00, -1.1169e+01, -1.1339e+01, -9.7969e+00, -7.2115e+00, -1.0315e+01, -1.0201e+01, -9.7416e+00, -8.1917e+00, -4.0993e+00, -4.1924e+00, -3.9357e+00, -4.9368e+00]], [[-1.4789e+00, -6.2658e+00, -7.3444e+00, -5.8436e+00, -6.6588e+00, -5.1329e+00, -5.7990e+00, -6.7011e+00, -7.8366e+00, -7.3573e+00, -7.0650e+00, -6.0818e+00, -3.5972e+00, -3.3717e+00, -3.4087e+00, -2.8131e+00]], [[-8.6095e-01, -6.2331e+00, -5.0286e+00, -5.3239e+00, -4.8210e+00, -5.0836e+00, -5.3404e+00, -4.8563e+00, -4.8852e+00, -4.5559e+00, -4.9841e+00, -4.5113e+00, -3.8723e+00, -3.4106e+00, -3.1851e+00, -3.3367e+00]], [[-2.1859e+00, -7.4938e+00, -8.5597e+00, -7.6985e+00, -6.5153e+00, -5.1588e+00, -6.5798e+00, -7.2144e+00, -4.6929e+00, -6.0996e+00, -6.2357e+00, -7.1290e+00, -4.7855e+00, -3.0713e+00, -3.0604e+00, -3.6617e+00]]]]) attn_weights tensor([[[[ -2.9953, -9.6649, -10.7845, -10.7369, -10.7823, -9.8300, -9.7153, -9.0306, -9.4323, -9.0930, -8.4495, -6.1269, -6.6369, -5.1611, -1.8014, -4.3607]], [[ -2.8780, -7.1874, -7.3088, -7.7668, -6.6418, -5.0150, -6.9889, -4.8600, -4.8959, -5.7322, -5.2086, -4.8262, -3.8817, -2.6621, -4.7266, -5.6788]], [[ -0.2965, -2.4296, -3.5876, -3.3977, -4.5004, -3.9785, -3.9512, -2.7166, -3.6617, -3.5667, -2.9337, -4.5739, -3.8905, -3.9732, -3.8463, -3.2615]], [[ -1.9960, -8.2356, -9.4229, -7.8565, -8.7480, -7.2923, -6.4848, -6.6533, -7.4857, -6.3135, -4.9452, -5.2332, -4.9988, -4.4041, -4.0234, -3.9274]], [[ 1.5087, -1.4914, -1.5407, -1.6840, -2.5360, -2.3275, -3.8250, -2.8765, -2.3222, -2.6593, -3.5165, -3.5746, -4.2733, -2.7362, -0.9180, -2.1333]], [[ -2.3476, -8.0781, -9.5732, -9.8545, -9.3534, -9.9687, -10.0806, -6.5770, -7.6932, -7.8512, -7.8206, -5.5545, -6.0671, -7.1392, -4.2695, -4.1117]], [[ -2.0376, -5.9309, -5.1362, -4.9802, -5.2161, -4.8084, -5.7208, -5.5230, -4.5821, -4.0449, -3.9694, -4.0252, -3.6918, -3.2407, -3.8885, -6.9272]], [[ 0.3497, -5.8068, -4.6544, -5.6980, -5.3587, -4.1319, -4.6080, -3.1110, -4.3843, -5.2092, -4.2018, -3.1944, -3.3382, -2.5321, -1.1976, 0.1606]], [[ 1.9224, -1.8659, -2.5496, -0.9200, -2.2797, -2.9277, -3.1641, -2.9938, -2.8211, -1.8359, -2.9183, -1.8157, -2.3544, -3.2491, -1.5928, -1.8454]], [[ -1.4214, -4.4762, -4.7835, -3.8354, -3.2570, -3.6839, -3.7354, -4.3657, -3.5179, -2.9595, -0.9402, -2.3020, -1.9024, -3.6221, -2.6807, -2.9915]], [[ 1.3558, -1.9057, -2.3264, -3.1228, -2.8904, -3.6682, -2.5581, -2.7115, -2.3230, -3.7418, -3.5187, -2.9899, -3.7068, -3.9516, -2.0778, -2.7902]], [[ -5.6194, -31.9276, -36.8783, -37.1563, -37.3178, -26.6258, -29.5670, -27.9187, -31.6844, -28.4674, -20.5204, -20.4678, -20.5766, -13.2641, 7.9420, 1.7594]]], [[[ -1.6979, -10.2058, -9.9369, -8.3215, -6.1882, -8.0284, -7.1118, -7.9667, -7.2605, -7.6976, -6.1087, -6.8478, -5.3193, -2.7269, -3.8060, -3.1614]], [[ -1.9128, -7.3971, -6.9310, -6.7820, -6.8248, -5.4979, -6.1791, -4.9113, -4.2088, -4.9226, -4.4961, -3.1642, -4.1383, -2.6159, -3.2173, -3.4450]], [[ 0.3054, -2.7466, -3.2862, -3.9706, -4.0961, -4.2545, -3.7956, -2.8350, -3.1178, -3.2265, -3.8068, -2.5414, -2.4692, -2.9373, -2.8618, -3.5789]], [[ -1.8089, -6.1956, -4.7668, -5.2834, -6.1467, -3.5085, -4.2611, -5.3162, -5.0911, -3.3234, -3.9378, -5.0691, -4.9630, -4.6423, -5.3795, -3.1290]], [[ 1.7650, -3.4231, -3.8009, -2.7859, -2.3067, -1.0972, -1.9573, -1.7142, -2.9876, -3.6121, -2.8462, -3.4147, -2.4454, -1.0581, -0.7741, -1.6270]], [[ -1.7116, -7.8580, -9.1867, -9.8734, -7.4428, -6.7700, -7.9665, -5.7593, -5.4244, -6.8504, -7.5171, -5.5381, -4.9055, -5.3203, 0.5142, -3.9208]], [[ -1.6798, -5.8768, -6.1173, -6.3233, -5.6579, -5.1407, -4.8719, -4.8113, -4.8767, -5.0518, -4.9890, -4.3667, -4.1021, -4.4982, -3.7371, -3.6233]], [[ 0.2847, -4.8223, -4.6869, -4.9919, -2.2498, -1.8355, -2.7577, -3.9072, -3.6981, -4.1513, -4.2305, -1.8448, -0.7157, -0.9159, 0.4831, 1.7154]], [[ 2.1477, -4.8056, -4.8074, -4.6394, -3.2844, -1.9377, -2.1430, -2.5248, -2.5744, -4.5441, -4.9573, -3.1712, -3.0695, -3.0387, -1.5010, -1.8352]], [[ -0.8527, -5.8686, -4.9570, -5.4729, -5.1832, -4.4810, -4.0669, -3.9039, -4.2567, -3.3111, -3.9423, -2.4474, -1.8112, -1.3931, -1.4290, -3.0138]], [[ 1.5914, -4.2591, -4.3485, -5.4613, -4.1642, -4.0618, -2.5616, -2.9296, -3.6749, -4.0541, -5.4877, -4.4189, -3.6381, -3.9513, -3.3642, -3.7204]], [[ -6.2501, -21.5659, -27.4869, -23.7344, -20.2478, -22.2595, -32.9220, -23.1199, -20.7690, -17.4755, -11.6366, -8.1331, -6.3115, -2.0389, 7.6304, -8.1002]]], [[[ -4.2420, -11.1270, -10.0131, -8.3253, -9.6390, -7.0846, -7.3970, -6.6215, -9.0614, -7.0472, -4.8738, -5.0008, -2.4552, -5.9768, -5.4829, -7.4979]], [[ -3.2743, -8.0593, -8.3544, -8.1687, -10.0654, -4.0102, -5.4389, -4.2827, -6.3467, -4.2829, -3.9326, -3.2063, -5.1897, -3.4629, -4.0159, -4.6030]], [[ 0.1147, -3.2942, -4.4841, -4.5802, -5.3855, -5.8414, -3.9863, -3.6709, -3.5531, -4.4675, -4.2021, -3.6590, -3.4508, -4.3031, -5.1753, -4.9374]], [[ -2.7493, -6.7593, -5.8608, -4.7938, -6.8281, -3.9994, -3.7334, -5.2358, -5.6372, -3.2902, -2.5672, -3.3309, -3.0034, -4.0721, -4.0419, -4.8677]], [[ 1.4232, -4.1341, -2.3955, -3.5878, -1.9972, -3.5480, -4.3469, -3.0022, -3.9576, -2.1983, -3.6906, -2.8925, -3.2547, -2.4690, -1.9863, -1.7750]], [[ -2.3698, -7.7039, -8.4943, -7.5863, -9.0021, -6.9436, -7.0161, -5.8565, -7.1820, -5.6477, -5.3254, -5.9346, -2.4085, -0.9882, -3.2720, -4.5658]], [[ -1.9823, -6.4254, -6.9269, -6.7401, -6.9873, -5.3816, -5.7972, -5.7136, -5.4084, -5.5816, -5.3660, -4.4840, -3.6610, -3.9709, -3.9180, -4.9636]], [[ 0.6410, -4.3378, -4.4421, -3.9394, -4.0021, -2.2548, -3.7104, -3.5187, -4.4019, -3.2360, -3.6588, -2.8612, -1.1352, -0.0445, 1.1764, 1.0997]], [[ 2.0737, -5.0162, -4.5019, -3.8947, -3.8546, -3.4418, -2.1789, -3.2208, -2.1499, -3.9274, -4.0704, -2.6332, -2.9992, -1.2447, -2.1346, -2.5862]], [[ -0.9959, -5.4768, -5.5712, -5.4448, -5.1548, -5.4299, -4.5995, -4.9856, -4.5725, -3.5046, -4.4862, -4.4066, -2.6026, -3.3456, -3.8359, -2.8091]], [[ 1.6995, -3.8036, -4.0953, -3.9409, -3.6220, -3.9276, -4.3227, -3.0114, -3.9342, -3.7158, -4.6282, -4.4700, -4.1155, -4.4796, -3.3900, -3.5339]], [[ -5.7964, -25.9266, -41.1297, -32.0919, -34.1379, -26.4325, -36.0701, -25.2518, -22.7222, -29.3724, -23.9799, -12.0403, -6.6730, 5.1353, 19.5742, 9.9221]]], [[[ -2.8417, -11.2790, -9.1542, -8.3529, -6.8354, -8.1013, -9.6594, -9.1994, -7.8574, -7.7307, -8.8214, -9.2096, -5.7306, -5.4056, -4.1323, -4.4984]], [[ -2.4875, -8.3133, -8.0874, -7.0701, -8.3566, -6.0397, -7.0246, -5.6050, -6.8065, -5.4929, -5.9694, -4.6066, -3.7843, -3.4476, -1.3204, -2.4582]], [[ -0.2211, -3.0115, -4.1051, -3.8543, -4.7463, -3.4916, -2.9572, -2.9820, -4.9223, -3.9972, -3.4363, -2.6528, -3.7917, -3.4696, -3.2850, -4.0973]], [[ -1.7848, -9.3735, -8.5649, -7.3223, -6.8201, -4.9970, -5.4675, -7.1098, -5.9071, -5.2237, -5.5905, -7.1793, -4.3859, -3.7324, -3.8517, -3.6339]], [[ 1.6807, -2.0208, -1.0822, -1.5160, -2.0040, -3.9192, -4.2092, -2.5486, -3.1873, -5.7203, -3.6618, -3.2042, -1.5215, -2.2948, -0.6513, -0.7644]], [[ -1.7932, -8.3617, -9.8382, -10.3083, -8.3057, -9.9516, -9.9299, -7.5043, -8.1458, -8.5589, -9.5057, -5.1110, -6.2723, -6.8237, -5.0713, -3.4245]], [[ -1.7512, -6.6844, -8.7616, -7.5599, -6.4753, -4.7488, -4.9905, -6.1632, -6.1505, -4.4061, -4.5938, -4.7649, -4.3962, -4.6672, -2.8743, -4.8570]], [[ 0.8175, -5.7105, -4.5547, -4.3206, -2.4230, -2.6258, -4.2463, -3.9925, -3.8505, -2.6237, -4.2603, -1.4589, -1.2475, -2.0251, -0.2241, 1.4596]], [[ 1.8822, -3.3500, -2.4687, -1.7828, -1.5137, -2.7464, -2.3162, -3.1648, -2.3036, -3.8767, -3.3406, -3.6008, -2.2915, -2.3466, -2.9696, -2.2393]], [[ -0.7469, -5.9418, -6.6866, -6.0409, -5.7896, -4.1996, -3.8985, -5.3678, -6.5763, -4.5058, -3.7709, -3.3872, -2.9474, -3.5808, -2.6313, -4.3262]], [[ 1.5984, -2.9269, -3.5935, -3.8870, -3.2251, -2.6406, -3.7406, -2.7737, -3.2992, -5.1321, -5.0021, -2.9115, -2.8120, -4.1704, -4.1218, -3.9779]], [[ -6.5312, -29.1046, -30.3120, -20.8878, -22.1507, -19.7586, -30.0461, -21.1638, -21.7345, -18.0792, -23.7772, -13.3914, -10.1166, -1.6647, 8.6881, 1.1553]]], [[[ -1.7941, -9.4546, -10.0029, -8.8184, -8.3039, -8.7817, -8.2438, -9.2844, -9.7511, -8.9477, -7.6656, -8.8522, -6.2724, -3.9640, -3.7685, -4.6238]], [[ -1.8372, -6.4175, -8.9476, -7.7152, -8.5794, -5.8470, -6.5733, -6.1855, -6.3585, -8.0101, -6.6318, -6.0862, -3.7748, -2.7302, -2.4017, -4.1899]], [[ 0.5900, -2.6266, -3.1125, -3.4581, -3.3300, -4.8377, -2.8158, -3.2977, -2.9816, -4.6838, -5.1517, -4.7907, -1.6523, -1.5662, -1.6200, -2.4137]], [[ -1.0987, -7.6198, -6.9664, -6.0092, -7.2392, -6.0625, -5.1575, -6.7463, -8.3232, -8.6538, -6.9545, -4.8460, -6.1806, -4.5277, -4.2067, -5.0508]], [[ 1.9591, -2.8873, -4.0979, -4.4846, -3.5893, -2.7290, -3.0673, -3.1687, -4.4484, -3.8278, -3.9937, -3.4643, -2.6775, -1.1420, -0.8296, -0.5690]], [[ -1.8223, -7.7180, -8.5573, -7.8461, -8.5991, -8.5202, -9.7339, -8.7191, -5.8285, -8.1910, -8.5880, -10.3137, -5.8711, -5.4480, -5.3717, -5.7335]], [[ -1.7709, -5.1736, -5.8477, -5.7120, -4.8999, -4.6878, -4.7570, -5.2630, -4.3120, -4.9034, -5.2906, -4.6277, -4.2289, -3.9981, -3.8174, -4.0038]], [[ 1.2568, -7.6400, -4.1601, -3.7469, -4.4566, -4.1197, -4.6895, -5.5238, -3.8043, -5.2583, -4.5538, -5.2792, -3.0623, -1.8382, -1.2385, 1.6475]], [[ 1.1927, -3.3274, -2.8253, -3.4843, -2.8316, -3.1150, -1.8013, -2.3519, -2.7314, -2.6368, -3.4312, -3.8793, -1.8155, -2.0470, -1.8903, -1.9808]], [[ -0.6687, -4.4582, -5.7384, -5.4465, -6.0721, -5.7288, -4.7111, -3.8608, -4.5894, -5.5017, -5.6434, -5.3865, -3.4926, -4.0314, -4.1426, -4.4495]], [[ 1.5105, -2.7000, -2.4404, -2.0832, -2.9920, -3.7179, -3.5003, -2.6949, -3.3988, -2.9796, -4.1308, -4.8530, -1.4218, -1.7677, -1.4845, -2.6153]], [[ -8.1859, -19.6739, -23.4566, -25.6134, -26.5462, -22.6171, -27.1182, -15.3105, -18.9732, -22.5873, -20.6099, -27.2230, -5.6061, 5.9565, 6.3088, -1.6495]]]]) attn_weights tensor([[[[ 2.0742, -1.7820, -4.1064, -3.7530, -1.9086, -3.2338, -3.3691, -2.7233, -4.6254, -3.4490, -2.0578, -3.0054, -3.4552, -2.2258, -4.2403, -2.9511]], [[ 3.9217, -4.7362, -5.3780, -8.9315, -8.3084, -5.1442, -6.8211, -9.8777, -8.5531, -9.2515, -6.6917, -12.0521, -9.0024, -5.6632, -6.5394, -3.3952]], [[ -0.0409, -3.9906, -4.1827, -3.8939, -4.1013, -3.5246, -4.1156, -4.6683, -2.6746, -2.5824, -2.6195, -2.6661, -2.9690, -1.8356, -0.8818, -4.0001]], [[ -0.2922, -1.6337, -2.2718, -2.3977, -2.5560, -2.4740, -2.9701, -1.9974, -0.7026, -1.6612, -0.7741, -1.9598, -2.1621, -2.7138, -2.1113, -2.9534]], [[ -0.3638, -6.0313, -6.4208, -5.5003, -4.6345, -3.6098, -3.2346, -2.6259, -4.6862, -3.8409, -3.2047, -1.8062, -2.3374, -1.1196, -0.4136, -2.1877]], [[ 1.9081, -1.9131, -0.9202, -6.0634, -4.0849, -2.5630, -4.8306, -7.3491, -4.2142, -6.7950, -4.2146, -7.2645, -5.3665, -3.2233, -5.3201, -3.4878]], [[ 1.3404, -6.6352, -8.6448, -8.8936, -7.8032, -2.4007, -3.1242, -3.2244, -5.6381, -7.0328, -5.4702, -4.4300, -4.1481, -0.5802, 0.1873, -1.5817]], [[ 0.3882, -4.4198, -5.3233, -5.8611, -4.5752, -4.0661, -2.2955, -3.5823, -5.0294, -5.3726, -2.2979, -3.0107, -0.8237, -1.8536, -0.9785, -3.3933]], [[ 0.3273, -2.0927, -2.3286, -5.9786, -5.5999, -3.5927, -5.4232, -5.7134, -3.6531, -5.3170, -4.8188, -5.5799, -5.0549, -2.9287, -4.7952, -4.6889]], [[ 1.2154, -3.2396, -2.3849, -2.4628, -1.3952, -1.9245, -1.8985, -1.6855, -2.7024, -3.2434, -1.8074, -1.9681, -1.8654, -2.4792, -2.7714, -6.1110]], [[ 2.7190, 1.1451, -4.3144, -3.8648, -3.5840, -1.9747, -0.4823, 0.0577, -4.2448, -4.6656, -4.6769, -2.2912, -1.2898, -2.0336, -0.5584, 0.6616]], [[ 0.9202, -2.5600, -2.7463, -2.8056, -2.5893, -3.7526, -4.0576, -2.9948, -2.6836, -3.0399, -2.8737, -2.3096, -2.5669, -3.5600, -2.9248, -1.3959]]], [[[ 2.6550, -6.9691, -5.5862, -7.1734, -6.2062, -4.2231, -2.0887, -2.2796, -2.3347, -5.1325, -7.6773, -7.6401, -4.9304, -4.0910, -3.0993, -0.9588]], [[ 4.2236, -10.9468, -11.4943, -13.2599, -12.7356, -6.9048, -7.4188, -5.3633, -8.0730, -10.3795, -13.6454, -13.0207, -7.8506, -6.0618, -6.7270, -4.5459]], [[ 0.4679, -3.8995, -4.4964, -3.5440, -4.1973, -4.6308, -3.9925, -4.2731, -3.9479, -3.3627, -2.6179, -2.7934, -2.7991, -2.0838, -1.1266, -1.7963]], [[ 0.0736, -2.1128, -2.9346, -2.8282, -3.0292, -2.5650, -2.9104, -2.2084, -1.9647, -1.5306, -1.7924, -0.7292, -0.4914, -0.6109, -2.0385, -2.4564]], [[ -0.0596, -5.8295, -5.7089, -6.4919, -6.2337, -5.2989, -4.8762, -4.6358, -4.6981, -4.8339, -5.1440, -4.1234, -3.5759, -2.6437, -1.6997, -2.2130]], [[ 1.6711, -5.9854, -6.2640, -6.9666, -6.4194, -3.8719, -3.0337, -1.2428, -2.4519, -3.9889, -6.8370, -7.7413, -7.1329, -5.2984, -2.9736, -3.3008]], [[ 1.2733, -5.8491, -6.7749, -5.9130, -3.4796, -3.1690, -6.1856, -4.6940, -4.1569, -5.3854, -5.4385, -4.4176, -3.8740, -3.2438, -0.1371, -1.7954]], [[ 1.3882, -5.5329, -7.4492, -7.8166, -5.1738, -3.6975, -0.9865, -4.7517, -5.3838, -6.2590, -6.4636, -4.8111, -4.0847, -2.1429, -1.5603, -0.5968]], [[ 0.7225, -4.4511, -5.3197, -5.8727, -4.7565, -3.3388, -1.4989, -0.9187, -1.6217, -2.9366, -4.7614, -4.6904, -3.9974, -3.3286, -2.6420, -2.2124]], [[ 1.0746, -3.4019, -5.3011, -4.5722, -3.4046, -2.6378, -1.1279, -1.6124, -2.5866, -5.0176, -5.0587, -4.2330, -4.4235, -4.5682, -3.3932, -3.5967]], [[ 2.5143, -0.7119, -2.3338, -1.5047, -1.2137, 1.5345, 1.1100, 0.7153, -0.2812, -2.2410, -2.2040, -3.9207, -1.7502, -1.7282, -0.9907, 0.3224]], [[ 0.9315, -4.8085, -4.6526, -4.6752, -3.4913, -2.3088, -2.7547, -2.2790, -3.2218, -4.6010, -4.9054, -4.3756, -3.9886, -4.3089, -2.9457, -2.3087]]], [[[ 2.7109, -6.4215, -5.5480, -4.8302, -5.5051, -2.5170, -5.1541, -4.2383, -4.1586, -5.7794, -6.4871, -6.6808, -3.5434, -4.1873, -2.2387, -1.5295]], [[ 4.8158, -14.2856, -9.5146, -8.6989, -9.0873, -0.3838, -10.0895, -12.8990, -9.5858, -12.4482, -11.8904, -14.9875, -11.0330, -9.0171, -5.2425, -1.2285]], [[ 0.4256, -4.4675, -4.8201, -4.9325, -4.1237, -4.6390, -4.5757, -4.5793, -2.7477, -3.3644, -2.5430, -1.9479, -2.2117, -0.4437, -1.0124, -2.3255]], [[ 0.0909, -2.6896, -3.4124, -3.5518, -4.1206, -3.3022, -3.4694, -2.6835, -1.8805, -1.8591, -2.2281, -2.8562, -2.4046, -3.1580, -4.5717, -3.3427]], [[ -0.0982, -6.0691, -6.9085, -6.3771, -8.2162, -4.6142, -3.6897, -4.5645, -6.1138, -4.1645, -4.7014, -4.4682, -1.1200, -2.2147, -1.5803, -3.0209]], [[ 2.3609, -9.3684, -5.0405, -5.1057, -6.2820, -0.2966, -4.5024, -3.6789, -2.5072, -4.8111, -3.6834, -7.1115, -4.9117, -4.4736, -4.5612, -3.3423]], [[ 1.5085, -7.8010, -8.6846, -7.2318, -7.0960, -4.3763, -6.6026, -5.0779, -4.9592, -6.7614, -6.0885, -3.8379, -2.7201, -0.1778, 0.4151, -2.5863]], [[ 0.9992, -5.0760, -5.7776, -6.3309, -5.9938, -4.0675, -1.9137, -3.9383, -5.5115, -4.9789, -4.4533, -3.7759, 1.3619, -0.9298, -0.2752, -1.5584]], [[ 0.7972, -6.5702, -5.5002, -6.4115, -7.5644, -0.8552, -1.8830, -1.3748, -3.9090, -5.2500, -5.7528, -6.9058, -5.0111, -5.1484, -4.8543, -3.5842]], [[ 1.1978, -3.4706, -4.7854, -4.4585, -3.9766, -2.8175, -2.1565, -2.7871, -3.6792, -4.6827, -4.7731, -4.8592, -4.0504, -3.6998, -5.2844, -5.2459]], [[ 2.2099, -1.0192, -0.8701, -0.6677, -1.5376, -0.9075, 0.0906, 0.2072, -2.4504, -0.7013, -1.4137, -1.3780, -0.7432, -2.3487, -2.5311, -3.0415]], [[ 0.9422, -5.6588, -5.4842, -5.5747, -3.0134, -3.8083, -4.4279, -3.7799, -3.6331, -4.5483, -4.5935, -3.9453, -2.4136, -3.0588, -2.4252, -0.0305]]], [[[ 2.5566, -3.6461, -7.0489, -5.3775, -3.9804, -3.5409, -1.7060, -2.6506, -4.3496, -5.3679, -5.5059, -3.4642, -5.3606, -5.4173, -4.1526, -1.9463]], [[ 4.9344, -5.7760, -8.3041, -5.5848, -5.2679, -3.5555, -2.4762, -8.9050, -8.3135, -8.3097, -11.2169, -7.3433, -8.6194, -8.8656, -7.1487, -1.3796]], [[ 0.6213, -4.7451, -6.4265, -3.5849, -4.9944, -4.8296, -4.4512, -5.1056, -6.4049, -5.1183, -4.6314, -3.9758, -3.6321, -1.6457, -1.6783, -3.4323]], [[ 0.1142, -3.0820, -4.1928, -4.0550, -4.4568, -3.9583, -3.9400, -3.6830, -3.5395, -3.1849, -3.3352, -1.6675, -1.3129, -1.5156, -1.3231, -2.4365]], [[ -0.0401, -7.0037, -8.0490, -4.7567, -4.9455, -3.6804, -3.2466, -4.6050, -5.6222, -4.4624, -4.0932, -2.4707, -3.0474, -0.7340, 0.9145, -1.9870]], [[ 1.8956, -3.3854, -2.1681, -1.6101, -1.1668, -1.1578, -1.6373, -4.5266, -2.9145, -3.1794, -5.6486, -3.6462, -3.5587, -5.6509, -5.5398, -3.0956]], [[ 1.4215, -8.2825, -7.9444, -6.5581, -6.3880, -4.0817, -6.1880, -6.2757, -6.5643, -4.0581, -5.1263, -6.0955, -2.6935, -2.9129, -1.6438, -0.8805]], [[ 1.0180, -6.1752, -5.9209, -5.4511, -5.1344, -3.5073, -3.5459, -5.7905, -4.9719, -5.3505, -4.1382, -5.5115, -2.4726, -1.8847, -0.2168, -1.7892]], [[ 0.7480, -3.7279, -4.7395, -2.6470, -1.8172, -1.1707, -1.4641, -1.7215, -3.6415, -3.6234, -5.6783, -2.2600, -4.0928, -5.5288, -4.6922, -3.7652]], [[ 0.9408, -3.8965, -5.0477, -4.8694, -3.8655, -2.8159, -3.2121, -3.3522, -3.6474, -3.6306, -4.3722, -3.3994, -3.1301, -3.2000, -3.0529, -4.9881]], [[ 2.1617, -0.8040, -0.5693, 0.4180, -0.1408, -1.5217, 0.6720, 0.7923, -2.7237, -1.9615, -1.8252, -0.9481, -3.2868, -2.8173, -2.4763, -0.6041]], [[ 1.1582, -4.3406, -4.0081, -4.0238, -3.0528, -4.9031, -5.7014, -4.9783, -4.9251, -5.3145, -5.4970, -5.5807, -4.2810, -4.0752, -2.8029, -1.6797]]], [[[ 1.8537, -2.5603, -4.9832, -3.3705, -3.1933, -3.0077, -4.2753, -5.5875, -5.8666, -3.8071, -5.5856, -6.6165, -6.3578, -4.6353, -3.3287, -1.7771]], [[ 4.4961, -10.5704, -9.4728, -8.4213, -7.4850, -6.2757, -13.1814, -15.4037, -10.5559, -9.0582, -8.1975, -16.7258, -15.7971, -7.9002, -3.3124, -2.2394]], [[ 0.8951, -2.5120, -4.1576, -4.8657, -3.6347, -3.4914, -3.7710, -3.8039, -3.9009, -3.9401, -4.8594, -4.8470, -2.5377, -1.3484, -2.2436, -2.9191]], [[ 0.4252, -2.1300, -3.1811, -3.2968, -3.6906, -3.2277, -2.3262, -2.6928, -4.1274, -4.7042, -3.8806, -4.1325, -2.0483, 0.2819, -0.1432, -2.1798]], [[ 0.1223, -5.0642, -6.1236, -5.5310, -4.6810, -4.3236, -3.6949, -4.1873, -5.3903, -5.4802, -5.0902, -4.6762, -3.1124, -2.4148, -2.0085, -2.3104]], [[ 2.1276, -8.1245, -5.1759, -4.4194, -4.3090, -2.9329, -4.7633, -5.2045, -3.8666, -4.6523, -2.6223, -6.3698, -5.0633, -2.6651, -1.4782, -1.9032]], [[ 0.8774, -4.9761, -5.1942, -5.5721, -4.8401, -5.1344, -7.0274, -4.1617, -3.9435, -5.1623, -5.3572, -7.9371, -3.4889, -1.3847, -0.9808, -1.7120]], [[ 1.2517, -4.5968, -5.8901, -6.4651, -4.5804, -4.8677, -2.4665, -4.2738, -5.3887, -4.9490, -3.9901, -4.3549, -3.7658, -4.0289, -4.1336, -3.2203]], [[ 0.9223, -3.2876, -3.3619, -2.4255, -2.6374, -4.3343, -4.9582, -4.6397, -4.8209, -3.4525, -4.7075, -6.3773, -4.2224, -2.9158, -2.6936, -1.9697]], [[ 1.0354, -3.2292, -2.7159, -3.1100, -2.9164, -2.7694, -2.5404, -2.9551, -3.5094, -4.2325, -3.7491, -3.9399, -2.7018, -2.9818, -2.4722, -3.1093]], [[ 1.8531, -2.0442, -1.9204, -1.7264, -1.1868, -0.1811, 0.3936, 0.0605, -1.3685, -2.6642, -1.8898, -1.2483, 0.3463, -0.8794, -0.5053, -1.5732]], [[ 1.0120, -5.0786, -3.8760, -3.8741, -3.9261, -3.4726, -4.6110, -4.3818, -4.5719, -5.0093, -5.5029, -4.8702, -2.9082, -3.2091, -2.5682, -0.9537]]]]) attn_weights tensor([[[[ -0.8180, -4.8939, -6.1046, -6.9686, -7.1273, -5.7126, -5.7868, -6.1846, -4.8791, -5.0658, -4.7000, -5.1081, -4.9761, -4.0181, -3.1144, -3.8779]], [[ 0.5176, -2.8811, -5.1933, -4.1611, -2.7058, -4.8141, -4.8594, -3.4593, -6.4204, -5.7312, -3.3051, -4.1686, -3.2590, -4.4734, -4.7003, -4.4391]], [[ 0.1992, -2.8941, -2.6947, -2.7860, -2.9252, -3.7375, -3.7551, -3.0103, -3.1004, -3.6619, -2.8585, -3.4046, -3.7545, -3.4838, -2.9975, -3.6048]], [[ 0.0727, -2.0275, -2.5761, -3.0092, -3.3463, -2.8410, -2.9315, -2.4915, -2.5859, -3.3415, -2.5327, -2.6693, -2.3791, -3.2086, -3.2549, -3.0060]], [[ 1.2606, -0.4690, -0.0339, -0.6207, -1.6498, -1.0207, -1.7079, -1.6731, -2.0514, -3.2661, -2.1750, -3.4475, -2.3532, -1.2740, -0.9897, -0.3321]], [[ -0.6417, -5.2024, -5.5568, -5.9801, -5.7428, -5.3157, -5.4369, -3.8988, -3.9333, -4.6426, -4.9011, -4.7217, -4.6229, -3.9229, -3.8723, -3.7180]], [[ 2.2133, -1.5261, -1.7828, -2.9062, -2.6800, -2.8967, -3.9484, -2.0143, -2.4630, -3.3534, -3.7463, -3.0742, -3.2009, -2.5602, -2.0106, -0.7091]], [[ -0.4353, -4.0415, -4.4697, -5.1290, -4.3014, -2.7426, -1.8108, -3.1594, -3.9354, -4.7271, -3.4606, -3.2002, -2.1536, -1.1335, -1.2983, -3.5885]], [[ -2.0106, -6.3817, -5.2721, -5.8332, -5.3171, -3.5701, -4.1089, -5.5842, -2.9512, -3.7839, -2.5602, -3.9487, -3.4919, -1.7653, -1.0537, -3.5195]], [[ 4.3710, -2.1638, -0.5221, -3.2974, -3.4857, -1.1602, -5.4151, -6.8630, -5.1354, -4.7789, -3.3504, -7.7281, -4.2861, -2.2973, -4.5618, -3.9164]], [[ 2.9968, -1.4977, -1.8809, -2.2742, -2.0109, -1.6431, -1.1531, -0.5991, -0.3864, -1.7585, -1.2296, -1.5930, -0.8345, -0.9015, -1.3172, -1.0403]], [[ -0.8471, -4.8487, -4.9340, -4.7127, -5.2620, -5.0546, -4.6710, -2.9931, -2.8865, -2.8667, -3.4839, -3.4885, -1.5772, -3.2294, -1.2687, -2.3196]]], [[[ -1.4492, -4.3396, -3.5156, -3.1600, -4.3584, -3.0559, -2.7396, -4.7583, -3.6260, -2.2566, -1.6280, -1.4500, -0.9978, -0.4033, -0.3193, -2.9545]], [[ 0.6713, -5.7087, -5.9527, -7.2074, -6.5169, -4.4466, -4.0396, -4.9604, -5.3564, -5.8036, -7.9793, -7.0635, -5.2877, -6.3670, -5.1499, -2.8869]], [[ 0.1527, -3.0722, -3.2262, -3.8154, -3.1366, -3.6750, -3.0888, -2.4004, -3.1263, -3.1896, -4.2547, -3.3569, -3.2756, -4.0120, -3.6812, -3.6723]], [[ 0.5967, -4.0839, -5.1330, -5.3952, -5.0446, -3.9364, -3.0372, -3.2488, -3.5119, -4.9298, -5.1366, -4.8683, -4.5584, -4.5897, -3.4252, -3.0521]], [[ 2.0642, -2.3455, -3.5528, -3.5254, -3.3329, -2.5930, -1.7190, -1.8992, -2.9793, -4.5753, -3.8295, -2.7377, -2.0987, -2.5385, -2.8144, -2.0645]], [[ -0.5256, -4.7908, -5.7051, -5.8480, -5.3768, -4.7820, -4.5895, -4.3028, -3.9492, -4.1257, -4.4158, -3.9752, -3.3466, -3.3361, -2.4483, -3.2250]], [[ 2.1748, -3.7426, -3.7396, -3.7380, -3.5117, -2.1190, -1.7253, -2.4086, -2.6467, -3.1822, -3.3976, -3.0947, -2.9774, -2.8687, -2.2299, -0.4350]], [[ -0.0895, -2.7077, -3.1479, -3.3676, -3.9821, -3.0018, -2.0636, -3.4643, -3.6299, -4.0717, -3.4188, -4.0757, -3.4396, -2.9789, -3.2114, -1.9980]], [[ -0.8996, -6.7435, -7.4004, -7.1007, -6.6661, -6.2984, -6.5642, -5.9670, -5.0967, -5.5663, -5.1063, -4.0199, -4.2264, -3.3606, -1.6475, -3.0914]], [[ 4.5305, -8.0003, -7.4982, -9.9101, -6.6849, -3.0312, -7.0299, -2.6472, -3.7181, -5.7200, -9.3351, -7.3043, -4.2659, -3.2118, -3.8124, -2.6718]], [[ 3.0427, -4.2652, -3.8511, -4.6782, -3.9151, -3.0822, -1.9016, -1.8595, -1.1122, -1.9316, -2.6252, -2.7084, -2.5821, -3.1025, -1.8946, -1.1536]], [[ -0.4403, -5.2757, -5.8360, -5.9807, -5.0981, -4.7570, -4.2755, -4.9228, -4.5056, -4.5701, -4.6248, -3.4004, -2.4739, -2.2222, -0.1894, -2.7490]]], [[[ -1.9265, -5.2170, -4.7445, -4.0947, -5.0681, -3.1950, -3.9056, -4.7660, -4.1975, -2.5690, -1.8039, -1.4086, -0.8531, -1.0217, -2.3745, -3.8711]], [[ 0.8432, -6.4738, -7.7226, -7.3222, -7.1536, -3.2405, -4.3297, -4.9775, -6.7575, -5.9753, -7.5408, -8.4238, -5.2395, -2.7370, -2.5844, -4.7922]], [[ 0.2728, -4.0768, -3.7576, -4.1466, -4.2671, -4.5227, -4.2104, -3.4608, -3.5088, -3.4268, -5.0230, -4.4889, -4.3367, -4.0946, -4.6723, -4.6396]], [[ 0.1562, -3.7499, -5.4098, -4.9280, -4.1083, -3.5034, -3.0882, -2.7697, -2.6648, -4.2164, -5.1647, -5.7444, -5.0329, -4.9493, -4.2084, -4.5446]], [[ 1.3251, -2.5382, -2.7864, -3.3807, -2.9126, -2.6962, -2.0012, -2.3213, -3.4383, -3.5383, -2.9661, -3.0186, -1.9427, -2.5079, -2.3659, -3.2041]], [[ -0.8924, -4.5924, -5.6378, -6.5283, -6.3946, -5.9099, -4.9087, -5.0866, -4.6622, -4.1706, -5.8887, -4.5742, -4.4564, -3.3190, -2.5789, -2.6776]], [[ 1.9690, -3.5682, -2.7404, -3.3400, -2.3099, -3.1110, -3.2982, -3.2973, -3.0334, -2.2353, -3.9154, -3.1143, -2.3524, -2.3534, -3.7876, -0.7575]], [[ -0.6362, -3.2931, -4.7542, -4.3183, -4.1972, -2.6555, -1.4582, -2.8841, -4.8025, -4.4975, -4.6580, -5.1354, -3.8684, -3.9927, -3.3616, -3.8677]], [[ -1.8142, -5.8908, -4.9857, -6.0929, -5.5401, -7.5556, -6.2907, -5.5002, -3.6743, -3.5872, -3.6955, -2.9386, -2.4924, -1.3500, -2.1058, -3.5192]], [[ 4.9045, -11.0337, -5.0736, -4.3223, -4.1911, 0.8170, -8.5615, -6.4548, -5.7891, -6.4183, -6.2454, -8.9708, -5.2679, -2.9573, -2.0030, -0.7518]], [[ 3.2040, -3.8836, -3.0772, -2.7915, -3.0758, -3.0127, -1.7537, -3.1962, -1.8825, -1.7418, -2.5287, -2.5007, -2.9542, -2.3655, -2.8926, -3.3876]], [[ -0.8337, -4.7123, -5.0537, -5.3087, -5.3635, -5.3144, -4.3597, -4.4770, -3.1737, -3.2049, -3.3135, -3.2034, -0.2598, -0.7979, -1.7933, -2.5648]]], [[[ -0.8223, -6.1048, -6.2386, -4.4163, -5.3374, -5.5795, -4.7746, -5.9021, -6.1816, -5.9517, -5.0621, -4.4370, -2.5801, -2.4118, -1.4242, -3.0556]], [[ 0.2354, -4.6432, -5.0638, -4.0541, -2.4607, -2.8175, -2.9967, -4.6904, -5.3919, -2.9809, -5.3619, -4.3425, -4.2909, -3.8792, -4.9439, -0.0208]], [[ 0.2735, -3.1549, -3.3494, -3.9795, -4.3496, -3.7169, -3.8377, -3.6512, -4.8298, -4.5117, -4.5833, -2.6472, -2.7977, -3.6834, -4.0265, -4.4496]], [[ 0.6587, -3.4117, -4.0506, -3.6048, -3.2460, -3.5667, -3.3362, -3.5871, -3.9119, -4.2700, -4.3251, -3.0958, -2.4704, -2.9202, -3.4326, -3.4351]], [[ 1.2123, -2.0636, -3.0198, -2.9225, -2.6085, -2.5002, -1.6359, -2.4322, -3.2213, -2.7330, -2.2679, -1.8200, -2.7810, -3.0306, -2.7673, -2.3605]], [[ -0.4619, -4.8338, -5.2934, -5.1969, -5.2667, -4.9164, -5.1216, -4.8457, -4.9306, -3.7308, -4.5993, -3.6918, -3.7897, -3.4005, -2.6890, -3.5577]], [[ 2.2949, -3.2274, -2.3066, -2.4594, -2.2291, -3.2089, -3.9375, -3.1926, -3.6129, -4.4546, -4.4213, -2.9234, -2.6133, -2.9527, -2.6675, -1.5387]], [[ -0.0859, -3.7685, -4.9203, -3.9970, -3.1006, -2.0370, -1.9701, -3.3524, -3.4057, -2.1824, -2.5684, -3.5889, -3.3150, -3.2668, -3.6818, -2.6702]], [[ -0.7819, -7.3320, -7.6657, -6.7524, -7.3596, -6.6275, -6.7657, -7.1135, -6.5916, -6.2218, -6.8969, -4.9440, -3.6672, -2.9185, -2.5218, -4.0606]], [[ 4.8670, -3.7066, -1.9358, 0.0162, -1.0080, -1.5838, -3.7345, -6.1357, -4.4021, -3.5550, -12.1126, -4.4518, -5.4463, -4.6962, -5.0016, -0.8870]], [[ 3.3913, -2.6285, -3.0832, -2.9405, -2.0004, -2.0815, -0.5101, -1.0523, -1.7032, -3.0964, -1.0977, -1.6792, -2.0131, -2.6373, -3.6736, -2.3325]], [[ -0.4231, -5.2042, -6.4004, -5.0232, -6.0122, -4.9212, -4.8380, -5.3652, -5.9272, -4.4905, -4.8098, -3.4381, -3.0256, -2.4062, -1.3734, -3.1969]]], [[[ 0.1558, -5.4234, -5.9074, -6.0300, -5.6840, -5.3653, -4.5757, -6.4237, -7.3730, -8.3097, -7.2300, -6.6289, -4.6450, -3.4609, -3.4552, -4.5359]], [[ 0.7322, -3.5275, -6.3276, -4.9961, -4.0233, -3.9977, -3.5484, -6.0962, -6.2660, -6.3996, -6.4349, -5.3655, -3.7526, -4.4836, -4.2741, -3.5037]], [[ 0.4764, -3.1286, -3.6607, -3.4987, -3.4513, -3.3755, -3.1177, -2.7762, -4.1638, -3.8563, -3.4769, -4.2154, -2.3169, -3.1744, -2.5020, -3.0808]], [[ 0.4495, -3.2362, -3.2846, -3.5584, -2.3669, -2.2189, -1.8320, -3.3393, -3.1878, -3.3466, -3.8590, -3.9857, -1.8410, -1.9867, -2.3352, -3.1565]], [[ 1.2122, -1.2453, -0.5356, -0.9396, -1.6792, -1.7445, -1.1510, -1.2873, -2.3595, -2.4918, -2.3630, -2.4836, -0.0721, -0.6406, -0.4395, -2.3861]], [[ -0.4791, -3.9049, -4.6725, -4.7516, -5.3426, -4.9347, -4.4009, -4.8001, -4.3993, -5.8986, -4.9987, -4.9681, -3.1991, -3.1820, -3.0251, -2.8467]], [[ 2.1371, -2.7863, -3.2619, -3.7694, -4.0990, -2.7473, -4.0278, -4.0397, -3.4166, -3.6804, -3.1274, -4.5348, -3.1406, -2.7732, -1.9184, -0.2738]], [[ 0.0262, -3.4512, -4.1484, -3.4823, -2.7756, -2.6338, -1.7745, -2.8997, -4.1932, -3.4428, -1.7117, -1.9180, -1.3579, -2.0526, -2.1295, -3.4359]], [[ -0.8462, -6.7443, -8.8035, -8.4130, -7.3487, -6.5927, -6.3872, -5.9170, -7.5850, -7.1865, -6.9884, -6.5668, -3.9294, -3.1071, -2.7272, -4.8158]], [[ 4.6747, -7.6623, -6.0578, -4.2329, -3.3230, -2.5317, -7.4044, -8.9612, -6.9160, -4.1996, -2.2820, -9.3634, -7.5023, -4.4689, -1.6793, -0.7469]], [[ 2.6180, -1.8946, -2.2644, -3.3519, -2.8571, -2.6589, -1.8811, -3.3431, -2.6548, -3.2121, -2.6582, -3.3984, -1.7016, -2.2803, -2.2947, -1.9815]], [[ 0.3551, -3.6849, -6.5786, -6.2485, -6.4316, -6.2777, -4.7262, -7.2754, -7.5813, -7.8782, -6.4822, -6.1537, -4.3058, -3.1098, -2.9158, -3.2100]]]]) attn_weights tensor([[[[-7.0777e-01, -7.9708e+00, -7.5265e+00, -9.1314e+00, -8.4350e+00, -5.4535e+00, -5.4058e+00, -5.0756e+00, -4.8179e+00, -6.0649e+00, -5.1393e+00, -4.8801e+00, -4.9423e+00, -3.2589e+00, -2.1389e+00, -3.8074e+00]], [[ 3.3498e+00, 4.2205e-01, -2.1277e+00, -2.3706e+00, -1.7061e+00, -1.4251e+00, -2.6692e+00, -3.0700e+00, -3.5100e+00, -3.4502e+00, -2.7120e+00, -2.7309e+00, -2.7592e+00, -2.0424e+00, -2.8661e+00, 4.5365e-01]], [[ 5.9002e+00, -6.2593e-01, -2.4778e+00, -2.7302e+00, -4.7107e+00, -8.8514e-01, -1.1689e+00, -1.2722e+00, -3.6503e+00, -2.8542e+00, -2.4094e+00, -3.1698e+00, -1.6401e+00, -2.9460e-01, -7.9296e-01, -1.3276e-01]], [[-2.5187e-03, -2.7585e+00, -3.5091e+00, -3.3551e+00, -3.5983e+00, -3.1018e+00, -3.1635e+00, -1.7885e+00, -1.8870e+00, -2.2794e+00, -2.6746e+00, -2.5676e+00, -2.5128e+00, -1.9060e+00, -1.4248e+00, -2.1893e+00]], [[ 9.4074e-02, -3.2954e+00, -2.8449e+00, -3.1176e+00, -3.1443e+00, -3.2802e+00, -3.1990e+00, -3.6089e+00, -2.5332e+00, -2.8890e+00, -2.1139e+00, -2.4747e+00, -2.0256e+00, -2.4259e+00, -9.0893e-01, -2.1321e+00]], [[ 1.2407e+00, -2.1240e+00, -2.9471e+00, -2.7435e+00, -3.5699e+00, -3.2078e+00, -2.2193e+00, -2.4033e+00, -3.8246e+00, -3.7958e+00, -3.9614e+00, -3.4062e+00, -2.1014e+00, -2.1513e+00, -1.6510e+00, -1.8344e+00]], [[ 1.3758e+00, -2.1398e+00, -2.6608e+00, -2.4090e+00, -2.7601e+00, -3.1144e+00, -2.7608e+00, -3.1156e+00, -1.8984e+00, -1.6874e+00, -2.5303e+00, -2.0404e+00, -2.8537e+00, -2.8973e+00, -2.2741e+00, -3.2143e+00]], [[ 3.4777e+00, -1.0676e+00, -1.6404e+00, -2.3899e+00, -1.0967e+00, -1.0979e+00, -1.6890e+00, -1.2760e+00, -1.0898e+00, -2.1275e+00, 4.0889e-01, -2.0931e+00, -2.6845e+00, -1.4247e+00, -2.6181e+00, -2.5386e-01]], [[-8.6415e-01, -4.2089e+00, -4.8347e+00, -5.1743e+00, -3.9773e+00, -3.1648e+00, -2.3206e+00, -3.5941e+00, -3.6290e+00, -3.9560e+00, -2.7244e+00, -3.0715e+00, -2.4615e+00, -1.4091e+00, -7.2736e-01, -3.7089e+00]], [[-2.3346e-01, -1.7510e+00, -1.9110e+00, -2.1918e+00, -3.1892e+00, -2.7889e+00, -3.5977e+00, -1.0427e+00, -8.1328e-01, -1.2747e+00, -1.4865e+00, -1.9667e+00, -1.9389e+00, -2.4790e+00, -1.3904e+00, -2.1212e+00]], [[ 3.9913e+00, -1.5747e+00, -9.7011e-01, -2.5143e+00, -3.2587e+00, -1.6372e+00, -2.9994e+00, -4.9369e+00, -1.9334e+00, -2.4834e+00, -2.3034e+00, -4.8752e+00, -1.4839e+00, -2.6585e+00, -1.9951e+00, -1.8873e+00]], [[ 2.6724e+00, -2.0614e+00, -3.4925e+00, -2.5109e+00, -3.6554e+00, -2.9299e+00, -2.7309e+00, -1.3777e+00, -2.6058e+00, -2.0353e+00, -2.1482e+00, -2.7020e+00, -1.9082e+00, -1.3383e+00, -1.2295e+00, -3.0162e+00]]], [[[-9.8672e-01, -6.6082e+00, -7.2913e+00, -6.3707e+00, -5.2652e+00, -7.3911e+00, -8.1624e+00, -5.5178e+00, -5.4506e+00, -5.5191e+00, -4.4311e+00, -4.6897e+00, -3.0025e+00, -5.8413e-01, 2.2041e+00, -4.0082e+00]], [[ 3.8581e+00, -2.3166e+00, -1.5614e+00, -2.8089e+00, -2.8310e+00, -1.1828e+00, -9.0688e-01, -6.0674e-01, -2.1698e-01, -5.5290e-01, -1.1500e+00, -2.4707e+00, -1.4674e+00, -1.4660e+00, -7.0871e-01, -1.1074e-01]], [[ 7.0008e+00, -2.8292e+00, -4.9627e+00, -6.8935e+00, -4.3937e+00, -8.4932e-01, -1.9193e+00, -1.1615e+00, -3.6752e+00, -5.8086e+00, -7.6561e+00, -4.5766e+00, -3.3014e+00, -3.6073e+00, -1.8306e+00, 1.1221e-01]], [[ 2.3909e-01, -5.5323e+00, -4.9238e+00, -5.5664e+00, -4.7369e+00, -2.1041e+00, -3.0788e+00, -3.7093e+00, -3.3933e+00, -3.3407e+00, -3.8269e+00, -3.9108e+00, -2.8084e+00, -2.3575e+00, -2.3827e+00, -1.9805e+00]], [[ 5.7537e-01, -5.2217e+00, -4.2415e+00, -4.9979e+00, -5.5786e+00, -4.4233e+00, -4.7700e+00, -5.5613e+00, -2.9621e+00, -3.3670e+00, -3.5125e+00, -3.7201e+00, -3.2203e+00, -3.0290e+00, -2.0585e+00, -2.5598e+00]], [[ 1.3550e+00, -3.4289e+00, -2.6699e+00, -2.8503e+00, -3.2668e+00, -3.6057e+00, -1.8582e+00, -2.1457e+00, -2.4620e+00, -3.0571e+00, -3.2542e+00, -2.3722e+00, -1.5018e+00, -8.5751e-01, -1.1910e+00, -2.5060e+00]], [[ 1.7507e+00, -2.9564e+00, -3.5170e+00, -4.7469e+00, -3.9822e+00, -1.9649e+00, -2.1436e+00, -2.4677e+00, -2.4945e+00, -3.3096e+00, -3.7355e+00, -4.3655e+00, -2.5869e+00, -3.2352e+00, -3.0669e+00, -2.6918e+00]], [[ 2.8314e+00, -4.4033e+00, -5.3440e+00, -6.5907e+00, -5.7047e+00, -3.3830e+00, -3.2481e+00, -2.4259e+00, -2.7989e+00, -4.6310e+00, -5.1420e+00, -5.2011e+00, -4.5267e+00, -4.8764e+00, -4.4545e+00, -1.8088e+00]], [[ 1.1942e-01, -6.0594e+00, -4.5105e+00, -4.3286e+00, -5.3420e+00, -2.9830e+00, -3.4366e+00, -4.0185e+00, -3.8248e+00, -3.1623e+00, -3.0232e+00, -4.6318e+00, -3.1754e+00, -1.6548e+00, -2.8046e+00, -1.6642e+00]], [[ 1.2384e-01, -3.9521e+00, -3.3024e+00, -4.3727e+00, -4.9160e+00, -2.6535e+00, -3.6642e+00, -2.9030e+00, -2.4040e+00, -2.4525e+00, -3.0413e+00, -2.3772e+00, -1.8651e+00, -2.2486e+00, -2.3550e+00, -2.4952e+00]], [[ 4.7822e+00, -3.6263e+00, -4.8302e+00, -6.0787e+00, -4.1201e+00, -2.0028e+00, -2.4223e+00, -1.9985e+00, -2.6905e+00, -4.4435e+00, -5.4286e+00, -4.2058e+00, -2.9334e+00, -1.4214e+00, -2.2534e+00, -9.8091e-01]], [[ 2.9716e+00, -4.0474e+00, -4.6464e+00, -6.0156e+00, -4.6990e+00, -2.4079e+00, -2.1903e+00, -1.4198e+00, -3.9677e+00, -4.2356e+00, -5.4831e+00, -4.5049e+00, -4.0305e+00, -3.9145e+00, -4.0191e+00, -1.6143e+00]]], [[[-8.7994e-01, -7.7366e+00, -7.6953e+00, -7.2013e+00, -7.5607e+00, -7.5404e+00, -7.3813e+00, -6.2638e+00, -6.0058e+00, -5.3517e+00, -4.8871e+00, -3.6984e+00, -1.6300e+00, -1.9084e+00, -2.5100e+00, -3.1130e+00]], [[ 2.8983e+00, -1.6556e+00, -1.7473e+00, -1.9225e+00, -1.5449e+00, -2.1532e+00, 4.6132e-02, -1.1728e+00, -1.4453e+00, -1.3384e+00, -1.3357e+00, -2.3497e+00, -7.4448e-01, -8.4174e-02, -7.2744e-01, -1.9890e+00]], [[ 6.2780e+00, -5.2398e+00, -4.3500e+00, -4.8046e+00, -5.1461e+00, -1.8721e-02, -5.7206e+00, -9.6255e+00, -5.6807e+00, -7.5996e+00, -6.3117e+00, -8.0574e+00, -3.7559e+00, -2.3742e+00, -3.5476e-01, 8.9498e-01]], [[ 1.2815e-01, -4.1805e+00, -3.6303e+00, -4.3606e+00, -4.2073e+00, -2.3145e+00, -2.3347e+00, -2.4719e+00, -7.0145e-01, -1.6559e+00, -2.5210e+00, -2.9563e+00, -2.7105e+00, -3.3608e+00, -3.2623e+00, -3.1426e+00]], [[ 9.8895e-01, -6.2743e+00, -4.6732e+00, -5.2984e+00, -6.4858e+00, -4.9813e+00, -5.1330e+00, -5.0880e+00, -4.0559e+00, -3.6500e+00, -4.0290e+00, -3.9385e+00, -3.5695e+00, -4.0355e+00, -4.1596e+00, -5.1638e+00]], [[ 9.0381e-01, -3.1511e+00, -4.1765e+00, -3.8997e+00, -4.7996e+00, -3.8524e+00, -2.2734e+00, -1.7529e+00, -1.5176e+00, -4.1149e+00, -3.1822e+00, -4.2169e+00, -2.2393e+00, -3.1409e+00, -3.2559e+00, -3.7781e+00]], [[ 1.5639e+00, -2.5200e+00, -3.4932e+00, -3.9712e+00, -3.5038e+00, -2.3602e+00, -1.9688e+00, -2.3780e+00, -2.5562e+00, -3.3541e+00, -4.3043e+00, -4.8523e+00, -4.5844e+00, -4.4467e+00, -4.2511e+00, -4.2473e+00]], [[ 2.8792e+00, -5.5311e+00, -5.4377e+00, -7.2513e+00, -6.3904e+00, -4.1182e+00, -3.4146e+00, -4.6174e+00, -4.0125e+00, -4.8890e+00, -6.2995e+00, -6.2940e+00, -5.7460e+00, -3.7254e+00, -4.2771e+00, -3.8178e+00]], [[-6.7823e-01, -3.8845e+00, -3.6143e+00, -3.5889e+00, -4.1808e+00, -4.0783e+00, -2.1238e+00, -8.6731e-01, -2.9190e+00, -1.9063e+00, -2.6213e+00, -2.7441e+00, -5.6289e-01, -3.3717e+00, -2.8564e+00, -2.8210e+00]], [[-1.8564e-01, -2.4845e+00, -2.5033e+00, -3.4940e+00, -5.2271e+00, -3.8449e+00, -2.9495e+00, -2.3276e+00, -1.9147e+00, -1.9353e+00, -2.7665e+00, -2.7278e+00, -2.4473e+00, -2.9465e+00, -2.5218e+00, -3.4613e+00]], [[ 4.8477e+00, -3.2094e+00, -1.2153e+00, -2.9996e+00, -3.7898e+00, 9.2385e-01, -4.3701e+00, -4.0149e+00, -3.4291e+00, -3.8996e+00, -4.1338e+00, -5.8676e+00, -3.0563e+00, -1.4804e+00, 4.6438e-01, 8.2957e-01]], [[ 2.9432e+00, -4.5383e+00, -5.8720e+00, -5.6649e+00, -5.1682e+00, -1.6734e+00, -4.4364e+00, -4.6925e+00, -5.7110e+00, -4.6430e+00, -4.8236e+00, -6.2457e+00, -4.5668e+00, -3.8549e+00, -4.5283e+00, -4.5010e+00]]], [[[-2.7589e-01, -7.7971e+00, -8.9773e+00, -5.9530e+00, -7.7824e+00, -7.5779e+00, -7.9294e+00, -6.8523e+00, -7.9685e+00, -7.4609e+00, -8.3284e+00, -5.6110e+00, -4.9753e+00, -2.2932e+00, -3.9850e-01, -3.2152e+00]], [[ 2.5037e+00, -1.5028e+00, -5.7028e-01, -1.0334e+00, 3.1473e-02, -1.6359e+00, -9.6744e-01, 4.7207e-01, -6.1717e-01, -2.8244e+00, -1.8108e+00, 9.2192e-01, -1.5811e+00, -2.5928e+00, -2.3613e+00, 6.7898e-01]], [[ 6.3480e+00, -1.2204e+00, -4.2754e+00, -2.9144e+00, -4.3481e+00, -1.1074e+00, -2.0222e+00, -3.9089e+00, -4.4580e+00, -2.7088e+00, -7.2260e+00, -2.3928e+00, -5.2227e+00, -3.8177e+00, -4.7365e+00, 5.0683e-01]], [[ 2.7531e-01, -3.6860e+00, -3.6664e+00, -4.1306e+00, -4.4694e+00, -4.0422e+00, -3.5167e+00, -2.5454e+00, -3.7537e+00, -3.8977e+00, -3.6261e+00, -2.5356e+00, -1.8979e+00, -2.0974e+00, -2.3307e+00, -1.1150e+00]], [[ 5.8067e-01, -4.6942e+00, -4.2450e+00, -3.0922e+00, -3.7310e+00, -5.1359e+00, -4.2854e+00, -5.8222e+00, -4.7508e+00, -4.4476e+00, -4.1634e+00, -3.1514e+00, -2.4858e+00, -2.4897e+00, -2.0404e+00, -1.3048e+00]], [[ 1.2804e+00, -2.8332e+00, -3.3726e+00, -2.7259e+00, -3.0673e+00, -4.1651e+00, -1.7321e+00, -2.6382e+00, -3.5765e+00, -3.8367e+00, -1.8132e+00, -2.1826e+00, -2.0222e+00, -1.9807e+00, -2.2032e+00, -1.6546e+00]], [[ 1.3784e+00, -2.6486e+00, -3.1737e+00, -2.2245e+00, -2.6742e+00, -1.9660e+00, -2.0855e+00, -2.6247e+00, -2.8134e+00, -2.7481e+00, -2.9911e+00, -2.4218e+00, -2.2899e+00, -1.3817e+00, -2.6552e+00, -3.3166e+00]], [[ 3.2440e+00, -2.3911e+00, -3.0869e+00, -3.1902e+00, -1.9548e+00, -9.7300e-01, -7.9257e-01, 1.9606e-01, -1.4429e+00, -2.2535e+00, -2.2673e+00, -4.7834e-01, -1.7392e+00, -2.6837e+00, -2.1275e+00, 3.8867e-01]], [[-2.4339e-02, -4.3562e+00, -4.9754e+00, -4.4632e+00, -4.1906e+00, -3.9316e+00, -2.7406e+00, -3.1014e+00, -5.0835e+00, -4.4606e+00, -3.9120e+00, -2.6509e+00, -2.6637e+00, -2.7706e+00, -3.0190e+00, -2.7955e+00]], [[ 1.2503e-01, -2.9513e+00, -3.1090e+00, -2.8879e+00, -4.2642e+00, -4.5904e+00, -5.0024e+00, -3.0882e+00, -3.7770e+00, -5.5427e+00, -5.7099e+00, -9.3002e-01, -8.7145e-01, -6.2740e-01, -1.7052e-03, -1.6010e+00]], [[ 3.5263e+00, -2.7283e+00, -1.6750e+00, -1.8539e+00, -1.8566e+00, -2.0467e+00, -1.0090e+00, -3.0959e+00, -1.3910e+00, -2.5858e+00, -6.6013e+00, -2.7959e+00, -3.6870e+00, -4.6964e+00, -5.0621e+00, -1.1527e-01]], [[ 3.0190e+00, -1.3411e+00, -3.6362e+00, -1.1136e+00, -3.3308e+00, -2.5032e+00, -1.8478e+00, -1.3101e+00, -4.0266e+00, -2.9029e+00, -3.9031e+00, -5.1462e-01, -3.2480e+00, -9.9369e-01, -2.2395e+00, -1.8795e+00]]], [[[-5.6351e-01, -6.1682e+00, -7.1759e+00, -7.8474e+00, -7.1501e+00, -6.3867e+00, -7.8542e+00, -7.1283e+00, -8.2754e+00, -7.0712e+00, -6.2894e+00, -8.0030e+00, -3.4125e+00, -2.0030e+00, -1.3476e+00, -3.7602e+00]], [[ 2.7100e+00, -1.6195e+00, -2.3492e+00, -2.7692e+00, -1.8538e+00, -6.8566e-01, -7.1182e-01, -2.5322e-01, -1.5178e+00, 1.0435e-01, -5.1175e-01, -5.2709e-01, 8.5446e-01, 8.2994e-04, -3.4094e-01, -1.7197e+00]], [[ 5.8936e+00, -3.1607e+00, -4.5714e+00, -3.9409e+00, -3.1566e+00, -1.9662e+00, -5.0316e+00, -5.5996e+00, -3.4817e+00, -3.2413e+00, -2.5587e+00, -7.4356e+00, -4.3913e+00, -2.0248e+00, 7.6693e-01, -1.8217e+00]], [[ 7.1803e-01, -4.3296e+00, -4.2460e+00, -4.7145e+00, -4.3249e+00, -3.7916e+00, -3.8346e+00, -4.2333e+00, -4.3669e+00, -4.1513e+00, -4.8899e+00, -4.2356e+00, -2.2571e+00, -2.9465e+00, -2.2208e+00, -3.2026e+00]], [[ 1.3452e+00, -5.6628e+00, -5.3424e+00, -5.1231e+00, -4.5469e+00, -5.8958e+00, -4.9193e+00, -5.4557e+00, -5.7131e+00, -5.7265e+00, -5.6803e+00, -5.5883e+00, -4.1552e+00, -4.0779e+00, -4.4622e+00, -3.9774e+00]], [[ 1.1197e+00, -2.6411e+00, -2.3822e+00, -3.3850e+00, -3.0363e+00, -2.5772e+00, -1.2728e+00, -1.5919e+00, -2.3727e+00, -2.9226e+00, -3.5800e+00, -3.2467e+00, -6.6088e-01, -1.2599e+00, -1.2934e+00, -2.8656e+00]], [[ 1.3720e+00, -1.8878e+00, -2.8303e+00, -3.2471e+00, -3.5812e+00, -2.3049e+00, -2.4398e+00, -2.4991e+00, -2.2098e+00, -2.7363e+00, -2.7918e+00, -3.2450e+00, -1.6617e+00, -1.9263e+00, -2.0803e+00, -2.5491e+00]], [[ 3.4163e+00, -1.2147e+00, -2.3249e+00, -3.7392e+00, -2.5183e+00, -2.3529e+00, -2.1406e+00, -2.7275e+00, -3.6358e+00, -3.2644e+00, -3.6620e+00, -3.3008e+00, -1.3944e+00, -1.3739e+00, -1.1660e+00, -1.4734e+00]], [[ 1.4726e-01, -5.0090e+00, -5.5121e+00, -4.9802e+00, -4.5086e+00, -4.6080e+00, -2.4488e+00, -3.3358e+00, -5.6188e+00, -5.5760e+00, -5.3147e+00, -4.3703e+00, -2.7058e+00, -2.4909e+00, -2.5226e+00, -3.8483e+00]], [[ 6.8862e-01, -3.1726e+00, -4.1058e+00, -4.8942e+00, -5.6023e+00, -3.9714e+00, -4.5896e+00, -4.0125e+00, -6.2653e+00, -7.3522e+00, -5.7111e+00, -6.1066e+00, -1.1043e+00, -1.6993e-01, -1.3763e-01, -1.4471e+00]], [[ 4.2702e+00, -4.2242e+00, -5.3937e+00, -4.3692e+00, -3.1257e+00, -2.6543e+00, -5.2902e+00, -5.0220e+00, -5.7634e+00, -2.3586e+00, -2.0249e+00, -7.0600e+00, -3.2300e+00, -2.3861e+00, -9.4171e-01, -2.0809e+00]], [[ 3.2605e+00, -3.5551e+00, -3.6347e+00, -3.3967e+00, -3.0734e+00, -2.4364e+00, -4.9617e+00, -5.8958e+00, -5.0411e+00, -3.9716e+00, -3.3476e+00, -7.1194e+00, -4.8362e+00, -5.0480e+00, -4.8321e+00, -2.8326e+00]]]]) attn_weights tensor([[[[ 1.2317, -1.0587, -2.4639, -2.8337, -3.5423, -4.6972, -3.2444, -2.9204, -2.7121, -3.5378, -4.5158, -4.1310, -4.1979, -4.0610, -3.6249, -1.7957]], [[ 4.2781, 0.3922, -1.0990, -0.0277, 0.0223, -1.0219, -2.5230, -0.2320, -1.8736, -0.9798, -1.1368, -1.2726, -1.9083, -1.4151, -1.4044, -1.2123]], [[ 1.7837, -0.0926, -1.4950, -1.1075, -0.9957, -0.4218, -1.2928, -0.2505, -1.2075, -1.3248, -2.0081, -1.7801, -1.0794, -0.8319, -1.2906, -1.0210]], [[ 1.8130, -1.1293, -2.0175, -1.5068, -1.9443, -1.8373, -2.2551, -0.7646, -2.5694, -2.2502, -3.2515, -3.0772, -2.5166, -1.8834, -2.5432, -1.2602]], [[-0.7476, -5.9865, -7.1265, -7.0912, -5.4667, -3.8047, -3.2507, -4.3906, -5.6087, -5.0814, -5.0671, -3.8095, -3.6549, -2.4706, -0.3508, -3.9573]], [[-1.7736, -3.0758, -3.9071, -3.7249, -3.6674, -3.8722, -3.9264, -2.6508, -2.5739, -2.8064, -1.6715, -2.3476, -2.6319, -2.7308, -2.6076, -3.3871]], [[ 3.5698, -0.1594, -2.6296, -3.5116, -3.9449, -0.7476, -1.1082, -1.1934, -2.1284, -3.5652, -2.8006, -2.3242, -0.8965, -0.6811, -3.2901, -1.0617]], [[-0.9079, -7.3077, -7.4832, -7.7393, -6.5527, -2.4593, -2.8562, -4.6003, -5.1115, -5.2298, -3.0753, -3.3939, -2.1500, -0.8055, 0.3671, -2.5431]], [[ 0.5922, -2.7814, -3.4274, -3.9051, -4.5475, -1.7158, -1.9339, -2.9493, -3.3452, -3.8771, -2.8039, -3.2931, -1.6641, -1.5574, -1.7622, -1.9418]], [[ 1.2347, -3.5315, -3.8292, -3.6319, -2.9857, -1.6110, -2.0806, -2.4384, -3.2138, -3.2078, -2.3102, -2.3639, -1.9260, -0.7829, -1.9771, -2.2479]], [[ 1.0161, -1.6260, -2.2668, -2.9185, -3.2417, -2.8112, -3.5523, -2.4466, -2.5050, -3.2438, -3.5499, -3.3169, -3.2380, -2.6274, -1.9479, -1.9049]], [[ 0.7190, -2.7667, -3.3560, -3.4791, -3.4136, -2.8643, -3.4072, -2.8783, -3.7328, -4.0221, -3.8948, -4.0859, -4.2839, -3.4284, -3.6197, -3.8808]]], [[[ 1.4444, -3.2336, -3.9864, -3.2268, -3.9542, -3.2427, -2.0609, -2.4680, -2.7404, -3.3431, -2.8866, -3.7301, -2.3405, -2.6991, -2.4672, -2.5058]], [[ 4.9143, -2.6520, -2.8203, -3.9166, -1.2961, -1.3101, -2.3399, -0.0276, -1.0471, -2.3596, -3.0425, -2.6972, -1.4610, -0.4429, -0.1205, 0.6753]], [[ 1.7632, -1.9160, -2.9535, -2.5354, -2.0623, -2.2025, -1.7663, -1.5552, -1.0624, -2.4423, -1.8404, -1.8806, -1.5176, -1.9061, -1.4295, -1.6450]], [[ 2.1729, -3.1551, -2.9425, -2.8241, -2.4792, 0.2212, -1.1746, -0.8188, -1.7289, -2.4623, -2.6627, -3.9882, -3.2681, -2.4170, -1.9945, -0.6113]], [[ 0.3748, -6.9619, -6.8854, -6.4591, -4.4880, -5.3191, -5.0899, -5.8798, -5.2818, -6.6194, -5.9222, -5.6372, -4.3036, -4.2776, 2.0588, -2.9734]], [[-1.5296, -4.8085, -4.8266, -4.9161, -4.8699, -4.7175, -5.3125, -4.2697, -3.7966, -3.8502, -3.8608, -3.2381, -2.8797, -2.6244, -2.3684, -4.0377]], [[ 3.3141, -3.7618, -3.2261, -3.5495, -3.6474, -3.0039, -3.7603, -3.5615, -3.1420, -4.1071, -3.8236, -4.9547, -4.2578, -1.2632, -0.6114, -1.3026]], [[-0.6914, -7.9907, -6.9745, -7.5823, -6.3298, -7.0429, -6.9031, -7.0494, -5.7775, -5.1372, -5.1159, -6.3246, -4.3472, -2.0153, 0.0246, -3.8443]], [[ 1.1434, -3.7381, -3.4695, -3.4886, -3.0945, -1.1641, -1.5280, -2.2054, -3.0382, -3.8358, -3.5205, -5.3358, -3.2936, -2.5377, -2.2853, -0.9612]], [[ 1.7466, -5.0014, -5.1077, -5.8938, -4.4022, -0.7529, -1.6741, -3.7526, -4.7972, -4.3916, -5.2886, -5.5457, -4.7076, -4.3567, -3.6589, -0.6789]], [[ 1.0678, -3.8094, -3.6997, -4.3403, -3.3033, -1.4715, -1.8604, -1.6968, -2.4031, -3.2853, -3.7608, -4.0326, -2.7180, -2.6938, -2.2033, -1.3900]], [[ 0.9371, -4.0116, -3.2850, -3.8741, -3.5743, -2.2976, -2.7055, -2.9783, -4.1997, -3.4090, -4.2831, -5.5436, -4.5387, -3.9642, -4.2226, -3.2646]]], [[[ 1.1402, -3.4143, -3.0003, -3.2463, -2.8602, -5.4578, -2.6523, -3.7509, -3.3414, -2.6368, -3.7623, -3.0748, -2.3930, -2.7065, -3.1818, -1.7011]], [[ 5.2906, -2.5183, -5.3016, -4.5236, -3.9360, -0.8943, -2.7506, -3.3061, -4.2205, -4.8865, -4.0706, -4.6707, -1.7303, 1.0073, 2.7373, 1.2678]], [[ 2.0829, -1.9480, -2.4991, -2.9686, -2.2502, -1.0810, -1.0339, -2.4036, -2.1749, -2.9201, -3.2691, -3.5077, -2.5592, -1.9043, -2.8960, -1.9364]], [[ 2.6717, -1.9060, -2.7155, -3.5327, -3.7850, -3.4531, -1.0131, -1.2188, -1.4699, -3.2119, -3.8473, -4.7684, -3.7096, -3.9734, -4.9017, -3.6013]], [[ 0.1147, -5.2692, -5.4592, -6.1878, -6.8249, -5.4936, -4.5143, -4.9537, -5.0846, -4.6271, -3.0051, -1.6584, -0.8145, -1.3243, -1.0770, -1.3984]], [[-1.7052, -4.1157, -4.0511, -4.5061, -5.9371, -4.0045, -3.7985, -3.9399, -2.7894, -3.3533, -3.9363, -3.2852, -2.8152, -2.9987, -3.9292, -4.2057]], [[ 3.3490, -3.7423, -5.3308, -6.6975, -5.7448, -3.7665, -3.2362, -3.8631, -4.0068, -4.9756, -7.2467, -7.5427, -3.5326, -2.8410, -0.9840, -2.2799]], [[-0.9867, -6.4985, -5.5455, -7.2681, -6.9872, -6.7429, -6.4075, -6.1692, -4.2408, -3.2637, -2.1448, -2.6188, -0.2783, -1.4317, -2.1223, -1.7092]], [[-0.2803, -1.8791, -2.4381, -2.2509, -2.2510, -1.0544, -0.4503, -0.1478, -1.1424, -2.0886, -4.0439, -3.6286, -2.6112, -2.6678, -1.8335, -2.4020]], [[ 0.7995, -3.7240, -2.9421, -3.2669, -2.1046, -1.2075, -0.7200, -2.0802, -3.4407, -2.7303, -3.5328, -4.6524, -3.4017, -4.4362, -4.2909, -4.0428]], [[ 1.0243, -3.9769, -4.5946, -4.7990, -3.4136, -2.3925, -2.5410, -2.9534, -2.8319, -3.6218, -4.5809, -3.1166, -2.1789, -2.6154, -1.8065, -1.3416]], [[ 0.9243, -3.0371, -5.1467, -4.4028, -4.2291, -2.4544, -2.6484, -2.9440, -3.8201, -5.2988, -5.7948, -6.1299, -4.4913, -4.7486, -4.2650, -4.7233]]], [[[ 1.3363, -2.2856, -3.2488, -3.3996, -3.1066, -3.1366, -1.7987, -2.4960, -2.5921, -3.0435, -1.6050, -1.3189, -1.8946, -2.0095, -2.7070, -2.9467]], [[ 4.1839, -1.3560, -2.0239, -0.5727, 0.2054, -1.5138, -0.8190, -1.3020, -0.2473, -2.3278, -3.1414, -1.2498, -0.4094, 0.2589, -0.2346, 0.7247]], [[ 2.0770, -0.0901, -1.4652, -1.3020, -0.7664, -1.3970, -1.3488, -0.0438, -0.3505, -1.7558, -1.7809, 1.2067, -0.0308, -0.0736, -0.0969, -1.7101]], [[ 1.7039, -2.9349, -3.1987, -2.3271, -2.1652, -2.9906, -2.7681, -2.1339, -3.0752, -4.1095, -3.6055, -0.4357, -2.1952, -1.7730, -1.0469, -0.5405]], [[ 0.3145, -5.7950, -6.0242, -5.4270, -6.4253, -4.8766, -3.7811, -5.8452, -6.6449, -5.7447, -4.3925, -4.0945, -3.4157, -1.1838, 0.2286, -1.6346]], [[-1.0162, -3.9010, -5.2639, -5.0704, -5.2895, -5.2867, -5.3888, -5.4423, -5.7030, -5.4741, -4.8705, -3.0527, -2.5876, -2.7218, -0.6549, -2.2049]], [[ 3.3623, -2.2868, -2.7332, -3.3735, -2.4471, -2.9374, -2.0781, -1.6863, -2.3111, -4.5159, -2.1278, -2.2121, -1.8929, -1.4222, -1.6073, -1.1221]], [[-0.6088, -7.8471, -6.1152, -4.9207, -5.4178, -4.9220, -4.9914, -6.2975, -5.7519, -6.0923, -5.1956, -3.7840, -1.2891, -0.2837, 0.0221, -2.9586]], [[ 0.0716, -2.7516, -2.5930, -2.4430, -1.8796, -1.8911, -1.5557, -0.9662, -2.4736, -2.1881, -1.3768, -1.2487, -2.3646, -2.2617, -2.8754, -1.4697]], [[ 1.2780, -3.1650, -3.0787, -3.2203, -2.1982, -2.3478, -1.5872, -1.8215, -2.0084, -1.6771, -1.9913, -1.4877, -2.4017, -2.6294, -2.6643, -1.4304]], [[ 1.0179, -3.4837, -3.8672, -3.7178, -3.0531, -3.0942, -2.8646, -2.4476, -2.8883, -3.7667, -2.8953, -1.6697, -2.4942, -2.4196, -2.1502, -1.4954]], [[ 0.8975, -2.8480, -4.1393, -3.8190, -3.7183, -3.4105, -3.2217, -2.8698, -4.1100, -5.0871, -3.8192, -3.1826, -2.8120, -2.3485, -3.9855, -4.3810]]], [[[ 0.9664, -3.7128, -3.4143, -4.0572, -3.6940, -5.1127, -3.0884, -3.6918, -4.3796, -3.3253, -4.4096, -3.4335, -2.5674, -2.2569, -1.3890, -1.7483]], [[ 4.4022, -3.2000, -2.6664, -2.1382, -1.1486, -1.9821, -3.2937, -3.4691, -0.9660, -1.2716, -2.8167, -4.1250, -1.9062, -1.4910, -0.4732, -2.2422]], [[ 1.4285, -1.3591, -2.0360, -2.6377, -2.3753, -1.3608, -1.2907, -2.1004, -1.9538, -2.3576, -1.3422, -2.1179, -1.1896, -1.4469, -0.6234, -1.9862]], [[ 1.9063, -2.0605, -1.4485, -2.4460, -1.4799, 0.8412, 0.6507, -0.2308, -1.2697, 0.4096, -2.4569, 1.3678, 0.0824, -0.6859, -0.5250, -0.8542]], [[ 0.6493, -5.2011, -6.6037, -6.0123, -5.6392, -3.9097, -3.2022, -4.5340, -7.3539, -6.4593, -4.2874, -4.4641, -3.7310, -3.3682, -2.7223, -4.2979]], [[ 0.0199, -4.1248, -5.3993, -5.4572, -6.7902, -4.8438, -4.5847, -5.4135, -6.5771, -8.0017, -6.6080, -6.6773, -3.2030, -1.6767, -1.7663, -3.7389]], [[ 2.6750, -3.1157, -2.8455, -4.4747, -3.6968, -2.2824, -3.0652, -3.9246, -3.3167, -3.6676, -4.4946, -4.3653, -2.4585, -1.5584, -0.9641, -1.5794]], [[ 0.1552, -5.8261, -7.2906, -6.8548, -6.4814, -4.6921, -4.5624, -5.1801, -6.1442, -6.9504, -6.3953, -5.9016, -3.7922, -2.9338, -2.7374, -3.3248]], [[ 0.3568, -1.0417, -2.2358, -2.6235, -2.4215, -0.6758, -1.2960, -1.4072, -2.4012, -2.1588, -1.4681, -2.2877, -0.2555, -2.0000, -1.1429, -2.1092]], [[ 0.5637, -3.0687, -2.2123, -3.0273, -2.0216, -0.8611, -0.5931, -1.2134, -1.8171, -1.7701, -1.2291, -1.1113, -0.5224, -1.7992, -0.7579, -1.4794]], [[ 1.1754, -3.4639, -3.2554, -3.7808, -2.9349, -1.3636, -2.0607, -2.6714, -2.3471, -2.0180, -3.1052, -2.9363, -2.2940, -2.5989, -2.3241, -1.6881]], [[ 1.0389, -3.1259, -3.4988, -4.2382, -3.6006, -1.5287, -2.3267, -3.6077, -6.1842, -4.8605, -1.9132, -4.0488, -2.5847, -2.5269, -2.8676, -3.6246]]]]) attn_weights tensor([[[[ 2.6810, -2.2078, -4.0078, -3.8065, -3.9813, 0.1595, -0.1269, -2.9748, -5.4162, -4.5402, -2.0382, -2.8818, -2.4734, -0.4690, -1.8966, -2.1080]], [[ 2.9660, -0.9476, -2.4238, -2.7449, -1.5579, -2.4172, -2.4439, -0.7890, -2.8577, -3.3277, -3.3259, -1.7239, -0.3640, -2.5638, -1.1947, -0.7960]], [[ 2.1886, -3.1387, -3.7786, -3.9663, -3.3155, 0.0813, -0.9659, -2.4743, -4.6321, -4.1803, -3.2636, -3.0342, -1.8635, -0.4447, -2.8115, -1.3672]], [[-1.2061, -3.0977, -5.1937, -5.1067, -5.4213, -3.4113, -2.6868, -2.7626, -4.4430, -4.8212, -4.5407, -4.1389, -3.9208, -2.1900, -2.8513, -3.9359]], [[ 3.0505, -0.0367, -3.6750, -2.8296, -2.5835, -0.6172, -1.5592, -2.2169, -4.0183, -2.5998, -3.3605, -2.4113, -2.4885, -1.1159, -2.4224, -0.4884]], [[ 1.6049, -1.6667, -2.9887, -2.9618, -2.2845, -1.8044, -2.6581, -1.2854, -2.3622, -2.9308, -3.1652, -2.8044, -3.4617, -1.6057, -2.0000, -2.7007]], [[ 3.1694, -1.3456, -3.7447, -3.4833, -3.6696, -0.0496, -0.0204, -0.9067, -3.9320, -3.4323, -2.5560, -4.3014, -2.6089, -1.1878, -3.2926, -2.0603]], [[ 0.3264, -3.2584, -4.2330, -4.3337, -3.9565, -3.6102, -3.4550, -3.1111, -4.6671, -4.3821, -4.2114, -3.5100, -2.8995, -3.2309, -4.5295, -3.2247]], [[ 1.8540, -2.9277, -3.2371, -2.2742, -2.6514, -0.3214, -1.4446, -1.9466, -3.3054, -1.8856, -3.1786, -2.2887, -2.6911, -0.9447, -1.8397, -2.5653]], [[ 4.3110, -0.8681, -2.5753, -2.7470, -2.1036, 0.8280, 0.7008, -1.7820, -3.1776, -3.0005, -1.7801, -2.2268, -1.1853, -0.1304, -1.0158, -1.4292]], [[-0.1514, -4.3891, -3.9630, -3.2843, -3.0255, -2.9901, -2.0884, -3.0602, -3.4092, -2.5605, -1.6159, -1.6962, -1.0717, -1.9015, -0.7588, -1.8293]], [[ 3.3707, -0.2875, -2.4695, -2.1890, -2.1753, -2.6865, -3.0244, 0.3332, -2.2397, -2.1281, -1.8525, -0.9432, -2.0147, -2.8075, -1.4672, -1.5395]]], [[[ 2.7257, -3.0042, -2.7337, -2.4617, -3.5635, -0.7594, -1.0330, -1.9841, -3.4240, -3.2244, -2.7631, -5.2154, -4.0936, -3.0374, -3.2033, -1.1786]], [[ 3.8311, -1.9633, -3.0019, -3.7784, -2.6098, -2.3663, -1.3966, -1.8236, -2.0198, -3.1986, -3.5121, -4.4326, -2.7558, -2.4527, -0.7822, -2.1480]], [[ 3.0945, -3.1794, -2.9189, -3.5524, -3.2171, -1.6115, -1.8286, -2.0249, -3.2748, -3.7956, -4.2537, -5.1864, -4.1581, -4.0492, -3.5950, -1.0000]], [[-0.5378, -4.9805, -5.3883, -6.2997, -6.0077, -6.2398, -5.9697, -4.4627, -4.3727, -4.2558, -4.7307, -4.7941, -3.1720, -3.1371, -2.1704, -4.8807]], [[ 2.9863, -2.1761, -4.1809, -4.2558, -3.1674, -1.5544, -3.0940, -2.2172, -2.9010, -4.0111, -3.5514, -3.4223, -3.1880, -1.4133, -1.6074, -1.4474]], [[ 1.7727, -4.2037, -4.9746, -5.3315, -4.2345, -3.4204, -3.3405, -2.7141, -3.4342, -4.2404, -4.7388, -4.5878, -3.3582, -3.8822, -3.0919, -2.9317]], [[ 4.0227, -1.5806, -3.3137, -3.6123, -2.6997, -0.8105, -0.9387, -1.0245, -2.1578, -2.4530, -2.8628, -2.2220, -1.5671, -1.7263, -2.3940, -0.5300]], [[ 0.3314, -3.8872, -3.8818, -4.0296, -3.9970, -4.5365, -3.7600, -3.2357, -3.8291, -4.2132, -3.9746, -4.7103, -3.4566, -3.6709, -2.9882, -3.5826]], [[ 2.8169, -3.2754, -3.4948, -2.9521, -3.1569, -1.4620, -2.0827, -3.3688, -2.9978, -3.9019, -2.7677, -3.8253, -2.4764, -3.2925, -2.7842, -1.3451]], [[ 4.7649, -1.0636, -3.0157, -3.5691, -1.9619, -0.3974, -0.5464, -0.9586, -1.4908, -2.8435, -3.3086, -2.6289, -1.2886, -2.1085, -1.8456, -0.3183]], [[ 1.4849, -7.5706, -6.6995, -6.8562, -5.4551, -3.5574, -4.1476, -6.8640, -5.6389, -4.9292, -4.9563, -3.3266, -1.8745, -1.5396, 0.5325, -1.2982]], [[ 3.3592, -1.3578, -3.5190, -3.5432, -2.6265, -3.3404, -2.5712, -1.3035, -2.0462, -3.7706, -3.3673, -3.9921, -2.3763, -3.2437, -2.6477, -2.9929]]], [[[ 1.1194, -1.7187, -0.7860, -1.0574, -1.6914, 0.8241, 0.9403, -1.1347, -2.1428, -0.6258, -2.9882, -1.4077, -1.1488, -2.9180, -1.8642, -2.2467]], [[ 4.1402, -3.0970, -5.3284, -4.8509, -4.5542, -1.7569, -1.9056, -4.6251, -3.7557, -5.2939, -4.8823, -4.2479, -2.3014, -0.3971, -0.9427, -1.0824]], [[ 0.9025, -3.0377, -2.7172, -3.1681, -2.2953, -1.1568, -1.0220, -1.0277, -2.7937, -2.5597, -3.4181, -2.8312, -1.2388, -1.9367, -1.6726, -2.2775]], [[-1.3232, -4.5196, -3.9919, -5.0811, -6.4724, -4.5170, -4.2068, -3.8439, -1.8539, -2.6205, -3.3593, -1.8206, -1.7332, -1.3563, -1.8739, -2.4099]], [[ 3.2572, -3.0127, -4.1489, -4.1566, -4.2455, -2.3091, -1.6497, -3.8239, -3.8885, -4.9607, -5.0023, -4.5788, -4.0925, -2.6184, -3.0274, -2.3803]], [[ 1.8800, -3.3186, -3.7509, -3.9503, -3.6009, -2.2320, -3.0399, -4.0641, -4.3090, -3.5849, -5.2994, -3.7654, -2.2266, -3.5300, -3.5150, -2.2455]], [[ 3.6621, -3.2369, -3.4491, -3.4085, -4.9009, 0.2993, -0.4891, -4.7768, -4.0254, -4.7081, -4.8633, -4.9433, -2.5627, -2.5042, -2.6271, -2.6095]], [[ 0.5028, -4.4287, -4.8240, -5.3890, -5.2628, -1.7879, -2.2901, -3.3309, -3.6209, -4.7801, -6.1167, -5.5587, -3.6766, -3.8181, -3.9275, -3.8717]], [[ 1.5290, -3.5387, -3.6000, -2.8764, -3.0115, -0.1401, -0.9320, -2.4810, -2.4693, -3.2784, -4.0217, -3.1976, -2.4516, -3.4937, -3.2174, -2.6809]], [[ 4.4905, -2.3055, -2.9201, -2.8905, -4.4333, 0.2391, 0.5573, -4.7929, -3.4481, -5.3811, -4.0849, -4.3992, -1.8778, -1.9199, -2.4967, -2.2484]], [[ 0.6164, -5.4160, -4.5928, -5.5165, -5.0091, -3.5942, -3.5974, -5.0466, -3.9140, -2.7721, -2.1023, -1.5229, 0.6369, 0.9368, -0.4545, -0.5798]], [[ 3.4252, -2.3128, -3.9613, -2.8057, -2.8009, -1.6164, -1.7056, -3.8191, -5.0595, -4.9013, -5.7776, -5.1903, -3.1850, -3.8149, -4.5989, -3.2718]]], [[[ 2.0409, -3.9311, -3.4350, -3.6930, -2.6575, -0.6084, -0.6170, -2.4318, -3.3167, -2.1066, -1.7105, -3.2106, -2.7999, -3.9764, -4.2917, -2.6361]], [[ 4.2783, -0.8257, -3.0401, -2.9817, -0.9778, -4.1469, -2.0790, -1.4106, -1.4628, -2.4907, -3.9359, -3.4496, -3.0397, -2.7915, -1.6387, 0.0148]], [[ 1.9861, -3.7989, -3.2981, -3.9585, -2.1957, -2.2889, -2.2932, -1.9079, -2.3247, -2.5477, -2.5505, -2.5583, -3.0142, -3.9204, -3.0744, -0.2123]], [[-0.7172, -4.9585, -5.8922, -5.6939, -6.5906, -4.9243, -4.9084, -5.2259, -6.0583, -5.4215, -4.9390, -1.7555, -3.2937, -2.6937, -1.7762, -3.1765]], [[ 3.4147, -1.9038, -3.2778, -2.9578, -2.7169, -1.8927, -2.6587, -2.5567, -4.0037, -4.1335, -3.9368, -2.7184, -3.7384, -4.2744, -2.8611, -1.7572]], [[ 1.8414, -2.9281, -3.6971, -3.9471, -3.1834, -3.6058, -2.6043, -2.3931, -3.4300, -4.4914, -2.8061, -1.3973, -2.6704, -2.7551, -2.2177, -1.8662]], [[ 3.7633, -2.1340, -3.4636, -2.3567, -2.7861, -1.4192, -1.0781, -2.0753, -3.2389, -2.3905, -2.8552, 0.2356, -2.9529, -3.2073, -3.2967, -1.4888]], [[ 0.4992, -3.7886, -4.2954, -4.2618, -3.9489, -3.6345, -2.8564, -2.5288, -3.2642, -3.2397, -3.2189, -3.1869, -3.6705, -3.5147, -4.7496, -4.4310]], [[ 2.0733, -3.3264, -3.5833, -2.2357, -2.5654, -2.1128, -2.6102, -2.5298, -2.7698, -2.7013, -2.2746, -1.2978, -2.5685, -1.2008, -1.4031, -3.3965]], [[ 4.8025, -1.5180, -2.2714, -2.2541, -1.8118, -1.2006, 0.9183, -1.7685, -1.6650, -2.2791, -1.2952, -0.9321, -2.7995, -2.8899, -2.4937, -0.5341]], [[ 1.1064, -6.2962, -7.4728, -5.8999, -5.4448, -3.5776, -4.2481, -6.3818, -5.0392, -3.5330, -4.4704, -4.7084, -4.0286, -2.7596, 0.0151, -0.6787]], [[ 3.8668, 0.0902, -1.7463, -1.4793, -1.3409, -3.3981, -2.5224, 0.1426, -1.3777, -4.0985, -3.6903, 2.0288, -0.1111, -1.1519, -1.7125, -2.0087]]], [[[ 2.1446, -2.0733, -2.5401, -2.9198, -2.8383, 0.0202, 0.0734, -2.6636, -3.7980, -3.4128, -0.2821, -0.9850, -1.2983, -2.4749, -0.6661, -2.3850]], [[ 3.8526, -1.6814, -3.3974, -4.4281, -2.1717, -1.7299, -1.9929, -2.7904, -1.2245, -1.2807, -1.7556, -3.4751, -0.8979, -2.1623, -0.5649, -1.4012]], [[ 1.8354, -3.2302, -3.6785, -3.7976, -3.4262, -1.3273, -1.1749, -2.9355, -3.3732, -2.7634, -0.3170, -1.3913, -0.9708, -1.6417, -0.7110, -3.3112]], [[ 0.1728, -3.5589, -4.9573, -5.1575, -6.3290, -4.5024, -4.0740, -4.0436, -5.0683, -5.8604, -5.4121, -5.2644, -2.2546, -1.6060, -1.0403, -3.4390]], [[ 2.6520, -1.8057, -2.3548, -3.2042, -1.9116, 0.8248, 0.2771, -0.7564, -2.4411, -1.1104, -2.2929, -0.1363, -0.7125, -1.1442, 0.0239, -2.3606]], [[ 1.9281, -2.3429, -2.8829, -3.3149, -3.0349, -1.5005, -2.3194, -3.2091, -3.4436, -2.8073, -2.8548, -3.1761, -3.4905, -4.2761, -2.1712, -0.9984]], [[ 3.3432, -2.9017, -3.2813, -3.4045, -2.9464, 0.6996, -0.0687, -3.4760, -2.5879, -1.8144, 0.7058, -2.3845, -3.2889, -2.6122, -0.8522, -2.0983]], [[ 0.3592, -2.7768, -3.6187, -3.8901, -2.9546, -2.6002, -3.4182, -2.8378, -2.4757, -2.9709, -4.9094, -4.8093, -2.8149, -3.6249, -2.8712, -4.0141]], [[ 1.5295, -2.7027, -3.3722, -3.3682, -3.2345, 0.8575, -0.1483, -2.8099, -4.2612, -3.7064, 0.4828, -0.7286, -1.6313, -1.6167, -0.7314, -2.0552]], [[ 3.6799, -2.1373, -2.1619, -3.1901, -1.6511, -0.2508, -1.5005, -3.1449, -2.4164, -0.2948, 0.9298, -3.2904, -2.1755, -1.4768, -1.4453, -1.6869]], [[ 1.4439, -3.0494, -4.1208, -4.2730, -4.5957, -4.4000, -3.6400, -2.7619, -3.4565, -4.7068, -5.3374, -4.7332, -0.4101, -1.6261, -0.5137, -2.3605]], [[ 3.7572, -0.7765, -2.8496, -1.7304, -1.3392, -1.0068, -2.2840, -4.3057, -4.0739, -1.6649, -1.7114, -3.2360, -3.2566, -3.4748, -1.5121, -2.7686]]]]) attn_weights tensor([[[[ 2.6274e+00, -2.4994e+00, -4.2999e+00, -3.5429e+00, -4.2968e+00, 3.0291e-01, -1.1851e+00, -2.6772e+00, -4.8482e+00, -3.9163e+00, -1.5047e+00, -3.4970e+00, -3.2836e+00, 3.6874e-01, -2.6784e+00, -3.1103e+00]], [[ 3.8779e+00, 1.9592e-01, -2.4529e+00, 1.4168e-01, -1.8967e+00, 1.2841e+00, -4.3194e-01, -7.4861e-01, -3.3568e+00, 3.3203e-02, -1.9420e+00, -2.2456e+00, -5.1787e-01, -1.6628e-01, -3.5640e-01, -6.5346e-01]], [[ 2.5013e+00, 1.3446e+00, -1.0561e+00, -1.6343e+00, -1.6520e+00, 4.0787e-01, 9.6317e-02, -3.2802e-01, -1.7685e+00, -1.6477e+00, -1.3054e+00, -1.1129e+00, -8.2938e-01, -5.4280e-01, -7.2395e-01, -5.5188e-01]], [[ 2.2413e+00, 2.2420e+00, -2.8516e+00, -2.0432e+00, -1.1801e+00, 1.7220e+00, -1.8772e+00, 1.0958e+00, -3.5784e+00, -2.7016e+00, -2.9403e+00, -1.8466e+00, -4.4490e-01, 1.2094e+00, -9.0076e-02, -5.2704e-01]], [[ 2.4002e+00, 2.1741e+00, -1.9600e+00, -7.2250e-01, -1.8592e+00, -1.9783e+00, -1.0432e+00, 6.5199e-01, -3.2775e+00, -1.9320e+00, -2.7321e+00, -2.0436e+00, -1.5445e+00, -2.1323e+00, -3.0559e+00, -2.1672e+00]], [[-4.5765e-01, -1.6890e+00, -2.3207e+00, -1.2790e+00, -1.6636e+00, -2.1919e+00, -1.6275e+00, -1.9401e+00, -2.4240e+00, -1.4513e+00, -9.4642e-01, -1.5133e+00, -9.2808e-01, -1.3233e+00, -1.9920e+00, -2.1311e+00]], [[ 3.0960e+00, -2.9071e+00, -3.6223e+00, -3.1519e+00, -3.2206e+00, 6.7494e-01, -4.5559e-01, -3.2818e+00, -4.3789e+00, -3.4049e+00, -7.5321e-01, -2.7593e+00, -2.6066e+00, -9.9031e-03, -2.2090e+00, -3.0404e-01]], [[ 2.0755e+00, -1.0430e+00, -1.5918e+00, -2.8012e+00, -2.2881e+00, -1.2006e+00, -2.6934e+00, -7.9841e-01, -2.0912e+00, -2.6122e+00, -1.8111e+00, -1.9639e+00, -2.9772e+00, -1.5415e+00, -1.6670e+00, -1.3125e+00]], [[ 3.1282e+00, 2.3230e-01, -2.4459e+00, -2.5642e+00, -9.7673e-01, -2.5005e+00, -2.5046e+00, 5.7231e-01, -2.9178e+00, -2.9508e+00, -3.6096e+00, -1.2318e+00, -2.5887e+00, -2.7598e+00, 4.7007e-02, -5.4659e-01]], [[-3.4342e-01, -4.0099e+00, -5.1033e+00, -5.1096e+00, -4.8837e+00, -1.8461e+00, -1.8267e+00, -2.6949e+00, -4.5219e+00, -4.6120e+00, -1.6807e+00, -2.8253e+00, -2.3026e+00, -4.4041e-02, -1.5212e+00, -1.8764e+00]], [[ 3.0523e+00, -1.7094e+00, -1.8918e+00, -2.3526e+00, -1.3056e+00, -5.6633e-01, -1.0083e+00, -2.1066e+00, -2.4100e+00, -2.5085e+00, -2.8888e+00, -1.9424e+00, -3.2212e+00, -1.6709e+00, -2.3948e+00, -1.8905e+00]], [[ 3.9127e+00, -2.3623e+00, -2.0091e+00, -2.4744e+00, -3.4015e+00, 1.9163e+00, 1.8535e+00, -2.2392e+00, -2.4779e+00, -2.2077e+00, -1.1211e+00, -1.9875e+00, -2.1901e+00, 7.8997e-02, 1.3522e+00, 6.6525e-01]]], [[[ 3.2179e+00, -2.2733e+00, -3.6802e+00, -3.2645e+00, -3.2799e+00, -5.8095e-01, -9.2001e-01, -2.0755e+00, -2.7574e+00, -3.6709e+00, -3.3594e+00, -3.7290e+00, -2.7208e+00, -3.6088e+00, -3.5144e+00, -1.9315e+00]], [[ 4.2618e+00, -8.1774e-01, -3.7840e+00, -1.2924e+00, -2.1957e+00, -8.7316e-02, -1.2562e+00, -3.1843e-01, -1.4884e+00, -3.7642e+00, -1.4156e+00, -2.2794e+00, -2.1781e+00, -2.5017e+00, -2.0543e+00, -7.6335e-02]], [[ 3.0171e+00, -5.4732e-02, -1.7143e+00, -1.5320e+00, -2.2373e+00, -6.8108e-01, 3.1342e-01, -3.4062e-01, -7.1941e-01, -2.2080e+00, -1.7309e+00, -2.4926e+00, -1.7465e+00, -2.0059e+00, -2.2530e+00, -8.3941e-01]], [[ 2.2030e+00, -2.5616e-02, -2.7844e+00, -1.9591e+00, -1.7090e+00, -6.0946e-01, -1.5658e+00, -1.9691e-01, -1.2349e+00, -2.9633e+00, -2.5887e+00, -2.1748e+00, -8.8640e-01, -2.2410e+00, -2.1752e+00, -1.6970e+00]], [[ 2.3868e+00, -1.9672e-01, -2.5898e+00, -2.2271e+00, -2.1006e+00, -3.0507e+00, -2.3257e+00, -8.4221e-01, -1.0676e+00, -2.7213e+00, -1.9070e+00, -3.3722e+00, -2.2452e+00, -2.5876e+00, -2.0474e+00, -2.2262e+00]], [[ 8.7080e-01, -3.6028e+00, -4.4503e+00, -4.4422e+00, -4.1423e+00, -2.6043e+00, -3.4197e+00, -3.7291e+00, -2.4733e+00, -2.8906e+00, -3.2533e+00, -2.9215e+00, -1.4656e+00, -1.5026e+00, 3.8502e-01, -1.8200e+00]], [[ 3.8924e+00, -3.6035e+00, -3.9337e+00, -4.2043e+00, -3.8675e+00, 2.4616e-02, -6.2246e-01, -3.3742e+00, -4.0983e+00, -4.3763e+00, -4.7229e+00, -2.0912e+00, -3.5848e+00, -3.4356e+00, -3.7079e+00, -5.9663e-01]], [[ 2.3375e+00, -2.0079e+00, -2.4715e+00, -3.1222e+00, -2.3797e+00, -6.7029e-01, -2.1912e+00, -7.0124e-01, -1.1631e+00, -2.3733e+00, -2.7699e+00, -2.5755e+00, -1.5406e+00, -2.0911e+00, -1.5496e+00, -7.7687e-01]], [[ 3.0663e+00, -2.6833e+00, -4.2423e+00, -4.3886e+00, -2.2016e+00, -3.4730e+00, -2.7817e+00, -1.1858e+00, -2.6905e+00, -4.0007e+00, -3.9169e+00, -3.2758e+00, -1.8453e+00, -2.0159e+00, -2.0910e+00, -5.5687e-01]], [[ 5.7644e-01, -5.3547e+00, -4.0753e+00, -5.3566e+00, -4.0871e+00, -3.4012e+00, -4.0466e+00, -5.2774e+00, -4.0818e+00, -3.1505e+00, -4.3451e+00, -5.2598e+00, -2.7703e+00, -1.9022e+00, -9.4156e-03, -2.4072e+00]], [[ 3.6024e+00, -1.3104e+00, -2.1314e+00, -1.6018e+00, -1.3642e+00, -1.3412e+00, -1.0920e+00, -1.5864e+00, -1.9331e+00, -2.8111e+00, -1.9464e+00, -2.4520e+00, -2.3413e+00, -2.1206e+00, -2.2731e+00, -1.2923e+00]], [[ 5.2482e+00, -1.8705e+00, -5.7214e-01, -4.9817e-01, -8.2070e-01, 4.7481e-01, 3.5426e-01, -1.2988e+00, -1.3074e+00, -1.1355e+00, -5.9925e-01, -1.2175e+00, -1.7143e+00, 2.0193e+00, -5.5326e-01, 1.5940e+00]]], [[[ 2.3943e+00, -3.0880e+00, -3.8998e+00, -3.3841e+00, -4.0009e+00, -3.0282e-01, -8.9710e-01, -3.9361e+00, -3.4106e+00, -4.2448e+00, -4.3118e+00, -5.0836e+00, -2.2282e+00, -3.2632e+00, -4.1397e+00, -3.5657e+00]], [[ 4.4531e+00, -1.5325e+00, -4.3010e+00, -3.1128e+00, -3.1594e+00, 3.0505e-02, -1.1179e+00, -2.6159e+00, -2.4082e+00, -4.7948e+00, -3.5758e+00, -4.8937e+00, -1.1896e+00, -1.0432e+00, -8.2125e-01, -5.9468e-01]], [[ 3.3258e+00, -2.1723e+00, -2.3393e+00, -2.8874e+00, -2.8833e+00, 4.4702e-01, 3.8845e-01, -2.6295e+00, -1.7227e+00, -2.4884e+00, -3.4862e+00, -3.2301e+00, -1.0240e+00, -1.2584e+00, -2.1514e+00, -9.9446e-01]], [[ 2.6974e+00, -2.2736e+00, -3.0899e+00, -2.5665e+00, -3.0854e+00, -4.8776e-02, -5.7302e-01, -2.7623e+00, -2.9170e+00, -2.8760e+00, -2.1300e+00, -3.4007e+00, -1.0813e+00, -2.0952e+00, -2.0720e+00, -1.8291e+00]], [[ 2.0415e+00, -2.1342e+00, -1.3587e+00, -1.4450e+00, -1.5856e+00, -1.0655e+00, -7.4062e-01, -2.5429e+00, -1.4957e+00, -8.3865e-01, -4.1533e+00, -2.1418e+00, 1.1877e-01, -1.1393e+00, -7.1718e-01, -1.3729e+00]], [[ 2.1977e+00, -4.2110e+00, -4.2843e+00, -5.3279e+00, -5.8094e+00, -3.5851e+00, -4.6990e+00, -4.2608e+00, -3.7266e+00, -3.2307e+00, -2.6254e+00, -3.4959e+00, -2.6844e+00, -2.8981e+00, -3.4624e+00, -3.9365e+00]], [[ 2.8414e+00, -1.1443e+00, -2.9883e+00, -1.8668e+00, -1.8025e+00, -9.1762e-01, -1.0117e+00, -2.1231e+00, -2.0328e+00, -3.2865e+00, -2.8402e+00, -3.3621e+00, -1.0219e+00, -2.1441e+00, -1.2102e+00, -1.3635e+00]], [[ 1.6738e+00, -3.6401e+00, -3.6250e+00, -4.0848e+00, -2.8145e+00, -1.1549e+00, -2.1095e+00, -2.7756e+00, -2.7995e+00, -3.4518e+00, -3.7102e+00, -3.3031e+00, -2.6429e+00, -3.8591e+00, -2.0563e+00, -2.2223e+00]], [[ 3.7484e+00, -1.6087e+00, -3.6661e+00, -3.6444e+00, -3.8309e+00, -1.5073e+00, -1.9728e+00, -2.6243e+00, -2.2394e+00, -4.2624e+00, -3.3368e+00, -3.5073e+00, -1.7181e+00, -1.6543e+00, -2.3376e+00, -1.9213e+00]], [[ 5.5780e-01, -4.0236e+00, -4.5110e+00, -4.6905e+00, -4.1101e+00, -3.1671e+00, -2.2523e+00, -3.5111e+00, -2.8525e+00, -3.2699e+00, -4.0064e+00, -2.6586e+00, -1.4143e+00, -1.1481e+00, -1.0905e+00, -1.6066e+00]], [[ 3.2006e+00, -1.5964e+00, -3.2838e+00, -2.4531e+00, -2.8840e+00, -5.5926e-01, -1.1036e+00, -1.5902e+00, -2.0543e+00, -3.6185e+00, -3.2414e+00, -3.3967e+00, -1.4417e+00, -2.0492e+00, -2.1114e+00, -1.4517e+00]], [[ 4.2427e+00, -1.5143e+00, -4.0197e-01, 5.1867e-01, -2.4276e+00, -2.3463e+00, -3.4609e-01, -5.5692e-01, 5.6772e-01, 2.1141e-01, -1.5883e+00, -5.0660e-01, 4.0695e+00, 3.4940e+00, 3.4627e+00, 3.4488e+00]]], [[[ 3.1802e+00, -3.5483e+00, -3.7609e+00, -3.5174e+00, -4.1081e+00, -4.1362e-01, -9.6133e-01, -2.9185e+00, -4.6776e+00, -1.3639e+00, -2.1748e+00, -7.9847e-01, -3.3648e+00, -3.2889e+00, -3.2726e+00, -2.7068e+00]], [[ 4.3394e+00, -1.0935e+00, -2.3067e+00, 2.3275e-01, -1.9320e+00, -1.5748e+00, -8.1585e-01, -9.2882e-01, -1.8756e+00, -8.8645e-01, -2.3706e+00, -3.3991e-01, -2.5411e+00, -3.8201e-01, -8.9183e-01, 1.0385e+00]], [[ 3.2026e+00, 1.8376e-03, -1.8579e+00, -2.3711e+00, -1.9599e+00, -8.5804e-01, -4.8861e-01, -1.0113e+00, -2.0647e+00, -1.9126e+00, -8.2774e-01, 1.8940e+00, -1.0635e+00, -2.1838e+00, -2.0629e+00, -1.7235e+00]], [[ 2.8373e+00, 1.1887e+00, -1.8019e+00, -1.5153e+00, -1.1613e+00, 5.1915e-01, -1.3669e+00, 1.1833e+00, -2.5418e+00, -2.7488e+00, -2.8202e+00, 3.3325e+00, -1.0344e+00, -1.4933e+00, -2.2018e+00, -1.7448e+00]], [[ 2.7728e+00, -5.6396e-01, -2.2712e+00, -1.4813e+00, -2.4164e+00, -3.3202e+00, -2.9100e+00, -1.5208e+00, -3.2260e+00, -2.9370e+00, -3.8688e+00, -1.9484e-01, -2.0353e+00, -1.3113e+00, -9.5888e-01, -1.6752e+00]], [[ 1.3639e+00, -4.1095e+00, -4.4666e+00, -3.3469e+00, -3.2410e+00, -3.7380e+00, -4.5893e+00, -4.3552e+00, -3.2544e+00, -3.5938e+00, -5.9258e+00, -3.3134e+00, -2.8807e+00, -1.7680e+00, -4.8093e-01, -1.4076e+00]], [[ 3.4365e+00, -3.9709e+00, -3.7920e+00, -3.2035e+00, -3.1806e+00, -4.3196e-01, 2.7832e-01, -3.2382e+00, -3.9807e+00, -9.0177e-01, -9.2928e-01, -2.7011e+00, -3.9366e+00, -3.5980e+00, -2.7172e+00, -1.8126e+00]], [[ 2.5988e+00, -1.5118e+00, -1.4762e+00, -1.6438e+00, -1.9366e+00, -2.2933e+00, -2.1272e+00, -6.1591e-01, -2.3080e+00, -3.7973e+00, -2.3604e+00, -6.1769e-02, -1.5801e+00, -1.1042e+00, -1.6677e+00, -1.8876e+00]], [[ 3.9398e+00, -1.3938e-01, -2.9355e+00, -2.4618e+00, -1.6817e+00, -3.5007e+00, -3.1597e+00, -3.4809e-01, -2.1122e+00, -3.5002e+00, -4.6842e+00, -3.5427e-01, -3.0590e+00, -2.2131e+00, -2.1448e+00, 1.9854e-01]], [[ 6.0382e-01, -5.5644e+00, -5.2177e+00, -4.3115e+00, -4.3657e+00, -3.5921e+00, -3.0957e+00, -5.2144e+00, -4.9113e+00, -4.6036e+00, -4.7157e+00, -4.4857e+00, -4.7693e+00, -3.2742e+00, -2.2614e+00, -8.7037e-01]], [[ 3.3998e+00, -2.5573e+00, -1.8157e+00, -1.5937e+00, -2.6110e+00, -2.0336e+00, -7.6800e-01, -2.7382e+00, -3.3398e+00, -2.1568e+00, -2.2190e+00, -1.1776e+00, -2.7994e+00, -2.8522e+00, -3.3098e+00, -1.6988e+00]], [[ 4.2333e+00, -1.6566e+00, -9.5193e-01, -6.0579e-01, -1.3103e+00, 5.7080e-01, 6.6983e-02, -3.9355e-01, -1.0349e+00, -2.5721e+00, -7.7594e-01, -4.8170e-01, 2.7600e-01, 1.0356e+00, 2.5109e+00, 1.6977e+00]]], [[[ 2.1961e+00, -3.0702e+00, -4.2528e+00, -3.8697e+00, -3.4722e+00, 2.0717e+00, 5.2634e-01, -2.7392e+00, -3.6926e+00, -2.9191e+00, 8.6166e-01, -1.8039e+00, -2.1385e+00, -2.3475e+00, -5.0673e-01, -2.7693e+00]], [[ 3.6210e+00, -2.6961e+00, -4.0107e+00, -2.8546e+00, -3.0417e+00, 8.8400e-02, -1.4272e+00, -2.3452e+00, -1.3133e+00, -9.6989e-01, 7.9988e-01, -2.8020e+00, -1.9880e+00, -2.6577e+00, -9.2996e-01, -4.7651e-01]], [[ 3.3861e+00, -2.4302e+00, -2.0091e+00, -3.1294e+00, -2.8393e+00, -1.2562e-01, -9.0986e-01, -2.5688e+00, -2.8895e+00, -1.6550e+00, -1.4322e-01, -2.4831e+00, -1.8210e+00, -2.0019e+00, -6.0416e-01, -2.2627e+00]], [[ 2.7370e+00, -1.6618e+00, -2.9885e+00, -2.4545e+00, -2.7323e+00, 1.0004e+00, -5.2668e-01, -1.7935e+00, -2.8917e+00, -1.9303e+00, -8.1623e-01, -2.1844e+00, -4.5369e-01, 9.3047e-02, 4.6091e-01, -9.6341e-01]], [[ 2.7771e+00, -1.0794e+00, -2.6657e+00, -2.5896e+00, -1.8653e+00, -2.9634e-01, -4.6435e-01, -1.0322e+00, -1.6170e+00, -1.9574e+00, 1.0600e+00, -1.4577e+00, -1.4791e+00, -1.6009e+00, -5.5876e-01, -1.0910e+00]], [[ 2.1565e+00, -2.9592e+00, -3.5035e+00, -3.7085e+00, -4.4742e+00, -4.3157e+00, -5.0594e+00, -3.4900e+00, -3.9158e+00, -4.3679e+00, -5.4844e+00, -7.1567e+00, -2.8331e+00, -3.3778e+00, -2.1004e+00, -3.6692e+00]], [[ 2.9581e+00, -3.5481e+00, -3.7653e+00, -3.7011e+00, -3.3944e+00, 4.8333e-01, -5.7545e-01, -3.5917e+00, -3.6257e+00, -2.7949e+00, 9.3621e-01, -1.6897e+00, -3.5606e+00, -2.5181e+00, -1.7369e+00, -2.3416e+00]], [[ 1.7704e+00, -2.1892e+00, -2.2792e+00, -3.2603e+00, -2.0630e+00, 1.5758e+00, -8.0334e-01, -8.9471e-01, -2.0908e+00, -8.2708e-01, -6.5868e-01, -1.8331e+00, -8.8277e-01, -9.8350e-01, -3.5349e-01, -8.6398e-01]], [[ 3.1646e+00, -1.9403e+00, -3.0172e+00, -2.8660e+00, -2.4230e+00, -2.3217e+00, -3.1848e+00, -2.2934e+00, -2.4418e+00, -2.9596e-01, -1.2318e+00, -3.7554e+00, -1.5865e+00, -1.5568e-01, 5.3588e-01, -7.3830e-01]], [[ 1.2261e+00, -2.7340e+00, -2.9642e+00, -3.2773e+00, -3.1073e+00, -3.3882e+00, -2.9772e+00, -2.3188e+00, -3.9888e+00, -4.3023e+00, -5.5025e+00, -5.3085e+00, -1.0028e+00, -7.6665e-01, 2.9651e-03, -2.1735e+00]], [[ 3.1231e+00, -2.1040e+00, -2.1431e+00, -2.2377e+00, -1.3952e+00, 9.5739e-01, -4.9523e-01, -2.0903e+00, -2.4775e+00, -1.2917e+00, -1.5482e-01, -2.3686e+00, -1.2606e+00, -7.3697e-01, -3.6623e-01, -1.5957e+00]], [[ 4.0619e+00, -2.1258e-01, -1.6395e+00, -3.8388e+00, -3.4391e+00, 2.1779e+00, 1.0983e+00, 3.2558e-01, -2.1674e+00, -1.9732e+00, 1.4126e+00, 1.2169e-02, 1.6784e+00, 2.8000e-01, 1.9935e+00, -1.6207e-01]]]]) attn_weights tensor([[[[ 1.4429e+00, 1.9077e+00, 9.1515e-01, 9.2087e-01, 3.9077e-01, 9.0982e-01, 4.0808e-01, 6.6584e-01, 4.9109e-01, -8.0179e-02, 1.2084e-01, 7.0412e-01, 1.0734e+00, 5.6058e-01, 7.3687e-01, 1.4442e+00]], [[ 3.3605e+00, 1.2879e+00, 1.7834e-01, 1.7155e-01, 1.0141e-01, 2.4689e-01, -1.5839e-01, 1.9837e-01, -1.0853e+00, -8.3123e-01, -4.1562e-01, -7.4354e-01, -8.4701e-01, -4.9143e-01, -2.6806e-01, 2.6920e-01]], [[ 3.0076e+00, 1.0656e+00, -1.6571e+00, -1.6368e+00, -1.5954e+00, 3.2574e-01, -1.1722e-02, 6.0451e-01, -2.8603e+00, -2.0880e+00, -1.2216e+00, -1.3049e+00, -1.2968e+00, -6.3037e-01, -6.9292e-01, -2.1788e+00]], [[ 1.2464e+00, -1.1903e-01, -2.5792e+00, -2.9629e+00, -2.1441e+00, -1.5583e+00, -6.2402e-01, -9.7949e-01, -3.6594e+00, -3.7224e+00, -1.9944e+00, -1.9441e+00, -1.9740e+00, -7.3991e-01, -4.5437e-01, -1.6600e+00]], [[ 1.9655e+00, -2.6785e-02, -7.6978e-01, -1.0009e+00, -4.4172e-01, -1.4110e+00, -2.3035e+00, -2.3031e-01, -1.0885e+00, -1.3599e+00, -1.9031e+00, -5.1962e-01, -1.0258e+00, -1.5635e+00, -2.7337e-01, -1.3517e+00]], [[ 3.6157e+00, 8.5651e-01, -9.8772e-01, 2.0664e-01, -8.4617e-01, 1.8127e+00, 2.7391e+00, 4.9954e-01, -1.7588e+00, -4.9716e-01, 1.7794e-01, -1.0337e+00, -1.2092e+00, 8.4766e-02, -2.6089e-01, 7.8595e-01]], [[ 3.1727e+00, -1.2087e+00, -1.9893e+00, -1.3403e+00, -1.2575e+00, -2.6239e-01, -2.0772e+00, -1.7063e+00, -2.7831e+00, -2.1981e+00, -1.8913e+00, -1.8888e+00, -2.0603e+00, -1.5374e+00, -1.2632e+00, -2.0989e+00]], [[ 3.4413e+00, 2.0093e+00, 4.6775e-01, 2.1696e-01, 3.1182e-01, 1.5451e+00, 2.7483e-01, 4.7400e-01, -9.6931e-01, -1.6028e+00, -7.5414e-01, -4.1089e-01, -1.4450e-01, 3.9218e-02, 2.9309e-01, -1.4003e-01]], [[-6.6341e+00, 2.8798e+00, 1.7479e+00, 9.7644e-01, 9.9247e-01, 2.5150e+00, 2.9534e+00, 2.2602e+00, 7.1925e-01, 3.0648e-01, 1.7858e+00, 5.0076e-02, 4.3825e-03, 2.6279e+00, 1.3600e+00, 1.9278e+00]], [[ 3.7267e+00, -4.0815e-01, -2.3355e+00, -2.4711e+00, -2.5711e+00, 8.9454e-01, 6.8541e-01, -8.4124e-01, -3.0632e+00, -2.7119e+00, -1.4829e+00, -2.3145e+00, -1.1551e+00, -7.5850e-01, -1.3752e+00, -6.9762e-01]], [[ 2.5157e+00, 9.6369e-01, -1.6236e+00, -1.5817e+00, -1.2577e+00, 1.5204e+00, -2.9274e-02, 6.1627e-01, -2.5719e+00, -2.0314e+00, 6.8069e-01, -3.0542e-01, -9.2670e-01, 8.9467e-01, 8.4518e-01, 1.9403e-01]], [[ 2.7366e+00, 1.3525e+00, -1.8165e+00, -5.3594e-01, -8.3171e-01, 1.2678e+00, 7.7502e-01, 1.4755e+00, -2.6362e+00, -7.3264e-01, 1.3828e+00, -1.9917e-01, -4.4074e-01, 7.7841e-01, 3.4292e-01, -6.3522e-02]]], [[[ 9.8251e-01, 1.4294e+00, 5.1924e-01, 1.8588e-01, 8.3822e-01, 3.9251e-01, 4.2621e-01, 8.2292e-01, 1.6735e+00, 6.7045e-01, 1.5301e-01, 4.9096e-01, 1.0232e+00, 4.8604e-01, 6.3382e-01, 2.7633e-01]], [[ 3.9907e+00, -9.3808e-01, -1.4644e+00, -7.1396e-01, -2.0799e-01, -8.6840e-01, 5.8786e-02, -1.3738e-01, -5.2749e-01, -1.0177e+00, -4.8249e-01, -4.7186e-01, 1.4595e-01, -4.2290e-01, -5.8040e-01, 1.0613e+00]], [[ 3.5980e+00, 5.7246e-01, -1.8739e+00, -1.5666e+00, -1.4087e+00, -3.5973e-01, 2.4485e-02, 1.0640e+00, -4.5714e-01, -2.7509e+00, -1.7333e+00, -2.2646e+00, -1.3686e+00, -2.3288e+00, -2.4272e+00, -8.2181e-01]], [[ 1.6865e+00, -1.5773e+00, -2.6545e+00, -2.8296e+00, -1.4471e+00, -1.1326e+00, -9.8780e-01, -1.1347e+00, -1.0998e+00, -3.0241e+00, -2.9675e+00, -2.4168e+00, -2.4037e+00, -1.2878e+00, -1.5811e+00, -2.4523e+00]], [[ 2.3752e+00, -3.6446e-01, -9.7443e-01, -1.4124e+00, -7.5176e-01, -1.5718e+00, -1.9218e+00, -3.7908e-01, -1.1632e+00, -1.0532e+00, -1.7551e+00, -2.2515e+00, -9.2307e-01, -2.0955e+00, -1.3618e+00, -1.3003e+00]], [[ 3.9370e+00, 9.1163e-02, -1.8184e+00, -2.2820e+00, -6.8922e-01, 3.3523e-02, 1.3972e+00, 5.4433e-01, -1.4173e-01, -2.0608e+00, -2.7188e+00, -9.5743e-01, -1.7649e+00, -5.0562e-01, -7.2690e-01, -1.0305e-01]], [[ 3.6473e+00, -1.5445e+00, -2.0784e+00, -1.4018e+00, -6.1036e-01, -5.9543e-01, -9.3033e-01, -1.3294e+00, -1.5739e+00, -2.5847e+00, -1.5629e+00, -1.2010e+00, -7.6914e-01, -1.1671e+00, -7.2058e-01, -5.4086e-02]], [[ 3.4188e+00, 7.6505e-01, -1.2110e+00, -7.4897e-01, -1.3741e-01, 1.1037e+00, 9.7990e-01, 9.5669e-01, 1.8413e-01, -1.1209e+00, -7.6537e-01, 5.2336e-02, 5.3591e-01, 2.4387e-01, -1.1859e+00, 6.3121e-01]], [[-5.3025e+00, 1.3859e+00, 1.1177e+00, 7.2769e-01, 1.1484e+00, 2.1454e+00, 1.8859e+00, 1.2075e+00, 1.5556e+00, 9.9682e-01, 1.3457e+00, 2.4687e+00, 2.4462e+00, 3.0279e+00, 2.6990e+00, 2.0633e+00]], [[ 4.5641e+00, -4.4095e-01, -2.1960e+00, -1.8185e+00, -2.0678e+00, -1.0458e-01, 1.8277e-01, -1.5282e-01, -8.6087e-01, -2.8097e+00, -2.1182e+00, -6.3613e-01, -1.1670e+00, -1.3535e+00, -9.6433e-01, 6.2849e-01]], [[ 3.1248e+00, 3.5745e-01, -4.9887e-01, -7.4585e-01, -5.3595e-01, 8.2964e-01, -2.1196e-01, 9.2089e-01, 9.0761e-01, -1.2680e+00, -7.2346e-01, -3.7706e-01, -6.6199e-01, -3.2877e-01, -8.1751e-01, 9.5895e-01]], [[ 2.6469e+00, 2.6416e+00, -5.5701e-02, -2.8248e-02, -2.2343e-01, 1.1377e+00, 1.0676e+00, 3.3225e+00, 1.7998e+00, -9.2341e-01, 1.7749e-01, -6.0684e-01, -2.1870e-01, 7.6526e-01, -4.3896e-01, 1.3713e+00]]], [[[ 1.5912e+00, -4.9851e-01, -5.5557e-01, -5.1595e-01, 2.1259e-01, 4.2914e-01, 4.4325e-01, -2.4881e-01, 2.7739e-03, -1.7004e-01, -1.2766e+00, -9.9000e-02, -2.9058e-01, -2.0313e-01, 4.3618e-01, -1.6823e-01]], [[ 2.9182e+00, -1.6863e+00, -1.2353e+00, -1.9422e+00, -1.8968e+00, -4.0361e-01, -6.0275e-01, -9.2757e-01, -2.0720e+00, -1.4560e+00, -3.1223e+00, -2.1829e+00, -1.2903e+00, -1.2627e+00, -7.2627e-01, -8.7384e-01]], [[ 2.8425e+00, -2.3505e+00, -2.5136e+00, -2.9517e+00, -2.6997e+00, 2.1004e-01, -3.9000e-01, -2.0077e+00, -1.7686e+00, -2.4110e+00, -3.2281e+00, -3.3443e+00, -2.5769e+00, -1.9018e+00, -1.8899e+00, -1.7022e+00]], [[ 9.0330e-01, -2.1400e+00, -1.9378e+00, -2.0445e+00, -2.7737e+00, -4.1467e-01, -8.8845e-01, -7.7109e-01, -3.8103e-01, -9.3718e-01, -4.2316e+00, -9.9639e-01, -1.3811e-02, -9.6727e-01, -1.4606e+00, -1.2969e+00]], [[ 1.9320e+00, -1.6055e+00, -2.2082e+00, -1.7347e+00, -2.1581e+00, -1.5011e+00, -2.0629e+00, -1.3746e+00, -1.0210e+00, -2.0304e+00, -3.0676e+00, -1.8546e+00, -8.4637e-01, -1.5692e+00, -6.4556e-01, -1.8019e+00]], [[ 4.1325e+00, -1.4487e+00, -2.0242e+00, -2.4811e+00, -2.5670e+00, 4.7981e-01, 8.8628e-01, -2.8174e+00, -2.8974e+00, -2.6364e+00, -2.6262e+00, -3.0678e+00, -3.1385e+00, -3.8546e-01, -8.5461e-01, -1.1846e-02]], [[ 3.3163e+00, -2.7562e+00, -2.8631e+00, -3.7718e+00, -3.1217e+00, -8.0582e-01, -1.4126e+00, -2.9450e+00, -3.0289e+00, -3.7248e+00, -3.3214e+00, -3.8497e+00, -2.2038e+00, -1.8833e+00, -2.5525e+00, -2.3504e+00]], [[ 3.6054e+00, -7.8858e-01, -1.4942e+00, -2.7003e+00, -1.7105e+00, 6.6395e-01, -3.9380e-01, -1.3015e+00, -2.3236e+00, -2.2971e+00, -2.8947e+00, -3.2709e+00, -3.0579e+00, -1.9709e+00, -2.4663e+00, -1.0695e+00]], [[-4.2573e+00, 4.9768e-01, 2.2614e+00, 1.0374e+00, 4.9729e-01, 6.5289e-01, 2.1289e-01, 2.1911e-01, 3.6167e-01, 1.6197e+00, -6.0067e+00, 2.3695e+00, 5.0027e-01, -5.0642e-01, 2.8570e-02, 4.2999e-01]], [[ 4.3725e+00, -9.8886e-01, -2.0799e+00, -2.4995e+00, -1.8215e+00, -1.2623e+00, -1.3015e+00, -2.1152e+00, -1.4090e+00, -2.3967e+00, -1.4641e+00, -1.5373e+00, -5.5545e-01, -1.3552e-01, 3.3046e-01, 4.0739e-01]], [[ 1.4236e+00, -2.9994e+00, -2.0492e+00, -1.6594e+00, -1.8695e+00, -5.8048e-01, -1.1932e+00, -2.3112e+00, -1.5099e+00, -2.0528e+00, -1.6619e+00, -1.7061e+00, 2.2093e-01, 5.6488e-01, 1.0766e+00, 2.3238e-01]], [[ 2.9714e+00, -2.1534e+00, -5.0138e-01, -2.9457e-01, -5.4367e-01, 9.5982e-01, -3.3119e-02, -1.9735e+00, -8.9996e-01, -2.8573e-01, -1.0893e+01, 8.1685e-01, 1.9192e+00, 2.3855e+00, 1.5930e+00, 1.4842e+00]]], [[[ 1.6350e+00, 6.2852e-01, -2.0411e-02, 7.2886e-02, -5.5926e-02, -1.2871e-01, 3.9314e-01, 2.2042e-01, -5.2051e-01, -5.0843e-01, 7.1628e-01, 3.9392e-01, 1.0447e+00, 2.7736e-01, 2.3245e-01, -1.4213e-01]], [[ 3.8590e+00, -5.7023e-01, -2.0750e-01, -1.6229e-01, -9.7498e-01, -1.2362e+00, -5.7894e-02, -5.0452e-01, -1.6987e+00, -2.0988e+00, -1.6350e+00, 5.1410e-01, -6.8183e-01, -5.3783e-01, -6.2432e-01, 2.8404e-01]], [[ 3.6091e+00, -6.9393e-01, -2.5482e+00, -1.8142e+00, -1.9252e+00, -5.4204e-01, 3.0414e-01, -6.5594e-01, -2.3718e+00, -4.9585e-01, -1.1666e+00, 1.9817e+00, -2.9014e+00, -1.8947e+00, -2.3249e+00, -2.6762e+00]], [[ 1.1666e+00, -1.7834e+00, -1.7831e+00, -1.7597e+00, -1.7018e+00, -9.1174e-01, -1.0434e+00, -1.1307e+00, -3.0611e+00, -2.4228e+00, -1.3933e+00, -8.3196e-01, -7.1538e-01, -4.7279e-01, -1.2117e+00, -1.7283e+00]], [[ 2.0174e+00, -7.0896e-01, -1.2963e+00, -1.0133e+00, -1.2931e+00, -2.0877e+00, -1.9723e+00, 9.7224e-02, -2.0196e+00, -2.2815e+00, -2.7772e+00, -5.9755e-01, -6.6393e-01, -6.7145e-01, -1.5566e+00, -2.0496e+00]], [[ 4.3974e+00, 1.2134e-01, -1.5534e+00, -1.6224e-01, -1.7958e-01, 5.9961e-01, 2.3885e+00, 3.0824e-01, -5.5866e-01, -7.1889e-01, 1.5152e+00, -2.4231e-01, -1.3381e+00, -1.0638e+00, 5.8381e-01, 5.7432e-01]], [[ 3.6068e+00, -2.0974e+00, -1.9306e+00, -1.7442e+00, -1.5085e+00, -9.7789e-01, -9.8676e-01, -2.0411e+00, -1.7254e+00, -1.6306e+00, -2.7130e+00, -1.9600e+00, -2.5489e+00, -2.8649e+00, -2.2979e+00, -2.0866e+00]], [[ 4.5122e+00, 1.0499e+00, -6.1270e-01, -2.1849e-01, 7.0290e-02, 1.3408e+00, 8.8049e-01, 4.1796e-01, -1.3066e+00, -8.5927e-01, -8.2570e-01, 2.1114e+00, -8.7049e-01, -1.0912e+00, 1.0482e+00, 7.6802e-01]], [[-5.6519e+00, 3.8420e+00, 3.7615e+00, 2.8131e+00, 2.8730e+00, 4.2787e+00, 4.2074e+00, 3.3313e+00, 2.0060e+00, 1.8402e+00, 2.7674e+00, 3.4958e+00, 4.1692e+00, 4.5466e+00, 4.9970e+00, 4.1728e+00]], [[ 4.3454e+00, -1.0164e+00, -1.8739e+00, -1.9041e+00, -1.6047e+00, -9.1195e-01, 6.9513e-01, -3.5636e-01, -1.6097e+00, -4.6134e-02, -5.9802e-01, -7.4896e-01, -2.4263e+00, -2.3576e+00, -7.3304e-01, 4.0633e-01]], [[ 2.6194e+00, -1.1607e+00, -1.5631e+00, -7.3778e-01, -1.2332e+00, -3.0443e-01, -5.5103e-01, -8.5151e-02, -1.2755e+00, -2.3343e+00, -8.3358e-01, -9.3441e-01, -1.2694e+00, 4.8656e-01, 1.5552e+00, 5.8867e-03]], [[ 2.3448e+00, -5.8419e-01, -8.7999e-01, -3.9957e-01, -1.3110e+00, 1.1668e+00, 9.8318e-01, 2.2994e-01, -1.8668e+00, -1.2207e+00, 3.9891e-01, -8.1752e-01, -7.4297e-01, 5.2353e-01, 7.9538e-01, -1.4281e-01]]], [[[ 2.0194e+00, 9.1841e-01, -1.6214e-01, 3.2362e-01, 5.1950e-01, 8.8220e-01, 6.1406e-01, 1.1274e+00, 6.6632e-01, 5.1331e-01, 4.0794e-01, 1.1389e-01, 3.9607e-01, 6.4378e-01, 9.4696e-01, 1.2003e+00]], [[ 3.6489e+00, -5.8524e-01, -1.1049e+00, -1.3070e+00, -2.3500e-01, -4.6879e-01, -4.8483e-01, 2.8596e-01, -1.8844e-01, 2.4192e-01, 2.0750e+00, -2.2495e+00, 5.8566e-01, 5.0398e-02, 1.5132e+00, 4.2955e-01]], [[ 3.0021e+00, -4.3573e-01, -1.7041e+00, -1.9516e+00, -1.4880e+00, 7.8316e-01, 5.8738e-02, -6.7285e-01, -1.3953e+00, -9.8964e-01, -2.6629e-01, -2.0331e+00, 3.8059e-01, -8.9853e-01, 1.2017e+00, 9.8705e-04]], [[ 1.6396e+00, 4.1933e-02, -2.1123e+00, -2.0808e+00, -1.1030e+00, -4.0443e-01, 1.0172e-01, 5.7413e-02, -2.8945e+00, -2.9511e+00, -1.9389e-01, -7.5729e-01, 1.1401e+00, -6.0556e-01, 1.2827e+00, -8.3073e-01]], [[ 2.7814e+00, -1.7320e-01, -4.6616e-01, -9.3488e-01, -3.9241e-01, -3.3989e-01, -1.2828e+00, -3.6825e-01, -9.4965e-01, -3.1131e-01, -8.6362e-01, -2.5306e+00, 9.5147e-02, -2.3866e-01, 7.2185e-01, 2.8710e-01]], [[ 4.2539e+00, -1.7633e-01, -8.4719e-01, -9.0909e-01, -1.1522e+00, 1.5259e+00, 2.1351e+00, -1.5696e-01, -5.6298e-01, 1.5404e+00, 1.4292e+00, 9.9032e-01, -2.1586e-01, 1.1680e-01, 1.4111e+00, -7.5557e-02]], [[ 3.4750e+00, -1.2936e+00, -2.4923e+00, -2.0221e+00, -1.6426e+00, 1.4237e-02, -1.6713e+00, -1.4246e+00, -2.3754e+00, -1.2837e+00, -9.3222e-01, -3.6323e+00, -1.0218e+00, -1.8289e+00, -8.4764e-02, -3.3726e-01]], [[ 3.7908e+00, 9.7976e-01, 1.1522e-01, 1.4177e-01, 8.6868e-01, 1.8688e+00, -5.2247e-02, 9.1402e-01, -3.0978e-01, 5.7297e-01, 9.9785e-01, -1.6307e+00, 7.1238e-01, -1.0111e+00, 1.3520e+00, 2.1516e+00]], [[-2.2882e+00, 5.2320e+00, 5.0683e+00, 4.8640e+00, 4.0906e+00, 3.9199e+00, 3.8253e+00, 5.0036e+00, 4.3953e+00, 3.5827e+00, 1.9322e+00, 1.6636e+00, 5.9173e+00, 4.3767e+00, 6.1013e+00, 6.1137e+00]], [[ 4.0607e+00, -1.4097e+00, -3.2097e+00, -2.8181e+00, -1.9520e+00, 2.1489e-01, -5.7234e-01, -1.4852e+00, -1.2799e+00, -1.7579e+00, -1.9712e-01, -2.3680e+00, -1.0123e+00, -1.8595e+00, 5.6717e-02, -1.1992e+00]], [[ 3.4418e+00, 4.2025e-01, -9.1237e-01, -1.5660e+00, -1.3847e+00, 2.0559e+00, 6.6493e-01, 1.8848e-01, -9.8026e-01, -4.1573e-01, 6.0978e-01, -1.4156e-01, 1.9980e+00, 9.8395e-01, 2.6679e+00, 1.6959e+00]], [[ 3.8629e+00, 1.8119e-01, -1.2886e+00, -1.6275e+00, -1.0001e+00, 1.4364e+00, 3.4928e-01, -1.7155e-02, -1.6473e+00, -1.4339e+00, 3.1364e-01, -1.3424e+00, 3.1490e-01, -1.1521e+01, -3.6936e+00, 5.6599e-01]]]]) attn_weights tensor([[[[-1.4330, -4.4946, -2.4807, ..., -4.4035, -2.4886, -4.6005]], [[-2.1749, 0.1359, -3.2497, ..., -2.9430, -4.3179, 3.8754]], [[-1.6710, -3.1286, -1.9959, ..., -2.8710, -2.3985, -3.0564]], ..., [[-1.6608, -2.0319, -1.9886, ..., -2.0002, -1.9773, -1.8113]], [[-0.2153, -0.4585, -0.6434, ..., -0.4572, -0.6711, 0.1449]], [[-1.3183, -2.0765, -3.3705, ..., -2.1981, -2.8772, -1.9335]]], [[[-1.0813, -3.4512, -1.5911, ..., -3.2424, -0.1960, -3.0995]], [[-0.5663, 0.3870, -0.8293, ..., 6.5854, -1.5106, 6.6251]], [[-2.0129, -2.5436, -2.7636, ..., -2.1042, -2.8362, -2.0648]], ..., [[-1.7704, -2.1172, -2.2000, ..., -1.9908, -2.3457, -1.9278]], [[-0.3162, -0.6432, -0.6760, ..., 0.6681, -0.8257, 0.6952]], [[-1.2930, -2.1349, -3.5797, ..., -2.1425, -2.2702, -2.1384]]], [[[-1.0265, -2.0210, -2.1879, ..., -2.2764, -1.9171, -1.8539]], [[ 1.4249, 2.1485, 0.8457, ..., -0.1316, -0.0371, 10.7098]], [[-1.1628, -2.6888, -1.5432, ..., -2.7115, -1.8732, -1.8081]], ..., [[-1.9522, -2.4780, -2.8149, ..., -2.5520, -2.4980, -5.1450]], [[ 0.3606, 0.0969, -0.0645, ..., -0.0853, -0.2272, 1.4763]], [[-1.4025, -2.0899, -2.4229, ..., -2.2912, -3.0248, -1.9461]]], [[[-1.5435, -4.9174, -2.4461, ..., -3.0179, -2.5877, -4.7483]], [[-3.1776, 2.6563, -3.3428, ..., -5.0981, -3.7811, 3.5928]], [[-2.2557, -1.1290, -2.9348, ..., -4.0445, -3.7403, -0.8217]], ..., [[-1.7266, -2.0786, -2.0965, ..., -2.2443, -2.0865, -2.0040]], [[-0.2360, -0.3058, -0.4850, ..., -0.7062, -0.5579, -0.1751]], [[-1.5830, -2.2616, -3.6157, ..., -2.3760, -3.7168, -2.2038]]], [[[-1.1371, -3.5074, -2.2985, ..., -2.7474, -1.1274, -3.4446]], [[-1.4011, -0.9918, -1.6729, ..., -2.3242, -0.6097, 5.1700]], [[-2.2736, -2.5392, -2.9912, ..., -2.7694, -2.2817, -3.5902]], ..., [[-1.7500, -1.9594, -2.0348, ..., -1.8778, -1.7808, -1.8690]], [[ 0.0801, -0.1393, -0.2629, ..., -0.2508, -0.2175, 0.7372]], [[-1.4812, -2.3161, -3.6502, ..., -2.0404, -2.6307, -2.6473]]]]) attn_weights tensor([[[[-0.6718, -3.1623, -2.3505, ..., 0.0065, -0.1963, -0.3480]], [[-0.1270, -1.9005, -2.4104, ..., -0.4301, -0.5187, 0.7953]], [[-3.0802, -3.9992, -3.6775, ..., -2.5071, -2.7223, -2.0226]], ..., [[ 1.4055, -0.3802, -0.1593, ..., -0.2430, -0.3645, -0.7024]], [[-4.4362, -2.3596, -2.2263, ..., -0.9999, -0.9848, -0.5320]], [[ 0.1228, -0.7186, -1.7672, ..., -0.9421, -1.0558, -0.0763]]], [[[-1.3666, -3.7024, -3.0011, ..., -1.8725, 0.5999, -0.9548]], [[-0.9861, -2.4379, -2.7914, ..., -0.5543, 0.0552, 0.1072]], [[-3.6404, -4.3096, -4.1411, ..., -2.7927, -2.9988, -2.5781]], ..., [[ 1.3396, -0.4340, 0.0807, ..., -0.1221, -1.3755, -0.1628]], [[-4.5052, -2.7061, -2.5376, ..., -1.0983, -0.9092, -0.8996]], [[-0.4265, -0.6671, -4.5551, ..., 2.9000, -3.8688, 1.9951]]], [[[-1.4677, -3.3703, -4.3397, ..., 0.1089, 0.9954, 0.3225]], [[-0.8022, -2.4334, -2.7592, ..., -0.2285, 0.3164, -0.5786]], [[-3.4795, -4.1244, -3.9608, ..., -2.9782, -2.8977, -3.0121]], ..., [[ 1.7243, -0.1178, 0.4650, ..., -0.2695, 0.2849, -1.3716]], [[-4.7945, -2.2071, -2.1696, ..., -1.4488, -1.2387, -0.7182]], [[ 1.2111, 0.2602, -3.7221, ..., 0.4160, -1.8941, 4.5174]]], [[[-1.5404, -4.2975, -2.5167, ..., 0.4437, 0.1789, -0.6102]], [[-1.0568, -3.2958, -2.8368, ..., -0.4307, 0.0442, 0.4197]], [[-3.3654, -4.0976, -3.9010, ..., -2.9267, -2.6400, -2.1659]], ..., [[ 1.1230, -0.4751, -0.1605, ..., -0.3437, -0.7509, -1.1642]], [[-4.4505, -2.5429, -2.4302, ..., -1.3303, -0.9458, -0.8156]], [[-0.7638, -1.0977, -2.2352, ..., -2.2677, -1.9777, -0.5514]]], [[[-1.5326, -3.1765, -2.7396, ..., 0.1702, 2.1021, 1.0235]], [[-1.4316, -2.3826, -2.8152, ..., 1.0202, 1.4544, 0.6768]], [[-3.3493, -3.9788, -3.8091, ..., -2.4537, -2.7907, -2.3702]], ..., [[ 1.3442, -0.6435, 0.2642, ..., -0.4493, 0.5715, 0.3313]], [[-4.8111, -2.4582, -2.3246, ..., -1.0542, -1.0290, -1.0056]], [[-1.8428, -2.0466, -4.1983, ..., -0.8831, -2.9601, 1.5735]]]]) attn_weights tensor([[[[ -1.0900, -4.7317, -3.3841, ..., -1.0762, -1.8566, -2.3285]], [[ 1.3746, -1.1523, -2.1983, ..., -1.9016, -2.4245, -1.2953]], [[ -6.0244, -15.8362, -13.5765, ..., -5.6885, -4.5914, -4.1702]], ..., [[ -3.5663, -8.8900, -8.4793, ..., -3.2031, -2.2579, -2.5972]], [[ -1.2598, -3.8231, -3.4032, ..., -2.2242, -1.6927, -1.5080]], [[ -0.3386, -5.2673, -4.7700, ..., -3.2709, -2.6501, -2.4733]]], [[[ -2.1713, -5.3809, -4.9570, ..., -2.3378, -2.8141, -1.4050]], [[ 1.7715, -1.1242, -2.2669, ..., -1.4515, -1.7318, -2.0569]], [[ -6.2285, -17.2694, -17.0981, ..., -8.5025, -3.3561, -5.1829]], ..., [[ -4.7187, -10.1825, -9.5273, ..., -5.6710, -0.8547, -4.0252]], [[ -2.1497, -4.3208, -3.9356, ..., -2.0447, -1.4101, -1.4960]], [[ -0.7061, -5.5958, -5.3358, ..., -3.3620, -2.7470, -2.8447]]], [[[ -1.6059, -4.7835, -4.9691, ..., -1.3602, -2.7152, -3.7012]], [[ 1.1003, -1.0065, -1.3003, ..., -2.1591, -2.0548, 0.2548]], [[ -4.9196, -12.3342, -13.3226, ..., -3.9761, -3.6761, -4.7185]], ..., [[ -3.6004, -7.6638, -7.4667, ..., -3.9951, -3.8715, -2.7752]], [[ -1.6836, -3.5180, -3.3454, ..., -2.1935, -1.9004, -0.9964]], [[ -0.4556, -4.9272, -4.7814, ..., -3.3203, -2.9665, -2.4856]]], [[[ -1.6275, -6.0797, -4.2775, ..., -1.2661, -1.9638, -2.7131]], [[ 1.5739, -0.1846, -2.1705, ..., -1.7418, -3.0147, -0.9806]], [[ -8.2067, -19.2207, -15.8573, ..., -4.7630, -3.0999, -4.3153]], ..., [[ -5.0332, -11.4575, -9.7683, ..., -3.7110, -2.1445, -3.8368]], [[ -2.0402, -4.1458, -3.8282, ..., -1.7019, -1.4653, -1.7909]], [[ -0.7212, -5.9957, -5.4902, ..., -3.1198, -2.7382, -3.1011]]], [[[ -1.6225, -4.7117, -4.2135, ..., -2.1726, 0.0474, -1.8527]], [[ 1.8065, -1.9715, -0.5835, ..., -1.4029, -0.4846, -1.8999]], [[ -7.6097, -15.1196, -14.3459, ..., -6.1240, -3.7772, -5.5237]], ..., [[ -3.5359, -7.7811, -7.2357, ..., -2.4828, -2.1818, -3.2073]], [[ -1.2236, -3.3622, -3.1967, ..., -1.5830, -1.3352, -1.1398]], [[ -0.5569, -5.5247, -5.3896, ..., -3.0651, -3.1941, -2.8310]]]]) attn_weights tensor([[[[ 3.8737, -0.7513, -1.4165, ..., -2.4369, -2.9004, -0.7451]], [[ -2.7337, -4.9899, -5.2372, ..., -4.5114, -3.6195, -4.1544]], [[ -4.6197, -7.8986, -8.2852, ..., -4.9442, -4.0805, -5.7552]], ..., [[ -2.2388, -4.7989, -4.4635, ..., -6.3512, -4.9987, -3.9777]], [[ -1.1924, -5.4325, -4.7463, ..., -3.8202, -3.1546, -2.9306]], [[ -2.7941, -6.7539, -7.0905, ..., -2.9415, -1.7831, -3.5635]]], [[[ 4.3495, -1.5504, -2.8967, ..., 1.8276, -2.9182, 0.9235]], [[ -3.0059, -7.0548, -6.1442, ..., -5.2625, -6.1437, -3.9244]], [[ -5.5869, -12.9773, -13.0813, ..., -6.4193, -4.5852, -3.9039]], ..., [[ -2.2264, -6.3365, -6.7928, ..., -4.3855, -3.9109, -4.0893]], [[ -1.3930, -6.3259, -6.1112, ..., -3.0370, -2.1291, -1.6871]], [[ -3.0744, -7.7381, -8.2410, ..., -4.1727, -3.0357, -3.4419]]], [[[ 6.5525, -0.1505, -3.3120, ..., -3.2707, -0.1816, 3.7928]], [[ -2.1661, -5.3924, -5.2468, ..., -4.9873, -3.9905, -5.9190]], [[ -3.5646, -9.6899, -9.7978, ..., -1.9244, -1.6580, -4.3331]], ..., [[ -1.6627, -5.6694, -5.2463, ..., -2.3717, -3.1049, -3.2739]], [[ -0.6440, -6.5638, -6.5506, ..., -4.5192, -3.3710, -2.1359]], [[ -1.9860, -6.0235, -6.7592, ..., -1.4219, -2.6251, -3.3368]]], [[[ 3.8613, -0.1116, -0.1670, ..., -1.8569, -2.8218, -1.2432]], [[ -2.9146, -9.9416, -8.5172, ..., -3.9474, -4.8457, -4.4380]], [[ -5.2695, -15.2406, -12.6663, ..., -4.2540, -2.0752, -5.3936]], ..., [[ -2.0822, -8.3784, -5.1719, ..., -3.0541, -3.5946, -2.6424]], [[ -1.4432, -5.9619, -5.3607, ..., -3.7362, -2.5507, -2.8864]], [[ -2.9932, -9.1898, -9.7890, ..., -3.1456, -3.5042, -4.0453]]], [[[ 4.2346, -1.1697, -2.1728, ..., -0.4183, -2.6376, 0.2764]], [[ -2.3746, -6.1632, -5.8498, ..., -2.6623, -4.0538, -3.8436]], [[ -3.9665, -9.5055, -9.7561, ..., -4.5579, -3.8003, -3.1824]], ..., [[ -1.6557, -7.0077, -5.9796, ..., -4.0358, -1.3798, -2.5405]], [[ -0.6709, -6.1850, -5.8213, ..., -3.6844, -3.1411, -2.1948]], [[ -1.8227, -7.1252, -8.1625, ..., -2.1034, -2.5403, -2.3483]]]]) attn_weights tensor([[[[-2.9166e+00, -9.0216e+00, -8.3201e+00, ..., -2.3459e+00, -4.0616e+00, -4.5934e+00]], [[-1.9882e+00, -5.9504e+00, -6.7805e+00, ..., -5.4190e+00, -5.0518e+00, -3.6097e+00]], [[-1.0445e-01, -2.0806e+00, -2.5442e+00, ..., -4.2112e+00, -1.3062e+00, -2.0972e+00]], ..., [[-1.6295e+00, -3.8873e+00, -3.4549e+00, ..., -1.5959e+00, -1.7979e+00, -3.7813e+00]], [[ 1.2117e+00, -2.0110e+00, -3.0282e+00, ..., -1.8949e+00, -1.8616e+00, -1.7271e+00]], [[-8.1846e+00, -2.5569e+01, -2.0582e+01, ..., 9.6092e-03, 1.3480e+01, -3.7066e+00]]], [[[-2.8559e+00, -1.0343e+01, -1.0914e+01, ..., -6.5698e+00, -2.9214e+00, -4.4727e+00]], [[-3.0715e+00, -8.2799e+00, -7.7133e+00, ..., -5.0545e+00, -2.3655e+00, -3.2030e+00]], [[-1.3111e-01, -2.9340e+00, -3.0833e+00, ..., 4.4253e-01, -3.6804e+00, -2.5898e+00]], ..., [[-1.4780e+00, -5.5073e+00, -4.9727e+00, ..., -9.3378e-01, -2.6314e+00, -2.2118e+00]], [[ 1.2050e+00, -3.0610e+00, -3.5626e+00, ..., -2.9679e+00, -5.1793e+00, -2.8362e+00]], [[-3.8290e+00, -2.8514e+01, -4.4165e+01, ..., -2.3281e+01, 1.0069e+01, 3.9106e+00]]], [[[-2.9151e+00, -8.9112e+00, -8.7533e+00, ..., -4.3096e+00, -4.7625e+00, -4.2332e+00]], [[-2.3937e+00, -6.7804e+00, -7.0511e+00, ..., -2.7420e+00, -3.2302e+00, -4.0247e+00]], [[ 6.1480e-02, -2.6504e+00, -3.7641e+00, ..., -3.7728e+00, -4.5523e+00, -3.0757e+00]], ..., [[-8.3700e-01, -4.9464e+00, -4.4051e+00, ..., -2.6429e+00, -1.6956e+00, -2.4791e+00]], [[ 1.5590e+00, -4.2968e+00, -3.6292e+00, ..., -3.1905e+00, -3.0124e+00, -2.3119e+00]], [[-6.7419e+00, -2.3097e+01, -2.9229e+01, ..., 5.5810e+00, 1.6239e+01, -4.6001e+00]]], [[[-3.4963e+00, -1.1487e+01, -9.5037e+00, ..., -3.4088e+00, -3.4379e+00, -4.2530e+00]], [[-2.4523e+00, -9.5759e+00, -8.8695e+00, ..., -2.8007e+00, -2.6193e+00, -3.5871e+00]], [[-4.5368e-01, -3.8227e+00, -4.1967e+00, ..., -4.4704e+00, -4.0678e+00, -3.8467e+00]], ..., [[-1.2568e+00, -6.7122e+00, -6.1658e+00, ..., -2.0212e+00, -2.8508e+00, -3.9698e+00]], [[ 1.2640e+00, -2.1080e+00, -3.3313e+00, ..., -3.8853e+00, -3.5004e+00, -1.5352e+00]], [[-5.8208e+00, -3.3334e+01, -2.6828e+01, ..., -3.5007e+00, 1.3175e+01, -2.1678e+00]]], [[[-2.0257e+00, -9.3747e+00, -9.9150e+00, ..., -4.9243e+00, -1.7744e+00, -2.6219e+00]], [[-1.6744e+00, -6.7029e+00, -7.6246e+00, ..., -2.9378e+00, -3.9056e+00, -4.1801e+00]], [[ 4.4131e-01, -2.6952e+00, -2.5213e+00, ..., -1.4993e+00, -1.7955e+00, -2.0635e+00]], ..., [[-1.5382e-01, -4.8573e+00, -6.7690e+00, ..., -4.4421e+00, -3.5422e+00, -3.6122e+00]], [[ 1.5249e+00, -2.9063e+00, -2.5111e+00, ..., -1.3557e+00, -2.5605e+00, -3.0203e+00]], [[-5.3173e+00, -2.3258e+01, -2.5151e+01, ..., -4.9071e+00, 1.5611e+01, 6.6016e+00]]]]) attn_weights tensor([[[[ 2.4960e+00, -5.1427e+00, -3.5809e+00, ..., -3.7283e+00, -4.4230e+00, -2.3999e+00]], [[ 3.7147e+00, -8.8869e+00, -4.5546e+00, ..., -9.1417e+00, -7.7535e+00, -3.6431e+00]], [[-7.5923e-02, -2.5073e+00, -2.4438e+00, ..., -8.9288e-01, -2.4336e+00, -3.2722e+00]], ..., [[ 1.1505e+00, -3.0467e+00, -2.6076e+00, ..., -2.4705e+00, -3.7050e+00, -1.7922e+00]], [[ 2.0460e+00, -1.3668e-01, -1.4341e+00, ..., -1.5528e-01, -2.3457e-01, 1.9374e-02]], [[ 1.1812e+00, -2.6730e+00, -2.5658e+00, ..., -2.3339e+00, -3.5650e+00, -5.9108e-01]]], [[[ 2.4906e+00, -6.5038e+00, -5.5254e+00, ..., -5.5685e+00, -7.6653e-01, -2.4545e+00]], [[ 4.6666e+00, -1.2008e+01, -7.9345e+00, ..., -8.2830e+00, -2.6025e+00, -3.6992e+00]], [[-1.6540e-01, -4.2623e+00, -4.3249e+00, ..., -6.8687e-01, -2.0868e-01, -2.1863e+00]], ..., [[ 9.9850e-01, -3.2468e+00, -3.9450e+00, ..., -3.3850e+00, -3.0363e+00, -3.2500e+00]], [[ 1.9154e+00, -1.9119e+00, -1.5385e+00, ..., -1.1424e+00, 3.9506e-01, -1.2950e-01]], [[ 1.1517e+00, -3.1254e+00, -4.0235e+00, ..., -1.1561e+00, -2.5229e+00, 3.6460e-01]]], [[[ 2.3805e+00, -6.3686e+00, -5.6474e+00, ..., -2.3823e+00, -3.2024e+00, 8.9004e-03]], [[ 4.2893e+00, -1.4719e+01, -1.2042e+01, ..., -1.2351e+01, -1.2042e+01, -3.1329e+00]], [[ 3.7396e-01, -3.6265e+00, -4.1917e+00, ..., -3.0057e+00, -1.4566e+00, -3.5257e+00]], ..., [[ 1.4013e+00, -3.0923e+00, -5.3330e+00, ..., -6.1280e+00, -5.8128e+00, -5.7822e+00]], [[ 3.2991e+00, -6.0190e-01, -3.4931e-01, ..., -1.0293e+00, -8.1151e-01, 9.9180e-01]], [[ 8.0028e-01, -4.9907e+00, -4.1683e+00, ..., -2.9327e+00, -2.0523e+00, -1.4380e+00]]], [[[ 2.9277e+00, -7.1408e+00, -2.1869e+00, ..., -3.9768e+00, -2.0231e+00, -5.5886e-01]], [[ 5.4822e+00, -1.0348e+01, -1.1053e+00, ..., -9.9790e+00, -6.2936e+00, -3.0431e-01]], [[ 2.6724e-01, -5.6596e+00, -4.5117e+00, ..., -1.4744e+00, -9.7493e-01, -2.4501e+00]], ..., [[ 1.0217e+00, -3.4403e+00, -3.7094e+00, ..., -2.8378e+00, -4.1535e+00, -3.3237e+00]], [[ 1.7489e+00, -1.3426e+00, -1.3432e+00, ..., -2.7282e+00, -4.1225e-01, -3.6929e-01]], [[ 1.0091e+00, -1.4287e+00, -2.6677e+00, ..., -2.2946e+00, -1.5253e+00, -2.7702e-01]]], [[[ 1.9453e+00, -4.4780e+00, -5.0475e+00, ..., -4.4074e+00, -3.9577e+00, -2.6309e+00]], [[ 4.3786e+00, -1.1945e+01, -1.0445e+01, ..., -4.2203e+00, -2.6085e+00, -2.0612e+00]], [[ 1.0246e+00, -4.4743e+00, -5.8194e+00, ..., -2.7575e+00, -1.3245e+00, -2.3851e+00]], ..., [[ 9.0429e-01, -3.6525e+00, -3.3584e+00, ..., -2.8849e+00, -3.4635e+00, -3.3220e+00]], [[ 2.1800e+00, -1.4192e+00, -1.3107e+00, ..., -6.2578e-01, -1.6664e+00, -2.0247e+00]], [[ 1.1247e+00, -4.7402e+00, -4.0381e+00, ..., -2.5930e+00, -1.8376e+00, -2.3686e-01]]]]) attn_weights tensor([[[[ -0.7673, -2.9860, -2.4762, ..., -3.1064, -2.6115, -3.9962]], [[ -0.1772, -2.8150, -4.3774, ..., -4.0306, -3.0364, -3.2328]], [[ 0.2855, -2.3080, -2.8476, ..., -3.0992, -2.9847, -2.1381]], ..., [[ 4.0901, -5.6234, -0.4071, ..., -4.2456, -3.1590, -1.9288]], [[ 2.5773, -2.2660, -1.7603, ..., -1.2964, -1.3180, -1.1042]], [[ -0.1474, -1.7471, -3.8174, ..., -5.0064, -1.8631, -4.4191]]], [[[ -1.3971, -3.8696, -2.4172, ..., -1.6786, -2.6264, -4.9399]], [[ -0.8040, -2.9427, -2.4422, ..., -2.2933, -1.5344, -2.2292]], [[ 0.4297, -3.5592, -3.2521, ..., -3.9829, -4.3824, -3.9551]], ..., [[ 4.7761, -8.7043, -4.6689, ..., -4.5695, -0.4534, -5.0876]], [[ 3.2829, -3.8893, -4.0206, ..., -2.4842, -1.8885, -2.7311]], [[ -0.7775, -4.2936, -4.8930, ..., 0.7885, -2.3743, -3.1788]]], [[[ -1.1734, -5.1136, -3.3019, ..., -1.2329, -1.6125, -3.7509]], [[ 1.0211, -4.1530, -5.4943, ..., -0.8303, -3.2601, -2.2888]], [[ 0.3308, -3.2324, -3.1016, ..., -4.6264, -4.3392, -4.2695]], ..., [[ 4.2409, -11.5684, -7.1693, ..., -11.0321, -9.2594, -3.4993]], [[ 3.0397, -2.5719, -3.1916, ..., -1.6491, -2.7947, -1.5511]], [[ -0.5016, -4.3752, -5.0646, ..., -1.5046, -1.6853, -2.1858]]], [[[ -1.2340, -5.9356, -5.4214, ..., -2.0450, -1.5476, -4.4666]], [[ -1.1127, -5.9382, -3.6400, ..., -1.9690, -1.3658, -2.8265]], [[ 0.1395, -3.3523, -3.3309, ..., -3.4083, -4.2973, -3.2424]], ..., [[ 4.7489, -7.3089, 2.1010, ..., -6.0232, -4.2622, -0.5298]], [[ 3.0335, -3.2290, -1.1073, ..., -2.6409, -3.4542, -1.9736]], [[ -0.3711, -5.1573, -6.0207, ..., -2.0043, -2.7125, -4.0667]]], [[[ -0.3902, -5.8744, -6.4744, ..., -3.3631, -1.8504, -3.5056]], [[ 1.0454, -4.5834, -7.0264, ..., -5.2868, -2.6591, -2.0859]], [[ 0.3956, -3.7471, -3.9800, ..., -2.3261, -2.9453, -3.4964]], ..., [[ 3.9160, -7.6835, -5.6624, ..., -2.0982, -3.3086, -1.9379]], [[ 2.5574, -2.8547, -2.2680, ..., -2.0611, -2.8058, -3.2415]], [[ 0.0201, -3.7845, -5.5520, ..., -2.8578, -1.4504, -2.6601]]]]) attn_weights tensor([[[[ -0.3199, -7.8480, -6.5168, ..., -4.7442, -2.6506, -6.1392]], [[ 2.3697, -2.1972, -1.4845, ..., -0.4160, -0.1433, 0.2146]], [[ 5.3923, -2.5964, 0.0228, ..., -1.5779, -0.4903, -0.8873]], ..., [[ 0.7018, -2.8704, -3.8272, ..., -4.1290, -4.3021, -1.4776]], [[ 3.3715, -3.2507, -0.5294, ..., -2.4583, -1.3792, -1.8148]], [[ 2.8617, -4.0322, -2.1637, ..., -2.5072, -3.4895, -1.5598]]], [[[ 0.0243, -7.3782, -8.9313, ..., -5.8186, -3.0996, -4.8019]], [[ 2.8466, -4.6634, -3.5017, ..., -2.7988, -1.4267, -2.7091]], [[ 6.6156, -4.4804, -3.6199, ..., -1.9551, 0.5008, 0.9065]], ..., [[ 0.0923, -4.2019, -3.5449, ..., -2.0078, -3.2493, -3.6566]], [[ 3.9440, -3.7887, -3.0425, ..., -2.5361, -0.7181, 0.3788]], [[ 2.7851, -5.2140, -3.5510, ..., -3.9221, -2.6164, -3.5586]]], [[[ -0.6558, -6.5297, -6.4810, ..., -2.1399, -0.2085, -3.9447]], [[ 4.1411, -2.2573, -1.0083, ..., -1.8589, -1.8604, 0.8843]], [[ 6.4698, -6.3453, -5.6951, ..., -6.3978, -5.1426, -0.3902]], ..., [[ -0.0119, -2.5504, -2.5684, ..., -3.1289, -3.0104, -2.8257]], [[ 5.2900, -6.1033, -3.2562, ..., -8.2501, -7.1726, -0.6619]], [[ 3.1131, -3.7827, -5.2287, ..., -4.5056, -4.9315, -2.6179]]], [[[ -0.3205, -10.6534, -8.7723, ..., -2.6471, -2.1573, -6.2816]], [[ 2.9082, -3.5506, -1.1725, ..., -3.4556, 0.0507, -0.4404]], [[ 6.2156, -5.4925, -1.2652, ..., -5.6005, -1.9335, -0.6261]], ..., [[ 0.5202, -3.3988, -3.4331, ..., -1.5635, -2.1697, -2.0281]], [[ 2.9437, -5.5271, 0.0592, ..., -3.0078, -0.8015, -1.9133]], [[ 2.9252, -4.3816, 0.4593, ..., -3.0885, -1.7686, -3.7682]]], [[[ -0.0544, -6.8169, -7.9490, ..., -2.6885, -0.3661, -3.5888]], [[ 2.8966, -2.6428, -2.3397, ..., -0.5492, -1.8456, -2.0872]], [[ 6.0500, -2.9776, -5.3644, ..., -0.2194, -3.8330, -0.9968]], ..., [[ 0.5461, -3.2202, -4.0547, ..., -0.6754, -0.3501, -3.0861]], [[ 3.9867, -2.5555, -3.7938, ..., -0.9112, -2.4873, -1.6130]], [[ 3.0742, -4.0375, -5.0255, ..., -4.5197, -3.3069, -1.5478]]]]) attn_weights tensor([[[[ 1.3888, -0.8589, -1.6020, ..., -3.1586, -2.3217, -1.6525]], [[ 3.0262, -0.9170, -0.0922, ..., -0.6557, -1.0414, -1.5804]], [[ 1.5432, 0.2748, -0.4894, ..., -1.3803, -0.1646, 0.6494]], ..., [[ 1.1580, -2.4604, -2.1574, ..., -2.0809, -1.4361, -1.0075]], [[ 1.1433, -1.0853, -1.0812, ..., -1.8850, -2.0419, -0.9447]], [[ 0.5496, -3.1917, -2.9603, ..., -4.4155, -3.4610, -2.6820]]], [[[ 1.0582, -4.3191, -2.9083, ..., -1.6447, -1.8632, -1.3439]], [[ 4.5333, -2.8893, -2.7064, ..., -0.9891, 2.8806, 3.1347]], [[ 1.6048, -0.2590, -0.1975, ..., -1.1583, -1.5674, -2.4556]], ..., [[ 1.1941, -5.1218, -3.4350, ..., -1.7052, -0.1755, -2.0425]], [[ 1.1671, -3.8985, -2.5029, ..., -1.6938, -2.1917, -1.5219]], [[ 0.8766, -3.6293, -2.6965, ..., -4.4226, -3.0974, -4.5350]]], [[[ 1.3376, -2.7770, -3.5674, ..., -4.8290, -3.9247, -2.4903]], [[ 4.8037, -1.7139, -3.1050, ..., -1.1257, -1.5597, 0.4956]], [[ 2.3347, -0.4778, -1.2575, ..., -1.7626, -0.8245, -2.0316]], ..., [[ 1.3172, -3.9203, -3.2089, ..., -3.6107, -3.6042, -1.2127]], [[ 1.1541, -2.9466, -3.4028, ..., -3.8575, -3.1027, -1.8835]], [[ 1.0822, -3.5944, -4.7564, ..., -4.9777, -4.9320, -3.2515]]], [[[ 1.1520, -3.3373, -2.8170, ..., -2.9625, -4.0074, -3.1477]], [[ 1.3563, -3.4773, 0.1640, ..., 2.4708, -0.1199, -0.8174]], [[ 1.8635, -0.3548, -0.6606, ..., 0.2731, -0.3962, -0.3498]], ..., [[ 1.1095, -2.9520, -1.8883, ..., -0.7531, 0.1568, -1.4012]], [[ 1.1788, -2.7375, -2.0284, ..., -1.4454, -0.4860, -0.4529]], [[ 0.2667, -3.0743, -3.5747, ..., -4.0411, -3.2082, -4.9347]]], [[[ 1.0570, -3.2302, -3.0377, ..., -1.6504, -2.3277, -3.1144]], [[ 4.3208, -3.2583, -4.9541, ..., -0.2624, -1.5900, -0.0229]], [[ 1.6873, -1.8438, -3.3006, ..., -0.4725, -1.8314, -2.1202]], ..., [[ 0.6718, -3.3485, -2.8736, ..., -1.0827, -1.1062, -1.8399]], [[ 1.1610, -3.8414, -3.4922, ..., -2.3649, -2.2406, -1.2193]], [[ 1.0095, -2.7795, -3.9560, ..., -3.4770, -3.6688, -4.8153]]]]) attn_weights tensor([[[[ 2.0681, -1.3292, -2.8964, ..., -2.8716, -1.9688, -1.6708]], [[ 2.6727, -0.9026, -1.0688, ..., -1.7997, -1.6525, -1.0047]], [[ 1.5930, -2.7779, -2.6245, ..., -2.2992, -1.5563, -0.8315]], ..., [[ 2.7282, -2.5694, -2.5287, ..., -2.4237, -2.4220, -2.1587]], [[ 0.8167, -3.0661, -2.8812, ..., -4.9677, -3.0941, -2.5571]], [[ 3.5116, -0.5551, -0.8800, ..., -2.2959, -2.2816, -1.3161]]], [[[ 2.1467, -3.8186, -3.3882, ..., -4.3071, 0.4600, -3.5966]], [[ 5.0187, -2.5795, -4.1899, ..., -0.2551, -1.0413, 0.9920]], [[ 1.8866, -5.3404, -4.4457, ..., -3.1406, -0.5286, -3.2100]], ..., [[ 3.9980, -2.6168, -3.6007, ..., -1.3562, -0.1386, -2.0441]], [[ 1.5838, -5.9188, -6.8756, ..., -2.5260, -1.5884, -1.9679]], [[ 3.6575, -1.0495, -3.3810, ..., -1.8795, -3.3729, -4.2609]]], [[[ 2.5010, -1.9291, -1.8908, ..., -3.6979, -3.7031, 0.2820]], [[ 3.7282, -2.4924, -4.3648, ..., -2.6069, -1.7162, -2.6666]], [[ 2.6763, -2.3729, -2.7948, ..., -4.1539, -3.8476, -0.2372]], ..., [[ 5.0301, -2.4790, -2.5746, ..., -3.5869, -3.6337, 1.0063]], [[ 0.7394, -4.7683, -4.1357, ..., -0.6952, 0.3135, -1.1537]], [[ 3.8686, -0.4543, -2.6745, ..., -3.4591, -2.2425, -2.9404]]], [[[ 1.9825, -4.0363, -3.7196, ..., -3.6370, -2.6293, -4.8516]], [[ 2.1839, -1.8209, -1.2895, ..., 0.3720, -1.1575, -0.3337]], [[ 2.2150, -4.4111, -3.5503, ..., -3.5872, -0.9610, -2.6543]], ..., [[ 3.4247, -1.9823, -1.4592, ..., -2.9184, -0.8689, -2.8470]], [[ 1.2356, -5.3606, -5.4591, ..., -1.0835, -0.6074, -2.6887]], [[ 3.8990, -1.8944, 0.5859, ..., -1.2743, -2.3588, -2.2971]]], [[[ 2.2314, -2.7103, -4.2661, ..., -2.5122, -2.9205, -3.1032]], [[ 3.4185, -1.7989, -3.9058, ..., -1.3049, -1.7930, -0.3969]], [[ 1.5523, -3.3090, -3.9696, ..., -1.8364, -3.6045, -3.7103]], ..., [[ 2.9756, -2.2871, -2.5821, ..., -1.5435, -2.0190, -1.2380]], [[ 1.4430, -3.8060, -3.9916, ..., -2.2578, -0.1434, -1.6986]], [[ 3.4832, -1.0583, -3.0260, ..., -1.5848, -2.5728, -1.1448]]]]) attn_weights tensor([[[[ 1.9196, -2.9360, -4.0818, ..., -3.1556, -3.4548, -2.2135]], [[ 2.8273, -0.9425, -1.8448, ..., -1.5638, -1.3615, -0.6472]], [[ 2.5166, -0.2074, -1.1768, ..., -2.2081, -1.7978, -0.5211]], ..., [[ 0.6249, -3.3510, -1.9576, ..., -3.2161, -1.7063, -1.0805]], [[ 2.6893, -2.8709, -2.0720, ..., -3.0659, -2.3357, -2.8313]], [[ 2.6654, -1.3348, -2.1597, ..., -2.5430, -1.6793, -1.2268]]], [[[ 2.6374, -2.4447, -3.2841, ..., -3.1218, 0.6813, -2.1464]], [[ 4.3254, -2.2115, -3.1246, ..., -1.4767, 1.2107, -1.1437]], [[ 3.3635, -0.8189, -0.7364, ..., -1.7371, -0.5767, -1.8774]], ..., [[-0.0882, -3.4261, -2.0818, ..., -1.9318, -1.6996, -2.9404]], [[ 3.2643, -1.1888, -0.9378, ..., -1.2558, -1.7454, -2.2326]], [[ 4.3155, -2.7660, 0.3929, ..., -0.3764, 2.0134, 1.4281]]], [[[ 3.1134, -3.3108, -3.8650, ..., -5.4046, -4.7237, -0.5674]], [[ 4.6355, -1.7706, -3.9487, ..., -1.6782, -2.6375, 0.2301]], [[ 3.4740, -0.6936, -2.3497, ..., -2.9909, -2.0524, 0.0115]], ..., [[ 0.5282, -3.8142, -4.0806, ..., -2.0564, -0.7895, -0.0690]], [[ 3.6977, -1.3393, -2.8605, ..., -3.8437, -3.0420, -0.5704]], [[ 4.0494, -2.1927, -1.6544, ..., 0.3528, 2.3632, 1.6599]]], [[[ 2.5495, -2.5396, -3.0525, ..., -2.6737, -1.4412, -3.3351]], [[ 3.6193, -0.8462, -1.7045, ..., -0.0748, 0.8344, -0.4293]], [[ 2.9676, -0.1030, -0.3905, ..., -1.8861, -0.4951, -2.0400]], ..., [[ 0.7078, -3.1324, -0.8948, ..., -1.2156, 0.1323, -1.8994]], [[ 3.1009, -1.3772, -0.4475, ..., -2.6480, -1.4388, -2.5604]], [[ 3.5370, -2.2745, -1.1719, ..., -1.1669, 0.6736, -2.4616]]], [[[ 2.4490, -3.1043, -4.4682, ..., -1.4711, -3.4065, -3.0851]], [[ 2.7487, -1.7830, -3.6654, ..., -0.6866, -1.0036, 0.5447]], [[ 2.9193, -2.4033, -3.4943, ..., -0.9569, -2.8867, -1.9741]], ..., [[ 1.7294, -4.4550, -5.3329, ..., -1.9151, -0.8139, -2.4963]], [[ 2.9277, -2.5690, -3.0420, ..., -0.7567, -1.9612, -0.8233]], [[ 4.0051, -0.1558, -0.6372, ..., 1.7215, 2.5893, 0.4764]]]]) attn_weights tensor([[[[ 2.3547e+00, 2.2224e+00, 1.1332e+00, ..., -1.1167e-01, 6.5284e-01, 2.7200e+00]], [[ 2.9947e+00, 1.3895e-01, -1.0686e+00, ..., -5.0784e-01, 5.6188e-02, 9.5830e-01]], [[ 2.7420e+00, 2.5742e-01, -1.7873e+00, ..., -7.0755e-01, -2.1754e+00, 8.9526e-01]], ..., [[ 3.1774e+00, 1.9031e-02, -1.7884e+00, ..., -1.3393e+00, -6.1253e-01, -9.3286e-02]], [[ 3.0674e+00, 1.7918e+00, 5.4865e-01, ..., 9.5389e-01, 3.1653e-01, 2.3895e+00]], [[ 2.9224e+00, 8.6711e-01, -4.6764e-01, ..., -1.7369e-01, 3.3942e-01, 3.1882e-02]]], [[[ 1.2264e+00, 1.4757e+00, 6.3608e-01, ..., 1.2195e-01, -3.8151e-01, 1.2745e+00]], [[ 3.6285e+00, -4.8406e-01, -1.1066e+00, ..., -2.0872e-01, 8.3293e-01, -9.4962e-01]], [[ 3.2483e+00, -4.6040e-02, -2.0089e+00, ..., -1.9053e+00, -1.1102e+00, -1.8475e+00]], ..., [[ 4.3950e+00, -1.1686e+00, -1.9073e+00, ..., -5.5572e-01, 1.2988e+00, 1.0633e-04]], [[ 3.3605e+00, 2.9577e-01, 3.2088e-01, ..., -1.4539e+00, 2.5186e-02, 1.0405e+00]], [[ 3.1211e+00, 1.3861e+00, -6.4595e-01, ..., -8.2329e-01, 2.1425e+00, 2.4228e-01]]], [[[ 1.7170e+00, 2.2680e-01, -2.3883e-01, ..., -2.7376e-01, -1.1530e+00, -1.0964e-01]], [[ 3.7487e+00, -1.3480e+00, -1.1868e+00, ..., -1.5054e+00, -2.1461e+00, 8.5185e-01]], [[ 3.6367e+00, -1.5407e-01, -2.1499e+00, ..., -4.4304e+00, -4.1966e+00, -1.1980e-01]], ..., [[ 4.5779e+00, -1.2767e+00, -2.4087e+00, ..., -2.4365e+00, -3.2063e+00, 7.2863e-01]], [[ 2.5762e+00, -1.0489e+00, -1.7277e+00, ..., 4.1070e-02, 9.7974e-02, 4.2264e-01]], [[ 3.3542e+00, -5.1119e-01, -4.7165e-01, ..., 6.7778e-01, 1.3296e+00, 1.1578e+00]]], [[[ 1.4165e+00, 1.1140e+00, 9.1747e-01, ..., 8.0600e-02, 2.2658e-01, 2.7459e-01]], [[ 2.9283e+00, 1.5206e+00, 4.7533e-01, ..., 8.0595e-01, 7.3061e-01, 3.2378e-01]], [[ 2.8916e+00, 6.0880e-02, -1.3672e+00, ..., -2.5077e+00, -1.7297e+00, -2.3466e+00]], ..., [[ 3.5188e+00, 1.6365e-01, -1.2955e+00, ..., -2.4632e-01, 7.3034e-02, -5.4716e-01]], [[ 3.0455e+00, 1.0202e+00, -3.8971e-01, ..., 2.3220e-01, 5.0873e-01, 3.7781e-01]], [[ 2.2210e+00, 2.7514e-02, -1.5837e+00, ..., -1.4020e-01, -2.5168e-01, -1.9858e-01]]], [[[ 1.9653e+00, -1.3464e-01, -7.9308e-01, ..., 7.4505e-01, 5.0772e-01, 7.8145e-02]], [[ 3.2337e+00, -1.2163e+00, -1.6450e+00, ..., 9.4089e-02, -1.0744e+00, -2.6825e-01]], [[ 3.1957e+00, -1.1586e+00, -1.8844e+00, ..., -8.6940e-02, -6.3005e-01, -1.0928e+00]], ..., [[ 3.8791e+00, -1.7717e+00, -3.3825e+00, ..., -1.1392e+00, -2.9885e+00, -2.6457e+00]], [[ 3.0174e+00, -4.6741e-01, -2.3375e+00, ..., 1.7137e+00, 1.6553e+00, 3.6316e-01]], [[ 3.5499e+00, 3.1213e-01, -1.7919e+00, ..., -2.2346e+00, 9.7176e-01, 4.7751e-01]]]]) attn_weights tensor([[[[-3.1771e-01, -2.3926e+00, -3.2999e-01, ..., -5.0829e-01, -2.7441e+00, 5.6160e-01]], [[ 5.1821e-01, 1.8670e+00, 3.8237e+00, ..., -1.3062e-01, 9.9091e-01, 9.3768e+00]], [[-1.9778e+00, -2.0272e+00, -2.2301e+00, ..., -2.2097e+00, -1.0883e+00, -1.4113e+00]], ..., [[-1.8685e+00, -2.2635e+00, -2.0855e+00, ..., -2.0577e+00, -1.9307e+00, -1.6822e+00]], [[ 2.4923e-01, -1.5273e-01, 2.2069e-01, ..., -4.0147e-01, 1.2957e-01, 1.2172e+00]], [[-1.2163e+00, -2.0306e+00, -3.2854e+00, ..., -2.9310e+00, -1.7902e+00, -2.6663e+00]]], [[[-1.3265e+00, -3.4138e+00, -2.4175e+00, ..., -1.2612e+00, -2.5820e+00, -1.8315e+00]], [[-8.7723e-02, 9.6057e-02, -9.1576e-02, ..., 2.1373e-02, -5.1029e-01, 8.6090e+00]], [[-1.8719e+00, -2.4848e+00, -2.5541e+00, ..., -2.3678e+00, -2.2118e+00, -3.3203e+00]], ..., [[-2.4772e+00, -2.9648e+00, -3.0228e+00, ..., -2.6636e+00, -2.9258e+00, -3.2145e+00]], [[-2.9582e-01, -5.7738e-01, -8.4867e-01, ..., -1.1396e+00, -6.4766e-01, 1.1666e+00]], [[-1.2382e+00, -2.0847e+00, -2.6092e+00, ..., -1.8054e+00, -2.0603e+00, -2.3028e+00]]], [[[-1.2028e+00, -2.9151e+00, -2.0666e+00, ..., -2.8579e+00, -1.8088e+00, -2.9239e+00]], [[ 1.6254e+00, 1.1115e+00, -2.4584e-01, ..., -1.7381e+00, 1.1906e+00, 9.6917e+00]], [[-1.4800e+00, -2.2413e+00, -2.4714e+00, ..., -2.4617e+00, -4.1851e-01, -3.3956e+00]], ..., [[-2.2319e+00, -2.7852e+00, -2.8399e+00, ..., -2.9117e+00, -3.1685e+00, -3.0158e+00]], [[-2.5880e-01, -5.8921e-01, -7.3851e-01, ..., -8.5208e-01, -1.2055e+00, 5.3158e-01]], [[-1.1257e+00, -1.5624e+00, -2.8198e+00, ..., -3.3264e+00, -2.3827e+00, -1.3415e+00]]], [[[-1.2000e+00, -3.4701e+00, -2.2661e+00, ..., -2.6385e+00, -3.1950e+00, -2.8861e+00]], [[-6.5208e-01, -3.3467e-01, 1.6247e+00, ..., 7.4128e-01, -1.0508e+00, 6.2993e+00]], [[-1.9254e+00, -2.6604e+00, -2.3802e+00, ..., -2.2639e+00, -2.6208e+00, -3.0242e+00]], ..., [[-1.7735e+00, -2.1412e+00, -1.9907e+00, ..., -1.8627e+00, -1.9631e+00, -2.0481e+00]], [[ 3.4542e-02, -1.6027e-01, -2.1971e-03, ..., -3.0693e-01, -1.0158e-01, 1.3578e+00]], [[-1.6569e+00, -2.3514e+00, -3.5267e+00, ..., -3.8358e+00, -2.3867e+00, -2.8208e+00]]], [[[-4.5147e-01, -6.1420e-01, -1.8948e+00, ..., -1.3776e+00, -1.0472e+00, -3.7293e+00]], [[ 4.2449e+00, 2.7558e+00, 4.3406e+00, ..., 2.3492e-01, 9.3034e-02, 1.1765e+01]], [[-1.0846e+00, -2.5252e+00, -2.2663e+00, ..., -2.1212e+00, -2.2666e+00, -3.5274e+00]], ..., [[-2.2577e+00, -2.9377e+00, -3.1037e+00, ..., -2.8390e+00, -2.9791e+00, -3.3328e+00]], [[ 6.8087e-01, -1.2126e-01, -2.6975e-01, ..., -7.7498e-01, -7.0842e-01, 1.0526e+00]], [[-1.5466e+00, -1.7139e+00, -2.7514e+00, ..., -1.7213e+00, -2.2981e+00, -2.3091e+00]]]]) attn_weights tensor([[[[-3.6017e-01, -2.7511e+00, -2.8343e+00, ..., -3.7576e-01, 5.0116e-01, 2.3920e-01]], [[-1.0073e+00, -2.0395e+00, -2.7886e+00, ..., -8.1446e-01, 1.8031e+00, 3.7342e-01]], [[-3.3072e+00, -3.9464e+00, -3.7356e+00, ..., -2.9043e+00, -2.3027e+00, -2.3365e+00]], ..., [[ 1.3135e+00, -4.1037e-01, 1.7463e-01, ..., -5.4648e-03, -8.0802e-01, -1.7691e-01]], [[-4.7500e+00, -2.4401e+00, -2.2932e+00, ..., -1.0993e+00, -7.3872e-01, -6.3706e-01]], [[ 1.0569e+00, 5.6939e-01, -1.4003e+00, ..., -2.9858e+00, 1.2061e+00, 3.8350e+00]]], [[[-2.6302e+00, -5.7429e+00, -6.0552e+00, ..., -7.3376e-01, 1.8019e+00, -1.3571e+00]], [[-8.6958e-01, -2.7749e+00, -2.9878e+00, ..., -1.0934e-01, 8.6617e-01, 2.2375e-01]], [[-3.8475e+00, -4.5124e+00, -4.4300e+00, ..., -3.1628e+00, -2.7609e+00, -3.1689e+00]], ..., [[ 1.1609e+00, -3.0087e-01, 6.3977e-01, ..., -1.0341e+00, 6.5624e-02, -1.1178e+00]], [[-4.3718e+00, -2.6461e+00, -2.5816e+00, ..., -9.5845e-01, -8.6736e-01, -8.2388e-01]], [[ 7.2961e-01, 4.7185e-01, -3.6377e+00, ..., -1.5244e+00, -1.6883e+00, 4.0587e+00]]], [[[-2.1477e+00, -4.0911e+00, -4.6255e+00, ..., -1.3425e+00, -2.2044e+00, -9.5483e-01]], [[-6.0509e-01, -2.2619e+00, -3.2956e+00, ..., -2.7669e-01, 4.5275e-01, -4.3382e-01]], [[-3.3970e+00, -4.1701e+00, -3.9786e+00, ..., -2.9599e+00, -2.9791e+00, -2.6527e+00]], ..., [[ 1.4104e+00, -2.0893e-01, 2.1143e-01, ..., 3.1601e-02, -1.2600e+00, -7.4429e-01]], [[-4.4679e+00, -2.3419e+00, -2.2754e+00, ..., -1.2715e+00, -7.9071e-01, -7.0634e-01]], [[ 1.2341e+00, 5.0492e-01, -3.9456e+00, ..., -1.8113e+00, -1.8355e+00, 2.6638e+00]]], [[[-1.2835e+00, -3.3865e+00, -2.1787e+00, ..., 5.8191e-01, 7.2044e-01, 4.7438e-01]], [[-1.1178e+00, -2.6824e+00, -2.9811e+00, ..., 2.9170e-01, 1.6224e+00, 5.5729e-01]], [[-3.6676e+00, -4.3002e+00, -4.0944e+00, ..., -2.8235e+00, -2.4021e+00, -2.7169e+00]], ..., [[ 1.2473e+00, -5.3529e-01, 1.1166e-01, ..., -9.2831e-02, -9.3614e-01, 3.1296e-01]], [[-4.4044e+00, -2.6874e+00, -2.5337e+00, ..., -1.0022e+00, -8.8861e-01, -8.6631e-01]], [[-1.7931e+00, -1.2873e+00, -3.5381e+00, ..., -2.1185e+00, -2.8829e-01, 2.3846e+00]]], [[[-3.6031e+00, -4.8836e+00, -5.0492e+00, ..., 2.1719e+00, 5.6756e-01, -1.2186e+00]], [[-2.8713e+00, -4.1239e+00, -4.7657e+00, ..., -5.7945e-01, -4.9219e-01, -1.4099e+00]], [[-3.1926e+00, -3.8071e+00, -3.7492e+00, ..., -2.8972e+00, -2.6259e+00, -2.4911e+00]], ..., [[ 1.5811e+00, -1.3829e-01, 2.8958e-01, ..., -2.8562e-01, 2.8388e-01, -2.1525e+00]], [[-4.7490e+00, -2.0223e+00, -1.9345e+00, ..., -8.9415e-01, -9.0719e-01, -2.9849e-01]], [[ 2.3878e+00, 1.4297e+00, -2.4005e+00, ..., -1.1064e+00, -2.6814e+00, 4.7256e+00]]]]) attn_weights tensor([[[[ -1.2093, -4.4645, -3.7371, ..., -2.4989, -1.9297, -1.1402]], [[ 1.7934, -0.3722, -2.0333, ..., -2.0405, -0.4587, -1.0414]], [[ -5.3305, -13.5597, -12.7113, ..., -5.5520, -2.6149, -5.0977]], ..., [[ -3.0606, -7.9484, -7.1826, ..., -2.8922, -1.3759, -3.0951]], [[ -1.2886, -3.6104, -3.2965, ..., -1.6678, -1.3365, -0.9712]], [[ -0.4584, -5.2731, -4.9315, ..., -3.0606, -2.5227, -2.5434]]], [[[ -1.8559, -5.0456, -5.5304, ..., -1.8887, -0.9869, -2.8992]], [[ 2.0863, -2.2043, -3.7057, ..., -2.1486, -2.1319, -2.7103]], [[ -6.0060, -15.8319, -15.6424, ..., -3.0421, -1.7287, -3.6447]], ..., [[ -3.6106, -9.2058, -9.0685, ..., -1.7962, -3.7282, -2.3979]], [[ -1.9984, -4.1858, -3.9737, ..., -1.5507, -1.6678, -1.4264]], [[ -0.5093, -5.4784, -5.2379, ..., -2.6951, -2.6932, -2.4804]]], [[[ -1.7761, -4.5496, -4.8785, ..., -2.9920, -3.0590, -2.6048]], [[ 2.0017, -0.4200, -1.7250, ..., -2.1827, -2.4647, -1.2663]], [[ -5.0060, -13.6347, -14.1184, ..., -4.6815, -3.6728, -3.9479]], ..., [[ -3.5541, -8.1562, -7.6440, ..., -3.4380, -1.2764, -3.0993]], [[ -2.0395, -3.8289, -3.6861, ..., -2.2706, -1.3716, -1.2503]], [[ -0.5251, -4.9650, -4.8354, ..., -3.0873, -2.5997, -2.6223]]], [[[ -1.5686, -5.7318, -4.2496, ..., -1.8531, -2.2957, -1.4926]], [[ 1.9189, -0.9840, -2.6489, ..., -3.2559, -1.2956, -3.6501]], [[ -7.6207, -16.8813, -16.2277, ..., -4.2541, -3.0518, -5.1867]], ..., [[ -4.9588, -10.3930, -10.4336, ..., -2.4209, -2.7443, -2.6458]], [[ -2.4418, -4.1164, -3.9374, ..., -1.5069, -1.7024, -1.1638]], [[ -0.5603, -5.5553, -5.4434, ..., -2.7593, -2.8818, -2.4375]]], [[[ -1.5163, -4.5685, -4.0498, ..., 0.4373, -1.7472, -3.3494]], [[ 2.3078, -0.9660, -0.4900, ..., -0.7901, -1.8372, -1.4269]], [[ -6.4539, -13.1668, -13.1856, ..., 0.0783, -1.0748, -3.7769]], ..., [[ -3.5613, -7.3290, -7.2924, ..., -2.2676, -2.1430, -1.3322]], [[ -1.7600, -3.5238, -3.4326, ..., -1.6080, -1.6189, -0.6867]], [[ -0.4731, -5.1744, -5.1489, ..., -3.1496, -2.8909, -2.2962]]]]) attn_weights tensor([[[[ 4.5837, 0.2504, -1.3754, ..., -1.8698, 0.1608, 1.5022]], [[ -2.4376, -6.6811, -6.4858, ..., -5.7658, -3.0302, -4.2505]], [[ -4.4837, -8.6263, -9.6488, ..., -6.7378, -3.9805, -5.0709]], ..., [[ -1.5155, -4.8334, -5.3906, ..., -5.9665, -3.2996, -2.7583]], [[ -0.8890, -5.7346, -4.8568, ..., -4.3146, -3.0629, -2.9853]], [[ -2.3996, -7.5297, -8.7648, ..., -4.6151, -4.0336, -4.0289]]], [[[ 5.2901, -1.0733, -3.0791, ..., -2.0327, -1.9242, 0.9196]], [[ -2.6909, -7.2788, -6.6807, ..., -6.2002, -4.1173, -4.6184]], [[ -4.2787, -13.5817, -13.8684, ..., -5.1680, -2.0080, -3.3983]], ..., [[ -1.8454, -6.0202, -8.0642, ..., -2.6156, -3.8215, -2.5377]], [[ -0.9560, -7.3650, -7.8721, ..., -2.5282, -3.1536, -1.6072]], [[ -2.3219, -7.9030, -10.0586, ..., -2.6457, -2.5753, -2.7802]]], [[[ 5.0857, -0.3959, -4.7473, ..., -0.9431, -2.6834, 0.9903]], [[ -2.6769, -5.0180, -4.6784, ..., -4.5536, -5.8087, -4.9926]], [[ -4.5854, -11.2481, -10.7625, ..., -4.3335, -4.2390, -4.5760]], ..., [[ -1.6444, -5.7346, -5.0835, ..., -3.7202, -4.3964, -4.3319]], [[ -0.9135, -6.1394, -5.7448, ..., -4.1510, -3.2463, -1.9546]], [[ -2.4409, -6.6740, -8.1596, ..., -3.3030, -3.2579, -2.7023]]], [[[ 3.5397, -1.3320, -2.8716, ..., -2.0804, -1.0174, 0.4960]], [[ -2.8211, -8.8869, -8.2647, ..., -5.2558, -3.5366, -4.9789]], [[ -4.3540, -12.3996, -14.3690, ..., -5.3016, -3.0479, -4.0844]], ..., [[ -1.7550, -7.5855, -8.3053, ..., -4.3509, -3.3223, -2.8679]], [[ -1.1875, -5.5660, -5.2438, ..., -3.0493, -3.0933, -2.1537]], [[ -2.6250, -8.8526, -9.6875, ..., -4.4011, -3.6631, -3.7756]]], [[[ 5.3331, -0.2524, -1.2161, ..., -1.9294, -2.4578, 2.1176]], [[ -2.1824, -5.4591, -5.7254, ..., -4.0497, -3.7037, -4.4829]], [[ -3.8003, -7.2895, -8.8751, ..., -3.1792, -0.2669, -2.8429]], ..., [[ -1.2432, -5.4319, -5.1422, ..., 0.0427, -2.0138, -0.6407]], [[ -0.6004, -5.9585, -4.9907, ..., -3.1093, -3.0679, -1.8918]], [[ -1.6881, -7.0955, -6.9587, ..., -1.8554, -1.0389, 0.4014]]]]) attn_weights tensor([[[[-2.2322e+00, -1.0194e+01, -1.0581e+01, ..., -7.1840e+00, -4.5763e+00, -5.1106e+00]], [[-1.8459e+00, -8.6671e+00, -1.0163e+01, ..., -7.5453e+00, -3.1412e+00, -3.9487e+00]], [[ 1.6723e-01, -9.5929e-01, -1.7152e+00, ..., -7.3286e-01, -1.5865e+00, -2.4150e+00]], ..., [[-1.4759e+00, -4.2987e+00, -4.3400e+00, ..., -1.5305e+00, -2.8203e+00, -4.3744e+00]], [[ 1.3355e+00, -1.8900e+00, -3.0020e+00, ..., -2.0785e+00, -1.3560e+00, -1.4225e+00]], [[-1.0318e+01, -2.0110e+01, -2.9111e+01, ..., -1.5178e+01, 2.3505e+00, -5.3915e+00]]], [[[-2.7645e+00, -1.2078e+01, -1.2848e+01, ..., -3.9266e+00, -2.8925e+00, -3.2463e+00]], [[-2.3657e+00, -8.9904e+00, -1.0261e+01, ..., -3.7360e+00, -2.9675e+00, -2.4799e+00]], [[-6.7234e-02, -4.7308e+00, -4.1452e+00, ..., -4.2079e+00, -4.1740e+00, -4.2283e+00]], ..., [[-1.4585e+00, -5.6543e+00, -6.4992e+00, ..., -2.4108e+00, -8.5894e-01, -3.1323e+00]], [[ 1.5819e+00, -3.4835e+00, -3.6549e+00, ..., -5.3817e+00, -3.6671e+00, -4.4085e+00]], [[-8.2952e+00, -3.1889e+01, -3.9358e+01, ..., -5.0530e-01, 1.1867e+01, 4.2295e+00]]], [[[-2.7466e+00, -9.3152e+00, -1.0224e+01, ..., -4.4599e+00, -4.0217e+00, -4.3239e+00]], [[-2.0166e+00, -6.7440e+00, -6.1884e+00, ..., -4.1884e+00, -5.2158e+00, -4.1087e+00]], [[ 9.8147e-02, -2.8087e+00, -3.4229e+00, ..., -5.5990e+00, -4.3808e+00, -4.1345e+00]], ..., [[-1.1188e+00, -4.9928e+00, -4.1518e+00, ..., -2.1954e+00, -1.3521e+00, -1.4240e+00]], [[ 1.4278e+00, -2.3508e+00, -3.1967e+00, ..., -3.3902e+00, -2.7681e+00, -3.2833e+00]], [[-5.6886e+00, -2.8906e+01, -3.1858e+01, ..., -6.5298e+00, 1.2789e+01, 3.0931e+00]]], [[[-3.0679e+00, -1.1069e+01, -1.1313e+01, ..., -6.1010e+00, -4.2753e+00, -4.8802e+00]], [[-2.8308e+00, -8.3570e+00, -8.1319e+00, ..., -2.6284e+00, 2.6765e-02, -1.5907e+00]], [[-3.9798e-01, -3.2009e+00, -3.9201e+00, ..., -3.9571e+00, -3.3441e+00, -3.9645e+00]], ..., [[-1.3915e+00, -5.2765e+00, -6.4873e+00, ..., -1.4703e+00, -2.6689e+00, -3.1470e+00]], [[ 1.2558e+00, -2.8574e+00, -3.2931e+00, ..., -4.2293e+00, -2.1799e+00, -2.1932e+00]], [[-7.6964e+00, -1.8718e+01, -2.7185e+01, ..., -1.2376e+01, 9.0937e+00, 1.6436e+00]]], [[[-1.1242e+00, -8.2860e+00, -8.2646e+00, ..., -1.8985e+00, -1.2542e+00, -2.8900e+00]], [[-1.0887e+00, -4.9052e+00, -6.7508e+00, ..., -2.8327e+00, -3.3743e+00, -3.4591e+00]], [[ 4.6442e-01, -3.0563e+00, -3.7896e+00, ..., -1.8829e+00, -2.9564e+00, -1.0962e+00]], ..., [[-2.3970e-01, -4.2428e+00, -5.9849e+00, ..., -2.9465e+00, -1.6361e+00, -2.1216e+00]], [[ 1.6080e+00, -1.8076e+00, -1.2398e+00, ..., -1.7761e+00, -1.7464e+00, -2.5974e+00]], [[-7.6110e+00, -2.0081e+01, -1.4917e+01, ..., 5.9610e+00, 1.6559e+01, 1.2573e+00]]]]) attn_weights tensor([[[[ 2.3827, -2.1852, -3.2297, ..., -4.5695, -2.0020, -1.7321]], [[ 4.2855, -8.8430, -6.1491, ..., -10.6403, -9.3299, -2.7438]], [[ 0.3762, -3.1537, -3.5582, ..., -2.8500, -1.4736, -3.7504]], ..., [[ 1.1049, -3.1039, -2.6862, ..., -3.0857, -1.9210, -1.7144]], [[ 2.0234, -0.3332, -1.8342, ..., -0.2318, 0.0525, -1.9427]], [[ 1.0521, -3.5042, -2.4189, ..., -4.9041, -1.3454, 0.1260]]], [[[ 2.5170, -7.2688, -4.7106, ..., -2.7068, -3.1866, -3.2231]], [[ 4.1128, -11.5461, -10.0242, ..., -3.7899, -3.0514, -2.5964]], [[ 0.0702, -4.4323, -5.3883, ..., -0.2633, 1.5798, -1.9701]], ..., [[ 1.2169, -3.9650, -4.0044, ..., -3.0996, -2.7806, -4.6086]], [[ 2.0697, -1.6585, -2.4371, ..., -1.2399, -0.8777, -0.9423]], [[ 1.1288, -2.6693, -2.7079, ..., -3.5121, -0.9772, -0.5803]]], [[[ 2.4781, -5.3853, -6.5166, ..., -3.6506, -2.4665, -2.3453]], [[ 4.4375, -11.5164, -12.6205, ..., -11.4398, -4.4120, -2.5670]], [[ 0.1974, -5.2314, -5.1876, ..., -2.1743, -1.5564, -3.8005]], ..., [[ 1.2022, -4.0618, -4.1939, ..., -4.1847, -3.7583, -5.6066]], [[ 2.3197, -1.2808, -0.3434, ..., -1.5741, 0.6618, -0.6667]], [[ 0.9491, -4.5889, -4.2155, ..., -3.1049, -2.6024, -1.1361]]], [[[ 2.2998, -5.1547, -6.6398, ..., -1.9266, -0.3883, -2.9947]], [[ 4.1749, -11.1601, -6.9141, ..., -3.8720, -1.2194, -0.9085]], [[ 0.2101, -5.2255, -6.8026, ..., -1.6911, -1.5858, -3.1682]], ..., [[ 0.6606, -3.7207, -4.0321, ..., -1.6341, -1.4890, -3.6725]], [[ 1.5335, -2.4044, -5.3567, ..., -3.0258, -1.2961, -2.1219]], [[ 0.8164, -3.2338, -2.6414, ..., -1.8747, -1.4150, 0.9391]]], [[[ 2.9458, -3.4332, -3.0275, ..., -3.3801, -3.4259, -2.1489]], [[ 4.0171, -7.0220, -6.4812, ..., -5.7554, -8.3747, -2.9897]], [[ 0.8482, -3.0538, -4.6274, ..., -0.4163, 0.2746, -1.9203]], ..., [[ 1.0729, -3.2986, -3.5064, ..., -2.6280, -3.9257, -6.1558]], [[ 2.7474, -1.6064, -1.9431, ..., -1.1693, -2.7213, -3.1943]], [[ 1.0737, -1.0987, -2.0342, ..., -1.2403, -1.6809, -0.7254]]]]) attn_weights tensor([[[[-0.3752, -4.7714, -3.6627, ..., -4.3519, -3.8004, -3.5927]], [[-0.3688, -3.0199, -4.0356, ..., -2.1802, -2.1360, -2.2777]], [[ 0.4190, -2.7019, -2.8103, ..., -3.0402, -2.0424, -3.1443]], ..., [[ 4.5037, -5.5228, -3.5712, ..., -4.4388, -2.6376, -0.7366]], [[ 2.6774, -2.5001, -2.2659, ..., -1.9653, -1.3082, -1.8705]], [[ 0.6490, -4.4584, -6.1164, ..., -4.1338, -4.8925, -2.6070]]], [[[-1.5062, -5.6682, -5.2234, ..., -2.4510, -2.6486, -2.6133]], [[-0.5647, -3.9281, -6.1180, ..., -2.5442, -3.3251, -4.8868]], [[ 0.2652, -3.5658, -3.1749, ..., -4.6376, -3.1634, -3.6853]], ..., [[ 4.7850, -9.4367, -6.9515, ..., -0.6372, -2.8043, -0.1481]], [[ 3.1523, -3.4394, -4.1093, ..., -2.4435, -2.7542, -1.5690]], [[-0.8192, -4.0457, -5.6799, ..., -2.6893, -3.0165, -1.8254]]], [[[-1.0369, -6.0578, -5.1308, ..., -5.3387, -2.6431, -4.1343]], [[ 0.0683, -4.1149, -6.2806, ..., -4.2893, -3.7498, -3.6180]], [[ 0.4920, -3.0812, -2.6514, ..., -4.0498, -3.9430, -4.2907]], ..., [[ 4.1128, -6.4040, -5.2642, ..., -6.0534, -2.6291, -1.9484]], [[ 3.0302, -1.8537, -3.4295, ..., -2.0367, -2.5836, -1.2133]], [[-0.2228, -3.9461, -5.4994, ..., -2.8669, -2.2330, -1.8506]]], [[[-0.6047, -6.5371, -7.4660, ..., -3.4714, -4.6789, -3.9529]], [[-1.4564, -6.7631, -6.1231, ..., -1.0582, -3.3020, -2.0794]], [[ 0.3274, -3.3283, -3.1509, ..., -3.9669, -3.1321, -2.9609]], ..., [[ 3.3976, -8.9037, -6.2944, ..., -0.9856, -1.6104, -3.1817]], [[ 3.5681, -4.2726, -1.9237, ..., -3.9145, -2.5563, -0.2717]], [[-0.3169, -4.6022, -6.2408, ..., -1.8053, -1.5953, -1.4681]]], [[[ 0.3486, -5.0909, -5.0545, ..., -2.5773, -3.2370, -3.2991]], [[ 1.5431, -4.1273, -6.4907, ..., -3.1241, -1.8800, -2.8308]], [[ 0.3317, -2.8751, -2.9435, ..., -2.7519, -2.8181, -1.6203]], ..., [[ 4.6642, -5.1937, -3.1393, ..., -4.3440, -6.2122, -3.1367]], [[ 2.9146, -1.6757, -1.4612, ..., -2.5517, -2.4582, -0.2094]], [[ 0.8445, -3.5342, -5.7957, ..., -1.8003, -1.9738, 0.0723]]]]) attn_weights tensor([[[[-4.5296e-01, -7.5520e+00, -7.8308e+00, ..., -5.6643e+00, -3.2272e+00, -4.1089e+00]], [[ 3.0605e+00, -1.3273e+00, -1.4999e+00, ..., -1.8769e+00, 2.3230e-01, -6.2769e-01]], [[ 6.0762e+00, -2.5667e+00, -7.3545e-01, ..., -2.9019e+00, -2.5471e+00, 2.4883e-01]], ..., [[ 5.1789e-01, -3.4471e+00, -3.9169e+00, ..., -4.6720e+00, -1.7993e+00, -7.0547e-01]], [[ 4.3615e+00, -2.4855e+00, -1.0063e+00, ..., -1.8474e+00, -1.7057e+00, -6.5747e-01]], [[ 2.8872e+00, -1.4464e+00, -1.6061e+00, ..., -3.5859e+00, -1.5316e+00, -1.3803e-01]]], [[[-6.9297e-01, -7.6809e+00, -8.3258e+00, ..., -3.1707e+00, -3.4977e+00, -5.1302e+00]], [[ 3.3170e+00, -1.9185e+00, -2.1505e+00, ..., -7.5144e-01, -9.7616e-02, -2.9012e-01]], [[ 6.8601e+00, -6.3928e+00, -7.0357e+00, ..., -6.4308e-01, 1.9403e+00, -3.2722e-01]], ..., [[ 9.4763e-02, -2.1215e+00, -2.1256e+00, ..., -1.7699e+00, -2.0639e+00, -2.1176e+00]], [[ 4.1651e+00, -3.8831e+00, -2.7772e+00, ..., -1.3402e+00, -1.5530e-01, -7.6123e-01]], [[ 2.8173e+00, -3.3150e+00, -4.9722e+00, ..., -1.5691e+00, -1.8774e+00, -3.9179e+00]]], [[[-2.6599e-01, -9.2388e+00, -8.7755e+00, ..., -6.2574e+00, -2.9080e+00, -5.2711e+00]], [[ 3.5416e+00, -1.6038e+00, -1.2927e+00, ..., -1.4942e+00, -1.8153e+00, 1.0373e+00]], [[ 6.3891e+00, -5.1794e+00, -5.4945e+00, ..., -4.1058e+00, -8.2732e-01, 1.4011e+00]], ..., [[ 4.6046e-02, -1.8044e+00, -2.3219e+00, ..., -4.2920e+00, -2.2639e+00, -2.1828e+00]], [[ 4.0567e+00, -4.1651e+00, -2.3359e+00, ..., -4.2850e+00, -2.1380e+00, -2.6118e-01]], [[ 2.7563e+00, -2.6244e+00, -4.8047e+00, ..., -3.8962e+00, -2.9079e+00, -4.6726e-01]]], [[[-3.3512e-02, -8.0342e+00, -9.5864e+00, ..., -4.8204e+00, -3.3474e+00, -5.8611e+00]], [[ 1.9422e+00, -3.8253e+00, -4.4764e+00, ..., -1.8876e+00, -3.3257e+00, -2.3084e+00]], [[ 6.0847e+00, -5.6433e+00, -4.9494e+00, ..., -2.9095e+00, -3.1997e+00, -1.0913e+00]], ..., [[-2.7110e-02, -3.3774e+00, -5.0667e+00, ..., -2.9455e+00, -1.1417e+00, -1.9679e+00]], [[ 1.5934e+00, -5.1827e+00, -3.7860e+00, ..., -1.2596e+00, -1.7504e+00, -2.0964e+00]], [[ 2.4267e+00, -2.5532e+00, -2.8088e+00, ..., -1.5152e+00, -2.0625e+00, -2.6433e+00]]], [[[-7.1211e-03, -7.3244e+00, -6.7707e+00, ..., -2.6375e+00, -2.8774e+00, -3.6365e+00]], [[ 3.4646e+00, -1.7766e+00, -1.8230e+00, ..., -6.1922e-01, -4.5144e-01, -7.9765e-01]], [[ 6.4695e+00, -2.1111e+00, -3.1029e+00, ..., -3.3051e+00, -1.8660e+00, 4.0689e-01]], ..., [[ 1.3156e+00, -2.9702e+00, -3.3462e+00, ..., -5.1878e-02, -1.7784e+00, -1.0091e+00]], [[ 4.7693e+00, -3.0990e+00, -2.3055e+00, ..., -1.8913e+00, -3.2344e+00, -2.6363e+00]], [[ 3.0770e+00, -6.2049e-01, -3.1374e+00, ..., -1.8704e+00, -2.7216e+00, -1.4768e+00]]]]) attn_weights tensor([[[[ 1.2457, -2.0339, -1.9878, ..., -2.2430, -1.0749, -2.0343]], [[ 3.5446, -0.3155, 0.7413, ..., -1.5934, -1.8448, 0.6333]], [[ 1.7697, 0.1391, -0.1204, ..., 0.5356, 1.0650, -0.0857]], ..., [[ 1.0081, -2.5338, -1.8054, ..., -1.4150, -0.7096, -1.5351]], [[ 1.1875, -2.4115, -1.9810, ..., -1.9895, -1.9443, -1.6707]], [[ 0.9617, -3.2630, -3.4399, ..., -3.7543, -2.8781, -4.0561]]], [[[ 1.6551, -3.0103, -2.6816, ..., -4.0197, -3.5391, -3.8930]], [[ 5.8897, -3.1888, -3.2405, ..., -1.2601, -0.5619, 0.2799]], [[ 1.1275, -0.0417, -1.4892, ..., -0.5736, -2.4171, -0.9563]], ..., [[ 1.4433, -4.4978, -3.8434, ..., -0.8955, -2.9525, -2.7412]], [[ 0.9544, -3.1126, -3.0752, ..., -2.0997, -2.1762, -1.6667]], [[ 1.1297, -1.8481, -2.7742, ..., -3.4998, -3.5067, -4.8522]]], [[[ 1.5678, -2.9923, -3.6510, ..., -4.9189, -3.4207, -2.2509]], [[ 5.5360, 0.1020, -0.1470, ..., -1.7738, -1.4888, 1.4946]], [[ 1.8156, -0.1440, -1.2488, ..., -0.4978, -1.3715, -0.7737]], ..., [[ 1.0842, -3.7402, -2.6145, ..., -2.6899, -1.2931, -1.8504]], [[ 0.8362, -3.0113, -3.3002, ..., -2.9727, -2.2112, -1.0857]], [[ 1.0099, -2.6144, -3.7690, ..., -5.3623, -3.0690, -3.4918]]], [[[ 1.0117, -2.6537, -2.6819, ..., -3.3869, -3.1666, -1.4117]], [[ 1.8283, -4.4485, -3.6122, ..., -0.9629, -2.3550, -3.2144]], [[ 2.4740, -1.7242, -2.8769, ..., -2.1100, -2.3986, -2.8559]], ..., [[ 0.7941, -4.4047, -3.5496, ..., -1.0168, -1.9360, -2.5485]], [[ 1.0528, -3.9421, -3.8808, ..., -1.4127, -1.4688, -1.2833]], [[ 0.3298, -4.0311, -4.2418, ..., -5.0068, -5.2457, -4.5583]]], [[[ 1.5564, -2.5582, -3.0950, ..., -2.3832, -4.4276, -1.9838]], [[ 5.5555, -0.9579, 0.1005, ..., -0.2748, 0.3712, 0.5526]], [[ 2.0146, -0.7940, -1.7194, ..., -1.5875, -1.7353, -0.9311]], ..., [[ 1.2068, -3.8622, -3.0642, ..., -1.9951, -2.4877, -2.7525]], [[ 1.1591, -3.2011, -2.8810, ..., -1.3998, -1.0942, -1.5349]], [[ 0.8700, -3.1362, -3.8067, ..., -2.9561, -4.1943, -5.4049]]]]) attn_weights tensor([[[[ 1.9691, -1.3059, -2.3421, ..., -1.2137, -1.1541, -2.4491]], [[ 3.5637, -0.4138, -1.4883, ..., -2.5595, -0.7064, 0.6028]], [[ 1.8188, -2.1532, -2.3000, ..., -1.8054, -0.5102, -2.0696]], ..., [[ 3.3096, -2.3084, -2.9287, ..., -2.2610, -2.5352, -3.2457]], [[ 1.3860, -4.1237, -5.2740, ..., -4.2158, -0.9611, -0.5442]], [[ 3.4644, 0.6425, -0.4948, ..., -1.2228, -0.8348, -0.8385]]], [[[ 1.7608, -2.8661, -2.8601, ..., 0.2405, -4.4474, -3.0973]], [[ 3.8466, -1.0411, -2.7887, ..., -3.3374, -0.6630, -0.0913]], [[ 2.5436, -3.8802, -3.5617, ..., -0.5976, -3.4834, -2.2304]], ..., [[ 4.8117, -1.9564, -3.1712, ..., -0.6702, -2.5017, -0.6421]], [[ 0.0593, -6.0364, -5.5155, ..., -1.0734, -3.0853, -1.6879]], [[ 3.9216, -0.8471, -3.3775, ..., -4.5725, -3.1398, -1.9911]]], [[[ 1.7994, -3.0267, -3.2234, ..., -3.7748, 0.0103, -2.6251]], [[ 4.3251, -0.5936, -2.8993, ..., -0.8135, -2.8384, 0.4321]], [[ 2.7701, -2.4998, -2.9356, ..., -3.4949, -0.1079, -1.3194]], ..., [[ 4.9588, -1.2946, -2.1771, ..., -2.7936, -0.2888, 0.7788]], [[ 0.3005, -5.8643, -5.2700, ..., -1.8708, 0.3275, -0.6487]], [[ 3.7865, -0.7236, -3.4382, ..., -2.3813, -3.1882, -1.5739]]], [[[ 1.3256, -4.6370, -5.7659, ..., -2.5979, -3.7229, -3.7109]], [[ 2.6236, -2.7578, -2.6376, ..., -3.1132, -2.7980, -1.1060]], [[ 1.6706, -4.3824, -5.0885, ..., -1.0808, -2.1432, -3.4611]], ..., [[ 2.9835, -3.6573, -3.1115, ..., -1.8732, -2.8418, -1.9766]], [[ 0.7773, -4.7789, -6.0042, ..., -3.5971, -0.7862, -2.4076]], [[ 2.9761, -2.6055, -2.8662, ..., -3.5903, -3.2157, -3.1836]]], [[[ 2.4383, -2.8889, -4.3228, ..., -3.8539, -3.7595, -3.7885]], [[ 4.1256, -0.2305, -1.4468, ..., -2.3699, -0.5446, -0.9730]], [[ 2.1409, -3.6897, -2.9074, ..., -2.6412, -2.6512, -2.4579]], ..., [[ 3.4364, -2.5962, -3.0641, ..., -1.6374, -2.5370, -2.3795]], [[ 1.6812, -5.7654, -6.1745, ..., -2.0024, -1.5476, -2.3541]], [[ 4.0632, 2.0257, -1.6472, ..., -0.8414, 0.2524, -0.3444]]]]) attn_weights tensor([[[[ 2.1395e+00, -2.8504e+00, -3.6424e+00, ..., -2.7419e+00, -2.2829e+00, -3.6798e+00]], [[ 2.9499e+00, -8.1464e-01, -2.5953e+00, ..., -1.9835e+00, -8.1900e-01, -9.6709e-01]], [[ 2.4592e+00, -1.2591e+00, -1.3544e+00, ..., -1.2202e+00, -1.0453e+00, -1.6331e+00]], ..., [[ 8.4574e-01, -2.9568e+00, -2.4563e+00, ..., -2.7310e+00, -2.5148e-01, -1.6896e+00]], [[ 2.8551e+00, -2.2340e+00, -1.2932e+00, ..., -2.2542e+00, -2.6487e+00, -2.6103e+00]], [[ 2.7309e+00, -6.4875e-01, -1.5884e+00, ..., -1.4352e+00, 6.6999e-01, -1.0459e+00]]], [[[ 2.9934e+00, -2.8020e+00, -4.8157e+00, ..., -1.1362e+00, -4.5066e+00, -3.9350e+00]], [[ 4.7576e+00, -7.1547e-01, -3.0627e+00, ..., 3.9810e-01, -1.1509e+00, 8.5947e-02]], [[ 2.8212e+00, 1.3105e+00, -1.3810e+00, ..., -1.0360e+00, -2.5424e+00, -1.5450e+00]], ..., [[-1.1764e+00, -4.7363e+00, -5.3848e+00, ..., 2.1791e+00, -2.2606e+00, -6.1991e-01]], [[ 3.7996e+00, -2.1785e+00, -2.7838e+00, ..., -1.9550e+00, -4.1681e+00, -3.7748e+00]], [[ 4.3421e+00, -2.4750e+00, -1.6178e+00, ..., 8.4018e-01, 7.6447e-01, -5.0069e-03]]], [[[ 3.0169e+00, -2.4941e+00, -3.8472e+00, ..., -4.9222e+00, -1.2966e+00, -2.9678e+00]], [[ 4.9259e+00, 5.4674e-02, -1.9941e+00, ..., -2.9385e+00, 2.2335e-01, 4.8947e-01]], [[ 2.7515e+00, 2.0276e+00, -5.5449e-01, ..., -2.8607e+00, -6.7326e-01, 8.8748e-03]], ..., [[-6.2404e-01, -4.6700e+00, -4.9270e+00, ..., -3.1404e+00, 1.8536e+00, -1.5205e+00]], [[ 3.9296e+00, -1.1002e+00, -1.5389e+00, ..., -4.4106e+00, -1.6699e+00, -2.2823e+00]], [[ 4.1417e+00, -2.9390e+00, -1.7253e+00, ..., -2.3705e+00, -3.3963e-01, -1.4589e+00]]], [[[ 3.1808e+00, -4.4458e+00, -4.7618e+00, ..., -3.8162e+00, -4.6553e+00, -5.7872e+00]], [[ 3.3661e+00, -3.0251e+00, -2.5674e+00, ..., -1.1814e+00, -5.7033e-01, -2.0920e+00]], [[ 2.6031e+00, -2.1029e+00, -2.2955e+00, ..., -2.6113e+00, -2.7740e+00, -2.5448e+00]], ..., [[ 4.3844e-01, -5.0347e+00, -4.4146e+00, ..., -2.5759e+00, -3.3610e+00, -3.2803e+00]], [[ 2.7441e+00, -3.5851e+00, -2.7099e+00, ..., -3.2960e+00, -2.6596e+00, -2.0154e+00]], [[ 3.6344e+00, -3.1497e+00, -3.8907e+00, ..., -1.1857e+00, -1.2820e+00, -2.6665e+00]]], [[[ 2.3756e+00, -2.7241e+00, -3.6593e+00, ..., -2.7176e+00, -2.8006e+00, -3.6692e+00]], [[ 3.4714e+00, -1.7181e+00, -3.3882e+00, ..., -3.3553e-01, -1.8487e+00, -1.4991e+00]], [[ 2.6405e+00, -9.5804e-02, -2.0357e+00, ..., -9.5638e-01, -9.3429e-01, -1.0926e+00]], ..., [[ 4.0740e-01, -2.8675e+00, -4.0302e+00, ..., -1.2938e+00, -4.2455e-01, -9.4023e-01]], [[ 2.8378e+00, -3.2172e+00, -1.7629e+00, ..., -2.4225e+00, -1.9879e+00, -3.2337e+00]], [[ 3.6156e+00, -9.2273e-01, -5.0514e-01, ..., -1.3897e+00, -4.0655e-01, -1.2538e+00]]]]) attn_weights tensor([[[[ 1.1891, 1.6597, 1.1458, ..., 1.2702, 0.7313, 2.0323]], [[ 2.7231, 0.4146, -0.5390, ..., 0.2418, 0.9483, -0.7537]], [[ 2.5348, 0.0435, -2.0030, ..., -2.0829, 0.8372, -1.4139]], ..., [[ 3.3137, -0.2425, -1.4272, ..., -0.6183, -0.5861, -0.6703]], [[ 3.1100, 1.7172, 0.3583, ..., 0.3570, 2.3646, 1.2277]], [[ 2.9722, 0.7089, -0.7270, ..., 0.1870, -0.0881, 0.8310]]], [[[ 1.2043, 2.6413, 1.1815, ..., 0.7168, 0.6943, 2.0328]], [[ 3.9707, -0.7220, -1.2715, ..., -0.2182, -1.3065, -0.3552]], [[ 3.9087, 0.8110, -1.8998, ..., -0.8018, -2.2748, -2.0030]], ..., [[ 4.8033, -0.1155, -1.6553, ..., -0.0737, -0.8098, 0.6121]], [[ 2.6614, 0.0259, -1.1493, ..., -0.4123, 0.2450, 0.0217]], [[ 2.9123, 1.2937, -0.6154, ..., 2.7881, 0.4759, 0.4042]]], [[[ 1.1193, 2.9147, 1.3065, ..., 0.6092, -0.0106, 1.5591]], [[ 3.5688, 0.1487, -0.6526, ..., -2.2883, 0.3756, -0.2830]], [[ 3.8615, 1.0220, -1.6998, ..., -5.4103, -1.1490, -1.6768]], ..., [[ 4.8150, 0.1499, -1.0879, ..., -4.3478, -0.6508, 0.5889]], [[ 2.6170, 0.4416, -0.9004, ..., -2.2382, 0.4518, -0.4093]], [[ 2.4502, 1.1574, -0.3821, ..., -0.6589, 2.5351, 0.4337]]], [[[ 0.8635, 1.3621, 0.0847, ..., 0.4340, 0.6632, 1.0984]], [[ 3.4617, -1.3836, -1.4540, ..., -0.5663, -1.3736, -0.8073]], [[ 3.6116, -1.2033, -1.5111, ..., -2.2291, -2.5677, -4.3667]], ..., [[ 4.1529, -1.3005, -2.4623, ..., -0.9164, -0.7723, -2.2369]], [[ 2.7894, -0.4843, -1.2832, ..., -0.8482, 0.9730, 0.5924]], [[ 1.8078, 1.9393, -0.5268, ..., -0.6979, 2.2621, -0.3936]]], [[[ 1.1670, 1.4785, 0.4320, ..., 1.7537, 1.5513, 2.3486]], [[ 3.1222, 0.1273, -0.8214, ..., -0.6751, 0.6233, -0.8828]], [[ 2.7335, 0.6172, -1.5129, ..., -0.4046, -0.6337, -1.1374]], ..., [[ 3.4239, -0.7208, -2.0821, ..., -1.2730, -1.5959, -0.4416]], [[ 3.0531, 1.9925, -0.1967, ..., 1.6540, 1.3258, 0.3769]], [[ 1.8301, 2.3233, -0.7156, ..., 0.7287, 1.3242, 0.1846]]]]) attn_weights tensor([[[[-1.3061, -3.0111, -2.2333, ..., -2.6519, -0.7776, -2.7562]], [[ 1.5252, -0.2411, 0.5278, ..., -0.5295, -1.2056, 7.7632]], [[-1.6355, -2.3055, -2.1126, ..., -1.7188, -1.8078, -3.0878]], ..., [[-1.9464, -2.3010, -2.3866, ..., -2.1108, -1.9752, -2.6537]], [[ 0.1873, -0.2908, -0.3243, ..., -0.2850, -0.3563, 1.1047]], [[-0.9135, -2.3346, -3.1624, ..., -2.3710, -2.4939, -2.5560]]], [[[-1.5296, -4.6150, -2.5933, ..., -4.0476, -2.5066, -4.6282]], [[-2.3018, -0.1174, -3.5357, ..., -3.3380, -4.3804, 3.8084]], [[-1.7372, -3.2339, -2.0921, ..., -2.9165, -3.8250, -3.0870]], ..., [[-1.7432, -2.1491, -2.1019, ..., -1.9635, -2.3264, -1.8411]], [[-0.4247, -0.7078, -0.8851, ..., -0.3759, -0.9471, 0.0696]], [[-1.3079, -2.0968, -3.3681, ..., -2.2672, -2.3514, -2.0203]]], [[[-1.6401, -5.0392, -2.5576, ..., -2.4375, -2.3306, -4.7946]], [[-3.3084, 2.4146, -3.6279, ..., -5.3134, -3.5502, 3.5213]], [[-2.3238, -1.2262, -3.0335, ..., -4.6380, -2.4197, -0.8118]], ..., [[-1.8090, -2.1953, -2.2093, ..., -2.6271, -1.9648, -2.0423]], [[-0.4443, -0.5529, -0.7244, ..., -0.9732, -0.6759, -0.2745]], [[-1.5743, -2.2829, -3.6151, ..., -2.6198, -1.5339, -2.2732]]], [[[-1.0659, -3.5393, -1.9620, ..., -3.3240, -2.3774, -3.3573]], [[-1.3989, 0.7064, -2.7705, ..., 0.3153, -3.1702, 5.1491]], [[-2.0311, -2.9366, -2.7056, ..., -2.9686, -3.7306, -2.6912]], ..., [[-1.9307, -2.3442, -2.4131, ..., -2.2389, -2.3365, -2.2107]], [[-0.0664, -0.3032, -0.4505, ..., -0.2431, -0.4881, 0.1610]], [[-1.4261, -2.0613, -3.4175, ..., -2.1711, -2.8322, -2.8283]]], [[[-1.6401, -5.0392, -2.5576, ..., -3.6936, -0.5766, -4.7946]], [[-3.3084, 2.4146, -3.6279, ..., -5.5807, -5.3018, 3.5213]], [[-2.3238, -1.2262, -3.0335, ..., -4.8531, -3.6551, -0.8118]], ..., [[-1.8090, -2.1953, -2.2093, ..., -2.2091, -2.3218, -2.0423]], [[-0.4443, -0.5529, -0.7244, ..., -0.6503, -0.9066, -0.2745]], [[-1.5743, -2.2829, -3.6151, ..., -2.7145, -1.8304, -2.2732]]]]) attn_weights tensor([[[[-1.8992, -3.7117, -3.3305, ..., 0.1162, 0.8949, 0.3363]], [[-2.1067, -3.1400, -3.2701, ..., 1.2797, 1.2421, -0.1805]], [[-3.5396, -4.1584, -4.0456, ..., -2.5308, -2.6345, -2.7085]], ..., [[ 1.1607, -0.6323, -0.0549, ..., -0.9324, 0.1324, -0.0859]], [[-4.5023, -2.5145, -2.4335, ..., -0.7786, -0.6641, -0.7836]], [[ 1.0442, 0.3898, -2.9512, ..., 1.4866, -1.3344, 4.5471]]], [[[-0.3572, -3.0581, -2.1582, ..., -0.4367, -0.0668, 0.0064]], [[ 0.0422, -1.9208, -2.3697, ..., -0.5129, -0.5857, 0.9886]], [[-3.2405, -4.0762, -3.8331, ..., -2.5269, -2.7795, -2.0234]], ..., [[ 1.5410, -0.2639, 0.2894, ..., 0.0201, -0.4401, -0.5969]], [[-4.3224, -2.3705, -2.2577, ..., -0.8587, -0.8239, -0.4005]], [[-0.0907, -0.8799, -1.8882, ..., -1.4657, -1.5994, -0.1739]]], [[[-0.6839, -3.7344, -2.1057, ..., 0.1270, 0.4727, 0.0529]], [[-0.6783, -3.0703, -2.6994, ..., -0.5087, 0.1714, 0.6268]], [[-3.4721, -4.1418, -4.0045, ..., -2.9431, -2.6345, -2.2401]], ..., [[ 1.2673, -0.5364, -0.0415, ..., -1.5557, -0.3075, -1.2556]], [[-4.3622, -2.5725, -2.4691, ..., -0.8815, -0.8306, -0.7231]], [[-0.6317, -1.0075, -2.0726, ..., -3.0191, -1.8398, -0.4626]]], [[[-2.6254, -4.8987, -4.3333, ..., -0.2801, 2.1498, -0.3492]], [[-0.9138, -2.4043, -3.0196, ..., 1.6760, 1.1514, 0.5879]], [[-3.6663, -4.2611, -4.1332, ..., -2.4060, -2.8152, -2.6281]], ..., [[ 1.3379, -0.5001, 0.0065, ..., -0.9518, 0.2440, 0.1268]], [[-4.4359, -2.6173, -2.5014, ..., -0.8831, -0.8885, -0.8739]], [[-0.2488, -0.9981, -3.3896, ..., -0.1906, -2.0164, 3.0304]]], [[[-1.3768, -4.1672, -2.4185, ..., 1.0972, 0.7968, 0.2866]], [[-1.2877, -3.4431, -2.8287, ..., 0.0252, 0.2353, 0.6265]], [[-3.7143, -4.2741, -4.1625, ..., -2.8065, -2.6026, -2.2985]], ..., [[ 1.3509, -0.3800, 0.0636, ..., 0.3642, -1.3024, -1.1152]], [[-4.3939, -2.5835, -2.4644, ..., -1.1731, -0.3613, -0.6591]], [[-0.3822, -0.8641, -1.9941, ..., -0.9233, -1.7212, -0.1765]]]]) attn_weights tensor([[[[ -1.5908, -5.2378, -4.0687, ..., -2.3792, 0.3422, -1.2176]], [[ 1.6639, -1.5191, -1.3060, ..., -1.2255, -1.2498, -1.9181]], [[ -6.2208, -14.9019, -14.3591, ..., -3.9616, -2.6507, -4.9801]], ..., [[ -3.5331, -8.9881, -8.0933, ..., -1.9460, -2.5993, -2.8364]], [[ -1.9882, -3.7672, -3.7660, ..., -1.7972, -1.0878, -1.0201]], [[ -0.5776, -5.6298, -5.5217, ..., -2.9269, -2.6062, -2.5535]]], [[[ -0.8508, -4.6622, -3.0751, ..., -1.3987, -2.3714, -2.2298]], [[ 1.1436, -1.7191, -1.5285, ..., -2.9041, -1.8909, -1.6072]], [[ -5.4325, -15.6029, -13.4586, ..., -5.9918, -5.1924, -3.7566]], ..., [[ -3.1257, -8.3799, -7.8275, ..., -3.5788, -1.9913, -2.1099]], [[ -1.0256, -3.7672, -3.3215, ..., -1.8206, -1.1066, -1.3597]], [[ -0.2445, -5.2674, -4.7416, ..., -2.9769, -2.5359, -2.3554]]], [[[ -1.3133, -5.7628, -3.7996, ..., -2.8896, -1.8074, -2.6750]], [[ 1.4487, -0.4592, -1.6225, ..., -0.9316, -1.9863, -0.9787]], [[ -6.9550, -18.1130, -14.9956, ..., -4.9323, -3.3541, -3.5958]], ..., [[ -4.2583, -10.8878, -9.1094, ..., -1.7655, -1.8873, -3.4884]], [[ -1.7155, -3.8881, -3.6007, ..., -1.3980, -1.3716, -1.6234]], [[ -0.5500, -5.6070, -5.2097, ..., -2.8179, -2.8213, -2.8315]]], [[[ -1.6878, -5.6761, -5.0509, ..., -2.3542, -2.1453, -1.9865]], [[ 1.8484, -0.7110, -2.6330, ..., -0.8900, -3.2506, -2.8067]], [[ -8.2239, -18.9455, -18.8872, ..., -4.5778, -2.0256, -5.9161]], ..., [[ -5.2553, -10.9188, -11.6076, ..., -3.1194, -2.6634, -4.0054]], [[ -2.4367, -4.2455, -4.0216, ..., -1.9943, -1.2940, -1.4150]], [[ -0.5712, -5.7995, -5.4684, ..., -3.0589, -2.5372, -2.7679]]], [[[ -1.3743, -5.9900, -4.0235, ..., -1.8160, -1.4230, -2.4143]], [[ 2.1187, -1.0202, -1.2205, ..., -2.0671, -0.6304, -0.6516]], [[ -7.7535, -18.9687, -15.9226, ..., -5.3452, -4.3761, -4.4258]], ..., [[ -4.5217, -10.9057, -9.0593, ..., -3.1917, -0.5071, -3.5910]], [[ -1.4829, -3.6446, -3.4368, ..., -1.6184, -0.5420, -0.9861]], [[ -0.4992, -5.9254, -5.6648, ..., -3.2718, -2.5288, -2.7265]]]]) attn_weights tensor([[[[ 4.7961, -0.7999, -3.6184, ..., -0.5342, -3.0791, 1.8164]], [[ -2.6046, -7.5386, -7.5686, ..., -3.3245, -3.1283, -5.2998]], [[ -4.9167, -11.8322, -12.1600, ..., -5.7845, -3.1356, -5.9007]], ..., [[ -1.6731, -8.0784, -6.3480, ..., -3.5517, -2.6741, -2.5974]], [[ -1.0477, -6.6059, -5.9945, ..., -3.9399, -3.2803, -3.3839]], [[ -2.0269, -8.4819, -9.8882, ..., -3.8405, -2.4810, -3.8989]]], [[[ 3.8822, -0.7317, -1.3264, ..., -2.9335, -3.6427, -0.9614]], [[ -2.5386, -4.6535, -4.8255, ..., -4.8591, -5.4196, -3.7760]], [[ -4.3257, -7.0445, -7.6047, ..., -3.4168, -4.4462, -4.8148]], ..., [[ -2.0541, -4.3912, -4.2397, ..., -6.0802, -6.2997, -3.8977]], [[ -0.9973, -5.2919, -4.4769, ..., -3.5913, -2.7882, -2.6378]], [[ -2.5017, -6.2328, -6.4169, ..., -3.8603, -3.3330, -3.3580]]], [[[ 3.6324, -0.2002, -0.6610, ..., -2.2930, -2.9702, -0.6879]], [[ -2.7889, -7.1348, -5.5015, ..., -6.5645, -4.9782, -3.4264]], [[ -4.7629, -11.9867, -9.1303, ..., -6.5055, -4.5532, -5.5125]], ..., [[ -2.3023, -6.8628, -2.8021, ..., -5.5023, -5.8022, -3.3633]], [[ -1.1884, -6.4563, -5.1847, ..., -4.0158, -2.9049, -2.5759]], [[ -2.8683, -7.6946, -7.8368, ..., -3.2435, -2.3289, -3.6732]]], [[[ 3.6064, -1.4285, -2.3922, ..., -1.4769, -1.6384, 0.9126]], [[ -2.8753, -9.2612, -8.9102, ..., -3.8036, -5.4147, -4.6006]], [[ -4.3553, -12.6406, -14.3943, ..., -3.8795, -3.1141, -4.9308]], ..., [[ -1.5420, -7.4423, -8.7732, ..., -3.4792, -3.4569, -3.1861]], [[ -1.0806, -5.7526, -6.5614, ..., -3.4109, -3.1083, -2.2863]], [[ -2.5722, -9.0943, -10.3031, ..., -4.2293, -4.7376, -4.3553]]], [[[ 4.5276, -0.3525, -0.7196, ..., -1.3506, -2.5344, -1.2730]], [[ -2.4144, -8.5981, -6.8238, ..., -5.0458, -5.4168, -3.8442]], [[ -5.2015, -13.2770, -10.7326, ..., -3.5834, -4.4385, -5.5733]], ..., [[ -1.9054, -7.9088, -4.3705, ..., -2.8433, -0.1346, -2.6441]], [[ -0.9956, -6.4575, -5.7247, ..., -4.0153, -3.6672, -2.9545]], [[ -2.6716, -8.5085, -9.4821, ..., -2.1141, 1.5882, -2.5561]]]]) attn_weights tensor([[[[ -1.9707, -10.0948, -9.6920, ..., -5.3290, -4.2716, -4.6470]], [[ -2.0955, -8.4479, -9.3748, ..., -3.7302, -0.9883, -4.8418]], [[ 0.2255, -1.5061, -2.1828, ..., -1.4176, -1.9302, -2.3725]], ..., [[ -0.7366, -5.6185, -6.5850, ..., -3.5478, -3.2646, -4.1756]], [[ 1.5114, -1.7934, -1.4185, ..., -1.4911, -0.8207, -0.6001]], [[-10.1060, -23.3716, -18.7519, ..., -3.6999, 12.5437, -0.9598]]], [[[ -2.1402, -9.2475, -9.0514, ..., -2.7072, -3.6008, -4.4921]], [[ -1.6604, -6.0820, -7.3049, ..., -4.4361, -3.8524, -3.4783]], [[ 0.1642, -2.0174, -2.3470, ..., -3.6296, -2.7133, -1.9413]], ..., [[ -1.3913, -3.9679, -3.6773, ..., -1.4509, -3.0511, -3.6330]], [[ 1.3340, -1.9242, -2.8092, ..., -3.3061, -5.1704, -1.7648]], [[ -7.3952, -24.7773, -29.4061, ..., 5.0720, 12.7557, -4.7670]]], [[[ -3.4436, -10.7463, -9.7355, ..., -4.6164, -5.3299, -5.0683]], [[ -2.4363, -8.9300, -8.3920, ..., -4.8733, -4.4126, -4.3443]], [[ -0.3670, -2.7136, -3.3365, ..., -4.3391, -4.2332, -3.1250]], ..., [[ -1.6749, -5.6019, -4.7596, ..., -2.0588, -1.5846, -3.4463]], [[ 1.2039, -1.9526, -3.0441, ..., -2.6739, -3.8044, -2.1536]], [[ -6.9133, -38.2439, -42.2245, ..., 1.9307, 10.5055, -6.8148]]], [[[ -3.0248, -11.5363, -11.6194, ..., -5.8425, -4.6892, -4.7827]], [[ -3.1143, -7.8843, -8.6141, ..., 0.7605, -0.8855, -1.6721]], [[ -0.3730, -3.3517, -4.2562, ..., -2.7456, -3.8402, -3.9183]], ..., [[ -1.3929, -5.3096, -6.8539, ..., -2.8587, -3.0554, -3.8770]], [[ 1.2526, -3.0004, -3.6672, ..., -2.1257, -2.2899, -3.3733]], [[ -4.5397, -35.5265, -25.6192, ..., 0.8826, 15.9492, 4.8152]]], [[[ -1.9971, -10.6257, -10.3532, ..., -4.8011, -3.1502, -4.4569]], [[ -1.4712, -8.4863, -8.6285, ..., -3.6097, -1.4740, -2.7993]], [[ 0.5312, -3.8085, -3.4424, ..., -3.6525, -0.8126, -1.9959]], ..., [[ -0.7231, -5.8803, -6.9474, ..., -2.1811, 0.1653, -3.3864]], [[ 1.6753, -2.6157, -1.8419, ..., -2.5059, -3.1667, -1.2785]], [[ -6.3276, -29.5347, -32.2082, ..., -16.1991, 9.9747, -2.2810]]]]) attn_weights tensor([[[[ 2.1966, -3.7591, -3.1901, ..., -3.9410, -3.2013, -3.1878]], [[ 4.5147, -7.1046, -7.2026, ..., -8.0315, -5.6806, -3.9555]], [[ 0.6915, -4.1187, -5.2975, ..., -2.3304, -2.7524, -3.5517]], ..., [[ 0.9940, -3.6908, -3.8971, ..., -3.3093, -2.8314, -4.9726]], [[ 2.4631, -0.3993, -1.1954, ..., 0.1234, -0.5426, -0.3167]], [[ 1.0548, -4.5131, -4.1131, ..., -2.6387, -1.9789, -1.2502]]], [[[ 2.6024, -6.1534, -4.6833, ..., -3.7153, -5.4897, -2.0539]], [[ 3.8150, -12.7311, -7.7295, ..., -6.9635, -7.1602, -3.5128]], [[ 0.0430, -2.4340, -2.8604, ..., -2.2686, -3.1999, -3.5997]], ..., [[ 1.1884, -3.1199, -2.9168, ..., -2.9655, -3.7358, -1.5517]], [[ 1.9229, -0.8871, -1.1365, ..., -0.1706, -0.6394, -0.0560]], [[ 1.2601, -3.2392, -2.6023, ..., -2.3771, -5.0023, -0.2718]]], [[[ 2.5915, -7.7752, -2.5507, ..., -0.7319, -1.4241, -1.2828]], [[ 4.4452, -14.5453, -4.4181, ..., -4.4637, -5.4108, -2.4367]], [[ -0.2796, -4.8962, -4.1695, ..., -2.3431, -1.0789, -3.7736]], ..., [[ 1.0278, -3.4575, -3.3824, ..., -3.0180, -3.2073, -2.6537]], [[ 1.6371, -1.1731, -1.7411, ..., 0.2445, -0.4839, -0.8982]], [[ 0.9991, -3.1755, -3.2790, ..., -2.4383, -1.9377, -0.2431]]], [[[ 2.1602, -4.7961, -5.5652, ..., -0.4001, -1.6783, -1.2074]], [[ 4.2978, -12.8325, -9.2975, ..., -6.3245, -3.1390, 1.5271]], [[ 0.3856, -4.9424, -6.7455, ..., -1.7097, -2.0428, -4.2727]], ..., [[ 0.5874, -3.5546, -3.6916, ..., -1.4257, -2.1948, -1.8475]], [[ 1.0217, -1.7652, -4.7759, ..., -0.4352, -1.7132, -2.0659]], [[ 1.0055, -3.8583, -4.1057, ..., -2.2125, -0.7873, 1.8704]]], [[[ 2.9148, -5.6544, -1.8119, ..., -2.8007, -3.6966, -3.5981]], [[ 4.6995, -12.3512, -2.5804, ..., -7.5873, -6.3754, -2.4935]], [[ 0.6970, -4.3182, -5.1227, ..., -1.1546, -0.4676, -3.1862]], ..., [[ 1.1357, -3.6893, -2.9577, ..., -3.9338, -4.3697, -4.2295]], [[ 2.0645, -2.5554, -3.8262, ..., -2.6566, -1.3428, -2.3779]], [[ 1.1190, -2.4821, -2.8066, ..., -3.0010, -2.2350, -0.0918]]]]) attn_weights tensor([[[[-0.4405, -4.8694, -4.9234, ..., -3.5869, -2.4301, -2.8355]], [[ 0.4470, -4.3880, -5.6024, ..., -3.6797, -3.5490, -3.1775]], [[ 0.4217, -2.8471, -2.8841, ..., -1.8916, -3.0692, -2.6876]], ..., [[ 4.7271, -5.9179, -6.5985, ..., -2.9668, -4.8753, -3.5056]], [[ 2.5461, -2.9918, -1.9471, ..., -0.8138, -2.1576, -0.9532]], [[ 0.4185, -4.0792, -5.8050, ..., -4.5777, -1.3675, 0.0383]]], [[[-0.3600, -3.3482, -2.3775, ..., -5.5049, -5.6745, -4.4936]], [[-0.0388, -3.0033, -4.1600, ..., -4.7421, -4.4928, -2.8777]], [[ 0.3514, -2.6069, -2.6084, ..., -2.7816, -3.7392, -2.2347]], ..., [[ 4.2871, -8.2321, -3.3272, ..., -4.1357, -2.8492, -2.3248]], [[ 2.6747, -2.3588, -2.5117, ..., -1.9192, -1.5272, -0.5527]], [[ 0.1984, -2.1318, -4.5004, ..., -4.1337, -2.0487, -4.5100]]], [[[-1.2486, -4.3576, -4.1224, ..., -3.3290, -3.4191, -4.3120]], [[-0.5386, -5.0995, -5.3093, ..., -3.3230, -3.0544, -3.9816]], [[ 0.1902, -2.9565, -2.5394, ..., -4.4138, -4.4112, -2.9225]], ..., [[ 3.6138, -9.4380, -1.6790, ..., -2.6365, -2.3190, -1.8450]], [[ 2.8629, -2.1099, -0.3196, ..., -1.9622, -1.5313, -0.9128]], [[-0.3439, -3.9454, -5.3090, ..., -2.9132, -1.6850, -3.0379]]], [[[-1.1274, -6.9271, -6.8333, ..., -3.7954, -1.5055, -2.9378]], [[-1.5763, -6.1556, -5.4972, ..., -1.8654, -1.6531, -3.0790]], [[ 0.2200, -2.9728, -3.1347, ..., -2.7629, -3.3801, -3.7501]], ..., [[ 3.5407, -9.3331, -7.6643, ..., -5.9769, -4.9240, -1.4550]], [[ 3.3681, -4.5978, -2.9792, ..., -2.0954, -1.5231, -1.2871]], [[-0.6132, -4.9293, -6.1621, ..., -1.1912, -0.5041, -1.6218]]], [[[-0.0916, -6.3813, -5.9774, ..., -4.4917, -3.0827, -5.0130]], [[ 0.9817, -5.0803, -5.2196, ..., -4.6282, -4.1920, -4.5794]], [[ 0.3911, -3.6123, -3.9932, ..., -3.0554, -1.5359, -1.2453]], ..., [[ 4.5316, -7.3420, -1.2383, ..., -4.9899, -3.4670, 0.0974]], [[ 2.8906, -3.5782, -2.4273, ..., -2.8431, -1.4911, -0.7990]], [[ 0.0906, -4.3133, -6.6372, ..., -3.2697, 0.4887, -2.0668]]]]) attn_weights tensor([[[[-5.5201e-01, -6.5341e+00, -6.6231e+00, ..., -4.1849e+00, -1.8090e+00, -3.9113e+00]], [[ 3.7062e+00, 6.9129e-01, -2.0016e-01, ..., 2.2354e+00, -4.9350e-03, -4.7435e-01]], [[ 6.6490e+00, -3.5143e-01, -1.2251e+00, ..., -1.7710e+00, -1.4264e+00, 1.0509e+00]], ..., [[ 7.2995e-01, -3.5766e+00, -3.8355e+00, ..., -1.5611e+00, -2.9611e-01, -2.2371e+00]], [[ 5.0514e+00, -2.8897e+00, -3.5158e+00, ..., -1.8317e+00, -2.7819e+00, -2.6408e+00]], [[ 2.9914e+00, -1.5605e+00, -3.5943e+00, ..., -9.6871e-01, -2.7379e+00, -1.5851e+00]]], [[[-4.5586e-03, -7.8051e+00, -7.2475e+00, ..., -4.8249e+00, -3.3789e+00, -5.3930e+00]], [[ 3.1345e+00, -2.7968e+00, -1.6493e+00, ..., -1.5528e+00, 3.3163e-02, 5.2202e-01]], [[ 5.7865e+00, -3.7107e+00, -1.8660e+00, ..., -1.9726e-01, -1.7814e+00, -5.3672e-01]], ..., [[ 9.6241e-01, -2.9865e+00, -3.8202e+00, ..., -7.2946e+00, -5.3474e+00, -2.1885e+00]], [[ 3.9931e+00, -4.5296e+00, -2.1106e+00, ..., -2.4105e+00, -1.1236e+00, -1.7000e+00]], [[ 3.0131e+00, -3.7623e+00, -2.2971e+00, ..., -3.2866e+00, -5.1230e+00, -7.7269e-01]]], [[[-1.9988e-01, -1.0223e+01, -8.9732e+00, ..., -3.9541e+00, -3.7584e+00, -6.4914e+00]], [[ 3.2985e+00, -2.2658e+00, -6.8710e-01, ..., -7.2194e-01, 6.5496e-01, 8.5778e-01]], [[ 6.1846e+00, -6.3347e+00, -1.6163e+00, ..., -1.4970e+00, 1.3283e+00, -5.4237e-01]], ..., [[ 5.1687e-01, -1.9805e+00, -2.5557e+00, ..., -3.0315e+00, -3.9948e+00, -2.2222e+00]], [[ 3.7579e+00, -5.4080e+00, -1.0298e+00, ..., -2.5548e+00, -1.3250e+00, -2.3788e+00]], [[ 3.2755e+00, -4.2474e+00, -2.4552e-01, ..., -2.6912e+00, -1.2840e+00, -8.6079e-01]]], [[[-5.6951e-01, -7.5396e+00, -6.9155e+00, ..., -3.0404e+00, -2.6896e+00, -4.7360e+00]], [[ 1.7873e+00, -3.2088e+00, -3.6208e+00, ..., -3.4487e+00, -2.6937e+00, -3.5179e+00]], [[ 5.9648e+00, -6.6071e+00, -3.9551e+00, ..., -6.7104e+00, -4.2474e+00, -1.7289e+00]], ..., [[-4.5230e-01, -3.3649e+00, -3.9454e+00, ..., -7.9847e-01, -8.1986e-01, -2.2904e+00]], [[ 1.3656e+00, -4.9257e+00, -3.8517e+00, ..., -4.2114e+00, -3.1167e+00, -4.0809e+00]], [[ 2.0914e+00, -2.3478e+00, -2.5940e+00, ..., -3.4868e+00, -2.7977e+00, -1.6449e+00]]], [[[-2.3942e-01, -8.3599e+00, -8.3863e+00, ..., -5.9258e+00, -3.3035e+00, -4.8425e+00]], [[ 2.7456e+00, -2.4840e+00, -2.8631e+00, ..., -2.1956e+00, -1.9411e+00, -9.3104e-01]], [[ 6.2414e+00, -4.3733e+00, -8.0496e-01, ..., 1.6262e-01, 1.1996e-01, -4.9354e-01]], ..., [[ 6.2722e-01, -5.2565e+00, -5.0872e+00, ..., -1.8886e+00, -1.1764e+00, -1.2474e+00]], [[ 4.0150e+00, -4.4468e+00, -2.3099e+00, ..., -2.0308e+00, -2.2694e+00, -1.0870e+00]], [[ 3.1554e+00, -3.5627e+00, -1.1648e+00, ..., -3.0638e+00, -3.2645e+00, -1.6638e+00]]]]) attn_weights tensor([[[[ 1.3826, -1.0584, -2.0074, ..., -0.5629, -2.9018, -1.4997]], [[ 5.4184, 1.3183, 1.8679, ..., -0.5396, 0.2792, 0.6233]], [[ 1.5381, -0.2717, -1.0253, ..., 1.2738, -0.2701, -0.6352]], ..., [[ 1.3595, -2.5925, -2.2383, ..., -0.9610, -1.3882, -1.7675]], [[ 1.5795, -2.1408, -2.0065, ..., -0.5597, -1.5414, -1.0709]], [[ 1.3135, -2.9775, -3.1765, ..., -3.2021, -3.5710, -4.0277]]], [[[ 1.4662, -1.9960, -2.3046, ..., -2.7178, -4.1714, -1.9495]], [[ 3.9862, -1.9820, -0.9535, ..., -2.5717, -1.4512, -1.1279]], [[ 1.8748, 0.0146, -0.7893, ..., -1.8870, -0.9596, 0.7942]], ..., [[ 1.0806, -2.7485, -2.3922, ..., -2.7672, -1.8615, -0.7662]], [[ 1.1585, -1.8317, -1.5145, ..., -2.1564, -2.6574, -0.9510]], [[ 0.8589, -2.8027, -2.6579, ..., -4.6331, -4.9377, -2.3616]]], [[[ 1.4244, -3.8498, -2.6650, ..., -4.4465, -2.3309, -2.9047]], [[ 3.9358, -2.1943, -0.3795, ..., -1.5418, -1.1959, -1.0438]], [[ 2.0345, -0.5292, -1.2815, ..., -1.4044, -1.3659, -0.0207]], ..., [[ 0.9378, -3.4774, -2.6144, ..., -1.5235, -0.7838, -1.3384]], [[ 1.0641, -2.4366, -1.8080, ..., -1.7873, -1.0525, -1.2788]], [[ 0.8212, -2.6816, -3.7105, ..., -3.4036, -4.3304, -3.9700]]], [[[ 0.8777, -3.5952, -2.7012, ..., -3.8679, -1.8394, -1.2841]], [[ 2.6754, -3.8783, -2.5534, ..., -4.7407, -3.0823, -0.8111]], [[ 1.8323, -1.5065, -1.1753, ..., -1.2641, -1.2199, -3.2934]], ..., [[ 0.8441, -4.3575, -3.2443, ..., -2.4281, -2.6879, -2.5604]], [[ 1.0141, -3.8096, -3.5107, ..., -1.6596, -1.8138, -1.2544]], [[ 0.4750, -3.5137, -4.0492, ..., -4.7071, -3.7949, -4.4307]]], [[[ 1.2779, -3.9583, -3.3269, ..., -3.9055, -1.5638, -0.8965]], [[ 4.3559, -2.9528, -0.4603, ..., -0.3609, -0.8252, 0.5666]], [[ 1.6819, -2.1178, -1.7636, ..., -1.8442, -0.7544, -0.2328]], ..., [[ 1.1513, -3.9703, -2.8900, ..., -3.1568, -3.5861, -1.9266]], [[ 1.1078, -3.6939, -2.6009, ..., -1.2960, -2.0094, -0.5932]], [[ 0.9196, -3.0196, -2.8807, ..., -3.7911, -4.1946, -3.6063]]]]) attn_weights tensor([[[[ 2.2273, -1.0444, -2.4204, ..., -0.7315, -1.7007, -1.8561]], [[ 5.1836, 1.0557, -0.3086, ..., -0.2084, -0.6849, -0.0454]], [[ 2.7437, -2.6432, -1.7615, ..., -0.5986, -2.3431, -4.0956]], ..., [[ 4.2313, -1.3084, -2.5555, ..., -1.7195, -2.9309, -3.8265]], [[ 1.4753, -4.3899, -3.2873, ..., -2.1962, 0.0069, -1.1943]], [[ 3.8737, 0.0536, -1.2701, ..., -0.6086, -1.3924, -0.6849]]], [[[ 1.8007, -1.0817, -2.2591, ..., -4.4379, -2.4357, -1.5302]], [[ 2.9078, -1.0315, -1.5201, ..., -1.3750, -0.2007, -0.5402]], [[ 1.4083, -2.9733, -2.5513, ..., -3.3788, -2.4568, -1.1510]], ..., [[ 2.7724, -2.8137, -2.8110, ..., -3.9373, -1.5105, -2.0583]], [[ 1.2023, -3.0374, -3.0565, ..., -4.1854, -1.6772, -0.9887]], [[ 3.7624, -0.5884, -1.3234, ..., -4.0544, -3.4209, -1.3960]]], [[[ 2.0360, -3.2664, -3.0499, ..., -0.3729, -1.8681, -3.3853]], [[ 3.6486, -1.4586, -2.1873, ..., -2.1637, -1.1852, -0.8092]], [[ 2.4003, -3.1279, -2.4310, ..., -0.5394, -0.6098, -1.2938]], ..., [[ 4.2609, -2.3990, -2.7815, ..., -0.8859, -0.7969, -3.1316]], [[ 0.6881, -4.3950, -4.4463, ..., -0.3424, -0.1010, -2.0469]], [[ 3.9846, -1.9652, -0.3586, ..., -2.3568, -1.5145, -1.2617]]], [[[ 0.9736, -3.3186, -3.7761, ..., -5.2187, -3.1744, -4.0358]], [[ 2.4455, -3.4507, -2.5045, ..., -4.2931, -1.6177, -0.9534]], [[ 0.5913, -3.5788, -3.8622, ..., -2.8640, -3.0749, -3.0989]], ..., [[ 3.0391, -3.5375, -2.1225, ..., -5.0205, -2.4886, -2.4524]], [[ 0.6924, -4.2643, -3.6774, ..., -1.6971, 0.2747, -2.1057]], [[ 3.0474, -1.1269, -1.7331, ..., -4.1523, -3.7371, -1.9736]]], [[[ 2.1029, -3.6197, -4.2423, ..., -3.7066, -3.1143, -3.6043]], [[ 3.4060, -1.9253, -2.6507, ..., -1.1615, -2.3513, -0.7648]], [[ 1.3174, -3.8855, -3.4584, ..., -3.0888, -4.1579, -3.5696]], ..., [[ 2.5969, -2.5221, -2.1425, ..., -1.7256, -2.5781, -3.0300]], [[ 2.1635, -5.6641, -6.0568, ..., -2.8656, -0.3322, -2.0319]], [[ 3.8869, -0.9189, -1.5844, ..., -0.7627, -1.1497, -0.7339]]]]) attn_weights tensor([[[[ 2.9871, -3.0753, -3.3936, ..., -2.9974, -3.5821, -3.3753]], [[ 4.2252, -2.0790, -2.3440, ..., -1.2464, -2.2317, -2.0113]], [[ 3.2511, -0.6976, -1.4655, ..., 0.1368, -0.5429, -1.8979]], ..., [[ 0.9550, -2.9401, -3.2570, ..., -0.7436, -0.8309, -1.9729]], [[ 3.4592, -1.8888, -0.7299, ..., -2.2490, -1.3988, -2.6656]], [[ 3.7138, -0.1034, -0.8356, ..., 0.5093, -0.3113, -0.0972]]], [[[ 1.9863, -3.0895, -3.9679, ..., -4.3584, -3.5147, -1.7969]], [[ 2.8898, -1.6841, -2.4814, ..., -3.1505, -0.7709, -0.8789]], [[ 2.4762, -0.6921, -1.2957, ..., -3.9488, -2.8153, -0.5049]], ..., [[ 0.8551, -3.1102, -1.6116, ..., -5.1404, -3.4917, -1.0598]], [[ 2.7387, -2.7254, -1.9719, ..., -4.2036, -3.2330, -2.3881]], [[ 2.5232, -1.5642, -1.9446, ..., -2.5760, -1.4216, -0.5914]]], [[[ 2.7916, -2.7907, -3.7804, ..., -1.2188, -2.9081, -3.4741]], [[ 3.7194, -0.9669, -1.8826, ..., -1.1700, -0.0413, -1.3237]], [[ 2.7092, -0.0633, -0.8179, ..., -1.0675, -1.6175, -1.5945]], ..., [[ 0.5297, -3.4391, -2.6088, ..., -1.1036, -1.4047, -1.7148]], [[ 3.1356, -1.5284, -1.4920, ..., -1.7442, -2.5830, -2.1769]], [[ 3.2134, -2.2272, -2.3918, ..., -1.0857, -1.5035, -1.9667]]], [[[ 1.8109, -3.5399, -3.3514, ..., -4.8192, -4.6976, -4.3317]], [[ 3.4345, -3.0292, -3.2467, ..., -3.3326, -4.0705, -0.6606]], [[ 2.4981, -1.5052, -1.1090, ..., -1.8566, -1.9153, -2.4431]], ..., [[-0.2917, -2.6806, -4.1867, ..., -0.6431, -1.0178, -1.1105]], [[ 2.5533, -2.3419, -1.1937, ..., -2.8326, -1.6923, -1.1796]], [[ 2.2508, -2.3183, -2.1266, ..., -1.4135, -1.2726, -0.3615]]], [[[ 2.1426, -3.4944, -4.0431, ..., -2.9548, -3.3830, -3.5332]], [[ 2.8399, -2.3016, -3.8822, ..., -1.8014, -0.6105, -2.0347]], [[ 3.0156, -2.1553, -2.3543, ..., -1.6377, -2.2877, -1.7544]], ..., [[ 0.6871, -3.7903, -3.3470, ..., -1.7142, -1.0001, -0.3022]], [[ 2.7486, -2.2230, -1.4926, ..., -1.3189, -2.1367, -2.3841]], [[ 2.4898, -1.4483, -1.5061, ..., -1.4495, -1.5864, -0.2012]]]]) attn_weights tensor([[[[ 1.1520, 1.5052, 1.1152, ..., 0.5589, 2.4909, 1.0958]], [[ 3.3539, 0.7913, 0.2146, ..., 0.7372, -0.2808, -0.8056]], [[ 3.0650, 0.3441, -1.6058, ..., 0.1449, -1.4086, -1.8378]], ..., [[ 3.9033, 0.1807, -1.2020, ..., -0.4790, -0.4490, 0.2715]], [[ 3.3374, 2.0205, 1.0507, ..., 1.6906, 1.3920, 0.2920]], [[ 2.7511, 1.9310, 0.0082, ..., 2.0690, 1.5210, -1.1127]]], [[[ 2.4479, 2.0133, 0.8632, ..., -1.4159, 0.5864, 2.8644]], [[ 3.0384, -0.5070, -1.2706, ..., -1.5384, -0.8511, 0.9301]], [[ 2.7021, -0.1412, -1.9571, ..., -2.9912, -2.8926, 0.6056]], ..., [[ 3.1757, -0.8185, -2.0073, ..., -2.7114, -0.0481, -0.2779]], [[ 3.2306, 1.3570, 0.5293, ..., 0.0918, -0.8669, 2.3126]], [[ 2.9633, 0.6648, -0.9052, ..., -0.6282, -0.5076, -0.2398]]], [[[ 1.2905, 1.2983, 0.8965, ..., -0.3419, 1.0271, 0.7706]], [[ 2.8505, 0.0215, -0.5552, ..., -0.6090, -1.0286, -0.8934]], [[ 2.9514, -0.2114, -1.5498, ..., -0.8892, -2.3885, -1.4281]], ..., [[ 3.9510, -0.2430, -1.0573, ..., -0.3800, -0.1587, -0.8334]], [[ 2.9827, 0.5092, -0.1378, ..., -0.9649, -0.3301, 0.5458]], [[ 2.5045, -0.2628, -1.2016, ..., 0.3420, -0.1521, -0.1806]]], [[[ 1.1247, 1.5605, 1.3781, ..., 1.0712, 1.2937, 1.8644]], [[ 2.8890, 0.3348, -0.6074, ..., 0.2024, -1.3422, -0.0748]], [[ 2.4119, -0.3667, -1.4811, ..., -2.4279, -3.6759, -2.2044]], ..., [[ 3.6590, -1.9513, -3.2356, ..., -2.8000, -3.4241, -1.9827]], [[ 2.1073, 0.1150, -1.0504, ..., -0.3682, -1.8102, 0.1249]], [[ 1.9716, -0.2873, -2.3935, ..., -0.2048, -1.8717, -0.5789]]], [[[ 1.9218, 0.2133, -0.4729, ..., 0.2481, 0.8745, 0.8979]], [[ 3.3157, -0.1493, -0.8993, ..., 0.4827, -1.0917, 0.2677]], [[ 2.8214, -0.7595, -1.4271, ..., -0.4561, -1.0977, -0.0829]], ..., [[ 3.3886, -1.4899, -2.9372, ..., -1.7402, -0.7569, -1.4374]], [[ 2.9806, 0.3614, -1.3861, ..., 0.3053, 0.3997, 2.2998]], [[ 3.1494, -0.8255, -2.4128, ..., 0.4074, -0.1830, 0.9643]]]]) attn_weights tensor([[[[-1.6767, -5.1103, -2.6044, ..., -0.5220, -3.2475, -4.8470]], [[-3.3622, 2.3377, -3.7257, ..., -4.4396, -7.6351, 3.5352]], [[-2.3661, -1.2652, -3.0675, ..., -2.4037, -3.9522, -0.8187]], ..., [[-1.8588, -2.2504, -2.2559, ..., -1.7944, -2.3564, -2.0604]], [[-0.5288, -0.6522, -0.8255, ..., -0.4552, -0.9928, -0.3053]], [[-1.5693, -2.2859, -3.6153, ..., -2.6211, -2.5377, -2.2813]]], [[[-0.8410, -2.6019, -1.6409, ..., -1.4925, -2.7665, -1.4224]], [[-0.0849, 0.2221, 2.3913, ..., 0.1429, -1.6406, 9.3258]], [[-1.7556, -2.4151, -1.9010, ..., -2.2121, -1.4743, -1.3028]], ..., [[-1.9819, -2.3206, -2.1871, ..., -2.5287, -1.9063, -1.7020]], [[-0.1259, -0.2419, -0.1893, ..., -1.0414, -0.0488, 1.3920]], [[-1.7276, -2.5150, -3.6927, ..., -2.5281, -2.1860, -3.6589]]], [[[-0.9603, -3.5585, -0.9852, ..., -1.5925, -3.1978, -2.2713]], [[-1.1210, 1.6760, 1.5326, ..., 2.3324, 1.0266, 8.3293]], [[-2.5879, -2.6791, -3.0088, ..., -1.9451, -2.4822, -1.7652]], ..., [[-2.0106, -2.3939, -2.2998, ..., -2.0537, -2.1660, -2.0136]], [[-0.1536, -0.4620, -0.3498, ..., -0.2439, -0.2169, 0.6203]], [[-1.1958, -2.0337, -3.3214, ..., -1.4436, -2.2217, -1.9484]]], [[[-0.9203, -2.6159, -2.3042, ..., -2.3012, -2.5904, -3.7187]], [[ 3.1004, 1.7944, 6.7408, ..., 2.1325, -1.6293, 8.3422]], [[-1.1815, -2.0091, -2.2909, ..., -2.2091, -1.3155, -2.5920]], ..., [[-2.0435, -2.3524, -2.6856, ..., -2.3746, -2.2399, -2.5961]], [[ 0.6349, -0.0568, 1.2389, ..., -0.0469, 0.0416, 1.4899]], [[-1.4494, -2.3724, -3.7794, ..., -3.2266, -2.7516, -3.4964]]], [[[-0.5677, -2.9261, -2.1955, ..., -0.6153, -2.8657, -1.7724]], [[ 1.8251, 1.0984, 5.8694, ..., -1.3102, 0.7651, 6.3631]], [[-1.4946, -2.2749, -2.1736, ..., -2.3293, -2.2864, -2.0939]], ..., [[-1.8821, -2.2490, -2.5317, ..., -2.4326, -2.0357, -2.3018]], [[ 0.7418, -0.0428, 1.3883, ..., -0.5941, -0.0691, 1.6155]], [[-1.6939, -2.4654, -3.8051, ..., -1.6107, -2.4317, -4.0495]]]]) attn_weights tensor([[[[-1.4191e+00, -4.4606e+00, -2.5138e+00, ..., 8.4344e-01, 1.6377e+00, 1.8289e-01]], [[-1.3587e+00, -3.6317e+00, -2.8615e+00, ..., 5.4655e-01, 6.1358e-02, 3.0741e-01]], [[-3.6819e+00, -4.2233e+00, -4.1345e+00, ..., -2.7254e+00, -2.7673e+00, -2.2143e+00]], ..., [[ 1.0862e+00, -5.5233e-01, -6.3702e-02, ..., -4.9625e-02, -3.0152e-01, -1.1355e+00]], [[-4.2197e+00, -2.6220e+00, -2.5057e+00, ..., -7.4485e-01, -8.3654e-01, -6.2607e-01]], [[-3.8744e-01, -8.5269e-01, -2.1517e+00, ..., 1.4314e-01, -1.4600e+00, -1.7161e-01]]], [[[ 8.2943e-01, -1.2902e+00, -2.0257e+00, ..., 6.3669e-01, 2.1280e+00, 1.0929e+00]], [[-1.0073e+00, -2.4510e+00, -2.9220e+00, ..., -2.0328e-01, 2.2538e+00, 7.0589e-01]], [[-3.7601e+00, -4.2827e+00, -4.1941e+00, ..., -3.1428e+00, -2.4617e+00, -2.4475e+00]], ..., [[ 1.3239e+00, -4.0024e-01, 1.2761e-01, ..., -7.2651e-01, -8.3592e-01, 3.2306e-01]], [[-4.5516e+00, -2.6796e+00, -2.5486e+00, ..., -1.0395e+00, -6.2642e-01, -6.2356e-01]], [[ 1.2140e+00, 1.1779e-01, -1.4358e+00, ..., -3.4623e+00, 1.1373e+00, 3.9567e+00]]], [[[-1.8896e+00, -4.8230e+00, -3.6033e+00, ..., -1.0286e+00, -5.7157e-01, -5.7062e-01]], [[-1.3365e+00, -2.7933e+00, -3.1829e+00, ..., -2.5335e-01, 1.2035e+00, 5.4871e-01]], [[-3.5549e+00, -4.2228e+00, -4.0257e+00, ..., -2.8075e+00, -2.4329e+00, -2.3236e+00]], ..., [[ 1.2771e+00, -5.0911e-01, 2.7158e-01, ..., -3.3080e-01, -1.0578e+00, -2.5422e-01]], [[-4.3640e+00, -2.5745e+00, -2.4354e+00, ..., -9.3665e-01, -8.2808e-01, -5.2309e-01]], [[ 7.0052e-01, 2.7814e-01, -1.8948e+00, ..., -8.3422e-01, 6.9142e-01, 3.8371e+00]]], [[[-1.8238e+00, -4.1226e+00, -4.4853e+00, ..., 1.2599e+00, 1.2951e+00, -7.6913e-01]], [[-1.3627e+00, -2.8980e+00, -3.6771e+00, ..., 3.8818e-01, 1.2698e+00, 3.2493e-01]], [[-3.8822e+00, -4.3919e+00, -4.3160e+00, ..., -2.9403e+00, -2.8108e+00, -2.6206e+00]], ..., [[ 1.0814e+00, -5.4425e-01, 1.6891e-01, ..., -3.7508e-03, 2.9111e-01, -3.3617e-01]], [[-4.0899e+00, -2.6981e+00, -2.5412e+00, ..., -9.4551e-01, -9.6163e-01, -6.4851e-01]], [[-1.4536e+00, -1.0944e+00, -3.8758e-01, ..., -1.8325e+00, -2.8269e+00, 2.2800e+00]]], [[[-7.3930e-01, -3.2815e+00, -3.5616e+00, ..., 5.4094e-01, 9.5683e-01, 8.4961e-01]], [[-1.4794e+00, -2.8362e+00, -3.8716e+00, ..., 6.4322e-03, 1.6389e+00, 3.1560e-01]], [[-3.9097e+00, -4.4264e+00, -4.3206e+00, ..., -2.7462e+00, -2.4735e+00, -2.6120e+00]], ..., [[ 1.1046e+00, -6.3080e-01, -5.1164e-02, ..., -1.3234e+00, -1.0311e+00, -1.8120e-01]], [[-4.2381e+00, -2.7233e+00, -2.5601e+00, ..., -4.8721e-01, -7.7049e-01, -7.8003e-01]], [[-1.2357e+00, -1.0029e+00, 1.2769e+00, ..., -3.9133e+00, 2.0474e-02, 2.9208e+00]]]]) attn_weights tensor([[[[ -1.3827, -6.1666, -4.3563, ..., -1.4556, -0.5251, -2.6055]], [[ 1.7316, -0.7393, -1.5313, ..., -1.1507, -1.3680, -0.7357]], [[ -7.8104, -18.8652, -15.8152, ..., -4.1079, -2.4030, -3.9348]], ..., [[ -4.4573, -11.0471, -9.1521, ..., -3.8397, -2.0590, -3.5755]], [[ -1.6236, -3.8169, -3.5605, ..., -0.9604, -0.8953, -1.0904]], [[ -0.5462, -6.0497, -5.7094, ..., -2.7763, -2.6166, -2.7032]]], [[[ -1.2771, -4.7491, -3.7555, ..., -3.6641, -1.9544, -0.5222]], [[ 1.3862, -1.1700, -0.5408, ..., -1.8880, -1.3964, -1.4556]], [[ -5.4251, -14.0975, -15.0598, ..., -6.6088, -2.1723, -5.1150]], ..., [[ -2.8995, -8.2701, -8.2015, ..., -3.2075, -1.5039, -3.2411]], [[ -1.4749, -3.5797, -3.5731, ..., -1.3712, -1.5529, -1.3433]], [[ -0.5027, -5.5503, -5.3983, ..., -2.8607, -2.5471, -2.7684]]], [[[ -1.2160, -4.9701, -3.7169, ..., -1.0878, -2.5009, -1.2678]], [[ 1.3934, -0.4327, -2.0316, ..., -1.6848, -0.9561, -2.1324]], [[ -5.9566, -15.6612, -14.4495, ..., -6.1380, -2.3942, -3.8710]], ..., [[ -3.7003, -9.0955, -7.8491, ..., -2.4732, -2.4365, -3.1016]], [[ -1.8063, -3.8342, -3.5932, ..., -1.5324, -1.6265, -1.3881]], [[ -0.3984, -5.1195, -4.9462, ..., -2.8699, -2.6888, -2.7183]]], [[[ -1.8234, -5.7874, -5.1000, ..., -1.9292, -1.9175, -1.8253]], [[ 2.2395, -0.4475, -2.4586, ..., -3.9132, -3.0901, -3.9324]], [[ -7.9790, -18.5433, -19.8557, ..., -3.3593, -3.9992, -3.9865]], ..., [[ -4.9716, -11.2231, -11.2411, ..., -2.6323, -4.1561, -2.8715]], [[ -2.6730, -4.3674, -4.0934, ..., -1.4719, -1.5764, -1.2831]], [[ -0.6127, -5.8450, -5.6243, ..., -2.7843, -2.9116, -2.5379]]], [[[ -1.3836, -5.4986, -5.1387, ..., -1.4958, -1.8753, -1.0009]], [[ 1.6246, -1.0932, -1.1342, ..., 0.0401, -1.1148, -1.8978]], [[ -6.2022, -15.9230, -20.5062, ..., -5.9001, -2.8671, -5.3018]], ..., [[ -4.1789, -10.5431, -12.1323, ..., -1.9147, -2.9643, -3.4569]], [[ -2.0803, -3.8146, -3.8115, ..., -0.8027, -1.2117, -1.2020]], [[ -0.4615, -5.7737, -5.7270, ..., -2.6103, -2.6565, -2.6784]]]]) attn_weights tensor([[[[ 4.0963e+00, -4.5866e-01, -7.9213e-01, ..., -8.3983e-01, -2.2243e+00, -1.4094e+00]], [[-2.5781e+00, -9.3954e+00, -7.9277e+00, ..., -2.1617e+00, -3.6537e+00, -4.1507e+00]], [[-5.2211e+00, -1.4418e+01, -1.1392e+01, ..., -4.5787e+00, -3.6200e+00, -6.3721e+00]], ..., [[-1.8857e+00, -8.5652e+00, -4.9185e+00, ..., -2.6741e+00, -4.4977e-01, -3.5319e+00]], [[-1.1589e+00, -6.2970e+00, -5.5867e+00, ..., -3.1551e+00, -3.0205e+00, -3.0351e+00]], [[-2.4565e+00, -8.7715e+00, -1.0143e+01, ..., -3.6356e+00, -3.6791e-01, -2.8562e+00]]], [[[ 4.6031e+00, -5.1366e-02, -4.4861e-01, ..., -4.1046e+00, -4.3729e-01, 1.4946e+00]], [[-2.5134e+00, -6.3262e+00, -6.7357e+00, ..., -5.6938e+00, -2.9031e+00, -4.1628e+00]], [[-4.2431e+00, -9.5249e+00, -1.1039e+01, ..., -7.4881e+00, -4.3264e+00, -5.9537e+00]], ..., [[-1.5618e+00, -6.6591e+00, -8.1912e+00, ..., -7.2726e+00, -3.2214e+00, -3.7813e+00]], [[-9.3788e-01, -6.0095e+00, -5.1860e+00, ..., -4.0235e+00, -3.0027e+00, -3.1526e+00]], [[-2.1584e+00, -7.9113e+00, -9.0761e+00, ..., -5.5621e+00, -3.7827e+00, -4.2015e+00]]], [[[ 4.7082e+00, -7.9892e-01, -2.9352e+00, ..., -2.6475e+00, -7.2215e-01, 8.3280e-01]], [[-2.6387e+00, -7.0896e+00, -5.5537e+00, ..., -6.1205e+00, -3.5492e+00, -4.4043e+00]], [[-4.7503e+00, -1.0674e+01, -9.7344e+00, ..., -5.9848e+00, -4.0853e+00, -4.6041e+00]], ..., [[-1.9194e+00, -4.6338e+00, -3.9972e+00, ..., -3.8526e+00, -3.1201e+00, -3.8486e+00]], [[-9.4433e-01, -6.4947e+00, -5.2430e+00, ..., -2.9547e+00, -2.8707e+00, -2.7579e+00]], [[-3.0293e+00, -7.7034e+00, -7.9451e+00, ..., -2.0494e+00, -3.4693e+00, -4.1171e+00]]], [[[ 3.7143e+00, -7.9074e-01, 1.0002e+00, ..., -1.1736e+00, -2.9121e+00, 7.6092e-01]], [[-2.9347e+00, -9.9413e+00, -1.0048e+01, ..., -3.6043e+00, -4.8619e+00, -4.5500e+00]], [[-4.3521e+00, -1.4769e+01, -1.8280e+01, ..., -5.5324e+00, -4.1805e+00, -4.2655e+00]], ..., [[-2.2635e+00, -9.1445e+00, -1.0136e+01, ..., -2.2793e+00, -1.4191e+00, -2.5629e+00]], [[-1.2768e+00, -5.7798e+00, -6.4806e+00, ..., -3.2183e+00, -2.8972e+00, -1.9447e+00]], [[-2.7485e+00, -1.0180e+01, -1.1322e+01, ..., -3.2104e+00, -3.1059e+00, -2.3647e+00]]], [[[ 4.5643e+00, 3.1758e-01, 3.0851e+00, ..., -2.9285e+00, -1.5827e-02, 2.6128e+00]], [[-2.3715e+00, -8.0291e+00, -8.1745e+00, ..., -4.4216e+00, -2.8715e+00, -3.0117e+00]], [[-4.2849e+00, -1.1386e+01, -1.3781e+01, ..., -6.3218e+00, -4.1300e+00, -4.4956e+00]], ..., [[-1.3251e+00, -6.7874e+00, -7.5520e+00, ..., -8.4675e-01, -2.2508e+00, -2.5170e+00]], [[-7.7150e-01, -6.1150e+00, -5.4740e+00, ..., -4.0996e+00, -3.4241e+00, -2.4041e+00]], [[-2.2640e+00, -8.5510e+00, -9.6953e+00, ..., 1.1442e+00, -2.2687e+00, -3.4300e+00]]]]) attn_weights tensor([[[[ -2.3152, -11.1883, -9.4858, ..., -3.7701, -3.5162, -5.4821]], [[ -2.0138, -9.6517, -9.6860, ..., -2.0474, -3.9484, -4.4674]], [[ 0.0561, -2.9983, -2.5771, ..., -2.4449, -1.0359, -2.7757]], ..., [[ -0.9903, -6.3052, -6.7947, ..., -3.0705, -3.0791, -4.0379]], [[ 1.4897, -2.3815, -2.8314, ..., -1.8890, -1.3516, -0.9139]], [[ -6.8503, -26.9437, -22.7752, ..., -0.4449, 19.0769, 7.6200]]], [[[ -1.6564, -10.5064, -10.8836, ..., -8.4564, -4.6717, -4.7516]], [[ -1.8197, -7.7016, -10.2833, ..., -7.3580, -2.6494, -4.3439]], [[ 0.1575, -1.2591, -1.6753, ..., -2.8175, -0.8761, -2.6909]], ..., [[ -1.0428, -4.5284, -5.2318, ..., -3.4286, -2.9345, -4.8600]], [[ 1.2483, -2.3193, -3.0610, ..., -4.5790, -1.5514, -2.1510]], [[ -7.6494, -19.8091, -26.4775, ..., -14.0292, 4.2387, -2.9378]]], [[[ -2.8541, -9.9542, -10.4607, ..., -5.9373, -4.8379, -5.5668]], [[ -2.0828, -8.5629, -8.8996, ..., -6.3814, -3.6451, -3.2776]], [[ -0.2574, -2.0414, -3.0629, ..., -4.3068, -2.6979, -3.2815]], ..., [[ -1.6421, -5.0729, -5.3012, ..., -1.8450, -3.1324, -5.1603]], [[ 1.3802, -1.8811, -2.4536, ..., -3.2575, -1.9100, -1.1683]], [[ -9.3501, -22.6997, -32.5128, ..., -13.2055, 6.2121, -4.2813]]], [[[ -2.5535, -12.6135, -11.7364, ..., -5.1420, -4.7808, -3.9618]], [[ -2.5534, -9.2057, -8.6568, ..., -1.4814, -0.9178, -1.9273]], [[ -0.4669, -3.6632, -4.9419, ..., -4.1745, -4.2624, -5.2819]], ..., [[ -0.8766, -6.6477, -7.7958, ..., -2.9675, -4.0731, -4.9418]], [[ 1.3841, -3.1968, -4.2652, ..., -3.3956, -4.4095, -4.3623]], [[ -4.4496, -33.7322, -33.0830, ..., 2.1122, 11.6794, 4.3999]]], [[[ -1.7560, -10.8233, -11.7232, ..., -5.7752, -5.7122, -5.3639]], [[ -1.9391, -7.3531, -9.0758, ..., -2.5872, -2.4370, -3.2533]], [[ 0.5808, -3.2430, -3.7059, ..., -0.7795, -2.3708, -2.8040]], ..., [[ -0.6519, -5.7985, -7.9659, ..., -0.9268, -3.6980, -4.0908]], [[ 1.7414, -2.5124, -2.3444, ..., -3.7620, -1.8300, -1.8248]], [[ -8.8951, -21.7470, -31.4000, ..., -3.4238, 7.0877, -3.9897]]]]) attn_weights tensor([[[[ 2.6634, -6.8680, -0.6315, ..., -1.7090, -2.9324, -1.4333]], [[ 4.6049, -12.9789, -1.5270, ..., -3.7974, -6.0668, -3.2439]], [[ 0.5716, -4.1993, -5.0649, ..., -1.6896, -0.3562, -1.6069]], ..., [[ 1.0405, -3.8873, -3.4875, ..., -2.6745, -3.9977, -3.4639]], [[ 1.8588, -1.6727, -2.8184, ..., -0.9306, -1.5752, -1.2888]], [[ 1.0600, -1.8009, -2.4431, ..., -0.8533, -0.9516, -0.0219]]], [[[ 1.8405, -4.2353, -5.8985, ..., -5.1143, -1.6235, -2.4424]], [[ 4.2144, -10.9726, -8.7635, ..., -9.7893, -8.1273, -3.8936]], [[ 0.6918, -3.1385, -4.5712, ..., -3.5761, -1.5285, -3.2452]], ..., [[ 0.9835, -3.0853, -2.8684, ..., -3.1462, -1.8280, -3.0877]], [[ 1.7167, -1.8379, -1.7605, ..., -1.3057, -0.5369, -2.0814]], [[ 1.1535, -4.7950, -3.6882, ..., -6.3705, -2.0863, -0.1468]]], [[[ 2.4036, -4.1923, -3.4861, ..., -3.1419, -2.3804, -1.6688]], [[ 4.7259, -12.4269, -6.9591, ..., -9.5588, -5.7856, -1.8268]], [[ -0.0827, -3.2903, -3.0858, ..., -1.1172, -1.8744, -3.1136]], ..., [[ 0.9949, -3.6906, -3.3363, ..., -2.4735, -2.8055, -2.3403]], [[ 1.8803, -0.8673, -1.8405, ..., -0.3024, -0.6897, -2.6779]], [[ 0.8784, -4.2817, -3.8087, ..., -2.5928, -1.9623, 0.6135]]], [[[ 2.1136, -4.1893, -6.5625, ..., -2.0723, -1.4036, -2.1228]], [[ 4.6047, -6.2546, -6.5090, ..., -0.8376, 1.2545, -0.5202]], [[ 0.3366, -4.9694, -6.8539, ..., -2.4253, -1.4744, -3.8072]], ..., [[ 0.6671, -3.5535, -5.0172, ..., -2.4353, -2.5460, -4.1993]], [[ 1.7623, -1.1445, -1.6917, ..., -3.7054, -3.4905, -1.7533]], [[ 1.0617, -4.9753, -4.4682, ..., -3.2108, -2.8145, -2.0252]]], [[[ 2.4323, -3.6664, -4.2551, ..., -3.8555, -3.8627, -1.3318]], [[ 4.3840, -8.1315, -6.5807, ..., -5.1601, -5.6429, -2.2754]], [[ 0.8242, -3.7959, -6.0238, ..., -1.6123, -2.2890, -2.8168]], ..., [[ 1.0350, -3.2564, -4.3415, ..., -3.8262, -3.8355, -3.8265]], [[ 2.6988, -1.9357, -1.7054, ..., -1.9811, -1.8539, -0.0332]], [[ 1.0828, -3.2833, -2.5816, ..., -3.8531, -1.8945, -0.8216]]]]) attn_weights tensor([[[[-0.5138, -6.0974, -5.4469, ..., -2.8942, -2.2951, -3.2106]], [[ 0.7049, -6.1639, -5.6834, ..., -3.7027, -3.4748, -3.6662]], [[ 0.4382, -2.9038, -3.0331, ..., -3.6438, -2.2971, -1.9215]], ..., [[ 3.9415, -7.4810, -0.7094, ..., -0.9218, -1.5975, 0.6734]], [[ 2.8654, -3.1393, -1.4847, ..., -2.1585, -0.9588, 0.0872]], [[-0.1164, -5.2123, -6.8855, ..., -2.4049, 0.8824, -1.8012]]], [[[-0.1394, -5.0215, -5.2642, ..., -5.5244, -3.7709, -5.0503]], [[ 0.2704, -3.8452, -6.1509, ..., -4.9469, -2.9043, -3.7991]], [[ 0.3948, -3.1181, -2.9381, ..., -3.7078, -2.3215, -3.0025]], ..., [[ 4.6223, -9.0728, -6.9439, ..., -6.4451, -3.7293, -3.2885]], [[ 2.6325, -2.0253, -2.5751, ..., -2.6110, -0.9742, -2.0474]], [[ 0.3245, -3.9369, -6.7385, ..., -4.5173, -2.1458, -3.7545]]], [[[-1.0405, -4.2824, -4.7484, ..., -4.0321, -4.8909, -4.6583]], [[-0.9678, -3.4737, -4.2499, ..., -2.2897, -3.5560, -3.1190]], [[ 0.3352, -2.8521, -2.9417, ..., -4.0873, -3.1455, -2.7565]], ..., [[ 4.2624, -9.1080, -4.6434, ..., -4.8598, -3.5077, -0.3478]], [[ 2.8862, -3.0467, -2.3209, ..., -2.0490, -0.9545, -1.2485]], [[ 0.1039, -4.2168, -6.3689, ..., -4.0353, -4.0511, -2.9201]]], [[[-1.1295, -6.2879, -6.1421, ..., -2.1610, -1.4753, -3.5549]], [[-0.8671, -5.3472, -4.5607, ..., -3.0726, -2.5331, -0.7575]], [[ 0.4409, -2.4061, -2.5945, ..., -2.2395, -3.1319, -4.6212]], ..., [[ 4.5732, -6.2824, -1.6463, ..., 0.9178, 0.6255, -0.3725]], [[ 3.6741, -4.1936, -3.0387, ..., -0.7972, -0.7655, -1.6642]], [[-0.6152, -5.6105, -6.0042, ..., -0.5174, -0.4079, -4.1566]]], [[[-0.1534, -6.6388, -6.6378, ..., -3.8473, -3.9501, -2.2893]], [[ 0.5448, -5.4818, -7.0529, ..., -5.1755, -4.6684, -3.8226]], [[ 0.4080, -3.4874, -3.9256, ..., -1.5268, -1.5087, -2.3771]], ..., [[ 4.2587, -4.7029, -4.2406, ..., -1.8980, -3.4768, -1.5964]], [[ 2.8050, -3.5799, -3.8792, ..., -1.5464, -2.5212, -1.9650]], [[-0.1238, -4.2109, -7.6109, ..., 0.4869, -0.9049, -3.7981]]]]) attn_weights tensor([[[[-9.7836e-01, -8.2687e+00, -6.6677e+00, ..., -2.3058e+00, -8.5914e-01, -3.0306e+00]], [[ 3.1598e+00, -5.3508e-01, -1.4881e+00, ..., -7.5081e-01, -7.4562e-01, -3.6215e-01]], [[ 5.9876e+00, -3.5107e+00, 5.8445e-01, ..., -6.7946e-01, 1.2313e-01, 1.1512e+00]], ..., [[ 3.9304e-01, -4.2019e+00, -3.9677e+00, ..., -6.7000e-01, -2.2855e+00, -2.2861e+00]], [[ 3.9430e+00, -3.2955e+00, -1.0068e+00, ..., -2.7104e+00, -1.5832e+00, 4.0596e-01]], [[ 3.4510e+00, -3.0328e+00, 2.6896e-01, ..., -2.4944e-03, -9.5345e-01, -1.6127e+00]]], [[[-3.9230e-01, -6.9327e+00, -7.8232e+00, ..., -6.1630e+00, -1.7864e+00, -4.5708e+00]], [[ 2.5673e+00, -1.5337e+00, -2.5513e+00, ..., -6.6274e-01, 6.0886e-01, -2.2275e+00]], [[ 5.8685e+00, -3.8089e+00, -4.8784e+00, ..., -2.5996e+00, -1.8931e+00, -1.5144e+00]], ..., [[ 5.5046e-01, -2.7718e+00, -3.8881e+00, ..., -4.5999e+00, -5.4221e-01, -2.0502e+00]], [[ 4.1498e+00, -4.8671e+00, -5.1966e+00, ..., -2.4428e+00, -1.7112e+00, -3.0400e+00]], [[ 3.2991e+00, -3.8046e+00, -3.8404e+00, ..., -4.2841e+00, -2.6794e+00, -4.2931e+00]]], [[[-6.2096e-01, -5.9315e+00, -7.0142e+00, ..., -6.0266e+00, -3.1448e+00, -3.7094e+00]], [[ 2.2094e+00, -2.4391e+00, -1.6465e+00, ..., -1.4974e-01, -3.2550e-01, -1.3291e+00]], [[ 6.3718e+00, -5.0820e+00, -1.6983e+00, ..., -3.7071e+00, -4.8228e+00, -5.6843e-01]], ..., [[ 2.1307e-01, -1.8743e+00, -2.7864e+00, ..., -4.3875e+00, -2.9434e+00, -1.5709e+00]], [[ 4.0295e+00, -3.1042e+00, -9.0013e-01, ..., -3.9549e-01, -2.8016e+00, -4.9697e-01]], [[ 2.7475e+00, -2.5633e+00, -1.7699e+00, ..., -3.9275e+00, -3.4606e+00, -1.3982e+00]]], [[[-8.0735e-01, -8.4470e+00, -9.4681e+00, ..., -2.8356e+00, -9.1928e-01, -4.5092e+00]], [[ 2.0591e+00, -1.9193e+00, -2.1329e+00, ..., -1.3266e+00, -1.7266e+00, -1.1661e+00]], [[ 6.5844e+00, -2.6168e+00, -3.1436e+00, ..., -5.3112e+00, -5.5373e-01, -3.5398e-01]], ..., [[-8.3630e-02, -3.8676e+00, -4.5249e+00, ..., -1.1019e+00, -1.1932e+00, -2.2342e+00]], [[ 2.9946e+00, -2.5678e+00, -8.5566e-01, ..., -5.9719e-01, -1.8177e+00, -1.5591e+00]], [[ 2.7545e+00, -1.1146e+00, -2.8943e+00, ..., -4.7956e+00, -8.4074e-01, -2.3641e+00]]], [[[-1.2179e-01, -7.9389e+00, -9.9493e+00, ..., -4.4872e+00, -3.6196e+00, -4.6913e+00]], [[ 2.7079e+00, -1.7763e+00, -1.9145e+00, ..., -1.9415e+00, -1.0791e+00, 1.0850e+00]], [[ 6.1855e+00, -2.3612e+00, -4.1203e+00, ..., -4.2513e-02, -1.2194e+00, -1.1396e+00]], ..., [[ 6.6730e-01, -4.4363e+00, -5.2075e+00, ..., -1.5296e+00, -6.6218e-01, -1.5226e+00]], [[ 4.0660e+00, -2.4028e+00, -3.5412e+00, ..., -7.0325e-01, -6.1362e-02, -4.9651e-01]], [[ 3.2676e+00, -3.0756e+00, -4.2147e+00, ..., -2.7209e+00, -2.5306e+00, -1.2828e+00]]]]) attn_weights tensor([[[[ 1.2593, -1.8916, -2.0461, ..., -1.9408, -3.0099, -1.6854]], [[ 4.3524, -0.3517, 1.9204, ..., 0.2816, 0.4808, 1.3313]], [[ 1.3880, 0.0988, -0.5210, ..., -0.4285, -0.1871, 0.3902]], ..., [[ 1.1852, -2.3365, -1.6204, ..., -1.9680, -2.4787, -2.0451]], [[ 1.4655, -2.0096, -1.7293, ..., -1.7537, -1.3400, -0.5261]], [[ 0.8944, -2.5440, -2.6271, ..., -3.6849, -2.8883, -2.7316]]], [[[ 0.9941, -3.7350, -3.4598, ..., -2.0852, -1.6154, -2.0304]], [[ 4.4600, -3.3867, -2.6984, ..., -0.7138, -0.3279, -2.3100]], [[ 1.6713, -1.0808, -1.7767, ..., -0.7497, 1.0172, -1.5710]], ..., [[ 0.6132, -3.6238, -2.8607, ..., -1.7089, -0.2182, -1.7054]], [[ 1.1631, -3.7780, -3.2268, ..., -2.9789, -1.6578, -2.0301]], [[ 0.9855, -3.1292, -3.3802, ..., -4.6025, -1.9578, -4.0379]]], [[[ 1.1914, -3.0475, -2.7270, ..., -2.6766, -2.6069, -2.7059]], [[ 3.4321, -0.3897, 0.7221, ..., -1.0767, -2.1210, -0.8875]], [[ 1.2549, -0.1627, -0.1414, ..., -1.3069, 0.6072, -1.1341]], ..., [[ 0.8688, -3.1859, -2.1355, ..., -1.5336, -1.4949, -2.1909]], [[ 0.9693, -2.9590, -1.8236, ..., -2.2148, -2.7008, -1.3607]], [[ 1.2438, -2.1836, -2.4205, ..., -3.9460, -3.9903, -4.7711]]], [[[ 1.3541, -2.9745, -3.9173, ..., -4.0120, -2.8944, -2.4014]], [[ 4.3316, -0.9107, -0.2422, ..., -0.2544, 1.2120, 0.0658]], [[ 2.4081, -0.8650, -1.8946, ..., -0.5541, -1.1244, -2.2487]], ..., [[ 0.9264, -4.3418, -3.9924, ..., -3.3933, -3.7847, -2.0415]], [[ 0.8639, -4.2938, -4.8340, ..., -2.1573, -1.3700, -1.4833]], [[ 0.6192, -3.8050, -4.6269, ..., -4.6681, -4.9316, -4.5299]]], [[[ 1.2981, -3.3057, -2.9156, ..., -0.9881, -1.5324, -1.7074]], [[ 3.9398, -2.3952, -3.5837, ..., -1.4577, -1.4048, -1.5522]], [[ 2.1619, -1.6569, -3.0289, ..., -0.9008, -0.4473, -2.0978]], ..., [[ 1.0013, -4.2050, -3.8664, ..., -3.4637, -2.1816, -1.8085]], [[ 1.2228, -4.4923, -3.8964, ..., -2.0583, -1.5406, -1.4060]], [[ 1.2792, -2.8811, -3.8633, ..., -4.6502, -3.8078, -3.8301]]]]) attn_weights tensor([[[[ 2.1188, -0.6990, -1.9902, ..., -2.1726, -1.9769, -1.1448]], [[ 4.0151, 0.0893, -0.2191, ..., -0.9917, -0.2533, 0.5076]], [[ 2.1196, -2.1271, -1.7484, ..., -2.9180, -4.2491, -2.8929]], ..., [[ 3.3078, -1.6313, -2.7732, ..., -3.6560, -3.6729, -2.5228]], [[ 1.4392, -4.7287, -4.3483, ..., 0.0767, 0.0847, -0.9082]], [[ 4.0545, -0.8703, 0.1420, ..., -0.5609, -1.7134, 0.0563]]], [[[ 1.7339, -1.5968, -1.8879, ..., -3.0461, -0.8903, -2.9322]], [[ 3.7049, -1.5989, -3.0460, ..., -0.5614, -0.3000, -1.1142]], [[ 1.3854, -3.0441, -3.7098, ..., -2.5834, -1.1229, -4.2512]], ..., [[ 3.7499, -2.4987, -2.2594, ..., -2.0257, -1.6813, -2.6380]], [[ 1.2094, -3.3684, -4.8574, ..., -3.4627, 0.3431, -2.9992]], [[ 3.7141, -1.1801, -2.7023, ..., -1.9927, -2.0251, -3.2456]]], [[[ 1.6163, -1.7070, -2.7923, ..., -2.0070, -3.2565, -3.2094]], [[ 3.7103, -0.7360, -1.6363, ..., -0.8415, -2.1569, -0.3780]], [[ 1.4025, -1.9556, -2.0150, ..., -0.7952, -1.5462, -2.6768]], ..., [[ 3.5888, -2.1826, -2.3673, ..., -2.1064, -3.8148, -2.9872]], [[ 1.4479, -3.7417, -4.6151, ..., -2.2793, -1.5067, -0.2108]], [[ 3.5549, -0.0665, -0.8111, ..., -2.5573, -2.7116, -1.2795]]], [[[ 1.7360, -4.1219, -3.9496, ..., -4.5796, -5.1085, -3.3332]], [[ 3.6170, -0.9746, -1.8030, ..., -2.6456, -0.9994, -1.1424]], [[ 1.3613, -3.6361, -3.6088, ..., -3.8522, -3.2648, -0.8798]], ..., [[ 4.3269, -1.7608, -1.4622, ..., -2.2956, -1.1850, 0.5965]], [[ 0.8155, -5.7965, -6.5662, ..., -1.7399, 0.4818, -1.1323]], [[ 4.0323, -0.0934, -2.2093, ..., -2.7802, -1.6480, -2.7884]]], [[[ 1.6987, -2.4608, -3.7415, ..., -1.9171, -2.1600, -2.0662]], [[ 3.7206, -1.7026, -2.6220, ..., -1.4617, -0.9035, -1.5101]], [[ 1.4358, -2.8395, -3.3394, ..., -2.1672, -1.2192, -1.7520]], ..., [[ 4.1333, -1.9281, -2.3981, ..., -1.0056, -1.9009, -1.6568]], [[ 1.1510, -4.0380, -5.1209, ..., 0.4670, 0.4272, -1.2135]], [[ 3.8469, -2.3333, -3.7281, ..., -1.8776, -2.2136, -2.1542]]]]) attn_weights tensor([[[[ 2.2681, -3.2933, -3.2612, ..., -3.8046, -3.7346, -3.8258]], [[ 3.3056, -0.8964, -1.6380, ..., -1.8542, -0.5315, -0.7636]], [[ 2.8961, -1.2233, -1.1865, ..., -1.3946, -0.6603, -1.3524]], ..., [[ 0.4186, -3.8797, -3.8725, ..., -1.1409, -1.0325, -1.6866]], [[ 3.2170, -2.0996, -1.1496, ..., -2.1905, -2.0517, -2.1217]], [[ 3.3204, -0.9191, -1.1964, ..., -1.4135, 0.3668, -0.2321]]], [[[ 1.9589, -3.1050, -4.1907, ..., -3.3307, -1.2547, -2.8523]], [[ 3.7624, -2.5987, -3.5255, ..., -0.1727, -1.6961, -1.1080]], [[ 3.2307, -2.2438, -1.7268, ..., -1.6820, -0.9455, -2.5373]], ..., [[ 0.9327, -2.7902, -3.0396, ..., -4.1999, -0.4482, -2.4571]], [[ 3.1146, -2.1869, -2.1381, ..., -3.1857, -1.2914, -1.9816]], [[ 3.9298, 0.0143, -1.3259, ..., 0.0357, 2.3222, -0.7078]]], [[[ 2.1208, -2.2107, -2.9735, ..., -2.9302, -3.2091, -3.4065]], [[ 3.1831, -1.5101, -2.6262, ..., -0.5381, -2.6465, -2.4777]], [[ 2.3444, -0.6454, -0.9539, ..., -2.2435, -1.7189, -1.7733]], ..., [[ 0.4022, -2.4118, -2.1907, ..., -2.2714, -0.6174, -1.0632]], [[ 3.1201, -1.9037, -0.9574, ..., -2.8823, -3.0303, -2.8658]], [[ 1.7434, -1.4231, -1.7532, ..., -1.4460, -1.1803, -1.8202]]], [[[ 2.8023, -3.7053, -4.5054, ..., -6.2218, -4.7532, -2.7900]], [[ 3.5642, -1.7240, -3.0967, ..., -4.4612, -0.3583, -0.6809]], [[ 3.0584, -0.1584, -1.8202, ..., -3.8003, -3.6433, -2.1412]], ..., [[ 0.2714, -5.6920, -6.1863, ..., -4.2914, -2.8198, -1.3822]], [[ 3.0600, -2.5507, -1.9637, ..., -3.4045, -3.1968, -1.9320]], [[ 3.3894, -2.0491, -1.9282, ..., -1.4607, 0.1779, 0.3157]]], [[[ 3.1073, -4.6660, -4.5111, ..., -3.1323, -4.2834, -3.3511]], [[ 3.6418, -2.4315, -2.1873, ..., -0.9157, -1.8319, -0.9915]], [[ 3.3682, -2.8846, -2.7782, ..., -1.0528, -0.1558, -0.2630]], ..., [[ 1.8529, -5.3060, -5.5262, ..., -4.0853, -2.9816, -2.4619]], [[ 3.4969, -2.4593, -2.2030, ..., -2.0893, -1.6100, -1.2602]], [[ 4.2390, -1.1339, -0.8530, ..., 1.1805, 1.5540, 1.7674]]]]) attn_weights tensor([[[[ 1.3410e+00, 1.3200e+00, 9.1488e-01, ..., 1.7582e+00, 8.4173e-01, 1.5887e+00]], [[ 2.9193e+00, 8.1439e-01, 9.4958e-02, ..., -2.9518e-01, -4.7615e-01, -2.7859e-01]], [[ 2.7522e+00, -1.4850e-01, -1.4798e+00, ..., -1.7889e+00, -2.7497e+00, -8.9515e-01]], ..., [[ 3.8576e+00, 2.9227e-01, -6.7008e-01, ..., -5.3869e-01, -3.3211e-03, 2.0368e-01]], [[ 3.0353e+00, 1.5044e+00, 2.2601e-01, ..., 9.4688e-01, 4.8855e-01, 8.5932e-01]], [[ 2.9554e+00, 4.8295e-02, -5.9110e-01, ..., 7.2323e-01, -7.3047e-01, -4.1923e-01]]], [[[ 1.8161e+00, 7.8663e-01, 1.4068e-01, ..., 2.9860e-01, 7.9329e-01, 8.5293e-01]], [[ 3.6306e+00, -8.9721e-01, -1.4034e+00, ..., -8.1974e-01, 8.7800e-01, 4.7628e-01]], [[ 2.8253e+00, -6.6037e-01, -1.9365e+00, ..., -2.5279e+00, 3.3735e-01, -3.7742e-01]], ..., [[ 4.0643e+00, -1.3737e+00, -3.0648e+00, ..., -1.9240e-01, -2.7299e-01, -1.4538e+00]], [[ 3.3862e+00, 3.2440e-01, -6.8368e-01, ..., -9.6337e-01, 1.7663e+00, 1.4185e+00]], [[ 3.5555e+00, 1.9081e-01, -1.0438e+00, ..., -9.3960e-01, 9.6518e-01, 8.4953e-02]]], [[[ 1.1181e+00, 1.5796e+00, 1.4769e+00, ..., 1.3402e+00, 1.0386e+00, 2.3395e+00]], [[ 3.0127e+00, -1.7118e-01, -9.6028e-01, ..., -1.2321e+00, -1.1602e+00, -7.0136e-01]], [[ 2.7413e+00, -6.9617e-02, -1.8205e+00, ..., -2.4174e+00, -1.0609e+00, -1.4258e+00]], ..., [[ 3.5685e+00, -1.1461e+00, -2.1061e+00, ..., -9.5443e-01, -2.5078e+00, -1.7924e+00]], [[ 2.6515e+00, 1.1270e+00, 4.2931e-01, ..., -3.8724e-01, 9.9928e-01, 1.5946e+00]], [[ 2.5069e+00, 6.5799e-01, -1.2693e+00, ..., -9.2900e-01, 8.0208e-02, 1.2255e+00]]], [[[ 1.7476e+00, 5.8442e-01, -1.9878e-01, ..., -9.7190e-01, -9.4216e-01, -5.7824e-02]], [[ 3.4649e+00, -3.1958e-01, -4.2209e-01, ..., -2.3072e+00, -1.4356e+00, 6.8279e-02]], [[ 2.9730e+00, -3.6366e-01, -2.2110e+00, ..., -4.5191e+00, -2.6986e+00, -2.6076e+00]], ..., [[ 3.8481e+00, -1.5682e+00, -2.6869e+00, ..., -3.8703e+00, -1.9850e+00, -6.0819e-01]], [[ 1.8100e+00, -1.2837e+00, -2.0718e+00, ..., -3.0750e+00, -7.0277e-01, -8.9457e-01]], [[ 1.8839e+00, -1.1088e+00, -2.1909e+00, ..., -2.9416e+00, -2.2928e-01, -2.2173e-01]]], [[[ 1.8256e+00, 1.1282e-02, -7.0081e-01, ..., -1.4316e-01, -7.3967e-02, -3.6770e-03]], [[ 4.4354e+00, -1.7419e+00, -1.5696e+00, ..., -8.4205e-01, -1.4030e+00, -1.2223e+00]], [[ 3.8655e+00, -1.7758e+00, -1.9713e+00, ..., -1.8526e+00, -2.0764e+00, -9.9262e-01]], ..., [[ 4.5500e+00, -4.6147e-01, -9.8344e-01, ..., 8.2858e-01, 4.7810e-01, 5.7747e-01]], [[ 3.7285e+00, 2.7059e-01, 1.7401e+00, ..., 2.3493e-01, 6.9869e-01, 2.0805e+00]], [[ 3.1991e+00, -1.2685e+00, 3.2514e-01, ..., -5.9116e-02, -8.7916e-02, 1.6348e+00]]]]) attn_weights tensor([[[[-0.5880, -2.9639, -2.2343, ..., -2.5052, -2.8828, -1.7982]], [[ 1.7670, 0.9845, 5.8140, ..., -2.4014, 0.7088, 6.3884]], [[-1.5161, -2.3322, -2.2156, ..., -2.7066, -2.3009, -2.1188]], ..., [[-1.9227, -2.3042, -2.5862, ..., -2.4977, -2.0537, -2.3327]], [[ 0.6487, -0.1578, 1.2773, ..., -0.5968, -0.1271, 1.5626]], [[-1.7059, -2.4770, -3.8143, ..., -2.7914, -2.4253, -4.0908]]], [[[-1.0844, -3.3470, -3.9223, ..., -3.1587, -2.5230, -2.5059]], [[ 0.5143, -0.4758, -0.2528, ..., -1.0879, -0.0401, 8.5111]], [[-1.7659, -3.3962, -3.2156, ..., -2.9151, -2.5704, -3.2689]], ..., [[-2.1635, -2.8060, -2.7746, ..., -2.4254, -2.3622, -3.3392]], [[-0.1782, -0.7160, -0.7403, ..., -0.4809, -0.2293, 1.1045]], [[-0.5720, -1.8719, -2.3571, ..., -2.2679, -2.3212, -2.5543]]], [[[-0.5880, -2.9639, -2.2343, ..., -2.9144, -1.7924, -1.7982]], [[ 1.7670, 0.9845, 5.8140, ..., 0.7015, 0.0617, 6.3884]], [[-1.5161, -2.3322, -2.2156, ..., -2.3285, -1.8153, -2.1188]], ..., [[-1.9227, -2.3042, -2.5862, ..., -2.0853, -1.9207, -2.3327]], [[ 0.6487, -0.1578, 1.2773, ..., -0.1321, 0.0670, 1.5626]], [[-1.7059, -2.4770, -3.8143, ..., -2.4624, -2.4895, -4.0908]]], [[[-0.9467, -3.4942, -2.1216, ..., -2.5415, -2.4245, -2.4665]], [[ 2.3477, 1.4018, -0.3491, ..., -1.3911, -0.5154, 7.6289]], [[-2.0351, -2.8976, -1.8602, ..., -1.7732, -2.1421, -2.0131]], ..., [[-2.1480, -2.4886, -2.5260, ..., -2.2754, -2.4011, -2.5467]], [[-0.1853, -0.7664, -0.8804, ..., -0.3021, -0.6767, 0.8573]], [[-1.4788, -2.2161, -3.6659, ..., -3.3763, -3.9335, -2.4560]]], [[[-0.8465, -2.7324, -1.9131, ..., -2.5042, -1.3654, -1.8461]], [[ 0.3976, 0.2281, 0.4412, ..., -0.9460, -0.2680, 9.7894]], [[-1.6847, -3.2002, -2.3118, ..., -3.1701, -2.0313, -2.2705]], ..., [[-2.3363, -2.8584, -2.7108, ..., -2.5407, -2.3227, -2.7567]], [[-0.2027, -0.6203, -0.6330, ..., -0.4936, -0.4988, 0.9487]], [[-1.0299, -2.0017, -3.3181, ..., -2.4131, -3.8975, -1.8775]]]]) attn_weights tensor([[[[-0.6994, -3.4128, -3.6077, ..., 0.6183, 1.0252, 1.1026]], [[-1.4102, -2.7691, -3.7948, ..., 0.3363, 1.7216, 0.4899]], [[-3.8620, -4.3803, -4.2695, ..., -2.9934, -2.3999, -2.5228]], ..., [[ 1.0264, -0.6402, -0.1681, ..., 0.0300, -0.9450, -0.1150]], [[-4.1338, -2.6971, -2.5469, ..., -0.9909, -0.7155, -0.6990]], [[-1.8533, -1.4910, 0.5805, ..., -4.1289, -0.5858, 2.2632]]], [[[-3.5675, -5.1497, -4.8094, ..., -0.2358, 3.5203, -0.7942]], [[-1.6621, -3.0164, -3.0807, ..., 1.6590, 1.2824, 0.6350]], [[-3.8222, -4.3227, -4.2869, ..., -2.5640, -2.5842, -2.4895]], ..., [[ 1.3250, -0.5052, 0.7350, ..., -0.9914, 0.5054, -0.5584]], [[-4.5248, -2.5473, -2.4342, ..., -0.6379, -0.5882, -0.4250]], [[ 1.2574, 0.6325, -2.0543, ..., 1.7989, -0.7932, 4.3882]]], [[[-0.2652, -3.0180, -3.1312, ..., 0.5833, 1.8119, 1.3247]], [[-1.2479, -2.5885, -3.5430, ..., 1.2726, 1.6250, 0.6406]], [[-3.8167, -4.3726, -4.2627, ..., -2.6245, -2.5992, -2.5097]], ..., [[ 1.0909, -0.5475, -0.0528, ..., -1.0143, -0.0931, -0.0612]], [[-4.1340, -2.6865, -2.5382, ..., -0.8927, -0.6324, -0.6948]], [[-2.9297, -2.2633, -0.3063, ..., -1.0765, -2.6757, 1.2794]]], [[[-1.5699, -4.0714, -3.3993, ..., -0.0210, 0.0199, -0.5212]], [[-0.5619, -2.2392, -3.3970, ..., 0.2984, -0.5429, 0.6799]], [[-3.5762, -4.2507, -4.0633, ..., -2.7199, -2.5264, -2.1261]], ..., [[ 1.2369, -0.4490, -0.0965, ..., 0.1191, -0.3143, -0.6032]], [[-4.0245, -2.5737, -2.4497, ..., -1.0008, -0.7214, -0.1704]], [[ 0.9748, -0.0248, -1.9386, ..., -1.4709, -1.9529, 2.6042]]], [[[-3.5707, -5.1290, -3.7542, ..., -0.2939, 1.4022, -0.4896]], [[-2.0651, -3.5928, -3.7783, ..., 1.2756, 0.9619, 0.0896]], [[-3.8007, -4.2102, -4.2640, ..., -2.3884, -2.6890, -2.7230]], ..., [[ 1.0297, -0.7416, 0.2065, ..., -1.0748, 0.1172, -0.8518]], [[-4.3918, -2.5836, -2.5640, ..., -0.7861, -0.9058, -0.6252]], [[ 1.2837, 0.9907, -2.0013, ..., 1.0510, -1.9855, 5.6280]]]]) attn_weights tensor([[[[ -1.3866, -5.6990, -5.3802, ..., -1.3009, -2.2371, -1.2883]], [[ 1.4143, -0.9858, -1.9609, ..., -1.3860, -1.3433, -2.5973]], [[ -6.1724, -15.7824, -20.1797, ..., -3.8730, -2.6232, -4.7732]], ..., [[ -4.0688, -10.5930, -12.0070, ..., -2.7478, -2.9647, -3.2413]], [[ -2.2545, -4.0237, -3.9806, ..., -1.6085, -1.4552, -1.3002]], [[ -0.4511, -5.7720, -5.6807, ..., -2.8006, -2.6506, -2.5187]]], [[[ -1.6727, -5.0019, -5.0790, ..., -1.9103, 0.4526, -2.4024]], [[ 1.7126, -1.2872, -0.9602, ..., -1.6252, -1.4855, -2.0375]], [[ -6.6672, -16.1220, -17.0754, ..., -5.3704, -1.9192, -5.6125]], ..., [[ -4.0583, -8.9287, -9.2065, ..., -2.1977, -2.8987, -2.6932]], [[ -1.7121, -3.6952, -3.7080, ..., -1.6149, -1.4982, -0.3765]], [[ -0.4905, -5.8046, -5.6556, ..., -2.7733, -3.3164, -2.2095]]], [[[ -1.2843, -5.1526, -4.9515, ..., -2.6623, -0.9572, -1.3188]], [[ 1.2046, -0.9483, -1.9270, ..., -1.5525, -2.2990, -2.7792]], [[ -5.8870, -14.9325, -19.1555, ..., -3.9429, -2.9865, -4.5878]], ..., [[ -3.5671, -9.8953, -11.1611, ..., -3.6460, -3.3382, -3.0141]], [[ -2.1621, -4.0850, -3.8478, ..., -2.1162, -1.6121, -1.3349]], [[ -0.4390, -5.5138, -5.3111, ..., -3.1958, -2.7125, -2.3905]]], [[[ -0.9652, -5.2662, -3.4077, ..., -1.7246, -1.3866, -2.3680]], [[ 1.1845, -0.0842, -1.4078, ..., -2.3035, -2.3159, -0.8496]], [[ -5.6380, -16.7649, -15.7287, ..., -5.4933, -4.3133, -3.8100]], ..., [[ -3.6494, -10.0221, -10.1244, ..., -4.1018, -1.9518, -2.8150]], [[ -1.9325, -4.1589, -3.8404, ..., -1.8455, -1.3858, -1.0691]], [[ -0.2398, -5.8105, -5.2029, ..., -3.0818, -2.4579, -2.4003]]], [[[ -1.5553, -5.6015, -5.2406, ..., -2.0466, -1.2314, -1.8487]], [[ 1.4032, -1.0989, -0.9987, ..., -1.1691, -1.8034, -0.3396]], [[ -6.4233, -17.6995, -17.7753, ..., -4.0578, -2.8950, -4.7586]], ..., [[ -4.2547, -9.9829, -10.1947, ..., -2.8223, -1.8731, -2.8493]], [[ -2.1042, -3.8611, -3.9036, ..., -1.3057, -1.3114, -0.7343]], [[ -0.4932, -5.7995, -5.7527, ..., -2.9022, -2.8124, -2.4275]]]]) attn_weights tensor([[[[ 4.2949, -0.0778, 2.6816, ..., -4.0767, -0.8795, 2.0550]], [[ -2.6757, -8.7544, -9.0815, ..., -3.9137, -3.3745, -3.5944]], [[ -4.6018, -12.1066, -14.3297, ..., -4.1292, -3.9406, -4.5080]], ..., [[ -1.5856, -7.6024, -8.0911, ..., -0.5346, -3.0246, -3.0009]], [[ -1.0012, -6.1213, -5.3314, ..., -4.2454, -3.9031, -2.3882]], [[ -2.5368, -8.8406, -10.3121, ..., -0.8690, -3.2870, -3.9609]]], [[[ 4.9598, -0.7107, -2.9234, ..., -0.8774, -3.1339, 1.0574]], [[ -2.2329, -7.0677, -7.2632, ..., -3.1852, -4.2957, -6.2424]], [[ -4.1920, -10.8424, -11.8857, ..., -5.0140, -3.6704, -5.3690]], ..., [[ -1.3460, -7.3520, -6.6943, ..., -2.7253, -2.5275, -2.1714]], [[ -0.7453, -5.6462, -5.9712, ..., -3.2015, -3.2455, -2.6875]], [[ -1.5957, -7.8262, -8.9810, ..., -2.9078, -2.8574, -2.6017]]], [[[ 4.0956, -0.3970, 1.8363, ..., -0.4834, -2.1290, 0.6239]], [[ -2.6723, -6.9992, -7.5713, ..., -3.4068, -3.2548, -3.7112]], [[ -4.1686, -10.6602, -12.8752, ..., -4.6094, -3.2791, -4.5469]], ..., [[ -1.3942, -6.4234, -7.1490, ..., -4.0247, -2.1642, -3.0830]], [[ -0.8904, -5.7204, -4.8492, ..., -3.4433, -2.5225, -2.4125]], [[ -2.3169, -7.9800, -9.0820, ..., -4.2836, -1.7712, -3.7708]]], [[[ 4.2155, 0.4554, -1.2736, ..., -2.4187, -3.2857, 1.9210]], [[ -2.4930, -7.3107, -8.5335, ..., -4.8812, -4.5820, -4.1207]], [[ -4.0328, -10.3203, -11.7302, ..., -4.9064, -4.0873, -5.8197]], ..., [[ -1.5788, -5.7713, -6.4024, ..., -2.8985, -4.4408, -3.4293]], [[ -1.0195, -5.5915, -4.8046, ..., -3.5157, -2.2968, -2.6295]], [[ -2.2786, -7.9584, -8.6513, ..., -3.6533, -3.2608, -2.6550]]], [[[ 4.4976, -0.9963, -1.7863, ..., -2.0698, -2.8004, 2.2053]], [[ -2.3199, -8.9979, -8.2125, ..., -3.6866, -2.9210, -4.1842]], [[ -4.1448, -13.3502, -14.2097, ..., -5.8570, -4.7246, -5.3860]], ..., [[ -1.2692, -7.6096, -7.7579, ..., -2.9577, -2.5829, -2.7861]], [[ -0.8672, -6.9079, -6.5728, ..., -4.2495, -3.5269, -2.8448]], [[ -2.1854, -8.5712, -10.2758, ..., -3.2380, -4.3333, -4.1312]]]]) attn_weights tensor([[[[ -2.3839, -11.8606, -12.3407, ..., -5.5040, -7.1417, -5.9496]], [[ -2.7581, -8.5236, -9.9042, ..., -3.8574, -2.1210, -3.4823]], [[ -0.0555, -2.5043, -3.2237, ..., -1.6527, -2.0624, -3.2137]], ..., [[ -1.1824, -5.7391, -7.6004, ..., -2.6048, -3.5157, -3.9021]], [[ 1.5267, -2.3776, -3.3131, ..., -2.3813, -1.8420, -3.5187]], [[-10.4436, -21.5699, -29.9162, ..., 5.0986, 12.3676, 0.7906]]], [[[ -0.9934, -9.4957, -9.4715, ..., -4.4998, -2.5702, -4.7542]], [[ -1.8694, -7.0904, -8.0373, ..., -1.8558, -2.8245, -3.3632]], [[ 0.0735, -2.1600, -2.8087, ..., -1.0176, -2.8608, -2.3064]], ..., [[ -0.1502, -4.5717, -6.3602, ..., -2.6125, -2.8188, -3.9513]], [[ 1.5904, -2.9077, -2.5202, ..., -1.6267, -2.4022, -4.3172]], [[ -8.4183, -21.8376, -25.3462, ..., -5.9963, 9.4301, -2.1476]]], [[[ -2.2248, -11.3576, -11.6416, ..., -6.8667, -5.9466, -6.0305]], [[ -2.6052, -7.9144, -9.5225, ..., -3.3076, -0.9357, -3.1656]], [[ -0.1142, -2.1171, -3.4816, ..., -3.1660, -3.2736, -4.3192]], ..., [[ -1.2110, -5.3449, -6.4906, ..., -3.9832, -3.7645, -3.6995]], [[ 1.4582, -2.1100, -3.4895, ..., -2.3905, -1.8306, -3.5508]], [[ -8.1861, -22.3595, -28.4209, ..., -1.7142, 8.8813, -0.2524]]], [[[ -2.6255, -11.0767, -10.6641, ..., -4.3724, -3.4245, -5.2457]], [[ -2.1123, -7.9283, -8.3956, ..., -2.1548, -3.2176, -4.0442]], [[ -0.1741, -2.1735, -3.3173, ..., -3.9552, -4.6407, -1.8686]], ..., [[ -1.2706, -5.0701, -5.2959, ..., -2.5246, -2.3586, -2.5472]], [[ 1.3162, -1.9359, -2.5715, ..., -3.9336, -4.6329, -2.4491]], [[ -8.1205, -30.8220, -28.3421, ..., 0.2788, 8.3045, -3.4155]]], [[[ -1.0914, -11.7863, -11.3603, ..., -6.3314, -5.5920, -3.8779]], [[ -1.9479, -7.9193, -8.8167, ..., -2.7007, -2.9575, -2.8267]], [[ 0.4026, -3.6682, -3.9977, ..., -1.7939, -2.3650, -2.1582]], ..., [[ -0.5187, -5.7266, -6.4020, ..., -2.7723, -2.2899, -2.3383]], [[ 1.6255, -2.8827, -1.4203, ..., -2.4365, -1.0180, -1.7845]], [[ -6.2790, -26.5067, -15.8133, ..., -6.9951, 8.6372, 2.5179]]]]) attn_weights tensor([[[[ 2.3652, -4.1609, -4.2160, ..., -3.2424, -3.1680, -1.1192]], [[ 4.1586, -7.7163, -5.5232, ..., -7.5543, -6.8101, -2.2577]], [[ 0.5240, -3.9085, -6.4728, ..., -0.1121, -0.8781, -2.5043]], ..., [[ 0.7412, -3.2533, -4.5081, ..., -4.0551, -3.2310, -3.8284]], [[ 1.9310, -1.2259, -1.3088, ..., -1.9624, -2.1156, -0.4116]], [[ 0.9073, -2.7941, -1.5958, ..., -1.2602, -1.8146, -0.2085]]], [[[ 1.7865, -3.9211, -4.7332, ..., -0.6232, -2.9072, -3.2698]], [[ 4.0833, -10.1240, -9.8810, ..., -7.0245, -5.4219, -5.4171]], [[ 0.8477, -3.3778, -5.4037, ..., -1.6337, -0.5637, -2.5607]], ..., [[ 1.1154, -3.3403, -3.4850, ..., -2.0779, -2.6678, -5.8369]], [[ 2.3996, -1.5736, -0.2555, ..., 0.0940, -1.4085, -2.2896]], [[ 1.3317, -4.9082, -4.0888, ..., -1.8025, -1.3796, -0.0148]]], [[[ 2.1137, -4.3412, -5.6949, ..., -2.5499, -2.7972, -2.3152]], [[ 4.4128, -7.6458, -7.1003, ..., -7.9027, -6.4533, -2.6176]], [[ 0.2806, -4.2204, -5.1873, ..., -4.0785, -3.9016, -3.6133]], ..., [[ 0.6875, -2.9021, -3.7811, ..., -2.8565, -3.1543, -3.6791]], [[ 1.7604, -0.7393, -1.0832, ..., -0.9378, -1.3189, -0.7292]], [[ 0.9553, -3.6972, -2.6907, ..., -2.7484, -0.2649, -0.3938]]], [[[ 3.0518, -3.5496, -3.3460, ..., -2.3318, -4.0586, -0.6061]], [[ 4.7148, -6.8339, -5.7173, ..., -6.9072, -6.0045, -1.4831]], [[ 0.3631, -3.1986, -3.9617, ..., -1.7999, -1.3552, -2.2842]], ..., [[ 1.3605, -2.7516, -2.6101, ..., -2.5644, -2.7889, -2.0990]], [[ 1.8514, -0.6825, -0.6528, ..., -3.2440, -1.4251, -0.0540]], [[ 1.2096, -2.0196, -2.3751, ..., -2.7984, -2.5933, -0.8789]]], [[[ 2.4928, -5.4107, -5.6512, ..., -4.8932, -3.3024, -1.9145]], [[ 4.3607, -8.8405, -7.5692, ..., -5.8144, -3.9149, -3.2600]], [[ 0.9249, -4.7114, -5.7191, ..., -3.1811, -2.3826, -2.5596]], ..., [[ 1.2643, -3.7012, -4.0217, ..., -4.0182, -3.8712, -4.2649]], [[ 2.4916, -1.4340, -1.4346, ..., -2.1012, -0.5631, 0.8376]], [[ 1.0963, -4.5982, -4.5971, ..., -3.1379, -3.3174, -0.2821]]]]) attn_weights tensor([[[[-4.2570e-01, -6.2728e+00, -5.6967e+00, ..., -3.6057e+00, -3.0466e+00, -1.5473e+00]], [[ 1.7904e-01, -6.1831e+00, -7.0117e+00, ..., -3.9228e+00, -4.6904e+00, -3.7769e+00]], [[ 3.8494e-01, -3.1706e+00, -3.2904e+00, ..., -3.1500e+00, -2.4793e+00, -2.9560e+00]], ..., [[ 3.3249e+00, -4.7998e+00, -4.2341e+00, ..., -4.4421e+00, -2.9126e+00, -1.9849e+00]], [[ 2.8924e+00, -3.3593e+00, -3.3812e+00, ..., -1.1144e+00, -1.0638e+00, -1.4481e+00]], [[-1.4917e-01, -4.4108e+00, -7.5303e+00, ..., 9.5287e-01, -1.8491e-01, -2.8362e+00]]], [[[ 6.6542e-02, -4.9122e+00, -6.1645e+00, ..., -3.4772e+00, -3.3493e+00, -5.2989e+00]], [[ 9.1014e-01, -3.7486e+00, -6.6007e+00, ..., -3.5478e+00, -4.2786e+00, -6.4042e+00]], [[ 4.6603e-01, -2.4384e+00, -2.3744e+00, ..., -1.3589e+00, -2.3886e+00, -3.3986e+00]], ..., [[ 4.6080e+00, -7.2084e+00, -7.4204e+00, ..., -1.0132e+00, -2.1364e+00, -4.8004e+00]], [[ 2.2146e+00, -1.9457e+00, -1.5853e+00, ..., -6.3836e-02, -2.2323e+00, -1.3526e+00]], [[ 4.9551e-01, -4.0720e+00, -6.3483e+00, ..., -2.6890e+00, -2.2436e+00, -2.7123e+00]]], [[[-1.0249e+00, -5.5813e+00, -5.9704e+00, ..., -5.1885e+00, -3.3155e+00, -3.0416e+00]], [[-7.7874e-01, -4.5862e+00, -6.4255e+00, ..., -3.2146e+00, -2.9863e+00, -4.3025e+00]], [[ 3.1906e-01, -2.9622e+00, -2.9273e+00, ..., -2.7752e+00, -2.4569e+00, -3.0927e+00]], ..., [[ 4.0434e+00, -6.3282e+00, -5.7975e+00, ..., -4.9943e+00, -4.1095e+00, -3.7212e+00]], [[ 2.7632e+00, -3.6828e+00, -3.8297e+00, ..., -3.5726e-01, -1.4943e+00, -1.5630e+00]], [[ 1.4347e-02, -4.1083e+00, -7.7145e+00, ..., -2.9609e+00, -6.1393e-01, -3.6236e+00]]], [[[-7.1351e-01, -5.4281e+00, -5.4307e+00, ..., -3.9996e+00, -3.8481e+00, -4.4579e+00]], [[-1.3432e-01, -4.4064e+00, -5.4668e+00, ..., -3.9625e+00, -3.3613e+00, -2.7708e+00]], [[ 1.9645e-01, -2.8888e+00, -2.9335e+00, ..., -4.1832e+00, -4.6945e+00, -2.1054e+00]], ..., [[ 4.5951e+00, -3.5462e+00, -3.9335e-01, ..., -4.6163e+00, -3.6550e+00, -1.3751e+00]], [[ 2.9045e+00, -2.2411e+00, -2.1733e+00, ..., -2.0020e+00, -3.4350e+00, -7.9336e-01]], [[-8.5427e-02, -4.2211e+00, -6.6107e+00, ..., -3.8623e+00, -5.3398e+00, -3.9243e+00]]], [[[-5.8518e-01, -5.5660e+00, -3.7412e+00, ..., -3.3830e+00, -6.4758e-01, -1.7372e+00]], [[ 1.1792e+00, -5.9339e+00, -7.0560e+00, ..., -4.5668e+00, -3.9235e+00, -3.0857e+00]], [[ 4.7778e-01, -3.3193e+00, -3.8556e+00, ..., -1.6898e+00, -2.3068e+00, -2.6599e+00]], ..., [[ 4.4647e+00, -6.9415e+00, -5.4456e+00, ..., -4.7765e+00, -3.7690e+00, -2.2446e+00]], [[ 2.9537e+00, -4.4717e+00, -3.9226e+00, ..., -2.1452e+00, -1.7106e+00, -9.0146e-01]], [[ 1.4864e-03, -4.5868e+00, -6.2720e+00, ..., -1.1048e+00, -2.3465e+00, -1.6941e+00]]]]) attn_weights tensor([[[[-0.4350, -7.4721, -8.8468, ..., -2.2875, -1.5593, -3.0989]], [[ 2.7993, -0.7249, -1.2007, ..., -0.7647, -1.0108, -0.8104]], [[ 5.9587, -1.4572, -2.1772, ..., -2.0465, -0.1524, -0.0544]], ..., [[ 0.3514, -3.0398, -3.9294, ..., -1.8770, -0.3869, -1.5211]], [[ 3.5774, -1.3864, -2.7099, ..., -2.3047, 0.6008, -0.7413]], [[ 3.5030, -3.0989, -3.6593, ..., -2.8710, -2.1253, -2.3366]]], [[[ 0.1566, -6.0964, -7.7976, ..., -3.3136, -1.7256, -4.4879]], [[ 2.8495, -2.4836, -2.8556, ..., 0.3941, -2.1628, -2.1828]], [[ 6.5033, -2.7008, -5.5329, ..., -1.4483, -2.5134, -0.6586]], ..., [[ 0.7275, -3.1664, -3.7973, ..., -0.0271, -0.9732, -5.1118]], [[ 5.1103, -6.0399, -5.3895, ..., -2.0150, -1.0740, -4.7375]], [[ 3.1180, -1.4010, -3.1873, ..., -2.0202, -4.0849, -2.8472]]], [[[-0.5053, -7.1456, -9.0806, ..., -4.8628, -2.0209, -4.4917]], [[ 2.2138, -1.3509, -1.2877, ..., 1.2772, -0.1325, -0.2725]], [[ 6.0844, -2.6417, -3.1602, ..., -4.3638, -1.9335, -0.8363]], ..., [[ 0.1475, -1.9585, -2.9630, ..., -2.5935, -0.1372, -1.3056]], [[ 4.0085, -0.8492, -1.8677, ..., -1.6223, -0.1033, -1.1315]], [[ 3.1338, -2.8920, -3.1906, ..., -2.9876, -2.7022, -2.0541]]], [[[-0.4727, -8.6909, -8.0976, ..., -4.1375, -2.6498, -5.2118]], [[ 2.8456, -2.1197, -1.5184, ..., -1.6297, -0.6294, 0.6960]], [[ 5.8057, -1.9307, 0.1857, ..., -1.8851, -1.6158, 0.1760]], ..., [[ 0.7832, -4.4673, -5.1842, ..., -5.1963, -5.2186, -2.2923]], [[ 3.5149, -3.7424, -0.5003, ..., -3.8942, -2.1089, -1.4086]], [[ 2.8802, -2.7775, -2.2891, ..., -4.9654, -3.7418, -1.2890]]], [[[-0.3396, -7.8469, -7.5931, ..., -4.1767, -2.8581, -4.0612]], [[ 3.0483, -2.5989, -3.4240, ..., -2.6588, -1.5341, 0.2898]], [[ 6.7608, -3.6527, -4.3083, ..., -4.2870, -3.2353, -1.3586]], ..., [[ 0.4328, -4.2591, -4.5868, ..., -0.8715, -1.0375, -2.0417]], [[ 4.4420, -3.1099, -2.6379, ..., -1.3795, -1.4520, -0.9530]], [[ 3.1009, -3.8275, -4.3764, ..., -2.5087, -1.7896, -1.9758]]]]) attn_weights tensor([[[[ 1.2476, -1.8789, -1.8342, ..., -1.8236, -1.2302, -1.0709]], [[ 3.8400, -0.8527, -2.5143, ..., -2.3830, -1.3991, -1.1948]], [[ 1.6347, -0.2052, -1.9298, ..., -0.3092, 0.4503, -1.6276]], ..., [[ 1.2418, -2.8297, -2.7343, ..., -2.2677, -2.4112, -1.8598]], [[ 1.5680, -2.6571, -2.5230, ..., -1.8774, -1.0435, -1.3156]], [[ 1.4081, -1.8550, -3.2592, ..., -2.6265, -1.9481, -2.9478]]], [[[ 1.2802, -3.4209, -3.3523, ..., -1.1208, -2.2320, -2.2912]], [[ 4.9287, -2.0977, -2.0482, ..., 0.3025, -1.3373, -0.8655]], [[ 2.1599, -1.0249, -2.2363, ..., 1.8450, -0.1366, 0.2688]], ..., [[ 1.1583, -4.2597, -3.9784, ..., -0.7237, -2.0442, -2.4328]], [[ 1.5095, -4.0374, -3.1047, ..., -1.5348, -2.2492, -2.6094]], [[ 1.0188, -3.7773, -3.8370, ..., -2.4394, -3.2831, -4.6171]]], [[[ 1.1449, -2.7188, -2.2518, ..., -3.1693, -3.0071, -2.0834]], [[ 4.2196, -1.3849, -3.1697, ..., -2.4994, -1.7792, -2.2324]], [[ 2.0377, -1.2096, -2.5666, ..., -0.5258, -2.0713, -2.8245]], ..., [[ 0.7562, -3.7220, -3.2970, ..., -2.2355, -2.5142, -1.8612]], [[ 1.1319, -3.7167, -2.8877, ..., -2.0071, -1.1917, -1.4029]], [[ 1.4012, -2.2137, -3.3578, ..., -3.8335, -3.4222, -3.5720]]], [[[ 1.5335, -2.3830, -3.0972, ..., -4.8838, -5.5237, -2.1858]], [[ 2.9597, -2.1905, -0.8607, ..., -1.9611, -0.3333, -0.8491]], [[ 1.7845, -0.1991, -0.9524, ..., -1.6257, -2.0892, 0.8554]], ..., [[ 1.0325, -2.5513, -2.1719, ..., -2.2574, -1.9846, -1.3298]], [[ 1.0387, -2.0543, -2.4083, ..., -2.0298, -2.0539, -1.1193]], [[ 0.6370, -3.1679, -3.2661, ..., -6.0784, -3.5925, -2.3958]]], [[[ 0.9297, -3.4090, -3.8053, ..., -2.0040, -2.5184, -1.5061]], [[ 4.2452, -1.7438, -2.9692, ..., -1.9601, -1.9120, 0.0939]], [[ 1.5988, -1.5533, -2.6893, ..., -0.2117, -1.5013, -0.6467]], ..., [[ 1.1703, -4.3073, -4.0020, ..., -3.4939, -2.4476, -1.8413]], [[ 1.1273, -4.6390, -3.7697, ..., -1.6252, -1.4485, -1.3571]], [[ 0.6796, -4.5042, -4.0648, ..., -4.6629, -3.8334, -4.2228]]]]) attn_weights tensor([[[[ 2.6415e+00, 5.2410e-01, -1.7437e+00, ..., -1.6244e+00, 3.6475e-01, -1.5129e+00]], [[ 4.6868e+00, 5.6159e-01, -5.8828e-01, ..., -2.2274e+00, -2.9585e-01, -2.7012e-01]], [[ 2.7170e+00, -6.7890e-01, -1.4737e+00, ..., -2.8902e+00, -6.8286e-01, -1.3274e+00]], ..., [[ 4.8465e+00, -5.2804e-01, -2.2910e+00, ..., -3.3993e+00, -2.4671e+00, -2.7614e+00]], [[ 1.5639e+00, -3.1991e+00, -3.7362e+00, ..., 1.0594e+00, 1.0525e+00, 6.0565e-02]], [[ 3.7135e+00, -2.1686e+00, -3.0748e+00, ..., -4.4333e+00, -2.1192e+00, -3.6025e+00]]], [[[ 2.4608e+00, -3.3805e+00, -3.8163e+00, ..., -2.0874e+00, -3.5451e+00, -3.3645e+00]], [[ 4.0376e+00, -1.5596e+00, -3.0841e+00, ..., -1.4649e+00, -3.0857e+00, -2.8023e+00]], [[ 2.2397e+00, -3.1076e+00, -4.0259e+00, ..., -1.1428e-01, -2.4645e+00, -3.1676e+00]], ..., [[ 3.7662e+00, -2.8787e+00, -3.1276e+00, ..., -1.7109e+00, -2.5436e+00, -1.8004e+00]], [[ 1.8992e+00, -6.0226e+00, -6.5197e+00, ..., -2.0356e+00, -2.0518e+00, -2.2198e+00]], [[ 3.3992e+00, -1.2280e+00, -2.0576e+00, ..., -9.6870e-01, -2.2125e+00, -1.9865e+00]]], [[[ 1.5012e+00, -8.3789e-01, -2.1118e+00, ..., -1.4833e+00, -1.9519e+00, -2.4029e+00]], [[ 3.9742e+00, -3.0748e-01, -1.6094e+00, ..., -1.9429e+00, -1.3031e+00, -1.8519e+00]], [[ 1.4194e+00, -1.1652e+00, -2.4214e+00, ..., -4.1446e-01, -1.1175e+00, -1.9498e+00]], ..., [[ 4.5636e+00, -1.8004e+00, -2.4336e+00, ..., -2.7949e+00, -2.1221e+00, -2.6044e+00]], [[ 1.1193e+00, -3.7018e+00, -4.8380e+00, ..., -2.1211e+00, 5.9119e-01, -1.5898e+00]], [[ 3.6365e+00, -1.1963e+00, -2.7890e+00, ..., -3.0295e+00, -2.7928e+00, -2.5125e+00]]], [[[ 1.7076e+00, -1.4133e+00, -2.8156e+00, ..., -4.7757e+00, -3.0704e+00, -8.3484e-01]], [[ 2.4421e+00, -1.1990e+00, -1.6830e+00, ..., -2.3636e+00, -2.7752e+00, -4.0049e-01]], [[ 1.4277e+00, -2.4739e+00, -2.3725e+00, ..., -3.2464e+00, 2.0300e-02, -5.6210e-01]], ..., [[ 2.9748e+00, -2.6552e+00, -2.1987e+00, ..., -4.2688e+00, -1.2936e+00, -1.3614e+00]], [[ 5.4563e-01, -4.2069e+00, -4.6786e+00, ..., -1.4418e+00, -2.3318e+00, -1.5493e+00]], [[ 3.6688e+00, -3.1314e-03, -9.6493e-01, ..., -3.9070e+00, -3.8502e+00, 5.3712e-01]]], [[[ 2.1802e+00, -4.0734e+00, -4.0564e+00, ..., -3.1632e+00, -2.6146e+00, -2.7935e+00]], [[ 3.3416e+00, -2.1276e+00, -2.3431e+00, ..., -1.8905e+00, -1.7817e+00, -1.7909e-01]], [[ 2.0732e+00, -4.3457e+00, -3.4127e+00, ..., -3.3444e+00, -2.7871e+00, -2.1816e+00]], ..., [[ 3.8068e+00, -1.2882e+00, -1.8599e+00, ..., -1.8341e+00, -1.7325e+00, -9.6229e-01]], [[ 1.6815e+00, -5.3935e+00, -4.8015e+00, ..., -2.1037e+00, -1.8947e+00, -1.4898e+00]], [[ 3.5466e+00, -1.0334e+00, -3.2506e+00, ..., -1.7924e+00, -1.7305e+00, -2.1959e+00]]]]) attn_weights tensor([[[[ 3.2707e+00, -2.9987e+00, -3.3810e+00, ..., -5.1826e+00, -4.1198e+00, -4.0359e+00]], [[ 3.9290e+00, -1.8176e-01, 3.3241e-01, ..., -4.0362e+00, -2.1449e+00, 1.8390e-01]], [[ 3.6730e+00, -1.0270e+00, -1.9796e+00, ..., -1.9324e+00, -2.0763e+00, -1.7625e+00]], ..., [[ 2.3242e+00, -5.3920e+00, -5.3445e+00, ..., -4.8245e+00, -3.8374e+00, -3.1485e+00]], [[ 3.9271e+00, -7.8661e-01, -1.4347e+00, ..., -3.3875e+00, -1.2688e+00, -1.6683e+00]], [[ 4.6895e+00, 1.7532e-01, -5.7323e-01, ..., -1.2906e+00, -1.3135e-03, 2.0464e-01]]], [[[ 3.2605e+00, -3.4325e+00, -4.1395e+00, ..., -2.0371e+00, -3.2620e+00, -4.0405e+00]], [[ 4.4782e+00, -1.9146e+00, -3.0555e+00, ..., -7.2209e-02, -9.5721e-01, -2.0659e+00]], [[ 3.0908e+00, -9.8387e-01, -2.0520e+00, ..., -6.5929e-02, -1.9169e+00, -3.8594e+00]], ..., [[ 1.2798e+00, -5.0261e+00, -6.7977e+00, ..., -1.8274e+00, -2.4084e+00, -3.0818e+00]], [[ 3.7750e+00, -3.6250e+00, -3.2936e+00, ..., -2.9724e+00, -3.4684e+00, -4.4076e+00]], [[ 4.3808e+00, -1.6350e+00, -1.3287e+00, ..., 1.9594e-01, -1.4986e+00, -2.9508e+00]]], [[[ 2.9618e+00, -3.2650e+00, -3.5663e+00, ..., -2.8070e+00, -3.4621e+00, -3.7633e+00]], [[ 3.8503e+00, -1.6978e+00, -1.3692e+00, ..., -2.3263e+00, -2.5794e+00, -1.2756e+00]], [[ 3.1019e+00, -1.3913e+00, -2.0484e+00, ..., -2.1014e+00, -1.3819e+00, -1.8795e+00]], ..., [[ 1.8884e+00, -4.2100e+00, -3.5945e+00, ..., -3.8686e+00, -3.2842e+00, -2.4895e+00]], [[ 3.6911e+00, -1.8735e+00, -1.8314e+00, ..., -1.8270e+00, -1.8778e+00, -1.6305e+00]], [[ 3.5489e+00, -1.1300e+00, -1.2564e+00, ..., 3.5659e-01, 3.8169e-01, -7.4731e-01]]], [[[ 1.9028e+00, -2.6716e+00, -3.6056e+00, ..., -4.9198e+00, -2.8733e+00, -1.2772e+00]], [[ 2.8708e+00, -9.5526e-01, -1.8732e+00, ..., -2.6246e+00, -4.7344e-01, 9.7920e-02]], [[ 2.7492e+00, -1.1146e-01, -9.6314e-01, ..., -3.9993e+00, -2.7180e+00, 3.1734e-01]], ..., [[ 4.9330e-01, -3.6581e+00, -2.7539e+00, ..., -2.7182e+00, -9.7012e-01, -8.6308e-01]], [[ 2.6301e+00, -2.3297e+00, -1.6867e+00, ..., -3.8751e+00, -1.9016e+00, -1.7090e+00]], [[ 2.7274e+00, -1.7608e+00, -2.2800e+00, ..., -2.9981e+00, -9.2333e-01, -1.0669e+00]]], [[[ 2.5208e+00, -3.6078e+00, -4.3233e+00, ..., -4.0118e+00, -3.1093e+00, -2.9699e+00]], [[ 3.7815e+00, -3.0055e+00, -3.7983e+00, ..., -2.7580e+00, -2.6010e+00, -7.1094e-01]], [[ 3.1104e+00, -3.1322e+00, -2.7399e+00, ..., -1.8109e+00, -1.0600e+00, -8.1894e-01]], ..., [[ 7.7067e-01, -4.6139e+00, -5.0514e+00, ..., -2.1778e+00, -2.0467e+00, -1.2455e+00]], [[ 3.2130e+00, -2.4157e+00, -2.3963e+00, ..., -2.5278e+00, -1.8793e+00, -2.2715e+00]], [[ 3.1069e+00, -1.7000e+00, -1.0648e+00, ..., -1.1572e+00, 6.7325e-01, 3.7274e-02]]]]) attn_weights tensor([[[[ 1.6455, 0.5856, 0.0689, ..., 0.0312, 0.7942, 0.0309]], [[ 4.2892, -0.8553, -0.9071, ..., -2.2863, -1.8408, -1.6620]], [[ 4.2423, -0.6633, -1.6182, ..., -3.8106, -2.1881, -2.0788]], ..., [[ 5.4203, 1.3555, 0.9264, ..., -0.8355, 1.2506, 1.0853]], [[ 4.1464, 1.3833, 2.6393, ..., 0.1440, 0.9040, 2.2081]], [[ 3.7036, 0.9398, 1.7860, ..., 0.6889, 0.9889, 1.7747]]], [[[ 1.1144, 0.7119, -0.1818, ..., 0.3335, 1.2051, 1.0978]], [[ 3.7598, -1.3784, -1.6516, ..., -0.5310, -1.6998, -1.8282]], [[ 3.6199, -0.8339, -2.1528, ..., -0.9465, -2.2416, -2.9495]], ..., [[ 4.1990, -1.1992, -2.8319, ..., -0.5666, -2.4540, -0.8412]], [[ 3.5525, 0.9567, -0.3514, ..., 1.5487, -0.4159, -1.3062]], [[ 1.4369, 3.5021, 0.4808, ..., 8.1066, 0.1275, -1.3075]]], [[[ 1.3354, 1.0000, 0.9052, ..., 0.9157, 1.0774, 1.2119]], [[ 4.2969, -1.4251, -1.2655, ..., -1.4539, -1.1824, -0.8326]], [[ 3.9365, -1.4688, -1.8494, ..., -2.2255, -3.0105, -2.0834]], ..., [[ 4.6344, -0.2810, -0.5404, ..., -0.7710, -0.0304, -1.1475]], [[ 3.3331, 0.1201, 2.5481, ..., -0.0684, 0.2521, 2.5052]], [[ 3.1427, -0.8339, 1.0396, ..., -1.0941, -0.1468, 1.8169]]], [[[ 2.2689, 2.3495, 1.1801, ..., -1.6214, -0.2800, 3.0167]], [[ 2.7462, 0.5620, -0.4844, ..., -0.7436, 0.3126, 1.0299]], [[ 2.7559, 0.2851, -1.8444, ..., -3.0659, -2.5877, 0.7855]], ..., [[ 3.1895, 0.1315, -1.6694, ..., -2.4488, -1.1112, 0.4114]], [[ 3.0315, 1.7859, -0.0488, ..., -0.1941, -0.2428, 2.0778]], [[ 2.3209, 0.2663, -1.4236, ..., -0.7385, 0.3517, -0.2970]]], [[[ 1.6058, 0.6997, -0.6197, ..., 1.3775, 0.2615, 1.2530]], [[ 3.3787, -0.7819, -1.7024, ..., -0.0797, -0.7075, -0.1924]], [[ 2.8935, -0.7992, -1.6721, ..., -0.4014, -0.5836, -0.9840]], ..., [[ 3.4597, -2.0237, -3.2376, ..., -2.0376, -2.5833, -0.3175]], [[ 3.0946, 0.4448, -1.1979, ..., 2.2338, -0.5920, 1.4906]], [[ 2.6905, 0.4867, -1.7940, ..., 2.1236, -0.8712, 0.7145]]]]) attn_weights tensor([[[[-1.4785, -2.8014, -1.9321, ..., -2.6741, -1.4258, -0.7837]], [[ 0.3095, 0.3476, 0.4384, ..., -0.8321, -0.2328, 8.8559]], [[-1.1013, -2.1837, -1.6040, ..., -2.3757, -1.5911, -1.2434]], ..., [[-2.1192, -2.4997, -2.7552, ..., -2.2764, -2.4850, -2.8447]], [[ 0.1396, -0.0271, -0.0734, ..., -0.1825, -0.1623, 1.4550]], [[-0.8767, -1.8220, -3.0915, ..., -1.9182, -3.4394, -1.6975]]], [[[-1.4787, -3.7164, -2.5114, ..., -1.4963, -2.0103, -3.7893]], [[-2.2280, -0.2480, -3.1811, ..., -1.2467, -4.5806, 4.5664]], [[-2.2524, -2.7232, -3.0694, ..., -2.0679, -2.5534, -1.5234]], ..., [[-1.8561, -2.1783, -2.2192, ..., -1.5823, -2.3188, -1.6506]], [[-0.3840, -0.4730, -0.4701, ..., -0.0737, -0.7250, 0.3198]], [[-1.4982, -2.3029, -3.5771, ..., -3.2467, -2.6908, -2.4189]]], [[[-0.3740, -2.0377, -1.3123, ..., -0.9389, -0.7904, -1.0897]], [[ 2.0796, 1.8565, 1.7617, ..., 0.6332, 0.9146, 8.8162]], [[-1.3872, -2.5978, -1.8442, ..., -1.9623, -1.7904, -1.7245]], ..., [[-2.2304, -2.6528, -2.8422, ..., -2.2289, -2.5296, -2.9909]], [[ 0.1120, -0.3791, 0.3462, ..., 0.0812, 0.6103, 0.9849]], [[-1.1295, -1.8938, -3.4301, ..., -2.4465, -3.9942, -2.0423]]], [[[-1.0291, -4.1976, -1.9808, ..., -2.2338, -1.5944, -3.6334]], [[-1.3207, 0.2106, -1.8108, ..., -2.9047, -0.3229, 4.5219]], [[-1.5345, -2.7685, -1.6180, ..., -2.1866, -1.1796, -3.3408]], ..., [[-1.4201, -1.7952, -1.6780, ..., -1.7093, -1.3884, -1.1287]], [[-0.2091, -0.6977, -0.6242, ..., -0.4598, -0.1471, 0.1155]], [[-1.0499, -2.2182, -3.1941, ..., -3.5244, -2.3891, -2.0420]]], [[[-1.4787, -3.7164, -2.5114, ..., -1.7407, -2.5651, -3.7893]], [[-2.2280, -0.2480, -3.1811, ..., -3.4980, -4.5689, 4.5664]], [[-2.2524, -2.7232, -3.0694, ..., -2.8774, -2.4469, -1.5234]], ..., [[-1.8561, -2.1783, -2.2192, ..., -1.9262, -2.2419, -1.6506]], [[-0.3840, -0.4730, -0.4701, ..., -0.1805, -0.6318, 0.3198]], [[-1.4982, -2.3029, -3.5771, ..., -3.9898, -2.2768, -2.4189]]]]) attn_weights tensor([[[[-1.8731, -4.0567, -2.7117, ..., 0.6466, 2.2140, 0.1234]], [[-1.1528, -2.7475, -3.0944, ..., 1.9932, 1.6446, 0.6886]], [[-3.6692, -4.2130, -4.1796, ..., -2.2551, -2.4787, -2.7564]], ..., [[ 1.1689, -0.3611, -0.0138, ..., -0.8968, -0.2212, -0.7281]], [[-4.2517, -2.5322, -2.5018, ..., -0.7045, -0.7699, -0.9587]], [[ 0.0422, 0.0586, -0.9397, ..., 0.4564, -0.5923, 4.1182]]], [[[-1.5674, -4.4326, -3.8127, ..., 1.1829, 1.2735, -0.3027]], [[-1.1049, -2.2935, -2.5800, ..., 1.2961, 0.9796, 0.8864]], [[-3.8691, -4.2856, -4.3161, ..., -2.6897, -2.5436, -2.3435]], ..., [[ 1.3453, -0.6565, 0.3228, ..., 0.3068, -0.5101, -0.5071]], [[-4.1912, -2.6383, -2.5367, ..., -0.7155, -0.4864, -0.6331]], [[ 0.5162, -0.2971, -2.8800, ..., -1.0033, -2.2594, 2.6582]]], [[[-2.6591, -4.8884, -3.6411, ..., 0.1580, 1.3757, -0.3418]], [[-1.2015, -2.6147, -3.5403, ..., 1.2807, 0.6597, 0.1575]], [[-3.7948, -4.2364, -4.2166, ..., -2.6200, -2.6095, -2.8006]], ..., [[ 1.1304, -0.5424, -0.2897, ..., 0.0214, -0.3134, -0.7187]], [[-4.3131, -2.6854, -2.6026, ..., -0.6674, -0.8071, -0.8056]], [[-0.0318, -0.3505, -3.0806, ..., -1.9391, -2.3801, 3.4748]]], [[[ 0.4752, -1.7441, -2.0465, ..., 0.5330, 1.1021, 1.2302]], [[ 0.4613, -1.2714, -1.9407, ..., 0.6279, 2.0848, 1.8124]], [[-3.4313, -4.1421, -3.9570, ..., -2.4779, -2.2007, -2.1735]], ..., [[ 1.7240, -0.3997, 0.2731, ..., 0.2650, -0.1485, -0.0732]], [[-4.3285, -2.3100, -2.1955, ..., -0.6527, -0.1770, -0.4887]], [[ 0.8686, -0.1952, -1.7246, ..., -2.7399, 0.0885, 1.6249]]], [[[-1.9587, -5.1028, -4.2300, ..., 0.5377, 2.3306, -0.9072]], [[-0.7990, -2.3015, -2.5872, ..., 1.3438, 1.1518, 0.9941]], [[-3.9222, -4.3526, -4.3932, ..., -2.7979, -2.8920, -2.5708]], ..., [[ 1.4603, -0.6111, 0.1697, ..., -0.1685, -0.2325, -0.6861]], [[-4.1326, -2.6487, -2.5605, ..., -0.8720, -0.6716, -0.7129]], [[ 1.9013, 0.6211, -1.8036, ..., -1.0170, -2.7057, 3.9889]]]]) attn_weights tensor([[[[-1.5970e+00, -5.7065e+00, -5.5228e+00, ..., -2.0388e+00, -1.3985e+00, -1.1108e+00]], [[ 1.1583e+00, 1.2508e-01, -2.4181e+00, ..., -6.1999e-01, -3.0962e+00, -1.1536e+00]], [[-6.8778e+00, -1.8190e+01, -1.8575e+01, ..., -5.3184e+00, -3.6103e+00, -5.5073e+00]], ..., [[-3.9622e+00, -9.9794e+00, -1.0609e+01, ..., -2.8219e+00, -2.2360e+00, -3.1577e+00]], [[-2.4549e+00, -4.3123e+00, -4.2542e+00, ..., -1.6428e+00, -1.4375e+00, -1.4411e+00]], [[-4.8242e-01, -5.9141e+00, -5.7325e+00, ..., -2.8658e+00, -2.6390e+00, -2.8524e+00]]], [[[-1.9135e+00, -5.7026e+00, -5.3735e+00, ..., -3.5611e-01, -1.9204e+00, -7.0507e-01]], [[ 1.6720e+00, -1.4347e+00, -6.8056e-01, ..., -9.3011e-01, -1.0007e+00, -9.5178e-01]], [[-6.3927e+00, -1.8429e+01, -1.8219e+01, ..., -3.8694e+00, -5.3478e+00, -6.0402e+00]], ..., [[-4.2529e+00, -9.7841e+00, -9.6169e+00, ..., -3.8462e+00, -1.3864e+00, -3.7864e+00]], [[-1.6748e+00, -3.8057e+00, -3.6888e+00, ..., -1.4812e+00, -2.2874e-01, -8.8231e-01]], [[-4.8527e-01, -5.9714e+00, -5.8391e+00, ..., -3.3130e+00, -2.3412e+00, -2.5779e+00]]], [[[-1.5012e+00, -5.2332e+00, -5.2224e+00, ..., -1.3671e+00, -1.6743e+00, -2.0658e+00]], [[ 1.2115e+00, -9.7039e-01, -2.3168e+00, ..., -2.1095e+00, -3.1090e+00, -2.3689e+00]], [[-7.2312e+00, -1.7559e+01, -1.7538e+01, ..., -5.4589e+00, -3.1470e+00, -5.4197e+00]], ..., [[-4.1697e+00, -9.7917e+00, -1.0266e+01, ..., -3.4889e+00, -2.3095e+00, -3.1625e+00]], [[-2.4241e+00, -4.2346e+00, -4.0866e+00, ..., -1.7277e+00, -1.6043e+00, -1.4505e+00]], [[-5.3093e-01, -5.8609e+00, -5.5950e+00, ..., -2.8182e+00, -2.6448e+00, -2.6470e+00]]], [[[-5.9509e-01, -4.1309e+00, -2.9241e+00, ..., -1.2710e+00, -2.1765e+00, -2.1889e+00]], [[ 1.2714e+00, -1.3788e+00, -1.5630e+00, ..., -2.3010e+00, -9.8574e-01, -1.8216e+00]], [[-4.4257e+00, -1.4807e+01, -1.5291e+01, ..., -4.4213e+00, -1.3722e+00, -2.7204e+00]], ..., [[-2.5079e+00, -7.6035e+00, -8.0773e+00, ..., -1.9075e+00, -6.6023e-01, -1.7805e+00]], [[-1.5790e-01, -3.1717e+00, -2.5185e+00, ..., -6.2739e-01, -4.4161e-01, -6.1135e-01]], [[-1.6337e-01, -5.7535e+00, -5.1007e+00, ..., -2.8399e+00, -2.4758e+00, -2.2191e+00]]], [[[-2.0048e+00, -6.1312e+00, -5.8527e+00, ..., -1.7893e+00, -1.3709e+00, -8.6355e-01]], [[ 2.0957e+00, -8.0653e-01, -1.0355e+00, ..., -1.8782e+00, 9.8326e-03, 3.0245e-01]], [[-6.4183e+00, -1.9410e+01, -1.9476e+01, ..., -4.2480e+00, -3.5071e+00, -5.4234e+00]], ..., [[-4.2162e+00, -1.0542e+01, -1.0776e+01, ..., -2.4786e+00, -2.2613e+00, -3.7364e+00]], [[-1.9651e+00, -4.0116e+00, -3.9932e+00, ..., -1.4230e+00, -7.4854e-01, -9.6316e-01]], [[-4.6293e-01, -6.1026e+00, -6.0147e+00, ..., -2.9901e+00, -2.5455e+00, -2.5481e+00]]]]) attn_weights tensor([[[[ 4.7157, -0.9589, -0.2598, ..., -1.6118, -1.2507, 3.1206]], [[ -2.3654, -9.0833, -8.3149, ..., -3.3711, -2.9059, -4.5297]], [[ -4.4308, -12.6057, -12.6254, ..., -4.3353, -2.6738, -5.2582]], ..., [[ -0.9989, -6.9102, -8.0282, ..., -2.3968, -2.5642, -2.0327]], [[ -0.8996, -6.4692, -5.8996, ..., -4.5531, -2.8340, -2.8454]], [[ -2.3432, -8.6054, -10.1086, ..., -2.8850, -3.7851, -3.4095]]], [[[ 4.5358, -0.4085, -0.8247, ..., -2.6727, -3.0802, -0.4772]], [[ -2.4566, -7.6304, -7.6804, ..., -3.9478, -6.0798, -4.0116]], [[ -4.6106, -11.3497, -12.6298, ..., -4.8027, -5.2158, -5.5259]], ..., [[ -1.4832, -8.1335, -7.5308, ..., -3.7215, -1.3840, -0.9789]], [[ -0.9894, -6.4090, -6.0993, ..., -3.7246, -4.1213, -2.6318]], [[ -2.1926, -8.6330, -10.1737, ..., -3.0789, -2.5073, -2.4687]]], [[[ 4.0656, -0.8018, -0.6314, ..., -2.4676, -1.2307, 1.6160]], [[ -2.7407, -8.2114, -8.3305, ..., -3.4979, -4.0849, -4.7317]], [[ -4.1544, -11.1469, -11.9817, ..., -4.3108, -3.9556, -5.3383]], ..., [[ -1.3569, -6.7173, -7.8580, ..., -2.3563, -3.7652, -3.1367]], [[ -0.9429, -5.6796, -5.8624, ..., -3.4194, -3.2203, -2.7467]], [[ -2.4184, -8.2265, -9.6465, ..., -2.2448, -4.1470, -3.9760]]], [[[ 4.6826, 1.0932, -1.9131, ..., -3.0773, -1.2584, 2.5620]], [[ -1.9902, -5.8416, -7.2196, ..., -5.8665, -3.0051, -3.2261]], [[ -3.6015, -7.5467, -9.1334, ..., -5.7709, -4.1164, -3.9236]], ..., [[ -1.2418, -3.6425, -6.5651, ..., -7.6576, -2.8570, -4.2722]], [[ -0.8017, -5.2892, -5.4524, ..., -3.6352, -3.1388, -2.7254]], [[ -1.7010, -6.6624, -7.6711, ..., -4.7677, -3.1353, -1.7850]]], [[[ 4.8320, -0.8612, -1.3990, ..., -2.3566, -0.9236, -0.3119]], [[ -2.5545, -9.2905, -9.1256, ..., -3.7093, -4.7026, -4.5474]], [[ -5.1164, -13.9172, -14.9154, ..., -5.3862, -4.3462, -6.3117]], ..., [[ -1.7334, -8.8566, -8.9786, ..., -3.4081, -0.7604, -2.3389]], [[ -1.0746, -7.4340, -7.0901, ..., -3.8418, -3.6902, -2.4514]], [[ -2.7014, -9.5422, -11.5335, ..., -5.5635, -3.7208, -4.1923]]]]) attn_weights tensor([[[[-1.9583e+00, -1.2161e+01, -1.2345e+01, ..., -6.0078e+00, -5.3528e+00, -4.9706e+00]], [[-2.5985e+00, -8.2354e+00, -8.3747e+00, ..., -1.4280e+00, -1.9986e+00, -3.1629e+00]], [[ 1.6214e-01, -2.3718e+00, -3.2248e+00, ..., -1.7204e+00, -2.7581e+00, -2.9525e+00]], ..., [[-1.0183e+00, -5.3039e+00, -6.5506e+00, ..., -2.6040e+00, -3.0984e+00, -3.0545e+00]], [[ 1.5591e+00, -2.4213e+00, -2.9648e+00, ..., -2.1517e+00, -3.3684e+00, -2.3051e+00]], [[-6.0282e+00, -2.8351e+01, -1.1745e+01, ..., -6.6345e+00, 1.7018e+01, 5.7610e+00]]], [[[-1.1966e+00, -1.0591e+01, -9.9358e+00, ..., -3.6275e+00, -5.6627e+00, -5.1292e+00]], [[-2.0193e+00, -8.7843e+00, -8.9381e+00, ..., -2.9374e+00, -2.2004e+00, -2.9382e+00]], [[ 3.1681e-02, -1.6588e+00, -1.8185e+00, ..., -2.6434e+00, -3.4548e+00, -3.3164e+00]], ..., [[-1.6024e-01, -5.8038e+00, -7.9185e+00, ..., -3.5026e+00, -3.6306e+00, -3.8131e+00]], [[ 1.3834e+00, -2.3152e+00, -2.3882e+00, ..., -2.0139e+00, -4.3548e+00, -2.2337e+00]], [[-7.9970e+00, -2.5904e+01, -2.8685e+01, ..., -3.1324e+00, 4.7222e+00, -2.0337e+00]]], [[[-2.1221e+00, -1.1475e+01, -1.1134e+01, ..., -5.4006e+00, -5.4709e+00, -5.2406e+00]], [[-2.7123e+00, -7.6805e+00, -8.7787e+00, ..., -5.2537e-01, -2.6872e+00, -2.7658e+00]], [[-1.7021e-01, -1.6841e+00, -2.7902e+00, ..., -2.7207e+00, -3.4139e+00, -3.5818e+00]], ..., [[-1.0453e+00, -5.0893e+00, -6.4040e+00, ..., -3.1129e+00, -3.1749e+00, -3.8723e+00]], [[ 1.2260e+00, -1.7788e+00, -2.5306e+00, ..., -2.3011e+00, -2.5914e+00, -2.7924e+00]], [[-3.5173e+00, -2.9729e+01, -1.3214e+01, ..., -1.8736e+00, 1.5094e+01, 3.3576e+00]]], [[[-2.5922e+00, -7.5534e+00, -7.7821e+00, ..., -5.2656e+00, -4.1763e+00, -2.4162e+00]], [[-1.1366e+00, -7.6416e+00, -9.4493e+00, ..., -6.2434e+00, -3.3567e+00, -4.5107e+00]], [[ 4.2835e-01, -1.1829e+00, -2.4468e+00, ..., -4.2245e+00, -7.7139e-01, -1.2864e+00]], ..., [[-8.6051e-01, -3.8141e+00, -4.6453e+00, ..., -4.4522e+00, -2.4185e+00, -4.1802e+00]], [[ 1.3580e+00, -1.2150e+00, -2.0906e+00, ..., -3.4665e+00, -1.9847e+00, -1.0923e+00]], [[-8.1484e+00, -1.3754e+01, -2.0086e+01, ..., -4.2500e+00, 9.6220e+00, -9.8289e-01]]], [[[-1.3446e+00, -1.1162e+01, -1.0700e+01, ..., -4.3516e+00, -3.1618e+00, -4.5211e+00]], [[-2.3248e+00, -7.8691e+00, -8.0054e+00, ..., -2.0706e+00, -2.1995e+00, -3.0628e+00]], [[ 3.9728e-01, -3.5631e+00, -4.3844e+00, ..., -2.4206e+00, -2.0765e+00, -2.3300e+00]], ..., [[-7.9938e-01, -6.3177e+00, -6.8778e+00, ..., -2.9720e+00, -1.8015e+00, -2.2784e+00]], [[ 1.5994e+00, -3.0881e+00, -1.9227e+00, ..., -1.0625e+00, -1.6949e+00, -1.3691e+00]], [[-6.9577e+00, -3.3799e+01, -3.0882e+01, ..., -2.9133e+00, 1.1722e+01, 5.6044e+00]]]]) attn_weights tensor([[[[ 2.1687, -4.8674, -3.8788, ..., -3.4370, -2.6725, -3.0111]], [[ 4.6469, -10.8132, -8.2032, ..., -9.5673, -7.2278, -2.8567]], [[ 0.6188, -4.6259, -4.8334, ..., -1.0375, -1.4866, -3.1000]], ..., [[ 0.8817, -3.3890, -3.7918, ..., -3.0638, -3.0931, -4.4574]], [[ 2.0340, -0.8134, -0.6635, ..., -2.4996, -0.4459, -0.7466]], [[ 1.2102, -3.6412, -3.0231, ..., -3.5602, -2.6110, -1.4454]]], [[[ 1.9394, -5.9804, -6.0392, ..., -4.9412, -4.6508, -2.7048]], [[ 4.3414, -10.9543, -9.6423, ..., -6.0111, -8.0756, -0.4131]], [[ 1.0314, -3.6024, -5.4786, ..., -1.6949, -2.2850, -3.3011]], ..., [[ 1.1604, -3.6433, -3.1255, ..., -3.5501, -4.8148, -3.9837]], [[ 2.2895, -1.9523, -0.7066, ..., -1.9246, -3.1878, -1.2997]], [[ 1.3541, -4.5893, -4.2659, ..., -1.8852, -0.8120, 0.5251]]], [[[ 2.1333, -5.1113, -5.2815, ..., -1.9349, -2.8718, -3.7498]], [[ 4.6556, -9.5992, -8.0277, ..., -6.8994, -4.5748, -3.4485]], [[ 0.3770, -4.9704, -4.9335, ..., -3.7859, -2.7543, -4.4010]], ..., [[ 0.7410, -3.0943, -3.6606, ..., -2.9586, -3.6501, -4.0091]], [[ 1.5280, -0.8299, -0.4645, ..., -1.3137, -0.2713, -0.9991]], [[ 1.0133, -4.4184, -4.0492, ..., -0.5573, -2.0573, -0.3428]]], [[[ 2.9423, -2.9753, -3.9490, ..., -6.2279, -2.9071, -2.2133]], [[ 4.0395, -4.6505, -5.3698, ..., -7.9271, -4.5280, -1.8074]], [[ 0.7254, -3.1635, -4.2622, ..., -4.8876, -2.7762, -4.8819]], ..., [[ 1.3085, -2.8976, -3.3659, ..., -3.9434, -2.1354, -2.7879]], [[ 2.6908, -0.9194, -1.7374, ..., -2.1181, -0.0935, -1.4498]], [[ 1.2334, -3.0963, -2.8474, ..., -3.2073, -1.6798, -1.3948]]], [[[ 2.5636, -7.2139, -6.0350, ..., -3.7961, -2.1588, -2.2463]], [[ 4.4936, -11.0536, -8.4668, ..., -5.0920, -3.2891, -2.3024]], [[ 0.8269, -4.6493, -5.5390, ..., -2.5457, -1.5604, -3.7379]], ..., [[ 1.2789, -3.6067, -3.7615, ..., -3.9971, -3.5317, -4.1127]], [[ 2.4546, -2.0256, -1.9004, ..., -1.5186, -0.0797, -1.2470]], [[ 1.2569, -4.4336, -4.3716, ..., -3.0716, -1.8194, -0.0512]]]]) attn_weights tensor([[[[-0.5268, -5.9765, -4.3239, ..., -3.3602, -1.1887, -2.3842]], [[ 0.6332, -5.1979, -6.7249, ..., -3.1213, -3.8742, -3.5857]], [[ 0.3754, -3.6814, -3.1530, ..., -2.3530, -2.5638, -3.2482]], ..., [[ 4.5446, -7.6130, -6.4724, ..., -4.1056, -5.0266, -1.5886]], [[ 2.9352, -3.1139, -2.9823, ..., -1.9598, -1.9004, -1.0823]], [[-0.2997, -3.8086, -6.2168, ..., -0.3181, -1.9124, -1.4299]]], [[[-0.4467, -4.0680, -5.2795, ..., -2.7556, -2.7275, -3.4510]], [[ 0.9735, -4.3501, -6.6775, ..., -4.6649, -6.3700, -4.9639]], [[ 0.4203, -2.9857, -3.0681, ..., -2.7666, -3.5662, -3.1711]], ..., [[ 4.4231, -7.1622, -6.0835, ..., -3.7498, -6.0589, -0.5949]], [[ 2.6078, -2.2684, -2.6789, ..., -2.4269, -1.9542, -1.1580]], [[ 0.2365, -4.7950, -6.2961, ..., -1.8868, -1.7322, -1.9473]]], [[[-1.1715, -5.3088, -4.7353, ..., -3.3616, -1.6060, -3.1114]], [[-0.3027, -5.3738, -6.0582, ..., -3.6683, -4.0992, -4.6478]], [[ 0.1473, -2.9539, -3.0441, ..., -2.4992, -3.1292, -3.6015]], ..., [[ 4.2580, -6.5602, -5.7557, ..., -3.5416, -4.2414, -2.9411]], [[ 2.5042, -3.3800, -2.9379, ..., -1.2846, -1.3493, -1.7626]], [[-0.3782, -4.0703, -7.2026, ..., -0.8250, -3.1905, -3.6220]]], [[[ 0.4521, -4.7540, -5.2275, ..., -5.5735, -4.8508, -4.7432]], [[ 1.1278, -3.7092, -5.7126, ..., -5.6770, -3.8115, -4.0428]], [[ 0.5333, -2.8323, -3.1397, ..., -4.5400, -1.9874, -3.0935]], ..., [[ 4.4472, -2.6781, -1.7369, ..., -5.1798, -3.5471, -2.4896]], [[ 2.7032, -3.5815, -2.4250, ..., -5.5718, -3.4116, -2.5382]], [[ 0.6635, -4.4645, -7.4372, ..., -5.8395, -3.7889, -3.6412]]], [[[-0.8461, -4.9906, -4.0262, ..., -0.6777, -0.3524, -1.6283]], [[ 0.8947, -6.4900, -7.9913, ..., -5.0278, -3.2123, -3.7605]], [[ 0.5154, -3.7596, -4.4498, ..., -2.7667, -2.9009, -2.3668]], ..., [[ 4.1271, -6.7604, -4.6991, ..., -2.9533, -1.4485, -1.4762]], [[ 2.9922, -4.7821, -4.0194, ..., -2.3163, -1.2095, -1.5995]], [[-0.2834, -5.0642, -6.2781, ..., -2.3755, -1.2849, -2.0668]]]]) attn_weights tensor([[[[-0.6155, -7.0434, -5.9665, ..., -1.9898, -0.6151, -4.0029]], [[ 3.5444, -0.9501, -2.1966, ..., 0.7432, -1.3002, -1.7837]], [[ 6.2205, -5.2532, -4.4476, ..., -2.5054, -2.5124, -0.2335]], ..., [[ 0.5174, -2.9059, -3.2823, ..., -0.2922, -0.6667, -2.1679]], [[ 4.4588, -4.4590, -2.0635, ..., -0.6659, -0.6455, 0.0157]], [[ 3.5474, -4.8980, -4.4502, ..., -3.7659, -3.0619, -1.3686]]], [[[-0.5600, -6.8015, -7.3521, ..., -4.0539, -2.8717, -4.5915]], [[ 2.6659, -2.9440, -2.6999, ..., -1.8113, -3.4240, -2.2710]], [[ 5.7115, -3.8102, -5.2235, ..., -1.9980, -2.2807, -0.4234]], ..., [[ 0.4615, -3.2567, -3.4640, ..., 0.2591, -2.8932, -2.6572]], [[ 4.2347, -5.3426, -4.8805, ..., -0.9743, -3.7916, -1.1375]], [[ 2.9535, -3.6387, -4.9091, ..., -4.4599, -3.1134, -2.6097]]], [[[-0.5743, -6.9969, -6.7047, ..., -2.6795, -2.3327, -4.1008]], [[ 2.3415, -1.1764, -0.7132, ..., -0.3532, 0.0187, -2.2263]], [[ 6.1291, -3.6515, -3.8556, ..., -3.5309, -1.7341, -0.9165]], ..., [[-0.0514, -2.1014, -2.5115, ..., 0.0219, -0.4313, -1.9093]], [[ 4.0221, -2.1043, -2.2003, ..., -1.0705, -1.3496, -2.2537]], [[ 3.1337, -3.6025, -3.4769, ..., -3.7519, -3.1383, -1.9365]]], [[[ 0.1424, -7.2824, -7.8550, ..., -3.8116, -1.9730, -3.4303]], [[ 4.4966, -2.3353, -0.4352, ..., -1.8620, -0.5651, -0.8701]], [[ 6.2599, -2.5467, -2.8287, ..., -4.6432, -3.1797, -1.9502]], ..., [[ 1.9242, -6.6687, -6.0882, ..., -6.2592, -3.5830, -1.4624]], [[ 5.7615, -3.6831, -2.7624, ..., -5.6585, -4.0557, -2.9369]], [[ 3.2279, 0.1448, -2.4503, ..., -7.2888, -2.2052, -1.9240]]], [[[-0.6248, -8.1835, -8.1096, ..., -3.6304, -2.4547, -4.5152]], [[ 2.6876, -2.8159, -3.3631, ..., -1.5137, 0.6680, 0.1324]], [[ 6.5729, -5.0252, -4.8813, ..., -2.4345, -0.0351, 0.7125]], ..., [[ 0.4877, -4.4654, -4.6825, ..., -1.0481, -0.8771, -1.9286]], [[ 4.1708, -4.2222, -3.1344, ..., -1.1784, 1.2115, 0.5078]], [[ 3.0905, -4.6800, -4.6127, ..., -1.9366, -1.0050, -1.1802]]]]) attn_weights tensor([[[[ 1.3301, -2.1481, -1.8927, ..., -1.4486, -0.8153, -0.6885]], [[ 4.3737, -2.2585, -3.6594, ..., -0.6446, -2.4307, 0.9275]], [[ 1.8822, -0.3770, -1.4993, ..., 0.0301, -1.1586, -0.8312]], ..., [[ 1.0461, -1.8321, -1.7805, ..., -1.0936, -0.7872, -2.1589]], [[ 1.4938, -2.6466, -2.8984, ..., -1.1385, -1.7097, -1.2160]], [[ 1.3896, -3.0360, -4.3377, ..., -2.5559, -3.7815, -4.0795]]], [[[ 1.1750, -3.2648, -2.5671, ..., -1.8155, -1.2009, -0.1673]], [[ 4.8883, -2.0977, -3.4399, ..., -0.7291, -2.0575, 0.5817]], [[ 1.6880, -1.2251, -2.1464, ..., -0.6538, -0.1016, -0.3471]], ..., [[ 0.6611, -3.9088, -3.8083, ..., -2.9499, -3.2790, -2.5463]], [[ 1.2593, -4.3287, -3.7686, ..., -2.2503, -3.0790, -0.9853]], [[ 0.5849, -4.5846, -4.4693, ..., -4.0732, -4.8298, -4.8596]]], [[[ 1.0698, -2.9361, -2.1636, ..., -2.9682, -1.9476, -2.0136]], [[ 4.1689, -2.0722, -3.5174, ..., -1.6674, -2.8054, -3.1496]], [[ 1.7982, -1.3128, -2.3866, ..., -2.1259, -2.4154, -2.2331]], ..., [[ 0.6401, -3.0215, -2.8494, ..., -2.0596, -1.5040, -2.0310]], [[ 1.1040, -3.4359, -3.1732, ..., -1.1949, -1.6263, -1.2623]], [[ 1.1256, -3.0627, -3.8034, ..., -3.5276, -3.9957, -3.4572]]], [[[ 1.5752, -3.2235, -2.7014, ..., -5.7372, -2.6182, -1.8755]], [[ 4.9454, -2.7045, -3.9372, ..., -4.8595, -4.3424, -2.9467]], [[ 1.7644, -1.7416, -1.9846, ..., -3.9160, -0.7964, -1.2711]], ..., [[ 1.3263, -2.2949, -2.0286, ..., -4.1947, -0.9425, -1.2268]], [[ 1.1839, -1.8619, -2.8299, ..., -3.4457, -2.3688, -1.4774]], [[ 1.6710, -1.9489, -3.0822, ..., -6.3350, -3.1763, -2.6658]]], [[[ 1.0483, -3.7391, -3.2010, ..., -1.7165, -1.7957, -0.8586]], [[ 4.6990, -3.1342, -4.0582, ..., -1.9264, 0.9434, 0.7870]], [[ 1.6258, -2.0303, -3.3657, ..., -1.7742, -0.2781, -0.5712]], ..., [[ 1.1887, -4.3382, -4.5271, ..., -3.6530, -2.2202, -2.2056]], [[ 1.1509, -4.5354, -4.2650, ..., -1.7336, -1.3480, -0.6856]], [[ 0.7961, -4.1721, -4.0781, ..., -3.8070, -3.8281, -4.3299]]]]) attn_weights tensor([[[[ 2.4637, -0.9798, -1.4440, ..., -0.8554, -0.9891, -2.3538]], [[ 4.5949, -0.1340, -2.1811, ..., -0.5232, -2.2119, -1.4884]], [[ 2.3385, -1.6712, -1.6046, ..., -0.8074, -0.8227, -3.7204]], ..., [[ 4.4047, -1.5133, -3.1801, ..., -2.3013, -2.6648, -1.4153]], [[ 1.7615, -3.4602, -1.9425, ..., 0.4901, 1.4723, -0.5933]], [[ 3.6308, -2.8766, -3.1729, ..., -2.6895, -3.9220, -0.6126]]], [[[ 1.2366, -3.5759, -2.3556, ..., -4.0754, -3.9019, -2.9486]], [[ 3.7944, -1.5845, -4.0890, ..., -1.8973, -1.4320, -0.8494]], [[ 0.9883, -3.3971, -3.9355, ..., -2.9350, -3.3215, -2.5191]], ..., [[ 3.3592, -3.3184, -3.8043, ..., -2.5560, -2.6497, -1.7484]], [[ 1.9326, -4.8929, -5.4089, ..., -2.2925, -2.0998, -2.1428]], [[ 3.2975, -1.0487, -2.5583, ..., -3.0554, -2.3060, -2.4166]]], [[[ 1.7642, -1.5447, -1.3629, ..., -2.7845, -1.4009, -2.2366]], [[ 3.6624, -0.9757, -1.9756, ..., -2.0469, -2.8607, -1.6329]], [[ 1.3863, -0.7569, -1.3606, ..., -0.5734, -1.0099, -2.2592]], ..., [[ 4.5396, -1.8237, -2.1624, ..., -2.2184, -2.7829, -1.3794]], [[ 0.7042, -4.0114, -2.8077, ..., 0.6976, 0.5395, -1.3257]], [[ 3.5065, -0.9114, -2.6079, ..., -2.1787, -2.4648, -1.0760]]], [[[ 2.8217, -2.2782, -2.6258, ..., -5.2903, -1.9681, -2.8559]], [[ 3.0597, -1.9342, -3.8514, ..., -5.0735, -2.2348, -1.0482]], [[ 3.1627, -5.0140, -3.0322, ..., -2.9046, -1.7834, -2.4093]], ..., [[ 3.8526, -3.0348, -2.4762, ..., -3.0422, -3.0105, -3.3512]], [[ 1.4399, -5.0027, -4.9470, ..., -4.8326, -2.1670, -3.0214]], [[ 3.7607, 1.5131, -2.1093, ..., -3.9855, -0.0536, -1.6477]]], [[[ 1.8379, -4.1141, -3.5483, ..., -1.8072, -1.5282, -1.6896]], [[ 3.6624, -2.1625, -3.6286, ..., -2.7505, 0.2679, 0.2544]], [[ 1.7344, -3.6933, -3.4145, ..., -2.4668, -0.5127, -0.9531]], ..., [[ 4.6274, -1.8847, -2.3331, ..., -2.1741, 1.5028, 0.1284]], [[ 1.5616, -4.7561, -4.2238, ..., -1.7951, -0.5617, -1.0649]], [[ 4.0416, -1.5537, -3.2007, ..., -1.7242, -2.2495, -1.2180]]]]) attn_weights tensor([[[[ 3.7006, -2.8642, -3.3617, ..., -3.7505, -3.6768, -3.8024]], [[ 4.6034, -1.4295, -1.0487, ..., -2.0423, -1.2195, 1.0657]], [[ 3.7495, -0.2719, -1.3269, ..., -1.3448, -2.0554, -0.9990]], ..., [[ 2.2050, -4.9610, -4.5881, ..., -3.4929, -2.1381, -1.4094]], [[ 3.8611, -0.7316, -1.6333, ..., -1.0128, -1.9499, -0.7400]], [[ 5.5718, -0.4056, 1.0346, ..., -0.9072, 0.8405, 0.2556]]], [[[ 2.2546, -3.9734, -4.3340, ..., -3.0559, -3.3077, -3.3055]], [[ 3.4202, -2.4719, -3.1003, ..., -1.9929, -3.2036, -1.4674]], [[ 2.9538, -2.0268, -2.2025, ..., -2.1073, -3.8629, -2.2056]], ..., [[ 1.0599, -3.8091, -5.0711, ..., -2.9548, -3.9601, -2.4202]], [[ 3.1620, -2.5666, -2.5157, ..., -1.9893, -3.4430, -2.1491]], [[ 4.1366, -1.2856, -0.5223, ..., -2.8002, -1.3840, 0.6511]]], [[[ 2.7842, -2.7975, -3.4465, ..., -3.4362, -3.7712, -3.0703]], [[ 4.1925, -0.9078, -2.1427, ..., -2.4052, -2.9639, -1.3590]], [[ 3.1314, -0.2177, -1.3857, ..., -1.3789, -1.1067, -0.2927]], ..., [[ 1.5934, -4.3507, -3.9031, ..., -2.9856, -2.5842, -1.6879]], [[ 3.4905, -1.8025, -1.8327, ..., -2.4638, -2.1301, -1.0911]], [[ 4.2096, 0.1813, 1.8065, ..., -0.0897, 1.9755, 0.3584]]], [[[ 2.6983, -3.1603, -3.4991, ..., -3.7789, -2.8552, -2.6268]], [[ 4.1392, -2.3198, -2.5615, ..., -2.9149, -1.8458, -1.4387]], [[ 3.9556, -0.6370, -1.4288, ..., -4.4499, -1.4204, 0.6237]], ..., [[ 1.0755, -4.4967, -4.5840, ..., -3.9023, -1.7637, -1.4278]], [[ 3.1101, -1.7068, -1.8327, ..., -3.3938, -2.1301, -1.7046]], [[ 3.6893, -0.6477, -1.9309, ..., -2.2391, -0.7410, -0.9148]]], [[[ 3.1099, -4.0574, -3.9710, ..., -2.7065, -1.6065, -1.7837]], [[ 4.0184, -2.9248, -3.0587, ..., -1.8337, 0.3522, -0.0131]], [[ 3.3879, -3.1468, -2.9215, ..., -1.6711, 0.8688, -0.1462]], ..., [[ 1.0981, -5.4230, -4.8414, ..., -2.1486, -1.8702, -1.7340]], [[ 3.7118, -2.0240, -2.4976, ..., -1.4339, -0.3180, -0.4834]], [[ 4.8638, -1.1712, -0.1746, ..., 2.0634, 3.0173, 1.6708]]]]) attn_weights tensor([[[[ 1.8591, 0.3562, 0.4823, ..., 0.7479, 0.7116, 0.6197]], [[ 4.5414, 0.0368, -0.4591, ..., -0.6512, -0.6633, 0.0592]], [[ 4.1051, -0.7008, -1.0769, ..., -2.4545, -1.7294, -2.4344]], ..., [[ 5.3519, 0.8042, -0.0765, ..., 0.1890, -0.3953, 0.5831]], [[ 4.4572, 1.7064, 2.7107, ..., 0.6061, 2.3121, 2.2939]], [[ 4.4150, 1.5029, 2.6437, ..., 0.9647, 2.6718, 2.3022]]], [[[ 1.3991, -0.3162, -0.1026, ..., 0.2350, -0.8194, 0.3101]], [[ 3.7390, -1.4672, -1.3216, ..., -1.2388, -1.1441, -1.3703]], [[ 3.2367, -1.4967, -2.2576, ..., -2.1477, -2.6948, -2.6838]], ..., [[ 3.9851, -0.8576, -2.0426, ..., -0.9391, -0.4037, -0.1540]], [[ 2.9657, -0.5023, 0.3724, ..., 0.2322, -0.1994, 1.5667]], [[ 2.9070, -1.1166, 0.3920, ..., -1.5599, -0.9034, 0.9247]]], [[[ 1.2708, 1.1472, 1.1379, ..., 1.2549, 1.4759, 0.7618]], [[ 4.1261, -0.0415, -0.4143, ..., -0.6655, -0.2925, 0.0647]], [[ 3.3860, -0.7124, -1.3832, ..., -1.8625, -1.8119, -1.5123]], ..., [[ 4.8226, -0.2518, -0.2329, ..., -0.2587, -0.7181, -0.0176]], [[ 3.1690, -0.0056, 1.6974, ..., 0.4860, 1.8519, 0.6798]], [[ 3.6948, -0.5841, 1.1086, ..., 0.3016, 2.1045, 1.4803]]], [[[ 2.2387, 0.5759, -0.3385, ..., -2.5255, 1.1165, 1.6726]], [[ 3.6030, 0.1265, -1.1445, ..., -1.2117, -0.3383, -0.5891]], [[ 3.5252, -0.5673, -1.0730, ..., -2.5728, -0.8083, -0.7268]], ..., [[ 4.2276, -0.5329, -1.9581, ..., -2.2068, -0.7547, -1.3156]], [[ 4.0823, 2.1854, 0.5800, ..., -0.3988, 2.2074, 1.3796]], [[ 1.3469, 1.5706, -1.2857, ..., -1.4937, 2.6855, -0.8348]]], [[[ 1.8347, -0.5635, -1.4303, ..., -0.5948, 0.7615, 0.6718]], [[ 4.1390, -1.0433, -1.1296, ..., -0.6362, 1.0048, 0.0190]], [[ 3.5041, -1.8016, -1.6682, ..., -0.4375, 0.0120, -0.1637]], ..., [[ 4.3961, -0.6695, -1.6811, ..., -0.2046, 1.7272, 1.4271]], [[ 3.2302, -0.3313, 0.4370, ..., 0.9867, 2.5401, 1.8297]], [[ 3.3189, -1.3654, 0.0214, ..., 1.1203, 1.8891, 0.9778]]]]) attn_weights tensor([[[[-1.0424, -2.4574, -1.1821, ..., -0.5179, -1.8811, -1.8502]], [[ 0.4402, 0.0173, 0.4680, ..., -0.0525, 0.3927, 7.6543]], [[-1.4808, -2.4733, -2.2729, ..., -2.1858, -1.6772, -2.1097]], ..., [[-2.1649, -2.6982, -2.7397, ..., -2.3667, -2.6774, -2.3376]], [[-0.6056, -1.2234, -1.0287, ..., -0.5855, -0.7333, 0.5973]], [[-1.1383, -2.2635, -3.4091, ..., -4.0291, -2.5978, -2.0668]]], [[[-1.1190, -3.1450, -2.1416, ..., -2.2693, -2.9092, -2.9009]], [[-0.3226, 0.5981, 0.7414, ..., -1.3024, 0.9299, 6.7818]], [[-1.7201, -2.8997, -2.8228, ..., -2.3115, -1.1637, -2.8783]], ..., [[-2.0999, -2.5240, -2.5591, ..., -2.6681, -1.9496, -2.4866]], [[-0.2176, -0.6767, -0.7030, ..., -1.0053, -0.0162, 0.9752]], [[-1.3497, -2.2124, -3.3151, ..., -2.7697, -2.6532, -2.9011]]], [[[-0.6202, -2.5873, -1.4297, ..., -0.8078, -0.7168, -0.7695]], [[ 0.1012, 0.8892, 2.6956, ..., 2.2028, 3.2316, 11.2091]], [[-1.2144, -2.2041, -1.8905, ..., -1.8687, -1.4266, -2.4958]], ..., [[-2.1684, -2.7805, -2.7373, ..., -2.4175, -2.6764, -3.0120]], [[-0.1454, -0.6796, -0.4589, ..., -0.1982, -0.3781, 1.0034]], [[-1.1889, -2.0028, -3.0520, ..., -3.5830, -2.2633, -2.5151]]], [[[-1.0393, -4.2096, -1.9829, ..., -1.6243, -3.6851, -3.7108]], [[-1.3665, 0.1435, -1.8918, ..., -0.3808, 4.5109, 4.5543]], [[-1.5887, -2.8179, -1.6733, ..., -1.2218, -3.3900, -3.3505]], ..., [[-1.4569, -1.8533, -1.7329, ..., -1.4390, -1.1820, -1.1459]], [[-0.2838, -0.7909, -0.7235, ..., -0.2005, 0.0638, 0.0841]], [[-1.0295, -2.2149, -3.1658, ..., -2.4020, -2.0887, -2.0723]]], [[[-0.6028, -2.8403, -1.9643, ..., -1.9274, -2.5235, -1.8968]], [[ 0.8027, 1.6774, 1.6809, ..., 2.7294, 1.8931, 9.9194]], [[-1.8592, -2.9840, -2.5016, ..., -1.8996, -1.7311, -2.4630]], ..., [[-2.3954, -2.9126, -2.8624, ..., -2.6531, -2.3126, -2.7982]], [[-0.5155, -0.9996, -0.9273, ..., -0.6424, -0.1486, 0.9036]], [[-1.1241, -2.0401, -3.3750, ..., -1.9647, -2.3889, -2.2068]]]]) attn_weights tensor([[[[-3.2585e+00, -5.5098e+00, -3.5008e+00, ..., 2.2305e+00, 4.0986e+00, -4.7523e-01]], [[-1.5380e+00, -2.6835e+00, -3.0589e+00, ..., 1.6961e+00, 1.5915e+00, 5.0127e-01]], [[-4.0906e+00, -4.4681e+00, -4.5187e+00, ..., -2.8039e+00, -3.1321e+00, -2.5727e+00]], ..., [[ 1.3048e+00, -8.6782e-01, 3.2538e-02, ..., 3.8681e-03, -6.3344e-01, -1.3257e-01]], [[-3.8972e+00, -2.7946e+00, -2.6904e+00, ..., -8.3171e-01, -1.0650e+00, -4.5280e-01]], [[ 9.0990e-01, 1.0337e+00, -2.7904e+00, ..., -2.4094e+00, -1.4566e+00, 4.1082e+00]]], [[[-2.1728e+00, -4.8429e+00, -4.2099e+00, ..., 2.0523e-01, 1.9034e+00, -1.0036e+00]], [[-1.2657e+00, -2.7974e+00, -3.0254e+00, ..., 8.5892e-01, 1.2416e+00, 5.1048e-01]], [[-4.0769e+00, -4.4281e+00, -4.5239e+00, ..., -2.7084e+00, -2.5624e+00, -2.5518e+00]], ..., [[ 1.2222e+00, -7.2046e-01, 2.9706e-01, ..., -5.7280e-01, -6.3288e-01, 6.0317e-03]], [[-4.0911e+00, -2.8030e+00, -2.6673e+00, ..., -6.1673e-01, -7.9870e-01, -6.4561e-01]], [[-3.5908e-01, -7.2302e-01, -4.2176e+00, ..., -3.6092e+00, -5.8379e-01, 3.1137e+00]]], [[[-1.5307e+00, -3.8424e+00, -3.2313e+00, ..., 1.2655e+00, 2.4115e+00, 1.1272e+00]], [[-1.2425e+00, -2.6371e+00, -3.3447e+00, ..., 9.7803e-01, 1.2513e+00, 7.6441e-01]], [[-3.8742e+00, -4.2379e+00, -4.3234e+00, ..., -2.7475e+00, -2.9494e+00, -3.2099e+00]], ..., [[ 1.1889e+00, -7.4442e-01, -4.8357e-02, ..., -5.0306e-02, -3.5293e-01, -1.0815e+00]], [[-4.0843e+00, -2.7159e+00, -2.6862e+00, ..., -9.0998e-01, -9.7342e-01, -9.7562e-01]], [[ 1.1796e+00, 1.0548e+00, -1.5480e+00, ..., -2.1230e+00, -1.6863e+00, 5.1685e+00]]], [[[-1.8751e-01, -2.2138e+00, -2.4748e+00, ..., 6.2333e-01, 6.6685e-01, 7.0504e-01]], [[-2.9660e-01, -1.8854e+00, -2.5251e+00, ..., 1.4934e+00, 1.3473e+00, 1.4309e+00]], [[-3.6541e+00, -4.2762e+00, -4.1390e+00, ..., -2.3770e+00, -2.3355e+00, -2.1689e+00]], ..., [[ 1.5314e+00, -4.9302e-01, 5.4197e-02, ..., -2.6699e-01, -4.0213e-01, -5.6050e-01]], [[-4.1736e+00, -2.4345e+00, -2.3068e+00, ..., -2.5790e-01, -5.6867e-01, -4.4950e-01]], [[ 6.5980e-01, -3.4729e-01, -1.7472e+00, ..., 2.1614e-01, 1.2764e+00, 1.1161e+00]]], [[[-1.8719e+00, -4.0711e+00, -3.0802e+00, ..., 1.3044e+00, 1.8890e+00, 2.8372e-01]], [[-9.8809e-01, -2.7130e+00, -3.0184e+00, ..., 8.5748e-01, 1.0893e+00, 4.9029e-01]], [[-4.0339e+00, -4.3924e+00, -4.5213e+00, ..., -2.9930e+00, -2.7285e+00, -2.6619e+00]], ..., [[ 1.2734e+00, -5.5202e-01, 4.4924e-01, ..., -4.7604e-01, -5.7324e-01, -5.7203e-01]], [[-4.3486e+00, -2.6958e+00, -2.6235e+00, ..., -7.5458e-01, -8.3830e-01, -4.7471e-01]], [[ 1.9899e+00, 1.3435e+00, -2.4400e+00, ..., 3.7223e-01, 6.7352e-01, 5.4744e+00]]]]) attn_weights tensor([[[[-1.7782e+00, -6.0720e+00, -5.2151e+00, ..., -6.0985e-01, 3.3428e-01, -1.6498e+00]], [[ 1.7468e+00, -8.3982e-03, -2.6504e+00, ..., -3.4057e+00, -1.6693e+00, -2.5086e+00]], [[-6.4432e+00, -1.8154e+01, -1.7539e+01, ..., -1.4264e+00, -1.6158e+00, -4.5076e+00]], ..., [[-4.3053e+00, -1.1347e+01, -1.1024e+01, ..., -1.8664e+00, -2.3390e+00, -2.6600e+00]], [[-2.3013e+00, -4.2051e+00, -4.1928e+00, ..., -1.4909e+00, -1.4131e+00, -6.6925e-01]], [[-5.3181e-01, -6.2008e+00, -6.2315e+00, ..., -2.9183e+00, -3.0225e+00, -2.3257e+00]]], [[[-2.0968e+00, -5.7833e+00, -6.2409e+00, ..., -1.7967e+00, -2.4650e-01, -4.3033e+00]], [[ 1.3955e+00, -1.5342e+00, -1.5924e+00, ..., -1.4759e+00, -1.3115e+00, -2.0190e+00]], [[-6.4246e+00, -1.8476e+01, -1.7889e+01, ..., -4.9332e+00, -1.3767e+00, -5.7038e+00]], ..., [[-4.7521e+00, -1.0486e+01, -9.9919e+00, ..., -2.1167e+00, -4.2664e+00, -3.7396e+00]], [[-2.0938e+00, -4.1745e+00, -4.0920e+00, ..., -7.6307e-01, -1.1388e+00, -6.7617e-01]], [[-4.9840e-01, -6.2847e+00, -6.0316e+00, ..., -2.6182e+00, -2.7509e+00, -2.3546e+00]]], [[[-1.4897e+00, -5.0026e+00, -4.7732e+00, ..., -1.2871e+00, -1.9906e+00, -6.0360e-01]], [[ 1.2090e+00, -8.2069e-01, -2.4023e+00, ..., -3.3053e+00, -2.6117e+00, -1.8088e+00]], [[-6.1650e+00, -1.6270e+01, -1.6388e+01, ..., -2.3229e+00, -2.0795e+00, -3.9162e+00]], ..., [[-3.6706e+00, -9.7922e+00, -1.0065e+01, ..., -2.3726e+00, -2.7497e+00, -2.4773e+00]], [[-2.3101e+00, -4.1565e+00, -4.1367e+00, ..., -1.7080e+00, -1.5476e+00, -1.2155e+00]], [[-5.2183e-01, -5.8266e+00, -5.6357e+00, ..., -2.7667e+00, -2.6591e+00, -2.5089e+00]]], [[[-8.2635e-01, -4.2027e+00, -3.1365e+00, ..., -2.2604e+00, -2.4926e+00, -2.2470e+00]], [[ 1.4676e+00, -1.0614e+00, -1.3681e+00, ..., -8.5674e-01, -1.6571e+00, -1.6820e+00]], [[-4.9626e+00, -1.5732e+01, -1.5994e+01, ..., -2.0342e+00, -3.5569e+00, -3.0606e+00]], ..., [[-3.1080e+00, -8.3436e+00, -8.8219e+00, ..., -1.1520e+00, -2.3479e+00, -2.2861e+00]], [[-5.5521e-01, -3.3042e+00, -2.6769e+00, ..., -6.1431e-01, -8.8392e-01, -5.9227e-01]], [[-2.0998e-01, -5.8435e+00, -5.2888e+00, ..., -2.6676e+00, -2.5137e+00, -2.2649e+00]]], [[[-1.7984e+00, -5.7923e+00, -5.6135e+00, ..., -1.5443e+00, -1.5862e-01, -3.6738e+00]], [[ 1.6599e+00, -9.9063e-01, -2.1613e+00, ..., -5.3306e-01, -5.9600e-01, -1.4760e+00]], [[-5.4887e+00, -1.6799e+01, -1.6956e+01, ..., -3.0537e+00, -1.0188e+00, -4.0911e+00]], ..., [[-3.7799e+00, -9.7094e+00, -9.8552e+00, ..., -2.0196e+00, -3.2508e+00, -2.8943e+00]], [[-2.1443e+00, -4.1423e+00, -4.1913e+00, ..., -8.6686e-01, -1.1907e+00, -5.1686e-01]], [[-3.8003e-01, -5.9721e+00, -5.8954e+00, ..., -2.6801e+00, -2.6009e+00, -2.2709e+00]]]]) attn_weights tensor([[[[ 4.3530, -1.5702, -2.9479, ..., -3.7483, -1.6809, 1.9894]], [[ -2.2182, -9.1421, -8.3662, ..., -3.1813, -4.8434, -5.8041]], [[ -4.3911, -13.3822, -14.1507, ..., -3.8816, -4.6215, -5.8881]], ..., [[ -1.3113, -7.5630, -8.5252, ..., -3.0207, -1.3357, -4.2994]], [[ -0.7794, -7.1102, -6.0008, ..., -2.9070, -3.2360, -2.5168]], [[ -2.1728, -8.5592, -10.6322, ..., -4.3595, -3.3293, -2.4969]]], [[[ 4.2933, -1.1532, -2.0936, ..., -4.7203, -1.8115, 1.7394]], [[ -2.7209, -8.5322, -7.9660, ..., -4.9542, -3.4332, -3.8123]], [[ -4.8796, -13.2037, -13.4151, ..., -5.6321, -4.3528, -6.6072]], ..., [[ -1.7689, -8.8506, -8.3530, ..., 1.1749, -0.6585, -3.3643]], [[ -1.1105, -6.8498, -6.7806, ..., -4.5846, -5.0612, -3.2023]], [[ -2.6934, -9.3115, -10.6267, ..., -1.8501, -1.9488, -4.2423]]], [[[ 4.5154, -1.0998, -1.9001, ..., -2.7426, -3.0804, 1.8180]], [[ -2.6966, -8.2685, -8.3084, ..., -4.0547, -4.8610, -4.5914]], [[ -4.0687, -12.9312, -13.7551, ..., -5.0608, -5.4410, -5.2685]], ..., [[ -0.9577, -7.4397, -6.9172, ..., -2.7944, -1.3586, -2.3003]], [[ -0.9949, -6.1590, -6.5281, ..., -3.9335, -3.5648, -2.7317]], [[ -2.1192, -9.1728, -10.6655, ..., -4.5370, -4.0473, -2.6356]]], [[[ 4.6286, 0.8573, -1.9457, ..., -1.2443, 2.2323, 2.3813]], [[ -2.0043, -6.3162, -7.6042, ..., -2.9195, -2.9564, -3.0608]], [[ -4.0254, -8.0915, -9.8591, ..., -4.2693, -3.6114, -3.9315]], ..., [[ -1.2942, -4.3034, -6.6722, ..., -2.9232, -5.0854, -4.3550]], [[ -0.8432, -5.6250, -5.5809, ..., -3.4709, -2.8335, -2.7446]], [[ -1.8866, -7.0060, -8.2871, ..., -3.2108, -1.5813, -2.1793]]], [[[ 4.6342, -0.7253, -2.7814, ..., -1.9131, -0.8072, 2.5045]], [[ -2.4498, -9.1158, -8.5083, ..., -3.6795, -4.0650, -3.7994]], [[ -4.6755, -14.2608, -14.8605, ..., -5.4676, -5.2995, -5.4630]], ..., [[ -1.9727, -8.8902, -7.7527, ..., -1.0672, -1.9265, -5.4172]], [[ -0.9068, -7.0253, -6.2390, ..., -3.8801, -4.1117, -2.6342]], [[ -2.5157, -9.0356, -9.6576, ..., -3.5333, -3.1321, -4.0371]]]]) attn_weights tensor([[[[-1.7042e+00, -1.3199e+01, -1.2351e+01, ..., -5.7754e+00, -3.3579e+00, -4.8440e+00]], [[-2.3696e+00, -8.7010e+00, -9.1842e+00, ..., -2.4344e+00, -3.4854e+00, -4.3125e+00]], [[-2.1494e-01, -3.2870e+00, -3.3121e+00, ..., -2.5041e+00, -2.5630e+00, -2.9576e+00]], ..., [[-1.1435e+00, -5.7326e+00, -6.4840e+00, ..., -2.7916e+00, -2.0101e+00, -1.5410e+00]], [[ 1.4725e+00, -2.8104e+00, -2.6156e+00, ..., -3.1123e+00, -3.1007e+00, -2.6111e+00]], [[-5.6520e+00, -3.6370e+01, -2.7130e+01, ..., 1.2822e+00, 1.3024e+01, 5.6187e+00]]], [[[-1.2260e+00, -1.1947e+01, -1.1248e+01, ..., -5.6177e+00, -4.0590e+00, -4.8302e+00]], [[-2.6131e+00, -9.2159e+00, -9.5038e+00, ..., 7.0759e-03, -8.0099e-01, -3.2405e+00]], [[ 4.4340e-02, -2.8214e+00, -2.7807e+00, ..., -3.7212e+00, -3.8089e+00, -4.2179e+00]], ..., [[-3.5299e-01, -7.7790e+00, -8.8007e+00, ..., -4.6313e+00, -3.8061e+00, -5.9177e+00]], [[ 1.5099e+00, -2.7903e+00, -2.7842e+00, ..., -4.0239e+00, -2.4832e+00, -3.8355e+00]], [[-5.8983e+00, -2.8232e+01, -3.2566e+01, ..., 3.7880e+00, 1.7144e+01, 5.6990e+00]]], [[[-2.2235e+00, -1.2988e+01, -1.1225e+01, ..., -5.4336e+00, -4.3312e+00, -6.1957e+00]], [[-2.6606e+00, -8.7753e+00, -9.1389e+00, ..., -2.9461e+00, -2.5261e+00, -2.4708e+00]], [[-8.6441e-03, -2.2849e+00, -3.2652e+00, ..., -3.6192e+00, -3.5850e+00, -3.7904e+00]], ..., [[-5.9594e-01, -6.8227e+00, -7.2116e+00, ..., -4.3005e+00, -3.7189e+00, -2.4385e+00]], [[ 1.6104e+00, -2.4104e+00, -3.3762e+00, ..., -3.8833e+00, -4.1406e+00, -3.7098e+00]], [[-6.4062e+00, -3.3712e+01, -2.7560e+01, ..., -3.9409e+00, 7.1251e+00, -2.8592e+00]]], [[[-2.5334e+00, -7.6111e+00, -8.7699e+00, ..., -4.1390e+00, -1.4534e+00, -4.5088e+00]], [[-1.2419e+00, -7.7792e+00, -9.9758e+00, ..., -3.8815e+00, -3.8765e+00, -3.9098e+00]], [[ 4.9719e-01, -1.5336e+00, -2.2707e+00, ..., -1.0728e+00, -1.7359e+00, -1.3302e+00]], ..., [[-7.9731e-01, -3.9488e+00, -4.9083e+00, ..., -2.7915e+00, -4.0243e+00, -4.5351e+00]], [[ 1.4946e+00, -1.5573e+00, -2.0036e+00, ..., -2.4754e+00, -1.5431e+00, -1.0293e+00]], [[-9.2539e+00, -1.9190e+01, -2.4340e+01, ..., 8.6396e-01, 4.3005e+00, 5.2853e+00]]], [[[-1.1491e+00, -1.2179e+01, -1.2443e+01, ..., -4.3396e+00, -4.6460e+00, -3.3563e+00]], [[-2.3742e+00, -8.6408e+00, -8.9282e+00, ..., -2.2485e+00, -2.4221e+00, -4.5808e+00]], [[ 3.0214e-01, -3.8225e+00, -4.5461e+00, ..., -2.9381e+00, -2.5925e+00, -2.2630e+00]], ..., [[-9.7662e-01, -6.5436e+00, -6.5702e+00, ..., -1.8524e+00, -1.0697e+00, -3.4052e+00]], [[ 1.4756e+00, -3.3937e+00, -2.6483e+00, ..., -2.4288e+00, -2.0511e+00, -3.1870e+00]], [[-8.2497e+00, -3.0727e+01, -2.7328e+01, ..., 5.2669e+00, 1.4639e+01, 2.9842e+00]]]]) attn_weights tensor([[[[ 2.5202e+00, -3.7369e+00, -4.3391e+00, ..., -3.9682e+00, -1.7684e+00, -1.1141e+00]], [[ 4.6174e+00, -5.4746e+00, -4.8317e+00, ..., -8.6809e+00, -7.8346e+00, -3.9115e+00]], [[ 4.2143e-01, -4.3231e+00, -4.8433e+00, ..., -1.4369e+00, -1.3368e+00, -2.8845e+00]], ..., [[ 9.7742e-01, -2.8631e+00, -2.9727e+00, ..., -2.9715e+00, -3.2069e+00, -5.2759e+00]], [[ 1.6814e+00, -1.1552e+00, -4.5848e-01, ..., 4.6748e-01, 2.8657e-01, 2.0448e-01]], [[ 1.2761e+00, -2.9021e+00, -3.2471e+00, ..., -2.7397e+00, -2.4751e+00, -5.0247e-01]]], [[[ 2.3087e+00, -7.7451e+00, -5.7871e+00, ..., -7.1251e+00, -3.8425e+00, -3.3341e+00]], [[ 4.4607e+00, -1.3846e+01, -9.9655e+00, ..., -9.6726e+00, -3.5519e+00, -3.3812e+00]], [[ 1.0276e+00, -5.4718e+00, -7.0256e+00, ..., -3.6743e+00, -3.0499e+00, -4.9775e+00]], ..., [[ 1.0028e+00, -3.7728e+00, -4.0567e+00, ..., -4.1410e+00, -3.3817e+00, -4.6612e+00]], [[ 2.0008e+00, -2.3662e+00, -5.9580e-01, ..., -3.7019e+00, -3.0010e+00, -2.6843e+00]], [[ 1.4342e+00, -5.8483e+00, -5.2900e+00, ..., -1.6392e+00, -3.6116e-01, 4.6672e-01]]], [[[ 2.3430e+00, -4.7968e+00, -5.4749e+00, ..., -3.9381e+00, -4.7309e+00, -3.5909e+00]], [[ 4.9019e+00, -1.3049e+01, -1.0903e+01, ..., -6.2013e+00, -7.4968e+00, -2.3200e+00]], [[ 2.2903e-01, -4.9505e+00, -5.3897e+00, ..., -3.1641e+00, -3.1645e+00, -3.9081e+00]], ..., [[ 1.0926e+00, -2.8995e+00, -3.7253e+00, ..., -4.2625e+00, -4.0284e+00, -5.6865e+00]], [[ 1.7384e+00, -1.4346e+00, -6.3458e-01, ..., -5.2230e-01, -6.7465e-01, -1.2301e+00]], [[ 1.0512e+00, -4.4023e+00, -4.0407e+00, ..., -2.1994e+00, -1.9050e+00, -1.5185e+00]]], [[[ 2.5246e+00, -2.2849e+00, -4.8635e+00, ..., -4.4521e+00, -3.2487e+00, -6.0894e-01]], [[ 3.6992e+00, -7.4526e+00, -6.6490e+00, ..., -6.4817e+00, -3.6639e+00, -6.0133e-01]], [[ 9.0282e-01, -2.6075e+00, -3.5899e+00, ..., -3.7407e+00, -3.5653e+00, -4.6383e+00]], ..., [[ 1.1575e+00, -2.4867e+00, -1.9012e+00, ..., -2.4621e+00, -2.8204e+00, -2.0260e+00]], [[ 2.1916e+00, -4.6270e-01, -9.7670e-01, ..., -4.1922e-01, -2.4634e-01, -1.7828e-03]], [[ 1.2072e+00, -3.8629e+00, -3.5790e+00, ..., -2.7335e+00, -2.8815e+00, -9.4179e-01]]], [[[ 2.9317e+00, -5.9339e+00, -5.3452e+00, ..., -2.7110e+00, -2.3242e+00, -8.8171e-01]], [[ 4.8819e+00, -1.0463e+01, -8.3331e+00, ..., -8.3078e+00, -2.6740e+00, -2.9547e+00]], [[ 8.5769e-01, -4.9991e+00, -5.9899e+00, ..., -1.9169e+00, -1.7211e+00, -2.9251e+00]], ..., [[ 1.1874e+00, -4.2533e+00, -4.7513e+00, ..., -2.8863e+00, -3.3771e+00, -4.0677e+00]], [[ 1.9641e+00, -1.0526e+00, -1.3847e+00, ..., -1.2803e+00, -2.1448e+00, -9.3400e-01]], [[ 1.1303e+00, -4.1610e+00, -4.3340e+00, ..., -3.0307e+00, -2.4154e+00, -1.5069e+00]]]]) attn_weights tensor([[[[-0.9507, -5.8447, -3.5898, ..., 0.0195, -0.3997, -2.4714]], [[ 0.9422, -4.6997, -7.2187, ..., -5.0442, -3.9654, -2.5350]], [[ 0.3270, -2.5765, -2.7289, ..., -2.3757, -3.1180, -3.3455]], ..., [[ 4.5652, -3.1279, -3.2064, ..., -5.5154, -4.9017, -1.2677]], [[ 2.8070, -2.7918, -2.9172, ..., -1.0323, -1.0879, 0.0972]], [[-0.1073, -4.7646, -5.7380, ..., -0.9994, -1.1872, -2.0039]]], [[[-1.0313, -4.6654, -5.5540, ..., -2.0372, -1.9827, -3.4720]], [[ 0.5800, -5.6568, -7.3813, ..., -6.1620, -3.9525, -3.8176]], [[ 0.4204, -3.1698, -3.3962, ..., -3.2904, -3.3654, -3.9450]], ..., [[ 4.5405, -9.5230, -7.1272, ..., -7.6145, -2.1090, -3.2105]], [[ 2.5504, -3.2209, -2.3708, ..., -2.8553, -1.6568, -2.7544]], [[-0.0718, -5.2379, -6.6749, ..., -1.1882, -1.0602, -2.5250]]], [[[-1.3330, -5.7199, -4.3765, ..., -1.3488, -1.2096, -2.4257]], [[-0.3178, -4.8956, -6.0248, ..., -3.6030, -3.9737, -2.9482]], [[ 0.1672, -3.0680, -2.7352, ..., -2.7198, -3.1105, -3.5017]], ..., [[ 4.5930, -9.0528, -7.9190, ..., -5.1583, -5.1683, -1.4000]], [[ 2.8568, -3.4009, -2.7753, ..., -1.2643, -1.9557, -0.6631]], [[-0.3280, -5.4115, -6.7382, ..., -2.8433, -2.0017, -1.5189]]], [[[ 0.5665, -4.8979, -5.0071, ..., -4.7029, -3.2110, -4.1154]], [[ 0.7644, -3.6096, -5.8411, ..., -4.2771, -4.7101, -4.8245]], [[ 0.5709, -2.7374, -3.0986, ..., -1.8029, -2.8333, -1.8567]], ..., [[ 3.8403, -3.5617, -1.5286, ..., -4.2781, -1.7756, -1.7308]], [[ 2.7522, -1.7886, -0.9717, ..., -3.0649, -1.7724, -1.5351]], [[ 0.4811, -4.7460, -7.0015, ..., -3.9013, -2.0508, -3.6753]]], [[[-0.9479, -4.9707, -3.8021, ..., -0.8054, 0.3232, -2.2349]], [[ 0.9072, -6.8042, -8.3016, ..., -4.6015, -3.8606, -1.9301]], [[ 0.4010, -4.2738, -4.9166, ..., -3.1480, -3.2200, -3.9145]], ..., [[ 5.1827, -6.4471, -5.1216, ..., -3.9855, -1.4266, -2.4510]], [[ 2.8762, -4.4057, -4.3758, ..., -1.2419, -1.2413, -1.3480]], [[-0.5211, -5.7915, -6.4143, ..., -1.3896, -0.6425, -2.2668]]]]) attn_weights tensor([[[[-0.4648, -8.4718, -7.2074, ..., -1.7266, -2.9348, -3.8472]], [[ 3.5580, 0.6477, -1.0397, ..., -1.5774, -1.8751, -0.7534]], [[ 6.3884, -1.4821, -2.3603, ..., -3.4278, -3.6654, -0.1071]], ..., [[ 0.2023, -3.2160, -3.3166, ..., -0.7181, -1.7589, -2.1342]], [[ 4.1432, -1.1914, -0.7094, ..., -1.4124, -4.0563, -0.4547]], [[ 3.1826, -2.9499, -4.2943, ..., -3.5617, -3.3226, -1.5469]]], [[[-0.6413, -6.0322, -7.9522, ..., -2.8067, -2.5981, -4.3162]], [[ 2.1766, -2.9368, -3.2584, ..., -2.9744, -2.3358, -2.1301]], [[ 5.9191, -3.8051, -5.2595, ..., -4.7020, -2.5198, -3.5468]], ..., [[ 0.4248, -4.1128, -4.4105, ..., -1.6659, -1.3527, -2.4139]], [[ 3.8850, -4.6747, -4.5196, ..., -6.0790, -2.0654, -3.0490]], [[ 2.9576, -2.5971, -5.2572, ..., -3.4762, -2.1279, -2.0572]]], [[[-1.0795, -8.6677, -8.7669, ..., -4.1671, -2.5534, -4.0903]], [[ 2.0905, -2.8939, -2.1487, ..., -0.8259, -3.3290, -1.4832]], [[ 6.3004, -5.4655, -5.2176, ..., -3.7693, -4.4078, 0.8132]], ..., [[-0.1272, -3.4379, -3.3819, ..., -0.4388, -1.4203, -0.8362]], [[ 4.3241, -3.5032, -3.2892, ..., -2.4283, -3.6577, -0.7803]], [[ 3.0217, -3.2169, -3.9615, ..., -4.1557, -2.9671, -1.8602]]], [[[-0.4388, -5.8350, -6.7067, ..., -2.2061, -0.8132, -3.5120]], [[ 2.9898, -1.9727, -0.2748, ..., 0.3723, -0.3550, -1.0327]], [[ 5.2665, -1.6220, -1.4407, ..., -3.1094, -1.4230, 0.1719]], ..., [[ 1.3153, -5.7411, -5.6597, ..., -2.2468, -0.3511, -1.8345]], [[ 3.6127, -3.3680, -2.0373, ..., -3.0165, -1.4094, -2.0229]], [[ 3.0782, -3.8570, -2.5921, ..., -3.1753, -2.0898, -1.4947]]], [[[-0.4915, -8.4858, -9.0093, ..., -4.1973, -2.7976, -3.8980]], [[ 2.8387, -0.8254, -1.5917, ..., -1.0653, -0.3865, -0.3464]], [[ 6.8248, -2.9518, -4.0699, ..., -3.3837, 0.1496, -0.0836]], ..., [[ 0.0926, -4.8606, -4.9243, ..., -1.3061, -0.9407, -2.4589]], [[ 4.8463, -1.2781, -1.8609, ..., -2.8125, 0.2291, -0.7151]], [[ 3.4815, -4.4751, -5.6990, ..., -3.9863, -2.0150, -2.5346]]]]) attn_weights tensor([[[[ 1.1227, -1.9670, -2.5411, ..., -1.4471, -2.8028, -1.2811]], [[ 4.8546, 2.0580, 0.4331, ..., -1.0077, -2.4165, 0.6612]], [[ 1.4908, -0.3657, -0.7035, ..., -0.3236, -0.3074, -0.0589]], ..., [[ 1.1532, -2.1903, -1.8861, ..., -0.7081, -3.3269, -1.8037]], [[ 1.4631, -1.9551, -1.3390, ..., -0.1793, -1.4204, -0.3377]], [[ 1.3298, -2.7297, -3.2768, ..., -2.8217, -4.6880, -4.2021]]], [[[ 1.0992, -3.1770, -2.7871, ..., -2.0267, -1.4345, -1.5943]], [[ 4.8171, -2.2086, -3.4730, ..., -3.7389, -0.2337, 0.6726]], [[ 1.7858, -1.0451, -2.2056, ..., -0.0095, -0.2803, -1.6348]], ..., [[ 0.6813, -4.5071, -3.7464, ..., -3.6167, -2.7623, -1.8444]], [[ 1.2321, -4.5941, -4.7039, ..., -3.8579, -1.8708, -1.2613]], [[ 0.1978, -3.5918, -3.8834, ..., -4.3536, -4.4133, -3.4170]]], [[[ 1.0250, -3.1317, -2.8150, ..., -2.1339, -2.2038, -1.6147]], [[ 3.9438, -5.0004, -4.3645, ..., -3.9017, -3.9238, -2.0289]], [[ 2.4183, -2.0224, -2.4496, ..., -2.5830, -2.3088, -0.2510]], ..., [[ 0.2832, -3.9867, -3.4556, ..., -1.2675, -1.8522, -2.3678]], [[ 1.1108, -3.7004, -3.6481, ..., -2.0170, -1.7594, -1.6624]], [[ 0.5556, -3.4098, -4.3941, ..., -4.3735, -3.6123, -4.4486]]], [[[ 1.3846, -2.9070, -3.5016, ..., -2.5518, -3.0303, -1.3830]], [[ 3.1962, -2.4071, -1.7499, ..., -3.4520, -2.1687, -1.4982]], [[ 1.4586, -1.0286, -1.6882, ..., -0.2888, -1.0542, -0.7406]], ..., [[ 0.9409, -1.6401, -1.3541, ..., -0.4957, -1.7314, -1.1482]], [[ 1.0957, -1.1674, -1.9724, ..., -1.9975, -2.1956, -1.6608]], [[ 0.9104, -3.1788, -3.1158, ..., -2.6221, -2.2734, -2.1190]]], [[[ 0.8402, -4.5008, -4.1964, ..., -1.7572, -1.0041, -0.8835]], [[ 5.2158, -1.5283, -2.7106, ..., -0.9710, -0.5178, -0.7552]], [[ 1.9584, -1.6620, -1.9768, ..., -0.1654, -0.1262, -1.1425]], ..., [[ 1.5094, -4.3001, -4.5802, ..., -3.3741, -3.5777, -2.8721]], [[ 1.0315, -4.6320, -3.9856, ..., -1.9247, -1.4498, -1.6957]], [[ 0.7170, -3.7126, -2.7660, ..., -3.4910, -3.9187, -2.9535]]]]) attn_weights tensor([[[[ 2.3480, -0.7862, -0.9990, ..., -0.9007, -2.0015, -1.9527]], [[ 4.9897, 0.8550, -0.3333, ..., -1.1726, -2.1849, 0.3179]], [[ 2.6798, -2.3239, -1.7198, ..., -2.1169, -5.6139, -4.1767]], ..., [[ 4.0741, -0.5358, -2.4043, ..., -3.6772, -4.4317, -2.5777]], [[ 2.3271, -5.3020, -4.6747, ..., -0.9932, -1.3818, -2.1724]], [[ 3.8016, -0.9562, -1.9713, ..., -1.9843, -1.7888, -1.5300]]], [[[ 1.4369, -3.5097, -2.9387, ..., -3.9690, -2.9631, -2.5741]], [[ 3.6037, -1.8464, -4.5137, ..., -3.4478, -2.4905, -1.2128]], [[ 0.8308, -3.5292, -4.0529, ..., -4.9054, -3.8569, -3.6159]], ..., [[ 2.7682, -3.2964, -4.2199, ..., -4.3212, -3.1907, -2.3684]], [[ 1.6609, -5.6482, -6.5048, ..., -2.5733, -0.0977, -2.4964]], [[ 3.3284, -1.4050, -3.1302, ..., -2.2952, -2.2865, -1.3809]]], [[[ 1.6402, -2.6812, -2.3547, ..., -1.9687, -2.3778, -2.7366]], [[ 3.8376, -3.4082, -2.5408, ..., -3.4101, -3.1506, -0.8834]], [[ 0.9961, -2.2851, -2.5249, ..., -1.3867, -2.4709, -1.6628]], ..., [[ 3.9649, -2.4995, -2.8884, ..., -3.3805, -2.7877, -0.4923]], [[ 0.8248, -4.6272, -3.7118, ..., -0.2238, 0.7641, 0.1298]], [[ 3.2879, -1.7407, -2.9770, ..., -2.8038, -1.8920, -1.7515]]], [[[ 1.8818, -1.4418, -2.6407, ..., -0.9857, -1.9499, -0.8830]], [[ 2.5901, -0.9470, -1.9720, ..., -0.8465, -2.1392, -0.6637]], [[ 1.7243, -3.1675, -1.8384, ..., -0.5186, -1.7370, -1.1496]], ..., [[ 3.0687, -2.1574, -1.3543, ..., -1.9669, -2.5245, -1.2248]], [[ 1.2387, -3.1382, -2.9308, ..., -0.2105, -0.7172, -2.3764]], [[ 3.4821, -0.4788, -2.6225, ..., -1.0182, -1.9252, -0.7772]]], [[[ 2.4995, -4.7653, -4.2242, ..., -3.8389, -3.1196, -1.7752]], [[ 4.0420, -1.6662, -3.4391, ..., -1.4267, -0.7729, 0.5666]], [[ 2.3097, -3.7345, -3.5074, ..., -2.8525, -3.0733, -1.3595]], ..., [[ 4.1327, -1.0075, -1.4140, ..., -1.8956, -1.3713, 0.1918]], [[ 1.7662, -6.0290, -5.2975, ..., -1.8934, -0.8213, -1.4369]], [[ 3.8543, -2.3928, -4.0727, ..., -3.1757, -1.0836, -2.8868]]]]) attn_weights tensor([[[[ 3.0380, -2.3396, -2.6129, ..., -3.3353, -4.1097, -3.0184]], [[ 4.4262, -1.3099, -2.0499, ..., -3.0782, -1.5499, -1.4419]], [[ 3.5943, -0.7178, -0.4862, ..., -1.7397, -2.4520, -1.5834]], ..., [[ 0.8551, -3.6568, -5.9230, ..., -3.3870, -3.0635, -2.4603]], [[ 3.9023, -1.5881, -1.9154, ..., -3.0640, -3.1836, -2.7796]], [[ 4.0521, -0.3487, -0.9061, ..., -1.3223, -0.5204, 0.4324]]], [[[ 1.9886, -3.2831, -4.4417, ..., -4.3133, -3.4304, -3.2834]], [[ 3.1885, -2.2319, -4.3149, ..., -3.3614, -2.6566, -1.2662]], [[ 2.6411, -1.3032, -2.4819, ..., -3.1424, -2.1161, -1.6370]], ..., [[ 1.0378, -3.7523, -5.5819, ..., -4.4263, -0.7509, -0.7445]], [[ 2.9243, -2.1535, -2.5124, ..., -2.8456, -2.5199, -1.9460]], [[ 3.7216, -1.1654, 0.8140, ..., -2.2078, 1.2692, 0.5978]]], [[[ 2.4568, -3.8424, -3.8854, ..., -3.6440, -3.1525, -2.8830]], [[ 4.0474, -1.8259, -3.2716, ..., -3.5683, -2.2265, 0.2352]], [[ 3.0027, -0.7429, -1.8716, ..., -1.7862, -1.5353, 0.2121]], ..., [[ 0.7621, -5.0209, -5.7149, ..., -3.2713, -1.1751, -1.9987]], [[ 2.9627, -2.1375, -1.9390, ..., -2.0932, -1.3510, -1.0739]], [[ 4.4533, -0.1071, 2.2623, ..., 2.2395, 1.3169, 1.0186]]], [[[ 2.8008, -2.7257, -3.3200, ..., -1.5515, -2.3833, -0.5018]], [[ 3.3777, -0.9230, -1.6420, ..., -0.4760, -1.5116, -0.6426]], [[ 3.1951, 0.2276, -0.3381, ..., -0.3223, 1.3408, 1.4153]], ..., [[ 1.2689, -2.7635, -2.8395, ..., -0.3628, 0.1948, -1.0841]], [[ 2.9836, -2.4377, -1.4420, ..., -2.3305, -1.4355, -1.1797]], [[ 3.4104, -0.4489, -1.1413, ..., 0.1691, 0.0183, 0.8622]]], [[[ 2.4381, -2.6647, -3.7392, ..., -2.9897, -1.4826, -2.2157]], [[ 4.1145, -3.3599, -3.2040, ..., -1.3175, -1.5287, 0.8229]], [[ 3.2294, -2.9283, -1.9712, ..., -1.5393, -0.8529, -0.3979]], ..., [[ 0.8140, -4.7114, -4.2793, ..., -0.1331, 0.1530, -1.2227]], [[ 3.4454, -1.7779, -1.5378, ..., -2.5968, -1.9861, -1.3128]], [[ 3.9957, -1.9554, -1.0082, ..., -0.0688, 0.5064, 2.5788]]]]) attn_weights tensor([[[[ 0.8122, 1.6104, 1.1724, ..., 0.8081, -0.1138, 1.3317]], [[ 3.0922, 0.6478, -0.0767, ..., -0.2669, -1.3191, -0.6921]], [[ 2.9213, 0.2781, -1.2747, ..., -2.3040, -2.0464, -2.9032]], ..., [[ 3.9634, 0.3459, -0.9659, ..., -1.4949, -1.4449, -0.3857]], [[ 3.1751, 1.9994, 0.1349, ..., -0.6562, -1.6355, 0.4168]], [[ 1.9549, 3.3812, 0.3315, ..., -1.1441, -1.2653, -0.4460]]], [[[ 1.2633, 0.2559, 0.3375, ..., -0.7100, 0.6550, 0.5029]], [[ 3.4592, -0.9399, -1.3632, ..., -1.0349, -0.7804, -0.4865]], [[ 2.6720, -1.3982, -2.1801, ..., -2.0914, -2.3741, -2.0592]], ..., [[ 3.8993, -1.3856, -2.2739, ..., -0.6805, -0.7027, -0.8035]], [[ 2.7163, -0.4635, 0.2403, ..., -1.0467, 1.6296, 1.6894]], [[ 2.8974, -0.1164, -0.1992, ..., -1.0061, 2.1495, 1.4550]]], [[[ 0.9537, 0.9980, 0.3022, ..., 0.5909, 0.5777, 0.7231]], [[ 3.5580, -0.8799, -0.8409, ..., -1.0883, -0.7734, -0.6504]], [[ 2.8413, -1.4068, -2.1648, ..., -2.6317, -1.8846, -1.4505]], ..., [[ 4.6928, -1.1346, -1.1590, ..., -1.5655, -0.8240, 1.4155]], [[ 2.6528, -0.7773, 1.1140, ..., 1.3387, 1.0518, 0.9234]], [[ 2.8639, -1.0336, 0.7729, ..., 1.6328, 1.9714, 0.5967]]], [[[ 1.9111, 2.4940, 1.3242, ..., 2.1233, 2.4611, 2.0914]], [[ 3.4303, 1.2046, -0.1178, ..., 0.4321, 1.1233, 1.9074]], [[ 3.3601, 0.4679, -1.1241, ..., 0.2918, -0.2217, 1.2527]], ..., [[ 3.7315, 0.0638, -1.5053, ..., -0.0761, -1.1459, 0.3891]], [[ 4.0450, 2.3650, 0.9708, ..., 2.1559, 1.6148, 3.5679]], [[ 3.5184, 1.2409, -0.8090, ..., -0.1564, -10.3463, -5.6324]]], [[[ 1.4142, 0.1638, -0.7005, ..., 1.7548, 1.3848, 1.4598]], [[ 3.4800, -0.3675, -1.1281, ..., -0.2833, 0.0211, 0.5911]], [[ 2.5483, -1.0479, -1.8379, ..., -1.7228, -1.2397, -2.0703]], ..., [[ 3.4853, -1.4883, -2.6753, ..., -1.9990, -2.2215, -0.3320]], [[ 2.6764, 0.1029, -1.4687, ..., 0.3398, -0.2878, 0.2331]], [[ 3.4561, 0.3497, -1.4710, ..., 0.5137, -0.2231, 1.4765]]]]) attn_weights tensor([[[[-1.5501e+00, -3.7899e+00, -2.6004e+00, ..., -2.1986e+00, -2.2671e+00, -3.8099e+00]], [[-2.3168e+00, -4.0533e-01, -3.3498e+00, ..., -3.4768e+00, -7.5799e-01, 4.6488e+00]], [[-2.3072e+00, -2.8024e+00, -3.1566e+00, ..., -2.1487e+00, -1.8173e+00, -1.5176e+00]], ..., [[-1.9262e+00, -2.2787e+00, -2.3139e+00, ..., -2.3117e+00, -1.9000e+00, -1.6845e+00]], [[-5.1435e-01, -6.4820e-01, -6.4423e-01, ..., -4.2995e-01, -4.5835e-01, 2.6094e-01]], [[-1.4875e+00, -2.2999e+00, -3.5604e+00, ..., -2.7908e+00, -2.3246e+00, -2.4304e+00]]], [[[ 3.4084e-01, -1.6215e+00, -1.4645e+00, ..., -1.0486e+00, -1.1699e+00, -7.7674e-01]], [[ 2.6516e+00, 1.1219e+00, 1.4247e+00, ..., 9.1861e-01, 2.5611e+00, 1.1413e+01]], [[-1.3085e+00, -1.8346e+00, -1.4979e+00, ..., -2.2071e+00, -1.7665e+00, -1.2625e+00]], ..., [[-2.0352e+00, -2.5099e+00, -2.6433e+00, ..., -2.3337e+00, -2.5816e+00, -3.7256e+00]], [[ 1.3376e-01, -3.3447e-01, -6.7692e-01, ..., -1.6927e-01, -4.6239e-01, 1.6158e+00]], [[-2.0860e+00, -1.2826e+00, -3.3018e+00, ..., -2.5296e+00, -1.8863e+00, -2.8632e+00]]], [[[-8.7526e-01, -2.6185e+00, -2.0521e+00, ..., -1.4781e+00, -1.3985e+00, -2.3270e+00]], [[-1.0903e-02, -1.5084e+00, -1.0603e+00, ..., -3.5794e+00, -7.0142e-01, 7.5728e+00]], [[-1.8262e+00, -2.6996e+00, -2.4751e+00, ..., -2.1402e+00, -2.7254e+00, -2.8992e+00]], ..., [[-2.1776e+00, -2.6982e+00, -2.7447e+00, ..., -2.7376e+00, -2.7418e+00, -2.4190e+00]], [[-5.8339e-01, -1.0528e+00, -1.2076e+00, ..., -1.3901e+00, -8.1732e-01, 8.9525e-01]], [[-1.2129e+00, -2.2465e+00, -3.6740e+00, ..., -2.5221e+00, -2.4557e+00, -2.6399e+00]]], [[[-7.3684e-01, -2.2881e+00, -2.0038e+00, ..., -2.2441e+00, -2.2187e+00, -1.8442e+00]], [[ 1.5154e+00, 2.3742e+00, 6.4613e+00, ..., -2.9556e-01, -2.5769e-01, 8.2709e+00]], [[-1.5383e+00, -2.3591e+00, -2.0319e+00, ..., -2.0388e+00, -2.0295e+00, -1.7677e+00]], ..., [[-1.9942e+00, -2.4308e+00, -2.7077e+00, ..., -1.9582e+00, -1.9175e+00, -2.3314e+00]], [[ 3.3177e-01, -4.2403e-01, 8.1534e-01, ..., -1.0665e-01, -8.7946e-02, 1.6271e+00]], [[-1.2338e+00, -2.2028e+00, -3.6091e+00, ..., -2.0436e+00, -2.0318e+00, -3.1972e+00]]], [[[-1.1942e+00, -3.2038e+00, -2.8505e+00, ..., -2.4882e+00, -2.3958e+00, -2.9456e+00]], [[ 3.2941e+00, 8.3641e-02, 2.0132e+00, ..., 6.5421e-01, -1.8162e+00, 7.7841e+00]], [[-1.4450e+00, -2.5855e+00, -2.1811e+00, ..., -2.4537e+00, -3.1388e+00, -2.6389e+00]], ..., [[-2.3491e+00, -2.7712e+00, -2.8706e+00, ..., -2.5436e+00, -2.6216e+00, -4.1182e+00]], [[ 1.1118e-01, -5.5712e-01, -5.1767e-01, ..., -2.6675e-01, -8.3613e-01, 1.4167e+00]], [[-1.2607e+00, -2.1025e+00, -3.4593e+00, ..., -2.1940e+00, -2.8945e+00, -2.9305e+00]]]]) attn_weights tensor([[[[-2.0643e+00, -5.5209e+00, -4.9583e+00, ..., 3.1453e-01, 1.5344e+00, -9.9020e-01]], [[-8.5325e-01, -2.5373e+00, -2.7295e+00, ..., 6.9860e-01, 8.4647e-01, 7.0369e-01]], [[-4.0584e+00, -4.4415e+00, -4.5073e+00, ..., -3.1410e+00, -2.6916e+00, -2.4783e+00]], ..., [[ 1.3636e+00, -6.9782e-01, 1.8581e-02, ..., -5.3680e-01, -9.8723e-02, -6.2325e-01]], [[-3.8953e+00, -2.7255e+00, -2.6331e+00, ..., -1.0538e+00, -5.3536e-01, -5.4784e-01]], [[ 1.5048e+00, 3.5049e-01, -2.2851e+00, ..., -2.1241e+00, -2.2768e+00, 3.6119e+00]]], [[[-1.3149e-02, -1.8286e+00, -2.4695e+00, ..., 1.6693e+00, 3.1281e+00, 2.4703e+00]], [[-1.8483e+00, -3.4964e+00, -3.6309e+00, ..., 3.3729e-02, 3.8362e-01, -5.4538e-01]], [[-3.8217e+00, -4.2071e+00, -4.2805e+00, ..., -2.5771e+00, -2.6837e+00, -2.6119e+00]], ..., [[ 1.2341e+00, -3.5678e-01, -3.8671e-02, ..., -1.7567e-01, 3.8503e-02, -1.2531e+00]], [[-4.3969e+00, -2.3708e+00, -2.2958e+00, ..., -6.1755e-01, -5.8161e-01, -4.3984e-01]], [[-2.7664e+00, -2.9027e+00, -7.2647e+00, ..., -3.6424e+00, -4.4662e+00, 1.4712e+00]]], [[[-1.5838e+00, -4.1613e+00, -4.6117e+00, ..., 1.0264e+00, 1.2019e+00, -2.5550e-01]], [[-1.0486e+00, -2.7677e+00, -3.3374e+00, ..., 9.6873e-01, 1.0254e+00, 4.7436e-01]], [[-4.1251e+00, -4.5734e+00, -4.6269e+00, ..., -3.0937e+00, -3.2746e+00, -2.8669e+00]], ..., [[ 1.2939e+00, -8.0683e-01, 6.0393e-03, ..., -3.0067e-01, -7.9289e-01, -7.9149e-02]], [[-4.0372e+00, -2.8379e+00, -2.7236e+00, ..., -9.5542e-01, -8.9899e-01, -7.4447e-01]], [[ 2.2194e-01, 2.4543e-03, -4.4544e+00, ..., -1.5976e+00, -2.5283e+00, 3.9054e+00]]], [[[-1.6195e-01, -2.3991e+00, -3.6057e+00, ..., 1.8477e+00, 2.0559e+00, 1.4299e+00]], [[-1.1226e+00, -2.3450e+00, -3.8798e+00, ..., 2.3017e+00, 2.6887e+00, 1.4794e+00]], [[-3.7976e+00, -4.2423e+00, -4.2265e+00, ..., -2.5404e+00, -2.3690e+00, -2.4061e+00]], ..., [[ 1.2229e+00, -6.1365e-01, 3.2422e-01, ..., -8.1752e-01, -7.8348e-01, 5.7440e-01]], [[-4.1588e+00, -2.5679e+00, -2.4342e+00, ..., -7.2800e-01, -6.0945e-01, -5.4541e-01]], [[-8.5538e-01, -7.2598e-01, 1.6446e+00, ..., 1.0147e+00, 7.4772e-01, 3.5440e+00]]], [[[-1.1743e+00, -3.1914e+00, -3.7262e+00, ..., 1.0791e-03, 1.1229e+00, 6.1966e-01]], [[-1.2531e+00, -3.2886e+00, -3.4471e+00, ..., 2.1685e-01, 8.6419e-01, 9.2222e-02]], [[-3.8923e+00, -4.2796e+00, -4.3178e+00, ..., -2.7695e+00, -2.6363e+00, -2.4747e+00]], ..., [[ 1.2552e+00, -5.8790e-01, -1.4205e-01, ..., -5.0898e-01, -7.0215e-01, -3.9375e-01]], [[-4.0159e+00, -2.4789e+00, -2.3635e+00, ..., -7.5342e-01, -4.0821e-01, -4.0317e-01]], [[-1.8446e+00, -1.9197e+00, -5.9871e+00, ..., -4.1028e+00, -4.2975e+00, 2.4087e+00]]]]) attn_weights tensor([[[[ -2.1245, -6.4699, -6.1687, ..., -1.6238, -0.8447, -0.9550]], [[ 2.1850, -0.7258, -2.0992, ..., -1.6662, -2.4016, -0.4841]], [[ -6.6571, -20.3316, -20.6543, ..., -4.3495, -2.5462, -5.6884]], ..., [[ -4.2814, -10.8183, -10.8178, ..., -3.3814, -1.4890, -3.5586]], [[ -2.1976, -4.2188, -4.1030, ..., -1.3590, -0.6081, -1.0576]], [[ -0.4251, -6.1786, -6.0950, ..., -3.0419, -2.2151, -2.5691]]], [[[ -1.5108, -5.6487, -5.2963, ..., -0.5143, -3.3245, -2.2176]], [[ 1.8971, -2.1327, -2.7023, ..., -0.8351, -1.6652, -2.3562]], [[ -5.1611, -15.2111, -16.3406, ..., -2.1105, -2.4558, -2.2785]], ..., [[ -4.2496, -9.8454, -9.8109, ..., -3.1895, -2.1844, -1.9590]], [[ -2.6722, -4.0437, -4.1101, ..., -1.2426, -1.1763, -0.6190]], [[ -0.3663, -5.6341, -5.6529, ..., -2.6412, -2.6190, -2.2901]]], [[[ -1.8387, -5.5548, -5.7221, ..., -2.5957, 0.0270, -1.9446]], [[ 1.6325, -1.1730, -2.4399, ..., -2.9959, -1.2885, -1.8738]], [[ -5.9777, -17.7657, -19.1979, ..., -3.2510, -3.1160, -5.1333]], ..., [[ -3.6633, -10.0035, -9.3435, ..., -3.0735, -1.7064, -2.8018]], [[ -2.3891, -4.3225, -4.1327, ..., -1.5880, -1.0109, -1.2753]], [[ -0.4841, -5.9949, -5.7293, ..., -2.7813, -2.5032, -2.5555]]], [[[ -1.1925, -4.9266, -5.6282, ..., -2.0428, -1.8141, -0.6661]], [[ 1.3674, -0.4416, -1.1371, ..., -0.9920, -1.1368, -1.5716]], [[ -6.3623, -16.0198, -20.1095, ..., -4.5553, -3.5170, -5.1284]], ..., [[ -3.5429, -10.2872, -12.3792, ..., -2.6666, -2.4858, -3.0899]], [[ -1.8997, -3.7656, -3.6614, ..., -1.7048, -1.2883, -0.6976]], [[ -0.3585, -6.0073, -5.8513, ..., -2.9484, -2.6701, -2.3259]]], [[[ -1.2375, -5.8209, -5.2619, ..., -0.7997, -1.8762, -2.9571]], [[ 1.5713, -2.0897, -2.6564, ..., -0.8378, -1.8542, -1.6958]], [[ -5.1304, -16.1050, -18.7797, ..., -2.7352, -2.1567, -3.2823]], ..., [[ -4.0865, -9.9304, -10.1372, ..., -3.5201, -1.1318, -2.0870]], [[ -2.4980, -3.9734, -4.0764, ..., -1.3174, -0.8689, -0.7351]], [[ -0.3198, -5.9242, -5.7947, ..., -2.6420, -2.5726, -2.3972]]]]) attn_weights tensor([[[[ 4.9776, -0.3819, -1.1644, ..., -3.7568, -1.6265, 0.5181]], [[ -2.6842, -9.9929, -9.8689, ..., -4.9476, -5.7999, -5.5009]], [[ -5.1735, -14.7545, -15.6671, ..., -6.0766, -4.4467, -5.9572]], ..., [[ -2.2113, -9.9615, -9.4797, ..., -0.0644, -1.2732, -2.8694]], [[ -1.2142, -8.0594, -7.4455, ..., -4.5349, -4.3701, -2.5148]], [[ -2.9199, -10.1192, -12.5488, ..., -2.9699, -1.5194, -3.7240]]], [[[ 4.4150, 0.3036, -2.7830, ..., -0.8482, -2.0671, 3.3265]], [[ -2.5329, -8.6514, -7.7131, ..., -3.7267, -4.8384, -6.5881]], [[ -4.3647, -14.0286, -14.7227, ..., -4.0707, -2.7796, -3.6526]], ..., [[ -1.3846, -8.7404, -9.0537, ..., -2.9937, -1.9695, -4.3103]], [[ -0.9991, -6.5987, -7.8867, ..., -4.1908, -4.4117, -1.8532]], [[ -2.1774, -9.4929, -10.5447, ..., -3.0421, -3.1270, -3.7163]]], [[[ 4.4669, -0.9870, -3.6470, ..., -3.0368, -2.2177, 1.3069]], [[ -2.6630, -8.7861, -8.2975, ..., -5.4510, -3.8426, -5.6120]], [[ -4.4082, -14.3287, -15.3490, ..., -6.2348, -4.9283, -6.9192]], ..., [[ -1.3838, -7.9949, -7.6861, ..., -2.9368, -0.9116, -4.3509]], [[ -0.8146, -6.6280, -6.7721, ..., -4.3391, -3.6495, -2.7779]], [[ -2.1619, -9.3115, -10.8990, ..., -5.0057, -2.2317, -3.4006]]], [[[ 4.4992, 0.4004, 4.0320, ..., 0.6684, 0.8604, 2.1422]], [[ -2.5035, -8.3619, -10.0339, ..., -3.2635, -3.0240, -3.1874]], [[ -4.5805, -12.0116, -15.8418, ..., -4.0086, -3.6023, -4.2444]], ..., [[ -1.2995, -7.4371, -9.8411, ..., -3.8480, -3.6345, -2.4029]], [[ -0.8141, -6.4629, -5.7996, ..., -3.1219, -2.8799, -2.3518]], [[ -2.2395, -9.3222, -10.9342, ..., -2.5472, -2.5216, -3.1936]]], [[[ 4.8597, 0.5780, -1.8924, ..., -0.0541, -3.1935, 3.2630]], [[ -2.0663, -9.2757, -8.3315, ..., -3.5544, -3.4081, -4.2721]], [[ -3.5043, -15.4696, -17.8623, ..., -5.0480, -2.5194, -4.1647]], ..., [[ -0.8238, -7.8935, -8.1287, ..., -4.2936, -3.3876, -3.0485]], [[ -0.8418, -6.5424, -8.4839, ..., -4.1104, -2.9220, -2.0736]], [[ -1.7114, -10.0262, -10.8444, ..., -4.1413, -3.3602, -4.7079]]]]) attn_weights tensor([[[[ -2.0716, -12.0355, -11.2485, ..., -3.8714, -3.1611, -4.7866]], [[ -2.8645, -8.7502, -8.7624, ..., -2.8042, -4.0030, -5.2680]], [[ -0.2368, -2.4957, -3.4867, ..., -2.8232, -2.3534, -2.3913]], ..., [[ -1.3486, -5.6886, -6.2326, ..., -2.2717, -0.1042, -1.5269]], [[ 1.4772, -2.5081, -2.6104, ..., -3.5569, -2.0852, -1.7086]], [[ -7.5126, -32.9712, -38.5164, ..., -4.8049, 6.4427, 1.8101]]], [[[ -1.8698, -11.9606, -11.9650, ..., -3.8143, -0.6037, -2.4556]], [[ -2.3215, -9.7218, -9.0931, ..., -0.0800, -0.9884, -4.0714]], [[ 0.1733, -3.2632, -3.3625, ..., -2.8111, -3.4141, -3.9529]], ..., [[ -0.8712, -7.3071, -6.9304, ..., -2.4948, -2.2226, -3.5380]], [[ 1.2890, -4.6305, -4.1583, ..., -3.7361, -3.7927, -3.8192]], [[ -6.0598, -29.9385, -36.0122, ..., -3.8113, 8.1846, -5.5618]]], [[[ -2.4621, -13.4056, -11.5251, ..., -4.4277, -5.7650, -5.8939]], [[ -2.3842, -9.6151, -9.9904, ..., -3.8620, -3.5771, -4.7969]], [[ 0.1002, -3.1065, -3.3864, ..., -3.4315, -2.7319, -4.8655]], ..., [[ -0.7751, -6.3416, -6.7823, ..., -3.7938, -1.4371, -2.8955]], [[ 1.4917, -3.6773, -4.1755, ..., -4.2034, -3.7492, -4.0383]], [[ -4.4266, -38.3470, -39.8150, ..., -1.7148, 13.8601, -1.8385]]], [[[ -2.0131, -12.0000, -13.6220, ..., -4.4844, -3.6308, -4.3968]], [[ -2.4152, -8.8378, -12.0185, ..., -2.8086, -2.7333, -3.6106]], [[ 0.3215, -2.7124, -3.9438, ..., -1.7272, -1.5401, -2.0822]], ..., [[ -0.9847, -5.7395, -8.1713, ..., -3.4739, -3.5905, -4.1616]], [[ 1.4634, -1.5778, -2.5128, ..., -1.7119, -1.3447, -2.1767]], [[ -8.4609, -31.3410, -39.7980, ..., 3.6195, 4.1367, -7.8245]]], [[[ -1.5169, -11.9071, -12.7407, ..., -4.4390, -0.9711, -4.0764]], [[ -1.8152, -10.4611, -10.2962, ..., -3.5721, -2.8903, -3.6836]], [[ 0.3661, -4.3119, -4.2829, ..., -1.8594, -1.5406, -4.3479]], ..., [[ -0.5215, -7.7381, -6.4279, ..., -2.7938, -2.5656, -4.1254]], [[ 1.6021, -4.4802, -3.8039, ..., -3.7308, -3.7448, -2.9376]], [[ -6.5996, -28.9672, -36.1215, ..., -0.8835, 10.8800, 1.7591]]]]) attn_weights tensor([[[[ 2.8148, -6.0884, -4.5679, ..., -1.3616, -2.4404, -1.9479]], [[ 4.6497, -6.9637, -5.1837, ..., -5.2620, -6.6368, -1.7475]], [[ 0.6724, -4.1653, -5.0823, ..., -2.8678, -1.4357, -3.9191]], ..., [[ 1.0833, -3.2108, -3.0882, ..., -2.9714, -3.8865, -4.1681]], [[ 1.8129, -1.3089, -0.7292, ..., -1.4911, -0.7979, -1.4489]], [[ 1.3604, -2.7862, -3.0245, ..., -2.3238, -1.8744, -0.7527]]], [[[ 2.1242, -8.2583, -6.0608, ..., -2.0335, -3.0039, -0.8973]], [[ 3.7978, -10.0546, -11.1484, ..., -3.9582, -5.8075, -2.0249]], [[ 0.5867, -5.6429, -6.5581, ..., -1.5748, -1.3092, -1.8717]], ..., [[ 0.7526, -3.3405, -5.0103, ..., -3.2669, -4.2596, -2.6065]], [[ 2.6244, -1.4602, -2.6811, ..., -1.5631, -2.4234, 0.7794]], [[ 1.0462, -4.7770, -4.6522, ..., -3.4372, -5.2996, -1.8237]]], [[[ 2.4988, -5.9965, -7.1377, ..., -5.0187, -2.5784, -2.3791]], [[ 4.8838, -11.7672, -11.9758, ..., -6.9862, -0.7868, -1.1076]], [[ 0.2115, -5.5501, -5.8613, ..., -1.7968, -1.0876, -2.1797]], ..., [[ 1.0567, -2.8382, -4.5204, ..., -4.5611, -4.7464, -5.1858]], [[ 1.5584, -1.3119, -1.8798, ..., -1.2637, -0.4810, -1.6657]], [[ 1.1386, -5.0034, -4.8006, ..., -3.3130, -3.5753, -1.3120]]], [[[ 1.8256, -1.8150, -3.9280, ..., -3.3474, -2.8834, -1.3177]], [[ 3.9357, -6.2479, -7.8628, ..., -5.9217, -2.8683, -2.7721]], [[ 0.8403, -3.6271, -5.7892, ..., -0.1059, -1.0124, -2.2906]], ..., [[ 0.8181, -2.4345, -3.2265, ..., -2.6114, -2.1872, -2.2942]], [[ 2.1639, -0.9132, -0.3003, ..., 0.1785, 0.2173, 1.1477]], [[ 0.9649, -3.5264, -1.8880, ..., -3.7911, -3.1201, -0.3689]]], [[[ 1.7274, -7.9655, -6.0021, ..., -4.4894, -2.3258, -3.2769]], [[ 3.6848, -12.3919, -8.8004, ..., -4.9865, -5.5507, -4.0945]], [[ 1.0065, -6.3766, -6.0139, ..., -2.9004, -1.5246, -2.7032]], ..., [[ 0.9556, -3.4879, -4.4329, ..., -4.4018, -3.3310, -3.3864]], [[ 3.2188, -0.0561, -1.8730, ..., -2.0163, -0.8717, 1.7436]], [[ 0.8172, -4.1989, -4.0400, ..., -3.7378, -3.7174, -1.8715]]]]) attn_weights tensor([[[[-0.8083, -5.5022, -4.0867, ..., -1.2122, -1.8350, -2.0684]], [[ 0.8443, -5.9113, -8.5586, ..., -4.8138, -3.5890, -5.2712]], [[ 0.5884, -3.0741, -3.2728, ..., -3.0430, -3.6618, -2.6681]], ..., [[ 4.3604, -4.8549, -4.2591, ..., -2.3928, -2.6197, -1.4054]], [[ 3.0112, -3.4893, -3.5698, ..., -2.2101, -0.1155, -1.8102]], [[-0.1401, -5.1252, -6.5300, ..., -2.2259, -2.1053, -2.1597]]], [[[-0.8845, -4.7687, -3.7284, ..., 0.0478, 1.0302, -2.4772]], [[ 1.5910, -5.8660, -6.6628, ..., -3.5500, -5.7476, -2.1971]], [[ 0.3034, -2.8887, -3.0153, ..., -2.5420, -3.7167, -3.1935]], ..., [[ 3.9863, -8.2945, -6.7518, ..., -3.8328, -5.2414, -1.2749]], [[ 3.0618, -3.9486, -2.7033, ..., -1.4024, -2.3898, 0.0911]], [[-0.1751, -5.1056, -5.6471, ..., -0.1639, -0.5744, -2.1463]]], [[[-1.3714, -5.8365, -4.3294, ..., -0.2954, -1.2875, -3.1651]], [[ 0.1562, -5.1446, -7.1942, ..., -4.6537, -1.9154, -3.3911]], [[ 0.2397, -3.4496, -3.2119, ..., -3.7804, -3.6330, -3.7458]], ..., [[ 4.7040, -8.0833, -7.9403, ..., -4.5851, -2.3220, -2.5784]], [[ 2.9437, -3.9248, -3.0981, ..., -2.3714, -1.3690, -1.2831]], [[-0.2241, -4.7661, -5.7711, ..., -2.0645, 0.9421, -1.3773]]], [[[-0.3620, -7.0615, -7.8207, ..., -3.5520, -3.0531, -3.1016]], [[ 0.2492, -5.1728, -7.4297, ..., -3.9026, -4.3754, -3.3523]], [[ 0.3667, -2.8554, -3.3871, ..., -2.9151, -1.7716, -2.7086]], ..., [[ 3.9479, -4.4345, -4.5010, ..., -4.6351, -1.6097, -2.2737]], [[ 2.6254, -2.3481, -2.0707, ..., -1.8645, -2.5914, -1.5598]], [[ 0.0459, -5.1494, -8.7917, ..., -2.2738, -1.9248, -3.7249]]], [[[-0.4185, -5.4906, -6.4555, ..., -2.3779, -1.1506, -2.2362]], [[ 1.7174, -6.3816, -7.2905, ..., -4.1846, -3.0646, -1.2501]], [[ 0.4727, -3.5512, -3.8844, ..., -3.1766, -3.0588, -3.1218]], ..., [[ 3.7869, -8.8313, -4.7533, ..., -4.3343, -3.6203, -3.5679]], [[ 2.8849, -5.1145, -4.0086, ..., -1.9328, -2.5336, -2.3452]], [[-0.2036, -5.9843, -6.2543, ..., -2.5565, -0.1144, -3.0908]]]]) attn_weights tensor([[[[ -0.2628, -8.1685, -7.1162, ..., -4.7231, -3.7200, -4.1976]], [[ 3.3464, -0.2432, -0.5904, ..., -1.5623, -1.1694, -2.3706]], [[ 6.2074, -2.6756, -2.4275, ..., -0.3080, 1.0340, -0.0729]], ..., [[ 0.3354, -3.2098, -2.9577, ..., -1.4569, -1.3245, -1.7181]], [[ 4.0091, -2.8574, -2.4561, ..., -2.5608, -0.0149, -1.4013]], [[ 3.1052, -4.0906, -4.3214, ..., -1.7291, -0.4525, -1.6289]]], [[[ -0.5310, -7.5026, -7.7784, ..., -2.3329, 0.2099, -3.6168]], [[ 2.7274, -3.3109, -2.7731, ..., -2.3360, -1.8176, -1.4281]], [[ 6.5538, -0.9678, -4.1606, ..., -2.2137, -4.2850, -0.4733]], ..., [[ 0.4597, -4.0839, -3.8707, ..., -0.3490, -1.2892, -1.2362]], [[ 3.8386, -3.4177, -3.9452, ..., -2.2853, -2.2149, -1.1510]], [[ 3.7083, -3.1086, -4.7003, ..., -3.0478, -3.9335, -0.8252]]], [[[ -0.7073, -9.0414, -8.1101, ..., -2.3014, -0.6549, -4.2678]], [[ 2.1628, -2.8355, -3.3453, ..., -2.3239, -0.9998, -1.3006]], [[ 6.4681, -4.5487, -6.4895, ..., -4.7736, -1.7212, 0.0868]], ..., [[ -0.0349, -3.8351, -3.8108, ..., -1.1365, -0.0644, -2.0345]], [[ 3.8527, -4.6675, -5.1221, ..., -2.3482, 0.1249, -0.7093]], [[ 2.7490, -4.6487, -6.5774, ..., -6.0483, -4.9313, -3.5582]]], [[[ -0.7557, -8.0373, -10.4471, ..., -2.0343, -1.6716, -4.5865]], [[ 2.2225, -1.3525, -0.7648, ..., 0.2560, 0.1829, -0.0118]], [[ 5.3120, -0.6256, -3.2513, ..., -2.6599, 0.1287, -2.2085]], ..., [[ 0.6520, -4.2196, -5.6607, ..., -0.4241, -0.6312, -1.5745]], [[ 3.3650, -1.3731, -2.7209, ..., -1.8047, -0.6787, -1.1752]], [[ 3.0985, -2.4112, -3.6425, ..., -3.7481, -3.3870, -1.9841]]], [[[ -0.8193, -6.5839, -7.3190, ..., -3.5419, -0.9921, -3.8863]], [[ 4.0864, -4.0671, -4.3982, ..., -3.4389, -2.5405, -0.6167]], [[ 6.1518, -3.5370, -3.3255, ..., -2.4982, -2.6260, 0.2689]], ..., [[ 0.3324, -5.9807, -5.7320, ..., -1.7891, -2.0173, -2.2420]], [[ 4.6058, -4.4934, -2.2808, ..., -2.2352, -2.9679, -0.9302]], [[ 3.3696, -2.7593, -5.0709, ..., -3.6049, -3.6812, -3.0460]]]]) attn_weights tensor([[[[ 1.1366e+00, -1.4362e+00, -1.8504e+00, ..., -2.5724e+00, -5.2229e-01, 1.4145e-02]], [[ 4.6965e+00, -2.4401e-01, -1.2745e+00, ..., -2.1016e+00, 1.0135e+00, 3.9522e-01]], [[ 1.1562e+00, -5.9188e-01, -1.6625e+00, ..., 4.8877e-03, -4.3632e-01, -2.0317e-01]], ..., [[ 1.0973e+00, -1.7440e+00, -1.7874e+00, ..., -3.2857e+00, -2.3069e+00, -1.7247e+00]], [[ 1.5067e+00, -2.2909e+00, -2.4550e+00, ..., -1.7607e+00, -4.3173e-01, -8.5199e-02]], [[ 1.0586e+00, -3.5136e+00, -4.4905e+00, ..., -4.3790e+00, -3.8545e+00, -3.8824e+00]]], [[[ 1.4010e+00, -2.8220e+00, -4.6017e+00, ..., -9.5341e-01, -2.3083e+00, -5.5980e-01]], [[ 5.6926e+00, -1.4737e+00, -1.2136e+00, ..., 6.4518e-01, -4.5881e-01, 2.1523e+00]], [[ 1.7339e+00, -1.4790e+00, -2.0307e+00, ..., -3.2999e-01, -1.4630e+00, -1.9658e+00]], ..., [[ 1.5742e+00, -4.8635e+00, -4.7571e+00, ..., -2.6643e+00, -2.0523e+00, -4.0679e-01]], [[ 1.2042e+00, -4.4086e+00, -3.7918e+00, ..., -1.5282e+00, -1.8366e+00, -4.8707e-01]], [[ 1.0008e+00, -4.2548e+00, -3.8099e+00, ..., -3.6234e+00, -2.9713e+00, -3.3484e+00]]], [[[ 1.0791e+00, -3.7591e+00, -3.0462e+00, ..., -2.5795e+00, -2.6011e+00, -2.5073e+00]], [[ 4.6413e+00, -2.4158e+00, -4.1637e+00, ..., -2.8439e+00, -2.1331e+00, -6.0205e-01]], [[ 2.0876e+00, -2.0229e+00, -2.7906e+00, ..., -3.1004e+00, -1.3839e+00, -1.7927e+00]], ..., [[ 6.8536e-01, -4.4230e+00, -3.8691e+00, ..., -2.5134e+00, -2.8059e+00, -3.3584e+00]], [[ 1.1562e+00, -4.4895e+00, -5.0545e+00, ..., -2.3274e+00, -2.2484e+00, -1.3639e+00]], [[ 8.3981e-01, -3.5876e+00, -4.5939e+00, ..., -3.8117e+00, -4.4106e+00, -4.7123e+00]]], [[[ 1.1440e+00, -2.6237e+00, -2.5266e+00, ..., -1.8901e+00, -1.2227e+00, -1.4835e+00]], [[ 3.4821e+00, -1.9671e+00, -3.9477e+00, ..., -2.3728e+00, -1.5112e+00, -2.7944e+00]], [[ 1.9714e+00, -1.1451e+00, -2.9216e+00, ..., -1.1029e+00, -6.7926e-01, -2.5273e+00]], ..., [[ 8.1102e-01, -3.0722e+00, -2.8984e+00, ..., -2.4362e+00, -1.8362e+00, -1.6787e+00]], [[ 1.1176e+00, -3.2619e+00, -3.2176e+00, ..., -2.5736e+00, -2.1933e+00, -1.7422e+00]], [[ 8.3975e-01, -3.6123e+00, -4.1589e+00, ..., -3.5755e+00, -3.1224e+00, -3.7218e+00]]], [[[ 1.1148e+00, -4.0027e+00, -4.5466e+00, ..., -2.1629e+00, -2.1655e+00, -3.2068e+00]], [[ 4.9132e+00, -1.8137e+00, -2.2333e+00, ..., -8.2448e-01, -1.1566e+00, 2.3091e-01]], [[ 2.7614e+00, -2.2924e+00, -3.7612e+00, ..., -2.0640e+00, -1.8022e+00, -1.6582e+00]], ..., [[ 2.0047e+00, -4.9001e+00, -5.2222e+00, ..., -4.7795e+00, -3.7089e+00, 3.5021e-01]], [[ 1.3609e+00, -4.2117e+00, -4.1393e+00, ..., -2.2744e+00, -2.3010e+00, -1.1801e+00]], [[ 1.3800e+00, -4.0940e+00, -4.1837e+00, ..., -3.9442e+00, -1.9076e+00, -1.7155e+00]]]]) attn_weights tensor([[[[ 2.1579, 0.3470, -0.6039, ..., -1.5254, -0.4394, 0.0216]], [[ 5.0526, 0.2248, -1.6591, ..., -1.4221, 0.7034, 0.0643]], [[ 1.9777, -0.9734, -0.8586, ..., -4.9488, -2.9590, -2.0671]], ..., [[ 4.6092, -0.5154, -2.9816, ..., -4.0433, -1.4131, -2.2458]], [[ 2.0255, -3.6231, -2.8079, ..., -1.3960, -0.1611, -0.1396]], [[ 3.9335, -1.7725, -2.4147, ..., -1.0536, -2.1592, -1.5475]]], [[[ 2.6359, -4.1796, -4.4877, ..., -4.1983, -3.5513, -1.3324]], [[ 3.4658, -0.0557, -2.2825, ..., -1.7512, -1.8008, -1.6920]], [[ 2.6091, -5.0016, -4.4583, ..., -4.4694, -3.8280, -1.6882]], ..., [[ 3.9244, -2.0773, -2.8249, ..., -2.0535, -2.8079, -1.0476]], [[ 1.6764, -7.3927, -7.3187, ..., 0.3221, 1.0335, -1.0292]], [[ 3.9781, -0.0337, -2.5709, ..., -1.2319, -1.2107, -1.4846]]], [[[ 1.5577, -3.2025, -2.1308, ..., -1.8188, -2.0107, -3.8568]], [[ 4.4562, -2.8698, -4.9067, ..., -4.8933, -0.7293, -0.8771]], [[ 1.1491, -2.1232, -2.3278, ..., -2.2539, -1.8991, -2.6376]], ..., [[ 3.8369, -2.7252, -4.2847, ..., -3.6318, -0.9001, -1.5466]], [[ 0.7403, -5.3581, -5.2340, ..., -0.9081, -0.6052, -1.3427]], [[ 3.5479, -1.3584, -3.3798, ..., -2.8501, -2.9900, -3.3717]]], [[[ 1.7508, -1.4805, -3.2297, ..., -2.7267, -1.3833, -2.7682]], [[ 3.4326, -0.4567, -1.5812, ..., -2.8137, -1.1098, -1.4791]], [[ 1.3365, -2.1804, -2.6877, ..., -1.2776, -0.5570, -1.9093]], ..., [[ 3.8114, -1.7154, -2.2727, ..., -2.9527, -1.7741, -2.1609]], [[ 1.1522, -3.7477, -5.2659, ..., -2.3585, -1.2200, -2.0328]], [[ 3.5402, -0.3380, -2.6190, ..., -2.2925, -1.4535, -2.4840]]], [[[ 2.9284, -4.6951, -5.3025, ..., -3.6150, -0.4860, -0.5648]], [[ 4.2223, -4.1694, -4.6747, ..., -2.5339, -2.1412, -2.8898]], [[ 2.8750, -3.7159, -3.6598, ..., -2.4814, -0.8824, -1.1508]], ..., [[ 4.2394, -1.4691, -2.2526, ..., -1.0979, -0.2836, 0.6703]], [[ 1.4224, -5.7204, -6.0475, ..., -2.7309, 0.4240, -2.3781]], [[ 3.9804, -1.6492, -4.1191, ..., -1.9781, -3.2809, -2.2162]]]]) attn_weights tensor([[[[ 3.1481, -2.4782, -3.0111, ..., -3.5065, -1.7116, -2.4103]], [[ 4.3784, 0.1971, -0.5076, ..., 0.8227, 0.3366, 0.4530]], [[ 3.9405, -0.4044, -1.3462, ..., -1.8227, 0.8323, -0.7319]], ..., [[ 1.6691, -4.9240, -5.0771, ..., -1.8896, -2.4827, -1.6461]], [[ 4.4121, -0.4849, -1.7919, ..., -1.7398, -0.0872, -0.8778]], [[ 5.3733, 1.5212, 0.3595, ..., 0.3741, 2.9238, 0.3864]]], [[[ 2.7020, -3.2363, -3.2709, ..., -3.3261, -3.5588, -0.4911]], [[ 3.7250, -1.2089, -3.8617, ..., -2.0719, -2.3942, -0.5606]], [[ 2.7365, -0.3957, -1.1741, ..., -1.4358, -1.2256, -1.1827]], ..., [[ 0.3988, -3.4718, -3.9331, ..., -0.6344, -0.2076, 0.1190]], [[ 3.1870, -2.4899, -1.3141, ..., -3.0768, -2.7337, -1.7465]], [[ 4.3139, -2.0215, 0.1590, ..., 0.7023, 2.3032, -0.7565]]], [[[ 2.4394, -3.2780, -3.6597, ..., -3.5574, -2.8304, -3.1357]], [[ 4.0358, -1.8781, -5.1577, ..., -2.3471, -0.2117, -0.4135]], [[ 3.6539, -1.2437, -2.2206, ..., -1.3511, -0.3209, -0.8684]], ..., [[ 0.6314, -5.9389, -6.0422, ..., -1.6327, -0.9512, -1.6498]], [[ 3.3980, -2.1784, -2.7313, ..., -2.1728, -1.5264, -2.3089]], [[ 4.1582, -0.7544, 1.4711, ..., 3.5108, 3.4563, 2.4055]]], [[[ 2.5553, -3.8264, -4.1013, ..., -2.9741, -2.1940, -3.2550]], [[ 3.2415, -1.4575, -1.2489, ..., -2.7751, -1.6629, -1.4234]], [[ 3.4590, -1.9812, -2.1909, ..., -0.7011, -1.0335, -1.4803]], ..., [[ 2.1897, -5.1638, -5.0762, ..., -2.4025, -2.0083, -2.1938]], [[ 3.4462, -2.5412, -2.5501, ..., -1.7642, -1.9635, -2.3006]], [[ 4.0452, -0.7332, -1.2480, ..., -1.1880, -0.3643, -1.1301]]], [[[ 3.5683, -4.1459, -4.5081, ..., -2.7049, -1.4376, -0.8031]], [[ 4.5917, -3.8022, -4.4047, ..., -2.1512, -0.1172, 0.1424]], [[ 3.9278, -2.4417, -2.8222, ..., -0.7119, -0.6253, -0.3736]], ..., [[ 1.2557, -6.3068, -6.6808, ..., -2.4246, -0.2442, -1.5506]], [[ 3.4444, -2.8949, -2.9119, ..., -1.8265, -1.4881, -0.9298]], [[ 4.5651, -1.5126, -1.2256, ..., 1.0733, 3.4249, 1.3394]]]]) attn_weights tensor([[[[ 1.4026e+00, 5.8192e-01, 4.5063e-01, ..., -7.0201e-01, -1.9656e-01, 1.7851e-01]], [[ 3.9361e+00, -2.5069e-01, -3.7167e-01, ..., -8.7921e-01, -1.6758e-01, -1.5856e+00]], [[ 3.9525e+00, -8.1886e-01, -1.4453e+00, ..., -1.7835e+00, -1.5844e+00, -1.2557e+00]], ..., [[ 5.1285e+00, 1.5793e+00, 4.8487e-01, ..., 3.0319e-01, 1.8330e+00, 1.5043e+00]], [[ 3.8830e+00, 9.6325e-01, 1.4152e+00, ..., 1.1436e+00, 3.6776e+00, 1.9287e+00]], [[ 3.7846e+00, 2.0764e-01, 1.6904e+00, ..., 2.0795e+00, 2.0811e+00, 1.0610e+00]]], [[[ 8.7619e-01, 8.3199e-01, 5.5596e-01, ..., 1.2149e+00, 8.3851e-01, 5.3489e-01]], [[ 3.4600e+00, 1.1716e-02, -5.5820e-01, ..., 3.1497e-01, 4.4214e-01, 7.5257e-01]], [[ 2.9254e+00, 4.0358e-02, -1.5649e+00, ..., -2.3458e+00, -2.4654e+00, -3.8243e-01]], ..., [[ 3.8135e+00, -2.6933e-01, -1.6013e+00, ..., -1.8527e+00, -1.7077e+00, 5.4326e-01]], [[ 2.5715e+00, 1.0274e+00, -8.4023e-01, ..., -6.5994e-01, -2.3328e-01, 6.7638e-01]], [[ 3.2217e+00, 3.3345e+00, -1.3170e-01, ..., 7.1504e-01, 2.8063e-01, 7.5391e-01]]], [[[ 1.1530e+00, -1.1437e-03, -2.8926e-01, ..., 2.1839e-01, 2.2855e-01, -3.5501e-01]], [[ 3.4379e+00, -4.9033e-01, -7.9362e-01, ..., 3.4163e-01, 5.9129e-01, 4.4095e-01]], [[ 2.6028e+00, -1.5721e+00, -1.9733e+00, ..., -1.3474e+00, -1.0091e+00, -2.0911e+00]], ..., [[ 4.3625e+00, -1.1215e+00, -1.7324e+00, ..., -1.0263e+00, 1.3562e+00, 3.4159e-01]], [[ 2.0047e+00, -1.6849e+00, -4.9215e-01, ..., 1.4639e+00, 1.5058e+00, -3.0453e-01]], [[ 2.7724e+00, -1.0796e+00, 1.1491e-01, ..., 2.7767e+00, 2.4716e+00, 8.7822e-01]]], [[[ 1.6014e+00, 9.6175e-01, 4.4737e-01, ..., 5.8780e-01, 9.3495e-01, 7.9988e-01]], [[ 4.1665e+00, -1.1105e+00, -1.2359e+00, ..., -7.5256e-01, -9.6858e-01, -1.4705e+00]], [[ 3.8749e+00, -1.3319e+00, -2.1609e+00, ..., -1.9641e+00, -2.3497e+00, -1.8883e+00]], ..., [[ 4.5219e+00, 3.0426e-02, -5.7373e-01, ..., -1.3032e+00, -1.4825e-01, -5.1304e-01]], [[ 3.9776e+00, 7.2777e-01, 2.0862e+00, ..., -1.2483e+00, 4.2401e-01, 1.9092e+00]], [[ 3.2976e+00, -6.1895e-01, 9.3762e-01, ..., -1.1607e+01, -6.8447e+00, 1.4246e+00]]], [[[ 1.9489e+00, -1.1347e+00, -2.2496e+00, ..., 5.0653e-01, 7.0992e-01, 8.5614e-01]], [[ 4.4498e+00, -7.7282e-01, -1.5199e+00, ..., 4.5604e-01, 1.2994e+00, -3.3576e-01]], [[ 3.4829e+00, -1.3897e+00, -1.5048e+00, ..., -1.5903e-01, -8.7087e-01, -6.6106e-01]], ..., [[ 4.3329e+00, -2.3302e+00, -4.2047e+00, ..., -1.8670e+00, 2.1349e-01, -2.0677e-01]], [[ 3.1883e+00, -5.4868e-01, -1.5076e+00, ..., -6.5451e-02, 1.3539e+00, 9.7195e-01]], [[ 3.9820e+00, -4.5219e-01, -1.2086e+00, ..., 1.5335e-01, 3.0165e+00, 8.7870e-02]]]]) attn_weights tensor([[[[-0.4979, -1.8560, -1.4425, ..., -1.2980, -2.2804, -0.4057]], [[ 2.4768, 1.8874, 2.3614, ..., 1.8454, 1.6257, 11.5709]], [[-1.7945, -2.4423, -2.4607, ..., -1.7101, -1.5055, -2.3926]], ..., [[-2.4926, -3.0662, -3.0296, ..., -2.8065, -2.6188, -3.1864]], [[ 0.1032, -0.6823, -0.6320, ..., -0.3289, -0.2476, 1.1252]], [[-1.2466, -2.2415, -3.1923, ..., -1.8386, -2.0613, -2.4064]]], [[[-1.8152, -5.3141, -2.7928, ..., -3.4587, -1.0811, -4.8716]], [[-3.6072, 1.9515, -4.1670, ..., -5.7432, -7.4761, 3.5659]], [[-2.4852, -1.4561, -3.2278, ..., -3.9695, -3.9052, -0.7942]], ..., [[-2.0285, -2.4775, -2.4675, ..., -2.5585, -2.4998, -2.1137]], [[-0.9094, -1.1146, -1.2831, ..., -1.1523, -1.2228, -0.4578]], [[-1.5488, -2.2968, -3.5658, ..., -3.0273, -2.2262, -2.3826]]], [[[-0.8980, -2.1824, -2.1722, ..., -1.6331, -2.4578, -1.9169]], [[ 3.7402, 1.5112, 2.1701, ..., 2.0968, 3.6386, 11.5740]], [[-1.3527, -2.2795, -2.1743, ..., -2.9691, -2.4128, -3.5099]], ..., [[-2.2189, -2.7758, -2.8551, ..., -2.9248, -2.5583, -3.2092]], [[-0.5118, -1.2575, -1.3887, ..., -0.7493, -0.5018, 0.8587]], [[-1.6114, -2.2593, -2.8142, ..., -2.1595, -1.8445, -2.6634]]], [[[-1.4282, -2.6699, -2.5412, ..., -2.1200, -2.2055, -2.2979]], [[-0.5058, 1.0235, -0.8470, ..., -1.2056, -1.0681, 9.0963]], [[-2.2302, -2.7412, -2.1194, ..., -2.7737, -2.2517, -2.3405]], ..., [[-2.2123, -2.6948, -2.7813, ..., -2.1797, -2.3990, -2.9771]], [[-0.8043, -0.9233, -1.4065, ..., -0.4546, -1.0860, 1.0562]], [[-0.8127, -2.0101, -3.1937, ..., -2.2343, -3.1411, -2.3831]]], [[[-1.6490, -2.6913, -2.5877, ..., -2.7200, -1.3844, -0.6453]], [[ 0.4255, -0.3968, 0.1347, ..., -1.0916, -0.2753, 9.0080]], [[-1.5922, -2.7656, -2.4799, ..., -2.9652, -1.6235, -2.6958]], ..., [[-2.4443, -2.8079, -2.9181, ..., -2.9906, -1.9709, -3.8551]], [[-0.9891, -1.2300, -1.5715, ..., -1.3138, -0.9085, 1.2260]], [[-1.3470, -2.5411, -2.8552, ..., -2.8737, -3.2897, -2.1735]]]]) attn_weights tensor([[[[-3.2286e+00, -5.8753e+00, -4.4915e+00, ..., -3.8896e-01, 1.6875e+00, -4.5087e-01]], [[-1.0030e+00, -2.7521e+00, -3.2542e+00, ..., 6.9117e-01, 1.3118e+00, 4.0432e-01]], [[-4.2471e+00, -4.6177e+00, -4.6977e+00, ..., -2.7334e+00, -2.6812e+00, -2.4942e+00]], ..., [[ 1.2230e+00, -4.2013e-01, 4.0129e-01, ..., -8.9077e-02, -3.6554e-01, -7.7485e-01]], [[-4.0432e+00, -2.8085e+00, -2.7293e+00, ..., -5.7476e-01, -7.1240e-01, -3.6264e-01]], [[ 1.1365e+00, -1.1063e-02, -3.0871e+00, ..., -1.6516e+00, 8.2716e-01, 4.7359e+00]]], [[[-7.2125e-01, -4.2012e+00, -2.7291e+00, ..., 4.0838e-01, 4.6214e-01, 2.9334e-01]], [[-1.2022e+00, -3.8113e+00, -3.2295e+00, ..., -4.1463e-01, -2.7935e-01, 6.3663e-01]], [[-4.0340e+00, -4.4425e+00, -4.4768e+00, ..., -2.6835e+00, -2.5416e+00, -2.1010e+00]], ..., [[ 1.2709e+00, -5.6689e-01, 2.5724e-01, ..., -1.7037e-01, -8.8435e-01, -1.1777e+00]], [[-3.8577e+00, -2.6892e+00, -2.5829e+00, ..., -7.0142e-01, -5.1977e-01, -2.1858e-01]], [[-4.3091e-01, -8.7580e-01, -2.2978e+00, ..., -1.4617e+00, -2.8848e+00, 8.8091e-02]]], [[[-3.1783e+00, -5.7680e+00, -5.0386e+00, ..., 5.1796e-01, 2.2183e+00, -1.0487e+00]], [[-1.7238e+00, -3.3695e+00, -3.8837e+00, ..., 3.4899e-01, 4.5154e-01, -6.4322e-02]], [[-3.7968e+00, -4.0719e+00, -4.2316e+00, ..., -3.2194e+00, -2.8240e+00, -2.5527e+00]], ..., [[ 1.1667e+00, -4.7248e-01, 4.4622e-01, ..., -1.0559e+00, -7.9621e-01, -1.6150e+00]], [[-3.9328e+00, -2.5927e+00, -2.5141e+00, ..., -9.4883e-01, -9.0986e-01, -5.4909e-01]], [[ 1.7264e+00, 7.0093e-01, -4.1868e+00, ..., -1.7320e+00, -2.4780e+00, 5.2585e+00]]], [[[-1.0419e+00, -2.9181e+00, -2.1698e+00, ..., 1.3045e+00, 3.2384e+00, 3.3084e-01]], [[-2.0351e+00, -3.1368e+00, -3.6325e+00, ..., 1.5934e+00, 1.8487e+00, 6.1903e-01]], [[-4.0935e+00, -4.3436e+00, -4.5169e+00, ..., -2.5113e+00, -2.6943e+00, -2.4209e+00]], ..., [[ 1.0938e+00, -2.7742e-01, 5.0071e-01, ..., -8.1681e-01, 2.7074e-01, -1.1047e+00]], [[-4.0982e+00, -2.6686e+00, -2.5847e+00, ..., -7.4999e-01, -6.7733e-01, -4.9000e-01]], [[ 6.6034e-01, -1.0946e-02, -3.3801e+00, ..., 1.0467e+00, -2.9704e+00, 4.5560e+00]]], [[[-2.1860e+00, -3.7701e+00, -3.6987e+00, ..., 1.0088e+00, 7.0849e-01, 4.7792e-01]], [[-1.4932e+00, -3.2513e+00, -3.3863e+00, ..., 3.1775e-01, 1.1158e-01, -9.7734e-02]], [[-4.1314e+00, -4.3250e+00, -4.4852e+00, ..., -2.8023e+00, -2.5556e+00, -2.3937e+00]], ..., [[ 9.6982e-01, -3.6375e-01, 1.8131e-01, ..., -8.5276e-01, -4.1471e-03, -8.6638e-01]], [[-3.9984e+00, -2.5259e+00, -2.4959e+00, ..., -4.8380e-01, -5.0014e-01, -4.4094e-01]], [[-3.3712e+00, -3.0327e+00, -5.5291e+00, ..., -5.3231e+00, -3.3132e+00, 1.1478e+00]]]]) attn_weights tensor([[[[ -2.0306, -5.8023, -6.4774, ..., -1.6632, -0.3411, -3.3358]], [[ 1.7217, -0.6883, -2.1042, ..., -3.0112, -0.9849, -1.8787]], [[ -6.5538, -19.4903, -18.2088, ..., -6.0615, -1.7202, -5.2202]], ..., [[ -4.4622, -10.5332, -10.6670, ..., -2.8593, -3.8645, -3.6000]], [[ -2.1683, -4.2508, -4.1098, ..., -0.6740, -1.1059, -0.2951]], [[ -0.3534, -5.9833, -5.9929, ..., -2.2702, -2.5808, -2.1562]]], [[[ -1.2787, -6.6051, -4.6365, ..., -2.5850, -1.5535, -2.7342]], [[ 1.4964, -1.6670, -1.3989, ..., -2.0359, -3.2220, -1.5217]], [[ -6.6081, -20.2754, -17.9913, ..., -4.8340, -2.6464, -3.3579]], ..., [[ -4.1311, -11.9748, -10.2844, ..., -2.9566, -1.1875, -3.4789]], [[ -1.8400, -3.8902, -3.7974, ..., -1.0862, -0.4832, -0.7623]], [[ -0.3489, -6.1883, -5.9364, ..., -2.7659, -2.5000, -2.5380]]], [[[ -1.8546, -5.3066, -5.6168, ..., -0.6839, -0.4585, -2.3720]], [[ 1.2776, -1.8688, -2.1349, ..., -1.8171, -1.7094, -2.7424]], [[ -6.3423, -16.2919, -15.6233, ..., -2.8039, -0.7729, -3.1561]], ..., [[ -4.3858, -10.3528, -9.6653, ..., -2.9376, -3.5235, -3.2048]], [[ -2.5772, -4.2757, -4.2623, ..., -1.4447, -1.1842, -0.7066]], [[ -0.3394, -5.5952, -5.5897, ..., -2.7171, -2.5444, -2.2607]]], [[[ -1.2349, -5.1972, -5.0613, ..., -1.7158, -0.5056, -1.6096]], [[ 1.4069, -0.7786, -2.4019, ..., -1.4276, -3.1826, -1.3875]], [[ -6.0637, -18.2494, -18.3739, ..., -4.7569, -2.9915, -5.4996]], ..., [[ -3.9598, -10.0484, -10.8022, ..., -2.9336, -1.9704, -3.3217]], [[ -2.1352, -3.9548, -3.9567, ..., -1.3438, -0.7351, -0.6549]], [[ -0.3816, -6.2239, -6.2301, ..., -2.8054, -2.5366, -2.5339]]], [[[ -1.3023, -5.8681, -5.2785, ..., -1.6309, -1.7364, -3.1758]], [[ 1.5116, -2.5390, -3.0742, ..., -1.4573, -1.5710, -3.5291]], [[ -4.6601, -17.5949, -18.2401, ..., -3.0396, -1.5245, -2.5041]], ..., [[ -4.6256, -11.2601, -11.7611, ..., -2.2688, -1.2255, -2.5796]], [[ -2.5465, -3.9071, -3.9998, ..., -0.8799, -0.8070, -0.5956]], [[ -0.3192, -5.9643, -5.9523, ..., -2.7987, -2.6005, -2.4733]]]]) attn_weights tensor([[[[ 4.8559, -0.5587, -3.2848, ..., -2.7073, -0.9721, 2.2162]], [[ -2.6254, -9.5782, -9.2125, ..., -5.0423, -4.6893, -4.9053]], [[ -4.5674, -14.2543, -14.6690, ..., -4.9046, -4.5595, -5.9854]], ..., [[ -1.8958, -8.6845, -7.5287, ..., -2.8215, -2.2508, -3.9977]], [[ -0.9719, -7.3725, -6.8204, ..., -3.2872, -4.6831, -2.6259]], [[ -2.6487, -9.5444, -9.8592, ..., -0.8294, -2.2738, -3.5472]]], [[[ 3.8076, -0.4937, -0.5869, ..., -1.8210, -3.2517, -1.4113]], [[ -2.6525, -9.4318, -7.7876, ..., -4.9698, -5.4412, -3.6813]], [[ -5.2928, -16.4610, -14.5068, ..., -5.0023, -4.6611, -6.3149]], ..., [[ -2.1454, -9.4768, -5.6451, ..., -2.1545, -4.5698, -3.6084]], [[ -1.2256, -7.1569, -6.7388, ..., -4.0249, -2.6278, -2.7457]], [[ -2.8579, -9.8589, -10.7485, ..., -3.5981, -2.8157, -3.4673]]], [[[ 5.2543, -0.0868, -2.0376, ..., -2.9345, -1.1604, 3.5578]], [[ -2.5713, -7.7009, -7.5917, ..., -3.8382, -3.8436, -6.9033]], [[ -4.3565, -13.0538, -13.7615, ..., -5.0943, -4.5007, -5.1248]], ..., [[ -1.7288, -8.0255, -8.4401, ..., -2.1152, -3.8356, -4.2990]], [[ -0.7690, -6.8835, -7.5248, ..., -4.3705, -4.2078, -2.1220]], [[ -2.1223, -9.4876, -11.3656, ..., -1.3139, -0.0303, -3.2909]]], [[[ 5.4539, 0.1410, -1.8906, ..., -0.4868, -2.5519, 2.3238]], [[ -2.4332, -8.8096, -9.7799, ..., -2.8043, -2.1573, -4.9731]], [[ -4.2659, -13.6795, -15.2869, ..., -4.3257, -3.4401, -4.7251]], ..., [[ -0.7657, -8.1619, -9.9419, ..., -3.7283, -2.8817, -3.0711]], [[ -0.9476, -7.0280, -6.8362, ..., -3.9005, -3.2105, -2.7667]], [[ -1.9646, -9.1926, -10.0814, ..., -2.5808, -2.2508, -2.6221]]], [[[ 4.8643, 0.6983, -0.6468, ..., -3.8604, -2.0964, 3.4518]], [[ -2.4945, -9.3658, -9.1058, ..., -2.7956, -3.9683, -4.8332]], [[ -4.9509, -16.9534, -19.0424, ..., -2.7990, -3.1503, -3.3847]], ..., [[ -1.4579, -8.4948, -8.9729, ..., -3.2640, -3.4227, -4.4797]], [[ -1.1967, -7.3040, -9.1829, ..., -3.5131, -2.4630, -2.4727]], [[ -2.5810, -10.7712, -11.9744, ..., -2.3769, -3.8947, -4.2648]]]]) attn_weights tensor([[[[ -1.5675, -12.1908, -12.5230, ..., -4.8169, -4.9180, -5.2509]], [[ -2.7323, -8.8851, -9.3604, ..., -4.3251, -4.7511, -4.8594]], [[ -0.1028, -3.8462, -3.9770, ..., -2.7665, -2.4976, -1.7116]], ..., [[ -1.4516, -6.1271, -6.8221, ..., 0.7591, -0.2499, -2.0918]], [[ 1.6033, -2.8873, -3.2362, ..., -2.3354, -2.0293, -3.8871]], [[ -7.4331, -34.5372, -37.0468, ..., 5.1837, 12.2062, 1.5245]]], [[[ -2.6161, -13.3186, -12.6667, ..., -1.8459, -3.6494, -4.5002]], [[ -2.1890, -11.3261, -10.2383, ..., -3.4930, -5.2727, -3.5259]], [[ -0.0865, -3.5952, -3.6422, ..., -3.9217, -4.6188, -2.9543]], ..., [[ -1.1973, -7.8187, -7.4772, ..., -2.2364, -2.7767, -4.4204]], [[ 1.3161, -3.1446, -3.1009, ..., -4.4551, -4.3937, -1.7429]], [[ -6.7179, -42.6006, -49.9073, ..., -15.3972, 13.3260, -2.6980]]], [[[ -2.4996, -11.2552, -10.5444, ..., -5.6476, -4.4714, -1.9365]], [[ -2.4494, -8.4094, -9.0186, ..., -2.6898, -2.6850, -3.7073]], [[ -0.0869, -2.2130, -3.2339, ..., -3.2803, -3.8125, -4.0253]], ..., [[ -1.0139, -5.3143, -4.5205, ..., -1.2975, -2.1498, -1.5858]], [[ 1.4505, -3.0786, -3.9336, ..., -4.0342, -4.5874, -4.2274]], [[ -5.6695, -33.2206, -34.1826, ..., 7.3559, 15.9369, 3.5700]]], [[[ -0.9505, -12.5330, -13.6178, ..., -4.5931, -5.0024, -5.0239]], [[ -2.1565, -9.5410, -10.4347, ..., -3.8649, -2.8445, -3.4455]], [[ 0.4093, -2.7294, -3.6442, ..., -1.3864, -1.7511, -3.9930]], ..., [[ -0.4116, -5.7682, -6.5716, ..., -4.2123, -2.2313, -3.3230]], [[ 1.5879, -1.5981, -1.9711, ..., -1.6783, -2.6670, -2.4674]], [[ -4.9001, -32.2076, -18.3039, ..., -12.0894, 13.8995, -0.6011]]], [[[ -1.9537, -13.1442, -13.9165, ..., -1.8970, -4.6712, -5.4883]], [[ -2.1026, -11.8613, -12.3124, ..., -3.3540, -3.9041, -4.6423]], [[ 0.2660, -4.8493, -4.7917, ..., -1.7160, -4.0683, -4.5154]], ..., [[ -0.3221, -8.8763, -7.8410, ..., -4.1376, -4.3718, -3.9671]], [[ 1.4813, -4.4066, -3.4236, ..., -2.5908, -3.7765, -2.8508]], [[ 2.0042, -35.0677, -43.1004, ..., -5.7294, 18.8557, 7.2756]]]]) attn_weights tensor([[[[ 2.8774, -4.3608, -4.0865, ..., -3.0876, -1.3152, -0.9767]], [[ 4.3213, -7.4629, -4.8668, ..., -9.4375, -6.0282, -2.2903]], [[ 0.7898, -5.3303, -5.7033, ..., -3.6868, -2.9880, -4.2379]], ..., [[ 0.9875, -3.8283, -3.9364, ..., -2.9080, -3.7822, -4.3124]], [[ 1.4089, -0.0336, -1.1077, ..., -1.8051, -2.8534, -0.6849]], [[ 1.2263, -2.9195, -3.1095, ..., -3.1990, -2.6937, -1.6808]]], [[[ 2.3052, -8.1774, -2.7157, ..., -3.2755, -1.3503, -2.1012]], [[ 3.9642, -12.6863, -2.7865, ..., -6.0079, -4.3278, -5.1225]], [[ 0.3450, -6.6682, -6.0099, ..., 1.0972, -0.5743, -3.6114]], ..., [[ 0.7655, -3.5164, -3.2457, ..., -3.8337, -2.5415, -2.1397]], [[ 1.8195, -2.4842, -3.6097, ..., -1.1227, 0.0359, 0.5523]], [[ 1.0164, -2.9069, -2.7966, ..., -4.2326, -1.9480, 0.0918]]], [[[ 2.5434, -5.4256, -5.6401, ..., -3.6559, -2.9511, -1.5907]], [[ 4.6496, -8.5229, -8.1253, ..., -8.5743, -9.1795, -4.4034]], [[ 0.3918, -4.0031, -3.8470, ..., -1.1356, -0.4616, -2.2535]], ..., [[ 1.0961, -2.9445, -4.6610, ..., -4.4427, -4.5603, -6.6136]], [[ 1.8056, -1.0308, -1.8236, ..., -2.3886, -2.8731, 0.2543]], [[ 0.9513, -4.7536, -4.2367, ..., -4.0796, -1.2726, -1.2415]]], [[[ 2.1262, -3.8436, -3.8930, ..., -3.1657, -3.0922, -1.9924]], [[ 4.4022, -12.3407, -11.0725, ..., -3.0346, -5.1356, -5.9919]], [[ 1.2053, -5.2632, -5.6754, ..., -1.4463, -0.8041, -3.3859]], ..., [[ 1.1602, -2.1031, -3.4849, ..., -1.8597, -2.5990, -6.8361]], [[ 2.3444, -0.9411, -0.6596, ..., 0.0893, -0.2549, -0.4545]], [[ 1.0047, -3.7492, -3.3406, ..., -3.5473, -2.1024, -2.4419]]], [[[ 2.1543, -9.3112, -7.9515, ..., -3.2118, -3.8451, -1.5161]], [[ 4.4974, -19.0787, -16.0180, ..., -8.8243, -10.3194, -2.4101]], [[ 0.6240, -7.1311, -7.5307, ..., -2.8066, -0.5301, -1.8255]], ..., [[ 0.7771, -4.2366, -4.9998, ..., -4.1124, -1.5698, -2.4279]], [[ 3.0567, -2.4333, -2.9573, ..., -1.3287, -1.3799, 0.5305]], [[ 0.8502, -4.3462, -4.9973, ..., -4.1830, -1.2667, -1.3176]]]]) attn_weights tensor([[[[ -1.0490, -4.8386, -4.4005, ..., -0.9030, -0.0618, -2.2102]], [[ 0.8696, -5.9584, -7.2072, ..., -4.3367, -4.7259, -2.3017]], [[ 0.4907, -3.4663, -3.4788, ..., -3.7017, -3.1223, -3.1616]], ..., [[ 4.8073, -2.5425, -1.8783, ..., -4.0722, -3.5741, -2.1851]], [[ 3.1830, -3.0493, -2.8863, ..., -1.0421, -1.9707, -1.9671]], [[ -0.5479, -5.3458, -6.6292, ..., -1.5357, -0.6888, -1.6027]]], [[[ -0.6055, -5.6105, -5.6478, ..., -3.0284, -2.9146, -3.1372]], [[ 0.2162, -6.6005, -6.7030, ..., -4.3068, -2.6702, -3.9202]], [[ 0.2868, -3.9905, -3.9094, ..., -4.1422, -3.2058, -2.4397]], ..., [[ 3.4740, -8.4694, -2.2164, ..., -1.5674, -1.1392, -0.7326]], [[ 3.0387, -4.3509, -2.5829, ..., -2.6259, -1.8016, -0.7823]], [[ -0.1167, -5.3019, -6.3468, ..., -0.1516, -3.1232, -2.9974]]], [[[ -1.2594, -5.8486, -4.0734, ..., -1.4113, -2.3648, -2.6167]], [[ 0.1127, -5.4766, -6.9985, ..., -4.0354, -4.0987, -2.7829]], [[ 0.2836, -3.1261, -3.1851, ..., -3.7454, -4.0842, -3.9407]], ..., [[ 5.0184, -5.9315, -2.4881, ..., -6.3926, -5.5287, -3.3489]], [[ 3.0538, -2.7415, -3.0263, ..., -2.3808, -1.9220, -1.6706]], [[ -0.2586, -5.1929, -6.7811, ..., -0.0581, -0.6729, -2.5078]]], [[[ -0.0799, -7.0061, -5.8959, ..., -2.8753, -1.3887, -2.9299]], [[ 0.7553, -5.2515, -7.5270, ..., -4.3914, -3.1706, -2.5301]], [[ 0.4346, -3.2664, -3.5277, ..., -1.9716, -2.4999, -3.5903]], ..., [[ 5.4603, -9.3679, -7.3828, ..., -0.1586, -6.0253, -6.8042]], [[ 2.6898, -2.8104, -1.7082, ..., -2.7027, -1.9018, -0.8568]], [[ 0.2082, -5.6324, -7.4854, ..., -2.6977, -2.4687, -2.3638]]], [[[ -0.8425, -5.4946, -6.5532, ..., -1.5335, -1.8854, -3.7107]], [[ 1.6604, -7.6317, -7.7932, ..., -2.5714, -2.9384, -0.5072]], [[ 0.4269, -3.2455, -3.7809, ..., -3.1823, -3.0236, -3.1294]], ..., [[ 4.3990, -15.4726, -9.6599, ..., -4.0217, -5.1240, 0.3714]], [[ 2.8613, -4.0371, -3.2296, ..., -1.9553, -2.6962, 0.8866]], [[ -0.3989, -5.8670, -6.4823, ..., 0.5375, -2.7111, -2.5869]]]]) attn_weights tensor([[[[-2.5237e-01, -9.0238e+00, -9.2361e+00, ..., -5.1173e+00, -2.7347e+00, -3.9049e+00]], [[ 3.6738e+00, -7.6423e-03, -2.5001e-01, ..., -3.6122e+00, -3.8191e+00, -2.5948e+00]], [[ 6.5812e+00, 2.2334e-01, -6.1565e-01, ..., -1.6409e+00, -8.6386e-01, -6.3412e-01]], ..., [[ 4.2254e-01, -3.8012e+00, -4.0011e+00, ..., -2.6913e+00, -1.9287e+00, -2.8896e+00]], [[ 4.4242e+00, 4.8765e-01, -1.7192e+00, ..., -3.0936e+00, -2.3301e+00, -1.6398e+00]], [[ 3.5423e+00, -2.5161e+00, -4.4034e+00, ..., -3.3331e+00, -2.2983e+00, -2.4982e+00]]], [[[-2.9000e-01, -1.0663e+01, -1.0857e+01, ..., -3.8767e+00, -3.4670e+00, -4.0445e+00]], [[ 2.6664e+00, -5.1116e+00, -4.2214e+00, ..., -1.0238e+00, -2.4151e+00, -1.7342e+00]], [[ 6.4776e+00, -4.6720e+00, -8.7723e-01, ..., -1.0917e+00, -1.1331e+00, 4.9590e-01]], ..., [[ 1.6318e-01, -4.0884e+00, -4.2079e+00, ..., -2.3269e+00, -1.6769e+00, -1.2034e+00]], [[ 3.7012e+00, -4.5716e+00, -1.6900e+00, ..., -1.5460e+00, -2.6180e+00, 6.2304e-01]], [[ 3.4052e+00, -4.9353e+00, -4.4830e-01, ..., -1.8864e+00, -2.1263e+00, -1.8700e+00]]], [[[-6.7575e-01, -9.5822e+00, -8.1781e+00, ..., -1.5726e+00, -1.5155e+00, -4.3025e+00]], [[ 3.2795e+00, -1.5118e+00, -1.8267e+00, ..., -3.0522e+00, -2.4267e+00, 1.5958e-01]], [[ 6.8753e+00, -3.5624e+00, -3.9080e+00, ..., -6.1253e+00, -4.8203e+00, -1.5983e+00]], ..., [[-4.6239e-02, -3.4175e+00, -3.1032e+00, ..., -1.4097e+00, -1.7859e+00, -2.8222e+00]], [[ 4.6821e+00, -4.4877e+00, -2.7005e+00, ..., -4.7962e+00, -4.0511e+00, -1.1125e+00]], [[ 2.7412e+00, -3.2515e+00, -3.6237e+00, ..., -5.2218e+00, -4.6741e+00, -3.1733e+00]]], [[[-7.8423e-01, -8.5536e+00, -8.0735e+00, ..., -3.4218e+00, -1.9678e+00, -5.3464e+00]], [[ 3.3105e+00, -1.3973e+00, -1.7522e+00, ..., -7.5024e-01, -1.7910e+00, -2.1912e+00]], [[ 6.1570e+00, -5.6439e+00, -5.1975e+00, ..., -1.2293e+00, -4.7506e+00, -4.3477e+00]], ..., [[ 7.9790e-01, -4.5409e+00, -5.2298e+00, ..., -1.2940e+00, -6.5451e-01, -2.0198e+00]], [[ 5.2222e+00, -3.8149e+00, -3.0939e+00, ..., -8.4778e-01, -3.0894e+00, -5.7417e+00]], [[ 3.5725e+00, -4.0699e+00, -4.3398e+00, ..., -5.6198e+00, -5.3101e+00, -3.7528e+00]]], [[[-1.3490e+00, -6.2400e+00, -7.9380e+00, ..., -1.4197e-01, -1.8720e+00, -3.9808e+00]], [[ 2.8703e+00, -4.0857e+00, -4.6417e+00, ..., 2.5527e-02, -9.0290e-01, 1.3520e+00]], [[ 7.1070e+00, -6.4559e+00, -4.8609e+00, ..., -1.8785e+00, -1.2629e+00, 2.5861e+00]], ..., [[-2.8784e-02, -5.2329e+00, -4.9753e+00, ..., -6.4229e-01, -1.0734e+00, -1.7948e+00]], [[ 5.1687e+00, -7.6154e+00, -2.7668e+00, ..., -2.0454e+00, -1.4751e+00, 1.0000e+00]], [[ 3.5644e+00, -3.5367e+00, -3.5052e+00, ..., -2.3789e+00, -3.0849e+00, 1.0741e+00]]]]) attn_weights tensor([[[[ 1.2188, -3.0619, -2.4988, ..., -1.6970, -0.8871, -1.6855]], [[ 5.0779, 1.1047, -1.6347, ..., -3.6332, -2.4087, -0.2544]], [[ 1.7189, -0.2977, -0.3449, ..., -0.5073, 0.2953, -0.9116]], ..., [[ 1.0124, -2.4860, -2.2222, ..., -2.6220, -2.1927, -1.9226]], [[ 1.5784, -2.3901, -1.8994, ..., -1.3451, -0.8930, -0.2911]], [[ 1.4255, -2.4940, -3.3218, ..., -4.4920, -4.5032, -3.8619]]], [[[ 1.1645, -4.6096, -4.0034, ..., -2.1234, -1.0106, -0.6068]], [[ 5.1042, -3.7630, -1.3388, ..., 0.9510, -0.6108, 1.3174]], [[ 1.2996, -2.0178, -1.6851, ..., -1.1223, -0.4223, -0.7668]], ..., [[ 1.4452, -5.3062, -4.3780, ..., -1.9773, -0.6473, -2.3068]], [[ 1.0585, -4.8627, -3.1582, ..., -1.7989, -0.9469, -0.2081]], [[ 0.5370, -2.8834, -2.2892, ..., -3.6659, -2.6518, -3.8724]]], [[[ 1.2211, -3.4051, -3.8855, ..., -3.0315, -3.8430, -3.4086]], [[ 4.7346, -1.0450, -2.3789, ..., -3.2325, -2.7079, -0.8506]], [[ 1.9400, -1.8509, -3.0155, ..., -1.6467, -2.4448, -2.2852]], ..., [[ 1.1717, -4.5499, -3.5705, ..., -4.3850, -4.0691, -2.9042]], [[ 0.9314, -4.4801, -4.3584, ..., -3.9983, -3.2039, -1.7463]], [[ 1.1398, -3.6578, -3.8764, ..., -5.0990, -5.5109, -3.9315]]], [[[ 1.2986, -3.1302, -2.7052, ..., -1.3433, -1.7132, -3.7433]], [[ 4.1014, -1.8457, -4.3229, ..., -1.3463, -4.1025, -1.4522]], [[ 2.3274, -2.2050, -2.9618, ..., -1.2836, -2.5472, -2.6301]], ..., [[ 0.8109, -2.6087, -2.4246, ..., -1.8069, -1.3731, -2.1090]], [[ 1.3510, -2.9639, -3.1436, ..., -2.4235, -2.3629, -1.6942]], [[ 0.8046, -4.1952, -4.8115, ..., -3.1584, -3.5868, -4.5239]]], [[[ 1.2799, -4.0694, -4.7448, ..., -2.5051, -3.9183, -3.0297]], [[ 6.0823, -3.1033, -1.5079, ..., -0.2284, -0.4346, 2.6240]], [[ 1.9786, -1.0586, -2.6775, ..., -0.6278, -2.2708, -1.8211]], ..., [[ 1.9361, -4.0288, -4.3026, ..., -2.7418, 0.1327, 0.4092]], [[ 1.3127, -4.6709, -3.9781, ..., -1.7248, -1.1081, 0.1072]], [[ 1.2711, -4.3440, -4.3663, ..., -2.4112, -2.9465, -3.9014]]]]) attn_weights tensor([[[[ 3.2391, -1.0404, -2.3836, ..., -3.7423, -2.3598, -1.8611]], [[ 4.9836, 0.7549, -1.1249, ..., -1.5504, -0.9855, -0.3830]], [[ 3.1724, -1.3185, -0.6613, ..., -4.4397, -2.6356, -3.6029]], ..., [[ 4.1882, 0.1554, -2.3532, ..., -4.1839, -3.3374, -1.7684]], [[ 2.2127, -4.7263, -4.4031, ..., -1.4547, -0.1025, -1.8282]], [[ 3.5061, -0.4217, -1.9324, ..., -2.4578, -1.4381, -2.1373]]], [[[ 1.9273, -3.0833, -3.6493, ..., -2.9536, 0.5858, -3.4037]], [[ 3.5751, -1.8471, -2.5047, ..., -1.5658, -2.2447, -0.2546]], [[ 2.0678, -4.8777, -4.3714, ..., -3.0110, -0.7889, -3.1589]], ..., [[ 3.2695, -2.3709, -1.9499, ..., -2.9412, -1.0099, -1.4270]], [[ 2.3873, -6.9212, -7.3237, ..., -2.7838, -2.1314, -3.7998]], [[ 4.4009, -2.3584, -1.3528, ..., -0.6945, -2.3467, -0.6712]]], [[[ 2.7249, -2.9805, -3.2045, ..., -3.1320, -4.5223, -1.7984]], [[ 3.5329, -1.9537, -2.3009, ..., -1.9019, -2.1079, -1.7907]], [[ 2.9376, -3.2335, -3.1799, ..., -4.8049, -4.3502, -3.2716]], ..., [[ 4.7855, -1.6771, -2.1130, ..., -2.6949, -3.8634, -2.6397]], [[ 1.8658, -6.4485, -4.9061, ..., -0.3765, 0.4095, -1.1244]], [[ 3.2664, -1.0980, -3.3960, ..., -3.5887, -3.8423, -3.8130]]], [[[ 2.3581, -3.0538, -2.4329, ..., -2.9281, -1.3933, -2.3126]], [[ 3.8227, -1.9839, -2.9539, ..., -0.7316, -3.0298, -2.4143]], [[ 2.1530, -3.1475, -2.7227, ..., -1.3228, -2.0085, -2.5009]], ..., [[ 4.1693, -1.6400, -3.2419, ..., -2.3619, -3.8150, -2.7199]], [[ 1.7777, -4.6107, -3.3733, ..., -2.6234, 0.2513, -1.1780]], [[ 3.4311, -1.4751, -3.0183, ..., -1.9109, -3.1123, -1.9545]]], [[[ 3.0873, -4.8621, -5.5817, ..., -0.0957, -1.8266, -0.4202]], [[ 4.1960, -3.4765, -3.0519, ..., -1.1134, -3.3365, -2.2451]], [[ 3.0262, -3.4093, -3.6882, ..., -0.0387, -2.5288, -1.7102]], ..., [[ 4.6347, -1.5782, -0.5455, ..., 0.7201, -0.1225, -0.6494]], [[ 0.7531, -6.7647, -6.4967, ..., 1.0071, -1.9739, -1.6226]], [[ 4.6937, -1.0367, -3.8242, ..., -2.0412, -2.1593, -1.8088]]]]) attn_weights tensor([[[[ 3.0999e+00, -1.8918e+00, -2.6684e+00, ..., -3.9540e+00, -2.5489e+00, -3.5034e+00]], [[ 4.5808e+00, -2.2674e-01, -9.3124e-01, ..., -1.8127e+00, -1.7954e+00, -1.4035e+00]], [[ 3.5600e+00, 5.0203e-02, -4.6380e-01, ..., -2.4206e+00, -2.3650e+00, -1.5664e+00]], ..., [[ 1.5054e+00, -4.0283e+00, -4.7073e+00, ..., -3.1555e+00, -2.2163e+00, -3.1755e+00]], [[ 3.9786e+00, -7.0083e-01, -1.3080e+00, ..., -2.9759e+00, -2.5750e+00, -1.9672e+00]], [[ 6.2848e+00, 3.5591e-01, -9.7570e-02, ..., -1.4705e+00, -2.3205e-01, 3.2257e+00]]], [[[ 2.0607e+00, -3.5474e+00, -3.3479e+00, ..., -3.5013e+00, -1.3494e-01, -3.9512e+00]], [[ 3.1259e+00, -2.8978e+00, -2.7423e+00, ..., -2.8462e+00, -1.5572e-01, -2.6777e+00]], [[ 2.7084e+00, -2.9525e+00, -2.0161e+00, ..., -2.9455e+00, -2.2318e+00, -2.2356e+00]], ..., [[ 4.4934e-01, -5.3244e+00, -2.6050e+00, ..., -1.2006e+00, -1.1171e+00, -5.2143e-01]], [[ 2.9019e+00, -2.8930e+00, -1.2739e+00, ..., -2.6090e+00, -1.1387e+00, -3.1776e+00]], [[ 3.5622e+00, -2.6197e+00, -7.1411e-01, ..., -1.1407e+00, -8.2613e-01, -3.5132e-01]]], [[[ 3.0124e+00, -3.2563e+00, -3.4604e+00, ..., -2.7490e+00, -4.7401e+00, -3.1360e+00]], [[ 4.1828e+00, -1.4020e+00, -3.0362e+00, ..., -1.2151e+00, -1.9652e+00, 1.7784e-01]], [[ 3.0360e+00, -2.0105e-02, -1.6057e+00, ..., -1.5010e+00, -2.3729e+00, -2.7030e+00]], ..., [[ 1.0665e+00, -6.0615e+00, -6.4834e+00, ..., -2.6520e+00, -2.3745e+00, -7.0511e-01]], [[ 3.1932e+00, -2.1167e+00, -2.5567e+00, ..., -2.5998e+00, -3.4725e+00, -3.1481e+00]], [[ 5.0038e+00, -8.4830e-01, 1.5079e-01, ..., -4.7501e-01, -4.7881e-01, 1.0548e+00]]], [[[ 2.6080e+00, -3.4527e+00, -4.7791e+00, ..., -2.0904e+00, -4.2167e+00, -2.1120e+00]], [[ 3.9589e+00, -2.5048e+00, -2.9114e+00, ..., -2.8868e+00, -3.3831e+00, 6.0886e-02]], [[ 3.0632e+00, -6.5513e-01, -1.9103e+00, ..., -1.7976e+00, -2.4686e+00, -7.9635e-01]], ..., [[ 1.0688e+00, -5.5819e+00, -4.3420e+00, ..., -2.4119e+00, -8.8964e-01, -1.7717e+00]], [[ 2.9105e+00, -1.8316e+00, -2.7976e+00, ..., -1.6060e+00, -2.6800e+00, -1.8188e+00]], [[ 4.6342e+00, -1.3793e+00, -1.6093e+00, ..., -5.8395e-01, -2.2101e+00, 1.4076e+00]]], [[[ 4.1742e+00, -3.8052e+00, -4.5325e+00, ..., -1.2336e+00, -4.2443e-01, -1.4808e+00]], [[ 4.9131e+00, -2.8435e+00, -3.1699e+00, ..., 1.6064e+00, 5.5382e-02, -8.0276e-01]], [[ 3.8769e+00, -2.3529e+00, -2.5773e+00, ..., 4.4539e-01, -5.0924e-01, -3.2994e-01]], ..., [[ 3.4964e-01, -7.9056e+00, -7.2440e+00, ..., -5.5677e-01, -5.1839e-01, -1.7492e+00]], [[ 4.0595e+00, -2.9846e+00, -2.5782e+00, ..., -1.8827e+00, -7.0989e-04, -1.4355e+00]], [[ 5.8449e+00, -2.3087e+00, -8.8439e-01, ..., 4.8141e+00, -3.1239e-01, 4.0611e-01]]]]) attn_weights tensor([[[[ 1.2169, 1.5397, 1.4025, ..., 0.9398, 1.1387, 1.6329]], [[ 3.4848, 1.8195, 0.5875, ..., -0.4270, -0.1461, 1.5818]], [[ 3.1212, 0.3586, -1.2301, ..., -3.3938, -2.7289, -2.6586]], ..., [[ 4.2588, 0.2247, -1.1301, ..., -2.6867, -2.9680, -1.1474]], [[ 3.8426, 1.8507, 0.0700, ..., -0.5802, -1.4656, 0.6491]], [[ 3.5092, 3.1915, 0.5765, ..., 0.2127, -1.2029, 1.0210]]], [[[ 1.7075, 0.0316, -0.5946, ..., 0.9736, 0.5109, 0.5666]], [[ 3.4446, -0.9145, -0.8614, ..., -0.2528, 0.4207, 0.3785]], [[ 2.5380, -1.2554, -1.7211, ..., -2.5587, -1.1960, -1.5290]], ..., [[ 3.3047, -1.9709, -2.7660, ..., -3.2807, 1.0183, -1.7650]], [[ 2.9910, -0.0131, -1.1855, ..., -1.2386, 0.6311, 0.7855]], [[ 2.7394, -0.2637, -1.9531, ..., -1.7413, 0.2948, 0.1849]]], [[[ 1.4026, 0.3935, -0.1903, ..., -0.1123, -0.1384, -0.5503]], [[ 3.7954, -0.5240, -0.9297, ..., -0.7954, -1.6027, -0.0400]], [[ 3.2063, 0.0666, -1.8745, ..., -1.6137, -3.7009, -3.3504]], ..., [[ 4.4987, -0.7087, -2.6115, ..., -1.2904, -2.5451, -0.6652]], [[ 2.8439, 0.2323, -0.1834, ..., -0.8901, -1.5055, -0.3043]], [[ 2.1177, 2.2908, 0.0950, ..., -0.3445, -0.3353, -0.6806]]], [[[ 1.9100, 0.0443, 0.1749, ..., 0.6632, 0.0182, -0.6486]], [[ 4.1328, -0.7139, -0.9955, ..., -0.3919, -1.2921, -0.1777]], [[ 3.3852, -0.4019, -1.9696, ..., -1.0421, -2.1069, -1.0361]], ..., [[ 4.4115, -0.6658, -2.9335, ..., -1.0038, -3.2863, -0.8748]], [[ 4.8158, 1.4695, 1.0962, ..., 1.6304, 0.3829, -0.8234]], [[ 3.5304, 1.2051, -0.2061, ..., 3.9160, -0.0967, -0.1993]]], [[[ 1.7076, -0.4621, -1.5650, ..., 1.2774, 1.6209, 1.3910]], [[ 4.7696, -0.4042, -0.8284, ..., 1.1749, -0.0443, 0.2420]], [[ 3.4343, -0.9375, -1.5173, ..., -0.8703, 0.3493, 0.3132]], ..., [[ 4.7058, -1.5150, -2.4863, ..., 0.7686, -0.0356, -0.3064]], [[ 2.5192, -1.8807, -2.2859, ..., 0.7751, 1.1410, 0.8834]], [[ 3.7832, -0.5399, -1.2325, ..., 4.5880, 1.1164, -0.6676]]]]) attn_weights tensor([[[[-1.5431, -4.1555, -2.9113, ..., -3.9238, -1.0430, -3.4383]], [[ 1.0109, -0.9586, 0.6550, ..., -1.5426, -1.1073, 5.8596]], [[-2.0001, -3.0328, -2.5278, ..., -1.9264, -1.8057, -2.4013]], ..., [[-2.1946, -2.8056, -2.7010, ..., -2.4032, -2.5588, -2.6526]], [[-0.2260, -0.9554, -0.7583, ..., -0.3210, -0.2763, 1.3046]], [[-1.5203, -2.5553, -3.4211, ..., -2.7833, -2.7193, -3.2187]]], [[[-1.4731, -3.8484, -2.6086, ..., -0.4448, -3.2692, -2.9286]], [[-1.0429, -1.0357, 0.9131, ..., -1.9721, -1.3956, 6.3025]], [[-2.1514, -3.0035, -2.6523, ..., -2.6951, -2.6624, -3.0163]], ..., [[-2.0707, -2.5209, -2.3348, ..., -2.3961, -2.0376, -2.1401]], [[-0.6168, -0.9462, -0.7714, ..., -1.0800, -0.4042, 1.1041]], [[-1.6271, -2.3823, -3.4909, ..., -2.4845, -2.5498, -2.9763]]], [[[-1.6405, -4.0312, -2.4172, ..., -2.7115, -1.1216, -3.4562]], [[-2.0916, 0.0223, -2.2661, ..., -0.7377, -1.3136, 6.8317]], [[-1.9976, -2.7800, -3.1262, ..., -2.6205, -2.4132, -1.8667]], ..., [[-2.1552, -2.5679, -2.6078, ..., -2.1621, -2.5086, -1.9447]], [[-0.8623, -1.1373, -1.3560, ..., -0.9318, -0.8557, 0.5274]], [[-1.3933, -2.1096, -3.4317, ..., -2.7393, -3.1071, -2.3172]]], [[[-1.4022, -2.7000, -1.9465, ..., -1.1563, -1.6714, -2.6548]], [[-0.4186, 0.8061, -0.9621, ..., -1.1884, 2.3556, 7.4357]], [[-1.7038, -2.2561, -2.4874, ..., -2.1025, -1.7767, -2.3291]], ..., [[-2.0286, -2.5715, -2.6942, ..., -2.2872, -2.5615, -2.9058]], [[-0.0201, -0.4324, -0.4794, ..., -0.2510, -0.1724, 0.9640]], [[-1.2167, -1.8271, -3.2236, ..., -3.1885, -1.9067, -2.3581]]], [[[-1.4781, -3.9613, -2.7053, ..., -2.3231, -2.1426, -3.5794]], [[-1.8949, -1.8706, -2.6210, ..., -5.0124, -4.7494, 4.9518]], [[-2.5422, -2.9422, -3.3488, ..., -3.4810, -2.9241, -3.6343]], ..., [[-2.0993, -2.4149, -2.4588, ..., -2.6047, -2.5646, -1.9923]], [[-0.6959, -1.0735, -1.1814, ..., -1.4975, -1.1340, 0.4325]], [[-1.4604, -2.3688, -3.6385, ..., -2.9088, -2.3739, -2.7719]]]]) attn_weights tensor([[[[-2.1733, -4.7584, -3.2568, ..., 0.4953, 1.0628, -0.9022]], [[-1.2621, -2.9401, -3.6532, ..., 0.9696, 1.1382, 0.7673]], [[-4.2580, -4.5351, -4.5999, ..., -2.7544, -2.5895, -2.5056]], ..., [[ 0.9878, -0.7972, 0.0553, ..., -0.7191, -0.7980, 0.1365]], [[-3.5655, -2.8579, -2.6939, ..., -0.7171, -0.4295, -0.3496]], [[-0.8067, -1.0924, -3.1036, ..., -0.7903, -3.3538, 2.0830]]], [[[-0.6933, -3.4180, -2.2761, ..., 0.2837, 1.3699, 0.8721]], [[-1.1208, -3.1189, -3.4188, ..., 0.3706, 2.1731, 0.9972]], [[-4.2951, -4.5826, -4.6264, ..., -2.6661, -2.2460, -2.4832]], ..., [[ 1.4267, -0.7042, 0.5751, ..., -0.9679, -1.1086, 0.3337]], [[-3.8054, -2.8137, -2.6901, ..., -0.6237, -0.2983, -0.3834]], [[-0.0452, -0.0679, -2.0450, ..., -2.7814, 1.1630, 4.1060]]], [[[-2.7209, -5.4649, -5.7598, ..., -0.5990, 1.7028, -0.9890]], [[-0.7295, -2.5117, -2.9386, ..., 0.5836, 0.3734, 0.7981]], [[-3.9346, -4.2977, -4.4525, ..., -2.8271, -2.5848, -2.1859]], ..., [[ 1.2696, -0.8309, 0.1002, ..., 0.0261, -0.7755, -0.0269]], [[-3.9167, -2.6325, -2.5707, ..., -0.8534, -0.5710, -0.3050]], [[ 1.0677, 0.6263, -3.3577, ..., -2.0010, -1.0677, 4.2318]]], [[[-1.1940, -3.8534, -2.7641, ..., 2.3266, 4.1058, 0.6006]], [[-1.0166, -2.5300, -3.3714, ..., 1.6188, 1.2795, 0.9985]], [[-4.0046, -4.3644, -4.4873, ..., -2.6994, -2.3927, -2.7960]], ..., [[ 1.4956, -0.6374, 0.3164, ..., 0.4315, -0.6570, -0.1169]], [[-4.2035, -2.5092, -2.5285, ..., -0.7056, -0.4119, -0.8266]], [[ 0.9435, 0.0586, -2.6099, ..., -1.4504, 0.2131, 4.4000]]], [[[-1.2918, -4.1072, -4.1701, ..., -0.3896, 0.1832, 0.5531]], [[-1.0850, -3.0802, -3.5414, ..., 0.0531, 0.6621, 0.6537]], [[-4.2278, -4.5164, -4.6436, ..., -2.4990, -2.3352, -2.5883]], ..., [[ 1.2748, -0.8220, -0.0183, ..., -0.4055, -0.6325, 0.1171]], [[-3.8411, -2.7885, -2.6634, ..., -0.5075, -0.4326, -0.6181]], [[-1.5123, -1.8860, -4.3314, ..., -3.8476, -4.6203, 2.3982]]]]) attn_weights tensor([[[[ -1.8476, -6.0623, -6.3015, ..., -0.5754, -2.5002, -2.2190]], [[ 2.1616, -0.0848, -1.8886, ..., -0.7178, -1.0994, -2.9702]], [[ -5.9113, -20.1240, -22.3040, ..., -3.3300, -1.8046, -4.7000]], ..., [[ -3.9979, -11.5542, -12.8984, ..., -4.1542, -2.0552, -2.1449]], [[ -2.5796, -4.3260, -4.1348, ..., -1.3516, -0.9018, -0.7654]], [[ -0.4192, -6.1556, -6.1112, ..., -2.9013, -2.5033, -2.2544]]], [[[ -1.1607, -6.0803, -4.6351, ..., -1.4914, -2.0766, -0.9703]], [[ 1.5183, -1.6896, -1.5672, ..., -3.0349, -1.3484, -2.2335]], [[ -5.7553, -17.8641, -18.5444, ..., -3.4965, -1.6465, -4.6270]], ..., [[ -3.8570, -10.7080, -11.2817, ..., -1.6737, -1.9836, -2.0648]], [[ -2.3356, -3.9222, -3.9829, ..., -0.7193, -0.7914, -0.5176]], [[ -0.2609, -5.8707, -5.9732, ..., -2.5920, -2.3300, -2.1863]]], [[[ -1.9305, -5.6523, -5.9360, ..., -1.2452, -1.0415, -0.7403]], [[ 2.2252, -1.1758, -1.9146, ..., -1.6654, -1.5132, -0.8392]], [[ -5.3292, -17.9234, -18.2332, ..., -2.7997, -2.1387, -3.0994]], ..., [[ -3.6118, -10.1802, -9.9363, ..., -2.0727, -0.6480, -3.5096]], [[ -2.0787, -4.1095, -3.9616, ..., -1.1781, -0.7402, -0.7234]], [[ -0.3647, -5.7977, -5.7554, ..., -2.7031, -2.5709, -2.3215]]], [[[ -1.6634, -5.8447, -6.1120, ..., -1.4577, -0.8043, -1.3800]], [[ 1.5522, -0.4763, -1.5465, ..., -2.2245, -1.2805, -2.2721]], [[ -6.3427, -18.6819, -17.7551, ..., -2.0640, -2.2681, -5.4801]], ..., [[ -3.5876, -9.8783, -10.6244, ..., -1.8409, -2.0000, -3.2961]], [[ -2.4435, -4.0781, -4.0723, ..., -0.9114, -0.5444, -0.7956]], [[ -0.4393, -6.1689, -6.2351, ..., -2.7340, -2.3245, -2.4813]]], [[[ -1.5642, -5.7810, -5.7721, ..., -1.9807, -2.3309, -1.8077]], [[ 1.7401, -1.8743, -1.5102, ..., -3.3172, -3.8191, -1.9814]], [[ -5.9775, -19.9429, -20.8072, ..., -3.1187, -2.3276, -3.1460]], ..., [[ -3.6033, -11.2029, -11.8373, ..., -1.0726, -0.7666, -3.0562]], [[ -2.4740, -4.2368, -4.2628, ..., -0.8967, -0.6865, -1.0406]], [[ -0.2965, -6.0704, -6.1404, ..., -2.6433, -2.4164, -2.4044]]]]) attn_weights tensor([[[[ 4.5171, -0.9067, -2.4153, ..., -1.1128, -1.5167, 1.7947]], [[ -2.7322, -9.3266, -9.6229, ..., -4.2500, -4.8636, -4.4050]], [[ -4.9508, -16.1903, -19.4261, ..., -4.8295, -2.8299, -4.6897]], ..., [[ -2.1015, -9.1146, -9.5639, ..., -1.8120, -1.5216, -4.0962]], [[ -1.0187, -7.5261, -7.5147, ..., -4.0996, -3.0416, -2.5710]], [[ -3.1545, -9.6769, -11.6201, ..., -3.1449, -2.8473, -3.7966]]], [[[ 4.3458, -1.2011, -2.5057, ..., -3.2107, -0.9994, 1.2396]], [[ -2.4976, -9.2649, -8.4364, ..., -5.6505, -3.2031, -3.7561]], [[ -4.2824, -14.0437, -16.7077, ..., -6.5147, -3.8804, -4.9446]], ..., [[ -1.6273, -8.7574, -9.2077, ..., -4.3874, -3.5272, -2.1165]], [[ -0.9874, -6.3479, -6.1859, ..., -3.2225, -3.0145, -2.3315]], [[ -2.3972, -10.1905, -11.2599, ..., -4.4533, -3.7392, -4.1990]]], [[[ 4.5956, -1.6171, -2.0749, ..., -2.8551, -1.3982, 0.4501]], [[ -2.5429, -7.5153, -7.5027, ..., -4.8379, -7.0814, -5.5173]], [[ -4.7231, -13.5146, -13.5862, ..., -5.4329, -4.3219, -5.6319]], ..., [[ -1.9735, -8.0027, -7.9571, ..., -5.0450, -1.6671, -3.6850]], [[ -0.8315, -7.3731, -6.8247, ..., -4.2655, -2.8577, -1.5770]], [[ -2.5979, -8.7546, -10.4767, ..., -0.3513, -1.9747, -2.9519]]], [[[ 4.3122, -0.5128, -1.0445, ..., -2.7226, -1.0059, 2.1027]], [[ -2.5471, -9.6510, -9.5956, ..., -2.3281, -5.1539, -4.4572]], [[ -4.7663, -14.2623, -15.7754, ..., -4.3117, -5.6505, -5.3573]], ..., [[ -1.2117, -8.6522, -9.3998, ..., -2.2159, -2.7588, -1.8038]], [[ -0.9157, -6.8335, -6.8515, ..., -3.5603, -3.7080, -3.0700]], [[ -2.0490, -9.8415, -11.4203, ..., -3.4100, -2.6748, -3.7402]]], [[[ 4.0649, -1.2440, -2.9060, ..., -3.8019, -3.5754, 1.2348]], [[ -2.6600, -8.8979, -8.9672, ..., -4.8786, -5.1467, -3.1307]], [[ -4.7742, -18.5432, -20.6086, ..., -5.0089, -3.3664, -3.8783]], ..., [[ -2.0306, -9.5320, -9.8067, ..., -4.6024, -2.5792, -2.3732]], [[ -0.9972, -7.8243, -9.1166, ..., -2.9096, -3.1083, -1.6047]], [[ -2.3748, -11.1805, -12.6274, ..., -4.9006, -4.8132, -3.8285]]]]) attn_weights tensor([[[[-2.6029e+00, -1.2362e+01, -1.3569e+01, ..., -4.9282e+00, -1.8529e+00, -3.1929e+00]], [[-2.8439e+00, -9.0412e+00, -9.1368e+00, ..., -3.2318e+00, -4.0751e+00, -6.1603e+00]], [[ 3.1122e-02, -3.1886e+00, -4.0600e+00, ..., -1.5783e+00, -1.4859e+00, -2.4645e+00]], ..., [[-1.2950e+00, -6.3710e+00, -6.2540e+00, ..., 1.1061e+00, -7.9745e-01, -2.6006e+00]], [[ 1.5209e+00, -2.0694e+00, -3.0858e+00, ..., -1.7635e+00, -4.2588e+00, -3.1877e+00]], [[-6.1437e+00, -3.4267e+01, -4.3591e+01, ..., -4.2725e+00, 1.2446e+01, 5.7903e+00]]], [[[-2.4552e+00, -1.2963e+01, -1.3603e+01, ..., -5.7903e+00, -3.9511e+00, -4.9677e+00]], [[-2.1807e+00, -9.3260e+00, -9.5731e+00, ..., -5.8115e+00, -1.8459e+00, -2.7652e+00]], [[ 1.9771e-03, -3.1525e+00, -2.8362e+00, ..., -5.1399e+00, -2.6523e+00, -2.2037e+00]], ..., [[-1.1807e+00, -6.2172e+00, -7.6945e+00, ..., -3.1920e+00, -3.0003e+00, -3.0659e+00]], [[ 1.3496e+00, -3.3428e+00, -2.9167e+00, ..., -5.7526e+00, -2.0448e+00, -1.8102e+00]], [[-8.4861e+00, -2.7823e+01, -3.8496e+01, ..., -9.9703e+00, 7.9983e+00, -1.5317e+00]]], [[[-2.6557e+00, -1.0930e+01, -1.1395e+01, ..., -4.2459e+00, -1.4671e+00, -3.2491e+00]], [[-2.7660e+00, -9.1305e+00, -9.1405e+00, ..., -1.7254e+00, -3.1683e+00, -4.6592e+00]], [[ 2.1758e-02, -2.7835e+00, -3.2741e+00, ..., -3.7346e+00, -3.2560e+00, -3.6587e+00]], ..., [[-1.4437e+00, -5.3101e+00, -4.7356e+00, ..., -1.5762e+00, -4.9283e-01, -1.7330e+00]], [[ 1.2737e+00, -2.6969e+00, -2.5414e+00, ..., -4.0938e+00, -3.2108e+00, -2.5847e+00]], [[-5.8934e+00, -3.1329e+01, -4.3445e+01, ..., 5.1493e+00, 1.9114e+01, 8.5901e+00]]], [[[-1.5770e+00, -1.2935e+01, -1.2497e+01, ..., -3.6246e+00, -3.6158e+00, -2.2475e+00]], [[-2.2920e+00, -9.5211e+00, -1.0713e+01, ..., -2.8581e+00, -3.5034e+00, -3.6622e+00]], [[ 3.0136e-01, -3.1401e+00, -4.0917e+00, ..., -2.1619e+00, -2.8788e+00, -2.2032e+00]], ..., [[-5.1411e-01, -6.2538e+00, -7.2633e+00, ..., -2.9758e+00, -1.9744e+00, -2.0427e+00]], [[ 1.5078e+00, -1.5401e+00, -1.9176e+00, ..., -2.6923e+00, -4.0059e+00, -2.4298e+00]], [[-5.9162e+00, -3.6461e+01, -2.7968e+01, ..., 4.6013e+00, 1.5044e+01, 1.0294e+01]]], [[[-3.3651e+00, -1.3787e+01, -1.5312e+01, ..., -3.2869e+00, -2.3193e+00, -2.3963e-01]], [[-2.8164e+00, -1.1084e+01, -1.0259e+01, ..., -4.4590e+00, -5.1016e+00, -4.0675e+00]], [[ 2.1653e-01, -5.0538e+00, -4.8213e+00, ..., -4.5564e+00, -4.3891e+00, -4.6968e+00]], ..., [[-1.3357e+00, -8.1517e+00, -6.8499e+00, ..., -4.0121e+00, -4.1532e+00, -3.8268e+00]], [[ 1.4302e+00, -4.1587e+00, -3.6173e+00, ..., -4.7628e+00, -4.3627e+00, -2.3863e+00]], [[-3.9148e+00, -5.0083e+01, -5.3057e+01, ..., 9.9468e+00, 2.2224e+01, 6.9746e+00]]]]) attn_weights tensor([[[[ 2.6030, -1.6420, -2.9563, ..., -1.2718, -1.9344, -1.6950]], [[ 3.8477, -3.0843, -1.2364, ..., -4.8716, -3.0916, -1.8870]], [[ 0.4305, -4.5287, -3.9082, ..., -2.2696, -0.4184, -4.0540]], ..., [[ 1.1351, -3.7062, -3.5157, ..., -2.6249, -3.7204, -5.8975]], [[ 2.4733, -0.2113, -3.8303, ..., -3.6202, -1.9535, -0.8071]], [[ 1.0212, -1.2034, -1.8840, ..., -0.3688, -0.7630, 0.5531]]], [[[ 1.7270, -6.2883, -6.7644, ..., -2.3285, -3.7088, -3.0116]], [[ 3.3695, -13.1550, -8.5207, ..., -5.9389, -7.3200, -2.5861]], [[ 0.2665, -5.3026, -7.8093, ..., -1.4090, -1.0187, -2.7574]], ..., [[ 0.5750, -4.2469, -4.0352, ..., -2.3569, -2.0876, -3.5887]], [[ 1.5572, -2.6923, -5.3692, ..., 0.9056, 0.1531, -0.4648]], [[ 0.7681, -4.7932, -3.3430, ..., -1.5175, -0.8604, 0.7606]]], [[[ 2.5469, -7.2234, -6.1604, ..., -3.8505, -3.4997, -1.5267]], [[ 5.1922, -11.4904, -8.4684, ..., -10.2222, -7.1947, -1.5839]], [[ 0.5432, -5.0803, -5.3291, ..., -1.9344, -1.6355, -3.0323]], ..., [[ 1.1714, -2.7006, -3.9829, ..., -4.6463, -5.1540, -4.7185]], [[ 2.0098, -1.0874, -0.5204, ..., -2.6496, 1.0145, 0.6104]], [[ 1.1009, -4.2979, -4.5775, ..., -2.3449, -1.1679, 0.3070]]], [[[ 2.5142, -3.5213, -3.3340, ..., -4.1689, -4.2109, -2.0830]], [[ 4.4815, -8.8176, -9.8998, ..., -6.7057, -8.5043, -1.4823]], [[ 0.8949, -5.5378, -5.3740, ..., -1.6298, -1.1609, -1.8082]], ..., [[ 1.1899, -2.5145, -3.5376, ..., -3.1015, -4.1712, -5.1093]], [[ 2.1961, -1.1363, -0.4247, ..., 0.1078, -1.7249, -0.5068]], [[ 1.0376, -3.1624, -3.0299, ..., -2.0386, -1.8264, -0.6101]]], [[[ 2.5359, -6.8385, -7.9497, ..., -2.6343, -3.3638, -0.7426]], [[ 4.0239, -14.1920, -13.0441, ..., -7.7269, -8.1598, -2.1455]], [[ 0.7573, -6.8034, -7.4702, ..., 0.1267, -0.6120, -3.1628]], ..., [[ 0.9452, -4.0661, -4.7195, ..., -3.2324, -3.2581, -2.3984]], [[ 2.4567, -2.7390, -3.6446, ..., -0.5688, 0.3303, 0.1549]], [[ 1.0241, -4.9604, -5.3365, ..., -1.2105, -1.1112, -0.1301]]]]) attn_weights tensor([[[[ -0.6126, -4.9368, -5.9074, ..., -2.1045, -1.6223, -3.0043]], [[ 0.9703, -5.4828, -7.6385, ..., -4.4608, -2.1515, -4.8202]], [[ 0.4970, -3.7863, -3.5004, ..., -3.2404, -3.3839, -4.6249]], ..., [[ 4.2757, -1.1810, 0.1835, ..., -2.6017, -2.2043, -2.1577]], [[ 3.4738, -2.6101, -3.0861, ..., -2.5791, -2.4892, -3.0635]], [[ -0.4796, -5.8627, -5.8829, ..., -1.5912, -1.3408, -2.1822]]], [[[ -0.2994, -5.7964, -7.2690, ..., -3.0465, -2.9966, -1.7226]], [[ -0.5684, -7.5934, -6.9466, ..., -2.0301, -2.9504, -3.0937]], [[ 0.3839, -3.9308, -3.5154, ..., -3.7350, -2.6353, -3.0558]], ..., [[ 3.4543, -11.9947, -8.9165, ..., -3.1032, -4.9002, -3.5744]], [[ 2.7841, -4.9666, -4.1262, ..., -2.3192, -2.5064, -2.3957]], [[ -0.4959, -5.0710, -7.3445, ..., -2.3900, -0.8747, -1.8205]]], [[[ -1.4290, -5.0649, -3.7211, ..., -2.1701, -1.2551, -2.9826]], [[ 0.3271, -5.6810, -6.4418, ..., -4.3393, -2.6976, -2.5166]], [[ 0.1419, -3.6345, -3.7200, ..., -4.0400, -4.2149, -3.9000]], ..., [[ 4.2370, -7.1313, -3.5845, ..., -6.4208, -4.0605, -0.1434]], [[ 2.8493, -3.7683, -3.8228, ..., -2.8465, -2.2442, -1.8787]], [[ -0.7263, -5.1047, -5.9199, ..., 0.1179, -0.4207, -2.0226]]], [[[ -0.0982, -6.9298, -5.8158, ..., -0.9097, -1.5339, -2.1231]], [[ 0.7098, -4.9089, -7.1699, ..., -3.3804, -2.9900, -3.4943]], [[ 0.2885, -3.2080, -3.4752, ..., -2.8938, -3.4257, -2.6964]], ..., [[ 4.7883, -5.3517, -5.4692, ..., -6.3940, -5.7729, -0.1346]], [[ 2.6225, -2.8328, -1.7787, ..., -1.8417, -1.4738, -1.7167]], [[ 0.2573, -5.5833, -6.9286, ..., -2.2610, -1.6851, -2.0878]]], [[[ -0.8621, -7.4644, -8.5910, ..., -0.8725, -0.5007, -2.3412]], [[ 1.1158, -9.3299, -10.7221, ..., -4.3762, -2.8349, -3.8622]], [[ 0.5363, -3.9191, -4.5579, ..., -3.2335, -3.1449, -3.3049]], ..., [[ 3.9974, -10.0798, -7.4978, ..., -3.2073, -4.0980, -0.8581]], [[ 2.9654, -4.2568, -4.8738, ..., -2.5864, -0.9864, -1.1796]], [[ -0.5584, -6.0030, -6.2414, ..., -4.6720, -3.3085, -1.3383]]]]) attn_weights tensor([[[[ -0.7819, -8.3693, -8.3844, ..., -3.0305, -0.4574, -2.0379]], [[ 3.2642, 0.1118, -1.4744, ..., -3.6782, -3.0460, -2.3278]], [[ 6.7114, -0.3364, -0.4547, ..., -1.4660, -1.7430, -0.9345]], ..., [[ 0.0346, -3.3830, -3.2959, ..., -0.5303, -0.2084, -1.2115]], [[ 4.2015, -0.5487, 0.1010, ..., -1.4069, -1.6473, -1.5690]], [[ 3.3596, -1.7046, -3.6977, ..., -1.3616, -2.0931, -3.4191]]], [[[ -0.2008, -9.0950, -10.3590, ..., -5.5491, -2.4881, -4.5889]], [[ 2.2741, -4.4286, -5.6491, ..., -1.6454, -1.8503, -2.3018]], [[ 6.2923, -5.5274, -5.0008, ..., -3.0394, -2.1081, -0.5464]], ..., [[ 0.0642, -3.7554, -4.7159, ..., -2.0083, 0.3291, -1.6846]], [[ 3.2965, -5.0923, -4.0270, ..., -3.7920, 0.9106, 0.5223]], [[ 3.3938, -3.8030, -3.9983, ..., -1.6952, -3.6205, -3.8884]]], [[[ -0.9832, -8.2016, -8.5240, ..., -1.9108, -1.6576, -3.6802]], [[ 2.9636, -2.9457, -2.6341, ..., -3.0744, -1.4430, -1.1798]], [[ 6.3747, -4.8075, -2.5091, ..., -2.4236, -0.9912, 0.5526]], ..., [[ -0.5196, -3.8326, -3.6351, ..., -1.4139, -2.1512, -3.2232]], [[ 4.0911, -5.3297, -2.7879, ..., -4.8261, -1.8944, 0.5567]], [[ 2.6592, -4.8341, -4.2562, ..., -4.3289, -3.9706, -2.4673]]], [[[ -0.5493, -9.3365, -8.7897, ..., -2.8030, -3.3918, -4.2696]], [[ 3.1041, -1.1898, -1.0593, ..., -0.8833, -2.4348, -2.6786]], [[ 5.7673, -2.3818, -4.2194, ..., -4.9867, -4.4207, -0.2843]], ..., [[ 0.7345, -4.3082, -4.5833, ..., -0.5391, -1.6379, -2.3365]], [[ 3.8054, -2.2567, -1.8841, ..., -3.6242, -4.2719, -2.0285]], [[ 3.4575, -3.8359, -5.1983, ..., -4.2444, -3.3892, -1.5285]]], [[[ -0.3542, -10.8888, -11.4887, ..., -3.1909, -2.2503, -1.7739]], [[ 3.7413, -4.2099, -5.4229, ..., -2.7411, -1.4830, -0.2724]], [[ 6.6451, -5.6225, -4.8131, ..., 0.0658, 0.2479, 1.5539]], ..., [[ -0.0729, -5.6008, -5.8173, ..., -3.1035, -2.7290, -2.1854]], [[ 4.8409, -2.9667, -2.2476, ..., -1.9352, -0.0895, 4.3364]], [[ 3.1064, -4.1052, -5.1354, ..., -2.7919, -3.0301, -1.0379]]]]) attn_weights tensor([[[[ 1.2345, -2.2644, -2.4940, ..., -0.8319, -1.1687, -1.2016]], [[ 5.5281, 2.4363, 0.8559, ..., -0.9576, 0.1523, 0.0564]], [[ 1.4888, -0.0326, -0.8280, ..., 0.7056, -0.3961, -0.2850]], ..., [[ 1.1898, -4.1347, -3.6958, ..., -3.4187, -4.0264, -3.2271]], [[ 1.3911, -2.5234, -2.4951, ..., -0.5959, -1.0137, -0.8805]], [[ 1.3065, -3.2024, -3.2035, ..., -2.7082, -3.1810, -3.6022]]], [[[ 1.1571, -4.0045, -4.0056, ..., -1.8978, -2.0017, -1.4799]], [[ 4.5693, -3.6624, -4.6483, ..., -1.5532, 1.8761, 1.3644]], [[ 1.9306, -2.0502, -2.9432, ..., -1.5560, -1.2359, -1.1150]], ..., [[ 1.1802, -5.9174, -5.4613, ..., -0.7005, -1.5345, -2.1417]], [[ 1.0969, -5.2255, -4.5245, ..., -1.6249, -0.2348, -0.4699]], [[ 0.9892, -3.5873, -3.5351, ..., -3.2765, -3.4041, -3.2196]]], [[[ 0.7708, -3.7372, -3.4695, ..., -3.2150, -2.9463, -1.3747]], [[ 4.4304, -3.3609, -3.2941, ..., -3.1430, -2.5969, -0.2699]], [[ 1.1365, -0.5760, -0.9792, ..., -1.6805, -1.9987, -1.6863]], ..., [[ 0.9280, -4.8293, -3.8837, ..., -4.7780, -4.1064, -3.1181]], [[ 0.7097, -4.6484, -3.4863, ..., -3.6135, -2.0799, -1.2226]], [[ 0.5727, -3.0569, -2.9665, ..., -4.6598, -3.2418, -3.3507]]], [[[ 1.3958, -2.4918, -2.0929, ..., -1.5562, -2.3685, -1.9817]], [[ 4.1740, -2.9532, -4.0967, ..., -2.7420, -2.0413, 0.9456]], [[ 1.9644, -1.1192, -2.8600, ..., -2.1996, -2.1612, -1.6679]], ..., [[ 0.7671, -2.5080, -2.4936, ..., -1.4448, -2.7258, -2.7587]], [[ 1.4203, -3.3556, -3.6485, ..., -2.1767, -3.3697, -1.6681]], [[ 1.2974, -4.8328, -6.0276, ..., -4.8434, -4.5592, -5.0903]]], [[[ 1.1266, -3.2879, -3.6531, ..., -4.1559, -3.4173, -1.8725]], [[ 5.8448, -1.9871, -3.8043, ..., -1.1082, 0.9624, 1.1869]], [[ 2.0172, -2.2449, -4.0453, ..., -2.0940, -1.4787, -0.8152]], ..., [[ 1.6796, -4.0286, -3.1604, ..., -1.1451, -0.4713, -1.8524]], [[ 1.2947, -5.0075, -5.2976, ..., -2.2156, -1.4173, -1.1653]], [[ 0.8241, -4.0520, -5.0201, ..., -4.2036, -4.5183, -3.0549]]]]) attn_weights tensor([[[[ 2.6369, -2.0891, -3.3970, ..., -3.2640, -2.3941, -2.2871]], [[ 4.7640, -0.2560, -0.8828, ..., -0.3866, -1.6827, -0.3872]], [[ 2.3111, -2.0593, -1.0730, ..., -2.8161, -3.8677, -1.9455]], ..., [[ 4.4917, -0.5175, -2.9146, ..., -3.8554, -3.8676, -2.1934]], [[ 1.3379, -5.0515, -4.0645, ..., 0.2864, 2.1119, -0.1811]], [[ 3.7788, 0.0495, -1.5656, ..., -2.0643, -2.4469, -2.1643]]], [[[ 2.1821, -4.2548, -4.8809, ..., -1.0273, -2.3098, -1.4353]], [[ 3.6799, -2.6284, -3.4334, ..., -5.4930, -0.8137, -0.1531]], [[ 2.4785, -4.1233, -4.9582, ..., -2.1366, -0.9796, -2.4971]], ..., [[ 4.6785, -3.0970, -3.2592, ..., -2.6349, -0.2628, -0.2602]], [[ 2.1398, -5.1075, -6.8316, ..., -2.6167, 0.9009, -1.5078]], [[ 3.5472, -2.7604, -3.4783, ..., -3.7662, -2.3524, -1.8717]]], [[[ 1.3886, -2.2956, -2.4525, ..., -5.5143, -1.7321, -1.4427]], [[ 3.3601, -2.7038, -2.7845, ..., -1.3943, -1.5986, 0.4360]], [[ 1.0799, -4.0640, -3.4587, ..., -4.8086, -3.0862, -2.5339]], ..., [[ 4.0776, -2.5131, -1.6515, ..., -4.3928, -3.0276, -1.9498]], [[ 1.2467, -5.8767, -5.6708, ..., 0.3667, 0.1037, -1.3508]], [[ 3.3936, -1.6638, -3.1526, ..., -3.7508, -3.3657, -1.4003]]], [[[ 1.7105, -1.0262, -0.3021, ..., -0.2548, -3.0292, -0.0716]], [[ 4.2754, -1.2381, -4.1351, ..., -4.0819, -3.5461, 0.2998]], [[ 1.3330, -1.8364, -2.0861, ..., -1.1809, -3.6595, -1.4595]], ..., [[ 4.4941, -1.7756, -2.0291, ..., -3.0104, -1.6922, -0.3651]], [[ 1.6526, -5.8125, -4.6246, ..., -0.7986, -1.1096, 0.5667]], [[ 3.3457, -1.1463, -2.5288, ..., -2.8125, -3.8787, -2.4198]]], [[[ 2.2355, -4.6520, -5.5028, ..., -0.4413, 0.3772, -1.9985]], [[ 4.0207, -2.3811, -3.5225, ..., -2.6952, -2.4637, 0.6813]], [[ 2.1984, -1.9618, -3.0412, ..., -1.6878, -1.2559, -1.2642]], ..., [[ 4.4719, -1.6929, -2.0405, ..., -0.4937, -1.3084, 0.0303]], [[ 0.9844, -5.4616, -4.9819, ..., -1.6228, -1.2318, -1.4005]], [[ 4.0397, -2.4686, -4.0157, ..., -1.2544, -1.5136, -2.0617]]]]) attn_weights tensor([[[[ 3.1736, -3.3031, -3.3778, ..., -3.6324, -3.5587, -3.7013]], [[ 4.3615, -0.2517, -1.3428, ..., -1.1280, -1.9602, -0.5807]], [[ 3.2729, -0.3241, -1.5446, ..., -2.3551, -2.3473, -1.0202]], ..., [[ 0.6233, -4.4361, -4.5712, ..., -1.2590, 0.9615, -2.3743]], [[ 3.4463, -1.1622, -0.8657, ..., -2.3506, -2.7010, -2.5851]], [[ 4.5093, -0.5052, -1.3067, ..., -0.7386, 4.2064, 3.3083]]], [[[ 3.1546, -4.3343, -4.5145, ..., -1.3267, -4.0060, -4.1141]], [[ 3.8969, -2.8205, -1.9276, ..., -3.5577, -1.3290, 0.5459]], [[ 3.2197, -2.9010, -2.8688, ..., -3.8730, -1.1971, -2.0257]], ..., [[ 1.7902, -6.0436, -4.4319, ..., -4.6739, -3.1752, -1.3069]], [[ 3.3663, -1.6607, -2.1749, ..., -3.1678, -1.8515, -2.9582]], [[ 5.3773, -1.9078, -2.4253, ..., -2.6384, -0.3799, -0.2436]]], [[[ 1.9709, -2.9363, -3.5501, ..., -4.9595, -2.9765, -1.6675]], [[ 3.2704, -2.4052, -3.4699, ..., -3.4330, -1.6192, -0.6262]], [[ 2.7723, -1.6439, -1.7462, ..., -3.8922, -3.4622, -1.7521]], ..., [[ 0.1259, -3.1848, -4.4963, ..., -2.3444, -1.2193, -1.5736]], [[ 2.9970, -2.0145, -2.1829, ..., -3.3084, -2.3088, -1.1835]], [[ 3.4245, -1.6083, -1.9291, ..., -3.7449, -0.3464, 0.5016]]], [[[ 2.9587, -3.8628, -3.5990, ..., -3.0864, -2.6563, -2.0221]], [[ 4.2519, -1.7730, -3.0338, ..., -3.0771, -1.8811, -1.4078]], [[ 3.2224, -1.6004, -1.5969, ..., -1.6830, -2.0877, -0.6490]], ..., [[ 1.5154, -6.0570, -5.2442, ..., -2.2693, -1.1977, -2.1113]], [[ 3.5682, -2.3049, -2.0382, ..., -2.1171, -1.4684, -0.5683]], [[ 6.1254, -0.2220, 2.0859, ..., 2.1761, -0.4139, 2.3858]]], [[[ 3.0994, -3.1537, -4.5812, ..., 0.5706, -0.1613, -3.1982]], [[ 4.1286, -2.4086, -4.1053, ..., -0.5055, -1.7393, -0.1957]], [[ 3.7184, -1.9881, -3.2556, ..., -0.1437, -0.8172, -1.5551]], ..., [[ 1.2867, -6.5618, -5.6180, ..., -1.1909, -0.4927, -2.2320]], [[ 3.5009, -1.4207, -2.9149, ..., -0.1598, -1.0001, -0.5830]], [[ 5.8268, -1.5829, -0.9115, ..., 0.6542, 0.6418, 0.1186]]]]) attn_weights tensor([[[[ 1.0841, 1.8430, 0.8794, ..., 1.2628, 2.1021, 0.9764]], [[ 3.5248, 1.0537, 0.3691, ..., 0.0820, 0.6192, 1.1258]], [[ 3.1316, 0.6286, -1.2704, ..., -2.0116, -2.1302, -2.0924]], ..., [[ 4.3253, -0.1360, -1.4798, ..., -2.0011, -1.2208, -0.5577]], [[ 3.2059, 1.4909, -0.4773, ..., -0.4668, 2.0237, 1.1696]], [[ 3.5501, 2.2611, 0.4616, ..., -0.8171, 3.6068, 2.1540]]], [[[ 1.5256, 0.5924, -0.5749, ..., 0.4915, 1.2377, 0.5609]], [[ 4.2548, -1.6656, -1.4005, ..., -0.2998, -0.9469, -0.5168]], [[ 4.4494, -1.5304, -1.6558, ..., -0.8494, -2.8039, -3.2956]], ..., [[ 4.8504, -0.9693, -1.5547, ..., -1.7634, 0.0252, -0.7409]], [[ 4.5862, 0.4674, -0.2208, ..., -1.1413, 2.3618, 1.8949]], [[ 3.4377, 1.5264, 0.1303, ..., 0.0503, 2.5638, 0.2135]]], [[[ 1.5149, 1.1826, 0.0570, ..., 0.1201, -0.7978, 1.8580]], [[ 3.1321, -0.8058, -1.4748, ..., -2.6312, -0.1964, 1.0913]], [[ 2.7529, -0.3951, -1.7725, ..., -3.5524, -2.9781, 0.7131]], ..., [[ 3.5720, -1.9195, -3.6176, ..., -4.0883, -1.0242, -1.0852]], [[ 2.3894, 0.3337, -0.2839, ..., -2.5247, -0.8229, 1.9734]], [[ 3.2392, 0.2940, -1.5853, ..., -2.0139, -1.6933, 0.7691]]], [[[ 1.4828, -0.2008, 0.2828, ..., 0.6942, -0.1143, 0.3008]], [[ 3.7571, -1.5523, -0.9369, ..., -1.3478, -0.2599, -2.1541]], [[ 3.5673, -1.5836, -2.4207, ..., -2.3134, -1.6305, -2.1913]], ..., [[ 4.7908, -0.4843, -1.3386, ..., -1.5838, -0.9738, 0.6334]], [[ 3.7434, -0.6857, 0.6083, ..., 0.7257, -0.3664, 1.1998]], [[ 3.7037, -1.4447, 0.5543, ..., 0.9349, -2.1045, 1.1571]]], [[[ 1.9156, -0.6574, -1.8922, ..., 1.1923, 1.3388, 0.3209]], [[ 3.7826, -1.0846, -1.9440, ..., 0.0575, -0.0774, -0.1375]], [[ 3.1304, -1.5872, -1.8026, ..., 0.2844, -0.0404, -0.7540]], ..., [[ 4.2530, -1.0363, -2.7154, ..., 0.0894, -0.3275, -1.4394]], [[ 2.4370, -1.7061, -2.1906, ..., 0.4091, 1.5228, 0.7957]], [[ 3.1467, -1.3431, -1.8762, ..., 0.8882, 0.5416, -0.3482]]]]) attn_weights tensor([[[[-1.4281, -3.2213, -2.4366, ..., -1.0147, -1.9967, -3.5470]], [[ 0.0175, 0.2741, -1.3342, ..., 1.7276, -1.2288, 7.4261]], [[-1.9387, -2.4500, -2.3889, ..., -2.0296, -2.1393, -2.2879]], ..., [[-2.2514, -2.6092, -2.6945, ..., -2.4299, -2.0594, -2.1380]], [[-0.4266, -0.8942, -0.8926, ..., -0.6541, -0.6450, 0.8973]], [[-1.3664, -2.0862, -3.2401, ..., -2.8111, -3.2746, -2.3150]]], [[[-1.5392, -4.0947, -2.6730, ..., -3.5129, -2.7164, -3.0911]], [[-1.3296, 0.0985, -1.0148, ..., 0.1321, -0.9743, 5.8580]], [[-2.2208, -3.5322, -2.8953, ..., -3.1943, -3.2420, -2.0118]], ..., [[-2.2309, -2.6197, -2.5109, ..., -2.0886, -2.1562, -1.9428]], [[-0.8197, -1.1185, -1.0043, ..., -0.3474, -0.1060, 0.8705]], [[-1.3414, -2.1352, -3.4650, ..., -2.3939, -3.3622, -2.5302]]], [[[-1.5124, -3.6935, -1.9053, ..., -0.7209, -2.6337, -2.1151]], [[-0.6950, -0.8315, -1.1004, ..., 1.3703, -1.2708, 7.2208]], [[-1.8081, -3.0579, -2.9360, ..., -2.2716, -1.6425, -3.3241]], ..., [[-2.1647, -2.7413, -2.6654, ..., -2.6679, -2.1428, -2.4495]], [[-0.5846, -1.3282, -1.3855, ..., -0.8104, -0.7064, 0.8191]], [[-0.9023, -2.1748, -3.3946, ..., -2.4022, -2.2115, -2.7295]]], [[[-1.5429, -1.9759, -2.1253, ..., -1.1710, -2.1619, -0.6630]], [[ 0.9304, 2.0508, 2.2799, ..., 1.0832, 1.2303, 12.5128]], [[-1.1418, -2.7325, -2.6773, ..., -2.5846, -2.7449, -2.2035]], ..., [[-2.3109, -3.0874, -3.2770, ..., -3.0305, -3.3812, -4.5311]], [[-0.2442, -0.6081, -0.7997, ..., -1.1495, -0.9736, 1.3085]], [[-1.5129, -2.1443, -3.1262, ..., -2.3237, -2.4082, -2.4956]]], [[[-1.2287, -3.0366, -1.8698, ..., -1.3283, -2.0548, -1.1952]], [[-0.6675, -1.8784, -2.2643, ..., 1.4728, -1.2733, 7.6402]], [[-1.9708, -2.7500, -2.7535, ..., -1.8793, -2.5442, -3.1604]], ..., [[-2.4446, -2.9116, -2.9439, ..., -2.4979, -2.3874, -3.0700]], [[-1.0382, -1.4563, -1.7369, ..., -0.5610, -0.5635, 0.8481]], [[-0.9126, -2.5272, -2.6771, ..., -2.2186, -3.2330, -2.6060]]]]) attn_weights tensor([[[[-2.6496, -5.3657, -5.4524, ..., 1.8348, 0.3438, 0.0642]], [[-0.6269, -2.3930, -2.8621, ..., 0.8666, 1.5659, 0.8581]], [[-4.2148, -4.4953, -4.6443, ..., -2.4775, -2.5412, -2.3166]], ..., [[ 1.4284, -0.8324, 0.1296, ..., -0.5415, -0.0367, -0.2746]], [[-3.7189, -2.7611, -2.6901, ..., -0.3227, -0.3823, -0.2398]], [[ 1.1295, 0.6486, -3.7096, ..., -0.7979, -1.5376, 4.5214]]], [[[-1.7024, -4.5684, -4.4690, ..., 0.7602, 2.7770, 0.7830]], [[-0.9133, -2.7910, -3.4397, ..., 2.1323, 1.6683, 0.7596]], [[-4.3543, -4.6366, -4.7731, ..., -2.3489, -2.7650, -2.2778]], ..., [[ 1.3759, -0.7698, 0.3479, ..., -1.2261, -0.0159, -0.4313]], [[-3.7851, -2.7674, -2.6788, ..., -0.3420, -0.4861, -0.1802]], [[-0.2303, -1.0125, -2.8934, ..., 0.4002, -1.3651, 3.4159]]], [[[-2.1361, -4.9415, -5.9041, ..., -0.2583, 0.4116, -0.9579]], [[-0.7761, -2.8224, -3.3523, ..., 0.7301, 1.4436, 0.3024]], [[-4.1994, -4.5906, -4.6846, ..., -2.7782, -2.4061, -2.7136]], ..., [[ 1.0597, -0.6105, 0.3749, ..., -0.9454, -0.0145, -0.4306]], [[-3.8831, -2.8134, -2.7603, ..., -0.6065, -0.3951, -0.5781]], [[ 0.9460, 0.4181, -4.0238, ..., -0.1514, 0.1713, 4.9895]]], [[[-0.5624, -2.2131, -2.3402, ..., 1.4034, 2.6874, 1.5557]], [[-1.4745, -3.2273, -3.4098, ..., 0.9194, 1.1426, 0.5825]], [[-4.2171, -4.3954, -4.5530, ..., -2.5717, -2.9599, -2.2443]], ..., [[ 1.4364, -0.0211, 0.8933, ..., -0.8357, -0.5018, -1.7186]], [[-4.0048, -2.5467, -2.4972, ..., -0.4402, -0.8571, -0.3834]], [[ 0.9886, 1.0614, -0.5872, ..., -0.7062, -0.6683, 4.5825]]], [[[-3.1966, -5.5685, -5.6171, ..., -0.5417, 1.7381, -0.4557]], [[-2.1182, -4.2061, -4.3282, ..., -0.1687, 0.6818, 0.0322]], [[-4.2331, -4.3327, -4.6099, ..., -2.4013, -2.7940, -2.3508]], ..., [[ 0.7955, -0.8115, -0.1344, ..., -0.8668, 0.0270, -1.7518]], [[-3.9174, -2.6253, -2.6436, ..., -0.5285, -0.7876, -0.2779]], [[-0.6271, -0.5412, -3.5885, ..., -1.8429, -3.1531, 4.5034]]]]) attn_weights tensor([[[[ -1.9381, -6.3020, -6.8846, ..., -1.6967, -1.9078, -0.8772]], [[ 2.0708, -1.4903, -2.6370, ..., -1.5922, -3.0341, -2.1805]], [[ -5.2140, -18.8659, -19.8093, ..., -3.5082, -1.3965, -2.6587]], ..., [[ -3.9432, -11.1054, -11.6313, ..., -1.6745, -1.0341, -2.9843]], [[ -2.4247, -4.2109, -4.1555, ..., -0.3361, -0.6546, -0.4384]], [[ -0.2794, -6.0514, -6.1012, ..., -2.5277, -2.3103, -2.3487]]], [[[ -1.3604, -5.8919, -4.8893, ..., -2.2069, -1.5574, -1.9475]], [[ 1.3766, -1.7780, -1.1295, ..., -1.7389, -2.1109, -1.1950]], [[ -5.8538, -19.8085, -20.9071, ..., -2.9943, 0.0567, -3.1584]], ..., [[ -4.7593, -12.1026, -12.5740, ..., -2.7304, -1.8709, -3.3989]], [[ -2.3834, -4.1395, -4.2048, ..., -1.1006, -0.7965, -0.5556]], [[ -0.3438, -6.1671, -6.0592, ..., -2.7057, -2.4162, -2.3709]]], [[[ -1.9351, -5.7425, -6.2317, ..., -2.2076, -0.5901, -2.0473]], [[ 1.2994, -1.2576, -1.7788, ..., -2.1357, -1.7137, -2.0417]], [[ -4.6424, -18.5788, -20.0316, ..., -5.5358, -2.9491, -5.0278]], ..., [[ -3.2150, -10.0987, -10.3927, ..., -2.3505, -3.1304, -2.9262]], [[ -2.3465, -4.0914, -4.0347, ..., -0.9651, -1.1715, -1.1053]], [[ -0.3497, -5.9444, -5.9015, ..., -2.7177, -2.6580, -2.5192]]], [[[ -1.2946, -5.6871, -5.8585, ..., 0.7105, -0.4803, -2.8572]], [[ 1.6471, -0.1104, -2.6949, ..., -1.4442, -1.3673, -2.5544]], [[ -5.1848, -17.8155, -18.1814, ..., -3.9015, -1.7785, -4.1391]], ..., [[ -3.1098, -9.5817, -9.6549, ..., -1.4014, -2.4522, -2.5986]], [[ -2.3664, -3.9769, -4.1029, ..., -1.0721, -1.0079, -0.3386]], [[ -0.2692, -5.9739, -5.9776, ..., -2.6831, -2.7203, -2.1436]]], [[[ -1.3875, -5.5294, -5.8014, ..., -3.4354, -1.4480, -3.1977]], [[ 1.5893, -2.3173, -3.1319, ..., -2.2193, -1.5613, -1.4796]], [[ -4.7442, -18.6906, -20.4974, ..., -3.0066, -0.8622, -3.2910]], ..., [[ -3.8067, -11.4040, -12.0382, ..., -1.4069, -2.8094, -2.5740]], [[ -2.7180, -4.2504, -4.3635, ..., -0.7909, -1.2119, -0.6554]], [[ -0.2909, -5.9242, -6.0875, ..., -2.6154, -2.5766, -2.4170]]]]) attn_weights tensor([[[[ 4.7713, -0.5884, -2.7784, ..., -1.2647, -1.8660, 1.3356]], [[ -2.5874, -8.9435, -9.4873, ..., -5.0268, -3.9301, -5.8771]], [[ -4.9797, -16.2651, -16.4921, ..., -3.2867, -3.8312, -5.5295]], ..., [[ -1.5380, -8.4425, -8.3250, ..., -1.4595, -3.2564, -3.3549]], [[ -0.9631, -8.0867, -7.6376, ..., -3.3449, -2.9275, -1.9376]], [[ -2.7744, -9.5542, -11.1905, ..., -2.9893, -3.3403, -2.9909]]], [[[ 4.4007, -1.4075, -2.0864, ..., -1.6390, -1.7502, 1.6717]], [[ -2.7884, -10.0302, -9.7505, ..., -3.1947, -4.0271, -4.2752]], [[ -4.6749, -15.5843, -17.7281, ..., -4.8759, -4.2767, -5.6742]], ..., [[ -1.4257, -9.0232, -10.3753, ..., -3.6957, -2.9790, -2.4561]], [[ -1.0620, -6.1216, -7.5892, ..., -3.1889, -3.3276, -2.8194]], [[ -2.5489, -10.7447, -12.3278, ..., -4.3854, -5.0343, -3.8942]]], [[[ 4.5760, -0.6000, -3.7781, ..., -1.6902, -1.7037, 2.6663]], [[ -2.6581, -8.3546, -7.8031, ..., -6.2494, -5.4972, -4.5740]], [[ -4.0842, -15.4835, -16.6466, ..., -6.5441, -5.3143, -5.3317]], ..., [[ -1.9323, -8.4375, -8.7444, ..., -1.0937, -4.0049, -4.7078]], [[ -0.8476, -8.0948, -7.7408, ..., -3.8124, -3.8718, -2.7842]], [[ -2.2527, -9.6013, -10.7011, ..., -2.3248, -2.2965, -3.5175]]], [[[ 5.6146, -0.6726, -2.2213, ..., -6.5765, -0.9983, 1.9817]], [[ -2.3487, -9.6512, -9.7047, ..., -5.6379, -3.4066, -5.1759]], [[ -4.6008, -15.4230, -16.2595, ..., -4.8626, -2.1248, -3.3295]], ..., [[ -1.3963, -9.2642, -9.3028, ..., -3.7347, -1.8149, -2.0901]], [[ -0.8792, -7.4885, -7.4908, ..., -4.4436, -3.4826, -3.1568]], [[ -2.2693, -10.4285, -11.5629, ..., -3.4117, -2.9833, -1.9751]]], [[[ 5.1154, 0.1946, -2.4615, ..., -2.3151, -1.0002, 3.5862]], [[ -2.4535, -9.6277, -9.3324, ..., -4.5148, -2.7582, -5.4917]], [[ -4.2479, -19.0312, -20.3969, ..., -5.2387, -1.1487, -3.1581]], ..., [[ -1.8418, -9.4905, -9.1969, ..., -3.9340, -2.1953, -4.8887]], [[ -1.0560, -7.6206, -9.4815, ..., -3.0131, -3.0368, -1.9966]], [[ -2.0539, -10.8503, -12.1636, ..., -5.2969, -4.0412, -2.8199]]]]) attn_weights tensor([[[[-2.4050e+00, -1.2988e+01, -1.3540e+01, ..., -2.3977e+00, -2.1682e+00, -3.9893e+00]], [[-2.8262e+00, -1.0399e+01, -9.4414e+00, ..., -3.9046e+00, -5.4027e+00, -4.6121e+00]], [[ 3.9186e-02, -3.3360e+00, -4.1209e+00, ..., -1.0346e+00, -1.5352e+00, -3.2280e+00]], ..., [[-1.5858e+00, -6.4992e+00, -5.9765e+00, ..., -1.6795e+00, -1.5902e+00, -3.5211e+00]], [[ 1.4881e+00, -2.5255e+00, -3.0415e+00, ..., -3.7536e+00, -2.9567e+00, -2.8214e+00]], [[-7.4655e+00, -3.7763e+01, -4.1331e+01, ..., -3.9758e+00, 1.2086e+01, -3.3721e+00]]], [[[-2.6000e+00, -1.3115e+01, -1.4367e+01, ..., -4.9528e+00, -5.1863e+00, -4.6811e+00]], [[-2.5685e+00, -9.4419e+00, -1.0065e+01, ..., -1.8589e+00, -2.5195e+00, -3.1685e+00]], [[-2.0235e-01, -3.3740e+00, -2.7681e+00, ..., -2.5327e+00, -2.0055e+00, -2.4396e+00]], ..., [[-9.7220e-01, -6.8377e+00, -8.2866e+00, ..., -3.2287e+00, -3.1130e+00, -3.6570e+00]], [[ 1.1699e+00, -3.0879e+00, -2.4918e+00, ..., -1.9622e+00, -1.8925e+00, -2.6610e+00]], [[-4.2210e+00, -4.1241e+01, -3.3556e+01, ..., -6.5807e+00, 1.1310e+01, 4.2689e+00]]], [[[-2.7563e+00, -1.3149e+01, -1.4544e+01, ..., -4.5467e+00, -1.7257e+00, -5.1680e+00]], [[-2.7274e+00, -9.4419e+00, -9.9462e+00, ..., -3.7519e+00, -3.6954e+00, -4.1934e+00]], [[ 8.1528e-02, -2.8504e+00, -3.2200e+00, ..., -3.0695e+00, -2.8044e+00, -4.5030e+00]], ..., [[-1.1424e+00, -5.8553e+00, -6.0814e+00, ..., -1.0683e+00, -1.1345e+00, -3.1036e+00]], [[ 1.3776e+00, -3.0889e+00, -3.5436e+00, ..., -3.3087e+00, -3.1092e+00, -3.0104e+00]], [[-7.5291e+00, -3.8205e+01, -5.0363e+01, ..., -9.8241e+00, 7.2305e+00, -2.5528e+00]]], [[[-1.6739e+00, -1.4282e+01, -1.3143e+01, ..., -4.4875e+00, -1.6488e+00, -2.4901e+00]], [[-2.2365e+00, -1.0652e+01, -1.1025e+01, ..., -3.0042e+00, -2.4388e+00, -2.6217e+00]], [[ 4.5389e-01, -3.9328e+00, -5.3763e+00, ..., -3.1027e+00, -2.0483e+00, -3.0555e+00]], ..., [[-8.3095e-01, -7.5111e+00, -7.3094e+00, ..., -1.6503e+00, -5.7193e-01, -1.2864e+00]], [[ 1.8013e+00, -2.7413e+00, -1.9482e+00, ..., -3.1434e+00, -1.8431e+00, -4.1349e+00]], [[-6.1529e+00, -3.6488e+01, -3.5251e+01, ..., 7.6743e+00, 2.3271e+01, 1.1606e+01]]], [[[-3.1453e+00, -1.4787e+01, -1.4920e+01, ..., -3.8920e+00, -7.9819e-01, -5.5587e+00]], [[-2.4188e+00, -1.1324e+01, -1.0947e+01, ..., -4.6058e+00, -2.7929e+00, -3.8464e+00]], [[ 5.1373e-02, -5.8071e+00, -5.4699e+00, ..., -3.2851e+00, -3.3926e+00, -4.7277e+00]], ..., [[-1.0724e+00, -7.9313e+00, -7.5479e+00, ..., -3.4745e+00, -2.8131e+00, -4.0089e+00]], [[ 1.2575e+00, -5.1179e+00, -4.4075e+00, ..., -4.3542e+00, -1.8438e+00, -3.0782e+00]], [[-3.0182e+00, -4.5519e+01, -4.2038e+01, ..., -1.2749e+01, 2.0505e+01, 9.5799e+00]]]]) attn_weights tensor([[[[ 2.4630, -4.7427, -4.0786, ..., -2.4545, -3.3820, -2.2301]], [[ 4.9665, -8.5334, -3.9460, ..., -3.3348, -5.4631, -2.5225]], [[ 0.5720, -5.7907, -5.4199, ..., -2.0978, -2.8173, -3.1711]], ..., [[ 1.2126, -3.8067, -4.1388, ..., -3.8239, -5.6131, -4.1865]], [[ 1.8923, -0.4506, -2.3035, ..., -2.2882, -2.1840, 0.0781]], [[ 1.2099, -2.3016, -3.0666, ..., -2.7277, -2.2088, -0.1899]]], [[[ 2.3014, -7.1662, -7.3048, ..., -4.7482, -3.6512, -3.4551]], [[ 4.4663, -18.1899, -13.0017, ..., -10.8137, -5.5971, -2.0601]], [[ 0.7328, -5.4563, -7.4586, ..., -0.9275, -1.1243, -3.1205]], ..., [[ 0.7602, -4.3947, -4.2614, ..., -1.8608, -3.1509, -3.0578]], [[ 1.6893, -2.5188, -5.0812, ..., 0.4275, -0.5834, -0.7617]], [[ 0.9849, -5.2216, -5.1865, ..., -2.0257, -1.9496, -0.2676]]], [[[ 1.7751, -6.6430, -5.6183, ..., -2.8956, -3.0512, -1.9365]], [[ 4.6583, -10.8217, -9.0059, ..., -6.8858, -4.4146, -0.6135]], [[ 0.4474, -5.7960, -5.9515, ..., -2.8365, -2.5496, -2.6250]], ..., [[ 1.0433, -3.8553, -4.2843, ..., -3.7525, -4.1603, -3.7616]], [[ 1.5845, -0.5167, -0.4392, ..., -0.2556, -0.9907, -1.3768]], [[ 1.1035, -4.6810, -4.5536, ..., -3.1291, -2.5333, 0.3107]]], [[[ 3.5207, -4.9074, -3.9626, ..., -5.6938, -2.5436, -1.4855]], [[ 4.9635, -11.0777, -10.5866, ..., -11.0396, -6.2495, -1.8574]], [[ 1.0697, -6.6844, -6.7171, ..., -2.4295, -1.3018, -3.1946]], ..., [[ 1.3879, -3.1802, -4.5739, ..., -4.2828, -4.6268, -7.0453]], [[ 2.8183, -1.0967, -1.3722, ..., -2.8869, 0.0284, -1.4453]], [[ 1.0691, -2.2733, -3.0695, ..., -2.3530, -2.5758, -2.3564]]], [[[ 2.3700, -6.5195, -8.2288, ..., -1.6865, -2.3953, -2.4370]], [[ 4.1417, -20.7498, -18.5705, ..., -10.1283, -6.7628, -4.2875]], [[ 0.8824, -6.7615, -7.6296, ..., -1.7141, -0.6494, -2.7917]], ..., [[ 1.0158, -4.1629, -5.9047, ..., -3.7454, -3.4264, -5.1232]], [[ 2.6486, -1.5833, -3.3252, ..., -0.4425, -1.0637, 0.1334]], [[ 0.9039, -5.4087, -5.7136, ..., -2.4960, -2.3716, -2.4647]]]]) attn_weights tensor([[[[ -0.4748, -4.8102, -4.1272, ..., -0.5577, -2.2511, -3.8195]], [[ 1.5180, -6.6972, -7.2445, ..., -2.6371, -3.3984, -2.8107]], [[ 0.4394, -3.0562, -3.5402, ..., -2.1794, -2.4219, -2.0041]], ..., [[ 4.5533, -4.5443, -1.7148, ..., -1.5936, -4.3460, 0.7973]], [[ 3.3193, -3.6878, -3.1603, ..., -2.3429, -2.7433, -1.3162]], [[ -0.3179, -4.5390, -5.1441, ..., -0.5884, -0.0636, -0.9975]]], [[[ -0.7822, -6.2989, -6.5152, ..., -3.0917, -0.3806, -2.5076]], [[ -0.2011, -7.0420, -6.0895, ..., -2.7423, -3.0660, -4.1669]], [[ 0.2791, -3.9746, -3.9076, ..., -2.7883, -3.5870, -3.0827]], ..., [[ 4.3626, -11.9303, -8.7514, ..., -4.9004, -2.9670, -0.1896]], [[ 2.8786, -5.0005, -4.6205, ..., -2.9008, -2.9527, -2.3784]], [[ -0.8647, -4.9950, -6.9601, ..., -0.7496, -1.5685, -2.4903]]], [[[ -1.4637, -6.3446, -6.1097, ..., -2.1004, -1.1488, -3.7648]], [[ 0.1926, -5.4750, -6.0835, ..., -4.8716, -3.6248, -3.8851]], [[ 0.2864, -3.5262, -3.5627, ..., -3.8463, -4.0095, -4.1321]], ..., [[ 4.6807, -7.6689, -4.9480, ..., -3.8963, -2.1956, -1.0085]], [[ 2.7757, -4.1033, -3.7134, ..., -1.6901, -1.8728, -2.3520]], [[ -0.9603, -6.1414, -6.6938, ..., -0.7096, 0.1781, -2.1416]]], [[[ 0.0416, -5.6666, -5.0371, ..., -2.3019, -0.0695, -2.5374]], [[ 1.2678, -5.5886, -7.1038, ..., -3.9290, -3.7925, -3.0555]], [[ 0.6899, -3.7791, -3.7573, ..., -4.2092, -3.8566, -4.5238]], ..., [[ 5.3943, -8.5080, -6.4631, ..., -6.0746, -4.7732, -4.0125]], [[ 3.2735, -2.8467, -2.2729, ..., -3.1640, -3.2258, -2.0362]], [[ 0.4016, -7.5752, -7.8752, ..., -2.3168, -0.9625, -1.7725]]], [[[ -0.9994, -8.5576, -7.2599, ..., -1.4894, 0.7923, -2.0373]], [[ 1.3069, -8.2740, -8.4648, ..., -1.7042, -2.2579, -2.4175]], [[ 0.6164, -4.8323, -4.9175, ..., -2.8297, -3.1720, -4.0696]], ..., [[ 5.2494, -17.2545, -11.9394, ..., -8.0851, -1.8216, -2.2139]], [[ 3.0470, -4.0350, -4.6370, ..., -1.2016, -0.8923, 0.2283]], [[ -0.7351, -6.2616, -7.0518, ..., -3.5726, -0.7795, -2.8296]]]]) attn_weights tensor([[[[ -0.1440, -8.8924, -8.4532, ..., -1.9492, -1.6340, -2.1003]], [[ 3.2162, -3.0067, -1.2035, ..., -3.9296, -4.7543, -2.0017]], [[ 7.0271, -3.9012, -1.5759, ..., -2.0421, -2.2693, -0.2996]], ..., [[ 0.2991, -4.7833, -4.2541, ..., -1.0963, -2.2053, -2.1612]], [[ 4.5482, -1.8817, -1.6590, ..., -1.3505, -4.8757, 0.5423]], [[ 3.2207, -4.3508, -3.7281, ..., -1.8891, -3.2809, -1.7074]]], [[[ -0.3356, -9.7547, -9.1851, ..., -3.4635, -2.2903, -4.7659]], [[ 2.6556, -3.9456, -4.9685, ..., -1.5051, -2.2719, -2.3929]], [[ 6.3708, -6.1782, -4.8662, ..., -3.9367, -2.3197, 0.6433]], ..., [[ -0.0522, -3.4539, -3.9347, ..., 0.8468, -0.1421, -1.9242]], [[ 2.9878, -4.7488, -3.4269, ..., -0.4089, 0.2536, -0.5669]], [[ 3.1832, -3.7901, -3.9944, ..., -4.3554, -4.2825, -1.3704]]], [[[ -0.9108, -7.7502, -9.7730, ..., -3.0533, -0.6373, -2.0159]], [[ 2.0493, -2.1882, -0.7760, ..., -1.6989, -1.9026, -1.1524]], [[ 6.3273, -5.7650, -5.5699, ..., -0.8068, -0.8047, 2.2160]], ..., [[ -0.2699, -5.4177, -5.3370, ..., -2.4133, -2.1464, -2.2319]], [[ 3.4783, -4.0152, -3.2538, ..., -1.4800, -0.9814, 0.8552]], [[ 2.5995, -4.2291, -6.0391, ..., -2.5249, -2.0699, -1.9560]]], [[[ 0.3756, -10.0354, -10.8232, ..., -5.3428, -1.6888, -3.3343]], [[ 4.5863, -0.7371, -0.1727, ..., -2.2133, -3.1090, -1.5146]], [[ 7.0371, -3.4857, -4.1259, ..., -8.9965, -5.9858, -0.8197]], ..., [[ 0.8182, -5.1506, -5.1153, ..., -1.8078, -1.3412, -2.2536]], [[ 5.6551, -1.8879, -3.0579, ..., -7.0655, -5.3444, -4.7315]], [[ 3.4394, -4.3235, -5.2355, ..., -5.6744, -3.6132, -3.1480]]], [[[ -0.8121, -10.9193, -10.0819, ..., -3.9608, 1.3431, -2.6818]], [[ 4.3581, -3.7886, -5.3410, ..., -1.6167, -3.2748, -0.2185]], [[ 6.9398, -6.5505, -6.9585, ..., -2.3503, 0.0830, 1.4319]], ..., [[ 0.3133, -5.6202, -6.4323, ..., -2.7132, -0.7043, -2.7929]], [[ 5.2964, -8.7935, -7.2074, ..., -4.6453, 0.1351, -0.9269]], [[ 3.3510, -3.2333, -5.3502, ..., -1.0819, -0.7394, -0.2276]]]]) attn_weights tensor([[[[ 0.8801, -3.2981, -3.1753, ..., -2.5204, -2.0549, -1.4652]], [[ 5.4076, -1.1576, -1.5845, ..., -1.0194, -1.5231, 1.0506]], [[ 0.9848, -0.1306, -0.7278, ..., -0.9890, 0.2402, -0.7763]], ..., [[ 1.1314, -5.8858, -3.4895, ..., -5.8092, -3.9727, -2.5029]], [[ 1.3356, -4.0384, -2.7687, ..., -2.8106, -2.6884, -1.0460]], [[ 0.9077, -4.1266, -2.9965, ..., -3.1892, -3.8632, -3.5047]]], [[[ 1.1438, -4.1021, -3.6526, ..., -1.7471, -1.3496, -1.6172]], [[ 4.1964, -4.5546, -5.3347, ..., -0.6208, 0.2772, 1.0338]], [[ 1.5722, -2.4246, -2.6621, ..., -0.6230, -0.8496, -0.0283]], ..., [[ 1.2005, -5.7795, -5.2444, ..., -1.9416, -1.7892, -2.0715]], [[ 1.1188, -4.8931, -4.4701, ..., -0.5668, -0.9994, -0.3537]], [[ 0.5282, -3.7466, -3.6830, ..., -3.3009, -3.1002, -3.1452]]], [[[ 0.8432, -4.1809, -3.7906, ..., -3.3999, -1.7383, -2.1497]], [[ 4.3691, -3.4342, -3.6947, ..., -2.0871, -0.3716, 0.5150]], [[ 1.1827, -1.2453, -2.0631, ..., -0.8769, -0.6431, -0.9734]], ..., [[ 0.6784, -4.8798, -4.1122, ..., -2.7416, -1.8487, -1.6385]], [[ 0.8969, -5.1603, -5.1807, ..., -2.3475, -1.5174, -0.8731]], [[ 0.5596, -3.8176, -3.5557, ..., -2.5842, -3.6510, -2.7279]]], [[[ 1.7963, -2.8065, -2.6918, ..., -3.0205, -2.4694, -2.2128]], [[ 5.7365, -1.3410, -4.7206, ..., -4.6739, -1.8890, -2.1628]], [[ 2.1702, -1.1614, -1.4722, ..., -2.7181, -0.8846, -2.5698]], ..., [[ 1.2159, -2.5643, -1.6933, ..., -2.5051, -3.1459, -1.4556]], [[ 1.4907, -3.3047, -3.0344, ..., -3.5230, -2.1171, -2.1877]], [[ 2.0004, -3.3067, -4.1536, ..., -4.1107, -4.0601, -5.0415]]], [[[ 1.3245, -3.8960, -4.0452, ..., -2.9895, -2.0329, -2.2613]], [[ 5.4956, -2.5646, -4.2682, ..., -0.9204, 0.1330, 2.7147]], [[ 2.2678, -2.1163, -3.4272, ..., -2.4309, -0.9333, -1.8060]], ..., [[ 1.9667, -5.2614, -5.3011, ..., -1.1771, -1.3660, -0.6832]], [[ 1.2020, -4.7053, -5.4833, ..., -1.2817, -1.3293, -0.0360]], [[ 0.9085, -3.8043, -4.8359, ..., -3.8782, -2.0501, -2.4445]]]]) attn_weights tensor([[[[ 2.5752, -3.4684, -3.6712, ..., -5.2965, -4.2938, -2.3116]], [[ 4.6937, -1.5008, -1.4247, ..., -1.8481, -1.4896, 0.7126]], [[ 2.1775, -4.4806, -3.0297, ..., -5.6431, -3.9717, -2.0498]], ..., [[ 4.5311, -2.3259, -2.0000, ..., -3.9248, -3.4859, -2.0506]], [[ 2.0456, -5.7189, -4.8530, ..., -2.7508, -1.4416, -0.6981]], [[ 3.8377, -0.8027, -2.0958, ..., -2.1562, -1.7918, -1.4371]]], [[[ 2.3049, -4.0392, -4.5806, ..., -2.3531, -0.7147, -1.8396]], [[ 3.5913, -3.1931, -3.5387, ..., -1.4897, -0.7950, 0.0365]], [[ 2.5124, -3.8608, -4.4178, ..., -1.0484, -2.0671, -2.2849]], ..., [[ 4.8873, -3.0118, -3.6475, ..., -1.6305, -1.4194, -0.3992]], [[ 1.6347, -5.3816, -5.4440, ..., -0.3686, -0.4984, -2.5264]], [[ 3.5652, -2.4822, -3.1003, ..., -2.6833, -2.5226, -1.5074]]], [[[ 1.5059, -3.4242, -3.2741, ..., -2.3514, -2.2669, -3.3614]], [[ 4.0696, -2.5903, -3.5345, ..., -1.5637, -0.8486, 0.5519]], [[ 1.1113, -4.2947, -3.9602, ..., -3.2700, -2.8721, -3.7498]], ..., [[ 4.2245, -3.1750, -3.1002, ..., -2.4901, -1.7919, -0.4263]], [[ 1.4716, -5.9927, -6.9433, ..., -2.6268, -0.5821, -1.7046]], [[ 3.5621, -2.0131, -4.0940, ..., -2.6437, -1.1451, -0.9558]]], [[[ 3.5484, -1.7593, -2.6260, ..., -3.7405, -1.7185, -1.4009]], [[ 5.1750, 0.2768, -3.4800, ..., -4.8651, -1.7844, -1.4367]], [[ 3.8965, -2.7327, -2.0288, ..., -3.5165, -3.3639, -1.9386]], ..., [[ 4.3558, -1.6671, -3.5621, ..., -5.6925, -4.0363, -0.8553]], [[ 2.5802, -5.7067, -6.4480, ..., -4.3092, -0.4441, -1.5989]], [[ 3.4714, -0.9151, -1.9790, ..., -4.5803, -1.9787, -2.7990]]], [[[ 2.2159, -4.6768, -4.7673, ..., 0.0333, -1.5360, -0.2242]], [[ 4.0229, -3.0155, -4.0238, ..., -2.4948, -0.6580, -0.1021]], [[ 2.2139, -2.9440, -3.5035, ..., -1.9385, -2.1182, -0.3913]], ..., [[ 4.8873, -3.2778, -3.3276, ..., -1.6168, -0.9144, 0.6265]], [[ 1.3855, -7.3600, -6.9997, ..., -3.1057, -0.0562, -1.5469]], [[ 3.7992, -1.6822, -4.0775, ..., -0.5021, -1.2977, -0.1155]]]]) attn_weights tensor([[[[ 2.7832, -2.9751, -3.2733, ..., -4.7759, -4.2548, -2.4369]], [[ 4.1879, -2.1211, -2.7329, ..., -3.7798, -2.9822, -1.0253]], [[ 3.5063, -0.8913, -1.7540, ..., -3.5212, -2.4684, -1.0341]], ..., [[ 0.9161, -4.7194, -4.0489, ..., -0.7937, -2.3366, -0.4455]], [[ 3.6865, -1.6144, -1.4843, ..., -3.7150, -3.2897, -1.4589]], [[ 3.4332, -1.5500, -2.5516, ..., -4.0038, -2.2152, 0.8759]]], [[[ 2.8994, -3.5014, -3.2150, ..., -3.4440, -3.1017, -2.8197]], [[ 4.3922, -2.5400, -3.1361, ..., -1.9377, -0.6940, 1.1732]], [[ 3.2783, -2.0611, -2.2364, ..., -0.2387, -1.5263, -0.7225]], ..., [[ 1.0170, -5.9209, -4.3398, ..., -1.6440, 0.1011, -0.7425]], [[ 3.3598, -1.6753, -2.0781, ..., -1.1938, -2.8105, -2.0118]], [[ 5.3200, -0.4171, 0.2627, ..., 1.4642, 3.0073, 0.9873]]], [[[ 2.1859, -3.0367, -4.3632, ..., -3.3800, -2.5263, -2.7786]], [[ 3.5751, -2.7930, -3.8996, ..., -1.3575, -1.6949, -0.6037]], [[ 3.2126, -1.9185, -3.1703, ..., -3.3463, -0.9115, -0.7097]], ..., [[ 1.2836, -4.7453, -6.7324, ..., -2.7813, -0.7505, -1.7308]], [[ 3.1187, -2.3555, -2.6921, ..., -2.5120, -1.5078, -1.1809]], [[ 3.7037, -1.8387, -1.8851, ..., -0.0475, 3.8746, 2.0535]]], [[[ 3.0866, -3.1095, -3.0749, ..., -3.1801, -2.9594, -1.6669]], [[ 4.6430, -1.4185, -1.9262, ..., -0.4128, -2.2400, 0.5677]], [[ 3.4294, -0.7609, -0.7904, ..., -2.9509, -2.6887, -1.9452]], ..., [[ 1.4332, -3.8902, -7.3439, ..., -1.7526, -1.9196, -3.1932]], [[ 3.5662, -2.5330, -1.7889, ..., -1.8655, -2.7895, -1.4493]], [[ 5.9243, 0.0759, 1.1221, ..., -0.0856, 1.5063, 1.7283]]], [[[ 3.1739, -3.6296, -4.8259, ..., -1.2028, -3.5666, -1.3360]], [[ 5.0430, -2.5175, -4.1599, ..., -1.9986, -0.4288, 1.6384]], [[ 4.1871, -1.4657, -2.4774, ..., -0.5115, -0.0544, 1.3058]], ..., [[ 1.2959, -8.6599, -6.5504, ..., -1.6844, -0.2092, -2.1046]], [[ 4.2136, -2.5391, -3.7906, ..., -2.1634, -0.9944, -0.8211]], [[ 5.3961, -1.4976, -1.7342, ..., -0.0215, 3.6963, 3.1991]]]]) attn_weights tensor([[[[ 1.4957, 2.0336, 1.4084, ..., 1.1137, 0.5076, 2.1722]], [[ 3.5459, 0.3948, -1.4527, ..., -0.6490, -1.4374, 1.6051]], [[ 3.3137, 0.4961, -1.2463, ..., -2.6175, -2.7444, 0.2395]], ..., [[ 4.0111, -1.2600, -2.9249, ..., -1.7348, -2.7100, -0.8385]], [[ 3.3665, 0.9898, -0.4415, ..., -1.3561, -1.4291, 1.6676]], [[ 3.2593, 1.2006, -1.2420, ..., -1.6082, -2.0406, 0.9962]]], [[[ 1.6330, -0.5495, -1.1462, ..., 0.8483, -0.8012, 0.1300]], [[ 3.5320, -0.9848, -1.0645, ..., -0.3887, -0.2353, 0.1180]], [[ 3.4809, -1.3115, -1.4649, ..., -2.4937, -3.3284, -2.0673]], ..., [[ 4.8732, -0.7493, -1.2217, ..., -0.1376, -1.1767, 0.0897]], [[ 3.8201, -0.4793, -0.8534, ..., 0.4815, 0.1187, 0.7001]], [[ 3.3614, -0.1134, 0.4369, ..., 1.0039, 1.1066, 0.6712]]], [[[ 1.7499, -0.1765, -0.8297, ..., -0.9219, 0.4408, -0.4553]], [[ 3.7127, -1.3509, -1.8696, ..., 0.1214, 1.5132, 0.5941]], [[ 3.0528, -1.2313, -1.9537, ..., -2.4605, 0.1815, -0.9730]], ..., [[ 3.9013, -2.1512, -4.0475, ..., -1.1524, -0.8769, -0.3810]], [[ 2.7367, -0.3554, -0.7697, ..., -0.3843, 2.2083, 0.6191]], [[ 3.2340, -0.4513, -2.0524, ..., -1.6919, 1.1451, -0.1611]]], [[[ 1.1702, 0.2698, 0.1128, ..., 0.2768, 0.8163, -1.2287]], [[ 3.3702, 0.8744, 0.1897, ..., -0.2436, -0.8410, 0.2284]], [[ 2.9019, -0.2588, -1.5536, ..., -2.0740, -2.9042, -1.8297]], ..., [[ 4.3197, -0.5223, -1.6211, ..., -0.8459, -1.2204, -0.3090]], [[ 3.6783, 1.0967, 0.5478, ..., -0.1309, -1.0810, 0.0728]], [[ 3.2707, 2.0546, 0.9360, ..., 1.5539, 0.6139, 1.7231]]], [[[ 1.5435, -0.9647, -1.6972, ..., 0.7205, -0.6788, 0.2091]], [[ 4.0030, -1.2022, -2.1034, ..., -0.8276, 0.1983, -0.5546]], [[ 3.5415, -0.9038, -1.7825, ..., -0.0918, -0.0958, -0.3204]], ..., [[ 4.8647, -1.5467, -2.7443, ..., -1.0704, -1.8563, 0.0293]], [[ 2.9273, -1.5496, -1.9281, ..., 0.6416, 1.5709, 1.2521]], [[ 2.0610, -0.3603, -1.3111, ..., -0.0107, 1.2028, 0.9712]]]]) attn_weights tensor([[[[-1.7093, -4.2342, -2.9473, ..., -2.8430, -3.4111, -3.9650]], [[-2.5675, -0.9255, -3.2506, ..., -2.7049, -0.4796, 4.1244]], [[-2.7185, -3.2182, -3.3189, ..., -2.9429, -1.8400, -3.7332]], ..., [[-2.0198, -2.4630, -2.3944, ..., -1.9700, -1.8321, -1.9795]], [[-0.5847, -1.1260, -1.4852, ..., -0.8366, -0.4232, 0.2328]], [[-1.6272, -2.4178, -3.6437, ..., -3.0236, -2.6310, -2.4139]]], [[[-1.8473, -3.6602, -3.0561, ..., -2.6408, -1.8255, -2.5319]], [[ 0.7485, -0.4050, -0.2617, ..., 0.4810, -1.2199, 9.5416]], [[-1.9842, -3.3430, -2.3993, ..., -1.9861, -1.9193, -2.9835]], ..., [[-2.6641, -3.3922, -3.4101, ..., -3.0860, -2.7527, -3.2435]], [[-1.1779, -1.6784, -1.7667, ..., -1.1517, -0.8672, 0.7590]], [[-1.2542, -2.0846, -3.0266, ..., -2.2662, -3.4735, -1.9843]]], [[[-0.9819, -2.8574, -3.0683, ..., -2.2333, -2.9942, -2.1385]], [[ 3.4938, -0.4210, 2.2287, ..., -0.7886, 0.8234, 8.6073]], [[-0.8932, -2.4712, -1.6361, ..., -2.3502, -2.1084, -1.1507]], ..., [[-2.8760, -3.3481, -3.5491, ..., -3.0502, -3.3232, -4.2272]], [[-0.2279, -0.9810, -1.0297, ..., -0.6042, -0.6031, 1.2607]], [[-1.7971, -1.6729, -3.0682, ..., -2.0920, -2.6886, -3.1349]]], [[[-1.5816, -4.2140, -2.9797, ..., -2.7858, -2.0235, -3.4260]], [[ 0.9433, -1.0997, 0.4871, ..., -2.7172, -4.8113, 5.8958]], [[-2.0337, -3.0946, -2.5908, ..., -2.3714, -2.0242, -2.3967]], ..., [[-2.2511, -2.8836, -2.7793, ..., -2.7804, -2.5130, -2.6798]], [[-0.3310, -1.0977, -0.9080, ..., -0.8804, -1.2835, 1.2798]], [[-1.4951, -2.5328, -3.3594, ..., -2.6449, -2.5482, -3.2047]]], [[[-1.6625, -3.5964, -2.7439, ..., -3.0250, -2.4444, -3.5909]], [[-2.2714, 0.5130, -2.2649, ..., -3.2609, -3.7607, 5.5884]], [[-1.7306, -2.4162, -2.6983, ..., -2.7776, -2.5054, -2.1680]], ..., [[-2.0375, -2.4502, -2.5414, ..., -2.0229, -2.3264, -1.8905]], [[-0.7176, -0.8522, -1.2445, ..., -0.4096, -1.1872, 0.7615]], [[-1.6542, -2.4372, -3.5490, ..., -2.9212, -2.9006, -3.3951]]]]) attn_weights tensor([[[[-0.7997, -4.3075, -4.4826, ..., 0.3852, 1.4661, 1.3301]], [[-0.6214, -2.6510, -3.1095, ..., 0.9424, 1.0678, 0.9361]], [[-4.1490, -4.4656, -4.5725, ..., -2.4846, -2.3231, -2.5214]], ..., [[ 1.4892, -0.6431, 0.0375, ..., -0.0572, -0.2922, 0.4037]], [[-3.7787, -2.7611, -2.6831, ..., -0.3779, -0.2570, -0.5271]], [[ 0.0372, -0.6830, -3.6567, ..., -1.7808, -0.9823, 3.2822]]], [[[-2.3263, -5.0547, -5.0791, ..., 3.3893, 2.1269, 0.2476]], [[-1.1848, -3.3618, -3.6914, ..., 1.3106, 1.5575, 1.0239]], [[-4.2744, -4.4856, -4.6867, ..., -2.7641, -2.3853, -2.4214]], ..., [[ 1.0801, -0.5345, 1.0397, ..., 0.5282, -0.5718, -1.5355]], [[-3.8790, -2.6560, -2.6405, ..., -0.5540, -0.3195, -0.3454]], [[ 1.3319, 0.6291, -2.2743, ..., -1.1914, -1.3355, 5.8336]]], [[[-1.0429, -3.3451, -4.5225, ..., 0.3345, 2.0910, -0.0145]], [[-1.0498, -3.4426, -3.8401, ..., 0.5088, 0.3891, -0.4413]], [[-4.0310, -4.3853, -4.4951, ..., -2.3283, -2.7188, -2.0658]], ..., [[ 1.2423, -0.3706, 0.2271, ..., -0.7585, -0.5582, -0.1018]], [[-3.8412, -2.4389, -2.3848, ..., -0.3237, -0.5039, -0.1759]], [[-1.2971, -1.4833, -5.1704, ..., -2.8608, -3.2028, 2.7329]]], [[[-1.5783, -3.9083, -2.7409, ..., 2.0092, 1.1881, -0.4532]], [[-1.4390, -3.0372, -3.9990, ..., 0.7232, 0.9619, 0.8210]], [[-4.3708, -4.5303, -4.6704, ..., -3.0999, -2.2966, -2.4373]], ..., [[ 0.9761, -0.8803, 0.1634, ..., -0.2958, -1.6863, 0.2080]], [[-3.5444, -2.8414, -2.6902, ..., -1.0074, -0.4273, -0.3642]], [[ 0.8010, 0.0328, -1.5576, ..., -1.9277, -3.6152, 4.2152]]], [[[-2.6011, -5.5887, -6.3129, ..., 1.5167, 3.0873, -0.1563]], [[-0.8658, -2.6899, -3.1524, ..., 1.3278, 1.0778, 0.7898]], [[-4.1319, -4.3639, -4.5475, ..., -2.6764, -2.3589, -2.5855]], ..., [[ 1.2661, -0.9325, -0.0467, ..., 0.0740, -1.1892, -1.2453]], [[-3.6843, -2.7099, -2.6336, ..., -0.7553, -0.3100, -0.7171]], [[ 1.5434, 0.6108, -3.0151, ..., 0.6794, -4.1183, 3.6719]]]]) attn_weights tensor([[[[ -1.5963, -6.0630, -6.4689, ..., -1.7658, -0.2358, -2.4604]], [[ 1.4338, -1.3099, -1.7878, ..., -2.6063, -1.8545, -2.5724]], [[ -5.8466, -19.8745, -22.1640, ..., -2.9411, -0.9656, -4.2846]], ..., [[ -3.0423, -10.4067, -10.7548, ..., -1.0824, -1.7292, -2.8417]], [[ -2.2197, -4.1225, -4.0605, ..., -0.7901, -0.5843, -1.0184]], [[ -0.2411, -6.0804, -6.0618, ..., -2.4327, -2.3190, -2.4275]]], [[[ -1.4974, -5.8706, -5.3745, ..., -2.0679, -2.5172, -1.6099]], [[ 1.3406, -2.0531, -1.3469, ..., -1.7168, -0.6187, -0.2365]], [[ -6.0317, -19.3690, -19.7383, ..., -2.7827, -2.0897, -3.3997]], ..., [[ -3.8465, -11.1559, -11.4479, ..., -2.2371, -2.9841, -2.0375]], [[ -2.5931, -4.0636, -4.2344, ..., -0.8937, -0.7711, -0.5498]], [[ -0.2652, -6.0333, -6.0259, ..., -2.4667, -2.3399, -2.1534]]], [[[ -1.1502, -5.2276, -5.4031, ..., -0.6988, -0.9878, -2.6114]], [[ 1.0372, -1.8187, -2.2232, ..., -2.4849, -2.4837, -0.3680]], [[ -3.9640, -15.6447, -18.3613, ..., -3.8897, -1.8758, -3.5872]], ..., [[ -3.5407, -10.1001, -10.3161, ..., -3.4553, -1.4425, -1.8552]], [[ -2.4486, -3.9158, -3.9564, ..., -1.2106, -1.3151, -0.6087]], [[ -0.1521, -5.6306, -5.5242, ..., -2.6600, -2.5927, -2.0995]]], [[[ -1.5201, -5.8250, -6.1142, ..., -0.2622, -1.3522, -1.7256]], [[ 2.1400, 0.4330, -1.1308, ..., -1.4673, -1.1337, -2.5047]], [[ -5.9080, -20.3307, -22.0196, ..., -4.0300, -2.2958, -5.2312]], ..., [[ -4.0813, -11.5870, -13.1508, ..., -3.9976, -0.8318, -2.3643]], [[ -2.6704, -4.2721, -4.1879, ..., -1.1045, -0.4774, -0.6363]], [[ -0.3093, -6.1848, -6.2534, ..., -2.8376, -2.2626, -2.3044]]], [[[ -1.6201, -5.8172, -5.9481, ..., -1.6577, -1.0345, -0.2625]], [[ 1.7097, -1.8070, -2.1694, ..., -1.7897, -1.4113, -0.8094]], [[ -4.9576, -20.4654, -22.9035, ..., -1.9035, 0.4919, -3.2248]], ..., [[ -3.7650, -12.0977, -12.7866, ..., -3.0188, -1.4941, -3.3275]], [[ -2.5579, -4.0650, -4.3238, ..., -1.2165, -0.6033, -1.0028]], [[ -0.3195, -6.1286, -6.2705, ..., -2.5579, -2.4283, -2.4334]]]]) attn_weights tensor([[[[ 4.5153, -0.9854, -2.4402, ..., -3.9164, -2.9112, 0.9485]], [[ -2.6122, -9.0365, -9.5436, ..., -3.4561, -4.3234, -3.5572]], [[ -4.5845, -17.5363, -18.4982, ..., -6.0051, -4.3236, -5.2067]], ..., [[ -2.3198, -10.1268, -10.5598, ..., -4.6070, -2.5213, -3.3259]], [[ -1.0053, -8.8338, -8.8788, ..., -3.3110, -2.9141, -2.3431]], [[ -2.6677, -10.9591, -12.7834, ..., -3.6790, -1.7437, -3.9797]]], [[[ 4.4294, -1.4434, -3.0419, ..., -2.5641, -2.2278, 2.5128]], [[ -2.4692, -9.4049, -9.1114, ..., -2.9609, -3.6558, -3.9663]], [[ -3.9441, -15.5268, -17.8033, ..., -3.9043, -3.0311, -3.6170]], ..., [[ -1.3644, -8.7972, -10.1199, ..., -2.4510, -1.0275, -2.4094]], [[ -0.7402, -6.7212, -7.6914, ..., -3.6486, -3.8894, -2.3459]], [[ -2.0614, -9.7739, -11.6054, ..., -4.0810, -1.9621, -2.1227]]], [[[ 4.8772, 0.3921, -1.7561, ..., -2.1597, -2.0790, 2.7451]], [[ -2.4357, -8.1047, -8.0129, ..., -4.3604, -4.7439, -4.8582]], [[ -3.4914, -15.0953, -17.1029, ..., -4.9926, -2.8599, -4.6060]], ..., [[ -1.6142, -8.0526, -8.1558, ..., -3.3650, -5.2535, -3.5167]], [[ -0.8365, -7.5945, -8.1992, ..., -3.5426, -2.6473, -1.6813]], [[ -2.0278, -9.7322, -11.5762, ..., -2.0754, -1.6865, -4.1133]]], [[[ 5.0108, -0.9227, -2.1676, ..., -2.6005, -6.8824, 2.6102]], [[ -2.5591, -10.0203, -10.2851, ..., -3.3386, -5.2953, -3.9012]], [[ -5.0330, -18.0602, -22.3131, ..., -4.8423, -2.8516, -4.1540]], ..., [[ -2.3071, -10.1891, -10.8345, ..., -1.6139, 0.0505, -3.3984]], [[ -1.0714, -7.9067, -7.7625, ..., -4.4745, -2.8827, -2.2610]], [[ -2.8495, -10.4055, -12.3183, ..., -4.0186, -1.6582, -3.6632]]], [[[ 4.6167, -1.2391, -2.7869, ..., -1.4345, -0.8171, -2.0954]], [[ -2.5849, -9.6656, -10.0126, ..., -3.1896, -5.5629, -4.3042]], [[ -4.5068, -20.1241, -21.3064, ..., -1.6153, -4.5320, -5.8700]], ..., [[ -1.5537, -10.2839, -10.6916, ..., -2.3599, -5.1768, -3.1200]], [[ -0.9069, -8.9591, -9.9272, ..., -2.9650, -3.5291, -1.4644]], [[ -2.5393, -12.2295, -14.3574, ..., -3.9149, -1.6693, -4.2450]]]]) attn_weights tensor([[[[-2.8702e+00, -1.3723e+01, -1.4966e+01, ..., -3.4550e+00, -1.6580e+00, -4.2448e+00]], [[-2.7843e+00, -1.1006e+01, -1.0868e+01, ..., -5.4885e+00, -3.4661e+00, -4.3731e+00]], [[-1.8516e-01, -2.9580e+00, -3.7680e+00, ..., -2.0088e+00, -1.8663e+00, -3.3121e+00]], ..., [[-1.2878e+00, -6.9980e+00, -7.0936e+00, ..., -2.3526e+00, -2.3766e+00, -3.0936e+00]], [[ 1.3101e+00, -2.9535e+00, -2.9518e+00, ..., -2.5168e+00, -2.8450e+00, -2.0729e+00]], [[-7.4031e+00, -4.1641e+01, -5.3534e+01, ..., 5.4832e-01, 1.3276e+01, 5.6096e+00]]], [[[-1.3060e+00, -1.3562e+01, -1.3011e+01, ..., -5.4419e+00, -4.5040e+00, -4.5959e+00]], [[-2.0505e+00, -9.3319e+00, -8.7886e+00, ..., -1.8930e+00, -1.9155e+00, -2.5399e+00]], [[ 7.7174e-03, -3.7655e+00, -2.8122e+00, ..., -1.9996e+00, -2.4823e+00, -1.2011e+00]], ..., [[-6.5476e-01, -7.4258e+00, -7.8748e+00, ..., -2.5440e+00, -1.6358e+00, -3.2478e+00]], [[ 1.4518e+00, -3.4555e+00, -2.5592e+00, ..., -2.7917e+00, -2.6507e+00, -3.8610e+00]], [[-7.7824e+00, -4.2258e+01, -3.8984e+01, ..., -5.9503e-02, 9.5560e+00, 9.5760e-01]]], [[[-2.7708e+00, -1.2092e+01, -1.3262e+01, ..., -1.6498e+00, -3.7264e+00, -4.3417e+00]], [[-2.0769e+00, -1.0051e+01, -1.0026e+01, ..., -3.9534e+00, -3.5661e+00, -3.1627e+00]], [[-5.4882e-02, -2.6913e+00, -3.3352e+00, ..., -1.7731e+00, -3.9057e+00, -4.0503e+00]], ..., [[-8.4522e-01, -6.9356e+00, -6.4093e+00, ..., -1.2779e+00, -2.1456e+00, -3.6988e+00]], [[ 1.3119e+00, -4.1685e+00, -4.2038e+00, ..., -3.5086e+00, -3.1830e+00, -2.3003e+00]], [[-4.1418e+00, -3.1050e+01, -3.6698e+01, ..., 3.8736e-01, 1.2294e+01, 4.9591e+00]]], [[[-2.9920e+00, -1.3707e+01, -1.4690e+01, ..., -4.5803e+00, 7.8516e-01, -2.7641e+00]], [[-2.4811e+00, -1.0165e+01, -1.0894e+01, ..., -2.0982e+00, -4.3399e+00, -4.0274e+00]], [[ 3.6210e-01, -4.0197e+00, -5.3870e+00, ..., -2.2682e+00, -2.9503e+00, -3.4566e+00]], ..., [[-9.4336e-01, -7.5399e+00, -7.4029e+00, ..., -2.1544e+00, -5.6631e-01, -2.7160e+00]], [[ 1.7730e+00, -2.4984e+00, -3.2806e+00, ..., -3.7177e+00, -4.0784e+00, -2.9986e+00]], [[-3.3456e+00, -4.3221e+01, -5.3444e+01, ..., -5.1257e+00, 1.1378e+01, 5.8594e+00]]], [[[-3.2647e+00, -1.5557e+01, -1.5584e+01, ..., -2.0492e+00, -4.8225e+00, -4.1093e+00]], [[-2.8514e+00, -1.2193e+01, -1.1867e+01, ..., -3.2445e+00, -1.7209e+00, -4.2284e+00]], [[-1.2371e-01, -4.5661e+00, -4.9467e+00, ..., -3.4236e+00, -4.5674e+00, -3.5348e+00]], ..., [[-1.2555e+00, -7.5640e+00, -8.3342e+00, ..., -2.0883e+00, -2.9613e+00, -3.6466e+00]], [[ 1.4373e+00, -4.8608e+00, -3.6233e+00, ..., -2.1847e+00, -2.6646e+00, -1.0534e+00]], [[-4.2265e+00, -5.5827e+01, -5.6197e+01, ..., 1.3448e+01, 2.6525e+01, 1.1955e+01]]]]) attn_weights tensor([[[[ 2.2216, -6.1818, -5.5648, ..., -4.9428, -3.2651, -2.0373]], [[ 4.2310, -11.5983, -8.0570, ..., -10.2759, -7.4948, -3.3431]], [[ 0.8304, -5.6477, -6.7655, ..., -4.6066, -1.7027, -3.4616]], ..., [[ 1.0587, -4.3176, -4.4492, ..., -4.9508, -3.2979, -3.4439]], [[ 1.7592, -1.5961, -3.3251, ..., -3.6344, -1.2145, -2.1024]], [[ 0.9932, -3.6385, -3.6682, ..., -2.7613, -1.6940, 0.1077]]], [[[ 2.3583, -5.2989, -6.4304, ..., -2.7685, -4.0698, -2.7025]], [[ 5.0977, -13.0889, -12.9735, ..., -5.2173, -5.7924, -1.7479]], [[ 0.9898, -5.5360, -7.0344, ..., -1.5841, -1.4000, -3.1780]], ..., [[ 1.1203, -4.2111, -3.7809, ..., -3.3832, -3.5579, -4.7002]], [[ 2.0574, -2.4786, -2.8201, ..., -0.7981, -0.3365, -0.9212]], [[ 1.0093, -5.3784, -4.4423, ..., -2.2867, -2.0747, -2.3912]]], [[[ 2.0293, -8.1103, -5.6376, ..., -4.4926, -2.1910, -2.3644]], [[ 4.2001, -15.4920, -12.0366, ..., -8.5444, -6.0662, -3.7497]], [[ 0.6202, -4.5259, -6.8555, ..., -0.8405, -0.0944, -3.3921]], ..., [[ 1.1315, -3.5444, -4.4936, ..., -5.1328, -3.5930, -2.7812]], [[ 2.9907, 0.5801, -0.6715, ..., -1.0535, -0.9052, 2.7797]], [[ 0.7300, -4.2135, -4.3980, ..., -2.4055, -1.9747, -1.7578]]], [[[ 2.6580, -3.0645, -3.2752, ..., -3.6966, -2.5250, -2.3219]], [[ 3.6969, -5.9122, -4.8114, ..., -8.4216, -5.0984, -0.8413]], [[ 0.7238, -6.2989, -6.8203, ..., -1.8689, -1.0711, -3.4650]], ..., [[ 1.1128, -3.1794, -3.1733, ..., -3.4339, -3.6168, -5.9463]], [[ 2.1327, 0.8796, -2.5183, ..., -3.5700, -1.2049, 0.7251]], [[ 0.9693, -1.5728, -1.9431, ..., -2.1697, -2.3290, -0.3507]]], [[[ 2.4887, -6.8173, -6.6335, ..., -3.9985, -2.4551, -1.9670]], [[ 4.4762, -17.0356, -12.7114, ..., -10.6503, -5.9524, -1.9343]], [[ 0.5643, -7.6955, -8.5816, ..., 0.9738, 0.3653, -2.8510]], ..., [[ 1.0159, -4.4479, -6.3530, ..., -3.1458, -2.6302, -3.3252]], [[ 2.1654, -2.9469, -3.7106, ..., 0.5441, 1.1525, 0.3135]], [[ 1.0422, -4.9947, -5.9688, ..., -2.5343, -1.6891, -0.4442]]]]) attn_weights tensor([[[[ -0.7248, -5.9962, -7.2689, ..., -3.3592, -2.7550, -4.1218]], [[ 1.0724, -7.7386, -8.0867, ..., -5.5132, -4.0976, -4.5088]], [[ 0.4865, -3.1099, -3.8680, ..., -2.1826, -2.1090, -2.7696]], ..., [[ 3.7776, -7.0010, -3.6122, ..., -6.1235, -2.5743, -2.3449]], [[ 2.8873, -3.7225, -3.8439, ..., -3.0706, -2.0453, -1.9604]], [[ -0.8760, -6.3606, -7.5021, ..., -1.1407, -0.5714, -2.9551]]], [[[ -0.3449, -6.1459, -5.7838, ..., -2.1205, -2.3236, -2.9996]], [[ 0.5566, -5.9570, -6.9696, ..., -5.8119, -6.1092, -3.7586]], [[ 0.3686, -3.6276, -3.9111, ..., -3.1807, -3.1328, -3.1196]], ..., [[ 4.6794, -7.7544, -8.2746, ..., -1.8807, -4.3199, -0.3619]], [[ 3.0095, -4.9173, -5.0065, ..., -3.6076, -2.6315, -1.4815]], [[ -0.2524, -6.2476, -7.1885, ..., -1.3087, -1.2366, -1.8222]]], [[[ -1.0780, -6.1306, -6.5131, ..., -1.1428, -1.1601, -2.8359]], [[ 0.8447, -6.4708, -6.2343, ..., -4.5123, -1.9394, -3.3853]], [[ 0.2709, -3.3654, -3.2035, ..., -2.9241, -3.7265, -3.4572]], ..., [[ 4.6220, -12.0811, -5.7521, ..., -6.1966, -4.1452, -2.0428]], [[ 2.8447, -3.9931, -3.7385, ..., -1.8728, -2.6997, -2.0322]], [[ -0.7555, -5.2766, -6.3298, ..., -0.7215, -0.5431, -2.7492]]], [[[ -0.0328, -5.7657, -7.8947, ..., -3.2092, -3.2189, -3.0280]], [[ 1.0494, -4.2560, -7.3333, ..., -4.4336, -1.1971, -6.1352]], [[ 0.5366, -3.8607, -3.4430, ..., -4.3767, -3.6937, -4.3790]], ..., [[ 4.1995, -5.2150, -1.8680, ..., -7.3016, -4.3785, -3.5332]], [[ 3.0568, -2.2486, -1.8286, ..., -1.8854, -1.7900, -3.4934]], [[ -0.1629, -6.5202, -6.7347, ..., -1.2413, -0.2264, -2.2578]]], [[[ -1.4270, -8.4358, -7.7067, ..., 0.5893, -0.5468, -1.6242]], [[ 1.1031, -8.8614, -7.7578, ..., -2.4689, -1.4877, -2.8954]], [[ 0.4775, -4.4696, -5.0849, ..., -2.6794, -3.8489, -3.5642]], ..., [[ 4.2693, -11.5321, -7.4412, ..., -5.2562, -0.5006, -1.2279]], [[ 3.0859, -4.6975, -5.4777, ..., -2.2525, -0.3489, -0.7156]], [[ -1.0857, -7.2430, -7.1670, ..., -0.8153, -1.3147, -1.6755]]]]) attn_weights tensor([[[[ -0.2748, -8.9274, -9.8744, ..., -3.0828, -0.5250, -3.5713]], [[ 3.0087, -2.9507, -1.8707, ..., -5.6764, -3.5083, -2.0151]], [[ 6.4200, -3.7267, -2.6060, ..., -4.4689, -2.8373, -1.6661]], ..., [[ 0.3735, -5.3282, -5.3311, ..., -2.9924, -1.3534, -3.0636]], [[ 3.7700, -3.5242, -3.1435, ..., -6.8946, -1.9872, -2.4803]], [[ 3.2847, -4.7655, -4.5738, ..., -3.4831, -2.4180, -2.3787]]], [[[ -0.7615, -10.2482, -10.2658, ..., -4.2976, -2.3429, -4.3600]], [[ 3.0031, -4.3790, -4.3199, ..., -1.4241, -1.7119, -1.9899]], [[ 7.2590, -4.0395, -5.0240, ..., -1.2747, -0.4155, 3.5052]], ..., [[ 0.2478, -3.2420, -4.1170, ..., -1.1054, -2.1508, -1.6493]], [[ 4.4752, -2.8068, -3.5864, ..., 1.1269, -1.2096, 1.3238]], [[ 3.0324, -2.3306, -3.7815, ..., -3.0557, -2.7465, -0.9790]]], [[[ -0.7905, -7.5572, -9.7013, ..., -1.9007, -1.3883, -4.4667]], [[ 4.1068, -3.3629, -3.0245, ..., -1.4609, -1.3352, -0.4353]], [[ 6.1309, -6.4912, -6.1179, ..., -1.8993, -1.7794, -0.3506]], ..., [[ -0.3128, -3.3560, -3.9289, ..., -1.5804, -1.8141, -2.2228]], [[ 4.3718, -6.7318, -4.0889, ..., -1.9007, -3.0350, -2.1943]], [[ 2.7661, -3.0364, -4.7161, ..., -2.6106, -2.5668, -2.8925]]], [[[ -0.2135, -9.7210, -10.0215, ..., -2.6998, -1.9687, -3.5454]], [[ 4.5348, 0.2791, -1.3792, ..., -2.9397, -2.1204, -0.2635]], [[ 6.9189, -3.1768, -4.3860, ..., -5.0341, -1.7594, -3.3739]], ..., [[ 0.2439, -4.6765, -4.8480, ..., -1.2226, -0.4670, -3.1857]], [[ 5.1266, -3.0217, -1.9635, ..., -4.8656, -4.6908, -2.1683]], [[ 3.1220, -2.0970, -3.6171, ..., -2.1668, -2.6438, -5.2363]]], [[[ -1.0562, -11.2897, -11.0698, ..., -0.9283, -2.0356, -2.4563]], [[ 3.7884, -3.6202, -5.9355, ..., -3.8047, -0.9972, -1.2933]], [[ 6.2934, -7.0462, -5.3433, ..., -1.2431, 1.4059, 0.9000]], ..., [[ 0.0393, -6.0789, -6.2128, ..., -1.1119, -2.7367, -3.0816]], [[ 4.5725, -4.8063, -4.5282, ..., 0.5579, 1.4581, 0.1840]], [[ 3.0155, -4.0272, -5.2246, ..., -2.4910, 0.0150, -0.8288]]]]) attn_weights tensor([[[[ 0.9175, -3.2050, -2.8966, ..., -2.0532, -1.4671, -1.4707]], [[ 4.7115, -2.1962, -3.8531, ..., -3.0446, -0.1494, -1.4111]], [[ 1.3143, -0.8526, -2.1935, ..., -0.7369, -0.7676, -1.8994]], ..., [[ 0.8306, -5.2418, -3.5943, ..., -3.7070, -2.5802, -1.6501]], [[ 1.0317, -4.6311, -4.0967, ..., -3.5725, -2.1978, -1.3578]], [[ 0.6413, -4.1854, -4.4932, ..., -4.5754, -3.8495, -3.4928]]], [[[ 1.2748, -4.0037, -4.4161, ..., -2.1220, -3.0077, -2.4377]], [[ 5.6940, -2.0337, -2.7670, ..., 1.1583, -0.3301, 2.4470]], [[ 1.8129, -2.3888, -2.8359, ..., -0.8883, -0.6286, 0.3450]], ..., [[ 1.3298, -5.1313, -5.0400, ..., -2.3655, -2.8831, -2.3011]], [[ 1.1955, -4.7806, -4.1613, ..., -0.3897, -0.4320, -0.3389]], [[ 0.9420, -2.9530, -3.4041, ..., -3.0766, -3.1783, -2.1513]]], [[[ 1.4132, -3.2562, -3.9786, ..., -2.2745, -2.9835, -2.0502]], [[ 4.0537, -3.2505, -1.7853, ..., -0.8551, -1.2745, 0.1462]], [[ 1.9514, -0.3180, -1.1980, ..., -0.6073, -1.4515, -2.0512]], ..., [[ 1.3274, -4.6643, -4.4519, ..., -0.8492, -1.3995, -0.0931]], [[ 1.0257, -3.7988, -4.0468, ..., -1.0863, -1.4178, -0.3330]], [[ 1.2567, -2.8813, -4.1642, ..., -3.4453, -3.7854, -2.3064]]], [[[ 2.0333, -2.2226, -3.0823, ..., -2.5227, -1.8639, -1.6458]], [[ 5.9096, 0.9488, -2.1673, ..., -0.4066, -1.4071, -0.7703]], [[ 2.4281, -1.2554, -2.1905, ..., -1.0087, -1.7555, -2.6178]], ..., [[ 1.4300, -2.9446, -2.8452, ..., -1.3324, -1.0116, -2.1189]], [[ 1.6027, -2.3007, -2.7662, ..., -0.9095, -0.9794, -0.8988]], [[ 1.3298, -4.3486, -4.9433, ..., -3.7941, -4.0634, -3.4977]]], [[[ 0.9892, -4.0092, -4.2725, ..., -1.5233, -3.3392, -1.0684]], [[ 5.5738, -3.4783, -3.3043, ..., -0.0734, 2.2661, 1.8176]], [[ 1.6758, -2.2689, -3.1435, ..., -1.8458, -1.2834, -1.3454]], ..., [[ 1.7124, -4.5954, -4.4347, ..., -1.9275, -2.7299, -1.8560]], [[ 1.0314, -4.8269, -5.2958, ..., -1.5049, -1.0427, -0.7470]], [[ 0.7430, -3.1584, -4.1648, ..., -3.0129, -2.7591, -2.7180]]]]) attn_weights tensor([[[[ 1.8397, -3.3107, -3.4712, ..., -3.7572, -1.9863, -3.0428]], [[ 3.9492, -2.8144, -3.4828, ..., -3.4011, -0.6855, -0.5487]], [[ 1.6337, -4.2994, -3.6894, ..., -3.7770, -2.0299, -1.8250]], ..., [[ 3.8994, -3.2215, -2.8467, ..., -4.1915, -2.4258, -1.4347]], [[ 1.5871, -6.6562, -6.4177, ..., -2.6220, -0.9457, -1.6415]], [[ 3.5253, -0.3027, -2.3826, ..., -2.3294, -1.8169, -1.4184]]], [[[ 2.4304, -4.3892, -4.5327, ..., -0.6927, -1.3006, -2.3140]], [[ 4.5903, -1.1315, -1.3018, ..., -0.8202, -1.7234, 0.2851]], [[ 2.9180, -4.4095, -4.1233, ..., -2.5943, -2.6659, -1.7753]], ..., [[ 5.4245, -1.6018, -2.3114, ..., -0.8832, -1.1862, 1.3075]], [[ 1.8146, -7.2276, -7.6407, ..., -2.3317, -2.1815, -2.0247]], [[ 3.8776, -0.9560, -2.5053, ..., -2.4413, -1.4243, -0.2733]]], [[[ 2.6852, -3.8964, -5.6779, ..., -2.4857, -3.5597, -1.5790]], [[ 3.8834, -1.8911, -3.1110, ..., -0.7064, -0.4183, -2.2680]], [[ 2.6656, -3.3540, -4.1216, ..., -1.3405, -2.5140, -1.3527]], ..., [[ 4.3548, -2.7465, -3.3841, ..., -1.3012, -2.5514, -0.1784]], [[-0.1811, -6.5108, -6.5866, ..., 1.5795, 0.6883, -1.5748]], [[ 3.7079, -0.9486, -2.6535, ..., -1.1417, -1.8348, -3.3636]]], [[[ 3.5969, -2.1727, -4.1595, ..., -2.8661, -0.0474, 0.5022]], [[ 4.6230, -0.0201, -2.3892, ..., -1.2821, -2.0432, 1.7119]], [[ 3.8071, -2.6021, -2.7539, ..., -2.7029, -1.1788, -1.5076]], ..., [[ 4.7613, -1.2755, -3.8241, ..., -2.9456, -1.9839, 0.7882]], [[ 1.8875, -5.1714, -5.3114, ..., 0.5904, 4.0376, 0.4670]], [[ 3.0957, -0.6010, -2.4315, ..., -2.0169, -2.4473, -2.0883]]], [[[ 1.7745, -4.0091, -4.4462, ..., -1.7569, -0.2677, -1.3578]], [[ 3.7419, -2.4147, -3.4882, ..., 0.0383, 0.4765, 1.1230]], [[ 1.8646, -2.6919, -2.8992, ..., -2.6606, -0.3950, -1.7945]], ..., [[ 4.2133, -2.4269, -2.0995, ..., 0.1205, 1.3043, 1.3481]], [[ 1.0668, -6.5877, -6.5541, ..., -0.1865, -1.3297, -1.6314]], [[ 3.6748, -1.6112, -3.6180, ..., -1.4060, 0.4860, -1.1219]]]]) attn_weights tensor([[[[ 2.7269, -3.7511, -4.2345, ..., -4.3183, -2.9589, -2.8344]], [[ 3.8435, -2.8820, -3.5211, ..., -2.9102, -0.7868, -0.3437]], [[ 3.0623, -2.6175, -3.3078, ..., -3.4971, -1.8973, -1.2123]], ..., [[ 1.7798, -5.1633, -6.5335, ..., -3.9035, -0.8467, -1.5115]], [[ 3.4929, -3.2500, -2.8605, ..., -4.2547, -2.4610, -1.5795]], [[ 3.9335, -0.6161, -1.4586, ..., -0.4510, 4.1950, 2.4099]]], [[[ 3.4876, -3.8159, -3.6525, ..., -2.9774, -2.7954, -1.1705]], [[ 4.8147, -1.3295, -2.7369, ..., -2.2393, -1.4508, 0.5613]], [[ 3.4326, -2.0992, -2.4156, ..., -2.3950, -1.7535, 0.6086]], ..., [[ 0.5648, -7.7904, -6.4615, ..., -2.4392, -2.2714, -0.4087]], [[ 4.2776, -2.9352, -2.8724, ..., -3.8537, -3.7333, -1.7821]], [[ 4.8959, -3.2491, -1.1189, ..., 1.5938, 1.9230, 2.3288]]], [[[ 3.5221, -3.6983, -4.5853, ..., -3.2333, -4.2493, -1.2951]], [[ 4.1914, -2.0554, -3.9085, ..., 0.0938, -1.3787, -0.9203]], [[ 3.0082, 1.0806, -1.4348, ..., -0.5793, -1.8345, -1.1850]], ..., [[ 0.0230, -5.4682, -6.0225, ..., -0.3767, -0.4241, 0.1197]], [[ 3.3915, -2.4242, -2.3124, ..., -2.0478, -2.8597, -1.6833]], [[ 5.2797, -1.8357, -1.5073, ..., 1.4685, 1.0875, -0.1555]]], [[[ 3.8673, -4.4315, -4.3371, ..., -3.7413, -0.5140, -3.0698]], [[ 5.1145, -1.4678, -3.7241, ..., -1.0318, 0.1749, 0.2534]], [[ 3.2151, -0.5085, -1.6824, ..., -2.5738, -2.3231, -1.0829]], ..., [[ 1.5758, -5.5848, -7.2748, ..., -2.3614, 1.2017, -0.3154]], [[ 3.4932, -2.5196, -1.8923, ..., -2.7435, -1.8797, -3.0563]], [[ 6.6253, 0.1053, 0.8836, ..., 1.3875, 4.8563, 3.5792]]], [[[ 2.8047, -3.5364, -4.3048, ..., -3.3526, -1.1126, -2.3613]], [[ 4.3353, -2.9557, -4.2937, ..., -1.1252, 1.0094, 0.1501]], [[ 3.6959, -2.2973, -3.0444, ..., -0.6574, 0.8929, 2.5568]], ..., [[ 1.0440, -6.6192, -5.1214, ..., -1.0957, -2.3385, -1.4076]], [[ 3.6287, -2.4820, -3.4166, ..., -1.2471, -0.6475, -0.5617]], [[ 4.4755, -2.1562, -2.7390, ..., 2.3310, 1.1412, 2.6324]]]]) attn_weights tensor([[[[ 1.8653, 0.6763, -0.0887, ..., -0.4335, 0.8626, 1.5406]], [[ 3.4342, -1.3868, -2.2148, ..., -2.6884, 0.8468, 0.0082]], [[ 3.0719, -0.8857, -2.3058, ..., -3.4837, -0.2544, -0.1996]], ..., [[ 3.8964, -2.1218, -3.4217, ..., -3.5797, -0.9763, -1.4017]], [[ 2.9241, -0.5559, -1.2290, ..., -1.1493, 1.9690, 0.8876]], [[ 3.5074, -0.7497, -1.4089, ..., -1.6024, 1.6052, 0.8668]]], [[[ 1.3230, 0.6741, -0.6045, ..., 0.0701, 0.1500, 0.7435]], [[ 3.5305, -1.2435, -1.0296, ..., -0.6703, -0.7981, 0.0992]], [[ 3.6098, -0.4549, -1.5350, ..., -2.8858, -1.5756, -0.9273]], ..., [[ 4.5792, -1.0074, -1.5207, ..., -2.1229, -1.7352, 0.9126]], [[ 3.2355, -0.3172, -1.0627, ..., -1.1892, -0.6458, 1.0687]], [[ 2.5999, 2.1614, 0.0236, ..., -1.2008, -0.1022, 0.9345]]], [[[ 1.3265, 2.0267, 0.5553, ..., 1.9180, 1.0124, 0.9636]], [[ 3.9556, -0.7827, -0.5955, ..., 1.2328, 0.1789, -0.6893]], [[ 3.9412, 0.4045, -1.7278, ..., -1.0025, -2.8376, -1.0206]], ..., [[ 4.7264, -0.8288, -3.0111, ..., 0.7503, 0.2683, -0.5899]], [[ 3.1974, 0.2236, -1.2571, ..., 0.8662, -0.0903, -0.1584]], [[ 3.7300, 1.7669, -0.0920, ..., 1.3343, 1.4308, 0.5187]]], [[[ 1.1020, 0.1962, -0.3645, ..., 0.6957, -1.1495, -0.5294]], [[ 3.3961, 0.1744, 0.2392, ..., -0.2742, 0.2561, 1.2253]], [[ 3.2444, -0.4071, -1.8982, ..., -2.3995, -1.0971, -2.0823]], ..., [[ 4.2960, -0.7501, -2.0733, ..., -0.9966, 0.0579, 0.9465]], [[ 3.1627, -0.0855, -0.1228, ..., -0.5812, 3.2915, 2.7258]], [[ 2.6853, 0.1374, 0.1772, ..., 1.2126, 5.7038, 2.9768]]], [[[ 1.9260, -0.9599, -2.3319, ..., -0.2070, 0.1439, 0.9099]], [[ 3.7958, -0.7828, -1.8493, ..., 0.4737, -0.3920, 0.8950]], [[ 3.0077, -1.5697, -1.9372, ..., -0.3192, -0.7946, -0.2494]], ..., [[ 4.0857, -1.5503, -2.7814, ..., -1.2993, -0.0131, -0.3620]], [[ 2.2386, -2.1407, -2.2007, ..., 1.0343, 1.9513, 1.4435]], [[ 3.2190, -2.4937, -2.0075, ..., 1.0717, 0.9925, 1.8193]]]]) attn_weights tensor([[[[-1.3060, -3.3522, -3.0030, ..., -2.7568, -2.1061, -3.0071]], [[ 3.1453, -0.2236, 1.6908, ..., 0.4558, -1.1177, 7.7745]], [[-1.5517, -2.7311, -2.3043, ..., -2.4215, -2.5561, -2.6478]], ..., [[-2.4831, -2.9406, -3.0281, ..., -2.4685, -2.6569, -4.1462]], [[-0.1644, -0.8901, -0.8498, ..., -0.6494, -0.4860, 1.3618]], [[-1.2528, -2.1092, -3.4271, ..., -2.2801, -2.7694, -2.9697]]], [[[-1.6790, -3.9627, -2.7735, ..., -2.1628, -2.4624, -3.7856]], [[-2.5384, -0.7623, -3.7695, ..., -3.0233, -3.4887, 4.4569]], [[-2.4347, -2.9699, -3.3081, ..., -2.4523, -2.9294, -1.4913]], ..., [[-2.0711, -2.4664, -2.4898, ..., -1.9467, -2.3931, -1.7013]], [[-0.8331, -1.0290, -1.0267, ..., -0.2177, -0.7121, 0.1602]], [[-1.4751, -2.3053, -3.5170, ..., -2.5491, -2.5731, -2.4355]]], [[[-1.7337, -3.7316, -2.5896, ..., -1.9359, -1.2920, -3.6423]], [[-1.3445, 0.6588, -3.0212, ..., -2.9358, -5.6594, 7.2751]], [[-2.0387, -2.8670, -2.7559, ..., -2.9463, -3.0502, -1.7849]], ..., [[-2.1798, -2.6116, -2.6360, ..., -2.3129, -2.5161, -1.9685]], [[-0.9510, -1.1679, -1.4214, ..., -0.8249, -1.5976, 0.7059]], [[-1.5477, -2.2610, -3.6354, ..., -2.9334, -2.8978, -2.2107]]], [[[-1.7104, -4.1155, -2.5337, ..., -1.3590, -2.3378, -3.4431]], [[-2.1994, -0.1858, -2.4895, ..., -0.5488, -1.5378, 6.7535]], [[-2.0532, -2.8611, -3.2040, ..., -2.7130, -2.8007, -1.8587]], ..., [[-2.2338, -2.6748, -2.7109, ..., -2.3381, -2.0941, -1.9570]], [[-1.0224, -1.3390, -1.5672, ..., -0.8520, -0.8229, 0.4923]], [[-1.3751, -2.0950, -3.3793, ..., -2.5505, -3.2020, -2.3116]]], [[[-2.2875, -3.0999, -3.4253, ..., -2.3162, -2.6100, -2.2110]], [[ 0.3227, -0.8860, -1.3383, ..., -0.2676, -1.3775, 8.1910]], [[-1.5865, -2.6930, -2.2753, ..., -2.9787, -2.1190, -2.5972]], ..., [[-2.7073, -3.3571, -3.7077, ..., -3.1747, -2.9494, -4.7093]], [[-1.3550, -1.7454, -2.4442, ..., -1.2805, -1.0106, 0.8623]], [[-1.5152, -1.8859, -2.9539, ..., -2.5020, -3.1731, -1.6636]]]]) attn_weights tensor([[[[-1.1236e+00, -3.6404e+00, -4.5100e+00, ..., 4.3362e-01, 2.0834e+00, 8.6782e-01]], [[-9.9244e-01, -3.4134e+00, -3.5135e+00, ..., 1.1889e+00, 1.2943e+00, 3.6113e-01]], [[-4.0334e+00, -4.3922e+00, -4.4899e+00, ..., -2.4437e+00, -2.7622e+00, -2.3461e+00]], ..., [[ 1.2137e+00, -3.4745e-01, -1.3689e-01, ..., -6.1269e-01, 4.8285e-01, -2.3172e-01]], [[-3.8450e+00, -2.4311e+00, -2.3612e+00, ..., -2.3351e-01, -6.1239e-01, -3.1405e-01]], [[-4.3038e+00, -3.7210e+00, -8.1881e+00, ..., -6.0124e+00, -5.2299e+00, 1.1449e+00]]], [[[-1.6266e+00, -5.0944e+00, -4.7431e+00, ..., 1.2536e+00, 1.7280e+00, -7.7481e-02]], [[-5.7589e-01, -2.4374e+00, -2.7790e+00, ..., 1.7279e+00, 1.3434e+00, 1.3807e+00]], [[-4.4086e+00, -4.5971e+00, -4.8201e+00, ..., -2.4607e+00, -2.4895e+00, -2.3143e+00]], ..., [[ 1.2603e+00, -7.1948e-01, 3.8886e-01, ..., -1.7283e-01, -9.7600e-01, -9.0901e-01]], [[-3.6120e+00, -2.7832e+00, -2.7126e+00, ..., -3.1923e-01, -3.7876e-01, -3.8166e-01]], [[ 2.2989e-01, -5.8300e-01, -3.2325e+00, ..., -1.8366e+00, -3.0831e+00, 2.7754e+00]]], [[[-1.4757e+00, -4.0049e+00, -4.5334e+00, ..., 8.5056e-01, 9.4509e-01, 3.5772e-01]], [[-6.9729e-01, -2.8160e+00, -3.2214e+00, ..., 4.0605e-01, 6.8561e-01, 8.4789e-01]], [[-4.3101e+00, -4.5663e+00, -4.7185e+00, ..., -2.7311e+00, -2.1129e+00, -2.2729e+00]], ..., [[ 1.2453e+00, -7.6570e-01, 1.0198e-01, ..., -1.8213e-01, -4.3317e-01, -7.1063e-01]], [[-3.5964e+00, -2.7758e+00, -2.6732e+00, ..., -5.9309e-01, -2.2350e-01, -2.8779e-01]], [[ 2.0363e-01, -5.0406e-01, -4.5264e+00, ..., -4.1126e+00, -3.7521e+00, 3.2778e+00]]], [[[-2.1789e+00, -4.6941e+00, -5.6957e+00, ..., 2.2193e+00, 1.6301e+00, -3.6832e-02]], [[-7.8871e-01, -2.5759e+00, -3.2060e+00, ..., 8.9520e-01, 1.7984e+00, 1.3734e+00]], [[-4.3934e+00, -4.5410e+00, -4.7804e+00, ..., -2.3020e+00, -2.4629e+00, -2.1671e+00]], ..., [[ 1.4002e+00, -7.1253e-01, 1.9091e-01, ..., -1.3323e+00, 1.7267e-01, -1.0020e-01]], [[-3.7026e+00, -2.7477e+00, -2.6672e+00, ..., -4.5469e-01, -3.4065e-01, -2.1801e-01]], [[ 8.3784e-01, 4.5295e-01, -3.0674e+00, ..., -2.1726e+00, -1.7720e+00, 4.1315e+00]]], [[[-1.0520e+00, -2.9065e+00, -3.9952e+00, ..., 1.7046e+00, 1.9065e+00, 7.8292e-01]], [[-1.7580e+00, -3.8248e+00, -4.4884e+00, ..., 1.9307e-01, 9.0781e-01, -4.1063e-03]], [[-4.0159e+00, -4.1635e+00, -4.3624e+00, ..., -2.3561e+00, -2.5776e+00, -2.0178e+00]], ..., [[ 1.1481e+00, -4.7944e-01, 1.4510e-01, ..., -8.3947e-01, -1.0480e+00, -9.5096e-01]], [[-3.7799e+00, -2.3617e+00, -2.3729e+00, ..., -3.3382e-01, -7.4500e-01, -1.5563e-01]], [[ 9.5752e-01, -2.1685e-02, -3.4321e+00, ..., -1.0159e+00, 9.9923e-01, 4.6265e+00]]]]) attn_weights tensor([[[[ -1.1780, -5.9351, -5.8537, ..., -0.6198, -2.4858, -2.4527]], [[ 0.8598, -2.1327, -3.1938, ..., -2.3637, -2.8313, -1.5135]], [[ -4.3335, -16.8294, -19.7539, ..., -2.9500, -1.6085, -3.1622]], ..., [[ -3.1516, -9.7659, -10.2739, ..., -1.9368, -1.9839, -1.2024]], [[ -2.6240, -4.0544, -4.0518, ..., -0.8264, -1.1694, -0.4301]], [[ -0.1529, -5.9303, -5.8557, ..., -2.5239, -2.4374, -2.0998]]], [[[ -1.7986, -6.5526, -6.1724, ..., -2.6649, -1.3961, -0.4133]], [[ 1.7240, -1.8680, -1.3764, ..., -0.8394, -0.4943, -0.8948]], [[ -5.5360, -21.3825, -21.7154, ..., -2.9136, -1.2244, -3.6692]], ..., [[ -4.0775, -11.8616, -12.1537, ..., -3.8736, -1.3053, -3.8896]], [[ -2.5824, -4.4151, -4.3875, ..., -0.8244, -0.4979, -0.5580]], [[ -0.2597, -6.3567, -6.2967, ..., -2.5860, -2.3471, -2.2038]]], [[[ -1.4795, -5.9369, -6.4400, ..., -1.2016, -2.4822, -0.3356]], [[ 1.5079, -1.2629, -1.9553, ..., -1.9230, -1.2839, -1.3824]], [[ -3.8755, -18.9421, -20.7510, ..., -2.3757, -2.2012, -3.3569]], ..., [[ -3.4815, -11.2283, -11.7456, ..., -2.2200, -0.8420, -3.3091]], [[ -2.5515, -4.3947, -4.3341, ..., -1.2165, -0.4947, -0.7762]], [[ -0.2238, -5.9330, -6.0930, ..., -2.5915, -2.0821, -2.2792]]], [[[ -1.7922, -5.9734, -6.8648, ..., -1.2981, -1.3362, -0.8505]], [[ 1.9877, -0.8153, -2.8138, ..., -2.1774, -2.6760, -1.0800]], [[ -5.0057, -20.6598, -22.6165, ..., -3.4047, -2.9675, -4.4584]], ..., [[ -3.8286, -11.5913, -12.0998, ..., -1.1893, -1.1329, -3.3939]], [[ -2.4614, -4.3785, -4.2802, ..., -0.4761, -0.5596, -0.4942]], [[ -0.2743, -6.2884, -6.4329, ..., -2.4324, -2.2921, -2.2648]]], [[[ -1.2655, -5.3420, -5.6114, ..., -1.8986, -0.3039, -2.2239]], [[ 2.3488, -2.6623, -3.7207, ..., -2.0245, -0.1683, -1.9690]], [[ -3.0964, -15.9282, -18.7410, ..., -3.1341, -1.1186, -1.8875]], ..., [[ -3.5502, -10.3240, -10.9214, ..., -1.0382, -2.2063, -1.6591]], [[ -2.5473, -4.0013, -3.9281, ..., -0.8546, -1.3694, -0.2091]], [[ -0.0556, -5.6281, -5.6778, ..., -2.5189, -2.7968, -2.0972]]]]) attn_weights tensor([[[[ 4.6905, 0.3909, -1.8264, ..., -2.9500, 0.0787, 2.5969]], [[ -2.3051, -9.2672, -9.3109, ..., -3.5576, -2.9145, -5.4962]], [[ -3.6740, -17.5779, -20.2650, ..., -4.6892, -2.0214, -5.1081]], ..., [[ -1.5009, -9.1715, -10.0320, ..., -3.5117, -2.4859, -2.3036]], [[ -0.8371, -7.8966, -9.5072, ..., -3.2345, -2.8890, -1.8200]], [[ -2.1191, -11.2445, -12.5382, ..., -2.7141, -4.2274, -3.6420]]], [[[ 4.4645, -1.2253, -2.0864, ..., -1.4801, -2.4106, -0.8692]], [[ -2.6512, -10.2277, -10.2161, ..., -4.3033, -4.2433, -4.1382]], [[ -4.9059, -17.0766, -19.0756, ..., -4.3203, -3.2025, -5.1517]], ..., [[ -2.0187, -10.5982, -11.4107, ..., -1.5964, -0.3780, -2.7965]], [[ -1.1281, -7.8115, -7.9995, ..., -5.1257, -3.2891, -2.0902]], [[ -2.6869, -10.8947, -13.4401, ..., -3.8348, -1.4326, -3.3481]]], [[[ 4.9997, -0.3509, -2.5192, ..., -2.0421, -2.5214, 3.0166]], [[ -2.7358, -8.6595, -8.7201, ..., -4.7601, -5.4013, -3.9337]], [[ -4.4778, -17.2676, -18.1439, ..., -4.7070, -4.6891, -5.3313]], ..., [[ -2.4962, -8.6182, -10.6903, ..., -4.4310, -3.8304, -4.1732]], [[ -1.0292, -8.1548, -8.3762, ..., -3.4985, -3.3296, -2.1070]], [[ -2.8099, -10.3214, -12.8268, ..., -3.0102, -3.1178, -4.3145]]], [[[ 5.1985, -2.2789, -2.9004, ..., -4.5468, -2.6214, 1.4027]], [[ -2.6054, -10.7779, -11.3896, ..., -5.0881, -3.5359, -6.0244]], [[ -5.4600, -19.0006, -19.5136, ..., -3.7347, -2.2322, -6.8596]], ..., [[ -2.4066, -10.4880, -11.7754, ..., -0.2560, -3.7584, -4.7240]], [[ -1.0619, -8.9828, -8.3823, ..., -4.0535, -2.6770, -2.3418]], [[ -3.0152, -11.7482, -13.9236, ..., -0.9979, -3.8946, -3.9488]]], [[[ 5.3350, 0.2441, -2.0048, ..., -2.5601, -1.7065, 3.8885]], [[ -2.5720, -8.5269, -8.9238, ..., -5.6400, -4.2585, -5.7692]], [[ -4.3203, -16.7794, -18.1223, ..., -4.4256, -0.5117, -3.7468]], ..., [[ -1.9604, -9.7964, -9.0642, ..., -2.8405, -2.7822, -3.5433]], [[ -0.9356, -8.4055, -8.7412, ..., -3.4419, -4.3175, -1.7412]], [[ -2.2876, -10.0860, -11.0650, ..., -2.2285, -2.7962, -3.0993]]]]) attn_weights tensor([[[[ -2.4309, -13.2672, -14.9767, ..., -0.7155, -2.3763, -4.4921]], [[ -2.1569, -10.9905, -11.0755, ..., -2.8292, -2.2557, -4.2978]], [[ -0.1083, -3.3117, -3.7068, ..., -2.1793, -2.0599, -3.9180]], ..., [[ -0.7372, -7.6821, -7.2127, ..., -2.1320, -1.3047, -4.3164]], [[ 1.3326, -4.0483, -4.4424, ..., -3.1295, -1.6543, -2.0928]], [[ -4.6956, -34.0625, -40.0765, ..., -1.2039, 17.2105, 4.2007]]], [[[ -1.8588, -14.4929, -14.4199, ..., -4.9826, -4.7088, -6.1753]], [[ -2.7672, -11.2876, -10.7408, ..., -2.1826, -2.0058, -3.4113]], [[ -0.0819, -3.9890, -4.0700, ..., -3.3517, -1.4399, -2.7473]], ..., [[ -0.9941, -8.1337, -8.4204, ..., -1.7411, -2.5547, -3.2357]], [[ 1.3832, -3.6807, -2.9250, ..., -3.2204, -3.5931, -2.8750]], [[ -7.2059, -45.2029, -54.7905, ..., -6.3012, 14.7494, 1.5187]]], [[[ -3.2586, -13.7413, -14.6027, ..., -4.7864, -6.1369, -3.9035]], [[ -2.5275, -10.8670, -11.4102, ..., -1.9857, -2.1394, -4.0326]], [[ 0.0683, -3.2003, -3.5388, ..., -4.1327, -5.0572, -3.8414]], ..., [[ -1.2685, -7.3097, -7.3368, ..., -3.6147, -3.9813, -3.4684]], [[ 1.3456, -3.4105, -3.3761, ..., -4.2105, -2.9412, -2.3868]], [[ -4.9073, -48.3193, -51.3364, ..., -5.6012, 14.0468, 5.6943]]], [[[ -3.0991, -15.4151, -15.3052, ..., -0.1517, -2.4037, -3.6248]], [[ -2.5843, -11.9491, -12.0275, ..., -4.5844, -3.7592, -6.1205]], [[ 0.3649, -4.6627, -5.0066, ..., -2.4459, -2.6964, -3.1535]], ..., [[ -1.3494, -8.6136, -7.3318, ..., -0.3623, -1.1312, -3.0011]], [[ 1.7640, -3.1563, -2.9424, ..., -6.1204, -3.2677, -3.5459]], [[ -3.5739, -41.0686, -43.0294, ..., 3.6627, 20.4447, 3.7507]]], [[[ -2.8279, -13.5937, -14.7610, ..., -2.9967, -1.6811, -4.2790]], [[ -2.6068, -11.0176, -10.8374, ..., -2.2192, -3.2754, -2.9844]], [[ 0.1965, -3.9290, -4.4061, ..., -4.7932, -2.7827, -3.2324]], ..., [[ -0.9198, -7.6012, -7.4169, ..., -2.5174, -2.4732, -3.4623]], [[ 1.4957, -4.9175, -4.6894, ..., -2.3581, -2.3140, -2.3678]], [[ -5.9061, -40.9769, -44.9840, ..., -0.0910, 15.1702, -0.8607]]]]) attn_weights tensor([[[[ 1.7561, -7.7784, -6.9027, ..., -4.7388, -3.5374, -1.9265]], [[ 3.7006, -12.9017, -10.0448, ..., -6.0042, -7.1219, -2.5727]], [[ 1.0956, -5.7779, -7.0231, ..., -1.8172, -1.3619, -2.7476]], ..., [[ 0.8506, -3.9758, -4.6863, ..., -3.5019, -2.9787, -1.6856]], [[ 2.7289, -0.1902, -2.5306, ..., -1.6232, -0.2281, 1.3278]], [[ 0.7660, -4.0665, -3.9291, ..., -3.1939, -1.6743, -1.8688]]], [[[ 2.1120, -7.8772, -7.5886, ..., -3.2076, -2.1830, -2.8124]], [[ 4.3037, -12.2439, -10.7106, ..., -7.1920, -5.0092, -2.3025]], [[ 0.9043, -5.6954, -7.2578, ..., -0.8281, -1.0934, -2.6684]], ..., [[ 0.9883, -3.9680, -3.7634, ..., -3.4549, -3.1431, -3.6507]], [[ 1.7835, -1.8893, -2.7204, ..., -1.8798, -0.7723, -1.4911]], [[ 1.1112, -4.6996, -4.4392, ..., -2.6460, -3.6991, -0.7175]]], [[[ 2.0425, -6.5611, -8.5879, ..., -3.0858, -1.8404, -3.2095]], [[ 4.6620, -14.9782, -12.1241, ..., -3.9516, -2.7040, -1.1182]], [[ 0.6384, -5.9930, -7.4544, ..., -0.0926, -0.6153, -1.6394]], ..., [[ 1.2462, -4.0236, -4.5606, ..., -3.8795, -2.0780, -3.1363]], [[ 2.0887, -1.7173, -1.9723, ..., -1.9661, 0.4722, -0.3215]], [[ 0.9711, -4.5993, -5.0818, ..., -1.5711, -1.8634, 0.0550]]], [[[ 2.9091, -6.7467, -5.6752, ..., -4.3485, -2.1805, -1.9946]], [[ 4.3708, -12.3135, -7.9560, ..., -7.6254, -3.0178, -1.2653]], [[ 1.0693, -7.9746, -7.7775, ..., -0.3170, -0.4969, -2.1938]], ..., [[ 1.4010, -3.3641, -4.4333, ..., -3.9824, -4.3398, -4.3567]], [[ 2.3530, -1.5321, -2.8822, ..., -0.5217, -2.0567, -1.3696]], [[ 1.1089, -3.0659, -4.3090, ..., -3.4061, -2.7793, 0.0952]]], [[[ 2.6164, -7.7592, -6.8114, ..., -3.5478, -1.2311, -0.6948]], [[ 3.9561, -17.6206, -14.4769, ..., -7.5235, -5.6193, -1.9761]], [[ 0.5335, -5.9576, -7.5971, ..., -0.2503, -0.3257, -2.5592]], ..., [[ 1.3559, -4.1384, -5.9266, ..., -3.1036, -2.5773, -3.7285]], [[ 2.7820, -2.1204, -3.0925, ..., 0.3818, -1.0969, 1.9055]], [[ 0.6968, -4.6856, -5.2423, ..., -0.6370, -0.4535, -0.3999]]]]) attn_weights tensor([[[[ -0.2426, -5.9680, -6.6300, ..., -0.9272, -0.2467, -2.4557]], [[ 1.6361, -7.1938, -7.0909, ..., -4.5230, -3.1116, -0.8980]], [[ 0.4189, -3.2561, -3.6366, ..., -2.0689, -2.1277, -3.2309]], ..., [[ 3.9832, -11.8125, -6.2930, ..., -3.1073, -3.2937, -1.0917]], [[ 2.9238, -4.0906, -3.7435, ..., -2.7034, -2.8087, -1.0162]], [[ -0.3830, -5.5992, -6.6163, ..., -1.1251, -0.8978, -2.0304]]], [[[ -0.9091, -5.4563, -5.4065, ..., -3.0754, -1.6283, -2.2862]], [[ 0.4603, -6.2457, -8.2292, ..., -5.4218, -4.4214, -4.6971]], [[ 0.3466, -3.8914, -4.4228, ..., -3.2690, -3.1663, -2.8120]], ..., [[ 4.0255, -7.3567, -6.8344, ..., -4.2668, -2.6269, -1.0644]], [[ 2.8816, -5.9189, -5.6447, ..., -2.6556, -1.5370, -1.9327]], [[ -0.5302, -6.5266, -7.6968, ..., -1.7812, -0.9412, -2.3664]]], [[[ -1.2627, -7.4946, -6.4350, ..., -2.6488, -1.7109, -2.9500]], [[ 0.6742, -6.4447, -8.0337, ..., -2.6167, -1.5411, -4.7866]], [[ 0.4340, -3.6459, -3.6285, ..., -4.6233, -4.2507, -3.8890]], ..., [[ 4.8412, -11.6976, -7.7301, ..., -2.0746, -0.6372, -1.2664]], [[ 2.8979, -3.8443, -4.6926, ..., -3.1718, -2.6156, -2.6961]], [[ -0.7026, -6.0256, -7.9106, ..., -1.7926, -2.9724, -3.2891]]], [[[ -0.0267, -6.5267, -7.1308, ..., -2.2249, -2.5412, -4.2105]], [[ 1.2930, -6.8206, -8.9304, ..., -2.8208, -4.5892, -4.2683]], [[ 0.5635, -4.3207, -4.1895, ..., -4.6293, -4.8317, -4.7025]], ..., [[ 4.8324, -12.6884, -6.8994, ..., -7.0394, -3.4287, 0.1368]], [[ 3.2488, -3.9153, -3.1612, ..., -2.2841, -3.8290, -2.7951]], [[ -0.1484, -7.0961, -6.8409, ..., -0.1615, -1.2750, -1.1406]]], [[[ -0.9891, -8.2419, -6.2069, ..., -0.5296, -0.0767, -1.8068]], [[ 1.4101, -8.5679, -7.8269, ..., -3.5593, -2.6476, -2.2046]], [[ 0.4963, -4.7188, -4.8502, ..., -3.7578, -3.1009, -2.3994]], ..., [[ 4.6031, -12.7993, -7.9197, ..., -2.7766, -4.3771, -1.0509]], [[ 3.2874, -4.4466, -5.2726, ..., -1.1869, -1.1595, -0.9519]], [[ -0.5624, -6.8985, -7.5542, ..., -2.2159, -1.3157, -2.2203]]]]) attn_weights tensor([[[[ -0.3016, -6.8359, -7.5839, ..., -1.3742, 0.1990, -3.2332]], [[ 3.9566, -3.7523, -2.7841, ..., -2.4439, -1.6806, 0.3717]], [[ 6.4130, -3.6588, -3.6252, ..., -3.7921, -2.6219, -0.5998]], ..., [[ 0.5190, -4.4333, -4.3000, ..., -1.0718, -1.2634, -1.9946]], [[ 4.5926, -6.2342, -4.0054, ..., -3.7862, -3.4267, -0.9551]], [[ 3.4523, -4.0322, -5.2505, ..., -3.3639, -3.1408, -2.3987]]], [[[ -0.3129, -10.3096, -11.0140, ..., -4.5721, -2.8659, -4.1968]], [[ 2.3485, -4.5039, -4.4937, ..., -2.0228, -2.7321, -1.4186]], [[ 6.5561, -4.7836, -4.2827, ..., -0.8769, 2.1709, 1.5841]], ..., [[ -0.0951, -4.5799, -5.0145, ..., -2.1702, -1.3546, -1.6660]], [[ 3.9391, -3.6897, -4.1174, ..., -1.0716, -0.2138, 0.2037]], [[ 3.0826, -4.5548, -4.3008, ..., -2.9384, -0.9677, -2.1795]]], [[[ -0.6628, -9.9901, -10.8609, ..., -4.0158, -3.1030, -4.7917]], [[ 3.5345, -2.0978, -2.7305, ..., -1.5010, -0.0690, -2.1499]], [[ 6.5393, -7.8084, -6.6642, ..., 0.2184, 0.1677, 0.7042]], ..., [[ -0.5986, -5.0266, -5.4810, ..., -2.5882, -1.7777, -3.1491]], [[ 4.9247, -6.2070, -4.1026, ..., -0.7904, -0.7775, -0.9254]], [[ 2.8144, -5.0177, -5.9638, ..., -2.4292, -3.2881, -4.3086]]], [[[ 0.2177, -11.2321, -10.2846, ..., -3.9876, -3.5330, -3.5017]], [[ 4.1650, -0.5693, -0.6729, ..., -1.4470, -0.9419, -1.4933]], [[ 7.1594, -5.6402, -3.9485, ..., -1.8683, -0.8063, -0.4014]], ..., [[ 0.2744, -5.4228, -5.1048, ..., -0.7355, -3.3125, -3.7913]], [[ 5.4287, -5.3253, -2.5071, ..., -4.0879, -1.7927, -0.6029]], [[ 2.9892, -4.2679, -3.8565, ..., -1.7876, -2.7321, -2.8192]]], [[[ -0.4242, -10.6500, -11.1528, ..., -1.8758, -0.8462, -2.1383]], [[ 4.4964, -4.1220, -5.1080, ..., -2.2682, -2.2462, 0.0936]], [[ 6.7746, -8.4560, -8.0037, ..., -2.4025, -1.3031, -0.1564]], ..., [[ 0.4415, -5.6499, -5.5394, ..., -2.1801, -1.3956, -1.4250]], [[ 5.3486, -6.8776, -4.9163, ..., -2.7160, -3.4472, -1.5858]], [[ 3.1393, -4.0935, -5.2164, ..., -2.8093, -2.3935, -1.6350]]]]) attn_weights tensor([[[[ 1.1990, -3.7058, -4.1624, ..., -1.6654, -2.0231, -2.4019]], [[ 4.8781, -2.0822, -2.1514, ..., 0.1427, -0.3937, 0.0421]], [[ 2.0873, -1.0999, -2.1337, ..., -0.9852, -1.5568, -2.3499]], ..., [[ 1.5191, -5.2671, -4.5618, ..., -3.8604, -2.6671, 0.1200]], [[ 1.3633, -3.8680, -3.3521, ..., -1.6469, -1.5635, -0.4195]], [[ 1.5292, -3.7330, -4.0915, ..., -3.3613, -2.5941, -1.7715]]], [[[ 0.9863, -3.9992, -3.6761, ..., -1.7710, -1.2006, -0.3105]], [[ 5.3893, -3.2473, -4.4829, ..., -1.1294, 0.5300, 1.2264]], [[ 1.3127, -2.5388, -3.1717, ..., -0.6442, 0.5372, -0.3564]], ..., [[ 1.6490, -5.5294, -5.6597, ..., -4.0840, -3.7800, -2.9145]], [[ 1.0715, -5.7091, -4.7931, ..., -1.6572, -1.4775, 0.6255]], [[ 0.7933, -3.2829, -3.3130, ..., -3.4658, -3.0405, -3.5151]]], [[[ 0.9420, -4.2862, -3.9594, ..., -2.3394, -0.9623, -1.0056]], [[ 4.0174, -5.3851, -4.3979, ..., -1.0240, -0.0798, -1.5679]], [[ 1.2880, -1.2035, -1.0055, ..., -0.9332, -0.7364, -2.9532]], ..., [[ 0.7733, -3.7415, -2.8219, ..., -0.9224, 0.7200, -1.3316]], [[ 0.9268, -4.3292, -4.0228, ..., -1.2596, -0.0798, -1.5015]], [[ 0.7628, -3.5160, -3.2610, ..., -3.3102, -2.0012, -3.4164]]], [[[ 1.3717, -2.4882, -2.8640, ..., -1.7631, -1.8483, -1.7170]], [[ 5.5659, -1.3303, -2.4702, ..., -2.6874, -0.0173, 1.3755]], [[ 1.3249, -0.1368, -0.7173, ..., 0.1067, -0.4006, -0.7777]], ..., [[ 1.0743, -2.6890, -1.5784, ..., -3.5901, -3.7803, -4.3237]], [[ 1.2803, -3.4122, -3.0302, ..., -1.4032, -2.3102, -1.1199]], [[ 0.8447, -4.4330, -4.6134, ..., -3.1914, -3.3797, -4.3691]]], [[[ 1.4957, -3.9570, -4.6430, ..., -3.5180, -2.8456, -2.5327]], [[ 5.3766, -3.9207, -3.3064, ..., -1.3195, -0.6168, -0.6991]], [[ 1.7827, -1.7688, -2.4354, ..., -1.4490, -0.7055, -1.6796]], ..., [[ 2.1407, -4.9233, -4.6557, ..., -2.8604, -2.8929, -1.1532]], [[ 1.1646, -4.1976, -4.5124, ..., -1.9414, -1.5189, -1.7307]], [[ 1.0030, -3.9729, -4.4661, ..., -3.4785, -4.3252, -3.1379]]]]) attn_weights tensor([[[[ 3.0475, -4.4377, -5.3594, ..., -2.3740, -3.4763, -0.1296]], [[ 4.1137, -2.4922, -3.0416, ..., -1.4963, -1.7341, -2.6838]], [[ 3.1508, -3.9578, -3.6996, ..., -1.5809, -1.3912, -0.6074]], ..., [[ 4.4185, -2.3712, -2.0275, ..., -1.9677, -2.0626, 0.3964]], [[ 1.2222, -6.3252, -5.6741, ..., 0.1637, 0.9603, -1.7343]], [[ 4.0565, 0.5499, -2.1027, ..., -1.9489, -0.9171, -2.5025]]], [[[ 1.6283, -3.9833, -3.5565, ..., -2.6010, -2.7323, -1.7349]], [[ 4.1679, -1.9622, -3.3712, ..., -2.5071, 0.0691, 0.7450]], [[ 1.8301, -4.1825, -4.5601, ..., -3.3720, -1.5267, -1.6108]], ..., [[ 5.0569, -2.4320, -2.8903, ..., -0.7110, 1.6958, 1.2577]], [[ 2.4384, -6.5885, -6.8523, ..., -3.7934, -1.3888, -1.4797]], [[ 3.9653, -1.5199, -2.9211, ..., -1.6523, -0.6084, -1.6322]]], [[[ 1.5334, -3.6007, -2.5182, ..., -2.4757, -0.4815, -1.7040]], [[ 3.9884, -1.8209, -2.5647, ..., 0.9651, -1.6348, -1.4131]], [[ 1.6260, -4.5897, -3.9369, ..., -2.6854, -0.9649, -3.1929]], ..., [[ 4.6383, -1.4117, -1.8562, ..., -2.1730, -0.6129, -1.5781]], [[ 0.3675, -6.9772, -6.1611, ..., -1.7488, -1.1348, -2.9184]], [[ 3.5438, -2.6998, -3.5999, ..., -0.8483, -1.7000, -2.2247]]], [[[ 2.0736, -0.9440, -1.5196, ..., -0.9451, -0.3973, -0.7838]], [[ 4.4613, -0.7520, -3.0097, ..., -0.3000, 1.2198, 3.9566]], [[ 1.8906, -3.2081, -1.9288, ..., -2.6498, -3.2130, -2.8138]], ..., [[ 4.2664, -3.4236, -3.5462, ..., -2.7245, -1.8749, -0.7655]], [[ 1.9141, -5.6072, -6.1445, ..., -0.1107, -0.1035, 0.7694]], [[ 2.9580, -1.1296, -1.9030, ..., -2.0333, -2.4152, -2.6426]]], [[[ 3.0041, -3.9335, -5.7172, ..., -1.0945, -2.1397, -0.6369]], [[ 3.5497, -2.4312, -3.6571, ..., -1.1948, -0.0791, -0.7819]], [[ 3.1411, -3.2043, -3.1237, ..., -1.3184, -1.6553, -0.0267]], ..., [[ 4.8001, -2.5929, -3.1856, ..., -1.1642, -1.6363, -0.2788]], [[ 0.5668, -7.4073, -6.0867, ..., 0.9214, 0.2180, 0.0159]], [[ 3.8457, -1.5030, -3.6133, ..., -2.2400, -1.7242, -2.0629]]]]) attn_weights tensor([[[[ 3.6483, -4.2899, -3.4604, ..., -3.5557, -3.5832, -0.8093]], [[ 4.5771, -2.6023, -3.4275, ..., -0.4086, -1.1338, 0.5125]], [[ 3.6071, -0.9779, -1.7853, ..., -2.0104, -0.9743, 0.1076]], ..., [[ 0.5393, -4.7973, -4.7848, ..., 0.2301, 0.5132, -1.4548]], [[ 3.6446, -2.6393, -1.7061, ..., -2.2931, -1.9009, -1.0101]], [[ 4.3103, -1.3346, -1.8417, ..., 2.8611, 4.9028, 2.0989]]], [[[ 2.8559, -3.8913, -3.4216, ..., -2.5472, -1.9186, -2.2014]], [[ 3.8795, -2.3026, -2.4362, ..., -0.4644, -0.5926, 0.1050]], [[ 3.4470, -3.2466, -2.8467, ..., -1.3525, 0.6848, 0.4136]], ..., [[ 1.2071, -5.9094, -4.6971, ..., -3.4891, -1.2523, -0.9222]], [[ 3.6669, -2.1154, -2.2217, ..., -2.7691, -1.9138, -0.5554]], [[ 4.8257, -1.8321, -1.4918, ..., -1.8346, 2.2987, 1.8599]]], [[[ 2.4751, -3.1514, -4.1961, ..., -3.2676, 0.3675, -2.7068]], [[ 4.1513, -1.9270, -3.8349, ..., -1.9758, -0.6180, -1.2613]], [[ 3.2370, -1.3356, -2.3340, ..., -2.0953, -1.0499, -1.7736]], ..., [[ 0.2526, -5.3180, -5.1157, ..., -2.6956, -1.2269, -2.3909]], [[ 3.3100, -1.4121, -2.4746, ..., -2.9207, -1.3958, -1.7721]], [[ 4.7077, -1.7416, -1.7792, ..., -2.4236, 0.5229, 2.0440]]], [[[ 2.6508, -4.7289, -3.6314, ..., -2.0031, -3.4566, -2.8127]], [[ 4.6307, -2.8811, -3.3066, ..., -2.2635, -2.3740, -0.0092]], [[ 3.0065, -2.5528, -2.2082, ..., -2.5552, -0.9655, -1.2224]], ..., [[ 0.2695, -4.6035, -4.3861, ..., -2.3064, -2.9168, -2.4945]], [[ 3.2551, -3.4239, -2.0944, ..., -1.9865, -2.6001, -1.7912]], [[ 5.5388, -0.3375, 1.0701, ..., 0.9602, 2.0071, 3.4193]]], [[[ 3.5608, -3.5778, -3.9796, ..., -2.3255, -2.9242, -0.7729]], [[ 4.7438, -2.4808, -3.9939, ..., 0.3732, -0.5980, 0.5333]], [[ 3.3588, -1.1108, -2.3278, ..., -0.5674, 0.2127, 0.4823]], ..., [[ 0.2162, -6.7414, -4.7657, ..., -0.4789, 0.2317, -0.0984]], [[ 3.7524, -2.3823, -2.8715, ..., -1.8192, -1.4504, -0.6304]], [[ 5.9089, -2.8864, -1.5350, ..., 1.3245, 0.2753, 3.5786]]]]) attn_weights tensor([[[[ 1.7883, 0.7711, 0.2228, ..., 1.4518, 1.4779, 1.6728]], [[ 3.9958, -0.5354, -1.5702, ..., 0.5807, 0.0205, 0.7683]], [[ 3.5024, -0.1046, -1.4066, ..., -0.3509, -0.7140, -0.2874]], ..., [[ 4.4309, -1.6984, -3.3666, ..., -0.5553, -1.4382, -0.3101]], [[ 3.5071, 0.3271, -1.1458, ..., 1.9255, 1.7645, 1.4557]], [[ 4.2765, 0.7904, -0.6461, ..., 1.8890, 2.3551, 1.3422]]], [[[ 1.6200, -0.4966, -1.6279, ..., -0.2404, 0.4616, 0.5666]], [[ 3.7148, -1.3342, -1.0280, ..., -0.4125, 0.3847, 0.2278]], [[ 3.4033, -1.7567, -1.6220, ..., -1.5917, -1.1435, -0.9786]], ..., [[ 4.1710, -0.2121, -1.0240, ..., -0.0307, 1.7550, 2.5298]], [[ 2.7447, -0.7988, 0.4246, ..., 0.6349, 2.5257, 1.7704]], [[ 3.2117, -1.2055, 0.0878, ..., -0.4775, 1.2276, 1.7286]]], [[[ 1.5138, 0.0701, -0.2115, ..., -0.0518, 0.7472, -0.4099]], [[ 3.4512, -1.1263, -1.0002, ..., -0.1564, -0.8647, -0.8571]], [[ 3.0911, -0.9579, -1.8657, ..., -1.7905, -0.4714, -0.7672]], ..., [[ 4.2287, -1.7239, -2.6511, ..., -1.2697, -1.3828, -1.6352]], [[ 2.8933, -0.6764, -1.1789, ..., -1.3580, 0.2391, 0.4596]], [[ 2.8777, -0.0106, -1.2859, ..., -0.7143, -0.0924, 0.4317]]], [[[ 1.0540, 0.4246, -0.3211, ..., -0.5844, -0.9261, 0.3152]], [[ 2.8815, -1.2731, -1.3069, ..., -1.2376, -1.8481, -1.4377]], [[ 2.3311, -1.5123, -2.3967, ..., -1.0580, -2.9942, -2.2989]], ..., [[ 4.0922, -1.3442, -2.4798, ..., -0.6315, -1.4732, 0.7803]], [[ 2.5174, -0.9661, -0.5377, ..., 0.4877, 0.1622, 0.4434]], [[ 3.1824, -0.2058, 0.6951, ..., 1.3411, 0.8202, 1.1368]]], [[[ 1.4607, 0.5943, -0.7245, ..., -0.4770, 0.2247, 1.0145]], [[ 3.7514, -0.6563, -0.6355, ..., -0.2516, 0.0361, 0.9396]], [[ 3.9589, 0.1205, -1.3457, ..., -1.4567, -0.6574, 0.2712]], ..., [[ 4.6279, -0.3196, -1.2535, ..., 0.9386, 0.5928, 0.9678]], [[ 3.3640, -0.6458, -1.3599, ..., 1.1554, 0.6401, 1.1926]], [[ 3.6402, 0.3578, -0.5099, ..., 3.0711, 2.4927, 1.6731]]]])