In [13]:
import torch as t
import numpy as np
from torch.utils.data import DataLoader
from torch import optim
from torch import nn
from model import *
from torchnet import meter
import tqdm
from config import *
from test import *

def train():
    if Config.use_gpu:
        Config.device = t.device("cuda")
    else:
        Config.device = t.device("cpu")
    device = Config.device
    # 获取数据
    datas = np.load("tang.npz", allow_pickle=True)
    data = datas['data']
    ix2word = datas['ix2word'].item()
    word2ix = datas['word2ix'].item()
    data = t.from_numpy(data)
    dataloader = DataLoader(data,
                            batch_size=Config.batch_size,
                            shuffle=True,
                            num_workers=2)

    # 定义模型
    model = PoetryModel(len(word2ix),
                        embedding_dim=Config.embedding_dim,
                        hidden_dim = Config.hidden_dim)
    Configimizer = optim.Adam(model.parameters(),lr=Config.lr)
    criterion = nn.CrossEntropyLoss()
    if Config.model_path:
        model.load_state_dict(t.load(Config.model_path,map_location='cpu'))
    # 转移到相应计算设备上
    model.to(device)
    loss_meter = meter.AverageValueMeter()
    # 进行训练
    f = open('result.txt','w')
    for epoch in range(Config.epoch):
        loss_meter.reset()
        for li,data_ in tqdm.tqdm(enumerate(dataloader)):
            #print(data_.shape)
            data_ = data_.long().transpose(1,0).contiguous()
            # 注意这里，也转移到了计算设备上
            data_ = data_.to(device)
            Configimizer.zero_grad()
            # n个句子，前n-1句作为输入，后n-1句作为输出，二者一一对应
            input_,target = data_[:-1,:],data_[1:,:]
            output,_ = model(input_)
            #print("Here",output.shape)
            # 这里为什么view(-1)
            print(target.shape,target.view(-1).shape)
            loss = criterion(output,target.view(-1))
            loss.backward()
            Configimizer.step()
            loss_meter.add(loss.item())
            # 进行可视化
            if (1+li)%Config.plot_every == 0:
                print("训练损失为%s"%(str(loss_meter.mean)))
                f.write("训练损失为%s"%(str(loss_meter.mean)))
                for word in list(u"春江花朝秋月夜"):
                    gen_poetry = ''.join(generate(model,word,ix2word,word2ix))
                    print(gen_poetry)
                    f.write(gen_poetry)
                    f.write("\n\n\n")
                    f.flush()
        t.save(model.state_dict(),'%s_%s.pth'%(Config.model_prefix,epoch))



train()

0it [00:00, ?it/s]

torch.Size([124, 16]) torch.Size([1984])


1it [00:02,  2.87s/it]

torch.Size([124, 16]) torch.Size([1984])


2it [00:05,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3it [00:07,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


4it [00:09,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


5it [00:12,  2.35s/it]

torch.Size([124, 16]) torch.Size([1984])


6it [00:14,  2.35s/it]

torch.Size([124, 16]) torch.Size([1984])


7it [00:16,  2.35s/it]

torch.Size([124, 16]) torch.Size([1984])


8it [00:19,  2.36s/it]

torch.Size([124, 16]) torch.Size([1984])


9it [00:21,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


10it [00:23,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


11it [00:26,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


12it [00:28,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


13it [00:31,  2.37s/it]

torch.Size([124, 16]) torch.Size([1984])


14it [00:33,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


15it [00:35,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


16it [00:38,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


17it [00:40,  2.37s/it]

torch.Size([124, 16]) torch.Size([1984])


18it [00:42,  2.37s/it]

torch.Size([124, 16]) torch.Size([1984])


19it [00:45,  2.37s/it]

torch.Size([124, 16]) torch.Size([1984])


20it [00:47,  2.36s/it]

torch.Size([124, 16]) torch.Size([1984])


21it [00:50,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


22it [00:52,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


23it [00:54,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


24it [00:57,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


25it [00:59,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


26it [01:02,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


27it [01:04,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


28it [01:07,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


29it [01:10,  2.62s/it]

torch.Size([124, 16]) torch.Size([1984])


30it [01:13,  2.69s/it]

torch.Size([124, 16]) torch.Size([1984])


31it [01:15,  2.74s/it]

torch.Size([124, 16]) torch.Size([1984])


32it [01:18,  2.83s/it]

torch.Size([124, 16]) torch.Size([1984])


33it [01:23,  3.22s/it]

torch.Size([124, 16]) torch.Size([1984])


34it [01:26,  3.38s/it]

torch.Size([124, 16]) torch.Size([1984])


35it [01:30,  3.38s/it]

torch.Size([124, 16]) torch.Size([1984])


36it [01:33,  3.24s/it]

torch.Size([124, 16]) torch.Size([1984])


37it [01:36,  3.23s/it]

torch.Size([124, 16]) torch.Size([1984])


38it [01:39,  3.11s/it]

torch.Size([124, 16]) torch.Size([1984])


39it [01:42,  3.04s/it]

torch.Size([124, 16]) torch.Size([1984])


40it [01:44,  2.94s/it]

torch.Size([124, 16]) torch.Size([1984])


41it [01:47,  2.88s/it]

torch.Size([124, 16]) torch.Size([1984])


42it [01:50,  2.80s/it]

torch.Size([124, 16]) torch.Size([1984])


43it [01:52,  2.71s/it]

torch.Size([124, 16]) torch.Size([1984])


44it [01:54,  2.62s/it]

torch.Size([124, 16]) torch.Size([1984])


45it [01:57,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


46it [01:59,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


47it [02:02,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


48it [02:04,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


49it [02:07,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


50it [02:09,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


51it [02:12,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


52it [02:14,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


53it [02:17,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


54it [02:19,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


55it [02:21,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


56it [02:24,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


57it [02:26,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


58it [02:29,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


59it [02:31,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


60it [02:33,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


61it [02:36,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


62it [02:38,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


63it [02:41,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


64it [02:43,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


65it [02:46,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


66it [02:48,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


67it [02:50,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


68it [02:53,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


69it [02:55,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


70it [02:58,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


71it [03:00,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


72it [03:03,  2.60s/it]

torch.Size([124, 16]) torch.Size([1984])


73it [03:06,  2.70s/it]

torch.Size([124, 16]) torch.Size([1984])


74it [03:09,  2.78s/it]

torch.Size([124, 16]) torch.Size([1984])


75it [03:12,  2.69s/it]

torch.Size([124, 16]) torch.Size([1984])


76it [03:14,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


77it [03:16,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


78it [03:19,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


79it [03:21,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


80it [03:23,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


81it [03:26,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


82it [03:28,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


83it [03:31,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


84it [03:33,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


85it [03:35,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


86it [03:38,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


87it [03:40,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


88it [03:43,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


89it [03:45,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


90it [03:48,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


91it [03:50,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


92it [03:53,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


93it [03:55,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


94it [03:57,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


95it [04:00,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


96it [04:02,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


97it [04:05,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


98it [04:07,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


99it [04:10,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


100it [04:12,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


101it [04:15,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


102it [04:17,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


103it [04:19,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


104it [04:22,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


105it [04:24,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


106it [04:27,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


107it [04:29,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


108it [04:31,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


109it [04:34,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


110it [04:36,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


111it [04:39,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


112it [04:41,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


113it [04:44,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


114it [04:46,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


115it [04:48,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


116it [04:51,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


117it [04:53,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


118it [04:56,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


119it [04:58,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


120it [05:00,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


121it [05:03,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


122it [05:05,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


123it [05:08,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


124it [05:10,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


125it [05:13,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


126it [05:15,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


127it [05:17,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


128it [05:20,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


129it [05:22,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


130it [05:25,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


131it [05:27,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


132it [05:29,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


133it [05:32,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


134it [05:34,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


135it [05:37,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


136it [05:39,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


137it [05:41,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


138it [05:44,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


139it [05:46,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


140it [05:49,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


141it [05:51,  2.37s/it]

torch.Size([124, 16]) torch.Size([1984])


142it [05:53,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


143it [05:56,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


144it [05:58,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


145it [06:00,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


146it [06:03,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


147it [06:05,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


148it [06:08,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


149it [06:10,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


150it [06:13,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


151it [06:15,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


152it [06:17,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


153it [06:20,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


154it [06:22,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


155it [06:25,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


156it [06:27,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


157it [06:30,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


158it [06:32,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


159it [06:35,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


160it [06:37,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


161it [06:40,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


162it [06:42,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


163it [06:45,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


164it [06:47,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


165it [06:50,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


166it [06:52,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


167it [06:55,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


168it [06:57,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


169it [06:59,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


170it [07:02,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


171it [07:04,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


172it [07:07,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


173it [07:09,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


174it [07:11,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


175it [07:14,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


176it [07:16,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


177it [07:19,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


178it [07:21,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


179it [07:24,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


180it [07:26,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


181it [07:28,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


182it [07:31,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


183it [07:33,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


184it [07:36,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


185it [07:38,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


186it [07:41,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


187it [07:43,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


188it [07:45,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


189it [07:48,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


190it [07:50,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


191it [07:53,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


192it [07:55,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


193it [07:58,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


194it [08:00,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


195it [08:02,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


196it [08:05,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


197it [08:07,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


198it [08:10,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


199it [08:12,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])
训练损失为1.0008394911885259
春日扶阳柳，东南逐丽芳。摇摇舟物色，绕迳倚楼情。石藓分钩缀，风露助催鸣。风烟和羽舞，仗阁静龙程。仙鹤凌秋晚，罗浮照日荣。阴珠照宫女，静鸟避征声。乐极辞仙子，陈游厌水卿。露华芳草丽，风月紫微生。每接鸳鸞举，恭忧镂浪轻。素琴方未醉，余态已萦倾。不惜连沙眇，兼疑色在盈。绵绵牋作艇，晚棹舞长城。篱浅多芳草，皆疑遶户行。长波随作赏，几色是佳声。预忆庞篱爱，应怜过草生。
江城扶高多，南亩摘桐珠。荷花夹夹水，石路相如无。彩凤游陆抱，采芳弄阑涯。清秋数百里，曲尽丛桃花。朱楼照云屏，薄夕浃云涯。烦君自自适，遇物谁能差。烦己贯东郭，淹留亦何伤。欲开笑言笥，日夕忧心光。美人出户庭，五云不相张。或咏罗绮秀，双阙清且凉。会以东顾主，夕阳独裴回。忆昨扈轩并，鸞驾南朝来。扈步凌云阁，萧条过郊墙。华夷虽殊尚，英词尚相亡。
花界人何乐，当中鼎一封。事游纷忽起，心切气相连。簿书重禄典，世论宽国贤。十载守州域，再鸣官下禅。劳歌方冉冉，独梦何绵莲。夹水鸟雀，流萤潭屿天。风流限年少，风雨扬津前。高论惊壑动，忽感起舟禅。夜余向秋月，迎泛四山天。凫鹥起林口，山馆通云坡。日出广陵路，星辰游太清。瑶草色尚绿，仙台曙连青。因云俱结驷，独酌丝纶巾。
朝光九霄澹，暮雨三五日。秋风一惆怅，人事皆满寺。门外有一星，一道无一状。白日自无际，白云常在耳。无心伴得宿，到处无昏晓。碧幢长带绿，芳草遮成翠。持巧事操绵，从兹求道薄。智者化於生，智相饶智草。攫肉从逐稽，释思同所止。乃知鍊者子，不饮此乡岳。乾坤富毛叶，祝右藏文器。稽负明德光，英明感深昔。裴回南陌上，赋药接门出。三更见邻家，始知达於地。
秋风歘吸得灵山，终日如钩山翠云。攒珠振迅明月真，走来三驱如至君。皇帝真气无消息，当时决璧思当秋。堂陀士中争得之，地角天涯相许违。乍言骏发已流寇，貂裘貂裘染飞辔。当时白帝千门通，环楼向日万人静。清机出海真自奇，功业当时不如此。夫子相亲妇将宫，蓬莱殿前五色龙。五色青云不得迹，九华丹甲如如玉，去日昇兮磨万刻。风回未终上白沙，大夫万里犹未来。
月明江头江上来，沙头海底吴山来。欲淘波上红霞起，忽尔飞飞落秋水。适值江南多早梅，谁家凭船有新哀。政成天竺书莫论，又有笔砚称老来。不如挥手长叹嗟，何况生与子嫌丑。持此将还慰佳节，行役何

200it [08:20,  3.95s/it]

夜色尚再夜，心绪不知还。不见主人字，下车登遥山。穷春心不乐，听我曲自闲。坐臥夕阳里，雪烟冷江中。人稀臥海月，梦想在明宫。时清千里隔，心期二十年。数回不忍语，敛散已凄风。我亦愁风月，东西逢路空。赖逢瑶台友，愿作东南龙。共惜明镜主，徒闻车辙翁。微才谢时术，明主许开襟。寄病久搔首，含诗寄清风。时时屡沐时，但谓清泉。伊昔东山外，云飞横素翰。兴傥谅多期，永怀良未穷。
torch.Size([124, 16]) torch.Size([1984])


201it [08:22,  3.45s/it]

torch.Size([124, 16]) torch.Size([1984])


202it [08:24,  3.13s/it]

torch.Size([124, 16]) torch.Size([1984])


203it [08:27,  2.93s/it]

torch.Size([124, 16]) torch.Size([1984])


204it [08:29,  2.78s/it]

torch.Size([124, 16]) torch.Size([1984])


205it [08:32,  2.70s/it]

torch.Size([124, 16]) torch.Size([1984])


206it [08:34,  2.62s/it]

torch.Size([124, 16]) torch.Size([1984])


207it [08:37,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


208it [08:39,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


209it [08:41,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


210it [08:44,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


211it [08:46,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


212it [08:49,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


213it [08:51,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


214it [08:54,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


215it [08:56,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


216it [08:58,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


217it [09:01,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


218it [09:03,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


219it [09:06,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


220it [09:08,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


221it [09:11,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


222it [09:13,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


223it [09:16,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


224it [09:18,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


225it [09:21,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


226it [09:23,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


227it [09:26,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


228it [09:28,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


229it [09:31,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


230it [09:34,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


231it [09:36,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


232it [09:39,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


233it [09:41,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


234it [09:44,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


235it [09:46,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


236it [09:49,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


237it [09:52,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


238it [09:54,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


239it [09:57,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


240it [09:59,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


241it [10:02,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


242it [10:04,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


243it [10:07,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


244it [10:09,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


245it [10:12,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


246it [10:14,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


247it [10:17,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


248it [10:19,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


249it [10:22,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


250it [10:24,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


251it [10:26,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


252it [10:29,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


253it [10:31,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


254it [10:34,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


255it [10:36,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


256it [10:39,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


257it [10:41,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


258it [10:44,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


259it [10:46,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


260it [10:49,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


261it [10:51,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


262it [10:54,  2.60s/it]

torch.Size([124, 16]) torch.Size([1984])


263it [10:57,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


264it [10:59,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


265it [11:02,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


266it [11:04,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


267it [11:06,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


268it [11:09,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


269it [11:11,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


270it [11:14,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


271it [11:17,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


272it [11:19,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


273it [11:22,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


274it [11:24,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


275it [11:27,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


276it [11:30,  2.63s/it]

torch.Size([124, 16]) torch.Size([1984])


277it [11:32,  2.65s/it]

torch.Size([124, 16]) torch.Size([1984])


278it [11:35,  2.62s/it]

torch.Size([124, 16]) torch.Size([1984])


279it [11:37,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


280it [11:40,  2.60s/it]

torch.Size([124, 16]) torch.Size([1984])


281it [11:43,  2.61s/it]

torch.Size([124, 16]) torch.Size([1984])


282it [11:45,  2.60s/it]

torch.Size([124, 16]) torch.Size([1984])


283it [11:48,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


284it [11:50,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


285it [11:53,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


286it [11:55,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


287it [11:58,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


288it [12:00,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


289it [12:03,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


290it [12:06,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


291it [12:08,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


292it [12:11,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


293it [12:13,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


294it [12:15,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


295it [12:18,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


296it [12:20,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


297it [12:23,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


298it [12:25,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


299it [12:27,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


300it [12:30,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


301it [12:32,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


302it [12:35,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


303it [12:37,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


304it [12:39,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


305it [12:42,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


306it [12:44,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


307it [12:47,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


308it [12:49,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


309it [12:51,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


310it [12:54,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


311it [12:56,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


312it [12:58,  2.37s/it]

torch.Size([124, 16]) torch.Size([1984])


313it [13:01,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


314it [13:03,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


315it [13:06,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


316it [13:08,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


317it [13:10,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


318it [13:13,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


319it [13:15,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


320it [13:18,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


321it [13:20,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


322it [13:22,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


323it [13:25,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


324it [13:27,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


325it [13:30,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


326it [13:32,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


327it [13:34,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


328it [13:37,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


329it [13:39,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


330it [13:42,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


331it [13:44,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


332it [13:46,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


333it [13:49,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


334it [13:51,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


335it [13:53,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


336it [13:56,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


337it [13:58,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


338it [14:01,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


339it [14:03,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


340it [14:05,  2.37s/it]

torch.Size([124, 16]) torch.Size([1984])


341it [14:08,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


342it [14:10,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


343it [14:13,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


344it [14:15,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


345it [14:17,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


346it [14:20,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


347it [14:22,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


348it [14:25,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


349it [14:27,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


350it [14:30,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


351it [14:32,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


352it [14:35,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


353it [14:37,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


354it [14:40,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


355it [14:43,  2.61s/it]

torch.Size([124, 16]) torch.Size([1984])


356it [14:45,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


357it [14:48,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


358it [14:50,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


359it [14:53,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


360it [14:55,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


361it [14:58,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


362it [15:00,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


363it [15:03,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


364it [15:05,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


365it [15:07,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


366it [15:10,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


367it [15:12,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


368it [15:15,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


369it [15:17,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


370it [15:19,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


371it [15:22,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


372it [15:24,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


373it [15:27,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


374it [15:29,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


375it [15:31,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


376it [15:34,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


377it [15:36,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


378it [15:39,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


379it [15:41,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


380it [15:43,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


381it [15:46,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


382it [15:48,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


383it [15:50,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


384it [15:53,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


385it [15:55,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


386it [15:58,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


387it [16:00,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


388it [16:02,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


389it [16:05,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


390it [16:07,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


391it [16:10,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


392it [16:12,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


393it [16:14,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


394it [16:17,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


395it [16:19,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


396it [16:22,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


397it [16:24,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


398it [16:27,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


399it [16:29,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])
训练损失为1.1208561620116226
春色经中事，青铜照独眠。同心交手重，会面小妆妍。为问深宫里，教教小进年。自惭兼接绮，不识不通年。有恨怜顦顇，谁人似比然。列文皆駮绿，栽柳惹红鲜。渥肱何夭进，科锄易与崑。貂囊辞集地，琴瑟和高弦。异恨一三五，汤颜暗隔年。未知还守约，宛转马蹄前。密梵忘来久，登楼意绪偏。云由难驻马，猨为伴留铭。晓日乘妆雨，春寒破烛青。睡裁敲竹案，漏雍破墙墙。就笔求宽急，眠帘小柱钱。檐吟禽不语，苔暗鸟冲天。晚景连溪月，春寒
江城扶高多，桂叶碧且碧。吾欲窥天公，青冥秀江内。翠色开罗帐，春光疑波水。窈窕开四门，苍茫望三逵。羣雄望紫霄，秦风荡洪璧。白虹吼如电，红锦紫如霜。陋巷杂烟尘，抽毫换新茧。城中豪赵宅，不是喧喧悲。古貌有一空，生泪常自衰。既似血顿血，恐然呜咽脂。万事尽如此，含眉任所依。君看贞白璧，不如罗与衣。长恨短泪消，妾魂流晨头。如何摧折去，易异人已稀。共有楼上辞，歌声促秋衣。
花界人将世，龙居将莫嵬。时时无价薄，永久误君能。昨闻丞相言，知我抱遐谣。顾惟风尘外，但谓营有谋。临告慕聪明，岂惟厌王侯。生平在何处，此別岂吾哉。醉舞洛阳城，莫辞东逝销。古来诗句践，兄弟欲何骄。好是两寸血，空书中路遥。单车望春別，白首长安消。自顾汉文字，不如太常瓜。贱骨颇可贱，川平贫且遥。伯愚竟不绝，况乃投丘园。忽然高高台，但恐物我遥。
朝发西南芝，南渡月华光。朗有寒物旷，翛然有风光。兹溪杂绿湍，永嶂无停光。入山挹众植，安葺得一方。人间岁已晏，汲寂性颇长。仲夏月未白，陂洲草自黄。古泉森且壮，中庭泽未黄。东中有高树，日与新加阳。陋巷有蔬食，水深唯有香。松竹讵迅，龟潭轻负遐。清羸修坐者，盥兀松桂香。步竹清新旭，残蝉鸣晓廊。忽闻风雷动，喧臥珊瑚坊。或乏折叶数，又及白雪萎。曷如天一涯，岂必纡诸光。自无所从者，三毒无萎些。安得为时术，枣木亦
秋光古才长揭明，俊禽发腐者称兵。梓州草色马不死，每春相伴登春行。洛阳柳岸人可问，美人堂前弄新月。问人不惜妾心狂，谁令西来如昨日。今时好老风光时，胡中大妾唱胡歌。尔不识龟肠如雪，谁人能信妾中人。长歌落日魂断断，更有心情苦丁没。流湘陌上惊莺啼，怅望烟空忆沧浪。吴童傲羲君不见，女子呵香愁不绝。风号烈兮肠不衰，人在天边独往时。一人尽爱君独坐，月晚盛欢亲自衰。何人感此古长老

400it [16:37,  3.98s/it]

夜梦神仙隐一壁，白日飘飘一日魂。城头波影碧湘水，月落风高桃李园。闲冲雨露光高牖，静对松花媿故园。合得春光能变景，可怜风景似淘鲲。回廊影入凡尘暗，流水沙衔汗浪昏。飘剪芳菲成翠壁，洞天芳草锁闲园。绮罗似雾休呈丽，花里初欺景兔繁。忆昔管絃无限态，齐觞鞭罢寇侯敦。蟾蜍正好憎春忆，珠缀余英几捧繁。丽色似迎云外殿，夕阳偏向客帷微。
torch.Size([124, 16]) torch.Size([1984])


401it [16:39,  3.52s/it]

torch.Size([124, 16]) torch.Size([1984])


402it [16:41,  3.15s/it]

torch.Size([124, 16]) torch.Size([1984])


403it [16:44,  2.92s/it]

torch.Size([124, 16]) torch.Size([1984])


404it [16:46,  2.75s/it]

torch.Size([124, 16]) torch.Size([1984])


405it [16:49,  2.64s/it]

torch.Size([124, 16]) torch.Size([1984])


406it [16:51,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


407it [16:53,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


408it [16:56,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


409it [16:58,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


410it [17:01,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


411it [17:03,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


412it [17:06,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


413it [17:08,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


414it [17:11,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


415it [17:13,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


416it [17:16,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


417it [17:18,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


418it [17:21,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


419it [17:23,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


420it [17:26,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


421it [17:28,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


422it [17:31,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


423it [17:34,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


424it [17:36,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


425it [17:39,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


426it [17:41,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


427it [17:44,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


428it [17:46,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


429it [17:49,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


430it [17:51,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


431it [17:54,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


432it [17:56,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


433it [17:59,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


434it [18:02,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


435it [18:04,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


436it [18:07,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


437it [18:09,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


438it [18:12,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


439it [18:14,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


440it [18:16,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


441it [18:19,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


442it [18:21,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


443it [18:24,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


444it [18:26,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


445it [18:29,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


446it [18:31,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


447it [18:34,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


448it [18:36,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


449it [18:39,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


450it [18:41,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


451it [18:43,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


452it [18:46,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


453it [18:49,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


454it [18:51,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


455it [18:54,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


456it [18:56,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


457it [18:59,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


458it [19:01,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


459it [19:04,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


460it [19:06,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


461it [19:08,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


462it [19:11,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


463it [19:13,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


464it [19:16,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


465it [19:18,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


466it [19:21,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


467it [19:24,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


468it [19:26,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


469it [19:29,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


470it [19:31,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


471it [19:34,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


472it [19:37,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


473it [19:39,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


474it [19:42,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


475it [19:44,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


476it [19:47,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


477it [19:49,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


478it [19:52,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


479it [19:55,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


480it [19:57,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


481it [20:00,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


482it [20:02,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


483it [20:05,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


484it [20:08,  2.61s/it]

torch.Size([124, 16]) torch.Size([1984])


485it [20:10,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


486it [20:13,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


487it [20:15,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


488it [20:18,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


489it [20:20,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


490it [20:22,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


491it [20:25,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


492it [20:27,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


493it [20:30,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


494it [20:32,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


495it [20:35,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


496it [20:37,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


497it [20:40,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


498it [20:42,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


499it [20:45,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


500it [20:47,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


501it [20:50,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


502it [20:52,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


503it [20:55,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


504it [20:57,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


505it [21:00,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


506it [21:03,  2.62s/it]

torch.Size([124, 16]) torch.Size([1984])


507it [21:05,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


508it [21:07,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


509it [21:10,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


510it [21:12,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


511it [21:15,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


512it [21:17,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


513it [21:20,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


514it [21:22,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


515it [21:24,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


516it [21:27,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


517it [21:29,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


518it [21:32,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


519it [21:34,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


520it [21:36,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


521it [21:39,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


522it [21:41,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


523it [21:44,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


524it [21:46,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


525it [21:49,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


526it [21:51,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


527it [21:54,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


528it [21:56,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


529it [21:59,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


530it [22:01,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


531it [22:03,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


532it [22:06,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


533it [22:08,  2.35s/it]

torch.Size([124, 16]) torch.Size([1984])


534it [22:10,  2.34s/it]

torch.Size([124, 16]) torch.Size([1984])


535it [22:13,  2.33s/it]

torch.Size([124, 16]) torch.Size([1984])


536it [22:15,  2.33s/it]

torch.Size([124, 16]) torch.Size([1984])


537it [22:17,  2.35s/it]

torch.Size([124, 16]) torch.Size([1984])


538it [22:20,  2.32s/it]

torch.Size([124, 16]) torch.Size([1984])


539it [22:22,  2.35s/it]

torch.Size([124, 16]) torch.Size([1984])


540it [22:24,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


541it [22:27,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


542it [22:29,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


543it [22:32,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


544it [22:34,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


545it [22:37,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


546it [22:39,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


547it [22:41,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


548it [22:44,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


549it [22:46,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


550it [22:49,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


551it [22:51,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


552it [22:53,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


553it [22:56,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


554it [22:58,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


555it [23:01,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


556it [23:03,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


557it [23:05,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


558it [23:08,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


559it [23:10,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


560it [23:13,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


561it [23:15,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


562it [23:18,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


563it [23:21,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


564it [23:23,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


565it [23:26,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


566it [23:28,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


567it [23:31,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


568it [23:33,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


569it [23:36,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


570it [23:38,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


571it [23:41,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


572it [23:44,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


573it [23:46,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


574it [23:49,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


575it [23:51,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


576it [23:54,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


577it [23:56,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


578it [23:59,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


579it [24:01,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


580it [24:04,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


581it [24:06,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


582it [24:09,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


583it [24:11,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


584it [24:14,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


585it [24:16,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


586it [24:19,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


587it [24:21,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


588it [24:24,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


589it [24:26,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


590it [24:29,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


591it [24:31,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


592it [24:33,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


593it [24:36,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


594it [24:38,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


595it [24:41,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


596it [24:43,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


597it [24:46,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


598it [24:48,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


599it [24:51,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])
训练损失为1.2101642794410377
春水徧兆灵，南游漆渚宫。昔闻碧桃子，千里荡金风。荡漾遵目目，跃漫俨成藂。戏马乘天上，飞珠照海中。忽惊云雨起，还与龙潭通。可贵空窈窕，俄攀皎然功。炉芒赐马影，缤杂坠云红。清韵凌秋色，姑苏入曙空。高情极芳月，乔木涨西东。如何建容殿，从兹避简躬。云霞倏自尔，潢厦岂纤笼。冶生宗言什，恶态随时雄。羣迁从此断，抚素竟何穷。
江司冠盖之八葛，独谢荆门十围月。江城秋尽海，潇湘海日清皓。高台古墓名丘宫，西出峨嵋作神气。灵云纵纵唱吴歌引，鬼魅时时伏鼻趋。自谓明时不平主，盖轮零落满平芜。白首相逢翻不见，如何走马上天衢。夫人寡赋多骄理，愿倚门前掩朱雀。长镫本胜征路隅，龙鞍忽上珊瑚衫。八台九折俨如劒，白璧低缠无断绝。骥客留歌立地来，蜀王牋成酒多疾。醉后歌歌曲路长，罗巾掷鞚春风开。两岸二花争绽汙，菖菱含笑绿花开。
花落草萋萋，湖初冬晚稠。连波怅望处，落日复浮流。舟泊天上日，舟行沙际舟。穷冬九十地，夹地秋天秋。帝乡山海晴，春水淼茫洲。行人望海暖，野月明天游。別离家国泽，征马上扬州。忆昨金陵游，相逢一水流。重山共澄霁，帆影明如浮。浦屿逶迤路，风帆摇水沤。离魂倚楼上，千里云中流。吴岫碧云道，荆谿烟雨愁。借问从此去，故人何处游？坐厌荆州路，何时归旧楼。
朝发淇水边，十里看云天。遥见故人书，空成天地天。自从长沙熟，有食非黎然。再登四时科，刺米立小椽。攫喔毛有毒，吞胆势不全。脱足百尺弓，射缚决王权。问是有漏乐，不如火炉贤。耳缩时甚严，拔如天地坚。可以获稻粱，将锄置锥床。攫搏射猛鱼，羶毒不盈联。伉拭速受顾，详山备扶鞭。
秋天杳茫漫，青嶂含苍梧。积水含霁澜，积波照天宽。渊柔及良夕，曾为慕幽翰。哲孙文章菲，千载正相欢。朝朝共泛汎，余若萦幽蹊。曾经五月夕，兴与五峰寒。寻咏惜芳樽，揽衣满人泥。所劳见时色，坐见幽寂境。泛杖行月高，乘轩散林峦。适指岂知近，吾亦适吾宗。孙遵樊楚巅，隐隐必为邦。每兹兹山阻，忽遇至旧欢。时矣忽言放，山山忽腾抟。谐止瑶池浪，空接桂丛藂。
月出石稜稜，屹然中汉量。鳞尔吾师翊，玉编趋我婴。挺身束众节，抚心劳所施。挺身慕世世，弃置资天和。势素焕天宇，金容焕宫河。巍巍七曜尽，结构八九区。岂谓凡法中，生死杳无虞。体暗弥苍切，微然若空哗。云宫互见忝，华阁每来趋。高标有灵凤，顾密

600it [24:58,  3.87s/it]

夜梦神仙人，貌鍊药铅里。不买田舍或，因兹上持记。指着又须去，两两若脱地。牵者二个空，内前多梵地。三五六十代，五苦诸如七。所以不生色，囊中那可利。唯有母竖儿，何须礼专杼。祇言（巧作，究牵不得拟。身虽无生下，身死无过舍。佯解入口床，自现相违佛。铅宽分体长，不须乱如掌。魂魄本无疑，方元是明主。一语及今人，天外为天绿。四五打兵相，诸顿缚牙贼。一双吾师口，登山而太细。若欲有分离，如此而何歛。若能如在龙，如波
torch.Size([124, 16]) torch.Size([1984])


601it [25:00,  3.44s/it]

torch.Size([124, 16]) torch.Size([1984])


602it [25:02,  3.10s/it]

torch.Size([124, 16]) torch.Size([1984])


603it [25:05,  2.86s/it]

torch.Size([124, 16]) torch.Size([1984])


604it [25:07,  2.72s/it]

torch.Size([124, 16]) torch.Size([1984])


605it [25:09,  2.61s/it]

torch.Size([124, 16]) torch.Size([1984])


606it [25:12,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


607it [25:14,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


608it [25:17,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


609it [25:20,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


610it [25:22,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


611it [25:25,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


612it [25:27,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


613it [25:30,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


614it [25:32,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


615it [25:35,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


616it [25:37,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


617it [25:40,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


618it [25:42,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


619it [25:45,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


620it [25:48,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


621it [25:50,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


622it [25:53,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


623it [25:55,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


624it [25:58,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


625it [26:00,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


626it [26:03,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


627it [26:05,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


628it [26:07,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


629it [26:10,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


630it [26:13,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


631it [26:15,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


632it [26:17,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


633it [26:20,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


634it [26:22,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


635it [26:25,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


636it [26:27,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


637it [26:29,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


638it [26:32,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


639it [26:34,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


640it [26:37,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


641it [26:39,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


642it [26:42,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


643it [26:44,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


644it [26:47,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


645it [26:49,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


646it [26:52,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


647it [26:54,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


648it [26:56,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


649it [26:59,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


650it [27:01,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


651it [27:04,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


652it [27:06,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


653it [27:09,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


654it [27:11,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


655it [27:14,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


656it [27:16,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


657it [27:19,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


658it [27:21,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


659it [27:24,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


660it [27:26,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


661it [27:29,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


662it [27:31,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


663it [27:34,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


664it [27:37,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


665it [27:39,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


666it [27:42,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


667it [27:44,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


668it [27:47,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


669it [27:50,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


670it [27:52,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


671it [27:55,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


672it [27:57,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


673it [28:00,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


674it [28:02,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


675it [28:05,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


676it [28:07,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


677it [28:10,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


678it [28:12,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


679it [28:15,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


680it [28:17,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


681it [28:20,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


682it [28:22,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


683it [28:25,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


684it [28:27,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


685it [28:29,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


686it [28:32,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


687it [28:34,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


688it [28:37,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


689it [28:39,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


690it [28:42,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


691it [28:44,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


692it [28:47,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


693it [28:49,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


694it [28:52,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


695it [28:54,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


696it [28:56,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


697it [28:59,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


698it [29:01,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


699it [29:04,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


700it [29:06,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


701it [29:09,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


702it [29:11,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


703it [29:14,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


704it [29:16,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


705it [29:19,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


706it [29:21,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


707it [29:24,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


708it [29:26,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


709it [29:29,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


710it [29:31,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


711it [29:34,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


712it [29:36,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


713it [29:39,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


714it [29:41,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


715it [29:44,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


716it [29:47,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


717it [29:49,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


718it [29:52,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


719it [29:54,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


720it [29:57,  2.60s/it]

torch.Size([124, 16]) torch.Size([1984])


721it [30:00,  2.62s/it]

torch.Size([124, 16]) torch.Size([1984])


722it [30:02,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


723it [30:05,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


724it [30:07,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


725it [30:10,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


726it [30:12,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


727it [30:15,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


728it [30:17,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


729it [30:20,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


730it [30:22,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


731it [30:24,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


732it [30:27,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


733it [30:29,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


734it [30:32,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


735it [30:34,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


736it [30:36,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


737it [30:39,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


738it [30:42,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


739it [30:44,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


740it [30:46,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


741it [30:49,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


742it [30:51,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


743it [30:54,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


744it [30:56,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


745it [30:58,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


746it [31:01,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


747it [31:03,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


748it [31:06,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


749it [31:08,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


750it [31:11,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


751it [31:13,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


752it [31:15,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


753it [31:18,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


754it [31:20,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


755it [31:23,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


756it [31:25,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


757it [31:27,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


758it [31:30,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


759it [31:32,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


760it [31:35,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


761it [31:37,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


762it [31:40,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


763it [31:42,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


764it [31:44,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


765it [31:47,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


766it [31:49,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


767it [31:52,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


768it [31:54,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


769it [31:57,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


770it [31:59,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


771it [32:01,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


772it [32:04,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


773it [32:06,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


774it [32:09,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


775it [32:11,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


776it [32:14,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


777it [32:16,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


778it [32:18,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


779it [32:21,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


780it [32:23,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


781it [32:26,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


782it [32:28,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


783it [32:31,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


784it [32:33,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


785it [32:36,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


786it [32:39,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


787it [32:41,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


788it [32:43,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


789it [32:46,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


790it [32:49,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


791it [32:51,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


792it [32:53,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


793it [32:56,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


794it [32:58,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


795it [33:01,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


796it [33:03,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


797it [33:06,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


798it [33:08,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


799it [33:11,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])
训练损失为1.2918514982610934
春色河水微，平明照巫山。僊舟荡江水，南越随江山。岂知台峤人，邈邈不同攀。不凫亦已一，扰扰知异深。所恨武陵山，尝闻东山吟。地清四百里，春色游千寻。水流咫尺泻，水暎千峰岑。相去千载远，宁愁別馆深。东风吹暮雨，始得白云心。迳远见邻里，人来多阻闲。爱君万里道，共此十年闲。邀我共携手，还依东涧深。石门隔河汉，往往闻云禽。记余在高馆，及此涤烦襟。明月独听君，风流不盈寻。
江汉通京网，儒车谒上皇。紫霄来拜将，六始散羣郎。北陆辞天子，西山任圣哲。圣朝冠汉史，俗契出兵床。礼乐加新命，诗经笃用谈。戈鋋交驷马，仗戟亚离疆。奏命从臣说，鸣兵召战将。风云同阵象，甲日认膏桑。水木蒸禾破，山泥白璧彰。髯星照旌斾，危兽俨金骧。割厘归司死，何民稅代方。鱼龙超雾色，禾网杂泉光。败溜缘岚翠，重簷倚石墙。遥知讶奚处，不见在潇湘。谩说为荣爱，知君不算方。
花界人啼天草色，后人洲曲荅杨洲。一叶飞风洒襟思，数声清磬听鸣讴。龙笻机上知堪喜，珪组声中岂敢酬。松声震断无因见，鴈塔深期得一游。端拱猨声疎竹道，黄昏寂寞似渔矶。寻花莫忘幽源处，趣重危家近绿衣。忽尔不逢寒食去，每寻情遇似烟微。空嗟此地为君说，乡里分张局溅愁。万里不应丹志制，谿阳才就似何由。
朝发北窗津，暮啄左右还。吏时顾士戆，稅益尸盗勋。一食兵应苦，九坐寝见文。况逢富之日，或覩江湖人。情悟或自悲，乐壮固不伸。武帝竟何辜，豺虎忽在秦。城东信憧憧，不与天下宾。岂无党议说，不觉身独贫。富贵无念此，君能苦辛辛。驱车随长将，拜职赴咸秦。所以松柏使，遂媿猛武臣。嗟嗟魏王子，耻献宾鲁隣。斯文谅已久，遂使俱因陈。
秋天杳茫漫，山侣眄峥嵘。崚萌如耀雪，壮气迅飞鸣。杖轧走天地，潜飞若鸟行。四方尚奔流，百川被秋声。剧视陵邑间，濛濛大州城。阴风吹修哀，四海绕吞鲸。喷喷洪液势，击裘令吏营。一操舟檝介，麋骨同一楹。蹄拔蟹苗，爪力勿食铃。雪天泽无盐，谁是为拾盈。姦民益多故，兵血吞不平。遂为守患苦，灾患归尔并。首上天下狼，夜深兽为鸣。妇竖起清景，妇儿夸市兵。鸱鸮如何事，天下不合生。
月界三百里，星辰二宿初。直波横瑞碎，明历转三闾。玉醴晨趋槛，山川叠缀虚。焚香邀祓舞，比藻藻清虚。蚁大光觞绝，魄摇瑶圃虚。荣容长结意，荣耀几何如。壽老慙皆识，公私忝有余。南山披讲府，北

800it [33:18,  3.85s/it]

夜梦花为唤，时年眼似泥。同时知爱物，从事定能妖。本是承恩要，多因点慢朝。迎风下朱阁，带日下金堤。惊鴈栖林树，惊蝉蝴蝶雏。分忧悉芜逼，遥句笑相邀。阶废眠鹦鹉，巖虚蹋鹿泥。相逢阮有说，自笑旧知己。嬾与拋篱掷，相思碍树梢。地闲难更翫，尘事勿相携。蝉聒迎秋树，蝉声彻晓楼。旧恩君不在，又上白云桥。
torch.Size([124, 16]) torch.Size([1984])


801it [33:20,  3.39s/it]

torch.Size([124, 16]) torch.Size([1984])


802it [33:23,  3.09s/it]

torch.Size([124, 16]) torch.Size([1984])


803it [33:25,  2.88s/it]

torch.Size([124, 16]) torch.Size([1984])


804it [33:27,  2.72s/it]

torch.Size([124, 16]) torch.Size([1984])


805it [33:30,  2.62s/it]

torch.Size([124, 16]) torch.Size([1984])


806it [33:32,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


807it [33:34,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


808it [33:37,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


809it [33:39,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


810it [33:42,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


811it [33:44,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


812it [33:46,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


813it [33:49,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


814it [33:51,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


815it [33:54,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


816it [33:56,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


817it [33:59,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


818it [34:01,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


819it [34:04,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


820it [34:06,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


821it [34:08,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


822it [34:11,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


823it [34:13,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


824it [34:16,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


825it [34:18,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


826it [34:20,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


827it [34:23,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


828it [34:25,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


829it [34:28,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


830it [34:30,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


831it [34:33,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


832it [34:35,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


833it [34:38,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


834it [34:40,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


835it [34:43,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


836it [34:45,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


837it [34:48,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


838it [34:51,  2.60s/it]

torch.Size([124, 16]) torch.Size([1984])


839it [34:53,  2.60s/it]

torch.Size([124, 16]) torch.Size([1984])


840it [34:56,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


841it [34:58,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


842it [35:00,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


843it [35:03,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


844it [35:05,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


845it [35:08,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


846it [35:10,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


847it [35:13,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


848it [35:15,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


849it [35:18,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


850it [35:20,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


851it [35:23,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


852it [35:25,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


853it [35:27,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


854it [35:30,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


855it [35:32,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


856it [35:35,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


857it [35:37,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


858it [35:40,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


859it [35:42,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


860it [35:45,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


861it [35:48,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


862it [35:50,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


863it [35:53,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


864it [35:55,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


865it [35:57,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


866it [36:00,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


867it [36:02,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


868it [36:05,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


869it [36:07,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


870it [36:10,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


871it [36:12,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


872it [36:15,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


873it [36:18,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


874it [36:20,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


875it [36:23,  2.61s/it]

torch.Size([124, 16]) torch.Size([1984])


876it [36:25,  2.60s/it]

torch.Size([124, 16]) torch.Size([1984])


877it [36:28,  2.61s/it]

torch.Size([124, 16]) torch.Size([1984])


878it [36:31,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


879it [36:33,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


880it [36:36,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


881it [36:38,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


882it [36:40,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


883it [36:43,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


884it [36:46,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


885it [36:48,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


886it [36:51,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


887it [36:53,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


888it [36:55,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


889it [36:58,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


890it [37:00,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


891it [37:03,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


892it [37:05,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


893it [37:07,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


894it [37:10,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


895it [37:12,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


896it [37:15,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


897it [37:17,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


898it [37:20,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


899it [37:23,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


900it [37:25,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


901it [37:27,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


902it [37:30,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


903it [37:33,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


904it [37:35,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


905it [37:38,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


906it [37:40,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


907it [37:43,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


908it [37:45,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


909it [37:48,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


910it [37:50,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


911it [37:52,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


912it [37:55,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


913it [37:57,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


914it [38:00,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


915it [38:02,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


916it [38:04,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


917it [38:07,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


918it [38:09,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


919it [38:12,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


920it [38:14,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


921it [38:17,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


922it [38:19,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


923it [38:22,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


924it [38:24,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


925it [38:27,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


926it [38:29,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


927it [38:32,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


928it [38:34,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


929it [38:37,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


930it [38:39,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


931it [38:42,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


932it [38:44,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


933it [38:47,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


934it [38:49,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


935it [38:52,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


936it [38:54,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


937it [38:57,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


938it [39:00,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


939it [39:02,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


940it [39:05,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


941it [39:07,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


942it [39:10,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


943it [39:12,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


944it [39:15,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


945it [39:17,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


946it [39:20,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


947it [39:22,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


948it [39:25,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


949it [39:27,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


950it [39:30,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


951it [39:32,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


952it [39:35,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


953it [39:37,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


954it [39:40,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


955it [39:42,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


956it [39:44,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


957it [39:47,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


958it [39:49,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


959it [39:52,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


960it [39:54,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


961it [39:57,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


962it [40:00,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


963it [40:02,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


964it [40:04,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


965it [40:07,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


966it [40:10,  2.61s/it]

torch.Size([124, 16]) torch.Size([1984])


967it [40:12,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


968it [40:15,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


969it [40:17,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


970it [40:20,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


971it [40:22,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


972it [40:25,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


973it [40:27,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


974it [40:30,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


975it [40:32,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


976it [40:35,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


977it [40:37,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


978it [40:40,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


979it [40:42,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


980it [40:45,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


981it [40:47,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


982it [40:50,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


983it [40:52,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


984it [40:55,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


985it [40:57,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


986it [41:00,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


987it [41:02,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


988it [41:05,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


989it [41:07,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


990it [41:09,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


991it [41:12,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


992it [41:14,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


993it [41:17,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


994it [41:19,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


995it [41:22,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


996it [41:24,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


997it [41:27,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


998it [41:30,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


999it [41:32,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])
训练损失为1.3513242350220662
春风摇荡客，渭水分櫂游。野态吴舟出，风恬楚岸低。离羣失落处，劒影及徐洲。有竹畬桃种，长芜啮钓头。苍鹰惊管荇，青翠碍江楼。石镜成枯蘂，蒲津遶邓舟。荷斑难自洗，藜藿且婴忧。麴俗樵潜问，斯言笔讵刲。团圆金玉点，懒缩旧千钩。间植成三境，荣荣敌一休。一生唯一萼，直习显中州。尖襜昏天水，甲燄满长钩。万媚藏铃室，千层如雾流。如何沧海上，一见赤眉休。
江南行客行不足，门前江水波如草。舟轻荷发相及莼，舟通月中有哺书。典纳右笔攲献诫，喧呼郑葛声啾啾。闻声不及贡氏租，高歌缓步冀宜驰。山川岂厌解枯蔓，世路聚散非非斯。鲁山豪儒束寇事，遂令诸谢官脱鼻旗辟。忆昔鄱阳道士吏，莫论主人五侯子。紫駞老莱乌欲飞，胡儿饮马泪如丝。傍中大酒不解惜，长忆老翁皆一枝。
花界人，骏马鞭，荅幽筋骨动胡襟。南国业雄孰不得，闲居乐礼金门册。下士何尝驻茅茨，其公不乐主妻夫。少年百篇不复弃，心力并地非交亲。兄弟十年无外觅，眼看人，便纷纷。夜来风里梳舒放，日月照君君莫整。君心谓之不得何，道在兴亡譬中白。昔日怀仁每被伸，报恩至命如飞出。吾知醉后守清灵，此时焉及平生年。昨日江湖才子年，还应赋出颍阳篇。
朝光飞阊池，粲据金华池。高高光素晦，色霭笼琼除。中巷无人开，中路延美词。宛宛御宫君，煌煌列蓬莱。沈贞适尹闱，恭荐不可窥。起则神与祸，答和保元微。金石徒自贵，蟠玉谁与夷。对此时有赠，时哉昔所为。盛哉在春闱，三载谢希规。猜醉心自悲，升腾况追依。击筑黄鹤至，从扬东风吹。乃知清阴销，独坐或闻疑。自勒不可逃，稔悲火霏霏。安筌极其境，万室空欣期。
秋天瑟瑟夜沈机，翡翠笼烟玉蕴吹。阆苑英雄初降律，羣孙骥乐俨成丝。十陈杀德明时力，王主千官得请持。玉焰朝昏连焰落，铜壺夜坐走江旗。夫君一奏邯郸妇，负米还成赵使师。虞使王侯拥长绶，簿书征宿后康旗。昔年曾见哥沽局，今日先过李右讴。昔日霍亲名最重，乐平专被岁宵违。不知见说泾州隐，一夜一声山陇头。
月明江头江亭，落帆行雨咽。谁在楚王家，舟生骋缾逸。遥和龙山下，极目心且恻。宛无波涛际，始辨江湖丽。雄声压灵耳，烟浪随波水。方知适意便，奔放风波役。万日乘兴归，故人了无益。风云感良俗，日月思巖谷。今日空旧游，君心寄巴楚。猿啼月明月，夕落风声远。入口烟火收，入云行自足。林下人尝栗，风清鹤齐跼

1000it [41:40,  4.08s/it]

夜梦神州最，应缘此外情。惯临下堵路，不到斗牛声。影逼初惊雨，声繁彻晚声。闲将心猛猛，休教女儿名。败血浑成血，烧蛾欲有缨。忘忧为昨日，呜咽別连年。此好声吾我，凄凉耳甚清。放慵多擘点，怪日一投铛。故事烦师笑，淹留別里成。青云难换烛，明月更随缘。拔甃频看黑，封书不偶然。準应知尔恶，万事在羲然。可以烦贻分，何愁动舜篇。
torch.Size([124, 16]) torch.Size([1984])


1001it [41:42,  3.58s/it]

torch.Size([124, 16]) torch.Size([1984])


1002it [41:45,  3.25s/it]

torch.Size([124, 16]) torch.Size([1984])


1003it [41:47,  3.00s/it]

torch.Size([124, 16]) torch.Size([1984])


1004it [41:50,  2.85s/it]

torch.Size([124, 16]) torch.Size([1984])


1005it [41:52,  2.76s/it]

torch.Size([124, 16]) torch.Size([1984])


1006it [41:55,  2.68s/it]

torch.Size([124, 16]) torch.Size([1984])


1007it [41:57,  2.61s/it]

torch.Size([124, 16]) torch.Size([1984])


1008it [42:00,  2.62s/it]

torch.Size([124, 16]) torch.Size([1984])


1009it [42:02,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


1010it [42:05,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1011it [42:07,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1012it [42:10,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1013it [42:12,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1014it [42:15,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1015it [42:17,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1016it [42:20,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1017it [42:22,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1018it [42:24,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1019it [42:27,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1020it [42:29,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1021it [42:32,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1022it [42:34,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1023it [42:37,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1024it [42:39,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1025it [42:42,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1026it [42:44,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1027it [42:47,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1028it [42:50,  2.65s/it]

torch.Size([124, 16]) torch.Size([1984])


1029it [42:52,  2.62s/it]

torch.Size([124, 16]) torch.Size([1984])


1030it [42:55,  2.62s/it]

torch.Size([124, 16]) torch.Size([1984])


1031it [42:58,  2.67s/it]

torch.Size([124, 16]) torch.Size([1984])


1032it [43:00,  2.61s/it]

torch.Size([124, 16]) torch.Size([1984])


1033it [43:03,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


1034it [43:05,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


1035it [43:08,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


1036it [43:10,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1037it [43:13,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1038it [43:15,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1039it [43:18,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1040it [43:20,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1041it [43:22,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1042it [43:25,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1043it [43:27,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1044it [43:30,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1045it [43:32,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1046it [43:35,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1047it [43:37,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1048it [43:40,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1049it [43:42,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1050it [43:45,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1051it [43:47,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


1052it [43:50,  2.63s/it]

torch.Size([124, 16]) torch.Size([1984])


1053it [43:53,  2.62s/it]

torch.Size([124, 16]) torch.Size([1984])


1054it [43:55,  2.60s/it]

torch.Size([124, 16]) torch.Size([1984])


1055it [43:58,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


1056it [44:00,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1057it [44:03,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1058it [44:06,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


1059it [44:08,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1060it [44:11,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1061it [44:13,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1062it [44:16,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1063it [44:18,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1064it [44:20,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1065it [44:23,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1066it [44:25,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1067it [44:28,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1068it [44:30,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1069it [44:33,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1070it [44:35,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1071it [44:38,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1072it [44:40,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1073it [44:43,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1074it [44:45,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1075it [44:48,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1076it [44:51,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1077it [44:53,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


1078it [44:56,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1079it [44:58,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1080it [45:01,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


1081it [45:03,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


1082it [45:06,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


1083it [45:08,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


1084it [45:11,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1085it [45:14,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1086it [45:16,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1087it [45:19,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1088it [45:21,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1089it [45:24,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


1090it [45:26,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1091it [45:29,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


1092it [45:31,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1093it [45:34,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1094it [45:36,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1095it [45:39,  2.60s/it]

torch.Size([124, 16]) torch.Size([1984])


1096it [45:42,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


1097it [45:44,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1098it [45:46,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1099it [45:49,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1100it [45:51,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1101it [45:54,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1102it [45:56,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1103it [45:59,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1104it [46:01,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1105it [46:04,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1106it [46:06,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1107it [46:09,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1108it [46:11,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1109it [46:13,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1110it [46:16,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1111it [46:18,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1112it [46:21,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1113it [46:23,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1114it [46:26,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1115it [46:28,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1116it [46:31,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1117it [46:33,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1118it [46:36,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1119it [46:38,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1120it [46:41,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1121it [46:43,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1122it [46:46,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1123it [46:48,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1124it [46:50,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1125it [46:53,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1126it [46:55,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1127it [46:58,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1128it [47:00,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1129it [47:03,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1130it [47:05,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1131it [47:08,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1132it [47:10,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1133it [47:13,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1134it [47:15,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1135it [47:17,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1136it [47:20,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1137it [47:22,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1138it [47:25,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1139it [47:27,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1140it [47:30,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1141it [47:32,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1142it [47:35,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1143it [47:37,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1144it [47:39,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1145it [47:42,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1146it [47:44,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1147it [47:47,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1148it [47:49,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


1149it [47:51,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


1150it [47:54,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1151it [47:56,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1152it [47:59,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1153it [48:02,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1154it [48:04,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1155it [48:06,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1156it [48:09,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1157it [48:12,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1158it [48:14,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1159it [48:17,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1160it [48:19,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1161it [48:22,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1162it [48:24,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1163it [48:27,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1164it [48:29,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1165it [48:32,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1166it [48:34,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1167it [48:36,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1168it [48:39,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1169it [48:41,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1170it [48:44,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1171it [48:47,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1172it [48:49,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1173it [48:52,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1174it [48:54,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1175it [48:57,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1176it [48:59,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


1177it [49:02,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1178it [49:04,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


1179it [49:07,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1180it [49:09,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1181it [49:12,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1182it [49:14,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1183it [49:17,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1184it [49:19,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1185it [49:22,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1186it [49:25,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


1187it [49:27,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


1188it [49:30,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


1189it [49:32,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


1190it [49:35,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1191it [49:37,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1192it [49:40,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1193it [49:42,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1194it [49:44,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1195it [49:47,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1196it [49:49,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1197it [49:52,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1198it [49:54,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1199it [49:57,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])
训练损失为1.3922523351013647
春风摇荡客，拂日开虚扉。余芳与春草，青翠满园墀。刘尹官仍重，淇东俗幸迟。种花移上院，扫竹待新诗。爰涤江州侣，难逢宦別期。山通天竺僻，水隔越亭迟。別业曾辞本，行人自不疑。云门唯是挹，郡乙亦全奇。点检金门酒，惭资玉馔碑。常山云外竹，不忘一般碑。溪水连乡市，烟萝接舶祠。陟冈秋更晚，茶稼少春时。旧柏秋声少，邦郊数鸽危。那堪出尘虑，暂喜有时期。
江南矜论事兮文柄钱，刘安敬「奏汝边。夜女寡，唯见之，膏中死，瘴水银错森森森沈壮。开关欲尽何处说，但恐古松闻者畅。念君一何迫迁叠秦句窄，拄历庐山好偏古。我闻古人与客辈，子孙苦相埋沙水。恍惚险，无转骨。草荒松兮作路者，次揖七十之相忆。上有余杭骨与熟，自有龙泉不足濯。汝而不用长生人，耳中之号声震峋。有我一双觜子，彻于石而与手绝水文。含虚叶上雪中雪，豁以珠於山下云。或似天公使人怪，心如电激成寒文。君不见此
花萼杂花灼，花妓仕林幽。果落青山色，歌咏白云游。地肺疑祕像，荷锸抱笼舟。禊饮山木满，啸闻泉壑幽。召厕怀天藻，外使自淹留。旧井吟云马，前旌被鼓鼙。萧条下水北，淼淼望平流。岸上垂杨女，乌前长试讴。风流忽有赠，山海异游州。今日方长恸，行看万里州。山边带雨降，见见愁人愁。讬心有知音，战贼悲去头。胡为不得去，冉冉去田畴。畴昔崔谷人，邹门垂四愁。歌声促绿水，昔日泣青油。具后庙仙赠，数篇书独留。寄书同玉齿，此意
朝发淇水边，百花发青水。东风吹海雨，洞庭波浪阔。离披束锦缆，轻涟曳罗幕。忽觉西园拆，千年菊花发。梅花夹成水，红烛泻回雪。蕙柳半参差，叶栖花未开。烟深含怨践，石面厌清凉。珠翠兼香炷，䴔䴖碎网墙。总填池上酌，拢梭若趁钗。鱼龙动乳水，欹磴开银光。倒影迷船入，香香出洞房。回眸不可极，长恨惜春光。
秋天月，落浣田，凜视庚。风吹嫩，蛟龙鳞，烘竹枯槁人筋磨。怜君不知何所系，酒肉拜弟是生死。一人一回得此身，地人一回一回死。巍巍象地八十重，熊虎堆星专左尧。观机贼世乱如骨，骨肉射雕不肯死。劝君不得意气羸，我令天杀亦如斯。君但不闻人笑怪，鸟啼一事桑间噎。我愿两翁与邻女，走下嚼金翁有敌。男女男女嫁女母，母子不如嘱木肉。而今不独看桃蘂，勿令精华竟何益。江公大婆白玉浆，夜吐丹青水金碧。空闻汉水生万人，再挽梁王
月出石稜稜，云开上崇郡。舟航鼓鼙举，

1200it [50:04,  4.03s/it]

夜色在秋堂，清昼悲北堂。秋风动河汉，辇路转相望。回鴈通檐墟，夜见江上梁。去依湘水曲，夕泊东吴乡。九疑望中路，几度落星光。枕上曙光动，野中荷木香。朔风吹楚塞，大斾郁琱樯。总是平生意，俄然感旧场。迢迢沙塞日，奔走马扬尘。孟月正归去，黄云西日直。何时此思年，曾作平津角。自知身不死，飜思荆州墓。奈何不见时，非妾苦顦顇。幸乏新宠新，泰洗成灰束。结交一笑恩，不如猜妇主。
torch.Size([124, 16]) torch.Size([1984])


1201it [50:07,  3.55s/it]

torch.Size([124, 16]) torch.Size([1984])


1202it [50:09,  3.22s/it]

torch.Size([124, 16]) torch.Size([1984])


1203it [50:12,  2.98s/it]

torch.Size([124, 16]) torch.Size([1984])


1204it [50:14,  2.83s/it]

torch.Size([124, 16]) torch.Size([1984])


1205it [50:17,  2.78s/it]

torch.Size([124, 16]) torch.Size([1984])


1206it [50:19,  2.70s/it]

torch.Size([124, 16]) torch.Size([1984])


1207it [50:22,  2.63s/it]

torch.Size([124, 16]) torch.Size([1984])


1208it [50:24,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


1209it [50:27,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


1210it [50:29,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1211it [50:32,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1212it [50:34,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1213it [50:37,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1214it [50:39,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1215it [50:42,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1216it [50:44,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1217it [50:47,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1218it [50:49,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1219it [50:52,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1220it [50:54,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1221it [50:57,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1222it [50:59,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1223it [51:02,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1224it [51:04,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1225it [51:07,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


1226it [51:09,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


1227it [51:12,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


1228it [51:14,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1229it [51:17,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1230it [51:19,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1231it [51:22,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1232it [51:24,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1233it [51:27,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1234it [51:29,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1235it [51:32,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1236it [51:34,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1237it [51:36,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1238it [51:39,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1239it [51:41,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1240it [51:44,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1241it [51:46,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1242it [51:49,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1243it [51:51,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1244it [51:54,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1245it [51:56,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1246it [51:58,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1247it [52:01,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1248it [52:03,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1249it [52:06,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1250it [52:08,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1251it [52:11,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1252it [52:13,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1253it [52:16,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1254it [52:18,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1255it [52:21,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1256it [52:23,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1257it [52:26,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1258it [52:28,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1259it [52:31,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1260it [52:33,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1261it [52:36,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1262it [52:38,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1263it [52:40,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1264it [52:43,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1265it [52:45,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1266it [52:48,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1267it [52:50,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1268it [52:52,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


1269it [52:55,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1270it [52:57,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1271it [53:00,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1272it [53:02,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1273it [53:05,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1274it [53:07,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1275it [53:10,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1276it [53:12,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1277it [53:15,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1278it [53:17,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1279it [53:19,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1280it [53:22,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1281it [53:24,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1282it [53:27,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1283it [53:29,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1284it [53:32,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1285it [53:34,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1286it [53:37,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1287it [53:39,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1288it [53:42,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1289it [53:44,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1290it [53:47,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1291it [53:49,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1292it [53:52,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1293it [53:54,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1294it [53:57,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1295it [53:59,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1296it [54:01,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


1297it [54:04,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


1298it [54:06,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


1299it [54:08,  2.37s/it]

torch.Size([124, 16]) torch.Size([1984])


1300it [54:11,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


1301it [54:13,  2.37s/it]

torch.Size([124, 16]) torch.Size([1984])


1302it [54:15,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


1303it [54:18,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


1304it [54:20,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


1305it [54:23,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1306it [54:25,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1307it [54:28,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1308it [54:30,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1309it [54:33,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1310it [54:35,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1311it [54:37,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1312it [54:40,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1313it [54:42,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1314it [54:45,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1315it [54:47,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1316it [54:50,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1317it [54:52,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1318it [54:55,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


1319it [54:58,  2.60s/it]

torch.Size([124, 16]) torch.Size([1984])


1320it [55:00,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


1321it [55:03,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


1322it [55:06,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


1323it [55:08,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


1324it [55:11,  2.60s/it]

torch.Size([124, 16]) torch.Size([1984])


1325it [55:13,  2.60s/it]

torch.Size([124, 16]) torch.Size([1984])


1326it [55:16,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


1327it [55:19,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


1328it [55:21,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


1329it [55:24,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1330it [55:26,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


1331it [55:29,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


1332it [55:31,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


1333it [55:34,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


1334it [55:36,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1335it [55:39,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1336it [55:41,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1337it [55:44,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1338it [55:47,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


1339it [55:49,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


1340it [55:52,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1341it [55:54,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1342it [55:57,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1343it [55:59,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1344it [56:01,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1345it [56:04,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1346it [56:06,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1347it [56:09,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1348it [56:11,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1349it [56:14,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1350it [56:16,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1351it [56:19,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1352it [56:21,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1353it [56:24,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1354it [56:26,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1355it [56:29,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1356it [56:31,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1357it [56:34,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1358it [56:36,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


1359it [56:39,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


1360it [56:41,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1361it [56:44,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1362it [56:46,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1363it [56:49,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1364it [56:51,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


1365it [56:53,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1366it [56:56,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1367it [56:59,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1368it [57:01,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1369it [57:03,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1370it [57:06,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1371it [57:08,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1372it [57:11,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1373it [57:13,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1374it [57:16,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


1375it [57:19,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


1376it [57:21,  2.63s/it]

torch.Size([124, 16]) torch.Size([1984])


1377it [57:24,  2.63s/it]

torch.Size([124, 16]) torch.Size([1984])


1378it [57:26,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


1379it [57:29,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1380it [57:31,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1381it [57:34,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1382it [57:36,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1383it [57:39,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1384it [57:41,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1385it [57:44,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1386it [57:46,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1387it [57:49,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1388it [57:51,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1389it [57:53,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1390it [57:56,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1391it [57:58,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1392it [58:01,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1393it [58:03,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1394it [58:06,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1395it [58:08,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1396it [58:11,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1397it [58:13,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1398it [58:16,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1399it [58:18,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])
训练损失为1.4299229754294642
春风吹露草，青门对白杨。散雪先生柳，含露秀如苔。吴州十月后，越江如万艘。波涛若成黑，风俗互相依。白鸟飞孤轩，孤烟生四垓。荷带不潇洒，鱼娘亦慷洄。五具不可应，六雏互安摧。峡人梦何有，良会殊未回。萧萧柳气高，车汙无由来。色换一团扇，声声不自猜。砥行如泥汗，筋力如衰灰。饥儿醉复醉，起醉不复开。不展雀罗爵，新雏紫带开。不知此地者，为乐如死灰。
江上风暖歌草浮，君游五十无所为。少君结束慰远思，终日风流无所疑。我有一书抱琴瑟，美酒无人皆雀食。前儿啄粟头上头，因我向城有深愁。妻子来时不得语，春风日日相思啼。奈今今年是何许，随鹿焉得便无由。大之一瓢聊一失，一人复醉千载愁。我今此別为客苦，今日君生绸大丘。
花界无生地，慈宫有好人。心怀古舜则，诛拟一家真。汲乱尝今事，焚香旧几人。印林全偃落，松竹暗斜春。雪桧缘行秀，山苗可赏贫。烟花连户合，烟霭绕篱隣。断弁寒仍嫩，连泉冻更新。连瓯背鴈鹜，远寺入前邻。僧得何由著，经行不见春。呼鸡闻苦吹，看语好儿巡。墙近教安稳，逍遥不可驯。看山杂杨叶，来驾采成神。渐透阴阳照，孤愁净不匀。只愿千年后，荣教似要伸。
朝廷厌世乱，历世一斋登。服水凌云碧，甘泉溢桂苗。气圆回阁迥，景气过窗高。玉珮凝何异，金纲有不牢。又如炎瘴契，更进古风调。帝子思凭列，天文被会操。冯夷逾昼简，鲁国训为蛇。箧杂垂金钺，恩褒奏玉华。百壺朝玉陛，五灶发雕梁。斜苑疑宫燄，祥烟聚几双。恐言张筦琢，宁惜谏书单。兰芷摇斜影，金蝉续少桨。筌疲泉脉转，雪转阶墀。极境方澄起，游关自望赊。无人知得意，一夕一枝芳。
秋风歘吸吸明箭，击汗击稜轰细萤。豪豪愤足各自起，豪友如何如帝生。河边少有平安日，曾骑金鞭照瀚海。丁丁天仗欺早来，骏马连鞭来速毕。铁头鞭马控如云，照马低头照江上。拔鳞冲，正杀生，出将斫浪入两指。三峡空流四海清，胡兵合入阴丘变。一日横行万里追，戚中流胡五十万。人人尽说汉家求，势甲火德如泥锥。昨日祈君归奏罢，余颜一局何时入。惆怅长河万重烽，长沙万里何人哉。青山万里不可测，胡天不鸣蛟玉毛。
月界三伏尘，秋斋三十旬。饥鸣漏虫堕，病起语亦新。低涧穿半蜩，缘榛转苍榛。人生勤苦肠，誓岂钻虫羶。大贤不容洁，教使瞋道身。藜藿旷安寝，废坟颜果赐。牵年面万丈，置盏看新栗。白马胡马头，摧摧白露蠹

1400it [58:25,  3.75s/it]

夜梦神州宫，昨夜真仙尉。君今在鸡鸣，闻音不可越。但得山僧语，不觉夜永永。夜长哭嘤嘤，必解弹织足。况是古人情，不然长相忆。眼痛换明镜，秋堂已移隙。家酝冬夜澜，不如不如物。胡为苦不谐，犹记君子耳。那如南山疾，此意皆云覆。吾知今古人，损之颇变易。何用不平缘，一字便成寐。日暮两三人，裴回一灯酒。蝴弦一会时，不如两翁忆。
torch.Size([124, 16]) torch.Size([1984])


1401it [58:27,  3.32s/it]

torch.Size([124, 16]) torch.Size([1984])


1402it [58:30,  3.04s/it]

torch.Size([124, 16]) torch.Size([1984])


1403it [58:32,  2.82s/it]

torch.Size([124, 16]) torch.Size([1984])


1404it [58:34,  2.68s/it]

torch.Size([124, 16]) torch.Size([1984])


1405it [58:37,  2.61s/it]

torch.Size([124, 16]) torch.Size([1984])


1406it [58:39,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1407it [58:41,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1408it [58:44,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1409it [58:46,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1410it [58:49,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1411it [58:51,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1412it [58:53,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1413it [58:56,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1414it [58:58,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1415it [59:01,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1416it [59:03,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1417it [59:06,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1418it [59:08,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1419it [59:11,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1420it [59:13,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1421it [59:16,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1422it [59:18,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1423it [59:21,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1424it [59:23,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1425it [59:25,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1426it [59:28,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1427it [59:30,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1428it [59:33,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1429it [59:35,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1430it [59:38,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1431it [59:40,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1432it [59:43,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1433it [59:45,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1434it [59:47,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1435it [59:50,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1436it [59:52,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1437it [59:55,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1438it [59:57,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1439it [1:00:00,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1440it [1:00:02,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1441it [1:00:05,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1442it [1:00:07,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1443it [1:00:10,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1444it [1:00:12,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1445it [1:00:15,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1446it [1:00:17,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1447it [1:00:20,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1448it [1:00:22,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1449it [1:00:25,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1450it [1:00:27,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1451it [1:00:30,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1452it [1:00:32,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


1453it [1:00:34,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


1454it [1:00:37,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


1455it [1:00:39,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


1456it [1:00:42,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1457it [1:00:44,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1458it [1:00:46,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1459it [1:00:49,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


1460it [1:00:51,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1461it [1:00:54,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1462it [1:00:56,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


1463it [1:00:58,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1464it [1:01:01,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1465it [1:01:04,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1466it [1:01:06,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1467it [1:01:08,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1468it [1:01:11,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1469it [1:01:13,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1470it [1:01:16,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1471it [1:01:18,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1472it [1:01:21,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1473it [1:01:23,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1474it [1:01:26,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1475it [1:01:28,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1476it [1:01:31,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1477it [1:01:33,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1478it [1:01:36,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1479it [1:01:38,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1480it [1:01:41,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1481it [1:01:43,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1482it [1:01:46,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


1483it [1:01:48,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1484it [1:01:50,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1485it [1:01:53,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1486it [1:01:55,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


1487it [1:01:58,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


1488it [1:02:00,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1489it [1:02:03,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1490it [1:02:05,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1491it [1:02:07,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1492it [1:02:10,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1493it [1:02:12,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1494it [1:02:15,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1495it [1:02:17,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1496it [1:02:19,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


1497it [1:02:22,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


1498it [1:02:24,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1499it [1:02:27,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1500it [1:02:30,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1501it [1:02:32,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1502it [1:02:34,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1503it [1:02:37,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1504it [1:02:39,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1505it [1:02:42,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1506it [1:02:44,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1507it [1:02:47,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1508it [1:02:49,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


1509it [1:02:51,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1510it [1:02:54,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1511it [1:02:56,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1512it [1:02:59,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1513it [1:03:01,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1514it [1:03:04,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1515it [1:03:06,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1516it [1:03:09,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1517it [1:03:11,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1518it [1:03:14,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1519it [1:03:16,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1520it [1:03:19,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1521it [1:03:21,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1522it [1:03:24,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1523it [1:03:26,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


1524it [1:03:28,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


1525it [1:03:31,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


1526it [1:03:33,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


1527it [1:03:36,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1528it [1:03:38,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1529it [1:03:41,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


1530it [1:03:43,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


1531it [1:03:45,  2.34s/it]

torch.Size([124, 16]) torch.Size([1984])


1532it [1:03:47,  2.34s/it]

torch.Size([124, 16]) torch.Size([1984])


1533it [1:03:50,  2.34s/it]

torch.Size([124, 16]) torch.Size([1984])


1534it [1:03:52,  2.33s/it]

torch.Size([124, 16]) torch.Size([1984])


1535it [1:03:55,  2.36s/it]

torch.Size([124, 16]) torch.Size([1984])


1536it [1:03:57,  2.35s/it]

torch.Size([124, 16]) torch.Size([1984])


1537it [1:03:59,  2.34s/it]

torch.Size([124, 16]) torch.Size([1984])


1538it [1:04:01,  2.33s/it]

torch.Size([124, 16]) torch.Size([1984])


1539it [1:04:04,  2.33s/it]

torch.Size([124, 16]) torch.Size([1984])


1540it [1:04:06,  2.32s/it]

torch.Size([124, 16]) torch.Size([1984])


1541it [1:04:09,  2.35s/it]

torch.Size([124, 16]) torch.Size([1984])


1542it [1:04:11,  2.33s/it]

torch.Size([124, 16]) torch.Size([1984])


1543it [1:04:13,  2.31s/it]

torch.Size([124, 16]) torch.Size([1984])


1544it [1:04:15,  2.32s/it]

torch.Size([124, 16]) torch.Size([1984])


1545it [1:04:18,  2.31s/it]

torch.Size([124, 16]) torch.Size([1984])


1546it [1:04:20,  2.30s/it]

torch.Size([124, 16]) torch.Size([1984])


1547it [1:04:22,  2.31s/it]

torch.Size([124, 16]) torch.Size([1984])


1548it [1:04:25,  2.32s/it]

torch.Size([124, 16]) torch.Size([1984])


1549it [1:04:27,  2.32s/it]

torch.Size([124, 16]) torch.Size([1984])


1550it [1:04:29,  2.31s/it]

torch.Size([124, 16]) torch.Size([1984])


1551it [1:04:32,  2.32s/it]

torch.Size([124, 16]) torch.Size([1984])


1552it [1:04:34,  2.30s/it]

torch.Size([124, 16]) torch.Size([1984])


1553it [1:04:36,  2.31s/it]

torch.Size([124, 16]) torch.Size([1984])


1554it [1:04:39,  2.31s/it]

torch.Size([124, 16]) torch.Size([1984])


1555it [1:04:41,  2.33s/it]

torch.Size([124, 16]) torch.Size([1984])


1556it [1:04:43,  2.31s/it]

torch.Size([124, 16]) torch.Size([1984])


1557it [1:04:45,  2.31s/it]

torch.Size([124, 16]) torch.Size([1984])


1558it [1:04:48,  2.33s/it]

torch.Size([124, 16]) torch.Size([1984])


1559it [1:04:50,  2.36s/it]

torch.Size([124, 16]) torch.Size([1984])


1560it [1:04:53,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


1561it [1:04:55,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


1562it [1:04:57,  2.35s/it]

torch.Size([124, 16]) torch.Size([1984])


1563it [1:05:00,  2.36s/it]

torch.Size([124, 16]) torch.Size([1984])


1564it [1:05:02,  2.35s/it]

torch.Size([124, 16]) torch.Size([1984])


1565it [1:05:04,  2.37s/it]

torch.Size([124, 16]) torch.Size([1984])


1566it [1:05:07,  2.37s/it]

torch.Size([124, 16]) torch.Size([1984])


1567it [1:05:09,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


1568it [1:05:12,  2.37s/it]

torch.Size([124, 16]) torch.Size([1984])


1569it [1:05:14,  2.35s/it]

torch.Size([124, 16]) torch.Size([1984])


1570it [1:05:16,  2.37s/it]

torch.Size([124, 16]) torch.Size([1984])


1571it [1:05:19,  2.35s/it]

torch.Size([124, 16]) torch.Size([1984])


1572it [1:05:21,  2.35s/it]

torch.Size([124, 16]) torch.Size([1984])


1573it [1:05:23,  2.36s/it]

torch.Size([124, 16]) torch.Size([1984])


1574it [1:05:26,  2.36s/it]

torch.Size([124, 16]) torch.Size([1984])


1575it [1:05:28,  2.37s/it]

torch.Size([124, 16]) torch.Size([1984])


1576it [1:05:30,  2.35s/it]

torch.Size([124, 16]) torch.Size([1984])


1577it [1:05:33,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


1578it [1:05:35,  2.35s/it]

torch.Size([124, 16]) torch.Size([1984])


1579it [1:05:37,  2.33s/it]

torch.Size([124, 16]) torch.Size([1984])


1580it [1:05:40,  2.35s/it]

torch.Size([124, 16]) torch.Size([1984])


1581it [1:05:42,  2.37s/it]

torch.Size([124, 16]) torch.Size([1984])


1582it [1:05:45,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


1583it [1:05:47,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


1584it [1:05:50,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


1585it [1:05:52,  2.37s/it]

torch.Size([124, 16]) torch.Size([1984])


1586it [1:05:54,  2.36s/it]

torch.Size([124, 16]) torch.Size([1984])


1587it [1:05:57,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


1588it [1:05:59,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


1589it [1:06:01,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


1590it [1:06:04,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


1591it [1:06:06,  2.34s/it]

torch.Size([124, 16]) torch.Size([1984])


1592it [1:06:08,  2.35s/it]

torch.Size([124, 16]) torch.Size([1984])


1593it [1:06:11,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


1594it [1:06:13,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


1595it [1:06:16,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


1596it [1:06:18,  2.37s/it]

torch.Size([124, 16]) torch.Size([1984])


1597it [1:06:20,  2.36s/it]

torch.Size([124, 16]) torch.Size([1984])


1598it [1:06:23,  2.36s/it]

torch.Size([124, 16]) torch.Size([1984])


1599it [1:06:25,  2.35s/it]

torch.Size([124, 16]) torch.Size([1984])
训练损失为1.4625453896448002
春光生百泽，凉日东南隅。如何渊元化，睠镇粲重都。按劒下层极，乘风飞上天。层台绝崇极，览日临周旋。旷望两世纷，翳蟠出冥冥。气声出巴海，色望回秦川。奠月忽降明，葳蕤鸣寒烟。回头独踟蹰，一只千万年。自从命盛服，岂如贤哲篇。岂愿抱其所，岂云保耆连。煌煌魂眇窅，昊夏夜凝天。愔蠁光摇湧，洪洪卒若旋。是为苍生地，安得千载便。
江上风热人，我行信邀別。北风飘高树，回塘风断续。惊回颠又多，屡觉戎幕早。遥思丞相阁，遥指吴江口。瘴雾侵夜深，行吟孤月里。徘徊出关望，露白寒杉碧。向夕泪空歌，云鬟起相唤。魂飞两不见，笑荅殊未短。目极远山攒，风悲远山破。坐憩白苹花，褭褭悲霜霰。从期戎幕下，独守荆州郭。白日无由来，东堂盛名意。所悲良有志，何必中门隔。谁言山泽情，不使此何极。
花界人何烦揖，翛忽乐兮无极。循斯兮可致，愿在梁皇帝二。三十六相合，六代八音王。十上未相甲，诸侯得相向。冉冉两成墟，颠狂鼓角天。鼓声搏众木，声消怒浪烟。骧贼坤沟渺然，小下汝沙边。坏脸漏淋齿，注得翡琅船。鬼魅不灵音，则有万卷钱。恒思婴孩啄，拗穿狼扶燃。飘然涉大漠，不战非路天。不凿拗嵌难，背出蚌玲珑。此胎既有人，根同何处寻。
朝游多搆地，夜夜吟风鼓。江南人不归，客在迹连试。羁愁不自适，泪滴复滴泪。遥携青壁头，独步高僧吏。松筠两三竹，竹竹深如一。嵩室互相夸，茅茨期讵早。敝庐时徙下，岚色堪萧索。扣薪从宇宙，避缴倦秋暮。南择有知龙，彼何地皆委。山公永寂寞，台室环万岱。运稅谅难安，中原亦反寂。鱼跳竟不辍，麋鹿聊自谕。目落有时游，空思失心域。
秋天杳茫茫，夜夜百虑瘦。可能徇安得，坐在青松色。手持青莲坡，身是白云叟。冥心与凡客，何暇不作齿。下自嵇大韦，清净无异益。物王不自守，余生当自骂。雷落天宇增，龙飞世间一。苍苍八月大，隐视无四极。绵緜有大想，乃成太行路。藉兽犹未终，升吾岂相待？泪流还可解，鸞凤俄可望。杳杳随波流，腾腾出尘际。四句同一心，万虑俱销魄。唯当得无知，寻识心情里。
月出卯，立浣发，仰见浊醪亦病。半一半，杯里足。今朝见月元月生，月如照耀月明里。天子畏，牵人歌。夫子中，敲马尾。珊瑚未寒，如有杯中有冰床。冀天下车进贤公，我家裴回君上揖。天符不足后宫星，吾我独有威仪別。


1600it [1:06:32,  3.61s/it]

夜色递开短，凉风何嫋零。舟舟既稍发，潭色亦可适。将军汉主君，挟劒如白玉。前负谢安久，前逢征侠初。从容不再得，此君何所须？扪枥向白云，采桑坐何处？山寺半晴阳，金铙照江水。三桮自相忆，却忆不见面。好醉能有人，心中不容索。如今见何物，岂复闻鹧鸪。倏忽见荆州，咸期北门隔。徒伤年宪残，仁安迹何足。何日为客言，子生一枝喻。
torch.Size([124, 16]) torch.Size([1984])


1601it [1:06:34,  3.23s/it]

torch.Size([124, 16]) torch.Size([1984])


1602it [1:06:36,  2.97s/it]

torch.Size([124, 16]) torch.Size([1984])


1603it [1:06:39,  2.79s/it]

torch.Size([124, 16]) torch.Size([1984])


1604it [1:06:41,  2.69s/it]

torch.Size([124, 16]) torch.Size([1984])


1605it [1:06:43,  2.61s/it]

torch.Size([124, 16]) torch.Size([1984])


1606it [1:06:46,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


1607it [1:06:48,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1608it [1:06:51,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1609it [1:06:53,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1610it [1:06:56,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1611it [1:06:58,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1612it [1:07:01,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1613it [1:07:04,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


1614it [1:07:06,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


1615it [1:07:09,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


1616it [1:07:11,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1617it [1:07:13,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1618it [1:07:16,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


1619it [1:07:18,  2.37s/it]

torch.Size([124, 16]) torch.Size([1984])


1620it [1:07:20,  2.33s/it]

torch.Size([124, 16]) torch.Size([1984])


1621it [1:07:22,  2.34s/it]

torch.Size([124, 16]) torch.Size([1984])


1622it [1:07:25,  2.30s/it]

torch.Size([124, 16]) torch.Size([1984])


1623it [1:07:27,  2.29s/it]

torch.Size([124, 16]) torch.Size([1984])


1624it [1:07:29,  2.27s/it]

torch.Size([124, 16]) torch.Size([1984])


1625it [1:07:31,  2.27s/it]

torch.Size([124, 16]) torch.Size([1984])


1626it [1:07:34,  2.30s/it]

torch.Size([124, 16]) torch.Size([1984])


1627it [1:07:36,  2.34s/it]

torch.Size([124, 16]) torch.Size([1984])


1628it [1:07:39,  2.37s/it]

torch.Size([124, 16]) torch.Size([1984])


1629it [1:07:41,  2.36s/it]

torch.Size([124, 16]) torch.Size([1984])


1630it [1:07:43,  2.36s/it]

torch.Size([124, 16]) torch.Size([1984])


1631it [1:07:46,  2.36s/it]

torch.Size([124, 16]) torch.Size([1984])


1632it [1:07:48,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


1633it [1:07:51,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


1634it [1:07:53,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


1635it [1:07:55,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


1636it [1:07:58,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1637it [1:08:00,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1638it [1:08:03,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1639it [1:08:05,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1640it [1:08:08,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1641it [1:08:10,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1642it [1:08:13,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1643it [1:08:16,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1644it [1:08:18,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1645it [1:08:20,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1646it [1:08:23,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1647it [1:08:25,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1648it [1:08:28,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1649it [1:08:30,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1650it [1:08:33,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1651it [1:08:35,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1652it [1:08:38,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1653it [1:08:40,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1654it [1:08:43,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1655it [1:08:45,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1656it [1:08:47,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1657it [1:08:50,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1658it [1:08:52,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1659it [1:08:55,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1660it [1:08:57,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1661it [1:09:00,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1662it [1:09:02,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1663it [1:09:04,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1664it [1:09:07,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1665it [1:09:10,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1666it [1:09:12,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1667it [1:09:15,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1668it [1:09:17,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1669it [1:09:20,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1670it [1:09:22,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1671it [1:09:24,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1672it [1:09:27,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1673it [1:09:29,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1674it [1:09:32,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1675it [1:09:35,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1676it [1:09:37,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


1677it [1:09:40,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1678it [1:09:42,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1679it [1:09:45,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1680it [1:09:47,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1681it [1:09:49,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1682it [1:09:52,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1683it [1:09:54,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1684it [1:09:57,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1685it [1:09:59,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1686it [1:10:02,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1687it [1:10:04,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1688it [1:10:07,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1689it [1:10:09,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1690it [1:10:12,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1691it [1:10:14,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1692it [1:10:17,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1693it [1:10:19,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1694it [1:10:21,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1695it [1:10:24,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1696it [1:10:26,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1697it [1:10:29,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1698it [1:10:32,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1699it [1:10:34,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1700it [1:10:37,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1701it [1:10:39,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1702it [1:10:42,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1703it [1:10:44,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1704it [1:10:47,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1705it [1:10:49,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1706it [1:10:52,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1707it [1:10:54,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1708it [1:10:57,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1709it [1:10:59,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1710it [1:11:01,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1711it [1:11:04,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1712it [1:11:06,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1713it [1:11:09,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1714it [1:11:11,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1715it [1:11:14,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1716it [1:11:16,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1717it [1:11:19,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1718it [1:11:21,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1719it [1:11:24,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1720it [1:11:26,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1721it [1:11:29,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1722it [1:11:31,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1723it [1:11:34,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1724it [1:11:36,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1725it [1:11:39,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1726it [1:11:41,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1727it [1:11:44,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1728it [1:11:46,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1729it [1:11:49,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1730it [1:11:51,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1731it [1:11:54,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1732it [1:11:56,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1733it [1:11:59,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1734it [1:12:02,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1735it [1:12:04,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1736it [1:12:06,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1737it [1:12:09,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1738it [1:12:11,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1739it [1:12:14,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1740it [1:12:16,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1741it [1:12:19,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1742it [1:12:21,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1743it [1:12:24,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1744it [1:12:26,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1745it [1:12:28,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1746it [1:12:31,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1747it [1:12:33,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1748it [1:12:36,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1749it [1:12:38,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1750it [1:12:41,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1751it [1:12:43,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1752it [1:12:45,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1753it [1:12:48,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1754it [1:12:50,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1755it [1:12:53,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1756it [1:12:55,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1757it [1:12:58,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1758it [1:13:00,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1759it [1:13:03,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1760it [1:13:05,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1761it [1:13:08,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1762it [1:13:10,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1763it [1:13:13,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1764it [1:13:15,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1765it [1:13:18,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1766it [1:13:20,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1767it [1:13:23,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1768it [1:13:25,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1769it [1:13:28,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1770it [1:13:30,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1771it [1:13:33,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1772it [1:13:35,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1773it [1:13:38,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1774it [1:13:40,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1775it [1:13:42,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1776it [1:13:45,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1777it [1:13:47,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1778it [1:13:50,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1779it [1:13:52,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1780it [1:13:55,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1781it [1:13:57,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1782it [1:14:00,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1783it [1:14:02,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1784it [1:14:05,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1785it [1:14:07,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1786it [1:14:10,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1787it [1:14:12,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1788it [1:14:15,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1789it [1:14:17,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1790it [1:14:20,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1791it [1:14:22,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1792it [1:14:25,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1793it [1:14:27,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1794it [1:14:30,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1795it [1:14:32,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1796it [1:14:35,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


1797it [1:14:37,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1798it [1:14:40,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


1799it [1:14:42,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])
训练损失为1.4912432611319733
春风摇烟陌，槐叶满辰芒。春物变颜色，夜声飘舞家。葳蕤挂曙露，菡萏生晨光。凝露澹如坠，侵池露如塘。怳疑有遐旷，岂忘幽意芳。乍令幽抱久，似彼风罗裳。具言感俗态，岂谓为晶光。双阙当门序，玉女不能调。不与玉人赠，乃令朱庭傍。本是天地心，不为人网拘。惟闻粉成妙，可可比彤桑。龙驾定何讬，羽毛亦何伤。击鲸安可羨，远隔沧海长。
江上风热人不断，不能一日傍村老。念伊今夜与众木，一夜一直犹呜咽。不如目断谁问人，不谓君行不如手。一朝立举已十五，今日逢君常叹息。德貌兼为垢羽刀，文字才疎才未及。裴回十万马回头，身后错裁犹自吐。我而何事亦知贤。丈夫性外竟何足，弃取白头学小弟。或令吉诗使说闲，不知心爱在家心。
花界人兮镜如雪，君今至今君今道驰。第一君兮圣主所，能使我兮将何覩。及乎天之主妾母耶之中之有莫比。中汉之中不展君，阳之之妙不知冤。纵有一雨木於雪，君子夜夜独吹舒。月有两枝见巢尾，人间不见不能测。唯恐岁寒日迟迟，剖月濯汝潇湘波。黄叶自然木下死，巨吾不识神丹波。人人之方志有时，若不尽。
朝阳阙下悬杨棹，却忆伶郎系颜处。夜开月色当床前，悠悠野火生衣月。湘江白日明星恶，僮仆高眠出山路。蜂言碍水盘陀石，有客试来扫篱圃。粉笠霜黏染不成，银河月面如双影。宁知更有一枝桐，水精佛殿名无喧。山童历薄斸药钱热钱。镜中春雪眼何日，龙蛇寄语年年年。可怜不用探其卖，锥成造化身不停。却问李精锥宪巧，与君十载学长贤。他时果见李秋景，未必扈歌天上仙。
秋风歘吸吸月吸，霜如冰炭非膏滑。琉璃汗气生霜梧，剥摧木兰吹紫罗。卷帷掩映楼，焰焰如云灭。中林如电如有风，声若夜於月於云。孤高高标难耐覆，但有众动栖攀军。三边胡子妇不识，胡旋不言树寒兔。行者不御沟北流，不见天河月中尾。金河之下天地横，汉家重数无相营。风号神音耳咽兀，堂堂月下增嫌苦。昔人传行隸其人，孝子慈母称神亲。君能不知英强死，今人贳镜专分巾。楼下蛾眉一斗腐，枉看马上骄贵人。朝车竝将两曲随，胡儿夜坏
月出山阴明，照见青山明。烦赏共结类，得之谓何荣。翩翾大其壤，委立中天倾。骋然媚千里，照庑泻层明。吾游汝桃李，春生幼子精。平生白羽地，瞥与异姓名。点铁攒素光，飞腾撑虹茎。金虎衔镫底，赤龙鸣夜声。鬼神无穴魅，远近无纤生。填门不遭失，伍父安可轻。我何祛十方，浩荡

1800it [1:14:50,  3.95s/it]

夜梦身天湖水溢，一身行处相逢见。家家弟子能著鞭，将军骑尾生金驼。王孙留将主恩傥，我身一直还荆楚。我欲见李又知名，死生不得俱无情。君不见绮罗书里儿，使我骨肉自有髭。丈夫快步过万事，不及两日何时嗔。知君不及老大富，恶杀天下为欢琴。忽闻言行君调索，使君妇见才不如。莫言身长白骨改，不如蔓水公卿心。怕须读此身无事，百炼千金无主主。男儿长在他乡路，何许空房外来此。日夕悠悠一往还，麋鹿溺之无外事。吾闻古石老人言
torch.Size([124, 16]) torch.Size([1984])


1801it [1:14:52,  3.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1802it [1:14:54,  3.17s/it]

torch.Size([124, 16]) torch.Size([1984])


1803it [1:14:57,  2.94s/it]

torch.Size([124, 16]) torch.Size([1984])


1804it [1:14:59,  2.77s/it]

torch.Size([124, 16]) torch.Size([1984])


1805it [1:15:02,  2.69s/it]

torch.Size([124, 16]) torch.Size([1984])


1806it [1:15:04,  2.60s/it]

torch.Size([124, 16]) torch.Size([1984])


1807it [1:15:06,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1808it [1:15:09,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1809it [1:15:11,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1810it [1:15:14,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1811it [1:15:16,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1812it [1:15:19,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1813it [1:15:21,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1814it [1:15:24,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1815it [1:15:26,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1816it [1:15:29,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1817it [1:15:31,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1818it [1:15:34,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1819it [1:15:36,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1820it [1:15:39,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1821it [1:15:41,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1822it [1:15:44,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1823it [1:15:46,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1824it [1:15:49,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1825it [1:15:51,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1826it [1:15:54,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1827it [1:15:56,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1828it [1:15:59,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1829it [1:16:01,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1830it [1:16:04,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1831it [1:16:06,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1832it [1:16:09,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1833it [1:16:11,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1834it [1:16:14,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1835it [1:16:16,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1836it [1:16:19,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1837it [1:16:21,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1838it [1:16:24,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1839it [1:16:26,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1840it [1:16:29,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1841it [1:16:32,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


1842it [1:16:34,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


1843it [1:16:37,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


1844it [1:16:39,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


1845it [1:16:42,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1846it [1:16:44,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1847it [1:16:47,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1848it [1:16:49,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1849it [1:16:51,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1850it [1:16:54,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1851it [1:16:56,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1852it [1:16:59,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1853it [1:17:01,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1854it [1:17:04,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1855it [1:17:06,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1856it [1:17:09,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1857it [1:17:11,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1858it [1:17:14,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1859it [1:17:17,  2.60s/it]

torch.Size([124, 16]) torch.Size([1984])


1860it [1:17:19,  2.60s/it]

torch.Size([124, 16]) torch.Size([1984])


1861it [1:17:22,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


1862it [1:17:24,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


1863it [1:17:27,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1864it [1:17:29,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1865it [1:17:32,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1866it [1:17:34,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1867it [1:17:37,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1868it [1:17:39,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1869it [1:17:42,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1870it [1:17:44,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1871it [1:17:47,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1872it [1:17:49,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1873it [1:17:52,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1874it [1:17:54,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1875it [1:17:57,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1876it [1:17:59,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1877it [1:18:02,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


1878it [1:18:04,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1879it [1:18:07,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1880it [1:18:09,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1881it [1:18:12,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1882it [1:18:14,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1883it [1:18:17,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1884it [1:18:19,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1885it [1:18:22,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1886it [1:18:24,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1887it [1:18:27,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1888it [1:18:29,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


1889it [1:18:32,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1890it [1:18:34,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1891it [1:18:37,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1892it [1:18:39,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1893it [1:18:42,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1894it [1:18:44,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1895it [1:18:47,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1896it [1:18:49,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1897it [1:18:52,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1898it [1:18:54,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1899it [1:18:56,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1900it [1:18:59,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1901it [1:19:01,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1902it [1:19:04,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1903it [1:19:06,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1904it [1:19:09,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1905it [1:19:11,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1906it [1:19:14,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1907it [1:19:16,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1908it [1:19:19,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1909it [1:19:21,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1910it [1:19:24,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1911it [1:19:26,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1912it [1:19:28,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1913it [1:19:31,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1914it [1:19:33,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1915it [1:19:36,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1916it [1:19:38,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1917it [1:19:41,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1918it [1:19:43,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1919it [1:19:46,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1920it [1:19:48,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1921it [1:19:51,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1922it [1:19:53,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1923it [1:19:56,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1924it [1:19:58,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1925it [1:20:01,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1926it [1:20:03,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1927it [1:20:06,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1928it [1:20:08,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1929it [1:20:11,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1930it [1:20:13,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1931it [1:20:16,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1932it [1:20:18,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1933it [1:20:21,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1934it [1:20:23,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1935it [1:20:26,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1936it [1:20:28,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1937it [1:20:31,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1938it [1:20:33,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1939it [1:20:36,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1940it [1:20:38,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1941it [1:20:41,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


1942it [1:20:43,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1943it [1:20:46,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1944it [1:20:48,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1945it [1:20:50,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1946it [1:20:53,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1947it [1:20:55,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1948it [1:20:58,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1949it [1:21:00,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1950it [1:21:03,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1951it [1:21:05,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1952it [1:21:08,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1953it [1:21:10,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1954it [1:21:13,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1955it [1:21:15,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1956it [1:21:18,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1957it [1:21:20,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1958it [1:21:23,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1959it [1:21:25,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1960it [1:21:28,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1961it [1:21:30,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1962it [1:21:33,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1963it [1:21:35,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1964it [1:21:37,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1965it [1:21:40,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1966it [1:21:42,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1967it [1:21:45,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1968it [1:21:47,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1969it [1:21:50,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1970it [1:21:52,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1971it [1:21:55,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1972it [1:21:57,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1973it [1:22:00,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1974it [1:22:02,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1975it [1:22:05,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1976it [1:22:07,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1977it [1:22:09,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1978it [1:22:12,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1979it [1:22:14,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1980it [1:22:17,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1981it [1:22:19,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


1982it [1:22:22,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


1983it [1:22:24,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1984it [1:22:26,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


1985it [1:22:29,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


1986it [1:22:31,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


1987it [1:22:34,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1988it [1:22:36,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1989it [1:22:39,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1990it [1:22:41,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1991it [1:22:44,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


1992it [1:22:46,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


1993it [1:22:49,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1994it [1:22:51,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


1995it [1:22:54,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


1996it [1:22:56,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1997it [1:22:59,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


1998it [1:23:01,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


1999it [1:23:04,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])
训练损失为1.5165447815358606
春色徧渐远，凉光豔初新。幸与羣公游，所贵沅云人。云散日隐归，江山正新新。昔年病颜前，清洛桃李春。绿水荡別岸，青槐白发巾。我无济物心，乃是有目身。忽逢此中话，不愿天下人。豺狼被锋刃，可谓蒿莱薪。踟蹰恋天涯，鹤去不可攀。烟云为之別，一榻空崔嵬。明月晚归秦，松风邈苍苍。青山无不见，猨鸟自然惊。嶽鸟鸣远树，松门幽思生。
江陵通秋篠，山翠秀琉璃。奥洁古所好，丝桐释我能。遂令荣名难，一异颍阳僧。漆谈不足辨，遂为悲鸣欢。置俗日未厚，汲苔坐不援。事与时节阻，日与心事俱。榻为下郭卑，澡似新荷蔬。世情自寂寞，诗思视清澄。端居结遐迹，林籁幽贞欢。中夜促寝兴，虑清情屡牵。度尘讵再谢，此道方无偏。览罢幸兹夕，竟夕思我年。
花界年多少，黄衫死后偏。一州分旧物，千载骋前程。拔木和行骑，摩霞讶早星。月从徐鴈起，鹤逐晚风行。阃外蛮夷仰，山行礼武明。旱炎云雨霁，残月露楼明。劒路浮青气，幡场插白英。雨除山橘候，春入塞云明。刃断宽鲸队，琳容篆兕琤。摧藏知有补，雅极赖难倾。雀尾江堤变，鹰苏海峤明。摧黄鹦鹉鹢，斜退凤凰声。鬬惜书堂里，萦纡滴忆楹。心将尘本累，除病荷陶情。有论慙养质，从此污功名。
朝廷轨明祖，秀发鲁川良。六合冠盖古，万方瞻下行。焚香降从军，驰旅从孔军。陕岭色不入，谢安物或均。曝帐车马走，张书草木新。戟岭倚银阙，河乌拂平津。蹉跎不二老，车马日相亲。我自乘轩谒，却为尧仲秦。国云与时节，相见今已频。武帝猎谏猎，倜阑陵步嚬。我慙吕氏恩，慷慨寝原民。圣人配昭武，余德纵纵横。誓恳信子叹，日月赫自均。边事有谁问，何事稅功人。
秋风歘吸吹，芟画不敢干。臂牙如汗颈，日射如跳攒。始见山寸色，无间割天寒。潜腾火复迸，纤复如不盘。三毒曜曜开，万木相玲层。层延若平地，诸天镇其端。咄乃欧浑水，土木表清宽。修竹夹嵌空，酸挑百节残。扣乐哂神骨，焚弦思褊难。猛兽奔猛鬼，颠倒固为安。神威不足道，怯泰无哗哗。我愿神仙子，不知人魄腾。下士何所从，凉风满毫兰。雄雌驯驰心，不得随一盘。牵嘲问所愿，掉尾樵我寒。
月裴坐飞蓬鸣燕，凉风吹落空碧烟。玉珂零落秋山远，平王解佩如今年。忆昨逢春又相见，人间独有春冬千。白首十五自相识，纨手刻在数行船。或把山头蹋云母，钓竿不敢吹犀船。蛙裘欲落且放算，又不尽在一枝船。鲈鱼翁曹恣游

2000it [1:23:11,  3.80s/it]

夜梦劳师舍，来来安可安。三元登阁待，双履在林端。地入青山表，烟绵紫岭看。瓶陀藤带裹，滋径雪浮漫。老僧逾杖臂，缘屐看青龙。南过漆园岭，今来南固崇。丹崖尘世閟，白露冷牙冠。念往宁轻薄，非关脱辖衷。庾皇曾有武，方识霍垣安。突兀侵牛砾，兼添造象聋。旧房无旧窈，绝树是寒聋。愿得新诗否，题诗輙一从。
torch.Size([124, 16]) torch.Size([1984])


2001it [1:23:13,  3.36s/it]

torch.Size([124, 16]) torch.Size([1984])


2002it [1:23:15,  3.06s/it]

torch.Size([124, 16]) torch.Size([1984])


2003it [1:23:18,  2.84s/it]

torch.Size([124, 16]) torch.Size([1984])


2004it [1:23:20,  2.68s/it]

torch.Size([124, 16]) torch.Size([1984])


2005it [1:23:23,  2.66s/it]

torch.Size([124, 16]) torch.Size([1984])


2006it [1:23:25,  2.60s/it]

torch.Size([124, 16]) torch.Size([1984])


2007it [1:23:28,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


2008it [1:23:30,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2009it [1:23:32,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2010it [1:23:35,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2011it [1:23:37,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2012it [1:23:40,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2013it [1:23:42,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2014it [1:23:45,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2015it [1:23:47,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2016it [1:23:50,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2017it [1:23:52,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2018it [1:23:54,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2019it [1:23:57,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2020it [1:23:59,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2021it [1:24:02,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2022it [1:24:04,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2023it [1:24:07,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2024it [1:24:09,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2025it [1:24:12,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2026it [1:24:14,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2027it [1:24:16,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2028it [1:24:19,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2029it [1:24:21,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2030it [1:24:24,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2031it [1:24:26,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


2032it [1:24:28,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


2033it [1:24:31,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2034it [1:24:33,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2035it [1:24:36,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2036it [1:24:38,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


2037it [1:24:40,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


2038it [1:24:43,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


2039it [1:24:45,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


2040it [1:24:48,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2041it [1:24:50,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2042it [1:24:53,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2043it [1:24:55,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


2044it [1:24:58,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


2045it [1:25:01,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


2046it [1:25:03,  2.60s/it]

torch.Size([124, 16]) torch.Size([1984])


2047it [1:25:06,  2.60s/it]

torch.Size([124, 16]) torch.Size([1984])


2048it [1:25:08,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


2049it [1:25:11,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2050it [1:25:13,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2051it [1:25:16,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2052it [1:25:18,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2053it [1:25:20,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2054it [1:25:23,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2055it [1:25:26,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2056it [1:25:28,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2057it [1:25:31,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2058it [1:25:33,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2059it [1:25:36,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2060it [1:25:38,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2061it [1:25:41,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2062it [1:25:43,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2063it [1:25:46,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2064it [1:25:48,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2065it [1:25:51,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2066it [1:25:53,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2067it [1:25:56,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2068it [1:25:58,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2069it [1:26:01,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2070it [1:26:03,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2071it [1:26:06,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2072it [1:26:08,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2073it [1:26:10,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2074it [1:26:13,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2075it [1:26:15,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2076it [1:26:18,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2077it [1:26:21,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2078it [1:26:23,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2079it [1:26:26,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2080it [1:26:28,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2081it [1:26:31,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


2082it [1:26:33,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2083it [1:26:35,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2084it [1:26:38,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2085it [1:26:40,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2086it [1:26:43,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2087it [1:26:45,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2088it [1:26:48,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2089it [1:26:50,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2090it [1:26:53,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2091it [1:26:55,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2092it [1:26:58,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2093it [1:27:00,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2094it [1:27:03,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2095it [1:27:05,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2096it [1:27:07,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2097it [1:27:10,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2098it [1:27:12,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2099it [1:27:15,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2100it [1:27:17,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2101it [1:27:20,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2102it [1:27:22,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2103it [1:27:24,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


2104it [1:27:27,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2105it [1:27:30,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2106it [1:27:32,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2107it [1:27:34,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2108it [1:27:37,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2109it [1:27:39,  2.37s/it]

torch.Size([124, 16]) torch.Size([1984])


2110it [1:27:41,  2.35s/it]

torch.Size([124, 16]) torch.Size([1984])


2111it [1:27:44,  2.34s/it]

torch.Size([124, 16]) torch.Size([1984])


2112it [1:27:46,  2.33s/it]

torch.Size([124, 16]) torch.Size([1984])


2113it [1:27:48,  2.33s/it]

torch.Size([124, 16]) torch.Size([1984])


2114it [1:27:51,  2.35s/it]

torch.Size([124, 16]) torch.Size([1984])


2115it [1:27:53,  2.37s/it]

torch.Size([124, 16]) torch.Size([1984])


2116it [1:27:56,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2117it [1:27:58,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2118it [1:28:00,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2119it [1:28:03,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2120it [1:28:05,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


2121it [1:28:08,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2122it [1:28:10,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


2123it [1:28:12,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


2124it [1:28:15,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


2125it [1:28:17,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


2126it [1:28:19,  2.38s/it]

torch.Size([124, 16]) torch.Size([1984])


2127it [1:28:22,  2.37s/it]

torch.Size([124, 16]) torch.Size([1984])


2128it [1:28:24,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


2129it [1:28:27,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2130it [1:28:29,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2131it [1:28:32,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2132it [1:28:34,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2133it [1:28:36,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2134it [1:28:39,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2135it [1:28:41,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2136it [1:28:44,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2137it [1:28:46,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2138it [1:28:49,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2139it [1:28:51,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2140it [1:28:54,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2141it [1:28:56,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2142it [1:28:59,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2143it [1:29:01,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2144it [1:29:04,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2145it [1:29:06,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2146it [1:29:08,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2147it [1:29:11,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2148it [1:29:13,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2149it [1:29:16,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2150it [1:29:18,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2151it [1:29:21,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2152it [1:29:23,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2153it [1:29:26,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2154it [1:29:28,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


2155it [1:29:31,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


2156it [1:29:33,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2157it [1:29:36,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2158it [1:29:38,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2159it [1:29:41,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2160it [1:29:43,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2161it [1:29:46,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2162it [1:29:48,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2163it [1:29:51,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2164it [1:29:53,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2165it [1:29:56,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2166it [1:29:58,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2167it [1:30:01,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2168it [1:30:03,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2169it [1:30:06,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2170it [1:30:08,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2171it [1:30:10,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2172it [1:30:13,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2173it [1:30:15,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2174it [1:30:18,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2175it [1:30:20,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2176it [1:30:23,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2177it [1:30:25,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2178it [1:30:28,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2179it [1:30:30,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2180it [1:30:33,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2181it [1:30:35,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2182it [1:30:38,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2183it [1:30:40,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2184it [1:30:43,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2185it [1:30:45,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2186it [1:30:48,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2187it [1:30:50,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2188it [1:30:52,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2189it [1:30:55,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2190it [1:30:57,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2191it [1:31:00,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2192it [1:31:02,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2193it [1:31:05,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2194it [1:31:07,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2195it [1:31:09,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2196it [1:31:12,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2197it [1:31:14,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2198it [1:31:17,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2199it [1:31:19,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])
训练损失为1.5396394640478221
春余州路晚，舟下湖常大。山上一百丈，豁与平生宅。风生斑篠丛，水壮丹穴雪。清晨垂两岸，落日泛孤掌。圆月吐如波，长河澄皎皎。石崖跻远极，凫雁参天造。云路上峰青，行人穷水甸。筠荧易成雪，摧折仍婀娜。昔果有提壺，聊烦戏不足。风云与水曲，奔厉无由赏。何意济时人，至今长在手。
江陵寻水颠狂始，意中博望瀛洲远。辛勤懽深古郢前，吴侯机府画为髠。东堂建隼征鸿至，千里青山连帝关。玉帐金炉无旧有，长裾野石驻妖音。春过战，上飞旗，身逐弓尘不相许。应是龙骧避地狼，昔时地下论唐唐。司山铁柱今夜远，脚踏河源重叠铁。汗跼顽腥粗惕偏，但应气变为谁恡。贮咽夷南绝时事，但悲野草风中起。一言遗恨何许言，白昼不过何所诫。
花前伎，春正短，一日平生拋玉树。中有別妇，落花怨心里。黄鹂啄飞不禁游，洛阳宫中人笑春。少年妇女不相许，人事皆传有此春。一言复妾亦何曲，唯有优游花下春。不分沈沈少颜色，可怜妾笑无颜水。可怜贞实须误之，争得今人一杯酒。醉他翁，妻婢倒。少年憔悴与金闺，同衾帖纬声满时。紫烟舞袖颜可惜，红颜侍女盈眼眉。莫笑百年万二千，隐不买於今日移。
朝登高台下，日夕东风起。茅屋敞华筵，秦王序崇职。曲中疑九日，宫阙映千阙。珠皐敞紫极，石泉丽通绎。乍凝汤甸署，稍视骊山顶。宝女倾数篇，金罍贮芝蕙。杉桐不见水，草木无荣古。晏辔昼昏静，疎钟闲寂历。惬物谁与邻，所希情则邈。林泉静云远，云壑深窗织。嘉声激颓阴，绝顾无累际。愿言清风昼，蠲扰从所适。
秋风歘吸吹南峡，雷雨夜没吴中裂。祸龙眼睛若有已，未见此身若应。君不独寻此乡堂与□□□，□杀万物无穷高。荡子千里不暂回，我今七十无所知。且向山中作商叟，烦我痴酒无所二。驻马幡竿下路多，白日不过衣与客。长安后口乌亦稀，犹在邻家旧城郭。五年饥翁一斗身，今人不歛霍臣人。今年襄溪为知己，可怜作死便为主。君不见此，一时满墙西，营边不见泪垂眼。
月出穿廊林，高高高崔嵬。此地古所旷，清风时叫搴。挟携披时节，粲涵静者怀。幽独坐远时，忽闻风雷栖。清晨方在梦，始悟芳景非。忆昔游御阴，䜩游循朋俦。一朝奉颜色，结念在吾俦。贞意幸得道，掉回翻不挥。时时理稅思，上览情贞游。芳讯贮佳意，羣公情独游。因将逸翮势，共结风尘钩。物役良不远，道光知讵求。


2200it [1:31:26,  3.76s/it]

夜梦神仙女，应传仙客歌。双腰拖紫绶，绛幰驻红螺。追捧夫孙令，与郎玉腕多。青骢歌白气，紫管捧琼琚。为我才几许，慙羞燕暂过。春深榆柳岸，春至杏园花。刘毅何时见，单栖不可过。嬾从纨绮诏，娇咏女儿罗。妆匣排云阁，轻蛾拂面娥。翠眉催蜡炬，弦障扑琼蛾。选困娇红郁，衔恩擘绿罗。差池信无益，雪刃痛容罗。弃置时时否，妆成忆故窠。平原非雾鸟，日夕望江河。
torch.Size([124, 16]) torch.Size([1984])


2201it [1:31:28,  3.33s/it]

torch.Size([124, 16]) torch.Size([1984])


2202it [1:31:31,  3.06s/it]

torch.Size([124, 16]) torch.Size([1984])


2203it [1:31:33,  2.88s/it]

torch.Size([124, 16]) torch.Size([1984])


2204it [1:31:36,  2.75s/it]

torch.Size([124, 16]) torch.Size([1984])


2205it [1:31:38,  2.65s/it]

torch.Size([124, 16]) torch.Size([1984])


2206it [1:31:41,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


2207it [1:31:43,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


2208it [1:31:46,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


2209it [1:31:48,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


2210it [1:31:51,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2211it [1:31:53,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2212it [1:31:56,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2213it [1:31:58,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2214it [1:32:00,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2215it [1:32:03,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2216it [1:32:05,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2217it [1:32:08,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2218it [1:32:10,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2219it [1:32:13,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2220it [1:32:15,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2221it [1:32:17,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2222it [1:32:20,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2223it [1:32:22,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2224it [1:32:25,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2225it [1:32:27,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2226it [1:32:30,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2227it [1:32:32,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2228it [1:32:35,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2229it [1:32:37,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2230it [1:32:40,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2231it [1:32:42,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2232it [1:32:44,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2233it [1:32:47,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2234it [1:32:49,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2235it [1:32:52,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2236it [1:32:54,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2237it [1:32:57,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2238it [1:32:59,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2239it [1:33:02,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2240it [1:33:04,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2241it [1:33:07,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2242it [1:33:09,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2243it [1:33:11,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2244it [1:33:14,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2245it [1:33:16,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2246it [1:33:19,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2247it [1:33:21,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2248it [1:33:24,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


2249it [1:33:27,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


2250it [1:33:29,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2251it [1:33:31,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2252it [1:33:34,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2253it [1:33:36,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2254it [1:33:39,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


2255it [1:33:42,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2256it [1:33:44,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2257it [1:33:46,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2258it [1:33:49,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2259it [1:33:51,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2260it [1:33:54,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2261it [1:33:56,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2262it [1:33:58,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2263it [1:34:01,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2264it [1:34:03,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2265it [1:34:06,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2266it [1:34:08,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2267it [1:34:11,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2268it [1:34:13,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2269it [1:34:16,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2270it [1:34:18,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2271it [1:34:20,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2272it [1:34:23,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2273it [1:34:25,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2274it [1:34:28,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2275it [1:34:30,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2276it [1:34:33,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2277it [1:34:35,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2278it [1:34:38,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2279it [1:34:40,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2280it [1:34:43,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2281it [1:34:45,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2282it [1:34:47,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2283it [1:34:50,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2284it [1:34:52,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2285it [1:34:55,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2286it [1:34:57,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2287it [1:35:00,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2288it [1:35:02,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2289it [1:35:05,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2290it [1:35:07,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2291it [1:35:09,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2292it [1:35:12,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2293it [1:35:14,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2294it [1:35:17,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2295it [1:35:19,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2296it [1:35:22,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2297it [1:35:24,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2298it [1:35:26,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2299it [1:35:29,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2300it [1:35:31,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2301it [1:35:34,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2302it [1:35:36,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2303it [1:35:39,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2304it [1:35:41,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2305it [1:35:44,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2306it [1:35:46,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2307it [1:35:49,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2308it [1:35:51,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2309it [1:35:54,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2310it [1:35:56,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2311it [1:35:59,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2312it [1:36:01,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2313it [1:36:04,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2314it [1:36:06,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2315it [1:36:09,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2316it [1:36:11,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2317it [1:36:14,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


2318it [1:36:16,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2319it [1:36:19,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2320it [1:36:21,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2321it [1:36:24,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2322it [1:36:26,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2323it [1:36:29,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2324it [1:36:31,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2325it [1:36:34,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2326it [1:36:36,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2327it [1:36:39,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2328it [1:36:41,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2329it [1:36:44,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2330it [1:36:46,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


2331it [1:36:49,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


2332it [1:36:51,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2333it [1:36:54,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2334it [1:36:56,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2335it [1:36:59,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2336it [1:37:01,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2337it [1:37:04,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2338it [1:37:06,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2339it [1:37:09,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2340it [1:37:11,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2341it [1:37:14,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2342it [1:37:16,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2343it [1:37:18,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2344it [1:37:21,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2345it [1:37:24,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2346it [1:37:26,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2347it [1:37:29,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2348it [1:37:31,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2349it [1:37:34,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2350it [1:37:36,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2351it [1:37:39,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


2352it [1:37:41,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


2353it [1:37:44,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2354it [1:37:46,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2355it [1:37:49,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


2356it [1:37:52,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


2357it [1:37:54,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


2358it [1:37:57,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


2359it [1:37:59,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2360it [1:38:02,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2361it [1:38:04,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2362it [1:38:07,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2363it [1:38:09,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2364it [1:38:11,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2365it [1:38:14,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2366it [1:38:16,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2367it [1:38:19,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2368it [1:38:21,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2369it [1:38:24,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2370it [1:38:27,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


2371it [1:38:29,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2372it [1:38:32,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


2373it [1:38:34,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


2374it [1:38:37,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2375it [1:38:39,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2376it [1:38:42,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2377it [1:38:44,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2378it [1:38:47,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2379it [1:38:49,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2380it [1:38:51,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2381it [1:38:54,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2382it [1:38:56,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2383it [1:38:59,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2384it [1:39:01,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2385it [1:39:04,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2386it [1:39:07,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2387it [1:39:09,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2388it [1:39:12,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2389it [1:39:14,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2390it [1:39:16,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2391it [1:39:19,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2392it [1:39:21,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2393it [1:39:24,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2394it [1:39:26,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2395it [1:39:29,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2396it [1:39:31,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2397it [1:39:34,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2398it [1:39:36,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2399it [1:39:39,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])
训练损失为1.5568593026946003
春溪仲白禾黍，广冢青蝇上飞马。我心若水流不去，我见长在水中浴。霹雳格滑在洋池，芰荷香重琉璃枝。绛軿嵬架清神潭，我方遨游前首人。扬雄奔走人亦闻，扰扰匹车徒顾身。功名物理难得见，华山郁郁能与亲。裴回更逐长裾翼，俄惊击电何人吐。相顾坚搜掩几人，身闲不见人间死。哥来太守不归心，一片清香防不尽。君不见此心无数事，罗襦啜，徒见文公子。但见身事打贼来，世人为我向人间。
江陵郁郁苔，山谷特缁磷。邑人呼子魄，千年圣人知。天地费尧历，龙衮授雄诗。三禅承龙构，下颡如龙旗。信陵秉六愿，出入展明时。大簸刃奚掉，韬罗心所维。姦臣有邹枚，所以嗣大私。大河无千载，熊氏息中河。滔滔俯京溟，莽杳不可逃。经荒不容息，寇息何喧之。蛮卒绝美功，下军振天祇。欃兽谅茍启，霸德增难期。
花前日曈曈，明河应不返。素手耀朝云，飞珠下寥廓。清宵露帘外，清韵月帘曲。碧影笼清窗，炎光照瑶草。泠泠步騕褭，褭褭忘留讬。返节凝芳气，奇庭豔晴始。烟岚媚难辨，楼际多相映。髣髴不知留，萋萋芳草绿。清觞厌瑶爵，清明动素骨。携手从此始，下车何其盛。白马东岱戎，丹心淩天热。宁知万世事，若值千年隔。勿辞从此还，何幸待幽戚。
朝光含泰朝，朗钥启明公。弘策期登览，超符表隐邻。三台含景色，百象凑星辰。复阜千门晓，疏行四望春。仙宫映绛幄，金殿拂云闉。仰効矜神瑞，慇懃惜使臣。礼容联乐日，文盛委天真。宝镜凝仙气，花宫照夜轮。箭摇青嶂轴，梵写绮经春。谬列金门侣，旁传玉辇邻。清秋从习乐，汉祖独升晨。已得三皇赏，无劳贾战身。拥兵关猛气，横角冻奔尘。龙驾今如此，恩王在此身。
秋光靡晚天，绿叶不能映。君恩忽相剪，泾水湛其绿。万物资自然，三人不相害。家中踰千里，车马朝百里。蹭蹬或不羣，流年忽如此。诸侯竟不回，羣燕徒相悅。紫陌花未开，葳氲筑交柳。问君将陵县，且喜题诗客。別离行为将，形骸日将夕。京洛徒自劳，所与谁相见。吾君此中別，相见偶身命。若见无与依，人人未如昨。乃知天上马，不如身住贱。杀人不问谁，我独恸哭泣。去去无复情，君荣富能薄。
月落缑山海，江转褒相凑。樯沈近伍途，手醒无异色。遂令康狩至昇然，长讶途中常是息。兀然默默兮林顶，森森寒，龙枕水，波涛千古，烟霜混沌空流现。君不见此天真祐，妙元见之唐帝威。列阴山，展精洁，一万里，几留空。一双蜉

2400it [1:39:46,  4.01s/it]

夜夜坐秋馆，翛然无所思。宁知一饭掾，遂补黄庭期。昨日即杖截，秋人窥鑪驰。晨磬吼高户，佳果当啼池。松承龙符日，石转泉火池。山中有深谷，日觉无喧疑。一听不得意，下车三四师。忽闻南游者，今日加四期。清秩从礼秩，高斋空月轮。感时心已寂，经岁倦离离。不得回天道，蹉跎安久辞。若如优劣友，我亦吾吾知。无限江海人，故人江上诗。不如桃李荣，不待日光迟。
torch.Size([124, 16]) torch.Size([1984])


2401it [1:39:49,  3.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2402it [1:39:51,  3.19s/it]

torch.Size([124, 16]) torch.Size([1984])


2403it [1:39:54,  2.96s/it]

torch.Size([124, 16]) torch.Size([1984])


2404it [1:39:56,  2.79s/it]

torch.Size([124, 16]) torch.Size([1984])


2405it [1:39:58,  2.67s/it]

torch.Size([124, 16]) torch.Size([1984])


2406it [1:40:01,  2.62s/it]

torch.Size([124, 16]) torch.Size([1984])


2407it [1:40:03,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


2408it [1:40:06,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2409it [1:40:08,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2410it [1:40:11,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2411it [1:40:13,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2412it [1:40:16,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2413it [1:40:18,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2414it [1:40:21,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2415it [1:40:23,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2416it [1:40:25,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2417it [1:40:28,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2418it [1:40:30,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2419it [1:40:33,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2420it [1:40:35,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2421it [1:40:38,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2422it [1:40:40,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2423it [1:40:43,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2424it [1:40:45,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2425it [1:40:48,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2426it [1:40:50,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2427it [1:40:53,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2428it [1:40:55,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2429it [1:40:58,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2430it [1:41:00,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2431it [1:41:03,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2432it [1:41:05,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2433it [1:41:08,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2434it [1:41:10,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2435it [1:41:13,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2436it [1:41:15,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2437it [1:41:17,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2438it [1:41:20,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2439it [1:41:22,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2440it [1:41:25,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2441it [1:41:27,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2442it [1:41:30,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2443it [1:41:33,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2444it [1:41:35,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2445it [1:41:37,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2446it [1:41:40,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2447it [1:41:43,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2448it [1:41:45,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2449it [1:41:48,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2450it [1:41:50,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2451it [1:41:53,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2452it [1:41:55,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2453it [1:41:57,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2454it [1:42:00,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2455it [1:42:02,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2456it [1:42:05,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2457it [1:42:07,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2458it [1:42:10,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2459it [1:42:12,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2460it [1:42:15,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2461it [1:42:17,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2462it [1:42:20,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2463it [1:42:22,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2464it [1:42:24,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2465it [1:42:27,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2466it [1:42:29,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2467it [1:42:32,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2468it [1:42:34,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2469it [1:42:37,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2470it [1:42:39,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2471it [1:42:42,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2472it [1:42:44,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2473it [1:42:47,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2474it [1:42:49,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2475it [1:42:52,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2476it [1:42:54,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2477it [1:42:56,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2478it [1:42:59,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2479it [1:43:01,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2480it [1:43:04,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2481it [1:43:06,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2482it [1:43:09,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2483it [1:43:11,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2484it [1:43:14,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2485it [1:43:16,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2486it [1:43:19,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2487it [1:43:22,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


2488it [1:43:24,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


2489it [1:43:27,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2490it [1:43:29,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2491it [1:43:32,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2492it [1:43:34,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2493it [1:43:37,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2494it [1:43:39,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2495it [1:43:41,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2496it [1:43:44,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2497it [1:43:46,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2498it [1:43:49,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2499it [1:43:51,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2500it [1:43:54,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2501it [1:43:56,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2502it [1:43:59,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2503it [1:44:01,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2504it [1:44:04,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2505it [1:44:06,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2506it [1:44:09,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2507it [1:44:11,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2508it [1:44:14,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2509it [1:44:16,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2510it [1:44:19,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2511it [1:44:21,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2512it [1:44:24,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2513it [1:44:26,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2514it [1:44:29,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2515it [1:44:31,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2516it [1:44:33,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2517it [1:44:36,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2518it [1:44:38,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2519it [1:44:41,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2520it [1:44:43,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2521it [1:44:46,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2522it [1:44:48,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2523it [1:44:50,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2524it [1:44:53,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2525it [1:44:55,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2526it [1:44:58,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2527it [1:45:00,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2528it [1:45:03,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2529it [1:45:05,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2530it [1:45:07,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2531it [1:45:10,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2532it [1:45:12,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


2533it [1:45:15,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2534it [1:45:17,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2535it [1:45:20,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2536it [1:45:22,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2537it [1:45:25,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2538it [1:45:27,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2539it [1:45:29,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2540it [1:45:32,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2541it [1:45:34,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2542it [1:45:37,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2543it [1:45:39,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2544it [1:45:42,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2545it [1:45:44,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2546it [1:45:47,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2547it [1:45:49,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2548it [1:45:52,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2549it [1:45:54,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2550it [1:45:57,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2551it [1:45:59,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2552it [1:46:02,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2553it [1:46:04,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2554it [1:46:07,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2555it [1:46:09,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2556it [1:46:12,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2557it [1:46:14,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2558it [1:46:17,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2559it [1:46:19,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2560it [1:46:22,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2561it [1:46:24,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2562it [1:46:27,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2563it [1:46:29,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2564it [1:46:32,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2565it [1:46:34,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2566it [1:46:37,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2567it [1:46:39,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2568it [1:46:41,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2569it [1:46:44,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2570it [1:46:47,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2571it [1:46:49,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2572it [1:46:52,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2573it [1:46:54,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2574it [1:46:57,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2575it [1:46:59,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2576it [1:47:02,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2577it [1:47:04,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2578it [1:47:07,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2579it [1:47:09,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2580it [1:47:12,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2581it [1:47:14,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2582it [1:47:17,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2583it [1:47:19,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2584it [1:47:22,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2585it [1:47:24,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2586it [1:47:27,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2587it [1:47:29,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2588it [1:47:32,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2589it [1:47:34,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2590it [1:47:37,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2591it [1:47:39,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2592it [1:47:42,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


2593it [1:47:45,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


2594it [1:47:47,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2595it [1:47:50,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2596it [1:47:52,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


2597it [1:47:55,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2598it [1:47:57,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2599it [1:47:59,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])
训练损失为1.5760820414240553
春色递待轩，春生一阶草。西风起南原，波上无俦侣。旷荡送商谢，扁舟入高宴。寂寞坐中天，相思在瑶席。玉英摇素色，金翠亮相见。清露袭藂埃，圆流澹如素。寒云度飞沙，夏日疑白日。照耀星汉低，呵香贶金煦。靡靡炎方起，谅值微霞玩。林间袭诗棹，浦北逢鱼鹄。湖田水冻穿，人远人还鬬。纷纷慕朋侣，始觉风尘役。山下恣依稀，风前趣何夭。
江源气产苍苍，出山啸石皆遐。出士阅石以堪吁，侬家不敢匡君因。见人不肯识天子，不肯言之百般命。阴云直上天道明，涵星半夜涵河火。大鹏高飞万万回，诡踏百步双双来。去人钻浊蹶兀朝月，一片蒙躯土中火。曾闻野童舁钓子，今日米笔论便力。末中直至惟今夕，装纸还家尽日立。剧击唾乘排部前，满头吐镜红还黄。今年花落花自开，萋萋草色无尘埃。
花界人已行，马羸马屡忙。出没见商山，一身在蓬蒿。青青昨夜泪，惨涕不可知。顾叹圣明月，明晨天上辞。丈夫在何掾，富贵皆十丝。丈夫不退事，坐食有奇姿。片言足风雅，天下为妻儿。可以学安得，轗轲不磷磷。丈人充其道，饮骨无柴池。白瘴践郡郭，苍苍山水祠。我友多逸志，谈笑常自持。何况荣辱利，孰知我安知。
朝廷壮气异，历览伊水湄。区区奉斋宪，贾谊不足脂。四时皆迁稔，今春或成悲。盛时无此志，出户多高词。朝廷秉庶易，诏信文章姿。文命出门別，斯言良未私。重见范叔辈，依风望嵩池。膝穿瓜棘坞，坟绽桃花池。适因赏盛衰，今夕招淹炊。嗜慾非异草，缉年讵可知。榻屧呌枉渔，涉涧贪冻澌。搔首令我憎，昼夜视山陂。酿橡非为薪，穴虫不乱枝。遭乱懵已远，阴德谅不移。
秋光歘溢大八书，大君此地纵为余。汹汹汹湧孕其虚，鳣蹙柄严乐金乌。舜之祠乎孕世居，唐皇俯谷予不居。盗鲸溺穴若崩槎，此中表魄如辟且。是时得足圣明年，吾罕尽遇神仙株。凿稻嵌源结流水，钓羊横去疑远凌。左王右右极溟渤，巨壑喷鼋喷成崖。瀑崖峥嵘标丽色，晴霞冪洒沧溟夕。因君握茗看不得，忽似桑田长瀑色。露浓花色覆桑蕤，夜雨萧萧寒雨滴。
月出石稜稜，崎岖上阳。东流万里道，路入丈夫霜。挥毫换异浦，御角破孤塘。鱼挂桂舟牖，鼍喧红斾香。山暗练半点，岸绿垂莲光。峭干见石色，幽幽通远遐。沫孤凫动径，岸静波摇沙。塍浪钏不喧，风雷怒蒸疥。窈蜒鳞迹殊众吸，光碍远疑凝。有恨洗物中，有心难并忘。时节不足极，欢言涤烦烦。悅欢默冥间，轸酌何由

2600it [1:48:07,  3.89s/it]

夜月如芙蓉，羣巢难停棹。诸代值奇寻，须求三略缚。钱禽比眼看，取食攫来早。拾古笋虽就，缉折言空冪。湓城隔丈墟，是时多趾渡。论诗习机草，藉酒寻清境。竹迳草藓生，门廊冈掩翳。新诗一杯酒，今日鍊幽屐。紫绶截青门，庭槐盖眼影。自言白云操，日夕不生力。云路走天寒，天台近祠境。愿陪青鸟翔，俯眄紫驺祕。严冬有才调，气象无由见。不惧冷如颜，何由动妖孽。空知葵藿妨，可以不可进。
torch.Size([124, 16]) torch.Size([1984])


2601it [1:48:09,  3.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2602it [1:48:11,  3.13s/it]

torch.Size([124, 16]) torch.Size([1984])


2603it [1:48:14,  2.93s/it]

torch.Size([124, 16]) torch.Size([1984])


2604it [1:48:16,  2.79s/it]

torch.Size([124, 16]) torch.Size([1984])


2605it [1:48:19,  2.71s/it]

torch.Size([124, 16]) torch.Size([1984])


2606it [1:48:21,  2.61s/it]

torch.Size([124, 16]) torch.Size([1984])


2607it [1:48:24,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


2608it [1:48:26,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2609it [1:48:29,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2610it [1:48:31,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2611it [1:48:33,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2612it [1:48:36,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2613it [1:48:38,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2614it [1:48:41,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2615it [1:48:43,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2616it [1:48:46,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2617it [1:48:48,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2618it [1:48:51,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2619it [1:48:53,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2620it [1:48:55,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2621it [1:48:58,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2622it [1:49:01,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2623it [1:49:03,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2624it [1:49:06,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2625it [1:49:08,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2626it [1:49:10,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2627it [1:49:13,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2628it [1:49:15,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2629it [1:49:18,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2630it [1:49:20,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2631it [1:49:23,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2632it [1:49:25,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2633it [1:49:28,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2634it [1:49:30,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2635it [1:49:32,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2636it [1:49:35,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2637it [1:49:38,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2638it [1:49:40,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2639it [1:49:43,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2640it [1:49:45,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2641it [1:49:48,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


2642it [1:49:50,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


2643it [1:49:53,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


2644it [1:49:56,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


2645it [1:49:58,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


2646it [1:50:01,  2.62s/it]

torch.Size([124, 16]) torch.Size([1984])


2647it [1:50:04,  2.74s/it]

torch.Size([124, 16]) torch.Size([1984])


2648it [1:50:07,  2.87s/it]

torch.Size([124, 16]) torch.Size([1984])


2649it [1:50:10,  2.79s/it]

torch.Size([124, 16]) torch.Size([1984])


2650it [1:50:12,  2.66s/it]

torch.Size([124, 16]) torch.Size([1984])


2651it [1:50:14,  2.60s/it]

torch.Size([124, 16]) torch.Size([1984])


2652it [1:50:17,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


2653it [1:50:19,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2654it [1:50:22,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2655it [1:50:24,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2656it [1:50:27,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2657it [1:50:29,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2658it [1:50:32,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2659it [1:50:34,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2660it [1:50:36,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2661it [1:50:39,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2662it [1:50:41,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2663it [1:50:44,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2664it [1:50:46,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2665it [1:50:49,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2666it [1:50:51,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2667it [1:50:54,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2668it [1:50:56,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2669it [1:50:58,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2670it [1:51:01,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2671it [1:51:04,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2672it [1:51:06,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2673it [1:51:09,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2674it [1:51:11,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2675it [1:51:13,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2676it [1:51:16,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2677it [1:51:18,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2678it [1:51:20,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


2679it [1:51:23,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


2680it [1:51:25,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


2681it [1:51:28,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2682it [1:51:30,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2683it [1:51:33,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2684it [1:51:35,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2685it [1:51:37,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2686it [1:51:40,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2687it [1:51:42,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2688it [1:51:45,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2689it [1:51:47,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2690it [1:51:50,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2691it [1:51:52,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2692it [1:51:55,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2693it [1:51:57,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2694it [1:52:00,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2695it [1:52:02,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2696it [1:52:05,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2697it [1:52:07,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2698it [1:52:10,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2699it [1:52:12,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2700it [1:52:15,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2701it [1:52:17,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2702it [1:52:20,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2703it [1:52:22,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2704it [1:52:24,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2705it [1:52:27,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


2706it [1:52:29,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2707it [1:52:32,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2708it [1:52:34,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2709it [1:52:37,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2710it [1:52:39,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2711it [1:52:41,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2712it [1:52:44,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2713it [1:52:46,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2714it [1:52:49,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2715it [1:52:51,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2716it [1:52:54,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2717it [1:52:56,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2718it [1:52:58,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2719it [1:53:01,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2720it [1:53:03,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2721it [1:53:06,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2722it [1:53:08,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2723it [1:53:11,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2724it [1:53:13,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2725it [1:53:15,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2726it [1:53:18,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


2727it [1:53:20,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


2728it [1:53:23,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2729it [1:53:25,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2730it [1:53:28,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2731it [1:53:30,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2732it [1:53:33,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2733it [1:53:35,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2734it [1:53:38,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2735it [1:53:40,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2736it [1:53:43,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2737it [1:53:45,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2738it [1:53:48,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2739it [1:53:50,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2740it [1:53:53,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2741it [1:53:55,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2742it [1:53:58,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2743it [1:54:00,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2744it [1:54:03,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2745it [1:54:05,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2746it [1:54:07,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2747it [1:54:10,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2748it [1:54:12,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2749it [1:54:15,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2750it [1:54:18,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2751it [1:54:20,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2752it [1:54:22,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2753it [1:54:25,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2754it [1:54:28,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2755it [1:54:30,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2756it [1:54:32,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2757it [1:54:35,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2758it [1:54:38,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


2759it [1:54:40,  2.63s/it]

torch.Size([124, 16]) torch.Size([1984])


2760it [1:54:43,  2.66s/it]

torch.Size([124, 16]) torch.Size([1984])


2761it [1:54:46,  2.63s/it]

torch.Size([124, 16]) torch.Size([1984])


2762it [1:54:48,  2.60s/it]

torch.Size([124, 16]) torch.Size([1984])


2763it [1:54:51,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


2764it [1:54:53,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


2765it [1:54:56,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


2766it [1:54:59,  2.61s/it]

torch.Size([124, 16]) torch.Size([1984])


2767it [1:55:01,  2.68s/it]

torch.Size([124, 16]) torch.Size([1984])


2768it [1:55:04,  2.68s/it]

torch.Size([124, 16]) torch.Size([1984])


2769it [1:55:07,  2.68s/it]

torch.Size([124, 16]) torch.Size([1984])


2770it [1:55:09,  2.64s/it]

torch.Size([124, 16]) torch.Size([1984])


2771it [1:55:12,  2.64s/it]

torch.Size([124, 16]) torch.Size([1984])


2772it [1:55:14,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


2773it [1:55:17,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


2774it [1:55:20,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


2775it [1:55:22,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2776it [1:55:25,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


2777it [1:55:27,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2778it [1:55:30,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2779it [1:55:32,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2780it [1:55:35,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2781it [1:55:37,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


2782it [1:55:40,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2783it [1:55:42,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2784it [1:55:45,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2785it [1:55:47,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2786it [1:55:49,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2787it [1:55:52,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2788it [1:55:54,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2789it [1:55:57,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2790it [1:55:59,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2791it [1:56:02,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2792it [1:56:04,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2793it [1:56:07,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2794it [1:56:09,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2795it [1:56:12,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2796it [1:56:14,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2797it [1:56:16,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2798it [1:56:19,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2799it [1:56:21,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])
训练损失为1.5940058152377603
春色徧九阴，南国信不闻。五陵遥望君，千里一万里。君见长安陌，明年未归者。一日一日逢，不见俱如此。皇皇旧赐承，屈原苦板藜。嗟我旷怀远，盛时輙黯忽。扁舟下故乡，徙別梦初醒。白首见妇人，丹台拾灵水。竹柏落何时，日华方自洗。荆臯岂云养，而我空无际。本待红尘中，抽心紫霄上。风候忽不保，徒嗟此何夕。岁久沧洲云，秋光尚咫变。
江上昔闻饷，燕山隘金鞍。有美甚风雅，万物不可踰。惨於平生志，胸浪生蔓兰。橡栗窜嘉水，石桥贮神僊。高踪绝真道，何处寻真言。嶽色咽我风，风雨醉童童。浩酣不语勉，引态思无援。此老吾所怯，所以久念然。譬如西风下，唧唧飞飞天。尔来慕商娘，停噪聊详煎。今日一杯病，相劝三十年。书题忽无间，所贵在此言。今日同心骨，相忆松与岑。
花屏次第时，骄王入上门。朝光动沟海，豔豔随霓门。揭角饮醇水，持盃如玉盆。三月舞中劒，双双飞上门。厌闻大姊说，便有新诗恩。虽无金张籍，几许精且员。不如金与泥玉君，珠履不尽亦有言。一片白莲生佛骨，三十年来醉中孙。几日不厌李氏言，不得一事同飞猨。欲知死后心难错，时时注马惊相参。为文顦顇趁泪足，醒醉醉倒醉二头。笑我心事无远绝，崎穉长洲步长绿。
朝光九原大，出见五湖出。故山来二八，扰扰荆棘白。放旷登甸州，精华来累日。三军昔城观，三十期一状。大道诚七年，英材如可惜。风沙簸的气，剑木潜霆竞。痛美赖今邦，功夫浑敢向。炎州方自薄，曷欲无他策。故人在忠贞，感激心自挹。自非贤哲事，窃使空寥廓。壮士窜重茨，谋邦事颓昧。分明清禁下，岂复垂二月。望海方九州，箫鼓何时啸。
秋光滉卓王关碧，扬明怀遐意超武。王孙留年向十载，我言君行乐我弟。丈夫不御此下名，哭別谁论心不平。胡姬美人笑歌笑，笑笑梁王翁姓笙。商人结绶出朝夕，承恩拜下如拾丁。蹉跎山头暮霜白，谢公此时伤山顶。山花落尽春寂寥，江花漠漠开春景。淮中好日无闲声，因君忝献还伫宁。丈夫贵贱能几日，玉徽玉匣无人争。秋鹰有斧啄欲落，青溪脱辔沧海碧。自君眷乎不可删，此翁死人同涕条。
月出山阴明，西陵水汽白。过君独携手，始见南风来。佳期浩浩浩，清夜沈襟瑟。物情从此闲，谁为比芳意。淫和悅曩趣，偶此於巖崿。舍岸横云岑，登崖眄标禹。岂言此中志，感此心方适。道侣废文墨，俗足谋机役。嬾慢鲈鲙姿，犹悲满牕月。故人昨为客，白日未休

2800it [1:56:29,  3.85s/it]

夜月今夜兮青天清，月含冷漾兮洞房开。其中闻轸尔者笑，一声月剪翻双鸣。谁言愁人心结根，惜闲声兮於伊湘。朝朝候道兮神羞，念此別兮晨昏。巫山之之澶漫，有雨僵以樵。彼风气兮难噬食，隐不遑弔兮怆懽趣。永愿君兮盃秋涕，䜩成恩兮怀奈何。澧河流，刷丝紫阴兮如雪，自此劳兮稚尔。径婴兮不来，蓄美兮酸尔往。及嘉人兮使尔，视嘉父兮吾不得。愿言我兮神齿生，与君之难可论，欲进返而思深也是无。若可言以知所非，孕之冶而无良。伊吕
torch.Size([124, 16]) torch.Size([1984])


2801it [1:56:31,  3.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2802it [1:56:33,  3.12s/it]

torch.Size([124, 16]) torch.Size([1984])


2803it [1:56:36,  2.90s/it]

torch.Size([124, 16]) torch.Size([1984])


2804it [1:56:38,  2.77s/it]

torch.Size([124, 16]) torch.Size([1984])


2805it [1:56:41,  2.68s/it]

torch.Size([124, 16]) torch.Size([1984])


2806it [1:56:43,  2.60s/it]

torch.Size([124, 16]) torch.Size([1984])


2807it [1:56:46,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


2808it [1:56:48,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


2809it [1:56:51,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


2810it [1:56:53,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2811it [1:56:56,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2812it [1:56:58,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2813it [1:57:01,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2814it [1:57:03,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2815it [1:57:06,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2816it [1:57:08,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2817it [1:57:11,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2818it [1:57:13,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2819it [1:57:16,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2820it [1:57:18,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2821it [1:57:21,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2822it [1:57:23,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2823it [1:57:25,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2824it [1:57:28,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2825it [1:57:30,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2826it [1:57:33,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2827it [1:57:35,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2828it [1:57:38,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2829it [1:57:40,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2830it [1:57:43,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2831it [1:57:46,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2832it [1:57:48,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2833it [1:57:51,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2834it [1:57:53,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2835it [1:57:55,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2836it [1:57:58,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2837it [1:58:00,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2838it [1:58:03,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2839it [1:58:05,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2840it [1:58:08,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2841it [1:58:10,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2842it [1:58:13,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2843it [1:58:15,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2844it [1:58:17,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2845it [1:58:20,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2846it [1:58:22,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2847it [1:58:25,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2848it [1:58:27,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2849it [1:58:30,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2850it [1:58:32,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2851it [1:58:35,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2852it [1:58:37,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2853it [1:58:40,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2854it [1:58:42,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2855it [1:58:45,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


2856it [1:58:47,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


2857it [1:58:50,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2858it [1:58:52,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2859it [1:58:55,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2860it [1:58:57,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2861it [1:59:00,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2862it [1:59:02,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2863it [1:59:05,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2864it [1:59:07,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2865it [1:59:10,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2866it [1:59:12,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2867it [1:59:15,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2868it [1:59:17,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2869it [1:59:19,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2870it [1:59:22,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2871it [1:59:24,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2872it [1:59:27,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2873it [1:59:29,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2874it [1:59:32,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2875it [1:59:34,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2876it [1:59:36,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2877it [1:59:39,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2878it [1:59:41,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2879it [1:59:44,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2880it [1:59:46,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2881it [1:59:49,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2882it [1:59:51,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2883it [1:59:53,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2884it [1:59:56,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2885it [1:59:58,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2886it [2:00:01,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2887it [2:00:03,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2888it [2:00:06,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2889it [2:00:08,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2890it [2:00:11,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2891it [2:00:13,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2892it [2:00:15,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2893it [2:00:18,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2894it [2:00:20,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2895it [2:00:23,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2896it [2:00:25,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2897it [2:00:28,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2898it [2:00:30,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2899it [2:00:32,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2900it [2:00:35,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2901it [2:00:37,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2902it [2:00:40,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2903it [2:00:42,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2904it [2:00:45,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2905it [2:00:47,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2906it [2:00:50,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2907it [2:00:52,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2908it [2:00:54,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2909it [2:00:57,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2910it [2:00:59,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2911it [2:01:02,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2912it [2:01:04,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2913it [2:01:07,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2914it [2:01:09,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2915it [2:01:11,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2916it [2:01:14,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2917it [2:01:16,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2918it [2:01:19,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2919it [2:01:21,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2920it [2:01:24,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2921it [2:01:26,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2922it [2:01:28,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2923it [2:01:31,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2924it [2:01:34,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2925it [2:01:36,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


2926it [2:01:39,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2927it [2:01:41,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2928it [2:01:44,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2929it [2:01:46,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2930it [2:01:48,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2931it [2:01:51,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2932it [2:01:53,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2933it [2:01:56,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2934it [2:01:58,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2935it [2:02:01,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2936it [2:02:03,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2937it [2:02:06,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2938it [2:02:08,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2939it [2:02:11,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2940it [2:02:13,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2941it [2:02:16,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2942it [2:02:18,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2943it [2:02:21,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2944it [2:02:23,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2945it [2:02:26,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2946it [2:02:28,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2947it [2:02:31,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2948it [2:02:33,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2949it [2:02:36,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2950it [2:02:38,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2951it [2:02:41,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2952it [2:02:43,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2953it [2:02:45,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2954it [2:02:48,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2955it [2:02:50,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2956it [2:02:53,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2957it [2:02:55,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2958it [2:02:58,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2959it [2:03:00,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2960it [2:03:03,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


2961it [2:03:05,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


2962it [2:03:08,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2963it [2:03:10,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2964it [2:03:13,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2965it [2:03:15,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


2966it [2:03:18,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


2967it [2:03:20,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


2968it [2:03:23,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


2969it [2:03:25,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2970it [2:03:28,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2971it [2:03:30,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


2972it [2:03:33,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2973it [2:03:35,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2974it [2:03:37,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2975it [2:03:40,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2976it [2:03:42,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2977it [2:03:45,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2978it [2:03:47,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


2979it [2:03:50,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2980it [2:03:52,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2981it [2:03:54,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2982it [2:03:57,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2983it [2:03:59,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2984it [2:04:02,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


2985it [2:04:04,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2986it [2:04:06,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2987it [2:04:09,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2988it [2:04:11,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2989it [2:04:14,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2990it [2:04:16,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


2991it [2:04:19,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2992it [2:04:21,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


2993it [2:04:23,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


2994it [2:04:26,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2995it [2:04:28,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2996it [2:04:31,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


2997it [2:04:33,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


2998it [2:04:36,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


2999it [2:04:38,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])
训练损失为1.6111197256843242
春日仲盛雨，槿花逞佳芳。懿尔墨物枢，外壮播飞扬。曜中摄英出，匿覆何不常。弱龄不如此，羽翼那以尝。赵母虽自惑，剪锦媿不藏。有时农所才，颇顾无所当。君生茍不轻，谁能轻去乡。将妇不得意，女妾不成黄。惟今白云上，与我同且廉。我来有酒食，卖取苍生怀。其富不茍取，莫诉生死旁。饮之心丧泥，永伤心神伤。但愿死尔辈，他人贵为长。但令尔何辜，我受生命伤。岂无沟塍汚，唯畏犹自煎。
江城郁郁春芳时，金铺豔吐浮华滋。素帘低檝娇且发，文发丛花交裴回。纷纷唤转楚天曙，飒飒飒飒秋风来。潏河波澜漂凌烟，又如流水谪江霞。夫君昔在吴王宫，峨峨峰头照天外。万国皆成穆王事，翛然夜里灞林前。落花满地红氍茸，座中笑杀胡欲弦。独歌一曲歌歌舞，曲终不救青铜梯。朝妆拂柳摇袖席，花态荐衣开御筵。乐府麟茸如可笑，乌鹊走马惊千门。古人今事复如此，人事难传赵相国。位重闺山不得归，金陵江海不相识。独有千金谁与同？
花落真太灵，精灵与仙渊。隋皇二十年，毛象论其宣。曾为天子神，使君书孝诚。天堂刻堂堂，玉露霑锦缠。挥手覩天书，一言光莫宣。大君若悬华，飞腾千万年。我非天之平，神在大与千。超遥瑯琊山，下视百尺泉。下唯龙螭窟，拔之以飞虹。腾逐雷霆震，亘若万虑全。我耕培本者，蹶给三秋天。山鬼不敢买，霹雳升空田。流血乱消息，浮生安可全。斯图出麟阁，历识如虚烟。万事死皆戒，一言安可怜。脚头见遇盛，古来谁能全。
朝见天气明，夜半西风鸣。天风潇洒里，不及南山平。无事不可说，永日无停情。至今北京里，逮此方依横。羁旅默中说，恻恻在中生。晨趋日没雾，复值城东城。羇雌悲逝水，车马辞咸城。我有辞司隸，关山自有情。羞驰马蹄疾，乌头满路迎。鞭鸡夜先起，交游洛下行。行营试宾陟，白马满肩鸣。簪绂傥相顾，恩交不可听。岂知天地绿，明灭未成形。愿荐三光气，同游万国平。
秋风歘吸吹双壳，少是光阴龙骨薄。人生赪骝汉宫阙，天袭第贵胡貙在。貂刀盘，六龙撞，请撞东方百斧肆。华轩洞围无冻来，天河阴碧河开溢。丹青横弓六十尘，壮形筋骨惟霜霜。洗心一志与昏昧，姹女啼喉泪涂色。双双掷骨埋滹鼈，截鳞运龙同众态。两危九重四五人，上王渡头几时有。君子欲历二十年，一进之表如砥星。周臣虽欲行且子，猛者恐是埋铅田。或财用财实，知己自有边。风尘遍浪出，死者无忧缘。顽鼠不死门，寂

3000it [2:04:46,  4.00s/it]

夜色浣花堦，凉风吹柳色。我行多秋草，分如照我丑。但恐芳菲歇，枉与萧郎至。不知年已衰，所以迹可惜。后遭山兰草，水缩鱼龙死。身心不在鱼，岂是随人劝。昨来还相许，此地乐于此。喧喧多苦辛，词敌颇如竞。所以事前生，不如不死意。茫茫恶时进，而我中路役。悭得任他人，不能听叩袴。请君说此路，无味桮中味。此情无处待，唯记翻飱帖。
torch.Size([124, 16]) torch.Size([1984])


3001it [2:04:48,  3.52s/it]

torch.Size([124, 16]) torch.Size([1984])


3002it [2:04:51,  3.20s/it]

torch.Size([124, 16]) torch.Size([1984])


3003it [2:04:53,  2.95s/it]

torch.Size([124, 16]) torch.Size([1984])


3004it [2:04:55,  2.79s/it]

torch.Size([124, 16]) torch.Size([1984])


3005it [2:04:58,  2.67s/it]

torch.Size([124, 16]) torch.Size([1984])


3006it [2:05:00,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


3007it [2:05:03,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


3008it [2:05:05,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3009it [2:05:07,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3010it [2:05:10,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3011it [2:05:12,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3012it [2:05:15,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3013it [2:05:17,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3014it [2:05:20,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3015it [2:05:22,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3016it [2:05:25,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3017it [2:05:27,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3018it [2:05:30,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3019it [2:05:32,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3020it [2:05:34,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


3021it [2:05:37,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


3022it [2:05:39,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3023it [2:05:42,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3024it [2:05:44,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3025it [2:05:46,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3026it [2:05:49,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3027it [2:05:51,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


3028it [2:05:54,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


3029it [2:05:56,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3030it [2:05:58,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3031it [2:06:01,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


3032it [2:06:03,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


3033it [2:06:06,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3034it [2:06:08,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3035it [2:06:11,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3036it [2:06:13,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3037it [2:06:16,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3038it [2:06:18,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


3039it [2:06:21,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3040it [2:06:23,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3041it [2:06:26,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3042it [2:06:28,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3043it [2:06:31,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3044it [2:06:33,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3045it [2:06:35,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3046it [2:06:38,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3047it [2:06:41,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


3048it [2:06:43,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


3049it [2:06:46,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3050it [2:06:48,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3051it [2:06:51,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3052it [2:06:53,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3053it [2:06:56,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3054it [2:06:58,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3055it [2:07:01,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3056it [2:07:03,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3057it [2:07:06,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3058it [2:07:08,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3059it [2:07:11,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3060it [2:07:13,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3061it [2:07:15,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3062it [2:07:18,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3063it [2:07:20,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3064it [2:07:23,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3065it [2:07:25,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3066it [2:07:28,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3067it [2:07:30,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3068it [2:07:33,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3069it [2:07:35,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3070it [2:07:38,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3071it [2:07:40,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3072it [2:07:43,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3073it [2:07:45,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3074it [2:07:47,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3075it [2:07:50,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3076it [2:07:52,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3077it [2:07:55,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3078it [2:07:57,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3079it [2:08:00,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3080it [2:08:02,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3081it [2:08:05,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3082it [2:08:07,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3083it [2:08:10,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3084it [2:08:12,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3085it [2:08:15,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3086it [2:08:17,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


3087it [2:08:20,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


3088it [2:08:22,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3089it [2:08:25,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3090it [2:08:27,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


3091it [2:08:30,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


3092it [2:08:32,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3093it [2:08:35,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3094it [2:08:37,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


3095it [2:08:40,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


3096it [2:08:43,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


3097it [2:08:45,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


3098it [2:08:48,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


3099it [2:08:50,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3100it [2:08:52,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3101it [2:08:55,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3102it [2:08:57,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3103it [2:09:00,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3104it [2:09:02,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3105it [2:09:04,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3106it [2:09:07,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3107it [2:09:09,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3108it [2:09:12,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3109it [2:09:14,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3110it [2:09:17,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


3111it [2:09:19,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


3112it [2:09:21,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3113it [2:09:24,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


3114it [2:09:26,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3115it [2:09:29,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3116it [2:09:31,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3117it [2:09:34,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3118it [2:09:36,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3119it [2:09:38,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3120it [2:09:41,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3121it [2:09:43,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3122it [2:09:46,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3123it [2:09:48,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3124it [2:09:51,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3125it [2:09:53,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3126it [2:09:56,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3127it [2:09:58,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3128it [2:10:01,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3129it [2:10:03,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3130it [2:10:06,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3131it [2:10:08,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3132it [2:10:11,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3133it [2:10:13,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3134it [2:10:15,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3135it [2:10:18,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3136it [2:10:20,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3137it [2:10:23,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3138it [2:10:25,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3139it [2:10:28,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3140it [2:10:30,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3141it [2:10:33,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3142it [2:10:35,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3143it [2:10:37,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3144it [2:10:40,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3145it [2:10:42,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3146it [2:10:45,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3147it [2:10:47,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3148it [2:10:50,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3149it [2:10:52,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3150it [2:10:54,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3151it [2:10:57,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3152it [2:10:59,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3153it [2:11:02,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3154it [2:11:04,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3155it [2:11:07,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3156it [2:11:09,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3157it [2:11:11,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3158it [2:11:14,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3159it [2:11:16,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3160it [2:11:19,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3161it [2:11:21,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3162it [2:11:24,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3163it [2:11:26,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3164it [2:11:29,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3165it [2:11:31,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3166it [2:11:33,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3167it [2:11:36,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3168it [2:11:38,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3169it [2:11:41,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3170it [2:11:43,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3171it [2:11:46,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3172it [2:11:48,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3173it [2:11:51,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


3174it [2:11:53,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


3175it [2:11:56,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3176it [2:11:58,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3177it [2:12:01,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3178it [2:12:03,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3179it [2:12:06,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3180it [2:12:08,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3181it [2:12:11,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3182it [2:12:13,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3183it [2:12:16,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3184it [2:12:18,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3185it [2:12:21,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3186it [2:12:23,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3187it [2:12:26,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3188it [2:12:28,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3189it [2:12:31,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3190it [2:12:33,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3191it [2:12:35,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3192it [2:12:38,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3193it [2:12:40,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3194it [2:12:43,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3195it [2:12:45,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3196it [2:12:47,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3197it [2:12:50,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3198it [2:12:52,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3199it [2:12:55,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])
训练损失为1.6243598704226307
春风吹花谷，绿树拂春阶。美人结芳岁，一日垂桃花。昨日梅花骢，春来特所嗟。秾荑拂罗幕，素衣步金沙。怳如悬环风，四面嚬嚬娇。罥飞双鸳鸯，戴影遶鸳鸯。红颜不可发，玉指如嚬腰。小女真织女，清歌弄双蛾。将欢舞中笑，复此欢情赊。笑语且含月，妆成春色斜。一双不襞泪，一片红炉花。妾有玉颜发，今朝照宝芽。
江陵台下春风时，十株万株柳丝丝。游女一曲涧花春，美人歌妍歌玉枝。毵毵玉佩摇碧树，皎湛绮罗红桃枝。荆之舞袖繁霜烂，秦风飒飒飘金琐。舞裙荡罢商鸿散，玉筯未倾工刻肃。婵娟不成风雨清，清秋一览生春水。玉皇已扣金樽裙，天子未成宫女尊。何幸一杯揜渌水，胡骑琵琶杂金络。自言妾身劳此心，今朝使君能几人。君不见昔时冶颜月，使君见死无穷春。
花前桂树皆种栗，仲有青田瓜十旬。君心不知在穷始，身士毂蹄何足比。天地七年不自弃，身轻出入如千里。完年不到泰明存，攻儿见物无穷策。男儿不敢笑羞军，不学老翁论姓谷。君今见我不见来，使君为报剧肆水。一畦半闭勑书开，敕赐荷衣不敢比。岳兵高冢路，马上呌戍燕支州。死人不知此理遂，委俗翻然不可度。君意便为天上物，养余且是开门格。我年试谒从公进，颇领铜骝翅布书。风递草霑山脚冻，尺衣牋屑马蹄迷。山前水小山花好，白眼
朝廷无一顿，既进名与尉。不知舍民长，不为人民瘼。揆予久贫贱，所以谋所便。请君与我来，置酒或可保。故交弃簪舟，季子建安德。相公邺阙外，万古无能免。杖藜出高下，逸翮入巖壑。大唐三峰秀，突兀千山尖。寤醉忽止归，养为沈忧翰。迩来羣禽集，濩落同所适。栈邑多绝嚣，枣庐有余隙。北郊暑气浓，故主人多庆。宾御尚雕隐，科文信沦博。自古限拘修，往年长叹息。
秋光滉窈峨云暮，相望云容皓转红。乍吐楼船浮杨柳，逗含灯幕入宫丛。兰釭飞出朱丝发，彩片红盈玉珮笼。玉管为谈光触耳，玉盘承露诵衔丛。初惊绮陌遮犹重，渐透禁垣疑梦中。玉笼山馆红笼士，春窗一迳思鸿冲。蚁堆络马马如汗，绿渚风轻杨子雄。金羁绰约漳阴路，月映青芜一片风。绮席迢遰金山上，路远无人迷冶通。惆怅佳人应寂寂，一双双泪坠阑濛。绮罗无色无光露，暗度情情感晓风。
月下海水远，海上独回春。悲风渡漕关，谁见无此巡。忆昔边城月，蒲衣骄战云。娟娟寒不至，苍苍下桑茎。楼台五百万，窟子但不平。十丈目断肠，千山去不行。五月不复飞，一心自

3200it [2:13:02,  3.83s/it]

夜色满天津，凉风催马幕。家人饮酒病，颜色寇心绪。相逢棘窗下，不肯死草屦。相逢多悲悲，其如泪焦漆。十年不足主，徒旅无由见。君今见汝官，容名复离別。裴回不忍顾，望妾劳相顾。闻哭不语心，相逢不欢趣。杭州渭水水，奴仆家垆扫。忆昔別家星州旧迎，无处不知谁是迹。少年曾忝庾公孙，梁氏不为人不言。一水东西种樱茧，竞引红颜堕衣泪。相思谁道不成空，更有怀君一时阕。
torch.Size([124, 16]) torch.Size([1984])


3201it [2:13:04,  3.38s/it]

torch.Size([124, 16]) torch.Size([1984])


3202it [2:13:07,  3.08s/it]

torch.Size([124, 16]) torch.Size([1984])


3203it [2:13:09,  2.88s/it]

torch.Size([124, 16]) torch.Size([1984])


3204it [2:13:11,  2.73s/it]

torch.Size([124, 16]) torch.Size([1984])


3205it [2:13:14,  2.65s/it]

torch.Size([124, 16]) torch.Size([1984])


3206it [2:13:16,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


3207it [2:13:19,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


3208it [2:13:21,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3209it [2:13:23,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3210it [2:13:26,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3211it [2:13:28,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3212it [2:13:31,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3213it [2:13:33,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3214it [2:13:36,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3215it [2:13:38,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3216it [2:13:41,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3217it [2:13:43,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3218it [2:13:46,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3219it [2:13:48,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3220it [2:13:51,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3221it [2:13:53,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3222it [2:13:56,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3223it [2:13:58,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3224it [2:14:01,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3225it [2:14:03,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3226it [2:14:05,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3227it [2:14:08,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3228it [2:14:10,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


3229it [2:14:13,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3230it [2:14:15,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3231it [2:14:17,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3232it [2:14:20,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3233it [2:14:22,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3234it [2:14:25,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3235it [2:14:27,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3236it [2:14:30,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3237it [2:14:32,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3238it [2:14:35,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3239it [2:14:37,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3240it [2:14:40,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3241it [2:14:42,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


3242it [2:14:45,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


3243it [2:14:47,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3244it [2:14:50,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3245it [2:14:52,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3246it [2:14:55,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3247it [2:14:57,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3248it [2:15:00,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3249it [2:15:02,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3250it [2:15:04,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3251it [2:15:07,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3252it [2:15:09,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3253it [2:15:12,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3254it [2:15:14,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3255it [2:15:17,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3256it [2:15:19,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3257it [2:15:22,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3258it [2:15:24,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3259it [2:15:26,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3260it [2:15:29,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3261it [2:15:31,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3262it [2:15:34,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3263it [2:15:36,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3264it [2:15:39,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3265it [2:15:41,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3266it [2:15:44,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3267it [2:15:46,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3268it [2:15:48,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3269it [2:15:51,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3270it [2:15:53,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3271it [2:15:56,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3272it [2:15:58,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3273it [2:16:01,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3274it [2:16:03,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3275it [2:16:06,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3276it [2:16:08,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3277it [2:16:11,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3278it [2:16:13,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3279it [2:16:15,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3280it [2:16:18,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3281it [2:16:20,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3282it [2:16:23,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3283it [2:16:25,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3284it [2:16:28,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3285it [2:16:30,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3286it [2:16:33,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3287it [2:16:35,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3288it [2:16:38,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3289it [2:16:40,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3290it [2:16:42,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3291it [2:16:45,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3292it [2:16:47,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3293it [2:16:50,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3294it [2:16:52,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3295it [2:16:55,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3296it [2:16:57,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3297it [2:17:00,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


3298it [2:17:02,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3299it [2:17:05,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3300it [2:17:07,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3301it [2:17:10,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3302it [2:17:12,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3303it [2:17:14,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


3304it [2:17:17,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


3305it [2:17:19,  2.39s/it]

torch.Size([124, 16]) torch.Size([1984])


3306it [2:17:22,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


3307it [2:17:24,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


3308it [2:17:27,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3309it [2:17:29,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3310it [2:17:31,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3311it [2:17:34,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3312it [2:17:37,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


3313it [2:17:39,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3314it [2:17:42,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3315it [2:17:44,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3316it [2:17:47,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3317it [2:17:49,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3318it [2:17:51,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3319it [2:17:54,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3320it [2:17:57,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


3321it [2:17:59,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


3322it [2:18:02,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3323it [2:18:04,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3324it [2:18:07,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3325it [2:18:09,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3326it [2:18:11,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3327it [2:18:14,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3328it [2:18:16,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3329it [2:18:19,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3330it [2:18:21,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3331it [2:18:23,  2.40s/it]

torch.Size([124, 16]) torch.Size([1984])


3332it [2:18:26,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


3333it [2:18:28,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3334it [2:18:31,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3335it [2:18:34,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


3336it [2:18:36,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


3337it [2:18:39,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3338it [2:18:41,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3339it [2:18:43,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3340it [2:18:46,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3341it [2:18:48,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3342it [2:18:51,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3343it [2:18:53,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3344it [2:18:56,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3345it [2:18:58,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


3346it [2:19:01,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


3347it [2:19:03,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3348it [2:19:06,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3349it [2:19:08,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3350it [2:19:11,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3351it [2:19:13,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3352it [2:19:16,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3353it [2:19:18,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3354it [2:19:21,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3355it [2:19:23,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3356it [2:19:26,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3357it [2:19:28,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3358it [2:19:31,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3359it [2:19:33,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3360it [2:19:36,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3361it [2:19:38,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3362it [2:19:41,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3363it [2:19:43,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3364it [2:19:46,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3365it [2:19:48,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3366it [2:19:51,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3367it [2:19:53,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3368it [2:19:56,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3369it [2:19:58,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3370it [2:20:01,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3371it [2:20:03,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3372it [2:20:06,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3373it [2:20:08,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3374it [2:20:10,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3375it [2:20:13,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3376it [2:20:15,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3377it [2:20:18,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3378it [2:20:20,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3379it [2:20:23,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3380it [2:20:25,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3381it [2:20:28,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3382it [2:20:30,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3383it [2:20:33,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3384it [2:20:35,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3385it [2:20:38,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3386it [2:20:40,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3387it [2:20:42,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3388it [2:20:45,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3389it [2:20:47,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3390it [2:20:50,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3391it [2:20:52,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3392it [2:20:55,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3393it [2:20:57,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3394it [2:21:00,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3395it [2:21:02,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3396it [2:21:05,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3397it [2:21:07,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3398it [2:21:09,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3399it [2:21:12,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])
训练损失为1.6348614937242334
春风吹落梅花绽，银河悠悠落江色。长安鄂君湘水边，粲拂花屏春到晓。洛阳宫吏夜归来，青楼玉阙空相望。辇外花枝花正开，柳堤花谢年来来。水淹独倚平阳鴈，柳里年年照仙信。倡楼二月笳，飘曳玉山落。君王镜席快奉颜，比翼为君倾国律。鸣环拂拂绣鸳绮，捍辔鸣珂伤袖力。壽留天下不相思，可惜胡莺何处说。始知绝顶古来高，莫使人间弃离別。但令出没汗云鬟，还似他人赠如昨。君恩未尽不知深，粉扫南楼那复寻。
江海年暮春天流，我今见君卢武君。当年为爱青天宫，能在王王乐清寰。忆君二八豔天子，君家献珍不封叔。今年敕赐丞相故，天爵英雄皆可在。愿言得似长鸣钟，却是皇时不知暮。自言天下无此身，唯君此別为欢乐。请君写诉君谓知，日夕悲欢信为此。君不见西南城邑重生子来白头，健步不复依青冥。中原旧路人皆羨，哀岐孰能皆苦辛。君看长安西北来，倜傥郎身赐天殿。我来撰士心伯词，我本太守还侯资。念君高歌盛才遇，尧年可在胡生路。胡人
花界人不知，贤人相对设。请君西舍欢，慰我心欲矣。始尝入鄱阳，仁尚美神薛。胡马集锋罗，羣公亦攀薄。遂耕二贤盛，筑宅无愧讳。或临墨鬼虚，莫遣麾藏奴。下策诛大夫，杀戮肝嫂掉。眼昏猛虎怒，健阵还逦迤。最深何由危，万里无乾坤。突兀九江湄，然后几回矣。下视平原水，蹴鞠擒飞鸟。附掾不敢论，敢望新嘘陇。日夜施御躯，使人锋镝多。谁能报明代，斩虏咸百万。
朝阳冬夜雨，北望孤云暮。南山值秋夜，风水清如朴。何言最此中，终日在林薮。大哉龙蛇出，九陌花亭上。弱龄晼虚皇，神色无时见。岂无区中友，投地可承手。往往聆时词，养生不盈担。慈恩茍不染，跼视终身橐。万禄不可驰，谁能知雅量。踌蹰讵可量，拱舜恩不辍。所以万壽恩，不得万壽悅。是非不得意，返为生廉旷。吾欲喻元戎，授然宣大职。圣皇情睿道，中使资所系。伊昔挺翘丹，永焉挹至理。
秋光重卷皓光浮，佩鼎刀刀软缊衣。乍绕槛边分卷仄，碎轻冰焰上轻肥。斜花上阁看如鸟，带水夫人旋解衣。半醉傍人欹枕臥，远山先拂冻光飞。西园晚色如风起，灩灩愁红半掩扉。胡为夜眠空阔杵，几回衽幰冻霏霏。烟欺帐院空行隐，满院花阴半掩扉。红树又逢新月落，一枝闲倚晚风归。我今又见三年別，旧业新年又在秋。岁月各为霑照瓦，争知只合鹊南飞。
月胧濛，潮色浅，露月青枫塞天吼。虫声萧萧萧萧吹，草色萋萋长安道。人家

3400it [2:21:19,  3.88s/it]

夜月如溪月，青松有百场。低枝妬小戏，豔叶鲜相藏。朵落无瑕股，圆分同丈蜂。巧来不状味，渴鸟来相溅。整翼助新文，罗奁飜夜床。救鳞状挟炮，持斧不敢尝。箭啮丈人怜，跳爪鲛者呶。尖罅惹阴禽，叉爪承软噫。憨处若为患，顺此稷与筐。隐视万木余，蹶贯五色光。吾欲任玄祸，毒风以为萌。超遥指蕃壑，庶几心莫量。若不聋朽言，不可死自伤。
torch.Size([124, 16]) torch.Size([1984])


3401it [2:21:21,  3.41s/it]

torch.Size([124, 16]) torch.Size([1984])


3402it [2:21:24,  3.09s/it]

torch.Size([124, 16]) torch.Size([1984])


3403it [2:21:26,  2.88s/it]

torch.Size([124, 16]) torch.Size([1984])


3404it [2:21:29,  2.75s/it]

torch.Size([124, 16]) torch.Size([1984])


3405it [2:21:31,  2.68s/it]

torch.Size([124, 16]) torch.Size([1984])


3406it [2:21:34,  2.64s/it]

torch.Size([124, 16]) torch.Size([1984])


3407it [2:21:36,  2.60s/it]

torch.Size([124, 16]) torch.Size([1984])


3408it [2:21:39,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


3409it [2:21:41,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


3410it [2:21:44,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3411it [2:21:46,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3412it [2:21:48,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3413it [2:21:51,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3414it [2:21:53,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3415it [2:21:56,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3416it [2:21:58,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3417it [2:22:01,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3418it [2:22:03,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3419it [2:22:06,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3420it [2:22:08,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3421it [2:22:11,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3422it [2:22:13,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3423it [2:22:15,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3424it [2:22:18,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3425it [2:22:20,  2.41s/it]

torch.Size([124, 16]) torch.Size([1984])


3426it [2:22:23,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


3427it [2:22:25,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3428it [2:22:27,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3429it [2:22:30,  2.42s/it]

torch.Size([124, 16]) torch.Size([1984])


3430it [2:22:32,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3431it [2:22:35,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3432it [2:22:37,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3433it [2:22:40,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3434it [2:22:42,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3435it [2:22:45,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3436it [2:22:47,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3437it [2:22:50,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3438it [2:22:52,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3439it [2:22:55,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3440it [2:22:57,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3441it [2:23:00,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3442it [2:23:02,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3443it [2:23:05,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3444it [2:23:07,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3445it [2:23:10,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3446it [2:23:12,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3447it [2:23:15,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3448it [2:23:17,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3449it [2:23:19,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3450it [2:23:22,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3451it [2:23:24,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3452it [2:23:27,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3453it [2:23:29,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3454it [2:23:32,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3455it [2:23:34,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3456it [2:23:37,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3457it [2:23:39,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3458it [2:23:42,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3459it [2:23:44,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3460it [2:23:47,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3461it [2:23:49,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3462it [2:23:52,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3463it [2:23:54,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3464it [2:23:56,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3465it [2:23:59,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3466it [2:24:01,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3467it [2:24:04,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3468it [2:24:07,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3469it [2:24:09,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3470it [2:24:11,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3471it [2:24:14,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3472it [2:24:16,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3473it [2:24:19,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3474it [2:24:21,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3475it [2:24:24,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3476it [2:24:26,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3477it [2:24:29,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3478it [2:24:31,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3479it [2:24:33,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3480it [2:24:36,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


3481it [2:24:38,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3482it [2:24:41,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


3483it [2:24:44,  2.66s/it]

torch.Size([124, 16]) torch.Size([1984])


3484it [2:24:47,  2.60s/it]

torch.Size([124, 16]) torch.Size([1984])


3485it [2:24:49,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


3486it [2:24:52,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


3487it [2:24:54,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


3488it [2:24:57,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


3489it [2:24:59,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3490it [2:25:01,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3491it [2:25:04,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3492it [2:25:06,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3493it [2:25:09,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3494it [2:25:11,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3495it [2:25:14,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3496it [2:25:16,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3497it [2:25:19,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3498it [2:25:21,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3499it [2:25:24,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3500it [2:25:26,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3501it [2:25:29,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3502it [2:25:31,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3503it [2:25:34,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3504it [2:25:36,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3505it [2:25:39,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3506it [2:25:41,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3507it [2:25:43,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3508it [2:25:46,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3509it [2:25:48,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3510it [2:25:51,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3511it [2:25:53,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3512it [2:25:56,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3513it [2:25:58,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3514it [2:26:01,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


3515it [2:26:03,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


3516it [2:26:06,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3517it [2:26:08,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3518it [2:26:11,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3519it [2:26:13,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3520it [2:26:16,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3521it [2:26:18,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3522it [2:26:21,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


3523it [2:26:23,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3524it [2:26:26,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


3525it [2:26:28,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


3526it [2:26:31,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


3527it [2:26:33,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


3528it [2:26:36,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


3529it [2:26:38,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


3530it [2:26:41,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


3531it [2:26:43,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


3532it [2:26:46,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


3533it [2:26:49,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


3534it [2:26:51,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


3535it [2:26:54,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


3536it [2:26:56,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


3537it [2:26:59,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


3538it [2:27:01,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


3539it [2:27:04,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


3540it [2:27:06,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


3541it [2:27:09,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


3542it [2:27:11,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


3543it [2:27:14,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


3544it [2:27:17,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


3545it [2:27:19,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


3546it [2:27:22,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


3547it [2:27:24,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


3548it [2:27:27,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


3549it [2:27:29,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


3550it [2:27:32,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


3551it [2:27:34,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3552it [2:27:37,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


3553it [2:27:39,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3554it [2:27:42,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3555it [2:27:44,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3556it [2:27:47,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3557it [2:27:49,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3558it [2:27:52,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3559it [2:27:54,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3560it [2:27:57,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


3561it [2:28:00,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


3562it [2:28:02,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


3563it [2:28:05,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


3564it [2:28:07,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3565it [2:28:10,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


3566it [2:28:12,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


3567it [2:28:15,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


3568it [2:28:17,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3569it [2:28:20,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3570it [2:28:22,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3571it [2:28:25,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3572it [2:28:27,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3573it [2:28:29,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3574it [2:28:32,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


3575it [2:28:34,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3576it [2:28:37,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


3577it [2:28:39,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3578it [2:28:42,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


3579it [2:28:45,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


3580it [2:28:47,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


3581it [2:28:50,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


3582it [2:28:52,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


3583it [2:28:55,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


3584it [2:28:57,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


3585it [2:29:00,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


3586it [2:29:02,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


3587it [2:29:05,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


3588it [2:29:07,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


3589it [2:29:10,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


3590it [2:29:13,  2.62s/it]

torch.Size([124, 16]) torch.Size([1984])


3591it [2:29:15,  2.61s/it]

torch.Size([124, 16]) torch.Size([1984])


3592it [2:29:18,  2.60s/it]

torch.Size([124, 16]) torch.Size([1984])


3593it [2:29:21,  2.61s/it]

torch.Size([124, 16]) torch.Size([1984])


3594it [2:29:23,  2.60s/it]

torch.Size([124, 16]) torch.Size([1984])


3595it [2:29:26,  2.61s/it]

torch.Size([124, 16]) torch.Size([1984])


3596it [2:29:28,  2.61s/it]

torch.Size([124, 16]) torch.Size([1984])


3597it [2:29:31,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


3598it [2:29:33,  2.58s/it]

torch.Size([124, 12]) torch.Size([1488])


3599it [2:29:36,  2.49s/it]
0it [00:00, ?it/s]

torch.Size([124, 16]) torch.Size([1984])


1it [00:03,  3.27s/it]

torch.Size([124, 16]) torch.Size([1984])


2it [00:05,  2.88s/it]

torch.Size([124, 16]) torch.Size([1984])


3it [00:08,  2.74s/it]

torch.Size([124, 16]) torch.Size([1984])


4it [00:11,  2.68s/it]

torch.Size([124, 16]) torch.Size([1984])


5it [00:13,  2.64s/it]

torch.Size([124, 16]) torch.Size([1984])


6it [00:16,  2.63s/it]

torch.Size([124, 16]) torch.Size([1984])


7it [00:18,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


8it [00:21,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


9it [00:23,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


10it [00:26,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


11it [00:28,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


12it [00:31,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


13it [00:34,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


14it [00:36,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


15it [00:39,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


16it [00:41,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


17it [00:44,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


18it [00:46,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


19it [00:49,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


20it [00:51,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


21it [00:54,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


22it [00:56,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


23it [00:59,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


24it [01:01,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


25it [01:03,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


26it [01:06,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


27it [01:08,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


28it [01:11,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


29it [01:13,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


30it [01:16,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


31it [01:18,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


32it [01:21,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


33it [01:23,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


34it [01:26,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


35it [01:28,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


36it [01:31,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


37it [01:33,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


38it [01:36,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


39it [01:38,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


40it [01:41,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


41it [01:44,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


42it [01:46,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


43it [01:49,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


44it [01:51,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


45it [01:53,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


46it [01:56,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


47it [01:58,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


48it [02:01,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


49it [02:03,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


50it [02:06,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


51it [02:08,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


52it [02:11,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


53it [02:13,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


54it [02:16,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


55it [02:18,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


56it [02:21,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


57it [02:23,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


58it [02:26,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


59it [02:28,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


60it [02:31,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


61it [02:33,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


62it [02:35,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


63it [02:38,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


64it [02:40,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


65it [02:43,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


66it [02:45,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


67it [02:48,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


68it [02:50,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


69it [02:53,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


70it [02:55,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


71it [02:58,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


72it [03:00,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


73it [03:03,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


74it [03:05,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


75it [03:08,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


76it [03:10,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


77it [03:13,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


78it [03:15,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


79it [03:18,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


80it [03:20,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


81it [03:23,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


82it [03:25,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


83it [03:28,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


84it [03:30,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


85it [03:33,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


86it [03:35,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


87it [03:38,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


88it [03:40,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


89it [03:43,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


90it [03:45,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


91it [03:48,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


92it [03:50,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


93it [03:53,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


94it [03:55,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


95it [03:57,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


96it [04:00,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


97it [04:02,  2.46s/it]

torch.Size([124, 16]) torch.Size([1984])


98it [04:05,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


99it [04:07,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


100it [04:10,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


101it [04:12,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


102it [04:15,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


103it [04:17,  2.48s/it]

torch.Size([124, 16]) torch.Size([1984])


104it [04:20,  2.47s/it]

torch.Size([124, 16]) torch.Size([1984])


105it [04:22,  2.45s/it]

torch.Size([124, 16]) torch.Size([1984])


106it [04:25,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


107it [04:27,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


108it [04:29,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


109it [04:32,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


110it [04:34,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


111it [04:37,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


112it [04:39,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


113it [04:42,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


114it [04:44,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


115it [04:47,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


116it [04:49,  2.43s/it]

torch.Size([124, 16]) torch.Size([1984])


117it [04:51,  2.44s/it]

torch.Size([124, 16]) torch.Size([1984])


118it [04:54,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


119it [04:57,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


120it [04:59,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


121it [05:02,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


122it [05:04,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


123it [05:07,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


124it [05:09,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


125it [05:12,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


126it [05:14,  2.53s/it]

torch.Size([124, 16]) torch.Size([1984])


127it [05:17,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


128it [05:20,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


129it [05:22,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


130it [05:25,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


131it [05:27,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


132it [05:30,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


133it [05:32,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


134it [05:35,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


135it [05:38,  2.58s/it]

torch.Size([124, 16]) torch.Size([1984])


136it [05:40,  2.59s/it]

torch.Size([124, 16]) torch.Size([1984])


137it [05:43,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


138it [05:45,  2.57s/it]

torch.Size([124, 16]) torch.Size([1984])


139it [05:48,  2.55s/it]

torch.Size([124, 16]) torch.Size([1984])


140it [05:50,  2.52s/it]

torch.Size([124, 16]) torch.Size([1984])


141it [05:53,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


142it [05:55,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


143it [05:58,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


144it [06:00,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


145it [06:03,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


146it [06:05,  2.51s/it]

torch.Size([124, 16]) torch.Size([1984])


147it [06:08,  2.49s/it]

torch.Size([124, 16]) torch.Size([1984])


148it [06:10,  2.50s/it]

torch.Size([124, 16]) torch.Size([1984])


149it [06:13,  2.54s/it]

torch.Size([124, 16]) torch.Size([1984])


150it [06:15,  2.56s/it]

torch.Size([124, 16]) torch.Size([1984])


150it [06:18,  2.52s/it]
ERROR:root:Internal Python error in the inspect module.
Below is the traceback from this internal error.



Traceback (most recent call last):
  File "C:\anaconda3\lib\site-packages\IPython\core\interactiveshell.py", line 3437, in run_code
    exec(code_obj, self.user_global_ns, self.user_ns)
  File "<ipython-input-13-4c5cbcc49fcb>", line 74, in <module>
    train()
  File "<ipython-input-13-4c5cbcc49fcb>", line 57, in train
    loss.backward()
  File "C:\anaconda3\lib\site-packages\torch\tensor.py", line 245, in backward
    torch.autograd.backward(self, gradient, retain_graph, create_graph, inputs=inputs)
  File "C:\anaconda3\lib\site-packages\torch\autograd\__init__.py", line 145, in backward
    Variable._execution_engine.run_backward(
KeyboardInterrupt

During handling of the above exception, another exception occurred:

Traceback (most recent call last):
  File "C:\anaconda3\lib\site-packages\IPython\core\interactiveshell.py", line 2061, in showtraceback
    stb = value._render_traceback_()
AttributeError: 'KeyboardInterrupt' object has no attribute '_render_traceback_'

During handlin

TypeError: object of type 'NoneType' has no len()