# 读取和存储

## 读写Tensor

In [6]:
import torch
from torch import nn

# 单个Tensor写
x = torch.ones(3)
torch.save(x, 'x.pt')
# 单个Tensor读
x2 = torch.load('x.pt')
x2


  x2 = torch.load('x.pt')


tensor([1., 1., 1.])

In [7]:
# Tensor列表写
y = torch.zeros(4)
torch.save([x, y], 'x.pt')
# Tensor列表读
xy_list = torch.load('x.pt')
xy_list



  xy_list = torch.load('x.pt')


[tensor([1., 1., 1.]), tensor([0., 0., 0., 0.])]

In [8]:
# Tensor字典写
torch.save({'x': x, 'y': y}, 'x_dict.pt')
# Tensor字典读
xy = torch.load('x_dict.pt')
xy


  xy = torch.load('x_dict.pt')


{'x': tensor([1., 1., 1.]), 'y': tensor([0., 0., 0., 0.])}

## 读写模型

In [9]:
# net.state_dict()用来获取模型的参数和缓冲区（比如权重、偏置）组成的字典
class MLP(nn.Module):
    def __init__(self):
        super(MLP, self).__init__()
        self.hidden = nn.Linear(3, 2)
        self.act = nn.ReLU()
        self.output = nn.Linear(2, 1)

    def forward(self, x):
        a = self.act(self.hidden(x))
        return self.output(a)

net = MLP()
net.state_dict()


OrderedDict([('hidden.weight',
              tensor([[-0.0391, -0.0036,  0.3501],
                      [ 0.3094, -0.0750, -0.1477]])),
             ('hidden.bias', tensor([ 0.3402, -0.5161])),
             ('output.weight', tensor([[-0.0817, -0.0907]])),
             ('output.bias', tensor([-0.2088]))])

In [10]:
# 模型中，只有含可学习参数的层才有status_dict
# optimizer也有status_dict
optimizer = torch.optim.SGD(net.parameters(), lr=0.001, momentum=0.9)
optimizer.state_dict()


{'state': {},
 'param_groups': [{'lr': 0.001,
   'momentum': 0.9,
   'dampening': 0,
   'weight_decay': 0,
   'nesterov': False,
   'maximize': False,
   'foreach': None,
   'differentiable': False,
   'fused': None,
   'params': [0, 1, 2, 3]}]}

In [11]:
# # 模型保存
# torch.save(model.state_dict(), PATH) # 推荐的文件后缀名是pt或pth
# # 模型加载
# model = TheModelClass(*args, **kwargs)
# model.load_state_dict(torch.load(PATH))

X = torch.randn(2, 3)
Y = net(X)

PATH = "./net.pt"
torch.save(net.state_dict(), PATH)

net2 = MLP()
net2.load_state_dict(torch.load(PATH))
Y2 = net2(X)
Y2 == Y


  net2.load_state_dict(torch.load(PATH))


tensor([[True],
        [True]])