In [5]:
# %matplotlib inline
import torch
import torchvision
from torch.utils import data
from torchvision import transforms
from d2l import torch as d2l

d2l.use_svg_display()

In [6]:
# 使用svg来显示图片
d2l.use_svg_display()

In [11]:
trans = transforms.ToTensor()
mnist_train = torchvision.datasets.FashionMNIST(
    root='./data', train=True, transform=trans, download=True
)

In [7]:
trans = transforms.ToTensor()
mnist_train = torchvision.datasets.FashionMNIST(
    root='./data', train=True, transform=trans, download=False
)
mnist_test = torchvision.datasets.FashionMNIST(
    root='./data', train=False, transform=trans, download=False
)

len(mnist_train), len(mnist_test)

(60000, 10000)

In [45]:
mnist_train[0][0].shape

torch.Size([1, 28, 28])

In [46]:
def get_fashion_mnist_labels(labels):
    text_labels = [
        't-shirt', 'trouser', 'pullover', 'dress', 'coat', 'sandal', 'shirt', 'sneaker', 'bag', 'ankle boot'
    ]
    return [text_labels[int(i)] for i in labels]

In [47]:
def show_images(imgs, num_rows, num_cols, titles=None, scale=1.5):
    # plot a list of images
    figsize = (num_cols * scale, num_rows * scale)
    _, axes = d2l.plt.subplots(num_rows, num_cols, figsize=figsize)
    axes = axes.flatten()
    for i, (ax, img) in enumerate(zip(axes, imgs)):
        if torch.is_tensor(img):
            # 图片张量
            ax.imshow(img.numpy())
        else:
            # PIL图片
            ax.imshow(img)
        ax.axes.get_xaxis().setvisible(False)
        ax.axes.get_yaxis().setvisible(False)
        if titles:
            ax.set_title(titles[i])
    return axes

In [48]:
x, y = next(iter(data.DataLoader(mnist_train, batch_size=18)))
# show_images(x.reshape(18, 28, 28), 2, 9, titles=get_fashion_mnist_labels(y));

In [49]:
batch_size = 256

def get_dataloader_workers():
    # 使用n个线程来读取数据
    return 4

train_iter = data.DataLoader(mnist_train, batch_size, shuffle=True, num_workers=get_dataloader_workers())

timer = d2l.Timer()
for x, y in train_iter:
    continue
f'{timer.stop():.2f} sec'

'4.54 sec'

In [50]:
def load_data_fashion_mnist(batch_size, resize=None):
    # 下载fashion-mnist数据集，然后将其加载到内存中
    trans = [transforms.ToTensor()]
    if resize:
        trans.insert(0, transforms.Resize(resize))
    trans = transforms.Compose(trans)
    mnist_train = torchvision.datasets.FashionMNIST(
        root='./data',
        train=True,
        transform=trans,
        download=True,
    )
    mnist_test = torchvision.datasets.FashionMNIST(
        data='./data',
        train=False,
        transform=trans,
        download=True,
    )

    return (data.DataLoader(mnist_train, batch_size, shuffle=True, num_workers=get_dataloader_workers()), 
            data.DataLoader(mnist_test, batch_size, shuffle=True, num_workers=get_dataloader_workers()))