In [None]:
import torch
import torch.nn as nn
import torch.optim as optim
import torchvision
import torchvision.transforms as transforms

# 1. 数据加载和预处理
transform = transforms.Compose([transforms.ToTensor(), transforms.Normalize((0.5,), (0.5,))])

trainset = torchvision.datasets.MNIST(root='./data', train=True, download=True, transform=transform)
trainloader = torch.utils.data.DataLoader(trainset, batch_size=32, shuffle=True)

testset = torchvision.datasets.MNIST(root='./data', train=False, download=True, transform=transform)
testloader = torch.utils.data.DataLoader(testset, batch_size=32, shuffle=False)

# 2. 定义神经网络模型
class MNISTNet(nn.Module):
    def __init__(self):
        super(MNISTNet, self).__init__()
        self.fc1 = nn.Linear(784, 784)
        nn.init.xavier_uniform_(self.fc1.weight)  # 初始化第一层的权重
        self.fc2 = nn.Linear(784, 10)
        
        # 设置第一层的权重为不可训练
        for param in self.fc1.parameters():
            param.requires_grad = False

    def forward(self, x):
        x = x.view(-1, 784)
        x = torch.relu(self.fc1(x))
        x = self.fc2(x)
        return x

model = MNISTNet()

# 3. 定义损失函数和优化器
criterion = nn.CrossEntropyLoss()
optimizer = optim.SGD(filter(lambda p: p.requires_grad, model.parameters()), lr=0.01)

# 4. 训练模型
for epoch in range(10):
    running_loss = 0.0
    for i, (inputs, labels) in enumerate(trainloader, 0):
        optimizer.zero_grad()
        
        outputs = model(inputs)
        loss = criterion(outputs, labels)
        loss.backward()
        optimizer.step()

        running_loss += loss.item()
    print(f"Epoch {epoch+1}, Loss: {running_loss/len(trainloader)}")

    # 计算测试集准确率
    correct = 0
    total = 0
    with torch.no_grad():
        for data in testloader:
            images, labels = data
            outputs = model(images)
            _, predicted = torch.max(outputs.data, 1)
            total += labels.size(0)
            correct += (predicted == labels).sum().item()

    print(f"Accuracy on test set: {100 * correct / total}%")

print("Finished Training")

In [1]:
import torch
import torch.nn as nn
import torch.optim as optim
import torchvision
import torchvision.transforms as transforms
device = torch.device("cuda:5" if torch.cuda.is_available() else "cpu")

  warn(f"Failed to load image Python extension: {e}")


In [2]:
# 1. 数据加载和预处理
transform = transforms.Compose([transforms.ToTensor(), transforms.Normalize((0.5,), (0.5,))])

trainset = torchvision.datasets.MNIST(root='./data', train=True, download=True, transform=transform)
trainloader = torch.utils.data.DataLoader(trainset, batch_size=32, shuffle=True)

testset = torchvision.datasets.MNIST(root='./data', train=False, download=True, transform=transform)
testloader = torch.utils.data.DataLoader(testset, batch_size=32, shuffle=False)


In [3]:
# 2. 定义神经网络模型
class MNISTNet(nn.Module):
    def __init__(self):
        super(MNISTNet, self).__init__()
        self.fc1 = nn.Linear(784, 784)
        nn.init.xavier_uniform_(self.fc1.weight)  # 初始化第一层的权重
        self.fc2 = nn.Linear(784, 10)
        
        # 设置第一层的权重为不可训练
        for param in self.fc1.parameters():
            param.requires_grad = False

    def forward(self, x):
        x = x.view(-1, 784)
        x = torch.relu(self.fc1(x))
        x = self.fc2(x)
        return x

model = MNISTNet()

In [4]:
# 3. 定义损失函数和优化器
criterion = nn.CrossEntropyLoss()
optimizer = optim.SGD(filter(lambda p: p.requires_grad, model.parameters()), lr=0.01)

# 4. 训练模型
for epoch in range(10):
    running_loss = 0.0
    for i, (inputs, labels) in enumerate(trainloader, 0):
        optimizer.zero_grad()
        
        outputs = model(inputs)
        loss = criterion(outputs, labels)
        loss.backward()
        optimizer.step()

        running_loss += loss.item()
    print(f"Epoch {epoch+1}, Loss: {running_loss/len(trainloader)}")

    # 计算测试集准确率
    correct = 0
    total = 0
    with torch.no_grad():
        for data in testloader:
            images, labels = data
            outputs = model(images)
            _, predicted = torch.max(outputs.data, 1)
            total += labels.size(0)
            correct += (predicted == labels).sum().item()

    print(f"Accuracy on test set: {100 * correct / total}%")

print("Finished Training")

Epoch 1, Loss: 0.6496705929756165
Accuracy on test set: 89.27%
Epoch 2, Loss: 0.3982198082089424
Accuracy on test set: 90.3%
Epoch 3, Loss: 0.3558166202902794
Accuracy on test set: 90.86%
Epoch 4, Loss: 0.33314823386669157
Accuracy on test set: 91.44%
Epoch 5, Loss: 0.3168796214501063
Accuracy on test set: 91.54%
Epoch 6, Loss: 0.3049309025088946
Accuracy on test set: 91.56%
Epoch 7, Loss: 0.2954294763863087
Accuracy on test set: 92.07%
Epoch 8, Loss: 0.2875973941385746
Accuracy on test set: 92.19%
Epoch 9, Loss: 0.28053308519323666
Accuracy on test set: 92.49%
Epoch 10, Loss: 0.27475158662796023
Accuracy on test set: 92.49%
Finished Training
