In [None]:
import torch
import torchvision.models as models

# Load pre-trained AlexNet
alexnet = models.alexnet(pretrained=True)
alexnet.eval()

# Load pre-trained VGGNet
vgg16 = models.vgg16(pretrained=True)
vgg16.eval()

# Print the models
print("AlexNet:", alexnet)
print("\nVGG16:", vgg16)


Downloading: "https://download.pytorch.org/models/alexnet-owt-7be5be79.pth" to /root/.cache/torch/hub/checkpoints/alexnet-owt-7be5be79.pth
100%|██████████| 233M/233M [00:03<00:00, 69.4MB/s]
Downloading: "https://download.pytorch.org/models/vgg16-397923af.pth" to /root/.cache/torch/hub/checkpoints/vgg16-397923af.pth
100%|██████████| 528M/528M [00:06<00:00, 82.7MB/s]


AlexNet: AlexNet(
  (features): Sequential(
    (0): Conv2d(3, 64, kernel_size=(11, 11), stride=(4, 4), padding=(2, 2))
    (1): ReLU(inplace=True)
    (2): MaxPool2d(kernel_size=3, stride=2, padding=0, dilation=1, ceil_mode=False)
    (3): Conv2d(64, 192, kernel_size=(5, 5), stride=(1, 1), padding=(2, 2))
    (4): ReLU(inplace=True)
    (5): MaxPool2d(kernel_size=3, stride=2, padding=0, dilation=1, ceil_mode=False)
    (6): Conv2d(192, 384, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
    (7): ReLU(inplace=True)
    (8): Conv2d(384, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
    (9): ReLU(inplace=True)
    (10): Conv2d(256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
    (11): ReLU(inplace=True)
    (12): MaxPool2d(kernel_size=3, stride=2, padding=0, dilation=1, ceil_mode=False)
  )
  (avgpool): AdaptiveAvgPool2d(output_size=(6, 6))
  (classifier): Sequential(
    (0): Dropout(p=0.5, inplace=False)
    (1): Linear(in_features=9216, out_features=4096, bia

In [None]:
from torchvision import transforms
from PIL import Image
import urllib.request

In [None]:
transform = transforms.Compose([
    transforms.Resize(256),
    transforms.CenterCrop(224),
    transforms.ToTensor(),
    transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]),
])


In [None]:
def predict_image(model, image_path, transform):
    # Load and preprocess the image
    image = Image.open(image_path)
    image = transform(image).unsqueeze(0)  # Add batch dimension

    # Make prediction
    with torch.no_grad():
        outputs = model(image)
        _, predicted = torch.max(outputs, 1)
        return predicted.item()


In [None]:
image_path = "/content/Tree.jpg"

In [None]:
alexnet_prediction = predict_image(alexnet, image_path, transform)
print("AlexNet prediction:", alexnet_prediction)

# Predict using VGGNet
vgg16_prediction = predict_image(vgg16, image_path, transform)
print("VGG16 prediction:", vgg16_prediction)

AlexNet prediction: 912
VGG16 prediction: 975


In [None]:
# Load class labels
with open("imagenet_classes.txt") as f:
    class_labels = [line.strip() for line in f.readlines()]

# Print predicted labels
print("AlexNet prediction:", class_labels[alexnet_prediction])
print("VGG16 prediction:", class_labels[vgg16_prediction])


AlexNet prediction: 908, wing
VGG16 prediction: 971, bubble
