# Entrenamiento del modelo

In [2]:
import torch
from torchvision import datasets, models, transforms
from torch.utils.data import DataLoader
import os

# Transformaciones
data_transforms = {
    'train': transforms.Compose([
        transforms.RandomResizedCrop(224),
        transforms.RandomHorizontalFlip(),
        transforms.ToTensor(),
        transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225])
    ]),
    'val': transforms.Compose([
        transforms.Resize(256),
        transforms.CenterCrop(224),
        transforms.ToTensor(),
        transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225])
    ]),
}

data_dir = 'directorio_datos'
batch_size = 32

image_datasets = {x: datasets.ImageFolder(os.path.join(data_dir, x), data_transforms[x])
                  for x in ['train', 'val']}
dataloaders = {x: DataLoader(image_datasets[x], batch_size=batch_size, shuffle=True, num_workers=4)
               for x in ['train', 'val']}
dataset_sizes = {x: len(image_datasets[x]) for x in ['train', 'val']}
class_names = image_datasets['train'].classes

In [None]:
from torch import nn

model = models.resnet50(pretrained=True)  # Usando ResNet50 como base
# Ajustar la última capa para 5 clases
num_ftrs = model.fc.in_features
model.fc = nn.Linear(num_ftrs, 5)


In [4]:
from torch import optim

device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
model = model.to(device)
criterion = nn.CrossEntropyLoss()
optimizer = optim.Adam(model.parameters(), lr=0.001)


In [None]:
num_epochs = 12  # O el número de épocas deseado

for epoch in range(num_epochs):
    # Fases de entrenamiento y validación
    for phase in ['train', 'val']:
        if phase == 'train':
            model.train()  # Establece el modelo en modo de entrenamiento
        else:
            model.eval()   # Establece el modelo en modo de evaluación

        running_loss = 0.0
        running_corrects = 0

        # Iterar sobre los datos
        for inputs, labels in dataloaders[phase]:
            inputs = inputs.to(device)
            labels = labels.to(device)

            optimizer.zero_grad()

            # Forward
            # Rastrear historial solo si está en fase de entrenamiento
            with torch.set_grad_enabled(phase == 'train'):
                outputs = model(inputs)
                loss = criterion(outputs, labels)
                _, preds = torch.max(outputs, 1)

                # Backward + optimize solo si está en fase de entrenamiento
                if phase == 'train':
                    loss.backward()
                    optimizer.step()

            # Estadísticas
            running_loss += loss.item() * inputs.size(0)
            running_corrects += torch.sum(preds == labels.data)

        epoch_loss = running_loss / dataset_sizes[phase]
        epoch_acc = running_corrects.double() / dataset_sizes[phase]

        print(f'{phase} Epoch {epoch}/{num_epochs - 1}, Loss: {epoch_loss:.4f}, Acc: {epoch_acc:.4f}')


# Guarda el modelo

In [6]:
torch.save(model.state_dict(), 'wide_resnet_model.pth')


# Matriz de confusion

In [None]:
import torch
from torchvision import datasets, transforms, models
from torch.utils.data import DataLoader
import numpy as np
from sklearn.metrics import confusion_matrix

model.eval()

# Define las transformaciones
transform = transforms.Compose([
    transforms.Resize(256),
    transforms.CenterCrop(224),
    transforms.ToTensor(),
    transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225])
])

# Dispositivo (GPU o CPU)
device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
model.to(device)

# Ruta al conjunto de datos
data_dir = 'directorio_datos_test'

# Cargar el conjunto de datos
dataset = datasets.ImageFolder(root=data_dir, transform=transform)
dataloader = DataLoader(dataset, batch_size=64, shuffle=False, num_workers=4)
class_names = dataset.classes

y_pred = []
y_true = []

# Desactivar el cálculo de gradientes
with torch.no_grad():
    for images, labels in dataloader:
        images, labels = images.to(device), labels.to(device)
        outputs = model(images)
        _, predicted = torch.max(outputs, 1)
        y_pred.extend(predicted.cpu().numpy())
        y_true.extend(labels.cpu().numpy())

# Calcular la matriz de confusión
confusion_mat = confusion_matrix(y_true, y_pred)
recall = recall_score(y_true, y_pred, average='macro')

print(confusion_mat)
print(f'Recall del modelo: {recall}')