<h2 align="center">Codebasics DL Course: Optuna Hyperparameter Tunning</h2>

In [2]:
import torch
import torch.nn as nn
import torch.optim as optim
import torch.nn.functional as F
from torch.utils.data import DataLoader, TensorDataset
import optuna
from sklearn.datasets import make_classification
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler

### Load Syntetically Generated Dataset

In [3]:
# 1. Generate synthetic dataset
X, y = make_classification(n_samples=1000, n_features=20, n_classes=2, random_state=42)
X_train, X_val, y_train, y_val = train_test_split(X, y, test_size=0.2, random_state=42)

In [4]:
X_train.shape

(800, 20)

In [5]:
X_train[0]

array([ 0.50363664, -1.51368248, -0.46907062,  1.90176571, -0.87064279,
        1.82004715,  1.66291365,  1.29105223, -0.16713608, -1.04718436,
        1.43003039,  0.20104766,  1.27577182, -1.13260729,  1.75008532,
       -1.4089039 ,  0.03301588, -0.80340946, -1.31410638,  1.41209637])

In [6]:
y_train[0]

1

In [7]:
# Convert to PyTorch tensors
X_train, y_train = torch.tensor(X_train, dtype=torch.float32), torch.tensor(y_train, dtype=torch.long)
X_val, y_val = torch.tensor(X_val, dtype=torch.float32), torch.tensor(y_val, dtype=torch.long)

### Define a Neural Network

In [8]:
class SimpleNN(nn.Module):
    def __init__(self, input_dim, hidden_dim):
        super().__init__()
        self.network = nn.Sequential(
            nn.Linear(input_dim, hidden_dim),
            nn.ReLU(),
            nn.Linear(hidden_dim, 2)  # Output layer for binary classification
        )
        
    def forward(self, x):
        return self.network(x)

In [None]:
def objective(trial):
    
    learning_rate=trial.suggest_loguniform('learning_rate',1e-4,1e-1)
    hidden_dim=trial.suggest_int('hidden_dim',16,128)
    model=SimpleNN(input_dim=20,hidden_dim=hidden_dim)
    

### Perform Hyperparameter Tunning

In [10]:
# 3. Define the objective function for Optuna
def objective(trial):
    # Suggest values for the hyperparameters
    learning_rate = trial.suggest_loguniform('learning_rate', 1e-4, 1e-1)
    hidden_dim = trial.suggest_int('hidden_dim', 16, 128)

    # Model, loss, optimizer
    model = SimpleNN(input_dim=20, hidden_dim=hidden_dim)
    criterion = nn.CrossEntropyLoss()
    optimizer = optim.Adam(model.parameters(), lr=learning_rate)

    # Training loop
    epochs = 20
    batch_size = 32
    train_loader = DataLoader(TensorDataset(X_train, y_train), batch_size=batch_size, shuffle=True)
    val_loader = DataLoader(TensorDataset(X_val, y_val), batch_size=batch_size)

    for epoch in range(epochs):
        model.train()
        for batch_X, batch_y in train_loader:
            optimizer.zero_grad()
            outputs = model(batch_X)
            loss = criterion(outputs, batch_y)
            loss.backward()
            optimizer.step()

    # Validation accuracy
    model.eval()
    correct = 0
    total = 0
    with torch.no_grad():
        for batch_X, batch_y in val_loader:
            outputs = model(batch_X)
            _, predicted = torch.max(outputs, 1)
            total += batch_y.size(0)
            correct += (predicted == batch_y).sum().item()

    accuracy = correct / total
    return accuracy

# 4. Run the Optuna optimization
study = optuna.create_study(direction="maximize")
study.optimize(objective, n_trials=20)

# 5. Print the best hyperparameters
print("Best hyperparameters found:")
print(study.best_params)            

[I 2024-11-13 16:53:47,629] A new study created in memory with name: no-name-0db8ba0c-2516-4d57-8815-f775214dfb44
  learning_rate = trial.suggest_loguniform('learning_rate', 1e-4, 1e-1)
[I 2024-11-13 16:53:49,280] Trial 0 finished with value: 0.805 and parameters: {'learning_rate': 0.09265199617049812, 'hidden_dim': 68}. Best is trial 0 with value: 0.805.
[I 2024-11-13 16:53:50,989] Trial 1 finished with value: 0.83 and parameters: {'learning_rate': 0.01248371004211226, 'hidden_dim': 120}. Best is trial 1 with value: 0.83.
[I 2024-11-13 16:53:52,362] Trial 2 finished with value: 0.87 and parameters: {'learning_rate': 0.00028991853281172623, 'hidden_dim': 62}. Best is trial 2 with value: 0.87.
[I 2024-11-13 16:53:53,842] Trial 3 finished with value: 0.855 and parameters: {'learning_rate': 0.0002374400309515563, 'hidden_dim': 48}. Best is trial 2 with value: 0.87.
[I 2024-11-13 16:53:55,518] Trial 4 finished with value: 0.855 and parameters: {'learning_rate': 0.0003483451090663494, 'hidd

Best hyperparameters found:
{'learning_rate': 0.00028991853281172623, 'hidden_dim': 62}
