In [1]:
import torch
import torch.nn as nn
import torch.optim as optim
from sklearn.datasets import fetch_california_housing
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler

In [2]:
# 1. Load dataset
data = fetch_california_housing()
X, y = data.data, data.target

# 2. Train-test split
X_train, X_test, y_train, y_test = train_test_split(
    X, y, test_size=0.2, random_state=42
)

# 3. Standardize features
scaler = StandardScaler()
X_train = scaler.fit_transform(X_train)
X_test = scaler.transform(X_test)

In [9]:
X_train.shape
print(max([i for i in X_train[0]]),min([i for i in X_train[0]]))

1.2725865624711816 -1.3728111990668923


In [12]:
y[0]

np.float64(4.526)

In [15]:
# 4. Convert to PyTorch tensors
X_train_tensor = torch.tensor(X_train, dtype=torch.float32)
y_train_tensor = torch.tensor(y_train, dtype=torch.float32).view(-1, 1)
X_test_tensor = torch.tensor(X_test, dtype=torch.float32)
y_test_tensor = torch.tensor(y_test, dtype=torch.float32).view(-1, 1)

# 5. Define linear regression model
class LinearRegressionModel(nn.Module):
    def __init__(self, in_features):
        super(LinearRegressionModel, self).__init__()
        self.network = nn.Sequential(
            nn.Linear(in_features, 64),
            nn.ReLU(),
            nn.Linear(64, 32),
            nn.ReLU(),
            nn.Linear(32, 16),
            nn.ReLU(),
            nn.Linear(16, 1)  # Output layer
        )

    def forward(self, x):
        return self.network(x)

model = LinearRegressionModel(X_train.shape[1])


# 6. Loss function and optimizer
criterion = nn.MSELoss()
optimizer = optim.SGD(model.parameters(), lr=0.01)

# 7. Training loop
epochs = 1000
for epoch in range(epochs):
    # Forward pass
    outputs = model(X_train_tensor)
    loss = criterion(outputs, y_train_tensor)
    rmse_loss = torch.sqrt(loss)

    # Backward pass
    optimizer.zero_grad()
    loss.backward()
    optimizer.step()

    if (epoch+1) % 100 == 0:
        print(f"Epoch [{epoch+1}/{epochs}], Loss: {rmse_loss.item():.4f}")

# 8. Evaluation
model.eval()
with torch.no_grad():
    y_pred = model(X_test_tensor)
    test_loss = criterion(y_pred, y_test_tensor)
    print(f"\nTest MSE: {test_loss.item():.4f}")

Epoch [100/1000], Loss: 0.8930
Epoch [200/1000], Loss: 0.8016
Epoch [300/1000], Loss: 0.7659
Epoch [400/1000], Loss: 0.7363
Epoch [500/1000], Loss: 0.7118
Epoch [600/1000], Loss: 0.6930
Epoch [700/1000], Loss: 0.6793
Epoch [800/1000], Loss: 0.6694
Epoch [900/1000], Loss: 0.6617
Epoch [1000/1000], Loss: 0.6553

Test MSE: 0.4513


In [14]:
sqrt(test_loss.item())

NameError: name 'sqrt' is not defined