In [8]:
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import LabelEncoder, StandardScaler
import tensorflow as tf
from tensorflow.keras import layers, models, optimizers, regularizers


In [9]:
# Load and preprocess the dataset
def load_and_preprocess_data(file_path):
    # Load the dataset
    data = pd.read_csv(file_path)

    # Drop the 'id' column
    data = data.drop(columns=['id'])

    # Encode the target variable ('species') using LabelEncoder
    label_encoder = LabelEncoder()
    data['species'] = label_encoder.fit_transform(data['species'])

    # Separate features and target
    X = data.drop(columns=['species'])
    y = data['species']

    # Normalize the features
    scaler = StandardScaler()
    X = scaler.fit_transform(X)

    # Split the data into training and validation sets (80% train, 20% validation)
    X_train, X_val, y_train, y_val = train_test_split(X, y, test_size=0.2, random_state=42)

    return X_train, X_val, y_train, y_val, label_encoder


In [10]:
def build_mlp_model(input_dim, hidden_size, dropout_rate, l2_reg):
    model = models.Sequential([
        layers.Input(shape=(input_dim,)),
        layers.Dense(hidden_size, activation='tanh',
                     kernel_regularizer=regularizers.l2(l2_reg)),
        layers.Dropout(dropout_rate),
        layers.Dense(len(set(y_train)), activation='softmax')
    ])
    return model

In [11]:
# Function to train the model and evaluate performance
def train_and_evaluate_model(X_train, X_val, y_train, y_val, hidden_size, dropout_rate, l2_reg, optimizer, learning_rate, batch_size, epochs):
    # Build the model
    model = build_mlp_model(input_dim=X_train.shape[1],
                            hidden_size=hidden_size,
                            dropout_rate=dropout_rate,
                            l2_reg=l2_reg)

    # Compile the model
    opt = optimizer(learning_rate=learning_rate)
    model.compile(optimizer=opt,
                  loss='sparse_categorical_crossentropy',
                  metrics=['accuracy'])

    # Train the model
    history = model.fit(X_train, y_train,
                        validation_data=(X_val, y_val),
                        batch_size=batch_size,
                        epochs=epochs,
                        verbose=1)

    # Evaluate the model
    val_loss, val_accuracy = model.evaluate(X_val, y_val, verbose=0)
    print(f"Validation Loss: {val_loss:.4f}, Validation Accuracy: {val_accuracy:.4f}")
    return history, val_loss, val_accuracy

In [13]:
file_path = '/content/train.csv'
# Load and preprocess data
X_train, X_val, y_train, y_val, label_encoder = load_and_preprocess_data(file_path)

In [14]:
def main():

    # Example hyperparameters
    hidden_size = 64
    dropout_rate = 0.5
    l2_reg = 0.01
    optimizer = optimizers.Adam
    learning_rate = 0.001
    batch_size = 32
    epochs = 20

    # Train and evaluate the model
    history, val_loss, val_accuracy = train_and_evaluate_model(
        X_train, X_val, y_train, y_val,
        hidden_size=hidden_size,
        dropout_rate=dropout_rate,
        l2_reg=l2_reg,
        optimizer=optimizer,
        learning_rate=learning_rate,
        batch_size=batch_size,
        epochs=epochs
    )

if __name__ == "__main__":
    main()


Epoch 1/20
[1m25/25[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m2s[0m 15ms/step - accuracy: 0.0106 - loss: 5.6480 - val_accuracy: 0.0909 - val_loss: 5.0080
Epoch 2/20
[1m25/25[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 4ms/step - accuracy: 0.0667 - loss: 5.0217 - val_accuracy: 0.2172 - val_loss: 4.5251
Epoch 3/20
[1m25/25[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 3ms/step - accuracy: 0.2065 - loss: 4.4521 - val_accuracy: 0.3586 - val_loss: 4.1372
Epoch 4/20
[1m25/25[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 4ms/step - accuracy: 0.3604 - loss: 3.9078 - val_accuracy: 0.4444 - val_loss: 3.8044
Epoch 5/20
[1m25/25[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 4ms/step - accuracy: 0.4324 - loss: 3.6171 - val_accuracy: 0.5707 - val_loss: 3.4994
Epoch 6/20
[1m25/25[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 6ms/step - accuracy: 0.5438 - loss: 3.2665 - val_accuracy: 0.6414 - val_loss: 3.2274
Epoch 7/20
[1m25/25[0m [32m━━━━━━━━━