# Experiment Notebook

This notebook is used for conducting experiments related to the machine learning project. It includes data exploration, model training, and evaluation.

In [None]:
# Import necessary libraries
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns

# Set visualization style
sns.set(style='whitegrid')

# Load dataset
data = pd.read_csv('../data/dataset.csv')  # Update the path as necessary

# Display the first few rows of the dataset
data.head()

In [None]:
# Data exploration
data.info()
data.describe()

# Visualize data distribution
plt.figure(figsize=(10, 6))
sns.histplot(data['target_variable'], bins=30)
plt.title('Distribution of Target Variable')
plt.xlabel('Target Variable')
plt.ylabel('Frequency')
plt.show()

In [None]:
# Model training
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import accuracy_score

# Split the data into training and testing sets
X = data.drop('target_variable', axis=1)
y = data['target_variable']
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Train the model
model = RandomForestClassifier()
model.fit(X_train, y_train)

# Make predictions
predictions = model.predict(X_test)

# Evaluate the model
accuracy = accuracy_score(y_test, predictions)
print(f'Model Accuracy: {accuracy:.2f}')