In [3]:
import pandas as pd
import seaborn as sns
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import accuracy_score

# 1. Load the Titanic dataset (simpler alternative)
df = sns.load_dataset('titanic')
print(df.head())
print(df.info())  # Check columns & missing values
print(df.describe())  
# 2. Preprocessing (minimal example)
# Drop rows with missing 'age' and 'embarked'
df.dropna(subset=['age', 'embarked'], inplace=True)

# Convert categorical features to numeric
df['sex'] = df['sex'].map({'male': 1, 'female': 0})
df['embarked'] = df['embarked'].map({'S': 0, 'C': 1, 'Q': 2})

# 3. Define features (X) and target (y)
X = df[['pclass', 'sex', 'age', 'fare', 'embarked']]  # Features
y = df['survived']  # Target (what we want to predict)

# 4. Split data into training and testing sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# 5. Train the model
model = RandomForestClassifier(random_state=42)
model.fit(X_train, y_train)

# 6. Evaluate
y_pred = model.predict(X_test)
print("Accuracy:", accuracy_score(y_test, y_pred))



   survived  pclass     sex   age  sibsp  parch     fare embarked  class  \
0         0       3    male  22.0      1      0   7.2500        S  Third   
1         1       1  female  38.0      1      0  71.2833        C  First   
2         1       3  female  26.0      0      0   7.9250        S  Third   
3         1       1  female  35.0      1      0  53.1000        S  First   
4         0       3    male  35.0      0      0   8.0500        S  Third   

     who  adult_male deck  embark_town alive  alone  
0    man        True  NaN  Southampton    no  False  
1  woman       False    C    Cherbourg   yes  False  
2  woman       False  NaN  Southampton   yes   True  
3  woman       False    C  Southampton   yes  False  
4    man        True  NaN  Southampton    no   True  
<class 'pandas.core.frame.DataFrame'>
RangeIndex: 891 entries, 0 to 890
Data columns (total 15 columns):
 #   Column       Non-Null Count  Dtype   
---  ------       --------------  -----   
 0   survived     891 non-nu

In [6]:
!pip freeze > requirements.txt  # Note the exclamation mark

In [7]:
import os
print("File is saved in:", os.getcwd()) 

File is saved in: C:\Users\ssswa
