In [None]:
import pandas as pd
import numpy as np
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LogisticRegression
import joblib

# Simulated dataset
data = {
    'age': np.random.randint(20, 60, 500),
    'income': np.random.randint(20000, 150000, 500),
    'employment_status': np.random.choice(['Employed', 'Unemployed', 'Self-employed'], 500),
    'credit_score': np.random.randint(300, 850, 500),
    'existing_loans': np.random.randint(0, 5, 500),
}

df = pd.DataFrame(data)
# Simple rule for eligibility
df['eligible'] = np.where(
    (df['income'] > 50000) & 
    (df['credit_score'] > 600) &
    (df['employment_status'] != 'Unemployed'),
    1, 0
)

# Encoding employment_status manually
df['employment_status_encoded'] = df['employment_status'].map({
    'Employed': 0,
    'Self-employed': 1,
    'Unemployed': 2
})

# Features and target
X = df[['age', 'income', 'employment_status_encoded', 'credit_score', 'existing_loans']]
y = df['eligible']

# Train-test split
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2)

# Model
model = LogisticRegression()
model.fit(X_train, y_train)

# Save model
joblib.dump(model, 'model.pkl')
print("Model saved successfully!")
