## 1. Import libraries and read the data

To begin, we import the following libraries.

In [None]:
import pandas as pd
import numpy as np

CSV file with ID and random numbers saved as 'output.csv'.


In [None]:
# Load the training data
train_path = "train_campusrecruit.csv"
df_train = pd.read_csv(train_path)

# Clean training data
df_train = df_train.dropna(subset=['status'])
df_train['status'] = df_train['status'].map({'Placed': 1, 'Not Placed': 0})
df_train['gender'] = df_train['gender'].map({'M': 1, 'F': 0})
df_train['ssc_b'] = df_train['ssc_b'].map({'Central': 1, 'Others': 0})
df_train['hsc_b'] = df_train['hsc_b'].map({'Central': 1, 'Others': 0})
df_train['workex'] = df_train['workex'].map({'Yes': 1, 'No': 0})

# Select relevant features with weights based on correlation
features = ['gender', 'ssc_p', 'ssc_b', 'hsc_p', 'hsc_b', 'degree_p', 'workex', 'etest_p', 'mba_p']
weights = {'gender': -0.05, 'ssc_p': 0.35, 'ssc_b': 0.01, 'hsc_p': 0.26, 'hsc_b': 0.06, 
           'degree_p': 0.32, 'workex': 0.02, 'etest_p': 0.07, 'mba_p': 0}

# Apply weighting to features
X_train = df_train[features].copy()
for col in features:
    X_train[col] *= weights[col]

y_train = df_train['status']

# Train a simple Logistic Regression model
from sklearn.linear_model import LogisticRegression
model = LogisticRegression()
model.fit(X_train, y_train)

# Load the test data
test_path = "test_campusrecruit.csv"
df_test = pd.read_csv(test_path)

# Process test data
df_test['gender'] = df_test['gender'].map({'M': 1, 'F': 0})
df_test['ssc_b'] = df_test['ssc_b'].map({'Central': 1, 'Others': 0})
df_test['hsc_b'] = df_test['hsc_b'].map({'Central': 1, 'Others': 0})
df_test['workex'] = df_test['workex'].map({'Yes': 1, 'No': 0})

X_test = df_test[features].copy()
for col in features:
    X_test[col] *= weights[col]

# Predict placement status
df_test['status'] = model.predict(X_test)
df_test['status'] = df_test['status'].map({1: 'Placed', 0: 'Not Placed'})






In [None]:
# Save predictions
df_test[['id', 'status']].to_csv("sample_submission.csv", index=False)

print("Predictions saved to sample_submission.csv")