In [13]:
import pandas as pd
import numpy as np
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import LabelEncoder, StandardScaler
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import accuracy_score, classification_report

In [3]:
df = pd.read_csv('careermitra_dataset.csv')

In [11]:
target_column = "Suggested Job Role"
X = df.drop(columns=[target_column])
y = df[target_column]

In [14]:
# Encode target variable
label_encoder = LabelEncoder()
y = label_encoder.fit_transform(y)

# Identify categorical and numerical columns
categorical_cols = X.select_dtypes(include=['object']).columns
numerical_cols = X.select_dtypes(include=['int64', 'float64']).columns

# Encode categorical columns
X_encoded = X.copy()
for col in categorical_cols:
    X_encoded[col] = LabelEncoder().fit_transform(X[col])

# Scale numerical features
scaler = StandardScaler()
X_encoded[numerical_cols] = scaler.fit_transform(X_encoded[numerical_cols])

# Split data into train and test sets
X_train, X_test, y_train, y_test = train_test_split(X_encoded, y, test_size=0.2, random_state=42)

In [15]:
model = RandomForestClassifier(n_estimators=100, random_state=42)
model.fit(X_train, y_train)

# Make predictions
y_pred = model.predict(X_test)

In [16]:
accuracy = accuracy_score(y_test, y_pred)
print(f"Model Accuracy: {accuracy:.2f}")

Model Accuracy: 0.03


In [17]:
print("Classification Report:")
print(classification_report(y_test, y_pred, target_names=label_encoder.classes_))

Classification Report:
                                           precision    recall  f1-score   support

                   Applications Developer       0.05      0.05      0.05       115
            Business Intelligence Analyst       0.02      0.02      0.02        97
                 Business Systems Analyst       0.01      0.02      0.01       123
                     CRM Business Analyst       0.02      0.03      0.02       104
                  CRM Technical Developer       0.01      0.01      0.01       100
                           Data Architect       0.05      0.05      0.05       115
                   Database Administrator       0.02      0.02      0.02       122
                       Database Developer       0.03      0.04      0.03       112
                         Database Manager       0.03      0.02      0.03       122
                              Design & UX       0.04      0.04      0.04       122
                       E-Commerce Analyst       0.02      0.02 