In [2]:
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler, LabelEncoder
from sklearn.pipeline import Pipeline
from sklearn.linear_model import LogisticRegression
from sklearn.metrics import classification_report
import joblib


In [3]:
df = pd.read_csv('car rental dataset.csv')

# Preprocessing
df['Company Verified'] = df['Company Verified'].map({'YES': 1, 'NO': 0})
df['Target'] = df['Target'].map({'Verified': 1, 'Not Verified': 0})
df['Followers'] = df['Followers'].apply(lambda x: int(str(x).replace(',', '')))  # Convert 'Followers' to int


In [4]:
df['Headline'] = LabelEncoder().fit_transform(df['Headline'])
df['JOB Title'] = LabelEncoder().fit_transform(df['JOB Title'])


In [5]:
df.head()

Unnamed: 0,username,Headline,no of License and Cetificate,JOB Title,Company Verified,no of companies worked,Followers,Target
0,Vin Vashishta,0,2,2,1,6,190865,1
1,Rob Gonda,3,2,3,1,4,19356,1
2,Shahmir Qureshi,5,0,1,0,30,59,0
3,Sanaullah Mehran,4,8,4,1,4,500,1
4,Uzair Ahmed,6,20,5,0,10,210,0


In [6]:
X = df.drop(columns=['username', 'Target'])  # Drop 'username' as it’s likely not useful for prediction
y = df['Target']
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)


In [7]:
pipeline = Pipeline([
    ('scaler', StandardScaler()),  # Standardizing numerical features
    ('clf', LogisticRegression())  # Classifier
])

In [8]:
pipeline.fit(X_train, y_train)

# Testing the model
y_pred = pipeline.predict(X_test)
print("Classification Report:\n", classification_report(y_test, y_pred))


Classification Report:
               precision    recall  f1-score   support

           0       1.00      1.00      1.00         1
           1       1.00      1.00      1.00         1

    accuracy                           1.00         2
   macro avg       1.00      1.00      1.00         2
weighted avg       1.00      1.00      1.00         2



In [9]:
joblib.dump(pipeline, 'profile_verification_model.pkl')
print("Model saved as 'profile_verification_model.pkl'")

Model saved as 'profile_verification_model.pkl'
