In [16]:
# Import required libraries
import pandas as pd
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.metrics.pairwise import cosine_similarity
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import accuracy_score

In [17]:
# Load job listings data
job_data = pd.read_csv('job_data_naukri.csv')

# Preprocess data
job_data.drop_duplicates(inplace=True)
job_data.dropna(inplace=True)

# Define features
features = ['Company', 'Education', 'Experience', 'Industry', 'Job Description', 'Job Location', 'Job Title', 'Pay Rate', 'Shift Type']
job_data['Experience'] = job_data['Experience'].astype(str)

# Get user inputs
user_job_title = 'software developer'
user_shift_type = 'part time'
#user_skills = 'java'
user_experience = '4'

# Filter job data by shift type
#job_data = job_data[job_data['Shift Type'] == user_shift_type]

# Filter job data by experience
job_data = job_data[job_data['Experience'] <= user_experience]

In [18]:
# Vectorize features
vectorizer = TfidfVectorizer(stop_words='english')
job_features = vectorizer.fit_transform(job_data[features].apply(lambda x: ' '.join(x), axis=1))
user_features = vectorizer.transform([user_job_title])
#user_features = vectorizer.transform([user_shift_type])
#user_features = vectorizer.transform([user_skills])

In [20]:
# Train machine learning model
X_train, X_test, y_train, y_test = train_test_split(job_features, job_data['Industry'], test_size=0.2, random_state=42)
model = RandomForestClassifier(n_estimators=100, random_state=42)
model.fit(X_train, y_train)

# Evaluate model
y_pred = model.predict(X_test)
print('Accuracy:', accuracy_score(y_test, y_pred))

# Get job recommendations for user
user_similarity = cosine_similarity(user_features, job_features).flatten()
job_data['similarity'] = user_similarity
job_data = job_data.sort_values('similarity', ascending=False)
recommendations = job_data.head(10)[['Job Title', 'Shift Type', 'Experience']].values.tolist()
print('Recommended jobs:', recommendations)

Accuracy: 0.8340026773761714
Recommended jobs: [['C++ Developer - Bangalore / Hyderabad / Pune', 'Full Time', '2'], ['Biztalk Developer-', 'Full Time', '3'], ['PHP Developer', 'Full Time', '2'], ['Informatica Developer', 'Part Time', '11'], ['Tibco Developer', 'Part Time', '12'], ['Informatica Developer', 'Full Time', '3'], ['UI/ Front End Developer - Javascript', 'Work From Home', '4'], ['Informatica Developer', 'Work From Home', '2'], ['Plsql Developer', 'Full Time', '2'], ['Urgent Freshers Software Engineer/software Developer Java All India', 'Work From Home', '4']]
