In [1]:
from joblib import load

In [2]:
loaded_model=load('SVC_tfidf_model.joblib')

In [4]:
import pandas as pd

# Example job posts
data = [
    {
        "Category": "Sales",
        "Title": "Sales Representative - Regional Accounts",
        "Webindex": "72635563",
        "Company": "National Sales Corp",
        "Description": "sales representative regional accounts client relationship management territory sales target achievement lead generation product demonstrations customer feedback market analysis sales strategy teamwork communication skills minimum bachelor business administration bba proven sales track record regional sales national sales corp career opportunity benefits package apply send resume visit website url removed"
    },
    {
        "Category": "Engineering",
        "Title": "Mechanical Design Engineer",
        "Webindex": "72635560",
        "Company": "Innovative Engineering Solutions",
        "Description": "mechanical design engineer responsible developing innovative mechanical systems solutions collaborate cross functional teams ensure product quality efficiency extensive knowledge cad software solidworks autocad experience mechanical design analysis simulation stress testing required minimum bachelor's degree mechanical engineering strong problem solving communication skills competitive salary benefits package apply send resume company email visit website"
    },
    {
        "Category": "Accounting_Finance",
        "Title": "Senior Financial Analyst",
        "Webindex": "72635562",
        "Company": "Global Financial Services",
        "Description": "senior financial analyst budgeting forecasting financial planning reporting financial statements variance analysis accounting gaap regulations financial modeling investment analysis strategic planning teamwork leadership skills excel sap minimum cpa mba preferred financial services global company structured benefits package send resume apply position online visit website url removed"
    },
    {
        "Category": "Healthcare_Nursing",
        "Title": "Registered Nurse - Intensive Care Unit",
        "Webindex": "72635561",
        "Company": "Healthcare Professionals",
        "Description": "registered nurse icu intensive care unit critical patient monitoring vital signs administering medications patient care plans healthcare professionals team environment shift rotations extensive benefits experience icu nursing registered nurse license state requirements minimum bachelor nursing bsn apply position send cv email website contact online healthcare professionals url removed"
    }
]

# Create DataFrame
df_examples = pd.DataFrame(data)

# Display DataFrame
df_examples

Unnamed: 0,Category,Title,Webindex,Company,Description
0,Sales,Sales Representative - Regional Accounts,72635563,National Sales Corp,sales representative regional accounts client ...
1,Engineering,Mechanical Design Engineer,72635560,Innovative Engineering Solutions,mechanical design engineer responsible develop...
2,Accounting_Finance,Senior Financial Analyst,72635562,Global Financial Services,senior financial analyst budgeting forecasting...
3,Healthcare_Nursing,Registered Nurse - Intensive Care Unit,72635561,Healthcare Professionals,registered nurse icu intensive care unit criti...


In [5]:
import spacy

# load english language model and create nlp object from it
nlp = spacy.load("en_core_web_sm")

def preprocess(text):
    # remove stop words and lemmatize the text
    doc = nlp(text)
    filtered_tokens = []
    for token in doc:
        if token.is_stop or token.is_punct:
            continue
        filtered_tokens.append(token.lemma_)

    return " ".join(filtered_tokens)

In [6]:
def preprocess_title(text):
    # remove stop words and lemmatize the text
    doc = nlp(text)
    filtered_tokens = []
    for token in doc:
        if token.is_stop or token.is_punct:
            continue
        filtered_tokens.append(token.lemma_.lower())

    return " ".join(filtered_tokens)

In [7]:
df_examples['Preprocessed_Description'] = df_examples['Description'].apply(preprocess)

In [8]:
df_examples['Preprocessed_Title'] = df_examples['Title'].apply(preprocess_title)

In [9]:
df_examples['Preprocessed_Title_Description']=df_examples['Preprocessed_Title']+ " " + df_examples['Preprocessed_Description']

In [10]:
df_examples

Unnamed: 0,Category,Title,Webindex,Company,Description,Preprocessed_Description,Preprocessed_Title,Preprocessed_Title_Description
0,Sales,Sales Representative - Regional Accounts,72635563,National Sales Corp,sales representative regional accounts client ...,sale representative regional account client re...,sale representative regional accounts,sale representative regional accounts sale rep...
1,Engineering,Mechanical Design Engineer,72635560,Innovative Engineering Solutions,mechanical design engineer responsible develop...,mechanical design engineer responsible develop...,mechanical design engineer,mechanical design engineer mechanical design e...
2,Accounting_Finance,Senior Financial Analyst,72635562,Global Financial Services,senior financial analyst budgeting forecasting...,senior financial analyst budgeting forecast fi...,senior financial analyst,senior financial analyst senior financial anal...
3,Healthcare_Nursing,Registered Nurse - Intensive Care Unit,72635561,Healthcare Professionals,registered nurse icu intensive care unit criti...,register nurse icu intensive care unit critica...,registered nurse intensive care unit,registered nurse intensive care unit register ...


In [11]:
y_pred_examples = loaded_model.predict(df_examples['Preprocessed_Title_Description'])

In [12]:
y_pred_examples

array([3, 0, 2, 1], dtype=int64)

In [13]:
category_mapping={
    0:'Engineering',
    1:'Healthcare_Nursing',
    2:'Accounting_Finance',
    3:'Sales'
}

In [14]:
for y_pred in y_pred_examples:
    category_name=category_mapping.get(y_pred,'Unknown')
    print('Predicted Category: ',category_name)

Predicted Category:  Sales
Predicted Category:  Engineering
Predicted Category:  Accounting_Finance
Predicted Category:  Healthcare_Nursing
