In [12]:
# Load packages
import pandas as pd 
import numpy as np
import pickle
from mlflow.tracking import MlflowClient
from matplotlib import pyplot as plt
import json

In [13]:
EXPERIMENT_NAME = "job-profile-prediction"
RUN_ID = '92ed66d742664ef78606066f1ed74a8c'
TRACKING_URI = "../mlflow"


In [14]:

# Create an instance of the MlflowClient
client = MlflowClient(tracking_uri=TRACKING_URI)

# Get the run
run = client.get_run(run_id=RUN_ID)

# Get the data and model artifacts
data_artifact_uri = run.info.artifact_uri + "/data/data_details"
model_artifact_uri = run.info.artifact_uri + "/model/model.pkl"


# Load the data and model

# Load the pipeline from the pickle file
with open(model_artifact_uri, 'rb') as file:
    classifier = pickle.load(file)


classifier

In [15]:


# Read the JSON file
with open(data_artifact_uri, "r") as file:
    data = json.load(file)

features = pd.DataFrame(data=np.zeros((1, len(data['features_names']))), columns=data['features_names'],
                        dtype=int)

target = pd.DataFrame(data=np.zeros((1, len(data['targets_names']))), columns=data['targets_names'], dtype=int)




In [16]:
skills = ['ASP.NET','ASP.NET CORE', 'C#', 'Visual Basic (.Net)', 'Microsoft SQL Server']

features[skills] = 1
features[skills]

Unnamed: 0,ASP.NET,ASP.NET CORE,C#,Visual Basic (.Net),Microsoft SQL Server
0,1,1,1,1,1


In [17]:
for c  in features.columns:
    print(c)

APL
Ada
Apex
Assembly
Bash/Shell (all shells)
C
C#
C++
Clojure
Cobol
Crystal
Dart
Delphi
Elixir
Erlang
F#
Flow
Fortran
GDScript
Go
Groovy
HTML/CSS
Haskell
Java
JavaScript
Julia
Kotlin
Lisp
Lua
MATLAB
Nim
OCaml
Objective-C
PHP
Perl
PowerShell
Prolog
Python
R
Raku
Ruby
Rust
SAS
SQL
Scala
Solidity
Swift
TypeScript
VBA
Visual Basic (.Net)
Zig
BigQuery
Cassandra
Clickhouse
Cloud Firestore
Cockroachdb
Cosmos DB
Couch DB
Couchbase
Datomic
DuckDB
Dynamodb
Elasticsearch
Firebase Realtime Database
Firebird
H2
IBM DB2
InfluxDB
MariaDB
Microsoft Access
Microsoft SQL Server
MongoDB
MySQL
Neo4J
Oracle
PostgreSQL
RavenDB
Redis
SQLite
Snowflake
Solr
Supabase
TiDB
Amazon Web Services (AWS)
Cloudflare
Colocation
Digital Ocean
Firebase
Fly.io
Google Cloud
Heroku
Hetzner
IBM Cloud Or Watson
Linode, now Akamai
Managed Hosting
Microsoft Azure
Netlify
OVH
OpenShift
OpenStack
Oracle Cloud Infrastructure (OCI)
Render
Scaleway
VMware
Vercel
Vultr
ASP.NET
ASP.NET CORE
Angular
AngularJS
Blazor
CodeIgniter
Deno
Dj

In [18]:
prediction = classifier.predict_proba(features.values)
#prediction = [prob[0][1] for prob in prediction] # Keep positive probs 

target.iloc[0] = prediction[0] * 100

target.iloc[0].sort_values(ascending=False)


.NET back-end                                    70.304581
Developer, desktop or enterprise applications     7.019199
.NET full-stack                                   4.511171
Scientest/Researcher                              1.162103
Developer, embedded applications or devices       1.046178
Developer, front-end                              0.436693
Developer, QA or test                             0.270824
Engineer, data                                    0.095674
Data or business analyst                          0.067924
Cloud infrastructure engineer                     0.045940
DevOps specialist                                 0.033345
Python full-stack                                 0.032430
Research & Development role                       0.029963
Developer, mobile                                 0.029522
Python back-end                                   0.023169
Data scientist or machine learning specialist     0.022178
Hardware Engineer                                 0.0114