In [9]:
json_data = {
  "name": "John Anderson",
  "contact": {
    "email": "john.anderson@gmail.com",
    "linkedin": "linkedin.com/in/johnanderson",
    "github": "github.com/johndevml",
    "phone": "(555) 555-1234",
    "location": "San Francisco, CA"
  },
  "summary": "MLOps Engineer with 2+ years of experience in deploying and managing machine learning models, computer vision systems, and generative AI models in production. Proficient in automating end-to-end machine learning pipelines and integrating advanced AI solutions using cutting-edge tools like Docker, Kubernetes, TensorFlow, PyTorch, and MLflow. Strong expertise in scaling AI systems using cloud platforms (AWS, GCP), and optimizing deep learning models for real-time inference. Adept at integrating MLOps best practices, such as CI/CD pipelines and monitoring frameworks, to improve model robustness and scalability in production environments. Experienced in working with GANs and other generative models for various applications in image synthesis and data augmentation.",
  "skills": {
    "mlops_tools": [
      "Docker",
      "Kubernetes",
      "Jenkins",
      "MLflow",
      "Airflow",
      "TensorBoard",
      "Argo Workflows"
    ],
    "machine_learning": [
      "Supervised/Unsupervised Learning",
      "Model Deployment",
      "Hyperparameter Tuning"
    ],
    "computer_vision": [
      "OpenCV",
      "TensorFlow",
      "PyTorch",
      "YOLO",
      "Faster R-CNN",
      "Mask R-CNN"
    ],
    "generative_ai": [
      "GANs",
      "Variational Autoencoders (VAEs)",
      "DALL-E",
      "Stable Diffusion"
    ],
    "cloud_platforms": [
      "AWS (EC2, S3, Lambda, SageMaker)",
      "GCP (AI Platform, Compute Engine)"
    ],
    "programming_languages": [
      "Python",
      "Bash",
      "SQL",
      "C++"
    ],
    "version_control_ci_cd": [
      "Git",
      "GitLab CI",
      "Jenkins",
      "CircleCI",
      "GitHub Actions"
    ],
    "containerization_orchestration": [
      "Docker",
      "Kubernetes"
    ],
    "data_engineering": [
      "Apache Kafka",
      "Apache Spark",
      "Hadoop"
    ],
    "monitoring_logging": [
      "Prometheus",
      "Grafana",
      "ELK Stack"
    ]
  },
  "experience": [
    {
      "title": "MLOps Engineer",
      "company": "XYZ Corp",
      "location": "San Francisco, CA",
      "duration": "June 2022 – Present",
      "responsibilities": [
        "Architected and deployed real-time object detection models for autonomous vehicle systems, using TensorFlow and YOLOv5, enabling the detection of pedestrians and vehicles with 95% accuracy.",
        "Built and optimized deep learning pipelines for computer vision tasks, including image classification and segmentation, using Kubernetes for large-scale deployment on AWS.",
        "Automated the deployment and retraining of generative models, such as GANs for synthetic image generation, improving the model development lifecycle by 30%.",
        "Developed a CI/CD framework using Jenkins and MLflow to automate the training and deployment of computer vision models, reducing deployment time from weeks to days.",
        "Implemented GPU acceleration in model inference pipelines on AWS SageMaker, leading to a 50% reduction in processing time for complex computer vision models.",
        "Integrated TensorBoard and Prometheus for real-time model performance monitoring, ensuring model accuracy and reducing drift in production by 20%."
      ]
    },
    {
      "title": "Junior MLOps Engineer",
      "company": "DataTech Solutions",
      "location": "Los Angeles, CA",
      "duration": "August 2021 – June 2022",
      "responsibilities": [
        "Designed and maintained automated pipelines for the deployment of generative AI models (e.g., DCGANs) to enhance datasets through synthetic data generation.",
        "Containerized machine learning models for natural language processing (NLP) tasks such as text classification and summarization using Docker and Kubernetes.",
        "Led the deployment of computer vision models for image recognition in retail environments, which improved product identification accuracy by 15%.",
        "Collaborated with data science teams to implement transfer learning for custom object detection tasks, shortening the model development cycle by 40%.",
        "Created TensorFlow Serving pipelines for seamless model deployment across development and production environments, ensuring consistent API responses.",
        "Implemented logging and error-handling mechanisms in real-time NLP systems using ELK Stack, reducing system downtime by 25%."
      ]
    }
  ],
  "projects": [
    {
      "name": "Automated ML Pipeline for Predictive Maintenance in Autonomous Vehicles",
      "company": "XYZ Corp",
      "description": "Developed a real-time object detection pipeline for predicting maintenance issues in autonomous vehicles using YOLOv5 and TensorFlow. Integrated Airflow for orchestrating tasks such as model training, validation, and deployment on AWS Lambda, enabling real-time updates to the model with minimal downtime. Monitored model drift and performance using Prometheus and automated retraining when accuracy dropped, ensuring model precision stayed above 90%."
    },
    {
      "name": "Real-time Fraud Detection System Using Generative AI",
      "company": "DataTech Solutions",
      "description": "Built a fraud detection system that utilized variational autoencoders (VAEs) to detect anomalies in real-time transaction data streams. Deployed the model as a microservice on Kubernetes, leveraging horizontal scaling to support high-traffic environments. Used MLflow for model versioning and Jenkins to automate CI/CD workflows for model updates. The system achieved a fraud detection rate of 97%, significantly improving upon existing rule-based systems."
    },
    {
      "name": "Generative Image Synthesis Pipeline",
      "company": "XYZ Corp",
      "description": "Developed a GAN-based image synthesis pipeline for augmenting training datasets in computer vision projects, leading to a 15% improvement in model performance. Deployed the pipeline on GCP AI Platform with TensorFlow and Kubernetes, allowing on-demand image generation to reduce model training times. Used Argo Workflows for orchestrating multi-step data preprocessing, model training, and deployment, ensuring a seamless integration into existing MLOps infrastructure."
    }
  ],
  "open_source_contributions": [
    {
      "project": "Kubeflow",
      "contribution": "Contributed to the development of custom operators for scaling computer vision pipelines on Kubernetes. These contributions improved model training times by 20% in distributed environments."
    },
    {
      "project": "MLflow",
      "contribution": "Developed extensions for tracking and visualizing GAN training metrics, including loss curves and image quality metrics like FID scores."
    },
    {
      "project": "TensorFlow Hub",
      "contribution": "Created custom pre-trained models for image classification and segmentation, available for public use. These models have been downloaded over 5,000 times and are actively used in the open-source community."
    }
  ],
  "education": {
    "degree": "Bachelor of Science in Computer Science",
    "institution": "University of California, Berkeley",
    "graduation_year": "2020",
    "relevant_courses": [
      "Machine Learning",
      "Deep Learning",
      "Computer Vision",
      "Cloud Computing",
      "Distributed Systems"
    ],
    "extracurriculars": [
      "Machine Learning Club",
      "Generative AI Research Group",
      "Hackathons"
    ]
  },
  "certifications": [
    {
      "name": "AWS Certified Solutions Architect – Associate",
      "issued": "May 2023"
    },
    {
      "name": "Certified Kubernetes Administrator (CKA)",
      "issued": "September 2022"
    },
    {
      "name": "TensorFlow Developer Certification",
      "issued": "March 2022"
    },
    {
      "name": "Google Cloud Professional Data Engineer",
      "issued": "February 2024"
    },
    {
      "name": "NVIDIA Deep Learning Institute – Computer Vision with PyTorch",
      "issued": "August 2023"
    }
  ],
  "publications_talks": [
    {
      "title": "Building and Deploying Computer Vision Models at Scale with TensorFlow and Kubernetes",
      "event": "O'Reilly AI Conference",
      "year": "2023"
    },
    {
      "title": "Generative AI in Real-World Applications: Challenges and Solutions",
      "platform": "Medium",
      "views": "20,000+"
    },
    {
      "title": "Optimizing Deep Learning Workflows with Airflow and MLflow",
      "event": "PyData Conference",
      "year": "2023"
    }
  ],
  "volunteer_experience": [
    {
      "organization": "AI for Good Hackathon",
      "role": "Mentor",
      "description": "Mentored teams in designing and deploying computer vision models for healthcare applications, including X-ray image classification for COVID-19 detection."
    },
    {
      "organization": "Women Who Code",
      "role": "Workshop Leader",
      "description": "Conducted workshops on Generative AI with a focus on using GANs and VAEs for image synthesis."
    }
  ],
  "technical_proficiencies": {
    "operating_systems": ["Linux (Ubuntu, CentOS)", "Windows"],
    "databases": ["MySQL", "PostgreSQL", "MongoDB"],
    "version_control": ["Git", "Bitbucket"]
  },
  "references": "Available upon request."
}

In [7]:
import pandas as pd
df = pd.read_csv("Scraped Jobs MLOps.csv")

In [16]:
# Generating the PDF for Updated JSON
pdf_buffer = generate_resume_from_json(updated_json)

# Save PDF to file
output_filename = "Generated_Resume_Updated.pdf"
with open(output_filename, "wb") as f:
    f.write(pdf_buffer.getvalue())

In [1]:
# Misc

In [15]:
old_resume = """
1
John Anderson

Email: john.anderson@gmail.com | Phone: (555) 555-1234 | LinkedIn: linkedin.com/in/johnanderson |
GitHub: github.com/johndevml | Location: San Francisco, CA

Professional Summary

MLOps Engineer with 2+ years of experience in deploying and managing machine learning models,
computer vision systems, and generative AI models in production. Proficient in automating end-to-end
machine learning pipelines and integrating advanced AI solutions using cutting-edge tools like Docker,
Kubernetes, TensorFlow, PyTorch, and MLflow. Strong expertise in scaling AI systems using cloud
platforms (AWS, GCP), and optimizing deep learning models for real-time inference. Adept at
integrating MLOps best practices, such as CI/CD pipelines and monitoring frameworks, to improve
model robustness and scalability in production environments. Experienced in working with GANs and
other generative models for various applications in image synthesis and data augmentation.

Skills

Mlops tools:

Docker, Kubernetes, Jenkins, MLflow, Airflow, TensorBoard, Argo Workflows

Machine learning:

Supervised/Unsupervised Learning, Model Deployment, Hyperparameter Tuning

Computer vision:

OpenCV, TensorFlow, PyTorch, YOLO, Faster R-CNN, Mask R-CNN

Generative ai:

GANs, Variational Autoencoders (VAEs), DALL-E, Stable Diffusion

Cloud platforms:

AWS (EC2, S3, Lambda, SageMaker), GCP (AI Platform, Compute Engine)

Programming languages:

Python, Bash, SQL, C++

Version control ci cd:

Git, GitLab CI, Jenkins, CircleCI, GitHub Actions

Containerization orchestration:

Docker, Kubernetes

Data engineering:

Apache Kafka, Apache Spark, Hadoop

Monitoring logging:

Prometheus, Grafana, ELK Stack

Professional Experience

MLOps Engineer

XYZ Corp – San Francisco, CA

June 2022 – Present

• Architected and deployed real-time object detection models for autonomous vehicle systems, using
TensorFlow and YOLOv5, enabling the detection of pedestrians and vehicles with 95% accuracy.

• Built and optimized deep learning pipelines for computer vision tasks, including image classification
and segmentation, using Kubernetes for large-scale deployment on AWS.
• Automated the deployment and retraining of generative models, such as GANs for synthetic image
generation, improving the model development lifecycle by 30%.

• Developed a CI/CD framework using Jenkins and MLflow to automate the training and deployment of
computer vision models, reducing deployment time from weeks to days.

• Implemented GPU acceleration in model inference pipelines on AWS SageMaker, leading to a 50%
reduction in processing time for complex computer vision models.

• Integrated TensorBoard and Prometheus for real-time model performance monitoring, ensuring model
accuracy and reducing drift in production by 20%.

Junior MLOps Engineer

DataTech Solutions – Los Angeles, CA

August 2021 – June 2022

• Designed and maintained automated pipelines for the deployment of generative AI models (e.g.,
DCGANs) to enhance datasets through synthetic data generation.

• Containerized machine learning models for natural language processing (NLP) tasks such as text
classification and summarization using Docker and Kubernetes.

• Led the deployment of computer vision models for image recognition in retail environments, which
improved product identification accuracy by 15%.

• Collaborated with data science teams to implement transfer learning for custom object detection
tasks, shortening the model development cycle by 40%.

• Created TensorFlow Serving pipelines for seamless model deployment across development and
production environments, ensuring consistent API responses.

• Implemented logging and error-handling mechanisms in real-time NLP systems using ELK Stack,
reducing system downtime by 25%.

Projects

Automated ML Pipeline for Predictive Maintenance in Autonomous Vehicles

XYZ Corp

Developed a real-time object detection pipeline for predicting maintenance issues in autonomous
vehicles using YOLOv5 and TensorFlow. Integrated Airflow for orchestrating tasks such as model
training, validation, and deployment on AWS Lambda, enabling real-time updates to the model with
minimal downtime. Monitored model drift and performance using Prometheus and automated retraining
when accuracy dropped, ensuring model precision stayed above 90%.

Real-time Fraud Detection System Using Generative AI

DataTech Solutions

Built a fraud detection system that utilized variational autoencoders (VAEs) to detect anomalies in
real-time transaction data streams. Deployed the model as a microservice on Kubernetes, leveraging
horizontal scaling to support high-traffic environments. Used MLflow for model versioning and Jenkins
to automate CI/CD workflows for model updates. The system achieved a fraud detection rate of 97%,
significantly improving upon existing rule-based systems.

Generative Image Synthesis Pipeline

XYZ Corp
"""

In [9]:
resume = """Ralf Kendal

1
John Anderson

Email: john.anderson@gmail.com | Phone: (555) 555-1234 | LinkedIn: linkedin.com/in/johnanderson |
GitHub: github.com/johndevml | Location: India

Professional Summary

Senior MLOps Engineer with 7+ years of experience in deploying, managing, and optimizing machine
learning pipelines and systems at scale. Expertise in building and scaling AI solutions using Docker,
Kubernetes, and cloud platforms like AWS and GCP. Skilled in automating end-to-end MLOps
workflows, implementing CI/CD pipelines, and leveraging advanced AI tools including TensorFlow and
PyTorch. Proven track record in ensuring model performance and reliability through real-time
monitoring and optimization, with a focus on problem-solving and continuous improvement.

Skills

Mlops tools:

Docker, Kubernetes, Jenkins, MLflow, Airflow, Argo Workflows, Terraform, Ansible

Machine learning:

Supervised/Unsupervised Learning, Model Deployment, Model Performance Monitoring

Cloud platforms:

AWS (EC2, S3, Lambda, SageMaker, EMR, Kinesis, SQS, SNS), GCP (AI Platform, Compute Engine)

Programming languages:

Python, SQL

Version control ci cd:

Git, Jenkins, GitHub Actions, TravisCI, Bamboo

Data engineering:

Apache Spark, Airflow

Professional Experience

MLOps Engineer

XYZ Corp – India

June 2022 – Present

• Architected and deployed real-time object detection models for autonomous vehicle systems, using
TensorFlow and YOLOv5, with a focus on scalability and performance.

• Built and optimized deep learning pipelines on AWS using Kubernetes, enhancing model deployment
efficiency and scalability.

• Automated deployment and retraining of generative models, including GANs, improving the model
development lifecycle.

• Developed CI/CD frameworks with Jenkins and MLflow, reducing deployment times and ensuring
reliable and maintainable production systems.

• Implemented GPU acceleration in model inference pipelines on AWS SageMaker, optimizing
processing times and model performance.

• Integrated TensorBoard and Prometheus for real-time performance monitoring, ensuring model
accuracy and operational reliability.
Junior MLOps Engineer

DataTech Solutions – India

August 2021 – June 2022

• Designed and managed automated pipelines for deploying generative AI models, enhancing datasets
through synthetic data generation.

• Containerized NLP models using Docker and Kubernetes for scalable deployment.

• Led deployment of computer vision models, improving accuracy and operational efficiency.

• Implemented transfer learning for object detection tasks, accelerating the model development
process.

• Created TensorFlow Serving pipelines for consistent and scalable model deployment.

• Implemented logging and error-handling mechanisms using ELK Stack, reducing system downtime.

Projects

Automated ML Pipeline for Predictive Maintenance in Autonomous Vehicles

XYZ Corp

Developed a real-time object detection pipeline using YOLOv5 and TensorFlow for predicting
maintenance issues. Integrated Airflow for orchestrating model training and deployment on AWS
Lambda, ensuring high availability and minimal downtime.

Real-time Fraud Detection System Using Generative AI

DataTech Solutions

Built a fraud detection system utilizing VAEs for real-time anomaly detection. Deployed on Kubernetes
with CI/CD automation using Jenkins, achieving high accuracy and scalability.

Generative Image Synthesis Pipeline

XYZ Corp

Developed a GAN-based image synthesis pipeline to augment training datasets, deployed on GCP AI
Platform with TensorFlow and Kubernetes, improving model performance and training efficiency.

Open Source Contributions

Kubeflow

Developed custom operators for scaling computer vision pipelines on Kubernetes.

MLflow

Created extensions for tracking and visualizing GAN training metrics.

TensorFlow Hub

Developed pre-trained models for image classification and segmentation.

"""

In [10]:
from resumeRelevancyScore import RelevanceScorer
resume_relevence_scorer = RelevanceScorer()



In [13]:
%%time
df['Resume Relevancy Score'] = df['Job Descriptions'].apply(lambda x : resume_relevence_scorer.calculate_relevance_score(resume, x))

CPU times: total: 12 s
Wall time: 3.69 s


In [16]:
%%time
df['Old Resume Relevancy Score'] = df['Job Descriptions'].apply(lambda x : resume_relevence_scorer.calculate_relevance_score(old_resume, x))

CPU times: total: 12.3 s
Wall time: 3.58 s


In [17]:
df

Unnamed: 0,Job Title,Job Post Url,Company Name,Location,Job ID,Job Descriptions,Resume Relevancy Score,Old Resume Relevancy Score
0,Senior Machine Learning Engineer,https://www.linkedin.com/jobs/view/4007688246/...,Andela,India (Remote),4007688246,Senior MLOps Engineer\nAndela\nLocation Requir...,71.73,68.06
1,Generative AI Engineer,https://www.linkedin.com/jobs/view/4009701610/...,Deloitte,"Bengaluru, Karnataka, India (Hybrid)",4009701610,"Hi, We are looking for Candidates who are havi...",74.05,73.45
2,"Applied Scientist, International Machine Learning",https://www.linkedin.com/jobs/view/3877288573/...,Amazon,"Bengaluru, Karnataka, India",3877288573,Description\n\nDo you want to join an innovati...,73.64,75.78
3,Machine Learning Specialist,https://www.linkedin.com/jobs/view/4012120273/...,Cloud4C Services,"Hyderabad, Telangana, India (On-site)",4012120273,DevOPs / MLOPs engineer\nKey Responsibilities\...,78.54,75.79
4,"Machine Learning Engineer, AI/ML, Search & Dis...",https://www.linkedin.com/jobs/view/4023072153/...,Uplers,India (Remote),4023072153,Experience: 3.00 + years\n\nSalary: INR 629439...,69.11,63.76
5,Data and Applied Scientist II,https://www.linkedin.com/jobs/view/4011475232/...,Microsoft,"Jammu & Kashmir, India (Hybrid)",4011475232,Microsoft’s Cloud business is experiencing exp...,70.38,68.06
6,MLOps Engineer,https://www.linkedin.com/jobs/view/3991631201/...,C5i,"Bengaluru, Karnataka, India (On-site)",3991631201,C5i\nC5i is a pure-play AI & Analytics provide...,62.34,63.77
7,Cloud Ops with AI/ML,https://www.linkedin.com/jobs/view/3959690795/...,Siemens,"Bengaluru, Karnataka, India (On-site)",3959690795,Hello Visionary!\n\nWe empower our people to s...,75.54,72.15
8,"Manager II- ML Data Operations, GO-AI",https://www.linkedin.com/jobs/view/4010115141/...,Amazon,"Hyderabad, Telangana, India",4010115141,Description\n\nWant to join the Earth’s most c...,71.39,70.33
9,Senior Machine Learning (ML) Engineer,https://www.linkedin.com/jobs/view/3754623735/...,Clario,"Bengaluru, Karnataka, India (Hybrid)",3754623735,ML Engineer having 5+ years Experience with Ma...,79.83,84.82
