In [3]:
from reportlab.lib.pagesizes import LETTER
from reportlab.lib.styles import getSampleStyleSheet
from reportlab.platypus import SimpleDocTemplate, Paragraph, Spacer
from reportlab.lib import colors
from io import BytesIO

In [8]:
def generate_resume_from_json(json_data):
    buffer = BytesIO()
    pdf = SimpleDocTemplate(buffer, pagesize=LETTER)
    styles = getSampleStyleSheet()
    
    content = []
    
    # Add Name
    content.append(Paragraph(f"<b>{json_data.get('name', 'Your Name')}</b>", styles['Title']))
    
    # Add Contact Info
    contact = json_data.get("contact", {})
    contact_info = f"Email: {contact.get('email', '')} | Phone: {contact.get('phone', '')} | LinkedIn: {contact.get('linkedin', '')} | GitHub: {contact.get('github', '')} | Location: {contact.get('location', '')}"
    content.append(Paragraph(contact_info, styles['Normal']))
    content.append(Spacer(1, 12))

    # Add Summary
    content.append(Paragraph("<b>Professional Summary</b>", styles['Heading2']))
    content.append(Paragraph(json_data.get('summary', 'Summary not provided'), styles['Normal']))
    content.append(Spacer(1, 12))
    
    # Add Skills
    content.append(Paragraph("<b>Skills</b>", styles['Heading2']))
    skills = json_data.get('skills', {})
    for skill_category, skill_list in skills.items():
        content.append(Paragraph(f"<b>{skill_category.replace('_', ' ').capitalize()}:</b>", styles['Normal']))
        content.append(Paragraph(", ".join(skill_list), styles['Normal']))
    content.append(Spacer(1, 12))

    # Add Experience
    content.append(Paragraph("<b>Professional Experience</b>", styles['Heading2']))
    experience = json_data.get('experience', [])
    for job in experience:
        content.append(Paragraph(f"<b>{job.get('title', '')}</b>", styles['Heading3']))
        content.append(Paragraph(f"{job.get('company', '')} – {job.get('location', '')}", styles['Normal']))
        content.append(Paragraph(f"{job.get('duration', '')}", styles['Normal']))
        for responsibility in job.get('responsibilities', []):
            content.append(Paragraph(f"• {responsibility}", styles['Normal']))
        content.append(Spacer(1, 12))

    # Add Projects
    content.append(Paragraph("<b>Projects</b>", styles['Heading2']))
    projects = json_data.get('projects', [])
    for project in projects:
        content.append(Paragraph(f"<b>{project.get('name', '')}</b>", styles['Heading3']))
        content.append(Paragraph(project.get('company', ''), styles['Normal']))
        content.append(Paragraph(project.get('description', ''), styles['Normal']))
        content.append(Spacer(1, 12))

    # Add Open Source Contributions
    content.append(Paragraph("<b>Open Source Contributions</b>", styles['Heading2']))
    contributions = json_data.get('open_source_contributions', [])
    for contrib in contributions:
        content.append(Paragraph(f"<b>{contrib.get('project', '')}</b>", styles['Heading3']))
        content.append(Paragraph(contrib.get('contribution', ''), styles['Normal']))
        content.append(Spacer(1, 12))

    # Add Education
    content.append(Paragraph("<b>Education</b>", styles['Heading2']))
    education = json_data.get('education', {})
    content.append(Paragraph(education.get('degree', 'Degree not provided'), styles['Heading3']))
    content.append(Paragraph(education.get('institution', 'Institution not provided'), styles['Normal']))
    content.append(Paragraph(f"Graduation Year: {education.get('graduation_year', '')}", styles['Normal']))
    content.append(Paragraph(f"Relevant Courses: {', '.join(education.get('relevant_courses', []))}", styles['Normal']))
    content.append(Spacer(1, 12))

    # Add Certifications
    content.append(Paragraph("<b>Certifications</b>", styles['Heading2']))
    certifications = json_data.get('certifications', [])
    for cert in certifications:
        content.append(Paragraph(f"{cert.get('name', '')}, Issued: {cert.get('issued', '')}", styles['Normal']))
    content.append(Spacer(1, 12))

    # Add Technical Proficiencies
    content.append(Paragraph("<b>Technical Proficiencies</b>", styles['Heading2']))
    technical_proficiencies = json_data.get('technical_proficiencies', {})
    for category, profs in technical_proficiencies.items():
        content.append(Paragraph(f"{category.capitalize()}: {', '.join(profs)}", styles['Normal']))
    content.append(Spacer(1, 12))

    # Add Publications & Talks
    content.append(Paragraph("<b>Publications & Talks</b>", styles['Heading2']))
    publications = json_data.get('publications_talks', [])
    for pub in publications:
        content.append(Paragraph(f"{pub.get('title', '')}, {pub.get('event', '')} ({pub.get('year', '')})", styles['Normal']))
    content.append(Spacer(1, 12))

    # Add Volunteer Experience
    content.append(Paragraph("<b>Volunteer Experience</b>", styles['Heading2']))
    volunteer_experience = json_data.get('volunteer_experience', [])
    for exp in volunteer_experience:
        content.append(Paragraph(f"{exp.get('organization', '')} - {exp.get('role', '')}", styles['Normal']))
        content.append(Paragraph(exp.get('description', ''), styles['Normal']))
    content.append(Spacer(1, 12))

    # Add References
    references = json_data.get('references', 'Available upon request.')
    content.append(Paragraph("<b>References</b>", styles['Heading2']))
    content.append(Paragraph(references, styles['Normal']))

    # Build PDF
    pdf.build(content)
    
    buffer.seek(0)
    return buffer

In [9]:
json_data = {
  "name": "John Anderson",
  "contact": {
    "email": "john.anderson@gmail.com",
    "linkedin": "linkedin.com/in/johnanderson",
    "github": "github.com/johndevml",
    "phone": "(555) 555-1234",
    "location": "San Francisco, CA"
  },
  "summary": "MLOps Engineer with 2+ years of experience in deploying and managing machine learning models, computer vision systems, and generative AI models in production. Proficient in automating end-to-end machine learning pipelines and integrating advanced AI solutions using cutting-edge tools like Docker, Kubernetes, TensorFlow, PyTorch, and MLflow. Strong expertise in scaling AI systems using cloud platforms (AWS, GCP), and optimizing deep learning models for real-time inference. Adept at integrating MLOps best practices, such as CI/CD pipelines and monitoring frameworks, to improve model robustness and scalability in production environments. Experienced in working with GANs and other generative models for various applications in image synthesis and data augmentation.",
  "skills": {
    "mlops_tools": [
      "Docker",
      "Kubernetes",
      "Jenkins",
      "MLflow",
      "Airflow",
      "TensorBoard",
      "Argo Workflows"
    ],
    "machine_learning": [
      "Supervised/Unsupervised Learning",
      "Model Deployment",
      "Hyperparameter Tuning"
    ],
    "computer_vision": [
      "OpenCV",
      "TensorFlow",
      "PyTorch",
      "YOLO",
      "Faster R-CNN",
      "Mask R-CNN"
    ],
    "generative_ai": [
      "GANs",
      "Variational Autoencoders (VAEs)",
      "DALL-E",
      "Stable Diffusion"
    ],
    "cloud_platforms": [
      "AWS (EC2, S3, Lambda, SageMaker)",
      "GCP (AI Platform, Compute Engine)"
    ],
    "programming_languages": [
      "Python",
      "Bash",
      "SQL",
      "C++"
    ],
    "version_control_ci_cd": [
      "Git",
      "GitLab CI",
      "Jenkins",
      "CircleCI",
      "GitHub Actions"
    ],
    "containerization_orchestration": [
      "Docker",
      "Kubernetes"
    ],
    "data_engineering": [
      "Apache Kafka",
      "Apache Spark",
      "Hadoop"
    ],
    "monitoring_logging": [
      "Prometheus",
      "Grafana",
      "ELK Stack"
    ]
  },
  "experience": [
    {
      "title": "MLOps Engineer",
      "company": "XYZ Corp",
      "location": "San Francisco, CA",
      "duration": "June 2022 – Present",
      "responsibilities": [
        "Architected and deployed real-time object detection models for autonomous vehicle systems, using TensorFlow and YOLOv5, enabling the detection of pedestrians and vehicles with 95% accuracy.",
        "Built and optimized deep learning pipelines for computer vision tasks, including image classification and segmentation, using Kubernetes for large-scale deployment on AWS.",
        "Automated the deployment and retraining of generative models, such as GANs for synthetic image generation, improving the model development lifecycle by 30%.",
        "Developed a CI/CD framework using Jenkins and MLflow to automate the training and deployment of computer vision models, reducing deployment time from weeks to days.",
        "Implemented GPU acceleration in model inference pipelines on AWS SageMaker, leading to a 50% reduction in processing time for complex computer vision models.",
        "Integrated TensorBoard and Prometheus for real-time model performance monitoring, ensuring model accuracy and reducing drift in production by 20%."
      ]
    },
    {
      "title": "Junior MLOps Engineer",
      "company": "DataTech Solutions",
      "location": "Los Angeles, CA",
      "duration": "August 2021 – June 2022",
      "responsibilities": [
        "Designed and maintained automated pipelines for the deployment of generative AI models (e.g., DCGANs) to enhance datasets through synthetic data generation.",
        "Containerized machine learning models for natural language processing (NLP) tasks such as text classification and summarization using Docker and Kubernetes.",
        "Led the deployment of computer vision models for image recognition in retail environments, which improved product identification accuracy by 15%.",
        "Collaborated with data science teams to implement transfer learning for custom object detection tasks, shortening the model development cycle by 40%.",
        "Created TensorFlow Serving pipelines for seamless model deployment across development and production environments, ensuring consistent API responses.",
        "Implemented logging and error-handling mechanisms in real-time NLP systems using ELK Stack, reducing system downtime by 25%."
      ]
    }
  ],
  "projects": [
    {
      "name": "Automated ML Pipeline for Predictive Maintenance in Autonomous Vehicles",
      "company": "XYZ Corp",
      "description": "Developed a real-time object detection pipeline for predicting maintenance issues in autonomous vehicles using YOLOv5 and TensorFlow. Integrated Airflow for orchestrating tasks such as model training, validation, and deployment on AWS Lambda, enabling real-time updates to the model with minimal downtime. Monitored model drift and performance using Prometheus and automated retraining when accuracy dropped, ensuring model precision stayed above 90%."
    },
    {
      "name": "Real-time Fraud Detection System Using Generative AI",
      "company": "DataTech Solutions",
      "description": "Built a fraud detection system that utilized variational autoencoders (VAEs) to detect anomalies in real-time transaction data streams. Deployed the model as a microservice on Kubernetes, leveraging horizontal scaling to support high-traffic environments. Used MLflow for model versioning and Jenkins to automate CI/CD workflows for model updates. The system achieved a fraud detection rate of 97%, significantly improving upon existing rule-based systems."
    },
    {
      "name": "Generative Image Synthesis Pipeline",
      "company": "XYZ Corp",
      "description": "Developed a GAN-based image synthesis pipeline for augmenting training datasets in computer vision projects, leading to a 15% improvement in model performance. Deployed the pipeline on GCP AI Platform with TensorFlow and Kubernetes, allowing on-demand image generation to reduce model training times. Used Argo Workflows for orchestrating multi-step data preprocessing, model training, and deployment, ensuring a seamless integration into existing MLOps infrastructure."
    }
  ],
  "open_source_contributions": [
    {
      "project": "Kubeflow",
      "contribution": "Contributed to the development of custom operators for scaling computer vision pipelines on Kubernetes. These contributions improved model training times by 20% in distributed environments."
    },
    {
      "project": "MLflow",
      "contribution": "Developed extensions for tracking and visualizing GAN training metrics, including loss curves and image quality metrics like FID scores."
    },
    {
      "project": "TensorFlow Hub",
      "contribution": "Created custom pre-trained models for image classification and segmentation, available for public use. These models have been downloaded over 5,000 times and are actively used in the open-source community."
    }
  ],
  "education": {
    "degree": "Bachelor of Science in Computer Science",
    "institution": "University of California, Berkeley",
    "graduation_year": "2020",
    "relevant_courses": [
      "Machine Learning",
      "Deep Learning",
      "Computer Vision",
      "Cloud Computing",
      "Distributed Systems"
    ],
    "extracurriculars": [
      "Machine Learning Club",
      "Generative AI Research Group",
      "Hackathons"
    ]
  },
  "certifications": [
    {
      "name": "AWS Certified Solutions Architect – Associate",
      "issued": "May 2023"
    },
    {
      "name": "Certified Kubernetes Administrator (CKA)",
      "issued": "September 2022"
    },
    {
      "name": "TensorFlow Developer Certification",
      "issued": "March 2022"
    },
    {
      "name": "Google Cloud Professional Data Engineer",
      "issued": "February 2024"
    },
    {
      "name": "NVIDIA Deep Learning Institute – Computer Vision with PyTorch",
      "issued": "August 2023"
    }
  ],
  "publications_talks": [
    {
      "title": "Building and Deploying Computer Vision Models at Scale with TensorFlow and Kubernetes",
      "event": "O'Reilly AI Conference",
      "year": "2023"
    },
    {
      "title": "Generative AI in Real-World Applications: Challenges and Solutions",
      "platform": "Medium",
      "views": "20,000+"
    },
    {
      "title": "Optimizing Deep Learning Workflows with Airflow and MLflow",
      "event": "PyData Conference",
      "year": "2023"
    }
  ],
  "volunteer_experience": [
    {
      "organization": "AI for Good Hackathon",
      "role": "Mentor",
      "description": "Mentored teams in designing and deploying computer vision models for healthcare applications, including X-ray image classification for COVID-19 detection."
    },
    {
      "organization": "Women Who Code",
      "role": "Workshop Leader",
      "description": "Conducted workshops on Generative AI with a focus on using GANs and VAEs for image synthesis."
    }
  ],
  "technical_proficiencies": {
    "operating_systems": ["Linux (Ubuntu, CentOS)", "Windows"],
    "databases": ["MySQL", "PostgreSQL", "MongoDB"],
    "version_control": ["Git", "Bitbucket"]
  },
  "references": "Available upon request."
}

In [None]:
# Generating the PDF
pdf_buffer = generate_resume_from_json(json_data)

# Save PDF to file
output_filename = "Generated_Resume.pdf"
with open(output_filename, "wb") as f:
    f.write(pdf_buffer.getvalue())

In [12]:
import pandas as pd
df = pd.read_csv("Scraped Jobs MLOps.csv")

In [15]:
updated_json = {
  "name": "John Anderson",
  "contact": {
    "email": "john.anderson@gmail.com",
    "linkedin": "linkedin.com/in/johnanderson",
    "github": "github.com/johndevml",
    "phone": "(555) 555-1234",
    "location": "India"
  },
  "summary": "Senior MLOps Engineer with 7+ years of experience in deploying, managing, and optimizing machine learning pipelines and systems at scale. Expertise in building and scaling AI solutions using Docker, Kubernetes, and cloud platforms like AWS and GCP. Skilled in automating end-to-end MLOps workflows, implementing CI/CD pipelines, and leveraging advanced AI tools including TensorFlow and PyTorch. Proven track record in ensuring model performance and reliability through real-time monitoring and optimization, with a focus on problem-solving and continuous improvement.",
  "skills": {
    "mlops_tools": [
      "Docker",
      "Kubernetes",
      "Jenkins",
      "MLflow",
      "Airflow",
      "Argo Workflows",
      "Terraform",
      "Ansible"
    ],
    "machine_learning": [
      "Supervised/Unsupervised Learning",
      "Model Deployment",
      "Model Performance Monitoring"
    ],
    "cloud_platforms": [
      "AWS (EC2, S3, Lambda, SageMaker, EMR, Kinesis, SQS, SNS)",
      "GCP (AI Platform, Compute Engine)"
    ],
    "programming_languages": [
      "Python",
      "SQL"
    ],
    "version_control_ci_cd": [
      "Git",
      "Jenkins",
      "GitHub Actions",
      "TravisCI",
      "Bamboo"
    ],
    "data_engineering": [
      "Apache Spark",
      "Airflow"
    ]
  },
  "experience": [
    {
      "title": "MLOps Engineer",
      "company": "XYZ Corp",
      "location": "India",
      "duration": "June 2022 – Present",
      "responsibilities": [
        "Architected and deployed real-time object detection models for autonomous vehicle systems, using TensorFlow and YOLOv5, with a focus on scalability and performance.",
        "Built and optimized deep learning pipelines on AWS using Kubernetes, enhancing model deployment efficiency and scalability.",
        "Automated deployment and retraining of generative models, including GANs, improving the model development lifecycle.",
        "Developed CI/CD frameworks with Jenkins and MLflow, reducing deployment times and ensuring reliable and maintainable production systems.",
        "Implemented GPU acceleration in model inference pipelines on AWS SageMaker, optimizing processing times and model performance.",
        "Integrated TensorBoard and Prometheus for real-time performance monitoring, ensuring model accuracy and operational reliability."
      ]
    },
    {
      "title": "Junior MLOps Engineer",
      "company": "DataTech Solutions",
      "location": "India",
      "duration": "August 2021 – June 2022",
      "responsibilities": [
        "Designed and managed automated pipelines for deploying generative AI models, enhancing datasets through synthetic data generation.",
        "Containerized NLP models using Docker and Kubernetes for scalable deployment.",
        "Led deployment of computer vision models, improving accuracy and operational efficiency.",
        "Implemented transfer learning for object detection tasks, accelerating the model development process.",
        "Created TensorFlow Serving pipelines for consistent and scalable model deployment.",
        "Implemented logging and error-handling mechanisms using ELK Stack, reducing system downtime."
      ]
    }
  ],
  "projects": [
    {
      "name": "Automated ML Pipeline for Predictive Maintenance in Autonomous Vehicles",
      "company": "XYZ Corp",
      "description": "Developed a real-time object detection pipeline using YOLOv5 and TensorFlow for predicting maintenance issues. Integrated Airflow for orchestrating model training and deployment on AWS Lambda, ensuring high availability and minimal downtime."
    },
    {
      "name": "Real-time Fraud Detection System Using Generative AI",
      "company": "DataTech Solutions",
      "description": "Built a fraud detection system utilizing VAEs for real-time anomaly detection. Deployed on Kubernetes with CI/CD automation using Jenkins, achieving high accuracy and scalability."
    },
    {
      "name": "Generative Image Synthesis Pipeline",
      "company": "XYZ Corp",
      "description": "Developed a GAN-based image synthesis pipeline to augment training datasets, deployed on GCP AI Platform with TensorFlow and Kubernetes, improving model performance and training efficiency."
    }
  ],
  "open_source_contributions": [
    {
      "project": "Kubeflow",
      "contribution": "Developed custom operators for scaling computer vision pipelines on Kubernetes."
    },
    {
      "project": "MLflow",
      "contribution": "Created extensions for tracking and visualizing GAN training metrics."
    },
    {
      "project": "TensorFlow Hub",
      "contribution": "Developed pre-trained models for image classification and segmentation."
    }
  ],
  "education": {
    "degree": "Bachelor of Science in Computer Science",
    "institution": "University of California, Berkeley",
    "graduation_year": "2020",
    "relevant_courses": [
      "Machine Learning",
      "Deep Learning",
      "Cloud Computing",
      "Distributed Systems"
    ]
  },
  "certifications": [
    {
      "name": "AWS Certified Solutions Architect – Associate",
      "issued": "May 2023"
    },
    {
      "name": "Certified Kubernetes Administrator (CKA)",
      "issued": "September 2022"
    },
    {
      "name": "TensorFlow Developer Certification",
      "issued": "March 2022"
    },
    {
      "name": "Google Cloud Professional Data Engineer",
      "issued": "February 2024"
    }
  ],
  "publications_talks": [
    {
      "title": "Building and Deploying Computer Vision Models at Scale with TensorFlow and Kubernetes",
      "event": "O'Reilly AI Conference",
      "year": "2023"
    },
    {
      "title": "Generative AI in Real-World Applications: Challenges and Solutions",
      "platform": "Medium",
      "views": "20,000+"
    },
    {
      "title": "Optimizing Deep Learning Workflows with Airflow and MLflow",
      "event": "PyData Conference",
      "year": "2023"
    }
  ],
  "volunteer_experience": [
    {
      "organization": "AI for Good Hackathon",
      "role": "Mentor",
      "description": "Mentored teams in designing and deploying computer vision models for healthcare applications."
    },
    {
      "organization": "Women Who Code",
      "role": "Workshop Leader",
      "description": "Conducted workshops on Generative AI with a focus on using GANs and VAEs for image synthesis."
    }
  ],
  "technical_proficiencies": {
    "operating_systems": ["Linux (Ubuntu, CentOS)", "Windows"],
    "databases": ["MySQL", "PostgreSQL"],
    "version_control": ["Git"]
  },
  "references": "Available upon request."
}


In [16]:
# Generating the PDF for Updated JSON
pdf_buffer = generate_resume_from_json(updated_json)

# Save PDF to file
output_filename = "Generated_Resume_Updated.pdf"
with open(output_filename, "wb") as f:
    f.write(pdf_buffer.getvalue())