In [None]:
# imports

import os
import requests
from dotenv import load_dotenv
from bs4 import BeautifulSoup
from IPython.display import Markdown, display
from openai import OpenAI

# If you get an error running this cell, then please head over to the troubleshooting notebook!

In [None]:
# Load environment variables in a file called .env

load_dotenv(override=True)
api_key = os.getenv('OPENAI_API_KEY')

# Check the key

if not api_key:
    print("No API key was found - please head over to the troubleshooting notebook in this folder to identify & fix!")
elif not api_key.startswith("sk-proj-"):
    print("An API key was found, but it doesn't start sk-proj-; please check you're using the right key - see troubleshooting notebook")
elif api_key.strip() != api_key:
    print("An API key was found, but it looks like it might have space or tab characters at the start or end - please remove them - see troubleshooting notebook")
else:
    print("API key found and looks good so far!")


In [None]:
openai = OpenAI()

# If this doesn't work, try Kernel menu >> Restart Kernel and Clear Outputs Of All Cells, then run the cells from the top of this notebook down.
# If it STILL doesn't work (horrors!) then please see the Troubleshooting notebook in this folder for full instructions

In [None]:
# Define our system prompt - you can experiment with this later, changing the last sentence to 'Respond in markdown in Spanish."

system_prompt = "You are a high profile professional resume analyst and assist users with highlighting gaps in a very formed resume and provide direction to make the resume eye catching to the recruiters \
and employers."

user_prompt = """Analyze the resume details to do the following: \
1. Assess the resume to highlight areas of improvement. \ 
2. Create a well formed resume.

Name: Sam Burns

PROFESSIONAL SUMMARY
Experienced Data and AI Architect with over 10 years of expertise designing scalable data platforms, integrating cloud-native solutions, and deploying AI/ML systems across enterprise environments. Proven track record of aligning data architecture with business strategy, leading cross-functional teams, and delivering high-impact AI-driven insights.

CORE SKILLS

Data Architecture: Lakehouse, Data Mesh, Delta Lake, Data Vault

Cloud Platforms: Azure (Data Factory, Synapse, ML Studio), AWS (S3, Glue, SageMaker), Databricks

Big Data & Streaming: Spark, Kafka, Hive, Hadoop

ML/AI Tooling: MLflow, TensorFlow, Scikit-learn, Hugging Face Transformers

Programming: Python, SQL, PySpark, Scala, Terraform

DevOps: CI/CD (GitHub Actions, Azure DevOps), Docker, Kubernetes

Governance: Data Lineage, Cataloging, RBAC, GDPR, Responsible AI

PROFESSIONAL EXPERIENCE

Senior Data & AI Architect
ABC Tech Solutions — New York, NY
Jan 2021 – Present

Designed and implemented a company-wide lakehouse architecture on Databricks, integrating AWS S3, Redshift, and real-time ingestion from Kafka.

Led architecture for a predictive maintenance platform using sensor data (IoT), Spark streaming, and MLflow-managed experiments.

Developed enterprise ML governance framework ensuring reproducibility, fairness, and compliance with GDPR.

Mentored 6 data engineers and ML engineers; led architectural reviews and technical roadmap planning.

Data Architect / AI Specialist
Global Insights Inc. — Boston, MA
Jun 2017 – Dec 2020

Modernized legacy data warehouse to Azure Synapse-based analytics platform, reducing ETL latency by 40%.

Built MLOps pipelines for customer churn prediction models using Azure ML and ADF.

Collaborated with business units to define semantic layers for self-service analytics in Power BI.

Data Engineer
NextGen Analytics — Remote
Jul 2013 – May 2017

Developed ETL pipelines in PySpark to transform raw web traffic into structured analytics dashboards.

Integrated NLP models into customer support workflows using spaCy and early versions of Hugging Face.

Contributed to open-source tools for Jupyter-based analytics and data catalog integration.

EDUCATION
M.S. in Computer Science – Carnegie Mellon University
B.S. in Information Systems – Rutgers University

CERTIFICATIONS

Databricks Certified Data Engineer Professional

Azure Solutions Architect Expert

AWS Certified Machine Learning – Specialty

PROJECTS & CONTRIBUTIONS

llm_engineering (GitHub): Developed and maintained hands-on LLM course materials and community contributions framework.

Real-time AI PoC: Designed Kafka-Spark pipeline with Azure OpenAI Service for anomaly detection on IoT streams.

Contributor to Hugging Face Transformers – integration examples for inference pipelines
"""

In [None]:
messages = [
    {"role": "system", "content": system_prompt},
    {"role": "user", "content": user_prompt}
]

In [None]:
# To give you a preview -- calling OpenAI with system and user messages:

response = openai.chat.completions.create(model="gpt-4o-mini", messages=messages)

In [None]:
# A function to display this nicely in the Jupyter output, using markdown

display(Markdown(response.choices[0].message.content))

# Sharing your code

I'd love it if you share your code afterwards so I can share it with others! You'll notice that some students have already made changes (including a Selenium implementation) which you will find in the community-contributions folder. If you'd like add your changes to that folder, submit a Pull Request with your new versions in that folder and I'll merge your changes.

If you're not an expert with git (and I am not!) then GPT has given some nice instructions on how to submit a Pull Request. It's a bit of an involved process, but once you've done it once it's pretty clear. As a pro-tip: it's best if you clear the outputs of your Jupyter notebooks (Edit >> Clean outputs of all cells, and then Save) for clean notebooks.

Here are good instructions courtesy of an AI friend:  
https://chatgpt.com/share/677a9cb5-c64c-8012-99e0-e06e88afd293