In [1]:
# ✅ Load functions
from keyword_matcher import extract_keywords, compute_keyword_match
from parsing_module import extract_text_pdfplumber, split_resume_into_sections
from llm_enhancer import enhance_summary_with_gpt, enhance_skills_with_gpt, enhance_experience_job, build_experience_prompt
from experience_splitter import split_experience_section, parse_job_entry


In [2]:
# ✅ Load and parse resume PDF
resume_text = extract_text_pdfplumber("docs/sample_resume.pdf")
sections = split_resume_into_sections(resume_text)
summary_text = sections.get("summary", "")
full_resume_text = resume_text.lower()  # for keyword matching


In [3]:
# ✅ Sample job description (paste your real one if needed)
job_posting = """
People Data Analyst:

As a People Data Analyst, you will play a critical role in CAVA’s People & Culture function, specifically within the Total Rewards team. This role is responsible for producing regular reporting and data analysis, key in supporting strategic decision-making across People & Culture, while also collaborating with cross-functional teams across the organization. Your insights will help drive equitable, data-driven, and competitive strategies to attract and retain top talent. This role will provide data backed recommendations to help drive workforce strategy and support industry best practices.



What You’ll Do: 

Develop Periodic Reporting: Assist in creating and enhancing daily reporting to support various business areas.
Audit our People Data: Transform raw data so that it can be used in creating reports, maintaining reports, and summarizing results associated with our audits.
Interpret our People Data: Identify trends in data, comparing to both internal and external benchmarks.
Collaborate with Talent Acquisition & HR: Partner with recruiting and HR teams to merge data from outside of our HRIS systems to provide new insights and assist in creating new metrics.
Assist in Cross-Functional Analysis: Develop expertise in the organization’s people data and how it can be leveraged across other areas of the organization.
Maintain People Analytics Dashboards: Assist in dashboard maintenance and development.
Measure and Track Impact: Identify dates associated with initiatives to inform the business of the results of initiatives.


The Qualifications:

Bachelor’s degree in Human Resources, Business, Finance, Statistics, or a related field.
2+ years of experience in HR analytics, or data analysis in a corporate environment.
Proficiency in Excel (advanced), HRIS systems, and data visualization tools (e.g., Tableau, Power BI).
Experience working with SQL, Python, or another programming language preferred.
"""

# ✅ Compute match result and extract missing keywords
match_result = compute_keyword_match(full_resume_text, job_posting)
missing_keywords = match_result["missing_keywords"]
print("🧩 Missing Keywords:", missing_keywords)


🧩 Missing Keywords: ['acquisition', 'audit', 'benchmark', 'collaborate', 'competitive', 'corporate', 'degree', 'hris', 'maintain', 'maintenance', 'recruiting', 'strategy', 'talent', 'tool']


In [4]:
# ✅ Run Summary Enhancement
print("\n🧠 Original Summary:\n", summary_text)

enhanced_summary = enhance_summary_with_gpt(summary_text, missing_keywords)

print("\n✨ Enhanced Summary:\n", enhanced_summary)



🧠 Original Summary:
 Federal Data Analyst with 4+ years in human capital analytics, data-driven decision-making, and workforce planning. Skilled
in SQL, Python, Tableau, and Power BI, with a track record of optimizing HR processes through data analysis, reporting
automation, and visualization.

✨ Enhanced Summary:
 Corporate Federal Data Analyst with a degree and 4+ years of experience in human capital analytics, talent acquisition, and workforce strategy. Proficient in SQL, Python, HRIS, Tableau, and Power BI. Demonstrated ability to collaborate on audits, maintain benchmark standards, and enhance competitive recruiting through data-driven decision-making, reporting automation, and visualization tool maintenance.


In [5]:
# ✅ Run Skills Enhancement
skills_text = sections.get("skills", "")
print("\n📋 Original Skills:\n", skills_text)

enhanced_skills = enhance_skills_with_gpt(skills_text, missing_keywords)

print("\n🚀 Enhanced Skills:\n", enhanced_skills)



📋 Original Skills:
 ● Data Analytics & Visualization: SQL · Python · Tableau · Power BI · Advanced Excel · Advanced MS Office Suite
● Human Capital & Workforce Analytics: HR Metrics · Hiring Pipeline Analytics · Employee Retention Analysis ·
Workforce Planning
● Data Management & Integrity: Data Mining · Data Cleaning · Quality Assurance · Database Management · Process
Optimization
● Reporting & Decision Support: Ad Hoc Reporting · Dashboard Development · Executive Presentations · Stakeholder
Communication
● Process Automation & Compliance: Workflow Automation · Data Privacy & Security · Federal HR Policy Compliance
● Strategic Insights & Decision Making: Data-Driven Recommendations · Trend Analysis · Large Dataset Processing ·
Proactive Problem-Solving

🚀 Enhanced Skills:
 ---
● Data Analytics & Visualization Tools: SQL · Python · Tableau · Power BI · Advanced Excel · Advanced MS Office Suite · HRIS
● Talent Acquisition & Workforce Strategy: HR Metrics · Hiring Pipeline Analytics · E

In [6]:
from llm_enhancer import enhance_experience_job, build_experience_prompt

# Grab one parsed job entry (assuming you already split it earlier)
from experience_splitter import split_experience_section, parse_job_entry

# Pull and parse the experience section
experience_text = sections.get("experience", "")
experience_chunks = split_experience_section(experience_text)

# Choose one job to test
sample_job_chunk = experience_chunks[0]
parsed_job = parse_job_entry(sample_job_chunk)

# Enhance the parsed job
enhanced_job = enhance_experience_job(parsed_job, missing_keywords, job_posting)

# Print result
from pprint import pprint
print("\n✨ Enhanced Experience Entry:\n")
pprint(enhanced_job)



✨ Enhanced Experience Entry:

{'bullets': ['Leveraged data mining to extract critical human capital '
             'information, supporting strategic decision-making and talent '
             'acquisition strategies across various divisions.',
             'Designed an Excel VBA-based incentive tracking tool, integrating '
             'engagement analysis to assess award effectiveness, improving '
             'data accuracy by 85% and enhancing data-driven decision-making.',
             'Developed a Python-based payroll tracking system, integrating '
             'multiple fund sources and leveraging SQL for data extraction, '
             'reducing reconciliation time by ~2 hours/month and improving '
             'payroll forecasting accuracy.',
             'Collaborated with cross-functional teams to optimize '
             'SharePoint-based data management processes, enhancing workflow '
             'automation and document version control for financial reporting.',
         

In [7]:
# Parse and enhance each job entry
enhanced_jobs = []
for chunk in experience_chunks:
    parsed_job = parse_job_entry(chunk)
    enhanced_job = enhance_experience_job(parsed_job, missing_keywords, job_posting)
    enhanced_jobs.append(enhanced_job)

# Preview results
from pprint import pprint
for job in enhanced_jobs:
    print("\n📌", job["title"], "at", job["company"], job["date_range"])
    pprint(job["bullets"])


📌 Budget Analyst at Substance Abuse and Mental Health Administration, Department of HHS Dec '23 - Mar '25
['Leveraged data mining to extract critical human capital information, '
 'supporting strategic decision-making and talent acquisition evaluations '
 'across divisions; enhanced workforce planning through comprehensive data '
 'analysis.',
 'Designed an Excel VBA-based tool for tracking incentives, integrating '
 'engagement analysis and survey design to evaluate award effectiveness; '
 'automated validation checks and dynamic data processing workflows increased '
 'data accuracy by 85%.',
 'Developed a real-time Python-based payroll tracking system, integrating '
 'multiple fund sources and lines of accounting; utilized SQL for data '
 'extraction and pandas for analysis, reducing reconciliation time and '
 'improving payroll forecasting accuracy.',
 'Optimized SharePoint-based data management processes, enhancing workflow '
 'automation and document version control for financial

In [8]:
# Import the formatter utilities
from resume_formatter import format_experience_section, assemble_resume

# Format the experience section using your enhanced jobs
formatted_experience = format_experience_section(enhanced_jobs)

# Assemble the full resume using enhanced summary, skills, experience, and education
final_resume = assemble_resume(
    summary=enhanced_summary,
    skills=enhanced_skills,
    experience=formatted_experience,
    education=sections.get("education", "Available upon request")  # fallback if missing
)

# Print the final resume for review
print(final_resume)



SUMMARY
-------
Corporate Federal Data Analyst with a degree and 4+ years of experience in human capital analytics, talent acquisition, and workforce strategy. Proficient in SQL, Python, HRIS, Tableau, and Power BI. Demonstrated ability to collaborate on audits, maintain benchmark standards, and enhance competitive recruiting through data-driven decision-making, reporting automation, and visualization tool maintenance.

SKILLS
------
---
● Data Analytics & Visualization Tools: SQL · Python · Tableau · Power BI · Advanced Excel · Advanced MS Office Suite · HRIS
● Talent Acquisition & Workforce Strategy: HR Metrics · Hiring Pipeline Analytics · Employee Retention Analysis · Workforce Planning · Recruiting · Benchmarking
● Data Management, Integrity & Maintenance: Data Mining · Data Cleaning · Quality Assurance · Database Management · Process Optimization · Audit
● Reporting, Decision Support & Competitive Insights: Ad Hoc Reporting · Dashboard Development · Executive Presentations · Stak