In [None]:
%pip install pdfplumber

In [5]:
import pdfplumber
import re
import pandas as pd
import nltk
from nltk import word_tokenize, pos_tag, ne_chunk
from nltk.tree import Tree

# Ensure NLTK corpora are downloaded
nltk.download('punkt')
nltk.download('averaged_perceptron_tagger')
nltk.download('maxent_ne_chunker')
nltk.download('words')

def extract_name(text):
    """Extract name using Named Entity Recognition."""
    sentences = nltk.sent_tokenize(text)
    print(sentences)
    for sentence in sentences:
        tokens = nltk.word_tokenize(sentence)
        print(tokens)
        tags = nltk.pos_tag(tokens)
        print(tags)
        chunks = ne_chunk(tags)
        print(chunks)
        for chunk in chunks:
            if isinstance(chunk, Tree) and chunk.label() == 'PERSON':
                return " ".join(c[0] for c in chunk)
    return "Not Found"

def extract_email(text):
    """Extract email using regex."""
    email_match = re.search(r'[a-zA-Z0-9_.+-]+@[a-zA-Z0-9-]+\.[a-zA-Z0-9-.]+', text)
    print(email_match)
    print(email_match.group(0))
    return email_match.group(0) if email_match else "Not Found"

def extract_qualification(text):
    """Extract qualifications by matching common degree terms."""
    qualifications = re.findall(r'\b(B(?:\.|achelor)?|M(?:\.|aster)?|Ph\.?D|Diploma|High School|HSC|UG|PG|CS|Engineering|Science)\b', text, re.IGNORECASE)
    print(qualifications)
    return ", ".join(set(qualifications)) if qualifications else "Not Found"

def extract_resume_details_nltk(file_path):
    """Extract details using pdfplumber and NLTK."""
    with pdfplumber.open(file_path) as pdf:
        text = ""
        for page in pdf.pages:
            text += page.extract_text()
        print(text)
    
    name = extract_name(text)
    print(name)
    email = extract_email(text)
    print(email)
    qualification = extract_qualification(text)
    print(qualification)
    
    print({"Name": name, "Qualification": qualification, "Email": email})
    return {"Name": name, "Qualification": qualification, "Email": email}

# Process all resumes
resume_files = ["Resume01.pdf","Resume02.pdf"]  # List of resume file paths
resume_data = []
print(resume_files)
print(resume_data)

for file in resume_files:
    details = extract_resume_details_nltk(file)
    print(details)
    resume_data.append(details)
    print(resume_data)

print(resume_data)
# Convert to DataFrame and save as CSV
df = pd.DataFrame(resume_data)
print(df)
output_path = "extracted_resume_data_nltk.csv"
df.to_csv(output_path, index=False)

print(f"Data saved to {output_path}")


[nltk_data] Downloading package punkt to
[nltk_data]     C:\Users\DELL\AppData\Roaming\nltk_data...
[nltk_data]   Package punkt is already up-to-date!
[nltk_data] Downloading package averaged_perceptron_tagger to
[nltk_data]     C:\Users\DELL\AppData\Roaming\nltk_data...
[nltk_data]   Package averaged_perceptron_tagger is already up-to-
[nltk_data]       date!
[nltk_data] Downloading package maxent_ne_chunker to
[nltk_data]     C:\Users\DELL\AppData\Roaming\nltk_data...
[nltk_data]   Package maxent_ne_chunker is already up-to-date!
[nltk_data] Downloading package words to
[nltk_data]     C:\Users\DELL\AppData\Roaming\nltk_data...
[nltk_data]   Package words is already up-to-date!


['Resume01.pdf', 'Resume02.pdf']
[]
Dhanvand Srinivasan
Ux|Ui Designer
Education
Hsc
Daniel Thomas (2017 - 19)
61%
BSC - Cs
SRM University (2019 - 22)
First Class
About Me
Experience
A Creative Ux|Ui Designer In Creating
Intuitive And Visually Appealing User UX UI Designer Trainee
Experiences.Passionate About Designing Phygitalz advisory and solutions (Apr24 - Jly24)
Innovative Solutions. That Enhance User Oversaw all major Ai plants automation design & icons.
Engagement And Satisfaction. Seeking A
* OEE 4.0 * Traceabillty 4.0 * TLM 4.0
Challenging Position Where I Can Apply My
* PredictM 4.0 * ZeDQual 4.0 * Energy 4.0
Expertise And Contribute To Creating
Skills
Exceptional Digital Products.
* User Research
Course
* Persona Creation
* Write User Stories
Advanced Ux|Ui Designer
* Prepare Scope Document
* Create User Flow
Jan - May (2023)
* Build Information Architecture
* Paper & Digital Prototypes
Contact * Usability Testing
* Ui Design
9080146466
Software Skills
dhanvand333@gmail.com


In [1]:
x ="""
Dhanvand Srinivasan
Ux|Ui Designer
Contact
Course
A Creative Ux|Ui Designer In Creating
Intuitive And Visually Appealing User
Experiences.Passionate About Designing
Innovative Solutions. That Enhance User
Engagement And Satisfaction. Seeking A
Challenging Position Where I Can Apply My
Expertise And Contribute To Creating
Exceptional Digital Products.
About Me
9080146466
Jan - May (2023)
Advanced Ux|Ui Designer
dhanvand333@gmail.com
behance.net/dhanvand
linkedin.com/in/dhanvand-srinivasan-65530b275
Education
Hsc
BSC - Cs
UX UI Designer Trainee
61%
First Class
User Research
Oversaw all major Ai plants automation design & icons.
OEE 4.0
PredictM 4.0
Traceabillty 4.0
ZeDQual 4.0
TLM 4.0
Energy 4.0
Persona Creation
Write User Stories
Prepare Scope Document
Create User Flow
Build Information Architecture
Paper & Digital Prototypes
Usability Testing
Ui Design
Figma
Prottapp Maze.Desgin
Invision Zeplin
Daniel Thomas (2017 - 19)
SRM University (2019 - 22)
Skills
Software Skills
Experience
Phygitalz advisory and solutions (Apr24 - Jly24)
*
*
*
*
*
*
*
*
*
*
*
*
*
*
*
"""

In [3]:
print(x)


Dhanvand Srinivasan
Ux|Ui Designer
Contact
Course
A Creative Ux|Ui Designer In Creating
Intuitive And Visually Appealing User
Experiences.Passionate About Designing
Innovative Solutions. That Enhance User
Engagement And Satisfaction. Seeking A
Challenging Position Where I Can Apply My
Expertise And Contribute To Creating
Exceptional Digital Products.
About Me
9080146466
Jan - May (2023)
Advanced Ux|Ui Designer
dhanvand333@gmail.com
behance.net/dhanvand
linkedin.com/in/dhanvand-srinivasan-65530b275
Education
Hsc
BSC - Cs
UX UI Designer Trainee
61%
First Class
User Research
Oversaw all major Ai plants automation design & icons.
OEE 4.0
PredictM 4.0
Traceabillty 4.0
ZeDQual 4.0
TLM 4.0
Energy 4.0
Persona Creation
Write User Stories
Prepare Scope Document
Create User Flow
Build Information Architecture
Paper & Digital Prototypes
Usability Testing
Ui Design
Figma
Prottapp Maze.Desgin
Invision Zeplin
Daniel Thomas (2017 - 19)
SRM University (2019 - 22)
Skills
Software Skills
Experience
Phyg