In [1]:
# Resume_Analysis.ipynb

import pandas as pd
import matplotlib.pyplot as plt
from wordcloud import WordCloud
import os

# Load all resume data from /output
folder = 'output'
dfs = []

for file in os.listdir(folder):
    if file.endswith('.csv'):
        df = pd.read_csv(os.path.join(folder, file))
        df['Source'] = file
        dfs.append(df)

# Combine all resumes
data = pd.concat(dfs, ignore_index=True)
print("Combined Resume Data:")
display(data)

# 🔍 Analyze common organizations
orgs = data['Organizations'].dropna().str.split(',').explode().str.strip()
org_counts = orgs.value_counts()

plt.figure(figsize=(10,5))
org_counts.head(10).plot(kind='bar')
plt.title("Top Organizations Mentioned in Resumes")
plt.ylabel("Frequency")
plt.xticks(rotation=45)
plt.tight_layout()
plt.show()

# 🌍 Analyze common locations
locs = data['Locations'].dropna().str.split(',').explode().str.strip()
loc_counts = locs.value_counts()

plt.figure(figsize=(10,5))
loc_counts.head(10).plot(kind='bar', color='green')
plt.title("Top Locations Mentioned")
plt.ylabel("Frequency")
plt.xticks(rotation=45)
plt.tight_layout()
plt.show()

# ☁️ Word Cloud for Names (just for visual fun)
names_text = ' '.join(data['Name'].dropna())
wordcloud = WordCloud(width=800, height=400, background_color='white').generate(names_text)

plt.figure(figsize=(10, 5))
plt.imshow(wordcloud, interpolation='bilinear')
plt.axis("off")
plt.title("Word Cloud of Names")
plt.show()


ModuleNotFoundError: No module named 'pandas'