Task 2 Explore the geographical distribution of software engineering job opportunities.

In [None]:
import pandas as pd
import matplotlib.pyplot as plt

In [None]:
# Reads data from jobs.csv and postings.csv
jobs_df = pd.read_csv('data\jobs.csv')
postings_df = pd.read_csv('data\postings.csv')

# We select only software engineering jobs
software_engineering_jobs = jobs_df[jobs_df['Job function'].str.contains('Software Engineering', case=False)]

# Merging job titles from postings.csv to jobs.csv by company name
merged_df = pd.merge(software_engineering_jobs, postings_df, how='left', left_on='company', right_on='company')

# Counting the number of job opportunities by location
location_distribution = merged_df['location'].value_counts()

# Grouping countries by wage and job vacancies
country_stats = merged_df.groupby('country').agg({'wage': 'median', 'location': 'count'})

# Illustration
plt.figure(figsize=(12, 6))

# Wage Plot
plt.subplot(1, 2, 1)
country_stats['wage'].plot(kind='bar', color='skyblue')
plt.title('Median Wage by Country')
plt.ylabel('Median Wage')
plt.xlabel('Country')

# Vacancies Plot
plt.subplot(1, 2, 2)
country_stats['location'].plot(kind='bar', color='salmon')
plt.title('Job Vacancies by Country')
plt.ylabel('Job Vacancies')
plt.xlabel('Country')

plt.tight_layout()
plt.show()

print(location_distribution)