<a href="https://colab.research.google.com/github/cbonnin88/starfield_industries/blob/main/hire_date_analysis.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [3]:
import polars as pl
import plotly.express as px
import gdown as gd

In [4]:
url = 'https://drive.google.com/uc?id=1pAE3Knjo4JSSY4vVi8DwBFkIEU6vlRDT'
gd.download(url,'starfield_HR.csv',quiet=True)

df_starfield = pl.read_csv('starfield_HR.csv')

In [5]:
df_starfield.columns

['ID',
 'Name',
 'Surname',
 'Age',
 'Tenure',
 'Hire Date',
 'Gender',
 'Region',
 'Job Title',
 'Department',
 'Manager',
 'Hours',
 'Salary Band',
 'Salary',
 'Performance',
 'Satisfaction']

In [6]:
df_starfield_new = df_starfield.with_columns(
    pl.col("Hire Date").str.to_datetime()
)

In [7]:
df_starfield_new.dtypes

[Int64,
 String,
 String,
 Int64,
 Int64,
 Datetime(time_unit='us', time_zone=None),
 String,
 String,
 String,
 String,
 String,
 Int64,
 String,
 Int64,
 String,
 Float64]

In [8]:
df_starfield_new.head()

ID,Name,Surname,Age,Tenure,Hire Date,Gender,Region,Job Title,Department,Manager,Hours,Salary Band,Salary,Performance,Satisfaction
i64,str,str,i64,i64,datetime[μs],str,str,str,str,str,i64,str,i64,str,f64
4045,"""Gwendolyn""","""Turner""",18,0,2025-05-07 00:00:00,"""Female""","""ile-de-France""","""Automation Engineer""","""Engineering""","""no""",8,"""T5""",13600,"""Average""",3.0
5780,"""Jason""","""Peterson""",20,1,2024-09-01 00:00:00,"""Male""","""ile-de-France""","""Release Engineer""","""Engineering""","""no""",8,"""T5""",14688,"""Average""",5.0
9231,"""Max""","""Hopkins""",19,1,2024-02-03 00:00:00,"""Male""","""ile-de-France""","""Support Engineer""","""Engineering""","""no""",8,"""T5""",14786,"""Average""",3.0
11163,"""Vanesa""","""Saldaña""",18,0,2025-06-17 00:00:00,"""Male""","""ile-de-France""","""Quantum Engineer""","""Engineering""","""no""",8,"""T5""",15439,"""Average""",0.0
7851,"""Amador""","""Roybal""",54,2,2023-02-11 00:00:00,"""Male""","""ile-de-France""","""Financial Planning & Analysis …","""Finance""","""no""",8,"""T5""",22427,"""Average""",5.0


# **Employees Hired per Year**

In [11]:
hiring_trends = df_starfield_new.with_columns(
    pl.col('Hire Date').dt.year().alias('hiring_year')
).group_by('hiring_year').agg(
    pl.len().alias('employees_hired')
).sort('hiring_year')

In [12]:
fig = px.bar(
    hiring_trends,
    x='hiring_year',
    y='employees_hired',
    title='Employees Hired Per Year',
    labels={'hiring_year':'Hiring Year','employees_hired':'Number of Employees Hired'},
    color_discrete_sequence=px.colors.qualitative.Pastel
)

fig.show()