In [1]:
import pandas as pd

# Load the CSV file into a DataFrame
df = pd.read_csv('Resources/CPI_Tech2018-2024.csv')

# Check the first few rows of the data to understand its structure
print(df.head())

       Series ID  Year Period     Label   Value
0  CUUR0000SEEEC  2018    M01  2018 Jan  56.343
1  CUUR0000SEEEC  2018    M02  2018 Feb  56.001
2  CUUR0000SEEEC  2018    M03  2018 Mar  55.699
3  CUUR0000SEEEC  2018    M04  2018 Apr  55.804
4  CUUR0000SEEEC  2018    M05  2018 May  55.537


In [2]:
# Convert 'Year' and 'Period' into a proper datetime format
df['Month'] = df['Period'].apply(lambda x: x[1:])  # Extract the month part from 'Period'
df['Date'] = pd.to_datetime(df[['Year', 'Month']].assign(DAY=1))  # Create a 'Date' column

# Drop the now redundant 'Year', 'Period', and 'Label' columns
df = df.drop(columns=['Year', 'Period', 'Label'])

# Set 'Date' as the index (optional for time series analysis)
df.set_index('Date', inplace=True)

# Check the first few rows to verify changes
print(df.head())


                Series ID   Value Month
Date                                   
2018-01-01  CUUR0000SEEEC  56.343    01
2018-02-01  CUUR0000SEEEC  56.001    02
2018-03-01  CUUR0000SEEEC  55.699    03
2018-04-01  CUUR0000SEEEC  55.804    04
2018-05-01  CUUR0000SEEEC  55.537    05


In [3]:
# Drop the 'Month' column, since 'Date' already contains both year and month
df = df.drop(columns=['Month'])

# Check the first few rows to verify the final structure
print(df.head())


                Series ID   Value
Date                             
2018-01-01  CUUR0000SEEEC  56.343
2018-02-01  CUUR0000SEEEC  56.001
2018-03-01  CUUR0000SEEEC  55.699
2018-04-01  CUUR0000SEEEC  55.804
2018-05-01  CUUR0000SEEEC  55.537


In [4]:
# Filter for the "Information Technology Commodities" category
it_commodities_df = df[df['Series ID'] == 'CUUR0000SEEEC']

# Check the first few rows of the filtered data
print(it_commodities_df.head())


                Series ID   Value
Date                             
2018-01-01  CUUR0000SEEEC  56.343
2018-02-01  CUUR0000SEEEC  56.001
2018-03-01  CUUR0000SEEEC  55.699
2018-04-01  CUUR0000SEEEC  55.804
2018-05-01  CUUR0000SEEEC  55.537


In [5]:
import matplotlib.pyplot as plt

# Plot the CPI trend over time
plt.figure(figsize=(10,6))
plt.plot(it_commodities_df.index, it_commodities_df['Value'], label='CPI - IT Commodities')
plt.title('CPI Over Time - IT Commodities')
plt.xlabel('Date')
plt.ylabel('CPI Value')
plt.legend()
plt.show()

# Plot the inflation rate over time
plt.figure(figsize=(10,6))
plt.plot(it_commodities_df.index, it_commodities_df['Inflation Rate'], label='Inflation Rate - IT Commodities', color='orange')
plt.title('Inflation Rate Over Time - IT Commodities')
plt.xlabel('Date')
plt.ylabel('Inflation Rate (%)')
plt.legend()
plt.show()


ImportError: DLL load failed while importing _multiarray_umath: The specified module could not be found.

ImportError: numpy.core.multiarray failed to import