In [None]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
%matplotlib inline 
# This line ensures plots are displayed directly in the notebook

In [None]:
# For Google Colab
from google.colab import drive
drive.mount('/content/drive')

# Then, provide the full path to your file
file_path = '/data/raw/BrentOilPrices.csv' # Adjust the path as needed
df = pd.read_csv(file_path)

# If you are working locally, a simple relative path will work
# df = pd.read_csv('data/raw/BrentOilPrices.csv')

In [None]:
# Display the first 5 rows to see what the data looks like
print(df.head())

# Get a summary of the dataframe, including data types and non-null counts
print(df.info())

In [None]:
# Convert the 'Date' column to datetime objects
df['Date'] = pd.to_datetime(df['Date'], format='%d-%b-%y')

# Set the 'Date' column as the DataFrame index
df.set_index('Date', inplace=True)

# Check the data types again to confirm the change
print(df.info())

In [None]:
# Check for any missing values
print(df.isnull().sum())

# Depending on the number of missing values, you may need to handle them.
# For a few, you could use forward fill (ffill) or back fill (bfill).
# df.ffill(inplace=True)

In [None]:
plt.figure(figsize=(15, 7))
plt.plot(df['Price'])
plt.title('Brent Oil Prices Over Time')
plt.xlabel('Date')
plt.ylabel('Price (USD)')
plt.grid(True)
plt.show()

In [None]:
# Calculate log returns
df['Log_Returns'] = np.log(df['Price'] / df['Price'].shift(1))

plt.figure(figsize=(15, 7))
plt.plot(df['Log_Returns'])
plt.title('Daily Log Returns of Brent Oil Prices')
plt.xlabel('Date')
plt.ylabel('Log Return')
plt.grid(True)
plt.show()