# 📈 Coca-Cola Stock Analysis

Analysis of historical KO stock data for insights and strategy.

In [None]:

import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

# Load dataset
df = pd.read_csv("Coca-Cola Project.csv")
df['date'] = pd.to_datetime(df['date'], utc=True)


In [None]:

df['year'] = df['date'].dt.year
df['month'] = df['date'].dt.month
df['day'] = df['date'].dt.day
df['day_of_week'] = df['date'].dt.day_name()
df['daily_return'] = df['close'].pct_change()
df['ma_30'] = df['close'].rolling(window=30).mean()
df['ma_90'] = df['close'].rolling(window=90).mean()


In [None]:

correlation_matrix = df.corr(numeric_only=True)
correlation_matrix


In [None]:

sns.set(style="whitegrid")
plt.figure(figsize=(14, 6))
sns.lineplot(data=df, x='date', y='close')
plt.title('Coca-Cola Stock Closing Price Over Time')
plt.xlabel('Date')
plt.ylabel('Closing Price')
plt.tight_layout()
plt.show()

plt.figure(figsize=(10, 5))
sns.histplot(df['daily_return'].dropna(), bins=100, kde=True)
plt.title('Distribution of Daily Returns')
plt.xlabel('Daily Return')
plt.ylabel('Frequency')
plt.tight_layout()
plt.show()

plt.figure(figsize=(10, 6))
sns.heatmap(correlation_matrix, annot=True, cmap='coolwarm', fmt=".2f")
plt.title('Correlation Matrix of Stock Metrics')
plt.tight_layout()
plt.show()


In [None]:

annual_summary = df.groupby('year')[['open', 'high', 'low', 'close', 'volume']].agg(['mean', 'max', 'min'])
annual_summary.tail()


In [None]:

df['annual_return'] = df.groupby('year')['daily_return'].transform('mean')
annual_returns = df.groupby('year')['daily_return'].mean().sort_values(ascending=False)
top_gains = df.sort_values(by='daily_return', ascending=False).head(5)
top_losses = df.sort_values(by='daily_return').head(5)

annual_returns.head(), top_gains[['date', 'daily_return']], top_losses[['date', 'daily_return']]
