In [None]:
# Import pustaka yang dibutuhkan
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
from sklearn.linear_model import LinearRegression

# 1. Load data
df = pd.read_csv('cases.csv')
df.head()

In [None]:
X = df[['acc_confirmed']].fillna(0)
y = df['new_confirmed'].fillna(0)

model = LinearRegression()
model.fit(X, y)

r2 = model.score(X, y)
coef = model.coef_[0]
intercept = model.intercept_

print(f"Coef: {coef}")
print(f"Intercept: {intercept}")
print(f"\nRegresi Linier: new_confirmed = {coef:.2f} * acc_confirmed + {intercept:.2f}")
print(f"R² Score: {r2:.4f}")

In [None]:
plt.figure(figsize=(14, 10))
plt.suptitle('Infografis COVID-19 Indonesia\nStatistik & Regresi Linier', fontsize=16, weight='bold')

# Histogram Kasus Baru
plt.subplot(2, 2, 1)
sns.histplot(df['new_confirmed'].dropna(), bins=30, color='#fa8c16')
plt.title('Distribusi Kasus Baru (new_confirmed)')

# Boxplot Kematian Baru
plt.subplot(2, 2, 2)
sns.boxplot(y=df['new_deceased'].dropna(), color='#ff4d4f')
plt.title('Sebaran Kematian Baru (new_deceased)')

# Scatter + Line Regressi
plt.subplot(2, 1, 2)
sns.regplot(x='acc_confirmed', y='new_confirmed', data=df,
            scatter_kws={'s':10}, line_kws={'color':'blue'})
plt.title(f'Regresi: new_confirmed vs acc_confirmed\nR² = {r2:.3f}, y = {coef:.2f}x + {intercept:.2f}')
plt.xlabel('Total Kasus Terkonfirmasi (acc_confirmed)')
plt.ylabel('Kasus Baru Harian (new_confirmed)')

plt.tight_layout(rect=[0, 0, 1, 0.93])
plt.show()