In [None]:
import pandas as pd
import sqlite3
import matplotlib.pyplot as plt
import seaborn as sns

# Connect to your database
DATABASE_NAME = "../anime.db" # Use relative path from the notebooks folder
conn = sqlite3.connect(DATABASE_NAME)

# Load data into a pandas DataFrame
df = pd.read_sql_query("SELECT * FROM anime", conn)
conn.close()

# --- Exploration 1: Top 10 Anime by Score ---
top_10_scored = df.nlargest(10, 'score')

plt.figure(figsize=(10, 6))
sns.barplot(data=top_10_scored, x='score', y='title', palette='viridis')
plt.title('Top 10 Anime by Score')
plt.xlabel('Score')
plt.ylabel('Anime Title')
plt.show()


# --- Exploration 2: Most Prolific Studios ---
# We need to handle multiple studios per anime
studios = df['studio'].str.split(', ').explode().str.strip()
top_10_studios = studios.value_counts().nlargest(10)

plt.figure(figsize=(10, 6))
sns.barplot(x=top_10_studios.values, y=top_10_studios.index, palette='mako')
plt.title('Top 10 Studios by Number of Productions (in Top 100)')
plt.xlabel('Number of Productions')
plt.ylabel('Studio')
plt.show()