In [None]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
import sys
import os

sys.path.append('../src')

from data_processing import get_processed_data
from visualization import *
from analysis import *

print("Video Game Success Predictor - Interactive Analysis")
print("Loading data...")

df = get_processed_data()

print(f"Dataset shape: {df.shape}")
print(f"Columns: {list(df.columns)}")
print(f"Time period: {df['Year_of_Release'].min()} - {df['Year_of_Release'].max()}")

df.head()

In [None]:
success_count = df['Is_Successful'].value_counts()
print("Success Distribution:")
print(f"Successful games (>1M sales): {success_count[True]:,}")
print(f"Unsuccessful games: {success_count[False]:,}")
print(f"Success rate: {(success_count[True] / len(df) * 100):.1f}%")

top_games = df.nlargest(10, 'Global_Sales')[['Name', 'Platform', 'Genre', 'Publisher', 'Global_Sales']]
print("\nTop 10 Games by Global Sales:")
top_games

In [None]:
genre_sales, total_sales, success_rate = plot_genre_analysis(df)

correlation_matrix = plot_critic_analysis(df)

publisher_total_sales, success_by_company = plot_publisher_analysis(df)

platform_sales, platform_success = plot_platform_analysis(df)

region_genre_pref = plot_regional_analysis(df)

games_per_year, sales_per_year, success_per_year, critic_per_year = plot_temporal_analysis(df)