# PowerBI Export
Export CSVs and project README to drive dashboards/ for PowerBI consumption.
Requires `gtd_cleaned.csv` to exist in `data/`.

In [None]:
import pandas as pd
import os

base_path = '/content/drive/MyDrive/LABS/Project-1-GTD-Analytics'
df_clean = pd.read_csv(f'{base_path}/data/gtd_cleaned.csv')
print('Loaded cleaned data:', df_clean.shape)

In [None]:
# FINAL POWERBI EXPORT
df_clean.to_csv(f'{base_path}/dashboards/gtd_powerbi.csv', index=False)

# PowerBI-ready summary table
powerbi_summary = df_clean.groupby(['region_txt', 'attacktype1_txt']).agg({
    'eventid': 'count',
    'casualties': 'sum',
    'nkill': 'sum'
}).round(2).reset_index()
powerbi_summary.columns = ['Region', 'Attack_Type', 'Attack_Count', 'Total_Casualties', 'Fatalities']
powerbi_summary.to_csv(f'{base_path}/dashboards/gtd_powerbi_summary.csv', index=False)

# CREATE README
readme_content = f"
GTD TERRORISM ANALYTICS PIPELINE - COMPLETE
=========================================
Processed: {len(df_clean):,} attacks (1970-2020)
Severity: {df_clean['severity'].value_counts().to_dict()}

POWERBI FILES (Drag to PowerBI Desktop):
├── gtd_powerbi.csv              (Main dataset)
├── gtd_powerbi_summary.csv      (Aggregated KPIs)
├── gtd_analytics.db             (3 SQLite tables)
├── master_dashboard.html        (Interactive charts)
├── feature_importance.png       (ML insights)
└── severity_chart.html          (Distribution)

POWERBI DASHBOARD SETUP (5 minutes):
1. Get Data → Text/CSV → gtd_powerbi.csv
2. Get Data → Database → SQLite → gtd_analytics.db
3. Create visuals: line/year, map (lat/lon), bars, pies, cards

ML MODEL: Random Forest (saved: gtd_model.pkl)
"
with open(f'{base_path}/README.md', 'w') as f:
    f.write(readme_content)

print("PROJECT EXPORT COMPLETE!")
print(f"All files in: {base_path}/dashboards")
print('
POWERBI READY FILES:')
print('   - gtd_powerbi.csv (Main)')
print('   - gtd_analytics.db (Database)')
print('   - feature_importance.png (ML)')
print('   - master_dashboard.html (Charts)')