In [1]:
import pandas as pd
import numpy as np

output_file = 'data/processed/parking_predictions_with_pois.parquet'
try:
    df = pd.read_parquet(output_file)

    print("--- DataFrame Info ---")
    df.info()

    print("\n--- DataFrame Head ---")
    print(df.head())

    # Identify POI columns (adjust if your naming convention differs slightly)
    poi_cols = [col for col in df.columns if col.startswith('poi_') and col.endswith('m')]

    if poi_cols:
        print(f"\n--- Found {len(poi_cols)} POI columns: ---")
        print(poi_cols)

        print("\n--- POI Columns Describe ---")
        # Attempt to convert to float for describe, as it handles NaNs and gives numeric stats
        # If your counts should strictly be integers and have no NaNs, .astype(int) might be an option
        # but float is safer for a general describe() if NaNs might exist or if some counts were float.
        try:
            print(df[poi_cols].astype(float).describe())
        except Exception as e:
            print(f"Could not describe POI columns directly, attempting column by column. Error: {e}")
            for col in poi_cols:
                try:
                    print(f"\nDescribing column: {col}")
                    print(df[col].astype(float).describe())
                except Exception as e_col:
                    print(f"Could not describe column {col}: {e_col}")


        print("\n--- POI Columns NaN Counts ---")
        print(df[poi_cols].isnull().sum())
    else:
        print("\n--- No POI columns (matching 'poi_*_...m') found! ---")

except FileNotFoundError:
    print(f"ERROR: Output file not found at {output_file}")
except Exception as e:
    print(f"An error occurred: {e}")


ERROR: Output file not found at data/processed/parking_predictions_with_pois.parquet
