In [1]:
import pandas as pd
import zipfile

# --- CONFIGURE THIS ---
ZIP_FILE_PATH = "data/raw/wbat.zip"

# --- RUN THE TEST ---
print(f"--- Inspecting headers in: {ZIP_FILE_PATH} ---")

with zipfile.ZipFile(ZIP_FILE_PATH, "r") as zip_ref:
    for internal_filepath in zip_ref.namelist():
        if internal_filepath.lower().endswith('.csv'):
            print(f"\n--- Reading internal file: {internal_filepath} ---")
            with zip_ref.open(internal_filepath) as internal_file:
                df = pd.read_csv(internal_file, nrows=10) # Read a few rows
                
                print(f"df.columns: {list(df.columns)}")
                
                # The critical test: Show the raw representation of the columns
                print(f"Raw repr(df.columns): {repr(df.columns)}")

                # Find the column that looks like 'SALE' and inspect it
                for col in df.columns:
                    if 'SALE' in col.upper():
                        print(f"\nInspecting column '{col}':")
                        # This will print the Unicode code point for each character
                        char_analysis = [(char, ord(char)) for char in col]
                        print(f"Character Analysis (char, unicode_point): {char_analysis}")
                break # Stop after the first CSV

--- Inspecting headers in: data/raw/wbat.zip ---

--- Reading internal file: wbat.csv ---
df.columns: ['UPC', 'STORE', 'WEEK', 'MOVE', 'QTY', 'PRICE', 'SALE', 'PROFIT', 'OK', 'PRICE_HEX', 'PROFIT_HEX']
Raw repr(df.columns): Index(['UPC', 'STORE', 'WEEK', 'MOVE', 'QTY', 'PRICE', 'SALE', 'PROFIT', 'OK',
       'PRICE_HEX', 'PROFIT_HEX'],
      dtype='object')

Inspecting column 'SALE':
Character Analysis (char, unicode_point): [('S', 83), ('A', 65), ('L', 76), ('E', 69)]
