# Inspect `columns_to_drop.pickle`

This notebook loads `SWAN/databases/columns_to_drop.pickle` and prints a readable summary of its contents (type, size, and samples).

In [7]:
from pathlib import Path
import pickle

path = Path("SWAN/databases/columns_to_drop.pickle")
with path.open("rb") as f:
    obj = pickle.load(f)

print("Loaded:", path)
print("Type:", type(obj))


Loaded: SWAN/databases/columns_to_drop.pickle
Type: <class 'dict'>


In [9]:
import pprint

try:
    from IPython.display import display
except Exception:
    display = None


def summarize(o):
    if isinstance(o, dict):
        print(f"dict with {len(o)} keys")
        keys = list(o.keys())
        print("First keys:")
        pprint.pprint(keys)
        for k in keys:
            print(f"- {k!r}:")
            pprint.pprint(o[k])
        return
    else:
        raise ValueError(f"Unsupported type: {type(o)}")

    if isinstance(o, (list, tuple, set)):
        seq = list(o)
        print(f"{type(o).__name__} with {len(seq)} items")
        print("First items:")
        pprint.pprint(seq)
        if seq and all(isinstance(x, str) for x in seq):
            print("\nUnique items:", len(set(seq)))
        return

    if hasattr(o, "shape") and hasattr(o, "head"):
        print("table-like object")
        print("Shape:", getattr(o, "shape", None))
        try:
            print("Columns:")
            pprint.pprint(list(getattr(o, "columns", [])))
        except Exception:
            pass
        head = o.head(20)
        if display is not None:
            display(head)
        else:
            print(head)
        return

    pprint.pprint(o)


summarize(obj)


dict with 4 keys
First keys:
['california_schools', 'formula_1', 'european_football_2', 'superhero']
- 'california_schools':
['fprm.`County Name`',
 'fprm.`County Code`',
 'fprm.`Educational Option Type`',
 'fprm.`Charter School (Y/N)`',
 'fprm.`Charter School Number`',
 'fprm.`Charter Funding Type`',
 'satscores.cname',
 'schools.`Country`',
 'schools.`City`',
 'schools.`MailCity`',
 'schools.`Magnet`',
 'schools.`Website`']
- 'formula_1':
['circuits.`country`',
 'circuits.`url`',
 'circuits.`lat`',
 'circuits.`lng`',
 'constructors.`nationality`',
 'constructors.`url`',
 'drivers.`nationality`',
 'drivers.`dob`',
 'drivers.`url`',
 'drivers.`code`',
 'races.date',
 'races.url']
- 'european_football_2':
['league.`country_id`',
 'league.`name`',
 'Country.`name`match.`league_id`',
 'match.`country_id`',
 'match.`home_team_goal`',
 'match.`away_team_goal`',
 'match.`goal`',
 'Team.`team_short_name`',
 'Player.`birthday`',
 'Player.`height`',
 'Player_Attributes.`preferred_foot`']
- 'sup