# 00 — Quick Start

This notebook verifies that the project environment is set up correctly.

## How to run

```bash
# From the project root:
python -m venv .venv
source .venv/bin/activate          # Linux/macOS
# .venv\\Scripts\\activate          # Windows PowerShell
pip install --upgrade pip
pip install -r requirements.txt
python -m pytest tests/ -v
```

Or run everything at once:
```bash
bash run_env_check.sh
```

In [None]:
# Cell 1 — Print installed package versions
import importlib, sys

print(f"Python {sys.version}\n")

packages = [
    "pandas", "numpy", "sklearn", "xgboost", "lightgbm",
    "matplotlib", "seaborn", "plotly", "shap", "joblib",
    "pyarrow", "fastparquet", "tensorflow", "mlflow",
]

for pkg in packages:
    try:
        mod = importlib.import_module(pkg)
        ver = getattr(mod, "__version__", "installed (no __version__)")
        print(f"  {pkg:20s} {ver}")
    except ImportError:
        print(f"  {pkg:20s} *** NOT INSTALLED ***")

In [None]:
# Cell 2 — Run the skeleton tests from inside the notebook
import subprocess, sys

result = subprocess.run(
    [sys.executable, "-m", "pytest", "tests/test_skeleton.py", "-v", "--tb=short"],
    capture_output=True, text=True
)
print(result.stdout)
if result.returncode != 0:
    print(result.stderr)

In [None]:
# Cell 3 — Quick peek at available data files
from pathlib import Path

data_dir = Path("../data") if Path("../data").exists() else Path("data")
csv_files = sorted(data_dir.glob("*.csv"))
print(f"Found {len(csv_files)} CSV file(s) in {data_dir.resolve()}:\n")
for f in csv_files:
    size_mb = f.stat().st_size / (1024 * 1024)
    print(f"  {f.name:45s}  {size_mb:8.2f} MB")