# Train ViT-Base on Colab

This notebook is designed to run the VLM-arch training pipeline on Google Colab's GPU runtime.

In [None]:
# 1. Setup Environment
import os
import shutil

# FORCE CLEANUP: Remove existing repo to ensure fresh clone
if os.path.exists('VLM-arch'):
    shutil.rmtree('VLM-arch')

# Clone the repository
!git clone https://github.com/cronenberg64/VLM-arch.git
%cd VLM-arch

# Install dependencies
!pip install -r requirements.txt
!pip install hydra-core omegaconf wandb timm

# VERIFICATION: Check if the fix is present
print("\n--- Verifying src/data/transforms.py ---")
!cat src/data/transforms.py
print("\n----------------------------------------")

In [None]:
# 2. Verify GPU
!nvidia-smi

In [None]:
# 3. Run Training (ViT-Base)
# Note: We resize images to 224x224 for ViT
!python scripts/train.py \
    model=vit_base \
    dataset=cifar10 \
    dataset.subset=5000 \
    dataset.image_size=224 \
    training.epochs=100 \
    training.lr=0.0001 \
    training.batch_size=128 \
    debug=true

In [None]:
# 4. (Optional) Zip and Download Results
!zip -r results.zip results/
from google.colab import files
files.download('results.zip')