# 04 - Mobile Optimization

Optimize models for mobile deployment:
- Quantization (dynamic, static, QAT)
- CoreML / TFLite export
- Benchmark inference latency
- Verify mobile readiness constraints

In [None]:
import torch
from src.models import build_model
from src.utils.config import load_config
from src.mobile.quantize import quantize_dynamic, compare_model_sizes
from src.mobile.benchmark import benchmark_pytorch, check_mobile_readiness

config = load_config('configs/model_tiny.yaml')
model = build_model(config.model)

# Compare sizes
sizes = compare_model_sizes(model)
for k, v in sizes.items():
    print(f'{k}: {v}')

In [None]:
# Benchmark
bench = benchmark_pytorch(model, num_runs=200)
for k, v in bench.items():
    print(f'{k}: {v:.3f}')

In [None]:
# Mobile readiness check
check_mobile_readiness(model, max_size_mb=5.0, max_latency_ms=10.0)