# Implementation: Mock INT8 Quantization

**Goal**: Compress Floats.

In [None]:
import torch

# 1. Original Weights (FP32)
weights_fp32 = torch.tensor([0.15, -0.85, 2.30, -1.20])

# 2. Determine Scale
max_val = weights_fp32.abs().max()
scale = 127 / max_val
print(f"Scale Factor: {scale:.2f}")

# 3. Quantize
weights_int8 = (weights_fp32 * scale).round().clamp(-127, 127).char()

# 4. De-quantize (During Inference)
weights_recon = weights_int8.float() / scale

print(f"Original: {weights_fp32}")
print(f"Int8 Rep: {weights_int8}")
print(f"Restored: {weights_recon}")
print(f"Error: {(weights_fp32 - weights_recon).abs().mean():.4f}")

## Conclusion
The error is small enough that the LLM usually doesn't notice.