add experiment harness

jbloomAus · Jun 27, 2024 · 1e020d5 · 1e020d5
1 parent 7a22a75
commit 1e020d5
Show file tree

Hide file tree

Showing 2 changed files with 124 additions and 0 deletions.
diff --git a/experiments/run_train_transcoder.py b/experiments/run_train_transcoder.py
@@ -0,0 +1,123 @@
+import os
+
+import torch
+from simple_parsing import ArgumentParser
+
+from sae_lens.config import LanguageModelTranscoderRunnerConfig
+from sae_lens.sae_training_runner import TranscoderTrainingRunner
+
+
+def setup_env_vars():
+    # Set the environment variables for the cache and the dataset.
+    os.environ["TOKENIZERS_PARALLELISM"] = "false"
+
+
+def get_default_config():
+    if torch.cuda.is_available():
+        device = "cuda"
+    elif torch.backends.mps.is_available():
+        device = "mps"
+    else:
+        device = "cpu"
+
+    # total_training_steps = 20_000
+    total_training_steps = 500
+    batch_size = 4096
+    total_training_tokens = total_training_steps * batch_size
+    print(f"Total Training Tokens: {total_training_tokens}")
+
+    lr_warm_up_steps = 0
+    lr_decay_steps = 40_000
+    print(f"lr_decay_steps: {lr_decay_steps}")
+    l1_warmup_steps = 10_000
+    print(f"l1_warmup_steps: {l1_warmup_steps}")
+
+    return LanguageModelTranscoderRunnerConfig(
+        # Pick a tiny model to make this easier.
+        model_name="gelu-1l",
+        ## MLP Layer 0 ##
+        hook_name="blocks.0.ln2.hook_normalized",
+        hook_name_out="blocks.0.hook_mlp_out",  # A valid hook point (see more details here: https://neelnanda-io.github.io/TransformerLens/generated/demos/Main_Demo.html#Hook-Points)
+        hook_layer=0,  # Only one layer in the model.
+        hook_layer_out=0,  # Only one layer in the model.
+        d_in=512,  # the width of the mlp input.
+        d_out=512,  # the width of the mlp output.
+        dataset_path="NeelNanda/c4-tokenized-2b",
+        context_size=256,
+        is_dataset_tokenized=True,
+        prepend_bos=True,  # I used to train GPT2 SAEs with a prepended-bos but no longer think we should do this.
+        # How big do we want our SAE to be?
+        expansion_factor=16,
+        # Dataset / Activation Store
+        # When we do a proper test
+        # training_tokens= 820_000_000, # 200k steps * 4096 batch size ~ 820M tokens (doable overnight on an A100)
+        # For now.
+        training_tokens=total_training_tokens,  # For initial testing I think this is a good number.
+        train_batch_size_tokens=4096,
+        # Loss Function
+        ## Reconstruction Coefficient.
+        mse_loss_normalization=None,  # MSE Loss Normalization is not mentioned (so we use stanrd MSE Loss). But not we take an average over the batch.
+        ## Anthropic does not mention using an Lp norm other than L1.
+        l1_coefficient=5,
+        lp_norm=1.0,
+        # Instead, they multiply the L1 loss contribution
+        # from each feature of the activations by the decoder norm of the corresponding feature.
+        scale_sparsity_penalty_by_decoder_norm=True,
+        # Learning Rate
+        lr_scheduler_name="constant",  # we set this independently of warmup and decay steps.
+        l1_warm_up_steps=l1_warmup_steps,
+        lr_warm_up_steps=lr_warm_up_steps,
+        lr_decay_steps=lr_warm_up_steps,
+        ## No ghost grad term.
+        use_ghost_grads=False,
+        # Initialization / Architecture
+        apply_b_dec_to_input=False,
+        # encoder bias zero's. (I'm not sure what it is by default now)
+        # decoder bias zero's.
+        b_dec_init_method="zeros",
+        normalize_sae_decoder=False,
+        decoder_heuristic_init=True,
+        init_encoder_as_decoder_transpose=True,
+        # Optimizer
+        lr=4e-5,
+        ## adam optimizer has no weight decay by default so worry about this.
+        adam_beta1=0.9,
+        adam_beta2=0.999,
+        # Buffer details won't matter in we cache / shuffle our activations ahead of time.
+        n_batches_in_buffer=64,
+        store_batch_size_prompts=16,
+        normalize_activations="constant_norm_rescale",
+        # Feature Store
+        feature_sampling_window=1000,
+        dead_feature_window=1000,
+        dead_feature_threshold=1e-4,
+        # performance enhancement:
+        compile_sae=True,
+        # WANDB
+        log_to_wandb=True,  # always use wandb unless you are just testing code.
+        wandb_project="benchmark",
+        wandb_log_frequency=100,
+        # Misc
+        device=device,
+        seed=42,
+        n_checkpoints=0,
+        checkpoint_path="checkpoints",
+        dtype="float32",
+    )
+
+
+def run_training(cfg: LanguageModelTranscoderRunnerConfig):
+    sae = TranscoderTrainingRunner(cfg).run()
+    assert sae is not None
+    # know whether or not this works by looking at the dashboard!    # know whether or not this works by looking at the dashboard!
+
+
+if __name__ == "__main__":
+
+    parser = ArgumentParser()
+    parser.add_arguments(
+        LanguageModelTranscoderRunnerConfig, "cfg", default=get_default_config()
+    )
+    args = parser.parse_args()
+    setup_env_vars()
+    run_training(args.cfg)
diff --git a/pyproject.toml b/pyproject.toml
@@ -53,6 +53,7 @@ mkdocstrings-python = "^1.9.0"
 
 [tool.poetry.group.tutorials.dependencies]
 ipykernel = "^6.29.4"
+simple-parsing = "^0.1.5"
 
 [tool.poetry.extras]
 mamba = ["mamba-lens"]