diff --git a/tinker_cookbook/recipes/chat_sl/README.md b/tinker_cookbook/recipes/chat_sl/README.md index 42d49df..6d8e90e 100644 --- a/tinker_cookbook/recipes/chat_sl/README.md +++ b/tinker_cookbook/recipes/chat_sl/README.md @@ -3,7 +3,7 @@ ## SFT on NoRobots ```bash -python -m tinker_cookbook.recipes.chat_sl.train +python -m tinker_cookbook.recipes.chat_sl.train \ model_name=Qwen/Qwen3-8B-Base \ dataset=no_robots \ learning_rate=5e-4 \ @@ -19,7 +19,7 @@ After 140 steps of training, `test/nll` decreases to 1.788. ## SFT on Tulu3 dataset ```bash -python -m tinker_cookbook.recipes.chat_sl.train +python -m tinker_cookbook.recipes.chat_sl.train \ model_name=Qwen/Qwen3-8B-Base \ dataset=tulu3 \ learning_rate=5e-4 \