From 99ea899a850f9c967334a22f51f8e8b3e88c1bf7 Mon Sep 17 00:00:00 2001 From: Jack <32371937+jackzhxng@users.noreply.github.com> Date: Wed, 24 Sep 2025 13:12:06 -0400 Subject: [PATCH 1/2] Update Voxtral README.md --- examples/models/voxtral/README.md | 2 ++ 1 file changed, 2 insertions(+) diff --git a/examples/models/voxtral/README.md b/examples/models/voxtral/README.md index a9bd5c9b1af..4fdd4f7ba2a 100644 --- a/examples/models/voxtral/README.md +++ b/examples/models/voxtral/README.md @@ -28,7 +28,9 @@ optimum-cli export executorch \ --use_custom_sdpa \ --use_custom_kv_cache \ --qlinear 8da4w \ + --qlinear_encoder 8da4w \ --qembedding 4w \ + --qembedding_group_size 32 \ --output_dir="voxtral" ``` From 122fa3646e86266c925175a7228f39de68afd4b0 Mon Sep 17 00:00:00 2001 From: Jack <32371937+jackzhxng@users.noreply.github.com> Date: Wed, 24 Sep 2025 13:15:42 -0400 Subject: [PATCH 2/2] Update README.md --- examples/models/voxtral/README.md | 1 + 1 file changed, 1 insertion(+) diff --git a/examples/models/voxtral/README.md b/examples/models/voxtral/README.md index 4fdd4f7ba2a..c6749c00b38 100644 --- a/examples/models/voxtral/README.md +++ b/examples/models/voxtral/README.md @@ -27,6 +27,7 @@ optimum-cli export executorch \ --recipe "xnnpack" \ --use_custom_sdpa \ --use_custom_kv_cache \ + --max_seq_len 2048 \ --qlinear 8da4w \ --qlinear_encoder 8da4w \ --qembedding 4w \