From 7d873df32ad9c73f1d4132342ab4cd01d63cef26 Mon Sep 17 00:00:00 2001 From: leejet Date: Sat, 30 May 2026 22:09:57 +0800 Subject: [PATCH] fix: correct Gemma3 rope settings and vram limit propagation --- src/conditioner.hpp | 5 +++++ src/llm.hpp | 8 ++++---- 2 files changed, 9 insertions(+), 4 deletions(-) diff --git a/src/conditioner.hpp b/src/conditioner.hpp index 0347a5258..f7037bc69 100644 --- a/src/conditioner.hpp +++ b/src/conditioner.hpp @@ -2290,6 +2290,11 @@ struct LTXAVEmbedder : public Conditioner { projector->set_flash_attention_enabled(enabled); } + void set_max_graph_vram_bytes(size_t max_vram_bytes) override { + llm->set_max_graph_vram_bytes(max_vram_bytes); + projector->set_max_graph_vram_bytes(max_vram_bytes); + } + void set_weight_adapter(const std::shared_ptr& adapter) override { llm->set_weight_adapter(adapter); projector->set_weight_adapter(adapter); diff --git a/src/llm.hpp b/src/llm.hpp index ec510e875..9c36be4bb 100644 --- a/src/llm.hpp +++ b/src/llm.hpp @@ -879,8 +879,8 @@ namespace LLM { input_pos, nullptr, head_dim, - GGML_ROPE_TYPE_NORMAL, - 0, + GGML_ROPE_TYPE_NEOX, + 131072, rope_theta, freq_scale, 0.f, @@ -892,8 +892,8 @@ namespace LLM { input_pos, nullptr, head_dim, - GGML_ROPE_TYPE_NORMAL, - 0, + GGML_ROPE_TYPE_NEOX, + 131072, rope_theta, freq_scale, 0.f,