Skip to content

Commit 937f992

Browse files
committed
request prealloc_y sync after quantization
1 parent 6e24c33 commit 937f992

File tree

1 file changed

+3
-3
lines changed

1 file changed

+3
-3
lines changed

ggml/src/ggml-vulkan/ggml-vulkan.cpp

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -7478,7 +7478,7 @@ static void ggml_vk_mul_mat_id_q_f16(ggml_backend_vk_context * ctx, vk_context&
74787478
if (x_non_contig || qx_needs_dequant) {
74797479
ctx->prealloc_x_need_sync = true;
74807480
}
7481-
if (y_non_contig) {
7481+
if (y_non_contig || quantize_y) {
74827482
ctx->prealloc_y_need_sync = true;
74837483
}
74847484
}
@@ -7504,7 +7504,7 @@ static void ggml_vk_mul_mat_vec_id_q_f16(ggml_backend_vk_context * ctx, vk_conte
75047504

75057505
const uint64_t ne10 = src1->ne[0];
75067506
const uint64_t ne11 = src1->ne[1];
7507-
// const uint64_t ne12 = src1->ne[2];
7507+
const uint64_t ne12 = src1->ne[2];
75087508
// const uint64_t ne13 = src1->ne[3];
75097509

75107510
const uint64_t nei0 = ids->ne[0];
@@ -7700,7 +7700,7 @@ static void ggml_vk_mul_mat_vec_id_q_f16(ggml_backend_vk_context * ctx, vk_conte
77007700
if (x_non_contig) {
77017701
ctx->prealloc_x_need_sync = true;
77027702
}
7703-
if (y_non_contig) {
7703+
if (y_non_contig || quantize_y) {
77047704
ctx->prealloc_y_need_sync = true;
77057705
}
77067706
}

0 commit comments

Comments
 (0)