Skip to content

Commit 1b78909

Browse files
committed
request prealloc_y sync after quantization
1 parent 434c6d3 commit 1b78909

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

ggml/src/ggml-vulkan/ggml-vulkan.cpp

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -7502,7 +7502,7 @@ static void ggml_vk_mul_mat_id_q_f16(ggml_backend_vk_context * ctx, vk_context&
75027502
if (x_non_contig || qx_needs_dequant) {
75037503
ctx->prealloc_x_need_sync = true;
75047504
}
7505-
if (y_non_contig) {
7505+
if (y_non_contig || quantize_y) {
75067506
ctx->prealloc_y_need_sync = true;
75077507
}
75087508
}
@@ -7803,7 +7803,7 @@ static void ggml_vk_mul_mat_vec_id_q_f16(ggml_backend_vk_context * ctx, vk_conte
78037803
if (x_non_contig) {
78047804
ctx->prealloc_x_need_sync = true;
78057805
}
7806-
if (y_non_contig) {
7806+
if (y_non_contig || quantize_y) {
78077807
ctx->prealloc_y_need_sync = true;
78087808
}
78097809
}

0 commit comments

Comments
 (0)