Skip to content

Commit 2ea0e00

Browse files
committed
opencl: use q8_0 mm for larger matrix
1 parent 28d3073 commit 2ea0e00

File tree

1 file changed

+3
-0
lines changed

1 file changed

+3
-0
lines changed

ggml/src/ggml-opencl/ggml-opencl.cpp

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -6975,6 +6975,9 @@ static void ggml_cl_mul_mat(ggml_backend_t backend, const ggml_tensor * src0, co
69756975
return;
69766976
}
69776977
case GGML_TYPE_Q8_0: {
6978+
if (ne11 < 32) {
6979+
break;
6980+
}
69786981
kernel = backend_ctx->kernel_mul_mm_q8_0_f32_l4_lm;
69796982
nth0 = 128; // calculated as (BM*BN)/(TM*TN)
69806983

0 commit comments

Comments
 (0)