summaryrefslogtreecommitdiff
path: root/ggml.c
diff options
context:
space:
mode:
authorshibe2 <shibe@tuta.io>2023-10-02 23:26:15 +0400
committerGitHub <noreply@github.com>2023-10-02 21:26:15 +0200
commit665018c749101e81c816675198e731e47d6b1dbe (patch)
tree4486f9b1484367d04d2609b57453af30cf0c8453 /ggml.c
parent29a404a951fb0b3f9c3b6ab8c4c9c76ac50d2bb3 (diff)
CLBlast: Add broadcast support for matrix multiplication (#3402)
Broadcast src0 into src1 across dimensions 2 and 3 when needed. This is required for models that use GQA.
Diffstat (limited to 'ggml.c')
-rw-r--r--ggml.c5
1 files changed, 0 insertions, 5 deletions
diff --git a/ggml.c b/ggml.c
index 820fe2e7..bf1426d2 100644
--- a/ggml.c
+++ b/ggml.c
@@ -11621,11 +11621,6 @@ static void ggml_compute_forward_mul_mat(
#if defined(GGML_USE_CLBLAST)
if (ggml_cl_can_mul_mat(src0, src1, dst)) {
- // TODO: handle case when src0 is broadcast-able into src1 across 2nd,3rd dimension
- // ref: https://github.com/ggerganov/ggml/pull/224
- GGML_ASSERT(ne02 == ne12);
- GGML_ASSERT(ne03 == ne13);
-
if (params->ith == 0 && params->type == GGML_TASK_COMPUTE) {
ggml_cl_mul_mat(src0, src1, dst, params->wdata, params->wsize);
}