summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorGeorgi Gerganov <ggerganov@gmail.com>2023-12-14 10:35:29 +0200
committerGeorgi Gerganov <ggerganov@gmail.com>2023-12-14 10:35:29 +0200
commit55e87c3749cb4985c3b316984d40e00e4df4a5d0 (patch)
tree492a10dc18935136397da89c1a14fe992d535b1b
parent873637afc7924f435ac44c067630a28e82eefa7b (diff)
ggml : fix OpenCL broadcast requirement for ggml_mul (close #4453)
-rw-r--r--ggml.c4
1 files changed, 2 insertions, 2 deletions
diff --git a/ggml.c b/ggml.c
index 29e18a24..7e127281 100644
--- a/ggml.c
+++ b/ggml.c
@@ -7759,10 +7759,10 @@ static void ggml_compute_forward_mul_f32(
const int ith = params->ith;
const int nth = params->nth;
-// TODO: OpenCL kernel support broadcast
#ifdef GGML_USE_CLBLAST
if (src1->backend == GGML_BACKEND_GPU) {
- GGML_ASSERT(ggml_are_same_shape(src0, src1));
+ // TODO: OpenCL kernel support full broadcast
+ GGML_ASSERT(ggml_can_repeat_rows(src1, src0));
if (ith == 0) {
ggml_cl_mul(src0, src1, dst);
}