summaryrefslogtreecommitdiff
path: root/ggml.c
diff options
context:
space:
mode:
Diffstat (limited to 'ggml.c')
-rw-r--r--ggml.c11
1 files changed, 11 insertions, 0 deletions
diff --git a/ggml.c b/ggml.c
index ef6fd8ca..8f57003e 100644
--- a/ggml.c
+++ b/ggml.c
@@ -7207,6 +7207,17 @@ static void ggml_compute_forward_add_f32(
const int ith = params->ith;
const int nth = params->nth;
+#ifdef GGML_USE_CLBLAST
+ if (src1->backend == GGML_BACKEND_GPU) {
+ // TODO: OpenCL kernel support full broadcast
+ GGML_ASSERT(ggml_can_repeat_rows(src1, src0));
+ if (ith == 0) {
+ ggml_cl_add(src0, src1, dst);
+ }
+ return;
+ }
+#endif
+
const int nr = ggml_nrows(src0);
GGML_TENSOR_BINARY_OP_LOCALS