summaryrefslogtreecommitdiff
path: root/ggml-cuda.cu
diff options
context:
space:
mode:
authorGeorgi Gerganov <ggerganov@gmail.com>2024-01-03 13:01:44 +0200
committerGeorgi Gerganov <ggerganov@gmail.com>2024-01-03 14:38:38 +0200
commitd55356d3baa58a6c3a9171cb67a67094b9aa9dff (patch)
tree02a6cc74b2056ff2637154ab9d47a683a6aee79c /ggml-cuda.cu
parent75e3fd85814c367b55aea11e7bb38cb7b82c6aa0 (diff)
cuda : mark I16 and I32 ops as unsupported
ggml-ci
Diffstat (limited to 'ggml-cuda.cu')
-rw-r--r--ggml-cuda.cu13
1 files changed, 10 insertions, 3 deletions
diff --git a/ggml-cuda.cu b/ggml-cuda.cu
index 8c271230..2e759d43 100644
--- a/ggml-cuda.cu
+++ b/ggml-cuda.cu
@@ -10039,14 +10039,22 @@ static bool ggml_backend_cuda_supports_op(ggml_backend_t backend, const ggml_ten
}
return false;
} break;
+ case GGML_OP_DUP:
+ case GGML_OP_REPEAT:
+ case GGML_OP_CONCAT:
+ {
+ ggml_type src0_type = op->src[0]->type;
+ if (src0_type != GGML_TYPE_I32 && src0_type != GGML_TYPE_I16) {
+ return true;
+ }
+ return false;
+ } break;
case GGML_OP_NONE:
case GGML_OP_RESHAPE:
case GGML_OP_VIEW:
case GGML_OP_PERMUTE:
case GGML_OP_TRANSPOSE:
case GGML_OP_NORM:
- case GGML_OP_REPEAT:
- case GGML_OP_DUP:
case GGML_OP_ADD:
case GGML_OP_MUL:
case GGML_OP_DIV:
@@ -10063,7 +10071,6 @@ static bool ggml_backend_cuda_supports_op(ggml_backend_t backend, const ggml_ten
case GGML_OP_SUM_ROWS:
case GGML_OP_ARGSORT:
case GGML_OP_ACC:
- case GGML_OP_CONCAT:
case GGML_OP_GROUP_NORM:
case GGML_OP_UPSCALE:
case GGML_OP_PAD: