summaryrefslogtreecommitdiff
path: root/ggml-cuda/softmax.cuh
diff options
context:
space:
mode:
authorslaren <slarengh@gmail.com>2024-03-25 13:50:23 +0100
committerGitHub <noreply@github.com>2024-03-25 13:50:23 +0100
commitae1f211ce2138448b47ebb148e25c58406845278 (patch)
treea18f5712eaee64d7d0ad1a3b3a097591ec10277e /ggml-cuda/softmax.cuh
parentad3a0505e3b6cd777259ee35e61d428357ffc565 (diff)
cuda : refactor into multiple files (#6269)
Diffstat (limited to 'ggml-cuda/softmax.cuh')
-rw-r--r--ggml-cuda/softmax.cuh5
1 files changed, 5 insertions, 0 deletions
diff --git a/ggml-cuda/softmax.cuh b/ggml-cuda/softmax.cuh
new file mode 100644
index 00000000..4ef4ff86
--- /dev/null
+++ b/ggml-cuda/softmax.cuh
@@ -0,0 +1,5 @@
+#include "common.cuh"
+
+#define CUDA_SOFT_MAX_BLOCK_SIZE 1024
+
+void ggml_cuda_op_soft_max(ggml_backend_cuda_context & ctx, ggml_tensor * dst);