summaryrefslogtreecommitdiff
path: root/ggml.h
diff options
context:
space:
mode:
Diffstat (limited to 'ggml.h')
-rw-r--r--ggml.h13
1 files changed, 9 insertions, 4 deletions
diff --git a/ggml.h b/ggml.h
index 27001818..6c195677 100644
--- a/ggml.h
+++ b/ggml.h
@@ -1383,13 +1383,17 @@ extern "C" {
struct ggml_context * ctx,
struct ggml_tensor * a);
- // fused soft_max(a*scale + mask)
+ // fused soft_max(a*scale + mask + pos[i]*(ALiBi slope))
// mask is optional
+ // pos is required when max_bias > 0.0f
+ // max_bias = 0.0f for no ALiBi
GGML_API struct ggml_tensor * ggml_soft_max_ext(
struct ggml_context * ctx,
struct ggml_tensor * a,
struct ggml_tensor * mask,
- float scale);
+ struct ggml_tensor * pos,
+ float scale,
+ float max_bias);
GGML_API struct ggml_tensor * ggml_soft_max_back(
struct ggml_context * ctx,
@@ -1491,12 +1495,13 @@ extern "C" {
// alibi position embedding
// in-place, returns view(a)
- GGML_API struct ggml_tensor * ggml_alibi(
+ GGML_DEPRECATED(GGML_API struct ggml_tensor * ggml_alibi(
struct ggml_context * ctx,
struct ggml_tensor * a,
int n_past,
int n_head,
- float bias_max);
+ float bias_max),
+ "use ggml_soft_max_ext instead (will be removed in Mar 2024)");
// clamp
// in-place, returns view(a)