diff options
author | Georgi Gerganov <ggerganov@gmail.com> | 2024-05-23 10:00:44 +0300 |
---|---|---|
committer | GitHub <noreply@github.com> | 2024-05-23 10:00:44 +0300 |
commit | d48c88cbd563b6cf0ce972e2f56796896e240736 (patch) | |
tree | 14574b8ddc14145b093f6ab531f1e2968bbd6d85 /ggml.h | |
parent | e84b71c2c6da6e69c8f815168ea836f9716a325e (diff) |
ggml : remove ggml_flash_attn and ggml_flash_ff (#7463)
ggml-ci
Diffstat (limited to 'ggml.h')
-rw-r--r-- | ggml.h | 18 |
1 files changed, 1 insertions, 17 deletions
@@ -481,9 +481,7 @@ extern "C" { GGML_OP_ARGSORT, GGML_OP_LEAKY_RELU, - GGML_OP_FLASH_ATTN, GGML_OP_FLASH_ATTN_EXT, - GGML_OP_FLASH_FF, GGML_OP_FLASH_ATTN_BACK, GGML_OP_SSM_CONV, GGML_OP_SSM_SCAN, @@ -1761,13 +1759,6 @@ extern "C" { struct ggml_tensor * a, int k); - GGML_API struct ggml_tensor * ggml_flash_attn( - struct ggml_context * ctx, - struct ggml_tensor * q, - struct ggml_tensor * k, - struct ggml_tensor * v, - bool masked); - #define GGML_KQ_MASK_PAD 32 // q: [n_embd, n_batch, n_head, 1] @@ -1788,6 +1779,7 @@ extern "C" { struct ggml_tensor * a, enum ggml_prec prec); + // TODO: needs to be adapted to ggml_flash_attn_ext GGML_API struct ggml_tensor * ggml_flash_attn_back( struct ggml_context * ctx, struct ggml_tensor * q, @@ -1796,14 +1788,6 @@ extern "C" { struct ggml_tensor * d, bool masked); - GGML_API struct ggml_tensor * ggml_flash_ff( - struct ggml_context * ctx, - struct ggml_tensor * a, - struct ggml_tensor * b0, - struct ggml_tensor * b1, - struct ggml_tensor * c0, - struct ggml_tensor * c1); - GGML_API struct ggml_tensor * ggml_ssm_conv( struct ggml_context * ctx, struct ggml_tensor * s, |