summaryrefslogtreecommitdiff
path: root/ggml/src/iqk/iqk_flash_impl.h
diff options
context:
space:
mode:
Diffstat (limited to 'ggml/src/iqk/iqk_flash_impl.h')
-rw-r--r--ggml/src/iqk/iqk_flash_impl.h4
1 files changed, 4 insertions, 0 deletions
diff --git a/ggml/src/iqk/iqk_flash_impl.h b/ggml/src/iqk/iqk_flash_impl.h
index 68802927..6f62e56b 100644
--- a/ggml/src/iqk/iqk_flash_impl.h
+++ b/ggml/src/iqk/iqk_flash_impl.h
@@ -6,6 +6,8 @@
#pragma once
+#include <cstdint>
+
bool iqk_flash_attn_impl(int type_k, // type of k
int type_v, // type of v
int Dk, // K head size
@@ -27,3 +29,5 @@ bool iqk_flash_attn_impl(int type_k, // type of k
float * M,
float * S);
+void * iqk_repack_k(int type_k, int nek0, int nek1, int nek2, int nek3, long nbk1, long nbk2, long nbk3,
+ const void * k, void * work, int ith, int nth, int& repacked_type, uint64_t& row_size);