diff options
Diffstat (limited to 'ggml/include')
-rw-r--r-- | ggml/include/ggml-backend.h | 6 | ||||
-rw-r--r-- | ggml/include/ggml.h | 7 |
2 files changed, 13 insertions, 0 deletions
diff --git a/ggml/include/ggml-backend.h b/ggml/include/ggml-backend.h index 5f3f1e28..621620bc 100644 --- a/ggml/include/ggml-backend.h +++ b/ggml/include/ggml-backend.h @@ -232,6 +232,12 @@ extern "C" { GGML_API void ggml_backend_tensor_alloc(ggml_backend_buffer_t buffer, struct ggml_tensor * tensor, void * addr); GGML_API void ggml_backend_view_init(struct ggml_tensor * tensor); + // Utility to query whether cached GGML graph is in use + GGML_API bool ggml_use_cached_graph(ggml_backend_sched_t sched); + + // Set whether or not to use GGML graph caching + GGML_API void ggml_set_cached_graph(ggml_backend_sched_t sched, bool set_value); + #ifdef __cplusplus } diff --git a/ggml/include/ggml.h b/ggml/include/ggml.h index a467c297..a99dc6b5 100644 --- a/ggml/include/ggml.h +++ b/ggml/include/ggml.h @@ -597,6 +597,13 @@ extern "C" { GGML_TENSOR_FLAG_PARAM = 4, }; + // Flag (used on GGML_OP_CPY nodes) on whether node is associated with K or V cache + enum ggml_kv_cache_flag { + GGML_KV_CACHE_FLAG_NONE = 0, + GGML_KV_CACHE_FLAG_K = 1, + GGML_KV_CACHE_FLAG_V = 2 + }; + // ggml object struct ggml_object { size_t offs; |