summaryrefslogtreecommitdiff
path: root/utils.h
diff options
context:
space:
mode:
authorErik Scholz <Green-Sky@users.noreply.github.com>2023-03-19 18:57:00 +0100
committerGitHub <noreply@github.com>2023-03-19 19:57:00 +0200
commit0b366e735729327476ec31da02de3c9c9771ddfb (patch)
tree84022e2ae4d512f44e430a0fb8b49acf3c4a6f72 /utils.h
parent160bfb217da5038ccbd74438f9f16a16012d7866 (diff)
Command line switch to use F16 for memory_k and memory_v (refactor of #154) (#294)
* Use F16 for memory_k and memory_v * add command line switch to use f16 instead of f32 for memory k+v --------- Co-authored-by: Ty Everett <ty@tyweb.us>
Diffstat (limited to 'utils.h')
-rw-r--r--utils.h1
1 files changed, 1 insertions, 0 deletions
diff --git a/utils.h b/utils.h
index e329ba16..c68e4cba 100644
--- a/utils.h
+++ b/utils.h
@@ -18,6 +18,7 @@ struct gpt_params {
int32_t n_predict = 128; // new tokens to predict
int32_t repeat_last_n = 64; // last n tokens to penalize
int32_t n_ctx = 512; //context size
+ bool memory_f16 = false; // use f16 instead of f32 for memory kv
// sampling parameters
int32_t top_k = 40;