diff options
author | Stephan Walter <stephan@walter.name> | 2023-04-12 15:06:16 +0000 |
---|---|---|
committer | GitHub <noreply@github.com> | 2023-04-12 15:06:16 +0000 |
commit | e7f6997f897a18b6372a6460e25c5f89e1469f1d (patch) | |
tree | 78139653d351b37cd045d951814b3ec7b2ca1412 /llama.h | |
parent | f76cb3a34d6a6b03afb96650e39495f201eac042 (diff) |
Don't crash on ftype (formerly f16) == 4 (#917)
Diffstat (limited to 'llama.h')
-rw-r--r-- | llama.h | 1 |
1 files changed, 1 insertions, 0 deletions
@@ -71,6 +71,7 @@ extern "C" { LLAMA_FTYPE_MOSTLY_F16 = 1, // except 1d tensors LLAMA_FTYPE_MOSTLY_Q4_0 = 2, // except 1d tensors LLAMA_FTYPE_MOSTLY_Q4_1 = 3, // except 1d tensors + LLAMA_FTYPE_MOSTLY_Q4_1_SOME_F16 = 4, // tok_embeddings.weight and output.weight are F16 }; LLAMA_API struct llama_context_params llama_context_default_params(); |