diff options
Diffstat (limited to 'src/llama.cpp')
-rw-r--r-- | src/llama.cpp | 6 |
1 files changed, 5 insertions, 1 deletions
diff --git a/src/llama.cpp b/src/llama.cpp index 5777689e..ac02abf6 100644 --- a/src/llama.cpp +++ b/src/llama.cpp @@ -116,7 +116,7 @@ // bump if necessary #define LLAMA_MAX_LAYERS 512 -#define LLAMA_MAX_EXPERTS 256 // DeepSeekV2 +#define LLAMA_MAX_EXPERTS 384 // Kimi-K2 // // helpers @@ -6402,6 +6402,10 @@ static void llm_load_vocab( tokenizer_pre == "hunyuan") { vocab.type_pre = LLAMA_VOCAB_PRE_TYPE_HUNYUAN; vocab.tokenizer_clean_spaces = false; + } else if ( + tokenizer_pre == "kimi-k2") { + vocab.type_pre = LLAMA_VOCAB_PRE_TYPE_KIMI_K2; + vocab.tokenizer_clean_spaces = false; } else { throw std::runtime_error(format("unknown pre-tokenizer type: '%s'", tokenizer_pre.c_str())); } |