summaryrefslogtreecommitdiff
path: root/llama.cpp
diff options
context:
space:
mode:
authorGeorgi Gerganov <ggerganov@gmail.com>2024-02-26 08:30:17 +0200
committerGeorgi Gerganov <ggerganov@gmail.com>2024-02-26 08:30:17 +0200
commit269de86ba073b5dc9ce687c11a3bc4d7d873b962 (patch)
tree130f3ef657bceb51793258e39b0759b7c637dfd9 /llama.cpp
parentc39373398803c669056304090050fe3f44b41bf9 (diff)
llama : fix Gemma rope type (#5691)
Diffstat (limited to 'llama.cpp')
-rw-r--r--llama.cpp2
1 files changed, 1 insertions, 1 deletions
diff --git a/llama.cpp b/llama.cpp
index 3424b199..28430254 100644
--- a/llama.cpp
+++ b/llama.cpp
@@ -12089,7 +12089,6 @@ enum llama_rope_type llama_rope_type(const struct llama_model * model) {
case LLM_ARCH_ORION:
case LLM_ARCH_INTERNLM2:
case LLM_ARCH_MINICPM:
- case LLM_ARCH_GEMMA:
return LLAMA_ROPE_TYPE_NORM;
// the pairs of head values are offset by n_rot/2
@@ -12101,6 +12100,7 @@ enum llama_rope_type llama_rope_type(const struct llama_model * model) {
case LLM_ARCH_QWEN:
case LLM_ARCH_QWEN2:
case LLM_ARCH_PHI2:
+ case LLM_ARCH_GEMMA:
return LLAMA_ROPE_TYPE_NEOX;
// all model arches should be listed explicitly here