diff options
author | chiranko <96988916+chiranko@users.noreply.github.com> | 2024-01-19 17:07:27 +0800 |
---|---|---|
committer | GitHub <noreply@github.com> | 2024-01-19 11:07:27 +0200 |
commit | 2b3b999cacc7ad1207c32fbdf3479a19c06e1a34 (patch) | |
tree | be2adbdfb73eb5d24ab9bcbb6f53671b9bb88ffa /gguf-py/gguf/tensor_mapping.py | |
parent | 993fba81807e55d27b570945af8e416d535eced1 (diff) |
llama : add CodeShell support (#5016)
* llama: add codeshell support
* llama.cpp: fix codeshell with NeoX rope
Co-authored-by: Georgi Gerganov <ggerganov@gmail.com>
---------
Co-authored-by: Georgi Gerganov <ggerganov@gmail.com>
Diffstat (limited to 'gguf-py/gguf/tensor_mapping.py')
-rw-r--r-- | gguf-py/gguf/tensor_mapping.py | 1 |
1 files changed, 1 insertions, 0 deletions
diff --git a/gguf-py/gguf/tensor_mapping.py b/gguf-py/gguf/tensor_mapping.py index e5b14610..de177af1 100644 --- a/gguf-py/gguf/tensor_mapping.py +++ b/gguf-py/gguf/tensor_mapping.py @@ -154,6 +154,7 @@ class TensorNameMap: "model.layers.{bid}.self_attn.rotary_emb.inv_freq", # llama-hf "layers.{bid}.attention.inner_attention.rope.freqs", # llama-pth "model.layers.layers.{bid}.self_attn.rotary_emb.inv_freq", # plamo + "transformer.h.{bid}.attn.rotary_emb.inv_freq", # codeshell ), # Feed-forward norm |