From bb43cf7e9d86d69ffd9c7f008f75db890a35b45a Mon Sep 17 00:00:00 2001 From: bryanSwk <93190252+bryanSwk@users.noreply.github.com> Date: Thu, 4 Apr 2024 02:05:10 +0800 Subject: llama : add SEA-LION support (#6448) * initial commit for sealion support * add sealion support * minor fix * q/k ln and pos_embd only if required * Apply suggestions from code review Co-authored-by: Georgi Gerganov * minor : clear whitespaces --------- Co-authored-by: bryan Co-authored-by: Georgi Gerganov --- gguf-py/gguf/tensor_mapping.py | 2 ++ 1 file changed, 2 insertions(+) (limited to 'gguf-py/gguf/tensor_mapping.py') diff --git a/gguf-py/gguf/tensor_mapping.py b/gguf-py/gguf/tensor_mapping.py index 93a5a455..345b1b0c 100644 --- a/gguf-py/gguf/tensor_mapping.py +++ b/gguf-py/gguf/tensor_mapping.py @@ -285,11 +285,13 @@ class TensorNameMap: MODEL_TENSOR.ATTN_Q_NORM: ( "language_model.encoder.layers.{bid}.self_attention.q_layernorm", "model.layers.{bid}.self_attn.q_layernorm", # persimmon + "transformer.blocks.{bid}.attn.q_ln", # sea-lion ), MODEL_TENSOR.ATTN_K_NORM: ( "language_model.encoder.layers.{bid}.self_attention.k_layernorm", "model.layers.{bid}.self_attn.k_layernorm", # persimmon + "transformer.blocks.{bid}.attn.k_ln", # sea-lion ), MODEL_TENSOR.ROPE_FREQS: ( -- cgit v1.2.3