llama : add phi3 support (#6852)

* add explicit phi3 support * add explicit phi3 support * remove unused code * convert : add BOS token * llama : match EOT token <|end|> * llama : minor / style * llama : tabs -> spaces * convert : fix lint checks --------- Co-authored-by: Georgi Gerganov <ggerganov@gmail.com>
author: liuwei-git <14815172+liuwei-git@users.noreply.github.com> 2024-04-24 15:00:37 +0800
committer: GitHub <noreply@github.com> 2024-04-24 10:00:37 +0300
commit: c8297c6af5693555652c40b95974b95d49d2674d (patch)
tree: 403d5e80233b90b3a03a7283c297c679400ccf6a /gguf-py/gguf/tensor_mapping.py
parent: 4e96a812b3ce7322a29a3008db2ed73d9087b176 (diff)
1 files changed, 2 insertions, 0 deletions
diff --git a/gguf-py/gguf/tensor_mapping.py b/gguf-py/gguf/tensor_mapping.py
index 10de36fa..e5750d41 100644
--- a/gguf-py/gguf/tensor_mapping.py
+++ b/gguf-py/gguf/tensor_mapping.py
@@ -117,6 +117,7 @@ class TensorNameMap:
             "h.{bid}.attn.c_attn",                                                 # gpt2
             "transformer.h.{bid}.mixer.Wqkv",                                      # phi2
             "encoder.layers.{bid}.attn.Wqkv",                                      # nomic-bert
+            "model.layers.{bid}.self_attn.qkv_proj"                                # phi3
         ),
 
         # Attention query
@@ -234,6 +235,7 @@ class TensorNameMap:
             "h.{bid}.mlp.c_fc",                                       # gpt2
             "transformer.h.{bid}.mlp.fc1",                            # phi2
             "model.layers.{bid}.mlp.fc1",                             # phi2
+            "model.layers.{bid}.mlp.gate_up_proj",                    # phi3
             "model.layers.layers.{bid}.mlp.up_proj",                  # plamo
             "model.layers.{bid}.feed_forward.w3",                     # internlm2
             "encoder.layers.{bid}.mlp.fc11",                          # nomic-bert
author	liuwei-git <14815172+liuwei-git@users.noreply.github.com>	2024-04-24 15:00:37 +0800
committer	GitHub <noreply@github.com>	2024-04-24 10:00:37 +0300
commit	c8297c6af5693555652c40b95974b95d49d2674d (patch)
tree	403d5e80233b90b3a03a7283c297c679400ccf6a /gguf-py/gguf/tensor_mapping.py
parent	4e96a812b3ce7322a29a3008db2ed73d9087b176 (diff)