Support for dots.llm1 models (#573)

* Add llama.cpp changes for dots1 support * Add python changes for dots1 support * Fix to make it convert * Remove V reshaping, remove BOS by default for dots1 and fix warmup to handle models without BOS * Minor fix * Remove commented lines
author: saood06 <saood05@gmail.com> 2025-07-10 02:37:36 -0500
committer: GitHub <noreply@github.com> 2025-07-10 02:37:36 -0500
commit: c53cb65251168006b29da91fea7e5e42d815af15 (patch)
tree: 0afdec44454a7e3dc379102de8346bbe6c92cd91 /gguf-py/gguf/tensor_mapping.py
parent: 283753cabcabd30eb2cfb93739d9c1679200bf1f (diff)
1 files changed, 1 insertions, 1 deletions
diff --git a/gguf-py/gguf/tensor_mapping.py b/gguf-py/gguf/tensor_mapping.py
index 9688b02c..d507725c 100644
--- a/gguf-py/gguf/tensor_mapping.py
+++ b/gguf-py/gguf/tensor_mapping.py
@@ -257,7 +257,7 @@ class TensorNameMap:
         ),
 
         MODEL_TENSOR.FFN_EXP_PROBS_B: (
-            "model.layers.{bid}.mlp.gate.e_score_correction", # deepseek-v3
+            "model.layers.{bid}.mlp.gate.e_score_correction", # deepseek-v3 dots1
         ),
 
         # Feed-forward up
author	saood06 <saood05@gmail.com>	2025-07-10 02:37:36 -0500
committer	GitHub <noreply@github.com>	2025-07-10 02:37:36 -0500
commit	c53cb65251168006b29da91fea7e5e42d815af15 (patch)
tree	0afdec44454a7e3dc379102de8346bbe6c92cd91 /gguf-py/gguf/tensor_mapping.py
parent	283753cabcabd30eb2cfb93739d9c1679200bf1f (diff)