summaryrefslogtreecommitdiff
path: root/gguf.py
diff options
context:
space:
mode:
authorslaren <slarengh@gmail.com>2023-08-24 20:04:05 +0200
committerGitHub <noreply@github.com>2023-08-24 21:04:05 +0300
commit0d3094f0c742ce61f84feb6e4f0b59beee6194d7 (patch)
tree5e8dba2a55440524f2cefdef72479eea9db93842 /gguf.py
parent01f2224682b08185af609b28b1268b95c8b4cfa2 (diff)
gguf : add rope_freq_base parameter for CodeLlama (#2769)
Diffstat (limited to 'gguf.py')
-rwxr-xr-xgguf.py6
1 files changed, 5 insertions, 1 deletions
diff --git a/gguf.py b/gguf.py
index 5c37f0f0..f4db7001 100755
--- a/gguf.py
+++ b/gguf.py
@@ -47,6 +47,7 @@ KEY_ATTENTION_LAYERNORM_RMS_EPS = "{arch}.attention.layer_norm_rms_epsilon"
# RoPE
KEY_ROPE_DIMENSION_COUNT = "{arch}.rope.dimension_count"
+KEY_ROPE_FREQ_BASE = "{arch}.rope.freq_base"
KEY_ROPE_SCALE_LINEAR = "{arch}.rope.scale_linear"
# tokenization
@@ -663,7 +664,10 @@ class GGUFWriter:
self.add_uint32(
KEY_ROPE_DIMENSION_COUNT.format(arch=self.arch), count)
- def add_rope_scale_linear(self, value: float):
+ def add_rope_freq_base(self, value: float):
+ self.add_float32(KEY_ROPE_FREQ_BASE.format(arch=self.arch), value)
+
+ def add_rope_scale_linear(self, value: float):
self.add_float32(KEY_ROPE_SCALE_LINEAR.format(arch=self.arch), value)
def add_tokenizer_model(self, model: str):