summaryrefslogtreecommitdiff
path: root/examples/train-text-from-scratch/train-text-from-scratch.cpp
diff options
context:
space:
mode:
authorcebtenzzre <cebtenzzre@gmail.com>2023-11-01 18:04:33 -0400
committerGitHub <noreply@github.com>2023-11-01 18:04:33 -0400
commit898aeca90a9bb992f506234cf3b8b7f7fa28a1df (patch)
tree125f8a9b466efd4534ecd3e64419ece001c86a7d /examples/train-text-from-scratch/train-text-from-scratch.cpp
parentc43c2da8afacaddfe51c09b21dbd9922cd0ea46b (diff)
llama : implement YaRN RoPE scaling (#2268)
Co-authored-by: cebtenzzre <cebtenzzre@gmail.com> Co-authored-by: Jeffrey Quesnelle <jquesnelle@gmail.com>
Diffstat (limited to 'examples/train-text-from-scratch/train-text-from-scratch.cpp')
-rw-r--r--examples/train-text-from-scratch/train-text-from-scratch.cpp6
1 files changed, 3 insertions, 3 deletions
diff --git a/examples/train-text-from-scratch/train-text-from-scratch.cpp b/examples/train-text-from-scratch/train-text-from-scratch.cpp
index 1ce6cef2..2a257e63 100644
--- a/examples/train-text-from-scratch/train-text-from-scratch.cpp
+++ b/examples/train-text-from-scratch/train-text-from-scratch.cpp
@@ -349,9 +349,9 @@ static struct ggml_tensor * llama_build_train_graphs(
// not capturing these, to silcence warnings
const int rope_mode = 0;
- return ggml_rope_custom(ctx,
- t, KQ_pos, n_rot, rope_mode, n_ctx,
- rope_freq_base, rope_freq_scale);
+ return ggml_rope_custom(
+ ctx, t, KQ_pos, n_rot, rope_mode, n_ctx, 0, rope_freq_base, rope_freq_scale, 0.0f, 1.0f, 0.0f, 0.0f
+ );
};
set_name(tokens_input, "tokens_input");