summaryrefslogtreecommitdiff
path: root/src/llama.cpp
diff options
context:
space:
mode:
authorKawrakow <48489457+ikawrakow@users.noreply.github.com>2024-08-21 13:00:09 +0300
committerGitHub <noreply@github.com>2024-08-21 13:00:09 +0300
commitbd99ed7d0afd2b12c0f5ff5c17b58486396dfe7e (patch)
tree2b209a3a58ee6462fedafd538b0fd80f737977ed /src/llama.cpp
parentd259a50ca6fd3a0821abe6a16b73c0b19c5b4651 (diff)
softcap: minor improvement (#24)
Co-authored-by: Iwan Kawrakow <iwan.kawrakow@gmail.com>
Diffstat (limited to 'src/llama.cpp')
-rw-r--r--src/llama.cpp3
1 files changed, 0 insertions, 3 deletions
diff --git a/src/llama.cpp b/src/llama.cpp
index 4aee41a4..831f98dc 100644
--- a/src/llama.cpp
+++ b/src/llama.cpp
@@ -8325,9 +8325,6 @@ static struct ggml_tensor * llm_build_kqv(
if (hparams.attn_soft_cap) {
kq = ggml_softcap(ctx, kq, 1.0f / hparams.f_attn_logit_softcapping, hparams.f_attn_logit_softcapping);
- //kq = ggml_scale(ctx, kq, 1.0f / hparams.f_attn_logit_softcapping);
- //kq = ggml_tanh(ctx, kq);
- //kq = ggml_scale(ctx, kq, hparams.f_attn_logit_softcapping);
}
kq = ggml_soft_max_ext(ctx, kq, kq_mask, kq_scale, hparams.f_max_alibi_bias);