summaryrefslogtreecommitdiff
path: root/src/llama.cpp
diff options
context:
space:
mode:
authorKawrakow <iwankawrakow@gmail.com>2025-07-03 15:36:52 +0200
committerGitHub <noreply@github.com>2025-07-03 15:36:52 +0200
commit9534461c01e132672821e53ce6e5e560dc58e829 (patch)
tree18d4487dece1ae25d0a44e02cc44260f94a91697 /src/llama.cpp
parentdb8dee50516d1437f94017de196f87dcf54be12d (diff)
Vulkan: fused rms norm (#577)
Co-authored-by: Iwan Kawrakow <iwan.kawrakow@gmail.com>
Diffstat (limited to 'src/llama.cpp')
-rw-r--r--src/llama.cpp7
1 files changed, 1 insertions, 6 deletions
diff --git a/src/llama.cpp b/src/llama.cpp
index c2769e32..794dcca6 100644
--- a/src/llama.cpp
+++ b/src/llama.cpp
@@ -9597,12 +9597,7 @@ static struct ggml_tensor * llm_build_norm(
const llm_build_cb & cb,
int il, float scale_eps = 1) {
-#ifdef GGML_USE_VULKAN
- constexpr bool use_fused_rms_norm = false;
-#else
- constexpr bool use_fused_rms_norm = true;
-#endif
- if (use_fused_rms_norm && type == LLM_NORM_RMS && mw) {
+ if (type == LLM_NORM_RMS && mw) {
cur = ggml_fused_rms_norm(ctx, cur, mw, scale_eps * hparams.f_norm_rms_eps);
if (mb) {
cb(cur, "fused_norm", il);