diff options
author | Kawrakow <iwankawrakow@gmail.com> | 2025-07-03 15:36:52 +0200 |
---|---|---|
committer | GitHub <noreply@github.com> | 2025-07-03 15:36:52 +0200 |
commit | 9534461c01e132672821e53ce6e5e560dc58e829 (patch) | |
tree | 18d4487dece1ae25d0a44e02cc44260f94a91697 /src/llama.cpp | |
parent | db8dee50516d1437f94017de196f87dcf54be12d (diff) |
Vulkan: fused rms norm (#577)
Co-authored-by: Iwan Kawrakow <iwan.kawrakow@gmail.com>
Diffstat (limited to 'src/llama.cpp')
-rw-r--r-- | src/llama.cpp | 7 |
1 files changed, 1 insertions, 6 deletions
diff --git a/src/llama.cpp b/src/llama.cpp index c2769e32..794dcca6 100644 --- a/src/llama.cpp +++ b/src/llama.cpp @@ -9597,12 +9597,7 @@ static struct ggml_tensor * llm_build_norm( const llm_build_cb & cb, int il, float scale_eps = 1) { -#ifdef GGML_USE_VULKAN - constexpr bool use_fused_rms_norm = false; -#else - constexpr bool use_fused_rms_norm = true; -#endif - if (use_fused_rms_norm && type == LLM_NORM_RMS && mw) { + if (type == LLM_NORM_RMS && mw) { cur = ggml_fused_rms_norm(ctx, cur, mw, scale_eps * hparams.f_norm_rms_eps); if (mb) { cb(cur, "fused_norm", il); |