Vulkan: add GGML_OP_FUSED_MUL_UNARY (#580)

Co-authored-by: Iwan Kawrakow <iwan.kawrakow@gmail.com>
author: Kawrakow <iwankawrakow@gmail.com> 2025-07-03 18:03:23 +0200
committer: GitHub <noreply@github.com> 2025-07-03 18:03:23 +0200
commit: 8a0c38f496f60bb0f627521823de604ce10fdc16 (patch)
tree: 646fa2f21c7436dcae8214d382dda1a2e4b5f994 /src/llama.cpp
parent: 9534461c01e132672821e53ce6e5e560dc58e829 (diff)
1 files changed, 1 insertions, 7 deletions
diff --git a/src/llama.cpp b/src/llama.cpp
index 794dcca6..11a7060c 100644
--- a/src/llama.cpp
+++ b/src/llama.cpp
@@ -9688,13 +9688,7 @@ static struct ggml_tensor * llm_build_ffn(
         cur = tmp;
     }
 
-#ifdef GGML_USE_VULKAN
-    constexpr bool use_fused_mul_unary = false;
-#else
-    constexpr bool use_fused_mul_unary = true;
-#endif
-
-    if (use_fused_mul_unary && type_gate == LLM_FFN_PAR &&
+    if (type_gate == LLM_FFN_PAR &&
        (type_op == LLM_FFN_SILU || type_op == LLM_FFN_RELU || (type_op == LLM_FFN_GELU && !act_scales))) {
         cur = ggml_fused_mul_unary(ctx, cur, tmp, type_op == LLM_FFN_SILU ? GGML_UNARY_OP_SILU :
                                                   type_op == LLM_FFN_RELU ? GGML_UNARY_OP_RELU : GGML_UNARY_OP_GELU);
author	Kawrakow <iwankawrakow@gmail.com>	2025-07-03 18:03:23 +0200
committer	GitHub <noreply@github.com>	2025-07-03 18:03:23 +0200
commit	8a0c38f496f60bb0f627521823de604ce10fdc16 (patch)
tree	646fa2f21c7436dcae8214d382dda1a2e4b5f994 /src/llama.cpp
parent	9534461c01e132672821e53ce6e5e560dc58e829 (diff)