summaryrefslogtreecommitdiff
path: root/src
diff options
context:
space:
mode:
Diffstat (limited to 'src')
-rw-r--r--src/llama.cpp12
1 files changed, 2 insertions, 10 deletions
diff --git a/src/llama.cpp b/src/llama.cpp
index 2cca5099..d52590a6 100644
--- a/src/llama.cpp
+++ b/src/llama.cpp
@@ -8111,16 +8111,8 @@ static struct ggml_tensor * llm_build_ffn(
} break;
case LLM_FFN_SWIGLU:
{
- // Project to 4h. If using swiglu double the output width, see https://arxiv.org/pdf/2002.05202.pdf
- int64_t split_point = cur->ne[0] / 2;
- struct ggml_tensor * x0 = ggml_cont(ctx, ggml_view_2d(ctx, cur, split_point, cur->ne[1], cur->nb[1], 0));
- struct ggml_tensor * x1 = ggml_cont(ctx, ggml_view_2d(ctx, cur, split_point, cur->ne[1], cur->nb[1], split_point * ggml_element_size(cur)));
-
- x0 = ggml_silu(ctx, x0);
- cb(cur, "ffn_silu", il);
-
- cur = ggml_mul(ctx, x0, x1);
- cb(cur, "ffn_mul", il);
+ cur = ggml_swiglu(ctx, cur);
+ cb(cur, "ffn_swiglu", il);
} break;
}