From f8c90cdbaa729e64493164c1aba7ea80da7b716f Mon Sep 17 00:00:00 2001 From: ds5t5 <145942675+ds5t5@users.noreply.github.com> Date: Wed, 4 Oct 2023 06:23:39 -0700 Subject: llm : add Refact model (#3329) * add refact model * resolve comments * rebase to the latest * solve alibi cpu error --------- Co-authored-by: Georgi Gerganov --- ggml.c | 2 -- 1 file changed, 2 deletions(-) (limited to 'ggml.c') diff --git a/ggml.c b/ggml.c index 4a94b0f3..f56d6ac7 100644 --- a/ggml.c +++ b/ggml.c @@ -13082,7 +13082,6 @@ static void ggml_compute_forward_alibi_f32( return; } - const int n_past = ((int32_t *) dst->op_params)[0]; const int n_head = ((int32_t *) dst->op_params)[1]; float max_bias; memcpy(&max_bias, (int32_t *) dst->op_params + 2, sizeof(float)); @@ -13103,7 +13102,6 @@ static void ggml_compute_forward_alibi_f32( //const int nb3 = src0->nb[3]; GGML_ASSERT(nb0 == sizeof(float)); - GGML_ASSERT(ne1 + n_past == ne0); GGML_ASSERT(n_head == ne2); // add alibi to src0 (KQ_scaled) -- cgit v1.2.3