diff options
author | ds5t5 <145942675+ds5t5@users.noreply.github.com> | 2023-10-04 06:23:39 -0700 |
---|---|---|
committer | GitHub <noreply@github.com> | 2023-10-04 16:23:39 +0300 |
commit | f8c90cdbaa729e64493164c1aba7ea80da7b716f (patch) | |
tree | d5d15cafc28bd2d982705c92bad32a8ea9b90e4b /ggml.c | |
parent | f93af02488179b9c52d0d391b08ae4c4d891b8d3 (diff) |
llm : add Refact model (#3329)
* add refact model
* resolve comments
* rebase to the latest
* solve alibi cpu error
---------
Co-authored-by: Georgi Gerganov <ggerganov@gmail.com>
Diffstat (limited to 'ggml.c')
-rw-r--r-- | ggml.c | 2 |
1 files changed, 0 insertions, 2 deletions
@@ -13082,7 +13082,6 @@ static void ggml_compute_forward_alibi_f32( return; } - const int n_past = ((int32_t *) dst->op_params)[0]; const int n_head = ((int32_t *) dst->op_params)[1]; float max_bias; memcpy(&max_bias, (int32_t *) dst->op_params + 2, sizeof(float)); @@ -13103,7 +13102,6 @@ static void ggml_compute_forward_alibi_f32( //const int nb3 = src0->nb[3]; GGML_ASSERT(nb0 == sizeof(float)); - GGML_ASSERT(ne1 + n_past == ne0); GGML_ASSERT(n_head == ne2); // add alibi to src0 (KQ_scaled) |