diff options
author | Kawrakow <iwankawrakow@gmail.com> | 2025-04-01 13:48:20 +0200 |
---|---|---|
committer | GitHub <noreply@github.com> | 2025-04-01 13:48:20 +0200 |
commit | 21a5b8bd2820c097c1aa03d85cb83658609c7a12 (patch) | |
tree | 5d59f731510aea90f18012f4e1f4efb12e446c24 | |
parent | 190e7866db1d87a5da8b2d2b8d6619092b2ec72c (diff) |
Fix ARM_NEON build failure due to q8_2 (#303)
Co-authored-by: Iwan Kawrakow <iwan.kawrakow@gmail.com>
-rw-r--r-- | ggml/src/ggml-alloc.c | 4 | ||||
-rw-r--r-- | ggml/src/iqk/iqk_quantize.cpp | 4 |
2 files changed, 4 insertions, 4 deletions
diff --git a/ggml/src/ggml-alloc.c b/ggml/src/ggml-alloc.c index d811dee6..3f2d2023 100644 --- a/ggml/src/ggml-alloc.c +++ b/ggml/src/ggml-alloc.c @@ -174,8 +174,8 @@ static size_t ggml_dyn_tallocr_alloc(struct ggml_dyn_tallocr * alloc, size_t siz // this should never happen fprintf(stderr, "%s: not enough space in the buffer to allocate %zu bytes, largest block available %zu bytes\n", __func__, size, max_avail); - fprintf(stderr, "%s: tensor was %s with %zu elements and %zu bytes\n", __func__, tensor->name, - ggml_nelements(tensor), ggml_nbytes(tensor)); + fprintf(stderr, "%s: tensor was %s with %g elements and %zu bytes\n", __func__, tensor->name, + 1.*ggml_nelements(tensor), ggml_nbytes(tensor)); GGML_ABORT("not enough space in the buffer"); } } diff --git a/ggml/src/iqk/iqk_quantize.cpp b/ggml/src/iqk/iqk_quantize.cpp index e2cea7df..7873d3fe 100644 --- a/ggml/src/iqk/iqk_quantize.cpp +++ b/ggml/src/iqk/iqk_quantize.cpp @@ -860,9 +860,9 @@ void quantize_row_q8_1_x4_T(const float * x, Block * y, int64_t k) { } } else { if (i < nb4) { - y4[i4].s[ir] = vaddvq_s32(accv); + y4[i4].d[ir+4] = GGML_FP32_TO_BF16(d * vaddvq_s32(accv)).bits; } else { - y[i].s = vaddvq_s32(accv); + y[i].s = GGML_FP32_TO_BF16(d * vaddvq_s32(accv)).bits; } } } |