diff options
author | Iwan Kawrakow <iwan.kawrakow@gmail.com> | 2024-06-10 17:56:55 +0200 |
---|---|---|
committer | Iwan Kawrakow <iwan.kawrakow@gmail.com> | 2024-06-22 12:02:50 +0300 |
commit | 3593891f390b376f7127efe3bd7eda9baffe6609 (patch) | |
tree | 7028f8a8e95c542b49421d21f39bfac51f66758f | |
parent | 9593e163db41f60b8d6598a443fec1740e97eb67 (diff) |
Fix nb4
-rw-r--r-- | ggml-quants.c | 5 |
1 files changed, 2 insertions, 3 deletions
diff --git a/ggml-quants.c b/ggml-quants.c index 684fdf7d..d80fc2a6 100644 --- a/ggml-quants.c +++ b/ggml-quants.c @@ -870,13 +870,13 @@ void quantize_row_q8_0(const float * restrict x, void * restrict vy, int64_t k) block_q8_0 * restrict y = vy; -#if defined(__ARM_NEON) - block_q8_0_x4 * y4 = (block_q8_0_x4 *)vy; #if GGML_USE_IQK_MULMAT const int nb4 = 4*(nb/4); #else const int nb4 = -1; #endif +#if defined(__ARM_NEON) + block_q8_0_x4 * y4 = (block_q8_0_x4 *)vy; for (int i = 0; i < nb; i++) { int i4 = i/4, ir = i%4; float32x4_t srcv [8]; @@ -953,7 +953,6 @@ void quantize_row_q8_0(const float * restrict x, void * restrict vy, int64_t k) } #elif defined(__AVX2__) || defined(__AVX__) block_q8_0_x4 * y4 = (block_q8_0_x4 *)vy; - int nb4 = 4*(nb/4); #ifdef __AVX2__ const bool pack = true; #else |