From 4fcfcd05d1b2b01b2f2224406d96a6ea9831ddcb Mon Sep 17 00:00:00 2001 From: Iwan Kawrakow Date: Sun, 16 Jun 2024 17:27:18 +0300 Subject: bitnet: scale is per row, not per tensor --- ggml-quants.c | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) (limited to 'ggml-quants.c') diff --git a/ggml-quants.c b/ggml-quants.c index 552d6198..fc3155ef 100644 --- a/ggml-quants.c +++ b/ggml-quants.c @@ -3731,7 +3731,7 @@ void quantize_row_q8_K64_reference(const float * restrict x, block_q8_K64 * rest for (int j = 0; j < 64; ++j) { float ax = fabsf(x[j]); if (ax > amax) { - amax = ax; max = x[j]; + amax = ax; max = x[j]; } } if (!amax) { -- cgit v1.2.3