summaryrefslogtreecommitdiff
path: root/ggml-quants.c
diff options
context:
space:
mode:
authorGeorgi Gerganov <ggerganov@gmail.com>2024-02-18 22:39:30 +0200
committerGitHub <noreply@github.com>2024-02-18 22:39:30 +0200
commitb1de96824bdbeb91ea458abcb3e5478690ad0727 (patch)
treec0ab39ccee911245158973dd6280f8959024381a /ggml-quants.c
parent7ad554f90e735cf2a0f612ce44f9aa4fad6ae46a (diff)
ci : fix wikitext url + compile warnings (#5569)
ggml-ci
Diffstat (limited to 'ggml-quants.c')
-rw-r--r--ggml-quants.c6
1 files changed, 3 insertions, 3 deletions
diff --git a/ggml-quants.c b/ggml-quants.c
index 48f5294e..43a8f1de 100644
--- a/ggml-quants.c
+++ b/ggml-quants.c
@@ -1837,9 +1837,9 @@ static void quantize_row_q2_K_impl(const float * restrict x, block_q2_K * restri
float sigma2 = sumx2/QK_K;
for (int j = 0; j < QK_K/16; ++j) {
const float * restrict qw = quant_weights + QK_K * i + 16*j;
- for (int l = 0; l < 16; ++l) weight[l] = qw[l] * sqrtf(sigma2 + x[16*j + l]*x[16*j + l]);
- for (int l = 0; l < 16; ++l) sw[j] += weight[l];
- scales[j] = make_qkx3_quants(16, 3, x + 16*j, weight, L + 16*j, &mins[j], Laux, -0.9f, 0.05f, 36, false);
+ for (int l = 0; l < QK_K/16; ++l) weight[l] = qw[l] * sqrtf(sigma2 + x[16*j + l]*x[16*j + l]);
+ for (int l = 0; l < QK_K/16; ++l) sw[j] += weight[l];
+ scales[j] = make_qkx3_quants(QK_K/16, 3, x + 16*j, weight, L + 16*j, &mins[j], Laux, -0.9f, 0.05f, 36, false);
}
float dm = make_qp_quants(QK_K/16, 15, scales, Ls, sw);