summaryrefslogtreecommitdiff
path: root/ggml.c
diff options
context:
space:
mode:
authorGeorgi Gerganov <ggerganov@gmail.com>2023-04-22 16:31:56 +0300
committerGeorgi Gerganov <ggerganov@gmail.com>2023-04-22 16:32:07 +0300
commit0e018fe008eacebdbcfa2d61b6c988c245c961cd (patch)
tree5a2051e9896f120527484732b9a9a14f0107f547 /ggml.c
parent857308d1e8fb6afe33edb481d48560eee8fe7d7c (diff)
ggml : fix Q4_3 cuBLAS
Diffstat (limited to 'ggml.c')
-rw-r--r--ggml.c3
1 files changed, 3 insertions, 0 deletions
diff --git a/ggml.c b/ggml.c
index d9a95af8..281b2028 100644
--- a/ggml.c
+++ b/ggml.c
@@ -7992,6 +7992,9 @@ static void ggml_compute_forward_mul_mat_q_f32(
else if (type == GGML_TYPE_Q4_2) {
dequantize_row_q_cuda = dequantize_row_q4_2_cuda;
}
+ else if (type == GGML_TYPE_Q4_3) {
+ dequantize_row_q_cuda = dequantize_row_q4_3_cuda;
+ }
else {
GGML_ASSERT(false);
}