summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorAbhilash Majumder <30946547+abhilash1910@users.noreply.github.com>2024-04-08 13:56:01 +0530
committerGitHub <noreply@github.com>2024-04-08 16:26:01 +0800
commit87fb5b4234d4b9c56ac94cf7aa229c8fd7defdb0 (patch)
tree2d2c684dd680f225494889cdabae7dfabda7e923
parentd752327c3338d5b9634121d651c0105f2c933f9b (diff)
remove row=1 cond (#6532)
-rw-r--r--ggml-sycl.cpp3
1 files changed, 1 insertions, 2 deletions
diff --git a/ggml-sycl.cpp b/ggml-sycl.cpp
index b8388149..55a1eedb 100644
--- a/ggml-sycl.cpp
+++ b/ggml-sycl.cpp
@@ -15776,7 +15776,7 @@ static void ggml_sycl_mul_mat(const ggml_tensor * src0, const ggml_tensor * src1
#ifdef GGML_SYCL_FORCE_DMMV
const bool use_mul_mat_vec_q = false;
#else
- bool use_mul_mat_vec_q = min_compute_capability >= VER_4VEC && ggml_is_quantized(src0->type) && ggml_nrows(src1) == 1;
+ bool use_mul_mat_vec_q = min_compute_capability >= VER_4VEC && ggml_is_quantized(src0->type);
use_mul_mat_vec_q = use_mul_mat_vec_q ||
(src0->type == GGML_TYPE_IQ2_XXS) || (src0->type == GGML_TYPE_IQ2_XS) || (src0->type == GGML_TYPE_IQ2_S) ||
(src0->type == GGML_TYPE_IQ3_XXS) || (src0->type == GGML_TYPE_IQ3_S) ||
@@ -15787,7 +15787,6 @@ static void ggml_sycl_mul_mat(const ggml_tensor * src0, const ggml_tensor * src1
#endif // GGML_SYCL_FORCE_DMMV
if (use_mul_mat_vec_q) {
- // NOTE: this kernel does not support ggml_nrows(src1) > 1
// GGML_SYCL_DEBUG("ggml_sycl_mul_mat ggml_sycl_op_mul_mat_vec_q path\n");
ggml_sycl_op_mul_mat(src0, src1, dst, ggml_sycl_op_mul_mat_vec_q, true);
} else {