summaryrefslogtreecommitdiff
path: root/iqk_mul_mat.cpp
diff options
context:
space:
mode:
authorIwan Kawrakow <iwan.kawrakow@gmail.com>2024-07-22 12:28:18 +0200
committerIwan Kawrakow <iwan.kawrakow@gmail.com>2024-07-24 08:04:47 +0200
commitabb740c9a4b65dd6b2facc4780a1e9f2f515bd86 (patch)
tree5ca4927d37eef3d0265e378cca8240752d7f9a55 /iqk_mul_mat.cpp
parent0117e386b3ee8de4d05e0c94448e573eda61f359 (diff)
Fix "make it work for row sizes that are multiple of 4 on NEON"
Diffstat (limited to 'iqk_mul_mat.cpp')
-rw-r--r--iqk_mul_mat.cpp2
1 files changed, 1 insertions, 1 deletions
diff --git a/iqk_mul_mat.cpp b/iqk_mul_mat.cpp
index 45d7816b..c83d2d84 100644
--- a/iqk_mul_mat.cpp
+++ b/iqk_mul_mat.cpp
@@ -4231,7 +4231,7 @@ template <int nrc> struct QF16 final : public QF16Base {
for (int iy = 0; iy < nrc_y; ++iy) y[iy] = (const __fp16 *)(cx + iy*bx);
}
IQK_ALWAYS_INLINE Data load1(int iy, int i) const { return load(y[iy] + k_step*i); }
- IQK_ALWAYS_INLINE Data load_tail(int iy, int i) const { return load4(y[iy] + k_step*i); }
+ IQK_ALWAYS_INLINE Data load_tail(int iy, int i) const { return load4(y[iy] + 4*i); }
const __fp16 * y[nrc_y];
};