diff options
author | Iwan Kawrakow <iwan.kawrakow@gmail.com> | 2024-07-22 12:28:18 +0200 |
---|---|---|
committer | Iwan Kawrakow <iwan.kawrakow@gmail.com> | 2024-07-24 08:04:47 +0200 |
commit | abb740c9a4b65dd6b2facc4780a1e9f2f515bd86 (patch) | |
tree | 5ca4927d37eef3d0265e378cca8240752d7f9a55 | |
parent | 0117e386b3ee8de4d05e0c94448e573eda61f359 (diff) |
Fix "make it work for row sizes that are multiple of 4 on NEON"
-rw-r--r-- | iqk_mul_mat.cpp | 2 |
1 files changed, 1 insertions, 1 deletions
diff --git a/iqk_mul_mat.cpp b/iqk_mul_mat.cpp index 45d7816b..c83d2d84 100644 --- a/iqk_mul_mat.cpp +++ b/iqk_mul_mat.cpp @@ -4231,7 +4231,7 @@ template <int nrc> struct QF16 final : public QF16Base { for (int iy = 0; iy < nrc_y; ++iy) y[iy] = (const __fp16 *)(cx + iy*bx); } IQK_ALWAYS_INLINE Data load1(int iy, int i) const { return load(y[iy] + k_step*i); } - IQK_ALWAYS_INLINE Data load_tail(int iy, int i) const { return load4(y[iy] + k_step*i); } + IQK_ALWAYS_INLINE Data load_tail(int iy, int i) const { return load4(y[iy] + 4*i); } const __fp16 * y[nrc_y]; }; |