diff --git a/CHANGELOG.md b/CHANGELOG.md index 10a4d450d30db4f6375cfde95267dc9f05bfcee4..e430695dd7f3e6fe691e8f0e97ca58521ccdce6f 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -24,6 +24,10 @@ KleidiAI follows the [Semantic Versioning](https://semver.org/) specification fo - Matrix multiplication (MxN) Micro-kernels of QSI8D32 LHS and QAI4C32 RHS with F16 output, optimized for FEAT_DotProd. - Optimized version of kai_rhs_pack_nxk_qsi4c32p_qsu4c32s1s0 kernel for block depth of 8 bytes (`kai_rhs_pack_nxk_qsi4c32pnrx8_qsu4c32s1s0_neon`) - Added Convolution example using SME Indirect Matmul Kernels +- Fixes: + - Fix issue where kai_get_m_step() returns the incorrect value for kernels + - matmul_clamp_f32_f32_f32p16vlx1b_1x16vl_sme2_mla + - matmul_clamp_f32_f32_f32p2vlx1b_1x16vl_sme2_mla ## v1.9.0 diff --git a/kai/ukernels/matmul/matmul_clamp_f32_f32_f32p/kai_matmul_clamp_f32_f32_f32p16vlx1b_1x16vl_sme2_mla.c b/kai/ukernels/matmul/matmul_clamp_f32_f32_f32p/kai_matmul_clamp_f32_f32_f32p16vlx1b_1x16vl_sme2_mla.c index 627ab6884a57899716fe5a09e2189b9b10938175..df4be133d862a1414827f646ed3b9b40c9f07a32 100644 --- a/kai/ukernels/matmul/matmul_clamp_f32_f32_f32p/kai_matmul_clamp_f32_f32_f32p16vlx1b_1x16vl_sme2_mla.c +++ b/kai/ukernels/matmul/matmul_clamp_f32_f32_f32p/kai_matmul_clamp_f32_f32_f32p16vlx1b_1x16vl_sme2_mla.c @@ -18,13 +18,14 @@ #include "kai/kai_common.h" +static const size_t kai_m_step = 1; static const size_t kai_mr = 1; static const size_t kai_nr = 16; static const size_t kai_kr = 1; static const size_t kai_sr = 1; size_t kai_get_m_step_matmul_clamp_f32_f32_f32p16vlx1b_1x16vl_sme2_mla(void) { - return kai_mr * kai_get_sme_vector_length_u32(); + return kai_m_step; } size_t kai_get_n_step_matmul_clamp_f32_f32_f32p16vlx1b_1x16vl_sme2_mla(void) { diff --git a/kai/ukernels/matmul/matmul_clamp_f32_f32_f32p/kai_matmul_clamp_f32_f32_f32p2vlx1b_1x16vl_sme2_mla.c b/kai/ukernels/matmul/matmul_clamp_f32_f32_f32p/kai_matmul_clamp_f32_f32_f32p2vlx1b_1x16vl_sme2_mla.c index cf0608401658f78884c6bdb67d31ec7a57bd86cb..2cadd759d26d1c9e89febd948c69537c405b0293 100644 --- a/kai/ukernels/matmul/matmul_clamp_f32_f32_f32p/kai_matmul_clamp_f32_f32_f32p2vlx1b_1x16vl_sme2_mla.c +++ b/kai/ukernels/matmul/matmul_clamp_f32_f32_f32p/kai_matmul_clamp_f32_f32_f32p2vlx1b_1x16vl_sme2_mla.c @@ -25,7 +25,7 @@ static const size_t kai_kr = 1; static const size_t kai_sr = 1; size_t kai_get_m_step_matmul_clamp_f32_f32_f32p2vlx1b_1x16vl_sme2_mla(void) { - return kai_m_step * kai_get_sme_vector_length_u32(); + return kai_m_step; } size_t kai_get_n_step_matmul_clamp_f32_f32_f32p2vlx1b_1x16vl_sme2_mla(void) {