@@ -51,11 +51,10 @@ static ggml_kleidiai_kernels gemm_gemv_kernels[] = {
51
51
/* .run_kernel = */ kai_run_matmul_clamp_f32_qsi8d32p1x4_qsi4c32p4vlx4_1x4vl_sme2_sdot,
52
52
},
53
53
/* .lhs_info = */ {
54
- /* .get_offset = */ kai_get_lhs_offset_lhs_quant_pack_qsi8d32p_f32 ,
55
- /* .get_packed_offset = */ kai_get_lhs_packed_offset_lhs_quant_pack_qsi8d32p_f32 ,
54
+ /* .get_offset = */ kai_get_lhs_offset_lhs_quant_pack_qsi8d32p_f32_neon ,
55
+ /* .get_packed_offset = */ kai_get_lhs_packed_offset_lhs_quant_pack_qsi8d32p_f32_neon ,
56
56
/* .packed_size = */ kai_get_lhs_packed_size_lhs_quant_pack_qsi8d32p_f32_neon,
57
57
/* .pack_func = */ kai_run_lhs_quant_pack_qsi8d32p_f32_neon,
58
- /* .require_aligned_m_idx = */ true ,
59
58
},
60
59
/* .rhs_info = */ {
61
60
/* .packed_size = */ kai_get_rhs_packed_size_rhs_pack_nxk_qsi4c32ps1s0scalef16_qsu4c32s16s0_neon,
@@ -100,7 +99,6 @@ static ggml_kleidiai_kernels gemm_gemv_kernels[] = {
100
99
/* .get_packed_offset = */ kai_get_lhs_packed_offset_lhs_quant_pack_qsi8d32p_f32,
101
100
/* .packed_size = */ kai_get_lhs_packed_size_lhs_quant_pack_qsi8d32p_f32,
102
101
/* .pack_func = */ kai_run_lhs_quant_pack_qsi8d32p_f32,
103
- /* .require_aligned_m_idx = */ false ,
104
102
},
105
103
/* .rhs_info = */ {
106
104
/* .packed_size = */ kai_get_rhs_packed_size_rhs_pack_nxk_qsi4c32pscalef16_qsu4c32s16s0,
@@ -144,7 +142,6 @@ static ggml_kleidiai_kernels gemm_gemv_kernels[] = {
144
142
/* .get_packed_offset = */ kai_get_lhs_packed_offset_lhs_quant_pack_qsi8d32p_f32,
145
143
/* .packed_size = */ kai_get_lhs_packed_size_lhs_quant_pack_qsi8d32p_f32,
146
144
/* .pack_func = */ kai_run_lhs_quant_pack_qsi8d32p_f32,
147
- /* .require_aligned_m_idx = */ false ,
148
145
},
149
146
/* .rhs_info = */ {
150
147
/* .packed_size = */ kai_get_rhs_packed_size_rhs_pack_nxk_qsi4c32pscalef16_qsu4c32s16s0,
@@ -189,7 +186,6 @@ static ggml_kleidiai_kernels gemm_gemv_kernels[] = {
189
186
/* .get_packed_offset = */ kai_get_lhs_packed_offset_lhs_quant_pack_qsi8d32p_f32,
190
187
/* .packed_size = */ kai_get_lhs_packed_size_lhs_quant_pack_qsi8d32p_f32,
191
188
/* .pack_func = */ kai_run_lhs_quant_pack_qsi8d32p_f32,
192
- /* .require_aligned_m_idx = */ false ,
193
189
},
194
190
/* .rhs_info = */ {
195
191
/* .packed_size = */ kai_get_rhs_packed_size_rhs_pack_nxk_qsi4c32pscalef16_qsu4c32s16s0,
@@ -233,7 +229,6 @@ static ggml_kleidiai_kernels gemm_gemv_kernels[] = {
233
229
/* .get_packed_offset = */ kai_get_lhs_packed_offset_lhs_quant_pack_qsi8d32p_f32,
234
230
/* .packed_size = */ kai_get_lhs_packed_size_lhs_quant_pack_qsi8d32p_f32,
235
231
/* .pack_func = */ kai_run_lhs_quant_pack_qsi8d32p_f32,
236
- /* .require_aligned_m_idx = */ false ,
237
232
},
238
233
/* .rhs_info = */ {
239
234
/* .packed_size = */ kai_get_rhs_packed_size_rhs_pack_nxk_qsi4c32pscalef16_qsu4c32s16s0,
0 commit comments