aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorFrank Barchard <fbarchard@google.com>2021-03-10 16:55:54 -0800
committerXNNPACK Team <xnnpack-github-robot@google.com>2021-03-10 16:56:29 -0800
commit46108547da415a7859ddb69a4afecc816703dfb9 (patch)
tree177ba36aeb27800d628fe8f42ab6b7f9f1fd6777
parent3522c0a6133873558e1509ad514fbb6826fd2039 (diff)
downloadXNNPACK-46108547da415a7859ddb69a4afecc816703dfb9.tar.gz
Disable QS8 1x16c4-aarch64-neondot-ld64 IGEMM microkernel
GEMM use intrinsics for 1x16 PiperOrigin-RevId: 362173993
-rw-r--r--src/init.c6
1 files changed, 3 insertions, 3 deletions
diff --git a/src/init.c b/src/init.c
index 9fe2e455a..bd7b130b6 100644
--- a/src/init.c
+++ b/src/init.c
@@ -809,7 +809,7 @@ static void init(void) {
#if XNN_ENABLE_ASSEMBLY
if (cpuinfo_has_arm_neon_dot()) {
xnn_params.qs8.gemm.minmax.gemm = xnn_init_hmp_gemm_ukernel((xnn_gemm_ukernel_function) xnn_qs8_gemm_minmax_ukernel_4x16c4__aarch64_neondot_ld64);
- xnn_params.qs8.gemm.minmax.gemm1 = xnn_init_hmp_gemm_ukernel((xnn_gemm_ukernel_function) xnn_qs8_gemm_minmax_ukernel_1x16c4__aarch64_neondot_ld64);
+ xnn_params.qs8.gemm.minmax.gemm1 = xnn_init_hmp_gemm_ukernel((xnn_gemm_ukernel_function) xnn_qs8_gemm_minmax_ukernel_1x16c4__neondot);
xnn_params.qs8.gemm.minmax.igemm = xnn_init_hmp_igemm_ukernel((xnn_igemm_ukernel_function) xnn_qs8_igemm_minmax_ukernel_4x16c4__aarch64_neondot_ld64);
xnn_params.qs8.gemm.minmax.igemm1 = xnn_init_hmp_igemm_ukernel((xnn_igemm_ukernel_function) xnn_qs8_igemm_minmax_ukernel_1x16c4__neondot);
xnn_params.qs8.gemm.mr = 4;
@@ -856,7 +856,7 @@ static void init(void) {
xnn_params.qs8.gemm.minmax.igemm = xnn_init_hmp_igemm_ukernel((xnn_igemm_ukernel_function) xnn_qs8_igemm_minmax_ukernel_4x16c4__aarch64_neondot_ld64);
break;
}
- xnn_params.qs8.gemm.minmax.gemm1 = xnn_init_hmp_gemm_ukernel((xnn_gemm_ukernel_function) xnn_qs8_gemm_minmax_ukernel_1x16c4__aarch64_neondot_ld64);
+ xnn_params.qs8.gemm.minmax.gemm1 = xnn_init_hmp_gemm_ukernel((xnn_gemm_ukernel_function) xnn_qs8_gemm_minmax_ukernel_1x16c4__neondot);
xnn_params.qs8.gemm.minmax.igemm1 = xnn_init_hmp_igemm_ukernel((xnn_igemm_ukernel_function) xnn_qs8_igemm_minmax_ukernel_1x16c4__neondot);
xnn_params.qs8.gemm.mr = 4;
xnn_params.qs8.gemm.nr = 16;
@@ -888,7 +888,7 @@ static void init(void) {
if (mr == 4 && nr == 16 && log2_kr == 2) {
xnn_params.qs8.gemm.minmax.gemm.function[i] = (xnn_gemm_ukernel_function) xnn_qs8_gemm_minmax_ukernel_4x16c4__aarch64_neondot_cortex_a55;
xnn_params.qs8.gemm.minmax.igemm.function[i] = (xnn_igemm_ukernel_function) xnn_qs8_igemm_minmax_ukernel_4x16c4__aarch64_neondot_cortex_a55;
- xnn_params.qs8.gemm.minmax.gemm1.function[i] = (xnn_gemm_ukernel_function) xnn_qs8_gemm_minmax_ukernel_1x16c4__aarch64_neondot_ld64;
+ xnn_params.qs8.gemm.minmax.gemm1.function[i] = (xnn_gemm_ukernel_function) xnn_qs8_gemm_minmax_ukernel_1x16c4__neondot;
xnn_params.qs8.gemm.minmax.igemm1.function[i] = (xnn_igemm_ukernel_function) xnn_qs8_igemm_minmax_ukernel_1x16c4__neondot;
}
break;