aboutsummaryrefslogtreecommitdiff
path: root/scripts/generate-qs8-igemm.sh
diff options
context:
space:
mode:
authorFrank Barchard <fbarchard@google.com>2020-10-13 13:38:54 -0700
committerXNNPACK Team <xnnpack-github-robot@google.com>2020-10-13 13:39:27 -0700
commit146e999aa302a0f4fce5b0bbda0692d403ad84ef (patch)
tree52131166137778b7dbe6e4cc6b06b91a6dc1b822 /scripts/generate-qs8-igemm.sh
parent1e8590e3c7d39a9cf7a6ab3757cad801c000d839 (diff)
downloadXNNPACK-146e999aa302a0f4fce5b0bbda0692d403ad84ef.tar.gz
Replace QS8 4x8 with 2x8 neon microkernel.
Improves performance for aarch32. PiperOrigin-RevId: 336945809
Diffstat (limited to 'scripts/generate-qs8-igemm.sh')
-rwxr-xr-xscripts/generate-qs8-igemm.sh2
1 files changed, 1 insertions, 1 deletions
diff --git a/scripts/generate-qs8-igemm.sh b/scripts/generate-qs8-igemm.sh
index bef4520c9..215976a61 100755
--- a/scripts/generate-qs8-igemm.sh
+++ b/scripts/generate-qs8-igemm.sh
@@ -16,7 +16,7 @@ tools/xngen src/qs8-igemm/MRx4c8-wasmsimd.c.in -D MR=3 -D VARIANT=LD128 -o src/q
################################### ARM NEON ##################################
tools/xngen src/qs8-igemm/neon-mlal-lane.c.in -D MR=1 -D NR=8 -o src/qs8-igemm/gen/1x8-minmax-neon-mlal-lane.c
-tools/xngen src/qs8-igemm/neon-mlal-lane.c.in -D MR=4 -D NR=8 -o src/qs8-igemm/gen/4x8-minmax-neon-mlal-lane.c
+tools/xngen src/qs8-igemm/neon-mlal-lane.c.in -D MR=2 -D NR=8 -o src/qs8-igemm/gen/2x8-minmax-neon-mlal-lane.c
tools/xngen src/qs8-igemm/neon-mlal-lane.c.in -D MR=1 -D NR=16 -o src/qs8-igemm/gen/1x16-minmax-neon-mlal-lane.c
tools/xngen src/qs8-igemm/neon-mlal-lane.c.in -D MR=2 -D NR=16 -o src/qs8-igemm/gen/2x16-minmax-neon-mlal-lane.c