aboutsummaryrefslogtreecommitdiff
path: root/scripts/generate-f32-dwconv2d-chw.sh
diff options
context:
space:
mode:
authorMarat Dukhan <maratek@google.com>2020-10-24 12:02:51 -0700
committerXNNPACK Team <xnnpack-github-robot@google.com>2020-10-24 12:03:24 -0700
commit91249d2c849ddde599c8270716bfe05f40d14603 (patch)
tree8601a0037ac1488df8db130f591828dc8fae02fd /scripts/generate-f32-dwconv2d-chw.sh
parentc581e480af4cffadcd62a1264cf26e9d66a960b1 (diff)
downloadXNNPACK-91249d2c849ddde599c8270716bfe05f40d14603.tar.gz
Auto-generate scalar versions of DWCONV2D CHW 3x3p1 micro-kernels
PiperOrigin-RevId: 338847524
Diffstat (limited to 'scripts/generate-f32-dwconv2d-chw.sh')
-rwxr-xr-xscripts/generate-f32-dwconv2d-chw.sh13
1 files changed, 13 insertions, 0 deletions
diff --git a/scripts/generate-f32-dwconv2d-chw.sh b/scripts/generate-f32-dwconv2d-chw.sh
index 06a758248..a6623ece1 100755
--- a/scripts/generate-f32-dwconv2d-chw.sh
+++ b/scripts/generate-f32-dwconv2d-chw.sh
@@ -54,5 +54,18 @@ tools/xngen src/f32-dwconv2d-chw/3x3p1-ssse3.c.in -D ROW_TILE=1 -D ACCUMULATORS=
tools/xngen src/f32-dwconv2d-chw/3x3p1-ssse3.c.in -D ROW_TILE=1 -D ACCUMULATORS=4 -o src/f32-dwconv2d-chw/gen/3x3p1-minmax-ssse3-1x4-acc4.c
tools/xngen src/f32-dwconv2d-chw/3x3p1-ssse3.c.in -D ROW_TILE=2 -D ACCUMULATORS=2 -o src/f32-dwconv2d-chw/gen/3x3p1-minmax-ssse3-2x4-acc2.c
+################################### Scalar ####################################
+tools/xngen src/f32-dwconv2d-chw/3x3p1-scalar.c.in -D ROW_TILE=1 -D ACCUMULATORS=1 -o src/f32-dwconv2d-chw/gen/3x3p1-minmax-scalar-1x1.c
+tools/xngen src/f32-dwconv2d-chw/3x3p1-scalar.c.in -D ROW_TILE=2 -D ACCUMULATORS=1 -o src/f32-dwconv2d-chw/gen/3x3p1-minmax-scalar-2x1.c
+tools/xngen src/f32-dwconv2d-chw/3x3p1-scalar.c.in -D ROW_TILE=3 -D ACCUMULATORS=1 -o src/f32-dwconv2d-chw/gen/3x3p1-minmax-scalar-3x1.c
+tools/xngen src/f32-dwconv2d-chw/3x3p1-scalar.c.in -D ROW_TILE=4 -D ACCUMULATORS=1 -o src/f32-dwconv2d-chw/gen/3x3p1-minmax-scalar-4x1.c
+tools/xngen src/f32-dwconv2d-chw/3x3p1-scalar.c.in -D ROW_TILE=5 -D ACCUMULATORS=1 -o src/f32-dwconv2d-chw/gen/3x3p1-minmax-scalar-5x1.c
+tools/xngen src/f32-dwconv2d-chw/3x3p1-scalar.c.in -D ROW_TILE=6 -D ACCUMULATORS=1 -o src/f32-dwconv2d-chw/gen/3x3p1-minmax-scalar-6x1.c
+
+tools/xngen src/f32-dwconv2d-chw/3x3p1-scalar.c.in -D ROW_TILE=1 -D ACCUMULATORS=2 -o src/f32-dwconv2d-chw/gen/3x3p1-minmax-scalar-1x1-acc2.c
+tools/xngen src/f32-dwconv2d-chw/3x3p1-scalar.c.in -D ROW_TILE=1 -D ACCUMULATORS=3 -o src/f32-dwconv2d-chw/gen/3x3p1-minmax-scalar-1x1-acc3.c
+tools/xngen src/f32-dwconv2d-chw/3x3p1-scalar.c.in -D ROW_TILE=1 -D ACCUMULATORS=4 -o src/f32-dwconv2d-chw/gen/3x3p1-minmax-scalar-1x1-acc4.c
+tools/xngen src/f32-dwconv2d-chw/3x3p1-scalar.c.in -D ROW_TILE=2 -D ACCUMULATORS=2 -o src/f32-dwconv2d-chw/gen/3x3p1-minmax-scalar-2x1-acc2.c
+
################################## Unit tests #################################
tools/generate-dwconv2d-chw-test.py --spec test/f32-dwconv2d-chw.yaml --output test/f32-dwconv2d-chw.cc