diff options
Diffstat (limited to 'bench')
-rw-r--r-- | bench/f32-dwconv2d-chw.cc | 28 |
1 files changed, 28 insertions, 0 deletions
diff --git a/bench/f32-dwconv2d-chw.cc b/bench/f32-dwconv2d-chw.cc index 6a30b25bc..d4b03c84e 100644 --- a/bench/f32-dwconv2d-chw.cc +++ b/bench/f32-dwconv2d-chw.cc @@ -223,9 +223,30 @@ static void DWConv2DBenchmark(benchmark::State& state, DWConv2DBenchmark(state, xnn_f32_dwconv2d_chw_ukernel_3x3p1__neonfma_2x4_acc2, 3, 3, 1, 1); } + static void dwconv2d_chw_3x3s2p1__neonfma_1x4(benchmark::State& state, const char* net) { + DWConv2DBenchmark(state, xnn_f32_dwconv2d_chw_ukernel_3x3s2p1__neonfma_1x4, 3, 3, 1, 2); + } + static void dwconv2d_chw_3x3s2p1__neonfma_2x4(benchmark::State& state, const char* net) { + DWConv2DBenchmark(state, xnn_f32_dwconv2d_chw_ukernel_3x3s2p1__neonfma_2x4, 3, 3, 1, 2); + } + static void dwconv2d_chw_3x3s2p1__neonfma_3x4(benchmark::State& state, const char* net) { + DWConv2DBenchmark(state, xnn_f32_dwconv2d_chw_ukernel_3x3s2p1__neonfma_3x4, 3, 3, 1, 2); + } + static void dwconv2d_chw_3x3s2p1__neonfma_4x4(benchmark::State& state, const char* net) { + DWConv2DBenchmark(state, xnn_f32_dwconv2d_chw_ukernel_3x3s2p1__neonfma_4x4, 3, 3, 1, 2); + } + static void dwconv2d_chw_3x3s2p1__neonfma_1x4_acc2(benchmark::State& state, const char* net) { + DWConv2DBenchmark(state, xnn_f32_dwconv2d_chw_ukernel_3x3s2p1__neonfma_1x4_acc2, 3, 3, 1, 2); + } static void dwconv2d_chw_3x3s2p1__neonfma_1x4_acc3(benchmark::State& state, const char* net) { DWConv2DBenchmark(state, xnn_f32_dwconv2d_chw_ukernel_3x3s2p1__neonfma_1x4_acc3, 3, 3, 1, 2); } + static void dwconv2d_chw_3x3s2p1__neonfma_1x4_acc4(benchmark::State& state, const char* net) { + DWConv2DBenchmark(state, xnn_f32_dwconv2d_chw_ukernel_3x3s2p1__neonfma_1x4_acc4, 3, 3, 1, 2); + } + static void dwconv2d_chw_3x3s2p1__neonfma_2x4_acc2(benchmark::State& state, const char* net) { + DWConv2DBenchmark(state, xnn_f32_dwconv2d_chw_ukernel_3x3s2p1__neonfma_2x4_acc2, 3, 3, 1, 2); + } static void dwconv2d_chw_5x5p2__neonfma_3x4(benchmark::State& state, const char* net) { DWConv2DBenchmark(state, xnn_f32_dwconv2d_chw_ukernel_5x5p2__neonfma_3x4, 5, 5, 2, 1); @@ -246,7 +267,14 @@ static void DWConv2DBenchmark(benchmark::State& state, BENCHMARK_DWCONV(dwconv2d_chw_3x3p1__neonfma_1x4_acc4) BENCHMARK_DWCONV(dwconv2d_chw_3x3p1__neonfma_2x4_acc2) + BENCHMARK_DWCONV(dwconv2d_chw_3x3s2p1__neonfma_1x4) + BENCHMARK_DWCONV(dwconv2d_chw_3x3s2p1__neonfma_2x4) + BENCHMARK_DWCONV(dwconv2d_chw_3x3s2p1__neonfma_3x4) + BENCHMARK_DWCONV(dwconv2d_chw_3x3s2p1__neonfma_4x4) + BENCHMARK_DWCONV(dwconv2d_chw_3x3s2p1__neonfma_1x4_acc2) BENCHMARK_DWCONV(dwconv2d_chw_3x3s2p1__neonfma_1x4_acc3) + BENCHMARK_DWCONV(dwconv2d_chw_3x3s2p1__neonfma_1x4_acc4) + BENCHMARK_DWCONV(dwconv2d_chw_3x3s2p1__neonfma_2x4_acc2) BENCHMARK_DWCONV(dwconv2d_chw_5x5p2__neonfma_3x4) |