// Copyright 2019 Google LLC // // This source code is licensed under the BSD-style license found in the // LICENSE file in the root directory of this source tree. #include #include #include #include #include "xnnpack.h" #include "xnnpack/config.h" #include "argmax-pooling-operator-tester.h" static uint32_t FindMaxSinglePassPoolingSize(const xnn_argmaxpool_config* ukernel) { uint32_t first_pass_tile_size = 0; while (ukernel->remainder_pass_tile_size == 0) { first_pass_tile_size = std::max(first_pass_tile_size, ukernel->first_pass_tile_size); ukernel++; } return first_pass_tile_size; } static xnn_argmaxpool_config FindMultiPassMicroKernel(const xnn_argmaxpool_config* ukernel) { while (ukernel->remainder_pass_tile_size == 0) { ukernel++; } return *ukernel; } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_small_1xM_pool) { const struct xnn_argmaxpool_config* argmaxpool_config = xnn_init_f32_argmaxpool_config(); ASSERT_NE(argmaxpool_config, nullptr); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = 2; pool_size <= FindMaxSinglePassPoolingSize(argmaxpool_config); pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(2) .input_width(pool_size + 2) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_small_1xM_pool_with_padding) { const struct xnn_argmaxpool_config* argmaxpool_config = xnn_init_f32_argmaxpool_config(); ASSERT_NE(argmaxpool_config, nullptr); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = 3; pool_size <= FindMaxSinglePassPoolingSize(argmaxpool_config); pool_size++) { for (size_t padding_left = 0; padding_left <= 1; padding_left++) { for (size_t padding_right = 0; padding_right <= 1; padding_right++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(2) .input_width(pool_size + 2) .padding_left(padding_left) .padding_right(padding_right) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .TestF32(); } } } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_small_1xM_pool_with_tf_same_padding) { const struct xnn_argmaxpool_config* argmaxpool_config = xnn_init_f32_argmaxpool_config(); ASSERT_NE(argmaxpool_config, nullptr); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = 3; pool_size <= FindMaxSinglePassPoolingSize(argmaxpool_config); pool_size++) { for (size_t input_width = pool_size + 1; input_width <= pool_size; input_width++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(2) .input_width(input_width) .padding_tf_same(true) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .TestF32(); } } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_small_Mx1_pool) { const struct xnn_argmaxpool_config* argmaxpool_config = xnn_init_f32_argmaxpool_config(); ASSERT_NE(argmaxpool_config, nullptr); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = 2; pool_size <= FindMaxSinglePassPoolingSize(argmaxpool_config); pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(pool_size + 1) .input_width(3) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_small_Mx1_pool_with_padding) { const struct xnn_argmaxpool_config* argmaxpool_config = xnn_init_f32_argmaxpool_config(); ASSERT_NE(argmaxpool_config, nullptr); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = 2; pool_size <= FindMaxSinglePassPoolingSize(argmaxpool_config); pool_size++) { for (size_t padding_top = 0; padding_top <= 1; padding_top++) { for (size_t padding_bottom = 0; padding_bottom <= 1; padding_bottom++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(pool_size + 1) .input_width(3) .padding_top(padding_top) .padding_bottom(padding_bottom) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .TestF32(); } } } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_small_Mx1_pool_with_tf_same_padding) { const struct xnn_argmaxpool_config* argmaxpool_config = xnn_init_f32_argmaxpool_config(); ASSERT_NE(argmaxpool_config, nullptr); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = 2; pool_size <= FindMaxSinglePassPoolingSize(argmaxpool_config); pool_size++) { for (size_t input_height = pool_size + 1; input_height <= pool_size * 2; input_height++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(input_height) .input_width(3) .padding_tf_same(true) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .TestF32(); } } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_small_pool_with_input_stride) { const struct xnn_argmaxpool_config* argmaxpool_config = xnn_init_f32_argmaxpool_config(); ASSERT_NE(argmaxpool_config, nullptr); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = 2; pool_size <= FindMaxSinglePassPoolingSize(argmaxpool_config); pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(pool_size + 1) .input_width(3) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .input_pixel_stride(5 * channels) .TestF32(); ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(2) .input_width(pool_size + 2) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .input_pixel_stride(5 * channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_small_pool_with_output_stride) { const struct xnn_argmaxpool_config* argmaxpool_config = xnn_init_f32_argmaxpool_config(); ASSERT_NE(argmaxpool_config, nullptr); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = 2; pool_size <= FindMaxSinglePassPoolingSize(argmaxpool_config); pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(pool_size + 1) .input_width(3) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .output_pixel_stride(5 * channels) .TestF32(); ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(2) .input_width(pool_size + 2) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .output_pixel_stride(5 * channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_large_1xM_pool) { const struct xnn_argmaxpool_config* argmaxpool_config = xnn_init_f32_argmaxpool_config(); ASSERT_NE(argmaxpool_config, nullptr); const auto multipass = FindMultiPassMicroKernel(argmaxpool_config); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = multipass.first_pass_tile_size + 1; pool_size <= multipass.first_pass_tile_size + multipass.remainder_pass_tile_size; pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(2) .input_width(pool_size + 2) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_large_1xM_pool_with_padding) { const struct xnn_argmaxpool_config* argmaxpool_config = xnn_init_f32_argmaxpool_config(); ASSERT_NE(argmaxpool_config, nullptr); const auto multipass = FindMultiPassMicroKernel(argmaxpool_config); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = multipass.first_pass_tile_size + 1; pool_size <= multipass.first_pass_tile_size + multipass.remainder_pass_tile_size; pool_size++) { for (size_t padding_left = 0; padding_left <= 1; padding_left++) { for (size_t padding_right = 0; padding_right <= 1; padding_right++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(2) .input_width(pool_size + 2) .padding_left(padding_left) .padding_right(padding_right) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .TestF32(); } } } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_large_1xM_pool_with_tf_same_padding) { const struct xnn_argmaxpool_config* argmaxpool_config = xnn_init_f32_argmaxpool_config(); ASSERT_NE(argmaxpool_config, nullptr); const auto multipass = FindMultiPassMicroKernel(argmaxpool_config); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = multipass.first_pass_tile_size + 1; pool_size <= multipass.first_pass_tile_size + multipass.remainder_pass_tile_size; pool_size++) { for (size_t input_width = pool_size + 1; input_width <= pool_size * 2; input_width++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(2) .input_width(input_width) .padding_tf_same(true) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .TestF32(); } } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_large_Mx1_pool) { const struct xnn_argmaxpool_config* argmaxpool_config = xnn_init_f32_argmaxpool_config(); ASSERT_NE(argmaxpool_config, nullptr); const auto multipass = FindMultiPassMicroKernel(argmaxpool_config); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = multipass.first_pass_tile_size + 1; pool_size <= multipass.first_pass_tile_size + multipass.remainder_pass_tile_size; pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(pool_size + 1) .input_width(3) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_large_Mx1_pool_with_padding) { const struct xnn_argmaxpool_config* argmaxpool_config = xnn_init_f32_argmaxpool_config(); ASSERT_NE(argmaxpool_config, nullptr); const auto multipass = FindMultiPassMicroKernel(argmaxpool_config); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = multipass.first_pass_tile_size + 1; pool_size <= multipass.first_pass_tile_size + multipass.remainder_pass_tile_size; pool_size++) { for (size_t padding_top = 0; padding_top <= 1; padding_top++) { for (size_t padding_bottom = 0; padding_bottom <= 1; padding_bottom++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(pool_size + 1) .input_width(3) .padding_top(padding_top) .padding_bottom(padding_bottom) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .TestF32(); } } } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_large_Mx1_pool_with_tf_same_padding) { const struct xnn_argmaxpool_config* argmaxpool_config = xnn_init_f32_argmaxpool_config(); ASSERT_NE(argmaxpool_config, nullptr); const auto multipass = FindMultiPassMicroKernel(argmaxpool_config); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = multipass.first_pass_tile_size + 1; pool_size <= multipass.first_pass_tile_size + multipass.remainder_pass_tile_size; pool_size++) { for (size_t input_height = pool_size + 2; input_height <= pool_size * 2; input_height++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(input_height) .input_width(3) .padding_tf_same(true) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .TestF32(); } } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_large_pool_with_input_stride) { const struct xnn_argmaxpool_config* argmaxpool_config = xnn_init_f32_argmaxpool_config(); ASSERT_NE(argmaxpool_config, nullptr); const auto multipass = FindMultiPassMicroKernel(argmaxpool_config); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = multipass.first_pass_tile_size + 1; pool_size <= multipass.first_pass_tile_size + multipass.remainder_pass_tile_size; pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(pool_size + 1) .input_width(3) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .input_pixel_stride(5 * channels) .TestF32(); ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(2) .input_width(pool_size + 2) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .input_pixel_stride(5 * channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_large_pool_with_output_stride) { const struct xnn_argmaxpool_config* argmaxpool_config = xnn_init_f32_argmaxpool_config(); ASSERT_NE(argmaxpool_config, nullptr); const auto multipass = FindMultiPassMicroKernel(argmaxpool_config); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = multipass.first_pass_tile_size + 1; pool_size <= multipass.first_pass_tile_size + multipass.remainder_pass_tile_size; pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(pool_size + 1) .input_width(3) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .output_pixel_stride(5 * channels) .TestF32(); ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(2) .input_width(pool_size + 2) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .output_pixel_stride(5 * channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, small_batch_small_pool) { const struct xnn_argmaxpool_config* argmaxpool_config = xnn_init_f32_argmaxpool_config(); ASSERT_NE(argmaxpool_config, nullptr); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = 2; pool_size <= FindMaxSinglePassPoolingSize(argmaxpool_config); pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(pool_size + 1) .input_width(3) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .TestF32(); ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(2) .input_width(pool_size + 2) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, small_batch_small_pool_with_input_stride) { const struct xnn_argmaxpool_config* argmaxpool_config = xnn_init_f32_argmaxpool_config(); ASSERT_NE(argmaxpool_config, nullptr); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = 2; pool_size <= FindMaxSinglePassPoolingSize(argmaxpool_config); pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(pool_size + 1) .input_width(3) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .input_pixel_stride(5 * channels) .TestF32(); ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(2) .input_width(pool_size + 2) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .input_pixel_stride(5 * channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, small_batch_small_pool_with_output_stride) { const struct xnn_argmaxpool_config* argmaxpool_config = xnn_init_f32_argmaxpool_config(); ASSERT_NE(argmaxpool_config, nullptr); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = 2; pool_size <= FindMaxSinglePassPoolingSize(argmaxpool_config); pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(pool_size + 1) .input_width(3) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .output_pixel_stride(5 * channels) .TestF32(); ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(2) .input_width(pool_size + 2) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .output_pixel_stride(5 * channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, small_batch_large_pool) { const struct xnn_argmaxpool_config* argmaxpool_config = xnn_init_f32_argmaxpool_config(); ASSERT_NE(argmaxpool_config, nullptr); const auto multipass = FindMultiPassMicroKernel(argmaxpool_config); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = multipass.first_pass_tile_size + 1; pool_size <= multipass.first_pass_tile_size + multipass.remainder_pass_tile_size; pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(pool_size + 1) .input_width(3) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .TestF32(); ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(2) .input_width(pool_size + 2) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, small_batch_large_pool_with_input_stride) { const struct xnn_argmaxpool_config* argmaxpool_config = xnn_init_f32_argmaxpool_config(); ASSERT_NE(argmaxpool_config, nullptr); const auto multipass = FindMultiPassMicroKernel(argmaxpool_config); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = multipass.first_pass_tile_size + 1; pool_size <= multipass.first_pass_tile_size + multipass.remainder_pass_tile_size; pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(pool_size + 1) .input_width(3) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .input_pixel_stride(5 * channels) .TestF32(); ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(2) .input_width(pool_size + 2) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .input_pixel_stride(5 * channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, small_batch_large_pool_with_output_stride) { const struct xnn_argmaxpool_config* argmaxpool_config = xnn_init_f32_argmaxpool_config(); ASSERT_NE(argmaxpool_config, nullptr); const auto multipass = FindMultiPassMicroKernel(argmaxpool_config); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = multipass.first_pass_tile_size + 1; pool_size <= multipass.first_pass_tile_size + multipass.remainder_pass_tile_size; pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(pool_size + 1) .input_width(3) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .output_pixel_stride(5 * channels) .TestF32(); ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(2) .input_width(pool_size + 2) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .output_pixel_stride(5 * channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, small_batch_large_pool_multithreaded) { const struct xnn_argmaxpool_config* argmaxpool_config = xnn_init_f32_argmaxpool_config(); ASSERT_NE(argmaxpool_config, nullptr); const auto multipass = FindMultiPassMicroKernel(argmaxpool_config); ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(multipass.first_pass_tile_size + 2) .input_width(3) .pooling_height(multipass.first_pass_tile_size + 1) .pooling_width(1) .channels(15) .multithreaded(true) .TestF32(); } TEST(ARGMAX_POOLING_NHWC_F32, setup_increasing_batch) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); ArgmaxPoolingOperatorTester() .batch_size(3) .next_batch_size(5) .input_height(8) .input_width(8) .pooling_height(5) .pooling_width(3) .channels(24) .TestSetupF32(); } TEST(ARGMAX_POOLING_NHWC_F32, setup_decreasing_batch) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); ArgmaxPoolingOperatorTester() .batch_size(5) .next_batch_size(3) .input_height(8) .input_width(8) .pooling_height(5) .pooling_width(3) .channels(24) .TestSetupF32(); } TEST(ARGMAX_POOLING_NHWC_F32, setup_changing_height) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(8) .input_width(8) .next_input_height(9) .pooling_height(5) .pooling_width(3) .channels(24) .TestSetupF32(); ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(8) .input_width(8) .next_input_height(7) .pooling_height(5) .pooling_width(3) .channels(24) .TestSetupF32(); } TEST(ARGMAX_POOLING_NHWC_F32, setup_changing_width) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(8) .input_width(8) .next_input_width(9) .pooling_height(5) .pooling_width(3) .channels(24) .TestSetupF32(); ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(8) .input_width(8) .next_input_width(7) .pooling_height(5) .pooling_width(3) .channels(24) .TestSetupF32(); } TEST(ARGMAX_POOLING_NHWC_F32, setup_swap_height_and_width) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(9) .input_width(8) .next_input_height(8) .next_input_width(9) .pooling_height(5) .pooling_width(3) .channels(24) .TestSetupF32(); }