// Copyright 2019 Google LLC // // This source code is licensed under the BSD-style license found in the // LICENSE file in the root directory of this source tree. #include #include "argmax-pooling-operator-tester.h" #include static uint32_t FindMaxSinglePassPoolingSize(const argmaxpool_parameters* ukernel) { uint32_t mr = 0; while (ukernel->qr == 0) { mr = std::max(mr, ukernel->mr); ukernel++; } return mr; } static argmaxpool_parameters FindMultiPassMicroKernel(const argmaxpool_parameters* ukernel) { while (ukernel->qr == 0) { ukernel++; } return *ukernel; } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_small_1xM_pool) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = 2; pool_size <= FindMaxSinglePassPoolingSize(xnn_params.f32.argmaxpool); pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(2) .input_width(pool_size + 2) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_small_1xM_pool_with_padding) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = 3; pool_size <= FindMaxSinglePassPoolingSize(xnn_params.f32.argmaxpool); pool_size++) { for (size_t padding_left = 0; padding_left <= 1; padding_left++) { for (size_t padding_right = 0; padding_right <= 1; padding_right++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(2) .input_width(pool_size + 2) .padding_left(padding_left) .padding_right(padding_right) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .TestF32(); } } } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_small_1xM_pool_with_tf_same_padding) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = 3; pool_size <= FindMaxSinglePassPoolingSize(xnn_params.f32.argmaxpool); pool_size++) { for (size_t input_width = pool_size + 1; input_width <= pool_size; input_width++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(2) .input_width(input_width) .padding_tf_same(true) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .TestF32(); } } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_small_Mx1_pool) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = 2; pool_size <= FindMaxSinglePassPoolingSize(xnn_params.f32.argmaxpool); pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(pool_size + 1) .input_width(3) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_small_Mx1_pool_with_padding) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = 2; pool_size <= FindMaxSinglePassPoolingSize(xnn_params.f32.argmaxpool); pool_size++) { for (size_t padding_top = 0; padding_top <= 1; padding_top++) { for (size_t padding_bottom = 0; padding_bottom <= 1; padding_bottom++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(pool_size + 1) .input_width(3) .padding_top(padding_top) .padding_bottom(padding_bottom) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .TestF32(); } } } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_small_Mx1_pool_with_tf_same_padding) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = 2; pool_size <= FindMaxSinglePassPoolingSize(xnn_params.f32.argmaxpool); pool_size++) { for (size_t input_height = pool_size + 1; input_height <= pool_size * 2; input_height++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(input_height) .input_width(3) .padding_tf_same(true) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .TestF32(); } } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_small_pool_with_input_stride) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = 2; pool_size <= FindMaxSinglePassPoolingSize(xnn_params.f32.argmaxpool); pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(pool_size + 1) .input_width(3) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .input_pixel_stride(5 * channels) .TestF32(); ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(2) .input_width(pool_size + 2) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .input_pixel_stride(5 * channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_small_pool_with_output_stride) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = 2; pool_size <= FindMaxSinglePassPoolingSize(xnn_params.f32.argmaxpool); pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(pool_size + 1) .input_width(3) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .output_pixel_stride(5 * channels) .TestF32(); ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(2) .input_width(pool_size + 2) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .output_pixel_stride(5 * channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_large_1xM_pool) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); const auto multipass = FindMultiPassMicroKernel(xnn_params.f32.argmaxpool); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = multipass.mr + 1; pool_size <= multipass.mr + multipass.qr; pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(2) .input_width(pool_size + 2) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_large_1xM_pool_with_padding) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); const auto multipass = FindMultiPassMicroKernel(xnn_params.f32.argmaxpool); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = multipass.mr + 1; pool_size <= multipass.mr + multipass.qr; pool_size++) { for (size_t padding_left = 0; padding_left <= 1; padding_left++) { for (size_t padding_right = 0; padding_right <= 1; padding_right++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(2) .input_width(pool_size + 2) .padding_left(padding_left) .padding_right(padding_right) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .TestF32(); } } } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_large_1xM_pool_with_tf_same_padding) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); const auto multipass = FindMultiPassMicroKernel(xnn_params.f32.argmaxpool); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = multipass.mr + 1; pool_size <= multipass.mr + multipass.qr; pool_size++) { for (size_t input_width = pool_size + 1; input_width <= pool_size * 2; input_width++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(2) .input_width(input_width) .padding_tf_same(true) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .TestF32(); } } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_large_Mx1_pool) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); const auto multipass = FindMultiPassMicroKernel(xnn_params.f32.argmaxpool); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = multipass.mr + 1; pool_size <= multipass.mr + multipass.qr; pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(pool_size + 1) .input_width(3) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_large_Mx1_pool_with_padding) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); const auto multipass = FindMultiPassMicroKernel(xnn_params.f32.argmaxpool); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = multipass.mr + 1; pool_size <= multipass.mr + multipass.qr; pool_size++) { for (size_t padding_top = 0; padding_top <= 1; padding_top++) { for (size_t padding_bottom = 0; padding_bottom <= 1; padding_bottom++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(pool_size + 1) .input_width(3) .padding_top(padding_top) .padding_bottom(padding_bottom) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .TestF32(); } } } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_large_Mx1_pool_with_tf_same_padding) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); const auto multipass = FindMultiPassMicroKernel(xnn_params.f32.argmaxpool); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = multipass.mr + 1; pool_size <= multipass.mr + multipass.qr; pool_size++) { for (size_t input_height = pool_size + 2; input_height <= pool_size * 2; input_height++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(input_height) .input_width(3) .padding_tf_same(true) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .TestF32(); } } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_large_pool_with_input_stride) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); const auto multipass = FindMultiPassMicroKernel(xnn_params.f32.argmaxpool); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = multipass.mr + 1; pool_size <= multipass.mr + multipass.qr; pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(pool_size + 1) .input_width(3) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .input_pixel_stride(5 * channels) .TestF32(); ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(2) .input_width(pool_size + 2) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .input_pixel_stride(5 * channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, unit_batch_large_pool_with_output_stride) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); const auto multipass = FindMultiPassMicroKernel(xnn_params.f32.argmaxpool); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = multipass.mr + 1; pool_size <= multipass.mr + multipass.qr; pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(pool_size + 1) .input_width(3) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .output_pixel_stride(5 * channels) .TestF32(); ArgmaxPoolingOperatorTester() .batch_size(1) .input_height(2) .input_width(pool_size + 2) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .output_pixel_stride(5 * channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, small_batch_small_pool) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = 2; pool_size <= FindMaxSinglePassPoolingSize(xnn_params.f32.argmaxpool); pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(pool_size + 1) .input_width(3) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .TestF32(); ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(2) .input_width(pool_size + 2) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, small_batch_small_pool_with_input_stride) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = 2; pool_size <= FindMaxSinglePassPoolingSize(xnn_params.f32.argmaxpool); pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(pool_size + 1) .input_width(3) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .input_pixel_stride(5 * channels) .TestF32(); ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(2) .input_width(pool_size + 2) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .input_pixel_stride(5 * channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, small_batch_small_pool_with_output_stride) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = 2; pool_size <= FindMaxSinglePassPoolingSize(xnn_params.f32.argmaxpool); pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(pool_size + 1) .input_width(3) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .output_pixel_stride(5 * channels) .TestF32(); ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(2) .input_width(pool_size + 2) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .output_pixel_stride(5 * channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, small_batch_large_pool) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); const auto multipass = FindMultiPassMicroKernel(xnn_params.f32.argmaxpool); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = multipass.mr + 1; pool_size <= multipass.mr + multipass.qr; pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(pool_size + 1) .input_width(3) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .TestF32(); ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(2) .input_width(pool_size + 2) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, small_batch_large_pool_with_input_stride) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); const auto multipass = FindMultiPassMicroKernel(xnn_params.f32.argmaxpool); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = multipass.mr + 1; pool_size <= multipass.mr + multipass.qr; pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(pool_size + 1) .input_width(3) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .input_pixel_stride(5 * channels) .TestF32(); ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(2) .input_width(pool_size + 2) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .input_pixel_stride(5 * channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, small_batch_large_pool_with_output_stride) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); const auto multipass = FindMultiPassMicroKernel(xnn_params.f32.argmaxpool); for (size_t channels = 1; channels <= 100; channels += 15) { for (size_t pool_size = multipass.mr + 1; pool_size <= multipass.mr + multipass.qr; pool_size++) { ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(pool_size + 1) .input_width(3) .pooling_height(pool_size) .pooling_width(1) .channels(channels) .output_pixel_stride(5 * channels) .TestF32(); ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(2) .input_width(pool_size + 2) .pooling_height(1) .pooling_width(pool_size) .channels(channels) .output_pixel_stride(5 * channels) .TestF32(); } } } TEST(ARGMAX_POOLING_NHWC_F32, setup_increasing_batch) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); ArgmaxPoolingOperatorTester() .batch_size(3) .next_batch_size(5) .input_height(8) .input_width(8) .pooling_height(5) .pooling_width(3) .channels(24) .TestSetupF32(); } TEST(ARGMAX_POOLING_NHWC_F32, setup_decreasing_batch) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); ArgmaxPoolingOperatorTester() .batch_size(5) .next_batch_size(3) .input_height(8) .input_width(8) .pooling_height(5) .pooling_width(3) .channels(24) .TestSetupF32(); } TEST(ARGMAX_POOLING_NHWC_F32, setup_changing_height) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(8) .input_width(8) .next_input_height(9) .pooling_height(5) .pooling_width(3) .channels(24) .TestSetupF32(); ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(8) .input_width(8) .next_input_height(7) .pooling_height(5) .pooling_width(3) .channels(24) .TestSetupF32(); } TEST(ARGMAX_POOLING_NHWC_F32, setup_changing_width) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(8) .input_width(8) .next_input_width(9) .pooling_height(5) .pooling_width(3) .channels(24) .TestSetupF32(); ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(8) .input_width(8) .next_input_width(7) .pooling_height(5) .pooling_width(3) .channels(24) .TestSetupF32(); } TEST(ARGMAX_POOLING_NHWC_F32, setup_swap_height_and_width) { ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */)); ArgmaxPoolingOperatorTester() .batch_size(3) .input_height(9) .input_width(8) .next_input_height(8) .next_input_width(9) .pooling_height(5) .pooling_width(3) .channels(24) .TestSetupF32(); }