blob: e910559b101c7768bd6725ab969ba73689467a93 [file] [log] [blame] [edit]
// Copyright 2019 Google LLC
//
// This source code is licensed under the BSD-style license found in the
// LICENSE file in the root directory of this source tree.
#include <gtest/gtest.h>
#include <xnnpack/params.h>
#include "prelu-operator-tester.h"
TEST(PRELU_NC_F16, unit_batch) {
ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));
for (size_t channels = 1; channels < xnn_params.f16.prelu.channel_tile * 10; channels += std::max<size_t>(1, xnn_params.f16.prelu.channel_tile - 1)) {
PReLUOperatorTester()
.batch_size(1)
.channels(channels)
.iterations(3)
.TestF16();
}
}
TEST(PRELU_NC_F16, small_batch) {
ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));
for (size_t channels = 1; channels < xnn_params.f16.prelu.channel_tile * 10; channels += std::max<size_t>(1, xnn_params.f16.prelu.channel_tile - 1)) {
PReLUOperatorTester()
.batch_size(xnn_params.f16.prelu.row_tile)
.channels(channels)
.iterations(3)
.TestF16();
}
}
TEST(PRELU_NC_F16, small_batch_with_x_stride) {
ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));
for (size_t channels = 1; channels < xnn_params.f16.prelu.channel_tile * 10; channels += std::max<size_t>(1, xnn_params.f16.prelu.channel_tile - 1)) {
PReLUOperatorTester()
.batch_size(xnn_params.f16.prelu.row_tile)
.channels(channels)
.x_stride(337)
.iterations(3)
.TestF16();
}
}
TEST(PRELU_NC_F16, small_batch_with_y_stride) {
ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));
for (size_t channels = 1; channels < xnn_params.f16.prelu.channel_tile * 10; channels += std::max<size_t>(1, xnn_params.f16.prelu.channel_tile - 1)) {
PReLUOperatorTester()
.batch_size(xnn_params.f16.prelu.row_tile)
.channels(channels)
.y_stride(347)
.iterations(3)
.TestF16();
}
}
TEST(PRELU_NC_F16, small_batch_with_x_stride_and_y_stride) {
ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));
for (size_t channels = 1; channels < xnn_params.f16.prelu.channel_tile * 10; channels += std::max<size_t>(1, xnn_params.f16.prelu.channel_tile - 1)) {
PReLUOperatorTester()
.batch_size(xnn_params.f16.prelu.row_tile)
.channels(channels)
.x_stride(337)
.y_stride(347)
.iterations(3)
.TestF16();
}
}
TEST(PRELU_NC_F16, large_batch) {
ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));
for (size_t channels = 1; channels < xnn_params.f16.prelu.channel_tile * 10; channels += std::max<size_t>(1, xnn_params.f16.prelu.channel_tile - 1)) {
PReLUOperatorTester()
.batch_size(3 * xnn_params.f16.prelu.row_tile + 1)
.channels(channels)
.iterations(1)
.TestF16();
}
}
TEST(PRELU_NC_F16, large_batch_with_x_stride) {
ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));
for (size_t channels = 1; channels < xnn_params.f16.prelu.channel_tile * 10; channels += std::max<size_t>(1, xnn_params.f16.prelu.channel_tile - 1)) {
PReLUOperatorTester()
.batch_size(3 * xnn_params.f16.prelu.row_tile + 1)
.channels(channels)
.x_stride(337)
.iterations(1)
.TestF16();
}
}
TEST(PRELU_NC_F16, large_batch_with_y_stride) {
ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));
for (size_t channels = 1; channels < xnn_params.f16.prelu.channel_tile * 10; channels += std::max<size_t>(1, xnn_params.f16.prelu.channel_tile - 1)) {
PReLUOperatorTester()
.batch_size(3 * xnn_params.f16.prelu.row_tile + 1)
.channels(channels)
.y_stride(347)
.iterations(1)
.TestF16();
}
}
TEST(PRELU_NC_F16, large_batch_with_x_stride_and_y_stride) {
ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));
for (size_t channels = 1; channels < xnn_params.f16.prelu.channel_tile * 10; channels += std::max<size_t>(1, xnn_params.f16.prelu.channel_tile - 1)) {
PReLUOperatorTester()
.batch_size(3 * xnn_params.f16.prelu.row_tile + 1)
.channels(channels)
.x_stride(337)
.y_stride(347)
.iterations(1)
.TestF16();
}
}
TEST(PRELU_NC_F16, fp32_weights) {
ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));
for (size_t channels = 1; channels < xnn_params.f16.prelu.channel_tile * 10; channels += std::max<size_t>(1, xnn_params.f16.prelu.channel_tile - 1)) {
PReLUOperatorTester()
.batch_size(3 * xnn_params.f16.prelu.row_tile + 1)
.channels(channels)
.x_stride(337)
.y_stride(347)
.weights_type(PReLUOperatorTester::WeightsType::FP32)
.iterations(1)
.TestF16();
}
}
TEST(PRELU_NC_F16, weights_cache_unit_batch) {
ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));
for (size_t channels = 1; channels < xnn_params.f16.prelu.channel_tile * 10; channels += std::max<size_t>(1, xnn_params.f16.prelu.channel_tile - 1)) {
PReLUOperatorTester()
.batch_size(1)
.channels(channels)
.use_weights_cache(true)
.iterations(3)
.TestF16();
}
}
TEST(PRELU_NC_F16, weights_cache_fp32_weights) {
ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));
for (size_t channels = 1; channels < xnn_params.f16.prelu.channel_tile * 10; channels += std::max<size_t>(1, xnn_params.f16.prelu.channel_tile - 1)) {
PReLUOperatorTester()
.batch_size(3 * xnn_params.f16.prelu.row_tile + 1)
.channels(channels)
.x_stride(345)
.y_stride(347)
.weights_type(PReLUOperatorTester::WeightsType::FP32)
.use_weights_cache(true)
.iterations(1)
.TestF16();
}
}
TEST(PRELU_NC_F32, unit_batch) {
ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));
for (size_t channels = 1; channels < xnn_params.f32.prelu.channel_tile * 10; channels += std::max<size_t>(1, xnn_params.f32.prelu.channel_tile - 1)) {
PReLUOperatorTester()
.batch_size(1)
.channels(channels)
.iterations(3)
.TestF32();
}
}
TEST(PRELU_NC_F32, small_batch) {
ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));
for (size_t channels = 1; channels < xnn_params.f32.prelu.channel_tile * 10; channels += std::max<size_t>(1, xnn_params.f32.prelu.channel_tile - 1)) {
PReLUOperatorTester()
.batch_size(xnn_params.f32.prelu.row_tile)
.channels(channels)
.iterations(3)
.TestF32();
}
}
TEST(PRELU_NC_F32, small_batch_with_x_stride) {
ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));
for (size_t channels = 1; channels < xnn_params.f32.prelu.channel_tile * 10; channels += std::max<size_t>(1, xnn_params.f32.prelu.channel_tile - 1)) {
PReLUOperatorTester()
.batch_size(xnn_params.f32.prelu.row_tile)
.channels(channels)
.x_stride(337)
.iterations(3)
.TestF32();
}
}
TEST(PRELU_NC_F32, small_batch_with_y_stride) {
ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));
for (size_t channels = 1; channels < xnn_params.f32.prelu.channel_tile * 10; channels += std::max<size_t>(1, xnn_params.f32.prelu.channel_tile - 1)) {
PReLUOperatorTester()
.batch_size(xnn_params.f32.prelu.row_tile)
.channels(channels)
.y_stride(347)
.iterations(3)
.TestF32();
}
}
TEST(PRELU_NC_F32, small_batch_with_x_stride_and_y_stride) {
ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));
for (size_t channels = 1; channels < xnn_params.f32.prelu.channel_tile * 10; channels += std::max<size_t>(1, xnn_params.f32.prelu.channel_tile - 1)) {
PReLUOperatorTester()
.batch_size(xnn_params.f32.prelu.row_tile)
.channels(channels)
.x_stride(337)
.y_stride(347)
.iterations(3)
.TestF32();
}
}
TEST(PRELU_NC_F32, large_batch) {
ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));
for (size_t channels = 1; channels < xnn_params.f32.prelu.channel_tile * 10; channels += std::max<size_t>(1, xnn_params.f32.prelu.channel_tile - 1)) {
PReLUOperatorTester()
.batch_size(3 * xnn_params.f32.prelu.row_tile + 1)
.channels(channels)
.iterations(1)
.TestF32();
}
}
TEST(PRELU_NC_F32, large_batch_with_x_stride) {
ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));
for (size_t channels = 1; channels < xnn_params.f32.prelu.channel_tile * 10; channels += std::max<size_t>(1, xnn_params.f32.prelu.channel_tile - 1)) {
PReLUOperatorTester()
.batch_size(3 * xnn_params.f32.prelu.row_tile + 1)
.channels(channels)
.x_stride(337)
.iterations(1)
.TestF32();
}
}
TEST(PRELU_NC_F32, large_batch_with_y_stride) {
ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));
for (size_t channels = 1; channels < xnn_params.f32.prelu.channel_tile * 10; channels += std::max<size_t>(1, xnn_params.f32.prelu.channel_tile - 1)) {
PReLUOperatorTester()
.batch_size(3 * xnn_params.f32.prelu.row_tile + 1)
.channels(channels)
.y_stride(347)
.iterations(1)
.TestF32();
}
}
TEST(PRELU_NC_F32, large_batch_with_x_stride_and_y_stride) {
ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));
for (size_t channels = 1; channels < xnn_params.f32.prelu.channel_tile * 10; channels += std::max<size_t>(1, xnn_params.f32.prelu.channel_tile - 1)) {
PReLUOperatorTester()
.batch_size(3 * xnn_params.f32.prelu.row_tile + 1)
.channels(channels)
.x_stride(337)
.y_stride(347)
.iterations(1)
.TestF32();
}
}
TEST(PRELU_NC_F32, weights_cache_unit_batch) {
ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));
for (size_t channels = 1; channels < xnn_params.f32.prelu.channel_tile * 10; channels += std::max<size_t>(1, xnn_params.f32.prelu.channel_tile - 1)) {
PReLUOperatorTester()
.batch_size(1)
.channels(channels)
.use_weights_cache(true)
.iterations(3)
.TestF32();
}
}