common/operations/Reduce.cpp - platform/packages/modules/NeuralNetworks - Git at Google

 /*
  * Copyright (C) 2018 The Android Open Source Project
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
  * You may obtain a copy of the License at
  *
  *      http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */

 #define LOG_TAG "Operations"

 #include <algorithm>
 #include <limits>
 #include <vector>

 #include "OperationResolver.h"
 #include "OperationsUtils.h"
 #include "Tracing.h"

 #ifdef NN_INCLUDE_CPU_IMPLEMENTATION
 #include <tensorflow/lite/kernels/internal/reference/reference_ops.h>
 #endif  // NN_INCLUDE_CPU_IMPLEMENTATION

 namespace android {
 namespace nn {
 namespace reduce {

 constexpr uint32_t kNumInputs = 3;
 constexpr uint32_t kInputTensor = 0;
 constexpr uint32_t kInputAxes = 1;
 constexpr uint32_t kInputKeepDims = 2;

 constexpr uint32_t kNumOutputs = 1;
 constexpr uint32_t kOutputTensor = 0;

 // Values from
 // https://en.wikipedia.org/wiki/Half-precision_floating-point_format#IEEE_754_half-precision_binary_floating-point_format:_binary16
 constexpr _Float16 kFloat16Max = 65504;
 constexpr _Float16 kFloat16Lowest = -kFloat16Max;

 #ifdef NN_INCLUDE_CPU_IMPLEMENTATION
 namespace {

 template <typename T>
 inline bool compute(IOperationExecutionContext* context, T init, T func(T, T)) {
     const Shape inputShape = context->getInputShape(kInputTensor);
     const Shape axesShape = context->getInputShape(kInputAxes);
     const Shape outputShape = context->getOutputShape(kOutputTensor);
     const uint32_t inputRank = getNumberOfDimensions(inputShape);
     const uint32_t numAxes = getNumberOfElements(axesShape);
     std::vector<int> tempIndex(inputShape.dimensions.size());
     std::vector<int> tempAxes(numAxes);
     return tflite::reference_ops::ReduceGeneric<T>(
             context->getInputBuffer<T>(kInputTensor),
             reinterpret_cast<const int32_t*>(inputShape.dimensions.data()), inputRank,
             context->getOutputBuffer<T>(kOutputTensor),
             reinterpret_cast<const int32_t*>(outputShape.dimensions.data()),
             outputShape.dimensions.size(), context->getInputBuffer<int32_t>(kInputAxes), numAxes,
             context->getInputValue<bool8>(kInputKeepDims), tempIndex.data(), tempAxes.data(), init,
             func);
 }

 }  // namespace
 #endif  // NN_INCLUDE_CPU_IMPLEMENTATION

 Result<Version> validateProdSum(const IOperationValidationContext* context) {
     NN_RET_CHECK_EQ(context->getNumInputs(), kNumInputs);
     NN_RET_CHECK_EQ(context->getNumOutputs(), kNumOutputs);
     OperandType inputType = context->getInputType(kInputTensor);
     NN_RET_CHECK(inputType == OperandType::TENSOR_FLOAT16 ||
                  inputType == OperandType::TENSOR_FLOAT32)
             << "Unsupported tensor type for REDUCE_PROD or REDUCE_SUM";
     NN_RET_CHECK(
             validateInputTypes(context, {inputType, OperandType::TENSOR_INT32, OperandType::BOOL}));
     NN_RET_CHECK(validateOutputTypes(context, {inputType}));
     const Shape& input = context->getInputShape(kInputTensor);
     if (hasKnownRank(input)) {
         NN_RET_CHECK_LE(getNumberOfDimensions(input), 4);
     }
     return Version::ANDROID_Q;
 }

 Result<Version> validateMaxMin(const IOperationValidationContext* context) {
     NN_RET_CHECK_EQ(context->getNumInputs(), kNumInputs);
     NN_RET_CHECK_EQ(context->getNumOutputs(), kNumOutputs);
     OperandType inputType = context->getInputType(kInputTensor);
     NN_RET_CHECK(inputType == OperandType::TENSOR_FLOAT16 ||
                  inputType == OperandType::TENSOR_FLOAT32 ||
                  inputType == OperandType::TENSOR_QUANT8_ASYMM ||
                  inputType == OperandType::TENSOR_QUANT8_ASYMM_SIGNED)
             << "Unsupported tensor type for REDUCE_MAX or REDUCE_MIN";
     NN_RET_CHECK(
             validateInputTypes(context, {inputType, OperandType::TENSOR_INT32, OperandType::BOOL}));
     NN_RET_CHECK(validateOutputTypes(context, {inputType}));
     auto minVersion = Version::ANDROID_Q;
     if (inputType == OperandType::TENSOR_QUANT8_ASYMM_SIGNED) {
         minVersion = Version::ANDROID_R;
     }
     const Shape& input = context->getInputShape(kInputTensor);
     if (hasKnownRank(input)) {
         NN_RET_CHECK_LE(getNumberOfDimensions(input), 4);
     }
     return minVersion;
 }

 Result<Version> validateLogical(const IOperationValidationContext* context) {
     NN_RET_CHECK_EQ(context->getNumInputs(), kNumInputs);
     NN_RET_CHECK_EQ(context->getNumOutputs(), kNumOutputs);
     OperandType inputType = context->getInputType(kInputTensor);
     NN_RET_CHECK(inputType == OperandType::TENSOR_BOOL8)
             << "Unsupported tensor type for REDUCE_ANY or REDUCE_ALL";
     NN_RET_CHECK(
             validateInputTypes(context, {inputType, OperandType::TENSOR_INT32, OperandType::BOOL}));
     NN_RET_CHECK(validateOutputTypes(context, {inputType}));
     const Shape& input = context->getInputShape(kInputTensor);
     if (hasKnownRank(input)) {
         NN_RET_CHECK_LE(getNumberOfDimensions(input), 4);
     }
     return Version::ANDROID_Q;
 }

 #ifdef NN_INCLUDE_CPU_IMPLEMENTATION
 bool prepare(IOperationExecutionContext* context) {
     Shape inputShape = context->getInputShape(kInputTensor);
     const uint32_t inputRank = getNumberOfDimensions(inputShape);
     NN_RET_CHECK_LE(inputRank, 4);

     std::vector<bool> shouldReduce(inputRank);
     const int32_t* axes = context->getInputBuffer<int32_t>(kInputAxes);
     Shape axesShape = context->getInputShape(kInputAxes);
     NN_RET_CHECK_EQ(getNumberOfDimensions(axesShape), 1u);
     const uint32_t numAxes = getNumberOfElements(axesShape);
     for (uint32_t i = 0; i < numAxes; ++i) {
         int32_t axis = axes[i];
         NN_RET_CHECK(handleNegativeAxis(inputRank, &axis));
         shouldReduce[axis] = true;
     }

     // Input and output must have the same quantization parameters, etc.
     Shape outputShape = inputShape;
     outputShape.dimensions.clear();
     bool keepDims = context->getInputValue<bool8>(kInputKeepDims);
     for (uint32_t axis = 0; axis < inputRank; ++axis) {
         if (shouldReduce[axis]) {
             if (keepDims) {
                 outputShape.dimensions.push_back(1);
             }
         } else {
             outputShape.dimensions.push_back(getSizeOfDimension(inputShape, axis));
         }
     }

     // Handle the case when all dimensions are removed
     if (outputShape.dimensions.empty()) {
         outputShape.dimensions.push_back(1);
     }

     return context->setOutputShape(kOutputTensor, outputShape);
 }

 bool executeProd(IOperationExecutionContext* context) {
     switch (context->getInputType(kInputTensor)) {
         case OperandType::TENSOR_FLOAT16:
             return compute<_Float16>(context, 1, [](_Float16 a, _Float16 b) -> _Float16 {
                 // Handle the zero case because 0 * inf evaluates to nan.
                 if (a == 0 || b == 0) return 0;
                 return a * b;
             });
         case OperandType::TENSOR_FLOAT32:
             return compute<float>(context, 1, [](float a, float b) -> float {
                 // Handle the zero case because 0 * inf evaluates to nan.
                 if (a == 0 || b == 0) return 0;
                 return a * b;
             });
         default:
             NN_RET_CHECK_FAIL() << "Unsupported tensor type for operation REDUCE_PROD";
     }
 }

 bool executeSum(IOperationExecutionContext* context) {
     switch (context->getInputType(kInputTensor)) {
         case OperandType::TENSOR_FLOAT16:
             return compute<_Float16>(context, 0, [](_Float16 a, _Float16 b) { return a + b; });
         case OperandType::TENSOR_FLOAT32:
             return compute<float>(context, 0, [](float a, float b) { return a + b; });
         default:
             NN_RET_CHECK_FAIL() << "Unsupported tensor type for operation REDUCE_SUM";
     }
 }

 bool executeMax(IOperationExecutionContext* context) {
     switch (context->getInputType(kInputTensor)) {
         case OperandType::TENSOR_FLOAT16:
             return compute<_Float16>(context, kFloat16Lowest,
                                      [](_Float16 a, _Float16 b) { return std::max(a, b); });
         case OperandType::TENSOR_FLOAT32:
             return compute<float>(context, std::numeric_limits<float>::lowest(),
                                   [](float a, float b) { return std::max(a, b); });
         case OperandType::TENSOR_QUANT8_ASYMM:
             return compute<uint8_t>(context, std::numeric_limits<uint8_t>::lowest(),
                                     [](uint8_t a, uint8_t b) { return std::max(a, b); });
         case OperandType::TENSOR_QUANT8_ASYMM_SIGNED:
             return compute<int8_t>(context, std::numeric_limits<int8_t>::lowest(),
                                    [](int8_t a, int8_t b) { return std::max(a, b); });
         default:
             NN_RET_CHECK_FAIL() << "Unsupported tensor type for operation REDUCE_MAX";
     }
 }

 bool executeMin(IOperationExecutionContext* context) {
     switch (context->getInputType(kInputTensor)) {
         case OperandType::TENSOR_FLOAT16:
             return compute<_Float16>(context, kFloat16Max,
                                      [](_Float16 a, _Float16 b) { return std::min(a, b); });
         case OperandType::TENSOR_FLOAT32:
             return compute<float>(context, std::numeric_limits<float>::max(),
                                   [](float a, float b) { return std::min(a, b); });
         case OperandType::TENSOR_QUANT8_ASYMM:
             return compute<uint8_t>(context, std::numeric_limits<uint8_t>::max(),
                                     [](uint8_t a, uint8_t b) { return std::min(a, b); });
         case OperandType::TENSOR_QUANT8_ASYMM_SIGNED:
             return compute<int8_t>(context, std::numeric_limits<int8_t>::max(),
                                    [](int8_t a, int8_t b) { return std::min(a, b); });
         default:
             NN_RET_CHECK_FAIL() << "Unsupported tensor type for operation REDUCE_MIN";
     }
 }

 bool executeAny(IOperationExecutionContext* context) {
     switch (context->getInputType(kInputTensor)) {
         case OperandType::TENSOR_BOOL8:
             return compute<bool8>(context, false,
                                   [](bool8 a, bool8 b) { return static_cast<bool8>(a || b); });
         default:
             NN_RET_CHECK_FAIL() << "Unsupported tensor type for operation REDUCE_ANY";
     }
 }

 bool executeAll(IOperationExecutionContext* context) {
     switch (context->getInputType(kInputTensor)) {
         case OperandType::TENSOR_BOOL8:
             return compute<bool8>(context, true,
                                   [](bool8 a, bool8 b) { return static_cast<bool8>(a && b); });
         default:
             NN_RET_CHECK_FAIL() << "Unsupported tensor type for operation REDUCE_ALL";
     }
 }
 #endif  // NN_INCLUDE_CPU_IMPLEMENTATION

 }  // namespace reduce

 NN_REGISTER_OPERATION(REDUCE_PROD, "REDUCE_PROD", reduce::validateProdSum, reduce::prepare,
                       reduce::executeProd);
 NN_REGISTER_OPERATION(REDUCE_SUM, "REDUCE_SUM", reduce::validateProdSum, reduce::prepare,
                       reduce::executeSum);
 NN_REGISTER_OPERATION(REDUCE_MAX, "REDUCE_MAX", reduce::validateMaxMin, reduce::prepare,
                       reduce::executeMax);
 NN_REGISTER_OPERATION(REDUCE_MIN, "REDUCE_MIN", reduce::validateMaxMin, reduce::prepare,
                       reduce::executeMin);
 NN_REGISTER_OPERATION(REDUCE_ANY, "REDUCE_ANY", reduce::validateLogical, reduce::prepare,
                       reduce::executeAny);
 NN_REGISTER_OPERATION(REDUCE_ALL, "REDUCE_ALL", reduce::validateLogical, reduce::prepare,
                       reduce::executeAll);

 }  // namespace nn
 }  // namespace android
	/*
	* Copyright (C) 2018 The Android Open Source Project
	*
	* Licensed under the Apache License, Version 2.0 (the "License");
	* you may not use this file except in compliance with the License.
	* You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/

	#define LOG_TAG "Operations"

	#include <algorithm>
	#include <limits>
	#include <vector>

	#include "OperationResolver.h"
	#include "OperationsUtils.h"
	#include "Tracing.h"

	#ifdef NN_INCLUDE_CPU_IMPLEMENTATION
	#include <tensorflow/lite/kernels/internal/reference/reference_ops.h>
	#endif // NN_INCLUDE_CPU_IMPLEMENTATION

	namespace android {
	namespace nn {
	namespace reduce {

	constexpr uint32_t kNumInputs = 3;
	constexpr uint32_t kInputTensor = 0;
	constexpr uint32_t kInputAxes = 1;
	constexpr uint32_t kInputKeepDims = 2;

	constexpr uint32_t kNumOutputs = 1;
	constexpr uint32_t kOutputTensor = 0;

	// Values from
	// https://en.wikipedia.org/wiki/Half-precision_floating-point_format#IEEE_754_half-precision_binary_floating-point_format:_binary16
	constexpr _Float16 kFloat16Max = 65504;
	constexpr _Float16 kFloat16Lowest = -kFloat16Max;

	#ifdef NN_INCLUDE_CPU_IMPLEMENTATION
	namespace {

	template <typename T>
	inline bool compute(IOperationExecutionContext* context, T init, T func(T, T)) {
	const Shape inputShape = context->getInputShape(kInputTensor);
	const Shape axesShape = context->getInputShape(kInputAxes);
	const Shape outputShape = context->getOutputShape(kOutputTensor);
	const uint32_t inputRank = getNumberOfDimensions(inputShape);
	const uint32_t numAxes = getNumberOfElements(axesShape);
	std::vector<int> tempIndex(inputShape.dimensions.size());
	std::vector<int> tempAxes(numAxes);
	return tflite::reference_ops::ReduceGeneric<T>(
	context->getInputBuffer<T>(kInputTensor),
	reinterpret_cast<const int32_t*>(inputShape.dimensions.data()), inputRank,
	context->getOutputBuffer<T>(kOutputTensor),
	reinterpret_cast<const int32_t*>(outputShape.dimensions.data()),
	outputShape.dimensions.size(), context->getInputBuffer<int32_t>(kInputAxes), numAxes,
	context->getInputValue<bool8>(kInputKeepDims), tempIndex.data(), tempAxes.data(), init,
	func);
	}

	} // namespace
	#endif // NN_INCLUDE_CPU_IMPLEMENTATION

	Result<Version> validateProdSum(const IOperationValidationContext* context) {
	NN_RET_CHECK_EQ(context->getNumInputs(), kNumInputs);
	NN_RET_CHECK_EQ(context->getNumOutputs(), kNumOutputs);
	OperandType inputType = context->getInputType(kInputTensor);
	NN_RET_CHECK(inputType == OperandType::TENSOR_FLOAT16 \|\|
	inputType == OperandType::TENSOR_FLOAT32)
	<< "Unsupported tensor type for REDUCE_PROD or REDUCE_SUM";
	NN_RET_CHECK(
	validateInputTypes(context, {inputType, OperandType::TENSOR_INT32, OperandType::BOOL}));
	NN_RET_CHECK(validateOutputTypes(context, {inputType}));
	const Shape& input = context->getInputShape(kInputTensor);
	if (hasKnownRank(input)) {
	NN_RET_CHECK_LE(getNumberOfDimensions(input), 4);
	}
	return Version::ANDROID_Q;
	}

	Result<Version> validateMaxMin(const IOperationValidationContext* context) {
	NN_RET_CHECK_EQ(context->getNumInputs(), kNumInputs);
	NN_RET_CHECK_EQ(context->getNumOutputs(), kNumOutputs);
	OperandType inputType = context->getInputType(kInputTensor);
	NN_RET_CHECK(inputType == OperandType::TENSOR_FLOAT16 \|\|
	inputType == OperandType::TENSOR_FLOAT32 \|\|
	inputType == OperandType::TENSOR_QUANT8_ASYMM \|\|
	inputType == OperandType::TENSOR_QUANT8_ASYMM_SIGNED)
	<< "Unsupported tensor type for REDUCE_MAX or REDUCE_MIN";
	NN_RET_CHECK(
	validateInputTypes(context, {inputType, OperandType::TENSOR_INT32, OperandType::BOOL}));
	NN_RET_CHECK(validateOutputTypes(context, {inputType}));
	auto minVersion = Version::ANDROID_Q;
	if (inputType == OperandType::TENSOR_QUANT8_ASYMM_SIGNED) {
	minVersion = Version::ANDROID_R;
	}
	const Shape& input = context->getInputShape(kInputTensor);
	if (hasKnownRank(input)) {
	NN_RET_CHECK_LE(getNumberOfDimensions(input), 4);
	}
	return minVersion;
	}

	Result<Version> validateLogical(const IOperationValidationContext* context) {
	NN_RET_CHECK_EQ(context->getNumInputs(), kNumInputs);
	NN_RET_CHECK_EQ(context->getNumOutputs(), kNumOutputs);
	OperandType inputType = context->getInputType(kInputTensor);
	NN_RET_CHECK(inputType == OperandType::TENSOR_BOOL8)
	<< "Unsupported tensor type for REDUCE_ANY or REDUCE_ALL";
	NN_RET_CHECK(
	validateInputTypes(context, {inputType, OperandType::TENSOR_INT32, OperandType::BOOL}));
	NN_RET_CHECK(validateOutputTypes(context, {inputType}));
	const Shape& input = context->getInputShape(kInputTensor);
	if (hasKnownRank(input)) {
	NN_RET_CHECK_LE(getNumberOfDimensions(input), 4);
	}
	return Version::ANDROID_Q;
	}

	#ifdef NN_INCLUDE_CPU_IMPLEMENTATION
	bool prepare(IOperationExecutionContext* context) {
	Shape inputShape = context->getInputShape(kInputTensor);
	const uint32_t inputRank = getNumberOfDimensions(inputShape);
	NN_RET_CHECK_LE(inputRank, 4);

	std::vector<bool> shouldReduce(inputRank);
	const int32_t* axes = context->getInputBuffer<int32_t>(kInputAxes);
	Shape axesShape = context->getInputShape(kInputAxes);
	NN_RET_CHECK_EQ(getNumberOfDimensions(axesShape), 1u);
	const uint32_t numAxes = getNumberOfElements(axesShape);
	for (uint32_t i = 0; i < numAxes; ++i) {
	int32_t axis = axes[i];
	NN_RET_CHECK(handleNegativeAxis(inputRank, &axis));
	shouldReduce[axis] = true;
	}

	// Input and output must have the same quantization parameters, etc.
	Shape outputShape = inputShape;
	outputShape.dimensions.clear();
	bool keepDims = context->getInputValue<bool8>(kInputKeepDims);
	for (uint32_t axis = 0; axis < inputRank; ++axis) {
	if (shouldReduce[axis]) {
	if (keepDims) {
	outputShape.dimensions.push_back(1);
	}
	} else {
	outputShape.dimensions.push_back(getSizeOfDimension(inputShape, axis));
	}
	}

	// Handle the case when all dimensions are removed
	if (outputShape.dimensions.empty()) {
	outputShape.dimensions.push_back(1);
	}

	return context->setOutputShape(kOutputTensor, outputShape);
	}

	bool executeProd(IOperationExecutionContext* context) {
	switch (context->getInputType(kInputTensor)) {
	case OperandType::TENSOR_FLOAT16:
	return compute<_Float16>(context, 1, [](_Float16 a, _Float16 b) -> _Float16 {
	// Handle the zero case because 0 * inf evaluates to nan.
	if (a == 0 \|\| b == 0) return 0;
	return a * b;
	});
	case OperandType::TENSOR_FLOAT32:
	return compute<float>(context, 1, [](float a, float b) -> float {
	// Handle the zero case because 0 * inf evaluates to nan.
	if (a == 0 \|\| b == 0) return 0;
	return a * b;
	});
	default:
	NN_RET_CHECK_FAIL() << "Unsupported tensor type for operation REDUCE_PROD";
	}
	}

	bool executeSum(IOperationExecutionContext* context) {
	switch (context->getInputType(kInputTensor)) {
	case OperandType::TENSOR_FLOAT16:
	return compute<_Float16>(context, 0, [](_Float16 a, _Float16 b) { return a + b; });
	case OperandType::TENSOR_FLOAT32:
	return compute<float>(context, 0, [](float a, float b) { return a + b; });
	default:
	NN_RET_CHECK_FAIL() << "Unsupported tensor type for operation REDUCE_SUM";
	}
	}

	bool executeMax(IOperationExecutionContext* context) {
	switch (context->getInputType(kInputTensor)) {
	case OperandType::TENSOR_FLOAT16:
	return compute<_Float16>(context, kFloat16Lowest,
	[](_Float16 a, _Float16 b) { return std::max(a, b); });
	case OperandType::TENSOR_FLOAT32:
	return compute<float>(context, std::numeric_limits<float>::lowest(),
	[](float a, float b) { return std::max(a, b); });
	case OperandType::TENSOR_QUANT8_ASYMM:
	return compute<uint8_t>(context, std::numeric_limits<uint8_t>::lowest(),
	[](uint8_t a, uint8_t b) { return std::max(a, b); });
	case OperandType::TENSOR_QUANT8_ASYMM_SIGNED:
	return compute<int8_t>(context, std::numeric_limits<int8_t>::lowest(),
	[](int8_t a, int8_t b) { return std::max(a, b); });
	default:
	NN_RET_CHECK_FAIL() << "Unsupported tensor type for operation REDUCE_MAX";
	}
	}

	bool executeMin(IOperationExecutionContext* context) {
	switch (context->getInputType(kInputTensor)) {
	case OperandType::TENSOR_FLOAT16:
	return compute<_Float16>(context, kFloat16Max,
	[](_Float16 a, _Float16 b) { return std::min(a, b); });
	case OperandType::TENSOR_FLOAT32:
	return compute<float>(context, std::numeric_limits<float>::max(),
	[](float a, float b) { return std::min(a, b); });
	case OperandType::TENSOR_QUANT8_ASYMM:
	return compute<uint8_t>(context, std::numeric_limits<uint8_t>::max(),
	[](uint8_t a, uint8_t b) { return std::min(a, b); });
	case OperandType::TENSOR_QUANT8_ASYMM_SIGNED:
	return compute<int8_t>(context, std::numeric_limits<int8_t>::max(),
	[](int8_t a, int8_t b) { return std::min(a, b); });
	default:
	NN_RET_CHECK_FAIL() << "Unsupported tensor type for operation REDUCE_MIN";
	}
	}

	bool executeAny(IOperationExecutionContext* context) {
	switch (context->getInputType(kInputTensor)) {
	case OperandType::TENSOR_BOOL8:
	return compute<bool8>(context, false,
	[](bool8 a, bool8 b) { return static_cast<bool8>(a \|\| b); });
	default:
	NN_RET_CHECK_FAIL() << "Unsupported tensor type for operation REDUCE_ANY";
	}
	}

	bool executeAll(IOperationExecutionContext* context) {
	switch (context->getInputType(kInputTensor)) {
	case OperandType::TENSOR_BOOL8:
	return compute<bool8>(context, true,
	[](bool8 a, bool8 b) { return static_cast<bool8>(a && b); });
	default:
	NN_RET_CHECK_FAIL() << "Unsupported tensor type for operation REDUCE_ALL";
	}
	}
	#endif // NN_INCLUDE_CPU_IMPLEMENTATION

	} // namespace reduce

	NN_REGISTER_OPERATION(REDUCE_PROD, "REDUCE_PROD", reduce::validateProdSum, reduce::prepare,
	reduce::executeProd);
	NN_REGISTER_OPERATION(REDUCE_SUM, "REDUCE_SUM", reduce::validateProdSum, reduce::prepare,
	reduce::executeSum);
	NN_REGISTER_OPERATION(REDUCE_MAX, "REDUCE_MAX", reduce::validateMaxMin, reduce::prepare,
	reduce::executeMax);
	NN_REGISTER_OPERATION(REDUCE_MIN, "REDUCE_MIN", reduce::validateMaxMin, reduce::prepare,
	reduce::executeMin);
	NN_REGISTER_OPERATION(REDUCE_ANY, "REDUCE_ANY", reduce::validateLogical, reduce::prepare,
	reduce::executeAny);
	NN_REGISTER_OPERATION(REDUCE_ALL, "REDUCE_ALL", reduce::validateLogical, reduce::prepare,
	reduce::executeAll);

	} // namespace nn
	} // namespace android