driver/sample/LimitedSupportDevice.cpp - platform/packages/modules/NeuralNetworks - Git at Google

 /*
  * Copyright (C) 2021 The Android Open Source Project
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
  * You may obtain a copy of the License at
  *
  *      http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */

 #include "LimitedSupportDevice.h"

 #include <android-base/logging.h>
 #include <nnapi/IBuffer.h>
 #include <nnapi/IDevice.h>
 #include <nnapi/IPreparedModel.h>
 #include <nnapi/OperandTypes.h>
 #include <nnapi/Result.h>
 #include <nnapi/TypeUtils.h>
 #include <nnapi/Types.h>
 #include <nnapi/Validation.h>

 #include <algorithm>
 #include <any>
 #include <chrono>
 #include <functional>
 #include <iterator>
 #include <memory>
 #include <optional>
 #include <set>
 #include <string>
 #include <utility>
 #include <vector>

 #include "CanonicalDevice.h"

 namespace android::nn::sample {
 namespace {

 Capabilities makeCapabilitiesFloatFast() {
     const Capabilities::PerformanceInfo defaultInfo = {.execTime = 1.0f, .powerUsage = 1.0f};
     const Capabilities::PerformanceInfo float32Info = {.execTime = 0.8f, .powerUsage = 1.2f};
     const Capabilities::PerformanceInfo relaxedInfo = {.execTime = 0.7f, .powerUsage = 1.1f};
     return makeCapabilities(defaultInfo, float32Info, relaxedInfo);
 }

 Capabilities makeCapabilitiesFloatSlow() {
     const Capabilities::PerformanceInfo defaultInfo = {.execTime = 1.0f, .powerUsage = 1.0f};
     const Capabilities::PerformanceInfo float32Info = {.execTime = 1.3f, .powerUsage = 0.7f};
     const Capabilities::PerformanceInfo relaxedInfo = {.execTime = 1.2f, .powerUsage = 0.6f};
     return makeCapabilities(defaultInfo, float32Info, relaxedInfo);
 }

 Capabilities makeCapabilitiesMinimal() {
     const Capabilities::PerformanceInfo defaultInfo = {.execTime = 1.0f, .powerUsage = 1.0f};
     const Capabilities::PerformanceInfo float32Info = {.execTime = 0.4f, .powerUsage = 0.5f};
     const Capabilities::PerformanceInfo relaxedInfo = {.execTime = 0.4f, .powerUsage = 0.5f};
     return makeCapabilities(defaultInfo, float32Info, relaxedInfo);
 }

 Capabilities makeCapabilitiesQuant() {
     const Capabilities::PerformanceInfo info = {.execTime = 50.0f, .powerUsage = 1.0f};
     return makeCapabilities(info, info, info);
 }

 GeneralResult<std::vector<bool>> getSupportedOperationsFloat(const Model& model) {
     const size_t count = model.main.operations.size();
     std::vector<bool> supported(count);
     for (size_t i = 0; i < count; i++) {
         const Operation& operation = model.main.operations[i];
         if (!isExtension(operation.type) && !operation.inputs.empty()) {
             const Operand& firstOperand = model.main.operands[operation.inputs[0]];
             supported[i] = firstOperand.type == OperandType::TENSOR_FLOAT32;
         }
     }
     return supported;
 }

 GeneralResult<std::vector<bool>> getSupportedOperationsMinimal(const Model& model) {
     const size_t count = model.main.operations.size();
     std::vector<bool> supported(count);
     // Simulate supporting just a few ops
     for (size_t i = 0; i < count; i++) {
         supported[i] = false;
         const Operation& operation = model.main.operations[i];
         switch (operation.type) {
             case OperationType::ADD:
             case OperationType::CONCATENATION:
             case OperationType::CONV_2D: {
                 const Operand& firstOperand = model.main.operands[operation.inputs[0]];
                 if (firstOperand.type == OperandType::TENSOR_FLOAT32) {
                     supported[i] = true;
                 }
                 break;
             }
             default:
                 break;
         }
     }
     return supported;
 }

 bool isQuantized(OperandType opType) {
     return opType == OperandType::TENSOR_QUANT8_ASYMM ||
            opType == OperandType::TENSOR_QUANT8_ASYMM_SIGNED;
 }

 GeneralResult<std::vector<bool>> getSupportedOperationsQuant(const Model& model) {
     const size_t count = model.main.operations.size();
     std::vector<bool> supported(count);
     for (size_t i = 0; i < count; i++) {
         const Operation& operation = model.main.operations[i];
         if (!isExtension(operation.type) && !operation.inputs.empty()) {
             const Operand& firstOperand = model.main.operands[operation.inputs[0]];
             supported[i] = isQuantized(firstOperand.type);
             if (operation.type == OperationType::SELECT) {
                 const Operand& secondOperand = model.main.operands[operation.inputs[1]];
                 supported[i] = isQuantized(secondOperand.type);
             }
         }
     }
     return supported;
 }

 SharedDevice makeDevice(std::string name, Capabilities capabilities,
                         LimitedSupportDevice::SupportedOperationsFunction getSupportedOperations) {
     auto device = std::make_shared<const Device>(std::move(name));
     auto limitedDevice = std::make_shared<const LimitedSupportDevice>(
             std::move(device), std::move(capabilities), std::move(getSupportedOperations));
     return limitedDevice;
 }

 }  // namespace

 LimitedSupportDevice::LimitedSupportDevice(SharedDevice device, Capabilities capabilities,
                                            SupportedOperationsFunction supportedOperationsFunction)
     : kDevice(std::move(device)),
       kCapabilities(std::move(capabilities)),
       kSupportedOperationsFunction(std::move(supportedOperationsFunction)) {
     CHECK(kDevice != nullptr);
     CHECK(kSupportedOperationsFunction != nullptr);
     const auto result = validate(kCapabilities);
     CHECK(result.has_value()) << result.error();
 }

 const std::string& LimitedSupportDevice::getName() const {
     return kDevice->getName();
 }

 const std::string& LimitedSupportDevice::getVersionString() const {
     return kDevice->getVersionString();
 }

 Version LimitedSupportDevice::getFeatureLevel() const {
     return kDevice->getFeatureLevel();
 }

 DeviceType LimitedSupportDevice::getType() const {
     return kDevice->getType();
 }

 const std::vector<Extension>& LimitedSupportDevice::getSupportedExtensions() const {
     return kDevice->getSupportedExtensions();
 }

 const Capabilities& LimitedSupportDevice::getCapabilities() const {
     return kCapabilities;
 }

 std::pair<uint32_t, uint32_t> LimitedSupportDevice::getNumberOfCacheFilesNeeded() const {
     return kDevice->getNumberOfCacheFilesNeeded();
 }

 GeneralResult<void> LimitedSupportDevice::wait() const {
     return kDevice->wait();
 }

 GeneralResult<std::vector<bool>> LimitedSupportDevice::getSupportedOperations(
         const Model& model) const {
     return kSupportedOperationsFunction(model);
 }

 GeneralResult<SharedPreparedModel> LimitedSupportDevice::prepareModel(
         const Model& model, ExecutionPreference preference, Priority priority,
         OptionalTimePoint deadline, const std::vector<SharedHandle>& modelCache,
         const std::vector<SharedHandle>& dataCache, const CacheToken& token,
         const std::vector<TokenValuePair>& /*hints*/,
         const std::vector<ExtensionNameAndPrefix>& /*extensionNameToPrefix*/) const {
     const auto supportedOperations = NN_TRY(kSupportedOperationsFunction(model));
     constexpr auto id = [](auto v) { return v; };
     if (!std::all_of(supportedOperations.begin(), supportedOperations.end(), id)) {
         return NN_ERROR(nn::ErrorStatus::INVALID_ARGUMENT) << "Not all operations are supported";
     }
     return kDevice->prepareModel(model, preference, priority, deadline, modelCache, dataCache,
                                  token, {}, {});
 }

 GeneralResult<SharedPreparedModel> LimitedSupportDevice::prepareModelFromCache(
         OptionalTimePoint deadline, const std::vector<SharedHandle>& modelCache,
         const std::vector<SharedHandle>& dataCache, const CacheToken& token) const {
     return kDevice->prepareModelFromCache(deadline, modelCache, dataCache, token);
 }

 GeneralResult<SharedBuffer> LimitedSupportDevice::allocate(
         const BufferDesc& desc, const std::vector<SharedPreparedModel>& preparedModels,
         const std::vector<BufferRole>& inputRoles,
         const std::vector<BufferRole>& outputRoles) const {
     return kDevice->allocate(desc, preparedModels, inputRoles, outputRoles);
 }

 std::vector<SharedDevice> getExampleLimitedDevices() {
     SharedDevice device;
     std::vector<SharedDevice> devices;
     devices.reserve(4);

     device = makeDevice("nnapi-sample_float_fast", makeCapabilitiesFloatFast(),
                         getSupportedOperationsFloat);
     devices.push_back(std::move(device));

     device = makeDevice("nnapi-sample_float_slow", makeCapabilitiesFloatSlow(),
                         getSupportedOperationsFloat);
     devices.push_back(std::move(device));

     device = makeDevice("nnapi-sample_minimal", makeCapabilitiesMinimal(),
                         getSupportedOperationsMinimal);
     devices.push_back(std::move(device));

     device = makeDevice("nnapi-sample_quant", makeCapabilitiesQuant(), getSupportedOperationsQuant);
     devices.push_back(std::move(device));

     return devices;
 }

 }  // namespace android::nn::sample
	/*
	* Copyright (C) 2021 The Android Open Source Project
	*
	* Licensed under the Apache License, Version 2.0 (the "License");
	* you may not use this file except in compliance with the License.
	* You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/

	#include "LimitedSupportDevice.h"

	#include <android-base/logging.h>
	#include <nnapi/IBuffer.h>
	#include <nnapi/IDevice.h>
	#include <nnapi/IPreparedModel.h>
	#include <nnapi/OperandTypes.h>
	#include <nnapi/Result.h>
	#include <nnapi/TypeUtils.h>
	#include <nnapi/Types.h>
	#include <nnapi/Validation.h>

	#include <algorithm>
	#include <any>
	#include <chrono>
	#include <functional>
	#include <iterator>
	#include <memory>
	#include <optional>
	#include <set>
	#include <string>
	#include <utility>
	#include <vector>

	#include "CanonicalDevice.h"

	namespace android::nn::sample {
	namespace {

	Capabilities makeCapabilitiesFloatFast() {
	const Capabilities::PerformanceInfo defaultInfo = {.execTime = 1.0f, .powerUsage = 1.0f};
	const Capabilities::PerformanceInfo float32Info = {.execTime = 0.8f, .powerUsage = 1.2f};
	const Capabilities::PerformanceInfo relaxedInfo = {.execTime = 0.7f, .powerUsage = 1.1f};
	return makeCapabilities(defaultInfo, float32Info, relaxedInfo);
	}

	Capabilities makeCapabilitiesFloatSlow() {
	const Capabilities::PerformanceInfo defaultInfo = {.execTime = 1.0f, .powerUsage = 1.0f};
	const Capabilities::PerformanceInfo float32Info = {.execTime = 1.3f, .powerUsage = 0.7f};
	const Capabilities::PerformanceInfo relaxedInfo = {.execTime = 1.2f, .powerUsage = 0.6f};
	return makeCapabilities(defaultInfo, float32Info, relaxedInfo);
	}

	Capabilities makeCapabilitiesMinimal() {
	const Capabilities::PerformanceInfo defaultInfo = {.execTime = 1.0f, .powerUsage = 1.0f};
	const Capabilities::PerformanceInfo float32Info = {.execTime = 0.4f, .powerUsage = 0.5f};
	const Capabilities::PerformanceInfo relaxedInfo = {.execTime = 0.4f, .powerUsage = 0.5f};
	return makeCapabilities(defaultInfo, float32Info, relaxedInfo);
	}

	Capabilities makeCapabilitiesQuant() {
	const Capabilities::PerformanceInfo info = {.execTime = 50.0f, .powerUsage = 1.0f};
	return makeCapabilities(info, info, info);
	}

	GeneralResult<std::vector<bool>> getSupportedOperationsFloat(const Model& model) {
	const size_t count = model.main.operations.size();
	std::vector<bool> supported(count);
	for (size_t i = 0; i < count; i++) {
	const Operation& operation = model.main.operations[i];
	if (!isExtension(operation.type) && !operation.inputs.empty()) {
	const Operand& firstOperand = model.main.operands[operation.inputs[0]];
	supported[i] = firstOperand.type == OperandType::TENSOR_FLOAT32;
	}
	}
	return supported;
	}

	GeneralResult<std::vector<bool>> getSupportedOperationsMinimal(const Model& model) {
	const size_t count = model.main.operations.size();
	std::vector<bool> supported(count);
	// Simulate supporting just a few ops
	for (size_t i = 0; i < count; i++) {
	supported[i] = false;
	const Operation& operation = model.main.operations[i];
	switch (operation.type) {
	case OperationType::ADD:
	case OperationType::CONCATENATION:
	case OperationType::CONV_2D: {
	const Operand& firstOperand = model.main.operands[operation.inputs[0]];
	if (firstOperand.type == OperandType::TENSOR_FLOAT32) {
	supported[i] = true;
	}
	break;
	}
	default:
	break;
	}
	}
	return supported;
	}

	bool isQuantized(OperandType opType) {
	return opType == OperandType::TENSOR_QUANT8_ASYMM \|\|
	opType == OperandType::TENSOR_QUANT8_ASYMM_SIGNED;
	}

	GeneralResult<std::vector<bool>> getSupportedOperationsQuant(const Model& model) {
	const size_t count = model.main.operations.size();
	std::vector<bool> supported(count);
	for (size_t i = 0; i < count; i++) {
	const Operation& operation = model.main.operations[i];
	if (!isExtension(operation.type) && !operation.inputs.empty()) {
	const Operand& firstOperand = model.main.operands[operation.inputs[0]];
	supported[i] = isQuantized(firstOperand.type);
	if (operation.type == OperationType::SELECT) {
	const Operand& secondOperand = model.main.operands[operation.inputs[1]];
	supported[i] = isQuantized(secondOperand.type);
	}
	}
	}
	return supported;
	}

	SharedDevice makeDevice(std::string name, Capabilities capabilities,
	LimitedSupportDevice::SupportedOperationsFunction getSupportedOperations) {
	auto device = std::make_shared<const Device>(std::move(name));
	auto limitedDevice = std::make_shared<const LimitedSupportDevice>(
	std::move(device), std::move(capabilities), std::move(getSupportedOperations));
	return limitedDevice;
	}

	} // namespace

	LimitedSupportDevice::LimitedSupportDevice(SharedDevice device, Capabilities capabilities,
	SupportedOperationsFunction supportedOperationsFunction)
	: kDevice(std::move(device)),
	kCapabilities(std::move(capabilities)),
	kSupportedOperationsFunction(std::move(supportedOperationsFunction)) {
	CHECK(kDevice != nullptr);
	CHECK(kSupportedOperationsFunction != nullptr);
	const auto result = validate(kCapabilities);
	CHECK(result.has_value()) << result.error();
	}

	const std::string& LimitedSupportDevice::getName() const {
	return kDevice->getName();
	}

	const std::string& LimitedSupportDevice::getVersionString() const {
	return kDevice->getVersionString();
	}

	Version LimitedSupportDevice::getFeatureLevel() const {
	return kDevice->getFeatureLevel();
	}

	DeviceType LimitedSupportDevice::getType() const {
	return kDevice->getType();
	}

	const std::vector<Extension>& LimitedSupportDevice::getSupportedExtensions() const {
	return kDevice->getSupportedExtensions();
	}

	const Capabilities& LimitedSupportDevice::getCapabilities() const {
	return kCapabilities;
	}

	std::pair<uint32_t, uint32_t> LimitedSupportDevice::getNumberOfCacheFilesNeeded() const {
	return kDevice->getNumberOfCacheFilesNeeded();
	}

	GeneralResult<void> LimitedSupportDevice::wait() const {
	return kDevice->wait();
	}

	GeneralResult<std::vector<bool>> LimitedSupportDevice::getSupportedOperations(
	const Model& model) const {
	return kSupportedOperationsFunction(model);
	}

	GeneralResult<SharedPreparedModel> LimitedSupportDevice::prepareModel(
	const Model& model, ExecutionPreference preference, Priority priority,
	OptionalTimePoint deadline, const std::vector<SharedHandle>& modelCache,
	const std::vector<SharedHandle>& dataCache, const CacheToken& token,
	const std::vector<TokenValuePair>& /hints/,
	const std::vector<ExtensionNameAndPrefix>& /extensionNameToPrefix/) const {
	const auto supportedOperations = NN_TRY(kSupportedOperationsFunction(model));
	constexpr auto id = [](auto v) { return v; };
	if (!std::all_of(supportedOperations.begin(), supportedOperations.end(), id)) {
	return NN_ERROR(nn::ErrorStatus::INVALID_ARGUMENT) << "Not all operations are supported";
	}
	return kDevice->prepareModel(model, preference, priority, deadline, modelCache, dataCache,
	token, {}, {});
	}

	GeneralResult<SharedPreparedModel> LimitedSupportDevice::prepareModelFromCache(
	OptionalTimePoint deadline, const std::vector<SharedHandle>& modelCache,
	const std::vector<SharedHandle>& dataCache, const CacheToken& token) const {
	return kDevice->prepareModelFromCache(deadline, modelCache, dataCache, token);
	}

	GeneralResult<SharedBuffer> LimitedSupportDevice::allocate(
	const BufferDesc& desc, const std::vector<SharedPreparedModel>& preparedModels,
	const std::vector<BufferRole>& inputRoles,
	const std::vector<BufferRole>& outputRoles) const {
	return kDevice->allocate(desc, preparedModels, inputRoles, outputRoles);
	}

	std::vector<SharedDevice> getExampleLimitedDevices() {
	SharedDevice device;
	std::vector<SharedDevice> devices;
	devices.reserve(4);

	device = makeDevice("nnapi-sample_float_fast", makeCapabilitiesFloatFast(),
	getSupportedOperationsFloat);
	devices.push_back(std::move(device));

	device = makeDevice("nnapi-sample_float_slow", makeCapabilitiesFloatSlow(),
	getSupportedOperationsFloat);
	devices.push_back(std::move(device));

	device = makeDevice("nnapi-sample_minimal", makeCapabilitiesMinimal(),
	getSupportedOperationsMinimal);
	devices.push_back(std::move(device));

	device = makeDevice("nnapi-sample_quant", makeCapabilitiesQuant(), getSupportedOperationsQuant);
	devices.push_back(std::move(device));

	return devices;
	}

	} // namespace android::nn::sample