241 lines
9.1 KiB
C++
241 lines
9.1 KiB
C++
/*
|
|
* Copyright (C) 2021 The Android Open Source Project
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
#include "LimitedSupportDevice.h"
|
|
|
|
#include <android-base/logging.h>
|
|
#include <nnapi/IBuffer.h>
|
|
#include <nnapi/IDevice.h>
|
|
#include <nnapi/IPreparedModel.h>
|
|
#include <nnapi/OperandTypes.h>
|
|
#include <nnapi/Result.h>
|
|
#include <nnapi/TypeUtils.h>
|
|
#include <nnapi/Types.h>
|
|
#include <nnapi/Validation.h>
|
|
|
|
#include <algorithm>
|
|
#include <any>
|
|
#include <chrono>
|
|
#include <functional>
|
|
#include <iterator>
|
|
#include <memory>
|
|
#include <optional>
|
|
#include <set>
|
|
#include <string>
|
|
#include <utility>
|
|
#include <vector>
|
|
|
|
#include "CanonicalDevice.h"
|
|
|
|
namespace android::nn::sample {
|
|
namespace {
|
|
|
|
Capabilities makeCapabilitiesFloatFast() {
|
|
const Capabilities::PerformanceInfo defaultInfo = {.execTime = 1.0f, .powerUsage = 1.0f};
|
|
const Capabilities::PerformanceInfo float32Info = {.execTime = 0.8f, .powerUsage = 1.2f};
|
|
const Capabilities::PerformanceInfo relaxedInfo = {.execTime = 0.7f, .powerUsage = 1.1f};
|
|
return makeCapabilities(defaultInfo, float32Info, relaxedInfo);
|
|
}
|
|
|
|
Capabilities makeCapabilitiesFloatSlow() {
|
|
const Capabilities::PerformanceInfo defaultInfo = {.execTime = 1.0f, .powerUsage = 1.0f};
|
|
const Capabilities::PerformanceInfo float32Info = {.execTime = 1.3f, .powerUsage = 0.7f};
|
|
const Capabilities::PerformanceInfo relaxedInfo = {.execTime = 1.2f, .powerUsage = 0.6f};
|
|
return makeCapabilities(defaultInfo, float32Info, relaxedInfo);
|
|
}
|
|
|
|
Capabilities makeCapabilitiesMinimal() {
|
|
const Capabilities::PerformanceInfo defaultInfo = {.execTime = 1.0f, .powerUsage = 1.0f};
|
|
const Capabilities::PerformanceInfo float32Info = {.execTime = 0.4f, .powerUsage = 0.5f};
|
|
const Capabilities::PerformanceInfo relaxedInfo = {.execTime = 0.4f, .powerUsage = 0.5f};
|
|
return makeCapabilities(defaultInfo, float32Info, relaxedInfo);
|
|
}
|
|
|
|
Capabilities makeCapabilitiesQuant() {
|
|
const Capabilities::PerformanceInfo info = {.execTime = 50.0f, .powerUsage = 1.0f};
|
|
return makeCapabilities(info, info, info);
|
|
}
|
|
|
|
GeneralResult<std::vector<bool>> getSupportedOperationsFloat(const Model& model) {
|
|
const size_t count = model.main.operations.size();
|
|
std::vector<bool> supported(count);
|
|
for (size_t i = 0; i < count; i++) {
|
|
const Operation& operation = model.main.operations[i];
|
|
if (!isExtension(operation.type) && !operation.inputs.empty()) {
|
|
const Operand& firstOperand = model.main.operands[operation.inputs[0]];
|
|
supported[i] = firstOperand.type == OperandType::TENSOR_FLOAT32;
|
|
}
|
|
}
|
|
return supported;
|
|
}
|
|
|
|
GeneralResult<std::vector<bool>> getSupportedOperationsMinimal(const Model& model) {
|
|
const size_t count = model.main.operations.size();
|
|
std::vector<bool> supported(count);
|
|
// Simulate supporting just a few ops
|
|
for (size_t i = 0; i < count; i++) {
|
|
supported[i] = false;
|
|
const Operation& operation = model.main.operations[i];
|
|
switch (operation.type) {
|
|
case OperationType::ADD:
|
|
case OperationType::CONCATENATION:
|
|
case OperationType::CONV_2D: {
|
|
const Operand& firstOperand = model.main.operands[operation.inputs[0]];
|
|
if (firstOperand.type == OperandType::TENSOR_FLOAT32) {
|
|
supported[i] = true;
|
|
}
|
|
break;
|
|
}
|
|
default:
|
|
break;
|
|
}
|
|
}
|
|
return supported;
|
|
}
|
|
|
|
bool isQuantized(OperandType opType) {
|
|
return opType == OperandType::TENSOR_QUANT8_ASYMM ||
|
|
opType == OperandType::TENSOR_QUANT8_ASYMM_SIGNED;
|
|
}
|
|
|
|
GeneralResult<std::vector<bool>> getSupportedOperationsQuant(const Model& model) {
|
|
const size_t count = model.main.operations.size();
|
|
std::vector<bool> supported(count);
|
|
for (size_t i = 0; i < count; i++) {
|
|
const Operation& operation = model.main.operations[i];
|
|
if (!isExtension(operation.type) && !operation.inputs.empty()) {
|
|
const Operand& firstOperand = model.main.operands[operation.inputs[0]];
|
|
supported[i] = isQuantized(firstOperand.type);
|
|
if (operation.type == OperationType::SELECT) {
|
|
const Operand& secondOperand = model.main.operands[operation.inputs[1]];
|
|
supported[i] = isQuantized(secondOperand.type);
|
|
}
|
|
}
|
|
}
|
|
return supported;
|
|
}
|
|
|
|
SharedDevice makeDevice(std::string name, Capabilities capabilities,
|
|
LimitedSupportDevice::SupportedOperationsFunction getSupportedOperations) {
|
|
auto device = std::make_shared<const Device>(std::move(name));
|
|
auto limitedDevice = std::make_shared<const LimitedSupportDevice>(
|
|
std::move(device), std::move(capabilities), std::move(getSupportedOperations));
|
|
return limitedDevice;
|
|
}
|
|
|
|
} // namespace
|
|
|
|
LimitedSupportDevice::LimitedSupportDevice(SharedDevice device, Capabilities capabilities,
|
|
SupportedOperationsFunction supportedOperationsFunction)
|
|
: kDevice(std::move(device)),
|
|
kCapabilities(std::move(capabilities)),
|
|
kSupportedOperationsFunction(std::move(supportedOperationsFunction)) {
|
|
CHECK(kDevice != nullptr);
|
|
CHECK(kSupportedOperationsFunction != nullptr);
|
|
const auto result = validate(kCapabilities);
|
|
CHECK(result.has_value()) << result.error();
|
|
}
|
|
|
|
const std::string& LimitedSupportDevice::getName() const {
|
|
return kDevice->getName();
|
|
}
|
|
|
|
const std::string& LimitedSupportDevice::getVersionString() const {
|
|
return kDevice->getVersionString();
|
|
}
|
|
|
|
Version LimitedSupportDevice::getFeatureLevel() const {
|
|
return kDevice->getFeatureLevel();
|
|
}
|
|
|
|
DeviceType LimitedSupportDevice::getType() const {
|
|
return kDevice->getType();
|
|
}
|
|
|
|
const std::vector<Extension>& LimitedSupportDevice::getSupportedExtensions() const {
|
|
return kDevice->getSupportedExtensions();
|
|
}
|
|
|
|
const Capabilities& LimitedSupportDevice::getCapabilities() const {
|
|
return kCapabilities;
|
|
}
|
|
|
|
std::pair<uint32_t, uint32_t> LimitedSupportDevice::getNumberOfCacheFilesNeeded() const {
|
|
return kDevice->getNumberOfCacheFilesNeeded();
|
|
}
|
|
|
|
GeneralResult<void> LimitedSupportDevice::wait() const {
|
|
return kDevice->wait();
|
|
}
|
|
|
|
GeneralResult<std::vector<bool>> LimitedSupportDevice::getSupportedOperations(
|
|
const Model& model) const {
|
|
return kSupportedOperationsFunction(model);
|
|
}
|
|
|
|
GeneralResult<SharedPreparedModel> LimitedSupportDevice::prepareModel(
|
|
const Model& model, ExecutionPreference preference, Priority priority,
|
|
OptionalTimePoint deadline, const std::vector<SharedHandle>& modelCache,
|
|
const std::vector<SharedHandle>& dataCache, const CacheToken& token,
|
|
const std::vector<TokenValuePair>& /*hints*/,
|
|
const std::vector<ExtensionNameAndPrefix>& /*extensionNameToPrefix*/) const {
|
|
const auto supportedOperations = NN_TRY(kSupportedOperationsFunction(model));
|
|
constexpr auto id = [](auto v) { return v; };
|
|
if (!std::all_of(supportedOperations.begin(), supportedOperations.end(), id)) {
|
|
return NN_ERROR(nn::ErrorStatus::INVALID_ARGUMENT) << "Not all operations are supported";
|
|
}
|
|
return kDevice->prepareModel(model, preference, priority, deadline, modelCache, dataCache,
|
|
token, {}, {});
|
|
}
|
|
|
|
GeneralResult<SharedPreparedModel> LimitedSupportDevice::prepareModelFromCache(
|
|
OptionalTimePoint deadline, const std::vector<SharedHandle>& modelCache,
|
|
const std::vector<SharedHandle>& dataCache, const CacheToken& token) const {
|
|
return kDevice->prepareModelFromCache(deadline, modelCache, dataCache, token);
|
|
}
|
|
|
|
GeneralResult<SharedBuffer> LimitedSupportDevice::allocate(
|
|
const BufferDesc& desc, const std::vector<SharedPreparedModel>& preparedModels,
|
|
const std::vector<BufferRole>& inputRoles,
|
|
const std::vector<BufferRole>& outputRoles) const {
|
|
return kDevice->allocate(desc, preparedModels, inputRoles, outputRoles);
|
|
}
|
|
|
|
std::vector<SharedDevice> getExampleLimitedDevices() {
|
|
SharedDevice device;
|
|
std::vector<SharedDevice> devices;
|
|
devices.reserve(4);
|
|
|
|
device = makeDevice("nnapi-sample_float_fast", makeCapabilitiesFloatFast(),
|
|
getSupportedOperationsFloat);
|
|
devices.push_back(std::move(device));
|
|
|
|
device = makeDevice("nnapi-sample_float_slow", makeCapabilitiesFloatSlow(),
|
|
getSupportedOperationsFloat);
|
|
devices.push_back(std::move(device));
|
|
|
|
device = makeDevice("nnapi-sample_minimal", makeCapabilitiesMinimal(),
|
|
getSupportedOperationsMinimal);
|
|
devices.push_back(std::move(device));
|
|
|
|
device = makeDevice("nnapi-sample_quant", makeCapabilitiesQuant(), getSupportedOperationsQuant);
|
|
devices.push_back(std::move(device));
|
|
|
|
return devices;
|
|
}
|
|
|
|
} // namespace android::nn::sample
|