mirror of
https://github.com/Evolution-X/hardware_interfaces
synced 2026-02-01 15:58:43 +00:00
This change is part of a larger chain of changes to remove HIDL and AIDL libraries from neuralnetworks_utils_hal_common. Bug: N/A Test: mma Change-Id: Iae9f692ffc72700294aae694c256e75c7e353fef
235 lines
9.1 KiB
C++
235 lines
9.1 KiB
C++
/*
|
|
* Copyright (C) 2020 The Android Open Source Project
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
#include "CommonUtils.h"
|
|
|
|
#include <android-base/logging.h>
|
|
#include <nnapi/Result.h>
|
|
#include <nnapi/SharedMemory.h>
|
|
#include <nnapi/TypeUtils.h>
|
|
#include <nnapi/Types.h>
|
|
#include <nnapi/Validation.h>
|
|
|
|
#include <algorithm>
|
|
#include <any>
|
|
#include <functional>
|
|
#include <optional>
|
|
#include <variant>
|
|
#include <vector>
|
|
|
|
namespace android::hardware::neuralnetworks::utils {
|
|
namespace {
|
|
|
|
bool hasNoPointerData(const nn::Operand& operand);
|
|
bool hasNoPointerData(const nn::Model::Subgraph& subgraph);
|
|
bool hasNoPointerData(const nn::Request::Argument& argument);
|
|
|
|
template <typename Type>
|
|
bool hasNoPointerData(const std::vector<Type>& objects) {
|
|
return std::all_of(objects.begin(), objects.end(),
|
|
[](const auto& object) { return hasNoPointerData(object); });
|
|
}
|
|
|
|
bool hasNoPointerData(const nn::DataLocation& location) {
|
|
return std::visit([](auto ptr) { return ptr == nullptr; }, location.pointer);
|
|
}
|
|
|
|
bool hasNoPointerData(const nn::Operand& operand) {
|
|
return hasNoPointerData(operand.location);
|
|
}
|
|
|
|
bool hasNoPointerData(const nn::Model::Subgraph& subgraph) {
|
|
return hasNoPointerData(subgraph.operands);
|
|
}
|
|
|
|
bool hasNoPointerData(const nn::Request::Argument& argument) {
|
|
return hasNoPointerData(argument.location);
|
|
}
|
|
|
|
void copyPointersToSharedMemory(nn::Operand* operand, nn::ConstantMemoryBuilder* memoryBuilder) {
|
|
CHECK(operand != nullptr);
|
|
CHECK(memoryBuilder != nullptr);
|
|
|
|
if (operand->lifetime != nn::Operand::LifeTime::POINTER) {
|
|
return;
|
|
}
|
|
|
|
const void* data = std::visit([](auto ptr) { return static_cast<const void*>(ptr); },
|
|
operand->location.pointer);
|
|
CHECK(data != nullptr);
|
|
operand->lifetime = nn::Operand::LifeTime::CONSTANT_REFERENCE;
|
|
operand->location = memoryBuilder->append(data, operand->location.length);
|
|
}
|
|
|
|
void copyPointersToSharedMemory(nn::Model::Subgraph* subgraph,
|
|
nn::ConstantMemoryBuilder* memoryBuilder) {
|
|
CHECK(subgraph != nullptr);
|
|
std::for_each(subgraph->operands.begin(), subgraph->operands.end(),
|
|
[memoryBuilder](auto& operand) {
|
|
copyPointersToSharedMemory(&operand, memoryBuilder);
|
|
});
|
|
}
|
|
|
|
} // anonymous namespace
|
|
|
|
nn::Capabilities::OperandPerformanceTable makeQuantized8PerformanceConsistentWithP(
|
|
const nn::Capabilities::PerformanceInfo& float32Performance,
|
|
const nn::Capabilities::PerformanceInfo& quantized8Performance) {
|
|
// In Android P, most data types are treated as having the same performance as
|
|
// TENSOR_QUANT8_ASYMM. This collection must be in sorted order.
|
|
std::vector<nn::Capabilities::OperandPerformance> operandPerformances = {
|
|
{.type = nn::OperandType::FLOAT32, .info = float32Performance},
|
|
{.type = nn::OperandType::INT32, .info = quantized8Performance},
|
|
{.type = nn::OperandType::UINT32, .info = quantized8Performance},
|
|
{.type = nn::OperandType::TENSOR_FLOAT32, .info = float32Performance},
|
|
{.type = nn::OperandType::TENSOR_INT32, .info = quantized8Performance},
|
|
{.type = nn::OperandType::TENSOR_QUANT8_ASYMM, .info = quantized8Performance},
|
|
{.type = nn::OperandType::OEM, .info = quantized8Performance},
|
|
{.type = nn::OperandType::TENSOR_OEM_BYTE, .info = quantized8Performance},
|
|
};
|
|
return nn::Capabilities::OperandPerformanceTable::create(std::move(operandPerformances))
|
|
.value();
|
|
}
|
|
|
|
bool hasNoPointerData(const nn::Model& model) {
|
|
return hasNoPointerData(model.main) && hasNoPointerData(model.referenced);
|
|
}
|
|
|
|
bool hasNoPointerData(const nn::Request& request) {
|
|
return hasNoPointerData(request.inputs) && hasNoPointerData(request.outputs);
|
|
}
|
|
|
|
nn::GeneralResult<std::reference_wrapper<const nn::Model>> flushDataFromPointerToShared(
|
|
const nn::Model* model, std::optional<nn::Model>* maybeModelInSharedOut) {
|
|
CHECK(model != nullptr);
|
|
CHECK(maybeModelInSharedOut != nullptr);
|
|
|
|
if (hasNoPointerData(*model)) {
|
|
return *model;
|
|
}
|
|
|
|
// Make a copy of the model in order to make modifications. The modified model is returned to
|
|
// the caller through `maybeModelInSharedOut` if the function succeeds.
|
|
nn::Model modelInShared = *model;
|
|
|
|
nn::ConstantMemoryBuilder memoryBuilder(modelInShared.pools.size());
|
|
copyPointersToSharedMemory(&modelInShared.main, &memoryBuilder);
|
|
std::for_each(modelInShared.referenced.begin(), modelInShared.referenced.end(),
|
|
[&memoryBuilder](auto& subgraph) {
|
|
copyPointersToSharedMemory(&subgraph, &memoryBuilder);
|
|
});
|
|
|
|
if (!memoryBuilder.empty()) {
|
|
auto memory = NN_TRY(memoryBuilder.finish());
|
|
modelInShared.pools.push_back(std::move(memory));
|
|
}
|
|
|
|
*maybeModelInSharedOut = modelInShared;
|
|
return **maybeModelInSharedOut;
|
|
}
|
|
|
|
template <>
|
|
void InputRelocationTracker::flush() const {
|
|
// Copy from pointers to shared memory.
|
|
uint8_t* memoryPtr = static_cast<uint8_t*>(std::get<void*>(kMapping.pointer));
|
|
for (const auto& [data, length, offset] : kRelocationInfos) {
|
|
std::memcpy(memoryPtr + offset, data, length);
|
|
}
|
|
}
|
|
|
|
template <>
|
|
void OutputRelocationTracker::flush() const {
|
|
// Copy from shared memory to pointers.
|
|
const uint8_t* memoryPtr = static_cast<const uint8_t*>(
|
|
std::visit([](auto ptr) { return static_cast<const void*>(ptr); }, kMapping.pointer));
|
|
for (const auto& [data, length, offset] : kRelocationInfos) {
|
|
std::memcpy(data, memoryPtr + offset, length);
|
|
}
|
|
}
|
|
|
|
nn::GeneralResult<std::reference_wrapper<const nn::Request>> convertRequestFromPointerToShared(
|
|
const nn::Request* request, uint32_t alignment, uint32_t padding,
|
|
std::optional<nn::Request>* maybeRequestInSharedOut, RequestRelocation* relocationOut) {
|
|
CHECK(request != nullptr);
|
|
CHECK(maybeRequestInSharedOut != nullptr);
|
|
CHECK(relocationOut != nullptr);
|
|
|
|
if (hasNoPointerData(*request)) {
|
|
return *request;
|
|
}
|
|
|
|
// Make a copy of the request in order to make modifications. The modified request is returned
|
|
// to the caller through `maybeRequestInSharedOut` if the function succeeds.
|
|
nn::Request requestInShared = *request;
|
|
|
|
RequestRelocation relocation;
|
|
|
|
// Change input pointers to shared memory.
|
|
nn::MutableMemoryBuilder inputBuilder(requestInShared.pools.size());
|
|
std::vector<InputRelocationInfo> inputRelocationInfos;
|
|
for (auto& input : requestInShared.inputs) {
|
|
const auto& location = input.location;
|
|
if (input.lifetime != nn::Request::Argument::LifeTime::POINTER) {
|
|
continue;
|
|
}
|
|
|
|
input.lifetime = nn::Request::Argument::LifeTime::POOL;
|
|
const void* data = std::visit([](auto ptr) { return static_cast<const void*>(ptr); },
|
|
location.pointer);
|
|
CHECK(data != nullptr);
|
|
input.location = inputBuilder.append(location.length, alignment, padding);
|
|
inputRelocationInfos.push_back({data, input.location.length, input.location.offset});
|
|
}
|
|
|
|
// Allocate input memory.
|
|
if (!inputBuilder.empty()) {
|
|
auto memory = NN_TRY(inputBuilder.finish());
|
|
requestInShared.pools.push_back(memory);
|
|
relocation.input = NN_TRY(
|
|
InputRelocationTracker::create(std::move(inputRelocationInfos), std::move(memory)));
|
|
}
|
|
|
|
// Change output pointers to shared memory.
|
|
nn::MutableMemoryBuilder outputBuilder(requestInShared.pools.size());
|
|
std::vector<OutputRelocationInfo> outputRelocationInfos;
|
|
for (auto& output : requestInShared.outputs) {
|
|
const auto& location = output.location;
|
|
if (output.lifetime != nn::Request::Argument::LifeTime::POINTER) {
|
|
continue;
|
|
}
|
|
|
|
output.lifetime = nn::Request::Argument::LifeTime::POOL;
|
|
void* data = std::get<void*>(location.pointer);
|
|
CHECK(data != nullptr);
|
|
output.location = outputBuilder.append(location.length, alignment, padding);
|
|
outputRelocationInfos.push_back({data, output.location.length, output.location.offset});
|
|
}
|
|
|
|
// Allocate output memory.
|
|
if (!outputBuilder.empty()) {
|
|
auto memory = NN_TRY(outputBuilder.finish());
|
|
requestInShared.pools.push_back(memory);
|
|
relocation.output = NN_TRY(OutputRelocationTracker::create(std::move(outputRelocationInfos),
|
|
std::move(memory)));
|
|
}
|
|
|
|
*maybeRequestInSharedOut = requestInShared;
|
|
*relocationOut = std::move(relocation);
|
|
return **maybeRequestInSharedOut;
|
|
}
|
|
|
|
} // namespace android::hardware::neuralnetworks::utils
|