Added SubGraphContext to manage creating SubGraph Flatbuffers Bug: 237410741 Test: Built libneuralnetworks_v2 properly Change-Id: I0be19a8d7827fd6e3cf6c597ce0f81b420ae6b51

commit: 7e9b08abb1d3fe2f1afcbe88790da5a4dc42dccc [log] [tgz]
author: Henry Trinh <thenrym@google.com> Fri Jun 24 20:44:32 2022 +0000
committer: Henry Trinh <thenrym@google.com> Mon Jul 18 01:38:20 2022 +0000
tree: f87bc71503a5cf80d0ea55e1c92cd8714c87699d
parent: 6f7152760cf31d85f36ab00a0cf90d3cced1065f [diff]
diff --git a/runtime/Android.bp b/runtime/Android.bp
index bfc8194..29815ea 100644
--- a/runtime/Android.bp
+++ b/runtime/Android.bp

@@ -174,6 +174,9 @@
 cc_defaults {
     name: "libneuralnetworks_v2_defaults",
     defaults: ["libneuralnetworks_defaults"],
+    srcs: [
+        "operation_converters/SubGraphContext.cpp",
+    ],
 
     static_libs: [
         "libtflite_static",

diff --git a/runtime/FlatbufferModelBuilderUtils.h b/runtime/FlatbufferModelBuilderUtils.h
index edd1eaf..05f311d 100644
--- a/runtime/FlatbufferModelBuilderUtils.h
+++ b/runtime/FlatbufferModelBuilderUtils.h

@@ -31,6 +31,7 @@
 using SubGraphFlatbuffer = flatbuffers::Offset<tflite::SubGraph>;
 using SubGraphsFlatbuffer = flatbuffers::Offset<flatbuffers::Vector<SubGraphFlatbuffer>>;
 
+using OperatorCodeFlatbuffer = flatbuffers::Offset<tflite::OperatorCode>;
 using OperatorFlatbuffer = flatbuffers::Offset<tflite::Operator>;
 using OperatorsFlatbuffer = flatbuffers::Offset<flatbuffers::Vector<OperatorFlatbuffer>>;
 
@@ -75,6 +76,20 @@
     }
 }
 
+// Referenced from external/tensorflow/tensorflow/lite/tools/versioning/op_version.cc
+inline int32_t getMaxOperatorVersionCode(tflite::BuiltinOperator builtinCode) {
+    // TODO: Add more builtin_codes
+    switch (builtinCode) {
+        case tflite::BuiltinOperator::BuiltinOperator_CONV_2D:
+            return 5;
+        case tflite::BuiltinOperator::BuiltinOperator_PAD:
+            return 4;
+        default:
+            LOG(FATAL) << "BuiltinOperator not supported: " << builtinCode;
+            return {};
+    }
+}
+
 }  // namespace nn
 }  // namespace android
 

diff --git a/runtime/operation_converters/SubGraphContext.cpp b/runtime/operation_converters/SubGraphContext.cpp
new file mode 100644
index 0000000..4ecd4ed
--- /dev/null
+++ b/runtime/operation_converters/SubGraphContext.cpp

@@ -0,0 +1,190 @@
+/*
+ * Copyright (C) 2022 The Android Open Source Project
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *      http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#define LOG_TAG "SubGraphContext"
+
+#include "SubGraphContext.h"
+
+#include "FlatbufferModelBuilderUtils.h"
+
+namespace android {
+namespace nn {
+
+SubGraphContext::SubGraphContext(const Model* model, const Model::Subgraph* subgraph,
+                                 flatbuffers::FlatBufferBuilder* builder,
+                                 std::vector<OpCodeFlatbuffer>* opCodesVector,
+                                 std::vector<int>* opCodeIndexForOperationType,
+                                 std::vector<BufferFlatbuffer>* bufferVector)
+    : mModel(model),
+      mSubgraph(subgraph),
+      mBuilder(builder),
+      mOpCodesVector(opCodesVector),
+      mOpCodeIndexForOperationType(opCodeIndexForOperationType),
+      mBufferVector(bufferVector) {
+    CHECK(model != nullptr);
+    CHECK(subgraph != nullptr);
+    CHECK(opCodesVector != nullptr);
+    CHECK(opCodeIndexForOperationType != nullptr);
+    CHECK(bufferVector != nullptr);
+
+    mOperandToTensorIdx.resize(subgraph->operands.size(), -1);
+    mMappings.resize(model->pools.size());
+}
+
+SubGraphFlatbuffer SubGraphContext::finish() {
+    return tflite::CreateSubGraphDirect(*mBuilder, &mTensorVector, &mInputTensors, &mOutputTensors,
+                                        &mOperatorVector);
+}
+
+int SubGraphContext::addTensorFlatbuffer(TensorFlatbuffer tensor, int32_t operandIdx) {
+    mTensorVector.push_back(tensor);
+
+    int tensorIdx = mTensorVector.size() - 1;
+    if (operandIdx >= 0) {
+        CHECK(mOperandToTensorIdx[operandIdx] == -1);
+        mOperandToTensorIdx[operandIdx] = tensorIdx;
+    }
+    return tensorIdx;
+}
+
+void SubGraphContext::addOperatorFlatbuffer(OperatorFlatbuffer opFlatbuffer) {
+    mOperatorVector.push_back(opFlatbuffer);
+}
+
+void SubGraphContext::addSubGraphInput(int32_t operandIdx) {
+    CHECK(mOperandToTensorIdx[operandIdx] != -1);
+    mInputTensors.push_back(mOperandToTensorIdx[operandIdx]);
+}
+
+void SubGraphContext::addSubGraphOutput(int32_t operandIdx) {
+    CHECK(mOperandToTensorIdx[operandIdx] != -1);
+    mOutputTensors.push_back(mOperandToTensorIdx[operandIdx]);
+}
+
+uint32_t SubGraphContext::getOpCodeIndex(OperationType operationType) const {
+    uint32_t idx = static_cast<uint32_t>(operationType);
+    CHECK(mOpCodeIndexForOperationType->at(idx) != -1);
+    return (*mOpCodeIndexForOperationType)[idx];
+}
+
+void SubGraphContext::addOpCode(OperationType operationType) {
+    uint32_t idx = static_cast<uint32_t>(operationType);
+    if (mOpCodeIndexForOperationType->at(idx) != -1) {
+        return;
+    }
+
+    OperatorCodeFlatbuffer opCode;
+
+    tflite::BuiltinOperator builtinCode = getFlatbufferOperator(operationType);
+    if (builtinCode < tflite::BuiltinOperator::BuiltinOperator_PLACEHOLDER_FOR_GREATER_OP_CODES)
+        opCode = tflite::CreateOperatorCode(
+                *mBuilder, static_cast<int8_t>(builtinCode) /* deprecated_builtin_code */,
+                0 /* custom_code */, getMaxOperatorVersionCode(builtinCode) /* version */);
+    else
+        opCode = tflite::CreateOperatorCode(*mBuilder, 0 /* deprecated_builtin_code */,
+                                            0 /* custom_code */,
+                                            getMaxOperatorVersionCode(builtinCode) /* version */,
+                                            builtinCode /* builtin_code */);
+
+    mOpCodesVector->push_back(opCode);
+    (*mOpCodeIndexForOperationType)[idx] = mOpCodesVector->size() - 1;
+}
+
+int SubGraphContext::getTensorIdxFromOperandIdx(int operandIdx) const {
+    return mOperandToTensorIdx[operandIdx];
+}
+
+const Mapping& SubGraphContext::getMapping(uint32_t poolIndex) {
+    if (mMappings[poolIndex].size > 0) {
+        return mMappings[poolIndex];
+    }
+
+    SharedMemory memory = mModel->pools[poolIndex];
+    GeneralResult<Mapping> mapping = map(memory);
+    CHECK(mapping.has_value()) << "CONSTANT_REFERENCE memory mapping error: "
+                               << mapping.error().message;
+
+    mMappings[poolIndex] = std::move(mapping).value();
+    return mMappings[poolIndex];
+}
+
+std::pair<const uint8_t*, uint32_t> SubGraphContext::getConstantPointerAndLength(
+        const Operand& operand) {
+    CHECK(operand.lifetime == Operand::LifeTime::CONSTANT_COPY ||
+          operand.lifetime == Operand::LifeTime::CONSTANT_REFERENCE);
+
+    if (operand.lifetime == Operand::LifeTime::CONSTANT_COPY) {
+        return std::make_pair(mModel->operandValues.data() + operand.location.offset,
+                              operand.location.length);
+    }
+
+    const Mapping& mapping = getMapping(operand.location.poolIndex);
+    const uint8_t* memoryPtr = static_cast<const uint8_t*>(
+            std::visit([](auto ptr) { return static_cast<const void*>(ptr); }, mapping.pointer));
+
+    return std::make_pair(memoryPtr + operand.location.offset, operand.location.length);
+}
+
+uint32_t SubGraphContext::addBufferFromData(const uint8_t* data, uint32_t length) {
+    auto dataVectorFlatbuffer = mBuilder->CreateVector(data, length);
+
+    auto buffer = tflite::CreateBuffer(*mBuilder, dataVectorFlatbuffer);
+    mBufferVector->push_back(buffer);
+
+    return mBufferVector->size() - 1;
+}
+
+void SubGraphContext::createTensorFlatbufferFromOperand(uint32_t operandIdx) {
+    // An output Operand to one Operation can be an input Operand to
+    // another Operation, so this function can be run more than once.
+    // We simply return if the Tensor for the Operand is already created.
+    if (mOperandToTensorIdx[operandIdx] != -1) return;
+
+    const Operand& operand = mSubgraph->operands[operandIdx];
+
+    bool isConstant = operand.lifetime == Operand::LifeTime::CONSTANT_COPY ||
+                      operand.lifetime == Operand::LifeTime::CONSTANT_REFERENCE;
+
+    std::vector<float> scaleVector{operand.scale};
+    std::vector<int64_t> zeroPointVector{operand.zeroPoint};
+
+    // build quantization parameters
+    auto quantizationParams = tflite::CreateQuantizationParametersDirect(
+            *mBuilder, 0 /* min */, 0 /* max */, &scaleVector /* scale */,
+            &zeroPointVector /* zero_point */,
+            tflite::QuantizationDetails::QuantizationDetails_NONE /* details_type */);
+
+    // add buffer if constant operand
+    // buffer at index 0 is reserved for tensors without a buffer
+    uint32_t bufferIdx = 0;
+    if (isConstant) {
+        auto [data, dataLength] = getConstantPointerAndLength(operand);
+        bufferIdx = addBufferFromData(data, dataLength);
+    }
+
+    // shape of tensor
+    std::vector<int32_t> shape(operand.dimensions.begin(), operand.dimensions.end());
+    std::replace(shape.begin(), shape.end(), 0, -1);
+
+    // build tensor
+    TensorFlatbuffer tensor = tflite::CreateTensorDirect(
+            *mBuilder, &shape, getTensorFlatbufferOperandType(operand.type) /* type */,
+            bufferIdx /* buffer */, 0 /* name */, quantizationParams /* quantization */);
+    addTensorFlatbuffer(tensor, operandIdx);
+}
+
+}  // namespace nn
+}  // namespace android
\ No newline at end of file

diff --git a/runtime/operation_converters/SubGraphContext.h b/runtime/operation_converters/SubGraphContext.h
new file mode 100644
index 0000000..55bda8a
--- /dev/null
+++ b/runtime/operation_converters/SubGraphContext.h

@@ -0,0 +1,100 @@
+/*
+ * Copyright (C) 2022 The Android Open Source Project
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *      http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef ANDROID_PACKAGES_MODULES_NEURALNETWORKS_RUNTIME_OPERATION_CONVERTERS_SUBGRAPH_CONTEXT_H
+#define ANDROID_PACKAGES_MODULES_NEURALNETWORKS_RUNTIME_OPERATION_CONVERTERS_SUBGRAPH_CONTEXT_H
+
+#include <utility>
+#include <vector>
+
+#include "FlatbufferModelBuilderUtils.h"
+#include "NeuralNetworks.h"
+
+namespace android {
+namespace nn {
+
+// This keeps track of all the data needed to convert NNAPI subgraphs to TFLite subgraphs
+// This also provides information needed to convert NNAPI Operations to TFLite Operators
+// Once the subgraph is done building, call finish() to return the flatbuffer
+class SubGraphContext {
+   public:
+    SubGraphContext(const Model* model, const Model::Subgraph* subgraph,
+                    flatbuffers::FlatBufferBuilder* builder,
+                    std::vector<OpCodeFlatbuffer>* opCodesVector,
+                    std::vector<int>* opCodeIndexForOperationType,
+                    std::vector<BufferFlatbuffer>* bufferVector);
+
+    SubGraphFlatbuffer finish();
+
+    // If the operandIdx is -1, it suggests that the tensor being added doesn't have a
+    // corresponding Operand from the NNAPI NDK model.
+    // Returns index of Tensor being added.
+    int addTensorFlatbuffer(TensorFlatbuffer tensor, int32_t operandIdx = -1);
+    void addOperatorFlatbuffer(OperatorFlatbuffer opFlatbuffer);
+    void addSubGraphInput(int32_t operandIdx);
+    void addSubGraphOutput(int32_t operandIdx);
+
+    void addOpCode(OperationType operationType);
+
+    const Model::Subgraph* getSubgraph() const { return mSubgraph; }
+    // Returns -1 if there is no corresponding tensor index
+    int getTensorIdxFromOperandIdx(int operandIdx) const;
+    uint32_t getOpCodeIndex(OperationType operationType) const;
+    flatbuffers::FlatBufferBuilder* getBuilder() { return mBuilder; }
+
+    // OperandLifeTime must be CONSTANT_COPY or CONSTANT_REFERENCE
+    // Will crash if OperandLifeTime is not either of the two.
+    // dataSize is the size of value in bytes.
+    template <typename Type>
+    void copyConstantValueToData(const Operand& operand, Type* data, size_t dataSize);
+
+    // Returns Buffer index
+    uint32_t addBufferFromData(const uint8_t* data, uint32_t length);
+    void createTensorFlatbufferFromOperand(uint32_t operandIdx);
+
+   private:
+    const Mapping& getMapping(uint32_t poolIndex);
+    std::pair<const uint8_t*, uint32_t> getConstantPointerAndLength(const Operand& operand);
+
+    const Model* mModel;
+    const Model::Subgraph* mSubgraph;
+    flatbuffers::FlatBufferBuilder* mBuilder;
+
+    std::vector<OpCodeFlatbuffer>* mOpCodesVector;
+    std::vector<int>* mOpCodeIndexForOperationType;
+    std::vector<BufferFlatbuffer>* mBufferVector;
+
+    std::vector<OperatorFlatbuffer> mOperatorVector;
+    std::vector<TensorFlatbuffer> mTensorVector;
+    std::vector<int32_t> mInputTensors;
+    std::vector<int32_t> mOutputTensors;
+    std::vector<int> mOperandToTensorIdx;
+    // Each index corresponds to the pool index of shared memory
+    std::vector<Mapping> mMappings;
+};
+
+template <typename Type>
+void SubGraphContext::copyConstantValueToData(const Operand& operand, Type* data, size_t dataSize) {
+    auto [pointer, length] = getConstantPointerAndLength(operand);
+    CHECK_GE(dataSize, length);
+
+    std::memcpy(data, pointer, length);
+}
+
+}  // namespace nn
+}  // namespace android
+
+#endif  // ANDROID_PACKAGES_MODULES_NEURALNETWORKS_RUNTIME_OPERATION_CONVERTERS_SUBGRAPH_CONTEXT_H
\ No newline at end of file
commit	7e9b08abb1d3fe2f1afcbe88790da5a4dc42dccc	[log] [tgz]
author	Henry Trinh <thenrym@google.com>	Fri Jun 24 20:44:32 2022 +0000
committer	Henry Trinh <thenrym@google.com>	Mon Jul 18 01:38:20 2022 +0000
tree	f87bc71503a5cf80d0ea55e1c92cd8714c87699d
parent	6f7152760cf31d85f36ab00a0cf90d3cced1065f [diff]