ArmNN
 25.11
Loading...
Searching...
No Matches
Deserializer.hpp
Go to the documentation of this file.
1//
2// Copyright © 2017,2019-2024 Arm Ltd and Contributors. All rights reserved.
3// SPDX-License-Identifier: MIT
4//
5
6#pragma once
7
8#include <armnn/INetwork.hpp>
10#include <ArmnnSchema_generated.h>
11
12#include <unordered_map>
13
14namespace armnnDeserializer
15{
16
17// Shorthands for deserializer types
18using ConstTensorRawPtr = const armnnSerializer::ConstTensor *;
19using GraphPtr = const armnnSerializer::SerializedGraph *;
20using TensorRawPtr = const armnnSerializer::TensorInfo *;
21using Pooling2dDescriptor = const armnnSerializer::Pooling2dDescriptor *;
22using Pooling3dDescriptor = const armnnSerializer::Pooling3dDescriptor *;
23using NormalizationDescriptorPtr = const armnnSerializer::NormalizationDescriptor *;
24using LstmDescriptorPtr = const armnnSerializer::LstmDescriptor *;
25using LstmInputParamsPtr = const armnnSerializer::LstmInputParams *;
26using QLstmDescriptorPtr = const armnnSerializer::QLstmDescriptor *;
27using QunatizedLstmInputParamsPtr = const armnnSerializer::QuantizedLstmInputParams *;
28using TensorRawPtrVector = std::vector<TensorRawPtr>;
29using LayerRawPtr = const armnnSerializer::LayerBase *;
30using LayerBaseRawPtr = const armnnSerializer::LayerBase *;
31using LayerBaseRawPtrVector = std::vector<LayerBaseRawPtr>;
32using UnidirectionalSequenceLstmDescriptorPtr = const armnnSerializer::UnidirectionalSequenceLstmDescriptor *;
33
35{
36public:
37
38 /// Create an input network from binary file contents
39 armnn::INetworkPtr CreateNetworkFromBinary(const std::vector<uint8_t>& binaryContent);
40
41 /// Create an input network from a binary input stream
42 armnn::INetworkPtr CreateNetworkFromBinary(std::istream& binaryContent);
43
44 /// Retrieve binding info (layer id and tensor info) for the network input identified by the given layer name
45 BindingPointInfo GetNetworkInputBindingInfo(unsigned int layerId, const std::string& name) const;
46
47 /// Retrieve binding info (layer id and tensor info) for the network output identified by the given layer name
48 BindingPointInfo GetNetworkOutputBindingInfo(unsigned int layerId, const std::string& name) const;
49
51 ~DeserializerImpl() = default;
52
53 // No copying allowed until it is wanted and properly implemented
56
57 // testable helpers
58 static GraphPtr LoadGraphFromBinary(const uint8_t* binaryContent, size_t len);
59 static TensorRawPtrVector GetInputs(const GraphPtr& graph, unsigned int layerIndex);
60 static TensorRawPtrVector GetOutputs(const GraphPtr& graph, unsigned int layerIndex);
61 static LayerBaseRawPtr GetBaseLayer(const GraphPtr& graphPtr, unsigned int layerIndex);
62 static int32_t GetBindingLayerInfo(const GraphPtr& graphPtr, unsigned int layerIndex);
63 static std::string GetLayerName(const GraphPtr& graph, unsigned int index);
65 unsigned int layerIndex);
67 unsigned int layerIndex);
69 NormalizationDescriptorPtr normalizationDescriptor, unsigned int layerIndex);
72 LstmInputParamsPtr lstmInputParams);
76 static armnn::TensorInfo OutputShapeOfReshape(const armnn::TensorInfo & inputTensorInfo,
77 const std::vector<uint32_t> & targetDimsIn);
78
79private:
80 /// Create the network from an already loaded flatbuffers graph
81 armnn::INetworkPtr CreateNetworkFromGraph(GraphPtr graph);
82
83 // signature for the parser functions
84 using LayerParsingFunction = void(DeserializerImpl::*)(GraphPtr graph, unsigned int layerIndex);
85
86 void ParseUnsupportedLayer(GraphPtr graph, unsigned int layerIndex);
87 void ParseAbs(GraphPtr graph, unsigned int layerIndex);
88 void ParseActivation(GraphPtr graph, unsigned int layerIndex);
89 void ParseAdd(GraphPtr graph, unsigned int layerIndex);
90 void ParseArgMinMax(GraphPtr graph, unsigned int layerIndex);
91 void ParseBatchMatMul(GraphPtr graph, unsigned int layerIndex);
92 void ParseBatchToSpaceNd(GraphPtr graph, unsigned int layerIndex);
93 void ParseBatchNormalization(GraphPtr graph, unsigned int layerIndex);
94 void ParseCast(GraphPtr graph, unsigned int layerIndex);
95 void ParseChannelShuffle(GraphPtr graph, unsigned int layerIndex);
96 void ParseComparison(GraphPtr graph, unsigned int layerIndex);
97 void ParseConcat(GraphPtr graph, unsigned int layerIndex);
98 void ParseConstant(GraphPtr graph, unsigned int layerIndex);
99 void ParseConvolution2d(GraphPtr graph, unsigned int layerIndex);
100 void ParseConvolution3d(GraphPtr graph, unsigned int layerIndex);
101 void ParseDepthToSpace(GraphPtr graph, unsigned int layerIndex);
102 void ParseDepthwiseConvolution2d(GraphPtr graph, unsigned int layerIndex);
103 void ParseDequantize(GraphPtr graph, unsigned int layerIndex);
104 void ParseDetectionPostProcess(GraphPtr graph, unsigned int layerIndex);
105 void ParseDivision(GraphPtr graph, unsigned int layerIndex);
106 void ParseElementwiseBinary(GraphPtr graph, unsigned int layerIndex);
107 void ParseElementwiseUnary(GraphPtr graph, unsigned int layerIndex);
108 void ParseEqual(GraphPtr graph, unsigned int layerIndex);
109 void ParseFill(GraphPtr graph, unsigned int layerIndex);
110 void ParseFloor(GraphPtr graph, unsigned int layerIndex);
111 void ParseFullyConnected(GraphPtr graph, unsigned int layerIndex);
112 void ParseGather(GraphPtr graph, unsigned int layerIndex);
113 void ParseGatherNd(GraphPtr graph, unsigned int layerIndex);
114 void ParseGreater(GraphPtr graph, unsigned int layerIndex);
115 void ParseInstanceNormalization(GraphPtr graph, unsigned int layerIndex);
116 void ParseL2Normalization(GraphPtr graph, unsigned int layerIndex);
117 void ParseLogicalBinary(GraphPtr graph, unsigned int layerIndex);
118 void ParseLogSoftmax(GraphPtr graph, unsigned int layerIndex);
119 void ParseMaximum(GraphPtr graph, unsigned int layerIndex);
120 void ParseMean(GraphPtr graph, unsigned int layerIndex);
121 void ParseMinimum(GraphPtr graph, unsigned int layerIndex);
122 void ParseMerge(GraphPtr graph, unsigned int layerIndex);
123 void ParseMultiplication(GraphPtr graph, unsigned int layerIndex);
124 void ParseNormalization(GraphPtr graph, unsigned int layerIndex);
125 void ParseLstm(GraphPtr graph, unsigned int layerIndex);
126 void ParseQuantizedLstm(GraphPtr graph, unsigned int layerIndex);
127 void ParsePad(GraphPtr graph, unsigned int layerIndex);
128 void ParsePermute(GraphPtr graph, unsigned int layerIndex);
129 void ParsePooling2d(GraphPtr graph, unsigned int layerIndex);
130 void ParsePooling3d(GraphPtr graph, unsigned int layerIndex);
131 void ParsePrelu(GraphPtr graph, unsigned int layerIndex);
132 void ParseQLstm(GraphPtr graph, unsigned int layerIndex);
133 void ParseQuantize(GraphPtr graph, unsigned int layerIndex);
134 void ParseRank(GraphPtr graph, unsigned int layerIndex);
135 void ParseReduce(GraphPtr graph, unsigned int layerIndex);
136 void ParseReshape(GraphPtr graph, unsigned int layerIndex);
137 void ParseResize(GraphPtr graph, unsigned int layerIndex);
138 void ParseResizeBilinear(GraphPtr graph, unsigned int layerIndex);
139 void ParseReverseV2(GraphPtr graph, unsigned int layerIndex);
140 void ParseRsqrt(GraphPtr graph, unsigned int layerIndex);
141 void ParseScatterNd(GraphPtr graph, unsigned int layerIndex);
142 void ParseShape(GraphPtr graph, unsigned int layerIndex);
143 void ParseSlice(GraphPtr graph, unsigned int layerIndex);
144 void ParseSoftmax(GraphPtr graph, unsigned int layerIndex);
145 void ParseSpaceToBatchNd(GraphPtr graph, unsigned int layerIndex);
146 void ParseSpaceToDepth(GraphPtr graph, unsigned int layerIndex);
147 void ParseSplitter(GraphPtr graph, unsigned int layerIndex);
148 void ParseStack(GraphPtr graph, unsigned int layerIndex);
149 void ParseStandIn(GraphPtr graph, unsigned int layerIndex);
150 void ParseStridedSlice(GraphPtr graph, unsigned int layerIndex);
151 void ParseSubtraction(GraphPtr graph, unsigned int layerIndex);
152 void ParseSwitch(GraphPtr graph, unsigned int layerIndex);
153 void ParseTile(GraphPtr graph, unsigned int layerIndex);
154 void ParseTranspose(GraphPtr graph, unsigned int layerIndex);
155 void ParseTransposeConvolution2d(GraphPtr graph, unsigned int layerIndex);
156 void ParseUnidirectionalSequenceLstm(GraphPtr graph, unsigned int layerIndex);
157
158 void RegisterInputSlots(GraphPtr graph,
159 uint32_t layerIndex,
161 std::vector<unsigned int> ignoreSlots = {});
162 void RegisterOutputSlots(GraphPtr graph,
163 uint32_t layerIndex,
165
166 // NOTE index here must be from flatbuffer object index property
167 void RegisterOutputSlotOfConnection(uint32_t sourceLayerIndex, uint32_t outputSlotIndex, armnn::IOutputSlot* slot);
168 void RegisterInputSlotOfConnection(uint32_t sourceLayerIndex, uint32_t outputSlotIndex, armnn::IInputSlot* slot);
169
170 void ResetParser();
171
172 void SetupInputLayers(GraphPtr graphPtr);
173 void SetupOutputLayers(GraphPtr graphPtr);
174
175 /// Helper to get the index of the layer in the flatbuffer vector from its bindingId property
176 unsigned int GetInputLayerInVector(GraphPtr graph, int targetId);
177 unsigned int GetOutputLayerInVector(GraphPtr graph, int targetId);
178
179 /// Helper to get the index of the layer in the flatbuffer vector from its index property
180 unsigned int GetLayerIndexInVector(GraphPtr graph, unsigned int index);
181
182 struct FeatureVersions
183 {
184 // Default values to zero for backward compatibility
185 unsigned int m_BindingIdScheme = 0;
186
187 // Default values to zero for backward compatibility
188 unsigned int m_WeightsLayoutScheme = 0;
189
190 // Default values to zero for backward compatibility
191 unsigned int m_ConstTensorsAsInputs = 0;
192 };
193
194 FeatureVersions GetFeatureVersions(GraphPtr graph);
195
196 /// The network we're building. Gets cleared after it is passed to the user
197 armnn::INetworkPtr m_Network;
198 std::vector<LayerParsingFunction> m_ParserFunctions;
199
200 using NameToBindingInfo = std::pair<std::string, BindingPointInfo >;
201 std::vector<NameToBindingInfo> m_InputBindings;
202 std::vector<NameToBindingInfo> m_OutputBindings;
203
204 /// This struct describe connections for each layer
205 struct Connections
206 {
207 // Maps output slot index (property in flatbuffer object) to IOutputSlot pointer
208 std::unordered_map<unsigned int, armnn::IOutputSlot*> outputSlots;
209
210 // Maps output slot index to IInputSlot pointer the output slot should be connected to
211 std::unordered_map<unsigned int, std::vector<armnn::IInputSlot*>> inputSlots;
212 };
213
214 /// Maps layer index (index property in flatbuffer object) to Connections for each layer
215 std::unordered_map<unsigned int, Connections> m_GraphConnections;
216};
217
218} // namespace armnnDeserializer
Interface for a layer that is connectable to other layers via InputSlots and OutputSlots.
Definition INetwork.hpp:81
An input connection slot for a layer.
Definition INetwork.hpp:26
An output connection slot for a layer.
Definition INetwork.hpp:54
static GraphPtr LoadGraphFromBinary(const uint8_t *binaryContent, size_t len)
static armnn::Pooling3dDescriptor GetPooling3dDescriptor(Pooling3dDescriptor pooling3dDescriptor, unsigned int layerIndex)
BindingPointInfo GetNetworkOutputBindingInfo(unsigned int layerId, const std::string &name) const
Retrieve binding info (layer id and tensor info) for the network output identified by the given layer...
static armnn::LstmInputParams GetLstmInputParams(LstmDescriptorPtr lstmDescriptor, LstmInputParamsPtr lstmInputParams)
armnn::INetworkPtr CreateNetworkFromBinary(const std::vector< uint8_t > &binaryContent)
Create an input network from binary file contents.
static armnn::QLstmDescriptor GetQLstmDescriptor(QLstmDescriptorPtr qLstmDescriptorPtr)
BindingPointInfo GetNetworkInputBindingInfo(unsigned int layerId, const std::string &name) const
Retrieve binding info (layer id and tensor info) for the network input identified by the given layer ...
DeserializerImpl(const DeserializerImpl &)=delete
static armnn::TensorInfo OutputShapeOfReshape(const armnn::TensorInfo &inputTensorInfo, const std::vector< uint32_t > &targetDimsIn)
static TensorRawPtrVector GetOutputs(const GraphPtr &graph, unsigned int layerIndex)
static armnn::NormalizationDescriptor GetNormalizationDescriptor(NormalizationDescriptorPtr normalizationDescriptor, unsigned int layerIndex)
static LayerBaseRawPtr GetBaseLayer(const GraphPtr &graphPtr, unsigned int layerIndex)
static armnn::Pooling2dDescriptor GetPooling2dDescriptor(Pooling2dDescriptor pooling2dDescriptor, unsigned int layerIndex)
static TensorRawPtrVector GetInputs(const GraphPtr &graph, unsigned int layerIndex)
static armnn::UnidirectionalSequenceLstmDescriptor GetUnidirectionalSequenceLstmDescriptor(UnidirectionalSequenceLstmDescriptorPtr descriptor)
DeserializerImpl & operator=(const DeserializerImpl &)=delete
static std::string GetLayerName(const GraphPtr &graph, unsigned int index)
static armnn::LstmDescriptor GetLstmDescriptor(LstmDescriptorPtr lstmDescriptor)
static int32_t GetBindingLayerInfo(const GraphPtr &graphPtr, unsigned int layerIndex)
const armnnSerializer::LstmDescriptor * LstmDescriptorPtr
const armnnSerializer::NormalizationDescriptor * NormalizationDescriptorPtr
const armnnSerializer::SerializedGraph * GraphPtr
const armnnSerializer::LayerBase * LayerRawPtr
const armnnSerializer::QLstmDescriptor * QLstmDescriptorPtr
const armnnSerializer::Pooling3dDescriptor * Pooling3dDescriptor
const armnnSerializer::ConstTensor * ConstTensorRawPtr
const armnnSerializer::QuantizedLstmInputParams * QunatizedLstmInputParamsPtr
const armnnSerializer::Pooling2dDescriptor * Pooling2dDescriptor
const armnnSerializer::TensorInfo * TensorRawPtr
const armnnSerializer::LayerBase * LayerBaseRawPtr
const armnnSerializer::LstmInputParams * LstmInputParamsPtr
const armnnSerializer::UnidirectionalSequenceLstmDescriptor * UnidirectionalSequenceLstmDescriptorPtr
std::vector< LayerBaseRawPtr > LayerBaseRawPtrVector
std::vector< TensorRawPtr > TensorRawPtrVector
LstmDescriptor UnidirectionalSequenceLstmDescriptor
std::unique_ptr< INetwork, void(*)(INetwork *network)> INetworkPtr
Definition INetwork.hpp:339
An LstmDescriptor for the LstmLayer.
A NormalizationDescriptor for the NormalizationLayer.
A Pooling2dDescriptor for the Pooling2dLayer.
A Pooling3dDescriptor for the Pooling3dLayer.
A QLstmDescriptor for the QLstmLayer.