12 const std::vector<const TensorInfo*>& inputs,
13 const std::vector<const TensorInfo*>& outputs,
16 std::vector<std::string> inputNames;
17 std::string outputName = std::string(
"output0_");
20 DType inputDType0 =
ArmNNToDType(inputs[0]->GetDataType());
21 DType outputDType0 =
ArmNNToDType(outputs[0]->GetDataType());
26 inputNames.emplace_back(
"input_0");
27 inputNames.emplace_back(
"input_1");
30 inputNames.emplace_back(
"input_2");
39 for (uint32_t i = 0; i < inputs.size(); ++i)
42 inputNames.push_back(inputName);
49 std::vector<TosaSerializationTensor*> tensors;
50 std::vector<TosaSerializationOperator*> operators;
57 if(inputNames[0].find(
"input_") != std::string::npos)
59 tensors.push_back(
new TosaSerializationTensor(inputNames[0], inputShape0, inputDType0, {}));
65 if(!inputs[1]->IsConstant() || layer ==
nullptr)
67 int32_t multiplier = inputShape1[3]/inputShape0[3];
70 std::vector<int32_t> inputShapeHWCM = {
71 inputShape1[1], inputShape1[2], inputShape0[3], multiplier
74 DType inputDType1 =
ArmNNToDType(inputs[1]->GetDataType());
76 tensors.push_back(
new TosaSerializationTensor(inputNames[1], inputShapeHWCM, inputDType1, {}));
81 if(!inputs[2]->IsConstant() || layer ==
nullptr)
84 DType inputDType2 =
ArmNNToDType(inputs[2]->GetDataType());
86 tensors.push_back(
new TosaSerializationTensor(inputNames[2], inputShape2, inputDType2, {}));
94 operators.push_back(
new TosaSerializationOperator(Op_CONST, Attribute_NONE,
nullptr, {}, {constantName}));
97 unsigned int index = (conv2dDescriptor->
m_DataLayout == DataLayout::NHWC) ? 3 : 1;
99 const DType dType = (inputDType0 == DType_INT8) ? DType_INT32 : outputDType0;
100 std::vector<float> data(outputs[0]->GetShape()[index], 0);
102 std::vector<uint8_t> uint8Data;
103 TosaSerializationHandler::ConvertF32toU8(data, uint8Data);
105 tensors.push_back(
new TosaSerializationTensor(constantName,
106 {
static_cast<int32_t
>(outputs[0]->GetShape()[index])},
109 inputNames.emplace_back(constantName);
114 std::string outputConv2dName;
115 bool isInputInt8 = (inputDType0 == DType_INT8);
119 tensors.push_back(
new TosaSerializationTensor(outputConv2dName, outputShape0, DType_INT32, {}));
123 tensors.push_back(
new TosaSerializationTensor(outputName, outputShape0, outputDType0, {}));
127 std::vector<int> pad = {
static_cast<int>(conv2dDescriptor->
m_PadTop),
129 static_cast<int>(conv2dDescriptor->
m_PadLeft),
130 static_cast<int>(conv2dDescriptor->
m_PadRight)};
131 std::vector<int> stride = {
static_cast<int>(conv2dDescriptor->
m_StrideY),
132 static_cast<int>(conv2dDescriptor->
m_StrideX)};
133 std::vector<int> dilation = {
static_cast<int>(conv2dDescriptor->
m_DilationY),
135 TosaConvAttribute attribute(pad, stride, dilation,
136 inputs[0]->GetQuantizationOffset(),
137 inputs[1]->GetQuantizationOffset(),
151 std::string& convOutStr = isInputInt8 ? outputConv2dName : outputName;
152 auto* conv2d_op =
new TosaSerializationOperator(Op_DEPTHWISE_CONV2D,
153 Attribute_ConvAttribute,
155 {sliceOutputName, inputNames[1], inputNames[2]},
157 operators.push_back(conv2d_op);
161 int32_t output_zp = outputs[0]->GetQuantizationOffset();
162 double output_scale = outputs[0]->GetQuantizationScales()[0];
163 double input_scale = inputs[0]->GetQuantizationScales()[0];
164 const std::vector<float>& weight_scales = inputs[1]->GetQuantizationScales();
166 TosaSerializationOperator* rescaleOp =
nullptr;
179 operators.push_back(rescaleOp);
180 tensors.push_back(
new TosaSerializationTensor(outputName,
187 return new TosaSerializationBasicBlock(blockName,
std::string GetInputSlicedToItsUsedSize(const std::vector< int32_t > &inputShape, const std::string &inputName, const DataLayout layout, const DType datatype, const std::vector< int32_t > &kernel, const std::vector< int32_t > &pad, const std::vector< int32_t > &stride, const std::vector< int32_t > &dilations, std::vector< TosaSerializationTensor * > &tensors, std::vector< TosaSerializationOperator * > &operators, const bool isPoolingOp=false)
void CreateRescaleTosaOperatorForWeights(const std::string &inputName, const std::string &outputName, int32_t input_zp, int32_t output_zp, bool input_unsigned, bool output_unsigned, bool double_round, bool scale32, double input_scale, double output_scale, const std::vector< float > &weight_scales, TosaSerializationOperator **op)
Creates a TOSA rescale operator for weight tensors.