armnn/latest/_lstm_8cpp_source.html

 //

 // Copyright © 2021 Arm Ltd and Contributors. All rights reserved.

 // SPDX-License-Identifier: MIT

 //


 #include "Activation.hpp"

 #include "Lstm.hpp"

 #include "LstmUtils.hpp"


 namespace armnn

 {


 void LstmImpl(const LstmDescriptor& descriptor,

               const TensorInfo& inputInfo,

               const TensorInfo& outputInfo,

               const TensorShape& inputToOutputWeightsShape,

               const TensorShape& recurrentToOutputWeightsShape,

               std::unique_ptr<Decoder<float>>& inputData,

               std::unique_ptr<Decoder<float>>& outputStateIn,

               std::unique_ptr<Decoder<float>>& cellStateIn,

               std::unique_ptr<Encoder<float>>& outputStateOut,

               std::unique_ptr<Encoder<float>>& cellStateOut,

               std::unique_ptr<Encoder<float>>& output,

               std::unique_ptr<Decoder<float>>& cellStateOutDecoder,

               std::unique_ptr<Decoder<float>>& outputDecoder,

               std::unique_ptr<Decoder<float>>& inputToInputWeightsTensor,

               std::unique_ptr<Decoder<float>>& inputToForgetWeightsTensor,

               std::unique_ptr<Decoder<float>>& inputToCellWeightsTensor,

               std::unique_ptr<Decoder<float>>& inputToOutputWeightsTensor,

               std::unique_ptr<Decoder<float>>& recurrentToInputWeightsTensor,

               std::unique_ptr<Decoder<float>>& recurrentToForgetWeightsTensor,

               std::unique_ptr<Decoder<float>>& recurrentToCellWeightsTensor,

               std::unique_ptr<Decoder<float>>& recurrentToOutputWeightsTensor,

               std::unique_ptr<Decoder<float>>& cellToInputWeightsTensor,

               std::unique_ptr<Decoder<float>>& cellToForgetWeightsTensor,

               std::unique_ptr<Decoder<float>>& cellToOutputWeightsTensor,

               std::unique_ptr<Decoder<float>>& inputGateBiasTensor,

               std::unique_ptr<Decoder<float>>& forgetGateBiasTensor,

               std::unique_ptr<Decoder<float>>& cellBiasTensor,

               std::unique_ptr<Decoder<float>>& outputGateBiasTensor,

               std::unique_ptr<Decoder<float>>& projectionWeightsTensor,

               std::unique_ptr<Decoder<float>>& projectionBiasTensor,

               std::unique_ptr<Decoder<float>>& inputLayerNormWeights,

               std::unique_ptr<Decoder<float>>& forgetLayerNormWeights,

               std::unique_ptr<Decoder<float>>& cellLayerNormWeights,

               std::unique_ptr<Decoder<float>>& outputLayerNormWeights,

               std::unique_ptr<Encoder<float>>& inputGateScratch,

               std::unique_ptr<Encoder<float>>& cellScratch,

               std::unique_ptr<Encoder<float>>& forgetGateScratch,

               std::unique_ptr<Encoder<float>>& outputGateScratch,

               std::unique_ptr<Decoder<float>>& inputGateScratchDecoder,

               std::unique_ptr<Decoder<float>>& cellScratchDecoder,

               std::unique_ptr<Decoder<float>>& forgetGateScratchDecoder,

               std::unique_ptr<Decoder<float>>& outputGateScratchDecoder,

               float layerNormEpsilon)

 {

     // This is a porting of the LSTM::Eval() method in the Android code base

     // Refer to: android/frameworks/ml/nn/common/operations/LSTM.cpp


     const TensorShape& inputShape = inputInfo.GetShape();

     const DataType& outputType = outputInfo.GetDataType();


     const uint32_t nBatch = inputShape[0];

     const uint32_t nInput = inputShape[1];


     const uint32_t nCell   = inputToOutputWeightsShape[0];

     const uint32_t nOutput = recurrentToOutputWeightsShape[1];


     const bool useCifg      = descriptor.m_CifgEnabled;

     const bool usePeephole  = descriptor.m_PeepholeEnabled;

     const bool useLayerNorm = descriptor.m_LayerNormEnabled;


     if (!useLayerNorm)

     {

         // Initialize scratch buffers with bias.

         if (!useCifg)

         {

             VectorBatchVectorAssign(*inputGateBiasTensor,

                                     nCell, nBatch, *inputGateScratch);

         }

         VectorBatchVectorAssign(*forgetGateBiasTensor,

                                 nCell, nBatch, *forgetGateScratch);

         VectorBatchVectorAssign(*cellBiasTensor,

                                 nCell, nBatch, *cellScratch);

         VectorBatchVectorAssign(*outputGateBiasTensor,

                                 nCell, nBatch, *outputGateScratch);

     }

     else

     {

         // Initialize scratch buffers with zeroes.

         if (!useCifg)

         {

             ZeroVector(*inputGateScratch, nCell * nBatch);

         }

         ZeroVector(*forgetGateScratch, nCell * nBatch);

         ZeroVector(*cellScratch      , nCell * nBatch);

         ZeroVector(*outputGateScratch, nCell * nBatch);

     }


     // For each batch and cell: compute input_weight * input.

     if (!useCifg)

     {

         MatrixBatchVectorMultiplyAccumulate(*inputToInputWeightsTensor,

                                             nCell, nInput, *inputData, nBatch, *inputGateScratch);

     }

     MatrixBatchVectorMultiplyAccumulate(*inputToForgetWeightsTensor,

                                         nCell, nInput, *inputData, nBatch, *forgetGateScratch);

     MatrixBatchVectorMultiplyAccumulate(*inputToCellWeightsTensor,

                                         nCell, nInput, *inputData, nBatch, *cellScratch);

     MatrixBatchVectorMultiplyAccumulate(*inputToOutputWeightsTensor,

                                         nCell, nInput, *inputData, nBatch, *outputGateScratch);


     // For each batch and cell: compute recurrent_weight * output_state.

     if (!useCifg)

     {

         MatrixBatchVectorMultiplyAccumulate(*recurrentToInputWeightsTensor,

                                             nCell, nOutput, *outputStateIn, nBatch, *inputGateScratch);

     }

     MatrixBatchVectorMultiplyAccumulate(*recurrentToForgetWeightsTensor,

                                         nCell, nOutput, *outputStateIn, nBatch, *forgetGateScratch);

     MatrixBatchVectorMultiplyAccumulate(*recurrentToCellWeightsTensor,

                                         nCell, nOutput, *outputStateIn, nBatch, *cellScratch);

     MatrixBatchVectorMultiplyAccumulate(*recurrentToOutputWeightsTensor,

                                         nCell, nOutput, *outputStateIn, nBatch, *outputGateScratch);


     // For each batch and cell: update input gate.

     if (!useCifg)

     {

         if (usePeephole)

         {

             VectorBatchVectorCwiseProductAccumulate(*cellToInputWeightsTensor,

                                                     nCell, *cellStateIn, nBatch, *inputGateScratch);

         }

         if (useLayerNorm)

         {

             MeanStddevNormalization(*inputGateScratchDecoder,

                                     *inputGateScratch, nCell, nBatch, layerNormEpsilon);

             VectorBatchVectorCwiseProduct(*inputLayerNormWeights,

                                           nCell, *inputGateScratchDecoder, nBatch, *inputGateScratch);

             VectorBatchVectorAdd(*inputGateBiasTensor,

                                  nCell, *inputGateScratchDecoder, nBatch, *inputGateScratch);

         }

         Activation(*inputGateScratchDecoder, *inputGateScratch,

                    TensorInfo({nCell, nBatch}, outputType),

                    ActivationFunction::Sigmoid, 0, 0);

     }


     // For each batch and cell: update forget gate.

     if (usePeephole)

     {

         VectorBatchVectorCwiseProductAccumulate(*cellToForgetWeightsTensor, nCell,

                                                 *cellStateIn, nBatch, *forgetGateScratch);

     }

     if (useLayerNorm)

     {

         MeanStddevNormalization(*forgetGateScratchDecoder,

                                 *forgetGateScratch, nCell, nBatch, layerNormEpsilon);

         VectorBatchVectorCwiseProduct(*forgetLayerNormWeights,

                                       nCell, *forgetGateScratchDecoder, nBatch, *forgetGateScratch);

         VectorBatchVectorAdd(*forgetGateBiasTensor,

                              nCell, *forgetGateScratchDecoder, nBatch, *forgetGateScratch);

     }

     Activation(*forgetGateScratchDecoder, *forgetGateScratch,

                TensorInfo({nCell, nBatch}, outputType),

                ActivationFunction::Sigmoid, 0, 0);


     // For each batch and cell: update the cell.

     if (useLayerNorm)

     {

         MeanStddevNormalization(*cellScratchDecoder,

                                 *cellScratch, nCell, nBatch, layerNormEpsilon);

         VectorBatchVectorCwiseProduct(*cellLayerNormWeights,

                                       nCell, *cellScratchDecoder, nBatch, *cellScratch);

         VectorBatchVectorAdd(*cellBiasTensor,

                              nCell, *cellScratchDecoder, nBatch, *cellScratch);

     }


     VectorVectorCwiseProduct(*forgetGateScratchDecoder, *cellStateIn, nBatch * nCell, *cellStateOut);


     ActivationFunction armnnActivationFunc = ActivationFunction::Sigmoid;

     float a = 0;

     float b = 0;

     SetActivationParameters(descriptor.m_ActivationFunc, armnnActivationFunc, a, b);


     if (descriptor.m_ActivationFunc > 0)

     {

         Activation(*cellScratchDecoder, *cellScratch,

                    TensorInfo({nCell, nBatch}, outputType),

                    armnnActivationFunc, a, b);

     }

     if (useCifg)

     {

         Sub1Vector(*forgetGateScratchDecoder, nBatch * nCell, *forgetGateScratch);

         VectorVectorCwiseProductAccumulate(

             *cellScratchDecoder, *forgetGateScratchDecoder, nBatch * nCell, *cellStateOut);

     }

     else

     {

         VectorVectorCwiseProductAccumulate(

             *cellScratchDecoder, *inputGateScratchDecoder, nBatch * nCell, *cellStateOut);

     }

     if (descriptor.m_ClippingThresCell > 0.0)

     {

         ClipVector(*cellStateOutDecoder, nBatch * nCell, descriptor.m_ClippingThresCell, *cellStateOut);

     }


     // For each batch and cell: update the output gate.

     if (usePeephole)

     {

         VectorBatchVectorCwiseProductAccumulate(*cellToOutputWeightsTensor,

                                                 nCell, *cellStateOutDecoder, nBatch, *outputGateScratch);

     }

     if (useLayerNorm)

     {

         MeanStddevNormalization(*outputGateScratchDecoder,

                                 *outputGateScratch, nCell, nBatch, layerNormEpsilon);

         VectorBatchVectorCwiseProduct(*outputLayerNormWeights,

                                       nCell, *outputGateScratchDecoder, nBatch, *outputGateScratch);

         VectorBatchVectorAdd(*outputGateBiasTensor,

                              nCell, *outputGateScratchDecoder, nBatch, *outputGateScratch);

     }

     Activation(*outputGateScratchDecoder, *outputGateScratch,

                TensorInfo({nCell, nBatch}, outputType),

                ActivationFunction::Sigmoid, 0, 0);


     if (descriptor.m_ActivationFunc > 0)

     {

         Activation(*cellStateOutDecoder, *cellScratch,

                    TensorInfo({nCell, nBatch}, outputType),

                    armnnActivationFunc, a, b);

     }


     VectorVectorCwiseProduct(*outputGateScratchDecoder, *cellScratchDecoder, nBatch * nCell, *outputGateScratch);


     // For each batch: update the projection and output_state.

     if (descriptor.m_ProjectionEnabled)

     {

         if (projectionBiasTensor)

         {

             VectorBatchVectorAssign(*projectionBiasTensor,

                                     nOutput, nBatch, *output);

         }

         MatrixBatchVectorMultiplyAccumulate(*projectionWeightsTensor,

                                             nOutput, nCell, *outputGateScratchDecoder, nBatch, *output);


         if (descriptor.m_ClippingThresProj > 0.0)

         {

             ClipVector(*outputDecoder, nBatch * nOutput, descriptor.m_ClippingThresProj, *output);

         }

     }

     else

     {

         CopyVector(*outputGateScratchDecoder, nBatch * nOutput, *output);

     }


     CopyVector(*outputDecoder, nBatch * nOutput, *outputStateOut);

 }


 } //namespace armnn

Activation.hpp

Lstm.hpp

CopyVector
void CopyVector(armnn::Decoder< float > &vector, uint32_t vSize, armnn::Encoder< float > &outResult)
Definition: LstmUtils.cpp:244

MeanStddevNormalization
void MeanStddevNormalization(armnn::Decoder< float > &input_vector, armnn::Encoder< float > &output_vector, uint32_t v_size, uint32_t n_batch, float normalization_epsilon)
Definition: LstmUtils.cpp:40

ClipVector
void ClipVector(armnn::Decoder< float > &vector, uint32_t vSize, float absLimit, armnn::Encoder< float > &outResult)
Definition: LstmUtils.cpp:229

VectorBatchVectorCwiseProduct
void VectorBatchVectorCwiseProduct(armnn::Decoder< float > &vector, uint32_t vSize, armnn::Decoder< float > &batchVector, uint32_t nBatch, armnn::Encoder< float > &outResult)
Definition: LstmUtils.cpp:152

VectorVectorCwiseProductAccumulate
void VectorVectorCwiseProductAccumulate(armnn::Decoder< float > &vector1, armnn::Decoder< float > &vector2, uint32_t vSize, armnn::Encoder< float > &outResult)
Definition: LstmUtils.cpp:204

VectorBatchVectorAdd
void VectorBatchVectorAdd(armnn::Decoder< float > &vector, uint32_t vSize, armnn::Decoder< float > &batchVector, uint32_t nBatch, armnn::Encoder< float > &outResult)
Definition: LstmUtils.cpp:16

ZeroVector
void ZeroVector(armnn::Encoder< float > &vector, uint32_t vSize)
Definition: LstmUtils.cpp:76

VectorVectorCwiseProduct
void VectorVectorCwiseProduct(armnn::Decoder< float > &vector1, armnn::Decoder< float > &vector2, uint32_t vSize, armnn::Encoder< float > &outResult)
Definition: LstmUtils.cpp:187

VectorBatchVectorCwiseProductAccumulate
void VectorBatchVectorCwiseProductAccumulate(armnn::Decoder< float > &vector, uint32_t vSize, armnn::Decoder< float > &batchVector, uint32_t nBatch, armnn::Encoder< float > &outResult)
Definition: LstmUtils.cpp:131

VectorBatchVectorAssign
void VectorBatchVectorAssign(armnn::Decoder< float > &vector, uint32_t vSize, uint32_t nBatch, armnn::Encoder< float > &outBatchVector)
Definition: LstmUtils.cpp:113

MatrixBatchVectorMultiplyAccumulate
void MatrixBatchVectorMultiplyAccumulate(armnn::Decoder< float > &matrix, uint32_t mRows, uint32_t mCols, armnn::Decoder< float > &vector, uint32_t nBatch, armnn::Encoder< float > &outResult)
Definition: LstmUtils.cpp:87

Sub1Vector
void Sub1Vector(armnn::Decoder< float > &vector, uint32_t vSize, armnn::Encoder< float > &result)
Definition: LstmUtils.cpp:173

SetActivationParameters
void SetActivationParameters(uint32_t activation, armnn::ActivationFunction &outArmnnActivation, float &outA, float &outB)
Definition: LstmUtils.cpp:258

LstmUtils.hpp

armnn::Decoder< float >

armnn::Encoder< float >

armnn::TensorInfo
Definition: Tensor.hpp:153

armnn::TensorInfo::GetShape
const TensorShape & GetShape() const
Definition: Tensor.hpp:193

armnn::TensorInfo::GetDataType
DataType GetDataType() const
Definition: Tensor.hpp:200

armnn::TensorShape
Definition: Tensor.hpp:21

armnn
Copyright (c) 2021 ARM Limited and Contributors.
Definition: 01_00_quick_start.dox:7

armnn::ActivationFunction
ActivationFunction
Definition: Types.hpp:87

armnn::ActivationFunction::Sigmoid
@ Sigmoid

armnn::Activation
float Activation(float in, ActivationFunction function, float a, float b)
Definition: Activation.cpp:13

armnn::LstmImpl
void LstmImpl(const LstmDescriptor &descriptor, const TensorInfo &inputInfo, const TensorInfo &outputInfo, const TensorShape &inputToOutputWeightsShape, const TensorShape &recurrentToOutputWeightsShape, std::unique_ptr< Decoder< float >> &inputData, std::unique_ptr< Decoder< float >> &outputStateIn, std::unique_ptr< Decoder< float >> &cellStateIn, std::unique_ptr< Encoder< float >> &outputStateOut, std::unique_ptr< Encoder< float >> &cellStateOut, std::unique_ptr< Encoder< float >> &output, std::unique_ptr< Decoder< float >> &cellStateOutDecoder, std::unique_ptr< Decoder< float >> &outputDecoder, std::unique_ptr< Decoder< float >> &inputToInputWeightsTensor, std::unique_ptr< Decoder< float >> &inputToForgetWeightsTensor, std::unique_ptr< Decoder< float >> &inputToCellWeightsTensor, std::unique_ptr< Decoder< float >> &inputToOutputWeightsTensor, std::unique_ptr< Decoder< float >> &recurrentToInputWeightsTensor, std::unique_ptr< Decoder< float >> &recurrentToForgetWeightsTensor, std::unique_ptr< Decoder< float >> &recurrentToCellWeightsTensor, std::unique_ptr< Decoder< float >> &recurrentToOutputWeightsTensor, std::unique_ptr< Decoder< float >> &cellToInputWeightsTensor, std::unique_ptr< Decoder< float >> &cellToForgetWeightsTensor, std::unique_ptr< Decoder< float >> &cellToOutputWeightsTensor, std::unique_ptr< Decoder< float >> &inputGateBiasTensor, std::unique_ptr< Decoder< float >> &forgetGateBiasTensor, std::unique_ptr< Decoder< float >> &cellBiasTensor, std::unique_ptr< Decoder< float >> &outputGateBiasTensor, std::unique_ptr< Decoder< float >> &projectionWeightsTensor, std::unique_ptr< Decoder< float >> &projectionBiasTensor, std::unique_ptr< Decoder< float >> &inputLayerNormWeights, std::unique_ptr< Decoder< float >> &forgetLayerNormWeights, std::unique_ptr< Decoder< float >> &cellLayerNormWeights, std::unique_ptr< Decoder< float >> &outputLayerNormWeights, std::unique_ptr< Encoder< float >> &inputGateScratch, std::unique_ptr< Encoder< float >> &cellScratch, std::unique_ptr< Encoder< float >> &forgetGateScratch, std::unique_ptr< Encoder< float >> &outputGateScratch, std::unique_ptr< Decoder< float >> &inputGateScratchDecoder, std::unique_ptr< Decoder< float >> &cellScratchDecoder, std::unique_ptr< Decoder< float >> &forgetGateScratchDecoder, std::unique_ptr< Decoder< float >> &outputGateScratchDecoder, float layerNormEpsilon)
Definition: Lstm.cpp:13

armnn::DataType
DataType
Definition: Types.hpp:49

armnn::LstmDescriptor
An LstmDescriptor for the LstmLayer.
Definition: Descriptors.hpp:1103

armnn::LstmDescriptor::m_PeepholeEnabled
bool m_PeepholeEnabled
Enable/disable peephole.
Definition: Descriptors.hpp:1148

armnn::LstmDescriptor::m_LayerNormEnabled
bool m_LayerNormEnabled
Enable/disable layer normalization.
Definition: Descriptors.hpp:1152

armnn::LstmDescriptor::m_ClippingThresCell
float m_ClippingThresCell
Clipping threshold value for the cell state.
Definition: Descriptors.hpp:1142

armnn::LstmDescriptor::m_ProjectionEnabled
bool m_ProjectionEnabled
Enable/disable the projection layer.
Definition: Descriptors.hpp:1150

armnn::LstmDescriptor::m_ClippingThresProj
float m_ClippingThresProj
Clipping threshold value for the projection.
Definition: Descriptors.hpp:1144

armnn::LstmDescriptor::m_CifgEnabled
bool m_CifgEnabled
Enable/disable cifg (coupled input & forget gate).
Definition: Descriptors.hpp:1146

armnn::LstmDescriptor::m_ActivationFunc
uint32_t m_ActivationFunc
The activation function to use.
Definition: Descriptors.hpp:1140