armnn/latest/_tosa_ref_layer_support_8cpp_source.html

//

// Copyright © 2022-2025 Arm Ltd and Contributors. All rights reserved.

// SPDX-License-Identifier: MIT

//


#include "TosaRefLayerSupport.hpp"


#include <tosaCommon/TosaMappings.hpp>


#include <armnn/Types.hpp>

#include <armnn/utility/IgnoreUnused.hpp>


#include <graph_status.h>

#include <model_runner.h>


#include <vector>


namespace armnn

{


bool TosaRefLayerSupport::IsLayerSupported(const LayerType& type,

                                           const std::vector<TensorInfo>& infos,

                                           const BaseDescriptor& descriptor,

                                           const Optional<LstmInputParamsInfo>& lstmParamsInfo,

                                           const Optional<QuantizedLstmInputParamsInfo>& quantizedLstmInputParamsInfo,

                                           Optional<std::string&> reasonIfUnsupported) const

{

    for (const auto& info : infos)

    {

        if (info.GetDataType() == DataType::Signed64)

        {

            reasonIfUnsupported.value() = "TOSA does not have INT64 support for TOSARef backend";

            return false;

        }


        // ArmNN U8 tensors are supported for TOSA if they are followed or preceeded by a Quantize layer

        if (info.GetDataType() == DataType::QAsymmU8 &&

            type != LayerType::Input &&

            type != LayerType::Quantize &&

            type != LayerType::Output)

        {

            reasonIfUnsupported.value() = "Must use a Quantize layer to/from unsigned INT for TOSARef backend";

            return false;

        }

    }


    IgnoreUnused(lstmParamsInfo);

    IgnoreUnused(quantizedLstmInputParamsInfo);

    IgnoreUnused(reasonIfUnsupported);


    std::vector<const TensorInfo*> inputInfos;

    std::vector<const TensorInfo*> outputInfos;


    switch (type)

    {

        case LayerType::Input:

        case LayerType::Output:

            return true;

        case LayerType::Addition:

        case LayerType::BatchMatMul:

        case LayerType::ElementwiseBinary:

        case LayerType::Gather:

        case LayerType::Multiplication:

        case LayerType::Subtraction:

        case LayerType::Prelu:

            // Setup inputs and outputs

            inputInfos.push_back(&infos[0]);

            inputInfos.push_back(&infos[1]);

            outputInfos.push_back(&infos[2]);

            break;

        case LayerType::Concat:

            for (unsigned int i = 0; i < infos.size() - 1; ++i)

            {

                inputInfos.push_back(&infos[i]);

            }

            outputInfos.push_back(&infos.back());

            break;

        case LayerType::Constant:

            outputInfos.push_back(&infos[0]);

            break;

        case LayerType::Convolution2d:

        {

            inputInfos.push_back(&infos[0]); // input

            outputInfos.push_back(&infos[1]); // output

            inputInfos.push_back(&infos[2]); // weights


            auto conv2dDesc = PolymorphicDowncast<const Convolution2dDescriptor*>(&descriptor);

            if(conv2dDesc->m_BiasEnabled)

            {

                inputInfos.push_back(&infos[3]); // bias

            }

            break;

        }

        case LayerType::Convolution3d:

        {

            inputInfos.push_back(&infos[0]); // input

            outputInfos.push_back(&infos[1]); // output

            inputInfos.push_back(&infos[2]); // weights


            auto conv3dDesc = PolymorphicDowncast<const Convolution3dDescriptor*>(&descriptor);

            if(conv3dDesc->m_BiasEnabled)

            {

                inputInfos.push_back(&infos[3]); // bias

            }

            break;

        }

        case LayerType::DepthwiseConvolution2d:

        {

            inputInfos.push_back(&infos[0]); // input

            outputInfos.push_back(&infos[1]); // output

            inputInfos.push_back(&infos[2]); // weights


            auto conv2dDesc = PolymorphicDowncast<const DepthwiseConvolution2dDescriptor*>(&descriptor);

            if(conv2dDesc->m_BiasEnabled)

            {

                inputInfos.push_back(&infos[3]); // bias

            }

            break;

        }

        case LayerType::FullyConnected:

        {

            inputInfos.push_back(&infos[0]); // input

            outputInfos.push_back(&infos[1]); // output

            inputInfos.push_back(&infos[2]); // weights

            auto fullyConnectedDesc = PolymorphicDowncast<const FullyConnectedDescriptor*>(&descriptor);

            if(fullyConnectedDesc->m_BiasEnabled)

            {

                inputInfos.push_back(&infos[3]); // bias

            }

            break;

        }

        case LayerType::Activation:

        case LayerType::DepthToSpace:

        case LayerType::Dequantize:

        case LayerType::ElementwiseUnary:

        case LayerType::Pad:

        case LayerType::Pooling2d:

        case LayerType::Mean:

        case LayerType::Quantize:

        case LayerType::Reduce:

        case LayerType::Reshape:

        case LayerType::Resize:

        case LayerType::Slice:

        case LayerType::Softmax:

        case LayerType::StridedSlice:

        case LayerType::Transpose:

        case LayerType::BatchToSpaceNd:

        case LayerType::SpaceToBatchNd:

        {

            inputInfos.push_back(&infos[0]);

            outputInfos.push_back(&infos[1]);

            break;

        }

        case LayerType::Splitter:

        {

            inputInfos.push_back(&infos[0]);

            for (unsigned int i = 1; i < infos.size(); ++i)

            {

                outputInfos.push_back(&infos[i]);

            }

            break;

        }

        case LayerType::TransposeConvolution2d:

        {

            inputInfos.push_back(&infos[0]); // input

            outputInfos.push_back(&infos[1]); // output

            inputInfos.push_back(&infos[2]); // weights


            auto conv2dDesc = PolymorphicDowncast<const TransposeConvolution2dDescriptor*>(&descriptor);

            if(conv2dDesc->m_BiasEnabled)

            {

                inputInfos.push_back(&infos[3]); // bias

            }

            break;

        }

        case LayerType::Stack:

        {

            auto stackDesc = PolymorphicDowncast<const StackDescriptor*>(&descriptor);

            for (unsigned int i = 0; i < stackDesc->m_NumInputs; ++i)

            {

                inputInfos.emplace_back(&infos[i]);

            }

            outputInfos.emplace_back(&infos[stackDesc->m_NumInputs]);

            break;

        }

        default:

            // Default to false for all unsupported layers.

            return false;

    }


    auto mappings = GetTosaMapping(nullptr, type, inputInfos, outputInfos, descriptor);

    if (mappings->GetName() == "")

    {

        // There currently isn't a TOSA mapping for this layer, as the default was returned.

        return false;

    }


    TosaSerializationHandler handler;


    // Add all mappings to main block.

    auto* block = new TosaSerializationBasicBlock("main",

                                                  "main",

                                                  mappings->GetOperators(),

                                                  mappings->GetTensors(),

                                                  mappings->GetInputs(),

                                                  mappings->GetOutputs());


    std::vector<TosaSerializationBasicBlock*> blocks;

    blocks.emplace_back(block);


    // Add blocks to the main region.

    auto* region = new TosaSerializationRegion("main", blocks);

    handler.GetRegions().emplace_back(region);


    GraphStatus status;

    TosaReference::IModelRunner runner;


#if !defined(TOSA_REFERENCE_MODEL_OUTPUT)

    // There currently isn't a way to disable the output from the TOSA Reference Model, but it does have a file pointer

    // to write debug output to, so set this to /dev/null (if it exists on the system) to hide the output.

    func_debug_t funcDebug;


    FILE* file = fopen("/dev/null", "w");

    funcDebug.func_debug_file = (file == nullptr) ? stderr : file;


    runner.setFuncDebug(funcDebug);

#endif


    // Initialise the model runner with the TosaSerializationHandler, which runs validation on the mapping.

    status = runner.initialize(handler);


#if !defined(TOSA_REFERENCE_MODEL_OUTPUT)

    // Reset FuncDebug as they can persist across multiple IModelRunner instances.

    funcDebug.func_debug_file = stderr;

    runner.setFuncDebug(funcDebug);

#endif


    if(status == GraphStatus::TOSA_ERROR || status == GraphStatus::TOSA_UNPREDICTABLE)

    {

        return false;

    }

    else

    {

        return true;

    }

}


} // namespace armnn

IgnoreUnused.hpp

GetTosaMapping
TosaSerializationBasicBlock * GetTosaMapping(const Layer *layer, const LayerType type, const std::vector< const TensorInfo * > &inputs, const std::vector< const TensorInfo * > &outputs, const BaseDescriptor &descriptor)
Definition TosaMappings.cpp:21

TosaMappings.hpp

TosaRefLayerSupport.hpp

Types.hpp

armnn::Optional
Definition Optional.hpp:271

armnn::OptionalReferenceSwitch::value
const T & value() const
Definition Optional.hpp:146

armnn::TosaRefLayerSupport::IsLayerSupported
bool IsLayerSupported(const LayerType &type, const std::vector< TensorInfo > &infos, const BaseDescriptor &descriptor, const Optional< LstmInputParamsInfo > &lstmParamsInfo, const Optional< QuantizedLstmInputParamsInfo > &, Optional< std::string & > reasonIfUnsupported) const override
Default implementation of the ILayerSupport interface, Backends should implement this as a switch sta...
Definition TosaRefLayerSupport.cpp:21

armnn
Copyright (c) 2021 ARM Limited and Contributors.
Definition 01_00_quick_start.dox:7

armnn::BoostLogSeverityMapping::info
@ info
Definition Logging.hpp:200

armnn::LayerType
LayerType
When adding a new layer, adapt also the LastLayer enum value in the enum class LayerType below.
Definition Types.hpp:494

armnn::LayerType::Prelu
@ Prelu
Definition Types.hpp:496

armnn::LayerType::Stack
@ Stack
Definition Types.hpp:496

armnn::LayerType::Multiplication
@ Multiplication
Definition Types.hpp:496

armnn::LayerType::Output
@ Output
Definition Types.hpp:496

armnn::LayerType::Softmax
@ Softmax
Definition Types.hpp:496

armnn::LayerType::Input
@ Input
Definition Types.hpp:496

armnn::LayerType::SpaceToBatchNd
@ SpaceToBatchNd
Definition Types.hpp:496

armnn::LayerType::Mean
@ Mean
Definition Types.hpp:496

armnn::LayerType::Splitter
@ Splitter
Definition Types.hpp:496

armnn::LayerType::Convolution3d
@ Convolution3d
Definition Types.hpp:496

armnn::LayerType::ElementwiseBinary
@ ElementwiseBinary
Definition Types.hpp:496

armnn::LayerType::Subtraction
@ Subtraction
Definition Types.hpp:496

armnn::LayerType::BatchToSpaceNd
@ BatchToSpaceNd
Definition Types.hpp:496

armnn::LayerType::TransposeConvolution2d
@ TransposeConvolution2d
Definition Types.hpp:496

armnn::LayerType::DepthToSpace
@ DepthToSpace
Definition Types.hpp:496

armnn::LayerType::Addition
@ Addition
Definition Types.hpp:496

armnn::LayerType::BatchMatMul
@ BatchMatMul
Definition Types.hpp:496

armnn::LayerType::Dequantize
@ Dequantize
Definition Types.hpp:496

armnn::LayerType::Resize
@ Resize
Definition Types.hpp:496

armnn::LayerType::StridedSlice
@ StridedSlice
Definition Types.hpp:496

armnn::LayerType::Reshape
@ Reshape
Definition Types.hpp:496

armnn::LayerType::Activation
@ Activation
Definition Types.hpp:496

armnn::LayerType::Gather
@ Gather
Definition Types.hpp:496

armnn::LayerType::Transpose
@ Transpose
Definition Types.hpp:496

armnn::LayerType::ElementwiseUnary
@ ElementwiseUnary
Definition Types.hpp:496

armnn::LayerType::Quantize
@ Quantize
Definition Types.hpp:496

armnn::LayerType::FullyConnected
@ FullyConnected
Definition Types.hpp:496

armnn::LayerType::Constant
@ Constant
Definition Types.hpp:496

armnn::LayerType::Slice
@ Slice
Definition Types.hpp:496

armnn::LayerType::Pooling2d
@ Pooling2d
Definition Types.hpp:496

armnn::LayerType::Convolution2d
@ Convolution2d
Definition Types.hpp:496

armnn::LayerType::Pad
@ Pad
Definition Types.hpp:496

armnn::LayerType::Concat
@ Concat
Definition Types.hpp:496

armnn::LayerType::Reduce
@ Reduce
Definition Types.hpp:496

armnn::LayerType::DepthwiseConvolution2d
@ DepthwiseConvolution2d
Definition Types.hpp:496

armnn::PolymorphicDowncast
DestType PolymorphicDowncast(SourceType *value)
Polymorphic downcast for build in pointers only.
Definition PolymorphicDowncast.hpp:74

armnn::DataType::QAsymmU8
@ QAsymmU8
Definition Types.hpp:52

armnn::DataType::Signed64
@ Signed64
Definition Types.hpp:59

armnn::IgnoreUnused
void IgnoreUnused(Ts &&...)
Definition IgnoreUnused.hpp:14

armnn::BaseDescriptor
Base class for all descriptors.
Definition Descriptors.hpp:23