armnn/latest/_convert_fp32_network_to_fp16_8hpp_source.html

//

// Copyright © 2017 Arm Ltd. All rights reserved.

// SPDX-License-Identifier: MIT

//

#pragma once


#include "Optimization.hpp"

#include "NetworkUtils.hpp"


namespace armnn

{

namespace optimizations

{


class ConvertFp32NetworkToFp16Impl

{

public:


    void Run(Graph& graph, Layer& layer) const

    {

        if(layer.GetType() == LayerType::Input)

        {

            // if the outputs of this layer are DataType::Float32

            // add a ConvertFloat32ToFloat16 layer after each of the outputs

            if (layer.GetDataType() == DataType::Float32)

            {

                InsertConvertFp32ToFp16LayersAfter(graph, layer);

            }

        }

        else if (layer.GetType() == LayerType::Output)

        {

            // For DetectionPostProcess Layer output is always Float32 regardless of input type

            Layer& connectedLayer = layer.GetInputSlots()[0].GetConnectedOutputSlot()->GetOwningLayer();

            if (connectedLayer.GetType() != LayerType::DetectionPostProcess)

            {

                // if the inputs of this layer are DataType::Float32

                // add a ConvertFloat16ToFloat32 layer before each of the inputs

                if (layer.GetDataType() == DataType::Float32)

                {

                    // NOTE: We need to call InsertConvertFp16ToFp32LayersBefore with expectCorrectInputType = false

                    // here, otherwise it will expect the inputs to be DataType::Float16

                    InsertConvertFp16ToFp32LayersBefore(graph, layer, false);

                }

            }

        }

        else if (layer.GetType() != LayerType::ConvertFp32ToFp16 && layer.GetType() != LayerType::ConvertFp16ToFp32)

        {

            // if the inputs/outputs of this layer are DataType::Float32

            // change the data type for all inputs and outputs to DataType::Float16

            for (auto&& input = layer.BeginInputSlots(); input != layer.EndInputSlots(); ++input)

            {

                // if it is connected to OutputSlot of the InputLayer do not change the DataType of connection

                // InputSlots of the current layer will be updated when conversion layer is inserted after InputLayer

                Layer& base = input->GetConnectedOutputSlot()->GetOwningLayer();

                if (base.GetType() != LayerType::Input)

                {

                    TensorInfo convertInfo = input->GetConnection()->GetTensorInfo();

                    if (convertInfo.GetDataType() == DataType::Float32)

                    {

                        convertInfo.SetDataType(DataType::Float16);

                        input->GetConnection()->SetTensorInfo(convertInfo);

                    }

                }

            }


            // For DetectionPostProcess Layer output is always Float32 regardless of input type

            if (layer.GetType() != LayerType::DetectionPostProcess)

            {

                // change outputs to DataType::Float16

                for (auto&& output = layer.BeginOutputSlots(); output != layer.EndOutputSlots(); ++output)

                {

                    TensorInfo convertInfo = output->GetTensorInfo();

                    if (convertInfo.GetDataType() == DataType::Float32)

                    {

                        convertInfo.SetDataType(DataType::Float16);

                        output->SetTensorInfo(convertInfo);

                    }

                }

            }

        }

    }


protected:

    ConvertFp32NetworkToFp16Impl() = default;

    ~ConvertFp32NetworkToFp16Impl() = default;

};


using Fp32NetworkToFp16Converter = OptimizeForType<Layer, ConvertFp32NetworkToFp16Impl>;


} // namespace optimizations

} // namespace armnn

NetworkUtils.hpp

Optimization.hpp

armnn::Graph
Definition Graph.hpp:31

armnn::Layer
Definition Layer.hpp:231

armnn::Layer::EndInputSlots
std::vector< InputSlot >::iterator EndInputSlots()
Definition Layer.hpp:263

armnn::Layer::GetInputSlots
const std::vector< InputSlot > & GetInputSlots() const
Definition Layer.hpp:258

armnn::Layer::BeginOutputSlots
std::vector< OutputSlot >::iterator BeginOutputSlots()
Definition Layer.hpp:266

armnn::Layer::GetType
LayerType GetType() const override
Returns the armnn::LayerType of this layer.
Definition Layer.hpp:286

armnn::Layer::BeginInputSlots
std::vector< InputSlot >::iterator BeginInputSlots()
Definition Layer.hpp:262

armnn::Layer::GetDataType
DataType GetDataType() const
Definition Layer.cpp:345

armnn::Layer::EndOutputSlots
std::vector< OutputSlot >::iterator EndOutputSlots()
Definition Layer.hpp:267

armnn::OptimizeForType
Definition Optimization.hpp:68

armnn::TensorInfo
Definition Tensor.hpp:153

armnn::TensorInfo::SetDataType
void SetDataType(DataType type)
Definition Tensor.hpp:201

armnn::TensorInfo::GetDataType
DataType GetDataType() const
Definition Tensor.hpp:200

armnn::optimizations::ConvertFp32NetworkToFp16Impl::~ConvertFp32NetworkToFp16Impl
~ConvertFp32NetworkToFp16Impl()=default

armnn::optimizations::ConvertFp32NetworkToFp16Impl::ConvertFp32NetworkToFp16Impl
ConvertFp32NetworkToFp16Impl()=default

armnn::optimizations::ConvertFp32NetworkToFp16Impl::Run
void Run(Graph &graph, Layer &layer) const
Definition ConvertFp32NetworkToFp16.hpp:18

armnn::optimizations
Definition AddBroadcastReshapeLayer.hpp:15

armnn::optimizations::Fp32NetworkToFp16Converter
OptimizeForType< Layer, ConvertFp32NetworkToFp16Impl > Fp32NetworkToFp16Converter
Definition ConvertFp32NetworkToFp16.hpp:87

armnn
Copyright (c) 2021 ARM Limited and Contributors.
Definition 01_00_quick_start.dox:7

armnn::LayerType::DetectionPostProcess
@ DetectionPostProcess
Definition Types.hpp:496

armnn::LayerType::Output
@ Output
Definition Types.hpp:496

armnn::LayerType::Input
@ Input
Definition Types.hpp:496

armnn::LayerType::ConvertFp16ToFp32
@ ConvertFp16ToFp32
Definition Types.hpp:496

armnn::LayerType::ConvertFp32ToFp16
@ ConvertFp32ToFp16
Definition Types.hpp:496

armnn::InsertConvertFp32ToFp16LayersAfter
std::vector< ConvertFp32ToFp16Layer * > InsertConvertFp32ToFp16LayersAfter(Graph &graph, Layer &layer)
Definition NetworkUtils.cpp:79

armnn::InsertConvertFp16ToFp32LayersBefore
std::vector< ConvertFp16ToFp32Layer * > InsertConvertFp16ToFp32LayersBefore(Graph &graph, Layer &layer, bool expectCorrectInputType)
Definition NetworkUtils.cpp:40

armnn::DataType::Float32
@ Float32
Definition Types.hpp:51

armnn::DataType::Float16
@ Float16
Definition Types.hpp:50