armnn/latest/_loaded_network_8hpp_source.html

 //

 // Copyright © 2017, 2024 Arm Ltd and Contributors. All rights reserved.

 // SPDX-License-Identifier: MIT

 //

 #pragma once


 #include "Network.hpp"

 #include "LayerFwd.hpp"

 #include "Profiling.hpp"


 #include <armnn/Tensor.hpp>


 #include <armnn/backends/IBackendInternal.hpp>

 #include <armnn/backends/IMemoryOptimizerStrategy.hpp>

 #include <armnn/backends/Workload.hpp>

 #include <armnn/backends/WorkloadFactory.hpp>


 #include <backendsCommon/DefaultAllocator.hpp>

 #include <backendsCommon/MemoryManager.hpp>

 #include <backendsCommon/TensorHandleFactoryRegistry.hpp>

 #include <backendsCommon/memoryOptimizerStrategyLibrary/strategies/SingleAxisPriorityList.hpp>


 #include <client/include/IProfilingService.hpp>

 #include <client/include/TimelineUtilityMethods.hpp>


 #include <common/include/LabelsAndEventClasses.hpp>


 #include <mutex>

 #include <condition_variable>

 #include <unordered_map>


 namespace cl

 {

 class Context;

 class CommandQueue;

 class Device;

 }


 namespace armnn

 {


 class LoadedNetwork

 {

 public:

     using WorkloadQueue = std::vector<std::unique_ptr<IWorkload>>;


     ~LoadedNetwork()

     {

         FreeWorkingMemory();

     }


     TensorInfo GetInputTensorInfo(LayerBindingId layerId) const;

     TensorInfo GetOutputTensorInfo(LayerBindingId layerId) const;


     std::vector<ImportedInputId> ImportInputs(const InputTensors& inputTensors,

                                               MemorySource forceImportMemorySource = MemorySource::Undefined);

     std::vector<ImportedOutputId> ImportOutputs(const OutputTensors& outputTensors,

                                                 MemorySource forceImportMemorySource = MemorySource::Undefined);


     void ClearImportedInputs(const std::vector<ImportedInputId> inputIds);

     void ClearImportedOutputs(const std::vector<ImportedOutputId> outputIds);


     /// Single thread execution of the loaded network

     Status EnqueueWorkload(const InputTensors& inputTensors, const OutputTensors& outputTensors,

                            std::vector<ImportedInputId> preImportedInputIds = {},

                            std::vector<ImportedOutputId> preImportedOutputIds = {});


     static std::unique_ptr<LoadedNetwork> MakeLoadedNetwork(std::unique_ptr<IOptimizedNetwork> net,

                                                             std::string& errorMessage,

                                                             const INetworkProperties& networkProperties,

                                                             arm::pipe::IProfilingService* profilingService);


     // NOTE we return by reference as the purpose of this method is only to provide

     // access to the private m_Profiler and in theory we should not need to increment

     // the shared_ptr's reference counter

     const std::shared_ptr<IProfiler>& GetProfiler() const { return m_OptimizedNetwork->GetProfiler(); }


     void FreeWorkingMemory();


     void RegisterDebugCallback(const DebugCallbackFunction& func);


     void SendNetworkStructure(arm::pipe::IProfilingService& profilingService);


     arm::pipe::ProfilingGuid GetNetworkGuid();


 private:


     void AllocateWorkingMemory(

 #if !defined(ARMNN_DISABLE_THREADS)

         std::lock_guard<std::mutex>& lock

 #endif

     );

     void AllocateAndExecuteConstantWorkloads();


     std::unordered_map<LayerGuid, std::unique_ptr<IWorkload>> m_ConstantWorkloads;

     std::unordered_map<LayerGuid, ITensorHandle*> m_ConstantTensorHandles;


     std::unique_ptr<IMemoryOptimizerStrategy> m_ConstantStrategy = std::make_unique<SingleAxisPriorityList>();


     LoadedNetwork(std::unique_ptr<IOptimizedNetwork> net,

                   const INetworkProperties& networkProperties,

                   arm::pipe::IProfilingService* profilingService);


     void EnqueueInput(const BindableLayer& layer, ITensorHandle* tensorHandle, const TensorInfo& tensorInfo);


     void EnqueueOutput(const BindableLayer& layer, ITensorHandle* tensorHandle, const TensorInfo& tensorInfo);


     void EnqueueInput(const ConstTensor& inputTensor, ITensorHandle* inputTensorHandle);


     void ImportOutputTensor(const Tensor& outputTensor, ITensorHandle* outputTensorHandle);


     bool Execute(std::unique_ptr<arm::pipe::TimelineUtilityMethods>& timelineUtils,

                  arm::pipe::ProfilingGuid inferenceGuid);


     const IWorkloadFactory& GetWorkloadFactory(const Layer& layer) const;


     inline LayerBindingId ValidateImportedInputID(ImportedInputId id);

     inline LayerBindingId ValidateImportedOutputID(ImportedOutputId id);


     void CreateMemoryProfile();


     std::unique_ptr<MemoryManager> CreateExternalMemoryManger(

             std::vector<std::pair<std::shared_ptr<TensorMemory>, MemorySource>>& tensorMemory);


     using BackendPtrMap = std::unordered_map<BackendId, IBackendInternalUniquePtr>;


     BackendPtrMap  m_Backends;

     std::vector<IBackendInternal::IMemoryManagerSharedPtr> m_BackendMemoryMangers;


     using WorkloadFactoryMap = std::unordered_map<BackendId, IBackendInternal::IWorkloadFactoryPtr>;

     WorkloadFactoryMap  m_WorkloadFactories;


     std::unique_ptr<IOptimizedNetwork> m_OptimizedNetwork;


     WorkloadQueue                      m_InputQueue;

     WorkloadQueue                      m_WorkloadQueue;

     WorkloadQueue                      m_OutputQueue;


 #if !defined(ARMNN_DISABLE_THREADS)

     mutable std::mutex m_WorkingMemMutex;

 #endif


     bool m_IsWorkingMemAllocated = false;


     INetworkProperties m_NetworkProperties;


     TensorHandleFactoryRegistry m_TensorHandleFactoryRegistry;


     // NOTE: raw pointer because the profiling service is controlled by the Runtime

     arm::pipe::IProfilingService* m_ProfilingService;


     struct ImportedTensorHandlePin

     {

         ImportedTensorHandlePin()

         {}


         ImportedTensorHandlePin(LayerBindingId layerBindingId,

                                 std::unique_ptr<ITensorHandle> tensorHandle)

         : m_LayerBindingId(layerBindingId)

         , m_TensorHandle(std::move(tensorHandle))

         {}


         ImportedTensorHandlePin(ImportedTensorHandlePin&&) = default;


         ~ImportedTensorHandlePin()

         {

             if (m_TensorHandle)

             {

                 m_TensorHandle->Unimport();

             }

         }


         LayerBindingId m_LayerBindingId;

         std::unique_ptr<ITensorHandle> m_TensorHandle;

     };


     std::vector<ImportedTensorHandlePin> m_PreImportedInputHandles;

     std::vector<ImportedTensorHandlePin> m_PreImportedOutputHandles;


     std::unordered_map<BackendId, std::vector<MemBlock>> m_MemBlockMap;

     std::unordered_map<BackendId, std::vector<MemBin>> m_MemBinMap;


     std::vector<ITensorHandle*> m_Tensorhandles;


     std::vector<std::pair<std::shared_ptr<TensorMemory>, MemorySource>> m_TensorMemory;


     std::unique_ptr<MemoryManager> m_ExternalMemoryManager;


     std::unordered_map<BackendId, bool> m_SupportsExternallyManagedMemory;


     // A set of vectors to record the workload queue indexes and their corresponding Input/Output Slot indexes

     // which are connected to Inputs and Outputs for the network.

     struct WorkloadIndices

     {

         unsigned int m_WorkloadIndex;

         unsigned int m_SlotIndex;

     };


     struct OutputWorkloadIndices

     {

         WorkloadIndices m_OutputSlotIndices;

         std::vector<WorkloadIndices> m_InputSlotIndices;

     };

     std::unordered_map<LayerBindingId, std::vector<WorkloadIndices>> m_InputWorkloadSlotPairs;

     std::unordered_map<LayerBindingId, OutputWorkloadIndices> m_OutputWorkloadSlotPairs;

     std::vector<bool> m_IsInputImported;

     std::vector<bool> m_IsOutputImported;


 };


 }

DefaultAllocator.hpp

IBackendInternal.hpp

IMemoryOptimizerStrategy.hpp

LayerFwd.hpp

MemoryManager.hpp

Network.hpp

Profiling.hpp

SingleAxisPriorityList.hpp

Tensor.hpp

TensorHandleFactoryRegistry.hpp

Workload.hpp

WorkloadFactory.hpp

armnn::BindableLayer
Definition: Layer.hpp:471

armnn::ConstTensor
A tensor defined by a TensorInfo (shape and data type) and an immutable backing store.
Definition: Tensor.hpp:330

armnn::ITensorHandle
Definition: ITensorHandle.hpp:17

armnn::IWorkloadFactory
Definition: WorkloadFactory.hpp:23

armnn::Layer
Definition: Layer.hpp:231

armnn::LoadedNetwork
Definition: LoadedNetwork.hpp:43

armnn::LoadedNetwork::RegisterDebugCallback
void RegisterDebugCallback(const DebugCallbackFunction &func)
Definition: LoadedNetwork.cpp:1567

armnn::LoadedNetwork::~LoadedNetwork
~LoadedNetwork()
Definition: LoadedNetwork.hpp:47

armnn::LoadedNetwork::GetOutputTensorInfo
TensorInfo GetOutputTensorInfo(LayerBindingId layerId) const
Definition: LoadedNetwork.cpp:644

armnn::LoadedNetwork::WorkloadQueue
std::vector< std::unique_ptr< IWorkload > > WorkloadQueue
Definition: LoadedNetwork.hpp:45

armnn::LoadedNetwork::ImportInputs
std::vector< ImportedInputId > ImportInputs(const InputTensors &inputTensors, MemorySource forceImportMemorySource=MemorySource::Undefined)
Definition: LoadedNetwork.cpp:1402

armnn::LoadedNetwork::EnqueueWorkload
Status EnqueueWorkload(const InputTensors &inputTensors, const OutputTensors &outputTensors, std::vector< ImportedInputId > preImportedInputIds={}, std::vector< ImportedOutputId > preImportedOutputIds={})
Single thread execution of the loaded network.
Definition: LoadedNetwork.cpp:783

armnn::LoadedNetwork::ClearImportedInputs
void ClearImportedInputs(const std::vector< ImportedInputId > inputIds)
Definition: LoadedNetwork.cpp:1525

armnn::LoadedNetwork::FreeWorkingMemory
void FreeWorkingMemory()
Definition: LoadedNetwork.cpp:1197

armnn::LoadedNetwork::ImportOutputs
std::vector< ImportedOutputId > ImportOutputs(const OutputTensors &outputTensors, MemorySource forceImportMemorySource=MemorySource::Undefined)
Definition: LoadedNetwork.cpp:1467

armnn::LoadedNetwork::GetNetworkGuid
arm::pipe::ProfilingGuid GetNetworkGuid()
Definition: LoadedNetwork.cpp:621

armnn::LoadedNetwork::SendNetworkStructure
void SendNetworkStructure(arm::pipe::IProfilingService &profilingService)
Definition: LoadedNetwork.cpp:583

armnn::LoadedNetwork::GetProfiler
const std::shared_ptr< IProfiler > & GetProfiler() const
Definition: LoadedNetwork.hpp:76

armnn::LoadedNetwork::ClearImportedOutputs
void ClearImportedOutputs(const std::vector< ImportedOutputId > outputIds)
Definition: LoadedNetwork.cpp:1546

armnn::LoadedNetwork::GetInputTensorInfo
TensorInfo GetInputTensorInfo(LayerBindingId layerId) const
Definition: LoadedNetwork.cpp:626

armnn::LoadedNetwork::MakeLoadedNetwork
static std::unique_ptr< LoadedNetwork > MakeLoadedNetwork(std::unique_ptr< IOptimizedNetwork > net, std::string &errorMessage, const INetworkProperties &networkProperties, arm::pipe::IProfilingService *profilingService)
Definition: LoadedNetwork.cpp:170

armnn::TensorHandleFactoryRegistry
Definition: TensorHandleFactoryRegistry.hpp:24

armnn::Tensor
A tensor defined by a TensorInfo (shape and data type) and a mutable backing store.
Definition: Tensor.hpp:322

armnn::TensorInfo
Definition: Tensor.hpp:153

armnn
Copyright (c) 2021 ARM Limited and Contributors.
Definition: 01_00_quick_start.dox:7

armnn::MemorySource
MemorySource
Define the Memory Source to reduce copies.
Definition: Types.hpp:246

armnn::MemorySource::Undefined
@ Undefined

armnn::DebugCallbackFunction
std::function< void(LayerGuid guid, unsigned int slotIndex, ITensorHandle *tensorHandle)> DebugCallbackFunction
Define the type of callback for the Debug layer to call.
Definition: Types.hpp:400

armnn::WorkloadQueue
std::vector< std::unique_ptr< IWorkload > > WorkloadQueue
Definition: ExecutionFrame.hpp:13

armnn::ImportedInputId
unsigned int ImportedInputId
Definition: Types.hpp:312

armnn::Status
Status
enumeration
Definition: Types.hpp:43

armnn::OutputTensors
std::vector< std::pair< LayerBindingId, class Tensor > > OutputTensors
Definition: Tensor.hpp:395

armnn::InputTensors
std::vector< std::pair< LayerBindingId, class ConstTensor > > InputTensors
Definition: Tensor.hpp:394

armnn::LayerBindingId
int LayerBindingId
Type of identifiers for bindable layers (inputs, outputs).
Definition: Types.hpp:311

armnn::ImportedOutputId
unsigned int ImportedOutputId
Definition: Types.hpp:313

std
Definition: BackendId.hpp:150

armnn::INetworkProperties
Definition: IRuntime.hpp:42