Basic function to run NERNNLayer. More...

#include <NERNNLayer.h>

Collaboration diagram for NERNNLayer:

Public Member Functions
	NERNNLayer (std::shared_ptr< IMemoryManager > memory_manager=nullptr)
	Default constructor. More...

	NERNNLayer (const NERNNLayer &)=delete
	Prevent instances of this class from being copied (As this class contains pointers) More...

	NERNNLayer (NERNNLayer &&)=delete
	Prevent instances of this class from being moved (As this class contains pointers) More...

NERNNLayer &	operator= (const NERNNLayer &)=delete
	Prevent instances of this class from being copied (As this class contains pointers) More...

NERNNLayer &	operator= (NERNNLayer &&)=delete
	Prevent instances of this class from being moved (As this class contains pointers) More...

	~NERNNLayer ()
	Default destructor. More...

void	configure (const ITensor input, const ITensor weights, const ITensor recurrent_weights, const ITensor bias, ITensor hidden_state, ITensor output, ActivationLayerInfo &info)
	Initialize the function. More...

void	run () override
	Run the kernels contained in the function. More...

void	prepare () override
	Prepare the function for executing. More...

Public Member Functions inherited from IFunction
virtual	~IFunction ()=default
	Destructor. More...

Static Public Member Functions
static Status	validate (const ITensorInfo input, const ITensorInfo weights, const ITensorInfo recurrent_weights, const ITensorInfo bias, const ITensorInfo hidden_state, const ITensorInfo output, const ActivationLayerInfo &info)
	Initialize the function. More...

Detailed Description

Basic function to run NERNNLayer.

Definition at line 40 of file NERNNLayer.h.

Constructor & Destructor Documentation

◆ NERNNLayer() [1/3]

NERNNLayer ( std::shared_ptr< IMemoryManager > memory_manager = nullptr )

Default constructor.

Definition at line 40 of file NERNNLayer.cpp.

     : _memory_group(std::move(memory_manager)),
       _gemm_state_f(),
       _add_f(),
       _activation(),
       _fully_connected(memory_manager),
       _copy_f(),
       _fully_connected_out(),
       _gemm_output(),
       _add_output(),
       _is_prepared(false)
 {
 }

◆ NERNNLayer() [2/3]

NERNNLayer ( const NERNNLayer & )

delete

Prevent instances of this class from being copied (As this class contains pointers)

◆ NERNNLayer() [3/3]

NERNNLayer ( NERNNLayer && )

delete

Prevent instances of this class from being moved (As this class contains pointers)

◆ ~NERNNLayer()

~NERNNLayer ( )

default

Default destructor.

Member Function Documentation

◆ configure()

void configure	(	const ITensor *	input,
		const ITensor *	weights,
		const ITensor *	recurrent_weights,
		const ITensor *	bias,
		ITensor *	hidden_state,
		ITensor *	output,
		ActivationLayerInfo &	info
	)

Initialize the function.

Valid data layouts:

NHWC
NCHW

Valid data type configurations:

src0	src1	src2	src3	dst0	dst1
F16	F16	F16	F16	F16	F16
F32	F32	F32	F32	F32	F32

Parameters

[in]	input	Input is a 2-D tensor of shape [input_size, batch_size]. Data types supported: F16/F32
[in]	weights	Weights tensor of shape [input_size, num_units] that multiplies the input. Data types supported: Same as `input`
[in]	recurrent_weights	Weights tensor of shape [num_units, num_units] that multiplies the current 'state'. Data types supported: Same as `input`
[in]	bias	Bias vector of shape [num_units]. Data types supported: Same as `input`
[out]	output	Output tensor of shape [num_units, batch_size]. Data types supported: Same as `input`
[in,out]	hidden_state	Output tensor of shape [num_units, batch_size]. Data types supported: Same as `input`
[in]	info	Activation layer parameter.

Definition at line 89 of file NERNNLayer.cpp.

 {
     ARM_COMPUTE_ERROR_ON_NULLPTR(input, weights, recurrent_weights, bias, hidden_state, output);
     ARM_COMPUTE_ERROR_THROW_ON(NERNNLayer::validate(input->info(), weights->info(), recurrent_weights->info(),
                                                     bias->info(), hidden_state->info(), output->info(), info));
     ARM_COMPUTE_LOG_PARAMS(input, weights, recurrent_weights, bias, hidden_state, output, info);
  
     const int   idx_height = get_data_layout_dimension_index(input->info()->data_layout(), DataLayoutDimension::HEIGHT);
     TensorShape shape      = misc::shape_calculator::compute_rnn_shape(recurrent_weights->info(),
                                                                        hidden_state->info()->dimension(idx_height));
  
     _is_prepared = false;
  
     // Manage intermediate buffers and configure
     _fully_connected_out.allocator()->init(TensorInfo(shape, 1, input->info()->data_type()));
     _gemm_output.allocator()->init(TensorInfo(shape, 1, input->info()->data_type()));
  
     // Manage intermediate buffers and configure
     _memory_group.manage(&_fully_connected_out);
     _fully_connected.configure(input, weights, bias, &_fully_connected_out);
  
     _memory_group.manage(&_gemm_output);
     _gemm_state_f.configure(hidden_state, recurrent_weights, nullptr, &_gemm_output, 1.f, 0.f);
  
     _add_output.allocator()->init(TensorInfo(shape, 1, input->info()->data_type()));
     _memory_group.manage(&_add_output);
  
     _add_f.configure(&_fully_connected_out, &_gemm_output, &_add_output, ConvertPolicy::SATURATE);
  
     _fully_connected_out.allocator()->allocate();
     _gemm_output.allocator()->allocate();
  
     _activation.configure(&_add_output, hidden_state, info);
     _add_output.allocator()->allocate();
  
     _copy_f.configure(hidden_state, output);
 }

References TensorAllocator::allocate(), Tensor::allocator(), ARM_COMPUTE_ERROR_ON_NULLPTR, ARM_COMPUTE_ERROR_THROW_ON, ARM_COMPUTE_LOG_PARAMS, bias, arm_compute::misc::shape_calculator::compute_rnn_shape(), NECopy::configure(), NEArithmeticAddition::configure(), NEGEMM::configure(), NEActivationLayer::configure(), NEFullyConnectedLayer::configure(), ITensorInfo::dimension(), arm_compute::get_data_layout_dimension_index(), arm_compute::HEIGHT, arm_compute::test::validation::idx_height, ITensor::info(), arm_compute::test::validation::info, TensorAllocator::init(), arm_compute::test::validation::input, MemoryGroup::manage(), arm_compute::SATURATE, arm_compute::test::validation::shape, and NERNNLayer::validate().

◆ operator=() [1/2]

NERNNLayer& operator= ( const NERNNLayer & )

delete

Prevent instances of this class from being copied (As this class contains pointers)

◆ operator=() [2/2]

NERNNLayer& operator= ( NERNNLayer && )

delete

Prevent instances of this class from being moved (As this class contains pointers)

◆ prepare()

void prepare ( )

overridevirtual

Prepare the function for executing.

Any one off pre-processing step required by the function is handled here

Note: Prepare stage might not need all the function's buffers' backing memory to be available in order to execute

Reimplemented from IFunction.

Definition at line 150 of file NERNNLayer.cpp.

 {
     if (!_is_prepared)
     {
         _fully_connected.prepare();
         _gemm_state_f.prepare();
  
         _is_prepared = true;
     }
 }

References NEGEMM::prepare(), and NEFullyConnectedLayer::prepare().

Referenced by NERNNLayer::run().

◆ run()

void run ( )

overridevirtual

Run the kernels contained in the function.

For CPU kernels:

Multi-threading is used for the kernels which are parallelisable.
By default std::thread::hardware_concurrency() threads are used.

Note: CPPScheduler::set_num_threads() can be used to manually set the number of threads

For OpenCL kernels:

All the kernels are enqueued on the queue associated with CLScheduler.
The queue is then flushed.

Note: The function will not block until the kernels are executed. It is the user's responsibility to wait.; Will call prepare() on first run if hasn't been done

Implements IFunction.

Definition at line 133 of file NERNNLayer.cpp.

 {
     prepare();
  
     MemoryGroupResourceScope scope_mg(_memory_group);
  
     _fully_connected.run();
  
     _gemm_state_f.run();
  
     _add_f.run();
     _activation.run();
  
     // copy hidden out to output
     _copy_f.run();
 }

References NERNNLayer::prepare(), NECopy::run(), NEActivationLayer::run(), NEArithmeticAddition::run(), NEGEMM::run(), and NEFullyConnectedLayer::run().

◆ validate()

Status validate	(	const ITensorInfo *	input,
		const ITensorInfo *	weights,
		const ITensorInfo *	recurrent_weights,
		const ITensorInfo *	bias,
		const ITensorInfo *	hidden_state,
		const ITensorInfo *	output,
		const ActivationLayerInfo &	info
	)

static

Initialize the function.

Parameters

[in]	input	Input is a 2-D tensor of shape [input_size, batch_size]. Data types supported: F16/F32
[in]	weights	Weights tensor of shape [input_size, num_units] that multiplies the input. Data types supported: Same as `input`
[in]	recurrent_weights	Weights tensor of shape [num_units, num_units] that multiplies the current 'state'. Data types supported: Same as `input`
[in]	bias	Bias vector of shape [num_units]. Data types supported: Same as `input`
[in]	output	Output tensor of shape [num_units, batch_size]. Data types supported: Same as `input`
[in]	hidden_state	Output tensor of shape [num_units, batch_size]. Data types supported: Same as `input`
[in]	info	Activation layer parameter.

Returns: a status

Definition at line 54 of file NERNNLayer.cpp.

 {
     ARM_COMPUTE_RETURN_ERROR_ON_NULLPTR(input, weights, recurrent_weights, bias, hidden_state, output);
     ARM_COMPUTE_RETURN_ERROR_ON_DATA_TYPE_NOT_IN(input, DataType::F16, DataType::F32);
  
     const int idx_width  = get_data_layout_dimension_index(input->data_layout(), DataLayoutDimension::WIDTH);
     const int idx_height = get_data_layout_dimension_index(input->data_layout(), DataLayoutDimension::HEIGHT);
     ARM_COMPUTE_RETURN_ERROR_ON(input->dimension(idx_width) != weights->dimension(idx_width));
     ARM_COMPUTE_RETURN_ERROR_ON(input->num_dimensions() != 2);
     ARM_COMPUTE_RETURN_ERROR_ON(weights->dimension(idx_height) != recurrent_weights->dimension(idx_width));
     ARM_COMPUTE_RETURN_ERROR_ON(recurrent_weights->dimension(idx_width) != recurrent_weights->dimension(idx_height));
     ARM_COMPUTE_RETURN_ERROR_ON(bias->num_dimensions() != 1);
     ARM_COMPUTE_RETURN_ERROR_ON(bias->dimension(idx_width) != weights->dimension(idx_height));
     ARM_COMPUTE_RETURN_ERROR_ON(hidden_state->dimension(idx_width) != weights->dimension(idx_height));
     ARM_COMPUTE_RETURN_ERROR_ON(hidden_state->dimension(idx_height) != input->dimension(idx_height));
     ARM_COMPUTE_RETURN_ERROR_ON_MISMATCHING_DIMENSIONS(output->tensor_shape(), hidden_state->tensor_shape());
  
     auto shape_info =
         TensorInfo(misc::shape_calculator::compute_rnn_shape(recurrent_weights, hidden_state->dimension(idx_height)), 1,
                    input->data_type());
  
     ARM_COMPUTE_RETURN_ON_ERROR(NEFullyConnectedLayer::validate(input, weights, bias, &shape_info));
     ARM_COMPUTE_RETURN_ON_ERROR(
         NEArithmeticAddition::validate(&shape_info, &shape_info, &shape_info, ConvertPolicy::SATURATE));
     ARM_COMPUTE_RETURN_ON_ERROR(NEActivationLayer::validate(&shape_info, &shape_info, info));
  
     return Status{};
 }

References ARM_COMPUTE_RETURN_ERROR_ON, ARM_COMPUTE_RETURN_ERROR_ON_DATA_TYPE_NOT_IN, ARM_COMPUTE_RETURN_ERROR_ON_MISMATCHING_DIMENSIONS, ARM_COMPUTE_RETURN_ERROR_ON_NULLPTR, ARM_COMPUTE_RETURN_ON_ERROR, bias, arm_compute::misc::shape_calculator::compute_rnn_shape(), ITensorInfo::dimension(), arm_compute::F16, arm_compute::F32, arm_compute::get_data_layout_dimension_index(), arm_compute::HEIGHT, arm_compute::test::validation::idx_height, arm_compute::test::validation::idx_width, arm_compute::test::validation::info, arm_compute::test::validation::input, arm_compute::SATURATE, ITensorInfo::tensor_shape(), NEArithmeticAddition::validate(), NEActivationLayer::validate(), NEFullyConnectedLayer::validate(), and arm_compute::WIDTH.

Referenced by NERNNLayer::configure().

The documentation for this class was generated from the following files:

arm_compute/runtime/NEON/functions/NERNNLayer.h
src/runtime/NEON/functions/NERNNLayer.cpp

Public Member Functions

Static Public Member Functions

Detailed Description

Constructor & Destructor Documentation

◆ NERNNLayer() [1/3]

◆ NERNNLayer() [2/3]

◆ NERNNLayer() [3/3]

◆ ~NERNNLayer()

Member Function Documentation

◆ configure()

◆ operator=() [1/2]

◆ operator=() [2/2]

◆ prepare()

◆ run()

◆ validate()