44 Status
validate_arguments(
const ITensorInfo *
input,
const ITensorInfo *rois, ITensorInfo *output,
const ROIPoolingLayerInfo &pool_info)
54 if(output->total_size() != 0)
65 const UniformQuantizationInfo rois_qinfo = rois->quantization_info().uniform();
79 : _input(nullptr), _output(nullptr), _rois(nullptr), _pool_info(0, 0, 0.f)
102 _pool_info = pool_info;
104 INEKernel::configure(
window);
114 template <
typename input_data_type>
116 unsigned int roi_batch,
117 float region_start_x,
121 float region_start_y,
127 if((region_end_x <= region_start_x) || (region_end_y <= region_start_y))
129 return input_data_type(0);
136 for(
int iy = 0; iy < grid_size_y; ++iy)
138 for(
int ix = 0; ix < grid_size_x; ++ix)
141 float y = region_start_y + (iy + 0.5) * bin_size_y / float(grid_size_y);
142 float x = region_start_x + (ix + 0.5) * bin_size_x / float(grid_size_x);
147 const int y_high = y_low + 1;
148 const int x_high = x_low + 1;
150 const float ly = y - y_low;
151 const float lx = x - x_low;
152 const float hy = 1. - ly;
153 const float hx = 1. - lx;
155 const float w1 = hy * hx;
156 const float w2 = hy * lx;
157 const float w3 = ly * hx;
158 const float w4 = ly * lx;
161 const auto data1 = *reinterpret_cast<const input_data_type *>(
input->ptr_to_element(
Coordinates(x_low, y_low, pz, roi_batch)));
162 const auto data2 = *reinterpret_cast<const input_data_type *>(
input->ptr_to_element(
Coordinates(x_high, y_low, pz, roi_batch)));
163 const auto data3 = *reinterpret_cast<const input_data_type *>(
input->ptr_to_element(
Coordinates(x_low, y_high, pz, roi_batch)));
164 const auto data4 = *reinterpret_cast<const input_data_type *>(
input->ptr_to_element(
Coordinates(x_high, y_high, pz, roi_batch)));
165 avg += w1 * data1 + w2 * data2 + w3 * data3 + w4 * data4;
169 const auto data1 = *reinterpret_cast<const input_data_type *>(
input->ptr_to_element(
Coordinates(pz, x_low, y_low, roi_batch)));
170 const auto data2 = *reinterpret_cast<const input_data_type *>(
input->ptr_to_element(
Coordinates(pz, x_high, y_low, roi_batch)));
171 const auto data3 = *reinterpret_cast<const input_data_type *>(
input->ptr_to_element(
Coordinates(pz, x_low, y_high, roi_batch)));
172 const auto data4 = *reinterpret_cast<const input_data_type *>(
input->ptr_to_element(
Coordinates(pz, x_high, y_high, roi_batch)));
173 avg += w1 * data1 + w2 * data2 + w3 * data3 + w4 * data4;
178 avg /= grid_size_x * grid_size_y;
179 return input_data_type(avg);
184 template <
typename input_data_type>
186 unsigned int roi_batch,
187 float region_start_x,
191 float region_start_y,
198 if((region_end_x <= region_start_x) || (region_end_y <= region_start_y))
210 for(
int iy = 0; iy < grid_size_y; ++iy)
212 for(
int ix = 0; ix < grid_size_x; ++ix)
215 float y = region_start_y + (iy + 0.5) * bin_size_y / float(grid_size_y);
216 float x = region_start_x + (ix + 0.5) * bin_size_x / float(grid_size_x);
221 const int y_high = y_low + 1;
222 const int x_high = x_low + 1;
224 const float ly = y - y_low;
225 const float lx = x - x_low;
226 const float hy = 1. - ly;
227 const float hx = 1. - lx;
229 const float w1 = hy * hx;
230 const float w2 = hy * lx;
231 const float w3 = ly * hx;
232 const float w4 = ly * lx;
242 avg += w1 * data1 + w2 * data2 + w3 * data3 + w4 * data4;
250 avg += w1 * data1 + w2 * data2 + w3 * data3 + w4 * data4;
261 avg += w1 * data1 + w2 * data2 + w3 * data3 + w4 * data4;
269 avg += w1 * data1 + w2 * data2 + w3 * data3 + w4 * data4;
275 avg /= grid_size_x * grid_size_y;
277 input_data_type res = 0;
292 const float region_start = p * bin_size + roi_anchor;
305 NEROIAlignLayerKernel::internal_run<uint8_t, uint16_t>(
window,
info);
310 NEROIAlignLayerKernel::internal_run<int8_t, uint16_t>(
window,
info);
315 NEROIAlignLayerKernel::internal_run<float>(
window,
info);
318 #ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC 321 NEROIAlignLayerKernel::internal_run<float16_t>(
window,
info);
324 #endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC 338 template <
typename input_data_type,
typename roi_data_type>
357 const int input_chanels = _input->
info()->
dimension(idx_depth);
364 const auto *rois_ptr = reinterpret_cast<const roi_data_type *>(_rois->
buffer());
366 for(
int roi_indx = roi_list_start; roi_indx < roi_list_end; ++roi_indx)
368 const unsigned int roi_batch = rois_ptr[values_per_roi * roi_indx];
370 roi_data_type qx1 = rois_ptr[values_per_roi * roi_indx + 1];
371 roi_data_type qy1 = rois_ptr[values_per_roi * roi_indx + 2];
372 roi_data_type qx2 = rois_ptr[values_per_roi * roi_indx + 3];
373 roi_data_type qy2 = rois_ptr[values_per_roi * roi_indx + 4];
387 const float roi_dims_x = std::max((x2 - x1) * _pool_info.
spatial_scale(), 1.0f);
388 const float roi_dims_y = std::max((y2 - y1) * _pool_info.
spatial_scale(), 1.0f);
389 float bin_size_x = roi_dims_x / _pool_info.
pooled_width();
393 for(
int ch = 0; ch < input_chanels; ++ch)
396 for(
int py = 0; py < pooled_h; ++py)
398 for(
int px = 0; px < pooled_w; ++px)
406 input_data_type out_val(0);
409 out_val = roi_align_1x1_qasymm8<input_data_type>(
410 _input, roi_batch, region_start_x, bin_size_x,
411 roi_bin_grid_x, region_end_x, region_start_y, bin_size_y,
416 out_val = roi_align_1x1<input_data_type>(
417 _input, roi_batch, region_start_x, bin_size_x,
418 roi_bin_grid_x, region_end_x, region_start_y, bin_size_y,
419 roi_bin_grid_y, region_end_y, ch);
424 auto out_ptr = reinterpret_cast<input_data_type *>(_output->
ptr_to_element(Coordinates(px, py, ch, roi_indx)));
429 auto out_ptr = reinterpret_cast<input_data_type *>(_output->
ptr_to_element(Coordinates(ch, px, py, roi_indx)));
input_data_type roi_align_1x1(const ITensor *input, unsigned int roi_batch, float region_start_x, float bin_size_x, int grid_size_x, float region_end_x, float region_start_y, float bin_size_y, int grid_size_y, float region_end_y, int pz)
Average pooling over an aligned window.
const Window & window() const
The maximum window the kernel can be executed on.
uint8_t * ptr_to_element(const Coordinates &id) const
Return a pointer to the element at the passed coordinates.
#define ARM_COMPUTE_RETURN_ERROR_ON_DATA_LAYOUT_NOT_IN(t,...)
#define ARM_COMPUTE_RETURN_ERROR_ON_MISMATCHING_DATA_LAYOUT(...)
#define ARM_COMPUTE_RETURN_ERROR_ON_CPU_F16_UNSUPPORTED(tensor)
float dequantize_qasymm8(uint8_t value, const INFO_TYPE &qinfo)
Dequantize a value given an unsigned 8-bit asymmetric quantization scheme.
virtual size_t dimension(size_t index) const =0
Return the size of the requested dimension.
TensorShape compute_roi_align_shape(const ITensorInfo &input, const ITensorInfo &rois, ROIPoolingLayerInfo pool_info)
Calculate the output roi align shape of a tensor.
uint8_t quantize_qasymm8(float value, const INFO_TYPE &qinfo, RoundingPolicy rounding_policy=RoundingPolicy::TO_NEAREST_UP)
Quantize a value given an unsigned 8-bit asymmetric quantization scheme.
#define ARM_COMPUTE_ERROR(msg)
Print the given message then throw an std::runtime_error.
#define ARM_COMPUTE_RETURN_ON_ERROR(status)
Checks if a status contains an error and returns it.
virtual DataType data_type() const =0
Data type used for each element of the tensor.
1 channel, 1 F32 per channel
const DataLayout data_layout
Store the tensor's metadata.
#define ARM_COMPUTE_ERROR_THROW_ON(status)
Describe one of the image's dimensions with a start, end and step.
quantized, asymmetric fixed-point 16-bit number
unsigned int pooled_width() const
Get the pooled width of the layer.
float compute_region_coordinate(int p, float bin_size, float roi_anchor, float max_value)
#define ARM_COMPUTE_RETURN_ERROR_ON(cond)
If the condition is true, an error is returned.
Interface for CPU tensor.
#define ARM_COMPUTE_RETURN_ERROR_ON_MISMATCHING_DIMENSIONS(...)
Copyright (c) 2017-2021 Arm Limited.
1 channel, 1 F16 per channel
#define ARM_COMPUTE_RETURN_ERROR_ON_NULLPTR(...)
DataType clamp(const DataType &n, const DataType &lower=std::numeric_limits< RangeType >::lowest(), const DataType &upper=std::numeric_limits< RangeType >::max())
Performs clamping among a lower and upper value.
float dequantize_qasymm16(uint16_t value, const UniformQuantizationInfo &qinfo)
Dequantize a value given a 16-bit asymmetric quantization scheme.
Quantization information.
static constexpr size_t DimX
Alias for dimension 0 also known as X dimension.
#define ARM_COMPUTE_UNUSED(...)
To avoid unused variables warnings.
virtual ITensorInfo & set_data_layout(const DataLayout &data_layout)=0
Set the data layout of the tensor.
int8_t quantize_qasymm8_signed(float value, const INFO_TYPE &qinfo, RoundingPolicy rounding_policy=RoundingPolicy::TO_NEAREST_UP)
Quantize a value given a signed 8-bit asymmetric quantization scheme.
quantized, asymmetric fixed-point 8-bit number unsigned
virtual uint8_t * buffer() const =0
Interface to be implemented by the child class to return a pointer to CPU memory.
UniformQuantizationInfo uniform() const
Return per layer quantization info.
bool is_data_type_quantized_asymmetric_signed(DataType dt)
Check if a given data type is of asymmetric quantized signed type.
bool auto_init_if_empty(ITensorInfo &info, const TensorShape &shape, int num_channels, DataType data_type, QuantizationInfo quantization_info=QuantizationInfo())
Auto initialize the tensor info (shape, number of channels and data type) if the current assignment i...
virtual ITensorInfo * info() const =0
Interface to be implemented by the child class to return the tensor's metadata.
const size_t input_height
void set(size_t dimension, const Dimension &dim)
Set the values of a given dimension.
virtual QuantizationInfo quantization_info() const =0
Get the quantization settings (scale and offset) of the tensor.
#define ARM_COMPUTE_ERROR_ON_UNCONFIGURED_KERNEL(k)
unsigned int sampling_ratio() const
Get sampling ratio.
Num samples, channels, height, width.
bool is_data_type_quantized_asymmetric(DataType dt)
Check if a given data type is of asymmetric quantized type.
static constexpr size_t DimY
Alias for dimension 1 also known as Y dimension.
ScaleKernelInfo info(interpolation_policy, default_border_mode, PixelValue(), sampling_policy, false)
void run(const Window &window, const ThreadInfo &info) override
Execute the kernel on the passed window.
Information about executing thread and CPU.
input_data_type roi_align_1x1_qasymm8(const ITensor *input, unsigned int roi_batch, float region_start_x, float bin_size_x, int grid_size_x, float region_end_x, float region_start_y, float bin_size_y, int grid_size_y, float region_end_y, int pz, const QuantizationInfo &out_qinfo)
Average pooling over an aligned window.
unsigned int pooled_height() const
Get the pooled height of the layer.
ROI Pooling Layer Information class.
#define ARM_COMPUTE_RETURN_ERROR_ON_MISMATCHING_DATA_TYPES(...)
Num samples, height, width, channels.
#define ARM_COMPUTE_RETURN_ERROR_ON_DATA_TYPE_CHANNEL_NOT_IN(t, c,...)
Status validate_arguments(const ITensorInfo *input, const ITensorInfo *bias, const ITensorInfo *output, const GEMMLowpOutputStageInfo *output_stage)
float spatial_scale() const
Get the spatial scale.
float dequantize_qasymm8_signed(int8_t value, const INFO_TYPE &qinfo)
Dequantize a value given a signed 8-bit asymmetric quantization scheme.
NEROIAlignLayerKernel()
Constructor.
#define ARM_COMPUTE_ERROR_ON_NULLPTR(...)
quantized, asymmetric fixed-point 8-bit number signed
size_t get_data_layout_dimension_index(const DataLayout data_layout, const DataLayoutDimension data_layout_dimension)
Get the index of the given dimension.
constexpr int end() const
Return the end of the dimension.
DataType
Available data types.
DataLayout
[DataLayout enum definition]
void configure(const ITensor *input, const ITensor *rois, ITensor *output, const ROIPoolingLayerInfo &pool_info)
Set the input and output tensors.
constexpr int start() const
Return the start of the dimension.
Describe a multidimensional execution window.
#define ARM_COMPUTE_ERROR_ON_INVALID_SUBWINDOW(f, s)
virtual DataLayout data_layout() const =0
Get the data layout of the tensor.
static Status validate(const ITensorInfo *input, const ITensorInfo *rois, ITensorInfo *output, const ROIPoolingLayerInfo &pool_info)
Static function to check if given info will lead to a valid configuration of NEROIAlignLayerKernel.
constexpr const Dimension & x() const
Alias to access the first dimension of the window.