ComputeLibrary/v21.02/_shape_calculator_8h_source.xhtml

 /*
  * Copyright (c) 2017-2021 Arm Limited.
  *
  * SPDX-License-Identifier: MIT
  *
  * Permission is hereby granted, free of charge, to any person obtaining a copy
  * of this software and associated documentation files (the "Software"), to
  * deal in the Software without restriction, including without limitation the
  * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
  * sell copies of the Software, and to permit persons to whom the Software is
  * furnished to do so, subject to the following conditions:
  *
  * The above copyright notice and this permission notice shall be included in all
  * copies or substantial portions of the Software.
  *
  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  * SOFTWARE.
  */
 #ifndef ARM_COMPUTE_MISC_SHAPE_CALCULATOR_H
 #define ARM_COMPUTE_MISC_SHAPE_CALCULATOR_H

 #include "arm_compute/core/Helpers.h"
 #include "arm_compute/core/ITensorInfo.h"
 #include "arm_compute/core/KernelDescriptors.h"
 #include "arm_compute/core/Utils.h"

 #include "arm_compute/core/utils/helpers/tensor_transform.h"

 #include <cmath>

 namespace arm_compute
 {
 namespace misc
 {
 namespace shape_calculator
 {
 /** Calculate the output tensor shape for the reduce mean operation
  *
  * @param[in] input          Input tensor shape
  * @param[in] reduction_axis Reduction axis
  * @param[in] keep_dims      Flag to indicate if dimensions are kept
  *
  * @return the calculated shape
  */
 inline TensorShape calculate_reduce_mean_shape(ITensorInfo *input, const Coordinates &reduction_axis, bool keep_dims)
 {
     const int   reduction_ops = reduction_axis.num_dimensions();
     Coordinates axis_local    = reduction_axis;
     const int   input_dims    = input->num_dimensions();
     convert_negative_axis(axis_local, input_dims);
     TensorShape out_shape = input->tensor_shape();
     // Configure reshape layer if we want to drop the dimensions
     if(!keep_dims)
     {
         // We have to sort the reduction axis vectors in order for remove_dimension
         // to work properly
         std::sort(axis_local.begin(), axis_local.begin() + reduction_ops);
         for(int i = 0; i < reduction_ops; ++i)
         {
             out_shape.remove_dimension(axis_local[i] - i);
         }
         return out_shape;
     }
     else
     {
         for(int i = 0; i < reduction_ops; ++i)
         {
             out_shape.set(axis_local[i], 1);
         }
         return out_shape;
     }
 }
 /** Calculate the output tensor shape of a vector input given the convolution dimensions
  *
  * @param[in] input       Input tensor shape
  * @param[in] conv_w      Convolution width
  * @param[in] conv_h      Convolution height
  * @param[in] data_layout Data layout
  *
  * @return the calculated shape
  */
 inline TensorShape compute_vector_to_tensor_output_shape(const TensorShape &input, size_t conv_w, size_t conv_h, const DataLayout &data_layout)
 {
     const size_t idx_w = get_data_layout_dimension_index(data_layout, DataLayoutDimension::WIDTH);
     const size_t idx_h = get_data_layout_dimension_index(data_layout, DataLayoutDimension::HEIGHT);
     const size_t idx_c = get_data_layout_dimension_index(data_layout, DataLayoutDimension::CHANNEL);

     TensorShape output_shape(input);
     output_shape.set(idx_w, conv_w);
     output_shape.set(idx_h, conv_h);
     output_shape.set(idx_c, input.x() / (conv_w * conv_h));

     return output_shape;
 }

 /** Calculate the permuted shape of an input given a permutation vector
  *
  * @param[in] input Input tensor info
  * @param[in] perm  Permutation vector
  *
  * @return the calculated shape
  */
 inline TensorShape compute_permutation_output_shape(const ITensorInfo &input, const PermutationVector &perm)
 {
     TensorShape output_shape = input.tensor_shape();
     permute(output_shape, perm);
     return output_shape;
 }

 /** Calculate the output shape of the reorg layer given a stride
  *
  * @param[in] input  Input tensor info
  * @param[in] stride Stride
  *
  * @return the calculated shape
  */
 inline TensorShape compute_reorg_output_shape(const ITensorInfo &input, int32_t stride)
 {
     const size_t idx_width   = get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::WIDTH);
     const size_t idx_height  = get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::HEIGHT);
     const size_t idx_channel = get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::CHANNEL);

     ARM_COMPUTE_ERROR_ON(stride <= 0);
     ARM_COMPUTE_ERROR_ON_MSG((input.tensor_shape()[idx_width] % stride != 0), "The width of the input tensor must be a multiple of stride");
     ARM_COMPUTE_ERROR_ON_MSG((input.tensor_shape()[idx_height] % stride != 0), "The height of the input tensor must be a multiple of stride");

     TensorShape output_shape{ input.tensor_shape() };

     output_shape.set(idx_width, output_shape[idx_width] / stride);
     output_shape.set(idx_height, output_shape[idx_height] / stride);
     output_shape.set(idx_channel, output_shape[idx_channel] * stride * stride);

     return output_shape;
 }

 /** Calculate the reshaped shape of the weights
  *
  * @param[in] weights    Weights tensor info
  * @param[in] has_bias   (Optional) Set to true if there is bias
  * @param[in] num_groups (Optional) Number of groups
  *
  * @return the calculated shape of the reshaped weights
  */
 inline TensorShape compute_weights_reshaped_shape(const ITensorInfo &weights, bool has_bias = false, unsigned int num_groups = 1)
 {
     // Number of groups greater than one are only supported for NCHW data layout, and the number of weights must be a multiple of it.
     ARM_COMPUTE_ERROR_ON(num_groups == 0);
     ARM_COMPUTE_ERROR_ON(weights.data_layout() == DataLayout::NHWC && num_groups > 1);
     ARM_COMPUTE_ERROR_ON((weights.dimension(3) % num_groups) != 0);

     // Calculate output shape
     TensorShape weights_reshaped{ weights.tensor_shape() };
     weights_reshaped.set(3, weights_reshaped[3] / num_groups);

     weights_reshaped.collapse(3);
     const size_t tmp_dim = weights_reshaped[0];
     weights_reshaped.set(0, weights_reshaped[1]);
     weights_reshaped.set(1, tmp_dim + (has_bias ? 1 : 0));
     if(weights.num_dimensions() < 5)
     {
         weights_reshaped.set(2, num_groups);
     }

     return weights_reshaped;
 }

 /** Calculate the Left Hand Side matrix reshaped shape
  *
  * @param[in] a                       Input tensor info
  * @param[in] lhs_info                Left Hand Side matrix information
  * @param[in] reinterpret_input_as_3d (Optional) Set to true if the input need to be interpreted as 3d
  *
  * @return the calculated shape
  */
 inline TensorShape compute_lhs_reshaped_shape(const ITensorInfo &a, const GEMMLHSMatrixInfo &lhs_info, bool reinterpret_input_as_3d = false)
 {
     ARM_COMPUTE_ERROR_ON(lhs_info.m0 == 0);
     ARM_COMPUTE_ERROR_ON(lhs_info.k0 == 0);
     ARM_COMPUTE_ERROR_ON(lhs_info.v0 == 0);

     // Input width/height
     const unsigned int input_width  = a.dimension(0);
     const unsigned int input_height = reinterpret_input_as_3d ? a.dimension(1) * a.dimension(2) : a.dimension(1);

     // Number of horizontal/vertical blocks in the input tensor
     const unsigned int num_horiz_blocks = std::ceil(input_width / static_cast<float>(lhs_info.k0));
     const unsigned int num_vert_blocks  = std::ceil(input_height / static_cast<float>(lhs_info.m0));

     // Block size
     const unsigned int block_size = lhs_info.m0 * lhs_info.k0;

     // Output width/height
     const unsigned int output_width  = block_size * num_horiz_blocks * lhs_info.v0;
     const unsigned int output_height = std::ceil(num_vert_blocks / static_cast<float>(lhs_info.v0));

     TensorShape lhs_shape{ a.tensor_shape() };
     lhs_shape.set(0, output_width);
     lhs_shape.set(1, output_height);

     if((reinterpret_input_as_3d) && (lhs_shape.num_dimensions() > 2))
     {
         // When the data format is NHWC and the shapes are Nx1x1
         // the tensor shape num_dimensions is automatically set to 1 instead of 3.
         // To avoid failures by removing a dimension that doesn't exist
         // check if the number of dimensions is greater than 2.
         lhs_shape.remove_dimension(2);
     }

     return lhs_shape;
 }

 /** Calculate the Right Hand Side matrix reshaped shape
  *
  * @param[in] a        Input tensor info
  * @param[in] rhs_info Right Hand Side matrix information
  *
  * @return the calculated shape
  */
 inline TensorShape compute_rhs_reshaped_shape(const ITensorInfo &a, const GEMMRHSMatrixInfo &rhs_info)
 {
     ARM_COMPUTE_ERROR_ON(rhs_info.n0 == 0);
     ARM_COMPUTE_ERROR_ON(rhs_info.k0 == 0);
     ARM_COMPUTE_ERROR_ON(rhs_info.h0 == 0);

     // Input width/height
     const unsigned int input_width  = a.dimension(0);
     const unsigned int input_height = a.dimension(1);

     // Number of horizontal/vertical blocks in the input tensor
     const unsigned int num_horiz_blocks = std::ceil(input_width / static_cast<float>(rhs_info.n0));
     const unsigned int num_vert_blocks  = std::ceil(input_height / static_cast<float>(rhs_info.k0));

     // Block size
     const unsigned int block_size = rhs_info.n0 * rhs_info.k0;

     // Output width/height
     const unsigned int output_width  = block_size * num_vert_blocks * rhs_info.h0;
     const unsigned int output_height = std::ceil(num_horiz_blocks / static_cast<float>(rhs_info.h0));

     TensorShape rhs_shape{ a.tensor_shape() };
     rhs_shape.set(0, output_width);
     rhs_shape.set(1, output_height);

     return rhs_shape;
 }

 /** Calculate the interleaved shape of an input tensor
  *
  * @param[in] a                         Input tensor info
  * @param[in] mult_interleave4x4_height (Optional) Interleave4x4 height
  * @param[in] reinterpret_input_as_3d   (Optional)  Set to true if the input need to be interpreted as 3d
  *
  * @return the calculated shape
  */
 inline TensorShape compute_interleaved_shape(const ITensorInfo &a, int mult_interleave4x4_height = 1, bool reinterpret_input_as_3d = false)
 {
     // The interleaved output matrix will have the following shape: [ a_height * W, ceil(a_width / W) ] where W = 4 * mult_interleave4x4_height
     ARM_COMPUTE_ERROR_ON(mult_interleave4x4_height < 1);
     const int   interleave_width = 4 * mult_interleave4x4_height;
     TensorShape shape_interleaved_a{ a.tensor_shape() };
     shape_interleaved_a.set(0, a.dimension(0) * interleave_width);
     if(reinterpret_input_as_3d)
     {
         const int M      = a.dimension(1) * a.dimension(2);
         const int height = std::ceil(M / static_cast<float>(interleave_width));
         shape_interleaved_a.set(1, height);

         // When the data format is NHWC and the shapes are Nx1x1
         // the tensor shape num_dimensions is automatically set to 1 instead of 3.
         // To avoid failures by removing a dimension that doesn't exist
         // check if the number of dimensions is greater than 2.
         if(shape_interleaved_a.num_dimensions() > 2)
         {
             shape_interleaved_a.remove_dimension(2);
         }
     }
     else
     {
         shape_interleaved_a.set(1, std::ceil(a.dimension(1) / static_cast<float>(interleave_width)));
     }

     return shape_interleaved_a;
 }

 /** Calculate the reshaped shape of the weights to use in depthwise convolution
  *
  * @param[in] input Input tensor info
  * @param[in] info  Depthwise convolution information to be used for reshaping.
  *
  * @return the calculated shape
  */
 inline TensorShape compute_reshaped_depthwise_weights_shape(const ITensorInfo &input, const DepthwiseConvolutionReshapeInfo &info)
 {
     const auto  data_layout = input.data_layout();
     TensorShape weights_shape{};

     const int    width_idx    = get_data_layout_dimension_index(data_layout, DataLayoutDimension::WIDTH);
     const int    height_idx   = get_data_layout_dimension_index(data_layout, DataLayoutDimension::HEIGHT);
     const int    channel_idx  = get_data_layout_dimension_index(data_layout, DataLayoutDimension::CHANNEL);
     const size_t num_channels = input.dimension(channel_idx);
     const size_t num_rows     = input.dimension(height_idx);
     const size_t num_cols     = input.dimension(width_idx);

     weights_shape.set(0, num_rows * num_cols * info.c0);
     weights_shape.set(1, DIV_CEIL(num_channels, info.c0));
     return weights_shape;
 }

 /** Calculate the transposed 1xW shape
  *
  * @param[in] b Input tensor info
  *
  * @return the calculated shape
  */
 inline TensorShape compute_transpose1xW_shape(const ITensorInfo &b)
 {
     // The transpose1xW output matrix will have the following shape: [ b_height * 16, ceil(b_width / 16.0f) ]
     TensorShape shape_transposed1xW_b{ b.tensor_shape() };
     shape_transposed1xW_b.set(0, b.dimension(1) * 16);
     shape_transposed1xW_b.set(1, std::ceil(b.dimension(0) / 16.f));

     return shape_transposed1xW_b;
 }

 /** Calculate the transposed 1xW width element shape
  *
  * @param[in] b                       Input tensor info
  * @param[in] mult_transpose1xW_width (Optional) Transpose1xW width
  *
  * @return the calculated shape
  */
 inline TensorShape compute_transpose1xW_with_element_size_shape(const ITensorInfo &b, int mult_transpose1xW_width = 1)
 {
     // Note: mult_transpose1xW_width expresses the number of chunks with size 1x(W) we want to store on the same row
     //       The transpose1xW output matrix will have the following shape:
     //       [ b_height * W, ceil(b_width / W) ] where W = (16 / element size of the tensor) * mult_transpose1xW_width
     ARM_COMPUTE_ERROR_ON(mult_transpose1xW_width < 1);
     TensorShape  shape_transposed1xW_b{ b.tensor_shape() };
     const size_t transpose_width = (16 / b.element_size()) * mult_transpose1xW_width;
     shape_transposed1xW_b.set(0, b.dimension(1) * transpose_width);
     shape_transposed1xW_b.set(1, static_cast<size_t>(std::ceil(b.dimension(0) / static_cast<float>(transpose_width))));

     return shape_transposed1xW_b;
 }

 /** Calculate the reductionA shape used in GEMMLowp
  *
  * @param[in] b Input tensor info
  *
  * @return the calculated shape
  */
 inline TensorShape compute_reductionA_shape(const ITensorInfo &b)
 {
     TensorShape shape_vector_sum_col{ b.tensor_shape() };
     if(shape_vector_sum_col.num_dimensions() > 1)
     {
         shape_vector_sum_col.remove_dimension(1);
     }

     return shape_vector_sum_col;
 }

 /** Calculate the reductionB shape used in GEMMLowp
  *
  * @param[in] a Input tensor info
  *
  * @return the calculated shape
  */
 inline TensorShape compute_reductionB_shape(const ITensorInfo &a)
 {
     TensorShape shape_vector_sum_row{ a.tensor_shape() };
     shape_vector_sum_row.set(Window::DimX, a.dimension(1));
     if(shape_vector_sum_row.num_dimensions() > 1)
     {
         shape_vector_sum_row.remove_dimension(1);
     }

     return shape_vector_sum_row;
 }

 /** Calculate the Col2Im shape
  *
  * @param[in] input           Input tensor info
  * @param[in] convolved_dims  Convolved dimensions
  * @param[in] batch_size_on_z True if batch size is on z axis
  * @param[in] num_groups      (Optional)  Number of groups when performing a grouped convolution
  *
  * @return the calculated shape
  */
 inline TensorShape compute_col2im_shape(const ITensorInfo &input, const Size2D &convolved_dims, bool batch_size_on_z, unsigned int num_groups = 1)
 {
     ARM_COMPUTE_ERROR_ON(num_groups == 0);
     ARM_COMPUTE_ERROR_ON(input.tensor_shape()[1] != (convolved_dims.area()));
     ARM_COMPUTE_ERROR_ON((num_groups > 1) && input.tensor_shape()[2] != num_groups);

     const DataLayout data_layout = input.data_layout();
     const int        width_idx   = get_data_layout_dimension_index(data_layout, DataLayoutDimension::WIDTH);
     const int        height_idx  = get_data_layout_dimension_index(data_layout, DataLayoutDimension::HEIGHT);
     const int        channel_idx = get_data_layout_dimension_index(data_layout, DataLayoutDimension::CHANNEL);

     TensorShape col2im_shape{ input.tensor_shape() };
     // If batches start on 3rd dimension shift dimensions right by 1 to retain upper tensor shape,
     // as first three will be override by H,W,C data
     if(batch_size_on_z && num_groups == 1)
     {
         col2im_shape.shift_right(1);
     }
     col2im_shape.set(width_idx, convolved_dims.width);
     col2im_shape.set(height_idx, convolved_dims.height);
     col2im_shape.set(channel_idx, input.tensor_shape()[0] * num_groups);

     return col2im_shape;
 }

 /** Calculate the transposed shape of a tensor
  *
  * @param[in] input Input tensor info
  *
  * @return the calculated shape
  */
 inline TensorShape compute_transposed_shape(const ITensorInfo &input)
 {
     TensorShape shape_transposed{ input.tensor_shape() };

     shape_transposed.set(0, input.dimension(1));
     shape_transposed.set(1, input.dimension(0));

     return shape_transposed;
 }

 /** Calculate the depthwise convolution output shape of a tensor
  *
  * @param[in] input            Input tensor info
  * @param[in] weights          Weights tensor info
  * @param[in] conv_info        Padding and stride information to use for the convolution.
  * @param[in] depth_multiplier Multiplier to apply to the input's depth in order to retrieve the output's depth.
  * @param[in] dilation         Dilation, in elements, across x and y. Defaults to (1, 1).
  *
  * @return the calculated shape
  */
 inline TensorShape compute_depthwise_convolution_shape(const ITensorInfo &input, const ITensorInfo &weights, PadStrideInfo conv_info, unsigned int depth_multiplier, const Size2D &dilation = Size2D(1U,
                                                        1U))
 {
     const TensorShape input_shape{ input.tensor_shape() };
     const TensorShape weights_shape{ weights.tensor_shape() };

     const DataLayout data_layout = input.data_layout();
     const int        width_idx   = get_data_layout_dimension_index(data_layout, DataLayoutDimension::WIDTH);
     const int        height_idx  = get_data_layout_dimension_index(data_layout, DataLayoutDimension::HEIGHT);
     const int        channel_idx = get_data_layout_dimension_index(data_layout, DataLayoutDimension::CHANNEL);

     const DataLayout weights_data_layout = weights.data_layout();
     const int        weights_width_idx   = get_data_layout_dimension_index(weights_data_layout, DataLayoutDimension::WIDTH);
     const int        weights_height_idx  = get_data_layout_dimension_index(weights_data_layout, DataLayoutDimension::HEIGHT);

     unsigned int output_width  = 0;
     unsigned int output_height = 0;
     std::tie(output_width, output_height) = scaled_dimensions(input_shape[width_idx], input_shape[height_idx],
                                                               weights_shape[weights_width_idx], weights_shape[weights_height_idx],
                                                               conv_info, dilation);

     TensorShape output_shape{ input_shape };
     output_shape.set(width_idx, output_width);
     output_shape.set(height_idx, output_height);
     output_shape.set(channel_idx, input_shape[channel_idx] * depth_multiplier);

     return output_shape;
 }

 /** Calculate the upsampled output shape used for deconvolution
  *
  * @param[in] input    Input tensor info
  * @param[in] weights  Weights tensor shape
  * @param[in] sx       Stride on x axis
  * @param[in] sy       Stride on y axis
  * @param[in] out_dims Output shape dimensions
  * @param[in] padx     Padding on x axis
  * @param[in] pady     Padding on y axis
  *
  * @return the calculated shape
  */
 inline TensorShape compute_deconvolution_upsampled_shape(const ITensorInfo &input, const ITensorInfo &weights, unsigned int sx, unsigned int sy,
                                                          std::pair<unsigned int, unsigned int> &out_dims, uint32_t &padx, uint32_t &pady)
 {
     const DataLayout data_layout = input.data_layout();
     const size_t     idx_w       = get_data_layout_dimension_index(data_layout, DataLayoutDimension::WIDTH);
     const size_t     idx_h       = get_data_layout_dimension_index(data_layout, DataLayoutDimension::HEIGHT);

     // Find the upsampled dimensions
     unsigned int out_x = (input.dimension(idx_w) - 1) * sx + 1;
     unsigned int out_y = (input.dimension(idx_h) - 1) * sy + 1;

     // Find the padding needed for the convolution with stride 1 in order to match output shape
     padx = out_dims.first - (out_x - weights.dimension(idx_w) + 1);
     pady = out_dims.second - (out_y - weights.dimension(idx_h) + 1);
     out_x += padx;
     out_y += pady;

     TensorShape scale_out_shape(input.tensor_shape());
     scale_out_shape.set(idx_w, out_x);
     scale_out_shape.set(idx_h, out_y);

     return scale_out_shape;
 }

 /** Calculate the output shape of the deconvolution layer
  *
  * @param[in] out_dims Output x and y shape dimensions
  * @param[in] input    Input tensor info
  * @param[in] weights  Weights tensor shape
  *
  * @return the calculated shape
  */
 inline TensorShape compute_deconvolution_output_shape(const std::pair<unsigned int, unsigned int> &out_dims, const ITensorInfo &input, const ITensorInfo &weights)
 {
     const TensorShape input_shape{ input.tensor_shape() };
     const TensorShape weights_shape{ weights.tensor_shape() };

     const DataLayout data_layout = input.data_layout();
     const int        width_idx   = get_data_layout_dimension_index(data_layout, DataLayoutDimension::WIDTH);
     const int        height_idx  = get_data_layout_dimension_index(data_layout, DataLayoutDimension::HEIGHT);
     const int        channel_idx = get_data_layout_dimension_index(data_layout, DataLayoutDimension::CHANNEL);
     const int        batch_idx   = get_data_layout_dimension_index(data_layout, DataLayoutDimension::BATCHES);

     TensorShape out_shape{ input_shape };
     out_shape.set(width_idx, out_dims.first);
     out_shape.set(height_idx, out_dims.second);
     out_shape.set(channel_idx, weights_shape[batch_idx]);
     return out_shape;
 }

 /** Calculate the im2col output shape of a tensor
  *
  * @param[in] input           Input tensor info
  * @param[in] kernel_dims     The kernel dimensions (width and height).
  * @param[in] conv_info       Contains padding and stride information
  * @param[in] has_bias        In case biases are provided expands the matrix with 1
  * @param[in] dilation        Dilation, in elements, across x and y
  * @param[in] batch_size_on_z True if batch size is on z axis
  * @param[in] num_groups      (Optional)  Number of groups when performing a grouped convolution
  *
  * @return the calculated shape
  */
 inline TensorShape compute_im2col_conv_shape(const ITensorInfo *input, const Size2D &kernel_dims, const PadStrideInfo &conv_info, bool has_bias, const Size2D &dilation, bool batch_size_on_z,
                                              unsigned int num_groups = 1)
 {
     // The output shape will be the 3D shape [ out_channels * kernel_area, num_elems_per_out_channel, batches ]                           if batch_size_on_z == true
     //                       or the 4D shape [ out_channels * kernel_area / num_groups, num_elems_per_out_channel, num_groups, batches ]  if batch_size_on_z == false

     ARM_COMPUTE_ERROR_ON(num_groups == 0);
     ARM_COMPUTE_ERROR_ON(num_groups > 1 && input->data_layout() != DataLayout::NCHW);
     ARM_COMPUTE_ERROR_ON(num_groups > 1 && batch_size_on_z);

     TensorShape output_shape{ input->tensor_shape() };

     const DataLayout data_layout = input->data_layout();
     const int        width_idx   = get_data_layout_dimension_index(data_layout, DataLayoutDimension::WIDTH);
     const int        height_idx  = get_data_layout_dimension_index(data_layout, DataLayoutDimension::HEIGHT);
     const int        channel_idx = get_data_layout_dimension_index(data_layout, DataLayoutDimension::CHANNEL);

     std::pair<unsigned int, unsigned int> out_dims = scaled_dimensions(output_shape[width_idx], output_shape[height_idx], kernel_dims.width, kernel_dims.height, conv_info, dilation);
     output_shape.set(0, (output_shape[channel_idx] / num_groups * kernel_dims.area() + (has_bias ? 1 : 0))); // NOLINT
     output_shape.set(1, (out_dims.first * out_dims.second));
     if(batch_size_on_z && output_shape.num_dimensions() >= 3)
     {
         output_shape.remove_dimension(2);
     }
     else
     {
         output_shape.set(2, num_groups);
     }

     return output_shape;
 }

 /** Calculate the flattened output shape of a tensor
  *
  * @param[in] input Input tensor info
  *
  * @return the calculated shape
  */
 inline TensorShape compute_flatten_shape(const ITensorInfo *input)
 {
     // The output shape will be the flatten version of the input (i.e. [ width * height * channels, num_batches, ... ] ). Used for FlattenLayer and FullyConnectedLayer.

     TensorShape output_shape{ input->tensor_shape() };

     output_shape.collapse(3);

     return output_shape;
 }

 /** Calculate the softmax output shape of a tensor
  *
  * @param[in] input Input tensor info
  * @param[in] axis  (Optional) Softmax axis
  *
  * @return the calculated shape
  */
 inline TensorShape compute_softmax_shape(const ITensorInfo *input, size_t axis = 1)
 {
     // The output shape will be a 2D version of the input. For instance:
     // - [x,y,z] and axis 1 will return [x, y*z]
     // - [x,y,z,w] and axis 2 will return [x*y, w*z]
     // - [x,y,z,w] and axis 3 will return [x*y*z, w]
     TensorShape shape2D = input->tensor_shape();

     if(axis < input->num_dimensions())
     {
         // Collapse from axis onward (this changes the shape)
         shape2D.collapse_from(axis);

         // Collapse the rest (collapse is inclusive)
         shape2D.collapse(shape2D.num_dimensions() - 1);
     }
     else
     {
         // Collapse everything
         shape2D.collapse(shape2D.num_dimensions());
     }

     if(axis == 0)
     {
         // If axis is zero the first dim should be one. Since
         // collapse is an inclusive operation we need to shift
         shape2D.shift_right(1);
     }

     return shape2D;
 }

 /** Calculate the winograd filter transform shape
  *
  * @param[in] input         Input tensor info
  * @param[in] winograd_info Winograd information
  *
  * @return the calculated shape
  */
 inline TensorShape compute_winograd_filter_transform_shape(const ITensorInfo &input, const WinogradInfo &winograd_info)
 {
     TensorShape tensor_shape{ input.tensor_shape() };

     const Size2D kernel_size      = winograd_info.kernel_size;
     const Size2D output_tile_size = winograd_info.output_tile_size;
     const Size2D input_tile_size  = Size2D(output_tile_size.width + kernel_size.width - 1, output_tile_size.height + kernel_size.height - 1);

     tensor_shape.remove_dimension(get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::WIDTH));
     tensor_shape.set(Window::DimX, input.dimension(3));
     tensor_shape.set(Window::DimY, input.dimension(get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::CHANNEL)));
     tensor_shape.set(Window::DimZ, input_tile_size.area());

     return tensor_shape;
 }

 /** Calculate the winograd input transform shape
  *
  * @param[in] input         Input tensor info
  * @param[in] winograd_info Winograd information
  *
  * @return the calculated shape
  */
 inline TensorShape compute_winograd_input_transform_shape(const ITensorInfo &input, const WinogradInfo &winograd_info)
 {
     const PadStrideInfo conv_info        = winograd_info.convolution_info;
     const Size2D        kernel_size      = winograd_info.kernel_size;
     const Size2D        output_tile_size = winograd_info.output_tile_size;
     const Size2D        input_tile_size  = Size2D(output_tile_size.width + kernel_size.width - 1, output_tile_size.height + kernel_size.height - 1);

     const size_t idx_w = get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::WIDTH);
     const size_t idx_h = get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::HEIGHT);
     const size_t idx_c = get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::CHANNEL);

     // Compute the number of output tiles along the x and y direction of size "output_tile_size"
     const Size2D num_tiles = compute_winograd_convolution_tiles(Size2D(input.tensor_shape()[idx_w], input.tensor_shape()[idx_h]),
                                                                 kernel_size,
                                                                 output_tile_size,
                                                                 conv_info);

     const unsigned int width  = input.tensor_shape()[idx_c];
     const unsigned int height = num_tiles.area();
     const unsigned int depth  = input_tile_size.area();

     TensorShape output_shape{ input.tensor_shape() };
     output_shape.set(0, width);
     output_shape.set(1, height);
     output_shape.set(2, depth);

     return output_shape;
 }

 /** Calculate the winograd output transform shape
  *
  * @param[in] input         Input tensor info
  * @param[in] winograd_info Winograd information
  *
  * @return the calculated shape
  */
 inline TensorShape compute_winograd_output_transform_shape(const ITensorInfo &input, const WinogradInfo &winograd_info)
 {
     const PadStrideInfo conv_info        = winograd_info.convolution_info;
     const Size2D        kernel_size      = winograd_info.kernel_size;
     const Size2D        input_dimensions = winograd_info.input_dimensions;
     const DataLayout    data_layout      = winograd_info.output_data_layout;

     // Compute output shape
     unsigned int output_width  = 0;
     unsigned int output_height = 0;
     std::tie(output_width, output_height) = scaled_dimensions(input_dimensions.width, input_dimensions.height,
                                                               kernel_size.width, kernel_size.height, conv_info);

     TensorShape tensor_shape{ input.tensor_shape() };

     // Output dimension
     const unsigned int out_w = output_width;
     const unsigned int out_h = output_height;
     const unsigned int out_c = input.dimension(0);

     tensor_shape.set(get_data_layout_dimension_index(data_layout, DataLayoutDimension::WIDTH), out_w);
     tensor_shape.set(get_data_layout_dimension_index(data_layout, DataLayoutDimension::HEIGHT), out_h);
     tensor_shape.set(get_data_layout_dimension_index(data_layout, DataLayoutDimension::CHANNEL), out_c);

     return tensor_shape;
 }

 /** Calculate the deep convolution shape output shape of a tensor
  *
  * @param[in] input     Input tensor info
  * @param[in] weights   Weights tensor info
  * @param[in] conv_info Contains padding and stride information
  *
  * @return the calculated shape
  */
 inline TensorShape compute_deep_convolution_shape(const ITensorInfo &input, const ITensorInfo &weights, PadStrideInfo conv_info)
 {
     const TensorShape input_shape{ input.tensor_shape() };
     const TensorShape weights_shape{ weights.tensor_shape() };

     const size_t idx_width   = get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::WIDTH);
     const size_t idx_height  = get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::HEIGHT);
     const size_t idx_channel = get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::CHANNEL);

     const unsigned int input_width         = input_shape[idx_width];
     const unsigned int input_height        = input_shape[idx_height];
     const unsigned int weights_width       = weights_shape[idx_width];
     const unsigned int weights_height      = weights_shape[idx_height];
     const unsigned int weights_out_channel = weights_shape[3];
     unsigned int       output_width        = 0;
     unsigned int       output_height       = 0;
     std::tie(output_width, output_height) = scaled_dimensions(input_width, input_height, weights_width, weights_height, conv_info);

     TensorShape output_shape{ input_shape };
     output_shape.set(idx_width, output_width);
     output_shape.set(idx_height, output_height);
     output_shape.set(idx_channel, weights_out_channel);

     return output_shape;
 }

 /** Calculate the min/max shape output shape of a tensor
  *
  * @param[in] input Input tensor info
  *
  * @return the calculated shape
  */
 inline TensorShape compute_min_max_shape(const ITensorInfo *input)
 {
     TensorShape output_shape{ input->tensor_shape() };
     output_shape.set(Window::DimX, 2);
     output_shape.remove_dimension(1);
     output_shape.remove_dimension(1);

     return output_shape;
 }

 /** Calculate the output pool shape of a tensor
  *
  * @param[in] input     Input tensor info
  * @param[in] pool_info Pooling layer info
  *
  * @return the calculated shape
  */
 inline TensorShape compute_pool_shape(const ITensorInfo &input, PoolingLayerInfo pool_info)
 {
     unsigned int pooled_w = 0;
     unsigned int pooled_h = 0;

     TensorShape output_shape{ input.tensor_shape() };

     const bool         is_global_pooling = pool_info.is_global_pooling;
     const unsigned int idx_width         = get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::WIDTH);
     const unsigned int idx_height        = get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::HEIGHT);
     const unsigned int pool_size_x       = is_global_pooling ? output_shape[idx_width] : pool_info.pool_size.width;
     const unsigned int pool_size_y       = is_global_pooling ? output_shape[idx_height] : pool_info.pool_size.height;

     std::tie(pooled_w, pooled_h) = scaled_dimensions(output_shape[idx_width],
                                                      output_shape[idx_height],
                                                      pool_size_x,
                                                      pool_size_y,
                                                      pool_info.pad_stride_info);

     output_shape.set(idx_width, pooled_w);
     output_shape.set(idx_height, pooled_h);

     return output_shape;
 }

 /** Calculate the output unpool shape of a tensor
  *
  * @param[in] input     Input tensor info
  * @param[in] pool_info Pooling layer info
  *
  * @return the calculated shape
  */
 inline TensorShape compute_unpool_shape(const ITensorInfo &input, PoolingLayerInfo pool_info)
 {
     const unsigned int idx_width   = get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::WIDTH);
     const unsigned int idx_height  = get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::HEIGHT);
     const TensorShape  input_shape = input.tensor_shape();
     ARM_COMPUTE_ERROR_ON(input_shape[idx_height] <= 1 || input_shape[idx_width] <= 1);
     const PadStrideInfo pad_stride_info = pool_info.pad_stride_info;
     const unsigned int  stride_x        = pad_stride_info.stride().first;
     const unsigned int  stride_y        = pad_stride_info.stride().second;

     const int pad_left   = pad_stride_info.pad_left();
     const int pad_top    = pad_stride_info.pad_top();
     const int pad_right  = pad_stride_info.pad_right();
     const int pad_bottom = pad_stride_info.pad_bottom();

     TensorShape        output_shape = input_shape;
     const unsigned int out_width    = (input_shape[idx_width] - 1) * stride_x - pad_left - pad_right + pool_info.pool_size.width;
     const unsigned int out_height   = (input_shape[idx_height] - 1) * stride_y - pad_top - pad_bottom + pool_info.pool_size.height;

     output_shape.set(idx_width, out_width);
     output_shape.set(idx_height, out_height);
     return output_shape;
 }

 /** Calculate the output roi align shape of a tensor
  *
  * @param[in] input     Input tensor info
  * @param[in] rois      Rois tensor info
  * @param[in] pool_info Pooling layer info
  *
  * @return the calculated shape
  */
 inline TensorShape compute_roi_align_shape(const ITensorInfo &input, const ITensorInfo &rois, ROIPoolingLayerInfo pool_info)
 {
     TensorShape output_shape{ input.tensor_shape() };

     const unsigned int idx_width  = get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::WIDTH);
     const unsigned int idx_height = get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::HEIGHT);

     output_shape.set(idx_width, pool_info.pooled_width());
     output_shape.set(idx_height, pool_info.pooled_height());
     output_shape.set(3, rois.dimension(1));

     return output_shape;
 }

 /** Calculate the RNN shape of a tensor
  *
  * @param[in] input      Input tensor info
  * @param[in] batch_size Batch size
  *
  * @return the calculated shape
  */
 inline TensorShape compute_rnn_shape(const ITensorInfo *input, const unsigned int batch_size)
 {
     TensorShape output_shape{ input->tensor_shape() };
     output_shape.set(1, batch_size);

     return output_shape;
 }

 /** Calculate the matrix multiplication output shape of two tensors
  *
  * @param[in] input0                    First input tensor info
  * @param[in] input1                    Second input tensor info
  * @param[in] is_interleaved_transposed True if the input is interleaved transposed
  * @param[in] reshape_info              GEMM reshape info
  *
  * @return the calculated shape
  */
 inline TensorShape compute_mm_shape(const ITensorInfo &input0, const ITensorInfo &input1, bool is_interleaved_transposed, const GEMMReshapeInfo &reshape_info)
 {
     ARM_COMPUTE_ERROR_ON_MSG(input0.num_dimensions() > 4, "The number of dimensions for the matrix A must be <= 4");
     ARM_COMPUTE_ERROR_ON_MSG(is_interleaved_transposed && reshape_info.reinterpret_input_as_3d(), "The first input tensor cannot be reinterpreted as 3D if is_interleaved_transposed is true");

     const bool reinterpret_input_as_3d  = reshape_info.reinterpret_input_as_3d();
     const bool reinterpret_output_as_3d = reshape_info.depth_output_gemm3d() != 0;
     const int  depth_output_gemm3d      = reinterpret_output_as_3d ? reshape_info.depth_output_gemm3d() : 1;
     const int  m                        = reshape_info.reinterpret_input_as_3d() ? input0.dimension(1) * input0.dimension(2) : input0.dimension(1);

     // If the output of GEMM has to be reinterpreted as 3D, the number of input0 rows (M) is obtained collapsing the second and third
     // dimension of the output tensor
     const int dim0 = is_interleaved_transposed ? reshape_info.n() : input1.dimension(0);
     const int dim1 = is_interleaved_transposed ? reshape_info.m() / depth_output_gemm3d : m / depth_output_gemm3d;
     const int dim2 = reinterpret_input_as_3d ? input0.tensor_shape()[3] : input0.tensor_shape()[2];
     const int dim3 = reinterpret_input_as_3d ? 1 : input0.tensor_shape()[3];

     TensorShape output_shape{ input0.tensor_shape() };

     output_shape.set(0, dim0);
     output_shape.set(1, dim1);
     output_shape.set(2, reinterpret_output_as_3d ? depth_output_gemm3d : dim2);
     output_shape.set(3, reinterpret_output_as_3d ? dim2 : dim3);
     output_shape.set(4, reinterpret_output_as_3d ? dim3 : 1);

     return output_shape;
 }

 /** Calculate the matrix multiplication output shape of two tensors
  *
  * @param[in] input0    First input tensor info
  * @param[in] input1    Second input tensor info
  * @param[in] gemm_info GEMM reshape info
  *
  * @return the calculated shape
  */
 inline TensorShape compute_mm_shape(const ITensorInfo &input0, const ITensorInfo &input1, const GEMMReshapeInfo &gemm_info)
 {
     ARM_COMPUTE_UNUSED(input1);
     ARM_COMPUTE_ERROR_ON_MSG(input0.num_dimensions() > 4, "The number of dimensions for the matrix A must be <= 4");

     const bool reinterpret_input_as_3d  = gemm_info.reinterpret_input_as_3d();
     const bool reinterpret_output_as_3d = gemm_info.depth_output_gemm3d() != 0;
     const int  depth_output_gemm3d      = reinterpret_output_as_3d ? gemm_info.depth_output_gemm3d() : 1;

     TensorShape output_shape{ input0.tensor_shape() };

     if(!reinterpret_input_as_3d && !reinterpret_output_as_3d)
     {
         output_shape.set(0, gemm_info.n());
         output_shape.set(1, gemm_info.m());
     }
     else
     {
         // If the output of GEMM has to be reinterpreted as 3D, the number of input0 rows (M) is obtained collapsing the second and third
         // dimension of the output tensor
         const int batch_size = reinterpret_input_as_3d ? input0.tensor_shape()[3] : input0.tensor_shape()[2];
         output_shape.set(0, gemm_info.n());
         output_shape.set(1, gemm_info.m() / depth_output_gemm3d);
         output_shape.set(2, reinterpret_output_as_3d ? depth_output_gemm3d : batch_size);
         output_shape.set(3, reinterpret_output_as_3d ? batch_size : 1);
     }

     return output_shape;
 }

 /** Calculate the matrix multiplication output shape of two tensors
  *
  * @param[in] input0    First input tensor info
  * @param[in] input1    Second input tensor info
  * @param[in] gemm_info GEMM kernel info used to retrieve the original dimensions of the input matrices
  *
  * @return the calculated shape
  */
 inline TensorShape compute_mm_shape(const ITensorInfo &input0, const ITensorInfo &input1, const GEMMKernelInfo &gemm_info)
 {
     ARM_COMPUTE_UNUSED(input1);
     ARM_COMPUTE_ERROR_ON_MSG(input0.num_dimensions() > 4, "The number of dimensions for the matrix A must be <= 4");

     const bool         reinterpret_input_as_3d  = gemm_info.reinterpret_input_as_3d;
     const bool         reinterpret_output_as_3d = gemm_info.depth_output_gemm3d != 0;
     const unsigned int depth_output_gemm3d      = reinterpret_output_as_3d ? gemm_info.depth_output_gemm3d : 1;

     TensorShape output_shape{ input0.tensor_shape() };

     if(!reinterpret_input_as_3d && !reinterpret_output_as_3d)
     {
         output_shape.set(0, gemm_info.n);
         output_shape.set(1, gemm_info.m);
     }
     else
     {
         // If the output of GEMM has to be reinterpreted as 3D, the number of input0 rows (M) is obtained collapsing the second and third
         // dimension of the output tensor
         const unsigned int batch_size = reinterpret_input_as_3d ? input0.tensor_shape()[3] : input0.tensor_shape()[2];
         output_shape.set(0, gemm_info.n);
         output_shape.set(1, gemm_info.m / depth_output_gemm3d);
         output_shape.set(2, reinterpret_output_as_3d ? depth_output_gemm3d : batch_size);
         output_shape.set(3, reinterpret_output_as_3d ? batch_size : 1);
     }

     return output_shape;
 }

 /** Calculate the matrix multiplication output shape of two tensors
  *
  * @param[in] input           Input tensor info
  * @param[in] gemm_3d_depth   (Optional)  GEMM 3d depth
  * @param[in] batch_size_on_z (Optional) True if batch size is on z axis
  *
  * @return the calculated shape
  */
 inline TensorShape compute_output_stage_shape(const ITensorInfo &input, unsigned int gemm_3d_depth = 1, bool batch_size_on_z = false)
 {
     ARM_COMPUTE_ERROR_ON(input.data_layout() != DataLayout::NHWC && gemm_3d_depth > 1);

     TensorShape output_shape = input.tensor_shape();
     if(gemm_3d_depth > 1)
     {
         if(batch_size_on_z)
         {
             output_shape.shift_right(1);
         }
         output_shape.set(0, input.tensor_shape().x());
         output_shape.set(1, input.tensor_shape().y() / gemm_3d_depth);
         output_shape.set(2, gemm_3d_depth);
     }

     return output_shape;
 }

 /** Calculate the strided slice output shape of a tensor
  *
  * @param[in] input            Input tensor info
  * @param[in] starts           The starts of the dimensions of the input tensor to be sliced
  * @param[in] ends             The ends of the dimensions of the input tensor to be sliced
  * @param[in] strides          The strides of the dimensions of the input tensor to be sliced
  * @param[in] begin_mask       If the ith bit of begin_mask is set, starts[i] is ignored and the fullest possible range in that dimension is used instead.
  * @param[in] end_mask         If the ith bit of end_mask is set, ends[i] is ignored and the fullest possible range in that dimension is used instead.
  * @param[in] shrink_axis_mask If the ith bit of shrink_axis_mask is set, it implies that the ith specification shrinks the dimensionality by 1
  *
  * @return the calculated shape
  */
 inline TensorShape compute_strided_slice_shape(const ITensorInfo &input,
                                                const Coordinates &starts, const Coordinates &ends, const Coordinates &strides,
                                                int32_t begin_mask, int32_t end_mask, int32_t shrink_axis_mask)
 {
     using namespace arm_compute::helpers::tensor_transform;
     return compute_strided_slice_output_shape(input.tensor_shape(), starts, ends, strides, begin_mask, end_mask, shrink_axis_mask);
 }

 /** Calculate the slice output shape of a tensor
  *
  * @param[in] input_shape Input tensor info
  * @param[in] starts      The starts of the dimensions of the input tensor to be sliced
  * @param[in] ends        The ends of the dimensions of the input tensor to be sliced
  *
  * @return the calculated shape
  */
 inline TensorShape compute_slice_shape(const TensorShape &input_shape, const Coordinates &starts, const Coordinates &ends)
 {
     using namespace arm_compute::helpers::tensor_transform;

     return compute_strided_slice_output_shape(input_shape,
                                               starts, ends, BiStrides(),
                                               0, construct_slice_end_mask(ends), 0);
 }

 /** Calculate the batch to space output shape of a tensor
  *
  * @param[in] input   Input tensor info
  * @param[in] block_x Block shape x value
  * @param[in] block_y Block shape y value
  *
  * @return the calculated shape
  */
 inline TensorShape compute_batch_to_space_shape(const ITensorInfo *input, const int block_x, const int block_y)
 {
     ARM_COMPUTE_ERROR_ON(block_x <= 0 || block_y <= 0);

     const DataLayout data_layout = input->data_layout();
     const int        idx_width   = get_data_layout_dimension_index(data_layout, DataLayoutDimension::WIDTH);
     const int        idx_height  = get_data_layout_dimension_index(data_layout, DataLayoutDimension::HEIGHT);
     const int        idx_batch   = get_data_layout_dimension_index(data_layout, DataLayoutDimension::BATCHES);

     TensorShape output_shape{ input->tensor_shape() };
     output_shape.set(idx_width, input->tensor_shape()[idx_width] * block_x);
     output_shape.set(idx_height, input->tensor_shape()[idx_height] * block_y);
     output_shape.set(idx_batch, input->tensor_shape()[idx_batch] / (block_x * block_y));

     return output_shape;
 }

 /** Calculate the depth to space output shape of a tensor
  *
  * @param[in] input_shape Input tensor shape
  * @param[in] data_layout Operation data layout
  * @param[in] block       Block shape value
  *
  * @return the calculated shape
  */
 inline TensorShape compute_depth_to_space_shape(const TensorShape &input_shape, DataLayout data_layout, int block)
 {
     ARM_COMPUTE_ERROR_ON(block < 2);

     const int idx_width   = get_data_layout_dimension_index(data_layout, DataLayoutDimension::WIDTH);
     const int idx_height  = get_data_layout_dimension_index(data_layout, DataLayoutDimension::HEIGHT);
     const int idx_channel = get_data_layout_dimension_index(data_layout, DataLayoutDimension::CHANNEL);

     TensorShape output_shape{ input_shape };
     output_shape.set(idx_width, input_shape[idx_width] * block);
     output_shape.set(idx_height, input_shape[idx_height] * block);
     output_shape.set(idx_channel, input_shape[idx_channel] / (block * block));

     return output_shape;
 }

 /** Calculate the split output shape of a tensor
  *
  * @param[in] input      Input tensor info
  * @param[in] axis       Axis on which to split the input
  * @param[in] num_splits Number of splits
  *
  * @return the calculated shape
  */
 inline TensorShape compute_split_shape(const ITensorInfo *input, unsigned int axis, unsigned int num_splits)
 {
     TensorShape empty_shape;
     empty_shape.set(0, 0);

     TensorShape out_shape{ input->tensor_shape() };

     // Return empty shape if axis is invalid
     if(axis > input->tensor_shape().num_dimensions())
     {
         return empty_shape;
     }

     size_t axis_size = out_shape[axis];

     // Return empty shape if num_split is not valid
     if(axis_size % num_splits)
     {
         return empty_shape;
     }

     out_shape[axis] = axis_size / num_splits;
     return out_shape;
 }

 /** Calculate the space to batch output shape of a tensor
  *
  * @param[in] input         Input tensor info
  * @param[in] block_x       Block shape x value
  * @param[in] block_y       Block shape y value
  * @param[in] padding_left  Left padding values
  * @param[in] padding_right Right padding values
  *
  * @return the calculated shape
  */
 inline TensorShape compute_space_to_batch_shape(const ITensorInfo *input, const int block_x, const int block_y, const Size2D &padding_left, const Size2D &padding_right)
 {
     TensorShape output_shape{ input->tensor_shape() };

     const DataLayout data_layout = input->data_layout();
     const int        idx_width   = get_data_layout_dimension_index(data_layout, DataLayoutDimension::WIDTH);
     const int        idx_height  = get_data_layout_dimension_index(data_layout, DataLayoutDimension::HEIGHT);
     const int        idx_batch   = get_data_layout_dimension_index(data_layout, DataLayoutDimension::BATCHES);

     ARM_COMPUTE_ERROR_ON((input->tensor_shape()[idx_width] + padding_left.x() + padding_right.x()) % block_x != 0);
     ARM_COMPUTE_ERROR_ON((input->tensor_shape()[idx_height] + padding_left.y() + padding_right.y()) % block_y != 0);

     output_shape.set(idx_width, (input->tensor_shape()[idx_width] + padding_left.x() + padding_right.x()) / block_x);
     output_shape.set(idx_height, (input->tensor_shape()[idx_height] + padding_left.y() + padding_right.y()) / block_y);
     output_shape.set(idx_batch, input->tensor_shape()[idx_batch] * block_x * block_y);

     return output_shape;
 }

 /** Calculate the space to batch output shape of a tensor
  *
  * @param[in] input       Input tensor info
  * @param[in] block_shape Block shape value
  *
  * @return the calculated shape
  */
 inline TensorShape compute_space_to_depth_shape(const ITensorInfo *input, int32_t block_shape)
 {
     TensorShape output_shape{ input->tensor_shape() };

     const DataLayout data_layout = input->data_layout();
     const int        idx_width   = get_data_layout_dimension_index(data_layout, DataLayoutDimension::WIDTH);
     const int        idx_height  = get_data_layout_dimension_index(data_layout, DataLayoutDimension::HEIGHT);
     const int        idx_depth   = get_data_layout_dimension_index(data_layout, DataLayoutDimension::CHANNEL);

     output_shape.set(idx_width, input->tensor_shape()[idx_width] * block_shape);
     output_shape.set(idx_height, input->tensor_shape()[idx_height] * block_shape);
     output_shape.set(idx_depth, input->tensor_shape()[idx_depth] / (block_shape * block_shape));

     return output_shape;
 }

 /** Calculate the prior box output shape of a tensor
  *
  * @param[in] input Input tensor info
  * @param[in] info  PriorBoxLayer info
  *
  * @return the calculated shape
  */
 inline TensorShape compute_prior_box_shape(const ITensorInfo &input, const PriorBoxLayerInfo &info)
 {
     DataLayout   data_layout = input.data_layout();
     const size_t idx_w       = get_data_layout_dimension_index(data_layout, DataLayoutDimension::WIDTH);
     const size_t idx_h       = get_data_layout_dimension_index(data_layout, DataLayoutDimension::HEIGHT);
     const int    num_priors  = info.aspect_ratios().size() * info.min_sizes().size() + info.max_sizes().size();

     TensorShape output_shape{};
     output_shape.set(0, input.dimension(idx_w) * input.dimension(idx_h) * num_priors * 4);
     output_shape.set(1, 2);

     return output_shape;
 }

 /** Calculate the padded shape of a tensor
  *
  * @param[in] input_shape Input tensor shape
  * @param[in] padding     Paddings list
  *
  * @return the calculated shape
  */
 inline TensorShape compute_padded_shape(const TensorShape &input_shape, const PaddingList &padding)
 {
     TensorShape padded_shape = input_shape;
     for(size_t dim = 0; dim < padding.size(); ++dim)
     {
         const auto    &padding_pair   = padding[dim];
         const uint32_t shape_on_index = (padded_shape.num_dimensions() <= dim) ? 1 : input_shape[dim];
         padded_shape.set(dim, padding_pair.first + shape_on_index + padding_pair.second);
     }
     return padded_shape;
 }

 /** Calculate the tiled shape of a tensor
  *
  * @param[in] input_shape Input tensor shape
  * @param[in] multiples   Paddings list
  *
  * @return the calculated shape
  */
 inline TensorShape compute_tiled_shape(const TensorShape &input_shape, const Multiples &multiples)
 {
     TensorShape tiled_shape = input_shape;
     for(size_t dim = 0; dim < multiples.size(); ++dim)
     {
         tiled_shape.set(dim, input_shape[dim] * multiples[dim]);
     }
     return tiled_shape;
 }

 /** Calculate the reduced shape of a tensor given an axis
  *
  * @param[in] input     Input tensor info
  * @param[in] axis      Axis on which to perform reduction
  * @param[in] keep_dims (Optional) Whether to keep the dimension after reduction operation. Defaults to true.
  *
  * @return the calculated shape
  */
 inline TensorShape compute_reduced_shape(const TensorShape &input, unsigned int axis, bool keep_dims = true)
 {
     TensorShape output_shape{ input };

     if(!keep_dims)
     {
         output_shape.remove_dimension(axis);
     }
     else
     {
         output_shape.set(axis, 1);
     }

     return output_shape;
 }

 /** Calculate the upsampled shape of a tensor
  *
  * @param[in] input Input tensor info
  * @param[in] info  Contains stride information (x and y)
  *
  * @return the calculated shape
  */
 inline TensorShape compute_upsample_shape(const ITensorInfo &input, const Size2D &info)
 {
     const DataLayout data_layout = input.data_layout();
     const int        idx_width   = get_data_layout_dimension_index(data_layout, DataLayoutDimension::WIDTH);
     const int        idx_height  = get_data_layout_dimension_index(data_layout, DataLayoutDimension::HEIGHT);

     TensorShape        scale_out_shape(input.tensor_shape());
     const unsigned int out_x = input.dimension(idx_width) * info.x();
     const unsigned int out_y = input.dimension(idx_height) * info.y();
     scale_out_shape.set(idx_width, out_x);
     scale_out_shape.set(idx_height, out_y);

     return scale_out_shape;
 }

 /** Get the tensor shape
  *
  * @param[in] data Input data
  *
  * @return the extracted tensor shape
  */
 template <typename T>
 inline TensorShape extract_shape(T *data)
 {
     return data->info()->tensor_shape();
 }

 inline TensorShape extract_shape(ITensorInfo *data)
 {
     return data->tensor_shape();
 }
 inline TensorShape extract_shape(const ITensorInfo *data)
 {
     return data->tensor_shape();
 }

 inline TensorShape extract_shape(const TensorShape *data)
 {
     return *data;
 }

 inline TensorShape extract_shape(TensorShape *data)
 {
     return *data;
 }

 /** Calculate the unstack shape of a tensor
  *
  * @param[in] input_shape Input tensor shape
  * @param[in] axis        Axis on which to perform the unstack operation
  *
  * @return the calculated shape
  */
 inline TensorShape calculate_unstack_shape(TensorShape input_shape, unsigned int axis)
 {
     ARM_COMPUTE_ERROR_ON(axis > input_shape.num_dimensions());
     input_shape.remove_dimension(axis);
     return input_shape;
 }

 /** Calculate the concatenate output shape of the concatenate operation along a single axis
  *
  * @param[in] input Vector containing the shapes of the inputs
  * @param[in] axis  Axis along which to concatenate the input tensors
  *
  * @return the calculated shape
  */
 template <typename T>
 inline TensorShape calculate_concatenate_shape(const std::vector<T *> &input, size_t axis)
 {
     TensorShape out_shape = extract_shape(input[0]);

 #if defined(ARM_COMPUTE_ASSERTS_ENABLED)
     // All dimensions must match except the axis one
     for(unsigned int i = 0; i < MAX_DIMS; ++i)
     {
         if(i == axis)
         {
             continue;
         }

         for(const auto &tensor : input)
         {
             ARM_COMPUTE_ERROR_ON(tensor == nullptr);
             const TensorShape shape = extract_shape(tensor);
             ARM_COMPUTE_ERROR_ON(out_shape[i] != shape[i]);
         }
     }
 #endif // defined(ARM_COMPUTE_ASSERTS_ENABLED)

     // Calculate output shape
     size_t new_size = 0;
     for(const auto &tensor : input)
     {
         const TensorShape shape = extract_shape(tensor);
         new_size += shape[axis];
     }

     out_shape.set(axis, new_size);

     return out_shape;
 }
 /** Calculate the stack output shape of a tensor
  *
  * @param[in] a           Input tensor info
  * @param[in] axis        Axis on which to perform the stack operation
  * @param[in] num_tensors Number of tensors to stack
  *
  * @return the calculated shape
  */
 inline TensorShape compute_stack_shape(const ITensorInfo &a, unsigned int axis, unsigned int num_tensors)
 {
     ARM_COMPUTE_ERROR_ON(axis > a.num_dimensions());
     ARM_COMPUTE_ERROR_ON(a.num_dimensions() > 4);

     TensorShape shape_out{ a.tensor_shape() };
     shape_out.set(axis, num_tensors);

     unsigned int i_shift = 0;

     for(unsigned int i = 0; i < a.num_dimensions(); ++i)
     {
         if(i == axis)
         {
             i_shift++;
         }

         shape_out.set(i + i_shift, a.tensor_shape()[i]);
     }
     return shape_out;
 }

 inline TensorShape compute_gather_shape(const TensorShape &input_shape, const TensorShape &indices_shape, uint32_t actual_axis)
 {
     ARM_COMPUTE_ERROR_ON(indices_shape.num_dimensions() > 1);
     ARM_COMPUTE_ERROR_ON(input_shape.num_dimensions() > 4);
     ARM_COMPUTE_ERROR_ON(actual_axis >= input_shape.num_dimensions());

     TensorShape output_shape  = input_shape;
     output_shape[actual_axis] = indices_shape[0];

     return output_shape;
 }
 } // namespace shape_calculator
 } // namespace misc
 } // namespace arm_compute
 #endif /* ARM_COMPUTE_MISC_SHAPE_CALCULATOR_H */
M
unsigned int M
Definition: NEGEMMAssemblyDispatch.cpp:48

arm_compute::ITensorInfo::num_dimensions
virtual size_t num_dimensions() const =0
The number of dimensions of the tensor (rank)

arm_compute::test::validation::shape
shape
Definition: DFT.cpp:115

arm_compute::test::validation::idx_width
const int idx_width
Definition: Scale.cpp:265

arm_compute::TensorShape::shift_right
void shift_right(size_t step)
Shifts right the tensor shape increasing its dimensions.
Definition: TensorShape.h:144

arm_compute::misc::shape_calculator::compute_slice_shape
TensorShape compute_slice_shape(const TensorShape &input_shape, const Coordinates &starts, const Coordinates &ends)
Calculate the slice output shape of a tensor.
Definition: ShapeCalculator.h:1048

arm_compute::TensorShape
Shape of a tensor.
Definition: TensorShape.h:39

arm_compute::misc::shape_calculator::compute_permutation_output_shape
TensorShape compute_permutation_output_shape(const ITensorInfo &input, const PermutationVector &perm)
Calculate the permuted shape of an input given a permutation vector.
Definition: ShapeCalculator.h:108

arm_compute::misc::shape_calculator::compute_depth_to_space_shape
TensorShape compute_depth_to_space_shape(const TensorShape &input_shape, DataLayout data_layout, int block)
Calculate the depth to space output shape of a tensor.
Definition: ShapeCalculator.h:1090

arm_compute::TensorShape::remove_dimension
void remove_dimension(size_t n)
Accessor to remove the dimension n from the tensor shape.
Definition: TensorShape.h:111

arm_compute::misc::shape_calculator::compute_winograd_input_transform_shape
TensorShape compute_winograd_input_transform_shape(const ITensorInfo &input, const WinogradInfo &winograd_info)
Calculate the winograd input transform shape.
Definition: ShapeCalculator.h:667

arm_compute::WinogradInfo::output_data_layout
DataLayout output_data_layout
Data layout to use for the output tensor once the convolution has been applied (NCHW or NHWC) ...
Definition: Types.h:2201

arm_compute::misc::shape_calculator::calculate_unstack_shape
TensorShape calculate_unstack_shape(TensorShape input_shape, unsigned int axis)
Calculate the unstack shape of a tensor.
Definition: ShapeCalculator.h:1332

arm_compute::misc::shape_calculator::compute_transpose1xW_with_element_size_shape
TensorShape compute_transpose1xW_with_element_size_shape(const ITensorInfo &b, int mult_transpose1xW_width=1)
Calculate the transposed 1xW width element shape.
Definition: ShapeCalculator.h:337

arm_compute::GEMMKernelInfo
Descriptor used by the GEMM kernels.
Definition: KernelDescriptors.h:56

arm_compute::misc::shape_calculator::compute_stack_shape
TensorShape compute_stack_shape(const ITensorInfo &a, unsigned int axis, unsigned int num_tensors)
Calculate the stack output shape of a tensor.
Definition: ShapeCalculator.h:1389

arm_compute::misc::shape_calculator::compute_depthwise_convolution_shape
TensorShape compute_depthwise_convolution_shape(const ITensorInfo &input, const ITensorInfo &weights, PadStrideInfo conv_info, unsigned int depth_multiplier, const Size2D &dilation=Size2D(1U, 1U))
Calculate the depthwise convolution output shape of a tensor.
Definition: ShapeCalculator.h:446

arm_compute::ITensorInfo::dimension
virtual size_t dimension(size_t index) const =0
Return the size of the requested dimension.

arm_compute::PaddingList
std::vector< PaddingInfo > PaddingList
List of padding information.
Definition: Types.h:481

arm_compute::misc::shape_calculator::compute_roi_align_shape
TensorShape compute_roi_align_shape(const ITensorInfo &input, const ITensorInfo &rois, ROIPoolingLayerInfo pool_info)
Calculate the output roi align shape of a tensor.
Definition: ShapeCalculator.h:851

arm_compute::test::validation::b
SimpleTensor< float > b
Definition: DFT.cpp:157

arm_compute::misc::shape_calculator::compute_deep_convolution_shape
TensorShape compute_deep_convolution_shape(const ITensorInfo &input, const ITensorInfo &weights, PadStrideInfo conv_info)
Calculate the deep convolution shape output shape of a tensor.
Definition: ShapeCalculator.h:738

arm_compute::GEMMLHSMatrixInfo::v0
unsigned int v0
Number of vertical blocks of size (m0xk0) stored on the same output row.
Definition: Types.h:1977

arm_compute::GEMMKernelInfo::depth_output_gemm3d
unsigned int depth_output_gemm3d
Depth of the output tensor in case is reinterpreted as 3D.
Definition: KernelDescriptors.h:84

arm_compute::WinogradInfo
Winograd information.
Definition: Types.h:2182

arm_compute::GEMMReshapeInfo
GEMM reshape information class.
Definition: Types.h:1831

arm_compute::WinogradInfo::convolution_info
PadStrideInfo convolution_info
Convolution info (Pads, strides,...)
Definition: Types.h:2200

arm_compute::test::validation::conv_info
conv_info
Definition: Winograd.cpp:599

arm_compute::PriorBoxLayerInfo::aspect_ratios
std::vector< float > aspect_ratios() const
Get aspect ratios.
Definition: Types.h:944

arm_compute::misc::shape_calculator::compute_mm_shape
TensorShape compute_mm_shape(const ITensorInfo &input0, const ITensorInfo &input1, bool is_interleaved_transposed, const GEMMReshapeInfo &reshape_info)
Calculate the matrix multiplication output shape of two tensors.
Definition: ShapeCalculator.h:889

arm_compute::misc::shape_calculator::compute_reductionA_shape
TensorShape compute_reductionA_shape(const ITensorInfo &b)
Calculate the reductionA shape used in GEMMLowp.
Definition: ShapeCalculator.h:357

arm_compute::misc::shape_calculator::compute_softmax_shape
TensorShape compute_softmax_shape(const ITensorInfo *input, size_t axis=1)
Calculate the softmax output shape of a tensor.
Definition: ShapeCalculator.h:605

arm_compute::DataLayoutDimension::HEIGHT
height

arm_compute::BiStrides
Coordinates BiStrides
Bidirectional strides.
Definition: Types.h:51

input_height
const size_t input_height
Definition: NEDepthwiseConvolutionLayerNativeKernel.cpp:68

arm_compute::misc::shape_calculator::compute_space_to_batch_shape
TensorShape compute_space_to_batch_shape(const ITensorInfo *input, const int block_x, const int block_y, const Size2D &padding_left, const Size2D &padding_right)
Calculate the space to batch output shape of a tensor.
Definition: ShapeCalculator.h:1149

arm_compute::GEMMRHSMatrixInfo::h0
unsigned int h0
Number of horizontal blocks of size (k0xn0) stored on the same output row.
Definition: Types.h:1992

arm_compute::test::validation::winograd_info
winograd_info
Definition: Winograd.cpp:330

ARM_COMPUTE_ERROR_ON
#define ARM_COMPUTE_ERROR_ON(cond)
If the condition is true then an error message is printed and an exception thrown.
Definition: Error.h:466

arm_compute::misc::shape_calculator::compute_rnn_shape
TensorShape compute_rnn_shape(const ITensorInfo *input, const unsigned int batch_size)
Calculate the RNN shape of a tensor.
Definition: ShapeCalculator.h:872

arm_compute::test::validation::data_layout
const DataLayout data_layout
Definition: Im2Col.cpp:151

arm_compute::GEMMLHSMatrixInfo
GEMM LHS (Left Hand Side) matrix information.
Definition: Types.h:1968

arm_compute::ITensorInfo
Store the tensor&#39;s metadata.
Definition: ITensorInfo.h:40

arm_compute::helpers::tensor_transform
Definition: tensor_transform.h:33

arm_compute::compute_winograd_convolution_tiles
Size2D compute_winograd_convolution_tiles(const Size2D &in_dims, const Size2D &kernel_size, const Size2D &output_tile_size, const PadStrideInfo &conv_info)
Calculate the number of output tiles required by Winograd Convolution layer.
Definition: Helpers.h:211

arm_compute::misc::shape_calculator::compute_reorg_output_shape
TensorShape compute_reorg_output_shape(const ITensorInfo &input, int32_t stride)
Calculate the output shape of the reorg layer given a stride.
Definition: ShapeCalculator.h:122

arm_compute::Size2D::x
size_t x() const
Semantic accessor for width as x.
Definition: Size2D.h:74

arm_compute::ROIPoolingLayerInfo::pooled_width
unsigned int pooled_width() const
Get the pooled width of the layer.
Definition: Types.h:1324

arm_compute::PadStrideInfo::pad_top
unsigned int pad_top() const
Get the top padding.
Definition: Types.h:806

arm_compute::DepthwiseConvolutionReshapeInfo
Definition: Types.h:1936

arm_compute::misc::shape_calculator::compute_reshaped_depthwise_weights_shape
TensorShape compute_reshaped_depthwise_weights_shape(const ITensorInfo &input, const DepthwiseConvolutionReshapeInfo &info)
Calculate the reshaped shape of the weights to use in depthwise convolution.
Definition: ShapeCalculator.h:297

arm_compute::misc::shape_calculator::compute_interleaved_shape
TensorShape compute_interleaved_shape(const ITensorInfo &a, int mult_interleave4x4_height=1, bool reinterpret_input_as_3d=false)
Calculate the interleaved shape of an input tensor.
Definition: ShapeCalculator.h:260

arm_compute::misc::shape_calculator::compute_output_stage_shape
TensorShape compute_output_stage_shape(const ITensorInfo &input, unsigned int gemm_3d_depth=1, bool batch_size_on_z=false)
Calculate the matrix multiplication output shape of two tensors.
Definition: ShapeCalculator.h:1001

weights_height
const size_t weights_height
Definition: NEDepthwiseConvolutionLayerNativeKernel.cpp:61

arm_compute
Copyright (c) 2017-2021 Arm Limited.
Definition: 00_introduction.dox:24

arm_compute::Size2D::height
size_t height
Height of the image region or rectangle.
Definition: Size2D.h:90

arm_compute::misc::shape_calculator::compute_min_max_shape
TensorShape compute_min_max_shape(const ITensorInfo *input)
Calculate the min/max shape output shape of a tensor.
Definition: ShapeCalculator.h:770

arm_compute::helpers::tensor_transform::construct_slice_end_mask
int32_t construct_slice_end_mask(Coordinates ends)
Constructs end mask in case we want to perform a slice operation using the strided slice interface...
Definition: tensor_transform.cpp:172

arm_compute::misc::shape_calculator::compute_strided_slice_shape
TensorShape compute_strided_slice_shape(const ITensorInfo &input, const Coordinates &starts, const Coordinates &ends, const Coordinates &strides, int32_t begin_mask, int32_t end_mask, int32_t shrink_axis_mask)
Calculate the strided slice output shape of a tensor.
Definition: ShapeCalculator.h:1032

arm_compute::DIV_CEIL
constexpr auto DIV_CEIL(S val, T m) -> decltype((val+m - 1)/m)
Calculate the rounded up quotient of val / m.
Definition: Utils.h:58

arm_compute::scaled_dimensions
std::pair< unsigned int, unsigned int > scaled_dimensions(int width, int height, int kernel_width, int kernel_height, const PadStrideInfo &pad_stride_info, const Size2D &dilation=Size2D(1U, 1U))
Returns expected width and height of output scaled tensor depending on dimensions rounding mode...
Definition: Utils.cpp:419

arm_compute::MAX_DIMS
constexpr size_t MAX_DIMS
Constant value used to indicate maximum dimensions of a Window, TensorShape and Coordinates.
Definition: Dimensions.h:38

arm_compute::misc::shape_calculator::compute_transposed_shape
TensorShape compute_transposed_shape(const ITensorInfo &input)
Calculate the transposed shape of a tensor.
Definition: ShapeCalculator.h:426

arm_compute::test::validation::input
auto input
Definition: LSTMLayerQuantized.cpp:486

arm_compute::permute
void permute(Dimensions< T > &dimensions, const PermutationVector &perm)
Permutes given Dimensions according to a permutation vector.
Definition: Helpers.h:125

arm_compute::misc::shape_calculator::compute_deconvolution_output_shape
TensorShape compute_deconvolution_output_shape(const std::pair< unsigned int, unsigned int > &out_dims, const ITensorInfo &input, const ITensorInfo &weights)
Calculate the output shape of the deconvolution layer.
Definition: ShapeCalculator.h:519

arm_compute::misc::shape_calculator::compute_pool_shape
TensorShape compute_pool_shape(const ITensorInfo &input, PoolingLayerInfo pool_info)
Calculate the output pool shape of a tensor.
Definition: ShapeCalculator.h:787

arm_compute::Dimensions::x
T x() const
Alias to access the size of the first dimension.
Definition: Dimensions.h:87

arm_compute::GEMMReshapeInfo::n
int n() const
Number of matrix B columns.
Definition: Types.h:1869

Utils.h

arm_compute::misc::shape_calculator::compute_flatten_shape
TensorShape compute_flatten_shape(const ITensorInfo *input)
Calculate the flattened output shape of a tensor.
Definition: ShapeCalculator.h:587

arm_compute::GEMMRHSMatrixInfo::k0
unsigned int k0
Number of partial accumulations performed by the matrix multiplication.
Definition: Types.h:1991

arm_compute::misc::shape_calculator::compute_prior_box_shape
TensorShape compute_prior_box_shape(const ITensorInfo &input, const PriorBoxLayerInfo &info)
Calculate the prior box output shape of a tensor.
Definition: ShapeCalculator.h:1198

arm_compute::misc::shape_calculator::compute_vector_to_tensor_output_shape
TensorShape compute_vector_to_tensor_output_shape(const TensorShape &input, size_t conv_w, size_t conv_h, const DataLayout &data_layout)
Calculate the output tensor shape of a vector input given the convolution dimensions.
Definition: ShapeCalculator.h:87

arm_compute::GEMMKernelInfo::m
unsigned int m
Number of LHS rows.
Definition: KernelDescriptors.h:81

arm_compute::GEMMKernelInfo::n
unsigned int n
Number of RHS columns.
Definition: KernelDescriptors.h:82

arm_compute::test::validation::input_shape
TensorShape input_shape
Validate test suite is to test ARM_COMPUTE_RETURN_ON_* macros we use to check the validity of given a...
Definition: LSTMLayerQuantized.cpp:466

arm_compute::Window::DimX
static constexpr size_t DimX
Alias for dimension 0 also known as X dimension.
Definition: Window.h:43

ARM_COMPUTE_UNUSED
#define ARM_COMPUTE_UNUSED(...)
To avoid unused variables warnings.
Definition: Error.h:152

arm_compute::Dimensions::collapse_from
void collapse_from(size_t start)
Collapse dimensions starting from a given point.
Definition: Dimensions.h:183

arm_compute::test::validation::output_shape
TensorShape output_shape
Definition: LSTMLayerQuantized.cpp:469

arm_compute::misc::shape_calculator::compute_lhs_reshaped_shape
TensorShape compute_lhs_reshaped_shape(const ITensorInfo &a, const GEMMLHSMatrixInfo &lhs_info, bool reinterpret_input_as_3d=false)
Calculate the Left Hand Side matrix reshaped shape.
Definition: ShapeCalculator.h:180

arm_compute::misc::shape_calculator::calculate_reduce_mean_shape
TensorShape calculate_reduce_mean_shape(ITensorInfo *input, const Coordinates &reduction_axis, bool keep_dims)
Calculate the output tensor shape for the reduce mean operation.
Definition: ShapeCalculator.h:50

arm_compute::GEMMRHSMatrixInfo
GEMM RHS (Right Hand Side) matrix information.
Definition: Types.h:1983

arm_compute::ITensorInfo::tensor_shape
virtual const TensorShape & tensor_shape() const =0
Size for each dimension of the tensor.

arm_compute::misc::shape_calculator::compute_unpool_shape
TensorShape compute_unpool_shape(const ITensorInfo &input, PoolingLayerInfo pool_info)
Calculate the output unpool shape of a tensor.
Definition: ShapeCalculator.h:819

arm_compute::WinogradInfo::output_tile_size
Size2D output_tile_size
Width and height of the output tile.
Definition: Types.h:2197

arm_compute::test::validation::idx_height
const int idx_height
Definition: Scale.cpp:266

arm_compute::GEMMRHSMatrixInfo::n0
unsigned int n0
Number of columns processed by the matrix multiplication.
Definition: Types.h:1990

ARM_COMPUTE_ERROR_ON_MSG
#define ARM_COMPUTE_ERROR_ON_MSG(cond, msg)
Definition: Error.h:456

arm_compute::test::validation::num_groups
const unsigned int num_groups
Definition: Im2Col.cpp:153

arm_compute::misc::shape_calculator::compute_tiled_shape
TensorShape compute_tiled_shape(const TensorShape &input_shape, const Multiples &multiples)
Calculate the tiled shape of a tensor.
Definition: ShapeCalculator.h:1238

arm_compute::Coordinates
Coordinates of an item.
Definition: Coordinates.h:37

arm_compute::PadStrideInfo::stride
std::pair< unsigned int, unsigned int > stride() const
Get the stride.
Definition: Types.h:770

arm_compute::misc::shape_calculator::compute_reduced_shape
TensorShape compute_reduced_shape(const TensorShape &input, unsigned int axis, bool keep_dims=true)
Calculate the reduced shape of a tensor given an axis.
Definition: ShapeCalculator.h:1256

arm_compute::PoolingLayerInfo
Pooling Layer Information struct.
Definition: Types.h:1214

arm_compute::misc::shape_calculator::compute_rhs_reshaped_shape
TensorShape compute_rhs_reshaped_shape(const ITensorInfo &a, const GEMMRHSMatrixInfo &rhs_info)
Calculate the Right Hand Side matrix reshaped shape.
Definition: ShapeCalculator.h:224

arm_compute::GEMMKernelInfo::reinterpret_input_as_3d
bool reinterpret_input_as_3d
Flag used to reinterpret the input as 3D.
Definition: KernelDescriptors.h:85

arm_compute::PriorBoxLayerInfo
PriorBox layer info.
Definition: Types.h:839

arm_compute::misc::shape_calculator::compute_deconvolution_upsampled_shape
TensorShape compute_deconvolution_upsampled_shape(const ITensorInfo &input, const ITensorInfo &weights, unsigned int sx, unsigned int sy, std::pair< unsigned int, unsigned int > &out_dims, uint32_t &padx, uint32_t &pady)
Calculate the upsampled output shape used for deconvolution.
Definition: ShapeCalculator.h:487

ITensorInfo.h

arm_compute::PadStrideInfo::pad_right
unsigned int pad_right() const
Get the right padding.
Definition: Types.h:801

arm_compute::PadStrideInfo
Padding and stride information class.
Definition: Types.h:722

arm_compute::ITensorInfo::element_size
virtual size_t element_size() const =0
Element size in bytes calculated as data_size() * num_channels()

arm_compute::Dimensions::begin
std::array< T, num_max_dimensions >::iterator begin()
Returns a read/write iterator that points to the first element in the dimension array.
Definition: Dimensions.h:215

arm_compute::test::validation::has_bias
const bool has_bias
Definition: Im2Col.cpp:152

arm_compute::misc::shape_calculator::compute_winograd_filter_transform_shape
TensorShape compute_winograd_filter_transform_shape(const ITensorInfo &input, const WinogradInfo &winograd_info)
Calculate the winograd filter transform shape.
Definition: ShapeCalculator.h:644

arm_compute::DataLayoutDimension::CHANNEL
channel

arm_compute::DepthwiseConvolutionReshapeInfo::c0
unsigned int c0
Number of channels processed by the depth-wise convolution.
Definition: Types.h:1938

arm_compute::misc::shape_calculator::compute_padded_shape
TensorShape compute_padded_shape(const TensorShape &input_shape, const PaddingList &padding)
Calculate the padded shape of a tensor.
Definition: ShapeCalculator.h:1219

arm_compute::DataLayoutDimension::BATCHES
batches

arm_compute::DataLayout::NCHW
Num samples, channels, height, width.

arm_compute::Size2D::y
size_t y() const
Semantic accessor for height as y.
Definition: Size2D.h:83

arm_compute::Strides
Strides of an item in bytes.
Definition: Strides.h:37

arm_compute::misc::shape_calculator::compute_reductionB_shape
TensorShape compute_reductionB_shape(const ITensorInfo &a)
Calculate the reductionB shape used in GEMMLowp.
Definition: ShapeCalculator.h:374

arm_compute::Window::DimY
static constexpr size_t DimY
Alias for dimension 1 also known as Y dimension.
Definition: Window.h:45

arm_compute::misc::shape_calculator::extract_shape
TensorShape extract_shape(T *data)
Get the tensor shape.
Definition: ShapeCalculator.h:1301

arm_compute::test::validation::info
ScaleKernelInfo info(interpolation_policy, default_border_mode, PixelValue(), sampling_policy, false)

arm_compute::PoolingLayerInfo::pad_stride_info
PadStrideInfo pad_stride_info
Definition: Types.h:1302

arm_compute::misc::shape_calculator::compute_upsample_shape
TensorShape compute_upsample_shape(const ITensorInfo &input, const Size2D &info)
Calculate the upsampled shape of a tensor.
Definition: ShapeCalculator.h:1279

arm_compute::misc::shape_calculator::compute_winograd_output_transform_shape
TensorShape compute_winograd_output_transform_shape(const ITensorInfo &input, const WinogradInfo &winograd_info)
Calculate the winograd output transform shape.
Definition: ShapeCalculator.h:703

arm_compute::Size2D::width
size_t width
Width of the image region or rectangle.
Definition: Size2D.h:89

arm_compute::Window::DimZ
static constexpr size_t DimZ
Alias for dimension 2 also known as Z dimension.
Definition: Window.h:47

arm_compute::ROIPoolingLayerInfo::pooled_height
unsigned int pooled_height() const
Get the pooled height of the layer.
Definition: Types.h:1329

arm_compute::misc::shape_calculator::compute_weights_reshaped_shape
TensorShape compute_weights_reshaped_shape(const ITensorInfo &weights, bool has_bias=false, unsigned int num_groups=1)
Calculate the reshaped shape of the weights.
Definition: ShapeCalculator.h:149

arm_compute::GEMMReshapeInfo::m
int m() const
Number of matrix A rows.
Definition: Types.h:1861

arm_compute::ROIPoolingLayerInfo
ROI Pooling Layer Information class.
Definition: Types.h:1309

arm_compute::Size2D
Class for specifying the size of an image or rectangle.
Definition: Size2D.h:34

arm_compute::Dimensions::num_dimensions
unsigned int num_dimensions() const
Returns the effective dimensionality of the tensor.
Definition: Dimensions.h:143

arm_compute::PriorBoxLayerInfo::max_sizes
std::vector< float > max_sizes() const
Get max sizes.
Definition: Types.h:939

arm_compute::DataLayout::NHWC
Num samples, height, width, channels.

arm_compute::misc::shape_calculator::compute_batch_to_space_shape
TensorShape compute_batch_to_space_shape(const ITensorInfo *input, const int block_x, const int block_y)
Calculate the batch to space output shape of a tensor.
Definition: ShapeCalculator.h:1065

arm_compute::misc::shape_calculator::compute_transpose1xW_shape
TensorShape compute_transpose1xW_shape(const ITensorInfo &b)
Calculate the transposed 1xW shape.
Definition: ShapeCalculator.h:320

arm_compute::GEMMReshapeInfo::depth_output_gemm3d
int depth_output_gemm3d() const
Depth (third dimension) of the output tensor to be used with the GEMM3D kernel.
Definition: Types.h:1904

arm_compute::WinogradInfo::kernel_size
Size2D kernel_size
Width and height of the kernel.
Definition: Types.h:2198

arm_compute::DataLayoutDimension::WIDTH
width

Helpers.h

arm_compute::GEMMLHSMatrixInfo::k0
unsigned int k0
Number of partial accumulations performed by the matrix multiplication.
Definition: Types.h:1976

tensor_transform.h

arm_compute::GEMMLHSMatrixInfo::m0
unsigned int m0
Number of rows processed by the matrix multiplication.
Definition: Types.h:1975

arm_compute::PoolingLayerInfo::pool_size
Size2D pool_size
Definition: Types.h:1300

arm_compute::Dimensions::y
T y() const
Alias to access the size of the second dimension.
Definition: Dimensions.h:92

arm_compute::convert_negative_axis
Coordinates & convert_negative_axis(Coordinates &coords, int max_value)
Convert negative coordinates to positive in the range [0, num_dims_input].
Definition: Helpers.h:241

arm_compute::PoolingLayerInfo::is_global_pooling
bool is_global_pooling
Definition: Types.h:1304

arm_compute::misc::shape_calculator::compute_col2im_shape
TensorShape compute_col2im_shape(const ITensorInfo &input, const Size2D &convolved_dims, bool batch_size_on_z, unsigned int num_groups=1)
Calculate the Col2Im shape.
Definition: ShapeCalculator.h:395

arm_compute::get_data_layout_dimension_index
size_t get_data_layout_dimension_index(const DataLayout data_layout, const DataLayoutDimension data_layout_dimension)
Get the index of the given dimension.
Definition: Helpers.inl:193

arm_compute::PadStrideInfo::pad_bottom
unsigned int pad_bottom() const
Get the bottom padding.
Definition: Types.h:811

arm_compute::WinogradInfo::input_dimensions
Size2D input_dimensions
Width and height of the input tensor before the convolution is applied.
Definition: Types.h:2199

arm_compute::misc::shape_calculator::calculate_concatenate_shape
TensorShape calculate_concatenate_shape(const std::vector< T *> &input, size_t axis)
Calculate the concatenate output shape of the concatenate operation along a single axis...
Definition: ShapeCalculator.h:1347

arm_compute::GEMMReshapeInfo::reinterpret_input_as_3d
bool reinterpret_input_as_3d() const
Flag which specifies if the input tensor has to be reinterpreted as 3D.
Definition: Types.h:1912

arm_compute::misc::shape_calculator::compute_split_shape
TensorShape compute_split_shape(const ITensorInfo *input, unsigned int axis, unsigned int num_splits)
Calculate the split output shape of a tensor.
Definition: ShapeCalculator.h:1114

weights_width
const size_t weights_width
Definition: NEDepthwiseConvolutionLayerNativeKernel.cpp:60

arm_compute::PadStrideInfo::pad_left
unsigned int pad_left() const
Get the left padding.
Definition: Types.h:796

KernelDescriptors.h

arm_compute::DataLayout
DataLayout
[DataLayout enum definition]
Definition: Types.h:120

arm_compute::Multiples
std::vector< uint32_t > Multiples
Information to produce a tiled version of a Tensor.
Definition: Types.h:484

input_width
const size_t input_width
Definition: NEDepthwiseConvolutionLayerNativeKernel.cpp:69

arm_compute::misc::shape_calculator::compute_im2col_conv_shape
TensorShape compute_im2col_conv_shape(const ITensorInfo *input, const Size2D &kernel_dims, const PadStrideInfo &conv_info, bool has_bias, const Size2D &dilation, bool batch_size_on_z, unsigned int num_groups=1)
Calculate the im2col output shape of a tensor.
Definition: ShapeCalculator.h:549

arm_compute::TensorShape::collapse
void collapse(size_t n, size_t first=0)
Collapse the first n dimensions.
Definition: TensorShape.h:133

arm_compute::TensorShape::set
TensorShape & set(size_t dimension, size_t value, bool apply_dim_correction=true, bool increase_dim_unit=true)
Accessor to set the value of one of the dimensions.
Definition: TensorShape.h:79

arm_compute::Size2D::area
size_t area() const
The area of the image or rectangle calculated as (width * height)
Definition: Size2D.h:53

arm_compute::ITensorInfo::data_layout
virtual DataLayout data_layout() const =0
Get the data layout of the tensor.

arm_compute::misc::shape_calculator::compute_space_to_depth_shape
TensorShape compute_space_to_depth_shape(const ITensorInfo *input, int32_t block_shape)
Calculate the space to batch output shape of a tensor.
Definition: ShapeCalculator.h:1175

arm_compute::PriorBoxLayerInfo::min_sizes
std::vector< float > min_sizes() const
Get min sizes.
Definition: Types.h:904

arm_compute::helpers::tensor_transform::compute_strided_slice_output_shape
TensorShape compute_strided_slice_output_shape(TensorShape input_shape, Coordinates starts, Coordinates ends, Coordinates strides, int32_t begin_mask=0, int32_t end_mask=0, int32_t shrink_axis_mask=0, bool return_unshrinked=false)
Computes output shape of strided slice.
Definition: tensor_transform.cpp:139

arm_compute::misc::shape_calculator::compute_gather_shape
TensorShape compute_gather_shape(const TensorShape &input_shape, const TensorShape &indices_shape, uint32_t actual_axis)
Definition: ShapeCalculator.h:1411