Basic function to execute one dimensional FFT. More...

#include <NEFFT1D.h>

Collaboration diagram for NEFFT1D:

Public Member Functions
	NEFFT1D (std::shared_ptr< IMemoryManager > memory_manager=nullptr)
	Default Constructor. More...

	NEFFT1D (const NEFFT1D &)=delete
	Prevent instances of this class from being copied (As this class contains pointers) More...

NEFFT1D &	operator= (const NEFFT1D &)=delete
	Prevent instances of this class from being copied (As this class contains pointers) More...

	NEFFT1D (NEFFT1D &&)=delete
	Prevent instances of this class from being moved (As this class contains non movable objects) More...

NEFFT1D &	operator= (NEFFT1D &&)=delete
	Prevent instances of this class from being moved (As this class contains non movable objects) More...

	~NEFFT1D ()
	Default destructor. More...

void	configure (const ITensor input, ITensor output, const FFT1DInfo &config)
	Initialise the function's source and destinations. More...

void	run () override
	Run the kernels contained in the function. More...

Public Member Functions inherited from IFunction
virtual	~IFunction ()=default
	Destructor. More...

virtual void	prepare ()
	Prepare the function for executing. More...

Static Public Member Functions
static Status	validate (const ITensorInfo input, const ITensorInfo output, const FFT1DInfo &config)
	Static function to check if given info will lead to a valid configuration of NEFFT1D. More...

Detailed Description

Basic function to execute one dimensional FFT.

This function calls the following kernels:

NEFFTDigitReverseKernel Performs digit reverse
NEFFTRadixStageKernel A list of FFT kernels depending on the radix decomposition
NEFFTScaleKernel Performs output scaling in case of in inverse FFT

Definition at line 48 of file NEFFT1D.h.

Constructor & Destructor Documentation

◆ NEFFT1D() [1/3]

NEFFT1D ( std::shared_ptr< IMemoryManager > memory_manager = nullptr )

Default Constructor.

Definition at line 40 of file NEFFT1D.cpp.

     : _memory_group(std::move(memory_manager)),
       _digit_reverse_kernel(),
       _fft_kernels(),
       _scale_kernel(),
       _digit_reversed_input(),
       _digit_reverse_indices(),
       _num_ffts(0),
       _axis(0),
       _run_scale(false)
 {
 }

◆ NEFFT1D() [2/3]

NEFFT1D ( const NEFFT1D & )

delete

Prevent instances of this class from being copied (As this class contains pointers)

◆ NEFFT1D() [3/3]

NEFFT1D ( NEFFT1D && )

delete

Prevent instances of this class from being moved (As this class contains non movable objects)

◆ ~NEFFT1D()

~NEFFT1D ( )

default

Default destructor.

Member Function Documentation

◆ configure()

void configure	(	const ITensor *	input,
		ITensor *	output,
		const FFT1DInfo &	config
	)

Initialise the function's source and destinations.

Valid data layouts:

All

Valid data type configurations:

src	dst
F32	F32

Parameters

[in]	input	Source tensor. Data types supported: F32. Number of channels supported: 1 (real tensor) or 2 (complex tensor).
[out]	output	Destination tensor. Data types and data layouts supported: Same as `input`. Number of channels supported: 1 (real tensor) or 2 (complex tensor).If `input` is real, `output` must be complex.
[in]	config	FFT related configuration

Definition at line 53 of file NEFFT1D.cpp.

 {
     ARM_COMPUTE_ERROR_ON_NULLPTR(input, output);
     ARM_COMPUTE_ERROR_THROW_ON(NEFFT1D::validate(input->info(), output->info(), config));
     ARM_COMPUTE_LOG_PARAMS(input, output, config);
  
     // Decompose size to radix factors
     const auto         supported_radix   = NEFFTRadixStageKernel::supported_radix();
     const unsigned int N                 = input->info()->tensor_shape()[config.axis];
     const auto         decomposed_vector = arm_compute::helpers::fft::decompose_stages(N, supported_radix);
     ARM_COMPUTE_ERROR_ON(decomposed_vector.empty());
  
     // Flags
     _run_scale = config.direction == FFTDirection::Inverse;
  
     const bool is_c2r = input->info()->num_channels() == 2 && output->info()->num_channels() == 1;
  
     // Configure digit reverse
     FFTDigitReverseKernelInfo digit_reverse_config;
     digit_reverse_config.axis      = config.axis;
     digit_reverse_config.conjugate = config.direction == FFTDirection::Inverse;
     TensorInfo digit_reverse_indices_info(TensorShape(input->info()->tensor_shape()[config.axis]), 1, DataType::U32);
     _digit_reverse_indices.allocator()->init(digit_reverse_indices_info);
     _memory_group.manage(&_digit_reversed_input);
     _digit_reverse_kernel = std::make_unique<NEFFTDigitReverseKernel>();
     _digit_reverse_kernel->configure(input, &_digit_reversed_input, &_digit_reverse_indices, digit_reverse_config);
  
     // Create and configure FFT kernels
     unsigned int Nx = 1;
     _num_ffts       = decomposed_vector.size();
     _fft_kernels.resize(_num_ffts);
     _axis = config.axis;
  
     for (unsigned int i = 0; i < _num_ffts; ++i)
     {
         const unsigned int radix_for_stage = decomposed_vector.at(i);
  
         FFTRadixStageKernelInfo fft_kernel_info;
         fft_kernel_info.axis           = config.axis;
         fft_kernel_info.radix          = radix_for_stage;
         fft_kernel_info.Nx             = Nx;
         fft_kernel_info.is_first_stage = (i == 0);
         _fft_kernels[i]                = std::make_unique<NEFFTRadixStageKernel>();
         _fft_kernels[i]->configure(&_digit_reversed_input, ((i == (_num_ffts - 1)) && !is_c2r) ? output : nullptr,
                                    fft_kernel_info);
  
         Nx *= radix_for_stage;
     }
  
     // Configure scale kernel
     if (_run_scale)
     {
         FFTScaleKernelInfo scale_config;
         scale_config.scale     = static_cast<float>(N);
         scale_config.conjugate = config.direction == FFTDirection::Inverse;
         _scale_kernel          = std::make_unique<NEFFTScaleKernel>();
         is_c2r ? _scale_kernel->configure(&_digit_reversed_input, output, scale_config)
                         : _scale_kernel->configure(output, nullptr, scale_config);
     }
  
     // Allocate tensors
     _digit_reversed_input.allocator()->allocate();
     _digit_reverse_indices.allocator()->allocate();
  
     // Init digit reverse indices
     const auto digit_reverse_cpu = arm_compute::helpers::fft::digit_reverse_indices(N, decomposed_vector);
     std::copy_n(digit_reverse_cpu.data(), N, reinterpret_cast<unsigned int *>(_digit_reverse_indices.buffer()));
 }

References TensorAllocator::allocate(), Tensor::allocator(), ARM_COMPUTE_ERROR_ON, ARM_COMPUTE_ERROR_ON_NULLPTR, ARM_COMPUTE_ERROR_THROW_ON, ARM_COMPUTE_LOG_PARAMS, FFTDigitReverseKernelInfo::axis, FFT1DInfo::axis, FFTRadixStageKernelInfo::axis, Tensor::buffer(), FFTScaleKernelInfo::conjugate, FFTDigitReverseKernelInfo::conjugate, arm_compute::helpers::fft::decompose_stages(), arm_compute::helpers::fft::digit_reverse_indices(), FFT1DInfo::direction, ITensor::info(), TensorAllocator::init(), arm_compute::test::validation::input, arm_compute::Inverse, FFTRadixStageKernelInfo::is_first_stage, MemoryGroup::manage(), N, ITensorInfo::num_channels(), FFTRadixStageKernelInfo::Nx, FFTRadixStageKernelInfo::radix, FFTScaleKernelInfo::scale, NEFFTRadixStageKernel::supported_radix(), arm_compute::U32, and NEFFT1D::validate().

Referenced by NEFFT2D::configure().

◆ operator=() [1/2]

NEFFT1D& operator= ( const NEFFT1D & )

delete

Prevent instances of this class from being copied (As this class contains pointers)

◆ operator=() [2/2]

NEFFT1D& operator= ( NEFFT1D && )

delete

Prevent instances of this class from being moved (As this class contains non movable objects)

◆ run()

void run ( )

overridevirtual

Run the kernels contained in the function.

For CPU kernels:

Multi-threading is used for the kernels which are parallelisable.
By default std::thread::hardware_concurrency() threads are used.

Note: CPPScheduler::set_num_threads() can be used to manually set the number of threads

For OpenCL kernels:

All the kernels are enqueued on the queue associated with CLScheduler.
The queue is then flushed.

Note: The function will not block until the kernels are executed. It is the user's responsibility to wait.; Will call prepare() on first run if hasn't been done

Implements IFunction.

Definition at line 148 of file NEFFT1D.cpp.

 {
     MemoryGroupResourceScope scope_mg(_memory_group);
  
     NEScheduler::get().schedule(_digit_reverse_kernel.get(), (_axis == 0 ? Window::DimY : Window::DimZ));
  
     for (unsigned int i = 0; i < _num_ffts; ++i)
     {
         NEScheduler::get().schedule(_fft_kernels[i].get(), (_axis == 0 ? Window::DimY : Window::DimX));
     }
  
     // Run output scaling
     if (_run_scale)
     {
         NEScheduler::get().schedule(_scale_kernel.get(), Window::DimY);
     }
 }

References Window::DimX, Window::DimY, Window::DimZ, Scheduler::get(), and IScheduler::schedule().

Referenced by NEFFT2D::run().

◆ validate()

Status validate	(	const ITensorInfo *	input,
		const ITensorInfo *	output,
		const FFT1DInfo &	config
	)

static

Static function to check if given info will lead to a valid configuration of NEFFT1D.

Parameters

[in]	input	Source tensor info. Data types supported: F32.
[in]	output	Destination tensor info. Data types and data layouts supported: Same as `input`.
[in]	config	FFT related configuration

Returns: a status

Definition at line 122 of file NEFFT1D.cpp.

 {
     ARM_COMPUTE_RETURN_ERROR_ON_NULLPTR(input, output);
     ARM_COMPUTE_RETURN_ERROR_ON(input->data_type() != DataType::F32);
     ARM_COMPUTE_RETURN_ERROR_ON(input->num_channels() > 2);
     ARM_COMPUTE_RETURN_ERROR_ON(std::set<unsigned int>({0, 1}).count(config.axis) == 0);
  
     // Check if FFT is decomposable
     const auto         supported_radix   = NEFFTRadixStageKernel::supported_radix();
     const unsigned int N                 = input->tensor_shape()[config.axis];
     const auto         decomposed_vector = arm_compute::helpers::fft::decompose_stages(N, supported_radix);
     ARM_COMPUTE_RETURN_ERROR_ON(decomposed_vector.empty());
  
     // Checks performed when output is configured
     if ((output != nullptr) && (output->total_size() != 0))
     {
         // All combinations are supported except real input with real output (i.e., both input channels set to 1)
         ARM_COMPUTE_RETURN_ERROR_ON(output->num_channels() == 1 && input->num_channels() == 1);
         ARM_COMPUTE_RETURN_ERROR_ON(output->num_channels() > 2);
         ARM_COMPUTE_RETURN_ERROR_ON_MISMATCHING_SHAPES(input, output);
         ARM_COMPUTE_RETURN_ERROR_ON_MISMATCHING_DATA_TYPES(input, output);
     }
  
     return Status{};
 }

References ARM_COMPUTE_RETURN_ERROR_ON, ARM_COMPUTE_RETURN_ERROR_ON_MISMATCHING_DATA_TYPES, ARM_COMPUTE_RETURN_ERROR_ON_MISMATCHING_SHAPES, ARM_COMPUTE_RETURN_ERROR_ON_NULLPTR, FFT1DInfo::axis, arm_compute::helpers::fft::decompose_stages(), arm_compute::F32, arm_compute::test::validation::input, N, ITensorInfo::num_channels(), NEFFTRadixStageKernel::supported_radix(), and ITensorInfo::total_size().

Referenced by NEFFT1D::configure(), and NEFFT2D::validate().

The documentation for this class was generated from the following files:

arm_compute/runtime/NEON/functions/NEFFT1D.h
src/runtime/NEON/functions/NEFFT1D.cpp

Public Member Functions

Static Public Member Functions

Detailed Description

Constructor & Destructor Documentation

◆ NEFFT1D() [1/3]

◆ NEFFT1D() [2/3]

◆ NEFFT1D() [3/3]

◆ ~NEFFT1D()

Member Function Documentation

◆ configure()

◆ operator=() [1/2]

◆ operator=() [2/2]

◆ run()

◆ validate()