Ne10/doc/NE10__fft_8c_source.html

 /*
  *  Copyright 2014-16 ARM Limited and Contributors.
  *  All rights reserved.
  *
  *  Redistribution and use in source and binary forms, with or without
  *  modification, are permitted provided that the following conditions are met:
  *    * Redistributions of source code must retain the above copyright
  *      notice, this list of conditions and the following disclaimer.
  *    * Redistributions in binary form must reproduce the above copyright
  *      notice, this list of conditions and the following disclaimer in the
  *      documentation and/or other materials provided with the distribution.
  *    * Neither the name of ARM Limited nor the
  *      names of its contributors may be used to endorse or promote products
  *      derived from this software without specific prior written permission.
  *
  *  THIS SOFTWARE IS PROVIDED BY ARM LIMITED AND CONTRIBUTORS "AS IS" AND
  *  ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
  *  WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
  *  DISCLAIMED. IN NO EVENT SHALL ARM LIMITED AND CONTRIBUTORS BE LIABLE FOR ANY
  *  DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
  *  (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
  *  LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
  *  ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  *  (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
  *  SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  */

 /* license of Kiss FFT */
 /*
 Copyright (c) 2003-2010, Mark Borgerding

 All rights reserved.

 Redistribution and use in source and binary forms, with or without modification, are permitted provided that the following conditions are met:

     * Redistributions of source code must retain the above copyright notice, this list of conditions and the following disclaimer.
     * Redistributions in binary form must reproduce the above copyright notice, this list of conditions and the following disclaimer in the documentation and/or other materials provided with the distribution.
     * Neither the author nor the names of any contributors may be used to endorse or promote products derived from this software without specific prior written permission.

 THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 */

 /*
  * NE10 Library : dsp/NE10_fft.c
  */

 #include "NE10_types.h"
 #include "NE10_macros.h"
 #include "NE10_fft.h"

 /*
  * This function outputs a factor buffer ('facbuf') that decomposes an FFT of input size
  * n into a number of radix-r butterfly calculations (for r in some set of radix values).
  *
  * Factor buffer layout:
  *     index 0: stage count
  *     index 1: stride for the first stage
  *     index 2 to (2*stage_count + 1): pairs of factors (number of sections, section size)
  *     index (2*stage_count + 2): an flag specifying which algorithm to use
  *
  * e.g. 1024 samples might result in the following five stage radix-4 factors buffer:
  *          [5, 256, 4, 256, 4, 64, 4, 16, 4, 4, 4, 1]
  *          i.e. 1024 = 4x256, each of which is 4x64, each of which is 4x16, each of which
  *               is 4x4, each of which is 4x1. There are 5 stages, and the stride for the
  *               first stage is 256 (1024 / 4, for radix-4).
  *
  * Only the leading 42 int32 is used to store factors.
  * The left can be used as algorithm flags, or status flags.
  * Even the leading bits of stage number can be reused.
  */
 ne10_int32_t ne10_factor (ne10_int32_t n,
         ne10_int32_t * facbuf,
         ne10_int32_t ne10_factor_flags)
 {
     // This is a workaround. We need to "return" some flags.
     // Otherwise, we need to modify signature of ne10_factor.
     assert (NE10_MAXFACTORS >= 32);

     if ((facbuf == NULL)
         || (n <= 0))
     {
         return NE10_ERR;
     }

     ne10_int32_t p;
     ne10_int32_t i = 1;
     ne10_int32_t stage_num = 0;
     ne10_int32_t stride_max = n;

     // Default algorithm flag is NE10_FFT_ALG_DEFAULT
     ne10_int32_t alg_flag = NE10_FFT_ALG_DEFAULT;

     // Factor out powers of 4, 2, 5, and 3. Additionally, factor out powers
     // of 8 if the right factor flags are passed. If none of these factors
     // can be applied at any stage, the remaining size is used as a factor.
     do
     {
         // If NE10_FACTOR_EIGHT_FIRST_STAGE is enabled, we can generate
         // a first stage of radix-8 (e.g. by combining one radix-4 and
         // one radix-2 stage into a single radix-8 stage).
         if ((ne10_factor_flags & NE10_FACTOR_EIGHT_FIRST_STAGE)
                 && ((n==8) || (n==40) || (n==24)))
         {
             switch (n)
             {
             case 8:
                 p = 8;
                 break;
             case 24:
                 p = 3;
                 alg_flag = NE10_FFT_ALG_ANY;
                 break;
             default: // n == 40
                 p = 5;
                 alg_flag = NE10_FFT_ALG_ANY;
                 break;
             }
         }
         else if ((ne10_factor_flags & NE10_FACTOR_EIGHT) && ((n % 8) == 0))
         {
             p = 8;
         }
         else if ((n % 4) == 0)
         {
             p = 4;
         }
         else if ((n % 2) == 0)
         {
             p = 2;
         }
         else if ((n % 5) == 0)
         {
             p = 5;
             alg_flag = NE10_FFT_ALG_ANY;
         }
         else if ((n % 3) == 0)
         {
             p = 3;
             alg_flag = NE10_FFT_ALG_ANY;
         }
         else // stop factoring
         {
             p = n;
             alg_flag = NE10_FFT_ALG_ANY;
         }

         n /= p;
         facbuf[2 * i] = p;
         facbuf[2 * i + 1] = n;
         i++;
         stage_num++;
     }
     while (n > 1);
     facbuf[0] = stage_num;
     facbuf[1] = stride_max / p;

     if (stage_num > 21)
     {
         // Since nfft is ne10_int32_t, stage_num can never be greater than 21,
         // because 3^21 > 2^32
         return NE10_ERR;
     }

     facbuf[2 * i] = alg_flag;
     return NE10_OK;
 }

 // Twiddles matrix [radix-1][mstride]
 // First column (k == 0) is ignored because phase == 1, and
 // twiddle = (1.0, 0.0).
 void ne10_fft_generate_twiddles_line_float32 (ne10_fft_cpx_float32_t * twiddles,
         const ne10_int32_t mstride,
         const ne10_int32_t fstride,
         const ne10_int32_t radix,
         const ne10_int32_t nfft)
 {
     ne10_int32_t j, k;
     ne10_float32_t phase;
     const ne10_float64_t pi = NE10_PI;

     for (j = 0; j < mstride; j++)
     {
         for (k = 1; k < radix; k++) // phase = 1 when k = 0
         {
             phase = -2 * pi * fstride * k * j / nfft;
             twiddles[mstride * (k - 1) + j].r = (ne10_float32_t) cos (phase);
             twiddles[mstride * (k - 1) + j].i = (ne10_float32_t) sin (phase);
         } // radix
     } // mstride
 }

 // Transposed twiddles matrix [mstride][radix-1]
 // First row (k == 0) is ignored because phase == 1, and
 // twiddle = (1.0, 0.0).
 // Transposed twiddle tables are used in RFFT to avoid memory access by a large
 // stride.
 void ne10_fft_generate_twiddles_line_transposed_float32 (
     ne10_fft_cpx_float32_t* twiddles,
     const ne10_int32_t mstride,
     const ne10_int32_t fstride,
     const ne10_int32_t radix,
     const ne10_int32_t nfft)
 {
     ne10_int32_t j, k;
     ne10_float32_t phase;
     const ne10_float64_t pi = NE10_PI;

     for (j = 0; j < mstride; j++)
     {
         for (k = 1; k < radix; k++) // phase = 1 when k = 0
         {
             phase = -2 * pi * fstride * k * j / nfft;
             twiddles[(radix - 1) * j + k - 1].r = (ne10_float32_t) cos (phase);
             twiddles[(radix - 1) * j + k - 1].i = (ne10_float32_t) sin (phase);
         } // radix
     } // mstride
 }

 // Twiddles matrix [mstride][radix-1]
 // First column (k == 0)is ignored because phase == 1, and
 // twiddle = (1.0, 0.0).
 static void ne10_fft_generate_twiddles_line_int32 (ne10_fft_cpx_int32_t * twiddles,
         const ne10_int32_t mstride,
         const ne10_int32_t fstride,
         const ne10_int32_t radix,
         const ne10_int32_t nfft)
 {
     ne10_int32_t j, k;
     ne10_float32_t phase;
     const ne10_float64_t pi = NE10_PI;

     for (j = 0; j < mstride; j++)
     {
         for (k = 1; k < radix; k++) // phase = 1 when k = 0
         {
             phase = -2 * pi * fstride * k * j / nfft;

             ne10_fft_cpx_int32_t *tw = &twiddles[mstride * (k - 1) + j];

             tw->r = (ne10_int32_t) floor (0.5f + NE10_F2I32_MAX * cos(phase));
             tw->i = (ne10_int32_t) floor (0.5f + NE10_F2I32_MAX * sin(phase));
         } // radix
     } // mstride
 }

 ne10_fft_cpx_int32_t* ne10_fft_generate_twiddles_int32 (ne10_fft_cpx_int32_t * twiddles,
         const ne10_int32_t * factors,
         const ne10_int32_t nfft )
 {
     ne10_int32_t stage_count = factors[0];
     ne10_int32_t fstride = factors[1];
     ne10_int32_t mstride;
     ne10_int32_t cur_radix; // current radix

     // for first stage
     cur_radix = factors[2 * stage_count];
     if (cur_radix % 2) // current radix is not 4 or 2
     {
         twiddles += 1;
         ne10_fft_generate_twiddles_line_int32 (twiddles, 1, fstride, cur_radix, nfft);
         twiddles += cur_radix - 1;
     }
     stage_count--;

     // for other stage
     for (; stage_count > 0; stage_count--)
     {
         cur_radix = factors[2 * stage_count];
         fstride /= cur_radix;
         mstride = factors[2 * stage_count + 1];
         ne10_fft_generate_twiddles_line_int32 (twiddles, mstride, fstride, cur_radix, nfft);
         twiddles += mstride * (cur_radix - 1);
     } // stage_count

     return twiddles;
 }

 typedef void (*line_generator_float32)(ne10_fft_cpx_float32_t*,
       const ne10_int32_t,
       const ne10_int32_t,
       const ne10_int32_t,
       const ne10_int32_t);

 ne10_fft_cpx_float32_t* ne10_fft_generate_twiddles_impl_float32 (
       line_generator_float32 generator,
       ne10_fft_cpx_float32_t * twiddles,
       const ne10_int32_t * factors,
       const ne10_int32_t nfft)
 {
     ne10_int32_t stage_count = factors[0];
     ne10_int32_t fstride = factors[1];
     ne10_int32_t mstride;
     ne10_int32_t cur_radix; // current radix

     // for first stage
     cur_radix = factors[2 * stage_count];
     if (cur_radix % 2) // current radix is not 4 or 2
     {
         twiddles[0].r = 1.0;
         twiddles[0].i = 0.0;
         twiddles += 1;
         generator (twiddles, 1, fstride, cur_radix, nfft);
         twiddles += cur_radix - 1;
     }
     stage_count --;

     // for other stage
     for (; stage_count > 0; stage_count --)
     {
         cur_radix = factors[2 * stage_count];
         fstride /= cur_radix;
         mstride = factors[2 * stage_count + 1];
         generator (twiddles, mstride, fstride, cur_radix, nfft);
         twiddles += mstride * (cur_radix - 1);
     } // stage_count

     return twiddles;
 }

 ne10_fft_cpx_float32_t* ne10_fft_generate_twiddles_float32 (ne10_fft_cpx_float32_t * twiddles,
         const ne10_int32_t * factors,
         const ne10_int32_t nfft )
 {
     line_generator_float32 generator = ne10_fft_generate_twiddles_line_float32;
     twiddles = ne10_fft_generate_twiddles_impl_float32(generator,
         twiddles, factors, nfft);
     return twiddles;
 }

 ne10_fft_cpx_float32_t* ne10_fft_generate_twiddles_transposed_float32 (
       ne10_fft_cpx_float32_t * twiddles,
       const ne10_int32_t * factors,
       const ne10_int32_t nfft)
 {
     line_generator_float32 generator =
         ne10_fft_generate_twiddles_line_transposed_float32;
     twiddles = ne10_fft_generate_twiddles_impl_float32(generator,
         twiddles, factors, nfft);
     return twiddles;
 }

 ne10_fft_cfg_float32_t ne10_fft_alloc_c2c_float32_neon (ne10_int32_t nfft)
 {
     // For input shorter than 15, fall back to c version.
     // We would not get much improvement from NEON for these cases.
     if (nfft < 15)
     {
         return ne10_fft_alloc_c2c_float32_c (nfft);
     }

     ne10_fft_cfg_float32_t st = NULL;
     ne10_uint32_t memneeded = sizeof (ne10_fft_state_float32_t)
                               + sizeof (ne10_int32_t) * (NE10_MAXFACTORS * 2) /* factors */
                               + sizeof (ne10_fft_cpx_float32_t) * nfft       /* twiddles */
                               + sizeof (ne10_fft_cpx_float32_t) * nfft         /* buffer */
                               + NE10_FFT_BYTE_ALIGNMENT;             /* 64-bit alignment */

     st = (ne10_fft_cfg_float32_t) NE10_MALLOC (memneeded);

     // Only backward FFT is scaled by default.
     st->is_forward_scaled = 0;
     st->is_backward_scaled = 1;

     // Bad allocation.
     if (st == NULL)
     {
         return NULL;
     }

     uintptr_t address = (uintptr_t) st + sizeof (ne10_fft_state_float32_t);
     NE10_BYTE_ALIGNMENT (address, NE10_FFT_BYTE_ALIGNMENT);
     st->factors = (ne10_int32_t*) address;
     st->twiddles = (ne10_fft_cpx_float32_t*) (st->factors + (NE10_MAXFACTORS * 2));
     st->buffer = st->twiddles + nfft;

     // st->last_twiddles is default NULL.
     // Calling fft_c or fft_neon is decided by this pointers.
     st->last_twiddles = NULL;

     st->nfft = nfft;
     if (nfft % NE10_FFT_PARA_LEVEL == 0)
     {
         // Size of FFT satisfies requirement of NEON optimization.
         st->nfft /= NE10_FFT_PARA_LEVEL;
         st->last_twiddles = st->twiddles + nfft / NE10_FFT_PARA_LEVEL;
     }

     ne10_int32_t result = ne10_factor (st->nfft, st->factors, NE10_FACTOR_EIGHT_FIRST_STAGE);

     // Cannot factor
     if (result == NE10_ERR)
     {
         NE10_FREE (st);
         return NULL;
     }

     ne10_int32_t stage_count    = st->factors[0];
     ne10_int32_t algorithm_flag = st->factors[2 * (stage_count + 1)];

     if (algorithm_flag == NE10_FFT_ALG_ANY)
     {
         if (nfft % NE10_FFT_PARA_LEVEL)
         {
             NE10_FREE (st);
             return NULL;
         }

         ne10_fft_generate_twiddles_float32 (st->twiddles, st->factors, st->nfft);

         // Generate super twiddles for the last stage.
         ne10_fft_generate_twiddles_line_float32 (st->last_twiddles,
                 st->nfft,
                 1,
                 NE10_FFT_PARA_LEVEL,
                 nfft);
         st->nfft *= NE10_FFT_PARA_LEVEL;
     }
     else
     {
         if (nfft % NE10_FFT_PARA_LEVEL == 0)
         {
             st->nfft = nfft;
             st->last_twiddles = NULL;

             // Adjust the factoring for a size "nfft / 4" FFT to work for size "nfft"
             if (stage_count > NE10_MAXFACTORS - 4)
             {
                 NE10_FREE (st);
                 return NULL;
             }
             st->factors[0]++;          // Bump the stage count
             st->factors[1] *= 4;       // Quadruple the first stage stride
             memmove(&st->factors[4], &st->factors[2], ((2 * (stage_count + 1)) - 1) * sizeof(st->factors[0]));
             st->factors[2] = 4;        // Add a new radix-4 stage
             st->factors[3] = nfft / 4;
         }

         ne10_fft_generate_twiddles_float32 (st->twiddles, st->factors, st->nfft);
     }

     return st;
 }

 ne10_fft_cfg_int32_t ne10_fft_alloc_c2c_int32_neon (ne10_int32_t nfft)
 {
     // For input shorter than 15, fall back to c version.
     // We would not get much improvement from NEON for these cases.
     if (nfft < 15)
     {
         return ne10_fft_alloc_c2c_int32_c (nfft);
     }

     ne10_fft_cfg_int32_t st = NULL;
     ne10_uint32_t memneeded = sizeof (ne10_fft_state_int32_t)
                               + sizeof (ne10_int32_t) * (NE10_MAXFACTORS * 2) /* factors */
                               + sizeof (ne10_fft_cpx_int32_t) * nfft         /* twiddles */
                               + sizeof (ne10_fft_cpx_int32_t) * nfft           /* buffer */
                               + NE10_FFT_BYTE_ALIGNMENT;             /* 64-bit alignment */

     st = (ne10_fft_cfg_int32_t) NE10_MALLOC (memneeded);

     // Bad allocation.
     if (st == NULL)
     {
         return NULL;
     }

     uintptr_t address = (uintptr_t) st + sizeof (ne10_fft_state_int32_t);
     NE10_BYTE_ALIGNMENT (address, NE10_FFT_BYTE_ALIGNMENT);
     st->factors = (ne10_int32_t*) address;
     st->twiddles = (ne10_fft_cpx_int32_t*) (st->factors + (NE10_MAXFACTORS * 2));
     st->buffer = st->twiddles + nfft;

     // st->last_twiddles is default NULL.
     // Calling fft_c or fft_neon is decided by this pointers.
     st->last_twiddles = NULL;

     st->nfft = nfft;
     if (nfft % NE10_FFT_PARA_LEVEL == 0)
     {
         // Size of FFT satisfies requirement of NEON optimization.
         st->nfft /= NE10_FFT_PARA_LEVEL;
         st->last_twiddles = st->twiddles + nfft / NE10_FFT_PARA_LEVEL;
     }

     ne10_int32_t result = ne10_factor (st->nfft, st->factors, NE10_FACTOR_EIGHT_FIRST_STAGE);

     // Cannot factor
     if (result == NE10_ERR)
     {
         NE10_FREE (st);
         return NULL;
     }

     ne10_int32_t stage_count    = st->factors[0];
     ne10_int32_t algorithm_flag = st->factors[2 * (stage_count + 1)];

     if (algorithm_flag == NE10_FFT_ALG_ANY)
     {
         // Disable radix 8 for INT32 generic FFTs (it isn't supported)
         result = ne10_factor (st->nfft, st->factors, NE10_FACTOR_DEFAULT);
         if ((result == NE10_ERR) || (nfft % NE10_FFT_PARA_LEVEL))
         {
             NE10_FREE (st);
             return NULL;
         }

         ne10_fft_generate_twiddles_int32 (st->twiddles, st->factors, st->nfft);

         // Generate super twiddles for the last stage.
         ne10_fft_generate_twiddles_line_int32 (st->last_twiddles,
                 st->nfft,
                 1,
                 NE10_FFT_PARA_LEVEL,
                 nfft);
         st->nfft *= NE10_FFT_PARA_LEVEL;
     }
     else
     {
         if (nfft % NE10_FFT_PARA_LEVEL == 0)
         {
             st->nfft = nfft;
             st->last_twiddles = NULL;

             // Adjust the factoring for a size "nfft / 4" FFT to work for size "nfft"
             if (stage_count > NE10_MAXFACTORS - 4)
             {
                 NE10_FREE (st);
                 return NULL;
             }
             st->factors[0]++;          // Bump the stage count
             st->factors[1] *= 4;       // Quadruple the first stage stride
             memmove(&st->factors[4], &st->factors[2], ((2 * (stage_count + 1)) - 1) * sizeof(st->factors[0]));
             st->factors[2] = 4;        // Add a new radix-4 stage
             st->factors[3] = nfft / 4;
         }

         ne10_fft_generate_twiddles_int32 (st->twiddles, st->factors, st->nfft);
     }

     return st;
 }

 void ne10_fft_destroy_c2c_float32 (ne10_fft_cfg_float32_t cfg)
 {
     free(cfg);
 }

 void ne10_fft_destroy_c2c_int32 (ne10_fft_cfg_int32_t cfg)
 {
     free (cfg);
 }

 void ne10_fft_destroy_c2c_int16 (ne10_fft_cfg_int16_t cfg)
 {
     free (cfg);
 }
  // C2C_FFT_IFFT

 void ne10_fft_destroy_r2c_float32 (ne10_fft_r2c_cfg_float32_t cfg)
 {
     free(cfg);
 }

 void ne10_fft_destroy_r2c_int32 (ne10_fft_r2c_cfg_int32_t cfg)
 {
     free (cfg);
 }

 void ne10_fft_destroy_r2c_int16 (ne10_fft_r2c_cfg_int16_t cfg)
 {
     free (cfg);
 }
  // R2C_FFT_IFFT
NE10_FFT_ALG_DEFAULT
#define NE10_FFT_ALG_DEFAULT
Definition: NE10_fft.h:57

ne10_fft_state_float32_t::is_backward_scaled
ne10_int32_t is_backward_scaled
Flag to control scaling behaviour in backward floating point complex FFT.
Definition: NE10_types.h:261

NE10_FFT_PARA_LEVEL
#define NE10_FFT_PARA_LEVEL
Definition: NE10_fft.h:79

ne10_fft_state_int32_t::twiddles
ne10_fft_cpx_int32_t * twiddles
Definition: NE10_types.h:335

ne10_fft_destroy_r2c_int16
void ne10_fft_destroy_r2c_int16(ne10_fft_r2c_cfg_int16_t)
Destroys the configuration structure allocated by ne10_fft_alloc_r2c_int16 (frees memory...
Definition: NE10_fft.c:613

NE10_MAXFACTORS
#define NE10_MAXFACTORS
Structure for the floating point FFT function.
Definition: NE10_types.h:229

NE10_macros.h

ne10_int32_t
int32_t ne10_int32_t
Definition: NE10_types.h:76

ne10_fft_generate_twiddles_line_transposed_float32
void ne10_fft_generate_twiddles_line_transposed_float32(ne10_fft_cpx_float32_t *twiddles, const ne10_int32_t mstride, const ne10_int32_t fstride, const ne10_int32_t radix, const ne10_int32_t nfft)
Definition: NE10_fft.c:197

ne10_fft_destroy_r2c_int32
void ne10_fft_destroy_r2c_int32(ne10_fft_r2c_cfg_int32_t)
Destroys the configuration structure allocated by ne10_fft_alloc_r2c_int32 (frees memory...
Definition: NE10_fft.c:603

ne10_fft_r2c_state_float32_t
Definition: NE10_types.h:269

ne10_factor
ne10_int32_t ne10_factor(ne10_int32_t n, ne10_int32_t *facbuf, ne10_int32_t ne10_factor_flags)
Definition: NE10_fft.c:71

ne10_fft_state_int32_t
Definition: NE10_types.h:331

ne10_float32_t
float ne10_float32_t
Definition: NE10_types.h:80

ne10_fft_alloc_c2c_float32_neon
ne10_fft_cfg_float32_t ne10_fft_alloc_c2c_float32_neon(ne10_int32_t nfft)
Specific implementation of ne10_fft_alloc_c2c_float32 for ne10_fft_c2c_1d_float32_neon.
Definition: NE10_fft.c:348

ne10_fft_state_float32_t::nfft
ne10_int32_t nfft
Definition: NE10_types.h:241

ne10_fft_generate_twiddles_impl_float32
ne10_fft_cpx_float32_t * ne10_fft_generate_twiddles_impl_float32(line_generator_float32 generator, ne10_fft_cpx_float32_t *twiddles, const ne10_int32_t *factors, const ne10_int32_t nfft)
Definition: NE10_fft.c:284

ne10_fft_state_float32_t
Structure for the floating point FFT state.
Definition: NE10_types.h:239

ne10_fft_destroy_r2c_float32
void ne10_fft_destroy_r2c_float32(ne10_fft_r2c_cfg_float32_t)
Destroys the configuration structure allocated by ne10_fft_alloc_r2c_float32 (frees memory...
Definition: NE10_fft.c:593

NE10_FFT_BYTE_ALIGNMENT
#define NE10_FFT_BYTE_ALIGNMENT
Definition: NE10_fft.h:45

NE10_fft.h

ne10_fft_generate_twiddles_int32
ne10_fft_cpx_int32_t * ne10_fft_generate_twiddles_int32(ne10_fft_cpx_int32_t *twiddles, const ne10_int32_t *factors, const ne10_int32_t nfft)
Definition: NE10_fft.c:246

ne10_fft_cpx_float32_t
Definition: NE10_types.h:230

ne10_fft_state_float32_t::factors
ne10_int32_t * factors
Definition: NE10_types.h:242

ne10_fft_state_int32_t::nfft
ne10_int32_t nfft
Definition: NE10_types.h:333

ne10_fft_cfg_float32_t
ne10_fft_state_float32_t * ne10_fft_cfg_float32_t
Configuration structure for floating point FFT.
Definition: NE10_types.h:267

ne10_uint32_t
uint32_t ne10_uint32_t
Definition: NE10_types.h:77

NE10_PI
#define NE10_PI
NE10 defines a number of macros for use in its function signatures.
Definition: NE10_macros.h:47

ne10_fft_alloc_c2c_int32_neon
ne10_fft_cfg_int32_t ne10_fft_alloc_c2c_int32_neon(ne10_int32_t nfft)
Specific implementation of ne10_fft_alloc_c2c_int32 for ne10_fft_c2c_1d_int32_neon.
Definition: NE10_fft.c:451

ne10_fft_generate_twiddles_transposed_float32
ne10_fft_cpx_float32_t * ne10_fft_generate_twiddles_transposed_float32(ne10_fft_cpx_float32_t *twiddles, const ne10_int32_t *factors, const ne10_int32_t nfft)
Definition: NE10_fft.c:330

ne10_fft_state_float32_t::twiddles
ne10_fft_cpx_float32_t * twiddles
Definition: NE10_types.h:243

ne10_fft_alloc_c2c_float32_c
ne10_fft_cfg_float32_t ne10_fft_alloc_c2c_float32_c(ne10_int32_t nfft)
Specific implementation of ne10_fft_alloc_c2c_float32 for ne10_fft_c2c_1d_float32_c.
Definition: NE10_fft_float32.c:828

NE10_FREE
#define NE10_FREE(p)
Definition: NE10_macros.h:54

ne10_fft_state_float32_t::last_twiddles
ne10_fft_cpx_float32_t * last_twiddles
Definition: NE10_types.h:245

ne10_fft_cpx_int32_t
Structure for the 32-bit fixed point FFT function.
Definition: NE10_types.h:325

ne10_fft_cpx_int32_t::i
ne10_int32_t i
Definition: NE10_types.h:328

ne10_fft_generate_twiddles_line_float32
void ne10_fft_generate_twiddles_line_float32(ne10_fft_cpx_float32_t *twiddles, const ne10_int32_t mstride, const ne10_int32_t fstride, const ne10_int32_t radix, const ne10_int32_t nfft)
Definition: NE10_fft.c:171

ne10_fft_state_int32_t::factors
ne10_int32_t * factors
Definition: NE10_types.h:334

ne10_fft_destroy_c2c_int32
void ne10_fft_destroy_c2c_int32(ne10_fft_cfg_int32_t)
Destroys the configuration structure allocated by variants of ne10_fft_alloc_c2c_int32 (frees memory...
Definition: NE10_fft.c:566

ne10_fft_destroy_c2c_float32
void ne10_fft_destroy_c2c_float32(ne10_fft_cfg_float32_t)
Destroys the configuration structure allocated by variants of ne10_fft_alloc_c2c_float32 (frees memor...
Definition: NE10_fft.c:556

NE10_FACTOR_EIGHT_FIRST_STAGE
#define NE10_FACTOR_EIGHT_FIRST_STAGE
Definition: NE10_fft.h:72

ne10_fft_r2c_state_int32_t
Definition: NE10_types.h:342

ne10_fft_generate_twiddles_float32
ne10_fft_cpx_float32_t * ne10_fft_generate_twiddles_float32(ne10_fft_cpx_float32_t *twiddles, const ne10_int32_t *factors, const ne10_int32_t nfft)
Definition: NE10_fft.c:320

NE10_FFT_ALG_ANY
#define NE10_FFT_ALG_ANY
Definition: NE10_fft.h:58

ne10_fft_state_int16_t
Definition: NE10_types.h:300

NE10_F2I32_MAX
#define NE10_F2I32_MAX
Definition: NE10_macros.h:81

ne10_fft_r2c_state_int16_t
Definition: NE10_types.h:310

ne10_fft_state_int32_t::buffer
ne10_fft_cpx_int32_t * buffer
Definition: NE10_types.h:336

NE10_MALLOC
#define NE10_MALLOC
Definition: NE10_macros.h:53

NE10_BYTE_ALIGNMENT
#define NE10_BYTE_ALIGNMENT(address, alignment)
Definition: NE10_macros.h:63

NE10_ERR
#define NE10_ERR
Definition: NE10_types.h:66

ne10_fft_cpx_int32_t::r
ne10_int32_t r
Definition: NE10_types.h:327

ne10_float64_t
double ne10_float64_t
Definition: NE10_types.h:81

NE10_OK
#define NE10_OK
Definition: NE10_types.h:65

ne10_fft_cpx_float32_t::i
ne10_float32_t i
Definition: NE10_types.h:233

ne10_fft_alloc_c2c_int32_c
ne10_fft_cfg_int32_t ne10_fft_alloc_c2c_int32_c(ne10_int32_t nfft)
Specific implementation of ne10_fft_alloc_c2c_int32 for ne10_fft_c2c_1d_int32_c.
Definition: NE10_fft_int32.c:1054

ne10_fft_state_float32_t::buffer
ne10_fft_cpx_float32_t * buffer
Definition: NE10_types.h:244

ne10_fft_destroy_c2c_int16
void ne10_fft_destroy_c2c_int16(ne10_fft_cfg_int16_t)
Destroys the configuration structure allocated by ne10_fft_alloc_c2c_int16 (frees memory...
Definition: NE10_fft.c:576

NE10_FACTOR_EIGHT
#define NE10_FACTOR_EIGHT
Definition: NE10_fft.h:73

NE10_types.h

ne10_fft_state_float32_t::is_forward_scaled
ne10_int32_t is_forward_scaled
Flag to control scaling behaviour in forward floating point complex FFT.
Definition: NE10_types.h:253

ne10_fft_state_int32_t::last_twiddles
ne10_fft_cpx_int32_t * last_twiddles
Definition: NE10_types.h:337

ne10_fft_cpx_float32_t::r
ne10_float32_t r
Definition: NE10_types.h:232

line_generator_float32
void(* line_generator_float32)(ne10_fft_cpx_float32_t *, const ne10_int32_t, const ne10_int32_t, const ne10_int32_t, const ne10_int32_t)
Definition: NE10_fft.c:278

NE10_FACTOR_DEFAULT
#define NE10_FACTOR_DEFAULT
Definition: NE10_fft.h:71

ne10_fft_cfg_int32_t
ne10_fft_state_int32_t * ne10_fft_cfg_int32_t
Definition: NE10_types.h:340