build-rockchip.git

/* ---------------------------------------------------------------------- 
 * Project:      CMSIS DSP Library 
 * Title:        arm_rfft_f32.c 
 * Description:  RFFT & RIFFT Floating point process function 
 * 
 * $Date:        27. January 2017 
 * $Revision:    V.1.5.1 
 * 
 * Target Processor: Cortex-M cores 
 * -------------------------------------------------------------------- */ 
/* 
 * Copyright (C) 2010-2017 ARM Limited or its affiliates. All rights reserved. 
 * 
 * SPDX-License-Identifier: Apache-2.0 
 * 
 * Licensed under the Apache License, Version 2.0 (the License); you may 
 * not use this file except in compliance with the License. 
 * You may obtain a copy of the License at 
 * 
 * www.apache.org/licenses/LICENSE-2.0 
 * 
 * Unless required by applicable law or agreed to in writing, software 
 * distributed under the License is distributed on an AS IS BASIS, WITHOUT 
 * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 
 * See the License for the specific language governing permissions and 
 * limitations under the License. 
 */ 
 
#include "arm_math.h" 
 
void stage_rfft_f32( 
  arm_rfft_fast_instance_f32 * S, 
  float32_t * p, float32_t * pOut) 
{ 
   uint32_t  k;                                   /* Loop Counter                     */ 
   float32_t twR, twI;                           /* RFFT Twiddle coefficients        */ 
   float32_t * pCoeff = S->pTwiddleRFFT;  /* Points to RFFT Twiddle factors   */ 
   float32_t *pA = p;                           /* increasing pointer               */ 
   float32_t *pB = p;                           /* decreasing pointer               */ 
   float32_t xAR, xAI, xBR, xBI;                /* temporary variables              */ 
   float32_t t1a, t1b;                         /* temporary variables              */ 
   float32_t p0, p1, p2, p3;                   /* temporary variables              */ 
 
 
   k = (S->Sint).fftLen - 1; 
 
   /* Pack first and last sample of the frequency domain together */ 
 
   xBR = pB[0]; 
   xBI = pB[1]; 
   xAR = pA[0]; 
   xAI = pA[1]; 
 
   twR = *pCoeff++ ; 
   twI = *pCoeff++ ; 
 
   // U1 = XA(1) + XB(1); % It is real 
   t1a = xBR + xAR  ; 
 
   // U2 = XB(1) - XA(1); % It is imaginary 
   t1b = xBI + xAI  ; 
 
   // real(tw * (xB - xA)) = twR * (xBR - xAR) - twI * (xBI - xAI); 
   // imag(tw * (xB - xA)) = twI * (xBR - xAR) + twR * (xBI - xAI); 
   *pOut++ = 0.5f * ( t1a + t1b ); 
   *pOut++ = 0.5f * ( t1a - t1b ); 
 
   // XA(1) = 1/2*( U1 - imag(U2) +  i*( U1 +imag(U2) )); 
   pB  = p + 2*k; 
   pA += 2; 
 
   do 
   { 
      /* 
         function X = my_split_rfft(X, ifftFlag) 
         % X is a series of real numbers 
         L  = length(X); 
         XC = X(1:2:end) +i*X(2:2:end); 
         XA = fft(XC); 
         XB = conj(XA([1 end:-1:2])); 
         TW = i*exp(-2*pi*i*[0:L/2-1]/L).'; 
         for l = 2:L/2 
            XA(l) = 1/2 * (XA(l) + XB(l) + TW(l) * (XB(l) - XA(l))); 
         end 
         XA(1) = 1/2* (XA(1) + XB(1) + TW(1) * (XB(1) - XA(1))) + i*( 1/2*( XA(1) + XB(1) + i*( XA(1) - XB(1)))); 
         X = XA; 
      */ 
 
      xBI = pB[1]; 
      xBR = pB[0]; 
      xAR = pA[0]; 
      xAI = pA[1]; 
 
      twR = *pCoeff++; 
      twI = *pCoeff++; 
 
      t1a = xBR - xAR ; 
      t1b = xBI + xAI ; 
 
      // real(tw * (xB - xA)) = twR * (xBR - xAR) - twI * (xBI - xAI); 
      // imag(tw * (xB - xA)) = twI * (xBR - xAR) + twR * (xBI - xAI); 
      p0 = twR * t1a; 
      p1 = twI * t1a; 
      p2 = twR * t1b; 
      p3 = twI * t1b; 
 
      *pOut++ = 0.5f * (xAR + xBR + p0 + p3 ); //xAR 
      *pOut++ = 0.5f * (xAI - xBI + p1 - p2 ); //xAI 
 
      pA += 2; 
      pB -= 2; 
      k--; 
   } while (k > 0U); 
} 
 
/* Prepares data for inverse cfft */ 
void merge_rfft_f32( 
arm_rfft_fast_instance_f32 * S, 
float32_t * p, float32_t * pOut) 
{ 
   uint32_t  k;                                /* Loop Counter                     */ 
   float32_t twR, twI;                        /* RFFT Twiddle coefficients        */ 
   float32_t *pCoeff = S->pTwiddleRFFT;        /* Points to RFFT Twiddle factors   */ 
   float32_t *pA = p;                        /* increasing pointer               */ 
   float32_t *pB = p;                        /* decreasing pointer               */ 
   float32_t xAR, xAI, xBR, xBI;            /* temporary variables              */ 
   float32_t t1a, t1b, r, s, t, u;            /* temporary variables              */ 
 
   k = (S->Sint).fftLen - 1; 
 
   xAR = pA[0]; 
   xAI = pA[1]; 
 
   pCoeff += 2 ; 
 
   *pOut++ = 0.5f * ( xAR + xAI ); 
   *pOut++ = 0.5f * ( xAR - xAI ); 
 
   pB  =  p + 2*k ; 
   pA +=  2       ; 
 
   while (k > 0U) 
   { 
      /* G is half of the frequency complex spectrum */ 
      //for k = 2:N 
      //    Xk(k) = 1/2 * (G(k) + conj(G(N-k+2)) + Tw(k)*( G(k) - conj(G(N-k+2)))); 
      xBI =   pB[1]    ; 
      xBR =   pB[0]    ; 
      xAR =  pA[0]; 
      xAI =  pA[1]; 
 
      twR = *pCoeff++; 
      twI = *pCoeff++; 
 
      t1a = xAR - xBR ; 
      t1b = xAI + xBI ; 
 
      r = twR * t1a; 
      s = twI * t1b; 
      t = twI * t1a; 
      u = twR * t1b; 
 
      // real(tw * (xA - xB)) = twR * (xAR - xBR) - twI * (xAI - xBI); 
      // imag(tw * (xA - xB)) = twI * (xAR - xBR) + twR * (xAI - xBI); 
      *pOut++ = 0.5f * (xAR + xBR - r - s ); //xAR 
      *pOut++ = 0.5f * (xAI - xBI + t - u ); //xAI 
 
      pA += 2; 
      pB -= 2; 
      k--; 
   } 
 
} 
 
/** 
* @ingroup groupTransforms 
*/ 
 
/** 
 * @defgroup RealFFT Real FFT Functions 
 * 
 * \par 
 * The CMSIS DSP library includes specialized algorithms for computing the 
 * FFT of real data sequences.  The FFT is defined over complex data but 
 * in many applications the input is real.  Real FFT algorithms take advantage 
 * of the symmetry properties of the FFT and have a speed advantage over complex 
 * algorithms of the same length. 
 * \par 
 * The Fast RFFT algorith relays on the mixed radix CFFT that save processor usage. 
 * \par 
 * The real length N forward FFT of a sequence is computed using the steps shown below. 
 * \par 
 * \image html RFFT.gif "Real Fast Fourier Transform" 
 * \par 
 * The real sequence is initially treated as if it were complex to perform a CFFT. 
 * Later, a processing stage reshapes the data to obtain half of the frequency spectrum 
 * in complex format. Except the first complex number that contains the two real numbers 
 * X[0] and X[N/2] all the data is complex. In other words, the first complex sample 
 * contains two real values packed. 
 * \par 
 * The input for the inverse RFFT should keep the same format as the output of the 
 * forward RFFT. A first processing stage pre-process the data to later perform an 
 * inverse CFFT. 
 * \par 
 * \image html RIFFT.gif "Real Inverse Fast Fourier Transform" 
 * \par 
 * The algorithms for floating-point, Q15, and Q31 data are slightly different 
 * and we describe each algorithm in turn. 
 * \par Floating-point 
 * The main functions are arm_rfft_fast_f32() and arm_rfft_fast_init_f32(). 
 * The older functions arm_rfft_f32() and arm_rfft_init_f32() have been 
 * deprecated but are still documented. 
 * \par 
 * The FFT of a real N-point sequence has even symmetry in the frequency 
 * domain. The second half of the data equals the conjugate of the first 
 * half flipped in frequency. Looking at the data, we see that we can 
 * uniquely represent the FFT using only N/2 complex numbers. These are 
 * packed into the output array in alternating real and imaginary 
 * components: 
 * \par 
 * X = { real[0], imag[0], real[1], imag[1], real[2], imag[2] ... 
 * real[(N/2)-1], imag[(N/2)-1 } 
 * \par 
 * It happens that the first complex number (real[0], imag[0]) is actually 
 * all real. real[0] represents the DC offset, and imag[0] should be 0. 
 * (real[1], imag[1]) is the fundamental frequency, (real[2], imag[2]) is 
 * the first harmonic and so on. 
 * \par 
 * The real FFT functions pack the frequency domain data in this fashion. 
 * The forward transform outputs the data in this form and the inverse 
 * transform expects input data in this form. The function always performs 
 * the needed bitreversal so that the input and output data is always in 
 * normal order. The functions support lengths of [32, 64, 128, ..., 4096] 
 * samples. 
 * \par Q15 and Q31 
 * The real algorithms are defined in a similar manner and utilize N/2 complex 
 * transforms behind the scenes. 
 * \par 
 * The complex transforms used internally include scaling to prevent fixed-point 
 * overflows.  The overall scaling equals 1/(fftLen/2). 
 * \par 
 * A separate instance structure must be defined for each transform used but 
 * twiddle factor and bit reversal tables can be reused. 
 * \par 
 * There is also an associated initialization function for each data type. 
 * The initialization function performs the following operations: 
 * - Sets the values of the internal structure fields. 
 * - Initializes twiddle factor table and bit reversal table pointers. 
 * - Initializes the internal complex FFT data structure. 
 * \par 
 * Use of the initialization function is optional. 
 * However, if the initialization function is used, then the instance structure 
 * cannot be placed into a const data section. To place an instance structure 
 * into a const data section, the instance structure should be manually 
 * initialized as follows: 
 * <pre> 
 *arm_rfft_instance_q31 S = {fftLenReal, fftLenBy2, ifftFlagR, bitReverseFlagR, twidCoefRModifier, pTwiddleAReal, pTwiddleBReal, pCfft}; 
 *arm_rfft_instance_q15 S = {fftLenReal, fftLenBy2, ifftFlagR, bitReverseFlagR, twidCoefRModifier, pTwiddleAReal, pTwiddleBReal, pCfft}; 
 * </pre> 
 * where <code>fftLenReal</code> is the length of the real transform; 
 * <code>fftLenBy2</code> length of  the internal complex transform. 
 * <code>ifftFlagR</code> Selects forward (=0) or inverse (=1) transform. 
 * <code>bitReverseFlagR</code> Selects bit reversed output (=0) or normal order 
 * output (=1). 
 * <code>twidCoefRModifier</code> stride modifier for the twiddle factor table. 
 * The value is based on the FFT length; 
 * <code>pTwiddleAReal</code>points to the A array of twiddle coefficients; 
 * <code>pTwiddleBReal</code>points to the B array of twiddle coefficients; 
 * <code>pCfft</code> points to the CFFT Instance structure. The CFFT structure 
 * must also be initialized.  Refer to arm_cfft_radix4_f32() for details regarding 
 * static initialization of the complex FFT instance structure. 
 */ 
 
/** 
* @addtogroup RealFFT 
* @{ 
*/ 
 
/** 
* @brief Processing function for the floating-point real FFT. 
* @param[in]  *S              points to an arm_rfft_fast_instance_f32 structure. 
* @param[in]  *p              points to the input buffer. 
* @param[in]  *pOut           points to the output buffer. 
* @param[in]  ifftFlag        RFFT if flag is 0, RIFFT if flag is 1 
* @return none. 
*/ 
 
void arm_rfft_fast_f32( 
arm_rfft_fast_instance_f32 * S, 
float32_t * p, float32_t * pOut, 
uint8_t ifftFlag) 
{ 
   arm_cfft_instance_f32 * Sint = &(S->Sint); 
   Sint->fftLen = S->fftLenRFFT / 2; 
 
   /* Calculation of Real FFT */ 
   if (ifftFlag) 
   { 
      /*  Real FFT compression */ 
      merge_rfft_f32(S, p, pOut); 
 
      /* Complex radix-4 IFFT process */ 
      arm_cfft_f32( Sint, pOut, ifftFlag, 1); 
   } 
   else 
   { 
      /* Calculation of RFFT of input */ 
      arm_cfft_f32( Sint, p, ifftFlag, 1); 
 
      /*  Real FFT extraction */ 
      stage_rfft_f32(S, p, pOut); 
   } 
} 
 
/** 
* @} end of RealFFT group 
*/