| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209 | /* ---------------------------------------------------------------------- * Project:      CMSIS DSP Library * Title:        arm_cfft_radix4_f32.c * Description:  Radix-4 Decimation in Frequency CFFT & CIFFT Floating point processing function * * $Date:        27. January 2017 * $Revision:    V.1.5.1 * * Target Processor: Cortex-M cores * -------------------------------------------------------------------- *//* * Copyright (C) 2010-2017 ARM Limited or its affiliates. All rights reserved. * * SPDX-License-Identifier: Apache-2.0 * * Licensed under the Apache License, Version 2.0 (the License); you may * not use this file except in compliance with the License. * You may obtain a copy of the License at * * www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an AS IS BASIS, WITHOUT * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */#include "arm_math.h"extern void arm_bitreversal_f32(float32_t * pSrc,uint16_t fftSize,uint16_t bitRevFactor,uint16_t * pBitRevTab);void arm_radix4_butterfly_f32(float32_t * pSrc,uint16_t fftLen,float32_t * pCoef,uint16_t twidCoefModifier);void arm_radix4_butterfly_inverse_f32(float32_t * pSrc,uint16_t fftLen,float32_t * pCoef,uint16_t twidCoefModifier,float32_t onebyfftLen);/*** @ingroup groupTransforms*//*** @addtogroup ComplexFFT* @{*//*** @details* @brief Processing function for the floating-point Radix-4 CFFT/CIFFT.* @deprecated Do not use this function.  It has been superseded by \ref arm_cfft_f32 and will be removed* in the future.* @param[in]      *S    points to an instance of the floating-point Radix-4 CFFT/CIFFT structure.* @param[in, out] *pSrc points to the complex data buffer of size <code>2*fftLen</code>. Processing occurs in-place.* @return none.*/void arm_cfft_radix4_f32(  const arm_cfft_radix4_instance_f32 * S,  float32_t * pSrc){   if (S->ifftFlag == 1U)   {      /*  Complex IFFT radix-4  */      arm_radix4_butterfly_inverse_f32(pSrc, S->fftLen, S->pTwiddle, S->twidCoefModifier, S->onebyfftLen);   }   else   {      /*  Complex FFT radix-4  */      arm_radix4_butterfly_f32(pSrc, S->fftLen, S->pTwiddle, S->twidCoefModifier);   }   if (S->bitReverseFlag == 1U)   {      /*  Bit Reversal */      arm_bitreversal_f32(pSrc, S->fftLen, S->bitRevFactor, S->pBitRevTable);   }}/*** @} end of ComplexFFT group*//* ---------------------------------------------------------------------- * Internal helper function used by the FFTs * ---------------------------------------------------------------------- *//** @brief  Core function for the floating-point CFFT butterfly process.* @param[in, out] *pSrc            points to the in-place buffer of floating-point data type.* @param[in]      fftLen           length of the FFT.* @param[in]      *pCoef           points to the twiddle coefficient buffer.* @param[in]      twidCoefModifier twiddle coefficient modifier that supports different size FFTs with the same twiddle factor table.* @return none.*/void arm_radix4_butterfly_f32(float32_t * pSrc,uint16_t fftLen,float32_t * pCoef,uint16_t twidCoefModifier){   float32_t co1, co2, co3, si1, si2, si3;   uint32_t ia1, ia2, ia3;   uint32_t i0, i1, i2, i3;   uint32_t n1, n2, j, k;#if defined (ARM_MATH_DSP)   /* Run the below code for Cortex-M4 and Cortex-M3 */   float32_t xaIn, yaIn, xbIn, ybIn, xcIn, ycIn, xdIn, ydIn;   float32_t Xaplusc, Xbplusd, Yaplusc, Ybplusd, Xaminusc, Xbminusd, Yaminusc,   Ybminusd;   float32_t Xb12C_out, Yb12C_out, Xc12C_out, Yc12C_out, Xd12C_out, Yd12C_out;   float32_t Xb12_out, Yb12_out, Xc12_out, Yc12_out, Xd12_out, Yd12_out;   float32_t *ptr1;   float32_t p0,p1,p2,p3,p4,p5;   float32_t a0,a1,a2,a3,a4,a5,a6,a7;   /*  Initializations for the first stage */   n2 = fftLen;   n1 = n2;   /* n2 = fftLen/4 */   n2 >>= 2U;   i0 = 0U;   ia1 = 0U;   j = n2;   /*  Calculation of first stage */   do   {      /*  index calculation for the input as, */      /*  pSrc[i0 + 0], pSrc[i0 + fftLen/4], pSrc[i0 + fftLen/2], pSrc[i0 + 3fftLen/4] */      i1 = i0 + n2;      i2 = i1 + n2;      i3 = i2 + n2;      xaIn = pSrc[(2U * i0)];      yaIn = pSrc[(2U * i0) + 1U];      xbIn = pSrc[(2U * i1)];      ybIn = pSrc[(2U * i1) + 1U];      xcIn = pSrc[(2U * i2)];      ycIn = pSrc[(2U * i2) + 1U];      xdIn = pSrc[(2U * i3)];      ydIn = pSrc[(2U * i3) + 1U];      /* xa + xc */      Xaplusc = xaIn + xcIn;      /* xb + xd */      Xbplusd = xbIn + xdIn;      /* ya + yc */      Yaplusc = yaIn + ycIn;      /* yb + yd */      Ybplusd = ybIn + ydIn;      /*  index calculation for the coefficients */      ia2 = ia1 + ia1;      co2 = pCoef[ia2 * 2U];      si2 = pCoef[(ia2 * 2U) + 1U];      /* xa - xc */      Xaminusc = xaIn - xcIn;      /* xb - xd */      Xbminusd = xbIn - xdIn;      /* ya - yc */      Yaminusc = yaIn - ycIn;      /* yb - yd */      Ybminusd = ybIn - ydIn;      /* xa' = xa + xb + xc + xd */      pSrc[(2U * i0)] = Xaplusc + Xbplusd;      /* ya' = ya + yb + yc + yd */      pSrc[(2U * i0) + 1U] = Yaplusc + Ybplusd;      /* (xa - xc) + (yb - yd) */      Xb12C_out = (Xaminusc + Ybminusd);      /* (ya - yc) + (xb - xd) */      Yb12C_out = (Yaminusc - Xbminusd);      /* (xa + xc) - (xb + xd) */      Xc12C_out = (Xaplusc - Xbplusd);      /* (ya + yc) - (yb + yd) */      Yc12C_out = (Yaplusc - Ybplusd);      /* (xa - xc) - (yb - yd) */      Xd12C_out = (Xaminusc - Ybminusd);      /* (ya - yc) + (xb - xd) */      Yd12C_out = (Xbminusd + Yaminusc);      co1 = pCoef[ia1 * 2U];      si1 = pCoef[(ia1 * 2U) + 1U];      /*  index calculation for the coefficients */      ia3 = ia2 + ia1;      co3 = pCoef[ia3 * 2U];      si3 = pCoef[(ia3 * 2U) + 1U];      Xb12_out = Xb12C_out * co1;      Yb12_out = Yb12C_out * co1;      Xc12_out = Xc12C_out * co2;      Yc12_out = Yc12C_out * co2;      Xd12_out = Xd12C_out * co3;      Yd12_out = Yd12C_out * co3;      /* xb' = (xa+yb-xc-yd)co1 - (ya-xb-yc+xd)(si1) */      //Xb12_out -= Yb12C_out * si1;      p0 = Yb12C_out * si1;      /* yb' = (ya-xb-yc+xd)co1 + (xa+yb-xc-yd)(si1) */      //Yb12_out += Xb12C_out * si1;      p1 = Xb12C_out * si1;      /* xc' = (xa-xb+xc-xd)co2 - (ya-yb+yc-yd)(si2) */      //Xc12_out -= Yc12C_out * si2;      p2 = Yc12C_out * si2;      /* yc' = (ya-yb+yc-yd)co2 + (xa-xb+xc-xd)(si2) */      //Yc12_out += Xc12C_out * si2;      p3 = Xc12C_out * si2;      /* xd' = (xa-yb-xc+yd)co3 - (ya+xb-yc-xd)(si3) */      //Xd12_out -= Yd12C_out * si3;      p4 = Yd12C_out * si3;      /* yd' = (ya+xb-yc-xd)co3 + (xa-yb-xc+yd)(si3) */      //Yd12_out += Xd12C_out * si3;      p5 = Xd12C_out * si3;      Xb12_out += p0;      Yb12_out -= p1;      Xc12_out += p2;      Yc12_out -= p3;      Xd12_out += p4;      Yd12_out -= p5;      /* xc' = (xa-xb+xc-xd)co2 + (ya-yb+yc-yd)(si2) */      pSrc[2U * i1] = Xc12_out;      /* yc' = (ya-yb+yc-yd)co2 - (xa-xb+xc-xd)(si2) */      pSrc[(2U * i1) + 1U] = Yc12_out;      /* xb' = (xa+yb-xc-yd)co1 + (ya-xb-yc+xd)(si1) */      pSrc[2U * i2] = Xb12_out;      /* yb' = (ya-xb-yc+xd)co1 - (xa+yb-xc-yd)(si1) */      pSrc[(2U * i2) + 1U] = Yb12_out;      /* xd' = (xa-yb-xc+yd)co3 + (ya+xb-yc-xd)(si3) */      pSrc[2U * i3] = Xd12_out;      /* yd' = (ya+xb-yc-xd)co3 - (xa-yb-xc+yd)(si3) */      pSrc[(2U * i3) + 1U] = Yd12_out;      /*  Twiddle coefficients index modifier */      ia1 += twidCoefModifier;      /*  Updating input index */      i0++;   }   while (--j);   twidCoefModifier <<= 2U;   /*  Calculation of second stage to excluding last stage */   for (k = fftLen >> 2U; k > 4U; k >>= 2U)   {      /*  Initializations for the first stage */      n1 = n2;      n2 >>= 2U;      ia1 = 0U;      /*  Calculation of first stage */      j = 0;      do      {         /*  index calculation for the coefficients */         ia2 = ia1 + ia1;         ia3 = ia2 + ia1;         co1 = pCoef[ia1 * 2U];         si1 = pCoef[(ia1 * 2U) + 1U];         co2 = pCoef[ia2 * 2U];         si2 = pCoef[(ia2 * 2U) + 1U];         co3 = pCoef[ia3 * 2U];         si3 = pCoef[(ia3 * 2U) + 1U];         /*  Twiddle coefficients index modifier */         ia1 += twidCoefModifier;         i0 = j;         do         {            /*  index calculation for the input as, */            /*  pSrc[i0 + 0], pSrc[i0 + fftLen/4], pSrc[i0 + fftLen/2], pSrc[i0 + 3fftLen/4] */            i1 = i0 + n2;            i2 = i1 + n2;            i3 = i2 + n2;            xaIn = pSrc[(2U * i0)];            yaIn = pSrc[(2U * i0) + 1U];            xbIn = pSrc[(2U * i1)];            ybIn = pSrc[(2U * i1) + 1U];            xcIn = pSrc[(2U * i2)];            ycIn = pSrc[(2U * i2) + 1U];            xdIn = pSrc[(2U * i3)];            ydIn = pSrc[(2U * i3) + 1U];            /* xa - xc */            Xaminusc = xaIn - xcIn;            /* (xb - xd) */            Xbminusd = xbIn - xdIn;            /* ya - yc */            Yaminusc = yaIn - ycIn;            /* (yb - yd) */            Ybminusd = ybIn - ydIn;            /* xa + xc */            Xaplusc = xaIn + xcIn;            /* xb + xd */            Xbplusd = xbIn + xdIn;            /* ya + yc */            Yaplusc = yaIn + ycIn;            /* yb + yd */            Ybplusd = ybIn + ydIn;            /* (xa - xc) + (yb - yd) */            Xb12C_out = (Xaminusc + Ybminusd);            /* (ya - yc) -  (xb - xd) */            Yb12C_out = (Yaminusc - Xbminusd);            /* xa + xc -(xb + xd) */            Xc12C_out = (Xaplusc - Xbplusd);            /* (ya + yc) - (yb + yd) */            Yc12C_out = (Yaplusc - Ybplusd);            /* (xa - xc) - (yb - yd) */            Xd12C_out = (Xaminusc - Ybminusd);            /* (ya - yc) +  (xb - xd) */            Yd12C_out = (Xbminusd + Yaminusc);            pSrc[(2U * i0)] = Xaplusc + Xbplusd;            pSrc[(2U * i0) + 1U] = Yaplusc + Ybplusd;            Xb12_out = Xb12C_out * co1;            Yb12_out = Yb12C_out * co1;            Xc12_out = Xc12C_out * co2;            Yc12_out = Yc12C_out * co2;            Xd12_out = Xd12C_out * co3;            Yd12_out = Yd12C_out * co3;            /* xb' = (xa+yb-xc-yd)co1 - (ya-xb-yc+xd)(si1) */            //Xb12_out -= Yb12C_out * si1;            p0 = Yb12C_out * si1;            /* yb' = (ya-xb-yc+xd)co1 + (xa+yb-xc-yd)(si1) */            //Yb12_out += Xb12C_out * si1;            p1 = Xb12C_out * si1;            /* xc' = (xa-xb+xc-xd)co2 - (ya-yb+yc-yd)(si2) */            //Xc12_out -= Yc12C_out * si2;            p2 = Yc12C_out * si2;            /* yc' = (ya-yb+yc-yd)co2 + (xa-xb+xc-xd)(si2) */            //Yc12_out += Xc12C_out * si2;            p3 = Xc12C_out * si2;            /* xd' = (xa-yb-xc+yd)co3 - (ya+xb-yc-xd)(si3) */            //Xd12_out -= Yd12C_out * si3;            p4 = Yd12C_out * si3;            /* yd' = (ya+xb-yc-xd)co3 + (xa-yb-xc+yd)(si3) */            //Yd12_out += Xd12C_out * si3;            p5 = Xd12C_out * si3;            Xb12_out += p0;            Yb12_out -= p1;            Xc12_out += p2;            Yc12_out -= p3;            Xd12_out += p4;            Yd12_out -= p5;            /* xc' = (xa-xb+xc-xd)co2 + (ya-yb+yc-yd)(si2) */            pSrc[2U * i1] = Xc12_out;            /* yc' = (ya-yb+yc-yd)co2 - (xa-xb+xc-xd)(si2) */            pSrc[(2U * i1) + 1U] = Yc12_out;            /* xb' = (xa+yb-xc-yd)co1 + (ya-xb-yc+xd)(si1) */            pSrc[2U * i2] = Xb12_out;            /* yb' = (ya-xb-yc+xd)co1 - (xa+yb-xc-yd)(si1) */            pSrc[(2U * i2) + 1U] = Yb12_out;            /* xd' = (xa-yb-xc+yd)co3 + (ya+xb-yc-xd)(si3) */            pSrc[2U * i3] = Xd12_out;            /* yd' = (ya+xb-yc-xd)co3 - (xa-yb-xc+yd)(si3) */            pSrc[(2U * i3) + 1U] = Yd12_out;            i0 += n1;         } while (i0 < fftLen);         j++;      } while (j <= (n2 - 1U));      twidCoefModifier <<= 2U;   }   j = fftLen >> 2;   ptr1 = &pSrc[0];   /*  Calculations of last stage */   do   {      xaIn = ptr1[0];      yaIn = ptr1[1];      xbIn = ptr1[2];      ybIn = ptr1[3];      xcIn = ptr1[4];      ycIn = ptr1[5];      xdIn = ptr1[6];      ydIn = ptr1[7];      /* xa + xc */      Xaplusc = xaIn + xcIn;      /* xa - xc */      Xaminusc = xaIn - xcIn;      /* ya + yc */      Yaplusc = yaIn + ycIn;      /* ya - yc */      Yaminusc = yaIn - ycIn;      /* xb + xd */      Xbplusd = xbIn + xdIn;      /* yb + yd */      Ybplusd = ybIn + ydIn;      /* (xb-xd) */      Xbminusd = xbIn - xdIn;      /* (yb-yd) */      Ybminusd = ybIn - ydIn;      /* xa' = xa + xb + xc + xd */      a0 = (Xaplusc + Xbplusd);      /* ya' = ya + yb + yc + yd */      a1 = (Yaplusc + Ybplusd);      /* xc' = (xa-xb+xc-xd) */      a2 = (Xaplusc - Xbplusd);      /* yc' = (ya-yb+yc-yd) */      a3 = (Yaplusc - Ybplusd);      /* xb' = (xa+yb-xc-yd) */      a4 = (Xaminusc + Ybminusd);      /* yb' = (ya-xb-yc+xd) */      a5 = (Yaminusc - Xbminusd);      /* xd' = (xa-yb-xc+yd)) */      a6 = (Xaminusc - Ybminusd);      /* yd' = (ya+xb-yc-xd) */      a7 = (Xbminusd + Yaminusc);      ptr1[0] = a0;      ptr1[1] = a1;      ptr1[2] = a2;      ptr1[3] = a3;      ptr1[4] = a4;      ptr1[5] = a5;      ptr1[6] = a6;      ptr1[7] = a7;      /* increment pointer by 8 */      ptr1 += 8U;   } while (--j);#else   float32_t t1, t2, r1, r2, s1, s2;   /* Run the below code for Cortex-M0 */   /*  Initializations for the fft calculation */   n2 = fftLen;   n1 = n2;   for (k = fftLen; k > 1U; k >>= 2U)   {      /*  Initializations for the fft calculation */      n1 = n2;      n2 >>= 2U;      ia1 = 0U;      /*  FFT Calculation */      j = 0;      do      {         /*  index calculation for the coefficients */         ia2 = ia1 + ia1;         ia3 = ia2 + ia1;         co1 = pCoef[ia1 * 2U];         si1 = pCoef[(ia1 * 2U) + 1U];         co2 = pCoef[ia2 * 2U];         si2 = pCoef[(ia2 * 2U) + 1U];         co3 = pCoef[ia3 * 2U];         si3 = pCoef[(ia3 * 2U) + 1U];         /*  Twiddle coefficients index modifier */         ia1 = ia1 + twidCoefModifier;         i0 = j;         do         {            /*  index calculation for the input as, */            /*  pSrc[i0 + 0], pSrc[i0 + fftLen/4], pSrc[i0 + fftLen/2], pSrc[i0 + 3fftLen/4] */            i1 = i0 + n2;            i2 = i1 + n2;            i3 = i2 + n2;            /* xa + xc */            r1 = pSrc[(2U * i0)] + pSrc[(2U * i2)];            /* xa - xc */            r2 = pSrc[(2U * i0)] - pSrc[(2U * i2)];            /* ya + yc */            s1 = pSrc[(2U * i0) + 1U] + pSrc[(2U * i2) + 1U];            /* ya - yc */            s2 = pSrc[(2U * i0) + 1U] - pSrc[(2U * i2) + 1U];            /* xb + xd */            t1 = pSrc[2U * i1] + pSrc[2U * i3];            /* xa' = xa + xb + xc + xd */            pSrc[2U * i0] = r1 + t1;            /* xa + xc -(xb + xd) */            r1 = r1 - t1;            /* yb + yd */            t2 = pSrc[(2U * i1) + 1U] + pSrc[(2U * i3) + 1U];            /* ya' = ya + yb + yc + yd */            pSrc[(2U * i0) + 1U] = s1 + t2;            /* (ya + yc) - (yb + yd) */            s1 = s1 - t2;            /* (yb - yd) */            t1 = pSrc[(2U * i1) + 1U] - pSrc[(2U * i3) + 1U];            /* (xb - xd) */            t2 = pSrc[2U * i1] - pSrc[2U * i3];            /* xc' = (xa-xb+xc-xd)co2 + (ya-yb+yc-yd)(si2) */            pSrc[2U * i1] = (r1 * co2) + (s1 * si2);            /* yc' = (ya-yb+yc-yd)co2 - (xa-xb+xc-xd)(si2) */            pSrc[(2U * i1) + 1U] = (s1 * co2) - (r1 * si2);            /* (xa - xc) + (yb - yd) */            r1 = r2 + t1;            /* (xa - xc) - (yb - yd) */            r2 = r2 - t1;            /* (ya - yc) -  (xb - xd) */            s1 = s2 - t2;            /* (ya - yc) +  (xb - xd) */            s2 = s2 + t2;            /* xb' = (xa+yb-xc-yd)co1 + (ya-xb-yc+xd)(si1) */            pSrc[2U * i2] = (r1 * co1) + (s1 * si1);            /* yb' = (ya-xb-yc+xd)co1 - (xa+yb-xc-yd)(si1) */            pSrc[(2U * i2) + 1U] = (s1 * co1) - (r1 * si1);            /* xd' = (xa-yb-xc+yd)co3 + (ya+xb-yc-xd)(si3) */            pSrc[2U * i3] = (r2 * co3) + (s2 * si3);            /* yd' = (ya+xb-yc-xd)co3 - (xa-yb-xc+yd)(si3) */            pSrc[(2U * i3) + 1U] = (s2 * co3) - (r2 * si3);            i0 += n1;         } while ( i0 < fftLen);         j++;      } while (j <= (n2 - 1U));      twidCoefModifier <<= 2U;   }#endif /* #if defined (ARM_MATH_DSP) */}/** @brief  Core function for the floating-point CIFFT butterfly process.* @param[in, out] *pSrc            points to the in-place buffer of floating-point data type.* @param[in]      fftLen           length of the FFT.* @param[in]      *pCoef           points to twiddle coefficient buffer.* @param[in]      twidCoefModifier twiddle coefficient modifier that supports different size FFTs with the same twiddle factor table.* @param[in]      onebyfftLen      value of 1/fftLen.* @return none.*/void arm_radix4_butterfly_inverse_f32(float32_t * pSrc,uint16_t fftLen,float32_t * pCoef,uint16_t twidCoefModifier,float32_t onebyfftLen){   float32_t co1, co2, co3, si1, si2, si3;   uint32_t ia1, ia2, ia3;   uint32_t i0, i1, i2, i3;   uint32_t n1, n2, j, k;#if defined (ARM_MATH_DSP)   float32_t xaIn, yaIn, xbIn, ybIn, xcIn, ycIn, xdIn, ydIn;   float32_t Xaplusc, Xbplusd, Yaplusc, Ybplusd, Xaminusc, Xbminusd, Yaminusc,   Ybminusd;   float32_t Xb12C_out, Yb12C_out, Xc12C_out, Yc12C_out, Xd12C_out, Yd12C_out;   float32_t Xb12_out, Yb12_out, Xc12_out, Yc12_out, Xd12_out, Yd12_out;   float32_t *ptr1;   float32_t p0,p1,p2,p3,p4,p5,p6,p7;   float32_t a0,a1,a2,a3,a4,a5,a6,a7;   /*  Initializations for the first stage */   n2 = fftLen;   n1 = n2;   /* n2 = fftLen/4 */   n2 >>= 2U;   i0 = 0U;   ia1 = 0U;   j = n2;   /*  Calculation of first stage */   do   {      /*  index calculation for the input as, */      /*  pSrc[i0 + 0], pSrc[i0 + fftLen/4], pSrc[i0 + fftLen/2], pSrc[i0 + 3fftLen/4] */      i1 = i0 + n2;      i2 = i1 + n2;      i3 = i2 + n2;      /*  Butterfly implementation */      xaIn = pSrc[(2U * i0)];      yaIn = pSrc[(2U * i0) + 1U];      xcIn = pSrc[(2U * i2)];      ycIn = pSrc[(2U * i2) + 1U];      xbIn = pSrc[(2U * i1)];      ybIn = pSrc[(2U * i1) + 1U];      xdIn = pSrc[(2U * i3)];      ydIn = pSrc[(2U * i3) + 1U];      /* xa + xc */      Xaplusc = xaIn + xcIn;      /* xb + xd */      Xbplusd = xbIn + xdIn;      /* ya + yc */      Yaplusc = yaIn + ycIn;      /* yb + yd */      Ybplusd = ybIn + ydIn;      /*  index calculation for the coefficients */      ia2 = ia1 + ia1;      co2 = pCoef[ia2 * 2U];      si2 = pCoef[(ia2 * 2U) + 1U];      /* xa - xc */      Xaminusc = xaIn - xcIn;      /* xb - xd */      Xbminusd = xbIn - xdIn;      /* ya - yc */      Yaminusc = yaIn - ycIn;      /* yb - yd */      Ybminusd = ybIn - ydIn;      /* xa' = xa + xb + xc + xd */      pSrc[(2U * i0)] = Xaplusc + Xbplusd;      /* ya' = ya + yb + yc + yd */      pSrc[(2U * i0) + 1U] = Yaplusc + Ybplusd;      /* (xa - xc) - (yb - yd) */      Xb12C_out = (Xaminusc - Ybminusd);      /* (ya - yc) + (xb - xd) */      Yb12C_out = (Yaminusc + Xbminusd);      /* (xa + xc) - (xb + xd) */      Xc12C_out = (Xaplusc - Xbplusd);      /* (ya + yc) - (yb + yd) */      Yc12C_out = (Yaplusc - Ybplusd);      /* (xa - xc) + (yb - yd) */      Xd12C_out = (Xaminusc + Ybminusd);      /* (ya - yc) - (xb - xd) */      Yd12C_out = (Yaminusc - Xbminusd);      co1 = pCoef[ia1 * 2U];      si1 = pCoef[(ia1 * 2U) + 1U];      /*  index calculation for the coefficients */      ia3 = ia2 + ia1;      co3 = pCoef[ia3 * 2U];      si3 = pCoef[(ia3 * 2U) + 1U];      Xb12_out = Xb12C_out * co1;      Yb12_out = Yb12C_out * co1;      Xc12_out = Xc12C_out * co2;      Yc12_out = Yc12C_out * co2;      Xd12_out = Xd12C_out * co3;      Yd12_out = Yd12C_out * co3;      /* xb' = (xa+yb-xc-yd)co1 - (ya-xb-yc+xd)(si1) */      //Xb12_out -= Yb12C_out * si1;      p0 = Yb12C_out * si1;      /* yb' = (ya-xb-yc+xd)co1 + (xa+yb-xc-yd)(si1) */      //Yb12_out += Xb12C_out * si1;      p1 = Xb12C_out * si1;      /* xc' = (xa-xb+xc-xd)co2 - (ya-yb+yc-yd)(si2) */      //Xc12_out -= Yc12C_out * si2;      p2 = Yc12C_out * si2;      /* yc' = (ya-yb+yc-yd)co2 + (xa-xb+xc-xd)(si2) */      //Yc12_out += Xc12C_out * si2;      p3 = Xc12C_out * si2;      /* xd' = (xa-yb-xc+yd)co3 - (ya+xb-yc-xd)(si3) */      //Xd12_out -= Yd12C_out * si3;      p4 = Yd12C_out * si3;      /* yd' = (ya+xb-yc-xd)co3 + (xa-yb-xc+yd)(si3) */      //Yd12_out += Xd12C_out * si3;      p5 = Xd12C_out * si3;      Xb12_out -= p0;      Yb12_out += p1;      Xc12_out -= p2;      Yc12_out += p3;      Xd12_out -= p4;      Yd12_out += p5;      /* xc' = (xa-xb+xc-xd)co2 - (ya-yb+yc-yd)(si2) */      pSrc[2U * i1] = Xc12_out;      /* yc' = (ya-yb+yc-yd)co2 + (xa-xb+xc-xd)(si2) */      pSrc[(2U * i1) + 1U] = Yc12_out;      /* xb' = (xa+yb-xc-yd)co1 - (ya-xb-yc+xd)(si1) */      pSrc[2U * i2] = Xb12_out;      /* yb' = (ya-xb-yc+xd)co1 + (xa+yb-xc-yd)(si1) */      pSrc[(2U * i2) + 1U] = Yb12_out;      /* xd' = (xa-yb-xc+yd)co3 - (ya+xb-yc-xd)(si3) */      pSrc[2U * i3] = Xd12_out;      /* yd' = (ya+xb-yc-xd)co3 + (xa-yb-xc+yd)(si3) */      pSrc[(2U * i3) + 1U] = Yd12_out;      /*  Twiddle coefficients index modifier */      ia1 = ia1 + twidCoefModifier;      /*  Updating input index */      i0 = i0 + 1U;   } while (--j);   twidCoefModifier <<= 2U;   /*  Calculation of second stage to excluding last stage */   for (k = fftLen >> 2U; k > 4U; k >>= 2U)   {      /*  Initializations for the first stage */      n1 = n2;      n2 >>= 2U;      ia1 = 0U;      /*  Calculation of first stage */      j = 0;      do      {         /*  index calculation for the coefficients */         ia2 = ia1 + ia1;         ia3 = ia2 + ia1;         co1 = pCoef[ia1 * 2U];         si1 = pCoef[(ia1 * 2U) + 1U];         co2 = pCoef[ia2 * 2U];         si2 = pCoef[(ia2 * 2U) + 1U];         co3 = pCoef[ia3 * 2U];         si3 = pCoef[(ia3 * 2U) + 1U];         /*  Twiddle coefficients index modifier */         ia1 = ia1 + twidCoefModifier;         i0 = j;         do         {            /*  index calculation for the input as, */            /*  pSrc[i0 + 0], pSrc[i0 + fftLen/4], pSrc[i0 + fftLen/2], pSrc[i0 + 3fftLen/4] */            i1 = i0 + n2;            i2 = i1 + n2;            i3 = i2 + n2;            xaIn = pSrc[(2U * i0)];            yaIn = pSrc[(2U * i0) + 1U];            xbIn = pSrc[(2U * i1)];            ybIn = pSrc[(2U * i1) + 1U];            xcIn = pSrc[(2U * i2)];            ycIn = pSrc[(2U * i2) + 1U];            xdIn = pSrc[(2U * i3)];            ydIn = pSrc[(2U * i3) + 1U];            /* xa - xc */            Xaminusc = xaIn - xcIn;            /* (xb - xd) */            Xbminusd = xbIn - xdIn;            /* ya - yc */            Yaminusc = yaIn - ycIn;            /* (yb - yd) */            Ybminusd = ybIn - ydIn;            /* xa + xc */            Xaplusc = xaIn + xcIn;            /* xb + xd */            Xbplusd = xbIn + xdIn;            /* ya + yc */            Yaplusc = yaIn + ycIn;            /* yb + yd */            Ybplusd = ybIn + ydIn;            /* (xa - xc) - (yb - yd) */            Xb12C_out = (Xaminusc - Ybminusd);            /* (ya - yc) +  (xb - xd) */            Yb12C_out = (Yaminusc + Xbminusd);            /* xa + xc -(xb + xd) */            Xc12C_out = (Xaplusc - Xbplusd);            /* (ya + yc) - (yb + yd) */            Yc12C_out = (Yaplusc - Ybplusd);            /* (xa - xc) + (yb - yd) */            Xd12C_out = (Xaminusc + Ybminusd);            /* (ya - yc) -  (xb - xd) */            Yd12C_out = (Yaminusc - Xbminusd);            pSrc[(2U * i0)] = Xaplusc + Xbplusd;            pSrc[(2U * i0) + 1U] = Yaplusc + Ybplusd;            Xb12_out = Xb12C_out * co1;            Yb12_out = Yb12C_out * co1;            Xc12_out = Xc12C_out * co2;            Yc12_out = Yc12C_out * co2;            Xd12_out = Xd12C_out * co3;            Yd12_out = Yd12C_out * co3;            /* xb' = (xa+yb-xc-yd)co1 - (ya-xb-yc+xd)(si1) */            //Xb12_out -= Yb12C_out * si1;            p0 = Yb12C_out * si1;            /* yb' = (ya-xb-yc+xd)co1 + (xa+yb-xc-yd)(si1) */            //Yb12_out += Xb12C_out * si1;            p1 = Xb12C_out * si1;            /* xc' = (xa-xb+xc-xd)co2 - (ya-yb+yc-yd)(si2) */            //Xc12_out -= Yc12C_out * si2;            p2 = Yc12C_out * si2;            /* yc' = (ya-yb+yc-yd)co2 + (xa-xb+xc-xd)(si2) */            //Yc12_out += Xc12C_out * si2;            p3 = Xc12C_out * si2;            /* xd' = (xa-yb-xc+yd)co3 - (ya+xb-yc-xd)(si3) */            //Xd12_out -= Yd12C_out * si3;            p4 = Yd12C_out * si3;            /* yd' = (ya+xb-yc-xd)co3 + (xa-yb-xc+yd)(si3) */            //Yd12_out += Xd12C_out * si3;            p5 = Xd12C_out * si3;            Xb12_out -= p0;            Yb12_out += p1;            Xc12_out -= p2;            Yc12_out += p3;            Xd12_out -= p4;            Yd12_out += p5;            /* xc' = (xa-xb+xc-xd)co2 - (ya-yb+yc-yd)(si2) */            pSrc[2U * i1] = Xc12_out;            /* yc' = (ya-yb+yc-yd)co2 + (xa-xb+xc-xd)(si2) */            pSrc[(2U * i1) + 1U] = Yc12_out;            /* xb' = (xa+yb-xc-yd)co1 - (ya-xb-yc+xd)(si1) */            pSrc[2U * i2] = Xb12_out;            /* yb' = (ya-xb-yc+xd)co1 + (xa+yb-xc-yd)(si1) */            pSrc[(2U * i2) + 1U] = Yb12_out;            /* xd' = (xa-yb-xc+yd)co3 - (ya+xb-yc-xd)(si3) */            pSrc[2U * i3] = Xd12_out;            /* yd' = (ya+xb-yc-xd)co3 + (xa-yb-xc+yd)(si3) */            pSrc[(2U * i3) + 1U] = Yd12_out;            i0 += n1;         } while (i0 < fftLen);         j++;      } while (j <= (n2 - 1U));      twidCoefModifier <<= 2U;   }   /*  Initializations of last stage */   j = fftLen >> 2;   ptr1 = &pSrc[0];   /*  Calculations of last stage */   do   {      xaIn = ptr1[0];      yaIn = ptr1[1];      xbIn = ptr1[2];      ybIn = ptr1[3];      xcIn = ptr1[4];      ycIn = ptr1[5];      xdIn = ptr1[6];      ydIn = ptr1[7];      /*  Butterfly implementation */      /* xa + xc */      Xaplusc = xaIn + xcIn;      /* xa - xc */      Xaminusc = xaIn - xcIn;      /* ya + yc */      Yaplusc = yaIn + ycIn;      /* ya - yc */      Yaminusc = yaIn - ycIn;      /* xb + xd */      Xbplusd = xbIn + xdIn;      /* yb + yd */      Ybplusd = ybIn + ydIn;      /* (xb-xd) */      Xbminusd = xbIn - xdIn;      /* (yb-yd) */      Ybminusd = ybIn - ydIn;      /* xa' = (xa+xb+xc+xd) * onebyfftLen */      a0 = (Xaplusc + Xbplusd);      /* ya' = (ya+yb+yc+yd) * onebyfftLen */      a1 = (Yaplusc + Ybplusd);      /* xc' = (xa-xb+xc-xd) * onebyfftLen */      a2 = (Xaplusc - Xbplusd);      /* yc' = (ya-yb+yc-yd) * onebyfftLen  */      a3 = (Yaplusc - Ybplusd);      /* xb' = (xa-yb-xc+yd) * onebyfftLen */      a4 = (Xaminusc - Ybminusd);      /* yb' = (ya+xb-yc-xd) * onebyfftLen */      a5 = (Yaminusc + Xbminusd);      /* xd' = (xa-yb-xc+yd) * onebyfftLen */      a6 = (Xaminusc + Ybminusd);      /* yd' = (ya-xb-yc+xd) * onebyfftLen */      a7 = (Yaminusc - Xbminusd);      p0 = a0 * onebyfftLen;      p1 = a1 * onebyfftLen;      p2 = a2 * onebyfftLen;      p3 = a3 * onebyfftLen;      p4 = a4 * onebyfftLen;      p5 = a5 * onebyfftLen;      p6 = a6 * onebyfftLen;      p7 = a7 * onebyfftLen;      /* xa' = (xa+xb+xc+xd) * onebyfftLen */      ptr1[0] = p0;      /* ya' = (ya+yb+yc+yd) * onebyfftLen */      ptr1[1] = p1;      /* xc' = (xa-xb+xc-xd) * onebyfftLen */      ptr1[2] = p2;      /* yc' = (ya-yb+yc-yd) * onebyfftLen  */      ptr1[3] = p3;      /* xb' = (xa-yb-xc+yd) * onebyfftLen */      ptr1[4] = p4;      /* yb' = (ya+xb-yc-xd) * onebyfftLen */      ptr1[5] = p5;      /* xd' = (xa-yb-xc+yd) * onebyfftLen */      ptr1[6] = p6;      /* yd' = (ya-xb-yc+xd) * onebyfftLen */      ptr1[7] = p7;      /* increment source pointer by 8 for next calculations */      ptr1 = ptr1 + 8U;   } while (--j);#else   float32_t t1, t2, r1, r2, s1, s2;   /* Run the below code for Cortex-M0 */   /*  Initializations for the first stage */   n2 = fftLen;   n1 = n2;   /*  Calculation of first stage */   for (k = fftLen; k > 4U; k >>= 2U)   {      /*  Initializations for the first stage */      n1 = n2;      n2 >>= 2U;      ia1 = 0U;      /*  Calculation of first stage */      j = 0;      do      {         /*  index calculation for the coefficients */         ia2 = ia1 + ia1;         ia3 = ia2 + ia1;         co1 = pCoef[ia1 * 2U];         si1 = pCoef[(ia1 * 2U) + 1U];         co2 = pCoef[ia2 * 2U];         si2 = pCoef[(ia2 * 2U) + 1U];         co3 = pCoef[ia3 * 2U];         si3 = pCoef[(ia3 * 2U) + 1U];         /*  Twiddle coefficients index modifier */         ia1 = ia1 + twidCoefModifier;         i0 = j;         do         {            /*  index calculation for the input as, */            /*  pSrc[i0 + 0], pSrc[i0 + fftLen/4], pSrc[i0 + fftLen/2], pSrc[i0 + 3fftLen/4] */            i1 = i0 + n2;            i2 = i1 + n2;            i3 = i2 + n2;            /* xa + xc */            r1 = pSrc[(2U * i0)] + pSrc[(2U * i2)];            /* xa - xc */            r2 = pSrc[(2U * i0)] - pSrc[(2U * i2)];            /* ya + yc */            s1 = pSrc[(2U * i0) + 1U] + pSrc[(2U * i2) + 1U];            /* ya - yc */            s2 = pSrc[(2U * i0) + 1U] - pSrc[(2U * i2) + 1U];            /* xb + xd */            t1 = pSrc[2U * i1] + pSrc[2U * i3];            /* xa' = xa + xb + xc + xd */            pSrc[2U * i0] = r1 + t1;            /* xa + xc -(xb + xd) */            r1 = r1 - t1;            /* yb + yd */            t2 = pSrc[(2U * i1) + 1U] + pSrc[(2U * i3) + 1U];            /* ya' = ya + yb + yc + yd */            pSrc[(2U * i0) + 1U] = s1 + t2;            /* (ya + yc) - (yb + yd) */            s1 = s1 - t2;            /* (yb - yd) */            t1 = pSrc[(2U * i1) + 1U] - pSrc[(2U * i3) + 1U];            /* (xb - xd) */            t2 = pSrc[2U * i1] - pSrc[2U * i3];            /* xc' = (xa-xb+xc-xd)co2 - (ya-yb+yc-yd)(si2) */            pSrc[2U * i1] = (r1 * co2) - (s1 * si2);            /* yc' = (ya-yb+yc-yd)co2 + (xa-xb+xc-xd)(si2) */            pSrc[(2U * i1) + 1U] = (s1 * co2) + (r1 * si2);            /* (xa - xc) - (yb - yd) */            r1 = r2 - t1;            /* (xa - xc) + (yb - yd) */            r2 = r2 + t1;            /* (ya - yc) +  (xb - xd) */            s1 = s2 + t2;            /* (ya - yc) -  (xb - xd) */            s2 = s2 - t2;            /* xb' = (xa+yb-xc-yd)co1 - (ya-xb-yc+xd)(si1) */            pSrc[2U * i2] = (r1 * co1) - (s1 * si1);            /* yb' = (ya-xb-yc+xd)co1 + (xa+yb-xc-yd)(si1) */            pSrc[(2U * i2) + 1U] = (s1 * co1) + (r1 * si1);            /* xd' = (xa-yb-xc+yd)co3 - (ya+xb-yc-xd)(si3) */            pSrc[2U * i3] = (r2 * co3) - (s2 * si3);            /* yd' = (ya+xb-yc-xd)co3 + (xa-yb-xc+yd)(si3) */            pSrc[(2U * i3) + 1U] = (s2 * co3) + (r2 * si3);            i0 += n1;         } while ( i0 < fftLen);         j++;      } while (j <= (n2 - 1U));      twidCoefModifier <<= 2U;   }   /*  Initializations of last stage */   n1 = n2;   n2 >>= 2U;   /*  Calculations of last stage */   for (i0 = 0U; i0 <= (fftLen - n1); i0 += n1)   {      /*  index calculation for the input as, */      /*  pSrc[i0 + 0], pSrc[i0 + fftLen/4], pSrc[i0 + fftLen/2], pSrc[i0 + 3fftLen/4] */      i1 = i0 + n2;      i2 = i1 + n2;      i3 = i2 + n2;      /*  Butterfly implementation */      /* xa + xc */      r1 = pSrc[2U * i0] + pSrc[2U * i2];      /* xa - xc */      r2 = pSrc[2U * i0] - pSrc[2U * i2];      /* ya + yc */      s1 = pSrc[(2U * i0) + 1U] + pSrc[(2U * i2) + 1U];      /* ya - yc */      s2 = pSrc[(2U * i0) + 1U] - pSrc[(2U * i2) + 1U];      /* xc + xd */      t1 = pSrc[2U * i1] + pSrc[2U * i3];      /* xa' = xa + xb + xc + xd */      pSrc[2U * i0] = (r1 + t1) * onebyfftLen;      /* (xa + xb) - (xc + xd) */      r1 = r1 - t1;      /* yb + yd */      t2 = pSrc[(2U * i1) + 1U] + pSrc[(2U * i3) + 1U];      /* ya' = ya + yb + yc + yd */      pSrc[(2U * i0) + 1U] = (s1 + t2) * onebyfftLen;      /* (ya + yc) - (yb + yd) */      s1 = s1 - t2;      /* (yb-yd) */      t1 = pSrc[(2U * i1) + 1U] - pSrc[(2U * i3) + 1U];      /* (xb-xd) */      t2 = pSrc[2U * i1] - pSrc[2U * i3];      /* xc' = (xa-xb+xc-xd)co2 - (ya-yb+yc-yd)(si2) */      pSrc[2U * i1] = r1 * onebyfftLen;      /* yc' = (ya-yb+yc-yd)co2 + (xa-xb+xc-xd)(si2) */      pSrc[(2U * i1) + 1U] = s1 * onebyfftLen;      /* (xa - xc) - (yb-yd) */      r1 = r2 - t1;      /* (xa - xc) + (yb-yd) */      r2 = r2 + t1;      /* (ya - yc) + (xb-xd) */      s1 = s2 + t2;      /* (ya - yc) - (xb-xd) */      s2 = s2 - t2;      /* xb' = (xa+yb-xc-yd)co1 - (ya-xb-yc+xd)(si1) */      pSrc[2U * i2] = r1 * onebyfftLen;      /* yb' = (ya-xb-yc+xd)co1 + (xa+yb-xc-yd)(si1) */      pSrc[(2U * i2) + 1U] = s1 * onebyfftLen;      /* xd' = (xa-yb-xc+yd)co3 - (ya+xb-yc-xd)(si3) */      pSrc[2U * i3] = r2 * onebyfftLen;      /* yd' = (ya+xb-yc-xd)co3 + (xa-yb-xc+yd)(si3) */      pSrc[(2U * i3) + 1U] = s2 * onebyfftLen;   }#endif /* #if defined (ARM_MATH_DSP) */}
 |