123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209 |
- /* ----------------------------------------------------------------------
- * Project: CMSIS DSP Library
- * Title: arm_cfft_radix4_f32.c
- * Description: Radix-4 Decimation in Frequency CFFT & CIFFT Floating point processing function
- *
- * $Date: 27. January 2017
- * $Revision: V.1.5.1
- *
- * Target Processor: Cortex-M cores
- * -------------------------------------------------------------------- */
- /*
- * Copyright (C) 2010-2017 ARM Limited or its affiliates. All rights reserved.
- *
- * SPDX-License-Identifier: Apache-2.0
- *
- * Licensed under the Apache License, Version 2.0 (the License); you may
- * not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- * www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an AS IS BASIS, WITHOUT
- * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
- #include "arm_math.h"
- extern void arm_bitreversal_f32(
- float32_t * pSrc,
- uint16_t fftSize,
- uint16_t bitRevFactor,
- uint16_t * pBitRevTab);
- void arm_radix4_butterfly_f32(
- float32_t * pSrc,
- uint16_t fftLen,
- float32_t * pCoef,
- uint16_t twidCoefModifier);
- void arm_radix4_butterfly_inverse_f32(
- float32_t * pSrc,
- uint16_t fftLen,
- float32_t * pCoef,
- uint16_t twidCoefModifier,
- float32_t onebyfftLen);
- /**
- * @ingroup groupTransforms
- */
- /**
- * @addtogroup ComplexFFT
- * @{
- */
- /**
- * @details
- * @brief Processing function for the floating-point Radix-4 CFFT/CIFFT.
- * @deprecated Do not use this function. It has been superseded by \ref arm_cfft_f32 and will be removed
- * in the future.
- * @param[in] *S points to an instance of the floating-point Radix-4 CFFT/CIFFT structure.
- * @param[in, out] *pSrc points to the complex data buffer of size <code>2*fftLen</code>. Processing occurs in-place.
- * @return none.
- */
- void arm_cfft_radix4_f32(
- const arm_cfft_radix4_instance_f32 * S,
- float32_t * pSrc)
- {
- if (S->ifftFlag == 1U)
- {
- /* Complex IFFT radix-4 */
- arm_radix4_butterfly_inverse_f32(pSrc, S->fftLen, S->pTwiddle, S->twidCoefModifier, S->onebyfftLen);
- }
- else
- {
- /* Complex FFT radix-4 */
- arm_radix4_butterfly_f32(pSrc, S->fftLen, S->pTwiddle, S->twidCoefModifier);
- }
- if (S->bitReverseFlag == 1U)
- {
- /* Bit Reversal */
- arm_bitreversal_f32(pSrc, S->fftLen, S->bitRevFactor, S->pBitRevTable);
- }
- }
- /**
- * @} end of ComplexFFT group
- */
- /* ----------------------------------------------------------------------
- * Internal helper function used by the FFTs
- * ---------------------------------------------------------------------- */
- /*
- * @brief Core function for the floating-point CFFT butterfly process.
- * @param[in, out] *pSrc points to the in-place buffer of floating-point data type.
- * @param[in] fftLen length of the FFT.
- * @param[in] *pCoef points to the twiddle coefficient buffer.
- * @param[in] twidCoefModifier twiddle coefficient modifier that supports different size FFTs with the same twiddle factor table.
- * @return none.
- */
- void arm_radix4_butterfly_f32(
- float32_t * pSrc,
- uint16_t fftLen,
- float32_t * pCoef,
- uint16_t twidCoefModifier)
- {
- float32_t co1, co2, co3, si1, si2, si3;
- uint32_t ia1, ia2, ia3;
- uint32_t i0, i1, i2, i3;
- uint32_t n1, n2, j, k;
- #if defined (ARM_MATH_DSP)
- /* Run the below code for Cortex-M4 and Cortex-M3 */
- float32_t xaIn, yaIn, xbIn, ybIn, xcIn, ycIn, xdIn, ydIn;
- float32_t Xaplusc, Xbplusd, Yaplusc, Ybplusd, Xaminusc, Xbminusd, Yaminusc,
- Ybminusd;
- float32_t Xb12C_out, Yb12C_out, Xc12C_out, Yc12C_out, Xd12C_out, Yd12C_out;
- float32_t Xb12_out, Yb12_out, Xc12_out, Yc12_out, Xd12_out, Yd12_out;
- float32_t *ptr1;
- float32_t p0,p1,p2,p3,p4,p5;
- float32_t a0,a1,a2,a3,a4,a5,a6,a7;
- /* Initializations for the first stage */
- n2 = fftLen;
- n1 = n2;
- /* n2 = fftLen/4 */
- n2 >>= 2U;
- i0 = 0U;
- ia1 = 0U;
- j = n2;
- /* Calculation of first stage */
- do
- {
- /* index calculation for the input as, */
- /* pSrc[i0 + 0], pSrc[i0 + fftLen/4], pSrc[i0 + fftLen/2], pSrc[i0 + 3fftLen/4] */
- i1 = i0 + n2;
- i2 = i1 + n2;
- i3 = i2 + n2;
- xaIn = pSrc[(2U * i0)];
- yaIn = pSrc[(2U * i0) + 1U];
- xbIn = pSrc[(2U * i1)];
- ybIn = pSrc[(2U * i1) + 1U];
- xcIn = pSrc[(2U * i2)];
- ycIn = pSrc[(2U * i2) + 1U];
- xdIn = pSrc[(2U * i3)];
- ydIn = pSrc[(2U * i3) + 1U];
- /* xa + xc */
- Xaplusc = xaIn + xcIn;
- /* xb + xd */
- Xbplusd = xbIn + xdIn;
- /* ya + yc */
- Yaplusc = yaIn + ycIn;
- /* yb + yd */
- Ybplusd = ybIn + ydIn;
- /* index calculation for the coefficients */
- ia2 = ia1 + ia1;
- co2 = pCoef[ia2 * 2U];
- si2 = pCoef[(ia2 * 2U) + 1U];
- /* xa - xc */
- Xaminusc = xaIn - xcIn;
- /* xb - xd */
- Xbminusd = xbIn - xdIn;
- /* ya - yc */
- Yaminusc = yaIn - ycIn;
- /* yb - yd */
- Ybminusd = ybIn - ydIn;
- /* xa' = xa + xb + xc + xd */
- pSrc[(2U * i0)] = Xaplusc + Xbplusd;
- /* ya' = ya + yb + yc + yd */
- pSrc[(2U * i0) + 1U] = Yaplusc + Ybplusd;
- /* (xa - xc) + (yb - yd) */
- Xb12C_out = (Xaminusc + Ybminusd);
- /* (ya - yc) + (xb - xd) */
- Yb12C_out = (Yaminusc - Xbminusd);
- /* (xa + xc) - (xb + xd) */
- Xc12C_out = (Xaplusc - Xbplusd);
- /* (ya + yc) - (yb + yd) */
- Yc12C_out = (Yaplusc - Ybplusd);
- /* (xa - xc) - (yb - yd) */
- Xd12C_out = (Xaminusc - Ybminusd);
- /* (ya - yc) + (xb - xd) */
- Yd12C_out = (Xbminusd + Yaminusc);
- co1 = pCoef[ia1 * 2U];
- si1 = pCoef[(ia1 * 2U) + 1U];
- /* index calculation for the coefficients */
- ia3 = ia2 + ia1;
- co3 = pCoef[ia3 * 2U];
- si3 = pCoef[(ia3 * 2U) + 1U];
- Xb12_out = Xb12C_out * co1;
- Yb12_out = Yb12C_out * co1;
- Xc12_out = Xc12C_out * co2;
- Yc12_out = Yc12C_out * co2;
- Xd12_out = Xd12C_out * co3;
- Yd12_out = Yd12C_out * co3;
- /* xb' = (xa+yb-xc-yd)co1 - (ya-xb-yc+xd)(si1) */
- //Xb12_out -= Yb12C_out * si1;
- p0 = Yb12C_out * si1;
- /* yb' = (ya-xb-yc+xd)co1 + (xa+yb-xc-yd)(si1) */
- //Yb12_out += Xb12C_out * si1;
- p1 = Xb12C_out * si1;
- /* xc' = (xa-xb+xc-xd)co2 - (ya-yb+yc-yd)(si2) */
- //Xc12_out -= Yc12C_out * si2;
- p2 = Yc12C_out * si2;
- /* yc' = (ya-yb+yc-yd)co2 + (xa-xb+xc-xd)(si2) */
- //Yc12_out += Xc12C_out * si2;
- p3 = Xc12C_out * si2;
- /* xd' = (xa-yb-xc+yd)co3 - (ya+xb-yc-xd)(si3) */
- //Xd12_out -= Yd12C_out * si3;
- p4 = Yd12C_out * si3;
- /* yd' = (ya+xb-yc-xd)co3 + (xa-yb-xc+yd)(si3) */
- //Yd12_out += Xd12C_out * si3;
- p5 = Xd12C_out * si3;
- Xb12_out += p0;
- Yb12_out -= p1;
- Xc12_out += p2;
- Yc12_out -= p3;
- Xd12_out += p4;
- Yd12_out -= p5;
- /* xc' = (xa-xb+xc-xd)co2 + (ya-yb+yc-yd)(si2) */
- pSrc[2U * i1] = Xc12_out;
- /* yc' = (ya-yb+yc-yd)co2 - (xa-xb+xc-xd)(si2) */
- pSrc[(2U * i1) + 1U] = Yc12_out;
- /* xb' = (xa+yb-xc-yd)co1 + (ya-xb-yc+xd)(si1) */
- pSrc[2U * i2] = Xb12_out;
- /* yb' = (ya-xb-yc+xd)co1 - (xa+yb-xc-yd)(si1) */
- pSrc[(2U * i2) + 1U] = Yb12_out;
- /* xd' = (xa-yb-xc+yd)co3 + (ya+xb-yc-xd)(si3) */
- pSrc[2U * i3] = Xd12_out;
- /* yd' = (ya+xb-yc-xd)co3 - (xa-yb-xc+yd)(si3) */
- pSrc[(2U * i3) + 1U] = Yd12_out;
- /* Twiddle coefficients index modifier */
- ia1 += twidCoefModifier;
- /* Updating input index */
- i0++;
- }
- while (--j);
- twidCoefModifier <<= 2U;
- /* Calculation of second stage to excluding last stage */
- for (k = fftLen >> 2U; k > 4U; k >>= 2U)
- {
- /* Initializations for the first stage */
- n1 = n2;
- n2 >>= 2U;
- ia1 = 0U;
- /* Calculation of first stage */
- j = 0;
- do
- {
- /* index calculation for the coefficients */
- ia2 = ia1 + ia1;
- ia3 = ia2 + ia1;
- co1 = pCoef[ia1 * 2U];
- si1 = pCoef[(ia1 * 2U) + 1U];
- co2 = pCoef[ia2 * 2U];
- si2 = pCoef[(ia2 * 2U) + 1U];
- co3 = pCoef[ia3 * 2U];
- si3 = pCoef[(ia3 * 2U) + 1U];
- /* Twiddle coefficients index modifier */
- ia1 += twidCoefModifier;
- i0 = j;
- do
- {
- /* index calculation for the input as, */
- /* pSrc[i0 + 0], pSrc[i0 + fftLen/4], pSrc[i0 + fftLen/2], pSrc[i0 + 3fftLen/4] */
- i1 = i0 + n2;
- i2 = i1 + n2;
- i3 = i2 + n2;
- xaIn = pSrc[(2U * i0)];
- yaIn = pSrc[(2U * i0) + 1U];
- xbIn = pSrc[(2U * i1)];
- ybIn = pSrc[(2U * i1) + 1U];
- xcIn = pSrc[(2U * i2)];
- ycIn = pSrc[(2U * i2) + 1U];
- xdIn = pSrc[(2U * i3)];
- ydIn = pSrc[(2U * i3) + 1U];
- /* xa - xc */
- Xaminusc = xaIn - xcIn;
- /* (xb - xd) */
- Xbminusd = xbIn - xdIn;
- /* ya - yc */
- Yaminusc = yaIn - ycIn;
- /* (yb - yd) */
- Ybminusd = ybIn - ydIn;
- /* xa + xc */
- Xaplusc = xaIn + xcIn;
- /* xb + xd */
- Xbplusd = xbIn + xdIn;
- /* ya + yc */
- Yaplusc = yaIn + ycIn;
- /* yb + yd */
- Ybplusd = ybIn + ydIn;
- /* (xa - xc) + (yb - yd) */
- Xb12C_out = (Xaminusc + Ybminusd);
- /* (ya - yc) - (xb - xd) */
- Yb12C_out = (Yaminusc - Xbminusd);
- /* xa + xc -(xb + xd) */
- Xc12C_out = (Xaplusc - Xbplusd);
- /* (ya + yc) - (yb + yd) */
- Yc12C_out = (Yaplusc - Ybplusd);
- /* (xa - xc) - (yb - yd) */
- Xd12C_out = (Xaminusc - Ybminusd);
- /* (ya - yc) + (xb - xd) */
- Yd12C_out = (Xbminusd + Yaminusc);
- pSrc[(2U * i0)] = Xaplusc + Xbplusd;
- pSrc[(2U * i0) + 1U] = Yaplusc + Ybplusd;
- Xb12_out = Xb12C_out * co1;
- Yb12_out = Yb12C_out * co1;
- Xc12_out = Xc12C_out * co2;
- Yc12_out = Yc12C_out * co2;
- Xd12_out = Xd12C_out * co3;
- Yd12_out = Yd12C_out * co3;
- /* xb' = (xa+yb-xc-yd)co1 - (ya-xb-yc+xd)(si1) */
- //Xb12_out -= Yb12C_out * si1;
- p0 = Yb12C_out * si1;
- /* yb' = (ya-xb-yc+xd)co1 + (xa+yb-xc-yd)(si1) */
- //Yb12_out += Xb12C_out * si1;
- p1 = Xb12C_out * si1;
- /* xc' = (xa-xb+xc-xd)co2 - (ya-yb+yc-yd)(si2) */
- //Xc12_out -= Yc12C_out * si2;
- p2 = Yc12C_out * si2;
- /* yc' = (ya-yb+yc-yd)co2 + (xa-xb+xc-xd)(si2) */
- //Yc12_out += Xc12C_out * si2;
- p3 = Xc12C_out * si2;
- /* xd' = (xa-yb-xc+yd)co3 - (ya+xb-yc-xd)(si3) */
- //Xd12_out -= Yd12C_out * si3;
- p4 = Yd12C_out * si3;
- /* yd' = (ya+xb-yc-xd)co3 + (xa-yb-xc+yd)(si3) */
- //Yd12_out += Xd12C_out * si3;
- p5 = Xd12C_out * si3;
- Xb12_out += p0;
- Yb12_out -= p1;
- Xc12_out += p2;
- Yc12_out -= p3;
- Xd12_out += p4;
- Yd12_out -= p5;
- /* xc' = (xa-xb+xc-xd)co2 + (ya-yb+yc-yd)(si2) */
- pSrc[2U * i1] = Xc12_out;
- /* yc' = (ya-yb+yc-yd)co2 - (xa-xb+xc-xd)(si2) */
- pSrc[(2U * i1) + 1U] = Yc12_out;
- /* xb' = (xa+yb-xc-yd)co1 + (ya-xb-yc+xd)(si1) */
- pSrc[2U * i2] = Xb12_out;
- /* yb' = (ya-xb-yc+xd)co1 - (xa+yb-xc-yd)(si1) */
- pSrc[(2U * i2) + 1U] = Yb12_out;
- /* xd' = (xa-yb-xc+yd)co3 + (ya+xb-yc-xd)(si3) */
- pSrc[2U * i3] = Xd12_out;
- /* yd' = (ya+xb-yc-xd)co3 - (xa-yb-xc+yd)(si3) */
- pSrc[(2U * i3) + 1U] = Yd12_out;
- i0 += n1;
- } while (i0 < fftLen);
- j++;
- } while (j <= (n2 - 1U));
- twidCoefModifier <<= 2U;
- }
- j = fftLen >> 2;
- ptr1 = &pSrc[0];
- /* Calculations of last stage */
- do
- {
- xaIn = ptr1[0];
- yaIn = ptr1[1];
- xbIn = ptr1[2];
- ybIn = ptr1[3];
- xcIn = ptr1[4];
- ycIn = ptr1[5];
- xdIn = ptr1[6];
- ydIn = ptr1[7];
- /* xa + xc */
- Xaplusc = xaIn + xcIn;
- /* xa - xc */
- Xaminusc = xaIn - xcIn;
- /* ya + yc */
- Yaplusc = yaIn + ycIn;
- /* ya - yc */
- Yaminusc = yaIn - ycIn;
- /* xb + xd */
- Xbplusd = xbIn + xdIn;
- /* yb + yd */
- Ybplusd = ybIn + ydIn;
- /* (xb-xd) */
- Xbminusd = xbIn - xdIn;
- /* (yb-yd) */
- Ybminusd = ybIn - ydIn;
- /* xa' = xa + xb + xc + xd */
- a0 = (Xaplusc + Xbplusd);
- /* ya' = ya + yb + yc + yd */
- a1 = (Yaplusc + Ybplusd);
- /* xc' = (xa-xb+xc-xd) */
- a2 = (Xaplusc - Xbplusd);
- /* yc' = (ya-yb+yc-yd) */
- a3 = (Yaplusc - Ybplusd);
- /* xb' = (xa+yb-xc-yd) */
- a4 = (Xaminusc + Ybminusd);
- /* yb' = (ya-xb-yc+xd) */
- a5 = (Yaminusc - Xbminusd);
- /* xd' = (xa-yb-xc+yd)) */
- a6 = (Xaminusc - Ybminusd);
- /* yd' = (ya+xb-yc-xd) */
- a7 = (Xbminusd + Yaminusc);
- ptr1[0] = a0;
- ptr1[1] = a1;
- ptr1[2] = a2;
- ptr1[3] = a3;
- ptr1[4] = a4;
- ptr1[5] = a5;
- ptr1[6] = a6;
- ptr1[7] = a7;
- /* increment pointer by 8 */
- ptr1 += 8U;
- } while (--j);
- #else
- float32_t t1, t2, r1, r2, s1, s2;
- /* Run the below code for Cortex-M0 */
- /* Initializations for the fft calculation */
- n2 = fftLen;
- n1 = n2;
- for (k = fftLen; k > 1U; k >>= 2U)
- {
- /* Initializations for the fft calculation */
- n1 = n2;
- n2 >>= 2U;
- ia1 = 0U;
- /* FFT Calculation */
- j = 0;
- do
- {
- /* index calculation for the coefficients */
- ia2 = ia1 + ia1;
- ia3 = ia2 + ia1;
- co1 = pCoef[ia1 * 2U];
- si1 = pCoef[(ia1 * 2U) + 1U];
- co2 = pCoef[ia2 * 2U];
- si2 = pCoef[(ia2 * 2U) + 1U];
- co3 = pCoef[ia3 * 2U];
- si3 = pCoef[(ia3 * 2U) + 1U];
- /* Twiddle coefficients index modifier */
- ia1 = ia1 + twidCoefModifier;
- i0 = j;
- do
- {
- /* index calculation for the input as, */
- /* pSrc[i0 + 0], pSrc[i0 + fftLen/4], pSrc[i0 + fftLen/2], pSrc[i0 + 3fftLen/4] */
- i1 = i0 + n2;
- i2 = i1 + n2;
- i3 = i2 + n2;
- /* xa + xc */
- r1 = pSrc[(2U * i0)] + pSrc[(2U * i2)];
- /* xa - xc */
- r2 = pSrc[(2U * i0)] - pSrc[(2U * i2)];
- /* ya + yc */
- s1 = pSrc[(2U * i0) + 1U] + pSrc[(2U * i2) + 1U];
- /* ya - yc */
- s2 = pSrc[(2U * i0) + 1U] - pSrc[(2U * i2) + 1U];
- /* xb + xd */
- t1 = pSrc[2U * i1] + pSrc[2U * i3];
- /* xa' = xa + xb + xc + xd */
- pSrc[2U * i0] = r1 + t1;
- /* xa + xc -(xb + xd) */
- r1 = r1 - t1;
- /* yb + yd */
- t2 = pSrc[(2U * i1) + 1U] + pSrc[(2U * i3) + 1U];
- /* ya' = ya + yb + yc + yd */
- pSrc[(2U * i0) + 1U] = s1 + t2;
- /* (ya + yc) - (yb + yd) */
- s1 = s1 - t2;
- /* (yb - yd) */
- t1 = pSrc[(2U * i1) + 1U] - pSrc[(2U * i3) + 1U];
- /* (xb - xd) */
- t2 = pSrc[2U * i1] - pSrc[2U * i3];
- /* xc' = (xa-xb+xc-xd)co2 + (ya-yb+yc-yd)(si2) */
- pSrc[2U * i1] = (r1 * co2) + (s1 * si2);
- /* yc' = (ya-yb+yc-yd)co2 - (xa-xb+xc-xd)(si2) */
- pSrc[(2U * i1) + 1U] = (s1 * co2) - (r1 * si2);
- /* (xa - xc) + (yb - yd) */
- r1 = r2 + t1;
- /* (xa - xc) - (yb - yd) */
- r2 = r2 - t1;
- /* (ya - yc) - (xb - xd) */
- s1 = s2 - t2;
- /* (ya - yc) + (xb - xd) */
- s2 = s2 + t2;
- /* xb' = (xa+yb-xc-yd)co1 + (ya-xb-yc+xd)(si1) */
- pSrc[2U * i2] = (r1 * co1) + (s1 * si1);
- /* yb' = (ya-xb-yc+xd)co1 - (xa+yb-xc-yd)(si1) */
- pSrc[(2U * i2) + 1U] = (s1 * co1) - (r1 * si1);
- /* xd' = (xa-yb-xc+yd)co3 + (ya+xb-yc-xd)(si3) */
- pSrc[2U * i3] = (r2 * co3) + (s2 * si3);
- /* yd' = (ya+xb-yc-xd)co3 - (xa-yb-xc+yd)(si3) */
- pSrc[(2U * i3) + 1U] = (s2 * co3) - (r2 * si3);
- i0 += n1;
- } while ( i0 < fftLen);
- j++;
- } while (j <= (n2 - 1U));
- twidCoefModifier <<= 2U;
- }
- #endif /* #if defined (ARM_MATH_DSP) */
- }
- /*
- * @brief Core function for the floating-point CIFFT butterfly process.
- * @param[in, out] *pSrc points to the in-place buffer of floating-point data type.
- * @param[in] fftLen length of the FFT.
- * @param[in] *pCoef points to twiddle coefficient buffer.
- * @param[in] twidCoefModifier twiddle coefficient modifier that supports different size FFTs with the same twiddle factor table.
- * @param[in] onebyfftLen value of 1/fftLen.
- * @return none.
- */
- void arm_radix4_butterfly_inverse_f32(
- float32_t * pSrc,
- uint16_t fftLen,
- float32_t * pCoef,
- uint16_t twidCoefModifier,
- float32_t onebyfftLen)
- {
- float32_t co1, co2, co3, si1, si2, si3;
- uint32_t ia1, ia2, ia3;
- uint32_t i0, i1, i2, i3;
- uint32_t n1, n2, j, k;
- #if defined (ARM_MATH_DSP)
- float32_t xaIn, yaIn, xbIn, ybIn, xcIn, ycIn, xdIn, ydIn;
- float32_t Xaplusc, Xbplusd, Yaplusc, Ybplusd, Xaminusc, Xbminusd, Yaminusc,
- Ybminusd;
- float32_t Xb12C_out, Yb12C_out, Xc12C_out, Yc12C_out, Xd12C_out, Yd12C_out;
- float32_t Xb12_out, Yb12_out, Xc12_out, Yc12_out, Xd12_out, Yd12_out;
- float32_t *ptr1;
- float32_t p0,p1,p2,p3,p4,p5,p6,p7;
- float32_t a0,a1,a2,a3,a4,a5,a6,a7;
- /* Initializations for the first stage */
- n2 = fftLen;
- n1 = n2;
- /* n2 = fftLen/4 */
- n2 >>= 2U;
- i0 = 0U;
- ia1 = 0U;
- j = n2;
- /* Calculation of first stage */
- do
- {
- /* index calculation for the input as, */
- /* pSrc[i0 + 0], pSrc[i0 + fftLen/4], pSrc[i0 + fftLen/2], pSrc[i0 + 3fftLen/4] */
- i1 = i0 + n2;
- i2 = i1 + n2;
- i3 = i2 + n2;
- /* Butterfly implementation */
- xaIn = pSrc[(2U * i0)];
- yaIn = pSrc[(2U * i0) + 1U];
- xcIn = pSrc[(2U * i2)];
- ycIn = pSrc[(2U * i2) + 1U];
- xbIn = pSrc[(2U * i1)];
- ybIn = pSrc[(2U * i1) + 1U];
- xdIn = pSrc[(2U * i3)];
- ydIn = pSrc[(2U * i3) + 1U];
- /* xa + xc */
- Xaplusc = xaIn + xcIn;
- /* xb + xd */
- Xbplusd = xbIn + xdIn;
- /* ya + yc */
- Yaplusc = yaIn + ycIn;
- /* yb + yd */
- Ybplusd = ybIn + ydIn;
- /* index calculation for the coefficients */
- ia2 = ia1 + ia1;
- co2 = pCoef[ia2 * 2U];
- si2 = pCoef[(ia2 * 2U) + 1U];
- /* xa - xc */
- Xaminusc = xaIn - xcIn;
- /* xb - xd */
- Xbminusd = xbIn - xdIn;
- /* ya - yc */
- Yaminusc = yaIn - ycIn;
- /* yb - yd */
- Ybminusd = ybIn - ydIn;
- /* xa' = xa + xb + xc + xd */
- pSrc[(2U * i0)] = Xaplusc + Xbplusd;
- /* ya' = ya + yb + yc + yd */
- pSrc[(2U * i0) + 1U] = Yaplusc + Ybplusd;
- /* (xa - xc) - (yb - yd) */
- Xb12C_out = (Xaminusc - Ybminusd);
- /* (ya - yc) + (xb - xd) */
- Yb12C_out = (Yaminusc + Xbminusd);
- /* (xa + xc) - (xb + xd) */
- Xc12C_out = (Xaplusc - Xbplusd);
- /* (ya + yc) - (yb + yd) */
- Yc12C_out = (Yaplusc - Ybplusd);
- /* (xa - xc) + (yb - yd) */
- Xd12C_out = (Xaminusc + Ybminusd);
- /* (ya - yc) - (xb - xd) */
- Yd12C_out = (Yaminusc - Xbminusd);
- co1 = pCoef[ia1 * 2U];
- si1 = pCoef[(ia1 * 2U) + 1U];
- /* index calculation for the coefficients */
- ia3 = ia2 + ia1;
- co3 = pCoef[ia3 * 2U];
- si3 = pCoef[(ia3 * 2U) + 1U];
- Xb12_out = Xb12C_out * co1;
- Yb12_out = Yb12C_out * co1;
- Xc12_out = Xc12C_out * co2;
- Yc12_out = Yc12C_out * co2;
- Xd12_out = Xd12C_out * co3;
- Yd12_out = Yd12C_out * co3;
- /* xb' = (xa+yb-xc-yd)co1 - (ya-xb-yc+xd)(si1) */
- //Xb12_out -= Yb12C_out * si1;
- p0 = Yb12C_out * si1;
- /* yb' = (ya-xb-yc+xd)co1 + (xa+yb-xc-yd)(si1) */
- //Yb12_out += Xb12C_out * si1;
- p1 = Xb12C_out * si1;
- /* xc' = (xa-xb+xc-xd)co2 - (ya-yb+yc-yd)(si2) */
- //Xc12_out -= Yc12C_out * si2;
- p2 = Yc12C_out * si2;
- /* yc' = (ya-yb+yc-yd)co2 + (xa-xb+xc-xd)(si2) */
- //Yc12_out += Xc12C_out * si2;
- p3 = Xc12C_out * si2;
- /* xd' = (xa-yb-xc+yd)co3 - (ya+xb-yc-xd)(si3) */
- //Xd12_out -= Yd12C_out * si3;
- p4 = Yd12C_out * si3;
- /* yd' = (ya+xb-yc-xd)co3 + (xa-yb-xc+yd)(si3) */
- //Yd12_out += Xd12C_out * si3;
- p5 = Xd12C_out * si3;
- Xb12_out -= p0;
- Yb12_out += p1;
- Xc12_out -= p2;
- Yc12_out += p3;
- Xd12_out -= p4;
- Yd12_out += p5;
- /* xc' = (xa-xb+xc-xd)co2 - (ya-yb+yc-yd)(si2) */
- pSrc[2U * i1] = Xc12_out;
- /* yc' = (ya-yb+yc-yd)co2 + (xa-xb+xc-xd)(si2) */
- pSrc[(2U * i1) + 1U] = Yc12_out;
- /* xb' = (xa+yb-xc-yd)co1 - (ya-xb-yc+xd)(si1) */
- pSrc[2U * i2] = Xb12_out;
- /* yb' = (ya-xb-yc+xd)co1 + (xa+yb-xc-yd)(si1) */
- pSrc[(2U * i2) + 1U] = Yb12_out;
- /* xd' = (xa-yb-xc+yd)co3 - (ya+xb-yc-xd)(si3) */
- pSrc[2U * i3] = Xd12_out;
- /* yd' = (ya+xb-yc-xd)co3 + (xa-yb-xc+yd)(si3) */
- pSrc[(2U * i3) + 1U] = Yd12_out;
- /* Twiddle coefficients index modifier */
- ia1 = ia1 + twidCoefModifier;
- /* Updating input index */
- i0 = i0 + 1U;
- } while (--j);
- twidCoefModifier <<= 2U;
- /* Calculation of second stage to excluding last stage */
- for (k = fftLen >> 2U; k > 4U; k >>= 2U)
- {
- /* Initializations for the first stage */
- n1 = n2;
- n2 >>= 2U;
- ia1 = 0U;
- /* Calculation of first stage */
- j = 0;
- do
- {
- /* index calculation for the coefficients */
- ia2 = ia1 + ia1;
- ia3 = ia2 + ia1;
- co1 = pCoef[ia1 * 2U];
- si1 = pCoef[(ia1 * 2U) + 1U];
- co2 = pCoef[ia2 * 2U];
- si2 = pCoef[(ia2 * 2U) + 1U];
- co3 = pCoef[ia3 * 2U];
- si3 = pCoef[(ia3 * 2U) + 1U];
- /* Twiddle coefficients index modifier */
- ia1 = ia1 + twidCoefModifier;
- i0 = j;
- do
- {
- /* index calculation for the input as, */
- /* pSrc[i0 + 0], pSrc[i0 + fftLen/4], pSrc[i0 + fftLen/2], pSrc[i0 + 3fftLen/4] */
- i1 = i0 + n2;
- i2 = i1 + n2;
- i3 = i2 + n2;
- xaIn = pSrc[(2U * i0)];
- yaIn = pSrc[(2U * i0) + 1U];
- xbIn = pSrc[(2U * i1)];
- ybIn = pSrc[(2U * i1) + 1U];
- xcIn = pSrc[(2U * i2)];
- ycIn = pSrc[(2U * i2) + 1U];
- xdIn = pSrc[(2U * i3)];
- ydIn = pSrc[(2U * i3) + 1U];
- /* xa - xc */
- Xaminusc = xaIn - xcIn;
- /* (xb - xd) */
- Xbminusd = xbIn - xdIn;
- /* ya - yc */
- Yaminusc = yaIn - ycIn;
- /* (yb - yd) */
- Ybminusd = ybIn - ydIn;
- /* xa + xc */
- Xaplusc = xaIn + xcIn;
- /* xb + xd */
- Xbplusd = xbIn + xdIn;
- /* ya + yc */
- Yaplusc = yaIn + ycIn;
- /* yb + yd */
- Ybplusd = ybIn + ydIn;
- /* (xa - xc) - (yb - yd) */
- Xb12C_out = (Xaminusc - Ybminusd);
- /* (ya - yc) + (xb - xd) */
- Yb12C_out = (Yaminusc + Xbminusd);
- /* xa + xc -(xb + xd) */
- Xc12C_out = (Xaplusc - Xbplusd);
- /* (ya + yc) - (yb + yd) */
- Yc12C_out = (Yaplusc - Ybplusd);
- /* (xa - xc) + (yb - yd) */
- Xd12C_out = (Xaminusc + Ybminusd);
- /* (ya - yc) - (xb - xd) */
- Yd12C_out = (Yaminusc - Xbminusd);
- pSrc[(2U * i0)] = Xaplusc + Xbplusd;
- pSrc[(2U * i0) + 1U] = Yaplusc + Ybplusd;
- Xb12_out = Xb12C_out * co1;
- Yb12_out = Yb12C_out * co1;
- Xc12_out = Xc12C_out * co2;
- Yc12_out = Yc12C_out * co2;
- Xd12_out = Xd12C_out * co3;
- Yd12_out = Yd12C_out * co3;
- /* xb' = (xa+yb-xc-yd)co1 - (ya-xb-yc+xd)(si1) */
- //Xb12_out -= Yb12C_out * si1;
- p0 = Yb12C_out * si1;
- /* yb' = (ya-xb-yc+xd)co1 + (xa+yb-xc-yd)(si1) */
- //Yb12_out += Xb12C_out * si1;
- p1 = Xb12C_out * si1;
- /* xc' = (xa-xb+xc-xd)co2 - (ya-yb+yc-yd)(si2) */
- //Xc12_out -= Yc12C_out * si2;
- p2 = Yc12C_out * si2;
- /* yc' = (ya-yb+yc-yd)co2 + (xa-xb+xc-xd)(si2) */
- //Yc12_out += Xc12C_out * si2;
- p3 = Xc12C_out * si2;
- /* xd' = (xa-yb-xc+yd)co3 - (ya+xb-yc-xd)(si3) */
- //Xd12_out -= Yd12C_out * si3;
- p4 = Yd12C_out * si3;
- /* yd' = (ya+xb-yc-xd)co3 + (xa-yb-xc+yd)(si3) */
- //Yd12_out += Xd12C_out * si3;
- p5 = Xd12C_out * si3;
- Xb12_out -= p0;
- Yb12_out += p1;
- Xc12_out -= p2;
- Yc12_out += p3;
- Xd12_out -= p4;
- Yd12_out += p5;
- /* xc' = (xa-xb+xc-xd)co2 - (ya-yb+yc-yd)(si2) */
- pSrc[2U * i1] = Xc12_out;
- /* yc' = (ya-yb+yc-yd)co2 + (xa-xb+xc-xd)(si2) */
- pSrc[(2U * i1) + 1U] = Yc12_out;
- /* xb' = (xa+yb-xc-yd)co1 - (ya-xb-yc+xd)(si1) */
- pSrc[2U * i2] = Xb12_out;
- /* yb' = (ya-xb-yc+xd)co1 + (xa+yb-xc-yd)(si1) */
- pSrc[(2U * i2) + 1U] = Yb12_out;
- /* xd' = (xa-yb-xc+yd)co3 - (ya+xb-yc-xd)(si3) */
- pSrc[2U * i3] = Xd12_out;
- /* yd' = (ya+xb-yc-xd)co3 + (xa-yb-xc+yd)(si3) */
- pSrc[(2U * i3) + 1U] = Yd12_out;
- i0 += n1;
- } while (i0 < fftLen);
- j++;
- } while (j <= (n2 - 1U));
- twidCoefModifier <<= 2U;
- }
- /* Initializations of last stage */
- j = fftLen >> 2;
- ptr1 = &pSrc[0];
- /* Calculations of last stage */
- do
- {
- xaIn = ptr1[0];
- yaIn = ptr1[1];
- xbIn = ptr1[2];
- ybIn = ptr1[3];
- xcIn = ptr1[4];
- ycIn = ptr1[5];
- xdIn = ptr1[6];
- ydIn = ptr1[7];
- /* Butterfly implementation */
- /* xa + xc */
- Xaplusc = xaIn + xcIn;
- /* xa - xc */
- Xaminusc = xaIn - xcIn;
- /* ya + yc */
- Yaplusc = yaIn + ycIn;
- /* ya - yc */
- Yaminusc = yaIn - ycIn;
- /* xb + xd */
- Xbplusd = xbIn + xdIn;
- /* yb + yd */
- Ybplusd = ybIn + ydIn;
- /* (xb-xd) */
- Xbminusd = xbIn - xdIn;
- /* (yb-yd) */
- Ybminusd = ybIn - ydIn;
- /* xa' = (xa+xb+xc+xd) * onebyfftLen */
- a0 = (Xaplusc + Xbplusd);
- /* ya' = (ya+yb+yc+yd) * onebyfftLen */
- a1 = (Yaplusc + Ybplusd);
- /* xc' = (xa-xb+xc-xd) * onebyfftLen */
- a2 = (Xaplusc - Xbplusd);
- /* yc' = (ya-yb+yc-yd) * onebyfftLen */
- a3 = (Yaplusc - Ybplusd);
- /* xb' = (xa-yb-xc+yd) * onebyfftLen */
- a4 = (Xaminusc - Ybminusd);
- /* yb' = (ya+xb-yc-xd) * onebyfftLen */
- a5 = (Yaminusc + Xbminusd);
- /* xd' = (xa-yb-xc+yd) * onebyfftLen */
- a6 = (Xaminusc + Ybminusd);
- /* yd' = (ya-xb-yc+xd) * onebyfftLen */
- a7 = (Yaminusc - Xbminusd);
- p0 = a0 * onebyfftLen;
- p1 = a1 * onebyfftLen;
- p2 = a2 * onebyfftLen;
- p3 = a3 * onebyfftLen;
- p4 = a4 * onebyfftLen;
- p5 = a5 * onebyfftLen;
- p6 = a6 * onebyfftLen;
- p7 = a7 * onebyfftLen;
- /* xa' = (xa+xb+xc+xd) * onebyfftLen */
- ptr1[0] = p0;
- /* ya' = (ya+yb+yc+yd) * onebyfftLen */
- ptr1[1] = p1;
- /* xc' = (xa-xb+xc-xd) * onebyfftLen */
- ptr1[2] = p2;
- /* yc' = (ya-yb+yc-yd) * onebyfftLen */
- ptr1[3] = p3;
- /* xb' = (xa-yb-xc+yd) * onebyfftLen */
- ptr1[4] = p4;
- /* yb' = (ya+xb-yc-xd) * onebyfftLen */
- ptr1[5] = p5;
- /* xd' = (xa-yb-xc+yd) * onebyfftLen */
- ptr1[6] = p6;
- /* yd' = (ya-xb-yc+xd) * onebyfftLen */
- ptr1[7] = p7;
- /* increment source pointer by 8 for next calculations */
- ptr1 = ptr1 + 8U;
- } while (--j);
- #else
- float32_t t1, t2, r1, r2, s1, s2;
- /* Run the below code for Cortex-M0 */
- /* Initializations for the first stage */
- n2 = fftLen;
- n1 = n2;
- /* Calculation of first stage */
- for (k = fftLen; k > 4U; k >>= 2U)
- {
- /* Initializations for the first stage */
- n1 = n2;
- n2 >>= 2U;
- ia1 = 0U;
- /* Calculation of first stage */
- j = 0;
- do
- {
- /* index calculation for the coefficients */
- ia2 = ia1 + ia1;
- ia3 = ia2 + ia1;
- co1 = pCoef[ia1 * 2U];
- si1 = pCoef[(ia1 * 2U) + 1U];
- co2 = pCoef[ia2 * 2U];
- si2 = pCoef[(ia2 * 2U) + 1U];
- co3 = pCoef[ia3 * 2U];
- si3 = pCoef[(ia3 * 2U) + 1U];
- /* Twiddle coefficients index modifier */
- ia1 = ia1 + twidCoefModifier;
- i0 = j;
- do
- {
- /* index calculation for the input as, */
- /* pSrc[i0 + 0], pSrc[i0 + fftLen/4], pSrc[i0 + fftLen/2], pSrc[i0 + 3fftLen/4] */
- i1 = i0 + n2;
- i2 = i1 + n2;
- i3 = i2 + n2;
- /* xa + xc */
- r1 = pSrc[(2U * i0)] + pSrc[(2U * i2)];
- /* xa - xc */
- r2 = pSrc[(2U * i0)] - pSrc[(2U * i2)];
- /* ya + yc */
- s1 = pSrc[(2U * i0) + 1U] + pSrc[(2U * i2) + 1U];
- /* ya - yc */
- s2 = pSrc[(2U * i0) + 1U] - pSrc[(2U * i2) + 1U];
- /* xb + xd */
- t1 = pSrc[2U * i1] + pSrc[2U * i3];
- /* xa' = xa + xb + xc + xd */
- pSrc[2U * i0] = r1 + t1;
- /* xa + xc -(xb + xd) */
- r1 = r1 - t1;
- /* yb + yd */
- t2 = pSrc[(2U * i1) + 1U] + pSrc[(2U * i3) + 1U];
- /* ya' = ya + yb + yc + yd */
- pSrc[(2U * i0) + 1U] = s1 + t2;
- /* (ya + yc) - (yb + yd) */
- s1 = s1 - t2;
- /* (yb - yd) */
- t1 = pSrc[(2U * i1) + 1U] - pSrc[(2U * i3) + 1U];
- /* (xb - xd) */
- t2 = pSrc[2U * i1] - pSrc[2U * i3];
- /* xc' = (xa-xb+xc-xd)co2 - (ya-yb+yc-yd)(si2) */
- pSrc[2U * i1] = (r1 * co2) - (s1 * si2);
- /* yc' = (ya-yb+yc-yd)co2 + (xa-xb+xc-xd)(si2) */
- pSrc[(2U * i1) + 1U] = (s1 * co2) + (r1 * si2);
- /* (xa - xc) - (yb - yd) */
- r1 = r2 - t1;
- /* (xa - xc) + (yb - yd) */
- r2 = r2 + t1;
- /* (ya - yc) + (xb - xd) */
- s1 = s2 + t2;
- /* (ya - yc) - (xb - xd) */
- s2 = s2 - t2;
- /* xb' = (xa+yb-xc-yd)co1 - (ya-xb-yc+xd)(si1) */
- pSrc[2U * i2] = (r1 * co1) - (s1 * si1);
- /* yb' = (ya-xb-yc+xd)co1 + (xa+yb-xc-yd)(si1) */
- pSrc[(2U * i2) + 1U] = (s1 * co1) + (r1 * si1);
- /* xd' = (xa-yb-xc+yd)co3 - (ya+xb-yc-xd)(si3) */
- pSrc[2U * i3] = (r2 * co3) - (s2 * si3);
- /* yd' = (ya+xb-yc-xd)co3 + (xa-yb-xc+yd)(si3) */
- pSrc[(2U * i3) + 1U] = (s2 * co3) + (r2 * si3);
- i0 += n1;
- } while ( i0 < fftLen);
- j++;
- } while (j <= (n2 - 1U));
- twidCoefModifier <<= 2U;
- }
- /* Initializations of last stage */
- n1 = n2;
- n2 >>= 2U;
- /* Calculations of last stage */
- for (i0 = 0U; i0 <= (fftLen - n1); i0 += n1)
- {
- /* index calculation for the input as, */
- /* pSrc[i0 + 0], pSrc[i0 + fftLen/4], pSrc[i0 + fftLen/2], pSrc[i0 + 3fftLen/4] */
- i1 = i0 + n2;
- i2 = i1 + n2;
- i3 = i2 + n2;
- /* Butterfly implementation */
- /* xa + xc */
- r1 = pSrc[2U * i0] + pSrc[2U * i2];
- /* xa - xc */
- r2 = pSrc[2U * i0] - pSrc[2U * i2];
- /* ya + yc */
- s1 = pSrc[(2U * i0) + 1U] + pSrc[(2U * i2) + 1U];
- /* ya - yc */
- s2 = pSrc[(2U * i0) + 1U] - pSrc[(2U * i2) + 1U];
- /* xc + xd */
- t1 = pSrc[2U * i1] + pSrc[2U * i3];
- /* xa' = xa + xb + xc + xd */
- pSrc[2U * i0] = (r1 + t1) * onebyfftLen;
- /* (xa + xb) - (xc + xd) */
- r1 = r1 - t1;
- /* yb + yd */
- t2 = pSrc[(2U * i1) + 1U] + pSrc[(2U * i3) + 1U];
- /* ya' = ya + yb + yc + yd */
- pSrc[(2U * i0) + 1U] = (s1 + t2) * onebyfftLen;
- /* (ya + yc) - (yb + yd) */
- s1 = s1 - t2;
- /* (yb-yd) */
- t1 = pSrc[(2U * i1) + 1U] - pSrc[(2U * i3) + 1U];
- /* (xb-xd) */
- t2 = pSrc[2U * i1] - pSrc[2U * i3];
- /* xc' = (xa-xb+xc-xd)co2 - (ya-yb+yc-yd)(si2) */
- pSrc[2U * i1] = r1 * onebyfftLen;
- /* yc' = (ya-yb+yc-yd)co2 + (xa-xb+xc-xd)(si2) */
- pSrc[(2U * i1) + 1U] = s1 * onebyfftLen;
- /* (xa - xc) - (yb-yd) */
- r1 = r2 - t1;
- /* (xa - xc) + (yb-yd) */
- r2 = r2 + t1;
- /* (ya - yc) + (xb-xd) */
- s1 = s2 + t2;
- /* (ya - yc) - (xb-xd) */
- s2 = s2 - t2;
- /* xb' = (xa+yb-xc-yd)co1 - (ya-xb-yc+xd)(si1) */
- pSrc[2U * i2] = r1 * onebyfftLen;
- /* yb' = (ya-xb-yc+xd)co1 + (xa+yb-xc-yd)(si1) */
- pSrc[(2U * i2) + 1U] = s1 * onebyfftLen;
- /* xd' = (xa-yb-xc+yd)co3 - (ya+xb-yc-xd)(si3) */
- pSrc[2U * i3] = r2 * onebyfftLen;
- /* yd' = (ya+xb-yc-xd)co3 + (xa-yb-xc+yd)(si3) */
- pSrc[(2U * i3) + 1U] = s2 * onebyfftLen;
- }
- #endif /* #if defined (ARM_MATH_DSP) */
- }
|