123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337 |
-
- #include "coder.h"
- #include "assembly.h"
- static const int nmdctTab[NUM_IMDCT_SIZES] PROGMEM = {128, 1024};
- static const int postSkip[NUM_IMDCT_SIZES] PROGMEM = {15, 1};
- static void PreMultiply(int tabidx, int *zbuf1)
- {
- int i, nmdct, ar1, ai1, ar2, ai2, z1, z2;
- int t, cms2, cps2a, sin2a, cps2b, sin2b;
- int *zbuf2;
- const int *csptr;
- nmdct = nmdctTab[tabidx];
- zbuf2 = zbuf1 + nmdct - 1;
- csptr = cos4sin4tab + cos4sin4tabOffset[tabidx];
-
- for (i = nmdct >> 2; i != 0; i--) {
-
- cps2a = *csptr++;
- sin2a = *csptr++;
- cps2b = *csptr++;
- sin2b = *csptr++;
- ar1 = *(zbuf1 + 0);
- ai2 = *(zbuf1 + 1);
- ai1 = *(zbuf2 + 0);
- ar2 = *(zbuf2 - 1);
-
- t = MULSHIFT32(sin2a, ar1 + ai1);
- z2 = MULSHIFT32(cps2a, ai1) - t;
- cms2 = cps2a - 2*sin2a;
- z1 = MULSHIFT32(cms2, ar1) + t;
- *zbuf1++ = z1;
- *zbuf1++ = z2;
- t = MULSHIFT32(sin2b, ar2 + ai2);
- z2 = MULSHIFT32(cps2b, ai2) - t;
- cms2 = cps2b - 2*sin2b;
- z1 = MULSHIFT32(cms2, ar2) + t;
- *zbuf2-- = z2;
- *zbuf2-- = z1;
- }
- }
- static void PostMultiply(int tabidx, int *fft1)
- {
- int i, nmdct, ar1, ai1, ar2, ai2, skipFactor;
- int t, cms2, cps2, sin2;
- int *fft2;
- const int *csptr;
- nmdct = nmdctTab[tabidx];
- csptr = cos1sin1tab;
- skipFactor = postSkip[tabidx];
- fft2 = fft1 + nmdct - 1;
-
- cps2 = *csptr++;
- sin2 = *csptr;
- csptr += skipFactor;
- cms2 = cps2 - 2*sin2;
- for (i = nmdct >> 2; i != 0; i--) {
- ar1 = *(fft1 + 0);
- ai1 = *(fft1 + 1);
- ar2 = *(fft2 - 1);
- ai2 = *(fft2 + 0);
-
- t = MULSHIFT32(sin2, ar1 + ai1);
- *fft2-- = t - MULSHIFT32(cps2, ai1);
- *fft1++ = t + MULSHIFT32(cms2, ar1);
- cps2 = *csptr++;
- sin2 = *csptr;
- csptr += skipFactor;
- ai2 = -ai2;
- t = MULSHIFT32(sin2, ar2 + ai2);
- *fft2-- = t - MULSHIFT32(cps2, ai2);
- cms2 = cps2 - 2*sin2;
- *fft1++ = t + MULSHIFT32(cms2, ar2);
- }
- }
- static void PreMultiplyRescale(int tabidx, int *zbuf1, int es)
- {
- int i, nmdct, ar1, ai1, ar2, ai2, z1, z2;
- int t, cms2, cps2a, sin2a, cps2b, sin2b;
- int *zbuf2;
- const int *csptr;
- nmdct = nmdctTab[tabidx];
- zbuf2 = zbuf1 + nmdct - 1;
- csptr = cos4sin4tab + cos4sin4tabOffset[tabidx];
-
- for (i = nmdct >> 2; i != 0; i--) {
-
- cps2a = *csptr++;
- sin2a = *csptr++;
- cps2b = *csptr++;
- sin2b = *csptr++;
- ar1 = *(zbuf1 + 0) >> es;
- ai1 = *(zbuf2 + 0) >> es;
- ai2 = *(zbuf1 + 1) >> es;
- t = MULSHIFT32(sin2a, ar1 + ai1);
- z2 = MULSHIFT32(cps2a, ai1) - t;
- cms2 = cps2a - 2*sin2a;
- z1 = MULSHIFT32(cms2, ar1) + t;
- *zbuf1++ = z1;
- *zbuf1++ = z2;
- ar2 = *(zbuf2 - 1) >> es;
- t = MULSHIFT32(sin2b, ar2 + ai2);
- z2 = MULSHIFT32(cps2b, ai2) - t;
- cms2 = cps2b - 2*sin2b;
- z1 = MULSHIFT32(cms2, ar2) + t;
- *zbuf2-- = z2;
- *zbuf2-- = z1;
- }
- }
- static void PostMultiplyRescale(int tabidx, int *fft1, int es)
- {
- int i, nmdct, ar1, ai1, ar2, ai2, skipFactor, z;
- int t, cs2, sin2;
- int *fft2;
- const int *csptr;
- nmdct = nmdctTab[tabidx];
- csptr = cos1sin1tab;
- skipFactor = postSkip[tabidx];
- fft2 = fft1 + nmdct - 1;
-
- cs2 = *csptr++;
- sin2 = *csptr;
- csptr += skipFactor;
- for (i = nmdct >> 2; i != 0; i--) {
- ar1 = *(fft1 + 0);
- ai1 = *(fft1 + 1);
- ai2 = *(fft2 + 0);
- t = MULSHIFT32(sin2, ar1 + ai1);
- z = t - MULSHIFT32(cs2, ai1);
- CLIP_2N_SHIFT(z, es);
- *fft2-- = z;
- cs2 -= 2*sin2;
- z = t + MULSHIFT32(cs2, ar1);
- CLIP_2N_SHIFT(z, es);
- *fft1++ = z;
- cs2 = *csptr++;
- sin2 = *csptr;
- csptr += skipFactor;
- ar2 = *fft2;
- ai2 = -ai2;
- t = MULSHIFT32(sin2, ar2 + ai2);
- z = t - MULSHIFT32(cs2, ai2);
- CLIP_2N_SHIFT(z, es);
- *fft2-- = z;
- cs2 -= 2*sin2;
- z = t + MULSHIFT32(cs2, ar2);
- CLIP_2N_SHIFT(z, es);
- *fft1++ = z;
- cs2 += 2*sin2;
- }
- }
- void DCT4(int tabidx, int *coef, int gb)
- {
- int es;
-
- if (gb < GBITS_IN_DCT4) {
- es = GBITS_IN_DCT4 - gb;
- PreMultiplyRescale(tabidx, coef, es);
- R4FFT(tabidx, coef);
- PostMultiplyRescale(tabidx, coef, es);
- } else {
- PreMultiply(tabidx, coef);
- R4FFT(tabidx, coef);
- PostMultiply(tabidx, coef);
- }
- }
|