123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295 |
-
- #include "coder.h"
- #include "assembly.h"
- #define DEF_NFRACBITS (DQ_FRACBITS_OUT - 2 - 2 - 15)
- #define CSHIFT 12
- static __inline short ClipToShort(int x, int fracBits)
- {
- int sign;
-
-
- x >>= fracBits;
-
-
- sign = x >> 31;
- if (sign != (x >> 15))
- x = sign ^ ((1 << 15) - 1);
- return (short)x;
- }
- #define MC0M(x) { \
- c1 = *coef; coef++; c2 = *coef; coef++; \
- vLo = *(vb1+(x)); vHi = *(vb1+(23-(x))); \
- sum1L = MADD64(sum1L, vLo, c1); sum1L = MADD64(sum1L, vHi, -c2); \
- }
- #define MC1M(x) { \
- c1 = *coef; coef++; \
- vLo = *(vb1+(x)); \
- sum1L = MADD64(sum1L, vLo, c1); \
- }
- #define MC2M(x) { \
- c1 = *coef; coef++; c2 = *coef; coef++; \
- vLo = *(vb1+(x)); vHi = *(vb1+(23-(x))); \
- sum1L = MADD64(sum1L, vLo, c1); sum2L = MADD64(sum2L, vLo, c2); \
- sum1L = MADD64(sum1L, vHi, -c2); sum2L = MADD64(sum2L, vHi, c1); \
- }
- void PolyphaseMono(short *pcm, int *vbuf, const int *coefBase)
- {
- int i;
- const int *coef;
- int *vb1;
- int vLo, vHi, c1, c2;
- Word64 sum1L, sum2L, rndVal;
- rndVal = (Word64)( 1 << (DEF_NFRACBITS - 1 + (32 - CSHIFT)) );
-
- coef = coefBase;
- vb1 = vbuf;
- sum1L = rndVal;
- MC0M(0)
- MC0M(1)
- MC0M(2)
- MC0M(3)
- MC0M(4)
- MC0M(5)
- MC0M(6)
- MC0M(7)
- *(pcm + 0) = ClipToShort((int)SAR64(sum1L, (32-CSHIFT)), DEF_NFRACBITS);
-
- coef = coefBase + 256;
- vb1 = vbuf + 64*16;
- sum1L = rndVal;
- MC1M(0)
- MC1M(1)
- MC1M(2)
- MC1M(3)
- MC1M(4)
- MC1M(5)
- MC1M(6)
- MC1M(7)
- *(pcm + 16) = ClipToShort((int)SAR64(sum1L, (32-CSHIFT)), DEF_NFRACBITS);
-
- coef = coefBase + 16;
- vb1 = vbuf + 64;
- pcm++;
-
- for (i = 15; i > 0; i--) {
- sum1L = sum2L = rndVal;
- MC2M(0)
- MC2M(1)
- MC2M(2)
- MC2M(3)
- MC2M(4)
- MC2M(5)
- MC2M(6)
- MC2M(7)
- vb1 += 64;
- *(pcm) = ClipToShort((int)SAR64(sum1L, (32-CSHIFT)), DEF_NFRACBITS);
- *(pcm + 2*i) = ClipToShort((int)SAR64(sum2L, (32-CSHIFT)), DEF_NFRACBITS);
- pcm++;
- }
- }
- #define MC0S(x) { \
- c1 = *coef; coef++; c2 = *coef; coef++; \
- vLo = *(vb1+(x)); vHi = *(vb1+(23-(x))); \
- sum1L = MADD64(sum1L, vLo, c1); sum1L = MADD64(sum1L, vHi, -c2); \
- vLo = *(vb1+32+(x)); vHi = *(vb1+32+(23-(x))); \
- sum1R = MADD64(sum1R, vLo, c1); sum1R = MADD64(sum1R, vHi, -c2); \
- }
- #define MC1S(x) { \
- c1 = *coef; coef++; \
- vLo = *(vb1+(x)); \
- sum1L = MADD64(sum1L, vLo, c1); \
- vLo = *(vb1+32+(x)); \
- sum1R = MADD64(sum1R, vLo, c1); \
- }
- #define MC2S(x) { \
- c1 = *coef; coef++; c2 = *coef; coef++; \
- vLo = *(vb1+(x)); vHi = *(vb1+(23-(x))); \
- sum1L = MADD64(sum1L, vLo, c1); sum2L = MADD64(sum2L, vLo, c2); \
- sum1L = MADD64(sum1L, vHi, -c2); sum2L = MADD64(sum2L, vHi, c1); \
- vLo = *(vb1+32+(x)); vHi = *(vb1+32+(23-(x))); \
- sum1R = MADD64(sum1R, vLo, c1); sum2R = MADD64(sum2R, vLo, c2); \
- sum1R = MADD64(sum1R, vHi, -c2); sum2R = MADD64(sum2R, vHi, c1); \
- }
- void PolyphaseStereo(short *pcm, int *vbuf, const int *coefBase)
- {
- int i;
- const int *coef;
- int *vb1;
- int vLo, vHi, c1, c2;
- Word64 sum1L, sum2L, sum1R, sum2R, rndVal;
- rndVal = (Word64)( 1 << (DEF_NFRACBITS - 1 + (32 - CSHIFT)) );
-
- coef = coefBase;
- vb1 = vbuf;
- sum1L = sum1R = rndVal;
- MC0S(0)
- MC0S(1)
- MC0S(2)
- MC0S(3)
- MC0S(4)
- MC0S(5)
- MC0S(6)
- MC0S(7)
- *(pcm + 0) = ClipToShort((int)SAR64(sum1L, (32-CSHIFT)), DEF_NFRACBITS);
- *(pcm + 1) = ClipToShort((int)SAR64(sum1R, (32-CSHIFT)), DEF_NFRACBITS);
-
- coef = coefBase + 256;
- vb1 = vbuf + 64*16;
- sum1L = sum1R = rndVal;
- MC1S(0)
- MC1S(1)
- MC1S(2)
- MC1S(3)
- MC1S(4)
- MC1S(5)
- MC1S(6)
- MC1S(7)
- *(pcm + 2*16 + 0) = ClipToShort((int)SAR64(sum1L, (32-CSHIFT)), DEF_NFRACBITS);
- *(pcm + 2*16 + 1) = ClipToShort((int)SAR64(sum1R, (32-CSHIFT)), DEF_NFRACBITS);
-
- coef = coefBase + 16;
- vb1 = vbuf + 64;
- pcm += 2;
-
- for (i = 15; i > 0; i--) {
- sum1L = sum2L = rndVal;
- sum1R = sum2R = rndVal;
- MC2S(0)
- MC2S(1)
- MC2S(2)
- MC2S(3)
- MC2S(4)
- MC2S(5)
- MC2S(6)
- MC2S(7)
- vb1 += 64;
- *(pcm + 0) = ClipToShort((int)SAR64(sum1L, (32-CSHIFT)), DEF_NFRACBITS);
- *(pcm + 1) = ClipToShort((int)SAR64(sum1R, (32-CSHIFT)), DEF_NFRACBITS);
- *(pcm + 2*2*i + 0) = ClipToShort((int)SAR64(sum2L, (32-CSHIFT)), DEF_NFRACBITS);
- *(pcm + 2*2*i + 1) = ClipToShort((int)SAR64(sum2R, (32-CSHIFT)), DEF_NFRACBITS);
- pcm += 2;
- }
- }
|