123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616 |
-
- #include "sbr.h"
- #include "assembly.h"
- #define FBITS_LPCOEFS 29
- #define MAG_16 (16 * (1 << (32 - (2*(32-FBITS_LPCOEFS)))))
- #define RELAX_COEF 0x7ffff79c
- static const int newBWTab[4][4] PROGMEM = {
- {0x00000000, 0x4ccccccd, 0x73333333, 0x7d70a3d7},
- {0x4ccccccd, 0x60000000, 0x73333333, 0x7d70a3d7},
- {0x00000000, 0x60000000, 0x73333333, 0x7d70a3d7},
- {0x00000000, 0x60000000, 0x73333333, 0x7d70a3d7},
- };
- #if (defined (XXXX__arm) && defined (__ARMCC_VERSION)) || (defined (_WIN32) && defined (_WIN32_WCE) && defined (ARM)) || (defined(__GNUC__) && defined(XXXX__arm__))
- #ifdef __cplusplus
- extern "C"
- #endif
- void CVKernel1(int *XBuf, int *accBuf);
- #else
- void CVKernel1(int *XBuf, int *accBuf)
- {
- U64 p01re, p01im, p12re, p12im, p11re, p22re;
- int n, x0re, x0im, x1re, x1im;
- x0re = XBuf[0];
- x0im = XBuf[1];
- XBuf += (2*64);
- x1re = XBuf[0];
- x1im = XBuf[1];
- XBuf += (2*64);
- p01re.w64 = p01im.w64 = 0;
- p12re.w64 = p12im.w64 = 0;
- p11re.w64 = 0;
- p22re.w64 = 0;
- p12re.w64 = MADD64(p12re.w64, x1re, x0re);
- p12re.w64 = MADD64(p12re.w64, x1im, x0im);
- p12im.w64 = MADD64(p12im.w64, x0re, x1im);
- p12im.w64 = MADD64(p12im.w64, -x0im, x1re);
- p22re.w64 = MADD64(p22re.w64, x0re, x0re);
- p22re.w64 = MADD64(p22re.w64, x0im, x0im);
- for (n = (NUM_TIME_SLOTS*SAMPLES_PER_SLOT + 6); n != 0; n--) {
-
- x0re = x1re;
- x0im = x1im;
- x1re = XBuf[0];
- x1im = XBuf[1];
- p01re.w64 = MADD64(p01re.w64, x1re, x0re);
- p01re.w64 = MADD64(p01re.w64, x1im, x0im);
- p01im.w64 = MADD64(p01im.w64, x0re, x1im);
- p01im.w64 = MADD64(p01im.w64, -x0im, x1re);
- p11re.w64 = MADD64(p11re.w64, x0re, x0re);
- p11re.w64 = MADD64(p11re.w64, x0im, x0im);
- XBuf += (2*64);
- }
-
- p12re.w64 += p01re.w64;
- p12re.w64 = MADD64(p12re.w64, x1re, -x0re);
- p12re.w64 = MADD64(p12re.w64, x1im, -x0im);
- p12im.w64 += p01im.w64;
- p12im.w64 = MADD64(p12im.w64, x0re, -x1im);
- p12im.w64 = MADD64(p12im.w64, x0im, x1re);
- p22re.w64 += p11re.w64;
- p22re.w64 = MADD64(p22re.w64, x0re, -x0re);
- p22re.w64 = MADD64(p22re.w64, x0im, -x0im);
- accBuf[0] = p01re.r.lo32; accBuf[1] = p01re.r.hi32;
- accBuf[2] = p01im.r.lo32; accBuf[3] = p01im.r.hi32;
- accBuf[4] = p11re.r.lo32; accBuf[5] = p11re.r.hi32;
- accBuf[6] = p12re.r.lo32; accBuf[7] = p12re.r.hi32;
- accBuf[8] = p12im.r.lo32; accBuf[9] = p12im.r.hi32;
- accBuf[10] = p22re.r.lo32; accBuf[11] = p22re.r.hi32;
- }
- #endif
- static int CalcCovariance1(int *XBuf, int *p01reN, int *p01imN, int *p12reN, int *p12imN, int *p11reN, int *p22reN)
- {
- int accBuf[2*6];
- int n, z, s, loShift, hiShift, gbMask;
- U64 p01re, p01im, p12re, p12im, p11re, p22re;
- CVKernel1(XBuf, accBuf);
- p01re.r.lo32 = accBuf[0]; p01re.r.hi32 = accBuf[1];
- p01im.r.lo32 = accBuf[2]; p01im.r.hi32 = accBuf[3];
- p11re.r.lo32 = accBuf[4]; p11re.r.hi32 = accBuf[5];
- p12re.r.lo32 = accBuf[6]; p12re.r.hi32 = accBuf[7];
- p12im.r.lo32 = accBuf[8]; p12im.r.hi32 = accBuf[9];
- p22re.r.lo32 = accBuf[10]; p22re.r.hi32 = accBuf[11];
-
- gbMask = ((p01re.r.hi32) ^ (p01re.r.hi32 >> 31)) | ((p01im.r.hi32) ^ (p01im.r.hi32 >> 31));
- gbMask |= ((p12re.r.hi32) ^ (p12re.r.hi32 >> 31)) | ((p12im.r.hi32) ^ (p12im.r.hi32 >> 31));
- gbMask |= ((p11re.r.hi32) ^ (p11re.r.hi32 >> 31)) | ((p22re.r.hi32) ^ (p22re.r.hi32 >> 31));
- if (gbMask == 0) {
- s = p01re.r.hi32 >> 31; gbMask = (p01re.r.lo32 ^ s) - s;
- s = p01im.r.hi32 >> 31; gbMask |= (p01im.r.lo32 ^ s) - s;
- s = p12re.r.hi32 >> 31; gbMask |= (p12re.r.lo32 ^ s) - s;
- s = p12im.r.hi32 >> 31; gbMask |= (p12im.r.lo32 ^ s) - s;
- s = p11re.r.hi32 >> 31; gbMask |= (p11re.r.lo32 ^ s) - s;
- s = p22re.r.hi32 >> 31; gbMask |= (p22re.r.lo32 ^ s) - s;
- z = 32 + CLZ(gbMask);
- } else {
- gbMask = FASTABS(p01re.r.hi32) | FASTABS(p01im.r.hi32);
- gbMask |= FASTABS(p12re.r.hi32) | FASTABS(p12im.r.hi32);
- gbMask |= FASTABS(p11re.r.hi32) | FASTABS(p22re.r.hi32);
- z = CLZ(gbMask);
- }
- n = 64 - z;
- if (n <= 30) {
- loShift = (30 - n);
- *p01reN = p01re.r.lo32 << loShift; *p01imN = p01im.r.lo32 << loShift;
- *p12reN = p12re.r.lo32 << loShift; *p12imN = p12im.r.lo32 << loShift;
- *p11reN = p11re.r.lo32 << loShift; *p22reN = p22re.r.lo32 << loShift;
- return -(loShift + 2*FBITS_OUT_QMFA);
- } else if (n < 32 + 30) {
- loShift = (n - 30);
- hiShift = 32 - loShift;
- *p01reN = (p01re.r.hi32 << hiShift) | (p01re.r.lo32 >> loShift);
- *p01imN = (p01im.r.hi32 << hiShift) | (p01im.r.lo32 >> loShift);
- *p12reN = (p12re.r.hi32 << hiShift) | (p12re.r.lo32 >> loShift);
- *p12imN = (p12im.r.hi32 << hiShift) | (p12im.r.lo32 >> loShift);
- *p11reN = (p11re.r.hi32 << hiShift) | (p11re.r.lo32 >> loShift);
- *p22reN = (p22re.r.hi32 << hiShift) | (p22re.r.lo32 >> loShift);
- return (loShift - 2*FBITS_OUT_QMFA);
- } else {
- hiShift = n - (32 + 30);
- *p01reN = p01re.r.hi32 >> hiShift; *p01imN = p01im.r.hi32 >> hiShift;
- *p12reN = p12re.r.hi32 >> hiShift; *p12imN = p12im.r.hi32 >> hiShift;
- *p11reN = p11re.r.hi32 >> hiShift; *p22reN = p22re.r.hi32 >> hiShift;
- return (32 - 2*FBITS_OUT_QMFA - hiShift);
- }
- return 0;
- }
- #if (defined (XXXX__arm) && defined (__ARMCC_VERSION)) || (defined (_WIN32) && defined (_WIN32_WCE) && defined (ARM)) || (defined(__GNUC__) && defined(XXXX__arm__))
- #ifdef __cplusplus
- extern "C"
- #endif
- void CVKernel2(int *XBuf, int *accBuf);
- #else
- void CVKernel2(int *XBuf, int *accBuf)
- {
- U64 p02re, p02im;
- int n, x0re, x0im, x1re, x1im, x2re, x2im;
- p02re.w64 = p02im.w64 = 0;
- x0re = XBuf[0];
- x0im = XBuf[1];
- XBuf += (2*64);
- x1re = XBuf[0];
- x1im = XBuf[1];
- XBuf += (2*64);
- for (n = (NUM_TIME_SLOTS*SAMPLES_PER_SLOT + 6); n != 0; n--) {
-
- x2re = XBuf[0];
- x2im = XBuf[1];
- p02re.w64 = MADD64(p02re.w64, x2re, x0re);
- p02re.w64 = MADD64(p02re.w64, x2im, x0im);
- p02im.w64 = MADD64(p02im.w64, x0re, x2im);
- p02im.w64 = MADD64(p02im.w64, -x0im, x2re);
- x0re = x1re;
- x0im = x1im;
- x1re = x2re;
- x1im = x2im;
- XBuf += (2*64);
- }
- accBuf[0] = p02re.r.lo32;
- accBuf[1] = p02re.r.hi32;
- accBuf[2] = p02im.r.lo32;
- accBuf[3] = p02im.r.hi32;
- }
- #endif
- static int CalcCovariance2(int *XBuf, int *p02reN, int *p02imN)
- {
- U64 p02re, p02im;
- int n, z, s, loShift, hiShift, gbMask;
- int accBuf[2*2];
- CVKernel2(XBuf, accBuf);
- p02re.r.lo32 = accBuf[0];
- p02re.r.hi32 = accBuf[1];
- p02im.r.lo32 = accBuf[2];
- p02im.r.hi32 = accBuf[3];
-
- gbMask = ((p02re.r.hi32) ^ (p02re.r.hi32 >> 31)) | ((p02im.r.hi32) ^ (p02im.r.hi32 >> 31));
- if (gbMask == 0) {
- s = p02re.r.hi32 >> 31; gbMask = (p02re.r.lo32 ^ s) - s;
- s = p02im.r.hi32 >> 31; gbMask |= (p02im.r.lo32 ^ s) - s;
- z = 32 + CLZ(gbMask);
- } else {
- gbMask = FASTABS(p02re.r.hi32) | FASTABS(p02im.r.hi32);
- z = CLZ(gbMask);
- }
- n = 64 - z;
- if (n <= 30) {
- loShift = (30 - n);
- *p02reN = p02re.r.lo32 << loShift;
- *p02imN = p02im.r.lo32 << loShift;
- return -(loShift + 2*FBITS_OUT_QMFA);
- } else if (n < 32 + 30) {
- loShift = (n - 30);
- hiShift = 32 - loShift;
- *p02reN = (p02re.r.hi32 << hiShift) | (p02re.r.lo32 >> loShift);
- *p02imN = (p02im.r.hi32 << hiShift) | (p02im.r.lo32 >> loShift);
- return (loShift - 2*FBITS_OUT_QMFA);
- } else {
- hiShift = n - (32 + 30);
- *p02reN = p02re.r.hi32 >> hiShift;
- *p02imN = p02im.r.hi32 >> hiShift;
- return (32 - 2*FBITS_OUT_QMFA - hiShift);
- }
- return 0;
- }
- static void CalcLPCoefs(int *XBuf, int *a0re, int *a0im, int *a1re, int *a1im, int gb)
- {
- int zFlag, n1, n2, nd, d, dInv, tre, tim;
- int p01re, p01im, p02re, p02im, p12re, p12im, p11re, p22re;
-
- if (gb < 3) {
- nd = 3 - gb;
- for (n1 = (NUM_TIME_SLOTS*SAMPLES_PER_SLOT + 6 + 2); n1 != 0; n1--) {
- XBuf[0] >>= nd; XBuf[1] >>= nd;
- XBuf += (2*64);
- }
- XBuf -= (2*64*(NUM_TIME_SLOTS*SAMPLES_PER_SLOT + 6 + 2));
- }
-
-
- n1 = CalcCovariance1(XBuf, &p01re, &p01im, &p12re, &p12im, &p11re, &p22re);
- n2 = CalcCovariance2(XBuf, &p02re, &p02im);
-
- if (n1 < n2) {
- nd = MIN(n2 - n1, 31);
- p01re >>= nd; p01im >>= nd;
- p12re >>= nd; p12im >>= nd;
- p11re >>= nd; p22re >>= nd;
- n1 = n2;
- } else if (n1 > n2) {
- nd = MIN(n1 - n2, 31);
- p02re >>= nd; p02im >>= nd;
- }
-
- d = MULSHIFT32(p12re, p12re) + MULSHIFT32(p12im, p12im);
- d = MULSHIFT32(d, RELAX_COEF) << 1;
- d = MULSHIFT32(p11re, p22re) - d;
- ASSERT(d >= 0);
- zFlag = 0;
- *a0re = *a0im = 0;
- *a1re = *a1im = 0;
- if (d > 0) {
-
- nd = CLZ(d) - 1;
- d <<= nd;
- dInv = InvRNormalized(d);
-
- tre = MULSHIFT32(p01re, p12re) - MULSHIFT32(p01im, p12im) - MULSHIFT32(p02re, p11re);
- tre = MULSHIFT32(tre, dInv);
- tim = MULSHIFT32(p01re, p12im) + MULSHIFT32(p01im, p12re) - MULSHIFT32(p02im, p11re);
- tim = MULSHIFT32(tim, dInv);
-
- if (nd > 28 || (FASTABS(tre) >> (28 - nd)) >= 4 || (FASTABS(tim) >> (28 - nd)) >= 4) {
- zFlag = 1;
- } else {
- *a1re = tre << (FBITS_LPCOEFS - 28 + nd);
- *a1im = tim << (FBITS_LPCOEFS - 28 + nd);
- }
- }
- if (p11re) {
-
- nd = CLZ(p11re) - 1;
- p11re <<= nd;
- dInv = InvRNormalized(p11re);
-
- tre = (p01re >> 3) + MULSHIFT32(p12re, *a1re) + MULSHIFT32(p12im, *a1im);
- tre = -MULSHIFT32(tre, dInv);
- tim = (p01im >> 3) - MULSHIFT32(p12im, *a1re) + MULSHIFT32(p12re, *a1im);
- tim = -MULSHIFT32(tim, dInv);
- if (nd > 25 || (FASTABS(tre) >> (25 - nd)) >= 4 || (FASTABS(tim) >> (25 - nd)) >= 4) {
- zFlag = 1;
- } else {
- *a0re = tre << (FBITS_LPCOEFS - 25 + nd);
- *a0im = tim << (FBITS_LPCOEFS - 25 + nd);
- }
- }
-
- if (zFlag || MULSHIFT32(*a0re, *a0re) + MULSHIFT32(*a0im, *a0im) >= MAG_16 || MULSHIFT32(*a1re, *a1re) + MULSHIFT32(*a1im, *a1im) >= MAG_16) {
- *a0re = *a0im = 0;
- *a1re = *a1im = 0;
- }
-
- if (gb < 3) {
- nd = 3 - gb;
- for (n1 = (NUM_TIME_SLOTS*SAMPLES_PER_SLOT + 6 + 2); n1 != 0; n1--) {
- XBuf[0] <<= nd; XBuf[1] <<= nd;
- XBuf += (2*64);
- }
- }
- }
- void GenerateHighFreq(PSInfoSBR *psi, SBRGrid *sbrGrid, SBRFreq *sbrFreq, SBRChan *sbrChan, int ch)
- {
- int band, newBW, c, t, gb, gbMask, gbIdx;
- int currPatch, p, x, k, g, i, iStart, iEnd, bw, bwsq;
- int a0re, a0im, a1re, a1im;
- int x1re, x1im, x2re, x2im;
- int ACCre, ACCim;
- int *XBufLo, *XBufHi;
- (void) ch;
-
- for (band = 0; band < sbrFreq->numNoiseFloorBands; band++) {
- c = sbrChan->chirpFact[band];
- newBW = newBWTab[sbrChan->invfMode[0][band]][sbrChan->invfMode[1][band]];
-
- if (newBW < c)
- t = MULSHIFT32(newBW, 0x60000000) + MULSHIFT32(0x20000000, c);
- else
- t = MULSHIFT32(newBW, 0x74000000) + MULSHIFT32(0x0c000000, c);
- t <<= 1;
- if (t < 0x02000000)
- t = 0;
- if (t > 0x7f800000)
- t = 0x7f800000;
-
- sbrChan->chirpFact[band] = t;
- sbrChan->invfMode[0][band] = sbrChan->invfMode[1][band];
- }
- iStart = sbrGrid->envTimeBorder[0] + HF_ADJ;
- iEnd = sbrGrid->envTimeBorder[sbrGrid->numEnv] + HF_ADJ;
-
- k = sbrFreq->kStart;
- g = 0;
- bw = sbrChan->chirpFact[g];
- bwsq = MULSHIFT32(bw, bw) << 1;
-
- gbMask = (sbrChan->gbMask[0] | sbrChan->gbMask[1]);
- gb = CLZ(gbMask) - 1;
- for (currPatch = 0; currPatch < sbrFreq->numPatches; currPatch++) {
- for (x = 0; x < sbrFreq->patchNumSubbands[currPatch]; x++) {
-
- if (k >= sbrFreq->freqNoise[g+1]) {
- g++;
- bw = sbrChan->chirpFact[g];
- bwsq = MULSHIFT32(bw, bw) << 1;
- }
-
- p = sbrFreq->patchStartSubband[currPatch] + x;
- XBufHi = psi->XBuf[iStart][k];
- if (bw) {
- CalcLPCoefs(psi->XBuf[0][p], &a0re, &a0im, &a1re, &a1im, gb);
- a0re = MULSHIFT32(bw, a0re);
- a0im = MULSHIFT32(bw, a0im);
- a1re = MULSHIFT32(bwsq, a1re);
- a1im = MULSHIFT32(bwsq, a1im);
- XBufLo = psi->XBuf[iStart-2][p];
- x2re = XBufLo[0];
- x2im = XBufLo[1];
- XBufLo += (64*2);
- x1re = XBufLo[0];
- x1im = XBufLo[1];
- XBufLo += (64*2);
- for (i = iStart; i < iEnd; i++) {
-
- ACCre = MULSHIFT32(x2re, a1re) - MULSHIFT32(x2im, a1im);
- ACCim = MULSHIFT32(x2re, a1im) + MULSHIFT32(x2im, a1re);
- x2re = x1re;
- x2im = x1im;
-
- ACCre += MULSHIFT32(x1re, a0re) - MULSHIFT32(x1im, a0im);
- ACCim += MULSHIFT32(x1re, a0im) + MULSHIFT32(x1im, a0re);
- x1re = XBufLo[0];
- x1im = XBufLo[1];
- XBufLo += (64*2);
-
- CLIP_2N_SHIFT30(ACCre, 4);
- ACCre += x1re;
- CLIP_2N_SHIFT30(ACCim, 4);
- ACCim += x1im;
- XBufHi[0] = ACCre;
- XBufHi[1] = ACCim;
- XBufHi += (64*2);
-
- gbMask = FASTABS(ACCre);
- gbMask |= FASTABS(ACCim);
- gbIdx = (i >> 5) & 0x01;
- sbrChan->gbMask[gbIdx] |= gbMask;
- }
- } else {
- XBufLo = (int *)psi->XBuf[iStart][p];
- for (i = iStart; i < iEnd; i++) {
- XBufHi[0] = XBufLo[0];
- XBufHi[1] = XBufLo[1];
- XBufLo += (64*2);
- XBufHi += (64*2);
- }
- }
- k++;
- }
- }
- }
|