Home | History | Annotate | Download | only in srce
      1 /******************************************************************************
      2  *
      3  *  Copyright 1999-2012 Broadcom Corporation
      4  *
      5  *  Licensed under the Apache License, Version 2.0 (the "License");
      6  *  you may not use this file except in compliance with the License.
      7  *  You may obtain a copy of the License at:
      8  *
      9  *  http://www.apache.org/licenses/LICENSE-2.0
     10  *
     11  *  Unless required by applicable law or agreed to in writing, software
     12  *  distributed under the License is distributed on an "AS IS" BASIS,
     13  *  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
     14  *  See the License for the specific language governing permissions and
     15  *  limitations under the License.
     16  *
     17  ******************************************************************************/
     18 
     19 /******************************************************************************
     20  *
     21  *  source file for fast dct operations
     22  *
     23  ******************************************************************************/
     24 
     25 #include "sbc_dct.h"
     26 #include "sbc_enc_func_declare.h"
     27 #include "sbc_encoder.h"
     28 
     29 /*******************************************************************************
     30  *
     31  * Function         SBC_FastIDCT8
     32  *
     33  * Description      implementation of fast DCT algorithm by Feig and Winograd
     34  *
     35  *
     36  * Returns          y = dct(pInVect)
     37  *
     38  *
     39  ******************************************************************************/
     40 
     41 #if (SBC_IS_64_MULT_IN_IDCT == FALSE)
     42 #define SBC_COS_PI_SUR_4                              \
     43   (0x00005a82) /* ((0x8000) * 0.7071)     = cos(pi/4) \
     44                   */
     45 #define SBC_COS_PI_SUR_8 \
     46   (0x00007641) /* ((0x8000) * 0.9239)     = (cos(pi/8)) */
     47 #define SBC_COS_3PI_SUR_8 \
     48   (0x000030fb) /* ((0x8000) * 0.3827)     = (cos(3*pi/8)) */
     49 #define SBC_COS_PI_SUR_16 \
     50   (0x00007d8a) /* ((0x8000) * 0.9808))     = (cos(pi/16)) */
     51 #define SBC_COS_3PI_SUR_16 \
     52   (0x00006a6d) /* ((0x8000) * 0.8315))     = (cos(3*pi/16)) */
     53 #define SBC_COS_5PI_SUR_16 \
     54   (0x0000471c) /* ((0x8000) * 0.5556))     = (cos(5*pi/16)) */
     55 #define SBC_COS_7PI_SUR_16 \
     56   (0x000018f8) /* ((0x8000) * 0.1951))     = (cos(7*pi/16)) */
     57 #define SBC_IDCT_MULT(a, b, c) SBC_MULT_32_16_SIMPLIFIED(a, b, c)
     58 #else
     59 #define SBC_COS_PI_SUR_4 \
     60   (0x5A827999) /* ((0x80000000) * 0.707106781)      = (cos(pi/4)   ) */
     61 #define SBC_COS_PI_SUR_8 \
     62   (0x7641AF3C) /* ((0x80000000) * 0.923879533)      = (cos(pi/8)   ) */
     63 #define SBC_COS_3PI_SUR_8 \
     64   (0x30FBC54D) /* ((0x80000000) * 0.382683432)      = (cos(3*pi/8) ) */
     65 #define SBC_COS_PI_SUR_16 \
     66   (0x7D8A5F3F) /* ((0x80000000) * 0.98078528 ))     = (cos(pi/16)  ) */
     67 #define SBC_COS_3PI_SUR_16 \
     68   (0x6A6D98A4) /* ((0x80000000) * 0.831469612))     = (cos(3*pi/16)) */
     69 #define SBC_COS_5PI_SUR_16 \
     70   (0x471CECE6) /* ((0x80000000) * 0.555570233))     = (cos(5*pi/16)) */
     71 #define SBC_COS_7PI_SUR_16 \
     72   (0x18F8B83C) /* ((0x80000000) * 0.195090322))     = (cos(7*pi/16)) */
     73 #define SBC_IDCT_MULT(a, b, c) SBC_MULT_32_32(a, b, c)
     74 #endif /* SBC_IS_64_MULT_IN_IDCT */
     75 
     76 #if (SBC_FAST_DCT == FALSE)
     77 extern const int16_t gas16AnalDCTcoeff8[];
     78 extern const int16_t gas16AnalDCTcoeff4[];
     79 #endif
     80 
     81 void SBC_FastIDCT8(int32_t* pInVect, int32_t* pOutVect) {
     82 #if (SBC_FAST_DCT == TRUE)
     83 #if (SBC_ARM_ASM_OPT == TRUE)
     84 #else
     85 #if (SBC_IPAQ_OPT == TRUE)
     86 #if (SBC_IS_64_MULT_IN_IDCT == TRUE)
     87   int64_t s64Temp;
     88 #endif
     89 #else
     90 #if (SBC_IS_64_MULT_IN_IDCT == TRUE)
     91   int32_t s32HiTemp;
     92 #else
     93   int32_t s32In2Temp;
     94   register int32_t s32In1Temp;
     95 #endif
     96 #endif
     97 #endif
     98 
     99   register int32_t x0, x1, x2, x3, x4, x5, x6, x7, temp;
    100   int32_t res_even[4], res_odd[4];
    101   /*x0= (pInVect[4])/2 ;*/
    102   SBC_IDCT_MULT(SBC_COS_PI_SUR_4, pInVect[4], x0);
    103   /*printf("x0 0x%x = %d = %d * %d\n", x0, x0, SBC_COS_PI_SUR_4, pInVect[4]);*/
    104 
    105   x1 = (pInVect[3] + pInVect[5]) >> 1;
    106   x2 = (pInVect[2] + pInVect[6]) >> 1;
    107   x3 = (pInVect[1] + pInVect[7]) >> 1;
    108   x4 = (pInVect[0] + pInVect[8]) >> 1;
    109   x5 = (pInVect[9] - pInVect[15]) >> 1;
    110   x6 = (pInVect[10] - pInVect[14]) >> 1;
    111   x7 = (pInVect[11] - pInVect[13]) >> 1;
    112 
    113   /* 2-point IDCT of x0 and x4 as in (11) */
    114   temp = x0;
    115   SBC_IDCT_MULT(SBC_COS_PI_SUR_4, (x0 + x4),
    116                 x0); /*x0 = ( x0 + x4 ) * cos(1*pi/4) ; */
    117   SBC_IDCT_MULT(SBC_COS_PI_SUR_4, (temp - x4),
    118                 x4); /*x4 = ( temp - x4 ) * cos(1*pi/4) ; */
    119 
    120   /* rearrangement of x2 and x6 as in (15) */
    121   x2 -= x6;
    122   x6 <<= 1;
    123 
    124   /* 2-point IDCT of x2 and x6 and post-multiplication as in (15) */
    125   SBC_IDCT_MULT(SBC_COS_PI_SUR_4, x6, x6); /*x6 = x6 * cos(1*pi/4) ; */
    126   temp = x2;
    127   SBC_IDCT_MULT(SBC_COS_PI_SUR_8, (x2 + x6),
    128                 x2); /*x2 = ( x2 + x6 ) * cos(1*pi/8) ; */
    129   SBC_IDCT_MULT(SBC_COS_3PI_SUR_8, (temp - x6),
    130                 x6); /*x6 = ( temp - x6 ) * cos(3*pi/8) ;*/
    131 
    132   /* 4-point IDCT of x0,x2,x4 and x6 as in (11) */
    133   res_even[0] = x0 + x2;
    134   res_even[1] = x4 + x6;
    135   res_even[2] = x4 - x6;
    136   res_even[3] = x0 - x2;
    137 
    138   /* rearrangement of x1,x3,x5,x7 as in (15) */
    139   x7 <<= 1;
    140   x5 = (x5 << 1) - x7;
    141   x3 = (x3 << 1) - x5;
    142   x1 -= x3 >> 1;
    143 
    144   /* two-dimensional IDCT of x1 and x5 */
    145   SBC_IDCT_MULT(SBC_COS_PI_SUR_4, x5, x5); /*x5 = x5 * cos(1*pi/4) ; */
    146   temp = x1;
    147   x1 = x1 + x5;
    148   x5 = temp - x5;
    149 
    150   /* rearrangement of x3 and x7 as in (15) */
    151   x3 -= x7;
    152   x7 <<= 1;
    153   SBC_IDCT_MULT(SBC_COS_PI_SUR_4, x7, x7); /*x7 = x7 * cos(1*pi/4) ; */
    154 
    155   /* 2-point IDCT of x3 and x7 and post-multiplication as in (15) */
    156   temp = x3;
    157   SBC_IDCT_MULT(SBC_COS_PI_SUR_8, (x3 + x7),
    158                 x3); /*x3 = ( x3 + x7 ) * cos(1*pi/8)  ; */
    159   SBC_IDCT_MULT(SBC_COS_3PI_SUR_8, (temp - x7),
    160                 x7); /*x7 = ( temp - x7 ) * cos(3*pi/8) ;*/
    161 
    162   /* 4-point IDCT of x1,x3,x5 and x7 and post multiplication by diagonal matrix
    163    * as in (14) */
    164   SBC_IDCT_MULT((SBC_COS_PI_SUR_16), (x1 + x3),
    165                 res_odd[0]); /*res_odd[ 0 ] = ( x1 + x3 ) * cos(1*pi/16) ; */
    166   SBC_IDCT_MULT((SBC_COS_3PI_SUR_16), (x5 + x7),
    167                 res_odd[1]); /*res_odd[ 1 ] = ( x5 + x7 ) * cos(3*pi/16) ; */
    168   SBC_IDCT_MULT((SBC_COS_5PI_SUR_16), (x5 - x7),
    169                 res_odd[2]); /*res_odd[ 2 ] = ( x5 - x7 ) * cos(5*pi/16) ; */
    170   SBC_IDCT_MULT((SBC_COS_7PI_SUR_16), (x1 - x3),
    171                 res_odd[3]); /*res_odd[ 3 ] = ( x1 - x3 ) * cos(7*pi/16) ; */
    172 
    173   /* additions and subtractions as in (9) */
    174   pOutVect[0] = (res_even[0] + res_odd[0]);
    175   pOutVect[1] = (res_even[1] + res_odd[1]);
    176   pOutVect[2] = (res_even[2] + res_odd[2]);
    177   pOutVect[3] = (res_even[3] + res_odd[3]);
    178   pOutVect[7] = (res_even[0] - res_odd[0]);
    179   pOutVect[6] = (res_even[1] - res_odd[1]);
    180   pOutVect[5] = (res_even[2] - res_odd[2]);
    181   pOutVect[4] = (res_even[3] - res_odd[3]);
    182 #else
    183   uint8_t Index, k;
    184   int32_t temp;
    185   /*Calculate 4 subband samples by matrixing*/
    186   for (Index = 0; Index < 8; Index++) {
    187     temp = 0;
    188     for (k = 0; k < 16; k++) {
    189       /*temp += (int32_t)(((int64_t)M[(Index*strEncParams->numOfSubBands*2)+k] *
    190        * Y[k]) >> 16 );*/
    191       temp += (gas16AnalDCTcoeff8[(Index * 8 * 2) + k] * (pInVect[k] >> 16));
    192       temp +=
    193           ((gas16AnalDCTcoeff8[(Index * 8 * 2) + k] * (pInVect[k] & 0xFFFF)) >>
    194            16);
    195     }
    196     pOutVect[Index] = temp;
    197   }
    198 #endif
    199   /*    printf("pOutVect: 0x%x;0x%x;0x%x;0x%x;0x%x;0x%x;0x%x;0x%x\n",\
    200           pOutVect[0],pOutVect[1],pOutVect[2],pOutVect[3],pOutVect[4],pOutVect[5],pOutVect[6],pOutVect[7]);*/
    201 }
    202 
    203 /*******************************************************************************
    204  *
    205  * Function         SBC_FastIDCT4
    206  *
    207  * Description      implementation of fast DCT algorithm by Feig and Winograd
    208  *
    209  *
    210  * Returns          y = dct(x0)
    211  *
    212  *
    213  ******************************************************************************/
    214 void SBC_FastIDCT4(int32_t* pInVect, int32_t* pOutVect) {
    215 #if (SBC_FAST_DCT == TRUE)
    216 #if (SBC_ARM_ASM_OPT == TRUE)
    217 #else
    218 #if (SBC_IPAQ_OPT == TRUE)
    219 #if (SBC_IS_64_MULT_IN_IDCT == TRUE)
    220   int64_t s64Temp;
    221 #endif
    222 #else
    223 #if (SBC_IS_64_MULT_IN_IDCT == TRUE)
    224   int32_t s32HiTemp;
    225 #else
    226   uint16_t s32In2Temp;
    227   int32_t s32In1Temp;
    228 #endif
    229 #endif
    230 #endif
    231   int32_t temp, x2;
    232   int32_t tmp[8];
    233 
    234   x2 = pInVect[2] >> 1;
    235   temp = (pInVect[0] + pInVect[4]);
    236   SBC_IDCT_MULT((SBC_COS_PI_SUR_4 >> 1), temp, tmp[0]);
    237   tmp[1] = x2 - tmp[0];
    238   tmp[0] += x2;
    239   temp = (pInVect[1] + pInVect[3]);
    240   SBC_IDCT_MULT((SBC_COS_3PI_SUR_8 >> 1), temp, tmp[3]);
    241   SBC_IDCT_MULT((SBC_COS_PI_SUR_8 >> 1), temp, tmp[2]);
    242   temp = (pInVect[5] - pInVect[7]);
    243   SBC_IDCT_MULT((SBC_COS_3PI_SUR_8 >> 1), temp, tmp[5]);
    244   SBC_IDCT_MULT((SBC_COS_PI_SUR_8 >> 1), temp, tmp[4]);
    245   tmp[6] = tmp[2] + tmp[5];
    246   tmp[7] = tmp[3] - tmp[4];
    247   pOutVect[0] = (tmp[0] + tmp[6]);
    248   pOutVect[1] = (tmp[1] + tmp[7]);
    249   pOutVect[2] = (tmp[1] - tmp[7]);
    250   pOutVect[3] = (tmp[0] - tmp[6]);
    251 #else
    252   uint8_t Index, k;
    253   int32_t temp;
    254   /*Calculate 4 subband samples by matrixing*/
    255   for (Index = 0; Index < 4; Index++) {
    256     temp = 0;
    257     for (k = 0; k < 8; k++) {
    258       /*temp += (int32_t)(((int64_t)M[(Index*strEncParams->numOfSubBands*2)+k] *
    259        * Y[k]) >> 16 ); */
    260       temp += (gas16AnalDCTcoeff4[(Index * 4 * 2) + k] * (pInVect[k] >> 16));
    261       temp +=
    262           ((gas16AnalDCTcoeff4[(Index * 4 * 2) + k] * (pInVect[k] & 0xFFFF)) >>
    263            16);
    264     }
    265     pOutVect[Index] = temp;
    266   }
    267 #endif
    268 }
    269