1 /****************************************************************************** 2 * 3 * Copyright (C) 1999-2012 Broadcom Corporation 4 * 5 * Licensed under the Apache License, Version 2.0 (the "License"); 6 * you may not use this file except in compliance with the License. 7 * You may obtain a copy of the License at: 8 * 9 * http://www.apache.org/licenses/LICENSE-2.0 10 * 11 * Unless required by applicable law or agreed to in writing, software 12 * distributed under the License is distributed on an "AS IS" BASIS, 13 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 14 * See the License for the specific language governing permissions and 15 * limitations under the License. 16 * 17 ******************************************************************************/ 18 19 /****************************************************************************** 20 * 21 * source file for fast dct operations 22 * 23 ******************************************************************************/ 24 25 #include "sbc_encoder.h" 26 #include "sbc_enc_func_declare.h" 27 #include "sbc_dct.h" 28 29 30 31 /******************************************************************************* 32 ** 33 ** Function SBC_FastIDCT8 34 ** 35 ** Description implementation of fast DCT algorithm by Feig and Winograd 36 ** 37 ** 38 ** Returns y = dct(pInVect) 39 ** 40 ** 41 *******************************************************************************/ 42 43 #if (SBC_IS_64_MULT_IN_IDCT == FALSE) 44 #define SBC_COS_PI_SUR_4 (0x00005a82) /* ((0x8000) * 0.7071) = cos(pi/4) */ 45 #define SBC_COS_PI_SUR_8 (0x00007641) /* ((0x8000) * 0.9239) = (cos(pi/8)) */ 46 #define SBC_COS_3PI_SUR_8 (0x000030fb) /* ((0x8000) * 0.3827) = (cos(3*pi/8)) */ 47 #define SBC_COS_PI_SUR_16 (0x00007d8a) /* ((0x8000) * 0.9808)) = (cos(pi/16)) */ 48 #define SBC_COS_3PI_SUR_16 (0x00006a6d) /* ((0x8000) * 0.8315)) = (cos(3*pi/16)) */ 49 #define SBC_COS_5PI_SUR_16 (0x0000471c) /* ((0x8000) * 0.5556)) = (cos(5*pi/16)) */ 50 #define SBC_COS_7PI_SUR_16 (0x000018f8) /* ((0x8000) * 0.1951)) = (cos(7*pi/16)) */ 51 #define SBC_IDCT_MULT(a,b,c) SBC_MULT_32_16_SIMPLIFIED(a,b,c) 52 #else 53 #define SBC_COS_PI_SUR_4 (0x5A827999) /* ((0x80000000) * 0.707106781) = (cos(pi/4) ) */ 54 #define SBC_COS_PI_SUR_8 (0x7641AF3C) /* ((0x80000000) * 0.923879533) = (cos(pi/8) ) */ 55 #define SBC_COS_3PI_SUR_8 (0x30FBC54D) /* ((0x80000000) * 0.382683432) = (cos(3*pi/8) ) */ 56 #define SBC_COS_PI_SUR_16 (0x7D8A5F3F) /* ((0x80000000) * 0.98078528 )) = (cos(pi/16) ) */ 57 #define SBC_COS_3PI_SUR_16 (0x6A6D98A4) /* ((0x80000000) * 0.831469612)) = (cos(3*pi/16)) */ 58 #define SBC_COS_5PI_SUR_16 (0x471CECE6) /* ((0x80000000) * 0.555570233)) = (cos(5*pi/16)) */ 59 #define SBC_COS_7PI_SUR_16 (0x18F8B83C) /* ((0x80000000) * 0.195090322)) = (cos(7*pi/16)) */ 60 #define SBC_IDCT_MULT(a,b,c) SBC_MULT_32_32(a,b,c) 61 #endif /* SBC_IS_64_MULT_IN_IDCT */ 62 63 #if (SBC_FAST_DCT == FALSE) 64 extern const SINT16 gas16AnalDCTcoeff8[]; 65 extern const SINT16 gas16AnalDCTcoeff4[]; 66 #endif 67 68 void SBC_FastIDCT8(SINT32 *pInVect, SINT32 *pOutVect) 69 { 70 #if (SBC_FAST_DCT == TRUE) 71 #if (SBC_ARM_ASM_OPT==TRUE) 72 #else 73 #if (SBC_IPAQ_OPT==TRUE) 74 #if (SBC_IS_64_MULT_IN_IDCT == TRUE) 75 SINT64 s64Temp; 76 #endif 77 #else 78 #if (SBC_IS_64_MULT_IN_IDCT == TRUE) 79 SINT32 s32HiTemp; 80 #else 81 SINT32 s32In2Temp; 82 register SINT32 s32In1Temp; 83 #endif 84 #endif 85 #endif 86 87 register SINT32 x0, x1, x2, x3, x4, x5, x6, x7,temp; 88 SINT32 res_even[4], res_odd[4]; 89 /*x0= (pInVect[4])/2 ;*/ 90 SBC_IDCT_MULT(SBC_COS_PI_SUR_4,pInVect[4], x0); 91 /*printf("x0 0x%x = %d = %d * %d\n", x0, x0, SBC_COS_PI_SUR_4, pInVect[4]);*/ 92 93 x1 = (pInVect[3] + pInVect[5]) >>1; 94 x2 = (pInVect[2] + pInVect[6]) >>1; 95 x3 = (pInVect[1] + pInVect[7]) >>1; 96 x4 = (pInVect[0] + pInVect[8]) >>1; 97 x5 = (pInVect[9] - pInVect[15]) >>1; 98 x6 = (pInVect[10] - pInVect[14])>>1; 99 x7 = (pInVect[11] - pInVect[13])>>1; 100 101 /* 2-point IDCT of x0 and x4 as in (11) */ 102 temp = x0 ; 103 SBC_IDCT_MULT(SBC_COS_PI_SUR_4, ( x0 + x4 ), x0); /*x0 = ( x0 + x4 ) * cos(1*pi/4) ; */ 104 SBC_IDCT_MULT(SBC_COS_PI_SUR_4, ( temp - x4 ), x4); /*x4 = ( temp - x4 ) * cos(1*pi/4) ; */ 105 106 /* rearrangement of x2 and x6 as in (15) */ 107 x2 -=x6; 108 x6 <<= 1 ; 109 110 /* 2-point IDCT of x2 and x6 and post-multiplication as in (15) */ 111 SBC_IDCT_MULT(SBC_COS_PI_SUR_4,x6, x6); /*x6 = x6 * cos(1*pi/4) ; */ 112 temp = x2 ; 113 SBC_IDCT_MULT(SBC_COS_PI_SUR_8,( x2 + x6 ), x2); /*x2 = ( x2 + x6 ) * cos(1*pi/8) ; */ 114 SBC_IDCT_MULT(SBC_COS_3PI_SUR_8,( temp - x6 ), x6); /*x6 = ( temp - x6 ) * cos(3*pi/8) ;*/ 115 116 /* 4-point IDCT of x0,x2,x4 and x6 as in (11) */ 117 res_even[ 0 ] = x0 + x2 ; 118 res_even[ 1 ] = x4 + x6 ; 119 res_even[ 2 ] = x4 - x6 ; 120 res_even[ 3 ] = x0 - x2 ; 121 122 123 /* rearrangement of x1,x3,x5,x7 as in (15) */ 124 x7 <<= 1 ; 125 x5 = ( x5 <<1 ) - x7 ; 126 x3 = ( x3 <<1 ) - x5 ; 127 x1 -= x3 >>1 ; 128 129 /* two-dimensional IDCT of x1 and x5 */ 130 SBC_IDCT_MULT(SBC_COS_PI_SUR_4, x5, x5); /*x5 = x5 * cos(1*pi/4) ; */ 131 temp = x1 ; 132 x1 = x1 + x5 ; 133 x5 = temp - x5 ; 134 135 /* rearrangement of x3 and x7 as in (15) */ 136 x3 -= x7; 137 x7 <<= 1 ; 138 SBC_IDCT_MULT(SBC_COS_PI_SUR_4, x7, x7); /*x7 = x7 * cos(1*pi/4) ; */ 139 140 /* 2-point IDCT of x3 and x7 and post-multiplication as in (15) */ 141 temp = x3 ; 142 SBC_IDCT_MULT( SBC_COS_PI_SUR_8,( x3 + x7 ), x3); /*x3 = ( x3 + x7 ) * cos(1*pi/8) ; */ 143 SBC_IDCT_MULT( SBC_COS_3PI_SUR_8,( temp - x7 ), x7); /*x7 = ( temp - x7 ) * cos(3*pi/8) ;*/ 144 145 /* 4-point IDCT of x1,x3,x5 and x7 and post multiplication by diagonal matrix as in (14) */ 146 SBC_IDCT_MULT((SBC_COS_PI_SUR_16), ( x1 + x3 ) , res_odd[0]); /*res_odd[ 0 ] = ( x1 + x3 ) * cos(1*pi/16) ; */ 147 SBC_IDCT_MULT((SBC_COS_3PI_SUR_16), ( x5 + x7 ) , res_odd[1]); /*res_odd[ 1 ] = ( x5 + x7 ) * cos(3*pi/16) ; */ 148 SBC_IDCT_MULT((SBC_COS_5PI_SUR_16), ( x5 - x7 ) , res_odd[2]); /*res_odd[ 2 ] = ( x5 - x7 ) * cos(5*pi/16) ; */ 149 SBC_IDCT_MULT((SBC_COS_7PI_SUR_16), ( x1 - x3 ) , res_odd[3]); /*res_odd[ 3 ] = ( x1 - x3 ) * cos(7*pi/16) ; */ 150 151 /* additions and subtractions as in (9) */ 152 pOutVect[0] = (res_even[ 0 ] + res_odd[ 0 ]) ; 153 pOutVect[1] = (res_even[ 1 ] + res_odd[ 1 ]) ; 154 pOutVect[2] = (res_even[ 2 ] + res_odd[ 2 ]) ; 155 pOutVect[3] = (res_even[ 3 ] + res_odd[ 3 ]) ; 156 pOutVect[7] = (res_even[ 0 ] - res_odd[ 0 ]) ; 157 pOutVect[6] = (res_even[ 1 ] - res_odd[ 1 ]) ; 158 pOutVect[5] = (res_even[ 2 ] - res_odd[ 2 ]) ; 159 pOutVect[4] = (res_even[ 3 ] - res_odd[ 3 ]) ; 160 #else 161 UINT8 Index, k; 162 SINT32 temp; 163 /*Calculate 4 subband samples by matrixing*/ 164 for(Index=0; Index<8; Index++) 165 { 166 temp = 0; 167 for(k=0; k<16; k++) 168 { 169 /*temp += (SINT32)(((SINT64)M[(Index*strEncParams->numOfSubBands*2)+k] * Y[k]) >> 16 );*/ 170 temp += (gas16AnalDCTcoeff8[(Index*8*2)+k] * (pInVect[k] >> 16)); 171 temp += ((gas16AnalDCTcoeff8[(Index*8*2)+k] * (pInVect[k] & 0xFFFF)) >> 16); 172 } 173 pOutVect[Index] = temp; 174 } 175 #endif 176 /* printf("pOutVect: 0x%x;0x%x;0x%x;0x%x;0x%x;0x%x;0x%x;0x%x\n",\ 177 pOutVect[0],pOutVect[1],pOutVect[2],pOutVect[3],pOutVect[4],pOutVect[5],pOutVect[6],pOutVect[7]);*/ 178 } 179 180 /******************************************************************************* 181 ** 182 ** Function SBC_FastIDCT4 183 ** 184 ** Description implementation of fast DCT algorithm by Feig and Winograd 185 ** 186 ** 187 ** Returns y = dct(x0) 188 ** 189 ** 190 *******************************************************************************/ 191 void SBC_FastIDCT4(SINT32 *pInVect, SINT32 *pOutVect) 192 { 193 #if (SBC_FAST_DCT == TRUE) 194 #if (SBC_ARM_ASM_OPT==TRUE) 195 #else 196 #if (SBC_IPAQ_OPT==TRUE) 197 #if (SBC_IS_64_MULT_IN_IDCT == TRUE) 198 SINT64 s64Temp; 199 #endif 200 #else 201 #if (SBC_IS_64_MULT_IN_IDCT == TRUE) 202 SINT32 s32HiTemp; 203 #else 204 UINT16 s32In2Temp; 205 SINT32 s32In1Temp; 206 #endif 207 #endif 208 #endif 209 SINT32 temp,x2; 210 SINT32 tmp[8]; 211 212 x2=pInVect[2]>>1; 213 temp=(pInVect[0]+pInVect[4]); 214 SBC_IDCT_MULT((SBC_COS_PI_SUR_4>>1), temp , tmp[0]); 215 tmp[1]=x2-tmp[0]; 216 tmp[0]+=x2; 217 temp=(pInVect[1]+pInVect[3]); 218 SBC_IDCT_MULT((SBC_COS_3PI_SUR_8>>1), temp , tmp[3]); 219 SBC_IDCT_MULT((SBC_COS_PI_SUR_8>>1), temp , tmp[2]); 220 temp=(pInVect[5]-pInVect[7]); 221 SBC_IDCT_MULT((SBC_COS_3PI_SUR_8>>1), temp , tmp[5]); 222 SBC_IDCT_MULT((SBC_COS_PI_SUR_8>>1), temp , tmp[4]); 223 tmp[6]=tmp[2]+tmp[5]; 224 tmp[7]=tmp[3]-tmp[4]; 225 pOutVect[0] = (tmp[0]+tmp[6]); 226 pOutVect[1] = (tmp[1]+tmp[7]); 227 pOutVect[2] = (tmp[1]-tmp[7]); 228 pOutVect[3] = (tmp[0]-tmp[6]); 229 #else 230 UINT8 Index, k; 231 SINT32 temp; 232 /*Calculate 4 subband samples by matrixing*/ 233 for(Index=0; Index<4; Index++) 234 { 235 temp = 0; 236 for(k=0; k<8; k++) 237 { 238 /*temp += (SINT32)(((SINT64)M[(Index*strEncParams->numOfSubBands*2)+k] * Y[k]) >> 16 ); */ 239 temp += (gas16AnalDCTcoeff4[(Index*4*2)+k] * (pInVect[k] >> 16)); 240 temp += ((gas16AnalDCTcoeff4[(Index*4*2)+k] * (pInVect[k] & 0xFFFF)) >> 16); 241 } 242 pOutVect[Index] = temp; 243 } 244 #endif 245 } 246