1*df25739fSMilanka Ringwald /******************************************************************************
2*df25739fSMilanka Ringwald *
3*df25739fSMilanka Ringwald * Copyright (C) 1999-2012 Broadcom Corporation
4*df25739fSMilanka Ringwald *
5*df25739fSMilanka Ringwald * Licensed under the Apache License, Version 2.0 (the "License");
6*df25739fSMilanka Ringwald * you may not use this file except in compliance with the License.
7*df25739fSMilanka Ringwald * You may obtain a copy of the License at:
8*df25739fSMilanka Ringwald *
9*df25739fSMilanka Ringwald * http://www.apache.org/licenses/LICENSE-2.0
10*df25739fSMilanka Ringwald *
11*df25739fSMilanka Ringwald * Unless required by applicable law or agreed to in writing, software
12*df25739fSMilanka Ringwald * distributed under the License is distributed on an "AS IS" BASIS,
13*df25739fSMilanka Ringwald * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14*df25739fSMilanka Ringwald * See the License for the specific language governing permissions and
15*df25739fSMilanka Ringwald * limitations under the License.
16*df25739fSMilanka Ringwald *
17*df25739fSMilanka Ringwald ******************************************************************************/
18*df25739fSMilanka Ringwald
19*df25739fSMilanka Ringwald /******************************************************************************
20*df25739fSMilanka Ringwald *
21*df25739fSMilanka Ringwald * source file for fast dct operations
22*df25739fSMilanka Ringwald *
23*df25739fSMilanka Ringwald ******************************************************************************/
24*df25739fSMilanka Ringwald
25*df25739fSMilanka Ringwald #include "sbc_encoder.h"
26*df25739fSMilanka Ringwald #include "sbc_enc_func_declare.h"
27*df25739fSMilanka Ringwald #include "sbc_dct.h"
28*df25739fSMilanka Ringwald
29*df25739fSMilanka Ringwald
30*df25739fSMilanka Ringwald
31*df25739fSMilanka Ringwald /*******************************************************************************
32*df25739fSMilanka Ringwald **
33*df25739fSMilanka Ringwald ** Function SBC_FastIDCT8
34*df25739fSMilanka Ringwald **
35*df25739fSMilanka Ringwald ** Description implementation of fast DCT algorithm by Feig and Winograd
36*df25739fSMilanka Ringwald **
37*df25739fSMilanka Ringwald **
38*df25739fSMilanka Ringwald ** Returns y = dct(pInVect)
39*df25739fSMilanka Ringwald **
40*df25739fSMilanka Ringwald **
41*df25739fSMilanka Ringwald *******************************************************************************/
42*df25739fSMilanka Ringwald
43*df25739fSMilanka Ringwald #if (SBC_IS_64_MULT_IN_IDCT == FALSE)
44*df25739fSMilanka Ringwald #define SBC_COS_PI_SUR_4 (0x00005a82) /* ((0x8000) * 0.7071) = cos(pi/4) */
45*df25739fSMilanka Ringwald #define SBC_COS_PI_SUR_8 (0x00007641) /* ((0x8000) * 0.9239) = (cos(pi/8)) */
46*df25739fSMilanka Ringwald #define SBC_COS_3PI_SUR_8 (0x000030fb) /* ((0x8000) * 0.3827) = (cos(3*pi/8)) */
47*df25739fSMilanka Ringwald #define SBC_COS_PI_SUR_16 (0x00007d8a) /* ((0x8000) * 0.9808)) = (cos(pi/16)) */
48*df25739fSMilanka Ringwald #define SBC_COS_3PI_SUR_16 (0x00006a6d) /* ((0x8000) * 0.8315)) = (cos(3*pi/16)) */
49*df25739fSMilanka Ringwald #define SBC_COS_5PI_SUR_16 (0x0000471c) /* ((0x8000) * 0.5556)) = (cos(5*pi/16)) */
50*df25739fSMilanka Ringwald #define SBC_COS_7PI_SUR_16 (0x000018f8) /* ((0x8000) * 0.1951)) = (cos(7*pi/16)) */
51*df25739fSMilanka Ringwald #define SBC_IDCT_MULT(a,b,c) SBC_MULT_32_16_SIMPLIFIED(a,b,c)
52*df25739fSMilanka Ringwald #else
53*df25739fSMilanka Ringwald #define SBC_COS_PI_SUR_4 (0x5A827999) /* ((0x80000000) * 0.707106781) = (cos(pi/4) ) */
54*df25739fSMilanka Ringwald #define SBC_COS_PI_SUR_8 (0x7641AF3C) /* ((0x80000000) * 0.923879533) = (cos(pi/8) ) */
55*df25739fSMilanka Ringwald #define SBC_COS_3PI_SUR_8 (0x30FBC54D) /* ((0x80000000) * 0.382683432) = (cos(3*pi/8) ) */
56*df25739fSMilanka Ringwald #define SBC_COS_PI_SUR_16 (0x7D8A5F3F) /* ((0x80000000) * 0.98078528 )) = (cos(pi/16) ) */
57*df25739fSMilanka Ringwald #define SBC_COS_3PI_SUR_16 (0x6A6D98A4) /* ((0x80000000) * 0.831469612)) = (cos(3*pi/16)) */
58*df25739fSMilanka Ringwald #define SBC_COS_5PI_SUR_16 (0x471CECE6) /* ((0x80000000) * 0.555570233)) = (cos(5*pi/16)) */
59*df25739fSMilanka Ringwald #define SBC_COS_7PI_SUR_16 (0x18F8B83C) /* ((0x80000000) * 0.195090322)) = (cos(7*pi/16)) */
60*df25739fSMilanka Ringwald #define SBC_IDCT_MULT(a,b,c) SBC_MULT_32_32(a,b,c)
61*df25739fSMilanka Ringwald #endif /* SBC_IS_64_MULT_IN_IDCT */
62*df25739fSMilanka Ringwald
63*df25739fSMilanka Ringwald #if (SBC_FAST_DCT == FALSE)
64*df25739fSMilanka Ringwald extern const SINT16 gas16AnalDCTcoeff8[];
65*df25739fSMilanka Ringwald extern const SINT16 gas16AnalDCTcoeff4[];
66*df25739fSMilanka Ringwald #endif
67*df25739fSMilanka Ringwald
SBC_FastIDCT8(SINT32 * pInVect,SINT32 * pOutVect)68*df25739fSMilanka Ringwald void SBC_FastIDCT8(SINT32 *pInVect, SINT32 *pOutVect)
69*df25739fSMilanka Ringwald {
70*df25739fSMilanka Ringwald #if (SBC_FAST_DCT == TRUE)
71*df25739fSMilanka Ringwald #if (SBC_ARM_ASM_OPT==TRUE)
72*df25739fSMilanka Ringwald #else
73*df25739fSMilanka Ringwald #if (SBC_IPAQ_OPT==TRUE)
74*df25739fSMilanka Ringwald #if (SBC_IS_64_MULT_IN_IDCT == TRUE)
75*df25739fSMilanka Ringwald SINT64 s64Temp;
76*df25739fSMilanka Ringwald #endif
77*df25739fSMilanka Ringwald #else
78*df25739fSMilanka Ringwald #if (SBC_IS_64_MULT_IN_IDCT == TRUE)
79*df25739fSMilanka Ringwald SINT32 s32HiTemp;
80*df25739fSMilanka Ringwald #else
81*df25739fSMilanka Ringwald SINT32 s32In2Temp;
82*df25739fSMilanka Ringwald register SINT32 s32In1Temp;
83*df25739fSMilanka Ringwald #endif
84*df25739fSMilanka Ringwald #endif
85*df25739fSMilanka Ringwald #endif
86*df25739fSMilanka Ringwald
87*df25739fSMilanka Ringwald register SINT32 x0, x1, x2, x3, x4, x5, x6, x7,temp;
88*df25739fSMilanka Ringwald SINT32 res_even[4], res_odd[4];
89*df25739fSMilanka Ringwald SBC_IDCT_MULT(SBC_COS_PI_SUR_4,pInVect[4], x0);
90*df25739fSMilanka Ringwald
91*df25739fSMilanka Ringwald x1 = (pInVect[3] + pInVect[5]) >>1;
92*df25739fSMilanka Ringwald x2 = (pInVect[2] + pInVect[6]) >>1;
93*df25739fSMilanka Ringwald x3 = (pInVect[1] + pInVect[7]) >>1;
94*df25739fSMilanka Ringwald x4 = (pInVect[0] + pInVect[8]) >>1;
95*df25739fSMilanka Ringwald x5 = (pInVect[9] - pInVect[15]) >>1;
96*df25739fSMilanka Ringwald x6 = (pInVect[10] - pInVect[14])>>1;
97*df25739fSMilanka Ringwald x7 = (pInVect[11] - pInVect[13])>>1;
98*df25739fSMilanka Ringwald
99*df25739fSMilanka Ringwald /* 2-point IDCT of x0 and x4 as in (11) */
100*df25739fSMilanka Ringwald temp = x0 ;
101*df25739fSMilanka Ringwald SBC_IDCT_MULT(SBC_COS_PI_SUR_4, ( x0 + x4 ), x0); /*x0 = ( x0 + x4 ) * cos(1*pi/4) ; */
102*df25739fSMilanka Ringwald SBC_IDCT_MULT(SBC_COS_PI_SUR_4, ( temp - x4 ), x4); /*x4 = ( temp - x4 ) * cos(1*pi/4) ; */
103*df25739fSMilanka Ringwald
104*df25739fSMilanka Ringwald /* rearrangement of x2 and x6 as in (15) */
105*df25739fSMilanka Ringwald x2 -=x6;
106*df25739fSMilanka Ringwald x6 <<= 1 ;
107*df25739fSMilanka Ringwald
108*df25739fSMilanka Ringwald /* 2-point IDCT of x2 and x6 and post-multiplication as in (15) */
109*df25739fSMilanka Ringwald SBC_IDCT_MULT(SBC_COS_PI_SUR_4,x6, x6); /*x6 = x6 * cos(1*pi/4) ; */
110*df25739fSMilanka Ringwald temp = x2 ;
111*df25739fSMilanka Ringwald SBC_IDCT_MULT(SBC_COS_PI_SUR_8,( x2 + x6 ), x2); /*x2 = ( x2 + x6 ) * cos(1*pi/8) ; */
112*df25739fSMilanka Ringwald SBC_IDCT_MULT(SBC_COS_3PI_SUR_8,( temp - x6 ), x6); /*x6 = ( temp - x6 ) * cos(3*pi/8) ;*/
113*df25739fSMilanka Ringwald
114*df25739fSMilanka Ringwald /* 4-point IDCT of x0,x2,x4 and x6 as in (11) */
115*df25739fSMilanka Ringwald res_even[ 0 ] = x0 + x2 ;
116*df25739fSMilanka Ringwald res_even[ 1 ] = x4 + x6 ;
117*df25739fSMilanka Ringwald res_even[ 2 ] = x4 - x6 ;
118*df25739fSMilanka Ringwald res_even[ 3 ] = x0 - x2 ;
119*df25739fSMilanka Ringwald
120*df25739fSMilanka Ringwald
121*df25739fSMilanka Ringwald /* rearrangement of x1,x3,x5,x7 as in (15) */
122*df25739fSMilanka Ringwald x7 <<= 1 ;
123*df25739fSMilanka Ringwald x5 = ( x5 <<1 ) - x7 ;
124*df25739fSMilanka Ringwald x3 = ( x3 <<1 ) - x5 ;
125*df25739fSMilanka Ringwald x1 -= x3 >>1 ;
126*df25739fSMilanka Ringwald
127*df25739fSMilanka Ringwald /* two-dimensional IDCT of x1 and x5 */
128*df25739fSMilanka Ringwald SBC_IDCT_MULT(SBC_COS_PI_SUR_4, x5, x5); /*x5 = x5 * cos(1*pi/4) ; */
129*df25739fSMilanka Ringwald temp = x1 ;
130*df25739fSMilanka Ringwald x1 = x1 + x5 ;
131*df25739fSMilanka Ringwald x5 = temp - x5 ;
132*df25739fSMilanka Ringwald
133*df25739fSMilanka Ringwald /* rearrangement of x3 and x7 as in (15) */
134*df25739fSMilanka Ringwald x3 -= x7;
135*df25739fSMilanka Ringwald x7 <<= 1 ;
136*df25739fSMilanka Ringwald SBC_IDCT_MULT(SBC_COS_PI_SUR_4, x7, x7); /*x7 = x7 * cos(1*pi/4) ; */
137*df25739fSMilanka Ringwald
138*df25739fSMilanka Ringwald /* 2-point IDCT of x3 and x7 and post-multiplication as in (15) */
139*df25739fSMilanka Ringwald temp = x3 ;
140*df25739fSMilanka Ringwald SBC_IDCT_MULT( SBC_COS_PI_SUR_8,( x3 + x7 ), x3); /*x3 = ( x3 + x7 ) * cos(1*pi/8) ; */
141*df25739fSMilanka Ringwald SBC_IDCT_MULT( SBC_COS_3PI_SUR_8,( temp - x7 ), x7); /*x7 = ( temp - x7 ) * cos(3*pi/8) ;*/
142*df25739fSMilanka Ringwald
143*df25739fSMilanka Ringwald /* 4-point IDCT of x1,x3,x5 and x7 and post multiplication by diagonal matrix as in (14) */
144*df25739fSMilanka Ringwald SBC_IDCT_MULT((SBC_COS_PI_SUR_16), ( x1 + x3 ) , res_odd[0]); /*res_odd[ 0 ] = ( x1 + x3 ) * cos(1*pi/16) ; */
145*df25739fSMilanka Ringwald SBC_IDCT_MULT((SBC_COS_3PI_SUR_16), ( x5 + x7 ) , res_odd[1]); /*res_odd[ 1 ] = ( x5 + x7 ) * cos(3*pi/16) ; */
146*df25739fSMilanka Ringwald SBC_IDCT_MULT((SBC_COS_5PI_SUR_16), ( x5 - x7 ) , res_odd[2]); /*res_odd[ 2 ] = ( x5 - x7 ) * cos(5*pi/16) ; */
147*df25739fSMilanka Ringwald SBC_IDCT_MULT((SBC_COS_7PI_SUR_16), ( x1 - x3 ) , res_odd[3]); /*res_odd[ 3 ] = ( x1 - x3 ) * cos(7*pi/16) ; */
148*df25739fSMilanka Ringwald
149*df25739fSMilanka Ringwald /* additions and subtractions as in (9) */
150*df25739fSMilanka Ringwald pOutVect[0] = (res_even[ 0 ] + res_odd[ 0 ]) ;
151*df25739fSMilanka Ringwald pOutVect[1] = (res_even[ 1 ] + res_odd[ 1 ]) ;
152*df25739fSMilanka Ringwald pOutVect[2] = (res_even[ 2 ] + res_odd[ 2 ]) ;
153*df25739fSMilanka Ringwald pOutVect[3] = (res_even[ 3 ] + res_odd[ 3 ]) ;
154*df25739fSMilanka Ringwald pOutVect[7] = (res_even[ 0 ] - res_odd[ 0 ]) ;
155*df25739fSMilanka Ringwald pOutVect[6] = (res_even[ 1 ] - res_odd[ 1 ]) ;
156*df25739fSMilanka Ringwald pOutVect[5] = (res_even[ 2 ] - res_odd[ 2 ]) ;
157*df25739fSMilanka Ringwald pOutVect[4] = (res_even[ 3 ] - res_odd[ 3 ]) ;
158*df25739fSMilanka Ringwald #else
159*df25739fSMilanka Ringwald UINT8 Index, k;
160*df25739fSMilanka Ringwald SINT32 temp;
161*df25739fSMilanka Ringwald /*Calculate 4 subband samples by matrixing*/
162*df25739fSMilanka Ringwald for(Index=0; Index<8; Index++)
163*df25739fSMilanka Ringwald {
164*df25739fSMilanka Ringwald temp = 0;
165*df25739fSMilanka Ringwald for(k=0; k<16; k++)
166*df25739fSMilanka Ringwald {
167*df25739fSMilanka Ringwald /*temp += (SINT32)(((SINT64)M[(Index*strEncParams->numOfSubBands*2)+k] * Y[k]) >> 16 );*/
168*df25739fSMilanka Ringwald temp += (gas16AnalDCTcoeff8[(Index*8*2)+k] * (pInVect[k] >> 16));
169*df25739fSMilanka Ringwald temp += ((gas16AnalDCTcoeff8[(Index*8*2)+k] * (pInVect[k] & 0xFFFF)) >> 16);
170*df25739fSMilanka Ringwald }
171*df25739fSMilanka Ringwald pOutVect[Index] = temp;
172*df25739fSMilanka Ringwald }
173*df25739fSMilanka Ringwald #endif
174*df25739fSMilanka Ringwald }
175*df25739fSMilanka Ringwald
176*df25739fSMilanka Ringwald /*******************************************************************************
177*df25739fSMilanka Ringwald **
178*df25739fSMilanka Ringwald ** Function SBC_FastIDCT4
179*df25739fSMilanka Ringwald **
180*df25739fSMilanka Ringwald ** Description implementation of fast DCT algorithm by Feig and Winograd
181*df25739fSMilanka Ringwald **
182*df25739fSMilanka Ringwald **
183*df25739fSMilanka Ringwald ** Returns y = dct(x0)
184*df25739fSMilanka Ringwald **
185*df25739fSMilanka Ringwald **
186*df25739fSMilanka Ringwald *******************************************************************************/
SBC_FastIDCT4(SINT32 * pInVect,SINT32 * pOutVect)187*df25739fSMilanka Ringwald void SBC_FastIDCT4(SINT32 *pInVect, SINT32 *pOutVect)
188*df25739fSMilanka Ringwald {
189*df25739fSMilanka Ringwald #if (SBC_FAST_DCT == TRUE)
190*df25739fSMilanka Ringwald #if (SBC_ARM_ASM_OPT==TRUE)
191*df25739fSMilanka Ringwald #else
192*df25739fSMilanka Ringwald #if (SBC_IPAQ_OPT==TRUE)
193*df25739fSMilanka Ringwald #if (SBC_IS_64_MULT_IN_IDCT == TRUE)
194*df25739fSMilanka Ringwald SINT64 s64Temp;
195*df25739fSMilanka Ringwald #endif
196*df25739fSMilanka Ringwald #else
197*df25739fSMilanka Ringwald #if (SBC_IS_64_MULT_IN_IDCT == TRUE)
198*df25739fSMilanka Ringwald SINT32 s32HiTemp;
199*df25739fSMilanka Ringwald #else
200*df25739fSMilanka Ringwald UINT16 s32In2Temp;
201*df25739fSMilanka Ringwald SINT32 s32In1Temp;
202*df25739fSMilanka Ringwald #endif
203*df25739fSMilanka Ringwald #endif
204*df25739fSMilanka Ringwald #endif
205*df25739fSMilanka Ringwald SINT32 temp,x2;
206*df25739fSMilanka Ringwald SINT32 tmp[8];
207*df25739fSMilanka Ringwald
208*df25739fSMilanka Ringwald x2=pInVect[2]>>1;
209*df25739fSMilanka Ringwald temp=(pInVect[0]+pInVect[4]);
210*df25739fSMilanka Ringwald SBC_IDCT_MULT((SBC_COS_PI_SUR_4>>1), temp , tmp[0]);
211*df25739fSMilanka Ringwald tmp[1]=x2-tmp[0];
212*df25739fSMilanka Ringwald tmp[0]+=x2;
213*df25739fSMilanka Ringwald temp=(pInVect[1]+pInVect[3]);
214*df25739fSMilanka Ringwald SBC_IDCT_MULT((SBC_COS_3PI_SUR_8>>1), temp , tmp[3]);
215*df25739fSMilanka Ringwald SBC_IDCT_MULT((SBC_COS_PI_SUR_8>>1), temp , tmp[2]);
216*df25739fSMilanka Ringwald temp=(pInVect[5]-pInVect[7]);
217*df25739fSMilanka Ringwald SBC_IDCT_MULT((SBC_COS_3PI_SUR_8>>1), temp , tmp[5]);
218*df25739fSMilanka Ringwald SBC_IDCT_MULT((SBC_COS_PI_SUR_8>>1), temp , tmp[4]);
219*df25739fSMilanka Ringwald tmp[6]=tmp[2]+tmp[5];
220*df25739fSMilanka Ringwald tmp[7]=tmp[3]-tmp[4];
221*df25739fSMilanka Ringwald pOutVect[0] = (tmp[0]+tmp[6]);
222*df25739fSMilanka Ringwald pOutVect[1] = (tmp[1]+tmp[7]);
223*df25739fSMilanka Ringwald pOutVect[2] = (tmp[1]-tmp[7]);
224*df25739fSMilanka Ringwald pOutVect[3] = (tmp[0]-tmp[6]);
225*df25739fSMilanka Ringwald #else
226*df25739fSMilanka Ringwald UINT8 Index, k;
227*df25739fSMilanka Ringwald SINT32 temp;
228*df25739fSMilanka Ringwald /*Calculate 4 subband samples by matrixing*/
229*df25739fSMilanka Ringwald for(Index=0; Index<4; Index++)
230*df25739fSMilanka Ringwald {
231*df25739fSMilanka Ringwald temp = 0;
232*df25739fSMilanka Ringwald for(k=0; k<8; k++)
233*df25739fSMilanka Ringwald {
234*df25739fSMilanka Ringwald /*temp += (SINT32)(((SINT64)M[(Index*strEncParams->numOfSubBands*2)+k] * Y[k]) >> 16 ); */
235*df25739fSMilanka Ringwald temp += (gas16AnalDCTcoeff4[(Index*4*2)+k] * (pInVect[k] >> 16));
236*df25739fSMilanka Ringwald temp += ((gas16AnalDCTcoeff4[(Index*4*2)+k] * (pInVect[k] & 0xFFFF)) >> 16);
237*df25739fSMilanka Ringwald }
238*df25739fSMilanka Ringwald pOutVect[Index] = temp;
239*df25739fSMilanka Ringwald }
240*df25739fSMilanka Ringwald #endif
241*df25739fSMilanka Ringwald }
242