1*c83a76b0SSuyog Pawar /******************************************************************************
2*c83a76b0SSuyog Pawar *
3*c83a76b0SSuyog Pawar * Copyright (C) 2012 Ittiam Systems Pvt Ltd, Bangalore
4*c83a76b0SSuyog Pawar *
5*c83a76b0SSuyog Pawar * Licensed under the Apache License, Version 2.0 (the "License");
6*c83a76b0SSuyog Pawar * you may not use this file except in compliance with the License.
7*c83a76b0SSuyog Pawar * You may obtain a copy of the License at:
8*c83a76b0SSuyog Pawar *
9*c83a76b0SSuyog Pawar * http://www.apache.org/licenses/LICENSE-2.0
10*c83a76b0SSuyog Pawar *
11*c83a76b0SSuyog Pawar * Unless required by applicable law or agreed to in writing, software
12*c83a76b0SSuyog Pawar * distributed under the License is distributed on an "AS IS" BASIS,
13*c83a76b0SSuyog Pawar * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14*c83a76b0SSuyog Pawar * See the License for the specific language governing permissions and
15*c83a76b0SSuyog Pawar * limitations under the License.
16*c83a76b0SSuyog Pawar *
17*c83a76b0SSuyog Pawar ******************************************************************************/
18*c83a76b0SSuyog Pawar /**
19*c83a76b0SSuyog Pawar *******************************************************************************
20*c83a76b0SSuyog Pawar * @file
21*c83a76b0SSuyog Pawar * ihevc_chroma_itrans_recon.c
22*c83a76b0SSuyog Pawar *
23*c83a76b0SSuyog Pawar * @brief
24*c83a76b0SSuyog Pawar * Contains function definitions for inverse transform and reconstruction
25*c83a76b0SSuyog Pawar * of chroma interleaved data.
26*c83a76b0SSuyog Pawar *
27*c83a76b0SSuyog Pawar * @author
28*c83a76b0SSuyog Pawar * 100470
29*c83a76b0SSuyog Pawar *
30*c83a76b0SSuyog Pawar * @par List of Functions:
31*c83a76b0SSuyog Pawar * - ihevc_chroma_itrans_recon_4x4()
32*c83a76b0SSuyog Pawar *
33*c83a76b0SSuyog Pawar * @remarks
34*c83a76b0SSuyog Pawar * None
35*c83a76b0SSuyog Pawar *
36*c83a76b0SSuyog Pawar *******************************************************************************
37*c83a76b0SSuyog Pawar */
38*c83a76b0SSuyog Pawar
39*c83a76b0SSuyog Pawar #include <stdio.h>
40*c83a76b0SSuyog Pawar #include <string.h>
41*c83a76b0SSuyog Pawar #include "ihevc_typedefs.h"
42*c83a76b0SSuyog Pawar #include "ihevc_macros.h"
43*c83a76b0SSuyog Pawar #include "ihevc_platform_macros.h"
44*c83a76b0SSuyog Pawar #include "ihevc_defs.h"
45*c83a76b0SSuyog Pawar #include "ihevc_trans_tables.h"
46*c83a76b0SSuyog Pawar #include "ihevc_chroma_itrans_recon.h"
47*c83a76b0SSuyog Pawar #include "ihevc_func_selector.h"
48*c83a76b0SSuyog Pawar #include "ihevc_trans_macros.h"
49*c83a76b0SSuyog Pawar
50*c83a76b0SSuyog Pawar /* All the functions work one component(U or V) of interleaved data depending upon pointers passed to it */
51*c83a76b0SSuyog Pawar /* Data visualization */
52*c83a76b0SSuyog Pawar /* U V U V U V U V */
53*c83a76b0SSuyog Pawar /* U V U V U V U V */
54*c83a76b0SSuyog Pawar /* U V U V U V U V */
55*c83a76b0SSuyog Pawar /* U V U V U V U V */
56*c83a76b0SSuyog Pawar /* If the pointer points to first byte of above stream (U) , functions will operate on U component */
57*c83a76b0SSuyog Pawar /* If the pointer points to second byte of above stream (V) , functions will operate on V component */
58*c83a76b0SSuyog Pawar
59*c83a76b0SSuyog Pawar /**
60*c83a76b0SSuyog Pawar *******************************************************************************
61*c83a76b0SSuyog Pawar *
62*c83a76b0SSuyog Pawar * @brief
63*c83a76b0SSuyog Pawar * This function performs Inverse transform and reconstruction for 4x4
64*c83a76b0SSuyog Pawar * input block
65*c83a76b0SSuyog Pawar *
66*c83a76b0SSuyog Pawar * @par Description:
67*c83a76b0SSuyog Pawar * Performs inverse transform and adds the prediction data and clips output
68*c83a76b0SSuyog Pawar * to 8 bit
69*c83a76b0SSuyog Pawar *
70*c83a76b0SSuyog Pawar * @param[in] pi2_src
71*c83a76b0SSuyog Pawar * Input 4x4 coefficients
72*c83a76b0SSuyog Pawar *
73*c83a76b0SSuyog Pawar * @param[in] pi2_tmp
74*c83a76b0SSuyog Pawar * Temporary 4x4 buffer for storing inverse transform
75*c83a76b0SSuyog Pawar * 1st stage output
76*c83a76b0SSuyog Pawar *
77*c83a76b0SSuyog Pawar * @param[in] pu1_pred
78*c83a76b0SSuyog Pawar * Prediction 4x4 block
79*c83a76b0SSuyog Pawar *
80*c83a76b0SSuyog Pawar * @param[out] pu1_dst
81*c83a76b0SSuyog Pawar * Output 4x4 block
82*c83a76b0SSuyog Pawar *
83*c83a76b0SSuyog Pawar * @param[in] src_strd
84*c83a76b0SSuyog Pawar * Input stride
85*c83a76b0SSuyog Pawar *
86*c83a76b0SSuyog Pawar * @param[in] pred_strd
87*c83a76b0SSuyog Pawar * Prediction stride
88*c83a76b0SSuyog Pawar *
89*c83a76b0SSuyog Pawar * @param[in] dst_strd
90*c83a76b0SSuyog Pawar * Output Stride
91*c83a76b0SSuyog Pawar *
92*c83a76b0SSuyog Pawar * @param[in] shift
93*c83a76b0SSuyog Pawar * Output shift
94*c83a76b0SSuyog Pawar *
95*c83a76b0SSuyog Pawar * @param[in] zero_cols
96*c83a76b0SSuyog Pawar * Zero columns in pi2_src
97*c83a76b0SSuyog Pawar *
98*c83a76b0SSuyog Pawar * @returns Void
99*c83a76b0SSuyog Pawar *
100*c83a76b0SSuyog Pawar * @remarks
101*c83a76b0SSuyog Pawar * None
102*c83a76b0SSuyog Pawar *
103*c83a76b0SSuyog Pawar *******************************************************************************
104*c83a76b0SSuyog Pawar */
105*c83a76b0SSuyog Pawar
106*c83a76b0SSuyog Pawar
ihevc_chroma_itrans_recon_4x4(WORD16 * pi2_src,WORD16 * pi2_tmp,UWORD8 * pu1_pred,UWORD8 * pu1_dst,WORD32 src_strd,WORD32 pred_strd,WORD32 dst_strd,WORD32 zero_cols,WORD32 zero_rows)107*c83a76b0SSuyog Pawar void ihevc_chroma_itrans_recon_4x4(WORD16 *pi2_src,
108*c83a76b0SSuyog Pawar WORD16 *pi2_tmp,
109*c83a76b0SSuyog Pawar UWORD8 *pu1_pred,
110*c83a76b0SSuyog Pawar UWORD8 *pu1_dst,
111*c83a76b0SSuyog Pawar WORD32 src_strd,
112*c83a76b0SSuyog Pawar WORD32 pred_strd,
113*c83a76b0SSuyog Pawar WORD32 dst_strd,
114*c83a76b0SSuyog Pawar WORD32 zero_cols,
115*c83a76b0SSuyog Pawar WORD32 zero_rows)
116*c83a76b0SSuyog Pawar {
117*c83a76b0SSuyog Pawar WORD32 j;
118*c83a76b0SSuyog Pawar WORD32 e[2], o[2];
119*c83a76b0SSuyog Pawar WORD32 add;
120*c83a76b0SSuyog Pawar WORD32 shift;
121*c83a76b0SSuyog Pawar WORD16 *pi2_tmp_orig;
122*c83a76b0SSuyog Pawar WORD32 trans_size;
123*c83a76b0SSuyog Pawar UNUSED(zero_rows);
124*c83a76b0SSuyog Pawar trans_size = TRANS_SIZE_4;
125*c83a76b0SSuyog Pawar
126*c83a76b0SSuyog Pawar pi2_tmp_orig = pi2_tmp;
127*c83a76b0SSuyog Pawar
128*c83a76b0SSuyog Pawar /* Inverse Transform 1st stage */
129*c83a76b0SSuyog Pawar shift = IT_SHIFT_STAGE_1;
130*c83a76b0SSuyog Pawar add = 1 << (shift - 1);
131*c83a76b0SSuyog Pawar
132*c83a76b0SSuyog Pawar for(j = 0; j < trans_size; j++)
133*c83a76b0SSuyog Pawar {
134*c83a76b0SSuyog Pawar /* Checking for Zero Cols */
135*c83a76b0SSuyog Pawar if((zero_cols & 1) == 1)
136*c83a76b0SSuyog Pawar {
137*c83a76b0SSuyog Pawar memset(pi2_tmp, 0, trans_size * sizeof(WORD16));
138*c83a76b0SSuyog Pawar }
139*c83a76b0SSuyog Pawar else
140*c83a76b0SSuyog Pawar {
141*c83a76b0SSuyog Pawar
142*c83a76b0SSuyog Pawar /* Utilizing symmetry properties to the maximum to minimize the number of multiplications */
143*c83a76b0SSuyog Pawar o[0] = g_ai2_ihevc_trans_4[1][0] * pi2_src[src_strd]
144*c83a76b0SSuyog Pawar + g_ai2_ihevc_trans_4[3][0] * pi2_src[3 * src_strd];
145*c83a76b0SSuyog Pawar o[1] = g_ai2_ihevc_trans_4[1][1] * pi2_src[src_strd]
146*c83a76b0SSuyog Pawar + g_ai2_ihevc_trans_4[3][1] * pi2_src[3 * src_strd];
147*c83a76b0SSuyog Pawar e[0] = g_ai2_ihevc_trans_4[0][0] * pi2_src[0]
148*c83a76b0SSuyog Pawar + g_ai2_ihevc_trans_4[2][0] * pi2_src[2 * src_strd];
149*c83a76b0SSuyog Pawar e[1] = g_ai2_ihevc_trans_4[0][1] * pi2_src[0]
150*c83a76b0SSuyog Pawar + g_ai2_ihevc_trans_4[2][1] * pi2_src[2 * src_strd];
151*c83a76b0SSuyog Pawar
152*c83a76b0SSuyog Pawar pi2_tmp[0] =
153*c83a76b0SSuyog Pawar CLIP_S16(((e[0] + o[0] + add) >> shift));
154*c83a76b0SSuyog Pawar pi2_tmp[1] =
155*c83a76b0SSuyog Pawar CLIP_S16(((e[1] + o[1] + add) >> shift));
156*c83a76b0SSuyog Pawar pi2_tmp[2] =
157*c83a76b0SSuyog Pawar CLIP_S16(((e[1] - o[1] + add) >> shift));
158*c83a76b0SSuyog Pawar pi2_tmp[3] =
159*c83a76b0SSuyog Pawar CLIP_S16(((e[0] - o[0] + add) >> shift));
160*c83a76b0SSuyog Pawar
161*c83a76b0SSuyog Pawar }
162*c83a76b0SSuyog Pawar pi2_src++;
163*c83a76b0SSuyog Pawar pi2_tmp += trans_size;
164*c83a76b0SSuyog Pawar zero_cols = zero_cols >> 1;
165*c83a76b0SSuyog Pawar }
166*c83a76b0SSuyog Pawar
167*c83a76b0SSuyog Pawar pi2_tmp = pi2_tmp_orig;
168*c83a76b0SSuyog Pawar
169*c83a76b0SSuyog Pawar /* Inverse Transform 2nd stage */
170*c83a76b0SSuyog Pawar shift = IT_SHIFT_STAGE_2;
171*c83a76b0SSuyog Pawar add = 1 << (shift - 1);
172*c83a76b0SSuyog Pawar
173*c83a76b0SSuyog Pawar for(j = 0; j < trans_size; j++)
174*c83a76b0SSuyog Pawar {
175*c83a76b0SSuyog Pawar WORD32 itrans_out;
176*c83a76b0SSuyog Pawar /* Utilizing symmetry properties to the maximum to minimize the number of multiplications */
177*c83a76b0SSuyog Pawar o[0] = g_ai2_ihevc_trans_4[1][0] * pi2_tmp[trans_size]
178*c83a76b0SSuyog Pawar + g_ai2_ihevc_trans_4[3][0] * pi2_tmp[3 * trans_size];
179*c83a76b0SSuyog Pawar o[1] = g_ai2_ihevc_trans_4[1][1] * pi2_tmp[trans_size]
180*c83a76b0SSuyog Pawar + g_ai2_ihevc_trans_4[3][1] * pi2_tmp[3 * trans_size];
181*c83a76b0SSuyog Pawar e[0] = g_ai2_ihevc_trans_4[0][0] * pi2_tmp[0]
182*c83a76b0SSuyog Pawar + g_ai2_ihevc_trans_4[2][0] * pi2_tmp[2 * trans_size];
183*c83a76b0SSuyog Pawar e[1] = g_ai2_ihevc_trans_4[0][1] * pi2_tmp[0]
184*c83a76b0SSuyog Pawar + g_ai2_ihevc_trans_4[2][1] * pi2_tmp[2 * trans_size];
185*c83a76b0SSuyog Pawar
186*c83a76b0SSuyog Pawar itrans_out =
187*c83a76b0SSuyog Pawar CLIP_S16(((e[0] + o[0] + add) >> shift));
188*c83a76b0SSuyog Pawar pu1_dst[0 * 2] = CLIP_U8((itrans_out + pu1_pred[0 * 2]));
189*c83a76b0SSuyog Pawar itrans_out =
190*c83a76b0SSuyog Pawar CLIP_S16(((e[1] + o[1] + add) >> shift));
191*c83a76b0SSuyog Pawar pu1_dst[1 * 2] = CLIP_U8((itrans_out + pu1_pred[1 * 2]));
192*c83a76b0SSuyog Pawar itrans_out =
193*c83a76b0SSuyog Pawar CLIP_S16(((e[1] - o[1] + add) >> shift));
194*c83a76b0SSuyog Pawar pu1_dst[2 * 2] = CLIP_U8((itrans_out + pu1_pred[2 * 2]));
195*c83a76b0SSuyog Pawar itrans_out =
196*c83a76b0SSuyog Pawar CLIP_S16(((e[0] - o[0] + add) >> shift));
197*c83a76b0SSuyog Pawar pu1_dst[3 * 2] = CLIP_U8((itrans_out + pu1_pred[3 * 2]));
198*c83a76b0SSuyog Pawar
199*c83a76b0SSuyog Pawar pi2_tmp++;
200*c83a76b0SSuyog Pawar pu1_pred += pred_strd;
201*c83a76b0SSuyog Pawar pu1_dst += dst_strd;
202*c83a76b0SSuyog Pawar
203*c83a76b0SSuyog Pawar }
204*c83a76b0SSuyog Pawar }
205*c83a76b0SSuyog Pawar
206