xref: /aosp_15_r20/external/libhevc/common/ihevc_chroma_itrans_recon.c (revision c83a76b084498d55f252f48b2e3786804cdf24b7)
1*c83a76b0SSuyog Pawar /******************************************************************************
2*c83a76b0SSuyog Pawar *
3*c83a76b0SSuyog Pawar * Copyright (C) 2012 Ittiam Systems Pvt Ltd, Bangalore
4*c83a76b0SSuyog Pawar *
5*c83a76b0SSuyog Pawar * Licensed under the Apache License, Version 2.0 (the "License");
6*c83a76b0SSuyog Pawar * you may not use this file except in compliance with the License.
7*c83a76b0SSuyog Pawar * You may obtain a copy of the License at:
8*c83a76b0SSuyog Pawar *
9*c83a76b0SSuyog Pawar * http://www.apache.org/licenses/LICENSE-2.0
10*c83a76b0SSuyog Pawar *
11*c83a76b0SSuyog Pawar * Unless required by applicable law or agreed to in writing, software
12*c83a76b0SSuyog Pawar * distributed under the License is distributed on an "AS IS" BASIS,
13*c83a76b0SSuyog Pawar * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14*c83a76b0SSuyog Pawar * See the License for the specific language governing permissions and
15*c83a76b0SSuyog Pawar * limitations under the License.
16*c83a76b0SSuyog Pawar *
17*c83a76b0SSuyog Pawar ******************************************************************************/
18*c83a76b0SSuyog Pawar /**
19*c83a76b0SSuyog Pawar  *******************************************************************************
20*c83a76b0SSuyog Pawar  * @file
21*c83a76b0SSuyog Pawar  *  ihevc_chroma_itrans_recon.c
22*c83a76b0SSuyog Pawar  *
23*c83a76b0SSuyog Pawar  * @brief
24*c83a76b0SSuyog Pawar  *  Contains function definitions for inverse transform  and reconstruction
25*c83a76b0SSuyog Pawar  * of chroma interleaved data.
26*c83a76b0SSuyog Pawar  *
27*c83a76b0SSuyog Pawar  * @author
28*c83a76b0SSuyog Pawar  *  100470
29*c83a76b0SSuyog Pawar  *
30*c83a76b0SSuyog Pawar  * @par List of Functions:
31*c83a76b0SSuyog Pawar  *  - ihevc_chroma_itrans_recon_4x4()
32*c83a76b0SSuyog Pawar  *
33*c83a76b0SSuyog Pawar  * @remarks
34*c83a76b0SSuyog Pawar  *  None
35*c83a76b0SSuyog Pawar  *
36*c83a76b0SSuyog Pawar  *******************************************************************************
37*c83a76b0SSuyog Pawar  */
38*c83a76b0SSuyog Pawar 
39*c83a76b0SSuyog Pawar #include <stdio.h>
40*c83a76b0SSuyog Pawar #include <string.h>
41*c83a76b0SSuyog Pawar #include "ihevc_typedefs.h"
42*c83a76b0SSuyog Pawar #include "ihevc_macros.h"
43*c83a76b0SSuyog Pawar #include "ihevc_platform_macros.h"
44*c83a76b0SSuyog Pawar #include "ihevc_defs.h"
45*c83a76b0SSuyog Pawar #include "ihevc_trans_tables.h"
46*c83a76b0SSuyog Pawar #include "ihevc_chroma_itrans_recon.h"
47*c83a76b0SSuyog Pawar #include "ihevc_func_selector.h"
48*c83a76b0SSuyog Pawar #include "ihevc_trans_macros.h"
49*c83a76b0SSuyog Pawar 
50*c83a76b0SSuyog Pawar /* All the functions work one component(U or V) of interleaved data depending upon pointers passed to it */
51*c83a76b0SSuyog Pawar /* Data visualization */
52*c83a76b0SSuyog Pawar /* U V U V U V U V */
53*c83a76b0SSuyog Pawar /* U V U V U V U V */
54*c83a76b0SSuyog Pawar /* U V U V U V U V */
55*c83a76b0SSuyog Pawar /* U V U V U V U V */
56*c83a76b0SSuyog Pawar /* If the pointer points to first byte of above stream (U) , functions will operate on U component */
57*c83a76b0SSuyog Pawar /* If the pointer points to second byte of above stream (V) , functions will operate on V component */
58*c83a76b0SSuyog Pawar 
59*c83a76b0SSuyog Pawar /**
60*c83a76b0SSuyog Pawar  *******************************************************************************
61*c83a76b0SSuyog Pawar  *
62*c83a76b0SSuyog Pawar  * @brief
63*c83a76b0SSuyog Pawar  *  This function performs Inverse transform  and reconstruction for 4x4
64*c83a76b0SSuyog Pawar  * input block
65*c83a76b0SSuyog Pawar  *
66*c83a76b0SSuyog Pawar  * @par Description:
67*c83a76b0SSuyog Pawar  *  Performs inverse transform and adds the prediction  data and clips output
68*c83a76b0SSuyog Pawar  * to 8 bit
69*c83a76b0SSuyog Pawar  *
70*c83a76b0SSuyog Pawar  * @param[in] pi2_src
71*c83a76b0SSuyog Pawar  *  Input 4x4 coefficients
72*c83a76b0SSuyog Pawar  *
73*c83a76b0SSuyog Pawar  * @param[in] pi2_tmp
74*c83a76b0SSuyog Pawar  *  Temporary 4x4 buffer for storing inverse transform
75*c83a76b0SSuyog Pawar  *  1st stage output
76*c83a76b0SSuyog Pawar  *
77*c83a76b0SSuyog Pawar  * @param[in] pu1_pred
78*c83a76b0SSuyog Pawar  *  Prediction 4x4 block
79*c83a76b0SSuyog Pawar  *
80*c83a76b0SSuyog Pawar  * @param[out] pu1_dst
81*c83a76b0SSuyog Pawar  *  Output 4x4 block
82*c83a76b0SSuyog Pawar  *
83*c83a76b0SSuyog Pawar  * @param[in] src_strd
84*c83a76b0SSuyog Pawar  *  Input stride
85*c83a76b0SSuyog Pawar  *
86*c83a76b0SSuyog Pawar  * @param[in] pred_strd
87*c83a76b0SSuyog Pawar  *  Prediction stride
88*c83a76b0SSuyog Pawar  *
89*c83a76b0SSuyog Pawar  * @param[in] dst_strd
90*c83a76b0SSuyog Pawar  *  Output Stride
91*c83a76b0SSuyog Pawar  *
92*c83a76b0SSuyog Pawar  * @param[in] shift
93*c83a76b0SSuyog Pawar  *  Output shift
94*c83a76b0SSuyog Pawar  *
95*c83a76b0SSuyog Pawar  * @param[in] zero_cols
96*c83a76b0SSuyog Pawar  *  Zero columns in pi2_src
97*c83a76b0SSuyog Pawar  *
98*c83a76b0SSuyog Pawar  * @returns  Void
99*c83a76b0SSuyog Pawar  *
100*c83a76b0SSuyog Pawar  * @remarks
101*c83a76b0SSuyog Pawar  *  None
102*c83a76b0SSuyog Pawar  *
103*c83a76b0SSuyog Pawar  *******************************************************************************
104*c83a76b0SSuyog Pawar  */
105*c83a76b0SSuyog Pawar 
106*c83a76b0SSuyog Pawar 
ihevc_chroma_itrans_recon_4x4(WORD16 * pi2_src,WORD16 * pi2_tmp,UWORD8 * pu1_pred,UWORD8 * pu1_dst,WORD32 src_strd,WORD32 pred_strd,WORD32 dst_strd,WORD32 zero_cols,WORD32 zero_rows)107*c83a76b0SSuyog Pawar void ihevc_chroma_itrans_recon_4x4(WORD16 *pi2_src,
108*c83a76b0SSuyog Pawar                                    WORD16 *pi2_tmp,
109*c83a76b0SSuyog Pawar                                    UWORD8 *pu1_pred,
110*c83a76b0SSuyog Pawar                                    UWORD8 *pu1_dst,
111*c83a76b0SSuyog Pawar                                    WORD32 src_strd,
112*c83a76b0SSuyog Pawar                                    WORD32 pred_strd,
113*c83a76b0SSuyog Pawar                                    WORD32 dst_strd,
114*c83a76b0SSuyog Pawar                                    WORD32 zero_cols,
115*c83a76b0SSuyog Pawar                                    WORD32 zero_rows)
116*c83a76b0SSuyog Pawar {
117*c83a76b0SSuyog Pawar     WORD32 j;
118*c83a76b0SSuyog Pawar     WORD32 e[2], o[2];
119*c83a76b0SSuyog Pawar     WORD32 add;
120*c83a76b0SSuyog Pawar     WORD32 shift;
121*c83a76b0SSuyog Pawar     WORD16 *pi2_tmp_orig;
122*c83a76b0SSuyog Pawar     WORD32 trans_size;
123*c83a76b0SSuyog Pawar     UNUSED(zero_rows);
124*c83a76b0SSuyog Pawar     trans_size = TRANS_SIZE_4;
125*c83a76b0SSuyog Pawar 
126*c83a76b0SSuyog Pawar     pi2_tmp_orig = pi2_tmp;
127*c83a76b0SSuyog Pawar 
128*c83a76b0SSuyog Pawar     /* Inverse Transform 1st stage */
129*c83a76b0SSuyog Pawar     shift = IT_SHIFT_STAGE_1;
130*c83a76b0SSuyog Pawar     add = 1 << (shift - 1);
131*c83a76b0SSuyog Pawar 
132*c83a76b0SSuyog Pawar     for(j = 0; j < trans_size; j++)
133*c83a76b0SSuyog Pawar     {
134*c83a76b0SSuyog Pawar         /* Checking for Zero Cols */
135*c83a76b0SSuyog Pawar         if((zero_cols & 1) == 1)
136*c83a76b0SSuyog Pawar         {
137*c83a76b0SSuyog Pawar             memset(pi2_tmp, 0, trans_size * sizeof(WORD16));
138*c83a76b0SSuyog Pawar         }
139*c83a76b0SSuyog Pawar         else
140*c83a76b0SSuyog Pawar         {
141*c83a76b0SSuyog Pawar 
142*c83a76b0SSuyog Pawar             /* Utilizing symmetry properties to the maximum to minimize the number of multiplications */
143*c83a76b0SSuyog Pawar             o[0] = g_ai2_ihevc_trans_4[1][0] * pi2_src[src_strd]
144*c83a76b0SSuyog Pawar                             + g_ai2_ihevc_trans_4[3][0] * pi2_src[3 * src_strd];
145*c83a76b0SSuyog Pawar             o[1] = g_ai2_ihevc_trans_4[1][1] * pi2_src[src_strd]
146*c83a76b0SSuyog Pawar                             + g_ai2_ihevc_trans_4[3][1] * pi2_src[3 * src_strd];
147*c83a76b0SSuyog Pawar             e[0] = g_ai2_ihevc_trans_4[0][0] * pi2_src[0]
148*c83a76b0SSuyog Pawar                             + g_ai2_ihevc_trans_4[2][0] * pi2_src[2 * src_strd];
149*c83a76b0SSuyog Pawar             e[1] = g_ai2_ihevc_trans_4[0][1] * pi2_src[0]
150*c83a76b0SSuyog Pawar                             + g_ai2_ihevc_trans_4[2][1] * pi2_src[2 * src_strd];
151*c83a76b0SSuyog Pawar 
152*c83a76b0SSuyog Pawar             pi2_tmp[0] =
153*c83a76b0SSuyog Pawar                             CLIP_S16(((e[0] + o[0] + add) >> shift));
154*c83a76b0SSuyog Pawar             pi2_tmp[1] =
155*c83a76b0SSuyog Pawar                             CLIP_S16(((e[1] + o[1] + add) >> shift));
156*c83a76b0SSuyog Pawar             pi2_tmp[2] =
157*c83a76b0SSuyog Pawar                             CLIP_S16(((e[1] - o[1] + add) >> shift));
158*c83a76b0SSuyog Pawar             pi2_tmp[3] =
159*c83a76b0SSuyog Pawar                             CLIP_S16(((e[0] - o[0] + add) >> shift));
160*c83a76b0SSuyog Pawar 
161*c83a76b0SSuyog Pawar         }
162*c83a76b0SSuyog Pawar         pi2_src++;
163*c83a76b0SSuyog Pawar         pi2_tmp += trans_size;
164*c83a76b0SSuyog Pawar         zero_cols = zero_cols >> 1;
165*c83a76b0SSuyog Pawar     }
166*c83a76b0SSuyog Pawar 
167*c83a76b0SSuyog Pawar     pi2_tmp = pi2_tmp_orig;
168*c83a76b0SSuyog Pawar 
169*c83a76b0SSuyog Pawar     /* Inverse Transform 2nd stage */
170*c83a76b0SSuyog Pawar     shift = IT_SHIFT_STAGE_2;
171*c83a76b0SSuyog Pawar     add = 1 << (shift - 1);
172*c83a76b0SSuyog Pawar 
173*c83a76b0SSuyog Pawar     for(j = 0; j < trans_size; j++)
174*c83a76b0SSuyog Pawar     {
175*c83a76b0SSuyog Pawar         WORD32 itrans_out;
176*c83a76b0SSuyog Pawar         /* Utilizing symmetry properties to the maximum to minimize the number of multiplications */
177*c83a76b0SSuyog Pawar         o[0] = g_ai2_ihevc_trans_4[1][0] * pi2_tmp[trans_size]
178*c83a76b0SSuyog Pawar                         + g_ai2_ihevc_trans_4[3][0] * pi2_tmp[3 * trans_size];
179*c83a76b0SSuyog Pawar         o[1] = g_ai2_ihevc_trans_4[1][1] * pi2_tmp[trans_size]
180*c83a76b0SSuyog Pawar                         + g_ai2_ihevc_trans_4[3][1] * pi2_tmp[3 * trans_size];
181*c83a76b0SSuyog Pawar         e[0] = g_ai2_ihevc_trans_4[0][0] * pi2_tmp[0]
182*c83a76b0SSuyog Pawar                         + g_ai2_ihevc_trans_4[2][0] * pi2_tmp[2 * trans_size];
183*c83a76b0SSuyog Pawar         e[1] = g_ai2_ihevc_trans_4[0][1] * pi2_tmp[0]
184*c83a76b0SSuyog Pawar                         + g_ai2_ihevc_trans_4[2][1] * pi2_tmp[2 * trans_size];
185*c83a76b0SSuyog Pawar 
186*c83a76b0SSuyog Pawar         itrans_out =
187*c83a76b0SSuyog Pawar                         CLIP_S16(((e[0] + o[0] + add) >> shift));
188*c83a76b0SSuyog Pawar         pu1_dst[0 * 2] = CLIP_U8((itrans_out + pu1_pred[0 * 2]));
189*c83a76b0SSuyog Pawar         itrans_out =
190*c83a76b0SSuyog Pawar                         CLIP_S16(((e[1] + o[1] + add) >> shift));
191*c83a76b0SSuyog Pawar         pu1_dst[1 * 2] = CLIP_U8((itrans_out + pu1_pred[1 * 2]));
192*c83a76b0SSuyog Pawar         itrans_out =
193*c83a76b0SSuyog Pawar                         CLIP_S16(((e[1] - o[1] + add) >> shift));
194*c83a76b0SSuyog Pawar         pu1_dst[2 * 2] = CLIP_U8((itrans_out + pu1_pred[2 * 2]));
195*c83a76b0SSuyog Pawar         itrans_out =
196*c83a76b0SSuyog Pawar                         CLIP_S16(((e[0] - o[0] + add) >> shift));
197*c83a76b0SSuyog Pawar         pu1_dst[3 * 2] = CLIP_U8((itrans_out + pu1_pred[3 * 2]));
198*c83a76b0SSuyog Pawar 
199*c83a76b0SSuyog Pawar         pi2_tmp++;
200*c83a76b0SSuyog Pawar         pu1_pred += pred_strd;
201*c83a76b0SSuyog Pawar         pu1_dst += dst_strd;
202*c83a76b0SSuyog Pawar 
203*c83a76b0SSuyog Pawar     }
204*c83a76b0SSuyog Pawar }
205*c83a76b0SSuyog Pawar 
206