1*c83a76b0SSuyog Pawar /******************************************************************************
2*c83a76b0SSuyog Pawar *
3*c83a76b0SSuyog Pawar * Copyright (C) 2018 The Android Open Source Project
4*c83a76b0SSuyog Pawar *
5*c83a76b0SSuyog Pawar * Licensed under the Apache License, Version 2.0 (the "License");
6*c83a76b0SSuyog Pawar * you may not use this file except in compliance with the License.
7*c83a76b0SSuyog Pawar * You may obtain a copy of the License at:
8*c83a76b0SSuyog Pawar *
9*c83a76b0SSuyog Pawar * http://www.apache.org/licenses/LICENSE-2.0
10*c83a76b0SSuyog Pawar *
11*c83a76b0SSuyog Pawar * Unless required by applicable law or agreed to in writing, software
12*c83a76b0SSuyog Pawar * distributed under the License is distributed on an "AS IS" BASIS,
13*c83a76b0SSuyog Pawar * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14*c83a76b0SSuyog Pawar * See the License for the specific language governing permissions and
15*c83a76b0SSuyog Pawar * limitations under the License.
16*c83a76b0SSuyog Pawar *
17*c83a76b0SSuyog Pawar *****************************************************************************
18*c83a76b0SSuyog Pawar * Originally developed and contributed by Ittiam Systems Pvt. Ltd, Bangalore
19*c83a76b0SSuyog Pawar */
20*c83a76b0SSuyog Pawar /**
21*c83a76b0SSuyog Pawar ******************************************************************************
22*c83a76b0SSuyog Pawar * @file ihevce_bs_compute_ctb.c
23*c83a76b0SSuyog Pawar *
24*c83a76b0SSuyog Pawar * @brief
25*c83a76b0SSuyog Pawar * This file contains functions needed for boundary strength calculation
26*c83a76b0SSuyog Pawar *
27*c83a76b0SSuyog Pawar * @author
28*c83a76b0SSuyog Pawar * ittiam
29*c83a76b0SSuyog Pawar *
30*c83a76b0SSuyog Pawar * @List of Functions
31*c83a76b0SSuyog Pawar * ihevce_bs_init_ctb()
32*c83a76b0SSuyog Pawar * ihevce_bs_compute_ctb()
33*c83a76b0SSuyog Pawar * ihevce_bs_clear_invalid()
34*c83a76b0SSuyog Pawar *
35*c83a76b0SSuyog Pawar ******************************************************************************
36*c83a76b0SSuyog Pawar */
37*c83a76b0SSuyog Pawar
38*c83a76b0SSuyog Pawar /*****************************************************************************/
39*c83a76b0SSuyog Pawar /* File Includes */
40*c83a76b0SSuyog Pawar /*****************************************************************************/
41*c83a76b0SSuyog Pawar /* System include files */
42*c83a76b0SSuyog Pawar #include <stdio.h>
43*c83a76b0SSuyog Pawar #include <string.h>
44*c83a76b0SSuyog Pawar #include <stdlib.h>
45*c83a76b0SSuyog Pawar #include <assert.h>
46*c83a76b0SSuyog Pawar #include <stdarg.h>
47*c83a76b0SSuyog Pawar #include <math.h>
48*c83a76b0SSuyog Pawar
49*c83a76b0SSuyog Pawar /* User include files */
50*c83a76b0SSuyog Pawar #include "ihevc_typedefs.h"
51*c83a76b0SSuyog Pawar #include "itt_video_api.h"
52*c83a76b0SSuyog Pawar #include "ihevce_api.h"
53*c83a76b0SSuyog Pawar
54*c83a76b0SSuyog Pawar #include "rc_cntrl_param.h"
55*c83a76b0SSuyog Pawar #include "rc_frame_info_collector.h"
56*c83a76b0SSuyog Pawar #include "rc_look_ahead_params.h"
57*c83a76b0SSuyog Pawar
58*c83a76b0SSuyog Pawar #include "ihevc_defs.h"
59*c83a76b0SSuyog Pawar #include "ihevc_structs.h"
60*c83a76b0SSuyog Pawar #include "ihevc_platform_macros.h"
61*c83a76b0SSuyog Pawar #include "ihevc_deblk.h"
62*c83a76b0SSuyog Pawar #include "ihevc_itrans_recon.h"
63*c83a76b0SSuyog Pawar #include "ihevc_chroma_itrans_recon.h"
64*c83a76b0SSuyog Pawar #include "ihevc_chroma_intra_pred.h"
65*c83a76b0SSuyog Pawar #include "ihevc_intra_pred.h"
66*c83a76b0SSuyog Pawar #include "ihevc_inter_pred.h"
67*c83a76b0SSuyog Pawar #include "ihevc_mem_fns.h"
68*c83a76b0SSuyog Pawar #include "ihevc_padding.h"
69*c83a76b0SSuyog Pawar #include "ihevc_weighted_pred.h"
70*c83a76b0SSuyog Pawar #include "ihevc_sao.h"
71*c83a76b0SSuyog Pawar #include "ihevc_resi_trans.h"
72*c83a76b0SSuyog Pawar #include "ihevc_quant_iquant_ssd.h"
73*c83a76b0SSuyog Pawar #include "ihevc_cabac_tables.h"
74*c83a76b0SSuyog Pawar
75*c83a76b0SSuyog Pawar #include "ihevce_defs.h"
76*c83a76b0SSuyog Pawar #include "ihevce_lap_enc_structs.h"
77*c83a76b0SSuyog Pawar #include "ihevce_multi_thrd_structs.h"
78*c83a76b0SSuyog Pawar #include "ihevce_me_common_defs.h"
79*c83a76b0SSuyog Pawar #include "ihevce_had_satd.h"
80*c83a76b0SSuyog Pawar #include "ihevce_error_codes.h"
81*c83a76b0SSuyog Pawar #include "ihevce_bitstream.h"
82*c83a76b0SSuyog Pawar #include "ihevce_cabac.h"
83*c83a76b0SSuyog Pawar #include "ihevce_rdoq_macros.h"
84*c83a76b0SSuyog Pawar #include "ihevce_function_selector.h"
85*c83a76b0SSuyog Pawar #include "ihevce_enc_structs.h"
86*c83a76b0SSuyog Pawar #include "ihevce_entropy_structs.h"
87*c83a76b0SSuyog Pawar #include "ihevce_cmn_utils_instr_set_router.h"
88*c83a76b0SSuyog Pawar #include "ihevce_enc_loop_structs.h"
89*c83a76b0SSuyog Pawar #include "ihevce_bs_compute_ctb.h"
90*c83a76b0SSuyog Pawar #include "ihevce_global_tables.h"
91*c83a76b0SSuyog Pawar
92*c83a76b0SSuyog Pawar /*****************************************************************************/
93*c83a76b0SSuyog Pawar /* Global Tables */
94*c83a76b0SSuyog Pawar /*****************************************************************************/
95*c83a76b0SSuyog Pawar // clang-format off
96*c83a76b0SSuyog Pawar UWORD16 gau2_bs_table[2][8] =
97*c83a76b0SSuyog Pawar {
98*c83a76b0SSuyog Pawar { BS_INTRA_4, BS_INTRA_8, BS_INVALID, BS_INTRA_16, BS_INVALID, BS_INVALID, BS_INVALID, BS_INTRA_32 },
99*c83a76b0SSuyog Pawar { BS_CBF_4, BS_CBF_8, BS_INVALID, BS_CBF_16, BS_INVALID, BS_INVALID, BS_INVALID, BS_CBF_32 }
100*c83a76b0SSuyog Pawar };
101*c83a76b0SSuyog Pawar // clang-format on
102*c83a76b0SSuyog Pawar
103*c83a76b0SSuyog Pawar /*****************************************************************************/
104*c83a76b0SSuyog Pawar /* Function Definitions */
105*c83a76b0SSuyog Pawar /*****************************************************************************/
106*c83a76b0SSuyog Pawar
107*c83a76b0SSuyog Pawar /**
108*c83a76b0SSuyog Pawar *******************************************************************************
109*c83a76b0SSuyog Pawar *
110*c83a76b0SSuyog Pawar * @brief Initialize the Boundary Strength at a CTB level
111*c83a76b0SSuyog Pawar *
112*c83a76b0SSuyog Pawar * @par Description
113*c83a76b0SSuyog Pawar * Initialize the Boundary Strength at a CTB level to zeros*
114*c83a76b0SSuyog Pawar *
115*c83a76b0SSuyog Pawar * @param[out] ps_deblk_prms
116*c83a76b0SSuyog Pawar * Pointer to structure s_deblk_prms, which contains
117*c83a76b0SSuyog Pawar * s_deblk_prms.au4_horz_bs : max of 8 such conti. bs to be comp. for 64x64 ctb
118*c83a76b0SSuyog Pawar * s_deblk_prms.au4_vert_bs : max of 8 such conti. bs to be comp. for 64x64 ctb
119*c83a76b0SSuyog Pawar *
120*c83a76b0SSuyog Pawar * @param[in] ctb_size
121*c83a76b0SSuyog Pawar * Size in pels (can be 16, 32 or 64)
122*c83a76b0SSuyog Pawar *
123*c83a76b0SSuyog Pawar * @returns none
124*c83a76b0SSuyog Pawar *
125*c83a76b0SSuyog Pawar * @remarks
126*c83a76b0SSuyog Pawar *
127*c83a76b0SSuyog Pawar *******************************************************************************
128*c83a76b0SSuyog Pawar */
ihevce_bs_init_ctb(deblk_bs_ctb_ctxt_t * ps_deblk_prms,frm_ctb_ctxt_t * ps_frm_ctb_prms,WORD32 ctb_ctr,WORD32 vert_ctr)129*c83a76b0SSuyog Pawar void ihevce_bs_init_ctb(
130*c83a76b0SSuyog Pawar deblk_bs_ctb_ctxt_t *ps_deblk_prms,
131*c83a76b0SSuyog Pawar frm_ctb_ctxt_t *ps_frm_ctb_prms,
132*c83a76b0SSuyog Pawar WORD32 ctb_ctr,
133*c83a76b0SSuyog Pawar WORD32 vert_ctr)
134*c83a76b0SSuyog Pawar {
135*c83a76b0SSuyog Pawar WORD32 ctb_size = ps_frm_ctb_prms->i4_ctb_size;
136*c83a76b0SSuyog Pawar
137*c83a76b0SSuyog Pawar /* Pointer to the array to store the packed BS values in horizontal dir. */
138*c83a76b0SSuyog Pawar UWORD32 *pu4_horz_bs = &ps_deblk_prms->au4_horz_bs[0];
139*c83a76b0SSuyog Pawar /* Pointer to the array to store the packed BS values in vertical dir. */
140*c83a76b0SSuyog Pawar UWORD32 *pu4_vert_bs = &ps_deblk_prms->au4_vert_bs[0];
141*c83a76b0SSuyog Pawar
142*c83a76b0SSuyog Pawar WORD32 i4_top_ctb_tile_id, i4_left_ctb_tile_id;
143*c83a76b0SSuyog Pawar WORD32 *pi4_tile_id_map_temp;
144*c83a76b0SSuyog Pawar
145*c83a76b0SSuyog Pawar pi4_tile_id_map_temp = ps_frm_ctb_prms->pi4_tile_id_map +
146*c83a76b0SSuyog Pawar vert_ctr * ps_frm_ctb_prms->i4_tile_id_ctb_map_stride + ctb_ctr;
147*c83a76b0SSuyog Pawar
148*c83a76b0SSuyog Pawar i4_left_ctb_tile_id = *(pi4_tile_id_map_temp - 1);
149*c83a76b0SSuyog Pawar i4_top_ctb_tile_id = *(pi4_tile_id_map_temp - ps_frm_ctb_prms->i4_tile_id_ctb_map_stride);
150*c83a76b0SSuyog Pawar
151*c83a76b0SSuyog Pawar ps_deblk_prms->u1_not_first_ctb_row_of_frame = (i4_top_ctb_tile_id != -1);
152*c83a76b0SSuyog Pawar ps_deblk_prms->u1_not_first_ctb_col_of_frame = (i4_left_ctb_tile_id != -1);
153*c83a76b0SSuyog Pawar
154*c83a76b0SSuyog Pawar /* BS should be set to NULL in the following cases
155*c83a76b0SSuyog Pawar Frame boundaries
156*c83a76b0SSuyog Pawar Edges if deblocking is disabled by disable_deblocking_filter_flag
157*c83a76b0SSuyog Pawar Slice boundaries if deblocking across slices is disabled
158*c83a76b0SSuyog Pawar Tile boundaries if deblocking across slices is disabled
159*c83a76b0SSuyog Pawar These are not considered now, except the frame boundary
160*c83a76b0SSuyog Pawar */
161*c83a76b0SSuyog Pawar
162*c83a76b0SSuyog Pawar /* Initializing the bs array to 0. array size = (ctb_size/8 + 1)*4 bytes */
163*c83a76b0SSuyog Pawar memset(pu4_horz_bs, 0, ((ctb_size >> 3) + 1) * sizeof(UWORD32));
164*c83a76b0SSuyog Pawar memset(pu4_vert_bs, 0, ((ctb_size >> 3) + 1) * sizeof(UWORD32));
165*c83a76b0SSuyog Pawar }
166*c83a76b0SSuyog Pawar
167*c83a76b0SSuyog Pawar /**
168*c83a76b0SSuyog Pawar *******************************************************************************
169*c83a76b0SSuyog Pawar *
170*c83a76b0SSuyog Pawar * @brief Calculate the Boundary Strength at CU level
171*c83a76b0SSuyog Pawar *
172*c83a76b0SSuyog Pawar * @par Description
173*c83a76b0SSuyog Pawar * Calculate the Boundary Strength at CU level
174*c83a76b0SSuyog Pawar *
175*c83a76b0SSuyog Pawar * @param[in] ps_cu_final
176*c83a76b0SSuyog Pawar * Pointer to the final CU structure, of which we use the following values
177*c83a76b0SSuyog Pawar * u2_num_tus_in_cu : Total TUs in this CU
178*c83a76b0SSuyog Pawar * ps_enc_tu : Pointer to first tu of this cu. Each TU need to be
179*c83a76b0SSuyog Pawar * populated in TU order.
180*c83a76b0SSuyog Pawar * u4_pred_mode_flag : The prediction mode flag for the CU
181*c83a76b0SSuyog Pawar * cu_size : CU size in terms of min CU (8x8) units
182*c83a76b0SSuyog Pawar * cu_pos_x : X Position of CU in current ctb
183*c83a76b0SSuyog Pawar * cu_pos_y : Y Position of CU in current ctb
184*c83a76b0SSuyog Pawar * u4_part_mode : Partition information for CU. For inter 0 : @sa PART_SIZE_E
185*c83a76b0SSuyog Pawar * ps_pu : Pointer to first pu of this cu
186*c83a76b0SSuyog Pawar *
187*c83a76b0SSuyog Pawar * @param[in] ps_top_nbr_4x4
188*c83a76b0SSuyog Pawar * Pointer to top 4x4 CU nbr structure
189*c83a76b0SSuyog Pawar *
190*c83a76b0SSuyog Pawar * @param[in] ps_left_nbr_4x4
191*c83a76b0SSuyog Pawar * Pointer to left 4x4 CU nbr structure
192*c83a76b0SSuyog Pawar *
193*c83a76b0SSuyog Pawar * @param[in] ps_curr_nbr_4x4
194*c83a76b0SSuyog Pawar * Pointer to current 4x4 ctb structure
195*c83a76b0SSuyog Pawar *
196*c83a76b0SSuyog Pawar * @param[in] nbr_4x4_left_strd
197*c83a76b0SSuyog Pawar * Left nbr buffer stride in terms of 4x4 units
198*c83a76b0SSuyog Pawar *
199*c83a76b0SSuyog Pawar * @param[in] num_4x4_in_ctb
200*c83a76b0SSuyog Pawar * Current buffer stride in terms of 4x4 units
201*c83a76b0SSuyog Pawar *
202*c83a76b0SSuyog Pawar * @param[out] ps_deblk_prms
203*c83a76b0SSuyog Pawar * Pointer to structure s_deblk_prms, which contains
204*c83a76b0SSuyog Pawar * s_deblk_prms.au4_horz_bs : max of 8 such conti. bs to be comp. for 64x64 ctb
205*c83a76b0SSuyog Pawar * s_deblk_prms.au4_vert_bs : max of 8 such conti. bs to be comp. for 64x64 ctb
206*c83a76b0SSuyog Pawar *
207*c83a76b0SSuyog Pawar * @returns none
208*c83a76b0SSuyog Pawar *
209*c83a76b0SSuyog Pawar * @remarks
210*c83a76b0SSuyog Pawar * 1 : Setting all 4 edges for a TU or PU block. Which is inefficient in
211*c83a76b0SSuyog Pawar * a) may set the BS twice b) set the frame/slice boundaries
212*c83a76b0SSuyog Pawar * 2 : always update BS using bit-wise OR, which may set BS to 3 also.
213*c83a76b0SSuyog Pawar * ( Deblocking should take care of it as 2 itself )
214*c83a76b0SSuyog Pawar *
215*c83a76b0SSuyog Pawar *******************************************************************************
216*c83a76b0SSuyog Pawar */
ihevce_bs_compute_cu(cu_enc_loop_out_t * ps_cu_final,nbr_4x4_t * ps_top_nbr_4x4,nbr_4x4_t * ps_left_nbr_4x4,nbr_4x4_t * ps_curr_nbr_4x4,WORD32 nbr_4x4_left_strd,WORD32 num_4x4_in_ctb,deblk_bs_ctb_ctxt_t * ps_deblk_prms)217*c83a76b0SSuyog Pawar void ihevce_bs_compute_cu(
218*c83a76b0SSuyog Pawar cu_enc_loop_out_t *ps_cu_final,
219*c83a76b0SSuyog Pawar nbr_4x4_t *ps_top_nbr_4x4,
220*c83a76b0SSuyog Pawar nbr_4x4_t *ps_left_nbr_4x4,
221*c83a76b0SSuyog Pawar nbr_4x4_t *ps_curr_nbr_4x4,
222*c83a76b0SSuyog Pawar WORD32 nbr_4x4_left_strd,
223*c83a76b0SSuyog Pawar WORD32 num_4x4_in_ctb,
224*c83a76b0SSuyog Pawar deblk_bs_ctb_ctxt_t *ps_deblk_prms)
225*c83a76b0SSuyog Pawar {
226*c83a76b0SSuyog Pawar WORD32 i;
227*c83a76b0SSuyog Pawar WORD32 j;
228*c83a76b0SSuyog Pawar /* copy required arguments from pointer to CU structure */
229*c83a76b0SSuyog Pawar /* Total TUs in this CU */
230*c83a76b0SSuyog Pawar UWORD16 u2_num_tus_in_cu = ps_cu_final->u2_num_tus_in_cu;
231*c83a76b0SSuyog Pawar /* Pointer to first tu of this cu */
232*c83a76b0SSuyog Pawar tu_enc_loop_out_t *ps_enc_tu = ps_cu_final->ps_enc_tu;
233*c83a76b0SSuyog Pawar /* The prediction mode flag for the CU */
234*c83a76b0SSuyog Pawar UWORD32 u4_pred_mode_flag = ps_cu_final->b1_pred_mode_flag;
235*c83a76b0SSuyog Pawar /* X Position of CU in current ctb in (8x8) units */
236*c83a76b0SSuyog Pawar WORD32 cu_pos_x = ps_cu_final->b3_cu_pos_x;
237*c83a76b0SSuyog Pawar /* Y Position of CU in current ctb in (8x8) units */
238*c83a76b0SSuyog Pawar WORD32 cu_pos_y = ps_cu_final->b3_cu_pos_y;
239*c83a76b0SSuyog Pawar
240*c83a76b0SSuyog Pawar /* Indicates partition information for CU */
241*c83a76b0SSuyog Pawar UWORD32 u4_part_mode = ps_cu_final->b3_part_mode;
242*c83a76b0SSuyog Pawar
243*c83a76b0SSuyog Pawar /* Pointer to first pu of this cu */
244*c83a76b0SSuyog Pawar pu_t *ps_pu = ps_cu_final->ps_pu;
245*c83a76b0SSuyog Pawar
246*c83a76b0SSuyog Pawar /* Number of pus in current cu */
247*c83a76b0SSuyog Pawar WORD32 num_pus_in_cu;
248*c83a76b0SSuyog Pawar /* Pointer to the array to store the packed BS values in horizontal dir. */
249*c83a76b0SSuyog Pawar UWORD32 *pu4_horz_bs = &ps_deblk_prms->au4_horz_bs[0];
250*c83a76b0SSuyog Pawar /* Pointer to the array to store the packed BS values in vertical dir. */
251*c83a76b0SSuyog Pawar UWORD32 *pu4_vert_bs = &ps_deblk_prms->au4_vert_bs[0];
252*c83a76b0SSuyog Pawar
253*c83a76b0SSuyog Pawar (void)ps_curr_nbr_4x4;
254*c83a76b0SSuyog Pawar (void)num_4x4_in_ctb;
255*c83a76b0SSuyog Pawar
256*c83a76b0SSuyog Pawar /* CTB boundary case setting the BS for intra and cbf non zero case for CU top edge */
257*c83a76b0SSuyog Pawar if((ps_deblk_prms->u1_not_first_ctb_row_of_frame) && (0 == ps_cu_final->b3_cu_pos_y))
258*c83a76b0SSuyog Pawar {
259*c83a76b0SSuyog Pawar nbr_4x4_t *ps_nbr_4x4;
260*c83a76b0SSuyog Pawar UWORD32 u4_temp_bs = *pu4_horz_bs;
261*c83a76b0SSuyog Pawar WORD32 horz_bit_offset;
262*c83a76b0SSuyog Pawar WORD32 ctr;
263*c83a76b0SSuyog Pawar
264*c83a76b0SSuyog Pawar /* every 4x4 takes 2 bits in the register this is taken care in the loop */
265*c83a76b0SSuyog Pawar /* deriving 4x4 position */
266*c83a76b0SSuyog Pawar horz_bit_offset = (ps_cu_final->b3_cu_pos_x << 3) >> 2;
267*c83a76b0SSuyog Pawar
268*c83a76b0SSuyog Pawar /* scanning through each 4x4 csb along horizontal direction */
269*c83a76b0SSuyog Pawar for(ctr = 0; ctr < ((ps_cu_final->b4_cu_size << 3) >> 2); ctr++)
270*c83a76b0SSuyog Pawar {
271*c83a76b0SSuyog Pawar ps_nbr_4x4 = ps_top_nbr_4x4 + ctr;
272*c83a76b0SSuyog Pawar if(ps_nbr_4x4->b1_intra_flag)
273*c83a76b0SSuyog Pawar {
274*c83a76b0SSuyog Pawar /* To store in BigEnd. format. BS[0]|BS[1]| .. |BS[15] */
275*c83a76b0SSuyog Pawar u4_temp_bs = (u4_temp_bs | (2U << (30 - 2 * (ctr + horz_bit_offset))));
276*c83a76b0SSuyog Pawar }
277*c83a76b0SSuyog Pawar else if(ps_nbr_4x4->b1_y_cbf)
278*c83a76b0SSuyog Pawar {
279*c83a76b0SSuyog Pawar /* To store in BigEnd. format. BS[0]|BS[1]| .. |BS[15] */
280*c83a76b0SSuyog Pawar u4_temp_bs = (u4_temp_bs | (1 << (30 - 2 * (ctr + horz_bit_offset))));
281*c83a76b0SSuyog Pawar }
282*c83a76b0SSuyog Pawar }
283*c83a76b0SSuyog Pawar
284*c83a76b0SSuyog Pawar /* storing the BS computed for first row based on top ctb CUs */
285*c83a76b0SSuyog Pawar *(pu4_horz_bs) = u4_temp_bs;
286*c83a76b0SSuyog Pawar }
287*c83a76b0SSuyog Pawar
288*c83a76b0SSuyog Pawar /* CTB boundary case setting the BS for intra and cbf non zero case for CU left edge */
289*c83a76b0SSuyog Pawar if((ps_deblk_prms->u1_not_first_ctb_col_of_frame) && (0 == ps_cu_final->b3_cu_pos_x))
290*c83a76b0SSuyog Pawar {
291*c83a76b0SSuyog Pawar nbr_4x4_t *ps_nbr_4x4;
292*c83a76b0SSuyog Pawar UWORD32 u4_temp_bs = *pu4_vert_bs;
293*c83a76b0SSuyog Pawar WORD32 vert_bit_offset;
294*c83a76b0SSuyog Pawar WORD32 ctr;
295*c83a76b0SSuyog Pawar
296*c83a76b0SSuyog Pawar /* every 4x4 takes 2 bits in the register this is taken care in the loop */
297*c83a76b0SSuyog Pawar /* deriving 4x4 position */
298*c83a76b0SSuyog Pawar vert_bit_offset = (ps_cu_final->b3_cu_pos_y << 3) >> 2;
299*c83a76b0SSuyog Pawar
300*c83a76b0SSuyog Pawar /* scanning through each 4x4 csb along vertical direction */
301*c83a76b0SSuyog Pawar for(ctr = 0; ctr < ((ps_cu_final->b4_cu_size << 3) >> 2); ctr++)
302*c83a76b0SSuyog Pawar {
303*c83a76b0SSuyog Pawar ps_nbr_4x4 = ps_left_nbr_4x4 + ctr * nbr_4x4_left_strd;
304*c83a76b0SSuyog Pawar if(ps_nbr_4x4->b1_intra_flag)
305*c83a76b0SSuyog Pawar {
306*c83a76b0SSuyog Pawar /* To store in BigEnd. format. BS[0]|BS[1]| .. |BS[15] */
307*c83a76b0SSuyog Pawar u4_temp_bs = (u4_temp_bs | (2U << (30 - 2 * (ctr + vert_bit_offset))));
308*c83a76b0SSuyog Pawar }
309*c83a76b0SSuyog Pawar else if(ps_nbr_4x4->b1_y_cbf)
310*c83a76b0SSuyog Pawar {
311*c83a76b0SSuyog Pawar /* To store in BigEnd. format. BS[0]|BS[1]| .. |BS[15] */
312*c83a76b0SSuyog Pawar u4_temp_bs = (u4_temp_bs | (1 << (30 - 2 * (ctr + vert_bit_offset))));
313*c83a76b0SSuyog Pawar }
314*c83a76b0SSuyog Pawar }
315*c83a76b0SSuyog Pawar
316*c83a76b0SSuyog Pawar /* storing the BS computed for first col based on left ctb Cus */
317*c83a76b0SSuyog Pawar *(pu4_vert_bs) = u4_temp_bs;
318*c83a76b0SSuyog Pawar }
319*c83a76b0SSuyog Pawar
320*c83a76b0SSuyog Pawar /* Passes through each TU inside the CU */
321*c83a76b0SSuyog Pawar for(i = 0; i < u2_num_tus_in_cu; i++)
322*c83a76b0SSuyog Pawar {
323*c83a76b0SSuyog Pawar UWORD32 u4_tu_pos_x, u4_tu_pos_y;
324*c83a76b0SSuyog Pawar UWORD32 u4_tu_size;
325*c83a76b0SSuyog Pawar UWORD32 *pu4_tu_top_edge;
326*c83a76b0SSuyog Pawar UWORD32 *pu4_tu_bottom_edge;
327*c83a76b0SSuyog Pawar UWORD32 *pu4_tu_left_edge;
328*c83a76b0SSuyog Pawar UWORD32 *pu4_tu_right_edge;
329*c83a76b0SSuyog Pawar UWORD32 u4_bs_value;
330*c83a76b0SSuyog Pawar WORD32 set_bs_flag = 0;
331*c83a76b0SSuyog Pawar WORD32 tbl_idx = 1;
332*c83a76b0SSuyog Pawar
333*c83a76b0SSuyog Pawar /* TU_size calculation */
334*c83a76b0SSuyog Pawar u4_tu_size = 1 << ((ps_enc_tu->s_tu.b3_size) + 2);
335*c83a76b0SSuyog Pawar
336*c83a76b0SSuyog Pawar /* TU X position in terms of min TU (4x4) units wrt ctb */
337*c83a76b0SSuyog Pawar u4_tu_pos_x = ps_enc_tu->s_tu.b4_pos_x;
338*c83a76b0SSuyog Pawar /* TU Y position in terms of min TU (4x4) units wrt ctb */
339*c83a76b0SSuyog Pawar u4_tu_pos_y = ps_enc_tu->s_tu.b4_pos_y;
340*c83a76b0SSuyog Pawar
341*c83a76b0SSuyog Pawar /* pointers to the edges of current TU */
342*c83a76b0SSuyog Pawar pu4_tu_top_edge = pu4_horz_bs + (u4_tu_pos_y >> 1);
343*c83a76b0SSuyog Pawar pu4_tu_bottom_edge = pu4_horz_bs + ((u4_tu_pos_y + 1) >> 1) + (u4_tu_size >> 3);
344*c83a76b0SSuyog Pawar pu4_tu_left_edge = pu4_vert_bs + (u4_tu_pos_x >> 1);
345*c83a76b0SSuyog Pawar pu4_tu_right_edge = pu4_vert_bs + ((u4_tu_pos_x + 1) >> 1) + (u4_tu_size >> 3);
346*c83a76b0SSuyog Pawar
347*c83a76b0SSuyog Pawar /* chooose the table index based on pred_mode */
348*c83a76b0SSuyog Pawar if(PRED_MODE_INTRA == u4_pred_mode_flag)
349*c83a76b0SSuyog Pawar {
350*c83a76b0SSuyog Pawar tbl_idx = 0;
351*c83a76b0SSuyog Pawar }
352*c83a76b0SSuyog Pawar
353*c83a76b0SSuyog Pawar /* get the BS value from table if required */
354*c83a76b0SSuyog Pawar if((ps_enc_tu->s_tu.b1_y_cbf) || (PRED_MODE_INTRA == u4_pred_mode_flag))
355*c83a76b0SSuyog Pawar {
356*c83a76b0SSuyog Pawar set_bs_flag = 1;
357*c83a76b0SSuyog Pawar u4_bs_value = gau2_bs_table[tbl_idx][(u4_tu_size >> 2) - 1];
358*c83a76b0SSuyog Pawar }
359*c83a76b0SSuyog Pawar
360*c83a76b0SSuyog Pawar if(1 == set_bs_flag)
361*c83a76b0SSuyog Pawar {
362*c83a76b0SSuyog Pawar /* Store the BS value */
363*c83a76b0SSuyog Pawar if(4 == u4_tu_size)
364*c83a76b0SSuyog Pawar {
365*c83a76b0SSuyog Pawar if(0 == (u4_tu_pos_y & 1))
366*c83a76b0SSuyog Pawar {
367*c83a76b0SSuyog Pawar /* Only top TU edge came on a 8 pixel bounadey */
368*c83a76b0SSuyog Pawar SET_VALUE_BIG((pu4_tu_top_edge), u4_bs_value, u4_tu_pos_x, u4_tu_size);
369*c83a76b0SSuyog Pawar }
370*c83a76b0SSuyog Pawar else
371*c83a76b0SSuyog Pawar {
372*c83a76b0SSuyog Pawar /* Only bottom TU edge came on a 8 pixel bounadey */
373*c83a76b0SSuyog Pawar SET_VALUE_BIG((pu4_tu_bottom_edge), u4_bs_value, u4_tu_pos_x, u4_tu_size);
374*c83a76b0SSuyog Pawar }
375*c83a76b0SSuyog Pawar if(0 == (u4_tu_pos_x & 1))
376*c83a76b0SSuyog Pawar {
377*c83a76b0SSuyog Pawar /* Only left TU edge came on a 8 pixel bounadey */
378*c83a76b0SSuyog Pawar SET_VALUE_BIG((pu4_tu_left_edge), u4_bs_value, u4_tu_pos_y, u4_tu_size);
379*c83a76b0SSuyog Pawar }
380*c83a76b0SSuyog Pawar else
381*c83a76b0SSuyog Pawar {
382*c83a76b0SSuyog Pawar /* Only right TU edge came on a 8 pixel bounadey */
383*c83a76b0SSuyog Pawar SET_VALUE_BIG((pu4_tu_right_edge), u4_bs_value, u4_tu_pos_y, u4_tu_size);
384*c83a76b0SSuyog Pawar }
385*c83a76b0SSuyog Pawar }
386*c83a76b0SSuyog Pawar /* set all edges for other TU sizes */
387*c83a76b0SSuyog Pawar else
388*c83a76b0SSuyog Pawar {
389*c83a76b0SSuyog Pawar /* setting top TU edge */
390*c83a76b0SSuyog Pawar SET_VALUE_BIG((pu4_tu_top_edge), u4_bs_value, u4_tu_pos_x, u4_tu_size);
391*c83a76b0SSuyog Pawar /* setting bottom TU edge */
392*c83a76b0SSuyog Pawar SET_VALUE_BIG((pu4_tu_bottom_edge), u4_bs_value, u4_tu_pos_x, u4_tu_size);
393*c83a76b0SSuyog Pawar /* setting left TU edge */
394*c83a76b0SSuyog Pawar SET_VALUE_BIG((pu4_tu_left_edge), u4_bs_value, u4_tu_pos_y, u4_tu_size);
395*c83a76b0SSuyog Pawar /* setting right TU edge */
396*c83a76b0SSuyog Pawar SET_VALUE_BIG((pu4_tu_right_edge), u4_bs_value, u4_tu_pos_y, u4_tu_size);
397*c83a76b0SSuyog Pawar }
398*c83a76b0SSuyog Pawar }
399*c83a76b0SSuyog Pawar
400*c83a76b0SSuyog Pawar /* point to next TU inside CU in TU order */
401*c83a76b0SSuyog Pawar ps_enc_tu++;
402*c83a76b0SSuyog Pawar }
403*c83a76b0SSuyog Pawar
404*c83a76b0SSuyog Pawar if(PRED_MODE_INTRA == u4_pred_mode_flag)
405*c83a76b0SSuyog Pawar {
406*c83a76b0SSuyog Pawar /* no mv based BS computation in INTRA case */
407*c83a76b0SSuyog Pawar return;
408*c83a76b0SSuyog Pawar }
409*c83a76b0SSuyog Pawar /* BS update due to PU mv.s */
410*c83a76b0SSuyog Pawar if(u4_part_mode == SIZE_2Nx2N) /* symmetric motion partition, 2Nx2N */
411*c83a76b0SSuyog Pawar {
412*c83a76b0SSuyog Pawar num_pus_in_cu = 1;
413*c83a76b0SSuyog Pawar }
414*c83a76b0SSuyog Pawar else if(u4_part_mode == SIZE_NxN) /* symmetric motion partition, NxN */
415*c83a76b0SSuyog Pawar {
416*c83a76b0SSuyog Pawar num_pus_in_cu = 4;
417*c83a76b0SSuyog Pawar }
418*c83a76b0SSuyog Pawar else /* other sym. or asym. partiotions */
419*c83a76b0SSuyog Pawar {
420*c83a76b0SSuyog Pawar num_pus_in_cu = 2;
421*c83a76b0SSuyog Pawar }
422*c83a76b0SSuyog Pawar
423*c83a76b0SSuyog Pawar /* Go through each PU inside CU in PU order and set the top & bottom */
424*c83a76b0SSuyog Pawar /* PU edge BS accordingly */
425*c83a76b0SSuyog Pawar for(i = 0; i < num_pus_in_cu; i++)
426*c83a76b0SSuyog Pawar {
427*c83a76b0SSuyog Pawar WORD32 k;
428*c83a76b0SSuyog Pawar /* X Position of PU in terms of min PU (4x4) units in current ctb */
429*c83a76b0SSuyog Pawar WORD32 pu_pos_x = ps_pu->b4_pos_x;
430*c83a76b0SSuyog Pawar /* Y Position of PU in terms of min PU (4x4) units in current ctb */
431*c83a76b0SSuyog Pawar WORD32 pu_pos_y = ps_pu->b4_pos_y;
432*c83a76b0SSuyog Pawar /* PU width in 4 pixel unit */
433*c83a76b0SSuyog Pawar WORD32 pu_wd = (ps_pu->b4_wd) + 1;
434*c83a76b0SSuyog Pawar /* PU height in 4 pixel unit */
435*c83a76b0SSuyog Pawar WORD32 pu_ht = (ps_pu->b4_ht) + 1;
436*c83a76b0SSuyog Pawar /* Pred L0 flag */
437*c83a76b0SSuyog Pawar WORD32 cur_pred_l0_flag;
438*c83a76b0SSuyog Pawar /* pointer to current PU */
439*c83a76b0SSuyog Pawar nbr_4x4_t *ps_curr_nbr_4x4_pu;
440*c83a76b0SSuyog Pawar
441*c83a76b0SSuyog Pawar /* go through each 4x4 block along the PU edges and do BS calculation */
442*c83a76b0SSuyog Pawar /* can optimize further with proper checks according to PU size */
443*c83a76b0SSuyog Pawar /* but in that case also @CTB boundary, we should go by 4x4 nbr.s only*/
444*c83a76b0SSuyog Pawar
445*c83a76b0SSuyog Pawar /* load cur. PU parameters */
446*c83a76b0SSuyog Pawar WORD8 i1_cur_l0_ref_pic_buf_id, i1_cur_l1_ref_pic_buf_id;
447*c83a76b0SSuyog Pawar WORD32 cur_mv_no;
448*c83a76b0SSuyog Pawar WORD16 i2_mv_x0, i2_mv_y0, i2_mv_x1, i2_mv_y1;
449*c83a76b0SSuyog Pawar
450*c83a76b0SSuyog Pawar ps_curr_nbr_4x4_pu = ps_curr_nbr_4x4 + (pu_pos_x - (cu_pos_x << 1)) +
451*c83a76b0SSuyog Pawar (pu_pos_y - (cu_pos_y << 1)) * num_4x4_in_ctb;
452*c83a76b0SSuyog Pawar
453*c83a76b0SSuyog Pawar cur_pred_l0_flag = ps_curr_nbr_4x4_pu->b1_pred_l0_flag;
454*c83a76b0SSuyog Pawar
455*c83a76b0SSuyog Pawar /* L0 & L1 unique ref. pic. id for cur. PU, (stored in upper 4 bits) */
456*c83a76b0SSuyog Pawar i1_cur_l0_ref_pic_buf_id = (ps_curr_nbr_4x4_pu->mv.i1_l0_ref_pic_buf_id);
457*c83a76b0SSuyog Pawar i1_cur_l1_ref_pic_buf_id = (ps_curr_nbr_4x4_pu->mv.i1_l1_ref_pic_buf_id);
458*c83a76b0SSuyog Pawar
459*c83a76b0SSuyog Pawar /* Number of motion vectors used for cur. PU */
460*c83a76b0SSuyog Pawar cur_mv_no = cur_pred_l0_flag + ps_curr_nbr_4x4_pu->b1_pred_l1_flag;
461*c83a76b0SSuyog Pawar
462*c83a76b0SSuyog Pawar /* x and y mv for L0 and L1, for cur. PU */
463*c83a76b0SSuyog Pawar i2_mv_x0 = ps_curr_nbr_4x4_pu->mv.s_l0_mv.i2_mvx;
464*c83a76b0SSuyog Pawar i2_mv_y0 = ps_curr_nbr_4x4_pu->mv.s_l0_mv.i2_mvy;
465*c83a76b0SSuyog Pawar i2_mv_x1 = ps_curr_nbr_4x4_pu->mv.s_l1_mv.i2_mvx;
466*c83a76b0SSuyog Pawar i2_mv_y1 = ps_curr_nbr_4x4_pu->mv.s_l1_mv.i2_mvy;
467*c83a76b0SSuyog Pawar
468*c83a76b0SSuyog Pawar /* two cases for updating TOP and LEFT edges respectively */
469*c83a76b0SSuyog Pawar /* k = 0 : TOP edge update, k = 1 : LEFT edge update */
470*c83a76b0SSuyog Pawar for(k = 0; k < 2; k++)
471*c83a76b0SSuyog Pawar {
472*c83a76b0SSuyog Pawar WORD32 pu_pos_pointer_calc, pu_pos_bit_calc;
473*c83a76b0SSuyog Pawar UWORD32 *pu4_pu_cur_edge;
474*c83a76b0SSuyog Pawar WORD32 pu_dim, nbr_inc;
475*c83a76b0SSuyog Pawar nbr_4x4_t *ps_nbr_4x4;
476*c83a76b0SSuyog Pawar
477*c83a76b0SSuyog Pawar /* TOP edge case */
478*c83a76b0SSuyog Pawar if(0 == k)
479*c83a76b0SSuyog Pawar {
480*c83a76b0SSuyog Pawar pu_pos_pointer_calc = pu_pos_y;
481*c83a76b0SSuyog Pawar pu_pos_bit_calc = pu_pos_x;
482*c83a76b0SSuyog Pawar pu4_pu_cur_edge = pu4_horz_bs + (pu_pos_y >> 1);
483*c83a76b0SSuyog Pawar pu_dim = pu_wd;
484*c83a76b0SSuyog Pawar
485*c83a76b0SSuyog Pawar /* top neighbours are accessed linearly */
486*c83a76b0SSuyog Pawar nbr_inc = 1;
487*c83a76b0SSuyog Pawar
488*c83a76b0SSuyog Pawar /* If the current 4x4 csb is in the first row of CTB */
489*c83a76b0SSuyog Pawar if(0 == pu_pos_pointer_calc)
490*c83a76b0SSuyog Pawar { /* then need to check if top CTB is physically available */
491*c83a76b0SSuyog Pawar /* (slice bound. are considered as availabale) */
492*c83a76b0SSuyog Pawar if(ps_deblk_prms->u1_not_first_ctb_row_of_frame)
493*c83a76b0SSuyog Pawar {
494*c83a76b0SSuyog Pawar ps_nbr_4x4 = ps_top_nbr_4x4 + (nbr_inc * (pu_pos_x - (cu_pos_x << 1)));
495*c83a76b0SSuyog Pawar }
496*c83a76b0SSuyog Pawar else
497*c83a76b0SSuyog Pawar {
498*c83a76b0SSuyog Pawar /* This is done for avoiding uninitialized memory access at pic. boundaries*/
499*c83a76b0SSuyog Pawar ps_nbr_4x4 = ps_curr_nbr_4x4_pu;
500*c83a76b0SSuyog Pawar }
501*c83a76b0SSuyog Pawar }
502*c83a76b0SSuyog Pawar /* within ctb, so top neighbour is available */
503*c83a76b0SSuyog Pawar else
504*c83a76b0SSuyog Pawar {
505*c83a76b0SSuyog Pawar ps_nbr_4x4 = ps_curr_nbr_4x4_pu - num_4x4_in_ctb;
506*c83a76b0SSuyog Pawar }
507*c83a76b0SSuyog Pawar }
508*c83a76b0SSuyog Pawar /* LEFT edge case */
509*c83a76b0SSuyog Pawar else
510*c83a76b0SSuyog Pawar {
511*c83a76b0SSuyog Pawar pu_pos_pointer_calc = pu_pos_x;
512*c83a76b0SSuyog Pawar pu_pos_bit_calc = pu_pos_y;
513*c83a76b0SSuyog Pawar pu4_pu_cur_edge = pu4_vert_bs + (pu_pos_x >> 1);
514*c83a76b0SSuyog Pawar pu_dim = pu_ht;
515*c83a76b0SSuyog Pawar
516*c83a76b0SSuyog Pawar /* left neighbours are accessed using stride */
517*c83a76b0SSuyog Pawar nbr_inc = nbr_4x4_left_strd;
518*c83a76b0SSuyog Pawar
519*c83a76b0SSuyog Pawar /* If the current 4x4 csb is in the first col of CTB */
520*c83a76b0SSuyog Pawar if(0 == pu_pos_pointer_calc)
521*c83a76b0SSuyog Pawar { /* then need to check if left CTB is available */
522*c83a76b0SSuyog Pawar if(ps_deblk_prms->u1_not_first_ctb_col_of_frame)
523*c83a76b0SSuyog Pawar {
524*c83a76b0SSuyog Pawar ps_nbr_4x4 = ps_left_nbr_4x4 + (nbr_inc * (pu_pos_y - (cu_pos_y << 1)));
525*c83a76b0SSuyog Pawar }
526*c83a76b0SSuyog Pawar else
527*c83a76b0SSuyog Pawar {
528*c83a76b0SSuyog Pawar /* This is done for avoiding uninitialized memory access at pic. boundaries*/
529*c83a76b0SSuyog Pawar ps_nbr_4x4 = ps_curr_nbr_4x4_pu;
530*c83a76b0SSuyog Pawar nbr_inc = num_4x4_in_ctb;
531*c83a76b0SSuyog Pawar }
532*c83a76b0SSuyog Pawar }
533*c83a76b0SSuyog Pawar /* within ctb, so left neighbour is available */
534*c83a76b0SSuyog Pawar else
535*c83a76b0SSuyog Pawar {
536*c83a76b0SSuyog Pawar ps_nbr_4x4 = ps_curr_nbr_4x4_pu - 1;
537*c83a76b0SSuyog Pawar nbr_inc = num_4x4_in_ctb;
538*c83a76b0SSuyog Pawar }
539*c83a76b0SSuyog Pawar }
540*c83a76b0SSuyog Pawar
541*c83a76b0SSuyog Pawar /* Only if the current edge falls on 8 pixel grid and ... */
542*c83a76b0SSuyog Pawar if(0 == (pu_pos_pointer_calc & 1))
543*c83a76b0SSuyog Pawar {
544*c83a76b0SSuyog Pawar /* go through the edge in 4x4 unit. Can be optimized */
545*c83a76b0SSuyog Pawar /* In that case special case for CTB boundary */
546*c83a76b0SSuyog Pawar for(j = 0; j < pu_dim; j++)
547*c83a76b0SSuyog Pawar {
548*c83a76b0SSuyog Pawar //nbr_4x4_t *ps_temp_nbr_4x4;
549*c83a76b0SSuyog Pawar
550*c83a76b0SSuyog Pawar /* ... and if the BS not set yet */
551*c83a76b0SSuyog Pawar if(0 == EXTRACT_VALUE_BIG(pu4_pu_cur_edge, (pu_pos_bit_calc + j)))
552*c83a76b0SSuyog Pawar {
553*c83a76b0SSuyog Pawar WORD8 i1_nbr_l0_ref_pic_buf_id, i1_nbr_l1_ref_pic_buf_id;
554*c83a76b0SSuyog Pawar WORD32 nbr_mv_no;
555*c83a76b0SSuyog Pawar WORD32 bs_flag = 0;
556*c83a76b0SSuyog Pawar WORD32 nbr_pred_l0_flag = ps_nbr_4x4->b1_pred_l0_flag;
557*c83a76b0SSuyog Pawar
558*c83a76b0SSuyog Pawar /* L0 & L1 unique ref. pic. id for nbr. csb, in upper 4 bits */
559*c83a76b0SSuyog Pawar i1_nbr_l0_ref_pic_buf_id = (ps_nbr_4x4->mv.i1_l0_ref_pic_buf_id);
560*c83a76b0SSuyog Pawar i1_nbr_l1_ref_pic_buf_id = (ps_nbr_4x4->mv.i1_l1_ref_pic_buf_id);
561*c83a76b0SSuyog Pawar
562*c83a76b0SSuyog Pawar /* Number of motion vectors used */
563*c83a76b0SSuyog Pawar nbr_mv_no = nbr_pred_l0_flag + ps_nbr_4x4->b1_pred_l1_flag;
564*c83a76b0SSuyog Pawar
565*c83a76b0SSuyog Pawar /* If diff. no. of motion vectors used */
566*c83a76b0SSuyog Pawar if(cur_mv_no != nbr_mv_no)
567*c83a76b0SSuyog Pawar {
568*c83a76b0SSuyog Pawar bs_flag = 1;
569*c83a76b0SSuyog Pawar }
570*c83a76b0SSuyog Pawar /* If One motion vector is used */
571*c83a76b0SSuyog Pawar else if(1 == cur_mv_no)
572*c83a76b0SSuyog Pawar {
573*c83a76b0SSuyog Pawar WORD16 i2_mv_x, i2_mv_y;
574*c83a76b0SSuyog Pawar
575*c83a76b0SSuyog Pawar if(cur_pred_l0_flag)
576*c83a76b0SSuyog Pawar { /* L0 used for cur. */
577*c83a76b0SSuyog Pawar if(nbr_pred_l0_flag)
578*c83a76b0SSuyog Pawar { /* L0 used for nbr. */
579*c83a76b0SSuyog Pawar if(i1_cur_l0_ref_pic_buf_id != i1_nbr_l0_ref_pic_buf_id)
580*c83a76b0SSuyog Pawar {
581*c83a76b0SSuyog Pawar /* reference pictures used are different */
582*c83a76b0SSuyog Pawar bs_flag = 1;
583*c83a76b0SSuyog Pawar }
584*c83a76b0SSuyog Pawar }
585*c83a76b0SSuyog Pawar else
586*c83a76b0SSuyog Pawar { /* L1 used for nbr. */
587*c83a76b0SSuyog Pawar if(i1_cur_l0_ref_pic_buf_id != i1_nbr_l1_ref_pic_buf_id)
588*c83a76b0SSuyog Pawar {
589*c83a76b0SSuyog Pawar /* reference pictures used are different */
590*c83a76b0SSuyog Pawar bs_flag = 1;
591*c83a76b0SSuyog Pawar }
592*c83a76b0SSuyog Pawar }
593*c83a76b0SSuyog Pawar if(!bs_flag)
594*c83a76b0SSuyog Pawar {
595*c83a76b0SSuyog Pawar i2_mv_x = i2_mv_x0;
596*c83a76b0SSuyog Pawar i2_mv_y = i2_mv_y0;
597*c83a76b0SSuyog Pawar }
598*c83a76b0SSuyog Pawar }
599*c83a76b0SSuyog Pawar else
600*c83a76b0SSuyog Pawar { /* L1 used for cur. */
601*c83a76b0SSuyog Pawar if(nbr_pred_l0_flag)
602*c83a76b0SSuyog Pawar { /* L0 used for nbr. */
603*c83a76b0SSuyog Pawar if(i1_cur_l1_ref_pic_buf_id != i1_nbr_l0_ref_pic_buf_id)
604*c83a76b0SSuyog Pawar {
605*c83a76b0SSuyog Pawar /* reference pictures used are different */
606*c83a76b0SSuyog Pawar bs_flag = 1;
607*c83a76b0SSuyog Pawar }
608*c83a76b0SSuyog Pawar }
609*c83a76b0SSuyog Pawar else
610*c83a76b0SSuyog Pawar { /* L1 used for nbr. */
611*c83a76b0SSuyog Pawar if(i1_cur_l1_ref_pic_buf_id != i1_nbr_l1_ref_pic_buf_id)
612*c83a76b0SSuyog Pawar {
613*c83a76b0SSuyog Pawar /* reference pictures used are different */
614*c83a76b0SSuyog Pawar bs_flag = 1;
615*c83a76b0SSuyog Pawar }
616*c83a76b0SSuyog Pawar }
617*c83a76b0SSuyog Pawar if(!bs_flag)
618*c83a76b0SSuyog Pawar {
619*c83a76b0SSuyog Pawar i2_mv_x = i2_mv_x1;
620*c83a76b0SSuyog Pawar i2_mv_y = i2_mv_y1;
621*c83a76b0SSuyog Pawar }
622*c83a76b0SSuyog Pawar }
623*c83a76b0SSuyog Pawar
624*c83a76b0SSuyog Pawar if(!bs_flag)
625*c83a76b0SSuyog Pawar {
626*c83a76b0SSuyog Pawar WORD16 i2_nbr_mv_x, i2_nbr_mv_y;
627*c83a76b0SSuyog Pawar
628*c83a76b0SSuyog Pawar if(nbr_pred_l0_flag)
629*c83a76b0SSuyog Pawar {
630*c83a76b0SSuyog Pawar i2_nbr_mv_x = ps_nbr_4x4->mv.s_l0_mv.i2_mvx;
631*c83a76b0SSuyog Pawar i2_nbr_mv_y = ps_nbr_4x4->mv.s_l0_mv.i2_mvy;
632*c83a76b0SSuyog Pawar }
633*c83a76b0SSuyog Pawar else
634*c83a76b0SSuyog Pawar {
635*c83a76b0SSuyog Pawar i2_nbr_mv_x = ps_nbr_4x4->mv.s_l1_mv.i2_mvx;
636*c83a76b0SSuyog Pawar i2_nbr_mv_y = ps_nbr_4x4->mv.s_l1_mv.i2_mvy;
637*c83a76b0SSuyog Pawar }
638*c83a76b0SSuyog Pawar // clang-format off
639*c83a76b0SSuyog Pawar bs_flag =
640*c83a76b0SSuyog Pawar (abs(i2_mv_x - i2_nbr_mv_x) < 4) &&
641*c83a76b0SSuyog Pawar (abs(i2_mv_y - i2_nbr_mv_y) < 4)
642*c83a76b0SSuyog Pawar ? 0
643*c83a76b0SSuyog Pawar : 1;
644*c83a76b0SSuyog Pawar // clang-format on
645*c83a76b0SSuyog Pawar }
646*c83a76b0SSuyog Pawar }
647*c83a76b0SSuyog Pawar /* If two motion vectors are used */
648*c83a76b0SSuyog Pawar else if(2 == cur_mv_no)
649*c83a76b0SSuyog Pawar {
650*c83a76b0SSuyog Pawar /* check whether same reference pictures used */
651*c83a76b0SSuyog Pawar if((i1_cur_l0_ref_pic_buf_id == i1_nbr_l0_ref_pic_buf_id &&
652*c83a76b0SSuyog Pawar i1_cur_l1_ref_pic_buf_id == i1_nbr_l1_ref_pic_buf_id) ||
653*c83a76b0SSuyog Pawar (i1_cur_l0_ref_pic_buf_id == i1_nbr_l1_ref_pic_buf_id &&
654*c83a76b0SSuyog Pawar i1_cur_l1_ref_pic_buf_id == i1_nbr_l0_ref_pic_buf_id))
655*c83a76b0SSuyog Pawar {
656*c83a76b0SSuyog Pawar WORD16 i2_nbr_mv_x0, i2_nbr_mv_y0, i2_nbr_mv_x1, i2_nbr_mv_y1;
657*c83a76b0SSuyog Pawar
658*c83a76b0SSuyog Pawar /* x and y mv for L0 and L1, for nbr. csb*/
659*c83a76b0SSuyog Pawar i2_nbr_mv_x0 = ps_nbr_4x4->mv.s_l0_mv.i2_mvx;
660*c83a76b0SSuyog Pawar i2_nbr_mv_y0 = ps_nbr_4x4->mv.s_l0_mv.i2_mvy;
661*c83a76b0SSuyog Pawar i2_nbr_mv_x1 = ps_nbr_4x4->mv.s_l1_mv.i2_mvx;
662*c83a76b0SSuyog Pawar i2_nbr_mv_y1 = ps_nbr_4x4->mv.s_l1_mv.i2_mvy;
663*c83a76b0SSuyog Pawar
664*c83a76b0SSuyog Pawar /* Different L0 and L1 */
665*c83a76b0SSuyog Pawar if(i1_cur_l0_ref_pic_buf_id != i1_cur_l1_ref_pic_buf_id)
666*c83a76b0SSuyog Pawar {
667*c83a76b0SSuyog Pawar if(i1_cur_l0_ref_pic_buf_id == i1_nbr_l0_ref_pic_buf_id)
668*c83a76b0SSuyog Pawar {
669*c83a76b0SSuyog Pawar // clang-format off
670*c83a76b0SSuyog Pawar bs_flag =
671*c83a76b0SSuyog Pawar (abs(i2_mv_x0 - i2_nbr_mv_x0) < 4) &&
672*c83a76b0SSuyog Pawar (abs(i2_mv_y0 - i2_nbr_mv_y0) < 4) &&
673*c83a76b0SSuyog Pawar (abs(i2_mv_x1 - i2_nbr_mv_x1) < 4) &&
674*c83a76b0SSuyog Pawar (abs(i2_mv_y1 - i2_nbr_mv_y1) < 4)
675*c83a76b0SSuyog Pawar ? 0
676*c83a76b0SSuyog Pawar : 1;
677*c83a76b0SSuyog Pawar // clang-format on
678*c83a76b0SSuyog Pawar }
679*c83a76b0SSuyog Pawar else
680*c83a76b0SSuyog Pawar {
681*c83a76b0SSuyog Pawar // clang-format off
682*c83a76b0SSuyog Pawar bs_flag =
683*c83a76b0SSuyog Pawar (abs(i2_mv_x0 - i2_nbr_mv_x1) < 4) &&
684*c83a76b0SSuyog Pawar (abs(i2_mv_y0 - i2_nbr_mv_y1) < 4) &&
685*c83a76b0SSuyog Pawar (abs(i2_mv_x1 - i2_nbr_mv_x0) < 4) &&
686*c83a76b0SSuyog Pawar (abs(i2_mv_y1 - i2_nbr_mv_y0) < 4)
687*c83a76b0SSuyog Pawar ? 0
688*c83a76b0SSuyog Pawar : 1;
689*c83a76b0SSuyog Pawar // clang-format on
690*c83a76b0SSuyog Pawar }
691*c83a76b0SSuyog Pawar }
692*c83a76b0SSuyog Pawar else /* Same L0 and L1 */
693*c83a76b0SSuyog Pawar {
694*c83a76b0SSuyog Pawar // clang-format off
695*c83a76b0SSuyog Pawar bs_flag =
696*c83a76b0SSuyog Pawar ((abs(i2_mv_x0 - i2_nbr_mv_x0) >= 4) ||
697*c83a76b0SSuyog Pawar (abs(i2_mv_y0 - i2_nbr_mv_y0) >= 4) ||
698*c83a76b0SSuyog Pawar (abs(i2_mv_x1 - i2_nbr_mv_x1) >= 4) ||
699*c83a76b0SSuyog Pawar (abs(i2_mv_y1 - i2_nbr_mv_y1) >= 4)) &&
700*c83a76b0SSuyog Pawar ((abs(i2_mv_x0 - i2_nbr_mv_x1) >= 4) ||
701*c83a76b0SSuyog Pawar (abs(i2_mv_y0 - i2_nbr_mv_y1) >= 4) ||
702*c83a76b0SSuyog Pawar (abs(i2_mv_x1 - i2_nbr_mv_x0) >= 4) ||
703*c83a76b0SSuyog Pawar (abs(i2_mv_y1 - i2_nbr_mv_y0) >= 4))
704*c83a76b0SSuyog Pawar ? 1
705*c83a76b0SSuyog Pawar : 0;
706*c83a76b0SSuyog Pawar // clang-format on
707*c83a76b0SSuyog Pawar }
708*c83a76b0SSuyog Pawar }
709*c83a76b0SSuyog Pawar else /* If the reference pictures used are different */
710*c83a76b0SSuyog Pawar {
711*c83a76b0SSuyog Pawar bs_flag = 1;
712*c83a76b0SSuyog Pawar }
713*c83a76b0SSuyog Pawar }
714*c83a76b0SSuyog Pawar
715*c83a76b0SSuyog Pawar if(bs_flag)
716*c83a76b0SSuyog Pawar { /*Storing if BS set due to PU mvs */
717*c83a76b0SSuyog Pawar /*Storing in BigEnd. format. BS[0]|BS[1]| .. |BS[15] & edge_size is 4*/
718*c83a76b0SSuyog Pawar SET_VALUE_BIG((pu4_pu_cur_edge), BS_CBF_4, (pu_pos_bit_calc + j), 4);
719*c83a76b0SSuyog Pawar }
720*c83a76b0SSuyog Pawar }
721*c83a76b0SSuyog Pawar
722*c83a76b0SSuyog Pawar /* increment the neighbour */
723*c83a76b0SSuyog Pawar ps_nbr_4x4 += nbr_inc;
724*c83a76b0SSuyog Pawar }
725*c83a76b0SSuyog Pawar }
726*c83a76b0SSuyog Pawar }
727*c83a76b0SSuyog Pawar /* point to the next PU */
728*c83a76b0SSuyog Pawar ps_pu++;
729*c83a76b0SSuyog Pawar }
730*c83a76b0SSuyog Pawar }
731*c83a76b0SSuyog Pawar
732*c83a76b0SSuyog Pawar /**
733*c83a76b0SSuyog Pawar *******************************************************************************
734*c83a76b0SSuyog Pawar *
735*c83a76b0SSuyog Pawar * @brief Clear the invalid Boundary Strength which may be set by
736*c83a76b0SSuyog Pawar * ihevce_bs_compute_cu
737*c83a76b0SSuyog Pawar *
738*c83a76b0SSuyog Pawar * @par Description
739*c83a76b0SSuyog Pawar * Clear the invalid Boundary Strength which may be set by ihevce_bs_compute_cu
740*c83a76b0SSuyog Pawar * (as it does all 4 edges in a shot for some cases)
741*c83a76b0SSuyog Pawar *
742*c83a76b0SSuyog Pawar * @param[out] ps_deblk_prms
743*c83a76b0SSuyog Pawar * Pointer to structure s_deblk_prms, which contains
744*c83a76b0SSuyog Pawar * s_deblk_prms.au4_horz_bs : max of 8 such conti. bs to be comp. for 64x64 ctb
745*c83a76b0SSuyog Pawar * s_deblk_prms.au4_vert_bs : max of 8 such conti. bs to be comp. for 64x64 ctb
746*c83a76b0SSuyog Pawar *
747*c83a76b0SSuyog Pawar * @param[in] last_ctb_row_flag
748*c83a76b0SSuyog Pawar * Flag for checking whether the current CTB is in last ctb_row
749*c83a76b0SSuyog Pawar *
750*c83a76b0SSuyog Pawar * @param[in] last_ctb_in_row_flag
751*c83a76b0SSuyog Pawar * Flag for checking whether the current CTB is the last in current row
752*c83a76b0SSuyog Pawar *
753*c83a76b0SSuyog Pawar * @param[in] last_hz_ctb_wd
754*c83a76b0SSuyog Pawar * Valid Width (pixels) in the last CTB in every row (padding cases)
755*c83a76b0SSuyog Pawar *
756*c83a76b0SSuyog Pawar * @param[in] last_vt_ctb_ht
757*c83a76b0SSuyog Pawar * Valid Height (pixels) in the last CTB row (padding cases)
758*c83a76b0SSuyog Pawar *
759*c83a76b0SSuyog Pawar * @returns none
760*c83a76b0SSuyog Pawar *
761*c83a76b0SSuyog Pawar * @remarks
762*c83a76b0SSuyog Pawar *
763*c83a76b0SSuyog Pawar *******************************************************************************
764*c83a76b0SSuyog Pawar */
ihevce_bs_clear_invalid(deblk_bs_ctb_ctxt_t * ps_deblk_prms,WORD32 last_ctb_row_flag,WORD32 last_ctb_in_row_flag,WORD32 last_hz_ctb_wd,WORD32 last_vt_ctb_ht)765*c83a76b0SSuyog Pawar void ihevce_bs_clear_invalid(
766*c83a76b0SSuyog Pawar deblk_bs_ctb_ctxt_t *ps_deblk_prms,
767*c83a76b0SSuyog Pawar WORD32 last_ctb_row_flag,
768*c83a76b0SSuyog Pawar WORD32 last_ctb_in_row_flag,
769*c83a76b0SSuyog Pawar WORD32 last_hz_ctb_wd,
770*c83a76b0SSuyog Pawar WORD32 last_vt_ctb_ht)
771*c83a76b0SSuyog Pawar {
772*c83a76b0SSuyog Pawar /* Rightmost CTB. Right padding may be there */
773*c83a76b0SSuyog Pawar /* clear the last vert BS which might have set by ihevce_bs_compute_cu */
774*c83a76b0SSuyog Pawar if(1 == last_ctb_in_row_flag)
775*c83a76b0SSuyog Pawar {
776*c83a76b0SSuyog Pawar ps_deblk_prms->au4_vert_bs[last_hz_ctb_wd >> 3] = 0;
777*c83a76b0SSuyog Pawar }
778*c83a76b0SSuyog Pawar
779*c83a76b0SSuyog Pawar /* Bottommost CTB. Bottom padding may be there */
780*c83a76b0SSuyog Pawar /* clear the last horz BS which might have set by ihevce_bs_compute_cu */
781*c83a76b0SSuyog Pawar if(1 == last_ctb_row_flag)
782*c83a76b0SSuyog Pawar {
783*c83a76b0SSuyog Pawar ps_deblk_prms->au4_horz_bs[last_vt_ctb_ht >> 3] = 0;
784*c83a76b0SSuyog Pawar }
785*c83a76b0SSuyog Pawar }
786