1*c83a76b0SSuyog Pawar /******************************************************************************
2*c83a76b0SSuyog Pawar *
3*c83a76b0SSuyog Pawar * Copyright (C) 2012 Ittiam Systems Pvt Ltd, Bangalore
4*c83a76b0SSuyog Pawar *
5*c83a76b0SSuyog Pawar * Licensed under the Apache License, Version 2.0 (the "License");
6*c83a76b0SSuyog Pawar * you may not use this file except in compliance with the License.
7*c83a76b0SSuyog Pawar * You may obtain a copy of the License at:
8*c83a76b0SSuyog Pawar *
9*c83a76b0SSuyog Pawar * http://www.apache.org/licenses/LICENSE-2.0
10*c83a76b0SSuyog Pawar *
11*c83a76b0SSuyog Pawar * Unless required by applicable law or agreed to in writing, software
12*c83a76b0SSuyog Pawar * distributed under the License is distributed on an "AS IS" BASIS,
13*c83a76b0SSuyog Pawar * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14*c83a76b0SSuyog Pawar * See the License for the specific language governing permissions and
15*c83a76b0SSuyog Pawar * limitations under the License.
16*c83a76b0SSuyog Pawar *
17*c83a76b0SSuyog Pawar ******************************************************************************/
18*c83a76b0SSuyog Pawar /**
19*c83a76b0SSuyog Pawar *******************************************************************************
20*c83a76b0SSuyog Pawar * @file
21*c83a76b0SSuyog Pawar * ihevcd_mv_merge.c
22*c83a76b0SSuyog Pawar *
23*c83a76b0SSuyog Pawar * @brief
24*c83a76b0SSuyog Pawar * Contains functions for motion vector merge candidates derivation
25*c83a76b0SSuyog Pawar *
26*c83a76b0SSuyog Pawar * @author
27*c83a76b0SSuyog Pawar * Ittiam
28*c83a76b0SSuyog Pawar *
29*c83a76b0SSuyog Pawar * @par List of Functions:
30*c83a76b0SSuyog Pawar * - ihevcd_compare_pu_mv_t()
31*c83a76b0SSuyog Pawar * - ihevcd_mv_pred_merge()
32*c83a76b0SSuyog Pawar *
33*c83a76b0SSuyog Pawar * @remarks
34*c83a76b0SSuyog Pawar * None
35*c83a76b0SSuyog Pawar *
36*c83a76b0SSuyog Pawar *******************************************************************************
37*c83a76b0SSuyog Pawar */
38*c83a76b0SSuyog Pawar /*****************************************************************************/
39*c83a76b0SSuyog Pawar /* File Includes */
40*c83a76b0SSuyog Pawar /*****************************************************************************/
41*c83a76b0SSuyog Pawar #include <stdio.h>
42*c83a76b0SSuyog Pawar #include <stddef.h>
43*c83a76b0SSuyog Pawar #include <stdlib.h>
44*c83a76b0SSuyog Pawar #include <string.h>
45*c83a76b0SSuyog Pawar
46*c83a76b0SSuyog Pawar #include "ihevc_typedefs.h"
47*c83a76b0SSuyog Pawar #include "iv.h"
48*c83a76b0SSuyog Pawar #include "ivd.h"
49*c83a76b0SSuyog Pawar #include "ihevcd_cxa.h"
50*c83a76b0SSuyog Pawar #include "ithread.h"
51*c83a76b0SSuyog Pawar
52*c83a76b0SSuyog Pawar #include "ihevc_defs.h"
53*c83a76b0SSuyog Pawar #include "ihevc_debug.h"
54*c83a76b0SSuyog Pawar #include "ihevc_structs.h"
55*c83a76b0SSuyog Pawar #include "ihevc_macros.h"
56*c83a76b0SSuyog Pawar #include "ihevc_platform_macros.h"
57*c83a76b0SSuyog Pawar #include "ihevc_cabac_tables.h"
58*c83a76b0SSuyog Pawar #include "ihevc_disp_mgr.h"
59*c83a76b0SSuyog Pawar #include "ihevc_buf_mgr.h"
60*c83a76b0SSuyog Pawar #include "ihevc_dpb_mgr.h"
61*c83a76b0SSuyog Pawar
62*c83a76b0SSuyog Pawar #include "ihevcd_defs.h"
63*c83a76b0SSuyog Pawar #include "ihevcd_function_selector.h"
64*c83a76b0SSuyog Pawar #include "ihevcd_structs.h"
65*c83a76b0SSuyog Pawar #include "ihevcd_error.h"
66*c83a76b0SSuyog Pawar #include "ihevcd_nal.h"
67*c83a76b0SSuyog Pawar #include "ihevcd_bitstream.h"
68*c83a76b0SSuyog Pawar #include "ihevcd_fmt_conv.h"
69*c83a76b0SSuyog Pawar #include "ihevcd_job_queue.h"
70*c83a76b0SSuyog Pawar #include "ihevcd_debug.h"
71*c83a76b0SSuyog Pawar #include "ihevcd_mv_merge.h"
72*c83a76b0SSuyog Pawar /**
73*c83a76b0SSuyog Pawar *******************************************************************************
74*c83a76b0SSuyog Pawar *
75*c83a76b0SSuyog Pawar * @brief Compare Motion vectors function
76*c83a76b0SSuyog Pawar *
77*c83a76b0SSuyog Pawar *
78*c83a76b0SSuyog Pawar * @par Description:
79*c83a76b0SSuyog Pawar * Checks if MVs and Reference idx are excatly matching.
80*c83a76b0SSuyog Pawar *
81*c83a76b0SSuyog Pawar * @param[inout] ps_1
82*c83a76b0SSuyog Pawar * motion vector 1 to be compared
83*c83a76b0SSuyog Pawar *
84*c83a76b0SSuyog Pawar * @param[in] ps_2
85*c83a76b0SSuyog Pawar * motion vector 2 to be compared
86*c83a76b0SSuyog Pawar *
87*c83a76b0SSuyog Pawar * @returns
88*c83a76b0SSuyog Pawar * 0 : if not matching 1 : if matching
89*c83a76b0SSuyog Pawar *
90*c83a76b0SSuyog Pawar * @remarks
91*c83a76b0SSuyog Pawar *
92*c83a76b0SSuyog Pawar *******************************************************************************
93*c83a76b0SSuyog Pawar */
ihevcd_compare_pu_t(pu_t * ps_pu_1,pu_t * ps_pu_2)94*c83a76b0SSuyog Pawar WORD32 ihevcd_compare_pu_t(pu_t *ps_pu_1, pu_t *ps_pu_2)
95*c83a76b0SSuyog Pawar {
96*c83a76b0SSuyog Pawar WORD32 l0_match = 0, l1_match = 0;
97*c83a76b0SSuyog Pawar pu_mv_t *ps_mv_1, *ps_mv_2;
98*c83a76b0SSuyog Pawar WORD32 pred_mode_1, pred_mode_2;
99*c83a76b0SSuyog Pawar
100*c83a76b0SSuyog Pawar ps_mv_1 = &ps_pu_1->mv;
101*c83a76b0SSuyog Pawar ps_mv_2 = &ps_pu_2->mv;
102*c83a76b0SSuyog Pawar
103*c83a76b0SSuyog Pawar pred_mode_1 = ps_pu_1->b2_pred_mode;
104*c83a76b0SSuyog Pawar pred_mode_2 = ps_pu_2->b2_pred_mode;
105*c83a76b0SSuyog Pawar
106*c83a76b0SSuyog Pawar if(pred_mode_1 == pred_mode_2)
107*c83a76b0SSuyog Pawar {
108*c83a76b0SSuyog Pawar if(pred_mode_1 != PRED_L1)
109*c83a76b0SSuyog Pawar {
110*c83a76b0SSuyog Pawar if(ps_mv_1->i1_l0_ref_idx == ps_mv_2->i1_l0_ref_idx)
111*c83a76b0SSuyog Pawar {
112*c83a76b0SSuyog Pawar if(0 == memcmp(&ps_mv_1->s_l0_mv, &ps_mv_2->s_l0_mv, sizeof(mv_t)))
113*c83a76b0SSuyog Pawar {
114*c83a76b0SSuyog Pawar l0_match = 1;
115*c83a76b0SSuyog Pawar }
116*c83a76b0SSuyog Pawar }
117*c83a76b0SSuyog Pawar }
118*c83a76b0SSuyog Pawar if(pred_mode_1 != PRED_L0)
119*c83a76b0SSuyog Pawar {
120*c83a76b0SSuyog Pawar if(ps_mv_1->i1_l1_ref_idx == ps_mv_2->i1_l1_ref_idx)
121*c83a76b0SSuyog Pawar {
122*c83a76b0SSuyog Pawar if(0 == memcmp(&ps_mv_1->s_l1_mv, &ps_mv_2->s_l1_mv, sizeof(mv_t)))
123*c83a76b0SSuyog Pawar {
124*c83a76b0SSuyog Pawar l1_match = 1;
125*c83a76b0SSuyog Pawar }
126*c83a76b0SSuyog Pawar }
127*c83a76b0SSuyog Pawar }
128*c83a76b0SSuyog Pawar if(pred_mode_1 == PRED_BI)
129*c83a76b0SSuyog Pawar return (l1_match && l0_match);
130*c83a76b0SSuyog Pawar else if(pred_mode_1 == PRED_L0)
131*c83a76b0SSuyog Pawar return l0_match;
132*c83a76b0SSuyog Pawar else
133*c83a76b0SSuyog Pawar return l1_match;
134*c83a76b0SSuyog Pawar }
135*c83a76b0SSuyog Pawar
136*c83a76b0SSuyog Pawar return 0;
137*c83a76b0SSuyog Pawar }
138*c83a76b0SSuyog Pawar
ihevcd_collocated_mvp(mv_ctxt_t * ps_mv_ctxt,pu_t * ps_pu,mv_t * ps_mv_col,WORD32 * pu4_avail_col_flag,WORD32 use_pu_ref_idx,WORD32 x_col,WORD32 y_col)139*c83a76b0SSuyog Pawar void ihevcd_collocated_mvp(mv_ctxt_t *ps_mv_ctxt,
140*c83a76b0SSuyog Pawar pu_t *ps_pu,
141*c83a76b0SSuyog Pawar mv_t *ps_mv_col,
142*c83a76b0SSuyog Pawar WORD32 *pu4_avail_col_flag,
143*c83a76b0SSuyog Pawar WORD32 use_pu_ref_idx,
144*c83a76b0SSuyog Pawar WORD32 x_col,
145*c83a76b0SSuyog Pawar WORD32 y_col)
146*c83a76b0SSuyog Pawar {
147*c83a76b0SSuyog Pawar sps_t *ps_sps = ps_mv_ctxt->ps_sps;
148*c83a76b0SSuyog Pawar slice_header_t *ps_slice_hdr = ps_mv_ctxt->ps_slice_hdr;
149*c83a76b0SSuyog Pawar ref_list_t *ps_ref_list[2];
150*c83a76b0SSuyog Pawar mv_buf_t *ps_mv_buf_col;
151*c83a76b0SSuyog Pawar WORD32 xp_col, yp_col;
152*c83a76b0SSuyog Pawar WORD32 col_ctb_x, col_ctb_y;
153*c83a76b0SSuyog Pawar mv_t as_mv_col[2];
154*c83a76b0SSuyog Pawar WORD32 log2_ctb_size;
155*c83a76b0SSuyog Pawar WORD32 ctb_size;
156*c83a76b0SSuyog Pawar WORD32 avail_col;
157*c83a76b0SSuyog Pawar WORD32 col_ctb_idx, pu_cnt;
158*c83a76b0SSuyog Pawar WORD32 au4_list_col[2];
159*c83a76b0SSuyog Pawar WORD32 num_minpu_in_ctb;
160*c83a76b0SSuyog Pawar UWORD8 *pu1_pic_pu_map_ctb;
161*c83a76b0SSuyog Pawar pu_t *ps_col_pu;
162*c83a76b0SSuyog Pawar WORD32 part_pos_y;
163*c83a76b0SSuyog Pawar
164*c83a76b0SSuyog Pawar
165*c83a76b0SSuyog Pawar part_pos_y = ps_pu->b4_pos_y << 2;
166*c83a76b0SSuyog Pawar
167*c83a76b0SSuyog Pawar log2_ctb_size = ps_sps->i1_log2_ctb_size;
168*c83a76b0SSuyog Pawar ctb_size = (1 << log2_ctb_size);
169*c83a76b0SSuyog Pawar
170*c83a76b0SSuyog Pawar avail_col = 1;
171*c83a76b0SSuyog Pawar
172*c83a76b0SSuyog Pawar /* Initializing reference list */
173*c83a76b0SSuyog Pawar ps_ref_list[0] = ps_slice_hdr->as_ref_pic_list0;
174*c83a76b0SSuyog Pawar ps_ref_list[1] = ps_slice_hdr->as_ref_pic_list1;
175*c83a76b0SSuyog Pawar if(PSLICE == ps_slice_hdr->i1_slice_type)
176*c83a76b0SSuyog Pawar ps_ref_list[1] = ps_slice_hdr->as_ref_pic_list0;
177*c83a76b0SSuyog Pawar
178*c83a76b0SSuyog Pawar if((ps_slice_hdr->i1_slice_type == BSLICE) && (ps_slice_hdr->i1_collocated_from_l0_flag == 0))
179*c83a76b0SSuyog Pawar {
180*c83a76b0SSuyog Pawar /* L1 */
181*c83a76b0SSuyog Pawar ps_mv_buf_col = (mv_buf_t *)ps_ref_list[1][ps_slice_hdr->i1_collocated_ref_idx].pv_mv_buf;
182*c83a76b0SSuyog Pawar
183*c83a76b0SSuyog Pawar }
184*c83a76b0SSuyog Pawar else
185*c83a76b0SSuyog Pawar {
186*c83a76b0SSuyog Pawar /* L0 */
187*c83a76b0SSuyog Pawar ps_mv_buf_col = (mv_buf_t *)ps_ref_list[0][ps_slice_hdr->i1_collocated_ref_idx].pv_mv_buf;
188*c83a76b0SSuyog Pawar
189*c83a76b0SSuyog Pawar }
190*c83a76b0SSuyog Pawar num_minpu_in_ctb = (ctb_size / MIN_PU_SIZE) * (ctb_size / MIN_PU_SIZE);
191*c83a76b0SSuyog Pawar
192*c83a76b0SSuyog Pawar if(((part_pos_y >> log2_ctb_size) == (y_col >> log2_ctb_size))
193*c83a76b0SSuyog Pawar && ((x_col + (ps_mv_ctxt->i4_ctb_x << log2_ctb_size)) < ps_sps->i2_pic_width_in_luma_samples)
194*c83a76b0SSuyog Pawar && (((y_col + (ps_mv_ctxt->i4_ctb_y << log2_ctb_size))
195*c83a76b0SSuyog Pawar < ps_sps->i2_pic_height_in_luma_samples)))
196*c83a76b0SSuyog Pawar {
197*c83a76b0SSuyog Pawar xp_col = ((x_col >> 4) << 4);
198*c83a76b0SSuyog Pawar yp_col = ((y_col >> 4) << 4);
199*c83a76b0SSuyog Pawar col_ctb_x = ps_mv_ctxt->i4_ctb_x + (xp_col >> log2_ctb_size);
200*c83a76b0SSuyog Pawar col_ctb_y = ps_mv_ctxt->i4_ctb_y + (yp_col >> log2_ctb_size);
201*c83a76b0SSuyog Pawar col_ctb_idx = col_ctb_x + (col_ctb_y)*(ps_sps->i2_pic_wd_in_ctb);
202*c83a76b0SSuyog Pawar pu_cnt = ps_mv_buf_col->pu4_pic_pu_idx[col_ctb_idx];
203*c83a76b0SSuyog Pawar pu1_pic_pu_map_ctb = ps_mv_buf_col->pu1_pic_pu_map
204*c83a76b0SSuyog Pawar + col_ctb_idx * num_minpu_in_ctb;
205*c83a76b0SSuyog Pawar if(xp_col == ctb_size)
206*c83a76b0SSuyog Pawar xp_col = 0;
207*c83a76b0SSuyog Pawar pu_cnt += pu1_pic_pu_map_ctb[(yp_col >> 2)
208*c83a76b0SSuyog Pawar * (ctb_size / MIN_PU_SIZE) + (xp_col >> 2)];
209*c83a76b0SSuyog Pawar ps_col_pu = &ps_mv_buf_col->ps_pic_pu[pu_cnt];
210*c83a76b0SSuyog Pawar }
211*c83a76b0SSuyog Pawar else
212*c83a76b0SSuyog Pawar avail_col = 0;
213*c83a76b0SSuyog Pawar
214*c83a76b0SSuyog Pawar if((avail_col == 0) || (ps_col_pu->b1_intra_flag == 1)
215*c83a76b0SSuyog Pawar || (ps_slice_hdr->i1_slice_temporal_mvp_enable_flag == 0))
216*c83a76b0SSuyog Pawar {
217*c83a76b0SSuyog Pawar pu4_avail_col_flag[0] = 0;
218*c83a76b0SSuyog Pawar pu4_avail_col_flag[1] = 0;
219*c83a76b0SSuyog Pawar ps_mv_col[0].i2_mvx = 0;
220*c83a76b0SSuyog Pawar ps_mv_col[0].i2_mvy = 0;
221*c83a76b0SSuyog Pawar ps_mv_col[1].i2_mvx = 0;
222*c83a76b0SSuyog Pawar ps_mv_col[1].i2_mvy = 0;
223*c83a76b0SSuyog Pawar }
224*c83a76b0SSuyog Pawar else
225*c83a76b0SSuyog Pawar {
226*c83a76b0SSuyog Pawar WORD32 au4_ref_idx_col[2];
227*c83a76b0SSuyog Pawar WORD32 pred_flag_l0, pred_flag_l1;
228*c83a76b0SSuyog Pawar pred_flag_l0 = (ps_col_pu->b2_pred_mode != PRED_L1);
229*c83a76b0SSuyog Pawar pred_flag_l1 = (ps_col_pu->b2_pred_mode != PRED_L0);
230*c83a76b0SSuyog Pawar
231*c83a76b0SSuyog Pawar if(pred_flag_l0 == 0)
232*c83a76b0SSuyog Pawar {
233*c83a76b0SSuyog Pawar as_mv_col[0] = ps_col_pu->mv.s_l1_mv;
234*c83a76b0SSuyog Pawar au4_ref_idx_col[0] = ps_col_pu->mv.i1_l1_ref_idx;
235*c83a76b0SSuyog Pawar au4_list_col[0] = 1; /* L1 */
236*c83a76b0SSuyog Pawar
237*c83a76b0SSuyog Pawar as_mv_col[1] = ps_col_pu->mv.s_l1_mv;
238*c83a76b0SSuyog Pawar au4_ref_idx_col[1] = ps_col_pu->mv.i1_l1_ref_idx;
239*c83a76b0SSuyog Pawar au4_list_col[1] = 1; /* L1 */
240*c83a76b0SSuyog Pawar }
241*c83a76b0SSuyog Pawar else
242*c83a76b0SSuyog Pawar {
243*c83a76b0SSuyog Pawar if(pred_flag_l1 == 0)
244*c83a76b0SSuyog Pawar {
245*c83a76b0SSuyog Pawar as_mv_col[0] = ps_col_pu->mv.s_l0_mv;
246*c83a76b0SSuyog Pawar au4_ref_idx_col[0] = ps_col_pu->mv.i1_l0_ref_idx;
247*c83a76b0SSuyog Pawar au4_list_col[0] = 0; /* L1 */
248*c83a76b0SSuyog Pawar
249*c83a76b0SSuyog Pawar as_mv_col[1] = ps_col_pu->mv.s_l0_mv;
250*c83a76b0SSuyog Pawar au4_ref_idx_col[1] = ps_col_pu->mv.i1_l0_ref_idx;
251*c83a76b0SSuyog Pawar au4_list_col[1] = 0; /* L1 */
252*c83a76b0SSuyog Pawar }
253*c83a76b0SSuyog Pawar else
254*c83a76b0SSuyog Pawar {
255*c83a76b0SSuyog Pawar if(1 == ps_slice_hdr->i1_low_delay_flag)
256*c83a76b0SSuyog Pawar {
257*c83a76b0SSuyog Pawar as_mv_col[0] = ps_col_pu->mv.s_l0_mv;
258*c83a76b0SSuyog Pawar au4_ref_idx_col[0] = ps_col_pu->mv.i1_l0_ref_idx;
259*c83a76b0SSuyog Pawar au4_list_col[0] = 0; /* L0 */
260*c83a76b0SSuyog Pawar
261*c83a76b0SSuyog Pawar as_mv_col[1] = ps_col_pu->mv.s_l1_mv;
262*c83a76b0SSuyog Pawar au4_ref_idx_col[1] = ps_col_pu->mv.i1_l1_ref_idx;
263*c83a76b0SSuyog Pawar au4_list_col[1] = 1; /* L1 */
264*c83a76b0SSuyog Pawar }
265*c83a76b0SSuyog Pawar else
266*c83a76b0SSuyog Pawar {
267*c83a76b0SSuyog Pawar if(0 == ps_slice_hdr->i1_collocated_from_l0_flag)
268*c83a76b0SSuyog Pawar {
269*c83a76b0SSuyog Pawar as_mv_col[0] = ps_col_pu->mv.s_l0_mv;
270*c83a76b0SSuyog Pawar au4_ref_idx_col[0] = ps_col_pu->mv.i1_l0_ref_idx;
271*c83a76b0SSuyog Pawar
272*c83a76b0SSuyog Pawar as_mv_col[1] = ps_col_pu->mv.s_l0_mv;
273*c83a76b0SSuyog Pawar au4_ref_idx_col[1] = ps_col_pu->mv.i1_l0_ref_idx;
274*c83a76b0SSuyog Pawar }
275*c83a76b0SSuyog Pawar else
276*c83a76b0SSuyog Pawar {
277*c83a76b0SSuyog Pawar as_mv_col[0] = ps_col_pu->mv.s_l1_mv;
278*c83a76b0SSuyog Pawar au4_ref_idx_col[0] = ps_col_pu->mv.i1_l1_ref_idx;
279*c83a76b0SSuyog Pawar
280*c83a76b0SSuyog Pawar as_mv_col[1] = ps_col_pu->mv.s_l1_mv;
281*c83a76b0SSuyog Pawar au4_ref_idx_col[1] = ps_col_pu->mv.i1_l1_ref_idx;
282*c83a76b0SSuyog Pawar }
283*c83a76b0SSuyog Pawar
284*c83a76b0SSuyog Pawar au4_list_col[0] = ps_slice_hdr->i1_collocated_from_l0_flag; /* L"collocated_from_l0_flag" */
285*c83a76b0SSuyog Pawar au4_list_col[1] = ps_slice_hdr->i1_collocated_from_l0_flag; /* L"collocated_from_l0_flag" */
286*c83a76b0SSuyog Pawar }
287*c83a76b0SSuyog Pawar }
288*c83a76b0SSuyog Pawar }
289*c83a76b0SSuyog Pawar avail_col = 1;
290*c83a76b0SSuyog Pawar {
291*c83a76b0SSuyog Pawar WORD32 cur_poc, col_poc, col_ref_poc_l0, cur_ref_poc;
292*c83a76b0SSuyog Pawar WORD32 col_ref_poc_l0_lt, cur_ref_poc_lt;
293*c83a76b0SSuyog Pawar WORD32 ref_idx_l0, ref_idx_l1;
294*c83a76b0SSuyog Pawar WORD32 slice_idx;
295*c83a76b0SSuyog Pawar pic_buf_t *ps_pic_buf;
296*c83a76b0SSuyog Pawar
297*c83a76b0SSuyog Pawar if(use_pu_ref_idx)
298*c83a76b0SSuyog Pawar {
299*c83a76b0SSuyog Pawar ref_idx_l0 = ps_pu->mv.i1_l0_ref_idx;
300*c83a76b0SSuyog Pawar ref_idx_l1 = ps_pu->mv.i1_l1_ref_idx;
301*c83a76b0SSuyog Pawar }
302*c83a76b0SSuyog Pawar else
303*c83a76b0SSuyog Pawar {
304*c83a76b0SSuyog Pawar ref_idx_l0 = 0;
305*c83a76b0SSuyog Pawar ref_idx_l1 = 0;
306*c83a76b0SSuyog Pawar }
307*c83a76b0SSuyog Pawar
308*c83a76b0SSuyog Pawar col_poc = ps_mv_buf_col->i4_abs_poc;
309*c83a76b0SSuyog Pawar cur_poc = ps_slice_hdr->i4_abs_pic_order_cnt;
310*c83a76b0SSuyog Pawar
311*c83a76b0SSuyog Pawar slice_idx = *(ps_mv_buf_col->pu1_pic_slice_map + col_ctb_x + col_ctb_y * ps_sps->i2_pic_wd_in_ctb);
312*c83a76b0SSuyog Pawar slice_idx &= (MAX_SLICE_HDR_CNT - 1);
313*c83a76b0SSuyog Pawar if(au4_list_col[0] == 0)
314*c83a76b0SSuyog Pawar {
315*c83a76b0SSuyog Pawar col_ref_poc_l0 =
316*c83a76b0SSuyog Pawar ps_mv_buf_col->ai4_l0_collocated_poc[slice_idx][au4_ref_idx_col[0]];
317*c83a76b0SSuyog Pawar col_ref_poc_l0_lt =
318*c83a76b0SSuyog Pawar (ps_mv_buf_col->ai1_l0_collocated_poc_lt[slice_idx][au4_ref_idx_col[0]] == LONG_TERM_REF);
319*c83a76b0SSuyog Pawar }
320*c83a76b0SSuyog Pawar else
321*c83a76b0SSuyog Pawar {
322*c83a76b0SSuyog Pawar col_ref_poc_l0 =
323*c83a76b0SSuyog Pawar ps_mv_buf_col->ai4_l1_collocated_poc[slice_idx][au4_ref_idx_col[0]];
324*c83a76b0SSuyog Pawar col_ref_poc_l0_lt =
325*c83a76b0SSuyog Pawar (ps_mv_buf_col->ai1_l1_collocated_poc_lt[slice_idx][au4_ref_idx_col[0]] == LONG_TERM_REF);
326*c83a76b0SSuyog Pawar }
327*c83a76b0SSuyog Pawar /* L0 collocated mv */
328*c83a76b0SSuyog Pawar ps_pic_buf = (pic_buf_t *)((ps_ref_list[0][ref_idx_l0].pv_pic_buf));
329*c83a76b0SSuyog Pawar cur_ref_poc = ps_pic_buf->i4_abs_poc;
330*c83a76b0SSuyog Pawar cur_ref_poc_lt = (ps_pic_buf->u1_used_as_ref == LONG_TERM_REF);
331*c83a76b0SSuyog Pawar
332*c83a76b0SSuyog Pawar if(cur_ref_poc_lt == col_ref_poc_l0_lt)
333*c83a76b0SSuyog Pawar {
334*c83a76b0SSuyog Pawar pu4_avail_col_flag[0] = 1;
335*c83a76b0SSuyog Pawar
336*c83a76b0SSuyog Pawar if(cur_ref_poc_lt || ((col_poc - col_ref_poc_l0) == (cur_poc - cur_ref_poc)))
337*c83a76b0SSuyog Pawar {
338*c83a76b0SSuyog Pawar ps_mv_col[0] = as_mv_col[0];
339*c83a76b0SSuyog Pawar }
340*c83a76b0SSuyog Pawar else
341*c83a76b0SSuyog Pawar {
342*c83a76b0SSuyog Pawar ps_mv_col[0] = as_mv_col[0];
343*c83a76b0SSuyog Pawar if(col_ref_poc_l0 != col_poc)
344*c83a76b0SSuyog Pawar ihevcd_scale_collocated_mv((mv_t *)(&ps_mv_col[0]), cur_ref_poc,
345*c83a76b0SSuyog Pawar col_ref_poc_l0, col_poc, cur_poc);
346*c83a76b0SSuyog Pawar }
347*c83a76b0SSuyog Pawar }
348*c83a76b0SSuyog Pawar else
349*c83a76b0SSuyog Pawar {
350*c83a76b0SSuyog Pawar pu4_avail_col_flag[0] = 0;
351*c83a76b0SSuyog Pawar ps_mv_col[0].i2_mvx = 0;
352*c83a76b0SSuyog Pawar ps_mv_col[0].i2_mvy = 0;
353*c83a76b0SSuyog Pawar }
354*c83a76b0SSuyog Pawar if((BSLICE == ps_slice_hdr->i1_slice_type))
355*c83a76b0SSuyog Pawar {
356*c83a76b0SSuyog Pawar WORD32 col_ref_poc_l1_lt, col_ref_poc_l1;
357*c83a76b0SSuyog Pawar
358*c83a76b0SSuyog Pawar if(au4_list_col[1] == 0)
359*c83a76b0SSuyog Pawar {
360*c83a76b0SSuyog Pawar col_ref_poc_l1 =
361*c83a76b0SSuyog Pawar ps_mv_buf_col->ai4_l0_collocated_poc[slice_idx][au4_ref_idx_col[1]];
362*c83a76b0SSuyog Pawar col_ref_poc_l1_lt =
363*c83a76b0SSuyog Pawar (ps_mv_buf_col->ai1_l0_collocated_poc_lt[slice_idx][au4_ref_idx_col[1]] == LONG_TERM_REF);
364*c83a76b0SSuyog Pawar }
365*c83a76b0SSuyog Pawar else
366*c83a76b0SSuyog Pawar {
367*c83a76b0SSuyog Pawar col_ref_poc_l1 =
368*c83a76b0SSuyog Pawar ps_mv_buf_col->ai4_l1_collocated_poc[slice_idx][au4_ref_idx_col[1]];
369*c83a76b0SSuyog Pawar col_ref_poc_l1_lt =
370*c83a76b0SSuyog Pawar (ps_mv_buf_col->ai1_l1_collocated_poc_lt[slice_idx][au4_ref_idx_col[1]] == LONG_TERM_REF);
371*c83a76b0SSuyog Pawar }
372*c83a76b0SSuyog Pawar
373*c83a76b0SSuyog Pawar /* L1 collocated mv */
374*c83a76b0SSuyog Pawar ps_pic_buf = (pic_buf_t *)((ps_ref_list[1][ref_idx_l1].pv_pic_buf));
375*c83a76b0SSuyog Pawar cur_ref_poc = ps_pic_buf->i4_abs_poc;
376*c83a76b0SSuyog Pawar cur_ref_poc_lt = (ps_pic_buf->u1_used_as_ref == LONG_TERM_REF);
377*c83a76b0SSuyog Pawar
378*c83a76b0SSuyog Pawar if(cur_ref_poc_lt == col_ref_poc_l1_lt)
379*c83a76b0SSuyog Pawar {
380*c83a76b0SSuyog Pawar pu4_avail_col_flag[1] = 1;
381*c83a76b0SSuyog Pawar
382*c83a76b0SSuyog Pawar if(cur_ref_poc_lt || ((col_poc - col_ref_poc_l1) == (cur_poc - cur_ref_poc)))
383*c83a76b0SSuyog Pawar {
384*c83a76b0SSuyog Pawar ps_mv_col[1] = as_mv_col[1];
385*c83a76b0SSuyog Pawar }
386*c83a76b0SSuyog Pawar else
387*c83a76b0SSuyog Pawar {
388*c83a76b0SSuyog Pawar ps_mv_col[1] = as_mv_col[1];
389*c83a76b0SSuyog Pawar if(col_ref_poc_l1 != col_poc)
390*c83a76b0SSuyog Pawar ihevcd_scale_collocated_mv((mv_t *)&ps_mv_col[1], cur_ref_poc,
391*c83a76b0SSuyog Pawar col_ref_poc_l1, col_poc, cur_poc);
392*c83a76b0SSuyog Pawar }
393*c83a76b0SSuyog Pawar }
394*c83a76b0SSuyog Pawar else
395*c83a76b0SSuyog Pawar {
396*c83a76b0SSuyog Pawar pu4_avail_col_flag[1] = 0;
397*c83a76b0SSuyog Pawar ps_mv_col[1].i2_mvx = 0;
398*c83a76b0SSuyog Pawar ps_mv_col[1].i2_mvy = 0;
399*c83a76b0SSuyog Pawar }
400*c83a76b0SSuyog Pawar }
401*c83a76b0SSuyog Pawar else
402*c83a76b0SSuyog Pawar {
403*c83a76b0SSuyog Pawar pu4_avail_col_flag[1] = 0;
404*c83a76b0SSuyog Pawar }
405*c83a76b0SSuyog Pawar }
406*c83a76b0SSuyog Pawar }
407*c83a76b0SSuyog Pawar }
408*c83a76b0SSuyog Pawar
409*c83a76b0SSuyog Pawar
410*c83a76b0SSuyog Pawar /**
411*c83a76b0SSuyog Pawar *******************************************************************************
412*c83a76b0SSuyog Pawar *
413*c83a76b0SSuyog Pawar * @brief
414*c83a76b0SSuyog Pawar * This function performs Motion Vector Merge candidates derivation
415*c83a76b0SSuyog Pawar *
416*c83a76b0SSuyog Pawar * @par Description:
417*c83a76b0SSuyog Pawar * MV merge list is computed using neighbor mvs and colocated mv
418*c83a76b0SSuyog Pawar *
419*c83a76b0SSuyog Pawar * @param[in] ps_ctxt
420*c83a76b0SSuyog Pawar * pointer to mv predictor context
421*c83a76b0SSuyog Pawar *
422*c83a76b0SSuyog Pawar * @param[in] ps_top_nbr_4x4
423*c83a76b0SSuyog Pawar * pointer to top 4x4 nbr structure
424*c83a76b0SSuyog Pawar *
425*c83a76b0SSuyog Pawar * @param[in] ps_left_nbr_4x4
426*c83a76b0SSuyog Pawar * pointer to left 4x4 nbr structure
427*c83a76b0SSuyog Pawar *
428*c83a76b0SSuyog Pawar * @param[in] ps_top_left_nbr_4x4
429*c83a76b0SSuyog Pawar * pointer to top left 4x4 nbr structure
430*c83a76b0SSuyog Pawar *
431*c83a76b0SSuyog Pawar * @param[in] left_nbr_4x4_strd
432*c83a76b0SSuyog Pawar * left nbr buffer stride in terms of 4x4 units
433*c83a76b0SSuyog Pawar *
434*c83a76b0SSuyog Pawar * @param[in] ps_avail_flags
435*c83a76b0SSuyog Pawar * Neighbor availability flags container
436*c83a76b0SSuyog Pawar *
437*c83a76b0SSuyog Pawar * @param[in] ps_col_mv
438*c83a76b0SSuyog Pawar * Colocated MV pointer
439*c83a76b0SSuyog Pawar *
440*c83a76b0SSuyog Pawar * @param[in] ps_pu
441*c83a76b0SSuyog Pawar * Current Partition PU strucrture pointer
442*c83a76b0SSuyog Pawar *
443*c83a76b0SSuyog Pawar * @param[in] part_mode
444*c83a76b0SSuyog Pawar * Partition mode @sa PART_SIZE_E
445*c83a76b0SSuyog Pawar *
446*c83a76b0SSuyog Pawar * @param[in] part_idx
447*c83a76b0SSuyog Pawar * Partition idx of current partition inside CU
448*c83a76b0SSuyog Pawar *
449*c83a76b0SSuyog Pawar * @param[in] single_mcl_flag
450*c83a76b0SSuyog Pawar * Single MCL flag based on 8x8 CU and Parallel merge value
451*c83a76b0SSuyog Pawar *
452*c83a76b0SSuyog Pawar * @param[out] ps_merge_cand_list
453*c83a76b0SSuyog Pawar * pointer to store MV merge candidates list
454*c83a76b0SSuyog Pawar *
455*c83a76b0SSuyog Pawar * @returns
456*c83a76b0SSuyog Pawar * None
457*c83a76b0SSuyog Pawar * @remarks
458*c83a76b0SSuyog Pawar *
459*c83a76b0SSuyog Pawar *
460*c83a76b0SSuyog Pawar *******************************************************************************
461*c83a76b0SSuyog Pawar */
ihevcd_mv_merge(mv_ctxt_t * ps_mv_ctxt,UWORD32 * pu4_top_pu_idx,UWORD32 * pu4_left_pu_idx,WORD32 left_nbr_4x4_strd,pu_t * ps_pu,WORD32 part_mode,WORD32 part_idx,WORD32 part_wd,WORD32 part_ht,WORD32 part_pos_x,WORD32 part_pos_y,WORD32 single_mcl_flag,WORD32 lb_avail,WORD32 l_avail,WORD32 tr_avail,WORD32 t_avail,WORD32 tl_avail)462*c83a76b0SSuyog Pawar void ihevcd_mv_merge(mv_ctxt_t *ps_mv_ctxt,
463*c83a76b0SSuyog Pawar UWORD32 *pu4_top_pu_idx,
464*c83a76b0SSuyog Pawar UWORD32 *pu4_left_pu_idx,
465*c83a76b0SSuyog Pawar WORD32 left_nbr_4x4_strd,
466*c83a76b0SSuyog Pawar pu_t *ps_pu,
467*c83a76b0SSuyog Pawar WORD32 part_mode,
468*c83a76b0SSuyog Pawar WORD32 part_idx,
469*c83a76b0SSuyog Pawar WORD32 part_wd,
470*c83a76b0SSuyog Pawar WORD32 part_ht,
471*c83a76b0SSuyog Pawar WORD32 part_pos_x,
472*c83a76b0SSuyog Pawar WORD32 part_pos_y,
473*c83a76b0SSuyog Pawar WORD32 single_mcl_flag,
474*c83a76b0SSuyog Pawar WORD32 lb_avail,
475*c83a76b0SSuyog Pawar WORD32 l_avail,
476*c83a76b0SSuyog Pawar WORD32 tr_avail,
477*c83a76b0SSuyog Pawar WORD32 t_avail,
478*c83a76b0SSuyog Pawar WORD32 tl_avail)
479*c83a76b0SSuyog Pawar {
480*c83a76b0SSuyog Pawar /******************************************************/
481*c83a76b0SSuyog Pawar /* Spatial Merge Candidates */
482*c83a76b0SSuyog Pawar /******************************************************/
483*c83a76b0SSuyog Pawar slice_header_t *ps_slice_hdr;
484*c83a76b0SSuyog Pawar pu_t as_pu_merge_list[MAX_NUM_MERGE_CAND];
485*c83a76b0SSuyog Pawar pps_t *ps_pps;
486*c83a76b0SSuyog Pawar ref_list_t *ps_ref_list[2];
487*c83a76b0SSuyog Pawar WORD32 sum_avail_a0_a1_b0_b1 = 0; /*Sum of availability of A0, A1, B0, B1*/
488*c83a76b0SSuyog Pawar WORD32 nbr_x, nbr_y;
489*c83a76b0SSuyog Pawar WORD32 nbr_avail[MAX_NUM_MV_NBR];
490*c83a76b0SSuyog Pawar WORD32 merge_shift;
491*c83a76b0SSuyog Pawar WORD32 nbr_pu_idx;
492*c83a76b0SSuyog Pawar pu_t *ps_nbr_pu[MAX_NUM_MV_NBR];
493*c83a76b0SSuyog Pawar WORD32 max_num_merge_cand;
494*c83a76b0SSuyog Pawar WORD32 candidate_cnt;
495*c83a76b0SSuyog Pawar WORD32 pos_x_merge_shift, pos_y_merge_shift;
496*c83a76b0SSuyog Pawar
497*c83a76b0SSuyog Pawar ps_slice_hdr = ps_mv_ctxt->ps_slice_hdr;
498*c83a76b0SSuyog Pawar ps_pps = ps_mv_ctxt->ps_pps;
499*c83a76b0SSuyog Pawar /* Initializing reference list */
500*c83a76b0SSuyog Pawar ps_ref_list[0] = ps_slice_hdr->as_ref_pic_list0;
501*c83a76b0SSuyog Pawar ps_ref_list[1] = ps_slice_hdr->as_ref_pic_list1;
502*c83a76b0SSuyog Pawar if(PSLICE == ps_slice_hdr->i1_slice_type)
503*c83a76b0SSuyog Pawar ps_ref_list[1] = ps_slice_hdr->as_ref_pic_list0;
504*c83a76b0SSuyog Pawar
505*c83a76b0SSuyog Pawar candidate_cnt = 0;
506*c83a76b0SSuyog Pawar /*******************************************/
507*c83a76b0SSuyog Pawar /* Neighbor location: Graphical indication */
508*c83a76b0SSuyog Pawar /* */
509*c83a76b0SSuyog Pawar /* B2 _____________B1 B0 */
510*c83a76b0SSuyog Pawar /* | | */
511*c83a76b0SSuyog Pawar /* | | */
512*c83a76b0SSuyog Pawar /* | | */
513*c83a76b0SSuyog Pawar /* | PU ht| */
514*c83a76b0SSuyog Pawar /* | | */
515*c83a76b0SSuyog Pawar /* | | */
516*c83a76b0SSuyog Pawar /* A1|______wd_______| */
517*c83a76b0SSuyog Pawar /* A0 */
518*c83a76b0SSuyog Pawar /* */
519*c83a76b0SSuyog Pawar /*******************************************/
520*c83a76b0SSuyog Pawar
521*c83a76b0SSuyog Pawar merge_shift = ps_pps->i1_log2_parallel_merge_level;
522*c83a76b0SSuyog Pawar
523*c83a76b0SSuyog Pawar /* Availability check */
524*c83a76b0SSuyog Pawar /* A1 */
525*c83a76b0SSuyog Pawar nbr_x = part_pos_x - 1;
526*c83a76b0SSuyog Pawar nbr_y = part_pos_y + part_ht - 1; /* A1 */
527*c83a76b0SSuyog Pawar
528*c83a76b0SSuyog Pawar nbr_pu_idx = *(pu4_left_pu_idx + ((nbr_y - part_pos_y) >> 2) * left_nbr_4x4_strd);
529*c83a76b0SSuyog Pawar ps_nbr_pu[NBR_A1] = ps_mv_ctxt->ps_pic_pu + nbr_pu_idx;
530*c83a76b0SSuyog Pawar
531*c83a76b0SSuyog Pawar nbr_avail[NBR_A1] = l_avail
532*c83a76b0SSuyog Pawar && (!ps_nbr_pu[NBR_A1]->b1_intra_flag); /* A1 */
533*c83a76b0SSuyog Pawar
534*c83a76b0SSuyog Pawar pos_x_merge_shift = (part_pos_x >> merge_shift);
535*c83a76b0SSuyog Pawar pos_y_merge_shift = (part_pos_y >> merge_shift);
536*c83a76b0SSuyog Pawar max_num_merge_cand = ps_pu->b3_merge_idx + 1;
537*c83a76b0SSuyog Pawar
538*c83a76b0SSuyog Pawar {
539*c83a76b0SSuyog Pawar if(nbr_avail[NBR_A1])
540*c83a76b0SSuyog Pawar {
541*c83a76b0SSuyog Pawar /* if at same merge level */
542*c83a76b0SSuyog Pawar if(pos_x_merge_shift == (nbr_x >> merge_shift) &&
543*c83a76b0SSuyog Pawar (pos_y_merge_shift == (nbr_y >> merge_shift)))
544*c83a76b0SSuyog Pawar {
545*c83a76b0SSuyog Pawar nbr_avail[NBR_A1] = 0;
546*c83a76b0SSuyog Pawar }
547*c83a76b0SSuyog Pawar
548*c83a76b0SSuyog Pawar /* SPEC JCTVC-K1003_v9 version has a different way using not available */
549*c83a76b0SSuyog Pawar /* candidates compared to software. for non square part and seconf part case */
550*c83a76b0SSuyog Pawar /* ideally nothing from the 1st partition should be used as per spec but */
551*c83a76b0SSuyog Pawar /* HM 8.2 dev verison does not adhere to this. currenlty code fllows HM */
552*c83a76b0SSuyog Pawar
553*c83a76b0SSuyog Pawar /* if single MCL is 0 , second part of 2 part in CU */
554*c83a76b0SSuyog Pawar else if((single_mcl_flag == 0) && (part_idx == 1) &&
555*c83a76b0SSuyog Pawar ((part_mode == PART_Nx2N) || (part_mode == PART_nLx2N) ||
556*c83a76b0SSuyog Pawar (part_mode == PART_nRx2N)))
557*c83a76b0SSuyog Pawar {
558*c83a76b0SSuyog Pawar nbr_avail[NBR_A1] = 0;
559*c83a76b0SSuyog Pawar }
560*c83a76b0SSuyog Pawar sum_avail_a0_a1_b0_b1 += nbr_avail[NBR_A1];
561*c83a76b0SSuyog Pawar if(nbr_avail[NBR_A1])
562*c83a76b0SSuyog Pawar {
563*c83a76b0SSuyog Pawar as_pu_merge_list[candidate_cnt] = *ps_nbr_pu[NBR_A1];
564*c83a76b0SSuyog Pawar candidate_cnt++;
565*c83a76b0SSuyog Pawar if(candidate_cnt == max_num_merge_cand)
566*c83a76b0SSuyog Pawar {
567*c83a76b0SSuyog Pawar ps_pu[0].mv = as_pu_merge_list[candidate_cnt - 1].mv;
568*c83a76b0SSuyog Pawar ps_pu[0].b2_pred_mode = as_pu_merge_list[candidate_cnt - 1].b2_pred_mode;
569*c83a76b0SSuyog Pawar return;
570*c83a76b0SSuyog Pawar }
571*c83a76b0SSuyog Pawar }
572*c83a76b0SSuyog Pawar }
573*c83a76b0SSuyog Pawar }
574*c83a76b0SSuyog Pawar
575*c83a76b0SSuyog Pawar /* B1 */
576*c83a76b0SSuyog Pawar nbr_x = part_pos_x + part_wd - 1;
577*c83a76b0SSuyog Pawar nbr_y = part_pos_y - 1;
578*c83a76b0SSuyog Pawar
579*c83a76b0SSuyog Pawar nbr_pu_idx = *(pu4_top_pu_idx + ((nbr_x - part_pos_x) >> 2));
580*c83a76b0SSuyog Pawar ps_nbr_pu[NBR_B1] = ps_mv_ctxt->ps_pic_pu + nbr_pu_idx;
581*c83a76b0SSuyog Pawar
582*c83a76b0SSuyog Pawar nbr_avail[NBR_B1] = t_avail
583*c83a76b0SSuyog Pawar && (!ps_nbr_pu[NBR_B1]->b1_intra_flag); /* B1 */
584*c83a76b0SSuyog Pawar
585*c83a76b0SSuyog Pawar {
586*c83a76b0SSuyog Pawar WORD32 avail_flag;
587*c83a76b0SSuyog Pawar avail_flag = nbr_avail[NBR_B1];
588*c83a76b0SSuyog Pawar
589*c83a76b0SSuyog Pawar if(nbr_avail[NBR_B1])
590*c83a76b0SSuyog Pawar {
591*c83a76b0SSuyog Pawar /* if at same merge level */
592*c83a76b0SSuyog Pawar if(pos_x_merge_shift == (nbr_x >> merge_shift) &&
593*c83a76b0SSuyog Pawar (pos_y_merge_shift == (nbr_y >> merge_shift)))
594*c83a76b0SSuyog Pawar {
595*c83a76b0SSuyog Pawar nbr_avail[NBR_B1] = 0;
596*c83a76b0SSuyog Pawar avail_flag = 0;
597*c83a76b0SSuyog Pawar }
598*c83a76b0SSuyog Pawar
599*c83a76b0SSuyog Pawar /* if single MCL is 0 , second part of 2 part in CU */
600*c83a76b0SSuyog Pawar else if((single_mcl_flag == 0) && (part_idx == 1) &&
601*c83a76b0SSuyog Pawar ((part_mode == PART_2NxN) || (part_mode == PART_2NxnU) ||
602*c83a76b0SSuyog Pawar (part_mode == PART_2NxnD)))
603*c83a76b0SSuyog Pawar {
604*c83a76b0SSuyog Pawar nbr_avail[NBR_B1] = 0;
605*c83a76b0SSuyog Pawar avail_flag = 0;
606*c83a76b0SSuyog Pawar }
607*c83a76b0SSuyog Pawar
608*c83a76b0SSuyog Pawar else if(nbr_avail[NBR_A1])
609*c83a76b0SSuyog Pawar {
610*c83a76b0SSuyog Pawar avail_flag = !ihevcd_compare_pu_t(ps_nbr_pu[NBR_A1], ps_nbr_pu[NBR_B1]);
611*c83a76b0SSuyog Pawar }
612*c83a76b0SSuyog Pawar
613*c83a76b0SSuyog Pawar sum_avail_a0_a1_b0_b1 += avail_flag;
614*c83a76b0SSuyog Pawar if(avail_flag)
615*c83a76b0SSuyog Pawar {
616*c83a76b0SSuyog Pawar as_pu_merge_list[candidate_cnt] = *ps_nbr_pu[NBR_B1];
617*c83a76b0SSuyog Pawar candidate_cnt++;
618*c83a76b0SSuyog Pawar if(candidate_cnt == max_num_merge_cand)
619*c83a76b0SSuyog Pawar {
620*c83a76b0SSuyog Pawar ps_pu[0].mv = as_pu_merge_list[candidate_cnt - 1].mv;
621*c83a76b0SSuyog Pawar ps_pu[0].b2_pred_mode = as_pu_merge_list[candidate_cnt - 1].b2_pred_mode;
622*c83a76b0SSuyog Pawar return;
623*c83a76b0SSuyog Pawar }
624*c83a76b0SSuyog Pawar }
625*c83a76b0SSuyog Pawar }
626*c83a76b0SSuyog Pawar }
627*c83a76b0SSuyog Pawar /* B0 */
628*c83a76b0SSuyog Pawar nbr_x = part_pos_x + part_wd;
629*c83a76b0SSuyog Pawar nbr_y = part_pos_y - 1;
630*c83a76b0SSuyog Pawar
631*c83a76b0SSuyog Pawar nbr_pu_idx = *(pu4_top_pu_idx + ((nbr_x - part_pos_x) >> 2));
632*c83a76b0SSuyog Pawar ps_nbr_pu[NBR_B0] = ps_mv_ctxt->ps_pic_pu + nbr_pu_idx;
633*c83a76b0SSuyog Pawar
634*c83a76b0SSuyog Pawar nbr_avail[NBR_B0] = tr_avail
635*c83a76b0SSuyog Pawar && (!ps_nbr_pu[NBR_B0]->b1_intra_flag); /* B0 */
636*c83a76b0SSuyog Pawar
637*c83a76b0SSuyog Pawar {
638*c83a76b0SSuyog Pawar WORD32 avail_flag;
639*c83a76b0SSuyog Pawar avail_flag = nbr_avail[NBR_B0];
640*c83a76b0SSuyog Pawar
641*c83a76b0SSuyog Pawar /* if at same merge level */
642*c83a76b0SSuyog Pawar if(nbr_avail[NBR_B0])
643*c83a76b0SSuyog Pawar {
644*c83a76b0SSuyog Pawar if(pos_x_merge_shift == (nbr_x >> merge_shift) &&
645*c83a76b0SSuyog Pawar (pos_y_merge_shift == (nbr_y >> merge_shift)))
646*c83a76b0SSuyog Pawar {
647*c83a76b0SSuyog Pawar nbr_avail[NBR_B0] = 0;
648*c83a76b0SSuyog Pawar avail_flag = 0;
649*c83a76b0SSuyog Pawar }
650*c83a76b0SSuyog Pawar else if(nbr_avail[NBR_B1])
651*c83a76b0SSuyog Pawar {
652*c83a76b0SSuyog Pawar avail_flag = !ihevcd_compare_pu_t(ps_nbr_pu[NBR_B1], ps_nbr_pu[NBR_B0]);
653*c83a76b0SSuyog Pawar }
654*c83a76b0SSuyog Pawar
655*c83a76b0SSuyog Pawar sum_avail_a0_a1_b0_b1 += avail_flag;
656*c83a76b0SSuyog Pawar if(avail_flag)
657*c83a76b0SSuyog Pawar {
658*c83a76b0SSuyog Pawar as_pu_merge_list[candidate_cnt] = *ps_nbr_pu[NBR_B0];
659*c83a76b0SSuyog Pawar candidate_cnt++;
660*c83a76b0SSuyog Pawar if(candidate_cnt == max_num_merge_cand)
661*c83a76b0SSuyog Pawar {
662*c83a76b0SSuyog Pawar ps_pu[0].mv = as_pu_merge_list[candidate_cnt - 1].mv;
663*c83a76b0SSuyog Pawar ps_pu[0].b2_pred_mode = as_pu_merge_list[candidate_cnt - 1].b2_pred_mode;
664*c83a76b0SSuyog Pawar return;
665*c83a76b0SSuyog Pawar }
666*c83a76b0SSuyog Pawar }
667*c83a76b0SSuyog Pawar }
668*c83a76b0SSuyog Pawar }
669*c83a76b0SSuyog Pawar /* A0 */
670*c83a76b0SSuyog Pawar nbr_x = part_pos_x - 1;
671*c83a76b0SSuyog Pawar nbr_y = part_pos_y + part_ht; /* A0 */
672*c83a76b0SSuyog Pawar
673*c83a76b0SSuyog Pawar nbr_pu_idx = *(pu4_left_pu_idx + ((nbr_y - part_pos_y) >> 2) * left_nbr_4x4_strd);
674*c83a76b0SSuyog Pawar ps_nbr_pu[NBR_A0] = ps_mv_ctxt->ps_pic_pu + nbr_pu_idx;
675*c83a76b0SSuyog Pawar
676*c83a76b0SSuyog Pawar nbr_avail[NBR_A0] = lb_avail
677*c83a76b0SSuyog Pawar && (!ps_nbr_pu[NBR_A0]->b1_intra_flag); /* A0 */
678*c83a76b0SSuyog Pawar {
679*c83a76b0SSuyog Pawar WORD32 avail_flag;
680*c83a76b0SSuyog Pawar avail_flag = nbr_avail[NBR_A0];
681*c83a76b0SSuyog Pawar
682*c83a76b0SSuyog Pawar if(nbr_avail[NBR_A0])
683*c83a76b0SSuyog Pawar {
684*c83a76b0SSuyog Pawar /* if at same merge level */
685*c83a76b0SSuyog Pawar if(pos_x_merge_shift == (nbr_x >> merge_shift) &&
686*c83a76b0SSuyog Pawar (pos_y_merge_shift == (nbr_y >> merge_shift)))
687*c83a76b0SSuyog Pawar {
688*c83a76b0SSuyog Pawar nbr_avail[NBR_A0] = 0;
689*c83a76b0SSuyog Pawar avail_flag = 0;
690*c83a76b0SSuyog Pawar }
691*c83a76b0SSuyog Pawar else if(nbr_avail[NBR_A1])
692*c83a76b0SSuyog Pawar {
693*c83a76b0SSuyog Pawar avail_flag = !ihevcd_compare_pu_t(ps_nbr_pu[NBR_A1], ps_nbr_pu[NBR_A0]);
694*c83a76b0SSuyog Pawar }
695*c83a76b0SSuyog Pawar
696*c83a76b0SSuyog Pawar sum_avail_a0_a1_b0_b1 += avail_flag;
697*c83a76b0SSuyog Pawar if(avail_flag)
698*c83a76b0SSuyog Pawar {
699*c83a76b0SSuyog Pawar as_pu_merge_list[candidate_cnt] = *ps_nbr_pu[NBR_A0];
700*c83a76b0SSuyog Pawar candidate_cnt++;
701*c83a76b0SSuyog Pawar if(candidate_cnt == max_num_merge_cand)
702*c83a76b0SSuyog Pawar {
703*c83a76b0SSuyog Pawar ps_pu[0].mv = as_pu_merge_list[candidate_cnt - 1].mv;
704*c83a76b0SSuyog Pawar ps_pu[0].b2_pred_mode = as_pu_merge_list[candidate_cnt - 1].b2_pred_mode;
705*c83a76b0SSuyog Pawar return;
706*c83a76b0SSuyog Pawar }
707*c83a76b0SSuyog Pawar }
708*c83a76b0SSuyog Pawar }
709*c83a76b0SSuyog Pawar }
710*c83a76b0SSuyog Pawar /* B2 */
711*c83a76b0SSuyog Pawar
712*c83a76b0SSuyog Pawar nbr_x = part_pos_x - 1;
713*c83a76b0SSuyog Pawar nbr_y = part_pos_y - 1; /* B2 */
714*c83a76b0SSuyog Pawar
715*c83a76b0SSuyog Pawar nbr_pu_idx = *(pu4_top_pu_idx + ((nbr_x - part_pos_x) >> 2));
716*c83a76b0SSuyog Pawar ps_nbr_pu[NBR_B2] = ps_mv_ctxt->ps_pic_pu + nbr_pu_idx;
717*c83a76b0SSuyog Pawar
718*c83a76b0SSuyog Pawar nbr_avail[NBR_B2] = tl_avail
719*c83a76b0SSuyog Pawar && (!ps_nbr_pu[NBR_B2]->b1_intra_flag); /* B2 */
720*c83a76b0SSuyog Pawar
721*c83a76b0SSuyog Pawar {
722*c83a76b0SSuyog Pawar WORD32 avail_flag;
723*c83a76b0SSuyog Pawar avail_flag = nbr_avail[NBR_B2];
724*c83a76b0SSuyog Pawar
725*c83a76b0SSuyog Pawar if(nbr_avail[NBR_B2])
726*c83a76b0SSuyog Pawar {
727*c83a76b0SSuyog Pawar /* if at same merge level */
728*c83a76b0SSuyog Pawar if(pos_x_merge_shift == (nbr_x >> merge_shift) &&
729*c83a76b0SSuyog Pawar (pos_y_merge_shift == (nbr_y >> merge_shift)))
730*c83a76b0SSuyog Pawar {
731*c83a76b0SSuyog Pawar nbr_avail[NBR_B2] = 0;
732*c83a76b0SSuyog Pawar avail_flag = 0;
733*c83a76b0SSuyog Pawar }
734*c83a76b0SSuyog Pawar else if(4 == sum_avail_a0_a1_b0_b1)
735*c83a76b0SSuyog Pawar {
736*c83a76b0SSuyog Pawar avail_flag = 0;
737*c83a76b0SSuyog Pawar }
738*c83a76b0SSuyog Pawar
739*c83a76b0SSuyog Pawar else
740*c83a76b0SSuyog Pawar {
741*c83a76b0SSuyog Pawar if(nbr_avail[NBR_A1])
742*c83a76b0SSuyog Pawar {
743*c83a76b0SSuyog Pawar avail_flag = !ihevcd_compare_pu_t(ps_nbr_pu[NBR_A1], ps_nbr_pu[NBR_B2]);
744*c83a76b0SSuyog Pawar }
745*c83a76b0SSuyog Pawar
746*c83a76b0SSuyog Pawar if(avail_flag && nbr_avail[NBR_B1])
747*c83a76b0SSuyog Pawar {
748*c83a76b0SSuyog Pawar avail_flag = !ihevcd_compare_pu_t(ps_nbr_pu[NBR_B1], ps_nbr_pu[NBR_B2]);
749*c83a76b0SSuyog Pawar }
750*c83a76b0SSuyog Pawar }
751*c83a76b0SSuyog Pawar
752*c83a76b0SSuyog Pawar if(avail_flag)
753*c83a76b0SSuyog Pawar {
754*c83a76b0SSuyog Pawar as_pu_merge_list[candidate_cnt] = *ps_nbr_pu[NBR_B2];
755*c83a76b0SSuyog Pawar candidate_cnt++;
756*c83a76b0SSuyog Pawar if(candidate_cnt == max_num_merge_cand)
757*c83a76b0SSuyog Pawar {
758*c83a76b0SSuyog Pawar ps_pu[0].mv = as_pu_merge_list[candidate_cnt - 1].mv;
759*c83a76b0SSuyog Pawar ps_pu[0].b2_pred_mode = as_pu_merge_list[candidate_cnt - 1].b2_pred_mode;
760*c83a76b0SSuyog Pawar return;
761*c83a76b0SSuyog Pawar }
762*c83a76b0SSuyog Pawar }
763*c83a76b0SSuyog Pawar }
764*c83a76b0SSuyog Pawar }
765*c83a76b0SSuyog Pawar
766*c83a76b0SSuyog Pawar /***********************************************************/
767*c83a76b0SSuyog Pawar /* Collocated MV prediction */
768*c83a76b0SSuyog Pawar /***********************************************************/
769*c83a76b0SSuyog Pawar {
770*c83a76b0SSuyog Pawar mv_t as_mv_col[2];
771*c83a76b0SSuyog Pawar WORD32 avail_col_flag[2] = { 0 }, x_col, y_col;
772*c83a76b0SSuyog Pawar WORD32 avail_col_l0, avail_col_l1;
773*c83a76b0SSuyog Pawar // ihevcd_collocated_mvp(ps_mv_ctxt,ps_pu,part_pos_x,part_pos_y,part_wd,part_ht,as_mv_col,avail_col_flag,0);
774*c83a76b0SSuyog Pawar
775*c83a76b0SSuyog Pawar /* Checking Collocated MV availability at Bottom right of PU*/
776*c83a76b0SSuyog Pawar x_col = part_pos_x + part_wd;
777*c83a76b0SSuyog Pawar y_col = part_pos_y + part_ht;
778*c83a76b0SSuyog Pawar ihevcd_collocated_mvp(ps_mv_ctxt, ps_pu, as_mv_col, avail_col_flag, 0, x_col, y_col);
779*c83a76b0SSuyog Pawar
780*c83a76b0SSuyog Pawar avail_col_l0 = avail_col_flag[0];
781*c83a76b0SSuyog Pawar avail_col_l1 = avail_col_flag[1];
782*c83a76b0SSuyog Pawar
783*c83a76b0SSuyog Pawar if(avail_col_l0 || avail_col_l1)
784*c83a76b0SSuyog Pawar {
785*c83a76b0SSuyog Pawar as_pu_merge_list[candidate_cnt].mv.s_l0_mv = as_mv_col[0];
786*c83a76b0SSuyog Pawar as_pu_merge_list[candidate_cnt].mv.s_l1_mv = as_mv_col[1];
787*c83a76b0SSuyog Pawar }
788*c83a76b0SSuyog Pawar
789*c83a76b0SSuyog Pawar if(avail_col_l0 == 0 || avail_col_l1 == 0)
790*c83a76b0SSuyog Pawar {
791*c83a76b0SSuyog Pawar /* Checking Collocated MV availability at Center of PU */
792*c83a76b0SSuyog Pawar x_col = part_pos_x + (part_wd >> 1);
793*c83a76b0SSuyog Pawar y_col = part_pos_y + (part_ht >> 1);
794*c83a76b0SSuyog Pawar ihevcd_collocated_mvp(ps_mv_ctxt, ps_pu, as_mv_col, avail_col_flag, 0, x_col, y_col);
795*c83a76b0SSuyog Pawar
796*c83a76b0SSuyog Pawar if(avail_col_l0 == 0)
797*c83a76b0SSuyog Pawar {
798*c83a76b0SSuyog Pawar as_pu_merge_list[candidate_cnt].mv.s_l0_mv = as_mv_col[0];
799*c83a76b0SSuyog Pawar }
800*c83a76b0SSuyog Pawar if(avail_col_l1 == 0)
801*c83a76b0SSuyog Pawar {
802*c83a76b0SSuyog Pawar as_pu_merge_list[candidate_cnt].mv.s_l1_mv = as_mv_col[1];
803*c83a76b0SSuyog Pawar }
804*c83a76b0SSuyog Pawar
805*c83a76b0SSuyog Pawar avail_col_l0 |= avail_col_flag[0];
806*c83a76b0SSuyog Pawar avail_col_l1 |= avail_col_flag[1];
807*c83a76b0SSuyog Pawar }
808*c83a76b0SSuyog Pawar
809*c83a76b0SSuyog Pawar as_pu_merge_list[candidate_cnt].mv.i1_l0_ref_idx = 0;
810*c83a76b0SSuyog Pawar as_pu_merge_list[candidate_cnt].mv.i1_l1_ref_idx = 0;
811*c83a76b0SSuyog Pawar as_pu_merge_list[candidate_cnt].b2_pred_mode = avail_col_l0 ? (avail_col_l1 ? PRED_BI : PRED_L0) : PRED_L1;
812*c83a76b0SSuyog Pawar
813*c83a76b0SSuyog Pawar candidate_cnt += (avail_col_l0 || avail_col_l1);
814*c83a76b0SSuyog Pawar
815*c83a76b0SSuyog Pawar if(candidate_cnt == max_num_merge_cand)
816*c83a76b0SSuyog Pawar {
817*c83a76b0SSuyog Pawar ps_pu[0].mv = as_pu_merge_list[candidate_cnt - 1].mv;
818*c83a76b0SSuyog Pawar ps_pu[0].b2_pred_mode = as_pu_merge_list[candidate_cnt - 1].b2_pred_mode;
819*c83a76b0SSuyog Pawar return;
820*c83a76b0SSuyog Pawar }
821*c83a76b0SSuyog Pawar
822*c83a76b0SSuyog Pawar }
823*c83a76b0SSuyog Pawar {
824*c83a76b0SSuyog Pawar WORD32 slice_type;
825*c83a76b0SSuyog Pawar
826*c83a76b0SSuyog Pawar slice_type = ps_slice_hdr->i1_slice_type;
827*c83a76b0SSuyog Pawar /* Colocated mv has to be added to list, if available */
828*c83a76b0SSuyog Pawar
829*c83a76b0SSuyog Pawar /******************************************************/
830*c83a76b0SSuyog Pawar /* Bi pred merge candidates */
831*c83a76b0SSuyog Pawar /******************************************************/
832*c83a76b0SSuyog Pawar if(slice_type == BSLICE)
833*c83a76b0SSuyog Pawar {
834*c83a76b0SSuyog Pawar if((candidate_cnt > 1) && (candidate_cnt < MAX_NUM_MERGE_CAND))
835*c83a76b0SSuyog Pawar {
836*c83a76b0SSuyog Pawar WORD32 priority_list0[12] =
837*c83a76b0SSuyog Pawar { 0, 1, 0, 2, 1, 2, 0, 3, 1, 3, 2, 3 };
838*c83a76b0SSuyog Pawar WORD32 priority_list1[12] =
839*c83a76b0SSuyog Pawar { 1, 0, 2, 0, 2, 1, 3, 0, 3, 1, 3, 2 };
840*c83a76b0SSuyog Pawar WORD32 l0_cand, l1_cand;
841*c83a76b0SSuyog Pawar WORD32 bi_pred_idx = 0;
842*c83a76b0SSuyog Pawar WORD32 total_bi_pred_cand =
843*c83a76b0SSuyog Pawar candidate_cnt * (candidate_cnt - 1);
844*c83a76b0SSuyog Pawar
845*c83a76b0SSuyog Pawar while(bi_pred_idx < total_bi_pred_cand)
846*c83a76b0SSuyog Pawar {
847*c83a76b0SSuyog Pawar l0_cand = priority_list0[bi_pred_idx];
848*c83a76b0SSuyog Pawar l1_cand = priority_list1[bi_pred_idx];
849*c83a76b0SSuyog Pawar
850*c83a76b0SSuyog Pawar if((as_pu_merge_list[l0_cand].b2_pred_mode != PRED_L1)
851*c83a76b0SSuyog Pawar && (as_pu_merge_list[l1_cand].b2_pred_mode
852*c83a76b0SSuyog Pawar != PRED_L0))
853*c83a76b0SSuyog Pawar {
854*c83a76b0SSuyog Pawar WORD8 i1_l0_ref_idx, i1_l1_ref_idx;
855*c83a76b0SSuyog Pawar mv_t s_l0_mv, s_l1_mv;
856*c83a76b0SSuyog Pawar pic_buf_t *ps_pic_buf_l0, *ps_pic_buf_l1;
857*c83a76b0SSuyog Pawar
858*c83a76b0SSuyog Pawar i1_l0_ref_idx = as_pu_merge_list[l0_cand].mv.i1_l0_ref_idx;
859*c83a76b0SSuyog Pawar i1_l1_ref_idx = as_pu_merge_list[l1_cand].mv.i1_l1_ref_idx;
860*c83a76b0SSuyog Pawar ps_pic_buf_l0 = (pic_buf_t *)((ps_ref_list[0][i1_l0_ref_idx].pv_pic_buf));
861*c83a76b0SSuyog Pawar ps_pic_buf_l1 = (pic_buf_t *)((ps_ref_list[1][i1_l1_ref_idx].pv_pic_buf));
862*c83a76b0SSuyog Pawar s_l0_mv = as_pu_merge_list[l0_cand].mv.s_l0_mv;
863*c83a76b0SSuyog Pawar s_l1_mv = as_pu_merge_list[l1_cand].mv.s_l1_mv;
864*c83a76b0SSuyog Pawar
865*c83a76b0SSuyog Pawar if((ps_pic_buf_l0->i4_abs_poc != ps_pic_buf_l1->i4_abs_poc)
866*c83a76b0SSuyog Pawar || (s_l0_mv.i2_mvx != s_l1_mv.i2_mvx)
867*c83a76b0SSuyog Pawar || (s_l0_mv.i2_mvy != s_l1_mv.i2_mvy))
868*c83a76b0SSuyog Pawar {
869*c83a76b0SSuyog Pawar candidate_cnt++;
870*c83a76b0SSuyog Pawar if(candidate_cnt == max_num_merge_cand)
871*c83a76b0SSuyog Pawar {
872*c83a76b0SSuyog Pawar ps_pu[0].mv.s_l0_mv = s_l0_mv;
873*c83a76b0SSuyog Pawar ps_pu[0].mv.s_l1_mv = s_l1_mv;
874*c83a76b0SSuyog Pawar ps_pu[0].mv.i1_l0_ref_idx = i1_l0_ref_idx;
875*c83a76b0SSuyog Pawar ps_pu[0].mv.i1_l1_ref_idx = i1_l1_ref_idx;
876*c83a76b0SSuyog Pawar ps_pu[0].b2_pred_mode = PRED_BI;
877*c83a76b0SSuyog Pawar return;
878*c83a76b0SSuyog Pawar }
879*c83a76b0SSuyog Pawar }
880*c83a76b0SSuyog Pawar }
881*c83a76b0SSuyog Pawar
882*c83a76b0SSuyog Pawar bi_pred_idx++;
883*c83a76b0SSuyog Pawar
884*c83a76b0SSuyog Pawar if((bi_pred_idx == total_bi_pred_cand)
885*c83a76b0SSuyog Pawar || (candidate_cnt == MAX_NUM_MERGE_CAND))
886*c83a76b0SSuyog Pawar {
887*c83a76b0SSuyog Pawar break;
888*c83a76b0SSuyog Pawar }
889*c83a76b0SSuyog Pawar }
890*c83a76b0SSuyog Pawar }
891*c83a76b0SSuyog Pawar }
892*c83a76b0SSuyog Pawar
893*c83a76b0SSuyog Pawar /******************************************************/
894*c83a76b0SSuyog Pawar /* Zero merge candidates */
895*c83a76b0SSuyog Pawar /******************************************************/
896*c83a76b0SSuyog Pawar // if(candidate_cnt < max_num_merge_cand)
897*c83a76b0SSuyog Pawar {
898*c83a76b0SSuyog Pawar WORD32 num_ref_idx;
899*c83a76b0SSuyog Pawar WORD32 zero_idx;
900*c83a76b0SSuyog Pawar
901*c83a76b0SSuyog Pawar zero_idx = max_num_merge_cand - candidate_cnt - 1;
902*c83a76b0SSuyog Pawar
903*c83a76b0SSuyog Pawar if(slice_type == PSLICE)
904*c83a76b0SSuyog Pawar num_ref_idx = ps_slice_hdr->i1_num_ref_idx_l0_active;
905*c83a76b0SSuyog Pawar else
906*c83a76b0SSuyog Pawar /* Slice type B */
907*c83a76b0SSuyog Pawar num_ref_idx = MIN(ps_slice_hdr->i1_num_ref_idx_l0_active, ps_slice_hdr->i1_num_ref_idx_l1_active);
908*c83a76b0SSuyog Pawar
909*c83a76b0SSuyog Pawar if(zero_idx >= num_ref_idx)
910*c83a76b0SSuyog Pawar zero_idx = 0;
911*c83a76b0SSuyog Pawar
912*c83a76b0SSuyog Pawar ps_pu[0].mv.i1_l0_ref_idx = zero_idx;
913*c83a76b0SSuyog Pawar if(slice_type == PSLICE)
914*c83a76b0SSuyog Pawar {
915*c83a76b0SSuyog Pawar ps_pu[0].mv.i1_l1_ref_idx = 0;
916*c83a76b0SSuyog Pawar ps_pu[0].b2_pred_mode = PRED_L0;
917*c83a76b0SSuyog Pawar }
918*c83a76b0SSuyog Pawar else /* Slice type B */
919*c83a76b0SSuyog Pawar {
920*c83a76b0SSuyog Pawar ps_pu[0].mv.i1_l1_ref_idx = zero_idx;
921*c83a76b0SSuyog Pawar ps_pu[0].b2_pred_mode = PRED_BI;
922*c83a76b0SSuyog Pawar }
923*c83a76b0SSuyog Pawar
924*c83a76b0SSuyog Pawar ps_pu[0].mv.s_l0_mv.i2_mvx = 0;
925*c83a76b0SSuyog Pawar ps_pu[0].mv.s_l0_mv.i2_mvy = 0;
926*c83a76b0SSuyog Pawar ps_pu[0].mv.s_l1_mv.i2_mvx = 0;
927*c83a76b0SSuyog Pawar ps_pu[0].mv.s_l1_mv.i2_mvy = 0;
928*c83a76b0SSuyog Pawar
929*c83a76b0SSuyog Pawar candidate_cnt++;
930*c83a76b0SSuyog Pawar }
931*c83a76b0SSuyog Pawar }
932*c83a76b0SSuyog Pawar
933*c83a76b0SSuyog Pawar return;
934*c83a76b0SSuyog Pawar }
935*c83a76b0SSuyog Pawar
936*c83a76b0SSuyog Pawar
937