/****************************************************************************** * * Copyright (C) 2018 The Android Open Source Project * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at: * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. * ***************************************************************************** * Originally developed and contributed by Ittiam Systems Pvt. Ltd, Bangalore */ /** ******************************************************************************* * @file * ihevcd_mv_pred_merge.c * * @brief * Contains functions for motion vector merge candidates derivation * * @author * Ittiam * * @par List of Functions: * - ihevce_compare_pu_mv_t() * - ihevce_mv_pred_merge() * * @remarks * None * ******************************************************************************* */ /*****************************************************************************/ /* File Includes */ /*****************************************************************************/ /* System include files */ #include <stdio.h> #include <string.h> #include <stdlib.h> #include <assert.h> #include <stdarg.h> #include <math.h> /* User include files */ #include "ihevc_typedefs.h" #include "itt_video_api.h" #include "ihevce_api.h" #include "rc_cntrl_param.h" #include "rc_frame_info_collector.h" #include "rc_look_ahead_params.h" #include "ihevc_defs.h" #include "ihevc_macros.h" #include "ihevc_debug.h" #include "ihevc_structs.h" #include "ihevc_platform_macros.h" #include "ihevc_deblk.h" #include "ihevc_itrans_recon.h" #include "ihevc_chroma_itrans_recon.h" #include "ihevc_chroma_intra_pred.h" #include "ihevc_intra_pred.h" #include "ihevc_inter_pred.h" #include "ihevc_mem_fns.h" #include "ihevc_padding.h" #include "ihevc_weighted_pred.h" #include "ihevc_sao.h" #include "ihevc_resi_trans.h" #include "ihevc_quant_iquant_ssd.h" #include "ihevc_cabac_tables.h" #include "ihevc_common_tables.h" #include "ihevce_defs.h" #include "ihevce_hle_interface.h" #include "ihevce_lap_enc_structs.h" #include "ihevce_multi_thrd_structs.h" #include "ihevce_me_common_defs.h" #include "ihevce_had_satd.h" #include "ihevce_error_codes.h" #include "ihevce_bitstream.h" #include "ihevce_cabac.h" #include "ihevce_rdoq_macros.h" #include "ihevce_function_selector.h" #include "ihevce_enc_structs.h" #include "ihevce_entropy_structs.h" #include "ihevce_cmn_utils_instr_set_router.h" #include "ihevce_enc_loop_structs.h" #include "hme_datatype.h" #include "hme_interface.h" #include "hme_common_defs.h" #include "hme_defs.h" #include "ihevce_mv_pred.h" #include "ihevce_mv_pred_merge.h" #include "ihevce_common_utils.h" /*****************************************************************************/ /* Function Definitions */ /*****************************************************************************/ /** ******************************************************************************* * * @brief Function scaling temporal motion vector * * * @par Description: * Scales mv based on difference between current POC and current * reference POC and neighbour reference poc * * @param[inout] mv * motion vector to be scaled * * @param[in] cur_ref_poc * Current PU refernce pic poc * * @param[in] nbr_ref_poc * Neighbor PU reference pic poc * * @param[in] cur_poc * Picture order count of current pic * * @returns * None * * @remarks * ******************************************************************************* */ void ihevce_scale_collocated_mv( mv_t *ps_mv, WORD32 cur_ref_poc, WORD32 col_ref_poc, WORD32 col_poc, WORD32 cur_poc) { WORD32 td, tb, tx; WORD32 dist_scale_factor; WORD32 mvx, mvy; td = CLIP_S8(col_poc - col_ref_poc); tb = CLIP_S8(cur_poc - cur_ref_poc); tx = (16384 + (abs(td) >> 1)) / td; dist_scale_factor = (tb * tx + 32) >> 6; dist_scale_factor = CLIP3(dist_scale_factor, -4096, 4095); mvx = ps_mv->i2_mvx; mvy = ps_mv->i2_mvy; mvx = SIGN(dist_scale_factor * mvx) * ((abs(dist_scale_factor * mvx) + 127) >> 8); mvy = SIGN(dist_scale_factor * mvy) * ((abs(dist_scale_factor * mvy) + 127) >> 8); ps_mv->i2_mvx = CLIP_S16(mvx); ps_mv->i2_mvy = CLIP_S16(mvy); } /* End of ihevce_scale_collocated_mv */ void ihevce_collocated_mvp( mv_pred_ctxt_t *ps_mv_ctxt, pu_t *ps_pu, mv_t *ps_mv_col, WORD32 *pu4_avail_col_flag, WORD32 use_pu_ref_idx, WORD32 x_col, WORD32 y_col) { sps_t *ps_sps = ps_mv_ctxt->ps_sps; slice_header_t *ps_slice_hdr = ps_mv_ctxt->ps_slice_hdr; recon_pic_buf_t *ps_col_ref_buf; WORD32 xp_col, yp_col; //In pixel unit WORD32 col_ctb_x, col_ctb_y; //In CTB unit mv_t as_mv_col[2]; WORD32 log2_ctb_size; WORD32 ctb_size; WORD32 avail_col; WORD32 col_ctb_idx, pu_cnt; WORD32 au4_list_col[2]; WORD32 num_minpu_in_ctb; UWORD8 *pu1_pic_pu_map_ctb; pu_col_mv_t *ps_col_mv; WORD32 part_pos_y; part_pos_y = ps_pu->b4_pos_y << 2; log2_ctb_size = ps_sps->i1_log2_ctb_size; ctb_size = (1 << log2_ctb_size); avail_col = 1; /* Initializing reference list */ if((ps_slice_hdr->i1_slice_type == BSLICE) && (ps_slice_hdr->i1_collocated_from_l0_flag == 0)) { /* L1 */ ps_col_ref_buf = ps_mv_ctxt->ps_ref_list[1][ps_slice_hdr->i1_collocated_ref_idx]; } else { /* L0 */ ps_col_ref_buf = ps_mv_ctxt->ps_ref_list[0][ps_slice_hdr->i1_collocated_ref_idx]; } num_minpu_in_ctb = (ctb_size / MIN_PU_SIZE) * (ctb_size / MIN_PU_SIZE); if(((part_pos_y >> log2_ctb_size) == (y_col >> log2_ctb_size)) && (((x_col + (ps_mv_ctxt->i4_ctb_x << log2_ctb_size)) < ps_sps->i2_pic_width_in_luma_samples) || ps_mv_ctxt->ai4_tile_xtra_ctb[2]) && ((((y_col + (ps_mv_ctxt->i4_ctb_y << log2_ctb_size)) < ps_sps->i2_pic_height_in_luma_samples) || ps_mv_ctxt->ai4_tile_xtra_ctb[3]))) { xp_col = ((x_col >> 4) << 4); yp_col = ((y_col >> 4) << 4); col_ctb_x = ps_mv_ctxt->i4_ctb_x + (xp_col >> log2_ctb_size); col_ctb_y = ps_mv_ctxt->i4_ctb_y + (yp_col >> log2_ctb_size); /* pu1_frm_pu_map has (i2_pic_wd_in_ctb + 1) CTBs for stride */ col_ctb_idx = col_ctb_x + (col_ctb_y) * (ps_sps->i2_pic_wd_in_ctb + 1); if(xp_col == ctb_size) xp_col = 0; pu1_pic_pu_map_ctb = ps_col_ref_buf->pu1_frm_pu_map + col_ctb_idx * num_minpu_in_ctb; pu_cnt = pu1_pic_pu_map_ctb[(yp_col >> 2) * (ctb_size / MIN_PU_SIZE) + (xp_col >> 2)]; /* ps_frm_col_mv has (i2_pic_wd_in_ctb + 1) CTBs for stride */ ps_col_mv = ps_col_ref_buf->ps_frm_col_mv + (col_ctb_y * (ps_sps->i2_pic_wd_in_ctb + 1) + col_ctb_x) * num_minpu_in_ctb + pu_cnt; } else avail_col = 0; if((avail_col == 0) || (ps_col_mv->b1_intra_flag == 1) || (ps_slice_hdr->i1_slice_temporal_mvp_enable_flag == 0)) { pu4_avail_col_flag[0] = 0; pu4_avail_col_flag[1] = 0; ps_mv_col[0].i2_mvx = 0; ps_mv_col[0].i2_mvy = 0; ps_mv_col[1].i2_mvx = 0; ps_mv_col[1].i2_mvy = 0; } else { WORD32 au4_ref_idx_col[2]; WORD32 pred_flag_l0, pred_flag_l1; pred_flag_l0 = (ps_col_mv->b2_pred_mode != PRED_L1); pred_flag_l1 = (ps_col_mv->b2_pred_mode != PRED_L0); if(pred_flag_l0 == 0) { as_mv_col[0] = ps_col_mv->s_l1_mv; au4_ref_idx_col[0] = ps_col_mv->i1_l1_ref_idx; au4_list_col[0] = 1; /* L1 */ as_mv_col[1] = ps_col_mv->s_l1_mv; au4_ref_idx_col[1] = ps_col_mv->i1_l1_ref_idx; au4_list_col[1] = 1; /* L1 */ } else { if(pred_flag_l1 == 0) { as_mv_col[0] = ps_col_mv->s_l0_mv; au4_ref_idx_col[0] = ps_col_mv->i1_l0_ref_idx; au4_list_col[0] = 0; /* L1 */ as_mv_col[1] = ps_col_mv->s_l0_mv; au4_ref_idx_col[1] = ps_col_mv->i1_l0_ref_idx; au4_list_col[1] = 0; /* L1 */ } else { if(1 == ps_slice_hdr->i1_low_delay_flag) { as_mv_col[0] = ps_col_mv->s_l0_mv; au4_ref_idx_col[0] = ps_col_mv->i1_l0_ref_idx; au4_list_col[0] = 0; /* L0 */ as_mv_col[1] = ps_col_mv->s_l1_mv; au4_ref_idx_col[1] = ps_col_mv->i1_l1_ref_idx; au4_list_col[1] = 1; /* L1 */ } else { if(0 == ps_slice_hdr->i1_collocated_from_l0_flag) { as_mv_col[0] = ps_col_mv->s_l0_mv; au4_ref_idx_col[0] = ps_col_mv->i1_l0_ref_idx; as_mv_col[1] = ps_col_mv->s_l0_mv; au4_ref_idx_col[1] = ps_col_mv->i1_l0_ref_idx; } else { as_mv_col[0] = ps_col_mv->s_l1_mv; au4_ref_idx_col[0] = ps_col_mv->i1_l1_ref_idx; as_mv_col[1] = ps_col_mv->s_l1_mv; au4_ref_idx_col[1] = ps_col_mv->i1_l1_ref_idx; } au4_list_col[0] = ps_slice_hdr->i1_collocated_from_l0_flag; /* L"collocated_from_l0_flag" */ au4_list_col[1] = ps_slice_hdr->i1_collocated_from_l0_flag; /* L"collocated_from_l0_flag" */ } } } avail_col = 1; { WORD32 cur_poc, col_poc, col_ref_poc_l0, cur_ref_poc; WORD32 col_ref_poc_l0_lt, cur_ref_poc_lt; WORD32 ref_idx_l0, ref_idx_l1; if(use_pu_ref_idx) { ref_idx_l0 = ps_pu->mv.i1_l0_ref_idx; ref_idx_l1 = ps_pu->mv.i1_l1_ref_idx; } else { ref_idx_l0 = 0; ref_idx_l1 = 0; } col_poc = ps_col_ref_buf->i4_poc; cur_poc = ps_slice_hdr->i4_abs_pic_order_cnt; if(-1 != ref_idx_l0) { if(au4_list_col[0] == 0) { col_ref_poc_l0 = ps_col_ref_buf->ai4_col_l0_poc[au4_ref_idx_col[0]]; col_ref_poc_l0_lt = 0; /* Encoder has only short term references */ } else { col_ref_poc_l0 = ps_col_ref_buf->ai4_col_l1_poc[au4_ref_idx_col[0]]; col_ref_poc_l0_lt = 0; } /* L0 collocated mv */ cur_ref_poc = ps_mv_ctxt->ps_ref_list[0][ref_idx_l0]->i4_poc; cur_ref_poc_lt = 0; { pu4_avail_col_flag[0] = 1; /*if(cur_ref_poc_lt || ((col_poc - col_ref_poc_l0) == (cur_poc - cur_ref_poc)))*/ if((col_poc - col_ref_poc_l0) == (cur_poc - cur_ref_poc)) { ps_mv_col[0] = as_mv_col[0]; } else { ps_mv_col[0] = as_mv_col[0]; if(col_ref_poc_l0 != col_poc) { ihevce_scale_collocated_mv( (mv_t *)(&ps_mv_col[0]), cur_ref_poc, col_ref_poc_l0, col_poc, cur_poc); } } } } else { pu4_avail_col_flag[0] = 0; ps_mv_col[0].i2_mvx = 0; ps_mv_col[0].i2_mvy = 0; } if((BSLICE == ps_slice_hdr->i1_slice_type) && (-1 != ref_idx_l1)) { WORD32 col_ref_poc_l1_lt, col_ref_poc_l1; if(au4_list_col[1] == 0) { col_ref_poc_l1 = ps_col_ref_buf->ai4_col_l0_poc[au4_ref_idx_col[0]]; col_ref_poc_l1_lt = 0; } else { col_ref_poc_l1 = ps_col_ref_buf->ai4_col_l1_poc[au4_ref_idx_col[0]]; col_ref_poc_l1_lt = 0; } /* L1 collocated mv */ cur_ref_poc = ps_mv_ctxt->ps_ref_list[1][ref_idx_l1]->i4_poc; cur_ref_poc_lt = 0; { pu4_avail_col_flag[1] = 1; /*if(cur_ref_poc_lt || ((col_poc - col_ref_poc_l1) == (cur_poc - cur_ref_poc)))*/ if((col_poc - col_ref_poc_l1) == (cur_poc - cur_ref_poc)) { ps_mv_col[1] = as_mv_col[1]; } else { ps_mv_col[1] = as_mv_col[1]; if(col_ref_poc_l1 != col_poc) { ihevce_scale_collocated_mv( (mv_t *)&ps_mv_col[1], cur_ref_poc, col_ref_poc_l1, col_poc, cur_poc); } } } } /* End of if BSLICE */ else { pu4_avail_col_flag[1] = 0; } } } /* End of collocated MV calculation */ } /* End of ihevce_collocated_mvp */ /** ******************************************************************************* * * @brief Compare Motion vectors function * * * @par Description: * Checks if MVs and Reference idx are excatly matching. * * @param[inout] ps_1 * motion vector 1 to be compared * * @param[in] ps_2 * motion vector 2 to be compared * * @returns * 0 : if not matching 1 : if matching * * @remarks * ******************************************************************************* */ /** ******************************************************************************* * * @brief * This function performs Motion Vector Merge candidates derivation * * @par Description: * MV merge list is computed using neighbor mvs and colocated mv * * @param[in] ps_ctxt * pointer to mv predictor context * * @param[in] ps_top_nbr_4x4 * pointer to top 4x4 nbr structure * * @param[in] ps_left_nbr_4x4 * pointer to left 4x4 nbr structure * * @param[in] ps_top_left_nbr_4x4 * pointer to top left 4x4 nbr structure * * @param[in] left_nbr_4x4_strd * left nbr buffer stride in terms of 4x4 units * * @param[in] ps_avail_flags * Neighbor availability flags container * * @param[in] ps_col_mv * Colocated MV pointer * * @param[in] ps_pu * Current Partition PU strucrture pointer * * @param[in] part_mode * Partition mode @sa PART_SIZE_E * * @param[in] part_idx * Partition idx of current partition inside CU * * @param[in] single_mcl_flag * Single MCL flag based on 8x8 CU and Parallel merge value * * @param[out] ps_merge_cand_list * pointer to store MV merge candidates list * * @returns * Number of merge candidates * @remarks * * ******************************************************************************* */ WORD32 ihevce_mv_pred_merge( mv_pred_ctxt_t *ps_ctxt, nbr_4x4_t *ps_top_nbr_4x4, nbr_4x4_t *ps_left_nbr_4x4, nbr_4x4_t *ps_top_left_nbr_4x4, WORD32 left_nbr_4x4_strd, nbr_avail_flags_t *ps_avail_flags, pu_mv_t *ps_col_mv, pu_t *ps_pu, PART_SIZE_E part_mode, WORD32 part_idx, WORD32 single_mcl_flag, merge_cand_list_t *ps_merge_cand_list, UWORD8 *pu1_is_top_used) { /******************************************************/ /* Spatial Merge Candidates */ /******************************************************/ WORD32 part_pos_x; WORD32 part_pos_y; WORD32 part_wd; WORD32 part_ht; WORD32 slice_type; WORD32 num_ref_idx_l0_active; WORD32 num_ref_idx_l1_active; WORD32 num_merge_cand; WORD32 log2_parallel_merge_level_minus2; WORD32 n; WORD8 i1_spatial_avail_flag_n[MAX_NUM_MV_NBR]; /*[A0/A1/B0/B1/B2]*/ WORD32 nbr_x[MAX_NUM_MV_NBR], nbr_y[MAX_NUM_MV_NBR]; UWORD8 u1_nbr_avail[MAX_NUM_MV_NBR]; WORD32 merge_shift; nbr_4x4_t *ps_nbr_mv[MAX_NUM_MV_NBR]; /*******************************************/ /* Neighbor location: Graphical indication */ /* */ /* B2 _____________B1 B0 */ /* | | */ /* | | */ /* | | */ /* | PU ht| */ /* | | */ /* | | */ /* A1|______wd_______| */ /* A0 */ /* */ /*******************************************/ part_pos_x = ps_pu->b4_pos_x << 2; part_pos_y = ps_pu->b4_pos_y << 2; part_ht = (ps_pu->b4_ht + 1) << 2; part_wd = (ps_pu->b4_wd + 1) << 2; slice_type = ps_ctxt->ps_slice_hdr->i1_slice_type; num_ref_idx_l0_active = ps_ctxt->ps_slice_hdr->i1_num_ref_idx_l0_active; num_ref_idx_l1_active = ps_ctxt->ps_slice_hdr->i1_num_ref_idx_l1_active; log2_parallel_merge_level_minus2 = ps_ctxt->i4_log2_parallel_merge_level_minus2; /* Assigning co-ordinates to neighbors */ nbr_x[NBR_A0] = part_pos_x - 1; nbr_y[NBR_A0] = part_pos_y + part_ht; /* A0 */ nbr_x[NBR_A1] = part_pos_x - 1; nbr_y[NBR_A1] = part_pos_y + part_ht - 1; /* A1 */ nbr_x[NBR_B0] = part_pos_x + part_wd; nbr_y[NBR_B0] = part_pos_y - 1; /* B0 */ nbr_x[NBR_B1] = part_pos_x + part_wd - 1; nbr_y[NBR_B1] = part_pos_y - 1; /* B1 */ nbr_x[NBR_B2] = part_pos_x - 1; nbr_y[NBR_B2] = part_pos_y - 1; /* B2 */ /* Assigning mv's */ ps_nbr_mv[NBR_A0] = ps_left_nbr_4x4 + ((nbr_y[NBR_A0] - part_pos_y) >> 2) * left_nbr_4x4_strd; ps_nbr_mv[NBR_A1] = ps_left_nbr_4x4 + ((nbr_y[NBR_A1] - part_pos_y) >> 2) * left_nbr_4x4_strd; ps_nbr_mv[NBR_B0] = ps_top_nbr_4x4 + ((nbr_x[NBR_B0] - part_pos_x) >> 2); ps_nbr_mv[NBR_B1] = ps_top_nbr_4x4 + ((nbr_x[NBR_B1] - part_pos_x) >> 2); if(part_pos_y == 0) /* AT vertical CTB boundary */ ps_nbr_mv[NBR_B2] = ps_top_nbr_4x4 + ((nbr_x[NBR_B2] - part_pos_x) >> 2); else ps_nbr_mv[NBR_B2] = ps_top_left_nbr_4x4; /* Assigning nbr availability */ u1_nbr_avail[NBR_A0] = ps_avail_flags->u1_bot_lt_avail && (!ps_nbr_mv[NBR_A0]->b1_intra_flag); /* A0 */ u1_nbr_avail[NBR_A1] = ps_avail_flags->u1_left_avail && (!ps_nbr_mv[NBR_A1]->b1_intra_flag); /* A1 */ u1_nbr_avail[NBR_B0] = ps_avail_flags->u1_top_rt_avail && (!ps_nbr_mv[NBR_B0]->b1_intra_flag); /* B0 */ u1_nbr_avail[NBR_B1] = ps_avail_flags->u1_top_avail && (!ps_nbr_mv[NBR_B1]->b1_intra_flag); /* B1 */ u1_nbr_avail[NBR_B2] = ps_avail_flags->u1_top_lt_avail && (!ps_nbr_mv[NBR_B2]->b1_intra_flag); /* B2 */ merge_shift = log2_parallel_merge_level_minus2 + 2; /* Availability check */ /* A1 */ { WORD32 avail_flag; avail_flag = 1; n = NBR_A1; /* if at same merge level */ if((part_pos_x >> merge_shift) == (nbr_x[n] >> merge_shift) && ((part_pos_y >> merge_shift) == (nbr_y[n] >> merge_shift))) { u1_nbr_avail[n] = 0; } /* SPEC JCTVC-K1003_v9 version has a different way using not available */ /* candidates compared to software. for non square part and seconf part case */ /* ideally nothing from the 1st partition should be used as per spec but */ /* HM 8.2 dev verison does not adhere to this. currenlty code fllows HM */ /* if single MCL is 0 , second part of 2 part in CU */ if((single_mcl_flag == 0) && (part_idx == 1) && ((part_mode == PART_Nx2N) || (part_mode == PART_nLx2N) || (part_mode == PART_nRx2N))) { u1_nbr_avail[n] = 0; } if(u1_nbr_avail[n] == 0) { avail_flag = 0; } i1_spatial_avail_flag_n[n] = avail_flag; } /* B1 */ { WORD32 avail_flag; avail_flag = 1; n = NBR_B1; /* if at same merge level */ if((part_pos_x >> merge_shift) == (nbr_x[n] >> merge_shift) && ((part_pos_y >> merge_shift) == (nbr_y[n] >> merge_shift))) { u1_nbr_avail[n] = 0; } /* if single MCL is 0 , second part of 2 part in CU */ if((single_mcl_flag == 0) && (part_idx == 1) && ((part_mode == PART_2NxN) || (part_mode == PART_2NxnU) || (part_mode == PART_2NxnD))) { u1_nbr_avail[n] = 0; } if(u1_nbr_avail[n] == 0) { avail_flag = 0; } if((avail_flag == 1) && (u1_nbr_avail[NBR_A1] == 1)) { /* TODO: Assumption: mvs and ref indicies in both l0 and l1*/ /* should match for non availability */ WORD32 i4_pred_1, i4_pred_2; i4_pred_1 = (ps_nbr_mv[NBR_A1]->b1_pred_l0_flag | (ps_nbr_mv[NBR_A1]->b1_pred_l1_flag << 1)) - 1; i4_pred_2 = (ps_nbr_mv[n]->b1_pred_l0_flag | (ps_nbr_mv[n]->b1_pred_l1_flag << 1)) - 1; if(ihevce_compare_pu_mv_t( &ps_nbr_mv[NBR_A1]->mv, &ps_nbr_mv[n]->mv, i4_pred_1, i4_pred_2)) { avail_flag = 0; } } i1_spatial_avail_flag_n[n] = avail_flag; } /* B0 */ { WORD32 avail_flag; avail_flag = 1; n = NBR_B0; /* if at same merge level */ if((part_pos_x >> merge_shift) == (nbr_x[n] >> merge_shift) && ((part_pos_y >> merge_shift) == (nbr_y[n] >> merge_shift))) { u1_nbr_avail[n] = 0; } if(u1_nbr_avail[n] == 0) { avail_flag = 0; } if((avail_flag == 1) && (u1_nbr_avail[NBR_B1] == 1)) { WORD32 i4_pred_1, i4_pred_2; i4_pred_1 = (ps_nbr_mv[NBR_B1]->b1_pred_l0_flag | (ps_nbr_mv[NBR_B1]->b1_pred_l1_flag << 1)) - 1; i4_pred_2 = (ps_nbr_mv[n]->b1_pred_l0_flag | (ps_nbr_mv[n]->b1_pred_l1_flag << 1)) - 1; if(ihevce_compare_pu_mv_t( &ps_nbr_mv[NBR_B1]->mv, &ps_nbr_mv[n]->mv, i4_pred_1, i4_pred_2)) { avail_flag = 0; } } i1_spatial_avail_flag_n[n] = avail_flag; } /* A0 */ { WORD32 avail_flag; avail_flag = 1; n = NBR_A0; /* if at same merge level */ if((part_pos_x >> merge_shift) == (nbr_x[n] >> merge_shift) && ((part_pos_y >> merge_shift) == (nbr_y[n] >> merge_shift))) { u1_nbr_avail[n] = 0; } if(u1_nbr_avail[n] == 0) { avail_flag = 0; } if((avail_flag == 1) && (u1_nbr_avail[NBR_A1] == 1)) { WORD32 i4_pred_1, i4_pred_2; i4_pred_1 = (ps_nbr_mv[NBR_A1]->b1_pred_l0_flag | (ps_nbr_mv[NBR_A1]->b1_pred_l1_flag << 1)) - 1; i4_pred_2 = (ps_nbr_mv[n]->b1_pred_l0_flag | (ps_nbr_mv[n]->b1_pred_l1_flag << 1)) - 1; if(ihevce_compare_pu_mv_t( &ps_nbr_mv[NBR_A1]->mv, &ps_nbr_mv[n]->mv, i4_pred_1, i4_pred_2)) { avail_flag = 0; } } i1_spatial_avail_flag_n[n] = avail_flag; } /* B2 */ { WORD32 avail_flag; avail_flag = 1; n = NBR_B2; /* if at same merge level */ if((part_pos_x >> merge_shift) == (nbr_x[n] >> merge_shift) && ((part_pos_y >> merge_shift) == (nbr_y[n] >> merge_shift))) { u1_nbr_avail[n] = 0; } if(u1_nbr_avail[n] == 0) { avail_flag = 0; } if((i1_spatial_avail_flag_n[NBR_A0] + i1_spatial_avail_flag_n[NBR_A1] + i1_spatial_avail_flag_n[NBR_B0] + i1_spatial_avail_flag_n[NBR_B1]) == 4) { avail_flag = 0; } if(avail_flag == 1) { if(u1_nbr_avail[NBR_A1] == 1) { WORD32 i4_pred_1, i4_pred_2; i4_pred_1 = (ps_nbr_mv[NBR_A1]->b1_pred_l0_flag | (ps_nbr_mv[NBR_A1]->b1_pred_l1_flag << 1)) - 1; i4_pred_2 = (ps_nbr_mv[n]->b1_pred_l0_flag | (ps_nbr_mv[n]->b1_pred_l1_flag << 1)) - 1; if(ihevce_compare_pu_mv_t( &ps_nbr_mv[NBR_A1]->mv, &ps_nbr_mv[n]->mv, i4_pred_1, i4_pred_2)) { avail_flag = 0; } } if(u1_nbr_avail[NBR_B1] == 1) { WORD32 i4_pred_1, i4_pred_2; i4_pred_1 = (ps_nbr_mv[NBR_B1]->b1_pred_l0_flag | (ps_nbr_mv[NBR_B1]->b1_pred_l1_flag << 1)) - 1; i4_pred_2 = (ps_nbr_mv[n]->b1_pred_l0_flag | (ps_nbr_mv[n]->b1_pred_l1_flag << 1)) - 1; if(ihevce_compare_pu_mv_t( &ps_nbr_mv[NBR_B1]->mv, &ps_nbr_mv[n]->mv, i4_pred_1, i4_pred_2)) { avail_flag = 0; } } } i1_spatial_avail_flag_n[n] = avail_flag; } /******************************************************/ /* Merge Candidates List */ /******************************************************/ /* Preparing MV merge candidate list */ { WORD32 merge_list_priority[MAX_NUM_MERGE_CAND] = { NBR_A1, NBR_B1, NBR_B0, NBR_A0, NBR_B2 }; num_merge_cand = 0; for(n = 0; n < MAX_NUM_MERGE_CAND; n++) { WORD32 merge_idx; merge_idx = merge_list_priority[n]; if(i1_spatial_avail_flag_n[merge_idx] == 1) { ps_merge_cand_list[num_merge_cand].mv = ps_nbr_mv[merge_idx]->mv; ps_merge_cand_list[num_merge_cand].u1_pred_flag_l0 = (UWORD8)ps_nbr_mv[merge_idx]->b1_pred_l0_flag; ps_merge_cand_list[num_merge_cand].u1_pred_flag_l1 = (UWORD8)ps_nbr_mv[merge_idx]->b1_pred_l1_flag; switch(merge_list_priority[n]) { case NBR_A1: case NBR_A0: { pu1_is_top_used[num_merge_cand] = 0; break; } default: { pu1_is_top_used[num_merge_cand] = 1; break; } } num_merge_cand++; } } /******************************************************/ /* Temporal Merge Candidates */ /******************************************************/ if(num_merge_cand < MAX_NUM_MERGE_CAND) { mv_t as_mv_col[2]; WORD32 avail_col_flag[2] = { 0 }, x_col, y_col; WORD32 avail_col_l0, avail_col_l1; /* Checking Collocated MV availability at Bottom right of PU*/ x_col = part_pos_x + part_wd; y_col = part_pos_y + part_ht; ihevce_collocated_mvp(ps_ctxt, ps_pu, as_mv_col, avail_col_flag, 0, x_col, y_col); avail_col_l0 = avail_col_flag[0]; avail_col_l1 = avail_col_flag[1]; if(avail_col_l0 || avail_col_l1) { ps_merge_cand_list[num_merge_cand].mv.s_l0_mv = as_mv_col[0]; ps_merge_cand_list[num_merge_cand].mv.s_l1_mv = as_mv_col[1]; } if(avail_col_l0 == 0 || avail_col_l1 == 0) { /* Checking Collocated MV availability at Center of PU */ x_col = part_pos_x + (part_wd >> 1); y_col = part_pos_y + (part_ht >> 1); ihevce_collocated_mvp(ps_ctxt, ps_pu, as_mv_col, avail_col_flag, 0, x_col, y_col); if(avail_col_l0 == 0) { ps_merge_cand_list[num_merge_cand].mv.s_l0_mv = as_mv_col[0]; } if(avail_col_l1 == 0) { ps_merge_cand_list[num_merge_cand].mv.s_l1_mv = as_mv_col[1]; } avail_col_l0 |= avail_col_flag[0]; avail_col_l1 |= avail_col_flag[1]; } ps_merge_cand_list[num_merge_cand].mv.i1_l0_ref_idx = 0; ps_merge_cand_list[num_merge_cand].mv.i1_l1_ref_idx = 0; ps_merge_cand_list[num_merge_cand].u1_pred_flag_l0 = avail_col_l0 ? 1 : 0; ps_merge_cand_list[num_merge_cand].u1_pred_flag_l1 = avail_col_l1 ? 1 : 0; if(avail_col_l0 || avail_col_l1) { pu1_is_top_used[num_merge_cand] = 0; num_merge_cand++; } } /******************************************************/ /* Bi pred merge candidates */ /******************************************************/ if(slice_type == BSLICE) { if((num_merge_cand > 1) && (num_merge_cand < MAX_NUM_MERGE_CAND)) { WORD32 priority_list0[12] = { 0, 1, 0, 2, 1, 2, 0, 3, 1, 3, 2, 3 }; WORD32 priority_list1[12] = { 1, 0, 2, 0, 2, 1, 3, 0, 3, 1, 3, 2 }; WORD32 l0_cand, l1_cand; WORD32 bi_pred_idx = 0; WORD32 total_bi_pred_cand = num_merge_cand * (num_merge_cand - 1); while(bi_pred_idx < total_bi_pred_cand) { l0_cand = priority_list0[bi_pred_idx]; l1_cand = priority_list1[bi_pred_idx]; if((ps_merge_cand_list[l0_cand].u1_pred_flag_l0 == 1) && (ps_merge_cand_list[l1_cand].u1_pred_flag_l1 == 1)) { WORD8 i1_l0_ref_idx, i1_l1_ref_idx; WORD32 l0_poc, l1_poc; mv_t s_l0_mv, s_l1_mv; i1_l0_ref_idx = ps_merge_cand_list[l0_cand].mv.i1_l0_ref_idx; i1_l1_ref_idx = ps_merge_cand_list[l1_cand].mv.i1_l1_ref_idx; l0_poc = ps_ctxt->ps_ref_list[0][i1_l0_ref_idx]->i4_poc; l1_poc = ps_ctxt->ps_ref_list[1][i1_l1_ref_idx]->i4_poc; s_l0_mv = ps_merge_cand_list[l0_cand].mv.s_l0_mv; s_l1_mv = ps_merge_cand_list[l1_cand].mv.s_l1_mv; if((l0_poc != l1_poc) || (s_l0_mv.i2_mvx != s_l1_mv.i2_mvx) || (s_l0_mv.i2_mvy != s_l1_mv.i2_mvy)) { ps_merge_cand_list[num_merge_cand].mv.s_l0_mv = s_l0_mv; ps_merge_cand_list[num_merge_cand].mv.s_l1_mv = s_l1_mv; ps_merge_cand_list[num_merge_cand].mv.i1_l0_ref_idx = i1_l0_ref_idx; ps_merge_cand_list[num_merge_cand].mv.i1_l1_ref_idx = i1_l1_ref_idx; ps_merge_cand_list[num_merge_cand].u1_pred_flag_l0 = 1; ps_merge_cand_list[num_merge_cand].u1_pred_flag_l1 = 1; if(pu1_is_top_used[l0_cand] || pu1_is_top_used[l1_cand]) { pu1_is_top_used[num_merge_cand] = 1; } else { pu1_is_top_used[num_merge_cand] = 0; } num_merge_cand++; } } bi_pred_idx++; if((bi_pred_idx == total_bi_pred_cand) || (num_merge_cand == MAX_NUM_MERGE_CAND)) { break; } } } } /* End of Bipred merge candidates */ /******************************************************/ /* Zero merge candidates */ /******************************************************/ if(num_merge_cand < MAX_NUM_MERGE_CAND) { WORD32 num_ref_idx; WORD32 zero_idx; zero_idx = 0; if(slice_type == PSLICE) num_ref_idx = num_ref_idx_l0_active; else /* Slice type B */ num_ref_idx = MIN(num_ref_idx_l0_active, num_ref_idx_l1_active); while(num_merge_cand < MAX_NUM_MERGE_CAND) { if(slice_type == PSLICE) { ps_merge_cand_list[num_merge_cand].mv.i1_l0_ref_idx = zero_idx; ps_merge_cand_list[num_merge_cand].mv.i1_l1_ref_idx = -1; ps_merge_cand_list[num_merge_cand].u1_pred_flag_l0 = 1; ps_merge_cand_list[num_merge_cand].u1_pred_flag_l1 = 0; } else /* Slice type B */ { ps_merge_cand_list[num_merge_cand].mv.i1_l0_ref_idx = zero_idx; ps_merge_cand_list[num_merge_cand].mv.i1_l1_ref_idx = zero_idx; ps_merge_cand_list[num_merge_cand].u1_pred_flag_l0 = 1; ps_merge_cand_list[num_merge_cand].u1_pred_flag_l1 = 1; } ps_merge_cand_list[num_merge_cand].mv.s_l0_mv.i2_mvx = 0; ps_merge_cand_list[num_merge_cand].mv.s_l0_mv.i2_mvy = 0; ps_merge_cand_list[num_merge_cand].mv.s_l1_mv.i2_mvx = 0; ps_merge_cand_list[num_merge_cand].mv.s_l1_mv.i2_mvy = 0; pu1_is_top_used[num_merge_cand] = 0; num_merge_cand++; zero_idx++; /* if all the reference pics have been added as candidates */ /* the the loop shoudl break since it would add same cand again */ if(zero_idx == num_ref_idx) { break; } } } /* End of zero merge candidates */ } /* End of merge candidate list population */ return (num_merge_cand); }