diff options
Diffstat (limited to 'encoder/ih264e_mc.c')
-rwxr-xr-x | encoder/ih264e_mc.c | 320 |
1 files changed, 320 insertions, 0 deletions
diff --git a/encoder/ih264e_mc.c b/encoder/ih264e_mc.c new file mode 100755 index 0000000..2dd0974 --- /dev/null +++ b/encoder/ih264e_mc.c @@ -0,0 +1,320 @@ +/****************************************************************************** + * + * Copyright (C) 2015 The Android Open Source Project + * + * Licensed under the Apache License, Version 2.0 (the "License"); + * you may not use this file except in compliance with the License. + * You may obtain a copy of the License at: + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + * + ***************************************************************************** + * Originally developed and contributed by Ittiam Systems Pvt. Ltd, Bangalore +*/ + +/** +******************************************************************************* +* @file +* ih264e_mc.c +* +* @brief +* Contains definition of functions for motion compensation +* +* @author +* ittiam +* +* @par List of Functions: +* - ih264e_motion_comp_luma() +* - ih264e_motion_comp_chroma() +* +* @remarks +* None +* +******************************************************************************* +*/ + +/*****************************************************************************/ +/* File Includes */ +/*****************************************************************************/ + +/* System include files */ +#include <stdio.h> + +/* User include files */ +#include "ih264_typedefs.h" +#include "ih264_defs.h" +#include "iv2.h" +#include "ive2.h" +#include "ime_distortion_metrics.h" +#include "ime_structs.h" +#include "ih264_structs.h" +#include "ih264_inter_pred_filters.h" +#include "ih264_mem_fns.h" +#include "ih264_padding.h" +#include "ih264_intra_pred_filters.h" +#include "ih264_deblk_edge_filters.h" +#include "ih264_trans_quant_itrans_iquant.h" +#include "ih264_inter_pred_filters.h" +#include "ih264_mem_fns.h" +#include "ih264_padding.h" +#include "ih264_intra_pred_filters.h" +#include "ih264_deblk_edge_filters.h" +#include "ih264e_defs.h" +#include "ih264e_error.h" +#include "ih264e_bitstream.h" +#include "irc_cntrl_param.h" +#include "irc_frame_info_collector.h" +#include "ih264e_rate_control.h" +#include "ih264e_structs.h" +#include "ih264e_mc.h" +#include "ih264e_half_pel.h" + + +/*****************************************************************************/ +/* Function Definitions */ +/*****************************************************************************/ + +/** +****************************************************************************** +* +* @brief +* performs motion compensation for a luma mb for the given mv. +* +* @par Description +* This routine performs motion compensation of an inter mb. When the inter +* mb mode is P16x16, there is no need to copy 16x16 unit from reference buffer +* to pred buffer. In this case the function returns pointer and stride of the +* ref. buffer and this info is used in place of pred buffer else where. +* In other cases, the pred buffer is populated via copy / filtering + copy +* (q pel cases) and returned. +* +* @param[in] ps_proc +* pointer to current proc ctxt +* +* @param[out] pu1_pseudo_pred +* pseudo prediction buffer +* +* @param[out] u4_pseudo_pred_strd +* pseudo pred buffer stride +* +* @return none +* +* @remarks Assumes half pel buffers for the entire frame are populated. +* +****************************************************************************** +*/ +void ih264e_motion_comp_luma(process_ctxt_t *ps_proc, + UWORD8 **pu1_pseudo_pred, + WORD32 *pi4_pseudo_pred_strd) +{ + /* codec context */ + codec_t *ps_codec = ps_proc->ps_codec; + + /* me ctxt */ + me_ctxt_t *ps_me_ctxt = &ps_proc->s_me_ctxt; + + /* Pointer to the structure having motion vectors, size and position of curr partitions */ + enc_pu_t *ps_curr_pu; + + /* pointers to full pel, half pel x, half pel y, half pel xy reference buffer */ + UWORD8 *pu1_ref[4]; + + /* pred buffer ptr */ + UWORD8 *pu1_pred; + + /* strides of full pel, half pel x, half pel y, half pel xy reference buffer */ + WORD32 i4_ref_strd[4]; + + /* pred buffer stride */ + WORD32 i4_pred_strd = ps_proc->i4_pred_strd; + + /* full pel motion vectors */ + WORD32 u4_mv_x_full, u4_mv_y_full; + + /* half pel motion vectors */ + WORD32 u4_mv_x_hpel, u4_mv_y_hpel; + + /* quarter pel motion vectors */ + WORD32 u4_mv_x_qpel, u4_mv_y_qpel; + + /* width & height of the partition */ + UWORD32 wd, ht; + + /* partition idx */ + UWORD32 u4_num_prtn; + + /* half / qpel coefficient */ + UWORD32 u4_subpel_factor; + + /* temp var */ + UWORD32 u4_lkup_idx1; + + /* Init */ + i4_ref_strd[0] = ps_proc->i4_rec_strd; + + i4_ref_strd[1] = i4_ref_strd[2] = i4_ref_strd[3] = ps_me_ctxt->u4_hp_buf_strd; + + for (u4_num_prtn = 0; u4_num_prtn < ps_proc->u4_num_sub_partitions; u4_num_prtn++) + { + /* update ptr to curr partition */ + ps_curr_pu = ps_proc->ps_pu + u4_num_prtn; + + + /* get full pel mv's (full pel units) */ + u4_mv_x_full = ps_curr_pu->s_l0_mv.i2_mvx >> 2; + u4_mv_y_full = ps_curr_pu->s_l0_mv.i2_mvy >> 2; + + /* get half pel mv's */ + u4_mv_x_hpel = (ps_curr_pu->s_l0_mv.i2_mvx & 0x2) >> 1; + u4_mv_y_hpel = (ps_curr_pu->s_l0_mv.i2_mvy & 0x2) >> 1; + + /* get quarter pel mv's */ + u4_mv_x_qpel = (ps_curr_pu->s_l0_mv.i2_mvx & 0x1); + u4_mv_y_qpel = (ps_curr_pu->s_l0_mv.i2_mvy & 0x1); + + /* width and height of partition */ + wd = (ps_curr_pu->b4_wd + 1) << 2; + ht = (ps_curr_pu->b4_ht + 1) << 2; + + /* decision ? qpel/hpel, fpel */ + u4_subpel_factor = (u4_mv_y_hpel << 3) + (u4_mv_x_hpel << 2) + (u4_mv_y_qpel << 1) + (u4_mv_x_qpel); + + /* update ref buffer ptrs */ + pu1_ref[0] = ps_proc->pu1_ref_buf_luma + (u4_mv_y_full * i4_ref_strd[0]) + u4_mv_x_full; + + pu1_ref[1] = ps_proc->pu1_best_subpel_buf; + i4_ref_strd[1] = ps_proc->u4_bst_spel_buf_strd; + + + /* update pred buff ptr */ + pu1_pred = ps_proc->pu1_pred_mb + 4 * ps_curr_pu->b4_pos_y * i4_pred_strd + 4 * ps_curr_pu->b4_pos_x; + + /*u4_lkup_idx1 will be non zero for half pel*/ + u4_lkup_idx1 = (u4_subpel_factor >> 2 ) != 0 ; + + { + /********************************************************************/ + /* if the block is P16x16 MB and mv are not quarter pel motion */ + /* vectors, there is no need to copy 16x16 unit from reference frame*/ + /* to pred buffer. We might as well send the reference frame buffer */ + /* pointer as pred buffer (ofc with updated stride) to fwd transform*/ + /* and inverse transform unit. */ + /********************************************************************/ + if (ps_proc->u4_num_sub_partitions == 1) + { + *pu1_pseudo_pred = pu1_ref[u4_lkup_idx1]; + *pi4_pseudo_pred_strd = i4_ref_strd[u4_lkup_idx1]; + + } + /* + * Copying half pel or full pel to prediction buffer + * Currently ps_proc->u4_num_sub_partitions will always be 1 as we only support 16x16 in P mbs + */ + else + { + ps_codec->pf_inter_pred_luma_copy(pu1_ref[u4_lkup_idx1], pu1_pred, i4_ref_strd[u4_lkup_idx1], i4_pred_strd, ht, wd, NULL, 0); + } + + } + } +} + +/** +****************************************************************************** +* +* @brief +* performs motion compensation for chroma mb +* +* @par Description +* Copies a MB of data from the reference buffer (Full pel, half pel or q pel) +* according to the motion vectors given +* +* @param[in] ps_proc +* pointer to current proc ctxt +* +* @return none +* +* @remarks Assumes half pel and quarter pel buffers for the entire frame are +* populated. +****************************************************************************** +*/ +void ih264e_motion_comp_chroma(process_ctxt_t *ps_proc) +{ + /* codec context */ + codec_t *ps_codec = ps_proc->ps_codec; + + /* Pointer to the structure having motion vectors, size and position of curr partitions */ + enc_pu_t *ps_curr_pu; + + /* pointers to full pel, half pel x, half pel y, half pel xy reference buffer */ + UWORD8 *pu1_ref; + + /* pred buffer ptr */ + UWORD8 *pu1_pred; + + /* strides of full pel reference buffer */ + WORD32 i4_ref_strd = ps_proc->i4_rec_strd; + + /* pred buffer stride */ + WORD32 i4_pred_strd = ps_proc->i4_pred_strd; + + /* full pel motion vectors */ + WORD32 u4_mv_x_full, u4_mv_y_full; + + /* half pel motion vectors */ + WORD32 u4_mv_x_hpel, u4_mv_y_hpel; + + /* quarter pel motion vectors */ + WORD32 u4_mv_x_qpel, u4_mv_y_qpel; + + /* width & height of the partition */ + UWORD32 wd, ht; + + /* partition idx */ + UWORD32 u4_num_prtn; + + WORD32 u4_mv_x; + WORD32 u4_mv_y; + UWORD8 u1_dx, u1_dy; + + for (u4_num_prtn = 0; u4_num_prtn < ps_proc->u4_num_sub_partitions; u4_num_prtn++) + { + ps_curr_pu =ps_proc->ps_pu + u4_num_prtn; + + u4_mv_x = ps_curr_pu->s_l0_mv.i2_mvx >> 3; + u4_mv_y = ps_curr_pu->s_l0_mv.i2_mvy >> 3; + + /* corresponds to full pel motion vector in luma, but in chroma corresponds to pel formed with dx, dy =4*/ + u4_mv_x_full = (ps_curr_pu->s_l0_mv.i2_mvx & 0x4) >> 2; + u4_mv_y_full = (ps_curr_pu->s_l0_mv.i2_mvy & 0x4) >> 2; + + /* get half pel mv's */ + u4_mv_x_hpel = (ps_curr_pu->s_l0_mv.i2_mvx & 0x2) >> 1; + u4_mv_y_hpel = (ps_curr_pu->s_l0_mv.i2_mvy & 0x2) >> 1; + + /* get quarter pel mv's */ + u4_mv_x_qpel = (ps_curr_pu->s_l0_mv.i2_mvx & 0x1); + u4_mv_y_qpel = (ps_curr_pu->s_l0_mv.i2_mvy & 0x1); + + /* width and height of sub macro block */ + wd = (ps_curr_pu->b4_wd + 1) << 1; + ht = (ps_curr_pu->b4_ht + 1) << 1; + + /* move the pointers so that they point to the motion compensated locations */ + pu1_ref = ps_proc->pu1_ref_buf_chroma + (u4_mv_y * i4_ref_strd) + (u4_mv_x << 1); + + pu1_pred = ps_proc->pu1_pred_mb + 4 * ps_curr_pu->b4_pos_y * i4_pred_strd + 2 * ps_curr_pu->b4_pos_x; + + u1_dx = (u4_mv_x_full << 2) + (u4_mv_x_hpel << 1) + (u4_mv_x_qpel); + u1_dy = (u4_mv_y_full << 2) + (u4_mv_y_hpel << 1) + (u4_mv_y_qpel); + + ps_codec->pf_inter_pred_chroma(pu1_ref, pu1_pred, i4_ref_strd, i4_pred_strd, + u1_dx, u1_dy, ht, wd); + } +} |