blob: 2dd0974d9feeeeb1a13e21653bc3d5fe91deb445 [file] [log] [blame]
/******************************************************************************
*
* Copyright (C) 2015 The Android Open Source Project
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at:
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*
*****************************************************************************
* Originally developed and contributed by Ittiam Systems Pvt. Ltd, Bangalore
*/
/**
*******************************************************************************
* @file
* ih264e_mc.c
*
* @brief
* Contains definition of functions for motion compensation
*
* @author
* ittiam
*
* @par List of Functions:
* - ih264e_motion_comp_luma()
* - ih264e_motion_comp_chroma()
*
* @remarks
* None
*
*******************************************************************************
*/
/*****************************************************************************/
/* File Includes */
/*****************************************************************************/
/* System include files */
#include <stdio.h>
/* User include files */
#include "ih264_typedefs.h"
#include "ih264_defs.h"
#include "iv2.h"
#include "ive2.h"
#include "ime_distortion_metrics.h"
#include "ime_structs.h"
#include "ih264_structs.h"
#include "ih264_inter_pred_filters.h"
#include "ih264_mem_fns.h"
#include "ih264_padding.h"
#include "ih264_intra_pred_filters.h"
#include "ih264_deblk_edge_filters.h"
#include "ih264_trans_quant_itrans_iquant.h"
#include "ih264_inter_pred_filters.h"
#include "ih264_mem_fns.h"
#include "ih264_padding.h"
#include "ih264_intra_pred_filters.h"
#include "ih264_deblk_edge_filters.h"
#include "ih264e_defs.h"
#include "ih264e_error.h"
#include "ih264e_bitstream.h"
#include "irc_cntrl_param.h"
#include "irc_frame_info_collector.h"
#include "ih264e_rate_control.h"
#include "ih264e_structs.h"
#include "ih264e_mc.h"
#include "ih264e_half_pel.h"
/*****************************************************************************/
/* Function Definitions */
/*****************************************************************************/
/**
******************************************************************************
*
* @brief
* performs motion compensation for a luma mb for the given mv.
*
* @par Description
* This routine performs motion compensation of an inter mb. When the inter
* mb mode is P16x16, there is no need to copy 16x16 unit from reference buffer
* to pred buffer. In this case the function returns pointer and stride of the
* ref. buffer and this info is used in place of pred buffer else where.
* In other cases, the pred buffer is populated via copy / filtering + copy
* (q pel cases) and returned.
*
* @param[in] ps_proc
* pointer to current proc ctxt
*
* @param[out] pu1_pseudo_pred
* pseudo prediction buffer
*
* @param[out] u4_pseudo_pred_strd
* pseudo pred buffer stride
*
* @return none
*
* @remarks Assumes half pel buffers for the entire frame are populated.
*
******************************************************************************
*/
void ih264e_motion_comp_luma(process_ctxt_t *ps_proc,
UWORD8 **pu1_pseudo_pred,
WORD32 *pi4_pseudo_pred_strd)
{
/* codec context */
codec_t *ps_codec = ps_proc->ps_codec;
/* me ctxt */
me_ctxt_t *ps_me_ctxt = &ps_proc->s_me_ctxt;
/* Pointer to the structure having motion vectors, size and position of curr partitions */
enc_pu_t *ps_curr_pu;
/* pointers to full pel, half pel x, half pel y, half pel xy reference buffer */
UWORD8 *pu1_ref[4];
/* pred buffer ptr */
UWORD8 *pu1_pred;
/* strides of full pel, half pel x, half pel y, half pel xy reference buffer */
WORD32 i4_ref_strd[4];
/* pred buffer stride */
WORD32 i4_pred_strd = ps_proc->i4_pred_strd;
/* full pel motion vectors */
WORD32 u4_mv_x_full, u4_mv_y_full;
/* half pel motion vectors */
WORD32 u4_mv_x_hpel, u4_mv_y_hpel;
/* quarter pel motion vectors */
WORD32 u4_mv_x_qpel, u4_mv_y_qpel;
/* width & height of the partition */
UWORD32 wd, ht;
/* partition idx */
UWORD32 u4_num_prtn;
/* half / qpel coefficient */
UWORD32 u4_subpel_factor;
/* temp var */
UWORD32 u4_lkup_idx1;
/* Init */
i4_ref_strd[0] = ps_proc->i4_rec_strd;
i4_ref_strd[1] = i4_ref_strd[2] = i4_ref_strd[3] = ps_me_ctxt->u4_hp_buf_strd;
for (u4_num_prtn = 0; u4_num_prtn < ps_proc->u4_num_sub_partitions; u4_num_prtn++)
{
/* update ptr to curr partition */
ps_curr_pu = ps_proc->ps_pu + u4_num_prtn;
/* get full pel mv's (full pel units) */
u4_mv_x_full = ps_curr_pu->s_l0_mv.i2_mvx >> 2;
u4_mv_y_full = ps_curr_pu->s_l0_mv.i2_mvy >> 2;
/* get half pel mv's */
u4_mv_x_hpel = (ps_curr_pu->s_l0_mv.i2_mvx & 0x2) >> 1;
u4_mv_y_hpel = (ps_curr_pu->s_l0_mv.i2_mvy & 0x2) >> 1;
/* get quarter pel mv's */
u4_mv_x_qpel = (ps_curr_pu->s_l0_mv.i2_mvx & 0x1);
u4_mv_y_qpel = (ps_curr_pu->s_l0_mv.i2_mvy & 0x1);
/* width and height of partition */
wd = (ps_curr_pu->b4_wd + 1) << 2;
ht = (ps_curr_pu->b4_ht + 1) << 2;
/* decision ? qpel/hpel, fpel */
u4_subpel_factor = (u4_mv_y_hpel << 3) + (u4_mv_x_hpel << 2) + (u4_mv_y_qpel << 1) + (u4_mv_x_qpel);
/* update ref buffer ptrs */
pu1_ref[0] = ps_proc->pu1_ref_buf_luma + (u4_mv_y_full * i4_ref_strd[0]) + u4_mv_x_full;
pu1_ref[1] = ps_proc->pu1_best_subpel_buf;
i4_ref_strd[1] = ps_proc->u4_bst_spel_buf_strd;
/* update pred buff ptr */
pu1_pred = ps_proc->pu1_pred_mb + 4 * ps_curr_pu->b4_pos_y * i4_pred_strd + 4 * ps_curr_pu->b4_pos_x;
/*u4_lkup_idx1 will be non zero for half pel*/
u4_lkup_idx1 = (u4_subpel_factor >> 2 ) != 0 ;
{
/********************************************************************/
/* if the block is P16x16 MB and mv are not quarter pel motion */
/* vectors, there is no need to copy 16x16 unit from reference frame*/
/* to pred buffer. We might as well send the reference frame buffer */
/* pointer as pred buffer (ofc with updated stride) to fwd transform*/
/* and inverse transform unit. */
/********************************************************************/
if (ps_proc->u4_num_sub_partitions == 1)
{
*pu1_pseudo_pred = pu1_ref[u4_lkup_idx1];
*pi4_pseudo_pred_strd = i4_ref_strd[u4_lkup_idx1];
}
/*
* Copying half pel or full pel to prediction buffer
* Currently ps_proc->u4_num_sub_partitions will always be 1 as we only support 16x16 in P mbs
*/
else
{
ps_codec->pf_inter_pred_luma_copy(pu1_ref[u4_lkup_idx1], pu1_pred, i4_ref_strd[u4_lkup_idx1], i4_pred_strd, ht, wd, NULL, 0);
}
}
}
}
/**
******************************************************************************
*
* @brief
* performs motion compensation for chroma mb
*
* @par Description
* Copies a MB of data from the reference buffer (Full pel, half pel or q pel)
* according to the motion vectors given
*
* @param[in] ps_proc
* pointer to current proc ctxt
*
* @return none
*
* @remarks Assumes half pel and quarter pel buffers for the entire frame are
* populated.
******************************************************************************
*/
void ih264e_motion_comp_chroma(process_ctxt_t *ps_proc)
{
/* codec context */
codec_t *ps_codec = ps_proc->ps_codec;
/* Pointer to the structure having motion vectors, size and position of curr partitions */
enc_pu_t *ps_curr_pu;
/* pointers to full pel, half pel x, half pel y, half pel xy reference buffer */
UWORD8 *pu1_ref;
/* pred buffer ptr */
UWORD8 *pu1_pred;
/* strides of full pel reference buffer */
WORD32 i4_ref_strd = ps_proc->i4_rec_strd;
/* pred buffer stride */
WORD32 i4_pred_strd = ps_proc->i4_pred_strd;
/* full pel motion vectors */
WORD32 u4_mv_x_full, u4_mv_y_full;
/* half pel motion vectors */
WORD32 u4_mv_x_hpel, u4_mv_y_hpel;
/* quarter pel motion vectors */
WORD32 u4_mv_x_qpel, u4_mv_y_qpel;
/* width & height of the partition */
UWORD32 wd, ht;
/* partition idx */
UWORD32 u4_num_prtn;
WORD32 u4_mv_x;
WORD32 u4_mv_y;
UWORD8 u1_dx, u1_dy;
for (u4_num_prtn = 0; u4_num_prtn < ps_proc->u4_num_sub_partitions; u4_num_prtn++)
{
ps_curr_pu =ps_proc->ps_pu + u4_num_prtn;
u4_mv_x = ps_curr_pu->s_l0_mv.i2_mvx >> 3;
u4_mv_y = ps_curr_pu->s_l0_mv.i2_mvy >> 3;
/* corresponds to full pel motion vector in luma, but in chroma corresponds to pel formed with dx, dy =4*/
u4_mv_x_full = (ps_curr_pu->s_l0_mv.i2_mvx & 0x4) >> 2;
u4_mv_y_full = (ps_curr_pu->s_l0_mv.i2_mvy & 0x4) >> 2;
/* get half pel mv's */
u4_mv_x_hpel = (ps_curr_pu->s_l0_mv.i2_mvx & 0x2) >> 1;
u4_mv_y_hpel = (ps_curr_pu->s_l0_mv.i2_mvy & 0x2) >> 1;
/* get quarter pel mv's */
u4_mv_x_qpel = (ps_curr_pu->s_l0_mv.i2_mvx & 0x1);
u4_mv_y_qpel = (ps_curr_pu->s_l0_mv.i2_mvy & 0x1);
/* width and height of sub macro block */
wd = (ps_curr_pu->b4_wd + 1) << 1;
ht = (ps_curr_pu->b4_ht + 1) << 1;
/* move the pointers so that they point to the motion compensated locations */
pu1_ref = ps_proc->pu1_ref_buf_chroma + (u4_mv_y * i4_ref_strd) + (u4_mv_x << 1);
pu1_pred = ps_proc->pu1_pred_mb + 4 * ps_curr_pu->b4_pos_y * i4_pred_strd + 2 * ps_curr_pu->b4_pos_x;
u1_dx = (u4_mv_x_full << 2) + (u4_mv_x_hpel << 1) + (u4_mv_x_qpel);
u1_dy = (u4_mv_y_full << 2) + (u4_mv_y_hpel << 1) + (u4_mv_y_qpel);
ps_codec->pf_inter_pred_chroma(pu1_ref, pu1_pred, i4_ref_strd, i4_pred_strd,
u1_dx, u1_dy, ht, wd);
}
}