blob: 211d796e075d88ccd48f5b578629342ce073c86a [file] [log] [blame]
/******************************************************************************
*
* Copyright (C) 2015 The Android Open Source Project
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at:
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*
*****************************************************************************
* Originally developed and contributed by Ittiam Systems Pvt. Ltd, Bangalore
*/
/*!
**************************************************************************
* \file ih264d_process_intra_mb.c
*
* \brief
* Contains routines that decode a I slice type
*
* Detailed_description
*
* \date
* 07/07/2003
*
* \author NS
**************************************************************************
*/
#include <string.h>
#include "ih264d_bitstrm.h"
#include "ih264d_defs.h"
#include "ih264d_debug.h"
#include "ih264d_tables.h"
#include "ih264d_structs.h"
#include "ih264d_defs.h"
#include "ih264d_parse_cavlc.h"
#include "ih264d_mb_utils.h"
#include "ih264d_parse_slice.h"
#include "ih264d_process_intra_mb.h"
#include "ih264d_error_handler.h"
#include "ih264d_quant_scaling.h"
#include "ih264d_tables.h"
/*!
**************************************************************************
* \if Function name : ih264d_itrans_recon_luma_dc \endif
*
* \brief
* This function does InvTransform, scaling and reconstruction of Luma DC.
*
* \return
* 0 on Success and Error code otherwise
**************************************************************************
*/
void ih264d_itrans_recon_luma_dc(dec_struct_t *ps_dec,
WORD16* pi2_src,
WORD16* pi2_coeff_block,
const UWORD16 *pu2_weigh_mat)
{
WORD32 i;
WORD16 pi2_out[16];
WORD32 pi4_tmp[16];
WORD16 *pi2_out_ptr = &pi2_out[0];
PROFILE_DISABLE_IQ_IT_RECON_RETURN()
ps_dec->pf_ihadamard_scaling_4x4(pi2_src, pi2_out,
ps_dec->pu2_quant_scale_y, pu2_weigh_mat,
ps_dec->u1_qp_y_div6, pi4_tmp);
for(i = 0; i < 4; i++)
{
pi2_coeff_block[0] = pi2_out_ptr[0];
pi2_coeff_block[4 * 16] = pi2_out_ptr[4];
pi2_coeff_block[8 * 16] = pi2_out_ptr[8];
pi2_coeff_block[12 * 16] = pi2_out_ptr[12];
pi2_out_ptr++; /* Point to next column */
pi2_coeff_block += 16;
}
}
/*!
**************************************************************************
* \if Function name : ih264d_read_intra_pred_modes \endif
*
* \brief
* Reads the intra pred mode related values of I4x4 MB from bitstream.
*
* This function will read the prev intra pred mode flags and
* stores it in pu1_prev_intra4x4_pred_mode_flag. If the u4_flag
* indicates that most probable mode is not intra pred mode, then
* the rem_intra4x4_pred_mode is read and stored in
* pu1_rem_intra4x4_pred_mode array.
*
*
* \return
* 0 on success and Error code otherwise
*
**************************************************************************
*/
WORD32 ih264d_read_intra_pred_modes(dec_struct_t * ps_dec,
UWORD8 * pu1_prev_intra4x4_pred_mode_flag,
UWORD8 * pu1_rem_intra4x4_pred_mode,
UWORD32 u4_trans_form8x8)
{
WORD32 i4x4_luma_blk_idx = 0, i8x8_luma_blk_idx = 0;
dec_bit_stream_t * ps_bitstrm = ps_dec->ps_bitstrm;
if(!u4_trans_form8x8)
{
for(i4x4_luma_blk_idx = 0; i4x4_luma_blk_idx < 16; ++i4x4_luma_blk_idx)
{
UWORD32 u4_temp;
SWITCHOFFTRACE;
GETBIT(u4_temp, ps_bitstrm->u4_ofst, ps_bitstrm->pu4_buffer);
*pu1_prev_intra4x4_pred_mode_flag = (UWORD8)u4_temp;
if(!(*pu1_prev_intra4x4_pred_mode_flag))
{
GETBITS(u4_temp, ps_bitstrm->u4_ofst, ps_bitstrm->pu4_buffer, 3);
*(pu1_rem_intra4x4_pred_mode) = (UWORD8)u4_temp;
}
pu1_prev_intra4x4_pred_mode_flag++;
pu1_rem_intra4x4_pred_mode++;
}
}
else
{
/**********************************************************************/
/* prev_intra4x4_pred_modes to be interpreted as */
/* prev_intra8x8_pred_modes in case of transform 8x8 */
/**********************************************************************/
for(i8x8_luma_blk_idx = 0; i8x8_luma_blk_idx < 4; i8x8_luma_blk_idx++)
{
UWORD32 u4_temp;
GETBIT(u4_temp, ps_bitstrm->u4_ofst, ps_bitstrm->pu4_buffer);
*pu1_prev_intra4x4_pred_mode_flag = (UWORD8)u4_temp;
if(!(*pu1_prev_intra4x4_pred_mode_flag))
{
GETBITS(u4_temp, ps_bitstrm->u4_ofst, ps_bitstrm->pu4_buffer, 3);
(*pu1_rem_intra4x4_pred_mode) = (UWORD8)u4_temp;
}
pu1_prev_intra4x4_pred_mode_flag++;
pu1_rem_intra4x4_pred_mode++;
}
}
return (0);
}
WORD32 ih264d_unpack_coeff4x4_4x4blk(dec_struct_t * ps_dec,
WORD16 *pi2_out_coeff_data,
UWORD8 *pu1_inv_scan)
{
tu_sblk4x4_coeff_data_t *ps_tu_4x4 = (tu_sblk4x4_coeff_data_t *)ps_dec->pv_proc_tu_coeff_data;
UWORD16 u2_sig_coeff_map = ps_tu_4x4->u2_sig_coeff_map;
WORD32 idx = 0;
WORD16 *pi2_coeff_data = &ps_tu_4x4->ai2_level[0];
WORD32 dc_only_flag = 0;
WORD32 num_coeff = 0;
PROFILE_DISABLE_UNPACK_LUMA()
while(u2_sig_coeff_map)
{
idx = CLZ(u2_sig_coeff_map);
idx = 31 - idx;
RESET_BIT(u2_sig_coeff_map,idx);
idx = pu1_inv_scan[idx];
pi2_out_coeff_data[idx] = *pi2_coeff_data++;
num_coeff++;
}
if((num_coeff == 1) && (idx == 0))
{
dc_only_flag = 1;
}
{
WORD32 offset;
offset = (UWORD8 *)pi2_coeff_data - (UWORD8 *)ps_tu_4x4;
offset = ALIGN4(offset);
ps_dec->pv_proc_tu_coeff_data = (void *)((UWORD8 *)ps_dec->pv_proc_tu_coeff_data + offset);
}
return dc_only_flag;
}
UWORD32 ih264d_unpack_coeff4x4_8x8blk(dec_struct_t * ps_dec,
dec_mb_info_t * ps_cur_mb_info,
UWORD16 ui2_luma_csbp,
WORD16 *pi2_out_coeff_data)
{
UWORD8 *pu1_inv_scan;
UWORD8 u1_mb_field_decoding_flag = ps_cur_mb_info->u1_mb_field_decodingflag;
UWORD8 u1_field_coding_flag = ps_cur_mb_info->ps_curmb->u1_mb_fld;
UWORD32 u4_luma_dc_only_csbp = 0;
WORD32 dc_only_flag = 0;
PROFILE_DISABLE_UNPACK_LUMA()
if(u1_field_coding_flag || u1_mb_field_decoding_flag)
{
pu1_inv_scan = (UWORD8 *)gau1_ih264d_inv_scan_fld;
}
else
{
pu1_inv_scan = (UWORD8 *)gau1_ih264d_inv_scan;
}
// sub 0
if(ui2_luma_csbp & 0x1)
{
memset(pi2_out_coeff_data,0,16*sizeof(WORD16));
dc_only_flag = ih264d_unpack_coeff4x4_4x4blk(ps_dec,
pi2_out_coeff_data,
pu1_inv_scan);
INSERT_BIT(u4_luma_dc_only_csbp, 0, dc_only_flag);
}
pi2_out_coeff_data += 16;
// sub 1
if(ui2_luma_csbp & 0x2)
{
memset(pi2_out_coeff_data,0,16*sizeof(WORD16));
dc_only_flag = ih264d_unpack_coeff4x4_4x4blk(ps_dec,
pi2_out_coeff_data,
pu1_inv_scan);
INSERT_BIT(u4_luma_dc_only_csbp, 1, dc_only_flag);
}
pi2_out_coeff_data += 16 + 32;
// sub 2
if(ui2_luma_csbp & 0x10)
{
memset(pi2_out_coeff_data,0,16*sizeof(WORD16));
dc_only_flag = ih264d_unpack_coeff4x4_4x4blk(ps_dec,
pi2_out_coeff_data,
pu1_inv_scan);
INSERT_BIT(u4_luma_dc_only_csbp, 4, dc_only_flag);
}
pi2_out_coeff_data += 16;
// sub 3
if(ui2_luma_csbp & 0x20)
{
memset(pi2_out_coeff_data,0,16*sizeof(WORD16));
dc_only_flag = ih264d_unpack_coeff4x4_4x4blk(ps_dec,
pi2_out_coeff_data,
pu1_inv_scan);
INSERT_BIT(u4_luma_dc_only_csbp, 5, dc_only_flag);
}
return u4_luma_dc_only_csbp;
}
WORD32 ih264d_unpack_coeff8x8_8x8blk_cavlc(dec_struct_t * ps_dec,
dec_mb_info_t * ps_cur_mb_info,
UWORD16 ui2_luma_csbp,
WORD16 *pi2_out_coeff_data)
{
UWORD8 *pu1_inv_scan;
UWORD8 u1_mb_field_decoding_flag = ps_cur_mb_info->u1_mb_field_decodingflag;
UWORD8 u1_field_coding_flag = ps_cur_mb_info->ps_curmb->u1_mb_fld;
WORD32 dc_only_flag = 0;
PROFILE_DISABLE_UNPACK_LUMA()
if(ui2_luma_csbp & 0x33)
{
memset(pi2_out_coeff_data,0,64*sizeof(WORD16));
}
if(!u1_mb_field_decoding_flag)
{
pu1_inv_scan =
(UWORD8*)gau1_ih264d_inv_scan_prog8x8_cavlc[0];
}
else
{
pu1_inv_scan =
(UWORD8*)gau1_ih264d_inv_scan_int8x8_cavlc[0];
}
// sub 0
if(ui2_luma_csbp & 0x1)
{
dc_only_flag = ih264d_unpack_coeff4x4_4x4blk(ps_dec,
pi2_out_coeff_data,
pu1_inv_scan);
}
if(!u1_mb_field_decoding_flag)
{
pu1_inv_scan =
(UWORD8*)gau1_ih264d_inv_scan_prog8x8_cavlc[1];
}
else
{
pu1_inv_scan =
(UWORD8*)gau1_ih264d_inv_scan_int8x8_cavlc[1];
}
// sub 1
if(ui2_luma_csbp & 0x2)
{
dc_only_flag = 0;
ih264d_unpack_coeff4x4_4x4blk(ps_dec,
pi2_out_coeff_data,
pu1_inv_scan);
}
if(!u1_mb_field_decoding_flag)
{
pu1_inv_scan =
(UWORD8*)gau1_ih264d_inv_scan_prog8x8_cavlc[2];
}
else
{
pu1_inv_scan =
(UWORD8*)gau1_ih264d_inv_scan_int8x8_cavlc[2];
}
// sub 2
if(ui2_luma_csbp & 0x10)
{
dc_only_flag = 0;
ih264d_unpack_coeff4x4_4x4blk(ps_dec,
pi2_out_coeff_data,
pu1_inv_scan);
}
if(!u1_mb_field_decoding_flag)
{
pu1_inv_scan =
(UWORD8*)gau1_ih264d_inv_scan_prog8x8_cavlc[3];
}
else
{
pu1_inv_scan =
(UWORD8*)gau1_ih264d_inv_scan_int8x8_cavlc[3];
}
// sub 3
if(ui2_luma_csbp & 0x20)
{
dc_only_flag = 0;
ih264d_unpack_coeff4x4_4x4blk(ps_dec,
pi2_out_coeff_data,
pu1_inv_scan);
}
return dc_only_flag;
}
void ih264d_unpack_coeff4x4_8x8blk_chroma(dec_struct_t * ps_dec,
dec_mb_info_t * ps_cur_mb_info,
UWORD16 ui2_chroma_csbp,
WORD16 *pi2_out_coeff_data)
{
UWORD8 *pu1_inv_scan;
UWORD8 u1_mb_field_decoding_flag = ps_cur_mb_info->u1_mb_field_decodingflag;
UWORD8 u1_field_coding_flag = ps_cur_mb_info->ps_curmb->u1_mb_fld;
PROFILE_DISABLE_UNPACK_CHROMA()
if(u1_field_coding_flag || u1_mb_field_decoding_flag)
{
pu1_inv_scan = (UWORD8 *)gau1_ih264d_inv_scan_fld;
}
else
{
pu1_inv_scan = (UWORD8 *)gau1_ih264d_inv_scan;
}
if(ui2_chroma_csbp & 0x1)
{
memset(pi2_out_coeff_data,0,16*sizeof(WORD16));
ih264d_unpack_coeff4x4_4x4blk(ps_dec,
pi2_out_coeff_data,
pu1_inv_scan);
}
pi2_out_coeff_data += 16;
if(ui2_chroma_csbp & 0x2)
{
memset(pi2_out_coeff_data,0,16*sizeof(WORD16));
ih264d_unpack_coeff4x4_4x4blk(ps_dec,
pi2_out_coeff_data,
pu1_inv_scan);
}
pi2_out_coeff_data += 16;
if(ui2_chroma_csbp & 0x4)
{
memset(pi2_out_coeff_data,0,16*sizeof(WORD16));
ih264d_unpack_coeff4x4_4x4blk(ps_dec,
pi2_out_coeff_data,
pu1_inv_scan);
}
pi2_out_coeff_data += 16;
if(ui2_chroma_csbp & 0x8)
{
memset(pi2_out_coeff_data,0,16*sizeof(WORD16));
ih264d_unpack_coeff4x4_4x4blk(ps_dec,
pi2_out_coeff_data,
pu1_inv_scan);
}
}
UWORD32 ih264d_unpack_luma_coeff4x4_mb(dec_struct_t * ps_dec,
dec_mb_info_t * ps_cur_mb_info,
UWORD8 intra_flag)
{
UWORD8 u1_mb_type = ps_cur_mb_info->u1_mb_type;
UWORD16 ui2_luma_csbp = ps_cur_mb_info->u2_luma_csbp;
UWORD8 *pu1_inv_scan = ps_dec->pu1_inv_scan;
WORD16 *pi2_coeff_data = ps_dec->pi2_coeff_data;
PROFILE_DISABLE_UNPACK_LUMA()
if(!ps_cur_mb_info->u1_tran_form8x8)
{
UWORD32 u4_luma_dc_only_csbp = 0;
UWORD32 u4_temp = 0;
WORD16* pi2_dc_val = NULL;
/*
* Reserve the pointer to dc vals. The dc vals will be copied
* after unpacking of ac vals since memset to 0 inside.
*/
if(intra_flag && (u1_mb_type != I_4x4_MB))
{
if(CHECKBIT(ps_cur_mb_info->u1_yuv_dc_block_flag,0))
{
pi2_dc_val = (WORD16 *)ps_dec->pv_proc_tu_coeff_data;
ps_dec->pv_proc_tu_coeff_data = (void *)(pi2_dc_val + 16);
}
}
if(ui2_luma_csbp)
{
pi2_coeff_data = ps_dec->pi2_coeff_data;
u4_temp = ih264d_unpack_coeff4x4_8x8blk(ps_dec,
ps_cur_mb_info,
ui2_luma_csbp,
pi2_coeff_data);
u4_luma_dc_only_csbp = u4_temp;
pi2_coeff_data += 32;
ui2_luma_csbp = ui2_luma_csbp >> 2;
u4_temp = ih264d_unpack_coeff4x4_8x8blk(ps_dec,
ps_cur_mb_info,
ui2_luma_csbp,
pi2_coeff_data);
u4_luma_dc_only_csbp |= (u4_temp << 2);
pi2_coeff_data += 32 + 64;
ui2_luma_csbp = ui2_luma_csbp >> 6;
u4_temp = ih264d_unpack_coeff4x4_8x8blk(ps_dec,
ps_cur_mb_info,
ui2_luma_csbp,
pi2_coeff_data);
u4_luma_dc_only_csbp |= (u4_temp << 8);
pi2_coeff_data += 32;
ui2_luma_csbp = ui2_luma_csbp >> 2;
u4_temp = ih264d_unpack_coeff4x4_8x8blk(ps_dec,
ps_cur_mb_info,
ui2_luma_csbp,
pi2_coeff_data);
u4_luma_dc_only_csbp |= (u4_temp << 10);
}
if(pi2_dc_val != NULL)
{
WORD32 i;
pi2_coeff_data = ps_dec->pi2_coeff_data;
for(i = 0; i < 4; i++)
{
pi2_coeff_data[0] = pi2_dc_val[0];
pi2_coeff_data[4 * 16] = pi2_dc_val[4];
pi2_coeff_data[8 * 16] = pi2_dc_val[8];
pi2_coeff_data[12 * 16] = pi2_dc_val[12];
pi2_dc_val++; /* Point to next column */
pi2_coeff_data += 16;
}
u4_luma_dc_only_csbp = ps_cur_mb_info->u2_luma_csbp ^ 0xFFFF;
}
return u4_luma_dc_only_csbp;
}
else
{
UWORD32 u4_luma_dc_only_cbp = 0;
WORD32 dc_only_flag;
if(ui2_luma_csbp)
{
pi2_coeff_data = ps_dec->pi2_coeff_data;
dc_only_flag = ih264d_unpack_coeff8x8_8x8blk_cavlc(ps_dec,
ps_cur_mb_info,
ui2_luma_csbp,
pi2_coeff_data);
INSERT_BIT(u4_luma_dc_only_cbp, 0, dc_only_flag);
pi2_coeff_data += 64;
ui2_luma_csbp = ui2_luma_csbp >> 2;
dc_only_flag = ih264d_unpack_coeff8x8_8x8blk_cavlc(ps_dec,
ps_cur_mb_info,
ui2_luma_csbp,
pi2_coeff_data);
INSERT_BIT(u4_luma_dc_only_cbp, 1, dc_only_flag);
pi2_coeff_data += 64;
ui2_luma_csbp = ui2_luma_csbp >> 6;
dc_only_flag = ih264d_unpack_coeff8x8_8x8blk_cavlc(ps_dec,
ps_cur_mb_info,
ui2_luma_csbp,
pi2_coeff_data);
INSERT_BIT(u4_luma_dc_only_cbp, 2, dc_only_flag);
pi2_coeff_data += 64;
ui2_luma_csbp = ui2_luma_csbp >> 2;
dc_only_flag = ih264d_unpack_coeff8x8_8x8blk_cavlc(ps_dec,
ps_cur_mb_info,
ui2_luma_csbp,
pi2_coeff_data);
INSERT_BIT(u4_luma_dc_only_cbp, 3, dc_only_flag);
}
return u4_luma_dc_only_cbp;
}
}
void ih264d_unpack_chroma_coeff4x4_mb(dec_struct_t * ps_dec,
dec_mb_info_t * ps_cur_mb_info)
{
UWORD8 u1_mb_type = ps_cur_mb_info->u1_mb_type;
UWORD16 ui2_chroma_csbp = ps_cur_mb_info->u2_chroma_csbp;
UWORD8 *pu1_inv_scan = ps_dec->pu1_inv_scan;
WORD16 *pi2_coeff_data = ps_dec->pi2_coeff_data;
WORD32 i;
WORD16 *pi2_dc_val_u = NULL;
WORD16 *pi2_dc_val_v = NULL;
PROFILE_DISABLE_UNPACK_CHROMA()
if((ps_cur_mb_info->u1_cbp >> 4) == CBPC_ALLZERO)
return;
/*
* Reserve the pointers to dc vals. The dc vals will be copied
* after unpacking of ac vals since memset to 0 inside.
*/
if(CHECKBIT(ps_cur_mb_info->u1_yuv_dc_block_flag,1))
{
pi2_dc_val_u = (WORD16 *)ps_dec->pv_proc_tu_coeff_data;
ps_dec->pv_proc_tu_coeff_data = (void *)(pi2_dc_val_u + 4);
}
if(CHECKBIT(ps_cur_mb_info->u1_yuv_dc_block_flag,2))
{
pi2_dc_val_v = (WORD16 *)ps_dec->pv_proc_tu_coeff_data;
ps_dec->pv_proc_tu_coeff_data = (void *)(pi2_dc_val_v + 4);
}
if((ps_cur_mb_info->u1_cbp >> 4) == CBPC_NONZERO)
{
pi2_coeff_data = ps_dec->pi2_coeff_data;
ih264d_unpack_coeff4x4_8x8blk_chroma(ps_dec,
ps_cur_mb_info,
ui2_chroma_csbp,
pi2_coeff_data);
pi2_coeff_data += 64;
ui2_chroma_csbp = ui2_chroma_csbp >> 4;
ih264d_unpack_coeff4x4_8x8blk_chroma(ps_dec,
ps_cur_mb_info,
ui2_chroma_csbp,
pi2_coeff_data);
}
pi2_coeff_data = ps_dec->pi2_coeff_data;
if(pi2_dc_val_u != NULL)
{
pi2_coeff_data[0] = *pi2_dc_val_u++;
pi2_coeff_data[1 * 16] = *pi2_dc_val_u++;
pi2_coeff_data[2 * 16] = *pi2_dc_val_u++;
pi2_coeff_data[3 * 16] = *pi2_dc_val_u++;
}
else
{
pi2_coeff_data[0] = 0;
pi2_coeff_data[1 * 16] = 0;
pi2_coeff_data[2 * 16] = 0;
pi2_coeff_data[3 * 16] = 0;
}
pi2_coeff_data += 64;
if(pi2_dc_val_v != NULL)
{
pi2_coeff_data[0] = *pi2_dc_val_v++;
pi2_coeff_data[1 * 16] = *pi2_dc_val_v++;
pi2_coeff_data[2 * 16] = *pi2_dc_val_v++;
pi2_coeff_data[3 * 16] = *pi2_dc_val_v++;
}
else
{
pi2_coeff_data[0] = 0;
pi2_coeff_data[1 * 16] = 0;
pi2_coeff_data[2 * 16] = 0;
pi2_coeff_data[3 * 16] = 0;
}
}
UWORD32 ih264d_unpack_luma_coeff8x8_mb(dec_struct_t * ps_dec,
dec_mb_info_t * ps_cur_mb_info)
{
WORD32 blk_8x8_cnt;
WORD16 *pi2_out_coeff_data = ps_dec->pi2_coeff_data;
UWORD8 u1_field_coding_flag = ps_cur_mb_info->ps_curmb->u1_mb_fld;
UWORD8 *pu1_inv_scan;
UWORD32 u4_luma_dc_only_cbp = 0;
PROFILE_DISABLE_UNPACK_LUMA()
if(!u1_field_coding_flag)
{
/*******************************************************************/
/* initializing inverse scan matrices */
/*******************************************************************/
pu1_inv_scan = (UWORD8 *)gau1_ih264d_inv_scan_prog8x8_cabac;
}
else
{
/*******************************************************************/
/* initializing inverse scan matrices */
/*******************************************************************/
pu1_inv_scan = (UWORD8 *)gau1_ih264d_inv_scan_int8x8_cabac;
}
for(blk_8x8_cnt = 0; blk_8x8_cnt < 4; blk_8x8_cnt++)
{
if(CHECKBIT(ps_cur_mb_info->u1_cbp, blk_8x8_cnt))
{
tu_blk8x8_coeff_data_t *ps_tu_8x8 = (tu_blk8x8_coeff_data_t *)ps_dec->pv_proc_tu_coeff_data;
UWORD32 u4_sig_coeff_map;
WORD32 idx = 0;
WORD16 *pi2_coeff_data = &ps_tu_8x8->ai2_level[0];
WORD32 num_coeff = 0;
/* memset 64 coefficient to zero */
memset(pi2_out_coeff_data,0,64*sizeof(WORD16));
u4_sig_coeff_map = ps_tu_8x8->au4_sig_coeff_map[1];
while(u4_sig_coeff_map)
{
idx = CLZ(u4_sig_coeff_map);
idx = 31 - idx;
RESET_BIT(u4_sig_coeff_map,idx);
idx = pu1_inv_scan[idx + 32];
pi2_out_coeff_data[idx] = *pi2_coeff_data++;
num_coeff++;
}
u4_sig_coeff_map = ps_tu_8x8->au4_sig_coeff_map[0];
while(u4_sig_coeff_map)
{
idx = CLZ(u4_sig_coeff_map);
idx = 31 - idx;
RESET_BIT(u4_sig_coeff_map,idx);
idx = pu1_inv_scan[idx];
pi2_out_coeff_data[idx] = *pi2_coeff_data++;
num_coeff++;
}
if((num_coeff == 1) && (idx == 0))
{
SET_BIT(u4_luma_dc_only_cbp,blk_8x8_cnt);
}
{
WORD32 offset;
offset = (UWORD8 *)pi2_coeff_data - (UWORD8 *)ps_tu_8x8;
offset = ALIGN4(offset);
ps_dec->pv_proc_tu_coeff_data = (void *)((UWORD8 *)ps_dec->pv_proc_tu_coeff_data + offset);
}
}
pi2_out_coeff_data += 64;
}
return u4_luma_dc_only_cbp;
}
/*!
**************************************************************************
* \if Function name : ih264d_process_intra_mb \endif
*
* \brief
* This function decodes an I MB. Intraprediction is carried out followed
* by InvTramsform. Both IntraPrediction and Reconstrucion are carried out
* row buffer itself.
*
*
* \return
* 0 on Success and Error code otherwise
**************************************************************************
*/
WORD32 ih264d_process_intra_mb(dec_struct_t * ps_dec,
dec_mb_info_t * ps_cur_mb_info,
UWORD8 u1_mb_num)
{
UWORD8 u1_mb_type = ps_cur_mb_info->u1_mb_type;
UWORD8 uc_temp = ps_cur_mb_info->u1_mb_ngbr_availablity;
UWORD8 u1_top_available = BOOLEAN(uc_temp & TOP_MB_AVAILABLE_MASK);
UWORD8 u1_left_available = BOOLEAN(uc_temp & LEFT_MB_AVAILABLE_MASK);
UWORD8 u1_use_top_right_mb = BOOLEAN(uc_temp & TOP_RIGHT_MB_AVAILABLE_MASK);
UWORD8 u1_use_top_left_mb = BOOLEAN(uc_temp & TOP_LEFT_MB_AVAILABLE_MASK);
UWORD8 uc_useTopMB = u1_top_available;
UWORD16 u2_use_left_mb = u1_left_available;
UWORD16 u2_use_left_mb_pack;
UWORD8 *pu1_luma_pred_buffer;
/* CHANGED CODE */
UWORD8 *pu1_luma_rec_buffer;
UWORD8 *puc_top;
mb_neigbour_params_t *ps_left_mb;
mb_neigbour_params_t *ps_top_mb;
mb_neigbour_params_t *ps_top_right_mb;
mb_neigbour_params_t *ps_curmb;
UWORD16 u2_mbx = ps_cur_mb_info->u2_mbx;
UWORD32 ui_pred_width, ui_rec_width;
WORD16 *pi2_y_coeff;
UWORD8 u1_mbaff, u1_topmb, u1_mb_field_decoding_flag;
UWORD32 u4_num_pmbair;
UWORD16 ui2_luma_csbp = ps_cur_mb_info->u2_luma_csbp;
UWORD8 *pu1_yleft, *pu1_ytop_left;
/* Chroma variables*/
UWORD8 *pu1_top_u;
UWORD8 *pu1_uleft;
UWORD8 *pu1_u_top_left;
/* CHANGED CODE */
UWORD8 *pu1_mb_cb_rei1_buffer, *pu1_mb_cr_rei1_buffer;
UWORD32 u4_recwidth_cr;
/* CHANGED CODE */
tfr_ctxt_t *ps_frame_buf = ps_dec->ps_frame_buf_ip_recon;
UWORD32 u4_luma_dc_only_csbp = 0;
UWORD32 u4_luma_dc_only_cbp = 0;
UWORD8 *pu1_prev_intra4x4_pred_mode_data = (UWORD8 *)ps_dec->pv_proc_tu_coeff_data; //Pointer to keep track of intra4x4_pred_mode data in pv_proc_tu_coeff_data buffer
u1_mbaff = ps_dec->ps_cur_slice->u1_mbaff_frame_flag;
u1_topmb = ps_cur_mb_info->u1_topmb;
u4_num_pmbair = (u1_mb_num >> u1_mbaff);
/*--------------------------------------------------------------------*/
/* Find the current MB's mb params */
/*--------------------------------------------------------------------*/
u1_mb_field_decoding_flag = ps_cur_mb_info->u1_mb_field_decodingflag;
ps_curmb = ps_cur_mb_info->ps_curmb;
ps_top_mb = ps_cur_mb_info->ps_top_mb;
ps_left_mb = ps_cur_mb_info->ps_left_mb;
ps_top_right_mb = ps_cur_mb_info->ps_top_right_mb;
/*--------------------------------------------------------------------*/
/* Check whether neighbouring MB is Inter MB and */
/* constrained intra pred is 1. */
/*--------------------------------------------------------------------*/
u2_use_left_mb_pack = (u2_use_left_mb << 8) + u2_use_left_mb;
if(ps_dec->ps_cur_pps->u1_constrained_intra_pred_flag)
{
UWORD8 u1_left = (UWORD8)u2_use_left_mb;
uc_useTopMB = uc_useTopMB
&& ((ps_top_mb->u1_mb_type != P_MB)
&& (ps_top_mb->u1_mb_type != B_MB));
u2_use_left_mb = u2_use_left_mb
&& ((ps_left_mb->u1_mb_type != P_MB)
&& (ps_left_mb->u1_mb_type != B_MB));
u2_use_left_mb_pack = (u2_use_left_mb << 8) + u2_use_left_mb;
if(u1_mbaff)
{
if(u1_mb_field_decoding_flag ^ ps_left_mb->u1_mb_fld)
{
u1_left = u1_left
&& (((ps_left_mb + 1)->u1_mb_type != P_MB)
&& ((ps_left_mb + 1)->u1_mb_type
!= B_MB));
u2_use_left_mb = u2_use_left_mb && u1_left;
if(u1_mb_field_decoding_flag)
u2_use_left_mb_pack = (u1_left << 8)
+ (u2_use_left_mb_pack & 0xff);
else
u2_use_left_mb_pack = (u2_use_left_mb << 8)
+ (u2_use_left_mb);
}
}
u1_use_top_right_mb =
u1_use_top_right_mb
&& ((ps_top_right_mb->u1_mb_type != P_MB)
&& (ps_top_right_mb->u1_mb_type
!= B_MB));
u1_use_top_left_mb =
u1_use_top_left_mb
&& ((ps_cur_mb_info->u1_topleft_mbtype != P_MB)
&& (ps_cur_mb_info->u1_topleft_mbtype
!= B_MB));
}
/*********************Common pointer calculations *************************/
/* CHANGED CODE */
pu1_luma_pred_buffer = ps_dec->pu1_y;
pu1_luma_rec_buffer = ps_frame_buf->pu1_dest_y + (u4_num_pmbair << 4);
pu1_mb_cb_rei1_buffer = ps_frame_buf->pu1_dest_u
+ (u4_num_pmbair << 3) * YUV420SP_FACTOR;
pu1_mb_cr_rei1_buffer = ps_frame_buf->pu1_dest_v + (u4_num_pmbair << 3);
ui_pred_width = MB_SIZE;
ui_rec_width = ps_dec->u2_frm_wd_y << u1_mb_field_decoding_flag;
u4_recwidth_cr = ps_dec->u2_frm_wd_uv << u1_mb_field_decoding_flag;
/************* Current and top luma pointer *****************/
if(u1_mbaff)
{
if(u1_topmb == 0)
{
pu1_luma_rec_buffer += (
u1_mb_field_decoding_flag ?
(ui_rec_width >> 1) :
(ui_rec_width << 4));
pu1_mb_cb_rei1_buffer += (
u1_mb_field_decoding_flag ?
(u4_recwidth_cr >> 1) :
(u4_recwidth_cr << 3));
pu1_mb_cr_rei1_buffer += (
u1_mb_field_decoding_flag ?
(u4_recwidth_cr >> 1) :
(u4_recwidth_cr << 3));
}
}
/* CHANGED CODE */
if(ps_dec->u4_use_intrapred_line_copy == 1)
{
puc_top = ps_dec->pu1_prev_y_intra_pred_line + (ps_cur_mb_info->u2_mbx << 4);
pu1_top_u = ps_dec->pu1_prev_u_intra_pred_line
+ (ps_cur_mb_info->u2_mbx << 3) * YUV420SP_FACTOR;
}
else
{
puc_top = pu1_luma_rec_buffer - ui_rec_width;
pu1_top_u = pu1_mb_cb_rei1_buffer - u4_recwidth_cr;
}
/* CHANGED CODE */
/************* Left pointer *****************/
pu1_yleft = pu1_luma_rec_buffer - 1;
pu1_uleft = pu1_mb_cb_rei1_buffer - 1 * YUV420SP_FACTOR;
/**************Top Left pointer calculation**********/
pu1_ytop_left = puc_top - 1;
pu1_u_top_left = pu1_top_u - 1 * YUV420SP_FACTOR;
/* CHANGED CODE */
PROFILE_DISABLE_INTRA_PRED()
{
pu1_prev_intra4x4_pred_mode_data = (UWORD8 *)ps_dec->pv_proc_tu_coeff_data;
if(u1_mb_type == I_4x4_MB && ps_cur_mb_info->u1_tran_form8x8 == 0)
{
ps_dec->pv_proc_tu_coeff_data = (void *)((UWORD8 *)ps_dec->pv_proc_tu_coeff_data + 32);
}
else if (u1_mb_type == I_4x4_MB && ps_cur_mb_info->u1_tran_form8x8 == 1)
{
ps_dec->pv_proc_tu_coeff_data = (void *)((UWORD8 *)ps_dec->pv_proc_tu_coeff_data + 8);
}
}
if(!ps_cur_mb_info->u1_tran_form8x8)
{
u4_luma_dc_only_csbp = ih264d_unpack_luma_coeff4x4_mb(ps_dec,
ps_cur_mb_info,
1);
}
else
{
if(!ps_dec->ps_cur_pps->u1_entropy_coding_mode)
{
u4_luma_dc_only_cbp = ih264d_unpack_luma_coeff4x4_mb(ps_dec,
ps_cur_mb_info,
1);
}
else
{
u4_luma_dc_only_cbp = ih264d_unpack_luma_coeff8x8_mb(ps_dec,
ps_cur_mb_info);
}
}
pi2_y_coeff = ps_dec->pi2_coeff_data;
if(u1_mb_type != I_4x4_MB)
{
UWORD8 u1_intrapred_mode = MB_TYPE_TO_INTRA_16x16_MODE(u1_mb_type);
/*--------------------------------------------------------------------*/
/* 16x16 IntraPrediction */
/*--------------------------------------------------------------------*/
{
UWORD8 u1_packed_modes = (u1_top_available << 1)
+ u1_left_available;
UWORD8 u1_err_code =
(u1_intrapred_mode & 1) ?
u1_intrapred_mode :
(u1_intrapred_mode ^ 2);
if((u1_err_code & u1_packed_modes) ^ u1_err_code)
{
u1_intrapred_mode = 0;
ps_dec->i4_error_code = ERROR_INTRAPRED;
}
}
{
/* Align the size to multiple of 8, so that SIMD functions
can read 64 bits at a time. Only 33 bytes are actaully used */
UWORD8 au1_ngbr_pels[40];
/* Get neighbour pixels */
/* left pels */
if(u2_use_left_mb)
{
WORD32 i;
for(i = 0; i < 16; i++)
au1_ngbr_pels[16 - 1 - i] = pu1_yleft[i * ui_rec_width];
}
else
{
memset(au1_ngbr_pels, 0, 16);
}
/* top left pels */
au1_ngbr_pels[16] = *pu1_ytop_left;
/* top pels */
if(uc_useTopMB)
{
memcpy(au1_ngbr_pels + 16 + 1, puc_top, 16);
}
else
{
memset(au1_ngbr_pels + 16 + 1, 0, 16);
}
PROFILE_DISABLE_INTRA_PRED()
ps_dec->apf_intra_pred_luma_16x16[u1_intrapred_mode](
au1_ngbr_pels, pu1_luma_rec_buffer, 1, ui_rec_width,
((uc_useTopMB << 2) | u2_use_left_mb));
}
{
UWORD32 i;
WORD16 ai2_tmp[16];
for(i = 0; i < 16; i++)
{
WORD16 *pi2_level = pi2_y_coeff + (i << 4);
UWORD8 *pu1_pred_sblk = pu1_luma_rec_buffer
+ ((i & 0x3) * BLK_SIZE)
+ (i >> 2) * (ui_rec_width << 2);
PROFILE_DISABLE_IQ_IT_RECON()
{
if(CHECKBIT(ps_cur_mb_info->u2_luma_csbp, i))
{
ps_dec->pf_iquant_itrans_recon_luma_4x4(
pi2_level,
pu1_pred_sblk,
pu1_pred_sblk,
ui_rec_width,
ui_rec_width,
gau2_ih264_iquant_scale_4x4[ps_cur_mb_info->u1_qp_rem6],
(UWORD16 *)ps_dec->s_high_profile.i2_scalinglist4x4[0],
ps_cur_mb_info->u1_qp_div6, ai2_tmp, 1,
pi2_level);
}
else if((CHECKBIT(u4_luma_dc_only_csbp, i)) && pi2_level[0] != 0)
{
ps_dec->pf_iquant_itrans_recon_luma_4x4_dc(
pi2_level,
pu1_pred_sblk,
pu1_pred_sblk,
ui_rec_width,
ui_rec_width,
gau2_ih264_iquant_scale_4x4[ps_cur_mb_info->u1_qp_rem6],
(UWORD16 *)ps_dec->s_high_profile.i2_scalinglist4x4[0],
ps_cur_mb_info->u1_qp_div6, ai2_tmp, 1,
pi2_level);
}
}
}
}
}
else if(!ps_cur_mb_info->u1_tran_form8x8)
{
UWORD8 u1_is_left_sub_block, u1_is_top_sub_block = uc_useTopMB;
UWORD8 u1_sub_blk_x, u1_sub_blk_y, u1_sub_mb_num;
WORD8 i1_top_pred_mode;
WORD8 i1_left_pred_mode;
UWORD8 *pu1_top, *pu1_left, *pu1_top_left, *pu1_top_right;
WORD8 *pi1_cur_pred_mode, *pi1_left_pred_mode, *pc_topPredMode;
UWORD16 ui2_left_pred_buf_width = 0xffff;
WORD8 i1_intra_pred;
UWORD8 *pu1_prev_intra4x4_pred_mode_flag = pu1_prev_intra4x4_pred_mode_data;
UWORD8 *pu1_rem_intra4x4_pred_mode = pu1_prev_intra4x4_pred_mode_data + 16;
WORD16 *pi2_y_coeff1;
UWORD8 u1_cur_sub_block;
UWORD16 ui2_top_rt_mask;
/*--------------------------------------------------------------------*/
/* 4x4 IntraPrediction */
/*--------------------------------------------------------------------*/
/* Calculation of Top Right subblock mask */
/* */
/* (a) Set it to default mask */
/* [It has 0 for sublocks which will never have top-right sub block] */
/* */
/* (b) If top MB is not available */
/* Clear the bits of the first row sub blocks */
/* */
/* (c) Set/Clear bit for top-right sublock of MB */
/* [5 sub-block in decoding order] based on TOP RIGHT MB availablity */
/*--------------------------------------------------------------------*/
pu1_top = puc_top;
ui2_top_rt_mask = (u1_use_top_right_mb << 3) | (0x5750);
if(uc_useTopMB)
ui2_top_rt_mask |= 0x7;
/*Top Related initialisations*/
pi1_cur_pred_mode = ps_cur_mb_info->ps_curmb->pi1_intrapredmodes;
pc_topPredMode = ps_cur_mb_info->ps_top_mb->pi1_intrapredmodes;
/*--------------------------------------
if(u1_mbaff)
{
pi1_cur_pred_mode += (u2_mbx << 2);
pc_topPredMode = pi1_cur_pred_mode + ps_cur_mb_info->i1_offset;
pi1_cur_pred_mode += (u1_topmb) ? 0: 4;
}*/
if(u1_top_available)
{
if(ps_top_mb->u1_mb_type == I_4x4_MB)
*(WORD32*)pi1_cur_pred_mode = *(WORD32*)pc_topPredMode;
else
*(WORD32*)pi1_cur_pred_mode =
(uc_useTopMB) ? DC_DC_DC_DC : NOT_VALID;
}
else
*(WORD32*)pi1_cur_pred_mode = NOT_VALID;
/* CHANGED CODE */
/* CHANGED CODE */
/*Left Related initialisations*/
pi1_left_pred_mode = ps_dec->pi1_left_pred_mode;
if(!u1_mbaff)
{
if(u1_left_available)
{
if(ps_left_mb->u1_mb_type != I_4x4_MB)
*(WORD32*)pi1_left_pred_mode =
(u2_use_left_mb_pack) ?
DC_DC_DC_DC :
NOT_VALID;
}
else
{
*(WORD32*)pi1_left_pred_mode = NOT_VALID;
}
}
else
{
UWORD8 u1_curMbfld = ps_cur_mb_info->u1_mb_field_decodingflag;
UWORD8 u1_leftMbfld = ps_left_mb->u1_mb_fld;
if(u1_curMbfld ^ u1_leftMbfld)
{
if(u1_topmb
| ((u1_topmb == 0)
&& ((ps_curmb - 1)->u1_mb_type
!= I_4x4_MB)))
{
if(u1_left_available)
{
if(ps_left_mb->u1_mb_type != I_4x4_MB)
{
if(CHECKBIT(u2_use_left_mb_pack,0) == 0)
*(WORD32*)pi1_left_pred_mode = NOT_VALID;
else
*(WORD32*)pi1_left_pred_mode = DC_DC_DC_DC;
}
}
else
*(WORD32*)pi1_left_pred_mode = NOT_VALID;
if(u1_curMbfld)
{
if(u1_left_available)
{
if((ps_left_mb + 1)->u1_mb_type != I_4x4_MB)
{
if(u2_use_left_mb_pack >> 8)
*(WORD32*)(pi1_left_pred_mode + 4) =
DC_DC_DC_DC;
else
*(WORD32*)(pi1_left_pred_mode + 4) =
NOT_VALID;
}
}
else
*(WORD32*)(pi1_left_pred_mode + 4) = NOT_VALID;
pi1_left_pred_mode[1] = pi1_left_pred_mode[2];
pi1_left_pred_mode[2] = pi1_left_pred_mode[4];
pi1_left_pred_mode[3] = pi1_left_pred_mode[6];
*(WORD32*)(pi1_left_pred_mode + 4) =
*(WORD32*)pi1_left_pred_mode;
}
else
{
pi1_left_pred_mode[7] = pi1_left_pred_mode[3];
pi1_left_pred_mode[6] = pi1_left_pred_mode[3];
pi1_left_pred_mode[5] = pi1_left_pred_mode[2];
pi1_left_pred_mode[4] = pi1_left_pred_mode[2];
pi1_left_pred_mode[3] = pi1_left_pred_mode[1];
pi1_left_pred_mode[2] = pi1_left_pred_mode[1];
pi1_left_pred_mode[1] = pi1_left_pred_mode[0];
}
}
pi1_left_pred_mode += (u1_topmb) ? 0 : 4;
}
else
{
pi1_left_pred_mode += (u1_topmb) ? 0 : 4;
if(u1_left_available)
{
if(ps_left_mb->u1_mb_type != I_4x4_MB)
*(WORD32*)pi1_left_pred_mode =
(u2_use_left_mb_pack) ?
DC_DC_DC_DC :
NOT_VALID;
}
else
*(WORD32*)pi1_left_pred_mode = NOT_VALID;
}
}
/* One time pointer initialisations*/
pi2_y_coeff1 = pi2_y_coeff;
pu1_top_left = pu1_ytop_left;
/* Scan the sub-blocks in Raster Scan Order */
for(u1_sub_mb_num = 0; u1_sub_mb_num < 16; u1_sub_mb_num++)
{
/* Align the size to multiple of 8, so that SIMD functions
can read 64 bits at a time. Only 13 bytes are actaully used */
UWORD8 au1_ngbr_pels[16];
u1_sub_blk_x = u1_sub_mb_num & 0x3;
u1_sub_blk_y = u1_sub_mb_num >> 2;
i1_top_pred_mode = pi1_cur_pred_mode[u1_sub_blk_x];
i1_left_pred_mode = pi1_left_pred_mode[u1_sub_blk_y];
u1_use_top_right_mb = (!!CHECKBIT(ui2_top_rt_mask, u1_sub_mb_num));
/*********** left subblock availability**********/
if(u1_sub_blk_x)
u1_is_left_sub_block = 1;
else
u1_is_left_sub_block =
(u1_sub_blk_y < 2) ?
(CHECKBIT(u2_use_left_mb_pack,
0)) :
(u2_use_left_mb_pack >> 8);
/* CHANGED CODE */
if(u1_sub_blk_y)
u1_is_top_sub_block = 1;
/* CHANGED CODE */
/***************** Top *********************/
if(ps_dec->u4_use_intrapred_line_copy == 1)
{
if(u1_sub_blk_y)
pu1_top = pu1_luma_rec_buffer - ui_rec_width;
else
pu1_top = puc_top + (u1_sub_blk_x << 2);
}
else
{
pu1_top = pu1_luma_rec_buffer - ui_rec_width;
}
/***************** Top Right *********************/
pu1_top_right = pu1_top + 4;
/***************** Top Left *********************/
pu1_top_left = pu1_top - 1;
/***************** Left *********************/
pu1_left = pu1_luma_rec_buffer - 1;
/* CHANGED CODE */
/*---------------------------------------------------------------*/
/* Calculation of Intra prediction mode */
/*---------------------------------------------------------------*/
i1_intra_pred = ((i1_left_pred_mode < 0) | (i1_top_pred_mode < 0)) ?
DC : MIN(i1_left_pred_mode, i1_top_pred_mode);
{
UWORD8 u1_packed_modes = (u1_is_top_sub_block << 1)
+ u1_is_left_sub_block;
UWORD8 *pu1_intra_err_codes =
(UWORD8 *)gau1_ih264d_intra_pred_err_code;
UWORD8 uc_b2b0 = ((u1_sub_mb_num & 4) >> 1) | (u1_sub_mb_num & 1);
UWORD8 uc_b3b1 = ((u1_sub_mb_num & 8) >> 2)
| ((u1_sub_mb_num & 2) >> 1);
u1_cur_sub_block = (uc_b3b1 << 2) + uc_b2b0;
PROFILE_DISABLE_INTRA_PRED()
if(!pu1_prev_intra4x4_pred_mode_flag[u1_cur_sub_block])
{
i1_intra_pred =
pu1_rem_intra4x4_pred_mode[u1_cur_sub_block]
+ (pu1_rem_intra4x4_pred_mode[u1_cur_sub_block]
>= i1_intra_pred);
}
i1_intra_pred = CLIP3(0, 8, i1_intra_pred);
{
UWORD8 u1_err_code = pu1_intra_err_codes[i1_intra_pred];
if((u1_err_code & u1_packed_modes) ^ u1_err_code)
{
i1_intra_pred = 0;
ps_dec->i4_error_code = ERROR_INTRAPRED;
}
}
}
{
/* Get neighbour pixels */
/* left pels */
if(u1_is_left_sub_block)
{
WORD32 i;
for(i = 0; i < 4; i++)
au1_ngbr_pels[4 - 1 - i] = pu1_left[i * ui_rec_width];
}
else
{
memset(au1_ngbr_pels, 0, 4);
}
/* top left pels */
au1_ngbr_pels[4] = *pu1_top_left;
/* top pels */
if(u1_is_top_sub_block)
{
memcpy(au1_ngbr_pels + 4 + 1, pu1_top, 4);
}
else
{
memset(au1_ngbr_pels + 4 + 1, 0, 4);
}
/* top right pels */
if(u1_use_top_right_mb)
{
memcpy(au1_ngbr_pels + 4 * 2 + 1, pu1_top_right, 4);
}
else if(u1_is_top_sub_block)
{
memset(au1_ngbr_pels + 4 * 2 + 1, au1_ngbr_pels[4 * 2], 4);
}
}
PROFILE_DISABLE_INTRA_PRED()
ps_dec->apf_intra_pred_luma_4x4[i1_intra_pred](
au1_ngbr_pels, pu1_luma_rec_buffer, 1,
ui_rec_width,
((u1_is_top_sub_block << 2) | u1_is_left_sub_block));
/* CHANGED CODE */
if(CHECKBIT(ui2_luma_csbp, u1_sub_mb_num))
{
WORD16 ai2_tmp[16];
PROFILE_DISABLE_IQ_IT_RECON()
{
if(CHECKBIT(u4_luma_dc_only_csbp, u1_sub_mb_num))
{
ps_dec->pf_iquant_itrans_recon_luma_4x4_dc(
pi2_y_coeff1,
pu1_luma_rec_buffer,
pu1_luma_rec_buffer,
ui_rec_width,
ui_rec_width,
gau2_ih264_iquant_scale_4x4[ps_cur_mb_info->u1_qp_rem6],
(UWORD16 *)ps_dec->s_high_profile.i2_scalinglist4x4[0],
ps_cur_mb_info->u1_qp_div6, ai2_tmp, 0,
NULL);
}
else
{
ps_dec->pf_iquant_itrans_recon_luma_4x4(
pi2_y_coeff1,
pu1_luma_rec_buffer,
pu1_luma_rec_buffer,
ui_rec_width,
ui_rec_width,
gau2_ih264_iquant_scale_4x4[ps_cur_mb_info->u1_qp_rem6],
(UWORD16 *)ps_dec->s_high_profile.i2_scalinglist4x4[0],
ps_cur_mb_info->u1_qp_div6, ai2_tmp, 0,
NULL);
}
}
}
/*---------------------------------------------------------------*/
/* Update sub block number */
/*---------------------------------------------------------------*/
pi2_y_coeff1 += 16;
pu1_luma_rec_buffer +=
(u1_sub_blk_x == 3) ? (ui_rec_width << 2) - 12 : 4;
pu1_luma_pred_buffer +=
(u1_sub_blk_x == 3) ? (ui_pred_width << 2) - 12 : 4;
/* CHANGED CODE */
pi1_cur_pred_mode[u1_sub_blk_x] = i1_intra_pred;
pi1_left_pred_mode[u1_sub_blk_y] = i1_intra_pred;
}
}
else if((u1_mb_type == I_4x4_MB) && (ps_cur_mb_info->u1_tran_form8x8 == 1))
{
UWORD8 u1_is_left_sub_block, u1_is_top_sub_block = uc_useTopMB;
UWORD8 u1_sub_blk_x, u1_sub_blk_y, u1_sub_mb_num;
WORD8 i1_top_pred_mode;
WORD8 i1_left_pred_mode;
UWORD8 *pu1_top, *pu1_left, *pu1_top_left;
WORD8 *pi1_cur_pred_mode, *pi1_left_pred_mode, *pc_topPredMode;
UWORD16 ui2_left_pred_buf_width = 0xffff;
WORD8 i1_intra_pred;
UWORD8 *pu1_prev_intra4x4_pred_mode_flag = pu1_prev_intra4x4_pred_mode_data;
UWORD8 *pu1_rem_intra4x4_pred_mode = pu1_prev_intra4x4_pred_mode_data + 4;
WORD16 *pi2_y_coeff1;
UWORD16 ui2_top_rt_mask;
UWORD32 u4_4x4_left_offset = 0;
/*--------------------------------------------------------------------*/
/* 8x8 IntraPrediction */
/*--------------------------------------------------------------------*/
/* Calculation of Top Right subblock mask */
/* */
/* (a) Set it to default mask */
/* [It has 0 for sublocks which will never have top-right sub block] */
/* */
/* (b) If top MB is not available */
/* Clear the bits of the first row sub blocks */
/* */
/* (c) Set/Clear bit for top-right sublock of MB */
/* [5 sub-block in decoding order] based on TOP RIGHT MB availablity */
/* */
/* ui2_top_rt_mask: marks availibility of top right(neighbour) */
/* in the 8x8 Block ordering */
/* */
/* tr0 tr1 */
/* 0 1 tr3 */
/* 2 3 */
/* */
/* Top rights for 0 is in top MB */
/* top right of 1 will be in top right MB */
/* top right of 3 in right MB and hence not available */
/* This corresponds to ui2_top_rt_mask having default value 0x4 */
/*--------------------------------------------------------------------*/
ui2_top_rt_mask = (u1_use_top_right_mb << 1) | (0x4);
if(uc_useTopMB)
{
ui2_top_rt_mask |= 0x1;
}
/* Top Related initialisations */
pi1_cur_pred_mode = ps_cur_mb_info->ps_curmb->pi1_intrapredmodes;
pc_topPredMode = ps_cur_mb_info->ps_top_mb->pi1_intrapredmodes;
/*
if(u1_mbaff)
{
pi1_cur_pred_mode += (u2_mbx << 2);
pc_topPredMode = pi1_cur_pred_mode + ps_cur_mb_info->i1_offset;
pi1_cur_pred_mode += (u1_topmb) ? 0: 4;
}
*/
if(u1_top_available)
{
if(ps_top_mb->u1_mb_type == I_4x4_MB)
{
*(WORD32*)pi1_cur_pred_mode = *(WORD32*)pc_topPredMode;
}
else
{
*(WORD32*)pi1_cur_pred_mode =
(uc_useTopMB) ? DC_DC_DC_DC : NOT_VALID;
}
}
else
{
*(WORD32*)pi1_cur_pred_mode = NOT_VALID;
}
pu1_top = puc_top - 8;
/*Left Related initialisations*/
pi1_left_pred_mode = ps_dec->pi1_left_pred_mode;
if(!u1_mbaff)
{
if(u1_left_available)
{
if(ps_left_mb->u1_mb_type != I_4x4_MB)
{
*(WORD32*)pi1_left_pred_mode =
(u2_use_left_mb_pack) ?
DC_DC_DC_DC :
NOT_VALID;
}
}
else
{
*(WORD32*)pi1_left_pred_mode = NOT_VALID;
}
}
else
{
UWORD8 u1_curMbfld = ps_cur_mb_info->u1_mb_field_decodingflag;
UWORD8 u1_leftMbfld = ps_left_mb->u1_mb_fld;
if((!u1_curMbfld) && (u1_leftMbfld))
{
u4_4x4_left_offset = 1;
}
if(u1_curMbfld ^ u1_leftMbfld)
{
if(u1_topmb
| ((u1_topmb == 0)
&& ((ps_curmb - 1)->u1_mb_type
!= I_4x4_MB)))
{
if(u1_left_available)
{
if(ps_left_mb->u1_mb_type != I_4x4_MB)
{
if(CHECKBIT(u2_use_left_mb_pack,0) == 0)
{
*(WORD32*)pi1_left_pred_mode = NOT_VALID;
}
else
{
*(WORD32*)pi1_left_pred_mode = DC_DC_DC_DC;
}
}
}
else
{
*(WORD32*)pi1_left_pred_mode = NOT_VALID;
}
if(u1_curMbfld)
{
if(u1_left_available)
{
if((ps_left_mb + 1)->u1_mb_type != I_4x4_MB)
{
if(u2_use_left_mb_pack >> 8)
{
*(WORD32*)(pi1_left_pred_mode + 4) =
DC_DC_DC_DC;
}
else
{
*(WORD32*)(pi1_left_pred_mode + 4) =
NOT_VALID;
}
}
}
else
{
*(WORD32*)(pi1_left_pred_mode + 4) = NOT_VALID;
}
pi1_left_pred_mode[1] = pi1_left_pred_mode[2];
pi1_left_pred_mode[2] = pi1_left_pred_mode[4];
pi1_left_pred_mode[3] = pi1_left_pred_mode[6];
*(WORD32*)(pi1_left_pred_mode + 4) =
*(WORD32*)pi1_left_pred_mode;
}
else
{
pi1_left_pred_mode[7] = pi1_left_pred_mode[3];
pi1_left_pred_mode[6] = pi1_left_pred_mode[3];
pi1_left_pred_mode[5] = pi1_left_pred_mode[2];
pi1_left_pred_mode[4] = pi1_left_pred_mode[2];
pi1_left_pred_mode[3] = pi1_left_pred_mode[1];
pi1_left_pred_mode[2] = pi1_left_pred_mode[1];
pi1_left_pred_mode[1] = pi1_left_pred_mode[0];
}
}
pi1_left_pred_mode += (u1_topmb) ? 0 : 4;
}
else
{
pi1_left_pred_mode += (u1_topmb) ? 0 : 4;
if(u1_left_available)
{
if(ps_left_mb->u1_mb_type != I_4x4_MB)
{
*(WORD32*)pi1_left_pred_mode =
(u2_use_left_mb_pack) ?
DC_DC_DC_DC :
NOT_VALID;
}
}
else
{
*(WORD32*)pi1_left_pred_mode = NOT_VALID;
}
}
}
/* One time pointer initialisations*/
pi2_y_coeff1 = pi2_y_coeff;
if(u1_use_top_left_mb)
{
pu1_top_left = pu1_ytop_left;
}
else
{
pu1_top_left = NULL;
}
/* Scan the sub-blocks in Raster Scan Order */
for(u1_sub_mb_num = 0; u1_sub_mb_num < 4; u1_sub_mb_num++)
{
u1_sub_blk_x = (u1_sub_mb_num & 0x1);
u1_sub_blk_y = (u1_sub_mb_num >> 1);
i1_top_pred_mode = pi1_cur_pred_mode[u1_sub_blk_x << 1];
i1_left_pred_mode = pi1_left_pred_mode[u1_sub_blk_y << 1];
if(2 == u1_sub_mb_num)
{
i1_left_pred_mode = pi1_left_pred_mode[(u1_sub_blk_y << 1)
+ u4_4x4_left_offset];
}
u1_use_top_right_mb = (!!CHECKBIT(ui2_top_rt_mask, u1_sub_mb_num));
/*********** left subblock availability**********/
if(u1_sub_blk_x)
{
u1_is_left_sub_block = 1;
}
else
{
u1_is_left_sub_block =
(u1_sub_blk_y < 1) ?
(CHECKBIT(u2_use_left_mb_pack,
0)) :
(u2_use_left_mb_pack >> 8);
}
/***************** Top *********************/
if(u1_sub_blk_y)
{
u1_is_top_sub_block = 1;
// sushant
pu1_top = /*pu1_luma_pred_buffer*/pu1_luma_rec_buffer - ui_rec_width;
}
else
{
pu1_top += 8;
}
/***************** Left *********************/
if((u1_sub_blk_x) | (u4_num_pmbair != 0))
{
// sushant
pu1_left = /*pu1_luma_pred_buffer*/pu1_luma_rec_buffer - 1;
ui2_left_pred_buf_width = ui_rec_width;
}
else
{
pu1_left = pu1_yleft;
pu1_yleft += (ui_rec_width << 3);
ui2_left_pred_buf_width = ui_rec_width;
}
/***************** Top Left *********************/
if(u1_sub_mb_num)
{
pu1_top_left = (u1_sub_blk_x) ?
pu1_top - 1 : pu1_left - ui_rec_width;
if((u1_sub_blk_x && (!u1_is_top_sub_block))
|| ((!u1_sub_blk_x) && (!u1_is_left_sub_block)))
{
pu1_top_left = NULL;
}
}
/*---------------------------------------------------------------*/
/* Calculation of Intra prediction mode */
/*---------------------------------------------------------------*/
i1_intra_pred = ((i1_left_pred_mode < 0) | (i1_top_pred_mode < 0)) ?
DC : MIN(i1_left_pred_mode, i1_top_pred_mode);
{
UWORD8 u1_packed_modes = (u1_is_top_sub_block << 1)
+ u1_is_left_sub_block;
UWORD8 *pu1_intra_err_codes =
(UWORD8 *)gau1_ih264d_intra_pred_err_code;
/********************************************************************/
/* Same intra4x4_pred_mode array is filled with intra4x4_pred_mode */
/* for a MB with 8x8 intrapredicition */
/********************************************************************/
PROFILE_DISABLE_INTRA_PRED()
if(!pu1_prev_intra4x4_pred_mode_flag[u1_sub_mb_num])
{
i1_intra_pred = pu1_rem_intra4x4_pred_mode[u1_sub_mb_num]
+ (pu1_rem_intra4x4_pred_mode[u1_sub_mb_num]
>= i1_intra_pred);
}
i1_intra_pred = CLIP3(0, 8, i1_intra_pred);
{
UWORD8 u1_err_code = pu1_intra_err_codes[i1_intra_pred];
if((u1_err_code & u1_packed_modes) ^ u1_err_code)
{
i1_intra_pred = 0;
ps_dec->i4_error_code = ERROR_INTRAPRED;
}
}
}
{
/* Align the size to multiple of 8, so that SIMD functions
can read 64 bits at a time. Only 25 bytes are actaully used */
UWORD8 au1_ngbr_pels[32];
WORD32 ngbr_avail;
ngbr_avail = u1_is_left_sub_block << 0;
ngbr_avail |= u1_is_top_sub_block << 2;
if(pu1_top_left)
ngbr_avail |= 1 << 1;
ngbr_avail |= u1_use_top_right_mb << 3;
PROFILE_DISABLE_INTRA_PRED()
{
ps_dec->pf_intra_pred_ref_filtering(pu1_left, pu1_top_left,
pu1_top, au1_ngbr_pels,
ui2_left_pred_buf_width,
ngbr_avail);
ps_dec->apf_intra_pred_luma_8x8[i1_intra_pred](
au1_ngbr_pels, pu1_luma_rec_buffer, 1,
ui_rec_width,
((u1_is_top_sub_block << 2) | u1_is_left_sub_block));
}
}
/* Inverse Transform and Reconstruction */
if(CHECKBIT(ps_cur_mb_info->u1_cbp, u1_sub_mb_num))
{
WORD16 *pi2_scale_matrix_ptr;
WORD16 ai2_tmp[64];
pi2_scale_matrix_ptr =
ps_dec->s_high_profile.i2_scalinglist8x8[0];
PROFILE_DISABLE_IQ_IT_RECON()
{
if(CHECKBIT(u4_luma_dc_only_cbp, u1_sub_mb_num))
{
ps_dec->pf_iquant_itrans_recon_luma_8x8_dc(
pi2_y_coeff1,
pu1_luma_rec_buffer,
pu1_luma_rec_buffer,
ui_rec_width,
ui_rec_width,
gau1_ih264d_dequant8x8_cavlc[ps_cur_mb_info->u1_qp_rem6],
(UWORD16 *)pi2_scale_matrix_ptr,
ps_cur_mb_info->u1_qp_div6, ai2_tmp, 0,
NULL);
}
else
{
ps_dec->pf_iquant_itrans_recon_luma_8x8(
pi2_y_coeff1,
pu1_luma_rec_buffer,
pu1_luma_rec_buffer,
ui_rec_width,
ui_rec_width,
gau1_ih264d_dequant8x8_cavlc[ps_cur_mb_info->u1_qp_rem6],
(UWORD16 *)pi2_scale_matrix_ptr,
ps_cur_mb_info->u1_qp_div6, ai2_tmp, 0,
NULL);
}
}
}
/*---------------------------------------------------------------*/
/* Update sub block number */
/*---------------------------------------------------------------*/
pi2_y_coeff1 += 64;
pu1_luma_rec_buffer +=
(u1_sub_blk_x == 1) ?
(ui_rec_width << 3) - (8 * 1) : 8;
/*---------------------------------------------------------------*/
/* Pred mode filled in terms of 4x4 block so replicated in 2 */
/* locations. */
/*---------------------------------------------------------------*/
pi1_cur_pred_mode[u1_sub_blk_x << 1] = i1_intra_pred;
pi1_cur_pred_mode[(u1_sub_blk_x << 1) + 1] = i1_intra_pred;
pi1_left_pred_mode[u1_sub_blk_y << 1] = i1_intra_pred;
pi1_left_pred_mode[(u1_sub_blk_y << 1) + 1] = i1_intra_pred;
}
}
/* Decode Chroma Block */
ih264d_unpack_chroma_coeff4x4_mb(ps_dec,
ps_cur_mb_info);
/*--------------------------------------------------------------------*/
/* Chroma Blocks decoding */
/*--------------------------------------------------------------------*/
{
UWORD8 u1_intra_chrom_pred_mode;
UWORD8 u1_chroma_cbp = (UWORD8)(ps_cur_mb_info->u1_cbp >> 4);
/*--------------------------------------------------------------------*/
/* Perform Chroma intra prediction */
/*--------------------------------------------------------------------*/
u1_intra_chrom_pred_mode = CHROMA_TO_LUMA_INTRA_MODE(
ps_cur_mb_info->u1_chroma_pred_mode);
{
UWORD8 u1_packed_modes = (u1_top_available << 1)
+ u1_left_available;
UWORD8 u1_err_code =
(u1_intra_chrom_pred_mode & 1) ?
u1_intra_chrom_pred_mode :
(u1_intra_chrom_pred_mode ^ 2);
if((u1_err_code & u1_packed_modes) ^ u1_err_code)
{
u1_intra_chrom_pred_mode = 0;
ps_dec->i4_error_code = ERROR_INTRAPRED;
}
}
/* CHANGED CODE */
if(u1_chroma_cbp != CBPC_ALLZERO)
{
UWORD16 u2_chroma_csbp =
(u1_chroma_cbp == CBPC_ACZERO) ?
0 : ps_cur_mb_info->u2_chroma_csbp;
UWORD32 u4_scale_u;
UWORD32 u4_scale_v;
{
UWORD16 au2_ngbr_pels[33];
UWORD8 *pu1_ngbr_pels = (UWORD8 *)au2_ngbr_pels;
UWORD16 *pu2_left_uv;
UWORD16 *pu2_topleft_uv;
WORD32 use_left1 = (u2_use_left_mb_pack & 0x0ff);
WORD32 use_left2 = (u2_use_left_mb_pack & 0xff00) >> 8;
pu2_left_uv = (UWORD16 *)pu1_uleft;
pu2_topleft_uv = (UWORD16 *)pu1_u_top_left;
/* Get neighbour pixels */
/* left pels */
if(u2_use_left_mb_pack)
{
WORD32 i;
if(use_left1)
{
for(i = 0; i < 4; i++)
au2_ngbr_pels[8 - 1 - i] = pu2_left_uv[i
* u4_recwidth_cr / YUV420SP_FACTOR];
}
else
{
memset(au2_ngbr_pels + 4, 0, 4 * sizeof(UWORD16));
}
if(use_left2)
{
for(i = 4; i < 8; i++)
au2_ngbr_pels[8 - 1 - i] = pu2_left_uv[i
* u4_recwidth_cr / YUV420SP_FACTOR];
}
else
{
memset(au2_ngbr_pels, 0, 4 * sizeof(UWORD16));
}
}
else
{
memset(au2_ngbr_pels, 0, 8 * sizeof(UWORD16));
}
/* top left pels */
au2_ngbr_pels[8] = *pu2_topleft_uv;
/* top pels */
if(uc_useTopMB)
{
memcpy(au2_ngbr_pels + 8 + 1, pu1_top_u,
8 * sizeof(UWORD16));
}
else
{
memset(au2_ngbr_pels + 8 + 1, 0, 8 * sizeof(UWORD16));
}
PROFILE_DISABLE_INTRA_PRED()
ps_dec->apf_intra_pred_chroma[u1_intra_chrom_pred_mode](
pu1_ngbr_pels,
pu1_mb_cb_rei1_buffer,
1,
u4_recwidth_cr,
((uc_useTopMB << 2) | (use_left2 << 4)
| use_left1));
}
u4_scale_u = ps_cur_mb_info->u1_qpc_div6;
u4_scale_v = ps_cur_mb_info->u1_qpcr_div6;
pi2_y_coeff = ps_dec->pi2_coeff_data;
{
UWORD32 i;
WORD16 ai2_tmp[16];
for(i = 0; i < 4; i++)
{
WORD16 *pi2_level = pi2_y_coeff + (i << 4);
UWORD8 *pu1_pred_sblk = pu1_mb_cb_rei1_buffer
+ ((i & 0x1) * BLK_SIZE * YUV420SP_FACTOR)
+ (i >> 1) * (u4_recwidth_cr << 2);
PROFILE_DISABLE_IQ_IT_RECON()
{
if(CHECKBIT(u2_chroma_csbp, i))
{
ps_dec->pf_iquant_itrans_recon_chroma_4x4(
pi2_level,
pu1_pred_sblk,
pu1_pred_sblk,
u4_recwidth_cr,
u4_recwidth_cr,
gau2_ih264_iquant_scale_4x4[ps_cur_mb_info->u1_qpc_rem6],
(UWORD16 *)ps_dec->s_high_profile.i2_scalinglist4x4[1],
u4_scale_u, ai2_tmp, pi2_level);
}
else if(pi2_level[0] != 0)
{
ps_dec->pf_iquant_itrans_recon_chroma_4x4_dc(
pi2_level,
pu1_pred_sblk,
pu1_pred_sblk,
u4_recwidth_cr,
u4_recwidth_cr,
gau2_ih264_iquant_scale_4x4[ps_cur_mb_info->u1_qpc_rem6],
(UWORD16 *)ps_dec->s_high_profile.i2_scalinglist4x4[1],
u4_scale_u, ai2_tmp, pi2_level);
}
}
}
}
pi2_y_coeff += MB_CHROM_SIZE;
u2_chroma_csbp = u2_chroma_csbp >> 4;
{
UWORD32 i;
WORD16 ai2_tmp[16];
for(i = 0; i < 4; i++)
{
WORD16 *pi2_level = pi2_y_coeff + (i << 4);
UWORD8 *pu1_pred_sblk = pu1_mb_cb_rei1_buffer + 1
+ ((i & 0x1) * BLK_SIZE * YUV420SP_FACTOR)
+ (i >> 1) * (u4_recwidth_cr << 2);
PROFILE_DISABLE_IQ_IT_RECON()
{
if(CHECKBIT(u2_chroma_csbp, i))
{
ps_dec->pf_iquant_itrans_recon_chroma_4x4(
pi2_level,
pu1_pred_sblk,
pu1_pred_sblk,
u4_recwidth_cr,
u4_recwidth_cr,
gau2_ih264_iquant_scale_4x4[ps_cur_mb_info->u1_qpcr_rem6],
(UWORD16 *)ps_dec->s_high_profile.i2_scalinglist4x4[2],
u4_scale_v, ai2_tmp, pi2_level);
}
else if(pi2_level[0] != 0)
{
ps_dec->pf_iquant_itrans_recon_chroma_4x4_dc(
pi2_level,
pu1_pred_sblk,
pu1_pred_sblk,
u4_recwidth_cr,
u4_recwidth_cr,
gau2_ih264_iquant_scale_4x4[ps_cur_mb_info->u1_qpcr_rem6],
(UWORD16 *)ps_dec->s_high_profile.i2_scalinglist4x4[2],
u4_scale_v, ai2_tmp, pi2_level);
}
}
}
}
}
else
{
/* If no inverse transform is needed, pass recon buffer pointer */
/* to Intraprediction module instead of pred buffer pointer */
{
UWORD16 au2_ngbr_pels[33];
UWORD8 *pu1_ngbr_pels = (UWORD8 *)au2_ngbr_pels;
UWORD16 *pu2_left_uv;
UWORD16 *pu2_topleft_uv;
WORD32 use_left1 = (u2_use_left_mb_pack & 0x0ff);
WORD32 use_left2 = (u2_use_left_mb_pack & 0xff00) >> 8;
pu2_topleft_uv = (UWORD16 *)pu1_u_top_left;
pu2_left_uv = (UWORD16 *)pu1_uleft;
/* Get neighbour pixels */
/* left pels */
if(u2_use_left_mb_pack)
{
WORD32 i;
if(use_left1)
{
for(i = 0; i < 4; i++)
au2_ngbr_pels[8 - 1 - i] = pu2_left_uv[i
* u4_recwidth_cr / YUV420SP_FACTOR];
}
else
{
memset(au2_ngbr_pels + 4, 0, 4 * sizeof(UWORD16));
}
if(use_left2)
{
for(i = 4; i < 8; i++)
au2_ngbr_pels[8 - 1 - i] = pu2_left_uv[i
* u4_recwidth_cr / YUV420SP_FACTOR];
}
else
{
memset(au2_ngbr_pels, 0, 4 * sizeof(UWORD16));
}
}
else
{
memset(au2_ngbr_pels, 0, 8 * sizeof(UWORD16));
}
/* top left pels */
au2_ngbr_pels[8] = *pu2_topleft_uv;
/* top pels */
if(uc_useTopMB)
{
memcpy(au2_ngbr_pels + 8 + 1, pu1_top_u,
8 * sizeof(UWORD16));
}
else
{
memset(au2_ngbr_pels + 8 + 1, 0, 8 * sizeof(UWORD16));
}
PROFILE_DISABLE_INTRA_PRED()
ps_dec->apf_intra_pred_chroma[u1_intra_chrom_pred_mode](
pu1_ngbr_pels,
pu1_mb_cb_rei1_buffer,
1,
u4_recwidth_cr,
((uc_useTopMB << 2) | (use_left2 << 4)
| use_left1));
}
}
}
return OK;
}