blob: 6e2a39c1cdd94ccc828aaac9a02af9fad1590b98 [file] [log] [blame]
/******************************************************************************
*
* Copyright (C) 2012 Ittiam Systems Pvt Ltd, Bangalore
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at:
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*
******************************************************************************/
/**
*******************************************************************************
* @file
* ihevcd_parse_residual.c
*
* @brief
* Contains functions for parsing residual data at TU level
*
* @author
* Harish
*
* @par List of Functions:
*
* @remarks
* None
*
*******************************************************************************
*/
/*****************************************************************************/
/* File Includes */
/*****************************************************************************/
#include <stdio.h>
#include <stddef.h>
#include <stdlib.h>
#include <string.h>
#include <assert.h>
#include "ihevc_typedefs.h"
#include "iv.h"
#include "ivd.h"
#include "ihevcd_cxa.h"
#include "ihevc_defs.h"
#include "ihevc_debug.h"
#include "ihevc_structs.h"
#include "ihevc_macros.h"
#include "ihevc_platform_macros.h"
#include "ihevc_common_tables.h"
#include "ihevc_error.h"
#include "ihevc_cabac_tables.h"
#include "ihevcd_trace.h"
#include "ihevcd_defs.h"
#include "ihevcd_function_selector.h"
#include "ihevcd_structs.h"
#include "ihevcd_error.h"
#include "ihevcd_nal.h"
#include "ihevcd_bitstream.h"
#include "ihevcd_utils.h"
#include "ihevcd_parse_residual.h"
#include "ihevcd_cabac.h"
/**
*****************************************************************************
* @brief returns context increment for sig coeff based on csbf neigbour
* flags (bottom and right) and current coeff postion in 4x4 block
* See section 9.3.3.1.4 for details on this context increment
*
* input : neigbour csbf flags(bit0:rightcsbf, bit1:bottom csbf)
* coeff idx in raster order (0-15)
*
* output : context increment for sig coeff flag
*
*****************************************************************************
*/
const UWORD8 gau1_ihevcd_sigcoeff_ctxtinc[3][4][16] =
{
{
/* nbr csbf = 0: sigCtx = (xP+yP == 0) ? 2 : (xP+yP < 3) ? 1: 0 */
{ 2, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
/* nbr csbf = 1: sigCtx = (yP == 0) ? 2 : (yP == 1) ? 1: 0 */
{ 2, 1, 2, 0, 1, 2, 0, 0, 1, 2, 0, 0, 1, 0, 0, 0 },
/* nbr csbf = 2: sigCtx = (xP == 0) ? 2 : (xP == 1) ? 1: 0 */
{ 2, 2, 1, 2, 1, 0, 2, 1, 0, 0, 1, 0, 0, 0, 0, 0 },
/* nbr csbf = 3: sigCtx = 2 */
{ 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2 },
},
{
/* nbr csbf = 0: sigCtx = (xP+yP == 0) ? 2 : (xP+yP < 3) ? 1: 0 */
{ 2, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0 },
/* nbr csbf = 1: sigCtx = (yP == 0) ? 2 : (yP == 1) ? 1: 0 */
{ 2, 2, 2, 2, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0 },
/* nbr csbf = 2: sigCtx = (xP == 0) ? 2 : (xP == 1) ? 1: 0 */
{ 2, 1, 0, 0, 2, 1, 0, 0, 2, 1, 0, 0, 2, 1, 0, 0 },
/* nbr csbf = 3: sigCtx = 2 */
{ 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2 },
},
{
/* nbr csbf = 0: sigCtx = (xP+yP == 0) ? 2 : (xP+yP < 3) ? 1: 0 */
{ 2, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0 },
/* nbr csbf = 1: sigCtx = (yP == 0) ? 2 : (yP == 1) ? 1: 0 */
{ 2, 1, 0, 0, 2, 1, 0, 0, 2, 1, 0, 0, 2, 1, 0, 0 },
/* nbr csbf = 2: sigCtx = (xP == 0) ? 2 : (xP == 1) ? 1: 0 */
{ 2, 2, 2, 2, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0 },
/* nbr csbf = 3: sigCtx = 2 */
{ 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2 },
},
};
/**
*****************************************************************************
* @brief returns context increment for sig coeff for 4x4 tranform size as
* per Table 9-39 in section 9.3.3.1.4
*
* input : coeff idx in raster order (0-15)
*
* output : context increment for sig coeff flag
*
*****************************************************************************
*/
const UWORD8 gau1_ihevcd_sigcoeff_ctxtinc_tr4[3][16] =
{
/* Upright diagonal scan */
{
0, 2, 1, 6,
3, 4, 7, 6,
4, 5, 7, 8,
5, 8, 8, 8,
},
/* Horizontal scan */
{
0, 1, 4, 5,
2, 3, 4, 5,
6, 6, 8, 8,
7, 7, 8, 8,
},
/* Vertical scan */
{
0, 2, 6, 7,
1, 3, 6, 7,
4, 4, 8, 8,
5, 5, 8, 8,
},
};
/**
*******************************************************************************
*
* @brief
* Parses Residual coding
*
* @par Description:
* Parses Residual coding as per Section:7.3.13
*
* @param[in] ps_codec
* Pointer to codec context
*
* @returns error code from IHEVCD_ERROR_T
*
* @remarks
*
*
*******************************************************************************
*/
WORD32 ihevcd_parse_residual_coding(codec_t *ps_codec,
WORD32 x0, WORD32 y0,
WORD32 log2_trafo_size,
WORD32 c_idx,
WORD32 intra_pred_mode)
{
IHEVCD_ERROR_T ret = (IHEVCD_ERROR_T)IHEVCD_SUCCESS;
WORD32 transform_skip_flag;
WORD32 value;
pps_t *ps_pps;
WORD32 last_scan_pos, last_sub_blk;
bitstrm_t *ps_bitstrm = &ps_codec->s_parse.s_bitstrm;
WORD32 last_significant_coeff_x_prefix, last_significant_coeff_y_prefix;
WORD32 last_significant_coeff_x, last_significant_coeff_y;
const UWORD8 *pu1_scan_blk = NULL, *pu1_scan_coeff;
WORD32 scan_idx;
WORD32 i;
WORD32 sign_data_hiding_flag;
cab_ctxt_t *ps_cabac = &ps_codec->s_parse.s_cabac;
WORD32 gt1_ctxt = 1;
WORD32 c_max;
UWORD16 au2_csbf[9];
tu_sblk_coeff_data_t *ps_tu_sblk_coeff_data;
WORD8 *pi1_num_coded_subblks;
WORD32 num_subblks;
WORD32 sig_coeff_base_ctxt, abs_gt1_base_ctxt;
UNUSED(x0);
UNUSED(y0);
ps_pps = ps_codec->s_parse.ps_pps;
sign_data_hiding_flag = ps_pps->i1_sign_data_hiding_flag;
transform_skip_flag = 0;
if(ps_pps->i1_transform_skip_enabled_flag &&
!ps_codec->s_parse.s_cu.i4_cu_transquant_bypass &&
(log2_trafo_size == 2))
{
WORD32 ctxt_idx;
if(!c_idx)
{
ctxt_idx = IHEVC_CAB_TFM_SKIP0;
}
else
{
ctxt_idx = IHEVC_CAB_TFM_SKIP12;
}
TRACE_CABAC_CTXT("transform_skip_flag", ps_cabac->u4_range, ctxt_idx);
value = ihevcd_cabac_decode_bin(ps_cabac,
ps_bitstrm,
ctxt_idx);
AEV_TRACE("transform_skip_flag", value, ps_cabac->u4_range);
transform_skip_flag = value;
}
/* code the last_coeff_x_prefix as tunary binarized code */
{
WORD32 ctxt_idx_x, ctxt_idx_y, ctx_shift;
WORD32 ctx_offset;
c_max = (log2_trafo_size << 1) - 1;
if(!c_idx)
{
ctx_offset = (3 * (log2_trafo_size - 2)) + ((log2_trafo_size - 1) >> 2);
ctxt_idx_x = IHEVC_CAB_COEFFX_PREFIX + ctx_offset;
ctxt_idx_y = IHEVC_CAB_COEFFY_PREFIX + ctx_offset;
ctx_shift = (log2_trafo_size + 1) >> 2;
}
else
{
ctxt_idx_x = IHEVC_CAB_COEFFX_PREFIX + 15;
ctxt_idx_y = IHEVC_CAB_COEFFY_PREFIX + 15;
ctx_shift = log2_trafo_size - 2;
}
TRACE_CABAC_CTXT("last_coeff_x_prefix", ps_cabac->u4_range, ctxt_idx_x);
last_significant_coeff_x_prefix = ihevcd_cabac_decode_bins_tunary(ps_cabac,
ps_bitstrm,
c_max,
ctxt_idx_x,
ctx_shift,
c_max);
AEV_TRACE("last_coeff_x_prefix", last_significant_coeff_x_prefix, ps_cabac->u4_range);
TRACE_CABAC_CTXT("last_coeff_y_prefix", ps_cabac->u4_range, ctxt_idx_y);
last_significant_coeff_y_prefix = ihevcd_cabac_decode_bins_tunary(ps_cabac,
ps_bitstrm,
c_max,
ctxt_idx_y,
ctx_shift,
c_max);
AEV_TRACE("last_coeff_y_prefix", last_significant_coeff_y_prefix, ps_cabac->u4_range);
last_significant_coeff_x = last_significant_coeff_x_prefix;
if(last_significant_coeff_x_prefix > 3)
{
WORD32 suf_length = ((last_significant_coeff_x_prefix - 2) >> 1);
value = ihevcd_cabac_decode_bypass_bins(ps_cabac,
ps_bitstrm,
suf_length);
AEV_TRACE("last_coeff_x_suffix", value, ps_cabac->u4_range);
last_significant_coeff_x =
(1 << ((last_significant_coeff_x_prefix >> 1) - 1)) *
(2 + (last_significant_coeff_x_prefix & 1)) + value;
}
last_significant_coeff_y = last_significant_coeff_y_prefix;
if(last_significant_coeff_y_prefix > 3)
{
WORD32 suf_length = ((last_significant_coeff_y_prefix - 2) >> 1);
value = ihevcd_cabac_decode_bypass_bins(ps_cabac,
ps_bitstrm,
suf_length);
AEV_TRACE("last_coeff_y_suffix", value, ps_cabac->u4_range);
last_significant_coeff_y =
(1 << ((last_significant_coeff_y_prefix >> 1) - 1)) *
(2 + (last_significant_coeff_y_prefix & 1)) + value;
}
}
/* Choose a scan matrix based on intra flag, intra pred mode, transform size
and luma/chroma */
scan_idx = SCAN_DIAG_UPRIGHT;
if(PRED_MODE_INTRA == ps_codec->s_parse.s_cu.i4_pred_mode)
{
if((2 == log2_trafo_size) || ((3 == log2_trafo_size) && (0 == c_idx)))
{
if((6 <= intra_pred_mode) &&
(14 >= intra_pred_mode))
{
scan_idx = SCAN_VERT;
}
else if((22 <= intra_pred_mode) &&
(30 >= intra_pred_mode))
{
scan_idx = SCAN_HORZ;
}
}
}
/* In case the scan is vertical, then swap X and Y positions */
if(SCAN_VERT == scan_idx)
{
SWAP(last_significant_coeff_x, last_significant_coeff_y);
}
{
WORD8 *pi1_scan_idx;
WORD8 *pi1_buf = (WORD8 *)ps_codec->s_parse.pv_tu_coeff_data;
/* First WORD8 gives number of coded subblocks */
pi1_num_coded_subblks = pi1_buf++;
/* Set number of coded subblocks in the current TU to zero */
/* This will be updated later */
*pi1_num_coded_subblks = 0;
/* Second WORD8 gives (scan idx << 1) | trans_skip */
pi1_scan_idx = pi1_buf++;
*pi1_scan_idx = (scan_idx << 1) | transform_skip_flag;
/* Store the incremented pointer in pv_tu_coeff_data */
ps_codec->s_parse.pv_tu_coeff_data = pi1_buf;
}
/**
* Given last_significant_coeff_y and last_significant_coeff_x find last sub block
* This is done by ignoring lower two bits of last_significant_coeff_y and last_significant_coeff_x
* and using scan matrix for lookup
*/
/* If transform is 4x4, last_sub_blk is zero */
last_sub_blk = 0;
/* If transform is larger than 4x4, then based on scan_idx and transform size, choose a scan table */
if(log2_trafo_size > 2)
{
WORD32 scan_pos;
WORD32 scan_mat_size;
pu1_scan_blk = (UWORD8 *)gapv_ihevc_scan[scan_idx * 3 + (log2_trafo_size - 2 - 1)];
/* Divide the current transform to 4x4 subblocks and count number of 4x4 in the first row */
/* This will be size of scan matrix to be used for subblock scanning */
scan_mat_size = 1 << (log2_trafo_size - 2);
scan_pos = ((last_significant_coeff_y >> 2) * scan_mat_size) +
(last_significant_coeff_x >> 2);
last_sub_blk = pu1_scan_blk[scan_pos];
}
pu1_scan_coeff = &gau1_ihevc_scan4x4[scan_idx][0];
{
WORD32 scan_pos;
scan_pos = ((last_significant_coeff_y & 3) << 2) +
(last_significant_coeff_x & 3);
last_scan_pos = pu1_scan_coeff[scan_pos];
}
if(log2_trafo_size > 2)
pu1_scan_blk = (UWORD8 *)gapv_ihevc_invscan[scan_idx * 3 + (log2_trafo_size - 2 - 1)];
pu1_scan_coeff = &gau1_ihevc_invscan4x4[scan_idx][0];
/* Set CSBF array to zero */
{
UWORD32 *pu4_csbf;
pu4_csbf = (void *)au2_csbf;
*pu4_csbf++ = 0;
*pu4_csbf++ = 0;
*pu4_csbf++ = 0;
*pu4_csbf = 0;
/* To avoid a check for y pos, 9th WORD16 in the array is set to zero */
au2_csbf[8] = 0;
}
/*************************************************************************/
/* derive base context index for sig coeff as per section 9.3.3.1.4 */
/* TODO; convert to look up based on luma/chroma, scan type and tfr size */
/*************************************************************************/
if(!c_idx)
{
sig_coeff_base_ctxt = IHEVC_CAB_COEFF_FLAG;
abs_gt1_base_ctxt = IHEVC_CAB_COEFABS_GRTR1_FLAG;
if(3 == log2_trafo_size)
{
/* 8x8 transform size */
sig_coeff_base_ctxt += (scan_idx == SCAN_DIAG_UPRIGHT) ? 9 : 15;
}
else if(3 < log2_trafo_size)
{
/* larger transform sizes */
sig_coeff_base_ctxt += 21;
}
}
else
{
/* chroma context initializations */
sig_coeff_base_ctxt = IHEVC_CAB_COEFF_FLAG + 27;
abs_gt1_base_ctxt = IHEVC_CAB_COEFABS_GRTR1_FLAG + 16;
if(3 == log2_trafo_size)
{
/* 8x8 transform size */
sig_coeff_base_ctxt += 9;
}
else if(3 < log2_trafo_size)
{
/* larger transform sizes */
sig_coeff_base_ctxt += 12;
}
}
num_subblks = 0;
/* Parse each 4x4 subblocks */
for(i = last_sub_blk; i >= 0; i--)
{
WORD32 sub_blk_pos;
WORD32 infer_sig_coeff_flag;
WORD32 cur_csbf;
WORD32 n;
WORD32 num_coeff;
/* Sig coeff map for 16 entries in raster scan order. Upper 16 bits are used.
* MSB gives sig coeff flag for 0th coeff and so on
* UWORD16 would have been enough but kept as UWORD32 for code optimizations
* In arm unnecessary masking operations are saved
*/
UWORD32 u4_sig_coeff_map_raster;
WORD32 sign_hidden;
/* Sig coeff map in scan order */
UWORD32 u4_sig_coeff_map;
WORD32 coeff_abs_level_greater2_flag;
UWORD32 u4_coeff_abs_level_greater1_map;
UWORD32 u4_coeff_abs_level_greater2_map;
UWORD32 u4_coeff_sign_map;
WORD32 first_sig_scan_pos, last_sig_scan_pos, num_greater1_flag, first_greater1_scan_pos;
WORD32 num_sig_coeff, sum_abs_level;
WORD32 nbr_csbf;
WORD32 ctxt_set;
WORD32 rice_param;
WORD32 xs, ys;
sub_blk_pos = 0;
if(i && (log2_trafo_size > 2))
sub_blk_pos = pu1_scan_blk[i];
/* Get xs and ys from scan position */
/* This is needed for context modelling of significant coeff flag */
xs = sub_blk_pos & ((1 << (log2_trafo_size - 2)) - 1);
ys = sub_blk_pos >> (log2_trafo_size - 2);
/* Check if neighbor subblocks are coded */
{
nbr_csbf = 0;
/* Get Bottom sub blocks CSBF */
nbr_csbf |= (au2_csbf[ys + 1] >> xs) & 1;
nbr_csbf <<= 1;
/* Get Right sub blocks CSBF */
/* Even if xs is equal to (1 << (log2_trafo_size - 2 )) - 1,
since au2_csbf is set to zero at the beginning, csbf for
neighbor will be read as 0 */
nbr_csbf |= (au2_csbf[ys] >> (xs + 1)) & 1;
}
cur_csbf = 0;
/* DC coeff is inferred, only if coded_sub_block is explicitly parsed as 1 */
/* i.e. it is not inferred for first and last subblock */
infer_sig_coeff_flag = 0;
if((i < last_sub_blk) && (i > 0))
{
WORD32 ctxt_idx = IHEVC_CAB_CODED_SUBLK_IDX;
/* ctxt based on right / bottom avail csbf, section 9.3.3.1.3 */
ctxt_idx += (nbr_csbf) ? 1 : 0;
/* Ctxt based on luma or chroma */
ctxt_idx += c_idx ? 2 : 0;
TRACE_CABAC_CTXT("coded_sub_block_flag", ps_cabac->u4_range, ctxt_idx);
IHEVCD_CABAC_DECODE_BIN(cur_csbf, ps_cabac, ps_bitstrm, ctxt_idx);
AEV_TRACE("coded_sub_block_flag", cur_csbf, ps_cabac->u4_range);
infer_sig_coeff_flag = 1;
}
else /* if((i == last_sub_blk) || (sub_blk_pos == 0)) */
{
/* CSBF is set to 1 for first and last subblock */
/* Note for these subblocks sig_coeff_map is not inferred but instead parsed */
cur_csbf = 1;
}
/* Set current sub blocks CSBF */
{
UWORD32 u4_mask = 1 << xs;
if(cur_csbf)
au2_csbf[ys] |= u4_mask;
else
au2_csbf[ys] &= ~u4_mask;
}
/* If current subblock is not coded, proceed to the next subblock */
if(0 == cur_csbf)
continue;
n = 15;
u4_sig_coeff_map_raster = 0;
u4_sig_coeff_map = 0;
num_coeff = 0;
if(i == last_sub_blk)
{
WORD32 pos = ((last_significant_coeff_y & 3) << 2) +
(last_significant_coeff_x & 3);
n = (last_scan_pos - 1);
/* Set Significant coeff map for last significant coeff flag as 1 */
u4_sig_coeff_map_raster = 1 << pos;
u4_sig_coeff_map = 1 << last_scan_pos;
num_coeff = 1;
}
for(; n >= 0; n--)
{
WORD32 significant_coeff_flag;
if((n > 0 || !infer_sig_coeff_flag))
{
//WORD32 coeff_pos;
WORD32 sig_ctxinc;
WORD32 ctxt_idx;
/* Coefficient position is needed for deriving context index for significant_coeff_flag */
//coeff_pos = pu1_scan_coeff[n];
/* derive the context inc as per section 9.3.3.1.4 */
sig_ctxinc = 0;
if(2 == log2_trafo_size)
{
/* 4x4 transform size increment uses lookup */
sig_ctxinc = gau1_ihevcd_sigcoeff_ctxtinc_tr4[scan_idx][n];
}
else if(n || i)
{
/* ctxt for AC coeff depends on curpos and neigbour csbf */
sig_ctxinc = gau1_ihevcd_sigcoeff_ctxtinc[scan_idx][nbr_csbf][n];
/* based on luma subblock pos */
sig_ctxinc += (i && (!c_idx)) ? 3 : 0;
}
else
{
/* DC coeff has fixed context for luma and chroma */
sig_coeff_base_ctxt = (0 == c_idx) ? IHEVC_CAB_COEFF_FLAG :
(IHEVC_CAB_COEFF_FLAG + 27);
}
ctxt_idx = sig_ctxinc + sig_coeff_base_ctxt;
TRACE_CABAC_CTXT("significant_coeff_flag", ps_cabac->u4_range, ctxt_idx);
IHEVCD_CABAC_DECODE_BIN(significant_coeff_flag, ps_cabac,
ps_bitstrm,
ctxt_idx);
AEV_TRACE("significant_coeff_flag", significant_coeff_flag, ps_cabac->u4_range);
/* If at least one non-zero coeff is signalled then do not infer sig coeff map */
/* for (0,0) coeff in the current sub block */
if(significant_coeff_flag)
infer_sig_coeff_flag = 0;
// u4_sig_coeff_map_raster |= significant_coeff_flag
// << coeff_pos;
u4_sig_coeff_map |= significant_coeff_flag << n;
num_coeff += significant_coeff_flag;
}
}
/*********************************************************************/
/* If infer_sig_coeff_flag is 1 then treat the 0th coeff as non zero */
/* If infer_sig_coeff_flag is zero, then last significant_coeff_flag */
/* is parsed in the above loop */
/*********************************************************************/
if(infer_sig_coeff_flag)
{
u4_sig_coeff_map_raster |= 1;
u4_sig_coeff_map |= 1;
num_coeff++;
}
/*********************************************************************/
/* First subblock does not get an explicit csbf. It is assumed to */
/* be 1. For this subblock there is chance of getting all */
/* sig_coeff_flags to be zero. In such a case proceed to the next */
/* subblock(which is end of parsing for the current transform block) */
/*********************************************************************/
if(0 == num_coeff)
continue;
/* Increment number of coded subblocks for the current TU */
num_subblks++;
/* Set sig coeff map and subblock position */
ps_tu_sblk_coeff_data = (tu_sblk_coeff_data_t *)ps_codec->s_parse.pv_tu_coeff_data;
ps_tu_sblk_coeff_data->u2_sig_coeff_map = u4_sig_coeff_map;
ps_tu_sblk_coeff_data->u2_subblk_pos = (ys << 8) | xs;
first_sig_scan_pos = 16;
last_sig_scan_pos = -1;
num_greater1_flag = 0;
first_greater1_scan_pos = -1;
u4_coeff_abs_level_greater1_map = 0;
/* context set based on luma subblock pos */
ctxt_set = (i && (!c_idx)) ? 2 : 0;
/* See section 9.3.3.1.5 */
ctxt_set += (0 == gt1_ctxt) ? 1 : 0;
gt1_ctxt = 1;
/* Instead of initializing n to 15, set it to 31-CLZ(sig coeff map) */
{
UWORD32 u4_sig_coeff_map_shift;
UWORD32 clz;
clz = CLZ(u4_sig_coeff_map);
n = 31 - clz;
u4_sig_coeff_map_shift = u4_sig_coeff_map << clz;
/* For loop for n changed to do while to break early if sig_coeff_map_shift becomes zero */
do
{
//WORD32 coeff_pos;
WORD32 ctxt_idx;
//TODO: Scan lookup will be removed later and instead u4_sig_coeff_map will be used
//coeff_pos = pu1_scan_coeff[n];
if((u4_sig_coeff_map_shift >> 31) & 1)
{
/* abs_level_greater1_flag is sent for only first 8 non-zero levels in a subblock */
if(num_greater1_flag < 8)
{
WORD32 coeff_abs_level_greater1_flag;
ctxt_idx = (ctxt_set * 4) + abs_gt1_base_ctxt + gt1_ctxt;
TRACE_CABAC_CTXT("coeff_abs_level_greater1_flag", ps_cabac->u4_range, ctxt_idx);
IHEVCD_CABAC_DECODE_BIN(coeff_abs_level_greater1_flag, ps_cabac, ps_bitstrm, ctxt_idx);
AEV_TRACE("coeff_abs_level_greater1_flag", coeff_abs_level_greater1_flag, ps_cabac->u4_range);
u4_coeff_abs_level_greater1_map |= coeff_abs_level_greater1_flag << n;
num_greater1_flag++;
/* first_greater1_scan_pos is obtained using CLZ on u4_coeff_abs_level_greater1_map*/
/* outside the loop instead of the following check inside the loop */
/* if( coeff_abs_level_greater1_flag && first_greater1_scan_pos == -1) */
/* first_greater1_scan_pos = n; */
if(coeff_abs_level_greater1_flag)
{
gt1_ctxt = 0;
}
else if(gt1_ctxt && (gt1_ctxt < 3))
{
gt1_ctxt++;
}
}
else
break;
/* instead of computing last and first significan scan position using checks below */
/* They are computed outside the loop using CLZ and CTZ on sig_coeff_map */
/* if(last_sig_scan_pos == -1) */
/* last_sig_scan_pos = n; */
/* first_sig_scan_pos = n; */
}
u4_sig_coeff_map_shift <<= 1;
n--;
/* If there are zero coeffs, then shift by as many zero coeffs and decrement n */
clz = CLZ(u4_sig_coeff_map_shift);
u4_sig_coeff_map_shift <<= clz;
n -= clz;
}while(u4_sig_coeff_map_shift);
}
/* At this level u4_sig_coeff_map is non-zero i.e. has atleast one non-zero coeff */
last_sig_scan_pos = (31 - CLZ(u4_sig_coeff_map));
first_sig_scan_pos = CTZ(u4_sig_coeff_map);
sign_hidden = (((last_sig_scan_pos - first_sig_scan_pos) > 3) && !ps_codec->s_parse.s_cu.i4_cu_transquant_bypass);
u4_coeff_abs_level_greater2_map = 0;
if(u4_coeff_abs_level_greater1_map)
{
/* Check if the first level > 1 is greater than 2 */
WORD32 ctxt_idx;
first_greater1_scan_pos = (31 - CLZ(u4_coeff_abs_level_greater1_map));
ctxt_idx = IHEVC_CAB_COEFABS_GRTR2_FLAG;
ctxt_idx += (!c_idx) ? ctxt_set : (ctxt_set + 4);
TRACE_CABAC_CTXT("coeff_abs_level_greater2_flag", ps_cabac->u4_range, ctxt_idx);
IHEVCD_CABAC_DECODE_BIN(coeff_abs_level_greater2_flag, ps_cabac, ps_bitstrm, ctxt_idx);
AEV_TRACE("coeff_abs_level_greater2_flag", coeff_abs_level_greater2_flag, ps_cabac->u4_range);
u4_coeff_abs_level_greater2_map = coeff_abs_level_greater2_flag << first_greater1_scan_pos;
}
u4_coeff_sign_map = 0;
/* Parse sign flags */
if(!sign_data_hiding_flag || !sign_hidden)
{
IHEVCD_CABAC_DECODE_BYPASS_BINS(value, ps_cabac, ps_bitstrm, num_coeff);
AEV_TRACE("sign_flags", value, ps_cabac->u4_range);
u4_coeff_sign_map = value << (32 - num_coeff);
}
else
{
IHEVCD_CABAC_DECODE_BYPASS_BINS(value, ps_cabac, ps_bitstrm, (num_coeff - 1));
AEV_TRACE("sign_flags", value, ps_cabac->u4_range);
u4_coeff_sign_map = value << (32 - (num_coeff - 1));
}
num_sig_coeff = 0;
sum_abs_level = 0;
rice_param = 0;
{
UWORD32 clz;
UWORD32 u4_sig_coeff_map_shift;
clz = CLZ(u4_sig_coeff_map);
n = 31 - clz;
u4_sig_coeff_map_shift = u4_sig_coeff_map << clz;
/* For loop for n changed to do while to break early if sig_coeff_map_shift becomes zero */
do
{
if((u4_sig_coeff_map_shift >> 31) & 1)
{
WORD32 base_lvl;
WORD32 coeff_abs_level_remaining;
WORD32 level;
base_lvl = 1;
/* Update base_lvl if it is greater than 1 */
if((u4_coeff_abs_level_greater1_map >> n) & 1)
base_lvl++;
/* Update base_lvl if it is greater than 2 */
if((u4_coeff_abs_level_greater2_map >> n) & 1)
base_lvl++;
/* If level is greater than 3/2/1 based on the greater1 and greater2 maps,
* decode remaining level (level - base_lvl) will be signalled as bypass bins
*/
coeff_abs_level_remaining = 0;
if(base_lvl == ((num_sig_coeff < 8) ? ((n == first_greater1_scan_pos) ? 3 : 2) : 1))
{
UWORD32 u4_prefix;
WORD32 bin;
u4_prefix = 0;
do
{
IHEVCD_CABAC_DECODE_BYPASS_BIN(bin, ps_cabac, ps_bitstrm);
u4_prefix++;
if((WORD32)u4_prefix == 19 - rice_param)
{
bin = 1;
break;
}
}while(bin);
u4_prefix = u4_prefix - 1;
if(u4_prefix < 3)
{
UWORD32 u4_suffix;
coeff_abs_level_remaining = (u4_prefix << rice_param);
if(rice_param)
{
IHEVCD_CABAC_DECODE_BYPASS_BINS(u4_suffix, ps_cabac, ps_bitstrm, rice_param);
coeff_abs_level_remaining |= u4_suffix;
}
}
else
{
UWORD32 u4_suffix;
UWORD32 u4_numbins;
//u4_prefix = CLIP3(u4_prefix, 0, 19 - rice_param);
u4_numbins = (u4_prefix - 3 + rice_param);
coeff_abs_level_remaining = (((1 << (u4_prefix - 3)) + 3 - 1) << rice_param);
if(u4_numbins)
{
IHEVCD_CABAC_DECODE_BYPASS_BINS(u4_suffix, ps_cabac, ps_bitstrm, u4_numbins);
coeff_abs_level_remaining += u4_suffix;
}
}
AEV_TRACE("coeff_abs_level_remaining", coeff_abs_level_remaining, ps_cabac->u4_range);
base_lvl += coeff_abs_level_remaining;
}
/* update the rice param based on coeff level */
if((base_lvl > (3 << rice_param)) && (rice_param < 4))
{
rice_param++;
}
/* Compute absolute level */
level = base_lvl;
/* Update level with the sign */
if((u4_coeff_sign_map >> 31) & 1)
level = -level;
u4_coeff_sign_map <<= 1;
/* Update sign in case sign is hidden */
if(sign_data_hiding_flag && sign_hidden)
{
sum_abs_level += base_lvl;
if(n == first_sig_scan_pos && ((sum_abs_level % 2) == 1))
level = -level;
}
/* Store the resulting level in non-zero level array */
ps_tu_sblk_coeff_data->ai2_level[num_sig_coeff++] = level;
//AEV_TRACE("level", level, 0);
}
u4_sig_coeff_map_shift <<= 1;
n--;
/* If there are zero coeffs, then shift by as many zero coeffs and decrement n */
clz = CLZ(u4_sig_coeff_map_shift);
u4_sig_coeff_map_shift <<= clz;
n -= clz;
}while(u4_sig_coeff_map_shift);
}
/* Increment the pv_tu_sblk_coeff_data */
{
UWORD8 *pu1_buf = (UWORD8 *)ps_codec->s_parse.pv_tu_coeff_data;
pu1_buf += sizeof(tu_sblk_coeff_data_t) - SUBBLK_COEFF_CNT * sizeof(WORD16);
pu1_buf += num_coeff * sizeof(WORD16);
ps_codec->s_parse.pv_tu_coeff_data = pu1_buf;
}
}
/* Set number of coded sub blocks in the current TU */
*pi1_num_coded_subblks = num_subblks;
return ret;
}