blob: 717bb53022ddeee6ccb8c0abe44e5c48b719c778 [file] [log] [blame]
/******************************************************************************
*
* Copyright (C) 2012 Ittiam Systems Pvt Ltd, Bangalore
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at:
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*
******************************************************************************/
/**
*******************************************************************************
* @file
* ihevc_inter_pred_filters.c
*
* @brief
* Contains function definitions for inter prediction interpolation filters
*
*
* @author
* Srinivas T
*
* @par List of Functions:
* - ihevc_inter_pred_luma_copy()
* - ihevc_inter_pred_luma_horz()
* - ihevc_inter_pred_luma_vert()
* - ihevc_inter_pred_luma_copy_w16out()
* - ihevc_inter_pred_luma_horz_w16out()
* - ihevc_inter_pred_luma_vert_w16out()
* - ihevc_inter_pred_luma_vert_w16inp()
* - ihevc_inter_pred_luma_vert_w16inp_w16out()
* - ihevc_inter_pred_chroma_copy()
* - ihevc_inter_pred_chroma_horz()
* - ihevc_inter_pred_chroma_vert()
* - ihevc_inter_pred_chroma_copy_w16out()
* - ihevc_inter_pred_chroma_horz_w16out()
* - ihevc_inter_pred_chroma_vert_w16out()
* - ihevc_inter_pred_chroma_vert_w16inp()
* - ihevc_inter_pred_chroma_vert_w16inp_w16out()
*
* @remarks
* None
*
*******************************************************************************
*/
/*****************************************************************************/
/* File Includes */
/*****************************************************************************/
#include "ihevc_typedefs.h"
#include "ihevc_defs.h"
#include "ihevc_macros.h"
#include "ihevc_platform_macros.h"
#include "ihevc_func_selector.h"
#include "ihevc_inter_pred.h"
/*****************************************************************************/
/* Function Definitions */
/*****************************************************************************/
/**
*******************************************************************************
*
* @brief
* Interprediction luma function for copy
*
* @par Description:
* Copies the array of width 'wd' and height 'ht' from the location pointed
* by 'src' to the location pointed by 'dst'
*
* @param[in] pu1_src
* UWORD8 pointer to the source
*
* @param[out] pu1_dst
* UWORD8 pointer to the destination
*
* @param[in] src_strd
* integer source stride
*
* @param[in] dst_strd
* integer destination stride
*
* @param[in] pi1_coeff
* WORD8 pointer to the filter coefficients
*
* @param[in] ht
* integer height of the array
*
* @param[in] wd
* integer width of the array
*
* @returns
*
* @remarks
* None
*
*******************************************************************************
*/
void ihevc_inter_pred_luma_copy(UWORD8 *pu1_src,
UWORD8 *pu1_dst,
WORD32 src_strd,
WORD32 dst_strd,
WORD8 *pi1_coeff,
WORD32 ht,
WORD32 wd)
{
WORD32 row, col;
UNUSED(pi1_coeff);
for(row = 0; row < ht; row++)
{
for(col = 0; col < wd; col++)
{
pu1_dst[col] = pu1_src[col];
}
pu1_src += src_strd;
pu1_dst += dst_strd;
}
}
/**
*******************************************************************************
*
* @brief
* Interprediction luma filter for horizontal input
*
* @par Description:
* Applies a horizontal filter with coefficients pointed to by 'pi1_coeff'
* to the elements pointed by 'pu1_src' and writes to the location pointed
* by 'pu1_dst' The output is downshifted by 6 and clipped to 8 bits
*
* @param[in] pu1_src
* UWORD8 pointer to the source
*
* @param[out] pu1_dst
* UWORD8 pointer to the destination
*
* @param[in] src_strd
* integer source stride
*
* @param[in] dst_strd
* integer destination stride
*
* @param[in] pi1_coeff
* WORD8 pointer to the filter coefficients
*
* @param[in] ht
* integer height of the array
*
* @param[in] wd
* integer width of the array
*
* @returns
*
* @remarks
* None
*
*******************************************************************************
*/
void ihevc_inter_pred_luma_horz(UWORD8 *pu1_src,
UWORD8 *pu1_dst,
WORD32 src_strd,
WORD32 dst_strd,
WORD8 *pi1_coeff,
WORD32 ht,
WORD32 wd)
{
WORD32 row, col, i;
WORD16 i2_tmp;
for(row = 0; row < ht; row++)
{
for(col = 0; col < wd; col++)
{
i2_tmp = 0;
for(i = 0; i < NTAPS_LUMA; i++)
i2_tmp += pi1_coeff[i] * pu1_src[col + (i - 3)];
i2_tmp = (i2_tmp + OFFSET_14_MINUS_BIT_DEPTH) >> SHIFT_14_MINUS_BIT_DEPTH;
i2_tmp = CLIP_U8(i2_tmp);
pu1_dst[col] = (UWORD8)i2_tmp;
}
pu1_src += src_strd;
pu1_dst += dst_strd;
}
}
/**
*******************************************************************************
*
* @brief
* Interprediction luma filter for vertical input
*
* @par Description:
* Applies a vertcal filter with coefficients pointed to by 'pi1_coeff' to
* the elements pointed by 'pu1_src' and writes to the location pointed by
* 'pu1_dst' The output is downshifted by 6 and clipped to 8 bits
*
* @param[in] pu1_src
* UWORD8 pointer to the source
*
* @param[out] pu1_dst
* UWORD8 pointer to the destination
*
* @param[in] src_strd
* integer source stride
*
* @param[in] dst_strd
* integer destination stride
*
* @param[in] pi1_coeff
* WORD8 pointer to the filter coefficients
*
* @param[in] ht
* integer height of the array
*
* @param[in] wd
* integer width of the array
*
* @returns
*
* @remarks
* None
*
*******************************************************************************
*/
void ihevc_inter_pred_luma_vert(UWORD8 *pu1_src,
UWORD8 *pu1_dst,
WORD32 src_strd,
WORD32 dst_strd,
WORD8 *pi1_coeff,
WORD32 ht,
WORD32 wd)
{
WORD32 row, col, i;
WORD16 i2_tmp;
for(row = 0; row < ht; row++)
{
for(col = 0; col < wd; col++)
{
i2_tmp = 0;
for(i = 0; i < NTAPS_LUMA; i++)
i2_tmp += pi1_coeff[i] * pu1_src[col + (i - 3) * src_strd];
i2_tmp = (i2_tmp + OFFSET_14_MINUS_BIT_DEPTH) >> SHIFT_14_MINUS_BIT_DEPTH;
i2_tmp = CLIP_U8(i2_tmp);
pu1_dst[col] = (UWORD8)i2_tmp;
}
pu1_src += src_strd;
pu1_dst += dst_strd;
}
}
/**
*******************************************************************************
*
* @brief
* Interprediction luma filter for copy 16bit output
*
* @par Description:
* Copies the array of width 'wd' and height 'ht' from the location pointed
* by 'src' to the location pointed by 'dst' The output is upshifted by 6
* bits and is used as input for vertical filtering or weighted prediction
*
* @param[in] pu1_src
* UWORD8 pointer to the source
*
* @param[out] pi2_dst
* WORD16 pointer to the destination
*
* @param[in] src_strd
* integer source stride
*
* @param[in] dst_strd
* integer destination stride
*
* @param[in] pi1_coeff
* WORD8 pointer to the filter coefficients
*
* @param[in] ht
* integer height of the array
*
* @param[in] wd
* integer width of the array
*
* @returns
*
* @remarks
* None
*
*******************************************************************************
*/
void ihevc_inter_pred_luma_copy_w16out(UWORD8 *pu1_src,
WORD16 *pi2_dst,
WORD32 src_strd,
WORD32 dst_strd,
WORD8 *pi1_coeff,
WORD32 ht,
WORD32 wd)
{
WORD32 row, col;
UNUSED(pi1_coeff);
for(row = 0; row < ht; row++)
{
for(col = 0; col < wd; col++)
{
pi2_dst[col] = (pu1_src[col] << SHIFT_14_MINUS_BIT_DEPTH);
}
pu1_src += src_strd;
pi2_dst += dst_strd;
}
}
/**
*******************************************************************************
*
* @brief
* Interprediction luma filter for horizontal 16bit output
*
* @par Description:
* Applies a horizontal filter with coefficients pointed to by 'pi1_coeff'
* to the elements pointed by 'pu1_src' and writes to the location pointed
* by 'pu1_dst' No downshifting or clipping is done and the output is used
* as an input for vertical filtering or weighted prediction
*
* @param[in] pu1_src
* UWORD8 pointer to the source
*
* @param[out] pi2_dst
* WORD16 pointer to the destination
*
* @param[in] src_strd
* integer source stride
*
* @param[in] dst_strd
* integer destination stride
*
* @param[in] pi1_coeff
* WORD8 pointer to the filter coefficients
*
* @param[in] ht
* integer height of the array
*
* @param[in] wd
* integer width of the array
*
* @returns
*
* @remarks
* None
*
*******************************************************************************
*/
void ihevc_inter_pred_luma_horz_w16out(UWORD8 *pu1_src,
WORD16 *pi2_dst,
WORD32 src_strd,
WORD32 dst_strd,
WORD8 *pi1_coeff,
WORD32 ht,
WORD32 wd)
{
WORD32 row, col, i;
WORD16 i2_tmp;
for(row = 0; row < ht; row++)
{
for(col = 0; col < wd; col++)
{
i2_tmp = 0;
for(i = 0; i < NTAPS_LUMA; i++)
i2_tmp += pi1_coeff[i] * pu1_src[col + (i - 3)];
pi2_dst[col] = i2_tmp;
}
pu1_src += src_strd;
pi2_dst += dst_strd;
}
}
/**
*******************************************************************************
*
* @brief
* Interprediction luma filter for vertical 16bit output
*
* @par Description:
* Applies a vertical filter with coefficients pointed to by 'pi1_coeff' to
* the elements pointed by 'pu1_src' and writes to the location pointed by
* 'pu1_dst' No downshifting or clipping is done and the output is used as
* an input for weighted prediction
*
* @param[in] pu1_src
* UWORD8 pointer to the source
*
* @param[out] pi2_dst
* WORD16 pointer to the destination
*
* @param[in] src_strd
* integer source stride
*
* @param[in] dst_strd
* integer destination stride
*
* @param[in] pi1_coeff
* WORD8 pointer to the filter coefficients
*
* @param[in] ht
* integer height of the array
*
* @param[in] wd
* integer width of the array
*
* @returns
*
* @remarks
* None
*
*******************************************************************************
*/
void ihevc_inter_pred_luma_vert_w16out(UWORD8 *pu1_src,
WORD16 *pi2_dst,
WORD32 src_strd,
WORD32 dst_strd,
WORD8 *pi1_coeff,
WORD32 ht,
WORD32 wd)
{
WORD32 row, col, i;
WORD16 i2_tmp;
for(row = 0; row < ht; row++)
{
for(col = 0; col < wd; col++)
{
i2_tmp = 0;
for(i = 0; i < NTAPS_LUMA; i++)
i2_tmp += pi1_coeff[i] * pu1_src[col + (i - 3) * src_strd];
pi2_dst[col] = i2_tmp;
}
pu1_src += src_strd;
pi2_dst += dst_strd;
}
}
/**
*******************************************************************************
*
* @brief
*
* Luma vertical filter for 16bit input.
*
* @par Description:
* Applies a vertical filter with coefficients pointed to by 'pi1_coeff' to
* the elements pointed by 'pu1_src' and writes to the location pointed by
* 'pu1_dst' Input is 16 bits The filter output is downshifted by 12 and
* clipped to lie between 0 and 255
*
* @param[in] pi2_src
* WORD16 pointer to the source
*
* @param[out] pu1_dst
* UWORD8 pointer to the destination
*
* @param[in] src_strd
* integer source stride
*
* @param[in] dst_strd
* integer destination stride
*
* @param[in] pi1_coeff
* WORD8 pointer to the filter coefficients
*
* @param[in] ht
* integer height of the array
*
* @param[in] wd
* integer width of the array
*
* @returns
*
* @remarks
* None
*
*******************************************************************************
*/
void ihevc_inter_pred_luma_vert_w16inp(WORD16 *pi2_src,
UWORD8 *pu1_dst,
WORD32 src_strd,
WORD32 dst_strd,
WORD8 *pi1_coeff,
WORD32 ht,
WORD32 wd)
{
WORD32 row, col, i;
WORD32 i4_tmp;
for(row = 0; row < ht; row++)
{
for(col = 0; col < wd; col++)
{
i4_tmp = 0;
for(i = 0; i < NTAPS_LUMA; i++)
i4_tmp += pi1_coeff[i] * pi2_src[col + (i - 3) * src_strd];
i4_tmp = ((i4_tmp >> SHIFT_14_MINUS_BIT_DEPTH) + OFFSET_14_MINUS_BIT_DEPTH) >> SHIFT_14_MINUS_BIT_DEPTH;
i4_tmp = CLIP_U8(i4_tmp);
pu1_dst[col] = i4_tmp;
}
pi2_src += src_strd;
pu1_dst += dst_strd;
}
}
/**
*******************************************************************************
*
* @brief
* Luma prediction filter for vertical 16bit input & output
*
* @par Description:
* Applies a vertical filter with coefficients pointed to by 'pi1_coeff' to
* the elements pointed by 'pu1_src' and writes to the location pointed by
* 'pu1_dst' Input is 16 bits The filter output is downshifted by 6 and
* 8192 is subtracted to store it as a 16 bit number The output is used as
* a input to weighted prediction
*
* @param[in] pi2_src
* WORD16 pointer to the source
*
* @param[out] pi2_dst
* WORD16 pointer to the destination
*
* @param[in] src_strd
* integer source stride
*
* @param[in] dst_strd
* integer destination stride
*
* @param[in] pi1_coeff
* WORD8 pointer to the filter coefficients
*
* @param[in] ht
* integer height of the array
*
* @param[in] wd
* integer width of the array
*
* @returns
*
* @remarks
* None
*
*******************************************************************************
*/
void ihevc_inter_pred_luma_vert_w16inp_w16out(WORD16 *pi2_src,
WORD16 *pi2_dst,
WORD32 src_strd,
WORD32 dst_strd,
WORD8 *pi1_coeff,
WORD32 ht,
WORD32 wd)
{
WORD32 row, col, i;
WORD32 i4_tmp;
for(row = 0; row < ht; row++)
{
for(col = 0; col < wd; col++)
{
i4_tmp = 0;
for(i = 0; i < NTAPS_LUMA; i++)
i4_tmp += pi1_coeff[i] * pi2_src[col + (i - 3) * src_strd];
i4_tmp = (i4_tmp >> SHIFT_14_MINUS_BIT_DEPTH) - OFFSET14;
pi2_dst[col] = i4_tmp;
}
pi2_src += src_strd;
pi2_dst += dst_strd;
}
}
/**
*******************************************************************************
*
* @brief
* Chroma interprediction filter for copy
*
* @par Description:
* Copies the array of width 'wd' and height 'ht' from the location pointed
* by 'src' to the location pointed by 'dst'
*
* @param[in] pu1_src
* UWORD8 pointer to the source
*
* @param[out] pu1_dst
* UWORD8 pointer to the destination
*
* @param[in] src_strd
* integer source stride
*
* @param[in] dst_strd
* integer destination stride
*
* @param[in] pi1_coeff
* WORD8 pointer to the filter coefficients
*
* @param[in] ht
* integer height of the array
*
* @param[in] wd
* integer width of the array
*
* @returns
*
* @remarks
* None
*
*******************************************************************************
*/
void ihevc_inter_pred_chroma_copy(UWORD8 *pu1_src,
UWORD8 *pu1_dst,
WORD32 src_strd,
WORD32 dst_strd,
WORD8 *pi1_coeff,
WORD32 ht,
WORD32 wd)
{
WORD32 row, col;
UNUSED(pi1_coeff);
for(row = 0; row < ht; row++)
{
for(col = 0; col < 2 * wd; col++)
{
pu1_dst[col] = pu1_src[col];
}
pu1_src += src_strd;
pu1_dst += dst_strd;
}
}
/**
*******************************************************************************
*
* @brief
* Chroma interprediction filter for horizontal input
*
* @par Description:
* Applies a horizontal filter with coefficients pointed to by 'pi1_coeff'
* to the elements pointed by 'pu1_src' and writes to the location pointed
* by 'pu1_dst' The output is downshifted by 6 and clipped to 8 bits
*
* @param[in] pu1_src
* UWORD8 pointer to the source
*
* @param[out] pu1_dst
* UWORD8 pointer to the destination
*
* @param[in] src_strd
* integer source stride
*
* @param[in] dst_strd
* integer destination stride
*
* @param[in] pi1_coeff
* WORD8 pointer to the filter coefficients
*
* @param[in] ht
* integer height of the array
*
* @param[in] wd
* integer width of the array
*
* @returns
*
* @remarks
* None
*
*******************************************************************************
*/
void ihevc_inter_pred_chroma_horz(UWORD8 *pu1_src,
UWORD8 *pu1_dst,
WORD32 src_strd,
WORD32 dst_strd,
WORD8 *pi1_coeff,
WORD32 ht,
WORD32 wd)
{
WORD32 row, col, i;
WORD16 i2_tmp_u, i2_tmp_v;
for(row = 0; row < ht; row++)
{
for(col = 0; col < 2 * wd; col += 2)
{
i2_tmp_u = 0;
i2_tmp_v = 0;
for(i = 0; i < NTAPS_CHROMA; i++)
{
i2_tmp_u += pi1_coeff[i] * pu1_src[col + (i - 1) * 2];
i2_tmp_v += pi1_coeff[i] * pu1_src[col + 1 + (i - 1) * 2];
}
i2_tmp_u = (i2_tmp_u + OFFSET_14_MINUS_BIT_DEPTH) >> SHIFT_14_MINUS_BIT_DEPTH;
i2_tmp_u = CLIP_U8(i2_tmp_u);
i2_tmp_v = (i2_tmp_v + OFFSET_14_MINUS_BIT_DEPTH) >> SHIFT_14_MINUS_BIT_DEPTH;
i2_tmp_v = CLIP_U8(i2_tmp_v);
pu1_dst[col] = (UWORD8)i2_tmp_u;
pu1_dst[col + 1] = (UWORD8)i2_tmp_v;
}
pu1_src += src_strd;
pu1_dst += dst_strd;
}
}
/**
*******************************************************************************
*
* @brief
* Chroma interprediction filter for vertical input
*
* @par Description:
* Applies a vertcal filter with coefficients pointed to by 'pi1_coeff' to
* the elements pointed by 'pu1_src' and writes to the location pointed by
* 'pu1_dst' The output is downshifted by 6 and clipped to 8 bits
*
*
* @param[in] pu1_src
* UWORD8 pointer to the source
*
* @param[out] pu1_dst
* UWORD8 pointer to the destination
*
* @param[in] src_strd
* integer source stride
*
* @param[in] dst_strd
* integer destination stride
*
* @param[in] pi1_coeff
* WORD8 pointer to the filter coefficients
*
* @param[in] ht
* integer height of the array
*
* @param[in] wd
* integer width of the array
*
* @returns
*
* @remarks
* None
*
*******************************************************************************
*/
void ihevc_inter_pred_chroma_vert(UWORD8 *pu1_src,
UWORD8 *pu1_dst,
WORD32 src_strd,
WORD32 dst_strd,
WORD8 *pi1_coeff,
WORD32 ht,
WORD32 wd)
{
WORD32 row, col, i;
WORD16 i2_tmp;
for(row = 0; row < ht; row++)
{
for(col = 0; col < 2 * wd; col++)
{
i2_tmp = 0;
for(i = 0; i < NTAPS_CHROMA; i++)
{
i2_tmp += pi1_coeff[i] * pu1_src[col + (i - 1) * src_strd];
}
i2_tmp = (i2_tmp + OFFSET_14_MINUS_BIT_DEPTH) >> SHIFT_14_MINUS_BIT_DEPTH;
i2_tmp = CLIP_U8(i2_tmp);
pu1_dst[col] = (UWORD8)i2_tmp;
}
pu1_src += src_strd;
pu1_dst += dst_strd;
}
}
/**
*******************************************************************************
*
* @brief
* chroma interprediction filter for copying 16bit output
*
* @par Description:
* Copies the array of width 'wd' and height 'ht' from the location pointed
* by 'src' to the location pointed by 'dst' The output is upshifted by 6
* bits and is used as input for vertical filtering or weighted prediction
*
* @param[in] pu1_src
* UWORD8 pointer to the source
*
* @param[out] pi2_dst
* WORD16 pointer to the destination
*
* @param[in] src_strd
* integer source stride
*
* @param[in] dst_strd
* integer destination stride
*
* @param[in] pi1_coeff
* WORD8 pointer to the filter coefficients
*
* @param[in] ht
* integer height of the array
*
* @param[in] wd
* integer width of the array
*
* @returns
*
* @remarks
* None
*
*******************************************************************************
*/
void ihevc_inter_pred_chroma_copy_w16out(UWORD8 *pu1_src,
WORD16 *pi2_dst,
WORD32 src_strd,
WORD32 dst_strd,
WORD8 *pi1_coeff,
WORD32 ht,
WORD32 wd)
{
WORD32 row, col;
UNUSED(pi1_coeff);
for(row = 0; row < ht; row++)
{
for(col = 0; col < 2 * wd; col++)
{
pi2_dst[col] = (pu1_src[col] << SHIFT_14_MINUS_BIT_DEPTH);
}
pu1_src += src_strd;
pi2_dst += dst_strd;
}
}
/**
*******************************************************************************
*
* @brief
* chroma interprediction filter to store horizontal 16bit ouput
*
* @par Description:
* Applies a horizontal filter with coefficients pointed to by 'pi1_coeff'
* to the elements pointed by 'pu1_src' and writes to the location pointed
* by 'pu1_dst' No downshifting or clipping is done and the output is used
* as an input for vertical filtering or weighted prediction
*
* @param[in] pu1_src
* UWORD8 pointer to the source
*
* @param[out] pi2_dst
* WORD16 pointer to the destination
*
* @param[in] src_strd
* integer source stride
*
* @param[in] dst_strd
* integer destination stride
*
* @param[in] pi1_coeff
* WORD8 pointer to the filter coefficients
*
* @param[in] ht
* integer height of the array
*
* @param[in] wd
* integer width of the array
*
* @returns
*
* @remarks
* None
*
*******************************************************************************
*/
void ihevc_inter_pred_chroma_horz_w16out(UWORD8 *pu1_src,
WORD16 *pi2_dst,
WORD32 src_strd,
WORD32 dst_strd,
WORD8 *pi1_coeff,
WORD32 ht,
WORD32 wd)
{
WORD32 row, col, i;
WORD16 i2_tmp_u, i2_tmp_v;
for(row = 0; row < ht; row++)
{
for(col = 0; col < 2 * wd; col += 2)
{
i2_tmp_u = 0;
i2_tmp_v = 0;
for(i = 0; i < NTAPS_CHROMA; i++)
{
i2_tmp_u += pi1_coeff[i] * pu1_src[col + (i - 1) * 2];
i2_tmp_v += pi1_coeff[i] * pu1_src[col + 1 + (i - 1) * 2];
}
pi2_dst[col] = i2_tmp_u;
pi2_dst[col + 1] = i2_tmp_v;
}
pu1_src += src_strd;
pi2_dst += dst_strd;
}
}
/**
*******************************************************************************
*
* @brief
* Interprediction chroma filter to store vertical 16bit ouput
*
* @par Description:
* Applies a vertical filter with coefficients pointed to by 'pi1_coeff' to
* the elements pointed by 'pu1_src' and writes to the location pointed by
* 'pu1_dst' No downshifting or clipping is done and the output is used as
* an input for weighted prediction
*
* @param[in] pu1_src
* UWORD8 pointer to the source
*
* @param[out] pi2_dst
* WORD16 pointer to the destination
*
* @param[in] src_strd
* integer source stride
*
* @param[in] dst_strd
* integer destination stride
*
* @param[in] pi1_coeff
* WORD8 pointer to the filter coefficients
*
* @param[in] ht
* integer height of the array
*
* @param[in] wd
* integer width of the array
*
* @returns
*
* @remarks
* None
*
*******************************************************************************
*/
void ihevc_inter_pred_chroma_vert_w16out(UWORD8 *pu1_src,
WORD16 *pi2_dst,
WORD32 src_strd,
WORD32 dst_strd,
WORD8 *pi1_coeff,
WORD32 ht,
WORD32 wd)
{
WORD32 row, col, i;
WORD16 i2_tmp;
for(row = 0; row < ht; row++)
{
for(col = 0; col < 2 * wd; col++)
{
i2_tmp = 0;
for(i = 0; i < NTAPS_CHROMA; i++)
{
i2_tmp += pi1_coeff[i] * pu1_src[col + (i - 1) * src_strd];
}
pi2_dst[col] = i2_tmp;
}
pu1_src += src_strd;
pi2_dst += dst_strd;
}
}
/**
*******************************************************************************
*
* @brief
* chroma interprediction filter for vertical 16bit input
*
* @par Description:
* Applies a vertical filter with coefficients pointed to by 'pi1_coeff' to
* the elements pointed by 'pu1_src' and writes to the location pointed by
* 'pu1_dst' Input is 16 bits The filter output is downshifted by 12 and
* clipped to lie between 0 and 255
*
* @param[in] pi2_src
* WORD16 pointer to the source
*
* @param[out] pu1_dst
* UWORD8 pointer to the destination
*
* @param[in] src_strd
* integer source stride
*
* @param[in] dst_strd
* integer destination stride
*
* @param[in] pi1_coeff
* WORD8 pointer to the filter coefficients
*
* @param[in] ht
* integer height of the array
*
* @param[in] wd
* integer width of the array
*
* @returns
*
* @remarks
* None
*
*******************************************************************************
*/
void ihevc_inter_pred_chroma_vert_w16inp(WORD16 *pi2_src,
UWORD8 *pu1_dst,
WORD32 src_strd,
WORD32 dst_strd,
WORD8 *pi1_coeff,
WORD32 ht,
WORD32 wd)
{
WORD32 row, col, i;
WORD32 i4_tmp;
for(row = 0; row < ht; row++)
{
for(col = 0; col < 2 * wd; col++)
{
i4_tmp = 0;
for(i = 0; i < NTAPS_CHROMA; i++)
{
i4_tmp += pi1_coeff[i] * pi2_src[col + (i - 1) * src_strd];
}
i4_tmp = ((i4_tmp >> SHIFT_14_MINUS_BIT_DEPTH) + OFFSET_14_MINUS_BIT_DEPTH) >> SHIFT_14_MINUS_BIT_DEPTH;
i4_tmp = CLIP_U8(i4_tmp);
pu1_dst[col] = i4_tmp;
}
pi2_src += src_strd;
pu1_dst += dst_strd;
}
}
/**
*******************************************************************************
*
* @brief
*
* Chroma interprediction filter for 16bit vertical input and output.
*
* @par Description:
* Applies a vertical filter with coefficients pointed to by 'pi1_coeff' to
* the elements pointed by 'pu1_src' and writes to the location pointed by
* 'pu1_dst' Input is 16 bits The filter output is downshifted by 6 and
* 8192 is subtracted to store it as a 16 bit number The output is used as
* a input to weighted prediction
*
* @param[in] pi2_src
* WORD16 pointer to the source
*
* @param[out] pi2_dst
* WORD16 pointer to the destination
*
* @param[in] src_strd
* integer source stride
*
* @param[in] dst_strd
* integer destination stride
*
* @param[in] pi1_coeff
* WORD8 pointer to the filter coefficients
*
* @param[in] ht
* integer height of the array
*
* @param[in] wd
* integer width of the array
*
* @returns
*
* @remarks
* None
*
*******************************************************************************
*/
void ihevc_inter_pred_chroma_vert_w16inp_w16out(WORD16 *pi2_src,
WORD16 *pi2_dst,
WORD32 src_strd,
WORD32 dst_strd,
WORD8 *pi1_coeff,
WORD32 ht,
WORD32 wd)
{
WORD32 row, col, i;
WORD32 i4_tmp;
for(row = 0; row < ht; row++)
{
for(col = 0; col < 2 * wd; col++)
{
i4_tmp = 0;
for(i = 0; i < NTAPS_CHROMA; i++)
{
i4_tmp += pi1_coeff[i] * pi2_src[col + (i - 1) * src_strd];
}
i4_tmp = (i4_tmp >> SHIFT_14_MINUS_BIT_DEPTH);
pi2_dst[col] = i4_tmp;
}
pi2_src += src_strd;
pi2_dst += dst_strd;
}
}