blob: 2c5d9a4f6a575a121c1ade6a5be572f1827c491d [file] [log] [blame]
/*
* Copyright (c) 2017 The WebM project authors. All Rights Reserved.
*
* Use of this source code is governed by a BSD-style license
* that can be found in the LICENSE file in the root of the source
* tree. An additional intellectual property rights grant can be found
* in the file PATENTS. All contributing project authors may
* be found in the AUTHORS file in the root of the source tree.
*/
#ifndef VPX_DSP_PPC_BITDEPTH_CONVERSION_VSX_H_
#define VPX_DSP_PPC_BITDEPTH_CONVERSION_VSX_H_
#include "./vpx_config.h"
#include "vpx/vpx_integer.h"
#include "vpx_dsp/vpx_dsp_common.h"
#include "vpx_dsp/ppc/types_vsx.h"
// Load 8 16 bit values. If the source is 32 bits then pack down with
// saturation.
static INLINE int16x8_t load_tran_low(int32_t c, const tran_low_t *s) {
#if CONFIG_VP9_HIGHBITDEPTH
int32x4_t u = vec_vsx_ld(c, s);
int32x4_t v = vec_vsx_ld(c, s + 4);
return vec_packs(u, v);
#else
return vec_vsx_ld(c, s);
#endif
}
// Store 8 16 bit values. If the destination is 32 bits then sign extend the
// values by multiplying by 1.
static INLINE void store_tran_low(int16x8_t v, int32_t c, tran_low_t *s) {
#if CONFIG_VP9_HIGHBITDEPTH
const int16x8_t one = vec_splat_s16(1);
const int32x4_t even = vec_mule(v, one);
const int32x4_t odd = vec_mulo(v, one);
const int32x4_t high = vec_mergeh(even, odd);
const int32x4_t low = vec_mergel(even, odd);
vec_vsx_st(high, c, s);
vec_vsx_st(low, c, s + 4);
#else
vec_vsx_st(v, c, s);
#endif
}
#endif // VPX_DSP_PPC_BITDEPTH_CONVERSION_VSX_H_