| /* |
| * Copyright (c) 2011 The LibYuv project authors. All Rights Reserved. |
| * |
| * Use of this source code is governed by a BSD-style license |
| * that can be found in the LICENSE file in the root of the source |
| * tree. An additional intellectual property rights grant can be found |
| * in the file PATENTS. All contributing project authors may |
| * be found in the AUTHORS file in the root of the source tree. |
| */ |
| |
| #ifndef SOURCE_ROW_H_ |
| #define SOURCE_ROW_H_ |
| |
| #include "libyuv/basic_types.h" |
| |
| #ifdef __cplusplus |
| namespace libyuv { |
| extern "C" { |
| #endif |
| |
| // TODO(fbarchard): Remove kMaxStride |
| #define kMaxStride (2560 * 4) |
| #define IS_ALIGNED(p, a) (!((uintptr_t)(p) & ((a) - 1))) |
| |
| #if defined(COVERAGE_ENABLED) || defined(TARGET_IPHONE_SIMULATOR) |
| #define YUV_DISABLE_ASM |
| #endif |
| // True if compiling for SSSE3 as a requirement. |
| #if defined(__SSSE3__) || (defined(_M_IX86_FP) && (_M_IX86_FP >= 3)) |
| #define LIBYUV_SSSE3_ONLY |
| #endif |
| |
| // The following are available on all x86 platforms |
| #if !defined(YUV_DISABLE_ASM) && \ |
| (defined(_M_IX86) || defined(__x86_64__) || defined(__i386__)) |
| #define HAS_ABGRTOARGBROW_SSSE3 |
| #define HAS_ABGRTOUVROW_SSSE3 |
| #define HAS_ABGRTOYROW_SSSE3 |
| #define HAS_ARGB1555TOARGBROW_SSE2 |
| #define HAS_ARGB4444TOARGBROW_SSE2 |
| #define HAS_ARGBATTENUATE_SSSE3 |
| #define HAS_ARGBBLENDROW_SSSE3 |
| #define HAS_ARGBBLENDROW1_SSSE3 |
| #define HAS_ARGBTOARGB1555ROW_SSE2 |
| #define HAS_ARGBTOARGB4444ROW_SSE2 |
| #define HAS_ARGBTORAWROW_SSSE3 |
| #define HAS_ARGBTORGB24ROW_SSSE3 |
| #define HAS_ARGBTORGB565ROW_SSE2 |
| #define HAS_ARGBTOUVROW_SSSE3 |
| #define HAS_ARGBTOYROW_SSSE3 |
| #define HAS_ARGBUNATTENUATE_SSE2 |
| #define HAS_BGRATOARGBROW_SSSE3 |
| #define HAS_BGRATOUVROW_SSSE3 |
| #define HAS_BGRATOYROW_SSSE3 |
| #define HAS_COPYROW_SSE2 |
| #define HAS_COPYROW_X86 |
| #define HAS_I400TOARGBROW_SSE2 |
| #define HAS_I420TOABGRROW_SSSE3 |
| #define HAS_I420TOARGBROW_SSSE3 |
| #define HAS_I420TOBGRAROW_SSSE3 |
| #define HAS_I444TOARGBROW_SSSE3 |
| #define HAS_MIRRORROW_SSSE3 |
| #define HAS_MIRRORROWUV_SSSE3 |
| #define HAS_ADDROW_SSE2 |
| #define HAS_RAWTOARGBROW_SSSE3 |
| #define HAS_RGB24TOARGBROW_SSSE3 |
| #define HAS_RGB565TOARGBROW_SSE2 |
| #define HAS_SPLITUV_SSE2 |
| #define HAS_UYVYTOUVROW_SSE2 |
| #define HAS_UYVYTOYROW_SSE2 |
| #define HAS_YTOARGBROW_SSE2 |
| #define HAS_YUY2TOUVROW_SSE2 |
| #define HAS_YUY2TOYROW_SSE2 |
| #define HAS_ARGBGRAYROW_SSSE3 |
| #endif |
| |
| // The following are available only useful when SSSE3 is unavailable. |
| #if !defined(YUV_DISABLE_ASM) && \ |
| (defined(_M_IX86) || defined(__x86_64__) || defined(__i386__)) && \ |
| !defined(LIBYUV_SSSE3_ONLY) |
| #define HAS_MIRRORROW_SSE2 |
| #define HAS_ARGBATTENUATE_SSE2 |
| #define HAS_ARGBBLENDROW_SSE2 |
| #define HAS_ARGBBLENDROW1_SSE2 |
| #endif |
| |
| // The following are available on Neon platforms |
| #if !defined(YUV_DISABLE_ASM) && defined(__ARM_NEON__) |
| #define HAS_MIRRORROW_NEON |
| #define HAS_MIRRORROWUV_NEON |
| #define HAS_SPLITUV_NEON |
| #define HAS_COPYROW_NEON |
| #define HAS_I420TOARGBROW_NEON |
| #define HAS_I420TOBGRAROW_NEON |
| #define HAS_I420TOABGRROW_NEON |
| #endif |
| |
| #if defined(_MSC_VER) |
| #define SIMD_ALIGNED(var) __declspec(align(16)) var |
| typedef __declspec(align(16)) int8 vec8[16]; |
| typedef __declspec(align(16)) uint8 uvec8[16]; |
| typedef __declspec(align(16)) int16 vec16[8]; |
| typedef __declspec(align(16)) uint16 uvec16[8]; |
| typedef __declspec(align(16)) uint32 uvec32[4]; |
| #else // __GNUC__ |
| #define SIMD_ALIGNED(var) var __attribute__((aligned(16))) |
| typedef int8 __attribute__((vector_size(16))) vec8; |
| typedef uint8 __attribute__((vector_size(16))) uvec8; |
| typedef int16 __attribute__((vector_size(16))) vec16; |
| typedef uint16 __attribute__((vector_size(16))) uvec16; |
| typedef uint32 __attribute__((vector_size(16))) uvec32; |
| #endif |
| |
| #if defined(__APPLE__) || defined(__x86_64__) |
| #define OMITFP |
| #else |
| #define OMITFP __attribute__((optimize("omit-frame-pointer"))) |
| #endif |
| |
| void I420ToARGBRow_NEON(const uint8* y_buf, |
| const uint8* u_buf, |
| const uint8* v_buf, |
| uint8* rgb_buf, |
| int width); |
| void I420ToBGRARow_NEON(const uint8* y_buf, |
| const uint8* u_buf, |
| const uint8* v_buf, |
| uint8* rgb_buf, |
| int width); |
| void I420ToABGRRow_NEON(const uint8* y_buf, |
| const uint8* u_buf, |
| const uint8* v_buf, |
| uint8* rgb_buf, |
| int width); |
| |
| void ARGBToYRow_SSSE3(const uint8* src_argb, uint8* dst_y, int pix); |
| void BGRAToYRow_SSSE3(const uint8* src_argb, uint8* dst_y, int pix); |
| void ABGRToYRow_SSSE3(const uint8* src_argb, uint8* dst_y, int pix); |
| void ARGBToYRow_Unaligned_SSSE3(const uint8* src_argb, uint8* dst_y, int pix); |
| void BGRAToYRow_Unaligned_SSSE3(const uint8* src_argb, uint8* dst_y, int pix); |
| void ABGRToYRow_Unaligned_SSSE3(const uint8* src_argb, uint8* dst_y, int pix); |
| |
| void ARGBToUVRow_SSSE3(const uint8* src_argb0, int src_stride_argb, |
| uint8* dst_u, uint8* dst_v, int width); |
| void BGRAToUVRow_SSSE3(const uint8* src_argb0, int src_stride_argb, |
| uint8* dst_u, uint8* dst_v, int width); |
| void ABGRToUVRow_SSSE3(const uint8* src_argb0, int src_stride_argb, |
| uint8* dst_u, uint8* dst_v, int width); |
| void ARGBToUVRow_Unaligned_SSSE3(const uint8* src_argb0, int src_stride_argb, |
| uint8* dst_u, uint8* dst_v, int width); |
| void BGRAToUVRow_Unaligned_SSSE3(const uint8* src_argb0, int src_stride_argb, |
| uint8* dst_u, uint8* dst_v, int width); |
| void ABGRToUVRow_Unaligned_SSSE3(const uint8* src_argb0, int src_stride_argb, |
| uint8* dst_u, uint8* dst_v, int width); |
| |
| void MirrorRow_SSSE3(const uint8* src, uint8* dst, int width); |
| void MirrorRow_SSE2(const uint8* src, uint8* dst, int width); |
| void MirrorRow_NEON(const uint8* src, uint8* dst, int width); |
| void MirrorRow_C(const uint8* src, uint8* dst, int width); |
| |
| void MirrorRowUV_SSSE3(const uint8* src, uint8* dst_u, uint8* dst_v, int width); |
| void MirrorRowUV_NEON(const uint8* src, uint8* dst_u, uint8* dst_v, int width); |
| void MirrorRowUV_C(const uint8* src, uint8* dst_u, uint8* dst_v, int width); |
| |
| void AddRow_SSE2(const uint8* src, uint16* dst, int width); |
| void SubRow_SSE2(const uint8* src, uint16* dst, int width); |
| void AddRow_C(const uint8* src, uint16* dst, int width); |
| void SubRow_C(const uint8* src, uint16* dst, int width); |
| |
| void SplitUV_SSE2(const uint8* src_uv, uint8* dst_u, uint8* dst_v, int pix); |
| void SplitUV_NEON(const uint8* src_uv, uint8* dst_u, uint8* dst_v, int pix); |
| void SplitUV_C(const uint8* src_uv, uint8* dst_u, uint8* dst_v, int pix); |
| |
| void CopyRow_SSE2(const uint8* src, uint8* dst, int count); |
| void CopyRow_X86(const uint8* src, uint8* dst, int count); |
| void CopyRow_NEON(const uint8* src, uint8* dst, int count); |
| void CopyRow_C(const uint8* src, uint8* dst, int count); |
| |
| void ARGBToYRow_C(const uint8* src_argb, uint8* dst_y, int pix); |
| void BGRAToYRow_C(const uint8* src_argb, uint8* dst_y, int pix); |
| void ABGRToYRow_C(const uint8* src_argb, uint8* dst_y, int pix); |
| |
| void ARGBToUVRow_C(const uint8* src_argb0, int src_stride_argb, |
| uint8* dst_u, uint8* dst_v, int width); |
| void BGRAToUVRow_C(const uint8* src_argb0, int src_stride_argb, |
| uint8* dst_u, uint8* dst_v, int width); |
| void ABGRToUVRow_C(const uint8* src_argb0, int src_stride_argb, |
| uint8* dst_u, uint8* dst_v, int width); |
| |
| void ABGRToARGBRow_SSSE3(const uint8* src_abgr, uint8* dst_argb, int pix); |
| void BGRAToARGBRow_SSSE3(const uint8* src_bgra, uint8* dst_argb, int pix); |
| void RGB24ToARGBRow_SSSE3(const uint8* src_rgb24, uint8* dst_argb, int pix); |
| void RAWToARGBRow_SSSE3(const uint8* src_rgb24, uint8* dst_argb, int pix); |
| void ARGB1555ToARGBRow_SSE2(const uint8* src_argb, uint8* dst_argb, int pix); |
| void RGB565ToARGBRow_SSE2(const uint8* src_argb, uint8* dst_argb, int pix); |
| void ARGB4444ToARGBRow_SSE2(const uint8* src_argb, uint8* dst_argb, int pix); |
| |
| void ABGRToARGBRow_C(const uint8* src_abgr, uint8* dst_argb, int pix); |
| void BGRAToARGBRow_C(const uint8* src_bgra, uint8* dst_argb, int pix); |
| void RGB24ToARGBRow_C(const uint8* src_rgb24, uint8* dst_argb, int pix); |
| void RAWToARGBRow_C(const uint8* src_rgb24, uint8* dst_argb, int pix); |
| void RGB565ToARGBRow_C(const uint8* src_rgb, uint8* dst_argb, int pix); |
| void ARGB1555ToARGBRow_C(const uint8* src_argb, uint8* dst_argb, int pix); |
| void ARGB4444ToARGBRow_C(const uint8* src_argb, uint8* dst_argb, int pix); |
| |
| void ARGBToRGB24Row_SSSE3(const uint8* src_argb, uint8* dst_rgb, int pix); |
| void ARGBToRAWRow_SSSE3(const uint8* src_argb, uint8* dst_rgb, int pix); |
| void ARGBToRGB565Row_SSE2(const uint8* src_argb, uint8* dst_rgb, int pix); |
| void ARGBToARGB1555Row_SSE2(const uint8* src_argb, uint8* dst_rgb, int pix); |
| void ARGBToARGB4444Row_SSE2(const uint8* src_argb, uint8* dst_rgb, int pix); |
| |
| void ARGBToRGB24Row_C(const uint8* src_argb, uint8* dst_rgb, int pix); |
| void ARGBToRAWRow_C(const uint8* src_argb, uint8* dst_rgb, int pix); |
| void ARGBToRGB565Row_C(const uint8* src_argb, uint8* dst_rgb, int pix); |
| void ARGBToARGB1555Row_C(const uint8* src_argb, uint8* dst_rgb, int pix); |
| void ARGBToARGB4444Row_C(const uint8* src_argb, uint8* dst_rgb, int pix); |
| |
| void I400ToARGBRow_SSE2(const uint8* src_y, uint8* dst_argb, int pix); |
| void I400ToARGBRow_C(const uint8* src_y, uint8* dst_argb, int pix); |
| |
| void I420ToARGBRow_C(const uint8* y_buf, |
| const uint8* u_buf, |
| const uint8* v_buf, |
| uint8* rgb_buf, |
| int width); |
| |
| void I420ToBGRARow_C(const uint8* y_buf, |
| const uint8* u_buf, |
| const uint8* v_buf, |
| uint8* rgb_buf, |
| int width); |
| |
| void I420ToABGRRow_C(const uint8* y_buf, |
| const uint8* u_buf, |
| const uint8* v_buf, |
| uint8* rgb_buf, |
| int width); |
| |
| void I444ToARGBRow_C(const uint8* y_buf, |
| const uint8* u_buf, |
| const uint8* v_buf, |
| uint8* rgb_buf, |
| int width); |
| |
| void YToARGBRow_C(const uint8* y_buf, |
| uint8* rgb_buf, |
| int width); |
| |
| void I420ToARGBRow_SSSE3(const uint8* y_buf, |
| const uint8* u_buf, |
| const uint8* v_buf, |
| uint8* rgb_buf, |
| int width); |
| |
| void I420ToBGRARow_SSSE3(const uint8* y_buf, |
| const uint8* u_buf, |
| const uint8* v_buf, |
| uint8* rgb_buf, |
| int width); |
| |
| void I420ToABGRRow_SSSE3(const uint8* y_buf, |
| const uint8* u_buf, |
| const uint8* v_buf, |
| uint8* rgb_buf, |
| int width); |
| |
| void I420ToARGBRow_Unaligned_SSSE3(const uint8* y_buf, |
| const uint8* u_buf, |
| const uint8* v_buf, |
| uint8* rgb_buf, |
| int width); |
| |
| void I420ToBGRARow_Unaligned_SSSE3(const uint8* y_buf, |
| const uint8* u_buf, |
| const uint8* v_buf, |
| uint8* rgb_buf, |
| int width); |
| |
| void I420ToABGRRow_Unaligned_SSSE3(const uint8* y_buf, |
| const uint8* u_buf, |
| const uint8* v_buf, |
| uint8* rgb_buf, |
| int width); |
| |
| void I444ToARGBRow_SSSE3(const uint8* y_buf, |
| const uint8* u_buf, |
| const uint8* v_buf, |
| uint8* rgb_buf, |
| int width); |
| |
| void YToARGBRow_SSE2(const uint8* y_buf, |
| uint8* rgb_buf, |
| int width); |
| |
| // ARGB preattenuated alpha blend. |
| void ARGBBlendRow_Aligned_SSSE3(const uint8* src_argb0, const uint8* src_argb1, |
| uint8* dst_argb, int width); |
| void ARGBBlendRow_Aligned_SSE2(const uint8* src_argb0, const uint8* src_argb1, |
| uint8* dst_argb, int width); |
| void ARGBBlendRow1_SSSE3(const uint8* src_argb0, const uint8* src_argb1, |
| uint8* dst_argb, int width); |
| void ARGBBlendRow1_SSE2(const uint8* src_argb0, const uint8* src_argb1, |
| uint8* dst_argb, int width); |
| void ARGBBlendRow_Any_SSSE3(const uint8* src_argb0, const uint8* src_argb1, |
| uint8* dst_argb, int width); |
| void ARGBBlendRow_Any_SSE2(const uint8* src_argb0, const uint8* src_argb1, |
| uint8* dst_argb, int width); |
| void ARGBBlendRow_C(const uint8* src_argb0, const uint8* src_argb1, |
| uint8* dst_argb, int width); |
| |
| // 'Any' functions handle any size and alignment. |
| void I420ToARGBRow_Any_SSSE3(const uint8* y_buf, |
| const uint8* u_buf, |
| const uint8* v_buf, |
| uint8* rgb_buf, |
| int width); |
| |
| void I420ToBGRARow_Any_SSSE3(const uint8* y_buf, |
| const uint8* u_buf, |
| const uint8* v_buf, |
| uint8* rgb_buf, |
| int width); |
| |
| void I420ToABGRRow_Any_SSSE3(const uint8* y_buf, |
| const uint8* u_buf, |
| const uint8* v_buf, |
| uint8* rgb_buf, |
| int width); |
| |
| void ARGBToRGB24Row_Any_SSSE3(const uint8* src_argb, uint8* dst_rgb, int pix); |
| void ARGBToRAWRow_Any_SSSE3(const uint8* src_argb, uint8* dst_rgb, int pix); |
| void ARGBToRGB565Row_Any_SSE2(const uint8* src_argb, uint8* dst_rgb, int pix); |
| void ARGBToARGB1555Row_Any_SSE2(const uint8* src_argb, uint8* dst_rgb, int pix); |
| void ARGBToARGB4444Row_Any_SSE2(const uint8* src_argb, uint8* dst_rgb, int pix); |
| |
| void ARGBToYRow_Any_SSSE3(const uint8* src_argb, uint8* dst_y, int pix); |
| void BGRAToYRow_Any_SSSE3(const uint8* src_argb, uint8* dst_y, int pix); |
| void ABGRToYRow_Any_SSSE3(const uint8* src_argb, uint8* dst_y, int pix); |
| void ARGBToUVRow_Any_SSSE3(const uint8* src_argb0, int src_stride_argb, |
| uint8* dst_u, uint8* dst_v, int width); |
| void BGRAToUVRow_Any_SSSE3(const uint8* src_argb0, int src_stride_argb, |
| uint8* dst_u, uint8* dst_v, int width); |
| void ABGRToUVRow_Any_SSSE3(const uint8* src_argb0, int src_stride_argb, |
| uint8* dst_u, uint8* dst_v, int width); |
| |
| void I420ToARGBRow_Any_NEON(const uint8* y_buf, |
| const uint8* u_buf, |
| const uint8* v_buf, |
| uint8* rgb_buf, |
| int width); |
| |
| void I420ToBGRARow_Any_NEON(const uint8* y_buf, |
| const uint8* u_buf, |
| const uint8* v_buf, |
| uint8* rgb_buf, |
| int width); |
| |
| void I420ToABGRRow_Any_NEON(const uint8* y_buf, |
| const uint8* u_buf, |
| const uint8* v_buf, |
| uint8* rgb_buf, |
| int width); |
| |
| void YUY2ToYRow_SSE2(const uint8* src_yuy2, uint8* dst_y, int pix); |
| void YUY2ToUVRow_SSE2(const uint8* src_yuy2, int stride_yuy2, |
| uint8* dst_u, uint8* dst_y, int pix); |
| void YUY2ToYRow_Unaligned_SSE2(const uint8* src_yuy2, |
| uint8* dst_y, int pix); |
| void YUY2ToUVRow_Unaligned_SSE2(const uint8* src_yuy2, int stride_yuy2, |
| uint8* dst_u, uint8* dst_y, int pix); |
| |
| void UYVYToYRow_SSE2(const uint8* src_uyvy, uint8* dst_y, int pix); |
| void UYVYToUVRow_SSE2(const uint8* src_uyvy, int stride_uyvy, |
| uint8* dst_u, uint8* dst_y, int pix); |
| void UYVYToYRow_Unaligned_SSE2(const uint8* src_uyvy, |
| uint8* dst_y, int pix); |
| void UYVYToUVRow_Unaligned_SSE2(const uint8* src_uyvy, int stride_uyvy, |
| uint8* dst_u, uint8* dst_y, int pix); |
| |
| void YUY2ToUVRow_C(const uint8* src_yuy2, int src_stride_yuy2, |
| uint8* dst_u, uint8* dst_v, int pix); |
| void YUY2ToYRow_C(const uint8* src_yuy2, uint8* dst_y, int pix); |
| void UYVYToUVRow_C(const uint8* src_uyvy, int src_stride_uyvy, |
| uint8* dst_u, uint8* dst_v, int pix); |
| void UYVYToYRow_C(const uint8* src_uyvy, uint8* dst_y, int pix); |
| |
| void YUY2ToUVRow_Any_SSE2(const uint8* src_yuy2, int src_stride_yuy2, |
| uint8* dst_u, uint8* dst_v, int pix); |
| void YUY2ToYRow_Any_SSE2(const uint8* src_yuy2, uint8* dst_y, int pix); |
| void UYVYToUVRow_Any_SSE2(const uint8* src_uyvy, int src_stride_uyvy, |
| uint8* dst_u, uint8* dst_v, int pix); |
| void UYVYToYRow_Any_SSE2(const uint8* src_uyvy, uint8* dst_y, int pix); |
| |
| void ARGBAttenuateRow_C(const uint8* src_argb, uint8* dst_argb, int width); |
| void ARGBAttenuateRow_SSE2(const uint8* src_argb, uint8* dst_argb, int width); |
| void ARGBAttenuateRow_SSSE3(const uint8* src_argb, uint8* dst_argb, int width); |
| |
| // Inverse table for unattenuate, shared by C and SSE2. |
| extern uint32 fixed_invtbl8[256]; |
| void ARGBUnattenuateRow_C(const uint8* src_argb, uint8* dst_argb, int width); |
| void ARGBUnattenuateRow_SSE2(const uint8* src_argb, uint8* dst_argb, int width); |
| |
| void ARGBGrayRow_C(uint8* dst_argb, int width); |
| void ARGBGrayRow_SSSE3(uint8* dst_argb, int width); |
| |
| #ifdef __cplusplus |
| } // extern "C" |
| } // namespace libyuv |
| #endif |
| |
| #endif // SOURCE_ROW_H_ |