| /* |
| * Copyright (c) 2011 The LibYuv project authors. All Rights Reserved. |
| * |
| * Use of this source code is governed by a BSD-style license |
| * that can be found in the LICENSE file in the root of the source |
| * tree. An additional intellectual property rights grant can be found |
| * in the file PATENTS. All contributing project authors may |
| * be found in the AUTHORS file in the root of the source tree. |
| */ |
| |
| #include "row.h" |
| |
| #include "libyuv/basic_types.h" |
| #include <string.h> // For memcpy |
| |
| #ifdef __cplusplus |
| namespace libyuv { |
| extern "C" { |
| #endif |
| |
| void ABGRToARGBRow_C(const uint8* src_abgr, uint8* dst_argb, int width) { |
| for (int x = 0; x < width; ++x) { |
| // To support in-place conversion. |
| uint8 r = src_abgr[0]; |
| uint8 g = src_abgr[1]; |
| uint8 b = src_abgr[2]; |
| uint8 a = src_abgr[3]; |
| dst_argb[0] = b; |
| dst_argb[1] = g; |
| dst_argb[2] = r; |
| dst_argb[3] = a; |
| dst_argb += 4; |
| src_abgr += 4; |
| } |
| } |
| |
| void BGRAToARGBRow_C(const uint8* src_bgra, uint8* dst_argb, int width) { |
| for (int x = 0; x < width; ++x) { |
| // To support in-place conversion. |
| uint8 a = src_bgra[0]; |
| uint8 r = src_bgra[1]; |
| uint8 g = src_bgra[2]; |
| uint8 b = src_bgra[3]; |
| dst_argb[0] = b; |
| dst_argb[1] = g; |
| dst_argb[2] = r; |
| dst_argb[3] = a; |
| dst_argb += 4; |
| src_bgra += 4; |
| } |
| } |
| |
| void RGB24ToARGBRow_C(const uint8* src_rgb24, uint8* dst_argb, int width) { |
| for (int x = 0; x < width; ++x) { |
| uint8 b = src_rgb24[0]; |
| uint8 g = src_rgb24[1]; |
| uint8 r = src_rgb24[2]; |
| dst_argb[0] = b; |
| dst_argb[1] = g; |
| dst_argb[2] = r; |
| dst_argb[3] = 255u; |
| dst_argb += 4; |
| src_rgb24 += 3; |
| } |
| } |
| |
| void RAWToARGBRow_C(const uint8* src_raw, uint8* dst_argb, int width) { |
| for (int x = 0; x < width; ++x) { |
| uint8 r = src_raw[0]; |
| uint8 g = src_raw[1]; |
| uint8 b = src_raw[2]; |
| dst_argb[0] = b; |
| dst_argb[1] = g; |
| dst_argb[2] = r; |
| dst_argb[3] = 255u; |
| dst_argb += 4; |
| src_raw += 3; |
| } |
| } |
| |
| void RGB565ToARGBRow_C(const uint8* src_rgb, uint8* dst_argb, int width) { |
| for (int x = 0; x < width; ++x) { |
| uint8 b = src_rgb[0] & 0x1f; |
| uint8 g = (src_rgb[0] >> 5) | ((src_rgb[1] & 0x07) << 3); |
| uint8 r = src_rgb[1] >> 3; |
| dst_argb[0] = (b << 3) | (b >> 2); |
| dst_argb[1] = (g << 2) | (g >> 4); |
| dst_argb[2] = (r << 3) | (r >> 2); |
| dst_argb[3] = 255u; |
| dst_argb += 4; |
| src_rgb += 2; |
| } |
| } |
| |
| void ARGB1555ToARGBRow_C(const uint8* src_rgb, uint8* dst_argb, int width) { |
| for (int x = 0; x < width; ++x) { |
| uint8 b = src_rgb[0] & 0x1f; |
| uint8 g = (src_rgb[0] >> 5) | ((src_rgb[1] & 0x03) << 3); |
| uint8 r = (src_rgb[1] & 0x7c) >> 2; |
| uint8 a = src_rgb[1] >> 7; |
| dst_argb[0] = (b << 3) | (b >> 2); |
| dst_argb[1] = (g << 3) | (g >> 2); |
| dst_argb[2] = (r << 3) | (r >> 2); |
| dst_argb[3] = -a; |
| dst_argb += 4; |
| src_rgb += 2; |
| } |
| } |
| |
| void ARGB4444ToARGBRow_C(const uint8* src_rgb, uint8* dst_argb, int width) { |
| for (int x = 0; x < width; ++x) { |
| uint8 a = src_rgb[1] >> 4; |
| uint8 r = src_rgb[1] & 0x0f; |
| uint8 g = src_rgb[0] >> 4; |
| uint8 b = src_rgb[0] & 0x0f; |
| dst_argb[0] = (b << 4) | b; |
| dst_argb[1] = (g << 4) | g; |
| dst_argb[2] = (r << 4) | r; |
| dst_argb[3] = (a << 4) | a; |
| dst_argb += 4; |
| src_rgb += 2; |
| } |
| } |
| |
| void ARGBToRGB24Row_C(const uint8* src_argb, uint8* dst_rgb, int width) { |
| for (int x = 0; x < width; ++x) { |
| uint8 b = src_argb[0]; |
| uint8 g = src_argb[1]; |
| uint8 r = src_argb[2]; |
| dst_rgb[0] = b; |
| dst_rgb[1] = g; |
| dst_rgb[2] = r; |
| dst_rgb += 3; |
| src_argb += 4; |
| } |
| } |
| |
| void ARGBToRAWRow_C(const uint8* src_argb, uint8* dst_rgb, int width) { |
| for (int x = 0; x < width; ++x) { |
| uint8 b = src_argb[0]; |
| uint8 g = src_argb[1]; |
| uint8 r = src_argb[2]; |
| dst_rgb[0] = r; |
| dst_rgb[1] = g; |
| dst_rgb[2] = b; |
| dst_rgb += 3; |
| src_argb += 4; |
| } |
| } |
| |
| // TODO(fbarchard): support big endian CPU |
| void ARGBToRGB565Row_C(const uint8* src_argb, uint8* dst_rgb, int width) { |
| for (int x = 0; x < width; ++x) { |
| uint8 b = src_argb[0] >> 3; |
| uint8 g = src_argb[1] >> 2; |
| uint8 r = src_argb[2] >> 3; |
| *reinterpret_cast<uint16*>(dst_rgb) = (r << 11) | (g << 5) | b; |
| dst_rgb += 2; |
| src_argb += 4; |
| } |
| } |
| |
| void ARGBToARGB1555Row_C(const uint8* src_argb, uint8* dst_rgb, int width) { |
| for (int x = 0; x < width; ++x) { |
| uint8 b = src_argb[0] >> 3; |
| uint8 g = src_argb[1] >> 3; |
| uint8 r = src_argb[2] >> 3; |
| uint8 a = src_argb[2] >> 7; |
| *reinterpret_cast<uint16*>(dst_rgb) = (a << 15) | (r << 10) | (g << 5) | b; |
| dst_rgb += 2; |
| src_argb += 4; |
| } |
| } |
| |
| void ARGBToARGB4444Row_C(const uint8* src_argb, uint8* dst_rgb, int width) { |
| for (int x = 0; x < width; ++x) { |
| uint8 b = src_argb[0] >> 4; |
| uint8 g = src_argb[1] >> 4; |
| uint8 r = src_argb[2] >> 4; |
| uint8 a = src_argb[2] >> 4; |
| *reinterpret_cast<uint16*>(dst_rgb) = (a << 12) | (r << 8) | (g << 4) | b; |
| dst_rgb += 2; |
| src_argb += 4; |
| } |
| } |
| |
| static __inline int RGBToY(uint8 r, uint8 g, uint8 b) { |
| return (( 66 * r + 129 * g + 25 * b + 128) >> 8) + 16; |
| } |
| |
| static __inline int RGBToU(uint8 r, uint8 g, uint8 b) { |
| return ((-38 * r - 74 * g + 112 * b + 128) >> 8) + 128; |
| } |
| static __inline int RGBToV(uint8 r, uint8 g, uint8 b) { |
| return ((112 * r - 94 * g - 18 * b + 128) >> 8) + 128; |
| } |
| |
| #define MAKEROWY(NAME,R,G,B) \ |
| void NAME ## ToYRow_C(const uint8* src_argb0, uint8* dst_y, int width) { \ |
| for (int x = 0; x < width; ++x) { \ |
| dst_y[0] = RGBToY(src_argb0[R], src_argb0[G], src_argb0[B]); \ |
| src_argb0 += 4; \ |
| dst_y += 1; \ |
| } \ |
| } \ |
| void NAME ## ToUVRow_C(const uint8* src_rgb0, int src_stride_rgb, \ |
| uint8* dst_u, uint8* dst_v, int width) { \ |
| const uint8* src_rgb1 = src_rgb0 + src_stride_rgb; \ |
| for (int x = 0; x < width - 1; x += 2) { \ |
| uint8 ab = (src_rgb0[B] + src_rgb0[B + 4] + \ |
| src_rgb1[B] + src_rgb1[B + 4]) >> 2; \ |
| uint8 ag = (src_rgb0[G] + src_rgb0[G + 4] + \ |
| src_rgb1[G] + src_rgb1[G + 4]) >> 2; \ |
| uint8 ar = (src_rgb0[R] + src_rgb0[R + 4] + \ |
| src_rgb1[R] + src_rgb1[R + 4]) >> 2; \ |
| dst_u[0] = RGBToU(ar, ag, ab); \ |
| dst_v[0] = RGBToV(ar, ag, ab); \ |
| src_rgb0 += 8; \ |
| src_rgb1 += 8; \ |
| dst_u += 1; \ |
| dst_v += 1; \ |
| } \ |
| if (width & 1) { \ |
| uint8 ab = (src_rgb0[B] + src_rgb1[B]) >> 1; \ |
| uint8 ag = (src_rgb0[G] + src_rgb1[G]) >> 1; \ |
| uint8 ar = (src_rgb0[R] + src_rgb1[R]) >> 1; \ |
| dst_u[0] = RGBToU(ar, ag, ab); \ |
| dst_v[0] = RGBToV(ar, ag, ab); \ |
| } \ |
| } |
| |
| MAKEROWY(ARGB,2,1,0) |
| MAKEROWY(BGRA,1,2,3) |
| MAKEROWY(ABGR,0,1,2) |
| |
| void I400ToARGBRow_C(const uint8* src_y, uint8* dst_argb, int width) { |
| // Copy a Y to RGB. |
| for (int x = 0; x < width; ++x) { |
| uint8 y = src_y[0]; |
| dst_argb[2] = dst_argb[1] = dst_argb[0] = y; |
| dst_argb[3] = 255u; |
| dst_argb += 4; |
| ++src_y; |
| } |
| } |
| |
| // C reference code that mimics the YUV assembly. |
| |
| #define YG 74 /* static_cast<int8>(1.164 * 64 + 0.5) */ |
| |
| #define UB 127 /* min(63,static_cast<int8>(2.018 * 64)) */ |
| #define UG -25 /* static_cast<int8>(-0.391 * 64 - 0.5) */ |
| #define UR 0 |
| |
| #define VB 0 |
| #define VG -52 /* static_cast<int8>(-0.813 * 64 - 0.5) */ |
| #define VR 102 /* static_cast<int8>(1.596 * 64 + 0.5) */ |
| |
| // Bias |
| #define BB UB * 128 + VB * 128 |
| #define BG UG * 128 + VG * 128 |
| #define BR UR * 128 + VR * 128 |
| |
| static __inline uint32 Clip(int32 val) { |
| if (val < 0) { |
| return (uint32) 0; |
| } else if (val > 255){ |
| return (uint32) 255; |
| } |
| return (uint32) val; |
| } |
| |
| static __inline void YuvPixel(uint8 y, uint8 u, uint8 v, uint8* rgb_buf, |
| int ashift, int rshift, int gshift, int bshift) { |
| int32 y1 = (static_cast<int32>(y) - 16) * YG; |
| uint32 b = Clip(static_cast<int32>((u * UB + v * VB) - (BB) + y1) >> 6); |
| uint32 g = Clip(static_cast<int32>((u * UG + v * VG) - (BG) + y1) >> 6); |
| uint32 r = Clip(static_cast<int32>((u * UR + v * VR) - (BR) + y1) >> 6); |
| *reinterpret_cast<uint32*>(rgb_buf) = (b << bshift) | |
| (g << gshift) | |
| (r << rshift) | |
| (255u << ashift); |
| } |
| |
| void I420ToARGBRow_C(const uint8* y_buf, |
| const uint8* u_buf, |
| const uint8* v_buf, |
| uint8* rgb_buf, |
| int width) { |
| for (int x = 0; x < width - 1; x += 2) { |
| YuvPixel(y_buf[0], u_buf[0], v_buf[0], rgb_buf + 0, 24, 16, 8, 0); |
| YuvPixel(y_buf[1], u_buf[0], v_buf[0], rgb_buf + 4, 24, 16, 8, 0); |
| y_buf += 2; |
| u_buf += 1; |
| v_buf += 1; |
| rgb_buf += 8; // Advance 2 pixels. |
| } |
| if (width & 1) { |
| YuvPixel(y_buf[0], u_buf[0], v_buf[0], rgb_buf + 0, 24, 16, 8, 0); |
| } |
| } |
| |
| void I420ToBGRARow_C(const uint8* y_buf, |
| const uint8* u_buf, |
| const uint8* v_buf, |
| uint8* rgb_buf, |
| int width) { |
| for (int x = 0; x < width - 1; x += 2) { |
| YuvPixel(y_buf[0], u_buf[0], v_buf[0], rgb_buf + 0, 0, 8, 16, 24); |
| YuvPixel(y_buf[1], u_buf[0], v_buf[0], rgb_buf + 4, 0, 8, 16, 24); |
| y_buf += 2; |
| u_buf += 1; |
| v_buf += 1; |
| rgb_buf += 8; // Advance 2 pixels. |
| } |
| if (width & 1) { |
| YuvPixel(y_buf[0], u_buf[0], v_buf[0], rgb_buf, 0, 8, 16, 24); |
| } |
| } |
| |
| void I420ToABGRRow_C(const uint8* y_buf, |
| const uint8* u_buf, |
| const uint8* v_buf, |
| uint8* rgb_buf, |
| int width) { |
| for (int x = 0; x < width - 1; x += 2) { |
| YuvPixel(y_buf[0], u_buf[0], v_buf[0], rgb_buf + 0, 24, 0, 8, 16); |
| YuvPixel(y_buf[1], u_buf[0], v_buf[0], rgb_buf + 4, 24, 0, 8, 16); |
| y_buf += 2; |
| u_buf += 1; |
| v_buf += 1; |
| rgb_buf += 8; // Advance 2 pixels. |
| } |
| if (width & 1) { |
| YuvPixel(y_buf[0], u_buf[0], v_buf[0], rgb_buf + 0, 24, 0, 8, 16); |
| } |
| } |
| |
| void I444ToARGBRow_C(const uint8* y_buf, |
| const uint8* u_buf, |
| const uint8* v_buf, |
| uint8* rgb_buf, |
| int width) { |
| for (int x = 0; x < width; ++x) { |
| YuvPixel(y_buf[0], u_buf[0], v_buf[0], rgb_buf, 24, 16, 8, 0); |
| y_buf += 1; |
| u_buf += 1; |
| v_buf += 1; |
| rgb_buf += 4; // Advance 1 pixel. |
| } |
| } |
| |
| void YToARGBRow_C(const uint8* y_buf, uint8* rgb_buf, int width) { |
| for (int x = 0; x < width; ++x) { |
| YuvPixel(y_buf[0], 128, 128, rgb_buf, 24, 16, 8, 0); |
| y_buf += 1; |
| rgb_buf += 4; // Advance 1 pixel. |
| } |
| } |
| |
| void MirrorRow_C(const uint8* src, uint8* dst, int width) { |
| src += width - 1; |
| for (int x = 0; x < width - 1; x += 2) { |
| dst[x] = src[0]; |
| dst[x + 1] = src[-1]; |
| src -= 2; |
| } |
| if (width & 1) { |
| dst[width - 1] = src[0]; |
| } |
| } |
| |
| void MirrorRowUV_C(const uint8* src_uv, uint8* dst_u, uint8* dst_v, int width) { |
| src_uv += (width - 1) << 1; |
| for (int x = 0; x < width - 1; x += 2) { |
| dst_u[x] = src_uv[0]; |
| dst_u[x + 1] = src_uv[-2]; |
| dst_v[x] = src_uv[1]; |
| dst_v[x + 1] = src_uv[-2 + 1]; |
| src_uv -= 4; |
| } |
| if (width & 1) { |
| dst_u[width - 1] = src_uv[0]; |
| dst_v[width - 1] = src_uv[1]; |
| } |
| } |
| |
| void SplitUV_C(const uint8* src_uv, uint8* dst_u, uint8* dst_v, int width) { |
| for (int x = 0; x < width - 1; x += 2) { |
| dst_u[x] = src_uv[0]; |
| dst_u[x + 1] = src_uv[2]; |
| dst_v[x] = src_uv[1]; |
| dst_v[x + 1] = src_uv[3]; |
| src_uv += 4; |
| } |
| if (width & 1) { |
| dst_u[width - 1] = src_uv[0]; |
| dst_v[width - 1] = src_uv[1]; |
| } |
| } |
| |
| void CopyRow_C(const uint8* src, uint8* dst, int count) { |
| memcpy(dst, src, count); |
| } |
| |
| // Filter 2 rows of YUY2 UV's (422) into U and V (420) |
| void YUY2ToUVRow_C(const uint8* src_yuy2, int src_stride_yuy2, |
| uint8* dst_u, uint8* dst_v, int width) { |
| // Output a row of UV values, filtering 2 rows of YUY2 |
| for (int x = 0; x < width; x += 2) { |
| dst_u[0] = (src_yuy2[1] + src_yuy2[src_stride_yuy2 + 1] + 1) >> 1; |
| dst_v[0] = (src_yuy2[3] + src_yuy2[src_stride_yuy2 + 3] + 1) >> 1; |
| src_yuy2 += 4; |
| dst_u += 1; |
| dst_v += 1; |
| } |
| } |
| |
| void YUY2ToYRow_C(const uint8* src_yuy2, uint8* dst_y, int width) { |
| // Copy a row of yuy2 Y values |
| for (int x = 0; x < width - 1; x += 2) { |
| dst_y[x] = src_yuy2[0]; |
| dst_y[x + 1] = src_yuy2[2]; |
| src_yuy2 += 4; |
| } |
| if (width & 1) { |
| dst_y[width - 1] = src_yuy2[0]; |
| } |
| } |
| |
| void UYVYToUVRow_C(const uint8* src_uyvy, int src_stride_uyvy, |
| uint8* dst_u, uint8* dst_v, int width) { |
| // Copy a row of uyvy UV values |
| for (int x = 0; x < width; x += 2) { |
| dst_u[0] = (src_uyvy[0] + src_uyvy[src_stride_uyvy + 0] + 1) >> 1; |
| dst_v[0] = (src_uyvy[2] + src_uyvy[src_stride_uyvy + 2] + 1) >> 1; |
| src_uyvy += 4; |
| dst_u += 1; |
| dst_v += 1; |
| } |
| } |
| |
| void UYVYToYRow_C(const uint8* src_yuy2, uint8* dst_y, int width) { |
| // Copy a row of uyvy Y values |
| for (int x = 0; x < width - 1; x += 2) { |
| dst_y[x] = src_yuy2[1]; |
| dst_y[x + 1] = src_yuy2[3]; |
| src_yuy2 += 4; |
| } |
| if (width & 1) { |
| dst_y[width - 1] = src_yuy2[1]; |
| } |
| } |
| |
| #define BLENDER(f, b, a) (f * a + b * (a ^ 0xff) + 0x80) >> 8 |
| void ARGBBlendRow_C(const uint8* src_argb, uint8* dst_argb, int width) { |
| for (int x = 0; x < width - 1; x += 2) { |
| uint32 a = src_argb[3]; |
| if (a) { |
| if (a < 255) { |
| const uint32 fb = src_argb[0]; |
| const uint32 fg = src_argb[1]; |
| const uint32 fr = src_argb[2]; |
| const uint32 bb = dst_argb[0]; |
| const uint32 bg = dst_argb[1]; |
| const uint32 br = dst_argb[2]; |
| dst_argb[0] = BLENDER(fb, bb, a); |
| dst_argb[1] = BLENDER(fg, bg, a); |
| dst_argb[2] = BLENDER(fr, br, a); |
| dst_argb[3] = 255u; |
| } else { |
| *(uint32*)dst_argb = *(uint32*)src_argb; |
| } |
| } |
| a = src_argb[4 + 3]; |
| if (a) { |
| if (a < 255) { |
| const uint32 fb = src_argb[4 + 0]; |
| const uint32 fg = src_argb[4 + 1]; |
| const uint32 fr = src_argb[4 + 2]; |
| const uint32 bb = dst_argb[4 + 0]; |
| const uint32 bg = dst_argb[4 + 1]; |
| const uint32 br = dst_argb[4 + 2]; |
| dst_argb[4 + 0] = BLENDER(fb, bb, a); |
| dst_argb[4 + 1] = BLENDER(fg, bg, a); |
| dst_argb[4 + 2] = BLENDER(fr, br, a); |
| dst_argb[4 + 3] = 255u; |
| } else { |
| *(uint32*)(dst_argb + 4) = *(uint32*)(src_argb + 4); |
| } |
| } |
| src_argb += 8; |
| dst_argb += 8; |
| } |
| |
| if (width & 1) { |
| const uint32 a = src_argb[3]; |
| if (a) { |
| if (a < 255) { |
| const uint32 fb = src_argb[0]; |
| const uint32 fg = src_argb[1]; |
| const uint32 fr = src_argb[2]; |
| const uint32 bb = dst_argb[0]; |
| const uint32 bg = dst_argb[1]; |
| const uint32 br = dst_argb[2]; |
| dst_argb[0] = BLENDER(fb, bb, a); |
| dst_argb[1] = BLENDER(fg, bg, a); |
| dst_argb[2] = BLENDER(fr, br, a); |
| dst_argb[3] = 255u; |
| } else { |
| *(uint32*)dst_argb = *(uint32*)src_argb; |
| } |
| } |
| } |
| } |
| |
| #if 0 |
| void ARGBBlendRow_C(const uint8* src_argb, uint8* dst_argb, int width) { |
| for (int x = 0; x < width - 1; x += 2) { |
| uint32 f = *(uint32*)src_argb; |
| uint32 a = f >> 24; |
| if (a) { |
| const uint32 b = *(uint32*)dst_argb; |
| if (a < 255) { |
| const uint32 src_rb = f & 0x00ff00ff; |
| const uint32 dst_rb = b & 0x00ff00ff; |
| const uint32 out_rb = (src_rb * a + dst_rb * (a ^ 0xff) + 0x00800080) & |
| 0xff00ff00; |
| |
| const uint32 src_g = f & 0x0000ff00; |
| const uint32 dst_g = b & 0x0000ff00; |
| const uint32 out_g = ((src_g * a + dst_g * (a ^ 0xff) + 0x00008000) & |
| 0x00ff0000); |
| |
| f = ((out_rb | out_g) >> 8) | 0xff000000; |
| } |
| *(uint32*)dst_argb = f; |
| } |
| |
| f = *(uint32*)(src_argb + 4); |
| a = f >> 24; |
| if (a) { |
| const uint32 b = *(uint32*)(dst_argb + 4); |
| if (a < 255) { |
| const uint32 src_rb = f & 0x00ff00ff; |
| const uint32 dst_rb = b & 0x00ff00ff; |
| const uint32 out_rb = (src_rb * a + dst_rb * (a ^ 0xff) + 0x00800080) & |
| 0xff00ff00; |
| |
| const uint32 src_g = f & 0x0000ff00; |
| const uint32 dst_g = b & 0x0000ff00; |
| const uint32 out_g = ((src_g * a + dst_g * (a ^ 0xff) + 0x00008000) & |
| 0x00ff0000); |
| |
| f = ((out_rb | out_g) >> 8) | 0xff000000; |
| } |
| *(uint32*)(dst_argb + 4) = f; |
| } |
| src_argb += 8; |
| dst_argb += 8; |
| } |
| |
| if (width & 1) { |
| uint32 f = *(uint32*)src_argb; |
| uint32 a = f >> 24; |
| if (a) { |
| const uint32 b = *(uint32*)dst_argb; |
| if (a < 255) { |
| const uint32 src_rb = f & 0x00ff00ff; |
| const uint32 dst_rb = b & 0x00ff00ff; |
| const uint32 out_rb = (src_rb * a + dst_rb * (a ^ 0xff) + 0x00800080) & |
| 0xff00ff00; |
| |
| const uint32 src_g = f & 0x0000ff00; |
| const uint32 dst_g = b & 0x0000ff00; |
| const uint32 out_g = ((src_g * a + dst_g * (a ^ 0xff) + 0x00008000) & |
| 0x00ff0000); |
| |
| f = ((out_rb | out_g) >> 8) | 0xff000000; |
| } |
| *(uint32*)dst_argb = f; |
| } |
| } |
| } |
| #endif |
| |
| // Wrappers to handle odd sizes/alignments |
| #define MAKEYUVANY(NAMEANY, NAME, COPYROW) \ |
| void NAMEANY(const uint8* y_buf, \ |
| const uint8* u_buf, \ |
| const uint8* v_buf, \ |
| uint8* rgb_buf, \ |
| int width) { \ |
| SIMD_ALIGNED(uint8 row[kMaxStride]); \ |
| NAME(y_buf, u_buf, v_buf, row, width); \ |
| COPYROW(row, rgb_buf, width << 2); \ |
| } |
| |
| #if defined(HAS_I420TOARGBROW_SSSE3) |
| MAKEYUVANY(I420ToARGBRow_Any_SSSE3, I420ToARGBRow_SSSE3, CopyRow_X86) |
| MAKEYUVANY(I420ToBGRARow_Any_SSSE3, I420ToBGRARow_SSSE3, CopyRow_X86) |
| MAKEYUVANY(I420ToABGRRow_Any_SSSE3, I420ToABGRRow_SSSE3, CopyRow_X86) |
| #endif |
| #if defined(HAS_I420TOARGBROW_NEON) |
| MAKEYUVANY(I420ToARGBRow_Any_NEON, I420ToARGBRow_NEON, CopyRow_C) |
| MAKEYUVANY(I420ToBGRARow_Any_NEON, I420ToBGRARow_NEON, CopyRow_C) |
| MAKEYUVANY(I420ToABGRRow_Any_NEON, I420ToABGRRow_NEON, CopyRow_C) |
| #endif |
| |
| #define MAKEYUVANYRGB(NAMEANY, ARGBTORGB, BPP) \ |
| void NAMEANY(const uint8* argb_buf, \ |
| uint8* rgb_buf, \ |
| int width) { \ |
| SIMD_ALIGNED(uint8 row[kMaxStride]); \ |
| ARGBTORGB(argb_buf, row, width); \ |
| memcpy(rgb_buf, row, width * BPP); \ |
| } |
| |
| #if defined(HAS_ARGBTORGB24ROW_SSSE3) |
| MAKEYUVANYRGB(ARGBToRGB24Row_Any_SSSE3, ARGBToRGB24Row_SSSE3, 3) |
| MAKEYUVANYRGB(ARGBToRAWRow_Any_SSSE3, ARGBToRAWRow_SSSE3, 3) |
| MAKEYUVANYRGB(ARGBToRGB565Row_Any_SSE2, ARGBToRGB565Row_SSE2, 2) |
| MAKEYUVANYRGB(ARGBToARGB1555Row_Any_SSE2, ARGBToARGB1555Row_SSE2, 2) |
| MAKEYUVANYRGB(ARGBToARGB4444Row_Any_SSE2, ARGBToARGB4444Row_SSE2, 2) |
| #endif |
| |
| #ifdef HAS_ARGBTOYROW_SSSE3 |
| |
| #define MAKEYANY(NAMEANY, ARGBTOY_SSE, BPP) \ |
| void NAMEANY(const uint8* src_argb, uint8* dst_y, int width) { \ |
| ARGBTOY_SSE(src_argb, dst_y, width - 16); \ |
| ARGBTOY_SSE(src_argb + (width - 16) * BPP, dst_y + (width - 16), 16); \ |
| } |
| |
| MAKEYANY(ARGBToYRow_Any_SSSE3, ARGBToYRow_Unaligned_SSSE3, 4) |
| MAKEYANY(BGRAToYRow_Any_SSSE3, BGRAToYRow_Unaligned_SSSE3, 4) |
| MAKEYANY(ABGRToYRow_Any_SSSE3, ABGRToYRow_Unaligned_SSSE3, 4) |
| MAKEYANY(YUY2ToYRow_Any_SSE2, YUY2ToYRow_Unaligned_SSE2, 2) |
| MAKEYANY(UYVYToYRow_Any_SSE2, UYVYToYRow_Unaligned_SSE2, 2) |
| |
| #define MAKEUVANY(NAMEANY, ARGBTOUV_SSE, ARGBTOUV_C, BPP) \ |
| void NAMEANY(const uint8* src_argb0, int src_stride_argb, \ |
| uint8* dst_u, uint8* dst_v, int width) { \ |
| ARGBTOUV_SSE(src_argb0, src_stride_argb, dst_u, dst_v, width & ~15); \ |
| ARGBTOUV_C(src_argb0 + (width & ~15) * BPP, src_stride_argb, \ |
| dst_u + (width & ~15) / 2, dst_v + (width & ~15) / 2, \ |
| width & 15); \ |
| } |
| |
| MAKEUVANY(ARGBToUVRow_Any_SSSE3, ARGBToUVRow_Unaligned_SSSE3, ARGBToUVRow_C, 4) |
| MAKEUVANY(BGRAToUVRow_Any_SSSE3, BGRAToUVRow_Unaligned_SSSE3, BGRAToUVRow_C, 4) |
| MAKEUVANY(ABGRToUVRow_Any_SSSE3, ABGRToUVRow_Unaligned_SSSE3, ABGRToUVRow_C, 4) |
| MAKEUVANY(YUY2ToUVRow_Any_SSE2, YUY2ToUVRow_Unaligned_SSE2, YUY2ToUVRow_C, 2) |
| MAKEUVANY(UYVYToUVRow_Any_SSE2, UYVYToUVRow_Unaligned_SSE2, UYVYToUVRow_C, 2) |
| #endif |
| |
| #ifdef __cplusplus |
| } // extern "C" |
| } // namespace libyuv |
| #endif |