17#ifndef FREERDP_LIB_PRIM_INTERNAL_H
18#define FREERDP_LIB_PRIM_INTERNAL_H
20#include <winpr/platform.h>
21#include <freerdp/config.h>
23#include <freerdp/primitives.h>
24#include <freerdp/api.h>
26#include <freerdp/log.h>
28#include "../core/simd.h"
30#define PRIM_TAG FREERDP_TAG("primitives")
33#define PRIM_ALIGN_128 __attribute__((aligned(16)))
36#define PRIM_ALIGN_128 __declspec(align(16))
40#if defined(SSE_AVX_INTRINSICS_ENABLED) || defined(NEON_INTRINSICS_ENABLED) || defined(WITH_OPENCL)
41#define HAVE_OPTIMIZED_PRIMITIVES 1
44#if defined(SSE_AVX_INTRINSICS_ENABLED) || defined(NEON_INTRINSICS_ENABLED)
45#define HAVE_CPU_OPTIMIZED_PRIMITIVES 1
48static INLINE BYTE* writePixelBGRA(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G,
51 WINPR_UNUSED(formatSize);
61static INLINE BYTE* writePixelBGRX(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G,
64 WINPR_UNUSED(formatSize);
76static INLINE BYTE* writePixelRGBA(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G,
79 WINPR_UNUSED(formatSize);
89static INLINE BYTE* writePixelRGBX(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G,
92 WINPR_UNUSED(formatSize);
104static INLINE BYTE* writePixelABGR(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G,
107 WINPR_UNUSED(formatSize);
108 WINPR_UNUSED(format);
117static INLINE BYTE* writePixelXBGR(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G,
120 WINPR_UNUSED(formatSize);
121 WINPR_UNUSED(format);
131static INLINE BYTE* writePixelARGB(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G,
134 WINPR_UNUSED(formatSize);
135 WINPR_UNUSED(format);
144static INLINE BYTE* writePixelXRGB(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G,
147 WINPR_UNUSED(formatSize);
148 WINPR_UNUSED(format);
158static INLINE BYTE* writePixelGenericAlpha(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R,
159 BYTE G, BYTE B, BYTE A)
161 UINT32 color = FreeRDPGetColor(format, R, G, B, A);
162 FreeRDPWriteColor(dst, format, color);
163 return dst + formatSize;
166static INLINE BYTE* writePixelGeneric(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G,
169 UINT32 color = FreeRDPGetColor(format, R, G, B, A);
170 FreeRDPWriteColorIgnoreAlpha(dst, format, color);
171 return dst + formatSize;
174typedef BYTE* (*fkt_writePixel)(BYTE*, DWORD, UINT32, BYTE, BYTE, BYTE, BYTE);
176static INLINE fkt_writePixel getPixelWriteFunction(DWORD format, BOOL useAlpha)
180 case PIXEL_FORMAT_ARGB32:
181 case PIXEL_FORMAT_XRGB32:
182 return useAlpha ? writePixelARGB : writePixelXRGB;
184 case PIXEL_FORMAT_ABGR32:
185 case PIXEL_FORMAT_XBGR32:
186 return useAlpha ? writePixelABGR : writePixelXBGR;
188 case PIXEL_FORMAT_RGBA32:
189 case PIXEL_FORMAT_RGBX32:
190 return useAlpha ? writePixelRGBA : writePixelRGBX;
192 case PIXEL_FORMAT_BGRA32:
193 case PIXEL_FORMAT_BGRX32:
194 return useAlpha ? writePixelBGRA : writePixelBGRX;
197 return useAlpha ? writePixelGenericAlpha : writePixelGeneric;
201static INLINE BYTE CLIP(INT64 X)
212static INLINE BYTE CONDITIONAL_CLIP(INT32 in, BYTE original)
217 diff = out - original;
219 diff = original - out;
230static INLINE INT32 C(INT32 Y)
235static INLINE INT32 D(INT32 U)
240static INLINE INT32 E(INT32 V)
245static INLINE BYTE YUV2R(INT32 Y, INT32 U, INT32 V)
247 const INT32 r = (256 * C(Y) + 0 * D(U) + 403 * E(V));
248 const INT32 r8 = r >> 8;
252static INLINE BYTE YUV2G(INT32 Y, INT32 U, INT32 V)
254 const INT32 g = (256 * C(Y) - 48 * D(U) - 120 * E(V));
255 const INT32 g8 = g >> 8;
259static INLINE BYTE YUV2B(INT32 Y, INT32 U, INT32 V)
261 const INT32 b = (256 * C(Y) + 475 * D(U) + 0 * E(V));
262 const INT32 b8 = b >> 8;
271static INLINE BYTE RGB2Y(INT32 R, INT32 G, INT32 B)
273 const INT32 val = ((54 * R + 183 * G + 18 * B) >> 8);
274 return WINPR_ASSERTING_INT_CAST(BYTE, val);
277static INLINE BYTE RGB2U(INT32 R, INT32 G, INT32 B)
279 const INT32 val = (((-29 * R - 99 * G + 128 * B) >> 8) + 128);
280 return WINPR_ASSERTING_INT_CAST(BYTE, val);
283static INLINE BYTE RGB2V(INT32 R, INT32 G, INT32 B)
285 const INT32 val = (((128 * R - 116 * G - 12 * B) >> 8) + 128);
286 return WINPR_ASSERTING_INT_CAST(BYTE, val);
289static inline BYTE* writeYUVPixel(BYTE* dst, UINT32 DstFormat, INT32 y, INT32 u, INT32 v,
293 const BYTE r = YUV2R(y, u, v);
294 const BYTE g = YUV2G(y, u, v);
295 const BYTE b = YUV2B(y, u, v);
296 const DWORD formatSize = FreeRDPGetBytesPerPixel(DstFormat);
297 return fkt(dst, formatSize, DstFormat, r, g, b, 0);
300FREERDP_LOCAL
void general_RGBToAVC444YUV_BGRX_DOUBLE_ROW(
301 size_t offset,
const BYTE* WINPR_RESTRICT srcEven,
const BYTE* WINPR_RESTRICT srcOdd,
302 BYTE* WINPR_RESTRICT b1Even, BYTE* WINPR_RESTRICT b1Odd, BYTE* WINPR_RESTRICT b2,
303 BYTE* WINPR_RESTRICT b3, BYTE* WINPR_RESTRICT b4, BYTE* WINPR_RESTRICT b5,
304 BYTE* WINPR_RESTRICT b6, BYTE* WINPR_RESTRICT b7, UINT32 width);
306FREERDP_LOCAL
void general_RGBToAVC444YUVv2_BGRX_DOUBLE_ROW(
307 size_t offset,
const BYTE* WINPR_RESTRICT pSrcEven,
const BYTE* WINPR_RESTRICT pSrcOdd,
308 BYTE* WINPR_RESTRICT yLumaDstEven, BYTE* WINPR_RESTRICT yLumaDstOdd,
309 BYTE* WINPR_RESTRICT uLumaDst, BYTE* WINPR_RESTRICT vLumaDst,
310 BYTE* WINPR_RESTRICT yEvenChromaDst1, BYTE* WINPR_RESTRICT yEvenChromaDst2,
311 BYTE* WINPR_RESTRICT yOddChromaDst1, BYTE* WINPR_RESTRICT yOddChromaDst2,
312 BYTE* WINPR_RESTRICT uChromaDst1, BYTE* WINPR_RESTRICT uChromaDst2,
313 BYTE* WINPR_RESTRICT vChromaDst1, BYTE* WINPR_RESTRICT vChromaDst2, UINT32 width);
316FREERDP_LOCAL
void primitives_init_copy(
primitives_t* WINPR_RESTRICT prims);
317FREERDP_LOCAL
void primitives_init_set(
primitives_t* WINPR_RESTRICT prims);
318FREERDP_LOCAL
void primitives_init_add(
primitives_t* WINPR_RESTRICT prims);
319FREERDP_LOCAL
void primitives_init_andor(
primitives_t* WINPR_RESTRICT prims);
320FREERDP_LOCAL
void primitives_init_shift(
primitives_t* WINPR_RESTRICT prims);
321FREERDP_LOCAL
void primitives_init_sign(
primitives_t* WINPR_RESTRICT prims);
322FREERDP_LOCAL
void primitives_init_alphaComp(
primitives_t* WINPR_RESTRICT prims);
323FREERDP_LOCAL
void primitives_init_colors(
primitives_t* WINPR_RESTRICT prims);
324FREERDP_LOCAL
void primitives_init_YCoCg(
primitives_t* WINPR_RESTRICT prims);
325FREERDP_LOCAL
void primitives_init_YUV(
primitives_t* WINPR_RESTRICT prims);
327FREERDP_LOCAL
void primitives_init_copy_opt(
primitives_t* WINPR_RESTRICT prims);
328FREERDP_LOCAL
void primitives_init_set_opt(
primitives_t* WINPR_RESTRICT prims);
329FREERDP_LOCAL
void primitives_init_add_opt(
primitives_t* WINPR_RESTRICT prims);
330FREERDP_LOCAL
void primitives_init_andor_opt(
primitives_t* WINPR_RESTRICT prims);
331FREERDP_LOCAL
void primitives_init_shift_opt(
primitives_t* WINPR_RESTRICT prims);
332FREERDP_LOCAL
void primitives_init_sign_opt(
primitives_t* WINPR_RESTRICT prims);
333FREERDP_LOCAL
void primitives_init_alphaComp_opt(
primitives_t* WINPR_RESTRICT prims);
334FREERDP_LOCAL
void primitives_init_colors_opt(
primitives_t* WINPR_RESTRICT prims);
335FREERDP_LOCAL
void primitives_init_YCoCg_opt(
primitives_t* WINPR_RESTRICT prims);
336FREERDP_LOCAL
void primitives_init_YUV_opt(
primitives_t* WINPR_RESTRICT prims);
338#if defined(WITH_OPENCL)
339FREERDP_LOCAL BOOL primitives_init_opencl(
primitives_t* WINPR_RESTRICT prims);