17#ifndef FREERDP_LIB_PRIM_INTERNAL_H
18#define FREERDP_LIB_PRIM_INTERNAL_H
20#include <winpr/platform.h>
21#include <freerdp/config.h>
23#include <freerdp/primitives.h>
24#include <freerdp/api.h>
26#include "../core/simd.h"
28#define PRIM_ALIGN_128 DECLSPEC_ALIGN(16)
30#if defined(SSE_AVX_INTRINSICS_ENABLED) || defined(NEON_INTRINSICS_ENABLED) || defined(WITH_OPENCL)
31#define HAVE_OPTIMIZED_PRIMITIVES 1
34#if defined(SSE_AVX_INTRINSICS_ENABLED) || defined(NEON_INTRINSICS_ENABLED)
35#define HAVE_CPU_OPTIMIZED_PRIMITIVES 1
39static inline BYTE* writePixelBGRA(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G,
42 WINPR_UNUSED(formatSize);
53static inline BYTE* writePixelBGRX(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G,
56 WINPR_UNUSED(formatSize);
69static inline BYTE* writePixelRGBA(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G,
72 WINPR_UNUSED(formatSize);
83static inline BYTE* writePixelRGBX(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G,
86 WINPR_UNUSED(formatSize);
99static inline BYTE* writePixelABGR(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G,
102 WINPR_UNUSED(formatSize);
103 WINPR_UNUSED(format);
113static inline BYTE* writePixelXBGR(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G,
116 WINPR_UNUSED(formatSize);
117 WINPR_UNUSED(format);
128static inline BYTE* writePixelARGB(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G,
131 WINPR_UNUSED(formatSize);
132 WINPR_UNUSED(format);
142static inline BYTE* writePixelXRGB(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G,
145 WINPR_UNUSED(formatSize);
146 WINPR_UNUSED(format);
157static inline BYTE* writePixelGenericAlpha(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R,
158 BYTE G, BYTE B, BYTE A)
160 UINT32 color = FreeRDPGetColor(format, R, G, B, A);
161 FreeRDPWriteColor(dst, format, color);
162 return dst + formatSize;
166static inline BYTE* writePixelGeneric(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G,
169 UINT32 color = FreeRDPGetColor(format, R, G, B, A);
170 FreeRDPWriteColorIgnoreAlpha(dst, format, color);
171 return dst + formatSize;
174typedef BYTE* (*fkt_writePixel)(BYTE*, DWORD, UINT32, BYTE, BYTE, BYTE, BYTE);
177static inline fkt_writePixel getPixelWriteFunction(DWORD format, BOOL useAlpha)
181 case PIXEL_FORMAT_ARGB32:
182 case PIXEL_FORMAT_XRGB32:
183 return useAlpha ? writePixelARGB : writePixelXRGB;
185 case PIXEL_FORMAT_ABGR32:
186 case PIXEL_FORMAT_XBGR32:
187 return useAlpha ? writePixelABGR : writePixelXBGR;
189 case PIXEL_FORMAT_RGBA32:
190 case PIXEL_FORMAT_RGBX32:
191 return useAlpha ? writePixelRGBA : writePixelRGBX;
193 case PIXEL_FORMAT_BGRA32:
194 case PIXEL_FORMAT_BGRX32:
195 return useAlpha ? writePixelBGRA : writePixelBGRX;
198 return useAlpha ? writePixelGenericAlpha : writePixelGeneric;
203static inline BYTE CLIP(INT64 X)
215static inline BYTE CONDITIONAL_CLIP(INT32 in, BYTE original)
220 diff = out - original;
222 diff = original - out;
233static inline INT32 C(INT32 Y)
238static inline INT32 D(INT32 U)
243static inline INT32 E(INT32 V)
249static inline BYTE YUV2R(INT32 Y, INT32 U, INT32 V)
251 const INT32 r = (256 * C(Y) + 0 * D(U) + 403 * E(V));
252 const INT32 r8 = r >> 8;
257static inline BYTE YUV2G(INT32 Y, INT32 U, INT32 V)
259 const INT32 g = (256 * C(Y) - 48 * D(U) - 120 * E(V));
260 const INT32 g8 = g >> 8;
265static inline BYTE YUV2B(INT32 Y, INT32 U, INT32 V)
267 const INT32 b = (256 * C(Y) + 475 * D(U) + 0 * E(V));
268 const INT32 b8 = b >> 8;
278static inline BYTE RGB2Y(INT32 R, INT32 G, INT32 B)
280 const INT32 val = ((54 * R + 183 * G + 18 * B) >> 8);
281 return WINPR_ASSERTING_INT_CAST(BYTE, val);
285static inline BYTE RGB2U(INT32 R, INT32 G, INT32 B)
287 const INT32 val = (((-29 * R - 99 * G + 128 * B) >> 8) + 128);
288 return WINPR_ASSERTING_INT_CAST(BYTE, val);
292static inline BYTE RGB2V(INT32 R, INT32 G, INT32 B)
294 const INT32 val = (((128 * R - 116 * G - 12 * B) >> 8) + 128);
295 return WINPR_ASSERTING_INT_CAST(BYTE, val);
298static inline BYTE* writeYUVPixel(BYTE* dst, UINT32 DstFormat, INT32 y, INT32 u, INT32 v,
302 const BYTE r = YUV2R(y, u, v);
303 const BYTE g = YUV2G(y, u, v);
304 const BYTE b = YUV2B(y, u, v);
305 const DWORD formatSize = FreeRDPGetBytesPerPixel(DstFormat);
306 return fkt(dst, formatSize, DstFormat, r, g, b, 0);
309FREERDP_LOCAL
void general_RGBToAVC444YUV_BGRX_DOUBLE_ROW(
310 size_t offset,
const BYTE* WINPR_RESTRICT srcEven,
const BYTE* WINPR_RESTRICT srcOdd,
311 BYTE* WINPR_RESTRICT b1Even, BYTE* WINPR_RESTRICT b1Odd, BYTE* WINPR_RESTRICT b2,
312 BYTE* WINPR_RESTRICT b3, BYTE* WINPR_RESTRICT b4, BYTE* WINPR_RESTRICT b5,
313 BYTE* WINPR_RESTRICT b6, BYTE* WINPR_RESTRICT b7, UINT32 width);
315FREERDP_LOCAL
void general_RGBToAVC444YUVv2_BGRX_DOUBLE_ROW(
316 size_t offset,
const BYTE* WINPR_RESTRICT pSrcEven,
const BYTE* WINPR_RESTRICT pSrcOdd,
317 BYTE* WINPR_RESTRICT yLumaDstEven, BYTE* WINPR_RESTRICT yLumaDstOdd,
318 BYTE* WINPR_RESTRICT uLumaDst, BYTE* WINPR_RESTRICT vLumaDst,
319 BYTE* WINPR_RESTRICT yEvenChromaDst1, BYTE* WINPR_RESTRICT yEvenChromaDst2,
320 BYTE* WINPR_RESTRICT yOddChromaDst1, BYTE* WINPR_RESTRICT yOddChromaDst2,
321 BYTE* WINPR_RESTRICT uChromaDst1, BYTE* WINPR_RESTRICT uChromaDst2,
322 BYTE* WINPR_RESTRICT vChromaDst1, BYTE* WINPR_RESTRICT vChromaDst2, UINT32 width);
325FREERDP_LOCAL
void primitives_init_copy(
primitives_t* WINPR_RESTRICT prims);
326FREERDP_LOCAL
void primitives_init_set(
primitives_t* WINPR_RESTRICT prims);
327FREERDP_LOCAL
void primitives_init_add(
primitives_t* WINPR_RESTRICT prims);
328FREERDP_LOCAL
void primitives_init_andor(
primitives_t* WINPR_RESTRICT prims);
329FREERDP_LOCAL
void primitives_init_shift(
primitives_t* WINPR_RESTRICT prims);
330FREERDP_LOCAL
void primitives_init_sign(
primitives_t* WINPR_RESTRICT prims);
331FREERDP_LOCAL
void primitives_init_alphaComp(
primitives_t* WINPR_RESTRICT prims);
332FREERDP_LOCAL
void primitives_init_colors(
primitives_t* WINPR_RESTRICT prims);
333FREERDP_LOCAL
void primitives_init_YCoCg(
primitives_t* WINPR_RESTRICT prims);
334FREERDP_LOCAL
void primitives_init_YUV(
primitives_t* WINPR_RESTRICT prims);
336FREERDP_LOCAL
void primitives_init_copy_opt(
primitives_t* WINPR_RESTRICT prims);
337FREERDP_LOCAL
void primitives_init_set_opt(
primitives_t* WINPR_RESTRICT prims);
338FREERDP_LOCAL
void primitives_init_add_opt(
primitives_t* WINPR_RESTRICT prims);
339FREERDP_LOCAL
void primitives_init_andor_opt(
primitives_t* WINPR_RESTRICT prims);
340FREERDP_LOCAL
void primitives_init_shift_opt(
primitives_t* WINPR_RESTRICT prims);
341FREERDP_LOCAL
void primitives_init_sign_opt(
primitives_t* WINPR_RESTRICT prims);
342FREERDP_LOCAL
void primitives_init_alphaComp_opt(
primitives_t* WINPR_RESTRICT prims);
343FREERDP_LOCAL
void primitives_init_colors_opt(
primitives_t* WINPR_RESTRICT prims);
344FREERDP_LOCAL
void primitives_init_YCoCg_opt(
primitives_t* WINPR_RESTRICT prims);
345FREERDP_LOCAL
void primitives_init_YUV_opt(
primitives_t* WINPR_RESTRICT prims);
347#if defined(WITH_OPENCL)
349FREERDP_LOCAL BOOL primitives_init_opencl(
primitives_t* WINPR_RESTRICT prims);