diff options
Diffstat (limited to 'libfreerdp/primitives/prim_internal.h')
-rw-r--r-- | libfreerdp/primitives/prim_internal.h | 297 |
1 files changed, 297 insertions, 0 deletions
diff --git a/libfreerdp/primitives/prim_internal.h b/libfreerdp/primitives/prim_internal.h new file mode 100644 index 0000000..cf5c124 --- /dev/null +++ b/libfreerdp/primitives/prim_internal.h @@ -0,0 +1,297 @@ +/* prim_internal.h + * vi:ts=4 sw=4 + * + * (c) Copyright 2012 Hewlett-Packard Development Company, L.P. + * Licensed under the Apache License, Version 2.0 (the "License"); you may + * not use this file except in compliance with the License. You may obtain + * a copy of the License at http://www.apache.org/licenses/LICENSE-2.0. + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express + * or implied. See the License for the specific language governing + * permissions and limitations under the License. Algorithms used by + * this code may be covered by patents by HP, Microsoft, or other parties. + * + */ + +#ifndef FREERDP_LIB_PRIM_INTERNAL_H +#define FREERDP_LIB_PRIM_INTERNAL_H + +#include <freerdp/config.h> + +#include <freerdp/primitives.h> +#include <freerdp/api.h> + +#ifdef __GNUC__ +#define PRIM_ALIGN_128 __attribute__((aligned(16))) +#else +#ifdef _WIN32 +#define PRIM_ALIGN_128 __declspec(align(16)) +#endif +#endif + +#if defined(WITH_SSE2) || defined(WITH_NEON) || defined(WITH_OPENCL) +#define HAVE_OPTIMIZED_PRIMITIVES 1 +#endif + +#if defined(WITH_SSE2) || defined(WITH_NEON) +#define HAVE_CPU_OPTIMIZED_PRIMITIVES 1 +#endif + +#if defined(WITH_SSE2) +/* Use lddqu for unaligned; load for 16-byte aligned. */ +#define LOAD_SI128(_ptr_) \ + (((const ULONG_PTR)(_ptr_)&0x0f) ? _mm_lddqu_si128((const __m128i*)(_ptr_)) \ + : _mm_load_si128((const __m128i*)(_ptr_))) +#endif + +static INLINE BYTE* writePixelBGRA(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G, + BYTE B, BYTE A) +{ + WINPR_UNUSED(formatSize); + WINPR_UNUSED(format); + + *dst++ = B; + *dst++ = G; + *dst++ = R; + *dst++ = A; + return dst; +} + +static INLINE BYTE* writePixelBGRX(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G, + BYTE B, BYTE A) +{ + WINPR_UNUSED(formatSize); + WINPR_UNUSED(format); + WINPR_UNUSED(A); + + *dst++ = B; + *dst++ = G; + *dst++ = R; + dst++; /* Do not touch alpha */ + + return dst; +} + +static INLINE BYTE* writePixelRGBA(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G, + BYTE B, BYTE A) +{ + WINPR_UNUSED(formatSize); + WINPR_UNUSED(format); + + *dst++ = R; + *dst++ = G; + *dst++ = B; + *dst++ = A; + return dst; +} + +static INLINE BYTE* writePixelRGBX(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G, + BYTE B, BYTE A) +{ + WINPR_UNUSED(formatSize); + WINPR_UNUSED(format); + WINPR_UNUSED(A); + + *dst++ = R; + *dst++ = G; + *dst++ = B; + dst++; /* Do not touch alpha */ + + return dst; +} + +static INLINE BYTE* writePixelABGR(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G, + BYTE B, BYTE A) +{ + WINPR_UNUSED(formatSize); + WINPR_UNUSED(format); + + *dst++ = A; + *dst++ = B; + *dst++ = G; + *dst++ = R; + return dst; +} + +static INLINE BYTE* writePixelXBGR(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G, + BYTE B, BYTE A) +{ + WINPR_UNUSED(formatSize); + WINPR_UNUSED(format); + WINPR_UNUSED(A); + + dst++; /* Do not touch alpha */ + *dst++ = B; + *dst++ = G; + *dst++ = R; + return dst; +} + +static INLINE BYTE* writePixelARGB(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G, + BYTE B, BYTE A) +{ + WINPR_UNUSED(formatSize); + WINPR_UNUSED(format); + + *dst++ = A; + *dst++ = R; + *dst++ = G; + *dst++ = B; + return dst; +} + +static INLINE BYTE* writePixelXRGB(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G, + BYTE B, BYTE A) +{ + WINPR_UNUSED(formatSize); + WINPR_UNUSED(format); + WINPR_UNUSED(A); + + dst++; /* Do not touch alpha */ + *dst++ = R; + *dst++ = G; + *dst++ = B; + return dst; +} + +static INLINE BYTE* writePixelGenericAlpha(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, + BYTE G, BYTE B, BYTE A) +{ + UINT32 color = FreeRDPGetColor(format, R, G, B, A); + FreeRDPWriteColor(dst, format, color); + return dst + formatSize; +} + +static INLINE BYTE* writePixelGeneric(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G, + BYTE B, BYTE A) +{ + UINT32 color = FreeRDPGetColor(format, R, G, B, A); + FreeRDPWriteColorIgnoreAlpha(dst, format, color); + return dst + formatSize; +} + +typedef BYTE* (*fkt_writePixel)(BYTE*, DWORD, UINT32, BYTE, BYTE, BYTE, BYTE); + +static INLINE fkt_writePixel getPixelWriteFunction(DWORD format, BOOL useAlpha) +{ + switch (format) + { + case PIXEL_FORMAT_ARGB32: + case PIXEL_FORMAT_XRGB32: + return useAlpha ? writePixelARGB : writePixelXRGB; + + case PIXEL_FORMAT_ABGR32: + case PIXEL_FORMAT_XBGR32: + return useAlpha ? writePixelABGR : writePixelXBGR; + + case PIXEL_FORMAT_RGBA32: + case PIXEL_FORMAT_RGBX32: + return useAlpha ? writePixelRGBA : writePixelRGBX; + + case PIXEL_FORMAT_BGRA32: + case PIXEL_FORMAT_BGRX32: + return useAlpha ? writePixelBGRA : writePixelBGRX; + + default: + return useAlpha ? writePixelGenericAlpha : writePixelGeneric; + } +} + +static INLINE BYTE CLIP(INT64 X) +{ + if (X > 255L) + return 255L; + + if (X < 0L) + return 0L; + + return (BYTE)X; +} + +static INLINE BYTE CONDITIONAL_CLIP(INT32 in, BYTE original) +{ + BYTE out = CLIP(in); + BYTE diff; + if (out > original) + diff = out - original; + else + diff = original - out; + if (diff < 30) + return original; + return out; +} + +/** + * | R | ( | 256 0 403 | | Y | ) + * | G | = ( | 256 -48 -120 | | U - 128 | ) >> 8 + * | B | ( | 256 475 0 | | V - 128 | ) + */ +static INLINE INT32 C(INT32 Y) +{ + return (Y)-0L; +} + +static INLINE INT32 D(INT32 U) +{ + return (U)-128L; +} + +static INLINE INT32 E(INT32 V) +{ + return (V)-128L; +} + +static INLINE BYTE YUV2R(INT32 Y, INT32 U, INT32 V) +{ + const INT32 r = (256L * C(Y) + 0L * D(U) + 403L * E(V)); + const INT32 r8 = r >> 8L; + return CLIP(r8); +} + +static INLINE BYTE YUV2G(INT32 Y, INT32 U, INT32 V) +{ + const INT32 g = (256L * C(Y) - 48L * D(U) - 120L * E(V)); + const INT32 g8 = g >> 8L; + return CLIP(g8); +} + +static INLINE BYTE YUV2B(INT32 Y, INT32 U, INT32 V) +{ + const INT32 b = (256L * C(Y) + 475L * D(U) + 0L * E(V)); + const INT32 b8 = b >> 8L; + return CLIP(b8); +} + +/* Function prototypes for all the init/deinit routines. */ +FREERDP_LOCAL void primitives_init_copy(primitives_t* prims); +FREERDP_LOCAL void primitives_init_set(primitives_t* prims); +FREERDP_LOCAL void primitives_init_add(primitives_t* prims); +FREERDP_LOCAL void primitives_init_andor(primitives_t* prims); +FREERDP_LOCAL void primitives_init_shift(primitives_t* prims); +FREERDP_LOCAL void primitives_init_sign(primitives_t* prims); +FREERDP_LOCAL void primitives_init_alphaComp(primitives_t* prims); +FREERDP_LOCAL void primitives_init_colors(primitives_t* prims); +FREERDP_LOCAL void primitives_init_YCoCg(primitives_t* prims); +FREERDP_LOCAL void primitives_init_YUV(primitives_t* prims); + +#if defined(WITH_SSE2) || defined(WITH_NEON) +FREERDP_LOCAL void primitives_init_copy_opt(primitives_t* prims); +FREERDP_LOCAL void primitives_init_set_opt(primitives_t* prims); +FREERDP_LOCAL void primitives_init_add_opt(primitives_t* prims); +FREERDP_LOCAL void primitives_init_andor_opt(primitives_t* prims); +FREERDP_LOCAL void primitives_init_shift_opt(primitives_t* prims); +FREERDP_LOCAL void primitives_init_sign_opt(primitives_t* prims); +FREERDP_LOCAL void primitives_init_alphaComp_opt(primitives_t* prims); +FREERDP_LOCAL void primitives_init_colors_opt(primitives_t* prims); +FREERDP_LOCAL void primitives_init_YCoCg_opt(primitives_t* prims); +FREERDP_LOCAL void primitives_init_YUV_opt(primitives_t* prims); +#endif + +#if defined(WITH_OPENCL) +FREERDP_LOCAL BOOL primitives_init_opencl(primitives_t* prims); +#endif + +FREERDP_LOCAL primitives_t* primitives_get_by_type(DWORD type); + +#endif /* FREERDP_LIB_PRIM_INTERNAL_H */ |