/* prim_internal.h * vi:ts=4 sw=4 * * (c) Copyright 2012 Hewlett-Packard Development Company, L.P. * Licensed under the Apache License, Version 2.0 (the "License"); you may * not use this file except in compliance with the License. You may obtain * a copy of the License at http://www.apache.org/licenses/LICENSE-2.0. * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express * or implied. See the License for the specific language governing * permissions and limitations under the License. Algorithms used by * this code may be covered by patents by HP, Microsoft, or other parties. * */ #ifndef FREERDP_LIB_PRIM_INTERNAL_H #define FREERDP_LIB_PRIM_INTERNAL_H #ifdef HAVE_CONFIG_H #include "config.h" #endif #include #include #ifdef __GNUC__ #define PRIM_ALIGN_128 __attribute__((aligned(16))) #else #ifdef _WIN32 #define PRIM_ALIGN_128 __declspec(align(16)) #endif #endif #if defined(WITH_SSE2) || defined(WITH_NEON) #define HAVE_OPTIMIZED_PRIMITIVES 1 #endif #if defined(WITH_SSE2) /* Use lddqu for unaligned; load for 16-byte aligned. */ #define LOAD_SI128(_ptr_) \ (((ULONG_PTR) (_ptr_) & 0x0f) \ ? _mm_lddqu_si128((__m128i *) (_ptr_)) \ : _mm_load_si128((__m128i *) (_ptr_))) #endif static INLINE BYTE* writePixelBGRX(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G, BYTE B, BYTE A) { *dst++ = B; *dst++ = G; *dst++ = R; *dst++ = A; return dst; } static INLINE BYTE* writePixelRGBX(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G, BYTE B, BYTE A) { *dst++ = R; *dst++ = G; *dst++ = B; *dst++ = A; return dst; } static INLINE BYTE* writePixelXBGR(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G, BYTE B, BYTE A) { *dst++ = A; *dst++ = B; *dst++ = G; *dst++ = R; return dst; } static INLINE BYTE* writePixelXRGB(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G, BYTE B, BYTE A) { *dst++ = A; *dst++ = R; *dst++ = G; *dst++ = B; return dst; } static INLINE BYTE* writePixelGeneric(BYTE* dst, DWORD formatSize, UINT32 format, BYTE R, BYTE G, BYTE B, BYTE A) { UINT32 color = FreeRDPGetColor(format, R, G, B, A); WriteColor(dst, format, color); return dst + formatSize; } typedef BYTE* (*fkt_writePixel)(BYTE*, DWORD, UINT32, BYTE, BYTE, BYTE, BYTE); static INLINE fkt_writePixel getPixelWriteFunction(DWORD format) { switch (format) { case PIXEL_FORMAT_ARGB32: case PIXEL_FORMAT_XRGB32: return writePixelXRGB; case PIXEL_FORMAT_ABGR32: case PIXEL_FORMAT_XBGR32: return writePixelXBGR; case PIXEL_FORMAT_RGBA32: case PIXEL_FORMAT_RGBX32: return writePixelRGBX; case PIXEL_FORMAT_BGRA32: case PIXEL_FORMAT_BGRX32: return writePixelBGRX; default: return writePixelGeneric; } } static INLINE BYTE CLIP(INT32 X) { if (X > 255L) return 255L; if (X < 0L) return 0L; return X; } /** * | R | ( | 256 0 403 | | Y | ) * | G | = ( | 256 -48 -120 | | U - 128 | ) >> 8 * | B | ( | 256 475 0 | | V - 128 | ) */ static INLINE INT32 C(INT32 Y) { return (Y) - 0L; } static INLINE INT32 D(INT32 U) { return (U) - 128L; } static INLINE INT32 E(INT32 V) { return (V) - 128L; } static INLINE BYTE YUV2R(INT32 Y, INT32 U, INT32 V) { const INT32 r = (256L * C(Y) + 0L * D(U) + 403L * E(V)); const INT32 r8 = r >> 8L; return CLIP(r8); } static INLINE BYTE YUV2G(INT32 Y, INT32 U, INT32 V) { const INT32 g = (256L * C(Y) - 48L * D(U) - 120L * E(V)); const INT32 g8 = g >> 8L; return CLIP(g8); } static INLINE BYTE YUV2B(INT32 Y, INT32 U, INT32 V) { const INT32 b = (256L * C(Y) + 475L * D(U) + 0L * E(V)); const INT32 b8 = b >> 8L; return CLIP(b8); } /* Function prototypes for all the init/deinit routines. */ FREERDP_LOCAL void primitives_init_copy(primitives_t* prims); FREERDP_LOCAL void primitives_init_set(primitives_t* prims); FREERDP_LOCAL void primitives_init_add(primitives_t* prims); FREERDP_LOCAL void primitives_init_andor(primitives_t* prims); FREERDP_LOCAL void primitives_init_shift(primitives_t* prims); FREERDP_LOCAL void primitives_init_sign(primitives_t* prims); FREERDP_LOCAL void primitives_init_alphaComp(primitives_t* prims); FREERDP_LOCAL void primitives_init_colors(primitives_t* prims); FREERDP_LOCAL void primitives_init_YCoCg(primitives_t* prims); FREERDP_LOCAL void primitives_init_YUV(primitives_t* prims); #if defined(WITH_SSE2) || defined(WITH_NEON) FREERDP_LOCAL void primitives_init_copy_opt(primitives_t* prims); FREERDP_LOCAL void primitives_init_set_opt(primitives_t* prims); FREERDP_LOCAL void primitives_init_add_opt(primitives_t* prims); FREERDP_LOCAL void primitives_init_andor_opt(primitives_t* prims); FREERDP_LOCAL void primitives_init_shift_opt(primitives_t* prims); FREERDP_LOCAL void primitives_init_sign_opt(primitives_t* prims); FREERDP_LOCAL void primitives_init_alphaComp_opt(primitives_t* prims); FREERDP_LOCAL void primitives_init_colors_opt(primitives_t* prims); FREERDP_LOCAL void primitives_init_YCoCg_opt(primitives_t* prims); FREERDP_LOCAL void primitives_init_YUV_opt(primitives_t* prims); #endif #endif /* FREERDP_LIB_PRIM_INTERNAL_H */