diff options
author | José Fonseca <jfonseca@vmware.com> | 2010-07-16 13:16:57 +0100 |
---|---|---|
committer | José Fonseca <jfonseca@vmware.com> | 2010-07-16 17:24:21 +0100 |
commit | b7fff13d58b57870807bae2f43fa2854b551b267 (patch) | |
tree | 4182cbdad20ca02c23adcd7d2de1598bed7d3b0a | |
parent | 0a36a064a12de5caa0a6c1b245c9cc25bb00e5e0 (diff) |
llvmpipe: Describe _mm_shuffle_epi8() with gcc extended inline assembly when -mssse3 is not supported/enabled.
-rw-r--r-- | src/gallium/drivers/llvmpipe/lp_tile_soa.py | 33 |
1 files changed, 30 insertions, 3 deletions
diff --git a/src/gallium/drivers/llvmpipe/lp_tile_soa.py b/src/gallium/drivers/llvmpipe/lp_tile_soa.py index dc947c439163..c71ec8066c72 100644 --- a/src/gallium/drivers/llvmpipe/lp_tile_soa.py +++ b/src/gallium/drivers/llvmpipe/lp_tile_soa.py @@ -291,10 +291,37 @@ def generate_format_write(format, src_channel, src_native_type, src_suffix): def generate_ssse3(): print ''' -#ifdef PIPE_ARCH_SSSE3 +#if defined(PIPE_ARCH_SSE) + + +#if defined(PIPE_ARCH_SSSE3) #include <tmmintrin.h> +#else + +#include <emmintrin.h> + +/** + * Describe _mm_shuffle_epi8() with gcc extended inline assembly, for cases + * where -mssse3 is not supported/enabled. + * + * MSVC will never get in here as its intrinsics support do not rely on + * compiler command line options. + */ +static __inline __m128i __attribute__((__gnu_inline__, __always_inline__, __artificial__)) +_mm_shuffle_epi8(__m128i a, __m128i mask) +{ + __m128i result; + __asm__("pshufb %1, %0" + : "=x" (result) + : "xm" (mask), "0" (a)); + return result; +} + +#endif + + static void lp_tile_b8g8r8a8_unorm_swizzle_4ub_ssse3(uint8_t *dst, const uint8_t *src, unsigned src_stride, @@ -478,7 +505,7 @@ def generate_swizzle(formats, dst_channel, dst_native_type, dst_suffix): print ' case %s:' % format.name func_name = 'lp_tile_%s_swizzle_%s' % (format.short_name(), dst_suffix) if format.name == 'PIPE_FORMAT_B8G8R8A8_UNORM': - print '#ifdef PIPE_ARCH_SSSE3' + print '#ifdef PIPE_ARCH_SSE' print ' func = util_cpu_caps.has_ssse3 ? %s_ssse3 : %s;' % (func_name, func_name) print '#else' print ' func = %s;' % (func_name,) @@ -516,7 +543,7 @@ def generate_unswizzle(formats, src_channel, src_native_type, src_suffix): print ' case %s:' % format.name func_name = 'lp_tile_%s_unswizzle_%s' % (format.short_name(), src_suffix) if format.name == 'PIPE_FORMAT_B8G8R8A8_UNORM': - print '#ifdef PIPE_ARCH_SSSE3' + print '#ifdef PIPE_ARCH_SSE' print ' func = util_cpu_caps.has_ssse3 ? %s_ssse3 : %s;' % (func_name, func_name) print '#else' print ' func = %s;' % (func_name,) |