SSE4A
[Native]


Native SSE4A Operations{

SSP_FORCEINLINE __m128i ssp_extract_si64_SSE4A (__m128i a, __m128i b)
SSP_FORCEINLINE __m128i ssp_extracti_si64_SSE4A (__m128i a, int len, int ndx)
SSP_FORCEINLINE __m128i ssp_insert_si64_SSE4A (__m128i a, __m128i b)
SSP_FORCEINLINE __m128i ssp_inserti_si64_SSE4A (__m128i a, __m128i b, int len, int ndx)
SSP_FORCEINLINE void ssp_stream_sd_SSE4A (double *dst, __m128d src)
SSP_FORCEINLINE void ssp_stream_ss_SSE4A (float *dst, __m128 src)
SSP_FORCEINLINE unsigned short ssp_lzcnt16_SSE4A (unsigned short val)
SSP_FORCEINLINE unsigned int ssp_lzcnt_SSE4A (unsigned int val)
SSP_FORCEINLINE unsigned short ssp_popcnt16_SSE4A (unsigned short val)
SSP_FORCEINLINE unsigned int ssp_popcnt_SSE4A (unsigned int val)

Function Documentation

SSP_FORCEINLINE __m128i ssp_extract_si64_SSE4A ( __m128i  a,
__m128i  b 
)

Native implementation of _mm_extract_si64 [SSE4a]. (Searches MSDN)

Definition at line 17 of file SSEPlus_native_SSE4a.h.

00018 {
00019     return _mm_extract_si64( a, b );
00020 }

SSP_FORCEINLINE __m128i ssp_extracti_si64_SSE4A ( __m128i  a,
int  len,
int  ndx 
)

Native implementation of _mm_extracti_si64 [SSE4a]. (Searches MSDN)

Definition at line 22 of file SSEPlus_native_SSE4a.h.

00023 {
00024     return _mm_extracti_si64( a, len, ndx );
00025 }

SSP_FORCEINLINE __m128i ssp_insert_si64_SSE4A ( __m128i  a,
__m128i  b 
)

Native implementation of _mm_insert_si64 [SSE4a]. (Searches MSDN)

Definition at line 27 of file SSEPlus_native_SSE4a.h.

00028 {
00029     return _mm_insert_si64( a, b );
00030 }

SSP_FORCEINLINE __m128i ssp_inserti_si64_SSE4A ( __m128i  a,
__m128i  b,
int  len,
int  ndx 
)

Native implementation of _mm_inserti_si64 [SSE4a]. (Searches MSDN)

Definition at line 32 of file SSEPlus_native_SSE4a.h.

00033 {
00034     return _mm_inserti_si64( a, b, len, ndx );
00035 }

SSP_FORCEINLINE unsigned short ssp_lzcnt16_SSE4A ( unsigned short  val  ) 

Native implementation of __lzcnt16 [SSE4a]. (Searches MSDN)
NOTE: Support for the LZCNT instruction is indicated by ECX bit 5 (LZCNT) as returned by CPUID function 8000_0001h. If the LZCNT instruction is not available, the encoding is treated as the BSR instruction. Software MUST check the CPUID bit once per program or library initialization before using the LZCNT instruction, or inconsistent behavior may result.

Definition at line 50 of file SSEPlus_native_SSE4a.h.

00051 {
00052     return __lzcnt16( val );
00053 }

SSP_FORCEINLINE unsigned int ssp_lzcnt_SSE4A ( unsigned int  val  ) 

Native implementation of __lzcnt [SSE4a]. (Searches MSDN)
NOTE: Support for the LZCNT instruction is indicated by ECX bit 5 (LZCNT) as returned by CPUID function 8000_0001h. If the LZCNT instruction is not available, the encoding is treated as the BSR instruction. Software MUST check the CPUID bit once per program or library initialization before using the LZCNT instruction, or inconsistent behavior may result.

Definition at line 57 of file SSEPlus_native_SSE4a.h.

00058 {
00059     return __lzcnt( val );
00060 }

SSP_FORCEINLINE unsigned short ssp_popcnt16_SSE4A ( unsigned short  val  ) 

Native implementation of __popcnt16 [SSE4a]. (Searches MSDN)

Definition at line 70 of file SSEPlus_native_SSE4a.h.

00070           {Native,__popcnt16} */ 
00071 SSP_FORCEINLINE unsigned short ssp_popcnt16_SSE4A( unsigned short val )
00072 {
00073     return __popcnt16( val );

SSP_FORCEINLINE unsigned int ssp_popcnt_SSE4A ( unsigned int  val  ) 

Native implementation of __popcnt [SSE4a]. (Searches MSDN)

Definition at line 75 of file SSEPlus_native_SSE4a.h.

00075           {Native,__popcnt} */ 
00076 SSP_FORCEINLINE unsigned int ssp_popcnt_SSE4A( unsigned int val )
00077 {
00078     return __popcnt( val );

SSP_FORCEINLINE void ssp_stream_sd_SSE4A ( double *  dst,
__m128d  src 
)

Native implementation of _mm_stream_sd [SSE4a]. (Searches MSDN)

Definition at line 37 of file SSEPlus_native_SSE4a.h.

00038 {
00039     _mm_stream_sd( dst, src );
00040 }

SSP_FORCEINLINE void ssp_stream_ss_SSE4A ( float *  dst,
__m128  src 
)

Native implementation of _mm_stream_ss [SSE4a]. (Searches MSDN)

Definition at line 42 of file SSEPlus_native_SSE4a.h.

00043 {
00044     _mm_stream_ss( dst, src );
00045 }


Generated on Wed May 21 13:44:12 2008 for "SSEPlus" by  doxygen 1.5.4