33 lines
1.0 KiB
C
33 lines
1.0 KiB
C
|
#if defined(DETECT_FEATURES) && defined(__INTEL_COMPILER)
|
||
|
/*
|
||
|
* Unlike GCC and CLANG, Intel Compiler exposes all supported intrinsics,
|
||
|
* whether or not the build options for those features are specified.
|
||
|
* Therefore, we must test #definitions of CPU features when option native/host
|
||
|
* is enabled via `--cpu-baseline` or through env vr `CFLAGS` otherwise
|
||
|
* the test will be broken and leads to enable all possible features.
|
||
|
*/
|
||
|
#if !defined(__SSE4_2__) && !defined(__POPCNT__)
|
||
|
#error "HOST/ARCH doesn't support POPCNT"
|
||
|
#endif
|
||
|
#endif
|
||
|
|
||
|
#ifdef _MSC_VER
|
||
|
#include <nmmintrin.h>
|
||
|
#else
|
||
|
#include <popcntintrin.h>
|
||
|
#endif
|
||
|
|
||
|
int main(int argc, char **argv)
|
||
|
{
|
||
|
// To make sure popcnt instructions are generated
|
||
|
// and been tested against the assembler
|
||
|
unsigned long long a = *((unsigned long long*)argv[argc-1]);
|
||
|
unsigned int b = *((unsigned int*)argv[argc-2]);
|
||
|
|
||
|
#if defined(_M_X64) || defined(__x86_64__)
|
||
|
a = _mm_popcnt_u64(a);
|
||
|
#endif
|
||
|
b = _mm_popcnt_u32(b);
|
||
|
return (int)a + b;
|
||
|
}
|