File size: 972 Bytes
dc2106c
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
#if defined(DETECT_FEATURES) && defined(__INTEL_COMPILER)
    /*

     * Unlike GCC and CLANG, Intel Compiler exposes all supported intrinsics,

     * whether or not the build options for those features are specified.

     * Therefore, we must test #definitions of CPU features when option native/host

     * is enabled via `--cpu-baseline` or through env var `CFLAGS` otherwise

     * the test will be broken and leads to enable all possible features.

     */
    #if !defined(__AVX512VBMI__) || !defined(__AVX512IFMA__)
        #error "HOST/ARCH doesn't support CannonLake AVX512 features"
    #endif
#endif

#include <immintrin.h>

int main(int argc, char **argv)
{
    __m512i a = _mm512_loadu_si512((const __m512i*)argv[argc-1]);
    /* IFMA */
    a = _mm512_madd52hi_epu64(a, a, _mm512_setzero_si512());
    /* VMBI */
    a = _mm512_permutex2var_epi8(a, _mm512_setzero_si512(), a);
    return _mm_cvtsi128_si32(_mm512_castsi512_si128(a));
}