26 lines
		
	
	
		
			959 B
		
	
	
	
		
			C
		
	
	
	
	
	
		
		
			
		
	
	
			26 lines
		
	
	
		
			959 B
		
	
	
	
		
			C
		
	
	
	
	
	
| 
								 | 
							
								#if defined(DETECT_FEATURES) && defined(__INTEL_COMPILER)
							 | 
						||
| 
								 | 
							
								    /*
							 | 
						||
| 
								 | 
							
								     * Unlike GCC and CLANG, Intel Compiler exposes all supported intrinsics,
							 | 
						||
| 
								 | 
							
								     * whether or not the build options for those features are specified.
							 | 
						||
| 
								 | 
							
								     * Therefore, we must test #definitions of CPU features when option native/host
							 | 
						||
| 
								 | 
							
								     * is enabled via `--cpu-baseline` or through env var `CFLAGS` otherwise
							 | 
						||
| 
								 | 
							
								     * the test will be broken and leads to enable all possible features.
							 | 
						||
| 
								 | 
							
								     */
							 | 
						||
| 
								 | 
							
								    #if !defined(__AVX512ER__) || !defined(__AVX512PF__)
							 | 
						||
| 
								 | 
							
								        #error "HOST/ARCH doesn't support Knights Landing AVX512 features"
							 | 
						||
| 
								 | 
							
								    #endif
							 | 
						||
| 
								 | 
							
								#endif
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								#include <immintrin.h>
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								int main(int argc, char **argv)
							 | 
						||
| 
								 | 
							
								{
							 | 
						||
| 
								 | 
							
								    int base[128]={};
							 | 
						||
| 
								 | 
							
								    __m512d ad = _mm512_loadu_pd((const __m512d*)argv[argc-1]);
							 | 
						||
| 
								 | 
							
								    /* ER */
							 | 
						||
| 
								 | 
							
								    __m512i a = _mm512_castpd_si512(_mm512_exp2a23_pd(ad));
							 | 
						||
| 
								 | 
							
								    /* PF */
							 | 
						||
| 
								 | 
							
								    _mm512_mask_prefetch_i64scatter_pd(base, _mm512_cmpeq_epi64_mask(a, a), a, 1, _MM_HINT_T1);
							 | 
						||
| 
								 | 
							
								    return base[0];
							 | 
						||
| 
								 | 
							
								}
							 |