1/* { dg-do run } */ 2/* { dg-options "-O2 -mavx512f -std=c99" } */ 3/* { dg-require-effective-target avx512f } */ 4/* { dg-require-effective-target c99_runtime } */ 5 6#define AVX512F 7 8#include "avx512f-helper.h" 9 10#include <math.h> 11#define SIZE (AVX512F_LEN / 32) 12#include "avx512f-mask-type.h" 13 14#if AVX512F_LEN == 512 15#undef CMP 16#define CMP(imm, rel) \ 17 dst_ref = 0; \ 18 for (i = 0; i < 16; i++) \ 19 { \ 20 dst_ref = (((int) rel) << i) | dst_ref; \ 21 } \ 22 source1.x = _mm512_loadu_ps(s1); \ 23 source2.x = _mm512_loadu_ps(s2); \ 24 dst1 = _mm512_cmp_ps_mask(source1.x, source2.x, imm);\ 25 dst2 = _mm512_mask_cmp_ps_mask(mask, source1.x, source2.x, imm);\ 26 if (dst_ref != dst1) abort(); \ 27 if ((dst_ref & mask) != dst2) abort(); 28#endif 29 30#if AVX512F_LEN == 256 31#undef CMP 32#define CMP(imm, rel) \ 33 dst_ref = 0; \ 34 for (i = 0; i < 8; i++) \ 35 { \ 36 dst_ref = (((int) rel) << i) | dst_ref; \ 37 } \ 38 source1.x = _mm256_loadu_ps(s1); \ 39 source2.x = _mm256_loadu_ps(s2); \ 40 dst1 = _mm256_cmp_ps_mask(source1.x, source2.x, imm);\ 41 dst2 = _mm256_mask_cmp_ps_mask(mask, source1.x, source2.x, imm);\ 42 if (dst_ref != dst1) abort(); \ 43 if ((dst_ref & mask) != dst2) abort(); 44#endif 45 46#if AVX512F_LEN == 128 47#undef CMP 48#define CMP(imm, rel) \ 49 dst_ref = 0; \ 50 for (i = 0; i < 4; i++) \ 51 { \ 52 dst_ref = (((int) rel) << i) | dst_ref; \ 53 } \ 54 source1.x = _mm_loadu_ps(s1); \ 55 source2.x = _mm_loadu_ps(s2); \ 56 dst1 = _mm_cmp_ps_mask(source1.x, source2.x, imm);\ 57 dst2 = _mm_mask_cmp_ps_mask(mask, source1.x, source2.x, imm);\ 58 if (dst_ref != dst1) abort(); \ 59 if ((dst_ref & mask) != dst2) abort(); 60#endif 61 62void 63TEST () 64{ 65 UNION_TYPE (AVX512F_LEN,) source1, source2; 66 MASK_TYPE dst1, dst2, dst_ref; 67 MASK_TYPE mask = MASK_VALUE; 68 int i; 69 float s1[16] = {2134.3343, 6678.346, 453.345635, 54646.464, 70 231.23311, 5674.455, 111.111111, 23241.152, 71 123.14811, 1245.124, 244.151353, 53454.141, 72 926.16717, 3733.261, 643.161644, 23514.633}; 73 float s2[16] = {41124.234, 6678.346, 8653.65635, 856.43576, 74 231.23311, 4646.123, 111.111111, 124.12455, 75 123.14811, 1245.124, 244.151353, 53454.141, 76 2134.3343, 6678.346, 453.345635, 54646.464}; 77 78 CMP(_CMP_EQ_OQ, !isunordered(s1[i], s2[i]) && s1[i] == s2[i]); 79 CMP(_CMP_LT_OS, !isunordered(s1[i], s2[i]) && s1[i] < s2[i]); 80 CMP(_CMP_LE_OS, !isunordered(s1[i], s2[i]) && s1[i] <= s2[i]); 81 CMP(_CMP_UNORD_Q, isunordered(s1[i], s2[i])); 82 CMP(_CMP_NEQ_UQ, isunordered(s1[i], s2[i]) || s1[i] != s2[i]); 83 CMP(_CMP_NLT_US, isunordered(s1[i], s2[i]) || s1[i] >= s2[i]); 84 CMP(_CMP_NLE_US, isunordered(s1[i], s2[i]) || s1[i] > s2[i]); 85 CMP(_CMP_ORD_Q, !isunordered(s1[i], s2[i])); 86 87 CMP(_CMP_EQ_UQ, isunordered(s1[i], s2[i]) || s1[i] == s2[i]); 88 CMP(_CMP_NGE_US, isunordered(s1[i], s2[i]) || s1[i] < s2[i]); 89 CMP(_CMP_NGT_US, isunordered(s1[i], s2[i]) || s1[i] <= s2[i]); 90 91 CMP(_CMP_FALSE_OQ, 0); 92 CMP(_CMP_NEQ_OQ, !isunordered(s1[i], s2[i]) && s1[i] != s2[i]); 93 CMP(_CMP_GE_OS, !isunordered(s1[i], s2[i]) && s1[i] >= s2[i]); 94 CMP(_CMP_GT_OS, !isunordered(s1[i], s2[i]) && s1[i] > s2[i]); 95 CMP(_CMP_TRUE_UQ, 1); 96 97 CMP(_CMP_EQ_OS, !isunordered(s1[i], s2[i]) && s1[i] == s2[i]); 98 CMP(_CMP_LT_OQ, !isunordered(s1[i], s2[i]) && s1[i] < s2[i]); 99 CMP(_CMP_LE_OQ, !isunordered(s1[i], s2[i]) && s1[i] <= s2[i]); 100 CMP(_CMP_UNORD_S, isunordered(s1[i], s2[i])); 101 CMP(_CMP_NEQ_US, isunordered(s1[i], s2[i]) || s1[i] != s2[i]); 102 CMP(_CMP_NLT_UQ, isunordered(s1[i], s2[i]) || s1[i] >= s2[i]); 103 CMP(_CMP_NLE_UQ, isunordered(s1[i], s2[i]) || s1[i] > s2[i]); 104 CMP(_CMP_ORD_S, !isunordered(s1[i], s2[i])); 105 CMP(_CMP_EQ_US, isunordered(s1[i], s2[i]) || s1[i] == s2[i]); 106 CMP(_CMP_NGE_UQ, isunordered(s1[i], s2[i]) || s1[i] < s2[i]); 107 CMP(_CMP_NGT_UQ, isunordered(s1[i], s2[i]) || s1[i] <= s2[i]); 108 CMP(_CMP_FALSE_OS, 0); 109 CMP(_CMP_NEQ_OS, !isunordered(s1[i], s2[i]) && s1[i] != s2[i]); 110 CMP(_CMP_GE_OQ, !isunordered(s1[i], s2[i]) && s1[i] >= s2[i]); 111 CMP(_CMP_GT_OQ, !isunordered(s1[i], s2[i]) && s1[i] > s2[i]); 112 CMP(_CMP_TRUE_US, 1) 113} 114