1/* { dg-do run } */
2/* { dg-options "-O2 -mavx512f -std=c99" } */
3/* { dg-require-effective-target avx512f } */
4/* { dg-require-effective-target c99_runtime } */
5
6#define AVX512F
7
8#include "avx512f-helper.h"
9
10#include <math.h>
11#define SIZE (AVX512F_LEN / 32)
12#include "avx512f-mask-type.h"
13
14#if AVX512F_LEN == 512
15#undef CMP
16#define CMP(imm, rel)					\
17    dst_ref = 0;					\
18    for (i = 0; i < 16; i++)				\
19    {							\
20      dst_ref = (((int) rel) << i) | dst_ref;		\
21    }							\
22    source1.x = _mm512_loadu_ps(s1);			\
23    source2.x = _mm512_loadu_ps(s2);			\
24    dst1 = _mm512_cmp_ps_mask(source1.x, source2.x, imm);\
25    dst2 = _mm512_mask_cmp_ps_mask(mask, source1.x, source2.x, imm);\
26    if (dst_ref != dst1) abort();			\
27    if ((dst_ref & mask) != dst2) abort();
28#endif
29
30#if AVX512F_LEN == 256
31#undef CMP
32#define CMP(imm, rel)					\
33    dst_ref = 0;					\
34    for (i = 0; i < 8; i++)				\
35    {							\
36      dst_ref = (((int) rel) << i) | dst_ref;		\
37    }							\
38    source1.x = _mm256_loadu_ps(s1);			\
39    source2.x = _mm256_loadu_ps(s2);			\
40    dst1 = _mm256_cmp_ps_mask(source1.x, source2.x, imm);\
41    dst2 = _mm256_mask_cmp_ps_mask(mask, source1.x, source2.x, imm);\
42    if (dst_ref != dst1) abort();			\
43    if ((dst_ref & mask) != dst2) abort();
44#endif
45
46#if AVX512F_LEN == 128
47#undef CMP
48#define CMP(imm, rel)					\
49    dst_ref = 0;					\
50    for (i = 0; i < 4; i++)				\
51    {							\
52      dst_ref = (((int) rel) << i) | dst_ref;		\
53    }							\
54    source1.x = _mm_loadu_ps(s1);			\
55    source2.x = _mm_loadu_ps(s2);			\
56    dst1 = _mm_cmp_ps_mask(source1.x, source2.x, imm);\
57    dst2 = _mm_mask_cmp_ps_mask(mask, source1.x, source2.x, imm);\
58    if (dst_ref != dst1) abort();			\
59    if ((dst_ref & mask) != dst2) abort();
60#endif
61
62void
63TEST ()
64{
65    UNION_TYPE (AVX512F_LEN,) source1, source2;
66    MASK_TYPE dst1, dst2, dst_ref;
67    MASK_TYPE mask = MASK_VALUE;
68    int i;
69    float s1[16] = {2134.3343, 6678.346, 453.345635, 54646.464,
70		    231.23311, 5674.455, 111.111111, 23241.152,
71		    123.14811, 1245.124, 244.151353, 53454.141,
72		    926.16717, 3733.261, 643.161644, 23514.633};
73    float s2[16] = {41124.234, 6678.346, 8653.65635, 856.43576,
74		    231.23311, 4646.123, 111.111111, 124.12455,
75		    123.14811, 1245.124, 244.151353, 53454.141,
76		    2134.3343, 6678.346, 453.345635, 54646.464};
77
78    CMP(_CMP_EQ_OQ, !isunordered(s1[i], s2[i]) && s1[i] == s2[i]);
79    CMP(_CMP_LT_OS, !isunordered(s1[i], s2[i]) && s1[i] < s2[i]);
80    CMP(_CMP_LE_OS, !isunordered(s1[i], s2[i]) && s1[i] <= s2[i]);
81    CMP(_CMP_UNORD_Q, isunordered(s1[i], s2[i]));
82    CMP(_CMP_NEQ_UQ, isunordered(s1[i], s2[i]) || s1[i] != s2[i]);
83    CMP(_CMP_NLT_US, isunordered(s1[i], s2[i]) || s1[i] >= s2[i]);
84    CMP(_CMP_NLE_US, isunordered(s1[i], s2[i]) || s1[i] > s2[i]);
85    CMP(_CMP_ORD_Q, !isunordered(s1[i], s2[i]));
86
87    CMP(_CMP_EQ_UQ, isunordered(s1[i], s2[i]) || s1[i] == s2[i]);
88    CMP(_CMP_NGE_US, isunordered(s1[i], s2[i]) || s1[i] < s2[i]);
89    CMP(_CMP_NGT_US, isunordered(s1[i], s2[i]) || s1[i] <= s2[i]);
90
91    CMP(_CMP_FALSE_OQ, 0);
92    CMP(_CMP_NEQ_OQ, !isunordered(s1[i], s2[i]) && s1[i] != s2[i]);
93    CMP(_CMP_GE_OS, !isunordered(s1[i], s2[i]) && s1[i] >= s2[i]);
94    CMP(_CMP_GT_OS, !isunordered(s1[i], s2[i]) && s1[i] > s2[i]);
95    CMP(_CMP_TRUE_UQ, 1);
96
97    CMP(_CMP_EQ_OS, !isunordered(s1[i], s2[i]) && s1[i] == s2[i]);
98    CMP(_CMP_LT_OQ, !isunordered(s1[i], s2[i]) && s1[i] < s2[i]);
99    CMP(_CMP_LE_OQ, !isunordered(s1[i], s2[i]) && s1[i] <= s2[i]);
100    CMP(_CMP_UNORD_S, isunordered(s1[i], s2[i]));
101    CMP(_CMP_NEQ_US, isunordered(s1[i], s2[i]) || s1[i] != s2[i]);
102    CMP(_CMP_NLT_UQ, isunordered(s1[i], s2[i]) || s1[i] >= s2[i]);
103    CMP(_CMP_NLE_UQ, isunordered(s1[i], s2[i]) || s1[i] > s2[i]);
104    CMP(_CMP_ORD_S, !isunordered(s1[i], s2[i]));
105    CMP(_CMP_EQ_US, isunordered(s1[i], s2[i]) || s1[i] == s2[i]);
106    CMP(_CMP_NGE_UQ, isunordered(s1[i], s2[i]) || s1[i] < s2[i]);
107    CMP(_CMP_NGT_UQ, isunordered(s1[i], s2[i]) || s1[i] <= s2[i]);
108    CMP(_CMP_FALSE_OS, 0);
109    CMP(_CMP_NEQ_OS, !isunordered(s1[i], s2[i]) && s1[i] != s2[i]);
110    CMP(_CMP_GE_OQ, !isunordered(s1[i], s2[i]) && s1[i] >= s2[i]);
111    CMP(_CMP_GT_OQ, !isunordered(s1[i], s2[i]) && s1[i] > s2[i]);
112    CMP(_CMP_TRUE_US, 1)
113}
114