1/* Copyright (C) 2013-2015 Free Software Foundation, Inc.
2
3   This file is part of GCC.
4
5   GCC is free software; you can redistribute it and/or modify
6   it under the terms of the GNU General Public License as published by
7   the Free Software Foundation; either version 3, or (at your option)
8   any later version.
9
10   GCC is distributed in the hope that it will be useful,
11   but WITHOUT ANY WARRANTY; without even the implied warranty of
12   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
13   GNU General Public License for more details.
14
15   Under Section 7 of GPL version 3, you are granted additional
16   permissions described in the GCC Runtime Library Exception, version
17   3.1, as published by the Free Software Foundation.
18
19   You should have received a copy of the GNU General Public License and
20   a copy of the GCC Runtime Library Exception along with this program;
21   see the files COPYING3 and COPYING.RUNTIME respectively.  If not, see
22   <http://www.gnu.org/licenses/>.  */
23
24#ifndef _IMMINTRIN_H_INCLUDED
25#error "Never use <avx512pfintrin.h> directly; include <immintrin.h> instead."
26#endif
27
28#ifndef _AVX512PFINTRIN_H_INCLUDED
29#define _AVX512PFINTRIN_H_INCLUDED
30
31#ifndef __AVX512PF__
32#pragma GCC push_options
33#pragma GCC target("avx512pf")
34#define __DISABLE_AVX512PF__
35#endif /* __AVX512PF__ */
36
37/* Internal data types for implementing the intrinsics.  */
38typedef long long __v8di __attribute__ ((__vector_size__ (64)));
39typedef int __v16si __attribute__ ((__vector_size__ (64)));
40
41/* The Intel API is flexible enough that we must allow aliasing with other
42   vector types, and their scalar components.  */
43typedef long long __m512i __attribute__ ((__vector_size__ (64), __may_alias__));
44
45typedef unsigned char  __mmask8;
46typedef unsigned short __mmask16;
47
48#ifdef __OPTIMIZE__
49extern __inline void
50__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
51_mm512_mask_prefetch_i32gather_pd (__m256i index, __mmask8 mask,
52				   void *addr, int scale, int hint)
53{
54  __builtin_ia32_gatherpfdpd (mask, (__v8si) index, (long long const *) addr,
55			      scale, hint);
56}
57
58extern __inline void
59__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
60_mm512_mask_prefetch_i32gather_ps (__m512i index, __mmask16 mask,
61				   void *addr, int scale, int hint)
62{
63  __builtin_ia32_gatherpfdps (mask, (__v16si) index, (int const *) addr,
64			      scale, hint);
65}
66
67extern __inline void
68__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
69_mm512_mask_prefetch_i64gather_pd (__m512i index, __mmask8 mask,
70				   void *addr, int scale, int hint)
71{
72  __builtin_ia32_gatherpfqpd (mask, (__v8di) index, (long long const *) addr,
73			      scale, hint);
74}
75
76extern __inline void
77__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
78_mm512_mask_prefetch_i64gather_ps (__m512i index, __mmask8 mask,
79				   void *addr, int scale, int hint)
80{
81  __builtin_ia32_gatherpfqps (mask, (__v8di) index, (int const *) addr,
82			      scale, hint);
83}
84
85extern __inline void
86__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
87_mm512_prefetch_i32scatter_pd (void *addr, __m256i index, int scale,
88			       int hint)
89{
90  __builtin_ia32_scatterpfdpd ((__mmask8) 0xFF, (__v8si) index,
91			       (long long const *)addr, scale, hint);
92}
93
94extern __inline void
95__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
96_mm512_prefetch_i32scatter_ps (void *addr, __m512i index, int scale,
97			       int hint)
98{
99  __builtin_ia32_scatterpfdps ((__mmask16) 0xFFFF, (__v16si) index, (int const *) addr,
100			       scale, hint);
101}
102
103extern __inline void
104__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
105_mm512_mask_prefetch_i32scatter_pd (void *addr, __mmask8 mask,
106				    __m256i index, int scale, int hint)
107{
108  __builtin_ia32_scatterpfdpd (mask, (__v8si) index, (long long const *) addr,
109			       scale, hint);
110}
111
112extern __inline void
113__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
114_mm512_mask_prefetch_i32scatter_ps (void *addr, __mmask16 mask,
115				    __m512i index, int scale, int hint)
116{
117  __builtin_ia32_scatterpfdps (mask, (__v16si) index, (int const *) addr,
118			       scale, hint);
119}
120
121extern __inline void
122__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
123_mm512_prefetch_i64scatter_pd (void *addr, __m512i index, int scale,
124			       int hint)
125{
126  __builtin_ia32_scatterpfqpd ((__mmask8) 0xFF, (__v8di) index, (long long const *) addr,
127			       scale, hint);
128}
129
130extern __inline void
131__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
132_mm512_prefetch_i64scatter_ps (void *addr, __m512i index, int scale,
133			       int hint)
134{
135  __builtin_ia32_scatterpfqps ((__mmask8) 0xFF, (__v8di) index, (int const *) addr,
136			       scale, hint);
137}
138
139extern __inline void
140__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
141_mm512_mask_prefetch_i64scatter_pd (void *addr, __mmask16 mask,
142				    __m512i index, int scale, int hint)
143{
144  __builtin_ia32_scatterpfqpd (mask, (__v8di) index, (long long const *) addr,
145			       scale, hint);
146}
147
148extern __inline void
149__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
150_mm512_mask_prefetch_i64scatter_ps (void *addr, __mmask16 mask,
151				    __m512i index, int scale, int hint)
152{
153  __builtin_ia32_scatterpfqps (mask, (__v8di) index, (int const *) addr,
154			       scale, hint);
155}
156
157#else
158#define _mm512_mask_prefetch_i32gather_pd(INDEX, MASK, ADDR, SCALE, HINT)    \
159  __builtin_ia32_gatherpfdpd ((__mmask8)MASK, (__v8si)(__m256i)INDEX,	     \
160			      (long long const *)ADDR, (int)SCALE, (int)HINT)
161
162#define _mm512_mask_prefetch_i32gather_ps(INDEX, MASK, ADDR, SCALE, HINT)    \
163  __builtin_ia32_gatherpfdps ((__mmask16)MASK, (__v16si)(__m512i)INDEX,      \
164			      (int const *)ADDR, (int)SCALE, (int)HINT)
165
166#define _mm512_mask_prefetch_i64gather_pd(INDEX, MASK, ADDR, SCALE, HINT)    \
167  __builtin_ia32_gatherpfqpd ((__mmask8)MASK, (__v8di)(__m512i)INDEX,	     \
168			      (long long const *)ADDR, (int)SCALE, (int)HINT)
169
170#define _mm512_mask_prefetch_i64gather_ps(INDEX, MASK, ADDR, SCALE, HINT)    \
171  __builtin_ia32_gatherpfqps ((__mmask8)MASK, (__v8di)(__m512i)INDEX,	     \
172			      (int const *)ADDR, (int)SCALE, (int)HINT)
173
174#define _mm512_prefetch_i32scatter_pd(ADDR, INDEX, SCALE, HINT)              \
175  __builtin_ia32_scatterpfdpd ((__mmask8)0xFF, (__v8si)(__m256i)INDEX,       \
176			       (long long const *)ADDR, (int)SCALE, (int)HINT)
177
178#define _mm512_prefetch_i32scatter_ps(ADDR, INDEX, SCALE, HINT)              \
179  __builtin_ia32_scatterpfdps ((__mmask16)0xFFFF, (__v16si)(__m512i)INDEX,   \
180			       (int const *)ADDR, (int)SCALE, (int)HINT)
181
182#define _mm512_mask_prefetch_i32scatter_pd(ADDR, MASK, INDEX, SCALE, HINT)   \
183  __builtin_ia32_scatterpfdpd ((__mmask8)MASK, (__v8si)(__m256i)INDEX,       \
184			       (long long const *)ADDR, (int)SCALE, (int)HINT)
185
186#define _mm512_mask_prefetch_i32scatter_ps(ADDR, MASK, INDEX, SCALE, HINT)   \
187  __builtin_ia32_scatterpfdps ((__mmask16)MASK, (__v16si)(__m512i)INDEX,     \
188			       (int const *)ADDR, (int)SCALE, (int)HINT)
189
190#define _mm512_prefetch_i64scatter_pd(ADDR, INDEX, SCALE, HINT)              \
191  __builtin_ia32_scatterpfqpd ((__mmask8)0xFF, (__v8di)(__m512i)INDEX,	     \
192			       (long long const *)ADDR, (int)SCALE, (int)HINT)
193
194#define _mm512_prefetch_i64scatter_ps(ADDR, INDEX, SCALE, HINT)              \
195  __builtin_ia32_scatterpfqps ((__mmask8)0xFF, (__v8di)(__m512i)INDEX,	     \
196			       (int const *)ADDR, (int)SCALE, (int)HINT)
197
198#define _mm512_mask_prefetch_i64scatter_pd(ADDR, MASK, INDEX, SCALE, HINT)   \
199  __builtin_ia32_scatterpfqpd ((__mmask8)MASK, (__v8di)(__m512i)INDEX,	     \
200			       (long long const *)ADDR, (int)SCALE, (int)HINT)
201
202#define _mm512_mask_prefetch_i64scatter_ps(ADDR, MASK, INDEX, SCALE, HINT)   \
203  __builtin_ia32_scatterpfqps ((__mmask8)MASK, (__v8di)(__m512i)INDEX,	     \
204			       (int const *)ADDR, (int)SCALE, (int)HINT)
205#endif
206
207#ifdef __DISABLE_AVX512PF__
208#undef __DISABLE_AVX512PF__
209#pragma GCC pop_options
210#endif /* __DISABLE_AVX512PF__ */
211
212#endif /* _AVX512PFINTRIN_H_INCLUDED */
213