1/* Copyright (C) 2013-2015 Free Software Foundation, Inc.
2
3   This file is part of GCC.
4
5   GCC is free software; you can redistribute it and/or modify
6   it under the terms of the GNU General Public License as published by
7   the Free Software Foundation; either version 3, or (at your option)
8   any later version.
9
10   GCC is distributed in the hope that it will be useful,
11   but WITHOUT ANY WARRANTY; without even the implied warranty of
12   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
13   GNU General Public License for more details.
14
15   Under Section 7 of GPL version 3, you are granted additional
16   permissions described in the GCC Runtime Library Exception, version
17   3.1, as published by the Free Software Foundation.
18
19   You should have received a copy of the GNU General Public License and
20   a copy of the GCC Runtime Library Exception along with this program;
21   see the files COPYING3 and COPYING.RUNTIME respectively.  If not, see
22   <http://www.gnu.org/licenses/>.  */
23
24#ifndef _IMMINTRIN_H_INCLUDED
25#error "Never use <avx512vbmivlintrin.h> directly; include <immintrin.h> instead."
26#endif
27
28#ifndef _AVX512VBMIVLINTRIN_H_INCLUDED
29#define _AVX512VBMIVLINTRIN_H_INCLUDED
30
31#if !defined(__AVX512VL__) || !defined(__AVX512VBMI__)
32#pragma GCC push_options
33#pragma GCC target("avx512vbmi,avx512vl")
34#define __DISABLE_AVX512VBMIVL__
35#endif /* __AVX512VBMIVL__ */
36
37extern __inline __m256i
38__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
39_mm256_mask_multishift_epi64_epi8 (__m256i __W, __mmask32 __M, __m256i __X, __m256i __Y)
40{
41  return (__m256i) __builtin_ia32_vpmultishiftqb256_mask ((__v32qi) __X,
42							  (__v32qi) __Y,
43							  (__v32qi) __W,
44							  (__mmask32) __M);
45}
46
47extern __inline __m256i
48__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
49_mm256_maskz_multishift_epi64_epi8 (__mmask32 __M, __m256i __X, __m256i __Y)
50{
51  return (__m256i) __builtin_ia32_vpmultishiftqb256_mask ((__v32qi) __X,
52							  (__v32qi) __Y,
53							  (__v32qi)
54							  _mm256_setzero_si256 (),
55							  (__mmask32) __M);
56}
57
58extern __inline __m256i
59__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
60_mm256_multishift_epi64_epi8 (__m256i __X, __m256i __Y)
61{
62  return (__m256i) __builtin_ia32_vpmultishiftqb256_mask ((__v32qi) __X,
63							  (__v32qi) __Y,
64							  (__v32qi)
65							  _mm256_undefined_si256 (),
66							  (__mmask32) -1);
67}
68
69extern __inline __m128i
70__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
71_mm_mask_multishift_epi64_epi8 (__m128i __W, __mmask16 __M, __m128i __X, __m128i __Y)
72{
73  return (__m128i) __builtin_ia32_vpmultishiftqb128_mask ((__v16qi) __X,
74							  (__v16qi) __Y,
75							  (__v16qi) __W,
76							  (__mmask16) __M);
77}
78
79extern __inline __m128i
80__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
81_mm_maskz_multishift_epi64_epi8 (__mmask16 __M, __m128i __X, __m128i __Y)
82{
83  return (__m128i) __builtin_ia32_vpmultishiftqb128_mask ((__v16qi) __X,
84							  (__v16qi) __Y,
85							  (__v16qi)
86							  _mm_setzero_si128 (),
87							  (__mmask16) __M);
88}
89
90extern __inline __m128i
91__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
92_mm_multishift_epi64_epi8 (__m128i __X, __m128i __Y)
93{
94  return (__m128i) __builtin_ia32_vpmultishiftqb128_mask ((__v16qi) __X,
95							  (__v16qi) __Y,
96							  (__v16qi)
97							  _mm_undefined_si128 (),
98							  (__mmask16) -1);
99}
100
101extern __inline __m256i
102__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
103_mm256_permutexvar_epi8 (__m256i __A, __m256i __B)
104{
105  return (__m256i) __builtin_ia32_permvarqi256_mask ((__v32qi) __B,
106						     (__v32qi) __A,
107						     (__v32qi)
108						     _mm256_undefined_si256 (),
109						     (__mmask32) -1);
110}
111
112extern __inline __m256i
113__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
114_mm256_maskz_permutexvar_epi8 (__mmask32 __M, __m256i __A,
115				__m256i __B)
116{
117  return (__m256i) __builtin_ia32_permvarqi256_mask ((__v32qi) __B,
118						     (__v32qi) __A,
119						     (__v32qi)
120						     _mm256_setzero_si256 (),
121						     (__mmask32) __M);
122}
123
124extern __inline __m256i
125__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
126_mm256_mask_permutexvar_epi8 (__m256i __W, __mmask32 __M, __m256i __A,
127			       __m256i __B)
128{
129  return (__m256i) __builtin_ia32_permvarqi256_mask ((__v32qi) __B,
130						     (__v32qi) __A,
131						     (__v32qi) __W,
132						     (__mmask32) __M);
133}
134
135extern __inline __m128i
136__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
137_mm_permutexvar_epi8 (__m128i __A, __m128i __B)
138{
139  return (__m128i) __builtin_ia32_permvarqi128_mask ((__v16qi) __B,
140						     (__v16qi) __A,
141						     (__v16qi)
142						     _mm_undefined_si128 (),
143						     (__mmask16) -1);
144}
145
146extern __inline __m128i
147__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
148_mm_maskz_permutexvar_epi8 (__mmask16 __M, __m128i __A, __m128i __B)
149{
150  return (__m128i) __builtin_ia32_permvarqi128_mask ((__v16qi) __B,
151						     (__v16qi) __A,
152						     (__v16qi)
153						     _mm_setzero_si128 (),
154						     (__mmask16) __M);
155}
156
157extern __inline __m128i
158__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
159_mm_mask_permutexvar_epi8 (__m128i __W, __mmask16 __M, __m128i __A,
160			    __m128i __B)
161{
162  return (__m128i) __builtin_ia32_permvarqi128_mask ((__v16qi) __B,
163						     (__v16qi) __A,
164						     (__v16qi) __W,
165						     (__mmask16) __M);
166}
167
168extern __inline __m256i
169__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
170_mm256_permutex2var_epi8 (__m256i __A, __m256i __I, __m256i __B)
171{
172  return (__m256i) __builtin_ia32_vpermt2varqi256_mask ((__v32qi) __I
173							/* idx */ ,
174							(__v32qi) __A,
175							(__v32qi) __B,
176							(__mmask32) -
177							1);
178}
179
180extern __inline __m256i
181__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
182_mm256_mask_permutex2var_epi8 (__m256i __A, __mmask32 __U,
183				__m256i __I, __m256i __B)
184{
185  return (__m256i) __builtin_ia32_vpermt2varqi256_mask ((__v32qi) __I
186							/* idx */ ,
187							(__v32qi) __A,
188							(__v32qi) __B,
189							(__mmask32)
190							__U);
191}
192
193extern __inline __m256i
194__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
195_mm256_mask2_permutex2var_epi8 (__m256i __A, __m256i __I,
196				 __mmask32 __U, __m256i __B)
197{
198  return (__m256i) __builtin_ia32_vpermi2varqi256_mask ((__v32qi) __A,
199							(__v32qi) __I
200							/* idx */ ,
201							(__v32qi) __B,
202							(__mmask32)
203							__U);
204}
205
206extern __inline __m256i
207__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
208_mm256_maskz_permutex2var_epi8 (__mmask32 __U, __m256i __A,
209				 __m256i __I, __m256i __B)
210{
211  return (__m256i) __builtin_ia32_vpermt2varqi256_maskz ((__v32qi) __I
212							 /* idx */ ,
213							 (__v32qi) __A,
214							 (__v32qi) __B,
215							 (__mmask32)
216							 __U);
217}
218
219extern __inline __m128i
220__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
221_mm_permutex2var_epi8 (__m128i __A, __m128i __I, __m128i __B)
222{
223  return (__m128i) __builtin_ia32_vpermt2varqi128_mask ((__v16qi) __I
224							/* idx */ ,
225							(__v16qi) __A,
226							(__v16qi) __B,
227							(__mmask16) -
228							1);
229}
230
231extern __inline __m128i
232__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
233_mm_mask_permutex2var_epi8 (__m128i __A, __mmask16 __U, __m128i __I,
234			     __m128i __B)
235{
236  return (__m128i) __builtin_ia32_vpermt2varqi128_mask ((__v16qi) __I
237							/* idx */ ,
238							(__v16qi) __A,
239							(__v16qi) __B,
240							(__mmask16)
241							__U);
242}
243
244extern __inline __m128i
245__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
246_mm_mask2_permutex2var_epi8 (__m128i __A, __m128i __I, __mmask16 __U,
247			      __m128i __B)
248{
249  return (__m128i) __builtin_ia32_vpermi2varqi128_mask ((__v16qi) __A,
250							(__v16qi) __I
251							/* idx */ ,
252							(__v16qi) __B,
253							(__mmask16)
254							__U);
255}
256
257extern __inline __m128i
258__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
259_mm_maskz_permutex2var_epi8 (__mmask16 __U, __m128i __A, __m128i __I,
260			      __m128i __B)
261{
262  return (__m128i) __builtin_ia32_vpermt2varqi128_maskz ((__v16qi) __I
263							 /* idx */ ,
264							 (__v16qi) __A,
265							 (__v16qi) __B,
266							 (__mmask16)
267							 __U);
268}
269
270#ifdef __DISABLE_AVX512VBMIVL__
271#undef __DISABLE_AVX512VBMIVL__
272#pragma GCC pop_options
273#endif /* __DISABLE_AVX512VBMIVL__ */
274
275#endif /* _AVX512VBMIVLINTRIN_H_INCLUDED */
276