1327302Sdim/*===------------- avx512bitalgintrin.h - BITALG intrinsics ------------------===
2327302Sdim *
3327302Sdim *
4353358Sdim * Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
5353358Sdim * See https://llvm.org/LICENSE.txt for license information.
6353358Sdim * SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7327302Sdim *
8327302Sdim *===-----------------------------------------------------------------------===
9327302Sdim */
10327302Sdim#ifndef __IMMINTRIN_H
11327302Sdim#error "Never use <avx512bitalgintrin.h> directly; include <immintrin.h> instead."
12327302Sdim#endif
13327302Sdim
14327302Sdim#ifndef __AVX512BITALGINTRIN_H
15327302Sdim#define __AVX512BITALGINTRIN_H
16327302Sdim
17327302Sdim/* Define the default attributes for the functions in this file. */
18341825Sdim#define __DEFAULT_FN_ATTRS __attribute__((__always_inline__, __nodebug__, __target__("avx512bitalg"), __min_vector_width__(512)))
19327302Sdim
20327302Sdimstatic __inline__ __m512i __DEFAULT_FN_ATTRS
21327302Sdim_mm512_popcnt_epi16(__m512i __A)
22327302Sdim{
23327302Sdim  return (__m512i) __builtin_ia32_vpopcntw_512((__v32hi) __A);
24327302Sdim}
25327302Sdim
26327302Sdimstatic __inline__ __m512i __DEFAULT_FN_ATTRS
27327302Sdim_mm512_mask_popcnt_epi16(__m512i __A, __mmask32 __U, __m512i __B)
28327302Sdim{
29327302Sdim  return (__m512i) __builtin_ia32_selectw_512((__mmask32) __U,
30327302Sdim              (__v32hi) _mm512_popcnt_epi16(__B),
31327302Sdim              (__v32hi) __A);
32327302Sdim}
33327302Sdim
34327302Sdimstatic __inline__ __m512i __DEFAULT_FN_ATTRS
35327302Sdim_mm512_maskz_popcnt_epi16(__mmask32 __U, __m512i __B)
36327302Sdim{
37341825Sdim  return _mm512_mask_popcnt_epi16((__m512i) _mm512_setzero_si512(),
38327302Sdim              __U,
39327302Sdim              __B);
40327302Sdim}
41327302Sdim
42327302Sdimstatic __inline__ __m512i __DEFAULT_FN_ATTRS
43327302Sdim_mm512_popcnt_epi8(__m512i __A)
44327302Sdim{
45327302Sdim  return (__m512i) __builtin_ia32_vpopcntb_512((__v64qi) __A);
46327302Sdim}
47327302Sdim
48327302Sdimstatic __inline__ __m512i __DEFAULT_FN_ATTRS
49327302Sdim_mm512_mask_popcnt_epi8(__m512i __A, __mmask64 __U, __m512i __B)
50327302Sdim{
51327302Sdim  return (__m512i) __builtin_ia32_selectb_512((__mmask64) __U,
52327302Sdim              (__v64qi) _mm512_popcnt_epi8(__B),
53327302Sdim              (__v64qi) __A);
54327302Sdim}
55327302Sdim
56327302Sdimstatic __inline__ __m512i __DEFAULT_FN_ATTRS
57327302Sdim_mm512_maskz_popcnt_epi8(__mmask64 __U, __m512i __B)
58327302Sdim{
59341825Sdim  return _mm512_mask_popcnt_epi8((__m512i) _mm512_setzero_si512(),
60327302Sdim              __U,
61327302Sdim              __B);
62327302Sdim}
63327302Sdim
64327302Sdimstatic __inline__ __mmask64 __DEFAULT_FN_ATTRS
65327302Sdim_mm512_mask_bitshuffle_epi64_mask(__mmask64 __U, __m512i __A, __m512i __B)
66327302Sdim{
67327302Sdim  return (__mmask64) __builtin_ia32_vpshufbitqmb512_mask((__v64qi) __A,
68327302Sdim              (__v64qi) __B,
69327302Sdim              __U);
70327302Sdim}
71327302Sdim
72327302Sdimstatic __inline__ __mmask64 __DEFAULT_FN_ATTRS
73327302Sdim_mm512_bitshuffle_epi64_mask(__m512i __A, __m512i __B)
74327302Sdim{
75327302Sdim  return _mm512_mask_bitshuffle_epi64_mask((__mmask64) -1,
76327302Sdim              __A,
77327302Sdim              __B);
78327302Sdim}
79327302Sdim
80327302Sdim
81327302Sdim#undef __DEFAULT_FN_ATTRS
82327302Sdim
83327302Sdim#endif
84