1327302Sdim/*===------------- avx512bitalgintrin.h - BITALG intrinsics ------------------=== 2327302Sdim * 3327302Sdim * 4353358Sdim * Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 5353358Sdim * See https://llvm.org/LICENSE.txt for license information. 6353358Sdim * SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 7327302Sdim * 8327302Sdim *===-----------------------------------------------------------------------=== 9327302Sdim */ 10327302Sdim#ifndef __IMMINTRIN_H 11327302Sdim#error "Never use <avx512bitalgintrin.h> directly; include <immintrin.h> instead." 12327302Sdim#endif 13327302Sdim 14327302Sdim#ifndef __AVX512BITALGINTRIN_H 15327302Sdim#define __AVX512BITALGINTRIN_H 16327302Sdim 17327302Sdim/* Define the default attributes for the functions in this file. */ 18341825Sdim#define __DEFAULT_FN_ATTRS __attribute__((__always_inline__, __nodebug__, __target__("avx512bitalg"), __min_vector_width__(512))) 19327302Sdim 20327302Sdimstatic __inline__ __m512i __DEFAULT_FN_ATTRS 21327302Sdim_mm512_popcnt_epi16(__m512i __A) 22327302Sdim{ 23327302Sdim return (__m512i) __builtin_ia32_vpopcntw_512((__v32hi) __A); 24327302Sdim} 25327302Sdim 26327302Sdimstatic __inline__ __m512i __DEFAULT_FN_ATTRS 27327302Sdim_mm512_mask_popcnt_epi16(__m512i __A, __mmask32 __U, __m512i __B) 28327302Sdim{ 29327302Sdim return (__m512i) __builtin_ia32_selectw_512((__mmask32) __U, 30327302Sdim (__v32hi) _mm512_popcnt_epi16(__B), 31327302Sdim (__v32hi) __A); 32327302Sdim} 33327302Sdim 34327302Sdimstatic __inline__ __m512i __DEFAULT_FN_ATTRS 35327302Sdim_mm512_maskz_popcnt_epi16(__mmask32 __U, __m512i __B) 36327302Sdim{ 37341825Sdim return _mm512_mask_popcnt_epi16((__m512i) _mm512_setzero_si512(), 38327302Sdim __U, 39327302Sdim __B); 40327302Sdim} 41327302Sdim 42327302Sdimstatic __inline__ __m512i __DEFAULT_FN_ATTRS 43327302Sdim_mm512_popcnt_epi8(__m512i __A) 44327302Sdim{ 45327302Sdim return (__m512i) __builtin_ia32_vpopcntb_512((__v64qi) __A); 46327302Sdim} 47327302Sdim 48327302Sdimstatic __inline__ __m512i __DEFAULT_FN_ATTRS 49327302Sdim_mm512_mask_popcnt_epi8(__m512i __A, __mmask64 __U, __m512i __B) 50327302Sdim{ 51327302Sdim return (__m512i) __builtin_ia32_selectb_512((__mmask64) __U, 52327302Sdim (__v64qi) _mm512_popcnt_epi8(__B), 53327302Sdim (__v64qi) __A); 54327302Sdim} 55327302Sdim 56327302Sdimstatic __inline__ __m512i __DEFAULT_FN_ATTRS 57327302Sdim_mm512_maskz_popcnt_epi8(__mmask64 __U, __m512i __B) 58327302Sdim{ 59341825Sdim return _mm512_mask_popcnt_epi8((__m512i) _mm512_setzero_si512(), 60327302Sdim __U, 61327302Sdim __B); 62327302Sdim} 63327302Sdim 64327302Sdimstatic __inline__ __mmask64 __DEFAULT_FN_ATTRS 65327302Sdim_mm512_mask_bitshuffle_epi64_mask(__mmask64 __U, __m512i __A, __m512i __B) 66327302Sdim{ 67327302Sdim return (__mmask64) __builtin_ia32_vpshufbitqmb512_mask((__v64qi) __A, 68327302Sdim (__v64qi) __B, 69327302Sdim __U); 70327302Sdim} 71327302Sdim 72327302Sdimstatic __inline__ __mmask64 __DEFAULT_FN_ATTRS 73327302Sdim_mm512_bitshuffle_epi64_mask(__m512i __A, __m512i __B) 74327302Sdim{ 75327302Sdim return _mm512_mask_bitshuffle_epi64_mask((__mmask64) -1, 76327302Sdim __A, 77327302Sdim __B); 78327302Sdim} 79327302Sdim 80327302Sdim 81327302Sdim#undef __DEFAULT_FN_ATTRS 82327302Sdim 83327302Sdim#endif 84