1/* Copyright (C) 2013-2015 Free Software Foundation, Inc. 2 3 This file is part of GCC. 4 5 GCC is free software; you can redistribute it and/or modify 6 it under the terms of the GNU General Public License as published by 7 the Free Software Foundation; either version 3, or (at your option) 8 any later version. 9 10 GCC is distributed in the hope that it will be useful, 11 but WITHOUT ANY WARRANTY; without even the implied warranty of 12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 13 GNU General Public License for more details. 14 15 Under Section 7 of GPL version 3, you are granted additional 16 permissions described in the GCC Runtime Library Exception, version 17 3.1, as published by the Free Software Foundation. 18 19 You should have received a copy of the GNU General Public License and 20 a copy of the GCC Runtime Library Exception along with this program; 21 see the files COPYING3 and COPYING.RUNTIME respectively. If not, see 22 <http://www.gnu.org/licenses/>. */ 23 24#ifndef _IMMINTRIN_H_INCLUDED 25#error "Never use <avx512pfintrin.h> directly; include <immintrin.h> instead." 26#endif 27 28#ifndef _AVX512PFINTRIN_H_INCLUDED 29#define _AVX512PFINTRIN_H_INCLUDED 30 31#ifndef __AVX512PF__ 32#pragma GCC push_options 33#pragma GCC target("avx512pf") 34#define __DISABLE_AVX512PF__ 35#endif /* __AVX512PF__ */ 36 37/* Internal data types for implementing the intrinsics. */ 38typedef long long __v8di __attribute__ ((__vector_size__ (64))); 39typedef int __v16si __attribute__ ((__vector_size__ (64))); 40 41/* The Intel API is flexible enough that we must allow aliasing with other 42 vector types, and their scalar components. */ 43typedef long long __m512i __attribute__ ((__vector_size__ (64), __may_alias__)); 44 45typedef unsigned char __mmask8; 46typedef unsigned short __mmask16; 47 48#ifdef __OPTIMIZE__ 49extern __inline void 50__attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 51_mm512_mask_prefetch_i32gather_pd (__m256i index, __mmask8 mask, 52 void *addr, int scale, int hint) 53{ 54 __builtin_ia32_gatherpfdpd (mask, (__v8si) index, (long long const *) addr, 55 scale, hint); 56} 57 58extern __inline void 59__attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 60_mm512_mask_prefetch_i32gather_ps (__m512i index, __mmask16 mask, 61 void *addr, int scale, int hint) 62{ 63 __builtin_ia32_gatherpfdps (mask, (__v16si) index, (int const *) addr, 64 scale, hint); 65} 66 67extern __inline void 68__attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 69_mm512_mask_prefetch_i64gather_pd (__m512i index, __mmask8 mask, 70 void *addr, int scale, int hint) 71{ 72 __builtin_ia32_gatherpfqpd (mask, (__v8di) index, (long long const *) addr, 73 scale, hint); 74} 75 76extern __inline void 77__attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 78_mm512_mask_prefetch_i64gather_ps (__m512i index, __mmask8 mask, 79 void *addr, int scale, int hint) 80{ 81 __builtin_ia32_gatherpfqps (mask, (__v8di) index, (int const *) addr, 82 scale, hint); 83} 84 85extern __inline void 86__attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 87_mm512_prefetch_i32scatter_pd (void *addr, __m256i index, int scale, 88 int hint) 89{ 90 __builtin_ia32_scatterpfdpd ((__mmask8) 0xFF, (__v8si) index, 91 (long long const *)addr, scale, hint); 92} 93 94extern __inline void 95__attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 96_mm512_prefetch_i32scatter_ps (void *addr, __m512i index, int scale, 97 int hint) 98{ 99 __builtin_ia32_scatterpfdps ((__mmask16) 0xFFFF, (__v16si) index, (int const *) addr, 100 scale, hint); 101} 102 103extern __inline void 104__attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 105_mm512_mask_prefetch_i32scatter_pd (void *addr, __mmask8 mask, 106 __m256i index, int scale, int hint) 107{ 108 __builtin_ia32_scatterpfdpd (mask, (__v8si) index, (long long const *) addr, 109 scale, hint); 110} 111 112extern __inline void 113__attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 114_mm512_mask_prefetch_i32scatter_ps (void *addr, __mmask16 mask, 115 __m512i index, int scale, int hint) 116{ 117 __builtin_ia32_scatterpfdps (mask, (__v16si) index, (int const *) addr, 118 scale, hint); 119} 120 121extern __inline void 122__attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 123_mm512_prefetch_i64scatter_pd (void *addr, __m512i index, int scale, 124 int hint) 125{ 126 __builtin_ia32_scatterpfqpd ((__mmask8) 0xFF, (__v8di) index, (long long const *) addr, 127 scale, hint); 128} 129 130extern __inline void 131__attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 132_mm512_prefetch_i64scatter_ps (void *addr, __m512i index, int scale, 133 int hint) 134{ 135 __builtin_ia32_scatterpfqps ((__mmask8) 0xFF, (__v8di) index, (int const *) addr, 136 scale, hint); 137} 138 139extern __inline void 140__attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 141_mm512_mask_prefetch_i64scatter_pd (void *addr, __mmask16 mask, 142 __m512i index, int scale, int hint) 143{ 144 __builtin_ia32_scatterpfqpd (mask, (__v8di) index, (long long const *) addr, 145 scale, hint); 146} 147 148extern __inline void 149__attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 150_mm512_mask_prefetch_i64scatter_ps (void *addr, __mmask16 mask, 151 __m512i index, int scale, int hint) 152{ 153 __builtin_ia32_scatterpfqps (mask, (__v8di) index, (int const *) addr, 154 scale, hint); 155} 156 157#else 158#define _mm512_mask_prefetch_i32gather_pd(INDEX, MASK, ADDR, SCALE, HINT) \ 159 __builtin_ia32_gatherpfdpd ((__mmask8)MASK, (__v8si)(__m256i)INDEX, \ 160 (long long const *)ADDR, (int)SCALE, (int)HINT) 161 162#define _mm512_mask_prefetch_i32gather_ps(INDEX, MASK, ADDR, SCALE, HINT) \ 163 __builtin_ia32_gatherpfdps ((__mmask16)MASK, (__v16si)(__m512i)INDEX, \ 164 (int const *)ADDR, (int)SCALE, (int)HINT) 165 166#define _mm512_mask_prefetch_i64gather_pd(INDEX, MASK, ADDR, SCALE, HINT) \ 167 __builtin_ia32_gatherpfqpd ((__mmask8)MASK, (__v8di)(__m512i)INDEX, \ 168 (long long const *)ADDR, (int)SCALE, (int)HINT) 169 170#define _mm512_mask_prefetch_i64gather_ps(INDEX, MASK, ADDR, SCALE, HINT) \ 171 __builtin_ia32_gatherpfqps ((__mmask8)MASK, (__v8di)(__m512i)INDEX, \ 172 (int const *)ADDR, (int)SCALE, (int)HINT) 173 174#define _mm512_prefetch_i32scatter_pd(ADDR, INDEX, SCALE, HINT) \ 175 __builtin_ia32_scatterpfdpd ((__mmask8)0xFF, (__v8si)(__m256i)INDEX, \ 176 (long long const *)ADDR, (int)SCALE, (int)HINT) 177 178#define _mm512_prefetch_i32scatter_ps(ADDR, INDEX, SCALE, HINT) \ 179 __builtin_ia32_scatterpfdps ((__mmask16)0xFFFF, (__v16si)(__m512i)INDEX, \ 180 (int const *)ADDR, (int)SCALE, (int)HINT) 181 182#define _mm512_mask_prefetch_i32scatter_pd(ADDR, MASK, INDEX, SCALE, HINT) \ 183 __builtin_ia32_scatterpfdpd ((__mmask8)MASK, (__v8si)(__m256i)INDEX, \ 184 (long long const *)ADDR, (int)SCALE, (int)HINT) 185 186#define _mm512_mask_prefetch_i32scatter_ps(ADDR, MASK, INDEX, SCALE, HINT) \ 187 __builtin_ia32_scatterpfdps ((__mmask16)MASK, (__v16si)(__m512i)INDEX, \ 188 (int const *)ADDR, (int)SCALE, (int)HINT) 189 190#define _mm512_prefetch_i64scatter_pd(ADDR, INDEX, SCALE, HINT) \ 191 __builtin_ia32_scatterpfqpd ((__mmask8)0xFF, (__v8di)(__m512i)INDEX, \ 192 (long long const *)ADDR, (int)SCALE, (int)HINT) 193 194#define _mm512_prefetch_i64scatter_ps(ADDR, INDEX, SCALE, HINT) \ 195 __builtin_ia32_scatterpfqps ((__mmask8)0xFF, (__v8di)(__m512i)INDEX, \ 196 (int const *)ADDR, (int)SCALE, (int)HINT) 197 198#define _mm512_mask_prefetch_i64scatter_pd(ADDR, MASK, INDEX, SCALE, HINT) \ 199 __builtin_ia32_scatterpfqpd ((__mmask8)MASK, (__v8di)(__m512i)INDEX, \ 200 (long long const *)ADDR, (int)SCALE, (int)HINT) 201 202#define _mm512_mask_prefetch_i64scatter_ps(ADDR, MASK, INDEX, SCALE, HINT) \ 203 __builtin_ia32_scatterpfqps ((__mmask8)MASK, (__v8di)(__m512i)INDEX, \ 204 (int const *)ADDR, (int)SCALE, (int)HINT) 205#endif 206 207#ifdef __DISABLE_AVX512PF__ 208#undef __DISABLE_AVX512PF__ 209#pragma GCC pop_options 210#endif /* __DISABLE_AVX512PF__ */ 211 212#endif /* _AVX512PFINTRIN_H_INCLUDED */ 213