fmaintrin.h revision 1.1
1/* Copyright (C) 2011-2013 Free Software Foundation, Inc.
2
3   This file is part of GCC.
4
5   GCC is free software; you can redistribute it and/or modify
6   it under the terms of the GNU General Public License as published by
7   the Free Software Foundation; either version 3, or (at your option)
8   any later version.
9
10   GCC is distributed in the hope that it will be useful,
11   but WITHOUT ANY WARRANTY; without even the implied warranty of
12   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
13   GNU General Public License for more details.
14
15   Under Section 7 of GPL version 3, you are granted additional
16   permissions described in the GCC Runtime Library Exception, version
17   3.1, as published by the Free Software Foundation.
18
19   You should have received a copy of the GNU General Public License and
20   a copy of the GCC Runtime Library Exception along with this program;
21   see the files COPYING3 and COPYING.RUNTIME respectively.  If not, see
22   <http://www.gnu.org/licenses/>.  */
23
24#ifndef _IMMINTRIN_H_INCLUDED
25# error "Never use <fmaintrin.h> directly; include <immintrin.h> instead."
26#endif
27
28#ifndef _FMAINTRIN_H_INCLUDED
29#define _FMAINTRIN_H_INCLUDED
30
31#ifndef __FMA__
32# error "FMA instruction set not enabled"
33#else
34
35extern __inline __m128d
36__attribute__((__gnu_inline__, __always_inline__, __artificial__))
37_mm_fmadd_pd (__m128d __A, __m128d __B, __m128d __C)
38{
39  return (__m128d)__builtin_ia32_vfmaddpd ((__v2df)__A, (__v2df)__B,
40                                           (__v2df)__C);
41}
42
43extern __inline __m256d
44__attribute__((__gnu_inline__, __always_inline__, __artificial__))
45_mm256_fmadd_pd (__m256d __A, __m256d __B, __m256d __C)
46{
47  return (__m256d)__builtin_ia32_vfmaddpd256 ((__v4df)__A, (__v4df)__B,
48                                              (__v4df)__C);
49}
50
51extern __inline __m128
52__attribute__((__gnu_inline__, __always_inline__, __artificial__))
53_mm_fmadd_ps (__m128 __A, __m128 __B, __m128 __C)
54{
55  return (__m128)__builtin_ia32_vfmaddps ((__v4sf)__A, (__v4sf)__B,
56                                          (__v4sf)__C);
57}
58
59extern __inline __m256
60__attribute__((__gnu_inline__, __always_inline__, __artificial__))
61_mm256_fmadd_ps (__m256 __A, __m256 __B, __m256 __C)
62{
63  return (__m256)__builtin_ia32_vfmaddps256 ((__v8sf)__A, (__v8sf)__B,
64                                             (__v8sf)__C);
65}
66
67extern __inline __m128d
68__attribute__((__gnu_inline__, __always_inline__, __artificial__))
69_mm_fmadd_sd (__m128d __A, __m128d __B, __m128d __C)
70{
71  return (__m128d) __builtin_ia32_vfmaddsd3 ((__v2df)__A, (__v2df)__B,
72                                             (__v2df)__C);
73}
74
75extern __inline __m128
76__attribute__((__gnu_inline__, __always_inline__, __artificial__))
77_mm_fmadd_ss (__m128 __A, __m128 __B, __m128 __C)
78{
79  return (__m128) __builtin_ia32_vfmaddss3 ((__v4sf)__A, (__v4sf)__B,
80                                            (__v4sf)__C);
81}
82
83extern __inline __m128d
84__attribute__((__gnu_inline__, __always_inline__, __artificial__))
85_mm_fmsub_pd (__m128d __A, __m128d __B, __m128d __C)
86{
87  return (__m128d)__builtin_ia32_vfmaddpd ((__v2df)__A, (__v2df)__B,
88                                           -(__v2df)__C);
89}
90
91extern __inline __m256d
92__attribute__((__gnu_inline__, __always_inline__, __artificial__))
93_mm256_fmsub_pd (__m256d __A, __m256d __B, __m256d __C)
94{
95  return (__m256d)__builtin_ia32_vfmaddpd256 ((__v4df)__A, (__v4df)__B,
96                                              -(__v4df)__C);
97}
98
99extern __inline __m128
100__attribute__((__gnu_inline__, __always_inline__, __artificial__))
101_mm_fmsub_ps (__m128 __A, __m128 __B, __m128 __C)
102{
103  return (__m128)__builtin_ia32_vfmaddps ((__v4sf)__A, (__v4sf)__B,
104                                          -(__v4sf)__C);
105}
106
107extern __inline __m256
108__attribute__((__gnu_inline__, __always_inline__, __artificial__))
109_mm256_fmsub_ps (__m256 __A, __m256 __B, __m256 __C)
110{
111  return (__m256)__builtin_ia32_vfmaddps256 ((__v8sf)__A, (__v8sf)__B,
112                                             -(__v8sf)__C);
113}
114
115extern __inline __m128d
116__attribute__((__gnu_inline__, __always_inline__, __artificial__))
117_mm_fmsub_sd (__m128d __A, __m128d __B, __m128d __C)
118{
119  return (__m128d)__builtin_ia32_vfmaddsd3 ((__v2df)__A, (__v2df)__B,
120                                            -(__v2df)__C);
121}
122
123extern __inline __m128
124__attribute__((__gnu_inline__, __always_inline__, __artificial__))
125_mm_fmsub_ss (__m128 __A, __m128 __B, __m128 __C)
126{
127  return (__m128)__builtin_ia32_vfmaddss3 ((__v4sf)__A, (__v4sf)__B,
128                                           -(__v4sf)__C);
129}
130
131extern __inline __m128d
132__attribute__((__gnu_inline__, __always_inline__, __artificial__))
133_mm_fnmadd_pd (__m128d __A, __m128d __B, __m128d __C)
134{
135  return (__m128d)__builtin_ia32_vfmaddpd (-(__v2df)__A, (__v2df)__B,
136                                           (__v2df)__C);
137}
138
139extern __inline __m256d
140__attribute__((__gnu_inline__, __always_inline__, __artificial__))
141_mm256_fnmadd_pd (__m256d __A, __m256d __B, __m256d __C)
142{
143  return (__m256d)__builtin_ia32_vfmaddpd256 (-(__v4df)__A, (__v4df)__B,
144                                              (__v4df)__C);
145}
146
147extern __inline __m128
148__attribute__((__gnu_inline__, __always_inline__, __artificial__))
149_mm_fnmadd_ps (__m128 __A, __m128 __B, __m128 __C)
150{
151  return (__m128)__builtin_ia32_vfmaddps (-(__v4sf)__A, (__v4sf)__B,
152                                          (__v4sf)__C);
153}
154
155extern __inline __m256
156__attribute__((__gnu_inline__, __always_inline__, __artificial__))
157_mm256_fnmadd_ps (__m256 __A, __m256 __B, __m256 __C)
158{
159  return (__m256)__builtin_ia32_vfmaddps256 (-(__v8sf)__A, (__v8sf)__B,
160                                             (__v8sf)__C);
161}
162
163extern __inline __m128d
164__attribute__((__gnu_inline__, __always_inline__, __artificial__))
165_mm_fnmadd_sd (__m128d __A, __m128d __B, __m128d __C)
166{
167  return (__m128d)__builtin_ia32_vfmaddsd3 ((__v2df)__A, -(__v2df)__B,
168                                            (__v2df)__C);
169}
170
171extern __inline __m128
172__attribute__((__gnu_inline__, __always_inline__, __artificial__))
173_mm_fnmadd_ss (__m128 __A, __m128 __B, __m128 __C)
174{
175  return (__m128)__builtin_ia32_vfmaddss3 ((__v4sf)__A, -(__v4sf)__B,
176                                           (__v4sf)__C);
177}
178
179extern __inline __m128d
180__attribute__((__gnu_inline__, __always_inline__, __artificial__))
181_mm_fnmsub_pd (__m128d __A, __m128d __B, __m128d __C)
182{
183  return (__m128d)__builtin_ia32_vfmaddpd (-(__v2df)__A, (__v2df)__B,
184                                           -(__v2df)__C);
185}
186
187extern __inline __m256d
188__attribute__((__gnu_inline__, __always_inline__, __artificial__))
189_mm256_fnmsub_pd (__m256d __A, __m256d __B, __m256d __C)
190{
191  return (__m256d)__builtin_ia32_vfmaddpd256 (-(__v4df)__A, (__v4df)__B,
192                                              -(__v4df)__C);
193}
194
195extern __inline __m128
196__attribute__((__gnu_inline__, __always_inline__, __artificial__))
197_mm_fnmsub_ps (__m128 __A, __m128 __B, __m128 __C)
198{
199  return (__m128)__builtin_ia32_vfmaddps (-(__v4sf)__A, (__v4sf)__B,
200                                          -(__v4sf)__C);
201}
202
203extern __inline __m256
204__attribute__((__gnu_inline__, __always_inline__, __artificial__))
205_mm256_fnmsub_ps (__m256 __A, __m256 __B, __m256 __C)
206{
207  return (__m256)__builtin_ia32_vfmaddps256 (-(__v8sf)__A, (__v8sf)__B,
208                                             -(__v8sf)__C);
209}
210
211extern __inline __m128d
212__attribute__((__gnu_inline__, __always_inline__, __artificial__))
213_mm_fnmsub_sd (__m128d __A, __m128d __B, __m128d __C)
214{
215  return (__m128d)__builtin_ia32_vfmaddsd3 ((__v2df)__A, -(__v2df)__B,
216                                            -(__v2df)__C);
217}
218
219extern __inline __m128
220__attribute__((__gnu_inline__, __always_inline__, __artificial__))
221_mm_fnmsub_ss (__m128 __A, __m128 __B, __m128 __C)
222{
223  return (__m128)__builtin_ia32_vfmaddss3 ((__v4sf)__A, -(__v4sf)__B,
224                                           -(__v4sf)__C);
225}
226
227extern __inline __m128d
228__attribute__((__gnu_inline__, __always_inline__, __artificial__))
229_mm_fmaddsub_pd (__m128d __A, __m128d __B, __m128d __C)
230{
231  return (__m128d)__builtin_ia32_vfmaddsubpd ((__v2df)__A, (__v2df)__B,
232                                              (__v2df)__C);
233}
234
235extern __inline __m256d
236__attribute__((__gnu_inline__, __always_inline__, __artificial__))
237_mm256_fmaddsub_pd (__m256d __A, __m256d __B, __m256d __C)
238{
239  return (__m256d)__builtin_ia32_vfmaddsubpd256 ((__v4df)__A,
240                                                 (__v4df)__B,
241                                                 (__v4df)__C);
242}
243
244extern __inline __m128
245__attribute__((__gnu_inline__, __always_inline__, __artificial__))
246_mm_fmaddsub_ps (__m128 __A, __m128 __B, __m128 __C)
247{
248  return (__m128)__builtin_ia32_vfmaddsubps ((__v4sf)__A, (__v4sf)__B,
249                                             (__v4sf)__C);
250}
251
252extern __inline __m256
253__attribute__((__gnu_inline__, __always_inline__, __artificial__))
254_mm256_fmaddsub_ps (__m256 __A, __m256 __B, __m256 __C)
255{
256  return (__m256)__builtin_ia32_vfmaddsubps256 ((__v8sf)__A,
257                                                (__v8sf)__B,
258                                                (__v8sf)__C);
259}
260
261extern __inline __m128d
262__attribute__((__gnu_inline__, __always_inline__, __artificial__))
263_mm_fmsubadd_pd (__m128d __A, __m128d __B, __m128d __C)
264{
265  return (__m128d)__builtin_ia32_vfmaddsubpd ((__v2df)__A, (__v2df)__B,
266                                              -(__v2df)__C);
267}
268
269extern __inline __m256d
270__attribute__((__gnu_inline__, __always_inline__, __artificial__))
271_mm256_fmsubadd_pd (__m256d __A, __m256d __B, __m256d __C)
272{
273  return (__m256d)__builtin_ia32_vfmaddsubpd256 ((__v4df)__A,
274                                                 (__v4df)__B,
275                                                 -(__v4df)__C);
276}
277
278extern __inline __m128
279__attribute__((__gnu_inline__, __always_inline__, __artificial__))
280_mm_fmsubadd_ps (__m128 __A, __m128 __B, __m128 __C)
281{
282  return (__m128)__builtin_ia32_vfmaddsubps ((__v4sf)__A, (__v4sf)__B,
283                                             -(__v4sf)__C);
284}
285
286extern __inline __m256
287__attribute__((__gnu_inline__, __always_inline__, __artificial__))
288_mm256_fmsubadd_ps (__m256 __A, __m256 __B, __m256 __C)
289{
290  return (__m256)__builtin_ia32_vfmaddsubps256 ((__v8sf)__A,
291                                                (__v8sf)__B,
292                                                -(__v8sf)__C);
293}
294
295#endif
296
297#endif
298