1 /* Copyright (C) 2013-2017 Free Software Foundation, Inc.
3 This file is part of GCC.
5 GCC is free software; you can redistribute it and/or modify
6 it under the terms of the GNU General Public License as published by
7 the Free Software Foundation; either version 3, or (at your option)
10 GCC is distributed in the hope that it will be useful,
11 but WITHOUT ANY WARRANTY; without even the implied warranty of
12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 GNU General Public License for more details.
15 Under Section 7 of GPL version 3, you are granted additional
16 permissions described in the GCC Runtime Library Exception, version
17 3.1, as published by the Free Software Foundation.
19 You should have received a copy of the GNU General Public License and
20 a copy of the GCC Runtime Library Exception along with this program;
21 see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
22 <http://www.gnu.org/licenses/>. */
24 #ifndef _IMMINTRIN_H_INCLUDED
25 #error "Never use <avx512pfintrin.h> directly; include <immintrin.h> instead."
28 #ifndef _AVX512PFINTRIN_H_INCLUDED
29 #define _AVX512PFINTRIN_H_INCLUDED
32 #pragma GCC push_options
33 #pragma GCC target("avx512pf")
34 #define __DISABLE_AVX512PF__
35 #endif /* __AVX512PF__ */
37 /* Internal data types for implementing the intrinsics. */
38 typedef long long __v8di
__attribute__ ((__vector_size__ (64)));
39 typedef int __v16si
__attribute__ ((__vector_size__ (64)));
41 /* The Intel API is flexible enough that we must allow aliasing with other
42 vector types, and their scalar components. */
43 typedef long long __m512i
__attribute__ ((__vector_size__ (64), __may_alias__
));
45 typedef unsigned char __mmask8
;
46 typedef unsigned short __mmask16
;
50 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
51 _mm512_prefetch_i32gather_pd (__m256i __index
, void const *__addr
,
52 int __scale
, int __hint
)
54 __builtin_ia32_gatherpfdpd ((__mmask8
) 0xFF, (__v8si
) __index
, __addr
,
59 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
60 _mm512_prefetch_i32gather_ps (__m512i __index
, void const *__addr
,
61 int __scale
, int __hint
)
63 __builtin_ia32_gatherpfdps ((__mmask16
) 0xFFFF, (__v16si
) __index
, __addr
,
68 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
69 _mm512_mask_prefetch_i32gather_pd (__m256i __index
, __mmask8 __mask
,
70 void const *__addr
, int __scale
, int __hint
)
72 __builtin_ia32_gatherpfdpd (__mask
, (__v8si
) __index
, __addr
, __scale
,
77 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
78 _mm512_mask_prefetch_i32gather_ps (__m512i __index
, __mmask16 __mask
,
79 void const *__addr
, int __scale
, int __hint
)
81 __builtin_ia32_gatherpfdps (__mask
, (__v16si
) __index
, __addr
, __scale
,
86 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
87 _mm512_prefetch_i64gather_pd (__m512i __index
, void const *__addr
,
88 int __scale
, int __hint
)
90 __builtin_ia32_gatherpfqpd ((__mmask8
) 0xFF, (__v8di
) __index
, __addr
,
95 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
96 _mm512_prefetch_i64gather_ps (__m512i __index
, void const *__addr
,
97 int __scale
, int __hint
)
99 __builtin_ia32_gatherpfqps ((__mmask8
) 0xFF, (__v8di
) __index
, __addr
,
104 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
105 _mm512_mask_prefetch_i64gather_pd (__m512i __index
, __mmask8 __mask
,
106 void const *__addr
, int __scale
, int __hint
)
108 __builtin_ia32_gatherpfqpd (__mask
, (__v8di
) __index
, __addr
, __scale
,
113 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
114 _mm512_mask_prefetch_i64gather_ps (__m512i __index
, __mmask8 __mask
,
115 void const *__addr
, int __scale
, int __hint
)
117 __builtin_ia32_gatherpfqps (__mask
, (__v8di
) __index
, __addr
, __scale
,
122 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
123 _mm512_prefetch_i32scatter_pd (void *__addr
, __m256i __index
, int __scale
,
126 __builtin_ia32_scatterpfdpd ((__mmask8
) 0xFF, (__v8si
) __index
, __addr
,
131 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
132 _mm512_prefetch_i32scatter_ps (void *__addr
, __m512i __index
, int __scale
,
135 __builtin_ia32_scatterpfdps ((__mmask16
) 0xFFFF, (__v16si
) __index
, __addr
,
140 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
141 _mm512_mask_prefetch_i32scatter_pd (void *__addr
, __mmask8 __mask
,
142 __m256i __index
, int __scale
, int __hint
)
144 __builtin_ia32_scatterpfdpd (__mask
, (__v8si
) __index
, __addr
, __scale
,
149 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
150 _mm512_mask_prefetch_i32scatter_ps (void *__addr
, __mmask16 __mask
,
151 __m512i __index
, int __scale
, int __hint
)
153 __builtin_ia32_scatterpfdps (__mask
, (__v16si
) __index
, __addr
, __scale
,
158 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
159 _mm512_prefetch_i64scatter_pd (void *__addr
, __m512i __index
, int __scale
,
162 __builtin_ia32_scatterpfqpd ((__mmask8
) 0xFF, (__v8di
) __index
,__addr
,
167 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
168 _mm512_prefetch_i64scatter_ps (void *__addr
, __m512i __index
, int __scale
,
171 __builtin_ia32_scatterpfqps ((__mmask8
) 0xFF, (__v8di
) __index
, __addr
,
176 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
177 _mm512_mask_prefetch_i64scatter_pd (void *__addr
, __mmask16 __mask
,
178 __m512i __index
, int __scale
, int __hint
)
180 __builtin_ia32_scatterpfqpd (__mask
, (__v8di
) __index
, __addr
, __scale
,
185 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
186 _mm512_mask_prefetch_i64scatter_ps (void *__addr
, __mmask16 __mask
,
187 __m512i __index
, int __scale
, int __hint
)
189 __builtin_ia32_scatterpfqps (__mask
, (__v8di
) __index
, __addr
, __scale
,
194 #define _mm512_prefetch_i32gather_pd(INDEX, ADDR, SCALE, HINT) \
195 __builtin_ia32_gatherpfdpd ((__mmask8)0xFF, (__v8si)(__m256i)INDEX, \
196 (void const *)ADDR, (int)SCALE, (int)HINT)
198 #define _mm512_prefetch_i32gather_ps(INDEX, ADDR, SCALE, HINT) \
199 __builtin_ia32_gatherpfdps ((__mmask16)0xFFFF, (__v16si)(__m512i)INDEX, \
200 (void const *)ADDR, (int)SCALE, (int)HINT)
202 #define _mm512_mask_prefetch_i32gather_pd(INDEX, MASK, ADDR, SCALE, HINT) \
203 __builtin_ia32_gatherpfdpd ((__mmask8)MASK, (__v8si)(__m256i)INDEX, \
204 (void const *)ADDR, (int)SCALE, (int)HINT)
206 #define _mm512_mask_prefetch_i32gather_ps(INDEX, MASK, ADDR, SCALE, HINT) \
207 __builtin_ia32_gatherpfdps ((__mmask16)MASK, (__v16si)(__m512i)INDEX, \
208 (void const *)ADDR, (int)SCALE, (int)HINT)
210 #define _mm512_prefetch_i64gather_pd(INDEX, ADDR, SCALE, HINT) \
211 __builtin_ia32_gatherpfqpd ((__mmask8)0xFF, (__v8di)(__m512i)INDEX, \
212 (void *)ADDR, (int)SCALE, (int)HINT)
214 #define _mm512_prefetch_i64gather_ps(INDEX, ADDR, SCALE, HINT) \
215 __builtin_ia32_gatherpfqps ((__mmask8)0xFF, (__v8di)(__m512i)INDEX, \
216 (void *)ADDR, (int)SCALE, (int)HINT)
218 #define _mm512_mask_prefetch_i64gather_pd(INDEX, MASK, ADDR, SCALE, HINT) \
219 __builtin_ia32_gatherpfqpd ((__mmask8)MASK, (__v8di)(__m512i)INDEX, \
220 (void *)ADDR, (int)SCALE, (int)HINT)
222 #define _mm512_mask_prefetch_i64gather_ps(INDEX, MASK, ADDR, SCALE, HINT) \
223 __builtin_ia32_gatherpfqps ((__mmask8)MASK, (__v8di)(__m512i)INDEX, \
224 (void *)ADDR, (int)SCALE, (int)HINT)
226 #define _mm512_prefetch_i32scatter_pd(ADDR, INDEX, SCALE, HINT) \
227 __builtin_ia32_scatterpfdpd ((__mmask8)0xFF, (__v8si)(__m256i)INDEX, \
228 (void *)ADDR, (int)SCALE, (int)HINT)
230 #define _mm512_prefetch_i32scatter_ps(ADDR, INDEX, SCALE, HINT) \
231 __builtin_ia32_scatterpfdps ((__mmask16)0xFFFF, (__v16si)(__m512i)INDEX, \
232 (void *)ADDR, (int)SCALE, (int)HINT)
234 #define _mm512_mask_prefetch_i32scatter_pd(ADDR, MASK, INDEX, SCALE, HINT) \
235 __builtin_ia32_scatterpfdpd ((__mmask8)MASK, (__v8si)(__m256i)INDEX, \
236 (void *)ADDR, (int)SCALE, (int)HINT)
238 #define _mm512_mask_prefetch_i32scatter_ps(ADDR, MASK, INDEX, SCALE, HINT) \
239 __builtin_ia32_scatterpfdps ((__mmask16)MASK, (__v16si)(__m512i)INDEX, \
240 (void *)ADDR, (int)SCALE, (int)HINT)
242 #define _mm512_prefetch_i64scatter_pd(ADDR, INDEX, SCALE, HINT) \
243 __builtin_ia32_scatterpfqpd ((__mmask8)0xFF, (__v8di)(__m512i)INDEX, \
244 (void *)ADDR, (int)SCALE, (int)HINT)
246 #define _mm512_prefetch_i64scatter_ps(ADDR, INDEX, SCALE, HINT) \
247 __builtin_ia32_scatterpfqps ((__mmask8)0xFF, (__v8di)(__m512i)INDEX, \
248 (void *)ADDR, (int)SCALE, (int)HINT)
250 #define _mm512_mask_prefetch_i64scatter_pd(ADDR, MASK, INDEX, SCALE, HINT) \
251 __builtin_ia32_scatterpfqpd ((__mmask8)MASK, (__v8di)(__m512i)INDEX, \
252 (void *)ADDR, (int)SCALE, (int)HINT)
254 #define _mm512_mask_prefetch_i64scatter_ps(ADDR, MASK, INDEX, SCALE, HINT) \
255 __builtin_ia32_scatterpfqps ((__mmask8)MASK, (__v8di)(__m512i)INDEX, \
256 (void *)ADDR, (int)SCALE, (int)HINT)
259 #ifdef __DISABLE_AVX512PF__
260 #undef __DISABLE_AVX512PF__
261 #pragma GCC pop_options
262 #endif /* __DISABLE_AVX512PF__ */
264 #endif /* _AVX512PFINTRIN_H_INCLUDED */