1 /* Copyright (C) 2014-2016 Free Software Foundation, Inc.
3 This file is part of GCC.
5 GCC is free software; you can redistribute it and/or modify
6 it under the terms of the GNU General Public License as published by
7 the Free Software Foundation; either version 3, or (at your option)
10 GCC is distributed in the hope that it will be useful,
11 but WITHOUT ANY WARRANTY; without even the implied warranty of
12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 GNU General Public License for more details.
15 Under Section 7 of GPL version 3, you are granted additional
16 permissions described in the GCC Runtime Library Exception, version
17 3.1, as published by the Free Software Foundation.
19 You should have received a copy of the GNU General Public License and
20 a copy of the GCC Runtime Library Exception along with this program;
21 see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
22 <http://www.gnu.org/licenses/>. */
24 #ifndef _IMMINTRIN_H_INCLUDED
25 #error "Never use <avx512vlintrin.h> directly; include <immintrin.h> instead."
28 #ifndef _AVX512VLINTRIN_H_INCLUDED
29 #define _AVX512VLINTRIN_H_INCLUDED
31 /* Doesn't require avx512vl target and is used in avx512dqintrin.h. */
32 extern __inline __m128i
33 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
36 return __extension__ (__m128i
)(__v2di
){ 0LL, 0LL};
40 #pragma GCC push_options
41 #pragma GCC target("avx512vl")
42 #define __DISABLE_AVX512VL__
43 #endif /* __AVX512VL__ */
45 /* Internal data types for implementing the intrinsics. */
46 typedef unsigned int __mmask32
;
48 extern __inline __m256d
49 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
50 _mm256_mask_mov_pd (__m256d __W
, __mmask8 __U
, __m256d __A
)
52 return (__m256d
) __builtin_ia32_movapd256_mask ((__v4df
) __A
,
57 extern __inline __m256d
58 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
59 _mm256_maskz_mov_pd (__mmask8 __U
, __m256d __A
)
61 return (__m256d
) __builtin_ia32_movapd256_mask ((__v4df
) __A
,
67 extern __inline __m128d
68 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
69 _mm_mask_mov_pd (__m128d __W
, __mmask8 __U
, __m128d __A
)
71 return (__m128d
) __builtin_ia32_movapd128_mask ((__v2df
) __A
,
76 extern __inline __m128d
77 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
78 _mm_maskz_mov_pd (__mmask8 __U
, __m128d __A
)
80 return (__m128d
) __builtin_ia32_movapd128_mask ((__v2df
) __A
,
86 extern __inline __m256d
87 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
88 _mm256_mask_load_pd (__m256d __W
, __mmask8 __U
, void const *__P
)
90 return (__m256d
) __builtin_ia32_loadapd256_mask ((__v4df
*) __P
,
95 extern __inline __m256d
96 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
97 _mm256_maskz_load_pd (__mmask8 __U
, void const *__P
)
99 return (__m256d
) __builtin_ia32_loadapd256_mask ((__v4df
*) __P
,
101 _mm256_setzero_pd (),
105 extern __inline __m128d
106 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
107 _mm_mask_load_pd (__m128d __W
, __mmask8 __U
, void const *__P
)
109 return (__m128d
) __builtin_ia32_loadapd128_mask ((__v2df
*) __P
,
114 extern __inline __m128d
115 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
116 _mm_maskz_load_pd (__mmask8 __U
, void const *__P
)
118 return (__m128d
) __builtin_ia32_loadapd128_mask ((__v2df
*) __P
,
125 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
126 _mm256_mask_store_pd (void *__P
, __mmask8 __U
, __m256d __A
)
128 __builtin_ia32_storeapd256_mask ((__v4df
*) __P
,
134 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
135 _mm_mask_store_pd (void *__P
, __mmask8 __U
, __m128d __A
)
137 __builtin_ia32_storeapd128_mask ((__v2df
*) __P
,
142 extern __inline __m256
143 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
144 _mm256_mask_mov_ps (__m256 __W
, __mmask8 __U
, __m256 __A
)
146 return (__m256
) __builtin_ia32_movaps256_mask ((__v8sf
) __A
,
151 extern __inline __m256
152 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
153 _mm256_maskz_mov_ps (__mmask8 __U
, __m256 __A
)
155 return (__m256
) __builtin_ia32_movaps256_mask ((__v8sf
) __A
,
157 _mm256_setzero_ps (),
161 extern __inline __m128
162 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
163 _mm_mask_mov_ps (__m128 __W
, __mmask8 __U
, __m128 __A
)
165 return (__m128
) __builtin_ia32_movaps128_mask ((__v4sf
) __A
,
170 extern __inline __m128
171 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
172 _mm_maskz_mov_ps (__mmask8 __U
, __m128 __A
)
174 return (__m128
) __builtin_ia32_movaps128_mask ((__v4sf
) __A
,
180 extern __inline __m256
181 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
182 _mm256_mask_load_ps (__m256 __W
, __mmask8 __U
, void const *__P
)
184 return (__m256
) __builtin_ia32_loadaps256_mask ((__v8sf
*) __P
,
189 extern __inline __m256
190 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
191 _mm256_maskz_load_ps (__mmask8 __U
, void const *__P
)
193 return (__m256
) __builtin_ia32_loadaps256_mask ((__v8sf
*) __P
,
195 _mm256_setzero_ps (),
199 extern __inline __m128
200 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
201 _mm_mask_load_ps (__m128 __W
, __mmask8 __U
, void const *__P
)
203 return (__m128
) __builtin_ia32_loadaps128_mask ((__v4sf
*) __P
,
208 extern __inline __m128
209 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
210 _mm_maskz_load_ps (__mmask8 __U
, void const *__P
)
212 return (__m128
) __builtin_ia32_loadaps128_mask ((__v4sf
*) __P
,
219 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
220 _mm256_mask_store_ps (void *__P
, __mmask8 __U
, __m256 __A
)
222 __builtin_ia32_storeaps256_mask ((__v8sf
*) __P
,
228 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
229 _mm_mask_store_ps (void *__P
, __mmask8 __U
, __m128 __A
)
231 __builtin_ia32_storeaps128_mask ((__v4sf
*) __P
,
236 extern __inline __m256i
237 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
238 _mm256_mask_mov_epi64 (__m256i __W
, __mmask8 __U
, __m256i __A
)
240 return (__m256i
) __builtin_ia32_movdqa64_256_mask ((__v4di
) __A
,
245 extern __inline __m256i
246 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
247 _mm256_maskz_mov_epi64 (__mmask8 __U
, __m256i __A
)
249 return (__m256i
) __builtin_ia32_movdqa64_256_mask ((__v4di
) __A
,
251 _mm256_setzero_si256 (),
255 extern __inline __m128i
256 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
257 _mm_mask_mov_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
)
259 return (__m128i
) __builtin_ia32_movdqa64_128_mask ((__v2di
) __A
,
264 extern __inline __m128i
265 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
266 _mm_maskz_mov_epi64 (__mmask8 __U
, __m128i __A
)
268 return (__m128i
) __builtin_ia32_movdqa64_128_mask ((__v2di
) __A
,
274 extern __inline __m256i
275 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
276 _mm256_mask_load_epi64 (__m256i __W
, __mmask8 __U
, void const *__P
)
278 return (__m256i
) __builtin_ia32_movdqa64load256_mask ((__v4di
*) __P
,
284 extern __inline __m256i
285 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
286 _mm256_maskz_load_epi64 (__mmask8 __U
, void const *__P
)
288 return (__m256i
) __builtin_ia32_movdqa64load256_mask ((__v4di
*) __P
,
290 _mm256_setzero_si256 (),
295 extern __inline __m128i
296 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
297 _mm_mask_load_epi64 (__m128i __W
, __mmask8 __U
, void const *__P
)
299 return (__m128i
) __builtin_ia32_movdqa64load128_mask ((__v2di
*) __P
,
305 extern __inline __m128i
306 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
307 _mm_maskz_load_epi64 (__mmask8 __U
, void const *__P
)
309 return (__m128i
) __builtin_ia32_movdqa64load128_mask ((__v2di
*) __P
,
317 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
318 _mm256_mask_store_epi64 (void *__P
, __mmask8 __U
, __m256i __A
)
320 __builtin_ia32_movdqa64store256_mask ((__v4di
*) __P
,
326 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
327 _mm_mask_store_epi64 (void *__P
, __mmask8 __U
, __m128i __A
)
329 __builtin_ia32_movdqa64store128_mask ((__v2di
*) __P
,
334 extern __inline __m256i
335 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
336 _mm256_mask_mov_epi32 (__m256i __W
, __mmask8 __U
, __m256i __A
)
338 return (__m256i
) __builtin_ia32_movdqa32_256_mask ((__v8si
) __A
,
343 extern __inline __m256i
344 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
345 _mm256_maskz_mov_epi32 (__mmask8 __U
, __m256i __A
)
347 return (__m256i
) __builtin_ia32_movdqa32_256_mask ((__v8si
) __A
,
349 _mm256_setzero_si256 (),
353 extern __inline __m128i
354 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
355 _mm_mask_mov_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
)
357 return (__m128i
) __builtin_ia32_movdqa32_128_mask ((__v4si
) __A
,
362 extern __inline __m128i
363 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
364 _mm_maskz_mov_epi32 (__mmask8 __U
, __m128i __A
)
366 return (__m128i
) __builtin_ia32_movdqa32_128_mask ((__v4si
) __A
,
368 _mm_setzero_si128 (),
372 extern __inline __m256i
373 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
374 _mm256_mask_load_epi32 (__m256i __W
, __mmask8 __U
, void const *__P
)
376 return (__m256i
) __builtin_ia32_movdqa32load256_mask ((__v8si
*) __P
,
382 extern __inline __m256i
383 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
384 _mm256_maskz_load_epi32 (__mmask8 __U
, void const *__P
)
386 return (__m256i
) __builtin_ia32_movdqa32load256_mask ((__v8si
*) __P
,
388 _mm256_setzero_si256 (),
393 extern __inline __m128i
394 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
395 _mm_mask_load_epi32 (__m128i __W
, __mmask8 __U
, void const *__P
)
397 return (__m128i
) __builtin_ia32_movdqa32load128_mask ((__v4si
*) __P
,
403 extern __inline __m128i
404 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
405 _mm_maskz_load_epi32 (__mmask8 __U
, void const *__P
)
407 return (__m128i
) __builtin_ia32_movdqa32load128_mask ((__v4si
*) __P
,
409 _mm_setzero_si128 (),
415 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
416 _mm256_mask_store_epi32 (void *__P
, __mmask8 __U
, __m256i __A
)
418 __builtin_ia32_movdqa32store256_mask ((__v8si
*) __P
,
424 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
425 _mm_mask_store_epi32 (void *__P
, __mmask8 __U
, __m128i __A
)
427 __builtin_ia32_movdqa32store128_mask ((__v4si
*) __P
,
432 extern __inline __m128i
433 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
434 _mm_setzero_hi (void)
436 return __extension__ (__m128i
) (__v8hi
)
438 0, 0, 0, 0, 0, 0, 0, 0};
441 extern __inline __m128d
442 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
443 _mm_mask_add_pd (__m128d __W
, __mmask8 __U
, __m128d __A
, __m128d __B
)
445 return (__m128d
) __builtin_ia32_addpd128_mask ((__v2df
) __A
,
451 extern __inline __m128d
452 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
453 _mm_maskz_add_pd (__mmask8 __U
, __m128d __A
, __m128d __B
)
455 return (__m128d
) __builtin_ia32_addpd128_mask ((__v2df
) __A
,
462 extern __inline __m256d
463 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
464 _mm256_mask_add_pd (__m256d __W
, __mmask8 __U
, __m256d __A
,
467 return (__m256d
) __builtin_ia32_addpd256_mask ((__v4df
) __A
,
473 extern __inline __m256d
474 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
475 _mm256_maskz_add_pd (__mmask8 __U
, __m256d __A
, __m256d __B
)
477 return (__m256d
) __builtin_ia32_addpd256_mask ((__v4df
) __A
,
480 _mm256_setzero_pd (),
484 extern __inline __m128
485 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
486 _mm_mask_add_ps (__m128 __W
, __mmask16 __U
, __m128 __A
, __m128 __B
)
488 return (__m128
) __builtin_ia32_addps128_mask ((__v4sf
) __A
,
494 extern __inline __m128
495 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
496 _mm_maskz_add_ps (__mmask16 __U
, __m128 __A
, __m128 __B
)
498 return (__m128
) __builtin_ia32_addps128_mask ((__v4sf
) __A
,
505 extern __inline __m256
506 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
507 _mm256_mask_add_ps (__m256 __W
, __mmask16 __U
, __m256 __A
, __m256 __B
)
509 return (__m256
) __builtin_ia32_addps256_mask ((__v8sf
) __A
,
515 extern __inline __m256
516 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
517 _mm256_maskz_add_ps (__mmask16 __U
, __m256 __A
, __m256 __B
)
519 return (__m256
) __builtin_ia32_addps256_mask ((__v8sf
) __A
,
522 _mm256_setzero_ps (),
526 extern __inline __m128d
527 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
528 _mm_mask_sub_pd (__m128d __W
, __mmask8 __U
, __m128d __A
, __m128d __B
)
530 return (__m128d
) __builtin_ia32_subpd128_mask ((__v2df
) __A
,
536 extern __inline __m128d
537 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
538 _mm_maskz_sub_pd (__mmask8 __U
, __m128d __A
, __m128d __B
)
540 return (__m128d
) __builtin_ia32_subpd128_mask ((__v2df
) __A
,
547 extern __inline __m256d
548 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
549 _mm256_mask_sub_pd (__m256d __W
, __mmask8 __U
, __m256d __A
,
552 return (__m256d
) __builtin_ia32_subpd256_mask ((__v4df
) __A
,
558 extern __inline __m256d
559 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
560 _mm256_maskz_sub_pd (__mmask8 __U
, __m256d __A
, __m256d __B
)
562 return (__m256d
) __builtin_ia32_subpd256_mask ((__v4df
) __A
,
565 _mm256_setzero_pd (),
569 extern __inline __m128
570 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
571 _mm_mask_sub_ps (__m128 __W
, __mmask16 __U
, __m128 __A
, __m128 __B
)
573 return (__m128
) __builtin_ia32_subps128_mask ((__v4sf
) __A
,
579 extern __inline __m128
580 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
581 _mm_maskz_sub_ps (__mmask16 __U
, __m128 __A
, __m128 __B
)
583 return (__m128
) __builtin_ia32_subps128_mask ((__v4sf
) __A
,
590 extern __inline __m256
591 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
592 _mm256_mask_sub_ps (__m256 __W
, __mmask16 __U
, __m256 __A
, __m256 __B
)
594 return (__m256
) __builtin_ia32_subps256_mask ((__v8sf
) __A
,
600 extern __inline __m256
601 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
602 _mm256_maskz_sub_ps (__mmask16 __U
, __m256 __A
, __m256 __B
)
604 return (__m256
) __builtin_ia32_subps256_mask ((__v8sf
) __A
,
607 _mm256_setzero_ps (),
612 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
613 _mm256_store_epi64 (void *__P
, __m256i __A
)
615 *(__m256i
*) __P
= __A
;
619 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
620 _mm_store_epi64 (void *__P
, __m128i __A
)
622 *(__m128i
*) __P
= __A
;
625 extern __inline __m256d
626 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
627 _mm256_mask_loadu_pd (__m256d __W
, __mmask8 __U
, void const *__P
)
629 return (__m256d
) __builtin_ia32_loadupd256_mask ((const double *) __P
,
634 extern __inline __m256d
635 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
636 _mm256_maskz_loadu_pd (__mmask8 __U
, void const *__P
)
638 return (__m256d
) __builtin_ia32_loadupd256_mask ((const double *) __P
,
640 _mm256_setzero_pd (),
644 extern __inline __m128d
645 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
646 _mm_mask_loadu_pd (__m128d __W
, __mmask8 __U
, void const *__P
)
648 return (__m128d
) __builtin_ia32_loadupd128_mask ((const double *) __P
,
653 extern __inline __m128d
654 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
655 _mm_maskz_loadu_pd (__mmask8 __U
, void const *__P
)
657 return (__m128d
) __builtin_ia32_loadupd128_mask ((const double *) __P
,
664 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
665 _mm256_mask_storeu_pd (void *__P
, __mmask8 __U
, __m256d __A
)
667 __builtin_ia32_storeupd256_mask ((double *) __P
,
673 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
674 _mm_mask_storeu_pd (void *__P
, __mmask8 __U
, __m128d __A
)
676 __builtin_ia32_storeupd128_mask ((double *) __P
,
681 extern __inline __m256
682 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
683 _mm256_mask_loadu_ps (__m256 __W
, __mmask8 __U
, void const *__P
)
685 return (__m256
) __builtin_ia32_loadups256_mask ((const float *) __P
,
690 extern __inline __m256
691 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
692 _mm256_maskz_loadu_ps (__mmask8 __U
, void const *__P
)
694 return (__m256
) __builtin_ia32_loadups256_mask ((const float *) __P
,
696 _mm256_setzero_ps (),
700 extern __inline __m128
701 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
702 _mm_mask_loadu_ps (__m128 __W
, __mmask8 __U
, void const *__P
)
704 return (__m128
) __builtin_ia32_loadups128_mask ((const float *) __P
,
709 extern __inline __m128
710 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
711 _mm_maskz_loadu_ps (__mmask8 __U
, void const *__P
)
713 return (__m128
) __builtin_ia32_loadups128_mask ((const float *) __P
,
720 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
721 _mm256_mask_storeu_ps (void *__P
, __mmask8 __U
, __m256 __A
)
723 __builtin_ia32_storeups256_mask ((float *) __P
,
729 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
730 _mm_mask_storeu_ps (void *__P
, __mmask8 __U
, __m128 __A
)
732 __builtin_ia32_storeups128_mask ((float *) __P
,
737 extern __inline __m256i
738 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
739 _mm256_mask_loadu_epi64 (__m256i __W
, __mmask8 __U
, void const *__P
)
741 return (__m256i
) __builtin_ia32_loaddqudi256_mask ((const long long *) __P
,
746 extern __inline __m256i
747 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
748 _mm256_maskz_loadu_epi64 (__mmask8 __U
, void const *__P
)
750 return (__m256i
) __builtin_ia32_loaddqudi256_mask ((const long long *) __P
,
752 _mm256_setzero_si256 (),
756 extern __inline __m128i
757 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
758 _mm_mask_loadu_epi64 (__m128i __W
, __mmask8 __U
, void const *__P
)
760 return (__m128i
) __builtin_ia32_loaddqudi128_mask ((const long long *) __P
,
765 extern __inline __m128i
766 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
767 _mm_maskz_loadu_epi64 (__mmask8 __U
, void const *__P
)
769 return (__m128i
) __builtin_ia32_loaddqudi128_mask ((const long long *) __P
,
776 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
777 _mm256_mask_storeu_epi64 (void *__P
, __mmask8 __U
, __m256i __A
)
779 __builtin_ia32_storedqudi256_mask ((long long *) __P
,
785 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
786 _mm_mask_storeu_epi64 (void *__P
, __mmask8 __U
, __m128i __A
)
788 __builtin_ia32_storedqudi128_mask ((long long *) __P
,
793 extern __inline __m256i
794 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
795 _mm256_mask_loadu_epi32 (__m256i __W
, __mmask8 __U
, void const *__P
)
797 return (__m256i
) __builtin_ia32_loaddqusi256_mask ((const int *) __P
,
802 extern __inline __m256i
803 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
804 _mm256_maskz_loadu_epi32 (__mmask8 __U
, void const *__P
)
806 return (__m256i
) __builtin_ia32_loaddqusi256_mask ((const int *) __P
,
808 _mm256_setzero_si256 (),
812 extern __inline __m128i
813 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
814 _mm_mask_loadu_epi32 (__m128i __W
, __mmask8 __U
, void const *__P
)
816 return (__m128i
) __builtin_ia32_loaddqusi128_mask ((const int *) __P
,
821 extern __inline __m128i
822 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
823 _mm_maskz_loadu_epi32 (__mmask8 __U
, void const *__P
)
825 return (__m128i
) __builtin_ia32_loaddqusi128_mask ((const int *) __P
,
827 _mm_setzero_si128 (),
832 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
833 _mm256_mask_storeu_epi32 (void *__P
, __mmask8 __U
, __m256i __A
)
835 __builtin_ia32_storedqusi256_mask ((int *) __P
,
841 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
842 _mm_mask_storeu_epi32 (void *__P
, __mmask8 __U
, __m128i __A
)
844 __builtin_ia32_storedqusi128_mask ((int *) __P
,
849 extern __inline __m256i
850 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
851 _mm256_mask_abs_epi32 (__m256i __W
, __mmask8 __U
, __m256i __A
)
853 return (__m256i
) __builtin_ia32_pabsd256_mask ((__v8si
) __A
,
858 extern __inline __m256i
859 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
860 _mm256_maskz_abs_epi32 (__mmask8 __U
, __m256i __A
)
862 return (__m256i
) __builtin_ia32_pabsd256_mask ((__v8si
) __A
,
864 _mm256_setzero_si256 (),
868 extern __inline __m128i
869 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
870 _mm_mask_abs_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
)
872 return (__m128i
) __builtin_ia32_pabsd128_mask ((__v4si
) __A
,
877 extern __inline __m128i
878 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
879 _mm_maskz_abs_epi32 (__mmask8 __U
, __m128i __A
)
881 return (__m128i
) __builtin_ia32_pabsd128_mask ((__v4si
) __A
,
883 _mm_setzero_si128 (),
887 extern __inline __m256i
888 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
889 _mm256_abs_epi64 (__m256i __A
)
891 return (__m256i
) __builtin_ia32_pabsq256_mask ((__v4di
) __A
,
893 _mm256_setzero_si256 (),
897 extern __inline __m256i
898 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
899 _mm256_mask_abs_epi64 (__m256i __W
, __mmask8 __U
, __m256i __A
)
901 return (__m256i
) __builtin_ia32_pabsq256_mask ((__v4di
) __A
,
906 extern __inline __m256i
907 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
908 _mm256_maskz_abs_epi64 (__mmask8 __U
, __m256i __A
)
910 return (__m256i
) __builtin_ia32_pabsq256_mask ((__v4di
) __A
,
912 _mm256_setzero_si256 (),
916 extern __inline __m128i
917 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
918 _mm_abs_epi64 (__m128i __A
)
920 return (__m128i
) __builtin_ia32_pabsq128_mask ((__v2di
) __A
,
926 extern __inline __m128i
927 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
928 _mm_mask_abs_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
)
930 return (__m128i
) __builtin_ia32_pabsq128_mask ((__v2di
) __A
,
935 extern __inline __m128i
936 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
937 _mm_maskz_abs_epi64 (__mmask8 __U
, __m128i __A
)
939 return (__m128i
) __builtin_ia32_pabsq128_mask ((__v2di
) __A
,
945 extern __inline __m128i
946 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
947 _mm256_cvtpd_epu32 (__m256d __A
)
949 return (__m128i
) __builtin_ia32_cvtpd2udq256_mask ((__v4df
) __A
,
951 _mm_setzero_si128 (),
955 extern __inline __m128i
956 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
957 _mm256_mask_cvtpd_epu32 (__m128i __W
, __mmask8 __U
, __m256d __A
)
959 return (__m128i
) __builtin_ia32_cvtpd2udq256_mask ((__v4df
) __A
,
964 extern __inline __m128i
965 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
966 _mm256_maskz_cvtpd_epu32 (__mmask8 __U
, __m256d __A
)
968 return (__m128i
) __builtin_ia32_cvtpd2udq256_mask ((__v4df
) __A
,
970 _mm_setzero_si128 (),
974 extern __inline __m128i
975 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
976 _mm_cvtpd_epu32 (__m128d __A
)
978 return (__m128i
) __builtin_ia32_cvtpd2udq128_mask ((__v2df
) __A
,
980 _mm_setzero_si128 (),
984 extern __inline __m128i
985 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
986 _mm_mask_cvtpd_epu32 (__m128i __W
, __mmask8 __U
, __m128d __A
)
988 return (__m128i
) __builtin_ia32_cvtpd2udq128_mask ((__v2df
) __A
,
993 extern __inline __m128i
994 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
995 _mm_maskz_cvtpd_epu32 (__mmask8 __U
, __m128d __A
)
997 return (__m128i
) __builtin_ia32_cvtpd2udq128_mask ((__v2df
) __A
,
999 _mm_setzero_si128 (),
1003 extern __inline __m256i
1004 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1005 _mm256_mask_cvttps_epi32 (__m256i __W
, __mmask8 __U
, __m256 __A
)
1007 return (__m256i
) __builtin_ia32_cvttps2dq256_mask ((__v8sf
) __A
,
1012 extern __inline __m256i
1013 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1014 _mm256_maskz_cvttps_epi32 (__mmask8 __U
, __m256 __A
)
1016 return (__m256i
) __builtin_ia32_cvttps2dq256_mask ((__v8sf
) __A
,
1018 _mm256_setzero_si256 (),
1022 extern __inline __m128i
1023 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1024 _mm_mask_cvttps_epi32 (__m128i __W
, __mmask8 __U
, __m128 __A
)
1026 return (__m128i
) __builtin_ia32_cvttps2dq128_mask ((__v4sf
) __A
,
1031 extern __inline __m128i
1032 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1033 _mm_maskz_cvttps_epi32 (__mmask8 __U
, __m128 __A
)
1035 return (__m128i
) __builtin_ia32_cvttps2dq128_mask ((__v4sf
) __A
,
1037 _mm_setzero_si128 (),
1041 extern __inline __m256i
1042 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1043 _mm256_cvttps_epu32 (__m256 __A
)
1045 return (__m256i
) __builtin_ia32_cvttps2udq256_mask ((__v8sf
) __A
,
1047 _mm256_setzero_si256 (),
1051 extern __inline __m256i
1052 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1053 _mm256_mask_cvttps_epu32 (__m256i __W
, __mmask8 __U
, __m256 __A
)
1055 return (__m256i
) __builtin_ia32_cvttps2udq256_mask ((__v8sf
) __A
,
1060 extern __inline __m256i
1061 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1062 _mm256_maskz_cvttps_epu32 (__mmask8 __U
, __m256 __A
)
1064 return (__m256i
) __builtin_ia32_cvttps2udq256_mask ((__v8sf
) __A
,
1066 _mm256_setzero_si256 (),
1070 extern __inline __m128i
1071 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1072 _mm_cvttps_epu32 (__m128 __A
)
1074 return (__m128i
) __builtin_ia32_cvttps2udq128_mask ((__v4sf
) __A
,
1076 _mm_setzero_si128 (),
1080 extern __inline __m128i
1081 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1082 _mm_mask_cvttps_epu32 (__m128i __W
, __mmask8 __U
, __m128 __A
)
1084 return (__m128i
) __builtin_ia32_cvttps2udq128_mask ((__v4sf
) __A
,
1089 extern __inline __m128i
1090 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1091 _mm_maskz_cvttps_epu32 (__mmask8 __U
, __m128 __A
)
1093 return (__m128i
) __builtin_ia32_cvttps2udq128_mask ((__v4sf
) __A
,
1095 _mm_setzero_si128 (),
1099 extern __inline __m128i
1100 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1101 _mm256_mask_cvttpd_epi32 (__m128i __W
, __mmask8 __U
, __m256d __A
)
1103 return (__m128i
) __builtin_ia32_cvttpd2dq256_mask ((__v4df
) __A
,
1108 extern __inline __m128i
1109 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1110 _mm256_maskz_cvttpd_epi32 (__mmask8 __U
, __m256d __A
)
1112 return (__m128i
) __builtin_ia32_cvttpd2dq256_mask ((__v4df
) __A
,
1114 _mm_setzero_si128 (),
1118 extern __inline __m128i
1119 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1120 _mm_mask_cvttpd_epi32 (__m128i __W
, __mmask8 __U
, __m128d __A
)
1122 return (__m128i
) __builtin_ia32_cvttpd2dq128_mask ((__v2df
) __A
,
1127 extern __inline __m128i
1128 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1129 _mm_maskz_cvttpd_epi32 (__mmask8 __U
, __m128d __A
)
1131 return (__m128i
) __builtin_ia32_cvttpd2dq128_mask ((__v2df
) __A
,
1133 _mm_setzero_si128 (),
1137 extern __inline __m128i
1138 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1139 _mm256_cvttpd_epu32 (__m256d __A
)
1141 return (__m128i
) __builtin_ia32_cvttpd2udq256_mask ((__v4df
) __A
,
1143 _mm_setzero_si128 (),
1147 extern __inline __m128i
1148 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1149 _mm256_mask_cvttpd_epu32 (__m128i __W
, __mmask8 __U
, __m256d __A
)
1151 return (__m128i
) __builtin_ia32_cvttpd2udq256_mask ((__v4df
) __A
,
1156 extern __inline __m128i
1157 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1158 _mm256_maskz_cvttpd_epu32 (__mmask8 __U
, __m256d __A
)
1160 return (__m128i
) __builtin_ia32_cvttpd2udq256_mask ((__v4df
) __A
,
1162 _mm_setzero_si128 (),
1166 extern __inline __m128i
1167 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1168 _mm_cvttpd_epu32 (__m128d __A
)
1170 return (__m128i
) __builtin_ia32_cvttpd2udq128_mask ((__v2df
) __A
,
1172 _mm_setzero_si128 (),
1176 extern __inline __m128i
1177 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1178 _mm_mask_cvttpd_epu32 (__m128i __W
, __mmask8 __U
, __m128d __A
)
1180 return (__m128i
) __builtin_ia32_cvttpd2udq128_mask ((__v2df
) __A
,
1185 extern __inline __m128i
1186 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1187 _mm_maskz_cvttpd_epu32 (__mmask8 __U
, __m128d __A
)
1189 return (__m128i
) __builtin_ia32_cvttpd2udq128_mask ((__v2df
) __A
,
1191 _mm_setzero_si128 (),
1195 extern __inline __m128i
1196 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1197 _mm256_mask_cvtpd_epi32 (__m128i __W
, __mmask8 __U
, __m256d __A
)
1199 return (__m128i
) __builtin_ia32_cvtpd2dq256_mask ((__v4df
) __A
,
1204 extern __inline __m128i
1205 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1206 _mm256_maskz_cvtpd_epi32 (__mmask8 __U
, __m256d __A
)
1208 return (__m128i
) __builtin_ia32_cvtpd2dq256_mask ((__v4df
) __A
,
1210 _mm_setzero_si128 (),
1214 extern __inline __m128i
1215 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1216 _mm_mask_cvtpd_epi32 (__m128i __W
, __mmask8 __U
, __m128d __A
)
1218 return (__m128i
) __builtin_ia32_cvtpd2dq128_mask ((__v2df
) __A
,
1223 extern __inline __m128i
1224 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1225 _mm_maskz_cvtpd_epi32 (__mmask8 __U
, __m128d __A
)
1227 return (__m128i
) __builtin_ia32_cvtpd2dq128_mask ((__v2df
) __A
,
1229 _mm_setzero_si128 (),
1233 extern __inline __m256d
1234 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1235 _mm256_mask_cvtepi32_pd (__m256d __W
, __mmask8 __U
, __m128i __A
)
1237 return (__m256d
) __builtin_ia32_cvtdq2pd256_mask ((__v4si
) __A
,
1242 extern __inline __m256d
1243 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1244 _mm256_maskz_cvtepi32_pd (__mmask8 __U
, __m128i __A
)
1246 return (__m256d
) __builtin_ia32_cvtdq2pd256_mask ((__v4si
) __A
,
1248 _mm256_setzero_pd (),
1252 extern __inline __m128d
1253 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1254 _mm_mask_cvtepi32_pd (__m128d __W
, __mmask8 __U
, __m128i __A
)
1256 return (__m128d
) __builtin_ia32_cvtdq2pd128_mask ((__v4si
) __A
,
1261 extern __inline __m128d
1262 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1263 _mm_maskz_cvtepi32_pd (__mmask8 __U
, __m128i __A
)
1265 return (__m128d
) __builtin_ia32_cvtdq2pd128_mask ((__v4si
) __A
,
1271 extern __inline __m256d
1272 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1273 _mm256_cvtepu32_pd (__m128i __A
)
1275 return (__m256d
) __builtin_ia32_cvtudq2pd256_mask ((__v4si
) __A
,
1277 _mm256_setzero_pd (),
1281 extern __inline __m256d
1282 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1283 _mm256_mask_cvtepu32_pd (__m256d __W
, __mmask8 __U
, __m128i __A
)
1285 return (__m256d
) __builtin_ia32_cvtudq2pd256_mask ((__v4si
) __A
,
1290 extern __inline __m256d
1291 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1292 _mm256_maskz_cvtepu32_pd (__mmask8 __U
, __m128i __A
)
1294 return (__m256d
) __builtin_ia32_cvtudq2pd256_mask ((__v4si
) __A
,
1296 _mm256_setzero_pd (),
1300 extern __inline __m128d
1301 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1302 _mm_cvtepu32_pd (__m128i __A
)
1304 return (__m128d
) __builtin_ia32_cvtudq2pd128_mask ((__v4si
) __A
,
1310 extern __inline __m128d
1311 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1312 _mm_mask_cvtepu32_pd (__m128d __W
, __mmask8 __U
, __m128i __A
)
1314 return (__m128d
) __builtin_ia32_cvtudq2pd128_mask ((__v4si
) __A
,
1319 extern __inline __m128d
1320 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1321 _mm_maskz_cvtepu32_pd (__mmask8 __U
, __m128i __A
)
1323 return (__m128d
) __builtin_ia32_cvtudq2pd128_mask ((__v4si
) __A
,
1329 extern __inline __m256
1330 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1331 _mm256_mask_cvtepi32_ps (__m256 __W
, __mmask8 __U
, __m256i __A
)
1333 return (__m256
) __builtin_ia32_cvtdq2ps256_mask ((__v8si
) __A
,
1338 extern __inline __m256
1339 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1340 _mm256_maskz_cvtepi32_ps (__mmask16 __U
, __m256i __A
)
1342 return (__m256
) __builtin_ia32_cvtdq2ps256_mask ((__v8si
) __A
,
1344 _mm256_setzero_ps (),
1348 extern __inline __m128
1349 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1350 _mm_mask_cvtepi32_ps (__m128 __W
, __mmask8 __U
, __m128i __A
)
1352 return (__m128
) __builtin_ia32_cvtdq2ps128_mask ((__v4si
) __A
,
1357 extern __inline __m128
1358 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1359 _mm_maskz_cvtepi32_ps (__mmask16 __U
, __m128i __A
)
1361 return (__m128
) __builtin_ia32_cvtdq2ps128_mask ((__v4si
) __A
,
1367 extern __inline __m256
1368 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1369 _mm256_cvtepu32_ps (__m256i __A
)
1371 return (__m256
) __builtin_ia32_cvtudq2ps256_mask ((__v8si
) __A
,
1373 _mm256_setzero_ps (),
1377 extern __inline __m256
1378 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1379 _mm256_mask_cvtepu32_ps (__m256 __W
, __mmask8 __U
, __m256i __A
)
1381 return (__m256
) __builtin_ia32_cvtudq2ps256_mask ((__v8si
) __A
,
1386 extern __inline __m256
1387 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1388 _mm256_maskz_cvtepu32_ps (__mmask8 __U
, __m256i __A
)
1390 return (__m256
) __builtin_ia32_cvtudq2ps256_mask ((__v8si
) __A
,
1392 _mm256_setzero_ps (),
1396 extern __inline __m128
1397 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1398 _mm_cvtepu32_ps (__m128i __A
)
1400 return (__m128
) __builtin_ia32_cvtudq2ps128_mask ((__v4si
) __A
,
1406 extern __inline __m128
1407 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1408 _mm_mask_cvtepu32_ps (__m128 __W
, __mmask8 __U
, __m128i __A
)
1410 return (__m128
) __builtin_ia32_cvtudq2ps128_mask ((__v4si
) __A
,
1415 extern __inline __m128
1416 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1417 _mm_maskz_cvtepu32_ps (__mmask8 __U
, __m128i __A
)
1419 return (__m128
) __builtin_ia32_cvtudq2ps128_mask ((__v4si
) __A
,
1425 extern __inline __m256d
1426 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1427 _mm256_mask_cvtps_pd (__m256d __W
, __mmask8 __U
, __m128 __A
)
1429 return (__m256d
) __builtin_ia32_cvtps2pd256_mask ((__v4sf
) __A
,
1434 extern __inline __m256d
1435 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1436 _mm256_maskz_cvtps_pd (__mmask8 __U
, __m128 __A
)
1438 return (__m256d
) __builtin_ia32_cvtps2pd256_mask ((__v4sf
) __A
,
1440 _mm256_setzero_pd (),
1444 extern __inline __m128d
1445 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1446 _mm_mask_cvtps_pd (__m128d __W
, __mmask8 __U
, __m128 __A
)
1448 return (__m128d
) __builtin_ia32_cvtps2pd128_mask ((__v4sf
) __A
,
1453 extern __inline __m128d
1454 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1455 _mm_maskz_cvtps_pd (__mmask8 __U
, __m128 __A
)
1457 return (__m128d
) __builtin_ia32_cvtps2pd128_mask ((__v4sf
) __A
,
1463 extern __inline __m128i
1464 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1465 _mm_cvtepi32_epi8 (__m128i __A
)
1467 return (__m128i
) __builtin_ia32_pmovdb128_mask ((__v4si
) __A
,
1468 (__v16qi
)_mm_undefined_si128(),
1472 extern __inline
void
1473 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1474 _mm_mask_cvtepi32_storeu_epi8 (void * __P
, __mmask8 __M
, __m128i __A
)
1476 __builtin_ia32_pmovdb128mem_mask ((__v16qi
*) __P
, (__v4si
) __A
, __M
);
1479 extern __inline __m128i
1480 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1481 _mm_mask_cvtepi32_epi8 (__m128i __O
, __mmask8 __M
, __m128i __A
)
1483 return (__m128i
) __builtin_ia32_pmovdb128_mask ((__v4si
) __A
,
1484 (__v16qi
) __O
, __M
);
1487 extern __inline __m128i
1488 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1489 _mm_maskz_cvtepi32_epi8 (__mmask8 __M
, __m128i __A
)
1491 return (__m128i
) __builtin_ia32_pmovdb128_mask ((__v4si
) __A
,
1493 _mm_setzero_si128 (),
1497 extern __inline __m128i
1498 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1499 _mm256_cvtepi32_epi8 (__m256i __A
)
1501 return (__m128i
) __builtin_ia32_pmovdb256_mask ((__v8si
) __A
,
1502 (__v16qi
)_mm_undefined_si128(),
1506 extern __inline __m128i
1507 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1508 _mm256_mask_cvtepi32_epi8 (__m128i __O
, __mmask8 __M
, __m256i __A
)
1510 return (__m128i
) __builtin_ia32_pmovdb256_mask ((__v8si
) __A
,
1511 (__v16qi
) __O
, __M
);
1514 extern __inline
void
1515 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1516 _mm256_mask_cvtepi32_storeu_epi8 (void * __P
, __mmask8 __M
, __m256i __A
)
1518 __builtin_ia32_pmovdb256mem_mask ((__v16qi
*) __P
, (__v8si
) __A
, __M
);
1521 extern __inline __m128i
1522 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1523 _mm256_maskz_cvtepi32_epi8 (__mmask8 __M
, __m256i __A
)
1525 return (__m128i
) __builtin_ia32_pmovdb256_mask ((__v8si
) __A
,
1527 _mm_setzero_si128 (),
1531 extern __inline __m128i
1532 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1533 _mm_cvtsepi32_epi8 (__m128i __A
)
1535 return (__m128i
) __builtin_ia32_pmovsdb128_mask ((__v4si
) __A
,
1536 (__v16qi
)_mm_undefined_si128(),
1540 extern __inline
void
1541 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1542 _mm_mask_cvtsepi32_storeu_epi8 (void * __P
, __mmask8 __M
, __m128i __A
)
1544 __builtin_ia32_pmovsdb128mem_mask ((__v16qi
*) __P
, (__v4si
) __A
, __M
);
1547 extern __inline __m128i
1548 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1549 _mm_mask_cvtsepi32_epi8 (__m128i __O
, __mmask8 __M
, __m128i __A
)
1551 return (__m128i
) __builtin_ia32_pmovsdb128_mask ((__v4si
) __A
,
1552 (__v16qi
) __O
, __M
);
1555 extern __inline __m128i
1556 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1557 _mm_maskz_cvtsepi32_epi8 (__mmask8 __M
, __m128i __A
)
1559 return (__m128i
) __builtin_ia32_pmovsdb128_mask ((__v4si
) __A
,
1561 _mm_setzero_si128 (),
1565 extern __inline __m128i
1566 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1567 _mm256_cvtsepi32_epi8 (__m256i __A
)
1569 return (__m128i
) __builtin_ia32_pmovsdb256_mask ((__v8si
) __A
,
1570 (__v16qi
)_mm_undefined_si128(),
1574 extern __inline
void
1575 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1576 _mm256_mask_cvtsepi32_storeu_epi8 (void * __P
, __mmask8 __M
, __m256i __A
)
1578 __builtin_ia32_pmovsdb256mem_mask ((__v16qi
*) __P
, (__v8si
) __A
, __M
);
1581 extern __inline __m128i
1582 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1583 _mm256_mask_cvtsepi32_epi8 (__m128i __O
, __mmask8 __M
, __m256i __A
)
1585 return (__m128i
) __builtin_ia32_pmovsdb256_mask ((__v8si
) __A
,
1586 (__v16qi
) __O
, __M
);
1589 extern __inline __m128i
1590 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1591 _mm256_maskz_cvtsepi32_epi8 (__mmask8 __M
, __m256i __A
)
1593 return (__m128i
) __builtin_ia32_pmovsdb256_mask ((__v8si
) __A
,
1595 _mm_setzero_si128 (),
1599 extern __inline __m128i
1600 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1601 _mm_cvtusepi32_epi8 (__m128i __A
)
1603 return (__m128i
) __builtin_ia32_pmovusdb128_mask ((__v4si
) __A
,
1604 (__v16qi
)_mm_undefined_si128(),
1608 extern __inline
void
1609 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1610 _mm_mask_cvtusepi32_storeu_epi8 (void * __P
, __mmask8 __M
, __m128i __A
)
1612 __builtin_ia32_pmovusdb128mem_mask ((__v16qi
*) __P
, (__v4si
) __A
, __M
);
1615 extern __inline __m128i
1616 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1617 _mm_mask_cvtusepi32_epi8 (__m128i __O
, __mmask8 __M
, __m128i __A
)
1619 return (__m128i
) __builtin_ia32_pmovusdb128_mask ((__v4si
) __A
,
1624 extern __inline __m128i
1625 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1626 _mm_maskz_cvtusepi32_epi8 (__mmask8 __M
, __m128i __A
)
1628 return (__m128i
) __builtin_ia32_pmovusdb128_mask ((__v4si
) __A
,
1630 _mm_setzero_si128 (),
1634 extern __inline __m128i
1635 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1636 _mm256_cvtusepi32_epi8 (__m256i __A
)
1638 return (__m128i
) __builtin_ia32_pmovusdb256_mask ((__v8si
) __A
,
1639 (__v16qi
)_mm_undefined_si128(),
1643 extern __inline
void
1644 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1645 _mm256_mask_cvtusepi32_storeu_epi8 (void * __P
, __mmask8 __M
, __m256i __A
)
1647 __builtin_ia32_pmovusdb256mem_mask ((__v16qi
*) __P
, (__v8si
) __A
, __M
);
1650 extern __inline __m128i
1651 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1652 _mm256_mask_cvtusepi32_epi8 (__m128i __O
, __mmask8 __M
, __m256i __A
)
1654 return (__m128i
) __builtin_ia32_pmovusdb256_mask ((__v8si
) __A
,
1659 extern __inline __m128i
1660 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1661 _mm256_maskz_cvtusepi32_epi8 (__mmask8 __M
, __m256i __A
)
1663 return (__m128i
) __builtin_ia32_pmovusdb256_mask ((__v8si
) __A
,
1665 _mm_setzero_si128 (),
1669 extern __inline __m128i
1670 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1671 _mm_cvtepi32_epi16 (__m128i __A
)
1673 return (__m128i
) __builtin_ia32_pmovdw128_mask ((__v4si
) __A
,
1674 (__v8hi
) _mm_setzero_si128 (),
1678 extern __inline
void
1679 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1680 _mm_mask_cvtepi32_storeu_epi16 (void * __P
, __mmask8 __M
, __m128i __A
)
1682 __builtin_ia32_pmovdw128mem_mask ((__v8hi
*) __P
, (__v4si
) __A
, __M
);
1685 extern __inline __m128i
1686 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1687 _mm_mask_cvtepi32_epi16 (__m128i __O
, __mmask8 __M
, __m128i __A
)
1689 return (__m128i
) __builtin_ia32_pmovdw128_mask ((__v4si
) __A
,
1693 extern __inline __m128i
1694 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1695 _mm_maskz_cvtepi32_epi16 (__mmask8 __M
, __m128i __A
)
1697 return (__m128i
) __builtin_ia32_pmovdw128_mask ((__v4si
) __A
,
1699 _mm_setzero_si128 (),
1703 extern __inline __m128i
1704 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1705 _mm256_cvtepi32_epi16 (__m256i __A
)
1707 return (__m128i
) __builtin_ia32_pmovdw256_mask ((__v8si
) __A
,
1708 (__v8hi
)_mm_setzero_si128 (),
1712 extern __inline
void
1713 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1714 _mm256_mask_cvtepi32_storeu_epi16 (void * __P
, __mmask8 __M
, __m256i __A
)
1716 __builtin_ia32_pmovdw256mem_mask ((__v8hi
*) __P
, (__v8si
) __A
, __M
);
1719 extern __inline __m128i
1720 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1721 _mm256_mask_cvtepi32_epi16 (__m128i __O
, __mmask8 __M
, __m256i __A
)
1723 return (__m128i
) __builtin_ia32_pmovdw256_mask ((__v8si
) __A
,
1727 extern __inline __m128i
1728 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1729 _mm256_maskz_cvtepi32_epi16 (__mmask8 __M
, __m256i __A
)
1731 return (__m128i
) __builtin_ia32_pmovdw256_mask ((__v8si
) __A
,
1733 _mm_setzero_si128 (),
1737 extern __inline __m128i
1738 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1739 _mm_cvtsepi32_epi16 (__m128i __A
)
1741 return (__m128i
) __builtin_ia32_pmovsdw128_mask ((__v4si
) __A
,
1742 (__v8hi
)_mm_setzero_si128 (),
1746 extern __inline
void
1747 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1748 _mm_mask_cvtsepi32_storeu_epi16 (void * __P
, __mmask8 __M
, __m128i __A
)
1750 __builtin_ia32_pmovsdw128mem_mask ((__v8hi
*) __P
, (__v4si
) __A
, __M
);
1753 extern __inline __m128i
1754 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1755 _mm_mask_cvtsepi32_epi16 (__m128i __O
, __mmask8 __M
, __m128i __A
)
1757 return (__m128i
) __builtin_ia32_pmovsdw128_mask ((__v4si
) __A
,
1762 extern __inline __m128i
1763 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1764 _mm_maskz_cvtsepi32_epi16 (__mmask8 __M
, __m128i __A
)
1766 return (__m128i
) __builtin_ia32_pmovsdw128_mask ((__v4si
) __A
,
1768 _mm_setzero_si128 (),
1772 extern __inline __m128i
1773 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1774 _mm256_cvtsepi32_epi16 (__m256i __A
)
1776 return (__m128i
) __builtin_ia32_pmovsdw256_mask ((__v8si
) __A
,
1777 (__v8hi
)_mm_undefined_si128(),
1781 extern __inline
void
1782 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1783 _mm256_mask_cvtsepi32_storeu_epi16 (void * __P
, __mmask8 __M
, __m256i __A
)
1785 __builtin_ia32_pmovsdw256mem_mask ((__v8hi
*) __P
, (__v8si
) __A
, __M
);
1788 extern __inline __m128i
1789 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1790 _mm256_mask_cvtsepi32_epi16 (__m128i __O
, __mmask8 __M
, __m256i __A
)
1792 return (__m128i
) __builtin_ia32_pmovsdw256_mask ((__v8si
) __A
,
1796 extern __inline __m128i
1797 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1798 _mm256_maskz_cvtsepi32_epi16 (__mmask8 __M
, __m256i __A
)
1800 return (__m128i
) __builtin_ia32_pmovsdw256_mask ((__v8si
) __A
,
1802 _mm_setzero_si128 (),
1806 extern __inline __m128i
1807 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1808 _mm_cvtusepi32_epi16 (__m128i __A
)
1810 return (__m128i
) __builtin_ia32_pmovusdw128_mask ((__v4si
) __A
,
1811 (__v8hi
)_mm_undefined_si128(),
1815 extern __inline
void
1816 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1817 _mm_mask_cvtusepi32_storeu_epi16 (void * __P
, __mmask8 __M
, __m128i __A
)
1819 __builtin_ia32_pmovusdw128mem_mask ((__v8hi
*) __P
, (__v4si
) __A
, __M
);
1822 extern __inline __m128i
1823 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1824 _mm_mask_cvtusepi32_epi16 (__m128i __O
, __mmask8 __M
, __m128i __A
)
1826 return (__m128i
) __builtin_ia32_pmovusdw128_mask ((__v4si
) __A
,
1830 extern __inline __m128i
1831 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1832 _mm_maskz_cvtusepi32_epi16 (__mmask8 __M
, __m128i __A
)
1834 return (__m128i
) __builtin_ia32_pmovusdw128_mask ((__v4si
) __A
,
1836 _mm_setzero_si128 (),
1840 extern __inline __m128i
1841 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1842 _mm256_cvtusepi32_epi16 (__m256i __A
)
1844 return (__m128i
) __builtin_ia32_pmovusdw256_mask ((__v8si
) __A
,
1845 (__v8hi
)_mm_undefined_si128(),
1849 extern __inline
void
1850 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1851 _mm256_mask_cvtusepi32_storeu_epi16 (void * __P
, __mmask8 __M
, __m256i __A
)
1853 __builtin_ia32_pmovusdw256mem_mask ((__v8hi
*) __P
, (__v8si
) __A
, __M
);
1856 extern __inline __m128i
1857 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1858 _mm256_mask_cvtusepi32_epi16 (__m128i __O
, __mmask8 __M
, __m256i __A
)
1860 return (__m128i
) __builtin_ia32_pmovusdw256_mask ((__v8si
) __A
,
1864 extern __inline __m128i
1865 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1866 _mm256_maskz_cvtusepi32_epi16 (__mmask8 __M
, __m256i __A
)
1868 return (__m128i
) __builtin_ia32_pmovusdw256_mask ((__v8si
) __A
,
1870 _mm_setzero_si128 (),
1874 extern __inline __m128i
1875 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1876 _mm_cvtepi64_epi8 (__m128i __A
)
1878 return (__m128i
) __builtin_ia32_pmovqb128_mask ((__v2di
) __A
,
1879 (__v16qi
)_mm_undefined_si128(),
1883 extern __inline
void
1884 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1885 _mm_mask_cvtepi64_storeu_epi8 (void * __P
, __mmask8 __M
, __m128i __A
)
1887 __builtin_ia32_pmovqb128mem_mask ((__v16qi
*) __P
, (__v2di
) __A
, __M
);
1890 extern __inline __m128i
1891 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1892 _mm_mask_cvtepi64_epi8 (__m128i __O
, __mmask8 __M
, __m128i __A
)
1894 return (__m128i
) __builtin_ia32_pmovqb128_mask ((__v2di
) __A
,
1895 (__v16qi
) __O
, __M
);
1898 extern __inline __m128i
1899 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1900 _mm_maskz_cvtepi64_epi8 (__mmask8 __M
, __m128i __A
)
1902 return (__m128i
) __builtin_ia32_pmovqb128_mask ((__v2di
) __A
,
1904 _mm_setzero_si128 (),
1908 extern __inline __m128i
1909 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1910 _mm256_cvtepi64_epi8 (__m256i __A
)
1912 return (__m128i
) __builtin_ia32_pmovqb256_mask ((__v4di
) __A
,
1913 (__v16qi
)_mm_undefined_si128(),
1917 extern __inline
void
1918 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1919 _mm256_mask_cvtepi64_storeu_epi8 (void * __P
, __mmask8 __M
, __m256i __A
)
1921 __builtin_ia32_pmovqb256mem_mask ((__v16qi
*) __P
, (__v4di
) __A
, __M
);
1924 extern __inline __m128i
1925 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1926 _mm256_mask_cvtepi64_epi8 (__m128i __O
, __mmask8 __M
, __m256i __A
)
1928 return (__m128i
) __builtin_ia32_pmovqb256_mask ((__v4di
) __A
,
1929 (__v16qi
) __O
, __M
);
1932 extern __inline __m128i
1933 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1934 _mm256_maskz_cvtepi64_epi8 (__mmask8 __M
, __m256i __A
)
1936 return (__m128i
) __builtin_ia32_pmovqb256_mask ((__v4di
) __A
,
1938 _mm_setzero_si128 (),
1942 extern __inline __m128i
1943 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1944 _mm_cvtsepi64_epi8 (__m128i __A
)
1946 return (__m128i
) __builtin_ia32_pmovsqb128_mask ((__v2di
) __A
,
1947 (__v16qi
)_mm_undefined_si128(),
1951 extern __inline
void
1952 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1953 _mm_mask_cvtsepi64_storeu_epi8 (void * __P
, __mmask8 __M
, __m128i __A
)
1955 __builtin_ia32_pmovsqb128mem_mask ((__v16qi
*) __P
, (__v2di
) __A
, __M
);
1958 extern __inline __m128i
1959 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1960 _mm_mask_cvtsepi64_epi8 (__m128i __O
, __mmask8 __M
, __m128i __A
)
1962 return (__m128i
) __builtin_ia32_pmovsqb128_mask ((__v2di
) __A
,
1963 (__v16qi
) __O
, __M
);
1966 extern __inline __m128i
1967 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1968 _mm_maskz_cvtsepi64_epi8 (__mmask8 __M
, __m128i __A
)
1970 return (__m128i
) __builtin_ia32_pmovsqb128_mask ((__v2di
) __A
,
1972 _mm_setzero_si128 (),
1976 extern __inline __m128i
1977 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1978 _mm256_cvtsepi64_epi8 (__m256i __A
)
1980 return (__m128i
) __builtin_ia32_pmovsqb256_mask ((__v4di
) __A
,
1981 (__v16qi
)_mm_undefined_si128(),
1985 extern __inline
void
1986 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1987 _mm256_mask_cvtsepi64_storeu_epi8 (void * __P
, __mmask8 __M
, __m256i __A
)
1989 __builtin_ia32_pmovsqb256mem_mask ((__v16qi
*) __P
, (__v4di
) __A
, __M
);
1992 extern __inline __m128i
1993 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
1994 _mm256_mask_cvtsepi64_epi8 (__m128i __O
, __mmask8 __M
, __m256i __A
)
1996 return (__m128i
) __builtin_ia32_pmovsqb256_mask ((__v4di
) __A
,
1997 (__v16qi
) __O
, __M
);
2000 extern __inline __m128i
2001 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2002 _mm256_maskz_cvtsepi64_epi8 (__mmask8 __M
, __m256i __A
)
2004 return (__m128i
) __builtin_ia32_pmovsqb256_mask ((__v4di
) __A
,
2006 _mm_setzero_si128 (),
2010 extern __inline __m128i
2011 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2012 _mm_cvtusepi64_epi8 (__m128i __A
)
2014 return (__m128i
) __builtin_ia32_pmovusqb128_mask ((__v2di
) __A
,
2015 (__v16qi
)_mm_undefined_si128(),
2019 extern __inline
void
2020 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2021 _mm_mask_cvtusepi64_storeu_epi8 (void * __P
, __mmask8 __M
, __m128i __A
)
2023 __builtin_ia32_pmovusqb128mem_mask ((__v16qi
*) __P
, (__v2di
) __A
, __M
);
2026 extern __inline __m128i
2027 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2028 _mm_mask_cvtusepi64_epi8 (__m128i __O
, __mmask8 __M
, __m128i __A
)
2030 return (__m128i
) __builtin_ia32_pmovusqb128_mask ((__v2di
) __A
,
2035 extern __inline __m128i
2036 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2037 _mm_maskz_cvtusepi64_epi8 (__mmask8 __M
, __m128i __A
)
2039 return (__m128i
) __builtin_ia32_pmovusqb128_mask ((__v2di
) __A
,
2041 _mm_setzero_si128 (),
2045 extern __inline __m128i
2046 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2047 _mm256_cvtusepi64_epi8 (__m256i __A
)
2049 return (__m128i
) __builtin_ia32_pmovusqb256_mask ((__v4di
) __A
,
2050 (__v16qi
)_mm_undefined_si128(),
2054 extern __inline
void
2055 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2056 _mm256_mask_cvtusepi64_storeu_epi8 (void * __P
, __mmask8 __M
, __m256i __A
)
2058 __builtin_ia32_pmovusqb256mem_mask ((__v16qi
*) __P
, (__v4di
) __A
, __M
);
2061 extern __inline __m128i
2062 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2063 _mm256_mask_cvtusepi64_epi8 (__m128i __O
, __mmask8 __M
, __m256i __A
)
2065 return (__m128i
) __builtin_ia32_pmovusqb256_mask ((__v4di
) __A
,
2070 extern __inline __m128i
2071 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2072 _mm256_maskz_cvtusepi64_epi8 (__mmask8 __M
, __m256i __A
)
2074 return (__m128i
) __builtin_ia32_pmovusqb256_mask ((__v4di
) __A
,
2076 _mm_setzero_si128 (),
2080 extern __inline __m128i
2081 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2082 _mm_cvtepi64_epi16 (__m128i __A
)
2084 return (__m128i
) __builtin_ia32_pmovqw128_mask ((__v2di
) __A
,
2085 (__v8hi
)_mm_undefined_si128(),
2089 extern __inline
void
2090 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2091 _mm_mask_cvtepi64_storeu_epi16 (void * __P
, __mmask8 __M
, __m128i __A
)
2093 __builtin_ia32_pmovqw128mem_mask ((__v8hi
*) __P
, (__v2di
) __A
, __M
);
2096 extern __inline __m128i
2097 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2098 _mm_mask_cvtepi64_epi16 (__m128i __O
, __mmask8 __M
, __m128i __A
)
2100 return (__m128i
) __builtin_ia32_pmovqw128_mask ((__v2di
) __A
,
2105 extern __inline __m128i
2106 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2107 _mm_maskz_cvtepi64_epi16 (__mmask8 __M
, __m128i __A
)
2109 return (__m128i
) __builtin_ia32_pmovqw128_mask ((__v2di
) __A
,
2111 _mm_setzero_si128 (),
2115 extern __inline __m128i
2116 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2117 _mm256_cvtepi64_epi16 (__m256i __A
)
2119 return (__m128i
) __builtin_ia32_pmovqw256_mask ((__v4di
) __A
,
2120 (__v8hi
)_mm_undefined_si128(),
2124 extern __inline
void
2125 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2126 _mm256_mask_cvtepi64_storeu_epi16 (void * __P
, __mmask8 __M
, __m256i __A
)
2128 __builtin_ia32_pmovqw256mem_mask ((__v8hi
*) __P
, (__v4di
) __A
, __M
);
2131 extern __inline __m128i
2132 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2133 _mm256_mask_cvtepi64_epi16 (__m128i __O
, __mmask8 __M
, __m256i __A
)
2135 return (__m128i
) __builtin_ia32_pmovqw256_mask ((__v4di
) __A
,
2139 extern __inline __m128i
2140 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2141 _mm256_maskz_cvtepi64_epi16 (__mmask8 __M
, __m256i __A
)
2143 return (__m128i
) __builtin_ia32_pmovqw256_mask ((__v4di
) __A
,
2145 _mm_setzero_si128 (),
2149 extern __inline __m128i
2150 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2151 _mm_cvtsepi64_epi16 (__m128i __A
)
2153 return (__m128i
) __builtin_ia32_pmovsqw128_mask ((__v2di
) __A
,
2154 (__v8hi
)_mm_undefined_si128(),
2158 extern __inline
void
2159 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2160 _mm_mask_cvtsepi64_storeu_epi16 (void * __P
, __mmask8 __M
, __m128i __A
)
2162 __builtin_ia32_pmovsqw128mem_mask ((__v8hi
*) __P
, (__v2di
) __A
, __M
);
2165 extern __inline __m128i
2166 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2167 _mm_mask_cvtsepi64_epi16 (__m128i __O
, __mmask8 __M
, __m128i __A
)
2169 return (__m128i
) __builtin_ia32_pmovsqw128_mask ((__v2di
) __A
,
2173 extern __inline __m128i
2174 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2175 _mm_maskz_cvtsepi64_epi16 (__mmask8 __M
, __m128i __A
)
2177 return (__m128i
) __builtin_ia32_pmovsqw128_mask ((__v2di
) __A
,
2179 _mm_setzero_si128 (),
2183 extern __inline __m128i
2184 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2185 _mm256_cvtsepi64_epi16 (__m256i __A
)
2187 return (__m128i
) __builtin_ia32_pmovsqw256_mask ((__v4di
) __A
,
2188 (__v8hi
)_mm_undefined_si128(),
2192 extern __inline
void
2193 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2194 _mm256_mask_cvtsepi64_storeu_epi16 (void * __P
, __mmask8 __M
, __m256i __A
)
2196 __builtin_ia32_pmovsqw256mem_mask ((__v8hi
*) __P
, (__v4di
) __A
, __M
);
2199 extern __inline __m128i
2200 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2201 _mm256_mask_cvtsepi64_epi16 (__m128i __O
, __mmask8 __M
, __m256i __A
)
2203 return (__m128i
) __builtin_ia32_pmovsqw256_mask ((__v4di
) __A
,
2207 extern __inline __m128i
2208 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2209 _mm256_maskz_cvtsepi64_epi16 (__mmask8 __M
, __m256i __A
)
2211 return (__m128i
) __builtin_ia32_pmovsqw256_mask ((__v4di
) __A
,
2213 _mm_setzero_si128 (),
2217 extern __inline __m128i
2218 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2219 _mm_cvtusepi64_epi16 (__m128i __A
)
2221 return (__m128i
) __builtin_ia32_pmovusqw128_mask ((__v2di
) __A
,
2222 (__v8hi
)_mm_undefined_si128(),
2226 extern __inline
void
2227 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2228 _mm_mask_cvtusepi64_storeu_epi16 (void * __P
, __mmask8 __M
, __m128i __A
)
2230 __builtin_ia32_pmovusqw128mem_mask ((__v8hi
*) __P
, (__v2di
) __A
, __M
);
2233 extern __inline __m128i
2234 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2235 _mm_mask_cvtusepi64_epi16 (__m128i __O
, __mmask8 __M
, __m128i __A
)
2237 return (__m128i
) __builtin_ia32_pmovusqw128_mask ((__v2di
) __A
,
2241 extern __inline __m128i
2242 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2243 _mm_maskz_cvtusepi64_epi16 (__mmask8 __M
, __m128i __A
)
2245 return (__m128i
) __builtin_ia32_pmovusqw128_mask ((__v2di
) __A
,
2247 _mm_setzero_si128 (),
2251 extern __inline __m128i
2252 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2253 _mm256_cvtusepi64_epi16 (__m256i __A
)
2255 return (__m128i
) __builtin_ia32_pmovusqw256_mask ((__v4di
) __A
,
2256 (__v8hi
)_mm_undefined_si128(),
2260 extern __inline
void
2261 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2262 _mm256_mask_cvtusepi64_storeu_epi16 (void * __P
, __mmask8 __M
, __m256i __A
)
2264 __builtin_ia32_pmovusqw256mem_mask ((__v8hi
*) __P
, (__v4di
) __A
, __M
);
2267 extern __inline __m128i
2268 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2269 _mm256_mask_cvtusepi64_epi16 (__m128i __O
, __mmask8 __M
, __m256i __A
)
2271 return (__m128i
) __builtin_ia32_pmovusqw256_mask ((__v4di
) __A
,
2275 extern __inline __m128i
2276 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2277 _mm256_maskz_cvtusepi64_epi16 (__mmask8 __M
, __m256i __A
)
2279 return (__m128i
) __builtin_ia32_pmovusqw256_mask ((__v4di
) __A
,
2281 _mm_setzero_si128 (),
2285 extern __inline __m128i
2286 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2287 _mm_cvtepi64_epi32 (__m128i __A
)
2289 return (__m128i
) __builtin_ia32_pmovqd128_mask ((__v2di
) __A
,
2290 (__v4si
)_mm_undefined_si128(),
2294 extern __inline
void
2295 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2296 _mm_mask_cvtepi64_storeu_epi32 (void * __P
, __mmask8 __M
, __m128i __A
)
2298 __builtin_ia32_pmovqd128mem_mask ((__v4si
*) __P
, (__v2di
) __A
, __M
);
2301 extern __inline __m128i
2302 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2303 _mm_mask_cvtepi64_epi32 (__m128i __O
, __mmask8 __M
, __m128i __A
)
2305 return (__m128i
) __builtin_ia32_pmovqd128_mask ((__v2di
) __A
,
2309 extern __inline __m128i
2310 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2311 _mm_maskz_cvtepi64_epi32 (__mmask8 __M
, __m128i __A
)
2313 return (__m128i
) __builtin_ia32_pmovqd128_mask ((__v2di
) __A
,
2315 _mm_setzero_si128 (),
2319 extern __inline __m128i
2320 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2321 _mm256_cvtepi64_epi32 (__m256i __A
)
2323 return (__m128i
) __builtin_ia32_pmovqd256_mask ((__v4di
) __A
,
2324 (__v4si
)_mm_undefined_si128(),
2328 extern __inline
void
2329 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2330 _mm256_mask_cvtepi64_storeu_epi32 (void * __P
, __mmask8 __M
, __m256i __A
)
2332 __builtin_ia32_pmovqd256mem_mask ((__v4si
*) __P
, (__v4di
) __A
, __M
);
2335 extern __inline __m128i
2336 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2337 _mm256_mask_cvtepi64_epi32 (__m128i __O
, __mmask8 __M
, __m256i __A
)
2339 return (__m128i
) __builtin_ia32_pmovqd256_mask ((__v4di
) __A
,
2343 extern __inline __m128i
2344 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2345 _mm256_maskz_cvtepi64_epi32 (__mmask8 __M
, __m256i __A
)
2347 return (__m128i
) __builtin_ia32_pmovqd256_mask ((__v4di
) __A
,
2349 _mm_setzero_si128 (),
2353 extern __inline __m128i
2354 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2355 _mm_cvtsepi64_epi32 (__m128i __A
)
2357 return (__m128i
) __builtin_ia32_pmovsqd128_mask ((__v2di
) __A
,
2358 (__v4si
)_mm_undefined_si128(),
2362 extern __inline
void
2363 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2364 _mm_mask_cvtsepi64_storeu_epi32 (void * __P
, __mmask8 __M
, __m128i __A
)
2366 __builtin_ia32_pmovsqd128mem_mask ((__v4si
*) __P
, (__v2di
) __A
, __M
);
2369 extern __inline __m128i
2370 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2371 _mm_mask_cvtsepi64_epi32 (__m128i __O
, __mmask8 __M
, __m128i __A
)
2373 return (__m128i
) __builtin_ia32_pmovsqd128_mask ((__v2di
) __A
,
2377 extern __inline __m128i
2378 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2379 _mm_maskz_cvtsepi64_epi32 (__mmask8 __M
, __m128i __A
)
2381 return (__m128i
) __builtin_ia32_pmovsqd128_mask ((__v2di
) __A
,
2383 _mm_setzero_si128 (),
2387 extern __inline __m128i
2388 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2389 _mm256_cvtsepi64_epi32 (__m256i __A
)
2391 return (__m128i
) __builtin_ia32_pmovsqd256_mask ((__v4di
) __A
,
2392 (__v4si
)_mm_undefined_si128(),
2396 extern __inline
void
2397 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2398 _mm256_mask_cvtsepi64_storeu_epi32 (void * __P
, __mmask8 __M
, __m256i __A
)
2400 __builtin_ia32_pmovsqd256mem_mask ((__v4si
*) __P
, (__v4di
) __A
, __M
);
2403 extern __inline __m128i
2404 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2405 _mm256_mask_cvtsepi64_epi32 (__m128i __O
, __mmask8 __M
, __m256i __A
)
2407 return (__m128i
) __builtin_ia32_pmovsqd256_mask ((__v4di
) __A
,
2412 extern __inline __m128i
2413 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2414 _mm256_maskz_cvtsepi64_epi32 (__mmask8 __M
, __m256i __A
)
2416 return (__m128i
) __builtin_ia32_pmovsqd256_mask ((__v4di
) __A
,
2418 _mm_setzero_si128 (),
2422 extern __inline __m128i
2423 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2424 _mm_cvtusepi64_epi32 (__m128i __A
)
2426 return (__m128i
) __builtin_ia32_pmovusqd128_mask ((__v2di
) __A
,
2427 (__v4si
)_mm_undefined_si128(),
2431 extern __inline
void
2432 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2433 _mm_mask_cvtusepi64_storeu_epi32 (void * __P
, __mmask8 __M
, __m128i __A
)
2435 __builtin_ia32_pmovusqd128mem_mask ((__v4si
*) __P
, (__v2di
) __A
, __M
);
2438 extern __inline __m128i
2439 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2440 _mm_mask_cvtusepi64_epi32 (__m128i __O
, __mmask8 __M
, __m128i __A
)
2442 return (__m128i
) __builtin_ia32_pmovusqd128_mask ((__v2di
) __A
,
2446 extern __inline __m128i
2447 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2448 _mm_maskz_cvtusepi64_epi32 (__mmask8 __M
, __m128i __A
)
2450 return (__m128i
) __builtin_ia32_pmovusqd128_mask ((__v2di
) __A
,
2452 _mm_setzero_si128 (),
2456 extern __inline __m128i
2457 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2458 _mm256_cvtusepi64_epi32 (__m256i __A
)
2460 return (__m128i
) __builtin_ia32_pmovusqd256_mask ((__v4di
) __A
,
2461 (__v4si
)_mm_undefined_si128(),
2465 extern __inline
void
2466 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2467 _mm256_mask_cvtusepi64_storeu_epi32 (void * __P
, __mmask8 __M
, __m256i __A
)
2469 __builtin_ia32_pmovusqd256mem_mask ((__v4si
*) __P
, (__v4di
) __A
, __M
);
2472 extern __inline __m128i
2473 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2474 _mm256_mask_cvtusepi64_epi32 (__m128i __O
, __mmask8 __M
, __m256i __A
)
2476 return (__m128i
) __builtin_ia32_pmovusqd256_mask ((__v4di
) __A
,
2480 extern __inline __m128i
2481 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2482 _mm256_maskz_cvtusepi64_epi32 (__mmask8 __M
, __m256i __A
)
2484 return (__m128i
) __builtin_ia32_pmovusqd256_mask ((__v4di
) __A
,
2486 _mm_setzero_si128 (),
2490 extern __inline __m256
2491 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2492 _mm256_mask_broadcastss_ps (__m256 __O
, __mmask8 __M
, __m128 __A
)
2494 return (__m256
) __builtin_ia32_broadcastss256_mask ((__v4sf
) __A
,
2499 extern __inline __m256
2500 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2501 _mm256_maskz_broadcastss_ps (__mmask8 __M
, __m128 __A
)
2503 return (__m256
) __builtin_ia32_broadcastss256_mask ((__v4sf
) __A
,
2505 _mm256_setzero_ps (),
2509 extern __inline __m128
2510 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2511 _mm_mask_broadcastss_ps (__m128 __O
, __mmask8 __M
, __m128 __A
)
2513 return (__m128
) __builtin_ia32_broadcastss128_mask ((__v4sf
) __A
,
2518 extern __inline __m128
2519 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2520 _mm_maskz_broadcastss_ps (__mmask8 __M
, __m128 __A
)
2522 return (__m128
) __builtin_ia32_broadcastss128_mask ((__v4sf
) __A
,
2528 extern __inline __m256d
2529 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2530 _mm256_mask_broadcastsd_pd (__m256d __O
, __mmask8 __M
, __m128d __A
)
2532 return (__m256d
) __builtin_ia32_broadcastsd256_mask ((__v2df
) __A
,
2537 extern __inline __m256d
2538 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2539 _mm256_maskz_broadcastsd_pd (__mmask8 __M
, __m128d __A
)
2541 return (__m256d
) __builtin_ia32_broadcastsd256_mask ((__v2df
) __A
,
2543 _mm256_setzero_pd (),
2547 extern __inline __m256i
2548 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2549 _mm256_mask_broadcastd_epi32 (__m256i __O
, __mmask8 __M
, __m128i __A
)
2551 return (__m256i
) __builtin_ia32_pbroadcastd256_mask ((__v4si
) __A
,
2556 extern __inline __m256i
2557 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2558 _mm256_maskz_broadcastd_epi32 (__mmask8 __M
, __m128i __A
)
2560 return (__m256i
) __builtin_ia32_pbroadcastd256_mask ((__v4si
) __A
,
2562 _mm256_setzero_si256 (),
2566 extern __inline __m256i
2567 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2568 _mm256_mask_set1_epi32 (__m256i __O
, __mmask8 __M
, int __A
)
2570 return (__m256i
) __builtin_ia32_pbroadcastd256_gpr_mask (__A
, (__v8si
) __O
,
2574 extern __inline __m256i
2575 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2576 _mm256_maskz_set1_epi32 (__mmask8 __M
, int __A
)
2578 return (__m256i
) __builtin_ia32_pbroadcastd256_gpr_mask (__A
,
2580 _mm256_setzero_si256 (),
2584 extern __inline __m128i
2585 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2586 _mm_mask_broadcastd_epi32 (__m128i __O
, __mmask8 __M
, __m128i __A
)
2588 return (__m128i
) __builtin_ia32_pbroadcastd128_mask ((__v4si
) __A
,
2593 extern __inline __m128i
2594 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2595 _mm_maskz_broadcastd_epi32 (__mmask8 __M
, __m128i __A
)
2597 return (__m128i
) __builtin_ia32_pbroadcastd128_mask ((__v4si
) __A
,
2599 _mm_setzero_si128 (),
2603 extern __inline __m128i
2604 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2605 _mm_mask_set1_epi32 (__m128i __O
, __mmask8 __M
, int __A
)
2607 return (__m128i
) __builtin_ia32_pbroadcastd128_gpr_mask (__A
, (__v4si
) __O
,
2611 extern __inline __m128i
2612 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2613 _mm_maskz_set1_epi32 (__mmask8 __M
, int __A
)
2615 return (__m128i
) __builtin_ia32_pbroadcastd128_gpr_mask (__A
,
2617 _mm_setzero_si128 (),
2621 extern __inline __m256i
2622 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2623 _mm256_mask_broadcastq_epi64 (__m256i __O
, __mmask8 __M
, __m128i __A
)
2625 return (__m256i
) __builtin_ia32_pbroadcastq256_mask ((__v2di
) __A
,
2630 extern __inline __m256i
2631 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2632 _mm256_maskz_broadcastq_epi64 (__mmask8 __M
, __m128i __A
)
2634 return (__m256i
) __builtin_ia32_pbroadcastq256_mask ((__v2di
) __A
,
2636 _mm256_setzero_si256 (),
2640 extern __inline __m256i
2641 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2642 _mm256_mask_set1_epi64 (__m256i __O
, __mmask8 __M
, long long __A
)
2644 return (__m256i
) __builtin_ia32_pbroadcastq256_gpr_mask (__A
, (__v4di
) __O
,
2648 extern __inline __m256i
2649 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2650 _mm256_maskz_set1_epi64 (__mmask8 __M
, long long __A
)
2652 return (__m256i
) __builtin_ia32_pbroadcastq256_gpr_mask (__A
,
2654 _mm256_setzero_si256 (),
2658 extern __inline __m128i
2659 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2660 _mm_mask_broadcastq_epi64 (__m128i __O
, __mmask8 __M
, __m128i __A
)
2662 return (__m128i
) __builtin_ia32_pbroadcastq128_mask ((__v2di
) __A
,
2667 extern __inline __m128i
2668 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2669 _mm_maskz_broadcastq_epi64 (__mmask8 __M
, __m128i __A
)
2671 return (__m128i
) __builtin_ia32_pbroadcastq128_mask ((__v2di
) __A
,
2673 _mm_setzero_si128 (),
2677 extern __inline __m128i
2678 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2679 _mm_mask_set1_epi64 (__m128i __O
, __mmask8 __M
, long long __A
)
2681 return (__m128i
) __builtin_ia32_pbroadcastq128_gpr_mask (__A
, (__v2di
) __O
,
2685 extern __inline __m128i
2686 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2687 _mm_maskz_set1_epi64 (__mmask8 __M
, long long __A
)
2689 return (__m128i
) __builtin_ia32_pbroadcastq128_gpr_mask (__A
,
2691 _mm_setzero_si128 (),
2695 extern __inline __m256
2696 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2697 _mm256_broadcast_f32x4 (__m128 __A
)
2699 return (__m256
) __builtin_ia32_broadcastf32x4_256_mask ((__v4sf
) __A
,
2700 (__v8sf
)_mm256_undefined_pd (),
2704 extern __inline __m256
2705 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2706 _mm256_mask_broadcast_f32x4 (__m256 __O
, __mmask8 __M
, __m128 __A
)
2708 return (__m256
) __builtin_ia32_broadcastf32x4_256_mask ((__v4sf
) __A
,
2713 extern __inline __m256
2714 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2715 _mm256_maskz_broadcast_f32x4 (__mmask8 __M
, __m128 __A
)
2717 return (__m256
) __builtin_ia32_broadcastf32x4_256_mask ((__v4sf
) __A
,
2719 _mm256_setzero_ps (),
2723 extern __inline __m256i
2724 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2725 _mm256_broadcast_i32x4 (__m128i __A
)
2727 return (__m256i
) __builtin_ia32_broadcasti32x4_256_mask ((__v4si
)
2729 (__v8si
)_mm256_undefined_si256 (),
2733 extern __inline __m256i
2734 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2735 _mm256_mask_broadcast_i32x4 (__m256i __O
, __mmask8 __M
, __m128i __A
)
2737 return (__m256i
) __builtin_ia32_broadcasti32x4_256_mask ((__v4si
)
2743 extern __inline __m256i
2744 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2745 _mm256_maskz_broadcast_i32x4 (__mmask8 __M
, __m128i __A
)
2747 return (__m256i
) __builtin_ia32_broadcasti32x4_256_mask ((__v4si
)
2750 _mm256_setzero_si256 (),
2754 extern __inline __m256i
2755 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2756 _mm256_mask_cvtepi8_epi32 (__m256i __W
, __mmask8 __U
, __m128i __A
)
2758 return (__m256i
) __builtin_ia32_pmovsxbd256_mask ((__v16qi
) __A
,
2763 extern __inline __m256i
2764 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2765 _mm256_maskz_cvtepi8_epi32 (__mmask8 __U
, __m128i __A
)
2767 return (__m256i
) __builtin_ia32_pmovsxbd256_mask ((__v16qi
) __A
,
2769 _mm256_setzero_si256 (),
2773 extern __inline __m128i
2774 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2775 _mm_mask_cvtepi8_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
)
2777 return (__m128i
) __builtin_ia32_pmovsxbd128_mask ((__v16qi
) __A
,
2782 extern __inline __m128i
2783 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2784 _mm_maskz_cvtepi8_epi32 (__mmask8 __U
, __m128i __A
)
2786 return (__m128i
) __builtin_ia32_pmovsxbd128_mask ((__v16qi
) __A
,
2788 _mm_setzero_si128 (),
2792 extern __inline __m256i
2793 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2794 _mm256_mask_cvtepi8_epi64 (__m256i __W
, __mmask8 __U
, __m128i __A
)
2796 return (__m256i
) __builtin_ia32_pmovsxbq256_mask ((__v16qi
) __A
,
2801 extern __inline __m256i
2802 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2803 _mm256_maskz_cvtepi8_epi64 (__mmask8 __U
, __m128i __A
)
2805 return (__m256i
) __builtin_ia32_pmovsxbq256_mask ((__v16qi
) __A
,
2807 _mm256_setzero_si256 (),
2811 extern __inline __m128i
2812 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2813 _mm_mask_cvtepi8_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
)
2815 return (__m128i
) __builtin_ia32_pmovsxbq128_mask ((__v16qi
) __A
,
2820 extern __inline __m128i
2821 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2822 _mm_maskz_cvtepi8_epi64 (__mmask8 __U
, __m128i __A
)
2824 return (__m128i
) __builtin_ia32_pmovsxbq128_mask ((__v16qi
) __A
,
2826 _mm_setzero_si128 (),
2830 extern __inline __m256i
2831 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2832 _mm256_mask_cvtepi16_epi32 (__m256i __W
, __mmask8 __U
, __m128i __A
)
2834 return (__m256i
) __builtin_ia32_pmovsxwd256_mask ((__v8hi
) __A
,
2839 extern __inline __m256i
2840 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2841 _mm256_maskz_cvtepi16_epi32 (__mmask8 __U
, __m128i __A
)
2843 return (__m256i
) __builtin_ia32_pmovsxwd256_mask ((__v8hi
) __A
,
2845 _mm256_setzero_si256 (),
2849 extern __inline __m128i
2850 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2851 _mm_mask_cvtepi16_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
)
2853 return (__m128i
) __builtin_ia32_pmovsxwd128_mask ((__v8hi
) __A
,
2858 extern __inline __m128i
2859 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2860 _mm_maskz_cvtepi16_epi32 (__mmask8 __U
, __m128i __A
)
2862 return (__m128i
) __builtin_ia32_pmovsxwd128_mask ((__v8hi
) __A
,
2864 _mm_setzero_si128 (),
2868 extern __inline __m256i
2869 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2870 _mm256_mask_cvtepi16_epi64 (__m256i __W
, __mmask8 __U
, __m128i __A
)
2872 return (__m256i
) __builtin_ia32_pmovsxwq256_mask ((__v8hi
) __A
,
2877 extern __inline __m256i
2878 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2879 _mm256_maskz_cvtepi16_epi64 (__mmask8 __U
, __m128i __A
)
2881 return (__m256i
) __builtin_ia32_pmovsxwq256_mask ((__v8hi
) __A
,
2883 _mm256_setzero_si256 (),
2887 extern __inline __m128i
2888 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2889 _mm_mask_cvtepi16_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
)
2891 return (__m128i
) __builtin_ia32_pmovsxwq128_mask ((__v8hi
) __A
,
2896 extern __inline __m128i
2897 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2898 _mm_maskz_cvtepi16_epi64 (__mmask8 __U
, __m128i __A
)
2900 return (__m128i
) __builtin_ia32_pmovsxwq128_mask ((__v8hi
) __A
,
2902 _mm_setzero_si128 (),
2906 extern __inline __m256i
2907 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2908 _mm256_mask_cvtepi32_epi64 (__m256i __W
, __mmask8 __U
, __m128i __X
)
2910 return (__m256i
) __builtin_ia32_pmovsxdq256_mask ((__v4si
) __X
,
2915 extern __inline __m256i
2916 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2917 _mm256_maskz_cvtepi32_epi64 (__mmask8 __U
, __m128i __X
)
2919 return (__m256i
) __builtin_ia32_pmovsxdq256_mask ((__v4si
) __X
,
2921 _mm256_setzero_si256 (),
2925 extern __inline __m128i
2926 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2927 _mm_mask_cvtepi32_epi64 (__m128i __W
, __mmask8 __U
, __m128i __X
)
2929 return (__m128i
) __builtin_ia32_pmovsxdq128_mask ((__v4si
) __X
,
2934 extern __inline __m128i
2935 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2936 _mm_maskz_cvtepi32_epi64 (__mmask8 __U
, __m128i __X
)
2938 return (__m128i
) __builtin_ia32_pmovsxdq128_mask ((__v4si
) __X
,
2940 _mm_setzero_si128 (),
2944 extern __inline __m256i
2945 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2946 _mm256_mask_cvtepu8_epi32 (__m256i __W
, __mmask8 __U
, __m128i __A
)
2948 return (__m256i
) __builtin_ia32_pmovzxbd256_mask ((__v16qi
) __A
,
2953 extern __inline __m256i
2954 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2955 _mm256_maskz_cvtepu8_epi32 (__mmask8 __U
, __m128i __A
)
2957 return (__m256i
) __builtin_ia32_pmovzxbd256_mask ((__v16qi
) __A
,
2959 _mm256_setzero_si256 (),
2963 extern __inline __m128i
2964 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2965 _mm_mask_cvtepu8_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
)
2967 return (__m128i
) __builtin_ia32_pmovzxbd128_mask ((__v16qi
) __A
,
2972 extern __inline __m128i
2973 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2974 _mm_maskz_cvtepu8_epi32 (__mmask8 __U
, __m128i __A
)
2976 return (__m128i
) __builtin_ia32_pmovzxbd128_mask ((__v16qi
) __A
,
2978 _mm_setzero_si128 (),
2982 extern __inline __m256i
2983 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2984 _mm256_mask_cvtepu8_epi64 (__m256i __W
, __mmask8 __U
, __m128i __A
)
2986 return (__m256i
) __builtin_ia32_pmovzxbq256_mask ((__v16qi
) __A
,
2991 extern __inline __m256i
2992 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
2993 _mm256_maskz_cvtepu8_epi64 (__mmask8 __U
, __m128i __A
)
2995 return (__m256i
) __builtin_ia32_pmovzxbq256_mask ((__v16qi
) __A
,
2997 _mm256_setzero_si256 (),
3001 extern __inline __m128i
3002 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3003 _mm_mask_cvtepu8_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
)
3005 return (__m128i
) __builtin_ia32_pmovzxbq128_mask ((__v16qi
) __A
,
3010 extern __inline __m128i
3011 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3012 _mm_maskz_cvtepu8_epi64 (__mmask8 __U
, __m128i __A
)
3014 return (__m128i
) __builtin_ia32_pmovzxbq128_mask ((__v16qi
) __A
,
3016 _mm_setzero_si128 (),
3020 extern __inline __m256i
3021 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3022 _mm256_mask_cvtepu16_epi32 (__m256i __W
, __mmask8 __U
, __m128i __A
)
3024 return (__m256i
) __builtin_ia32_pmovzxwd256_mask ((__v8hi
) __A
,
3029 extern __inline __m256i
3030 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3031 _mm256_maskz_cvtepu16_epi32 (__mmask8 __U
, __m128i __A
)
3033 return (__m256i
) __builtin_ia32_pmovzxwd256_mask ((__v8hi
) __A
,
3035 _mm256_setzero_si256 (),
3039 extern __inline __m128i
3040 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3041 _mm_mask_cvtepu16_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
)
3043 return (__m128i
) __builtin_ia32_pmovzxwd128_mask ((__v8hi
) __A
,
3048 extern __inline __m128i
3049 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3050 _mm_maskz_cvtepu16_epi32 (__mmask8 __U
, __m128i __A
)
3052 return (__m128i
) __builtin_ia32_pmovzxwd128_mask ((__v8hi
) __A
,
3054 _mm_setzero_si128 (),
3058 extern __inline __m256i
3059 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3060 _mm256_mask_cvtepu16_epi64 (__m256i __W
, __mmask8 __U
, __m128i __A
)
3062 return (__m256i
) __builtin_ia32_pmovzxwq256_mask ((__v8hi
) __A
,
3067 extern __inline __m256i
3068 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3069 _mm256_maskz_cvtepu16_epi64 (__mmask8 __U
, __m128i __A
)
3071 return (__m256i
) __builtin_ia32_pmovzxwq256_mask ((__v8hi
) __A
,
3073 _mm256_setzero_si256 (),
3077 extern __inline __m128i
3078 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3079 _mm_mask_cvtepu16_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
)
3081 return (__m128i
) __builtin_ia32_pmovzxwq128_mask ((__v8hi
) __A
,
3086 extern __inline __m128i
3087 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3088 _mm_maskz_cvtepu16_epi64 (__mmask8 __U
, __m128i __A
)
3090 return (__m128i
) __builtin_ia32_pmovzxwq128_mask ((__v8hi
) __A
,
3092 _mm_setzero_si128 (),
3096 extern __inline __m256i
3097 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3098 _mm256_mask_cvtepu32_epi64 (__m256i __W
, __mmask8 __U
, __m128i __X
)
3100 return (__m256i
) __builtin_ia32_pmovzxdq256_mask ((__v4si
) __X
,
3105 extern __inline __m256i
3106 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3107 _mm256_maskz_cvtepu32_epi64 (__mmask8 __U
, __m128i __X
)
3109 return (__m256i
) __builtin_ia32_pmovzxdq256_mask ((__v4si
) __X
,
3111 _mm256_setzero_si256 (),
3115 extern __inline __m128i
3116 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3117 _mm_mask_cvtepu32_epi64 (__m128i __W
, __mmask8 __U
, __m128i __X
)
3119 return (__m128i
) __builtin_ia32_pmovzxdq128_mask ((__v4si
) __X
,
3124 extern __inline __m128i
3125 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3126 _mm_maskz_cvtepu32_epi64 (__mmask8 __U
, __m128i __X
)
3128 return (__m128i
) __builtin_ia32_pmovzxdq128_mask ((__v4si
) __X
,
3130 _mm_setzero_si128 (),
3134 extern __inline __m256d
3135 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3136 _mm256_rcp14_pd (__m256d __A
)
3138 return (__m256d
) __builtin_ia32_rcp14pd256_mask ((__v4df
) __A
,
3140 _mm256_setzero_pd (),
3144 extern __inline __m256d
3145 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3146 _mm256_mask_rcp14_pd (__m256d __W
, __mmask8 __U
, __m256d __A
)
3148 return (__m256d
) __builtin_ia32_rcp14pd256_mask ((__v4df
) __A
,
3153 extern __inline __m256d
3154 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3155 _mm256_maskz_rcp14_pd (__mmask8 __U
, __m256d __A
)
3157 return (__m256d
) __builtin_ia32_rcp14pd256_mask ((__v4df
) __A
,
3159 _mm256_setzero_pd (),
3163 extern __inline __m128d
3164 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3165 _mm_rcp14_pd (__m128d __A
)
3167 return (__m128d
) __builtin_ia32_rcp14pd128_mask ((__v2df
) __A
,
3173 extern __inline __m128d
3174 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3175 _mm_mask_rcp14_pd (__m128d __W
, __mmask8 __U
, __m128d __A
)
3177 return (__m128d
) __builtin_ia32_rcp14pd128_mask ((__v2df
) __A
,
3182 extern __inline __m128d
3183 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3184 _mm_maskz_rcp14_pd (__mmask8 __U
, __m128d __A
)
3186 return (__m128d
) __builtin_ia32_rcp14pd128_mask ((__v2df
) __A
,
3192 extern __inline __m256
3193 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3194 _mm256_rcp14_ps (__m256 __A
)
3196 return (__m256
) __builtin_ia32_rcp14ps256_mask ((__v8sf
) __A
,
3198 _mm256_setzero_ps (),
3202 extern __inline __m256
3203 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3204 _mm256_mask_rcp14_ps (__m256 __W
, __mmask8 __U
, __m256 __A
)
3206 return (__m256
) __builtin_ia32_rcp14ps256_mask ((__v8sf
) __A
,
3211 extern __inline __m256
3212 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3213 _mm256_maskz_rcp14_ps (__mmask8 __U
, __m256 __A
)
3215 return (__m256
) __builtin_ia32_rcp14ps256_mask ((__v8sf
) __A
,
3217 _mm256_setzero_ps (),
3221 extern __inline __m128
3222 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3223 _mm_rcp14_ps (__m128 __A
)
3225 return (__m128
) __builtin_ia32_rcp14ps128_mask ((__v4sf
) __A
,
3231 extern __inline __m128
3232 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3233 _mm_mask_rcp14_ps (__m128 __W
, __mmask8 __U
, __m128 __A
)
3235 return (__m128
) __builtin_ia32_rcp14ps128_mask ((__v4sf
) __A
,
3240 extern __inline __m128
3241 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3242 _mm_maskz_rcp14_ps (__mmask8 __U
, __m128 __A
)
3244 return (__m128
) __builtin_ia32_rcp14ps128_mask ((__v4sf
) __A
,
3250 extern __inline __m256d
3251 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3252 _mm256_rsqrt14_pd (__m256d __A
)
3254 return (__m256d
) __builtin_ia32_rsqrt14pd256_mask ((__v4df
) __A
,
3256 _mm256_setzero_pd (),
3260 extern __inline __m256d
3261 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3262 _mm256_mask_rsqrt14_pd (__m256d __W
, __mmask8 __U
, __m256d __A
)
3264 return (__m256d
) __builtin_ia32_rsqrt14pd256_mask ((__v4df
) __A
,
3269 extern __inline __m256d
3270 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3271 _mm256_maskz_rsqrt14_pd (__mmask8 __U
, __m256d __A
)
3273 return (__m256d
) __builtin_ia32_rsqrt14pd256_mask ((__v4df
) __A
,
3275 _mm256_setzero_pd (),
3279 extern __inline __m128d
3280 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3281 _mm_rsqrt14_pd (__m128d __A
)
3283 return (__m128d
) __builtin_ia32_rsqrt14pd128_mask ((__v2df
) __A
,
3289 extern __inline __m128d
3290 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3291 _mm_mask_rsqrt14_pd (__m128d __W
, __mmask8 __U
, __m128d __A
)
3293 return (__m128d
) __builtin_ia32_rsqrt14pd128_mask ((__v2df
) __A
,
3298 extern __inline __m128d
3299 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3300 _mm_maskz_rsqrt14_pd (__mmask8 __U
, __m128d __A
)
3302 return (__m128d
) __builtin_ia32_rsqrt14pd128_mask ((__v2df
) __A
,
3308 extern __inline __m256
3309 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3310 _mm256_rsqrt14_ps (__m256 __A
)
3312 return (__m256
) __builtin_ia32_rsqrt14ps256_mask ((__v8sf
) __A
,
3314 _mm256_setzero_ps (),
3318 extern __inline __m256
3319 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3320 _mm256_mask_rsqrt14_ps (__m256 __W
, __mmask8 __U
, __m256 __A
)
3322 return (__m256
) __builtin_ia32_rsqrt14ps256_mask ((__v8sf
) __A
,
3327 extern __inline __m256
3328 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3329 _mm256_maskz_rsqrt14_ps (__mmask8 __U
, __m256 __A
)
3331 return (__m256
) __builtin_ia32_rsqrt14ps256_mask ((__v8sf
) __A
,
3333 _mm256_setzero_ps (),
3337 extern __inline __m128
3338 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3339 _mm_rsqrt14_ps (__m128 __A
)
3341 return (__m128
) __builtin_ia32_rsqrt14ps128_mask ((__v4sf
) __A
,
3347 extern __inline __m128
3348 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3349 _mm_mask_rsqrt14_ps (__m128 __W
, __mmask8 __U
, __m128 __A
)
3351 return (__m128
) __builtin_ia32_rsqrt14ps128_mask ((__v4sf
) __A
,
3356 extern __inline __m128
3357 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3358 _mm_maskz_rsqrt14_ps (__mmask8 __U
, __m128 __A
)
3360 return (__m128
) __builtin_ia32_rsqrt14ps128_mask ((__v4sf
) __A
,
3366 extern __inline __m256d
3367 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3368 _mm256_mask_sqrt_pd (__m256d __W
, __mmask8 __U
, __m256d __A
)
3370 return (__m256d
) __builtin_ia32_sqrtpd256_mask ((__v4df
) __A
,
3375 extern __inline __m256d
3376 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3377 _mm256_maskz_sqrt_pd (__mmask8 __U
, __m256d __A
)
3379 return (__m256d
) __builtin_ia32_sqrtpd256_mask ((__v4df
) __A
,
3381 _mm256_setzero_pd (),
3385 extern __inline __m128d
3386 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3387 _mm_mask_sqrt_pd (__m128d __W
, __mmask8 __U
, __m128d __A
)
3389 return (__m128d
) __builtin_ia32_sqrtpd128_mask ((__v2df
) __A
,
3394 extern __inline __m128d
3395 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3396 _mm_maskz_sqrt_pd (__mmask8 __U
, __m128d __A
)
3398 return (__m128d
) __builtin_ia32_sqrtpd128_mask ((__v2df
) __A
,
3404 extern __inline __m256
3405 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3406 _mm256_mask_sqrt_ps (__m256 __W
, __mmask8 __U
, __m256 __A
)
3408 return (__m256
) __builtin_ia32_sqrtps256_mask ((__v8sf
) __A
,
3413 extern __inline __m256
3414 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3415 _mm256_maskz_sqrt_ps (__mmask8 __U
, __m256 __A
)
3417 return (__m256
) __builtin_ia32_sqrtps256_mask ((__v8sf
) __A
,
3419 _mm256_setzero_ps (),
3423 extern __inline __m128
3424 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3425 _mm_mask_sqrt_ps (__m128 __W
, __mmask8 __U
, __m128 __A
)
3427 return (__m128
) __builtin_ia32_sqrtps128_mask ((__v4sf
) __A
,
3432 extern __inline __m128
3433 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3434 _mm_maskz_sqrt_ps (__mmask8 __U
, __m128 __A
)
3436 return (__m128
) __builtin_ia32_sqrtps128_mask ((__v4sf
) __A
,
3442 extern __inline __m256i
3443 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3444 _mm256_mask_add_epi32 (__m256i __W
, __mmask8 __U
, __m256i __A
,
3447 return (__m256i
) __builtin_ia32_paddd256_mask ((__v8si
) __A
,
3453 extern __inline __m256i
3454 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3455 _mm256_maskz_add_epi32 (__mmask8 __U
, __m256i __A
, __m256i __B
)
3457 return (__m256i
) __builtin_ia32_paddd256_mask ((__v8si
) __A
,
3460 _mm256_setzero_si256 (),
3464 extern __inline __m256i
3465 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3466 _mm256_mask_add_epi64 (__m256i __W
, __mmask8 __U
, __m256i __A
,
3469 return (__m256i
) __builtin_ia32_paddq256_mask ((__v4di
) __A
,
3475 extern __inline __m256i
3476 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3477 _mm256_maskz_add_epi64 (__mmask8 __U
, __m256i __A
, __m256i __B
)
3479 return (__m256i
) __builtin_ia32_paddq256_mask ((__v4di
) __A
,
3482 _mm256_setzero_si256 (),
3486 extern __inline __m256i
3487 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3488 _mm256_mask_sub_epi32 (__m256i __W
, __mmask8 __U
, __m256i __A
,
3491 return (__m256i
) __builtin_ia32_psubd256_mask ((__v8si
) __A
,
3497 extern __inline __m256i
3498 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3499 _mm256_maskz_sub_epi32 (__mmask8 __U
, __m256i __A
, __m256i __B
)
3501 return (__m256i
) __builtin_ia32_psubd256_mask ((__v8si
) __A
,
3504 _mm256_setzero_si256 (),
3508 extern __inline __m256i
3509 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3510 _mm256_mask_sub_epi64 (__m256i __W
, __mmask8 __U
, __m256i __A
,
3513 return (__m256i
) __builtin_ia32_psubq256_mask ((__v4di
) __A
,
3519 extern __inline __m256i
3520 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3521 _mm256_maskz_sub_epi64 (__mmask8 __U
, __m256i __A
, __m256i __B
)
3523 return (__m256i
) __builtin_ia32_psubq256_mask ((__v4di
) __A
,
3526 _mm256_setzero_si256 (),
3530 extern __inline __m128i
3531 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3532 _mm_mask_add_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
,
3535 return (__m128i
) __builtin_ia32_paddd128_mask ((__v4si
) __A
,
3541 extern __inline __m128i
3542 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3543 _mm_maskz_add_epi32 (__mmask8 __U
, __m128i __A
, __m128i __B
)
3545 return (__m128i
) __builtin_ia32_paddd128_mask ((__v4si
) __A
,
3548 _mm_setzero_si128 (),
3552 extern __inline __m128i
3553 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3554 _mm_mask_add_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
,
3557 return (__m128i
) __builtin_ia32_paddq128_mask ((__v2di
) __A
,
3563 extern __inline __m128i
3564 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3565 _mm_maskz_add_epi64 (__mmask8 __U
, __m128i __A
, __m128i __B
)
3567 return (__m128i
) __builtin_ia32_paddq128_mask ((__v2di
) __A
,
3570 _mm_setzero_si128 (),
3574 extern __inline __m128i
3575 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3576 _mm_mask_sub_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
,
3579 return (__m128i
) __builtin_ia32_psubd128_mask ((__v4si
) __A
,
3585 extern __inline __m128i
3586 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3587 _mm_maskz_sub_epi32 (__mmask8 __U
, __m128i __A
, __m128i __B
)
3589 return (__m128i
) __builtin_ia32_psubd128_mask ((__v4si
) __A
,
3592 _mm_setzero_si128 (),
3596 extern __inline __m128i
3597 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3598 _mm_mask_sub_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
,
3601 return (__m128i
) __builtin_ia32_psubq128_mask ((__v2di
) __A
,
3607 extern __inline __m128i
3608 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3609 _mm_maskz_sub_epi64 (__mmask8 __U
, __m128i __A
, __m128i __B
)
3611 return (__m128i
) __builtin_ia32_psubq128_mask ((__v2di
) __A
,
3614 _mm_setzero_si128 (),
3618 extern __inline __m256
3619 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3620 _mm256_getexp_ps (__m256 __A
)
3622 return (__m256
) __builtin_ia32_getexpps256_mask ((__v8sf
) __A
,
3624 _mm256_setzero_ps (),
3628 extern __inline __m256
3629 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3630 _mm256_mask_getexp_ps (__m256 __W
, __mmask8 __U
, __m256 __A
)
3632 return (__m256
) __builtin_ia32_getexpps256_mask ((__v8sf
) __A
,
3637 extern __inline __m256
3638 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3639 _mm256_maskz_getexp_ps (__mmask8 __U
, __m256 __A
)
3641 return (__m256
) __builtin_ia32_getexpps256_mask ((__v8sf
) __A
,
3643 _mm256_setzero_ps (),
3647 extern __inline __m256d
3648 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3649 _mm256_getexp_pd (__m256d __A
)
3651 return (__m256d
) __builtin_ia32_getexppd256_mask ((__v4df
) __A
,
3653 _mm256_setzero_pd (),
3657 extern __inline __m256d
3658 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3659 _mm256_mask_getexp_pd (__m256d __W
, __mmask8 __U
, __m256d __A
)
3661 return (__m256d
) __builtin_ia32_getexppd256_mask ((__v4df
) __A
,
3666 extern __inline __m256d
3667 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3668 _mm256_maskz_getexp_pd (__mmask8 __U
, __m256d __A
)
3670 return (__m256d
) __builtin_ia32_getexppd256_mask ((__v4df
) __A
,
3672 _mm256_setzero_pd (),
3676 extern __inline __m128
3677 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3678 _mm_getexp_ps (__m128 __A
)
3680 return (__m128
) __builtin_ia32_getexpps128_mask ((__v4sf
) __A
,
3686 extern __inline __m128
3687 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3688 _mm_mask_getexp_ps (__m128 __W
, __mmask8 __U
, __m128 __A
)
3690 return (__m128
) __builtin_ia32_getexpps128_mask ((__v4sf
) __A
,
3695 extern __inline __m128
3696 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3697 _mm_maskz_getexp_ps (__mmask8 __U
, __m128 __A
)
3699 return (__m128
) __builtin_ia32_getexpps128_mask ((__v4sf
) __A
,
3705 extern __inline __m128d
3706 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3707 _mm_getexp_pd (__m128d __A
)
3709 return (__m128d
) __builtin_ia32_getexppd128_mask ((__v2df
) __A
,
3715 extern __inline __m128d
3716 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3717 _mm_mask_getexp_pd (__m128d __W
, __mmask8 __U
, __m128d __A
)
3719 return (__m128d
) __builtin_ia32_getexppd128_mask ((__v2df
) __A
,
3724 extern __inline __m128d
3725 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3726 _mm_maskz_getexp_pd (__mmask8 __U
, __m128d __A
)
3728 return (__m128d
) __builtin_ia32_getexppd128_mask ((__v2df
) __A
,
3734 extern __inline __m256i
3735 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3736 _mm256_mask_srl_epi32 (__m256i __W
, __mmask8 __U
, __m256i __A
,
3739 return (__m256i
) __builtin_ia32_psrld256_mask ((__v8si
) __A
,
3745 extern __inline __m256i
3746 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3747 _mm256_maskz_srl_epi32 (__mmask8 __U
, __m256i __A
, __m128i __B
)
3749 return (__m256i
) __builtin_ia32_psrld256_mask ((__v8si
) __A
,
3752 _mm256_setzero_si256 (),
3756 extern __inline __m128i
3757 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3758 _mm_mask_srl_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
,
3761 return (__m128i
) __builtin_ia32_psrld128_mask ((__v4si
) __A
,
3767 extern __inline __m128i
3768 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3769 _mm_maskz_srl_epi32 (__mmask8 __U
, __m128i __A
, __m128i __B
)
3771 return (__m128i
) __builtin_ia32_psrld128_mask ((__v4si
) __A
,
3774 _mm_setzero_si128 (),
3778 extern __inline __m256i
3779 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3780 _mm256_mask_srl_epi64 (__m256i __W
, __mmask8 __U
, __m256i __A
,
3783 return (__m256i
) __builtin_ia32_psrlq256_mask ((__v4di
) __A
,
3789 extern __inline __m256i
3790 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3791 _mm256_maskz_srl_epi64 (__mmask8 __U
, __m256i __A
, __m128i __B
)
3793 return (__m256i
) __builtin_ia32_psrlq256_mask ((__v4di
) __A
,
3796 _mm256_setzero_si256 (),
3800 extern __inline __m128i
3801 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3802 _mm_mask_srl_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
,
3805 return (__m128i
) __builtin_ia32_psrlq128_mask ((__v2di
) __A
,
3811 extern __inline __m128i
3812 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3813 _mm_maskz_srl_epi64 (__mmask8 __U
, __m128i __A
, __m128i __B
)
3815 return (__m128i
) __builtin_ia32_psrlq128_mask ((__v2di
) __A
,
3822 extern __inline __m256i
3823 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3824 _mm256_mask_and_epi32 (__m256i __W
, __mmask8 __U
, __m256i __A
,
3827 return (__m256i
) __builtin_ia32_pandd256_mask ((__v8si
) __A
,
3833 extern __inline __m256i
3834 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3835 _mm256_maskz_and_epi32 (__mmask8 __U
, __m256i __A
, __m256i __B
)
3837 return (__m256i
) __builtin_ia32_pandd256_mask ((__v8si
) __A
,
3840 _mm256_setzero_si256 (),
3844 extern __inline __m256d
3845 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3846 _mm256_scalef_pd (__m256d __A
, __m256d __B
)
3848 return (__m256d
) __builtin_ia32_scalefpd256_mask ((__v4df
) __A
,
3851 _mm256_setzero_pd (),
3855 extern __inline __m256d
3856 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3857 _mm256_mask_scalef_pd (__m256d __W
, __mmask8 __U
, __m256d __A
,
3860 return (__m256d
) __builtin_ia32_scalefpd256_mask ((__v4df
) __A
,
3866 extern __inline __m256d
3867 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3868 _mm256_maskz_scalef_pd (__mmask8 __U
, __m256d __A
, __m256d __B
)
3870 return (__m256d
) __builtin_ia32_scalefpd256_mask ((__v4df
) __A
,
3873 _mm256_setzero_pd (),
3877 extern __inline __m256
3878 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3879 _mm256_scalef_ps (__m256 __A
, __m256 __B
)
3881 return (__m256
) __builtin_ia32_scalefps256_mask ((__v8sf
) __A
,
3884 _mm256_setzero_ps (),
3888 extern __inline __m256
3889 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3890 _mm256_mask_scalef_ps (__m256 __W
, __mmask8 __U
, __m256 __A
,
3893 return (__m256
) __builtin_ia32_scalefps256_mask ((__v8sf
) __A
,
3899 extern __inline __m256
3900 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3901 _mm256_maskz_scalef_ps (__mmask8 __U
, __m256 __A
, __m256 __B
)
3903 return (__m256
) __builtin_ia32_scalefps256_mask ((__v8sf
) __A
,
3906 _mm256_setzero_ps (),
3910 extern __inline __m128d
3911 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3912 _mm_scalef_pd (__m128d __A
, __m128d __B
)
3914 return (__m128d
) __builtin_ia32_scalefpd128_mask ((__v2df
) __A
,
3921 extern __inline __m128d
3922 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3923 _mm_mask_scalef_pd (__m128d __W
, __mmask8 __U
, __m128d __A
,
3926 return (__m128d
) __builtin_ia32_scalefpd128_mask ((__v2df
) __A
,
3932 extern __inline __m128d
3933 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3934 _mm_maskz_scalef_pd (__mmask8 __U
, __m128d __A
, __m128d __B
)
3936 return (__m128d
) __builtin_ia32_scalefpd128_mask ((__v2df
) __A
,
3943 extern __inline __m128
3944 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3945 _mm_scalef_ps (__m128 __A
, __m128 __B
)
3947 return (__m128
) __builtin_ia32_scalefps128_mask ((__v4sf
) __A
,
3954 extern __inline __m128
3955 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3956 _mm_mask_scalef_ps (__m128 __W
, __mmask8 __U
, __m128 __A
, __m128 __B
)
3958 return (__m128
) __builtin_ia32_scalefps128_mask ((__v4sf
) __A
,
3964 extern __inline __m128
3965 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3966 _mm_maskz_scalef_ps (__mmask8 __U
, __m128 __A
, __m128 __B
)
3968 return (__m128
) __builtin_ia32_scalefps128_mask ((__v4sf
) __A
,
3975 extern __inline __m256d
3976 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3977 _mm256_mask_fmadd_pd (__m256d __A
, __mmask8 __U
, __m256d __B
,
3980 return (__m256d
) __builtin_ia32_vfmaddpd256_mask ((__v4df
) __A
,
3986 extern __inline __m256d
3987 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3988 _mm256_mask3_fmadd_pd (__m256d __A
, __m256d __B
, __m256d __C
,
3991 return (__m256d
) __builtin_ia32_vfmaddpd256_mask3 ((__v4df
) __A
,
3997 extern __inline __m256d
3998 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
3999 _mm256_maskz_fmadd_pd (__mmask8 __U
, __m256d __A
, __m256d __B
,
4002 return (__m256d
) __builtin_ia32_vfmaddpd256_maskz ((__v4df
) __A
,
4008 extern __inline __m128d
4009 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4010 _mm_mask_fmadd_pd (__m128d __A
, __mmask8 __U
, __m128d __B
, __m128d __C
)
4012 return (__m128d
) __builtin_ia32_vfmaddpd128_mask ((__v2df
) __A
,
4018 extern __inline __m128d
4019 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4020 _mm_mask3_fmadd_pd (__m128d __A
, __m128d __B
, __m128d __C
,
4023 return (__m128d
) __builtin_ia32_vfmaddpd128_mask3 ((__v2df
) __A
,
4029 extern __inline __m128d
4030 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4031 _mm_maskz_fmadd_pd (__mmask8 __U
, __m128d __A
, __m128d __B
,
4034 return (__m128d
) __builtin_ia32_vfmaddpd128_maskz ((__v2df
) __A
,
4040 extern __inline __m256
4041 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4042 _mm256_mask_fmadd_ps (__m256 __A
, __mmask8 __U
, __m256 __B
, __m256 __C
)
4044 return (__m256
) __builtin_ia32_vfmaddps256_mask ((__v8sf
) __A
,
4050 extern __inline __m256
4051 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4052 _mm256_mask3_fmadd_ps (__m256 __A
, __m256 __B
, __m256 __C
,
4055 return (__m256
) __builtin_ia32_vfmaddps256_mask3 ((__v8sf
) __A
,
4061 extern __inline __m256
4062 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4063 _mm256_maskz_fmadd_ps (__mmask8 __U
, __m256 __A
, __m256 __B
,
4066 return (__m256
) __builtin_ia32_vfmaddps256_maskz ((__v8sf
) __A
,
4072 extern __inline __m128
4073 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4074 _mm_mask_fmadd_ps (__m128 __A
, __mmask8 __U
, __m128 __B
, __m128 __C
)
4076 return (__m128
) __builtin_ia32_vfmaddps128_mask ((__v4sf
) __A
,
4082 extern __inline __m128
4083 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4084 _mm_mask3_fmadd_ps (__m128 __A
, __m128 __B
, __m128 __C
, __mmask8 __U
)
4086 return (__m128
) __builtin_ia32_vfmaddps128_mask3 ((__v4sf
) __A
,
4092 extern __inline __m128
4093 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4094 _mm_maskz_fmadd_ps (__mmask8 __U
, __m128 __A
, __m128 __B
, __m128 __C
)
4096 return (__m128
) __builtin_ia32_vfmaddps128_maskz ((__v4sf
) __A
,
4102 extern __inline __m256d
4103 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4104 _mm256_mask_fmsub_pd (__m256d __A
, __mmask8 __U
, __m256d __B
,
4107 return (__m256d
) __builtin_ia32_vfmaddpd256_mask ((__v4df
) __A
,
4113 extern __inline __m256d
4114 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4115 _mm256_mask3_fmsub_pd (__m256d __A
, __m256d __B
, __m256d __C
,
4118 return (__m256d
) __builtin_ia32_vfmsubpd256_mask3 ((__v4df
) __A
,
4124 extern __inline __m256d
4125 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4126 _mm256_maskz_fmsub_pd (__mmask8 __U
, __m256d __A
, __m256d __B
,
4129 return (__m256d
) __builtin_ia32_vfmaddpd256_maskz ((__v4df
) __A
,
4135 extern __inline __m128d
4136 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4137 _mm_mask_fmsub_pd (__m128d __A
, __mmask8 __U
, __m128d __B
, __m128d __C
)
4139 return (__m128d
) __builtin_ia32_vfmaddpd128_mask ((__v2df
) __A
,
4145 extern __inline __m128d
4146 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4147 _mm_mask3_fmsub_pd (__m128d __A
, __m128d __B
, __m128d __C
,
4150 return (__m128d
) __builtin_ia32_vfmsubpd128_mask3 ((__v2df
) __A
,
4156 extern __inline __m128d
4157 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4158 _mm_maskz_fmsub_pd (__mmask8 __U
, __m128d __A
, __m128d __B
,
4161 return (__m128d
) __builtin_ia32_vfmaddpd128_maskz ((__v2df
) __A
,
4167 extern __inline __m256
4168 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4169 _mm256_mask_fmsub_ps (__m256 __A
, __mmask8 __U
, __m256 __B
, __m256 __C
)
4171 return (__m256
) __builtin_ia32_vfmaddps256_mask ((__v8sf
) __A
,
4177 extern __inline __m256
4178 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4179 _mm256_mask3_fmsub_ps (__m256 __A
, __m256 __B
, __m256 __C
,
4182 return (__m256
) __builtin_ia32_vfmsubps256_mask3 ((__v8sf
) __A
,
4188 extern __inline __m256
4189 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4190 _mm256_maskz_fmsub_ps (__mmask8 __U
, __m256 __A
, __m256 __B
,
4193 return (__m256
) __builtin_ia32_vfmaddps256_maskz ((__v8sf
) __A
,
4199 extern __inline __m128
4200 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4201 _mm_mask_fmsub_ps (__m128 __A
, __mmask8 __U
, __m128 __B
, __m128 __C
)
4203 return (__m128
) __builtin_ia32_vfmaddps128_mask ((__v4sf
) __A
,
4209 extern __inline __m128
4210 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4211 _mm_mask3_fmsub_ps (__m128 __A
, __m128 __B
, __m128 __C
, __mmask8 __U
)
4213 return (__m128
) __builtin_ia32_vfmsubps128_mask3 ((__v4sf
) __A
,
4219 extern __inline __m128
4220 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4221 _mm_maskz_fmsub_ps (__mmask8 __U
, __m128 __A
, __m128 __B
, __m128 __C
)
4223 return (__m128
) __builtin_ia32_vfmaddps128_maskz ((__v4sf
) __A
,
4229 extern __inline __m256d
4230 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4231 _mm256_mask_fmaddsub_pd (__m256d __A
, __mmask8 __U
, __m256d __B
,
4234 return (__m256d
) __builtin_ia32_vfmaddsubpd256_mask ((__v4df
) __A
,
4240 extern __inline __m256d
4241 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4242 _mm256_mask3_fmaddsub_pd (__m256d __A
, __m256d __B
, __m256d __C
,
4245 return (__m256d
) __builtin_ia32_vfmaddsubpd256_mask3 ((__v4df
) __A
,
4252 extern __inline __m256d
4253 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4254 _mm256_maskz_fmaddsub_pd (__mmask8 __U
, __m256d __A
, __m256d __B
,
4257 return (__m256d
) __builtin_ia32_vfmaddsubpd256_maskz ((__v4df
) __A
,
4264 extern __inline __m128d
4265 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4266 _mm_mask_fmaddsub_pd (__m128d __A
, __mmask8 __U
, __m128d __B
,
4269 return (__m128d
) __builtin_ia32_vfmaddsubpd128_mask ((__v2df
) __A
,
4275 extern __inline __m128d
4276 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4277 _mm_mask3_fmaddsub_pd (__m128d __A
, __m128d __B
, __m128d __C
,
4280 return (__m128d
) __builtin_ia32_vfmaddsubpd128_mask3 ((__v2df
) __A
,
4287 extern __inline __m128d
4288 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4289 _mm_maskz_fmaddsub_pd (__mmask8 __U
, __m128d __A
, __m128d __B
,
4292 return (__m128d
) __builtin_ia32_vfmaddsubpd128_maskz ((__v2df
) __A
,
4299 extern __inline __m256
4300 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4301 _mm256_mask_fmaddsub_ps (__m256 __A
, __mmask8 __U
, __m256 __B
,
4304 return (__m256
) __builtin_ia32_vfmaddsubps256_mask ((__v8sf
) __A
,
4310 extern __inline __m256
4311 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4312 _mm256_mask3_fmaddsub_ps (__m256 __A
, __m256 __B
, __m256 __C
,
4315 return (__m256
) __builtin_ia32_vfmaddsubps256_mask3 ((__v8sf
) __A
,
4321 extern __inline __m256
4322 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4323 _mm256_maskz_fmaddsub_ps (__mmask8 __U
, __m256 __A
, __m256 __B
,
4326 return (__m256
) __builtin_ia32_vfmaddsubps256_maskz ((__v8sf
) __A
,
4332 extern __inline __m128
4333 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4334 _mm_mask_fmaddsub_ps (__m128 __A
, __mmask8 __U
, __m128 __B
, __m128 __C
)
4336 return (__m128
) __builtin_ia32_vfmaddsubps128_mask ((__v4sf
) __A
,
4342 extern __inline __m128
4343 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4344 _mm_mask3_fmaddsub_ps (__m128 __A
, __m128 __B
, __m128 __C
,
4347 return (__m128
) __builtin_ia32_vfmaddsubps128_mask3 ((__v4sf
) __A
,
4353 extern __inline __m128
4354 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4355 _mm_maskz_fmaddsub_ps (__mmask8 __U
, __m128 __A
, __m128 __B
,
4358 return (__m128
) __builtin_ia32_vfmaddsubps128_maskz ((__v4sf
) __A
,
4364 extern __inline __m256d
4365 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4366 _mm256_mask_fmsubadd_pd (__m256d __A
, __mmask8 __U
, __m256d __B
,
4369 return (__m256d
) __builtin_ia32_vfmaddsubpd256_mask ((__v4df
) __A
,
4375 extern __inline __m256d
4376 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4377 _mm256_mask3_fmsubadd_pd (__m256d __A
, __m256d __B
, __m256d __C
,
4380 return (__m256d
) __builtin_ia32_vfmsubaddpd256_mask3 ((__v4df
) __A
,
4387 extern __inline __m256d
4388 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4389 _mm256_maskz_fmsubadd_pd (__mmask8 __U
, __m256d __A
, __m256d __B
,
4392 return (__m256d
) __builtin_ia32_vfmaddsubpd256_maskz ((__v4df
) __A
,
4399 extern __inline __m128d
4400 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4401 _mm_mask_fmsubadd_pd (__m128d __A
, __mmask8 __U
, __m128d __B
,
4404 return (__m128d
) __builtin_ia32_vfmaddsubpd128_mask ((__v2df
) __A
,
4410 extern __inline __m128d
4411 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4412 _mm_mask3_fmsubadd_pd (__m128d __A
, __m128d __B
, __m128d __C
,
4415 return (__m128d
) __builtin_ia32_vfmsubaddpd128_mask3 ((__v2df
) __A
,
4422 extern __inline __m128d
4423 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4424 _mm_maskz_fmsubadd_pd (__mmask8 __U
, __m128d __A
, __m128d __B
,
4427 return (__m128d
) __builtin_ia32_vfmaddsubpd128_maskz ((__v2df
) __A
,
4434 extern __inline __m256
4435 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4436 _mm256_mask_fmsubadd_ps (__m256 __A
, __mmask8 __U
, __m256 __B
,
4439 return (__m256
) __builtin_ia32_vfmaddsubps256_mask ((__v8sf
) __A
,
4445 extern __inline __m256
4446 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4447 _mm256_mask3_fmsubadd_ps (__m256 __A
, __m256 __B
, __m256 __C
,
4450 return (__m256
) __builtin_ia32_vfmsubaddps256_mask3 ((__v8sf
) __A
,
4456 extern __inline __m256
4457 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4458 _mm256_maskz_fmsubadd_ps (__mmask8 __U
, __m256 __A
, __m256 __B
,
4461 return (__m256
) __builtin_ia32_vfmaddsubps256_maskz ((__v8sf
) __A
,
4467 extern __inline __m128
4468 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4469 _mm_mask_fmsubadd_ps (__m128 __A
, __mmask8 __U
, __m128 __B
, __m128 __C
)
4471 return (__m128
) __builtin_ia32_vfmaddsubps128_mask ((__v4sf
) __A
,
4477 extern __inline __m128
4478 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4479 _mm_mask3_fmsubadd_ps (__m128 __A
, __m128 __B
, __m128 __C
,
4482 return (__m128
) __builtin_ia32_vfmsubaddps128_mask3 ((__v4sf
) __A
,
4488 extern __inline __m128
4489 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4490 _mm_maskz_fmsubadd_ps (__mmask8 __U
, __m128 __A
, __m128 __B
,
4493 return (__m128
) __builtin_ia32_vfmaddsubps128_maskz ((__v4sf
) __A
,
4499 extern __inline __m256d
4500 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4501 _mm256_mask_fnmadd_pd (__m256d __A
, __mmask8 __U
, __m256d __B
,
4504 return (__m256d
) __builtin_ia32_vfnmaddpd256_mask ((__v4df
) __A
,
4510 extern __inline __m256d
4511 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4512 _mm256_mask3_fnmadd_pd (__m256d __A
, __m256d __B
, __m256d __C
,
4515 return (__m256d
) __builtin_ia32_vfmaddpd256_mask3 (-(__v4df
) __A
,
4521 extern __inline __m256d
4522 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4523 _mm256_maskz_fnmadd_pd (__mmask8 __U
, __m256d __A
, __m256d __B
,
4526 return (__m256d
) __builtin_ia32_vfmaddpd256_maskz (-(__v4df
) __A
,
4532 extern __inline __m128d
4533 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4534 _mm_mask_fnmadd_pd (__m128d __A
, __mmask8 __U
, __m128d __B
,
4537 return (__m128d
) __builtin_ia32_vfnmaddpd128_mask ((__v2df
) __A
,
4543 extern __inline __m128d
4544 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4545 _mm_mask3_fnmadd_pd (__m128d __A
, __m128d __B
, __m128d __C
,
4548 return (__m128d
) __builtin_ia32_vfmaddpd128_mask3 (-(__v2df
) __A
,
4554 extern __inline __m128d
4555 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4556 _mm_maskz_fnmadd_pd (__mmask8 __U
, __m128d __A
, __m128d __B
,
4559 return (__m128d
) __builtin_ia32_vfmaddpd128_maskz (-(__v2df
) __A
,
4565 extern __inline __m256
4566 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4567 _mm256_mask_fnmadd_ps (__m256 __A
, __mmask8 __U
, __m256 __B
,
4570 return (__m256
) __builtin_ia32_vfnmaddps256_mask ((__v8sf
) __A
,
4576 extern __inline __m256
4577 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4578 _mm256_mask3_fnmadd_ps (__m256 __A
, __m256 __B
, __m256 __C
,
4581 return (__m256
) __builtin_ia32_vfmaddps256_mask3 (-(__v8sf
) __A
,
4587 extern __inline __m256
4588 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4589 _mm256_maskz_fnmadd_ps (__mmask8 __U
, __m256 __A
, __m256 __B
,
4592 return (__m256
) __builtin_ia32_vfmaddps256_maskz (-(__v8sf
) __A
,
4598 extern __inline __m128
4599 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4600 _mm_mask_fnmadd_ps (__m128 __A
, __mmask8 __U
, __m128 __B
, __m128 __C
)
4602 return (__m128
) __builtin_ia32_vfnmaddps128_mask ((__v4sf
) __A
,
4608 extern __inline __m128
4609 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4610 _mm_mask3_fnmadd_ps (__m128 __A
, __m128 __B
, __m128 __C
, __mmask8 __U
)
4612 return (__m128
) __builtin_ia32_vfmaddps128_mask3 (-(__v4sf
) __A
,
4618 extern __inline __m128
4619 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4620 _mm_maskz_fnmadd_ps (__mmask8 __U
, __m128 __A
, __m128 __B
, __m128 __C
)
4622 return (__m128
) __builtin_ia32_vfmaddps128_maskz (-(__v4sf
) __A
,
4628 extern __inline __m256d
4629 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4630 _mm256_mask_fnmsub_pd (__m256d __A
, __mmask8 __U
, __m256d __B
,
4633 return (__m256d
) __builtin_ia32_vfnmsubpd256_mask ((__v4df
) __A
,
4639 extern __inline __m256d
4640 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4641 _mm256_mask3_fnmsub_pd (__m256d __A
, __m256d __B
, __m256d __C
,
4644 return (__m256d
) __builtin_ia32_vfnmsubpd256_mask3 ((__v4df
) __A
,
4650 extern __inline __m256d
4651 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4652 _mm256_maskz_fnmsub_pd (__mmask8 __U
, __m256d __A
, __m256d __B
,
4655 return (__m256d
) __builtin_ia32_vfmaddpd256_maskz (-(__v4df
) __A
,
4661 extern __inline __m128d
4662 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4663 _mm_mask_fnmsub_pd (__m128d __A
, __mmask8 __U
, __m128d __B
,
4666 return (__m128d
) __builtin_ia32_vfnmsubpd128_mask ((__v2df
) __A
,
4672 extern __inline __m128d
4673 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4674 _mm_mask3_fnmsub_pd (__m128d __A
, __m128d __B
, __m128d __C
,
4677 return (__m128d
) __builtin_ia32_vfnmsubpd128_mask3 ((__v2df
) __A
,
4683 extern __inline __m128d
4684 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4685 _mm_maskz_fnmsub_pd (__mmask8 __U
, __m128d __A
, __m128d __B
,
4688 return (__m128d
) __builtin_ia32_vfmaddpd128_maskz (-(__v2df
) __A
,
4694 extern __inline __m256
4695 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4696 _mm256_mask_fnmsub_ps (__m256 __A
, __mmask8 __U
, __m256 __B
,
4699 return (__m256
) __builtin_ia32_vfnmsubps256_mask ((__v8sf
) __A
,
4705 extern __inline __m256
4706 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4707 _mm256_mask3_fnmsub_ps (__m256 __A
, __m256 __B
, __m256 __C
,
4710 return (__m256
) __builtin_ia32_vfnmsubps256_mask3 ((__v8sf
) __A
,
4716 extern __inline __m256
4717 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4718 _mm256_maskz_fnmsub_ps (__mmask8 __U
, __m256 __A
, __m256 __B
,
4721 return (__m256
) __builtin_ia32_vfmaddps256_maskz (-(__v8sf
) __A
,
4727 extern __inline __m128
4728 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4729 _mm_mask_fnmsub_ps (__m128 __A
, __mmask8 __U
, __m128 __B
, __m128 __C
)
4731 return (__m128
) __builtin_ia32_vfnmsubps128_mask ((__v4sf
) __A
,
4737 extern __inline __m128
4738 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4739 _mm_mask3_fnmsub_ps (__m128 __A
, __m128 __B
, __m128 __C
, __mmask8 __U
)
4741 return (__m128
) __builtin_ia32_vfnmsubps128_mask3 ((__v4sf
) __A
,
4747 extern __inline __m128
4748 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4749 _mm_maskz_fnmsub_ps (__mmask8 __U
, __m128 __A
, __m128 __B
, __m128 __C
)
4751 return (__m128
) __builtin_ia32_vfmaddps128_maskz (-(__v4sf
) __A
,
4757 extern __inline __m128i
4758 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4759 _mm_mask_and_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
,
4762 return (__m128i
) __builtin_ia32_pandd128_mask ((__v4si
) __A
,
4768 extern __inline __m128i
4769 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4770 _mm_maskz_and_epi32 (__mmask8 __U
, __m128i __A
, __m128i __B
)
4772 return (__m128i
) __builtin_ia32_pandd128_mask ((__v4si
) __A
,
4775 _mm_setzero_si128 (),
4779 extern __inline __m256i
4780 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4781 _mm256_mask_andnot_epi32 (__m256i __W
, __mmask8 __U
, __m256i __A
,
4784 return (__m256i
) __builtin_ia32_pandnd256_mask ((__v8si
) __A
,
4790 extern __inline __m256i
4791 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4792 _mm256_maskz_andnot_epi32 (__mmask8 __U
, __m256i __A
, __m256i __B
)
4794 return (__m256i
) __builtin_ia32_pandnd256_mask ((__v8si
) __A
,
4797 _mm256_setzero_si256 (),
4801 extern __inline __m128i
4802 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4803 _mm_mask_andnot_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
,
4806 return (__m128i
) __builtin_ia32_pandnd128_mask ((__v4si
) __A
,
4812 extern __inline __m128i
4813 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4814 _mm_maskz_andnot_epi32 (__mmask8 __U
, __m128i __A
, __m128i __B
)
4816 return (__m128i
) __builtin_ia32_pandnd128_mask ((__v4si
) __A
,
4819 _mm_setzero_si128 (),
4823 extern __inline __m256i
4824 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4825 _mm256_mask_or_epi32 (__m256i __W
, __mmask8 __U
, __m256i __A
,
4828 return (__m256i
) __builtin_ia32_pord256_mask ((__v8si
) __A
,
4834 extern __inline __m256i
4835 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4836 _mm256_maskz_or_epi32 (__mmask8 __U
, __m256i __A
, __m256i __B
)
4838 return (__m256i
) __builtin_ia32_pord256_mask ((__v8si
) __A
,
4841 _mm256_setzero_si256 (),
4845 extern __inline __m128i
4846 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4847 _mm_mask_or_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
, __m128i __B
)
4849 return (__m128i
) __builtin_ia32_pord128_mask ((__v4si
) __A
,
4855 extern __inline __m128i
4856 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4857 _mm_maskz_or_epi32 (__mmask8 __U
, __m128i __A
, __m128i __B
)
4859 return (__m128i
) __builtin_ia32_pord128_mask ((__v4si
) __A
,
4862 _mm_setzero_si128 (),
4866 extern __inline __m256i
4867 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4868 _mm256_mask_xor_epi32 (__m256i __W
, __mmask8 __U
, __m256i __A
,
4871 return (__m256i
) __builtin_ia32_pxord256_mask ((__v8si
) __A
,
4877 extern __inline __m256i
4878 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4879 _mm256_maskz_xor_epi32 (__mmask8 __U
, __m256i __A
, __m256i __B
)
4881 return (__m256i
) __builtin_ia32_pxord256_mask ((__v8si
) __A
,
4884 _mm256_setzero_si256 (),
4888 extern __inline __m128i
4889 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4890 _mm_mask_xor_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
,
4893 return (__m128i
) __builtin_ia32_pxord128_mask ((__v4si
) __A
,
4899 extern __inline __m128i
4900 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4901 _mm_maskz_xor_epi32 (__mmask8 __U
, __m128i __A
, __m128i __B
)
4903 return (__m128i
) __builtin_ia32_pxord128_mask ((__v4si
) __A
,
4906 _mm_setzero_si128 (),
4910 extern __inline __m128
4911 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4912 _mm_mask_cvtpd_ps (__m128 __W
, __mmask8 __U
, __m128d __A
)
4914 return (__m128
) __builtin_ia32_cvtpd2ps_mask ((__v2df
) __A
,
4919 extern __inline __m128
4920 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4921 _mm_maskz_cvtpd_ps (__mmask8 __U
, __m128d __A
)
4923 return (__m128
) __builtin_ia32_cvtpd2ps_mask ((__v2df
) __A
,
4929 extern __inline __m128
4930 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4931 _mm256_mask_cvtpd_ps (__m128 __W
, __mmask8 __U
, __m256d __A
)
4933 return (__m128
) __builtin_ia32_cvtpd2ps256_mask ((__v4df
) __A
,
4938 extern __inline __m128
4939 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4940 _mm256_maskz_cvtpd_ps (__mmask8 __U
, __m256d __A
)
4942 return (__m128
) __builtin_ia32_cvtpd2ps256_mask ((__v4df
) __A
,
4948 extern __inline __m256i
4949 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4950 _mm256_mask_cvtps_epi32 (__m256i __W
, __mmask8 __U
, __m256 __A
)
4952 return (__m256i
) __builtin_ia32_cvtps2dq256_mask ((__v8sf
) __A
,
4957 extern __inline __m256i
4958 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4959 _mm256_maskz_cvtps_epi32 (__mmask8 __U
, __m256 __A
)
4961 return (__m256i
) __builtin_ia32_cvtps2dq256_mask ((__v8sf
) __A
,
4963 _mm256_setzero_si256 (),
4967 extern __inline __m128i
4968 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4969 _mm_mask_cvtps_epi32 (__m128i __W
, __mmask8 __U
, __m128 __A
)
4971 return (__m128i
) __builtin_ia32_cvtps2dq128_mask ((__v4sf
) __A
,
4976 extern __inline __m128i
4977 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4978 _mm_maskz_cvtps_epi32 (__mmask8 __U
, __m128 __A
)
4980 return (__m128i
) __builtin_ia32_cvtps2dq128_mask ((__v4sf
) __A
,
4982 _mm_setzero_si128 (),
4986 extern __inline __m256i
4987 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4988 _mm256_cvtps_epu32 (__m256 __A
)
4990 return (__m256i
) __builtin_ia32_cvtps2udq256_mask ((__v8sf
) __A
,
4992 _mm256_setzero_si256 (),
4996 extern __inline __m256i
4997 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
4998 _mm256_mask_cvtps_epu32 (__m256i __W
, __mmask8 __U
, __m256 __A
)
5000 return (__m256i
) __builtin_ia32_cvtps2udq256_mask ((__v8sf
) __A
,
5005 extern __inline __m256i
5006 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5007 _mm256_maskz_cvtps_epu32 (__mmask8 __U
, __m256 __A
)
5009 return (__m256i
) __builtin_ia32_cvtps2udq256_mask ((__v8sf
) __A
,
5011 _mm256_setzero_si256 (),
5015 extern __inline __m128i
5016 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5017 _mm_cvtps_epu32 (__m128 __A
)
5019 return (__m128i
) __builtin_ia32_cvtps2udq128_mask ((__v4sf
) __A
,
5021 _mm_setzero_si128 (),
5025 extern __inline __m128i
5026 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5027 _mm_mask_cvtps_epu32 (__m128i __W
, __mmask8 __U
, __m128 __A
)
5029 return (__m128i
) __builtin_ia32_cvtps2udq128_mask ((__v4sf
) __A
,
5034 extern __inline __m128i
5035 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5036 _mm_maskz_cvtps_epu32 (__mmask8 __U
, __m128 __A
)
5038 return (__m128i
) __builtin_ia32_cvtps2udq128_mask ((__v4sf
) __A
,
5040 _mm_setzero_si128 (),
5044 extern __inline __m256d
5045 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5046 _mm256_mask_movedup_pd (__m256d __W
, __mmask8 __U
, __m256d __A
)
5048 return (__m256d
) __builtin_ia32_movddup256_mask ((__v4df
) __A
,
5053 extern __inline __m256d
5054 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5055 _mm256_maskz_movedup_pd (__mmask8 __U
, __m256d __A
)
5057 return (__m256d
) __builtin_ia32_movddup256_mask ((__v4df
) __A
,
5059 _mm256_setzero_pd (),
5063 extern __inline __m128d
5064 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5065 _mm_mask_movedup_pd (__m128d __W
, __mmask8 __U
, __m128d __A
)
5067 return (__m128d
) __builtin_ia32_movddup128_mask ((__v2df
) __A
,
5072 extern __inline __m128d
5073 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5074 _mm_maskz_movedup_pd (__mmask8 __U
, __m128d __A
)
5076 return (__m128d
) __builtin_ia32_movddup128_mask ((__v2df
) __A
,
5082 extern __inline __m256
5083 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5084 _mm256_mask_movehdup_ps (__m256 __W
, __mmask8 __U
, __m256 __A
)
5086 return (__m256
) __builtin_ia32_movshdup256_mask ((__v8sf
) __A
,
5091 extern __inline __m256
5092 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5093 _mm256_maskz_movehdup_ps (__mmask8 __U
, __m256 __A
)
5095 return (__m256
) __builtin_ia32_movshdup256_mask ((__v8sf
) __A
,
5097 _mm256_setzero_ps (),
5101 extern __inline __m128
5102 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5103 _mm_mask_movehdup_ps (__m128 __W
, __mmask8 __U
, __m128 __A
)
5105 return (__m128
) __builtin_ia32_movshdup128_mask ((__v4sf
) __A
,
5110 extern __inline __m128
5111 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5112 _mm_maskz_movehdup_ps (__mmask8 __U
, __m128 __A
)
5114 return (__m128
) __builtin_ia32_movshdup128_mask ((__v4sf
) __A
,
5120 extern __inline __m256
5121 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5122 _mm256_mask_moveldup_ps (__m256 __W
, __mmask8 __U
, __m256 __A
)
5124 return (__m256
) __builtin_ia32_movsldup256_mask ((__v8sf
) __A
,
5129 extern __inline __m256
5130 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5131 _mm256_maskz_moveldup_ps (__mmask8 __U
, __m256 __A
)
5133 return (__m256
) __builtin_ia32_movsldup256_mask ((__v8sf
) __A
,
5135 _mm256_setzero_ps (),
5139 extern __inline __m128
5140 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5141 _mm_mask_moveldup_ps (__m128 __W
, __mmask8 __U
, __m128 __A
)
5143 return (__m128
) __builtin_ia32_movsldup128_mask ((__v4sf
) __A
,
5148 extern __inline __m128
5149 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5150 _mm_maskz_moveldup_ps (__mmask8 __U
, __m128 __A
)
5152 return (__m128
) __builtin_ia32_movsldup128_mask ((__v4sf
) __A
,
5158 extern __inline __m128i
5159 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5160 _mm_mask_unpackhi_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
,
5163 return (__m128i
) __builtin_ia32_punpckhdq128_mask ((__v4si
) __A
,
5169 extern __inline __m128i
5170 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5171 _mm_maskz_unpackhi_epi32 (__mmask8 __U
, __m128i __A
, __m128i __B
)
5173 return (__m128i
) __builtin_ia32_punpckhdq128_mask ((__v4si
) __A
,
5176 _mm_setzero_si128 (),
5180 extern __inline __m256i
5181 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5182 _mm256_mask_unpackhi_epi32 (__m256i __W
, __mmask8 __U
, __m256i __A
,
5185 return (__m256i
) __builtin_ia32_punpckhdq256_mask ((__v8si
) __A
,
5191 extern __inline __m256i
5192 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5193 _mm256_maskz_unpackhi_epi32 (__mmask8 __U
, __m256i __A
, __m256i __B
)
5195 return (__m256i
) __builtin_ia32_punpckhdq256_mask ((__v8si
) __A
,
5198 _mm256_setzero_si256 (),
5202 extern __inline __m128i
5203 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5204 _mm_mask_unpackhi_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
,
5207 return (__m128i
) __builtin_ia32_punpckhqdq128_mask ((__v2di
) __A
,
5213 extern __inline __m128i
5214 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5215 _mm_maskz_unpackhi_epi64 (__mmask8 __U
, __m128i __A
, __m128i __B
)
5217 return (__m128i
) __builtin_ia32_punpckhqdq128_mask ((__v2di
) __A
,
5224 extern __inline __m256i
5225 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5226 _mm256_mask_unpackhi_epi64 (__m256i __W
, __mmask8 __U
, __m256i __A
,
5229 return (__m256i
) __builtin_ia32_punpckhqdq256_mask ((__v4di
) __A
,
5235 extern __inline __m256i
5236 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5237 _mm256_maskz_unpackhi_epi64 (__mmask8 __U
, __m256i __A
, __m256i __B
)
5239 return (__m256i
) __builtin_ia32_punpckhqdq256_mask ((__v4di
) __A
,
5242 _mm256_setzero_si256 (),
5246 extern __inline __m128i
5247 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5248 _mm_mask_unpacklo_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
,
5251 return (__m128i
) __builtin_ia32_punpckldq128_mask ((__v4si
) __A
,
5257 extern __inline __m128i
5258 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5259 _mm_maskz_unpacklo_epi32 (__mmask8 __U
, __m128i __A
, __m128i __B
)
5261 return (__m128i
) __builtin_ia32_punpckldq128_mask ((__v4si
) __A
,
5264 _mm_setzero_si128 (),
5268 extern __inline __m256i
5269 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5270 _mm256_mask_unpacklo_epi32 (__m256i __W
, __mmask8 __U
, __m256i __A
,
5273 return (__m256i
) __builtin_ia32_punpckldq256_mask ((__v8si
) __A
,
5279 extern __inline __m256i
5280 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5281 _mm256_maskz_unpacklo_epi32 (__mmask8 __U
, __m256i __A
, __m256i __B
)
5283 return (__m256i
) __builtin_ia32_punpckldq256_mask ((__v8si
) __A
,
5286 _mm256_setzero_si256 (),
5290 extern __inline __m128i
5291 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5292 _mm_mask_unpacklo_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
,
5295 return (__m128i
) __builtin_ia32_punpcklqdq128_mask ((__v2di
) __A
,
5301 extern __inline __m128i
5302 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5303 _mm_maskz_unpacklo_epi64 (__mmask8 __U
, __m128i __A
, __m128i __B
)
5305 return (__m128i
) __builtin_ia32_punpcklqdq128_mask ((__v2di
) __A
,
5312 extern __inline __m256i
5313 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5314 _mm256_mask_unpacklo_epi64 (__m256i __W
, __mmask8 __U
, __m256i __A
,
5317 return (__m256i
) __builtin_ia32_punpcklqdq256_mask ((__v4di
) __A
,
5323 extern __inline __m256i
5324 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5325 _mm256_maskz_unpacklo_epi64 (__mmask8 __U
, __m256i __A
, __m256i __B
)
5327 return (__m256i
) __builtin_ia32_punpcklqdq256_mask ((__v4di
) __A
,
5330 _mm256_setzero_si256 (),
5334 extern __inline __mmask8
5335 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5336 _mm_cmpeq_epu32_mask (__m128i __A
, __m128i __B
)
5338 return (__mmask8
) __builtin_ia32_ucmpd128_mask ((__v4si
) __A
,
5343 extern __inline __mmask8
5344 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5345 _mm_cmpeq_epi32_mask (__m128i __A
, __m128i __B
)
5347 return (__mmask8
) __builtin_ia32_pcmpeqd128_mask ((__v4si
) __A
,
5352 extern __inline __mmask8
5353 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5354 _mm_mask_cmpeq_epu32_mask (__mmask8 __U
, __m128i __A
, __m128i __B
)
5356 return (__mmask8
) __builtin_ia32_ucmpd128_mask ((__v4si
) __A
,
5357 (__v4si
) __B
, 0, __U
);
5360 extern __inline __mmask8
5361 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5362 _mm_mask_cmpeq_epi32_mask (__mmask8 __U
, __m128i __A
, __m128i __B
)
5364 return (__mmask8
) __builtin_ia32_pcmpeqd128_mask ((__v4si
) __A
,
5368 extern __inline __mmask8
5369 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5370 _mm256_cmpeq_epu32_mask (__m256i __A
, __m256i __B
)
5372 return (__mmask8
) __builtin_ia32_ucmpd256_mask ((__v8si
) __A
,
5377 extern __inline __mmask8
5378 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5379 _mm256_cmpeq_epi32_mask (__m256i __A
, __m256i __B
)
5381 return (__mmask8
) __builtin_ia32_pcmpeqd256_mask ((__v8si
) __A
,
5386 extern __inline __mmask8
5387 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5388 _mm256_mask_cmpeq_epu32_mask (__mmask8 __U
, __m256i __A
, __m256i __B
)
5390 return (__mmask8
) __builtin_ia32_ucmpd256_mask ((__v8si
) __A
,
5391 (__v8si
) __B
, 0, __U
);
5394 extern __inline __mmask8
5395 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5396 _mm256_mask_cmpeq_epi32_mask (__mmask8 __U
, __m256i __A
, __m256i __B
)
5398 return (__mmask8
) __builtin_ia32_pcmpeqd256_mask ((__v8si
) __A
,
5402 extern __inline __mmask8
5403 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5404 _mm_cmpeq_epu64_mask (__m128i __A
, __m128i __B
)
5406 return (__mmask8
) __builtin_ia32_ucmpq128_mask ((__v2di
) __A
,
5411 extern __inline __mmask8
5412 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5413 _mm_cmpeq_epi64_mask (__m128i __A
, __m128i __B
)
5415 return (__mmask8
) __builtin_ia32_pcmpeqq128_mask ((__v2di
) __A
,
5420 extern __inline __mmask8
5421 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5422 _mm_mask_cmpeq_epu64_mask (__mmask8 __U
, __m128i __A
, __m128i __B
)
5424 return (__mmask8
) __builtin_ia32_ucmpq128_mask ((__v2di
) __A
,
5425 (__v2di
) __B
, 0, __U
);
5428 extern __inline __mmask8
5429 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5430 _mm_mask_cmpeq_epi64_mask (__mmask8 __U
, __m128i __A
, __m128i __B
)
5432 return (__mmask8
) __builtin_ia32_pcmpeqq128_mask ((__v2di
) __A
,
5436 extern __inline __mmask8
5437 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5438 _mm256_cmpeq_epu64_mask (__m256i __A
, __m256i __B
)
5440 return (__mmask8
) __builtin_ia32_ucmpq256_mask ((__v4di
) __A
,
5445 extern __inline __mmask8
5446 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5447 _mm256_cmpeq_epi64_mask (__m256i __A
, __m256i __B
)
5449 return (__mmask8
) __builtin_ia32_pcmpeqq256_mask ((__v4di
) __A
,
5454 extern __inline __mmask8
5455 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5456 _mm256_mask_cmpeq_epu64_mask (__mmask8 __U
, __m256i __A
, __m256i __B
)
5458 return (__mmask8
) __builtin_ia32_ucmpq256_mask ((__v4di
) __A
,
5459 (__v4di
) __B
, 0, __U
);
5462 extern __inline __mmask8
5463 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5464 _mm256_mask_cmpeq_epi64_mask (__mmask8 __U
, __m256i __A
, __m256i __B
)
5466 return (__mmask8
) __builtin_ia32_pcmpeqq256_mask ((__v4di
) __A
,
5470 extern __inline __mmask8
5471 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5472 _mm_cmpgt_epu32_mask (__m128i __A
, __m128i __B
)
5474 return (__mmask8
) __builtin_ia32_ucmpd128_mask ((__v4si
) __A
,
5479 extern __inline __mmask8
5480 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5481 _mm_cmpgt_epi32_mask (__m128i __A
, __m128i __B
)
5483 return (__mmask8
) __builtin_ia32_pcmpgtd128_mask ((__v4si
) __A
,
5488 extern __inline __mmask8
5489 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5490 _mm_mask_cmpgt_epu32_mask (__mmask8 __U
, __m128i __A
, __m128i __B
)
5492 return (__mmask8
) __builtin_ia32_ucmpd128_mask ((__v4si
) __A
,
5493 (__v4si
) __B
, 6, __U
);
5496 extern __inline __mmask8
5497 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5498 _mm_mask_cmpgt_epi32_mask (__mmask8 __U
, __m128i __A
, __m128i __B
)
5500 return (__mmask8
) __builtin_ia32_pcmpgtd128_mask ((__v4si
) __A
,
5504 extern __inline __mmask8
5505 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5506 _mm256_cmpgt_epu32_mask (__m256i __A
, __m256i __B
)
5508 return (__mmask8
) __builtin_ia32_ucmpd256_mask ((__v8si
) __A
,
5513 extern __inline __mmask8
5514 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5515 _mm256_cmpgt_epi32_mask (__m256i __A
, __m256i __B
)
5517 return (__mmask8
) __builtin_ia32_pcmpgtd256_mask ((__v8si
) __A
,
5522 extern __inline __mmask8
5523 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5524 _mm256_mask_cmpgt_epu32_mask (__mmask8 __U
, __m256i __A
, __m256i __B
)
5526 return (__mmask8
) __builtin_ia32_ucmpd256_mask ((__v8si
) __A
,
5527 (__v8si
) __B
, 6, __U
);
5530 extern __inline __mmask8
5531 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5532 _mm256_mask_cmpgt_epi32_mask (__mmask8 __U
, __m256i __A
, __m256i __B
)
5534 return (__mmask8
) __builtin_ia32_pcmpgtd256_mask ((__v8si
) __A
,
5538 extern __inline __mmask8
5539 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5540 _mm_cmpgt_epu64_mask (__m128i __A
, __m128i __B
)
5542 return (__mmask8
) __builtin_ia32_ucmpq128_mask ((__v2di
) __A
,
5547 extern __inline __mmask8
5548 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5549 _mm_cmpgt_epi64_mask (__m128i __A
, __m128i __B
)
5551 return (__mmask8
) __builtin_ia32_pcmpgtq128_mask ((__v2di
) __A
,
5556 extern __inline __mmask8
5557 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5558 _mm_mask_cmpgt_epu64_mask (__mmask8 __U
, __m128i __A
, __m128i __B
)
5560 return (__mmask8
) __builtin_ia32_ucmpq128_mask ((__v2di
) __A
,
5561 (__v2di
) __B
, 6, __U
);
5564 extern __inline __mmask8
5565 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5566 _mm_mask_cmpgt_epi64_mask (__mmask8 __U
, __m128i __A
, __m128i __B
)
5568 return (__mmask8
) __builtin_ia32_pcmpgtq128_mask ((__v2di
) __A
,
5572 extern __inline __mmask8
5573 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5574 _mm256_cmpgt_epu64_mask (__m256i __A
, __m256i __B
)
5576 return (__mmask8
) __builtin_ia32_ucmpq256_mask ((__v4di
) __A
,
5581 extern __inline __mmask8
5582 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5583 _mm256_cmpgt_epi64_mask (__m256i __A
, __m256i __B
)
5585 return (__mmask8
) __builtin_ia32_pcmpgtq256_mask ((__v4di
) __A
,
5590 extern __inline __mmask8
5591 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5592 _mm256_mask_cmpgt_epu64_mask (__mmask8 __U
, __m256i __A
, __m256i __B
)
5594 return (__mmask8
) __builtin_ia32_ucmpq256_mask ((__v4di
) __A
,
5595 (__v4di
) __B
, 6, __U
);
5598 extern __inline __mmask8
5599 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5600 _mm256_mask_cmpgt_epi64_mask (__mmask8 __U
, __m256i __A
, __m256i __B
)
5602 return (__mmask8
) __builtin_ia32_pcmpgtq256_mask ((__v4di
) __A
,
5606 extern __inline __mmask8
5607 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5608 _mm_test_epi32_mask (__m128i __A
, __m128i __B
)
5610 return (__mmask8
) __builtin_ia32_ptestmd128 ((__v4si
) __A
,
5615 extern __inline __mmask8
5616 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5617 _mm_mask_test_epi32_mask (__mmask8 __U
, __m128i __A
, __m128i __B
)
5619 return (__mmask8
) __builtin_ia32_ptestmd128 ((__v4si
) __A
,
5623 extern __inline __mmask8
5624 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5625 _mm256_test_epi32_mask (__m256i __A
, __m256i __B
)
5627 return (__mmask8
) __builtin_ia32_ptestmd256 ((__v8si
) __A
,
5632 extern __inline __mmask8
5633 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5634 _mm256_mask_test_epi32_mask (__mmask8 __U
, __m256i __A
, __m256i __B
)
5636 return (__mmask8
) __builtin_ia32_ptestmd256 ((__v8si
) __A
,
5640 extern __inline __mmask8
5641 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5642 _mm_test_epi64_mask (__m128i __A
, __m128i __B
)
5644 return (__mmask8
) __builtin_ia32_ptestmq128 ((__v2di
) __A
,
5649 extern __inline __mmask8
5650 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5651 _mm_mask_test_epi64_mask (__mmask8 __U
, __m128i __A
, __m128i __B
)
5653 return (__mmask8
) __builtin_ia32_ptestmq128 ((__v2di
) __A
,
5657 extern __inline __mmask8
5658 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5659 _mm256_test_epi64_mask (__m256i __A
, __m256i __B
)
5661 return (__mmask8
) __builtin_ia32_ptestmq256 ((__v4di
) __A
,
5666 extern __inline __mmask8
5667 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5668 _mm256_mask_test_epi64_mask (__mmask8 __U
, __m256i __A
, __m256i __B
)
5670 return (__mmask8
) __builtin_ia32_ptestmq256 ((__v4di
) __A
,
5674 extern __inline __mmask8
5675 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5676 _mm_testn_epi32_mask (__m128i __A
, __m128i __B
)
5678 return (__mmask8
) __builtin_ia32_ptestnmd128 ((__v4si
) __A
,
5683 extern __inline __mmask8
5684 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5685 _mm_mask_testn_epi32_mask (__mmask8 __U
, __m128i __A
, __m128i __B
)
5687 return (__mmask8
) __builtin_ia32_ptestnmd128 ((__v4si
) __A
,
5691 extern __inline __mmask8
5692 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5693 _mm256_testn_epi32_mask (__m256i __A
, __m256i __B
)
5695 return (__mmask8
) __builtin_ia32_ptestnmd256 ((__v8si
) __A
,
5700 extern __inline __mmask8
5701 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5702 _mm256_mask_testn_epi32_mask (__mmask8 __U
, __m256i __A
, __m256i __B
)
5704 return (__mmask8
) __builtin_ia32_ptestnmd256 ((__v8si
) __A
,
5708 extern __inline __mmask8
5709 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5710 _mm_testn_epi64_mask (__m128i __A
, __m128i __B
)
5712 return (__mmask8
) __builtin_ia32_ptestnmq128 ((__v2di
) __A
,
5717 extern __inline __mmask8
5718 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5719 _mm_mask_testn_epi64_mask (__mmask8 __U
, __m128i __A
, __m128i __B
)
5721 return (__mmask8
) __builtin_ia32_ptestnmq128 ((__v2di
) __A
,
5725 extern __inline __mmask8
5726 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5727 _mm256_testn_epi64_mask (__m256i __A
, __m256i __B
)
5729 return (__mmask8
) __builtin_ia32_ptestnmq256 ((__v4di
) __A
,
5734 extern __inline __mmask8
5735 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5736 _mm256_mask_testn_epi64_mask (__mmask8 __U
, __m256i __A
, __m256i __B
)
5738 return (__mmask8
) __builtin_ia32_ptestnmq256 ((__v4di
) __A
,
5742 extern __inline __m256d
5743 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5744 _mm256_mask_compress_pd (__m256d __W
, __mmask8 __U
, __m256d __A
)
5746 return (__m256d
) __builtin_ia32_compressdf256_mask ((__v4df
) __A
,
5751 extern __inline __m256d
5752 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5753 _mm256_maskz_compress_pd (__mmask8 __U
, __m256d __A
)
5755 return (__m256d
) __builtin_ia32_compressdf256_mask ((__v4df
) __A
,
5757 _mm256_setzero_pd (),
5761 extern __inline
void
5762 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5763 _mm256_mask_compressstoreu_pd (void *__P
, __mmask8 __U
, __m256d __A
)
5765 __builtin_ia32_compressstoredf256_mask ((__v4df
*) __P
,
5770 extern __inline __m128d
5771 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5772 _mm_mask_compress_pd (__m128d __W
, __mmask8 __U
, __m128d __A
)
5774 return (__m128d
) __builtin_ia32_compressdf128_mask ((__v2df
) __A
,
5779 extern __inline __m128d
5780 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5781 _mm_maskz_compress_pd (__mmask8 __U
, __m128d __A
)
5783 return (__m128d
) __builtin_ia32_compressdf128_mask ((__v2df
) __A
,
5789 extern __inline
void
5790 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5791 _mm_mask_compressstoreu_pd (void *__P
, __mmask8 __U
, __m128d __A
)
5793 __builtin_ia32_compressstoredf128_mask ((__v2df
*) __P
,
5798 extern __inline __m256
5799 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5800 _mm256_mask_compress_ps (__m256 __W
, __mmask8 __U
, __m256 __A
)
5802 return (__m256
) __builtin_ia32_compresssf256_mask ((__v8sf
) __A
,
5807 extern __inline __m256
5808 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5809 _mm256_maskz_compress_ps (__mmask8 __U
, __m256 __A
)
5811 return (__m256
) __builtin_ia32_compresssf256_mask ((__v8sf
) __A
,
5813 _mm256_setzero_ps (),
5817 extern __inline
void
5818 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5819 _mm256_mask_compressstoreu_ps (void *__P
, __mmask8 __U
, __m256 __A
)
5821 __builtin_ia32_compressstoresf256_mask ((__v8sf
*) __P
,
5826 extern __inline __m128
5827 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5828 _mm_mask_compress_ps (__m128 __W
, __mmask8 __U
, __m128 __A
)
5830 return (__m128
) __builtin_ia32_compresssf128_mask ((__v4sf
) __A
,
5835 extern __inline __m128
5836 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5837 _mm_maskz_compress_ps (__mmask8 __U
, __m128 __A
)
5839 return (__m128
) __builtin_ia32_compresssf128_mask ((__v4sf
) __A
,
5845 extern __inline
void
5846 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5847 _mm_mask_compressstoreu_ps (void *__P
, __mmask8 __U
, __m128 __A
)
5849 __builtin_ia32_compressstoresf128_mask ((__v4sf
*) __P
,
5854 extern __inline __m256i
5855 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5856 _mm256_mask_compress_epi64 (__m256i __W
, __mmask8 __U
, __m256i __A
)
5858 return (__m256i
) __builtin_ia32_compressdi256_mask ((__v4di
) __A
,
5863 extern __inline __m256i
5864 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5865 _mm256_maskz_compress_epi64 (__mmask8 __U
, __m256i __A
)
5867 return (__m256i
) __builtin_ia32_compressdi256_mask ((__v4di
) __A
,
5869 _mm256_setzero_si256 (),
5873 extern __inline
void
5874 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5875 _mm256_mask_compressstoreu_epi64 (void *__P
, __mmask8 __U
, __m256i __A
)
5877 __builtin_ia32_compressstoredi256_mask ((__v4di
*) __P
,
5882 extern __inline __m128i
5883 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5884 _mm_mask_compress_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
)
5886 return (__m128i
) __builtin_ia32_compressdi128_mask ((__v2di
) __A
,
5891 extern __inline __m128i
5892 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5893 _mm_maskz_compress_epi64 (__mmask8 __U
, __m128i __A
)
5895 return (__m128i
) __builtin_ia32_compressdi128_mask ((__v2di
) __A
,
5901 extern __inline
void
5902 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5903 _mm_mask_compressstoreu_epi64 (void *__P
, __mmask8 __U
, __m128i __A
)
5905 __builtin_ia32_compressstoredi128_mask ((__v2di
*) __P
,
5910 extern __inline __m256i
5911 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5912 _mm256_mask_compress_epi32 (__m256i __W
, __mmask8 __U
, __m256i __A
)
5914 return (__m256i
) __builtin_ia32_compresssi256_mask ((__v8si
) __A
,
5919 extern __inline __m256i
5920 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5921 _mm256_maskz_compress_epi32 (__mmask8 __U
, __m256i __A
)
5923 return (__m256i
) __builtin_ia32_compresssi256_mask ((__v8si
) __A
,
5925 _mm256_setzero_si256 (),
5929 extern __inline
void
5930 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5931 _mm256_mask_compressstoreu_epi32 (void *__P
, __mmask8 __U
, __m256i __A
)
5933 __builtin_ia32_compressstoresi256_mask ((__v8si
*) __P
,
5938 extern __inline __m128i
5939 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5940 _mm_mask_compress_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
)
5942 return (__m128i
) __builtin_ia32_compresssi128_mask ((__v4si
) __A
,
5947 extern __inline __m128i
5948 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5949 _mm_maskz_compress_epi32 (__mmask8 __U
, __m128i __A
)
5951 return (__m128i
) __builtin_ia32_compresssi128_mask ((__v4si
) __A
,
5953 _mm_setzero_si128 (),
5957 extern __inline
void
5958 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5959 _mm_mask_compressstoreu_epi32 (void *__P
, __mmask8 __U
, __m128i __A
)
5961 __builtin_ia32_compressstoresi128_mask ((__v4si
*) __P
,
5966 extern __inline __m256d
5967 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5968 _mm256_mask_expand_pd (__m256d __W
, __mmask8 __U
, __m256d __A
)
5970 return (__m256d
) __builtin_ia32_expanddf256_mask ((__v4df
) __A
,
5975 extern __inline __m256d
5976 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5977 _mm256_maskz_expand_pd (__mmask8 __U
, __m256d __A
)
5979 return (__m256d
) __builtin_ia32_expanddf256_maskz ((__v4df
) __A
,
5981 _mm256_setzero_pd (),
5985 extern __inline __m256d
5986 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5987 _mm256_mask_expandloadu_pd (__m256d __W
, __mmask8 __U
, void const *__P
)
5989 return (__m256d
) __builtin_ia32_expandloaddf256_mask ((__v4df
*) __P
,
5995 extern __inline __m256d
5996 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
5997 _mm256_maskz_expandloadu_pd (__mmask8 __U
, void const *__P
)
5999 return (__m256d
) __builtin_ia32_expandloaddf256_maskz ((__v4df
*) __P
,
6001 _mm256_setzero_pd (),
6006 extern __inline __m128d
6007 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6008 _mm_mask_expand_pd (__m128d __W
, __mmask8 __U
, __m128d __A
)
6010 return (__m128d
) __builtin_ia32_expanddf128_mask ((__v2df
) __A
,
6015 extern __inline __m128d
6016 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6017 _mm_maskz_expand_pd (__mmask8 __U
, __m128d __A
)
6019 return (__m128d
) __builtin_ia32_expanddf128_maskz ((__v2df
) __A
,
6025 extern __inline __m128d
6026 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6027 _mm_mask_expandloadu_pd (__m128d __W
, __mmask8 __U
, void const *__P
)
6029 return (__m128d
) __builtin_ia32_expandloaddf128_mask ((__v2df
*) __P
,
6035 extern __inline __m128d
6036 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6037 _mm_maskz_expandloadu_pd (__mmask8 __U
, void const *__P
)
6039 return (__m128d
) __builtin_ia32_expandloaddf128_maskz ((__v2df
*) __P
,
6046 extern __inline __m256
6047 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6048 _mm256_mask_expand_ps (__m256 __W
, __mmask8 __U
, __m256 __A
)
6050 return (__m256
) __builtin_ia32_expandsf256_mask ((__v8sf
) __A
,
6055 extern __inline __m256
6056 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6057 _mm256_maskz_expand_ps (__mmask8 __U
, __m256 __A
)
6059 return (__m256
) __builtin_ia32_expandsf256_maskz ((__v8sf
) __A
,
6061 _mm256_setzero_ps (),
6065 extern __inline __m256
6066 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6067 _mm256_mask_expandloadu_ps (__m256 __W
, __mmask8 __U
, void const *__P
)
6069 return (__m256
) __builtin_ia32_expandloadsf256_mask ((__v8sf
*) __P
,
6074 extern __inline __m256
6075 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6076 _mm256_maskz_expandloadu_ps (__mmask8 __U
, void const *__P
)
6078 return (__m256
) __builtin_ia32_expandloadsf256_maskz ((__v8sf
*) __P
,
6080 _mm256_setzero_ps (),
6085 extern __inline __m128
6086 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6087 _mm_mask_expand_ps (__m128 __W
, __mmask8 __U
, __m128 __A
)
6089 return (__m128
) __builtin_ia32_expandsf128_mask ((__v4sf
) __A
,
6094 extern __inline __m128
6095 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6096 _mm_maskz_expand_ps (__mmask8 __U
, __m128 __A
)
6098 return (__m128
) __builtin_ia32_expandsf128_maskz ((__v4sf
) __A
,
6104 extern __inline __m128
6105 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6106 _mm_mask_expandloadu_ps (__m128 __W
, __mmask8 __U
, void const *__P
)
6108 return (__m128
) __builtin_ia32_expandloadsf128_mask ((__v4sf
*) __P
,
6113 extern __inline __m128
6114 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6115 _mm_maskz_expandloadu_ps (__mmask8 __U
, void const *__P
)
6117 return (__m128
) __builtin_ia32_expandloadsf128_maskz ((__v4sf
*) __P
,
6124 extern __inline __m256i
6125 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6126 _mm256_mask_expand_epi64 (__m256i __W
, __mmask8 __U
, __m256i __A
)
6128 return (__m256i
) __builtin_ia32_expanddi256_mask ((__v4di
) __A
,
6133 extern __inline __m256i
6134 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6135 _mm256_maskz_expand_epi64 (__mmask8 __U
, __m256i __A
)
6137 return (__m256i
) __builtin_ia32_expanddi256_maskz ((__v4di
) __A
,
6139 _mm256_setzero_si256 (),
6143 extern __inline __m256i
6144 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6145 _mm256_mask_expandloadu_epi64 (__m256i __W
, __mmask8 __U
,
6148 return (__m256i
) __builtin_ia32_expandloaddi256_mask ((__v4di
*) __P
,
6154 extern __inline __m256i
6155 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6156 _mm256_maskz_expandloadu_epi64 (__mmask8 __U
, void const *__P
)
6158 return (__m256i
) __builtin_ia32_expandloaddi256_maskz ((__v4di
*) __P
,
6160 _mm256_setzero_si256 (),
6165 extern __inline __m128i
6166 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6167 _mm_mask_expand_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
)
6169 return (__m128i
) __builtin_ia32_expanddi128_mask ((__v2di
) __A
,
6174 extern __inline __m128i
6175 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6176 _mm_maskz_expand_epi64 (__mmask8 __U
, __m128i __A
)
6178 return (__m128i
) __builtin_ia32_expanddi128_maskz ((__v2di
) __A
,
6180 _mm_setzero_si128 (),
6184 extern __inline __m128i
6185 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6186 _mm_mask_expandloadu_epi64 (__m128i __W
, __mmask8 __U
, void const *__P
)
6188 return (__m128i
) __builtin_ia32_expandloaddi128_mask ((__v2di
*) __P
,
6194 extern __inline __m128i
6195 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6196 _mm_maskz_expandloadu_epi64 (__mmask8 __U
, void const *__P
)
6198 return (__m128i
) __builtin_ia32_expandloaddi128_maskz ((__v2di
*) __P
,
6200 _mm_setzero_si128 (),
6205 extern __inline __m256i
6206 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6207 _mm256_mask_expand_epi32 (__m256i __W
, __mmask8 __U
, __m256i __A
)
6209 return (__m256i
) __builtin_ia32_expandsi256_mask ((__v8si
) __A
,
6214 extern __inline __m256i
6215 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6216 _mm256_maskz_expand_epi32 (__mmask8 __U
, __m256i __A
)
6218 return (__m256i
) __builtin_ia32_expandsi256_maskz ((__v8si
) __A
,
6220 _mm256_setzero_si256 (),
6224 extern __inline __m256i
6225 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6226 _mm256_mask_expandloadu_epi32 (__m256i __W
, __mmask8 __U
,
6229 return (__m256i
) __builtin_ia32_expandloadsi256_mask ((__v8si
*) __P
,
6235 extern __inline __m256i
6236 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6237 _mm256_maskz_expandloadu_epi32 (__mmask8 __U
, void const *__P
)
6239 return (__m256i
) __builtin_ia32_expandloadsi256_maskz ((__v8si
*) __P
,
6241 _mm256_setzero_si256 (),
6246 extern __inline __m128i
6247 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6248 _mm_mask_expand_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
)
6250 return (__m128i
) __builtin_ia32_expandsi128_mask ((__v4si
) __A
,
6255 extern __inline __m128i
6256 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6257 _mm_maskz_expand_epi32 (__mmask8 __U
, __m128i __A
)
6259 return (__m128i
) __builtin_ia32_expandsi128_maskz ((__v4si
) __A
,
6261 _mm_setzero_si128 (),
6265 extern __inline __m128i
6266 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6267 _mm_mask_expandloadu_epi32 (__m128i __W
, __mmask8 __U
, void const *__P
)
6269 return (__m128i
) __builtin_ia32_expandloadsi128_mask ((__v4si
*) __P
,
6275 extern __inline __m128i
6276 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6277 _mm_maskz_expandloadu_epi32 (__mmask8 __U
, void const *__P
)
6279 return (__m128i
) __builtin_ia32_expandloadsi128_maskz ((__v4si
*) __P
,
6281 _mm_setzero_si128 (),
6286 extern __inline __m256d
6287 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6288 _mm256_permutex2var_pd (__m256d __A
, __m256i __I
, __m256d __B
)
6290 return (__m256d
) __builtin_ia32_vpermt2varpd256_mask ((__v4di
) __I
6297 extern __inline __m256d
6298 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6299 _mm256_mask_permutex2var_pd (__m256d __A
, __mmask8 __U
, __m256i __I
,
6302 return (__m256d
) __builtin_ia32_vpermt2varpd256_mask ((__v4di
) __I
6310 extern __inline __m256d
6311 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6312 _mm256_mask2_permutex2var_pd (__m256d __A
, __m256i __I
, __mmask8 __U
,
6315 return (__m256d
) __builtin_ia32_vpermi2varpd256_mask ((__v4df
) __A
,
6323 extern __inline __m256d
6324 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6325 _mm256_maskz_permutex2var_pd (__mmask8 __U
, __m256d __A
, __m256i __I
,
6328 return (__m256d
) __builtin_ia32_vpermt2varpd256_maskz ((__v4di
) __I
6336 extern __inline __m256
6337 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6338 _mm256_permutex2var_ps (__m256 __A
, __m256i __I
, __m256 __B
)
6340 return (__m256
) __builtin_ia32_vpermt2varps256_mask ((__v8si
) __I
6347 extern __inline __m256
6348 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6349 _mm256_mask_permutex2var_ps (__m256 __A
, __mmask8 __U
, __m256i __I
,
6352 return (__m256
) __builtin_ia32_vpermt2varps256_mask ((__v8si
) __I
6359 extern __inline __m256
6360 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6361 _mm256_mask2_permutex2var_ps (__m256 __A
, __m256i __I
, __mmask8 __U
,
6364 return (__m256
) __builtin_ia32_vpermi2varps256_mask ((__v8sf
) __A
,
6371 extern __inline __m256
6372 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6373 _mm256_maskz_permutex2var_ps (__mmask8 __U
, __m256 __A
, __m256i __I
,
6376 return (__m256
) __builtin_ia32_vpermt2varps256_maskz ((__v8si
) __I
6384 extern __inline __m128i
6385 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6386 _mm_permutex2var_epi64 (__m128i __A
, __m128i __I
, __m128i __B
)
6388 return (__m128i
) __builtin_ia32_vpermt2varq128_mask ((__v2di
) __I
6395 extern __inline __m128i
6396 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6397 _mm_mask_permutex2var_epi64 (__m128i __A
, __mmask8 __U
, __m128i __I
,
6400 return (__m128i
) __builtin_ia32_vpermt2varq128_mask ((__v2di
) __I
6407 extern __inline __m128i
6408 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6409 _mm_mask2_permutex2var_epi64 (__m128i __A
, __m128i __I
, __mmask8 __U
,
6412 return (__m128i
) __builtin_ia32_vpermi2varq128_mask ((__v2di
) __A
,
6419 extern __inline __m128i
6420 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6421 _mm_maskz_permutex2var_epi64 (__mmask8 __U
, __m128i __A
, __m128i __I
,
6424 return (__m128i
) __builtin_ia32_vpermt2varq128_maskz ((__v2di
) __I
6432 extern __inline __m128i
6433 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6434 _mm_permutex2var_epi32 (__m128i __A
, __m128i __I
, __m128i __B
)
6436 return (__m128i
) __builtin_ia32_vpermt2vard128_mask ((__v4si
) __I
6443 extern __inline __m128i
6444 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6445 _mm_mask_permutex2var_epi32 (__m128i __A
, __mmask8 __U
, __m128i __I
,
6448 return (__m128i
) __builtin_ia32_vpermt2vard128_mask ((__v4si
) __I
6455 extern __inline __m128i
6456 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6457 _mm_mask2_permutex2var_epi32 (__m128i __A
, __m128i __I
, __mmask8 __U
,
6460 return (__m128i
) __builtin_ia32_vpermi2vard128_mask ((__v4si
) __A
,
6467 extern __inline __m128i
6468 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6469 _mm_maskz_permutex2var_epi32 (__mmask8 __U
, __m128i __A
, __m128i __I
,
6472 return (__m128i
) __builtin_ia32_vpermt2vard128_maskz ((__v4si
) __I
6480 extern __inline __m256i
6481 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6482 _mm256_permutex2var_epi64 (__m256i __A
, __m256i __I
, __m256i __B
)
6484 return (__m256i
) __builtin_ia32_vpermt2varq256_mask ((__v4di
) __I
6491 extern __inline __m256i
6492 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6493 _mm256_mask_permutex2var_epi64 (__m256i __A
, __mmask8 __U
, __m256i __I
,
6496 return (__m256i
) __builtin_ia32_vpermt2varq256_mask ((__v4di
) __I
6503 extern __inline __m256i
6504 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6505 _mm256_mask2_permutex2var_epi64 (__m256i __A
, __m256i __I
,
6506 __mmask8 __U
, __m256i __B
)
6508 return (__m256i
) __builtin_ia32_vpermi2varq256_mask ((__v4di
) __A
,
6515 extern __inline __m256i
6516 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6517 _mm256_maskz_permutex2var_epi64 (__mmask8 __U
, __m256i __A
,
6518 __m256i __I
, __m256i __B
)
6520 return (__m256i
) __builtin_ia32_vpermt2varq256_maskz ((__v4di
) __I
6528 extern __inline __m256i
6529 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6530 _mm256_permutex2var_epi32 (__m256i __A
, __m256i __I
, __m256i __B
)
6532 return (__m256i
) __builtin_ia32_vpermt2vard256_mask ((__v8si
) __I
6539 extern __inline __m256i
6540 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6541 _mm256_mask_permutex2var_epi32 (__m256i __A
, __mmask8 __U
, __m256i __I
,
6544 return (__m256i
) __builtin_ia32_vpermt2vard256_mask ((__v8si
) __I
6551 extern __inline __m256i
6552 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6553 _mm256_mask2_permutex2var_epi32 (__m256i __A
, __m256i __I
,
6554 __mmask8 __U
, __m256i __B
)
6556 return (__m256i
) __builtin_ia32_vpermi2vard256_mask ((__v8si
) __A
,
6563 extern __inline __m256i
6564 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6565 _mm256_maskz_permutex2var_epi32 (__mmask8 __U
, __m256i __A
,
6566 __m256i __I
, __m256i __B
)
6568 return (__m256i
) __builtin_ia32_vpermt2vard256_maskz ((__v8si
) __I
6576 extern __inline __m128d
6577 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6578 _mm_permutex2var_pd (__m128d __A
, __m128i __I
, __m128d __B
)
6580 return (__m128d
) __builtin_ia32_vpermt2varpd128_mask ((__v2di
) __I
6587 extern __inline __m128d
6588 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6589 _mm_mask_permutex2var_pd (__m128d __A
, __mmask8 __U
, __m128i __I
,
6592 return (__m128d
) __builtin_ia32_vpermt2varpd128_mask ((__v2di
) __I
6600 extern __inline __m128d
6601 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6602 _mm_mask2_permutex2var_pd (__m128d __A
, __m128i __I
, __mmask8 __U
,
6605 return (__m128d
) __builtin_ia32_vpermi2varpd128_mask ((__v2df
) __A
,
6613 extern __inline __m128d
6614 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6615 _mm_maskz_permutex2var_pd (__mmask8 __U
, __m128d __A
, __m128i __I
,
6618 return (__m128d
) __builtin_ia32_vpermt2varpd128_maskz ((__v2di
) __I
6626 extern __inline __m128
6627 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6628 _mm_permutex2var_ps (__m128 __A
, __m128i __I
, __m128 __B
)
6630 return (__m128
) __builtin_ia32_vpermt2varps128_mask ((__v4si
) __I
6637 extern __inline __m128
6638 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6639 _mm_mask_permutex2var_ps (__m128 __A
, __mmask8 __U
, __m128i __I
,
6642 return (__m128
) __builtin_ia32_vpermt2varps128_mask ((__v4si
) __I
6649 extern __inline __m128
6650 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6651 _mm_mask2_permutex2var_ps (__m128 __A
, __m128i __I
, __mmask8 __U
,
6654 return (__m128
) __builtin_ia32_vpermi2varps128_mask ((__v4sf
) __A
,
6661 extern __inline __m128
6662 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6663 _mm_maskz_permutex2var_ps (__mmask8 __U
, __m128 __A
, __m128i __I
,
6666 return (__m128
) __builtin_ia32_vpermt2varps128_maskz ((__v4si
) __I
6674 extern __inline __m128i
6675 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6676 _mm_srav_epi64 (__m128i __X
, __m128i __Y
)
6678 return (__m128i
) __builtin_ia32_psravq128_mask ((__v2di
) __X
,
6685 extern __inline __m128i
6686 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6687 _mm_mask_srav_epi64 (__m128i __W
, __mmask8 __U
, __m128i __X
,
6690 return (__m128i
) __builtin_ia32_psravq128_mask ((__v2di
) __X
,
6696 extern __inline __m128i
6697 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6698 _mm_maskz_srav_epi64 (__mmask8 __U
, __m128i __X
, __m128i __Y
)
6700 return (__m128i
) __builtin_ia32_psravq128_mask ((__v2di
) __X
,
6707 extern __inline __m256i
6708 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6709 _mm256_mask_sllv_epi32 (__m256i __W
, __mmask8 __U
, __m256i __X
,
6712 return (__m256i
) __builtin_ia32_psllv8si_mask ((__v8si
) __X
,
6718 extern __inline __m256i
6719 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6720 _mm256_maskz_sllv_epi32 (__mmask8 __U
, __m256i __X
, __m256i __Y
)
6722 return (__m256i
) __builtin_ia32_psllv8si_mask ((__v8si
) __X
,
6725 _mm256_setzero_si256 (),
6729 extern __inline __m128i
6730 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6731 _mm_mask_sllv_epi32 (__m128i __W
, __mmask8 __U
, __m128i __X
,
6734 return (__m128i
) __builtin_ia32_psllv4si_mask ((__v4si
) __X
,
6740 extern __inline __m128i
6741 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6742 _mm_maskz_sllv_epi32 (__mmask8 __U
, __m128i __X
, __m128i __Y
)
6744 return (__m128i
) __builtin_ia32_psllv4si_mask ((__v4si
) __X
,
6747 _mm_setzero_si128 (),
6751 extern __inline __m256i
6752 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6753 _mm256_mask_sllv_epi64 (__m256i __W
, __mmask8 __U
, __m256i __X
,
6756 return (__m256i
) __builtin_ia32_psllv4di_mask ((__v4di
) __X
,
6762 extern __inline __m256i
6763 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6764 _mm256_maskz_sllv_epi64 (__mmask8 __U
, __m256i __X
, __m256i __Y
)
6766 return (__m256i
) __builtin_ia32_psllv4di_mask ((__v4di
) __X
,
6769 _mm256_setzero_si256 (),
6773 extern __inline __m128i
6774 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6775 _mm_mask_sllv_epi64 (__m128i __W
, __mmask8 __U
, __m128i __X
,
6778 return (__m128i
) __builtin_ia32_psllv2di_mask ((__v2di
) __X
,
6784 extern __inline __m128i
6785 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6786 _mm_maskz_sllv_epi64 (__mmask8 __U
, __m128i __X
, __m128i __Y
)
6788 return (__m128i
) __builtin_ia32_psllv2di_mask ((__v2di
) __X
,
6795 extern __inline __m256i
6796 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6797 _mm256_mask_srav_epi32 (__m256i __W
, __mmask8 __U
, __m256i __X
,
6800 return (__m256i
) __builtin_ia32_psrav8si_mask ((__v8si
) __X
,
6806 extern __inline __m256i
6807 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6808 _mm256_maskz_srav_epi32 (__mmask8 __U
, __m256i __X
, __m256i __Y
)
6810 return (__m256i
) __builtin_ia32_psrav8si_mask ((__v8si
) __X
,
6813 _mm256_setzero_si256 (),
6817 extern __inline __m128i
6818 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6819 _mm_mask_srav_epi32 (__m128i __W
, __mmask8 __U
, __m128i __X
,
6822 return (__m128i
) __builtin_ia32_psrav4si_mask ((__v4si
) __X
,
6828 extern __inline __m128i
6829 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6830 _mm_maskz_srav_epi32 (__mmask8 __U
, __m128i __X
, __m128i __Y
)
6832 return (__m128i
) __builtin_ia32_psrav4si_mask ((__v4si
) __X
,
6835 _mm_setzero_si128 (),
6839 extern __inline __m256i
6840 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6841 _mm256_mask_srlv_epi32 (__m256i __W
, __mmask8 __U
, __m256i __X
,
6844 return (__m256i
) __builtin_ia32_psrlv8si_mask ((__v8si
) __X
,
6850 extern __inline __m256i
6851 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6852 _mm256_maskz_srlv_epi32 (__mmask8 __U
, __m256i __X
, __m256i __Y
)
6854 return (__m256i
) __builtin_ia32_psrlv8si_mask ((__v8si
) __X
,
6857 _mm256_setzero_si256 (),
6861 extern __inline __m128i
6862 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6863 _mm_mask_srlv_epi32 (__m128i __W
, __mmask8 __U
, __m128i __X
,
6866 return (__m128i
) __builtin_ia32_psrlv4si_mask ((__v4si
) __X
,
6872 extern __inline __m128i
6873 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6874 _mm_maskz_srlv_epi32 (__mmask8 __U
, __m128i __X
, __m128i __Y
)
6876 return (__m128i
) __builtin_ia32_psrlv4si_mask ((__v4si
) __X
,
6879 _mm_setzero_si128 (),
6883 extern __inline __m256i
6884 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6885 _mm256_mask_srlv_epi64 (__m256i __W
, __mmask8 __U
, __m256i __X
,
6888 return (__m256i
) __builtin_ia32_psrlv4di_mask ((__v4di
) __X
,
6894 extern __inline __m256i
6895 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6896 _mm256_maskz_srlv_epi64 (__mmask8 __U
, __m256i __X
, __m256i __Y
)
6898 return (__m256i
) __builtin_ia32_psrlv4di_mask ((__v4di
) __X
,
6901 _mm256_setzero_si256 (),
6905 extern __inline __m128i
6906 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6907 _mm_mask_srlv_epi64 (__m128i __W
, __mmask8 __U
, __m128i __X
,
6910 return (__m128i
) __builtin_ia32_psrlv2di_mask ((__v2di
) __X
,
6916 extern __inline __m128i
6917 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6918 _mm_maskz_srlv_epi64 (__mmask8 __U
, __m128i __X
, __m128i __Y
)
6920 return (__m128i
) __builtin_ia32_psrlv2di_mask ((__v2di
) __X
,
6927 extern __inline __m256i
6928 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6929 _mm256_rolv_epi32 (__m256i __A
, __m256i __B
)
6931 return (__m256i
) __builtin_ia32_prolvd256_mask ((__v8si
) __A
,
6934 _mm256_setzero_si256 (),
6938 extern __inline __m256i
6939 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6940 _mm256_mask_rolv_epi32 (__m256i __W
, __mmask8 __U
, __m256i __A
,
6943 return (__m256i
) __builtin_ia32_prolvd256_mask ((__v8si
) __A
,
6949 extern __inline __m256i
6950 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6951 _mm256_maskz_rolv_epi32 (__mmask8 __U
, __m256i __A
, __m256i __B
)
6953 return (__m256i
) __builtin_ia32_prolvd256_mask ((__v8si
) __A
,
6956 _mm256_setzero_si256 (),
6960 extern __inline __m128i
6961 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6962 _mm_rolv_epi32 (__m128i __A
, __m128i __B
)
6964 return (__m128i
) __builtin_ia32_prolvd128_mask ((__v4si
) __A
,
6967 _mm_setzero_si128 (),
6971 extern __inline __m128i
6972 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6973 _mm_mask_rolv_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
,
6976 return (__m128i
) __builtin_ia32_prolvd128_mask ((__v4si
) __A
,
6982 extern __inline __m128i
6983 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6984 _mm_maskz_rolv_epi32 (__mmask8 __U
, __m128i __A
, __m128i __B
)
6986 return (__m128i
) __builtin_ia32_prolvd128_mask ((__v4si
) __A
,
6989 _mm_setzero_si128 (),
6993 extern __inline __m256i
6994 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
6995 _mm256_rorv_epi32 (__m256i __A
, __m256i __B
)
6997 return (__m256i
) __builtin_ia32_prorvd256_mask ((__v8si
) __A
,
7000 _mm256_setzero_si256 (),
7004 extern __inline __m256i
7005 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7006 _mm256_mask_rorv_epi32 (__m256i __W
, __mmask8 __U
, __m256i __A
,
7009 return (__m256i
) __builtin_ia32_prorvd256_mask ((__v8si
) __A
,
7015 extern __inline __m256i
7016 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7017 _mm256_maskz_rorv_epi32 (__mmask8 __U
, __m256i __A
, __m256i __B
)
7019 return (__m256i
) __builtin_ia32_prorvd256_mask ((__v8si
) __A
,
7022 _mm256_setzero_si256 (),
7026 extern __inline __m128i
7027 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7028 _mm_rorv_epi32 (__m128i __A
, __m128i __B
)
7030 return (__m128i
) __builtin_ia32_prorvd128_mask ((__v4si
) __A
,
7033 _mm_setzero_si128 (),
7037 extern __inline __m128i
7038 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7039 _mm_mask_rorv_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
,
7042 return (__m128i
) __builtin_ia32_prorvd128_mask ((__v4si
) __A
,
7048 extern __inline __m128i
7049 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7050 _mm_maskz_rorv_epi32 (__mmask8 __U
, __m128i __A
, __m128i __B
)
7052 return (__m128i
) __builtin_ia32_prorvd128_mask ((__v4si
) __A
,
7055 _mm_setzero_si128 (),
7059 extern __inline __m256i
7060 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7061 _mm256_rolv_epi64 (__m256i __A
, __m256i __B
)
7063 return (__m256i
) __builtin_ia32_prolvq256_mask ((__v4di
) __A
,
7066 _mm256_setzero_si256 (),
7070 extern __inline __m256i
7071 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7072 _mm256_mask_rolv_epi64 (__m256i __W
, __mmask8 __U
, __m256i __A
,
7075 return (__m256i
) __builtin_ia32_prolvq256_mask ((__v4di
) __A
,
7081 extern __inline __m256i
7082 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7083 _mm256_maskz_rolv_epi64 (__mmask8 __U
, __m256i __A
, __m256i __B
)
7085 return (__m256i
) __builtin_ia32_prolvq256_mask ((__v4di
) __A
,
7088 _mm256_setzero_si256 (),
7092 extern __inline __m128i
7093 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7094 _mm_rolv_epi64 (__m128i __A
, __m128i __B
)
7096 return (__m128i
) __builtin_ia32_prolvq128_mask ((__v2di
) __A
,
7103 extern __inline __m128i
7104 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7105 _mm_mask_rolv_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
,
7108 return (__m128i
) __builtin_ia32_prolvq128_mask ((__v2di
) __A
,
7114 extern __inline __m128i
7115 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7116 _mm_maskz_rolv_epi64 (__mmask8 __U
, __m128i __A
, __m128i __B
)
7118 return (__m128i
) __builtin_ia32_prolvq128_mask ((__v2di
) __A
,
7125 extern __inline __m256i
7126 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7127 _mm256_rorv_epi64 (__m256i __A
, __m256i __B
)
7129 return (__m256i
) __builtin_ia32_prorvq256_mask ((__v4di
) __A
,
7132 _mm256_setzero_si256 (),
7136 extern __inline __m256i
7137 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7138 _mm256_mask_rorv_epi64 (__m256i __W
, __mmask8 __U
, __m256i __A
,
7141 return (__m256i
) __builtin_ia32_prorvq256_mask ((__v4di
) __A
,
7147 extern __inline __m256i
7148 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7149 _mm256_maskz_rorv_epi64 (__mmask8 __U
, __m256i __A
, __m256i __B
)
7151 return (__m256i
) __builtin_ia32_prorvq256_mask ((__v4di
) __A
,
7154 _mm256_setzero_si256 (),
7158 extern __inline __m128i
7159 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7160 _mm_rorv_epi64 (__m128i __A
, __m128i __B
)
7162 return (__m128i
) __builtin_ia32_prorvq128_mask ((__v2di
) __A
,
7169 extern __inline __m128i
7170 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7171 _mm_mask_rorv_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
,
7174 return (__m128i
) __builtin_ia32_prorvq128_mask ((__v2di
) __A
,
7180 extern __inline __m128i
7181 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7182 _mm_maskz_rorv_epi64 (__mmask8 __U
, __m128i __A
, __m128i __B
)
7184 return (__m128i
) __builtin_ia32_prorvq128_mask ((__v2di
) __A
,
7191 extern __inline __m256i
7192 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7193 _mm256_srav_epi64 (__m256i __X
, __m256i __Y
)
7195 return (__m256i
) __builtin_ia32_psravq256_mask ((__v4di
) __X
,
7198 _mm256_setzero_si256 (),
7202 extern __inline __m256i
7203 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7204 _mm256_mask_srav_epi64 (__m256i __W
, __mmask8 __U
, __m256i __X
,
7207 return (__m256i
) __builtin_ia32_psravq256_mask ((__v4di
) __X
,
7213 extern __inline __m256i
7214 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7215 _mm256_maskz_srav_epi64 (__mmask8 __U
, __m256i __X
, __m256i __Y
)
7217 return (__m256i
) __builtin_ia32_psravq256_mask ((__v4di
) __X
,
7220 _mm256_setzero_si256 (),
7224 extern __inline __m256i
7225 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7226 _mm256_mask_and_epi64 (__m256i __W
, __mmask8 __U
, __m256i __A
,
7229 return (__m256i
) __builtin_ia32_pandq256_mask ((__v4di
) __A
,
7234 extern __inline __m256i
7235 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7236 _mm256_maskz_and_epi64 (__mmask8 __U
, __m256i __A
, __m256i __B
)
7238 return (__m256i
) __builtin_ia32_pandq256_mask ((__v4di
) __A
,
7241 _mm256_setzero_pd (),
7245 extern __inline __m128i
7246 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7247 _mm_mask_and_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
,
7250 return (__m128i
) __builtin_ia32_pandq128_mask ((__v2di
) __A
,
7255 extern __inline __m128i
7256 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7257 _mm_maskz_and_epi64 (__mmask8 __U
, __m128i __A
, __m128i __B
)
7259 return (__m128i
) __builtin_ia32_pandq128_mask ((__v2di
) __A
,
7266 extern __inline __m256i
7267 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7268 _mm256_mask_andnot_epi64 (__m256i __W
, __mmask8 __U
, __m256i __A
,
7271 return (__m256i
) __builtin_ia32_pandnq256_mask ((__v4di
) __A
,
7276 extern __inline __m256i
7277 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7278 _mm256_maskz_andnot_epi64 (__mmask8 __U
, __m256i __A
, __m256i __B
)
7280 return (__m256i
) __builtin_ia32_pandnq256_mask ((__v4di
) __A
,
7283 _mm256_setzero_pd (),
7287 extern __inline __m128i
7288 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7289 _mm_mask_andnot_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
,
7292 return (__m128i
) __builtin_ia32_pandnq128_mask ((__v2di
) __A
,
7297 extern __inline __m128i
7298 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7299 _mm_maskz_andnot_epi64 (__mmask8 __U
, __m128i __A
, __m128i __B
)
7301 return (__m128i
) __builtin_ia32_pandnq128_mask ((__v2di
) __A
,
7308 extern __inline __m256i
7309 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7310 _mm256_mask_or_epi64 (__m256i __W
, __mmask8 __U
, __m256i __A
,
7313 return (__m256i
) __builtin_ia32_porq256_mask ((__v4di
) __A
,
7319 extern __inline __m256i
7320 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7321 _mm256_maskz_or_epi64 (__mmask8 __U
, __m256i __A
, __m256i __B
)
7323 return (__m256i
) __builtin_ia32_porq256_mask ((__v4di
) __A
,
7326 _mm256_setzero_si256 (),
7330 extern __inline __m128i
7331 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7332 _mm_mask_or_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
, __m128i __B
)
7334 return (__m128i
) __builtin_ia32_porq128_mask ((__v2di
) __A
,
7340 extern __inline __m128i
7341 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7342 _mm_maskz_or_epi64 (__mmask8 __U
, __m128i __A
, __m128i __B
)
7344 return (__m128i
) __builtin_ia32_porq128_mask ((__v2di
) __A
,
7347 _mm_setzero_si128 (),
7351 extern __inline __m256i
7352 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7353 _mm256_mask_xor_epi64 (__m256i __W
, __mmask8 __U
, __m256i __A
,
7356 return (__m256i
) __builtin_ia32_pxorq256_mask ((__v4di
) __A
,
7362 extern __inline __m256i
7363 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7364 _mm256_maskz_xor_epi64 (__mmask8 __U
, __m256i __A
, __m256i __B
)
7366 return (__m256i
) __builtin_ia32_pxorq256_mask ((__v4di
) __A
,
7369 _mm256_setzero_si256 (),
7373 extern __inline __m128i
7374 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7375 _mm_mask_xor_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
,
7378 return (__m128i
) __builtin_ia32_pxorq128_mask ((__v2di
) __A
,
7384 extern __inline __m128i
7385 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7386 _mm_maskz_xor_epi64 (__mmask8 __U
, __m128i __A
, __m128i __B
)
7388 return (__m128i
) __builtin_ia32_pxorq128_mask ((__v2di
) __A
,
7391 _mm_setzero_si128 (),
7395 extern __inline __m256d
7396 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7397 _mm256_mask_max_pd (__m256d __W
, __mmask8 __U
, __m256d __A
,
7400 return (__m256d
) __builtin_ia32_maxpd256_mask ((__v4df
) __A
,
7406 extern __inline __m256d
7407 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7408 _mm256_maskz_max_pd (__mmask8 __U
, __m256d __A
, __m256d __B
)
7410 return (__m256d
) __builtin_ia32_maxpd256_mask ((__v4df
) __A
,
7413 _mm256_setzero_pd (),
7417 extern __inline __m256
7418 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7419 _mm256_mask_max_ps (__m256 __W
, __mmask8 __U
, __m256 __A
, __m256 __B
)
7421 return (__m256
) __builtin_ia32_maxps256_mask ((__v8sf
) __A
,
7427 extern __inline __m256
7428 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7429 _mm256_maskz_max_ps (__mmask8 __U
, __m256 __A
, __m256 __B
)
7431 return (__m256
) __builtin_ia32_maxps256_mask ((__v8sf
) __A
,
7434 _mm256_setzero_ps (),
7438 extern __inline __m128
7439 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7440 _mm_mask_div_ps (__m128 __W
, __mmask8 __U
, __m128 __A
, __m128 __B
)
7442 return (__m128
) __builtin_ia32_divps_mask ((__v4sf
) __A
,
7448 extern __inline __m128
7449 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7450 _mm_maskz_div_ps (__mmask8 __U
, __m128 __A
, __m128 __B
)
7452 return (__m128
) __builtin_ia32_divps_mask ((__v4sf
) __A
,
7459 extern __inline __m128d
7460 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7461 _mm_mask_div_pd (__m128d __W
, __mmask8 __U
, __m128d __A
, __m128d __B
)
7463 return (__m128d
) __builtin_ia32_divpd_mask ((__v2df
) __A
,
7469 extern __inline __m128d
7470 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7471 _mm_maskz_div_pd (__mmask8 __U
, __m128d __A
, __m128d __B
)
7473 return (__m128d
) __builtin_ia32_divpd_mask ((__v2df
) __A
,
7480 extern __inline __m256d
7481 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7482 _mm256_mask_min_pd (__m256d __W
, __mmask8 __U
, __m256d __A
,
7485 return (__m256d
) __builtin_ia32_minpd256_mask ((__v4df
) __A
,
7491 extern __inline __m256d
7492 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7493 _mm256_mask_div_pd (__m256d __W
, __mmask8 __U
, __m256d __A
,
7496 return (__m256d
) __builtin_ia32_divpd256_mask ((__v4df
) __A
,
7502 extern __inline __m256d
7503 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7504 _mm256_maskz_min_pd (__mmask8 __U
, __m256d __A
, __m256d __B
)
7506 return (__m256d
) __builtin_ia32_minpd256_mask ((__v4df
) __A
,
7509 _mm256_setzero_pd (),
7513 extern __inline __m256
7514 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7515 _mm256_mask_min_ps (__m256 __W
, __mmask8 __U
, __m256 __A
, __m256 __B
)
7517 return (__m256
) __builtin_ia32_minps256_mask ((__v8sf
) __A
,
7523 extern __inline __m256d
7524 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7525 _mm256_maskz_div_pd (__mmask8 __U
, __m256d __A
, __m256d __B
)
7527 return (__m256d
) __builtin_ia32_divpd256_mask ((__v4df
) __A
,
7530 _mm256_setzero_pd (),
7534 extern __inline __m256
7535 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7536 _mm256_mask_div_ps (__m256 __W
, __mmask8 __U
, __m256 __A
, __m256 __B
)
7538 return (__m256
) __builtin_ia32_divps256_mask ((__v8sf
) __A
,
7544 extern __inline __m256
7545 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7546 _mm256_maskz_min_ps (__mmask8 __U
, __m256 __A
, __m256 __B
)
7548 return (__m256
) __builtin_ia32_minps256_mask ((__v8sf
) __A
,
7551 _mm256_setzero_ps (),
7555 extern __inline __m256
7556 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7557 _mm256_maskz_div_ps (__mmask8 __U
, __m256 __A
, __m256 __B
)
7559 return (__m256
) __builtin_ia32_divps256_mask ((__v8sf
) __A
,
7562 _mm256_setzero_ps (),
7566 extern __inline __m128
7567 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7568 _mm_mask_min_ps (__m128 __W
, __mmask8 __U
, __m128 __A
, __m128 __B
)
7570 return (__m128
) __builtin_ia32_minps_mask ((__v4sf
) __A
,
7576 extern __inline __m128
7577 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7578 _mm_mask_mul_ps (__m128 __W
, __mmask8 __U
, __m128 __A
, __m128 __B
)
7580 return (__m128
) __builtin_ia32_mulps_mask ((__v4sf
) __A
,
7586 extern __inline __m128
7587 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7588 _mm_maskz_min_ps (__mmask8 __U
, __m128 __A
, __m128 __B
)
7590 return (__m128
) __builtin_ia32_minps_mask ((__v4sf
) __A
,
7597 extern __inline __m128
7598 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7599 _mm_maskz_mul_ps (__mmask8 __U
, __m128 __A
, __m128 __B
)
7601 return (__m128
) __builtin_ia32_mulps_mask ((__v4sf
) __A
,
7608 extern __inline __m128
7609 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7610 _mm_mask_max_ps (__m128 __W
, __mmask8 __U
, __m128 __A
, __m128 __B
)
7612 return (__m128
) __builtin_ia32_maxps_mask ((__v4sf
) __A
,
7618 extern __inline __m128
7619 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7620 _mm_maskz_max_ps (__mmask8 __U
, __m128 __A
, __m128 __B
)
7622 return (__m128
) __builtin_ia32_maxps_mask ((__v4sf
) __A
,
7629 extern __inline __m128d
7630 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7631 _mm_mask_min_pd (__m128d __W
, __mmask8 __U
, __m128d __A
, __m128d __B
)
7633 return (__m128d
) __builtin_ia32_minpd_mask ((__v2df
) __A
,
7639 extern __inline __m128d
7640 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7641 _mm_maskz_min_pd (__mmask8 __U
, __m128d __A
, __m128d __B
)
7643 return (__m128d
) __builtin_ia32_minpd_mask ((__v2df
) __A
,
7650 extern __inline __m128d
7651 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7652 _mm_mask_max_pd (__m128d __W
, __mmask8 __U
, __m128d __A
, __m128d __B
)
7654 return (__m128d
) __builtin_ia32_maxpd_mask ((__v2df
) __A
,
7660 extern __inline __m128d
7661 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7662 _mm_maskz_max_pd (__mmask8 __U
, __m128d __A
, __m128d __B
)
7664 return (__m128d
) __builtin_ia32_maxpd_mask ((__v2df
) __A
,
7671 extern __inline __m128d
7672 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7673 _mm_mask_mul_pd (__m128d __W
, __mmask8 __U
, __m128d __A
, __m128d __B
)
7675 return (__m128d
) __builtin_ia32_mulpd_mask ((__v2df
) __A
,
7681 extern __inline __m128d
7682 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7683 _mm_maskz_mul_pd (__mmask8 __U
, __m128d __A
, __m128d __B
)
7685 return (__m128d
) __builtin_ia32_mulpd_mask ((__v2df
) __A
,
7692 extern __inline __m256
7693 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7694 _mm256_mask_mul_ps (__m256 __W
, __mmask8 __U
, __m256 __A
, __m256 __B
)
7696 return (__m256
) __builtin_ia32_mulps256_mask ((__v8sf
) __A
,
7702 extern __inline __m256
7703 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7704 _mm256_maskz_mul_ps (__mmask8 __U
, __m256 __A
, __m256 __B
)
7706 return (__m256
) __builtin_ia32_mulps256_mask ((__v8sf
) __A
,
7709 _mm256_setzero_ps (),
7713 extern __inline __m256d
7714 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7715 _mm256_mask_mul_pd (__m256d __W
, __mmask8 __U
, __m256d __A
,
7718 return (__m256d
) __builtin_ia32_mulpd256_mask ((__v4df
) __A
,
7724 extern __inline __m256d
7725 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7726 _mm256_maskz_mul_pd (__mmask8 __U
, __m256d __A
, __m256d __B
)
7728 return (__m256d
) __builtin_ia32_mulpd256_mask ((__v4df
) __A
,
7731 _mm256_setzero_pd (),
7735 extern __inline __m256i
7736 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7737 _mm256_maskz_max_epi64 (__mmask8 __M
, __m256i __A
, __m256i __B
)
7739 return (__m256i
) __builtin_ia32_pmaxsq256_mask ((__v4di
) __A
,
7742 _mm256_setzero_si256 (),
7746 extern __inline __m256i
7747 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7748 _mm256_mask_max_epi64 (__m256i __W
, __mmask8 __M
, __m256i __A
,
7751 return (__m256i
) __builtin_ia32_pmaxsq256_mask ((__v4di
) __A
,
7756 extern __inline __m256i
7757 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7758 _mm256_min_epi64 (__m256i __A
, __m256i __B
)
7760 return (__m256i
) __builtin_ia32_pminsq256_mask ((__v4di
) __A
,
7763 _mm256_setzero_si256 (),
7767 extern __inline __m256i
7768 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7769 _mm256_mask_min_epi64 (__m256i __W
, __mmask8 __M
, __m256i __A
,
7772 return (__m256i
) __builtin_ia32_pminsq256_mask ((__v4di
) __A
,
7777 extern __inline __m256i
7778 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7779 _mm256_maskz_min_epi64 (__mmask8 __M
, __m256i __A
, __m256i __B
)
7781 return (__m256i
) __builtin_ia32_pminsq256_mask ((__v4di
) __A
,
7784 _mm256_setzero_si256 (),
7788 extern __inline __m256i
7789 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7790 _mm256_maskz_max_epu64 (__mmask8 __M
, __m256i __A
, __m256i __B
)
7792 return (__m256i
) __builtin_ia32_pmaxuq256_mask ((__v4di
) __A
,
7795 _mm256_setzero_si256 (),
7799 extern __inline __m256i
7800 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7801 _mm256_max_epi64 (__m256i __A
, __m256i __B
)
7803 return (__m256i
) __builtin_ia32_pmaxsq256_mask ((__v4di
) __A
,
7806 _mm256_setzero_si256 (),
7810 extern __inline __m256i
7811 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7812 _mm256_max_epu64 (__m256i __A
, __m256i __B
)
7814 return (__m256i
) __builtin_ia32_pmaxuq256_mask ((__v4di
) __A
,
7817 _mm256_setzero_si256 (),
7821 extern __inline __m256i
7822 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7823 _mm256_mask_max_epu64 (__m256i __W
, __mmask8 __M
, __m256i __A
,
7826 return (__m256i
) __builtin_ia32_pmaxuq256_mask ((__v4di
) __A
,
7831 extern __inline __m256i
7832 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7833 _mm256_min_epu64 (__m256i __A
, __m256i __B
)
7835 return (__m256i
) __builtin_ia32_pminuq256_mask ((__v4di
) __A
,
7838 _mm256_setzero_si256 (),
7842 extern __inline __m256i
7843 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7844 _mm256_mask_min_epu64 (__m256i __W
, __mmask8 __M
, __m256i __A
,
7847 return (__m256i
) __builtin_ia32_pminuq256_mask ((__v4di
) __A
,
7852 extern __inline __m256i
7853 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7854 _mm256_maskz_min_epu64 (__mmask8 __M
, __m256i __A
, __m256i __B
)
7856 return (__m256i
) __builtin_ia32_pminuq256_mask ((__v4di
) __A
,
7859 _mm256_setzero_si256 (),
7863 extern __inline __m256i
7864 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7865 _mm256_maskz_max_epi32 (__mmask8 __M
, __m256i __A
, __m256i __B
)
7867 return (__m256i
) __builtin_ia32_pmaxsd256_mask ((__v8si
) __A
,
7870 _mm256_setzero_si256 (),
7874 extern __inline __m256i
7875 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7876 _mm256_mask_max_epi32 (__m256i __W
, __mmask8 __M
, __m256i __A
,
7879 return (__m256i
) __builtin_ia32_pmaxsd256_mask ((__v8si
) __A
,
7884 extern __inline __m256i
7885 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7886 _mm256_maskz_min_epi32 (__mmask8 __M
, __m256i __A
, __m256i __B
)
7888 return (__m256i
) __builtin_ia32_pminsd256_mask ((__v8si
) __A
,
7891 _mm256_setzero_si256 (),
7895 extern __inline __m256i
7896 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7897 _mm256_mask_min_epi32 (__m256i __W
, __mmask8 __M
, __m256i __A
,
7900 return (__m256i
) __builtin_ia32_pminsd256_mask ((__v8si
) __A
,
7905 extern __inline __m256i
7906 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7907 _mm256_maskz_max_epu32 (__mmask8 __M
, __m256i __A
, __m256i __B
)
7909 return (__m256i
) __builtin_ia32_pmaxud256_mask ((__v8si
) __A
,
7912 _mm256_setzero_si256 (),
7916 extern __inline __m256i
7917 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7918 _mm256_mask_max_epu32 (__m256i __W
, __mmask8 __M
, __m256i __A
,
7921 return (__m256i
) __builtin_ia32_pmaxud256_mask ((__v8si
) __A
,
7926 extern __inline __m256i
7927 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7928 _mm256_maskz_min_epu32 (__mmask8 __M
, __m256i __A
, __m256i __B
)
7930 return (__m256i
) __builtin_ia32_pminud256_mask ((__v8si
) __A
,
7933 _mm256_setzero_si256 (),
7937 extern __inline __m256i
7938 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7939 _mm256_mask_min_epu32 (__m256i __W
, __mmask8 __M
, __m256i __A
,
7942 return (__m256i
) __builtin_ia32_pminud256_mask ((__v8si
) __A
,
7947 extern __inline __m128i
7948 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7949 _mm_maskz_max_epi64 (__mmask8 __M
, __m128i __A
, __m128i __B
)
7951 return (__m128i
) __builtin_ia32_pmaxsq128_mask ((__v2di
) __A
,
7954 _mm_setzero_si128 (),
7958 extern __inline __m128i
7959 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7960 _mm_mask_max_epi64 (__m128i __W
, __mmask8 __M
, __m128i __A
,
7963 return (__m128i
) __builtin_ia32_pmaxsq128_mask ((__v2di
) __A
,
7968 extern __inline __m128i
7969 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7970 _mm_min_epi64 (__m128i __A
, __m128i __B
)
7972 return (__m128i
) __builtin_ia32_pminsq128_mask ((__v2di
) __A
,
7979 extern __inline __m128i
7980 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7981 _mm_mask_min_epi64 (__m128i __W
, __mmask8 __M
, __m128i __A
,
7984 return (__m128i
) __builtin_ia32_pminsq128_mask ((__v2di
) __A
,
7989 extern __inline __m128i
7990 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
7991 _mm_maskz_min_epi64 (__mmask8 __M
, __m128i __A
, __m128i __B
)
7993 return (__m128i
) __builtin_ia32_pminsq128_mask ((__v2di
) __A
,
7996 _mm_setzero_si128 (),
8000 extern __inline __m128i
8001 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8002 _mm_maskz_max_epu64 (__mmask8 __M
, __m128i __A
, __m128i __B
)
8004 return (__m128i
) __builtin_ia32_pmaxuq128_mask ((__v2di
) __A
,
8007 _mm_setzero_si128 (),
8011 extern __inline __m128i
8012 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8013 _mm_max_epi64 (__m128i __A
, __m128i __B
)
8015 return (__m128i
) __builtin_ia32_pmaxsq128_mask ((__v2di
) __A
,
8022 extern __inline __m128i
8023 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8024 _mm_max_epu64 (__m128i __A
, __m128i __B
)
8026 return (__m128i
) __builtin_ia32_pmaxuq128_mask ((__v2di
) __A
,
8033 extern __inline __m128i
8034 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8035 _mm_mask_max_epu64 (__m128i __W
, __mmask8 __M
, __m128i __A
,
8038 return (__m128i
) __builtin_ia32_pmaxuq128_mask ((__v2di
) __A
,
8043 extern __inline __m128i
8044 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8045 _mm_min_epu64 (__m128i __A
, __m128i __B
)
8047 return (__m128i
) __builtin_ia32_pminuq128_mask ((__v2di
) __A
,
8054 extern __inline __m128i
8055 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8056 _mm_mask_min_epu64 (__m128i __W
, __mmask8 __M
, __m128i __A
,
8059 return (__m128i
) __builtin_ia32_pminuq128_mask ((__v2di
) __A
,
8064 extern __inline __m128i
8065 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8066 _mm_maskz_min_epu64 (__mmask8 __M
, __m128i __A
, __m128i __B
)
8068 return (__m128i
) __builtin_ia32_pminuq128_mask ((__v2di
) __A
,
8071 _mm_setzero_si128 (),
8075 extern __inline __m128i
8076 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8077 _mm_maskz_max_epi32 (__mmask8 __M
, __m128i __A
, __m128i __B
)
8079 return (__m128i
) __builtin_ia32_pmaxsd128_mask ((__v4si
) __A
,
8082 _mm_setzero_si128 (),
8086 extern __inline __m128i
8087 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8088 _mm_mask_max_epi32 (__m128i __W
, __mmask8 __M
, __m128i __A
,
8091 return (__m128i
) __builtin_ia32_pmaxsd128_mask ((__v4si
) __A
,
8096 extern __inline __m128i
8097 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8098 _mm_maskz_min_epi32 (__mmask8 __M
, __m128i __A
, __m128i __B
)
8100 return (__m128i
) __builtin_ia32_pminsd128_mask ((__v4si
) __A
,
8103 _mm_setzero_si128 (),
8107 extern __inline __m128i
8108 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8109 _mm_mask_min_epi32 (__m128i __W
, __mmask8 __M
, __m128i __A
,
8112 return (__m128i
) __builtin_ia32_pminsd128_mask ((__v4si
) __A
,
8117 extern __inline __m128i
8118 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8119 _mm_maskz_max_epu32 (__mmask8 __M
, __m128i __A
, __m128i __B
)
8121 return (__m128i
) __builtin_ia32_pmaxud128_mask ((__v4si
) __A
,
8124 _mm_setzero_si128 (),
8128 extern __inline __m128i
8129 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8130 _mm_mask_max_epu32 (__m128i __W
, __mmask8 __M
, __m128i __A
,
8133 return (__m128i
) __builtin_ia32_pmaxud128_mask ((__v4si
) __A
,
8138 extern __inline __m128i
8139 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8140 _mm_maskz_min_epu32 (__mmask8 __M
, __m128i __A
, __m128i __B
)
8142 return (__m128i
) __builtin_ia32_pminud128_mask ((__v4si
) __A
,
8145 _mm_setzero_si128 (),
8149 extern __inline __m128i
8150 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8151 _mm_mask_min_epu32 (__m128i __W
, __mmask8 __M
, __m128i __A
,
8154 return (__m128i
) __builtin_ia32_pminud128_mask ((__v4si
) __A
,
8159 #ifndef __AVX512CD__
8160 #pragma GCC push_options
8161 #pragma GCC target("avx512vl,avx512cd")
8162 #define __DISABLE_AVX512VLCD__
8165 extern __inline __m128i
8166 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8167 _mm_broadcastmb_epi64 (__mmask8 __A
)
8169 return (__m128i
) __builtin_ia32_broadcastmb128 (__A
);
8172 extern __inline __m256i
8173 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8174 _mm256_broadcastmb_epi64 (__mmask8 __A
)
8176 return (__m256i
) __builtin_ia32_broadcastmb256 (__A
);
8179 extern __inline __m128i
8180 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8181 _mm_broadcastmw_epi32 (__mmask16 __A
)
8183 return (__m128i
) __builtin_ia32_broadcastmw128 (__A
);
8186 extern __inline __m256i
8187 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8188 _mm256_broadcastmw_epi32 (__mmask16 __A
)
8190 return (__m256i
) __builtin_ia32_broadcastmw256 (__A
);
8193 extern __inline __m256i
8194 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8195 _mm256_lzcnt_epi32 (__m256i __A
)
8197 return (__m256i
) __builtin_ia32_vplzcntd_256_mask ((__v8si
) __A
,
8199 _mm256_setzero_si256 (),
8203 extern __inline __m256i
8204 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8205 _mm256_mask_lzcnt_epi32 (__m256i __W
, __mmask8 __U
, __m256i __A
)
8207 return (__m256i
) __builtin_ia32_vplzcntd_256_mask ((__v8si
) __A
,
8212 extern __inline __m256i
8213 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8214 _mm256_maskz_lzcnt_epi32 (__mmask8 __U
, __m256i __A
)
8216 return (__m256i
) __builtin_ia32_vplzcntd_256_mask ((__v8si
) __A
,
8218 _mm256_setzero_si256 (),
8222 extern __inline __m256i
8223 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8224 _mm256_lzcnt_epi64 (__m256i __A
)
8226 return (__m256i
) __builtin_ia32_vplzcntq_256_mask ((__v4di
) __A
,
8228 _mm256_setzero_si256 (),
8232 extern __inline __m256i
8233 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8234 _mm256_mask_lzcnt_epi64 (__m256i __W
, __mmask8 __U
, __m256i __A
)
8236 return (__m256i
) __builtin_ia32_vplzcntq_256_mask ((__v4di
) __A
,
8241 extern __inline __m256i
8242 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8243 _mm256_maskz_lzcnt_epi64 (__mmask8 __U
, __m256i __A
)
8245 return (__m256i
) __builtin_ia32_vplzcntq_256_mask ((__v4di
) __A
,
8247 _mm256_setzero_si256 (),
8251 extern __inline __m256i
8252 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8253 _mm256_conflict_epi64 (__m256i __A
)
8255 return (__m256i
) __builtin_ia32_vpconflictdi_256_mask ((__v4di
) __A
,
8257 _mm256_setzero_si256 (),
8261 extern __inline __m256i
8262 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8263 _mm256_mask_conflict_epi64 (__m256i __W
, __mmask8 __U
, __m256i __A
)
8265 return (__m256i
) __builtin_ia32_vpconflictdi_256_mask ((__v4di
) __A
,
8271 extern __inline __m256i
8272 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8273 _mm256_maskz_conflict_epi64 (__mmask8 __U
, __m256i __A
)
8275 return (__m256i
) __builtin_ia32_vpconflictdi_256_mask ((__v4di
) __A
,
8277 _mm256_setzero_si256 (),
8282 extern __inline __m256i
8283 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8284 _mm256_conflict_epi32 (__m256i __A
)
8286 return (__m256i
) __builtin_ia32_vpconflictsi_256_mask ((__v8si
) __A
,
8288 _mm256_setzero_si256 (),
8292 extern __inline __m256i
8293 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8294 _mm256_mask_conflict_epi32 (__m256i __W
, __mmask8 __U
, __m256i __A
)
8296 return (__m256i
) __builtin_ia32_vpconflictsi_256_mask ((__v8si
) __A
,
8302 extern __inline __m256i
8303 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8304 _mm256_maskz_conflict_epi32 (__mmask8 __U
, __m256i __A
)
8306 return (__m256i
) __builtin_ia32_vpconflictsi_256_mask ((__v8si
) __A
,
8308 _mm256_setzero_si256 (),
8313 extern __inline __m128i
8314 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8315 _mm_lzcnt_epi32 (__m128i __A
)
8317 return (__m128i
) __builtin_ia32_vplzcntd_128_mask ((__v4si
) __A
,
8319 _mm_setzero_si128 (),
8323 extern __inline __m128i
8324 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8325 _mm_mask_lzcnt_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
)
8327 return (__m128i
) __builtin_ia32_vplzcntd_128_mask ((__v4si
) __A
,
8332 extern __inline __m128i
8333 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8334 _mm_maskz_lzcnt_epi32 (__mmask8 __U
, __m128i __A
)
8336 return (__m128i
) __builtin_ia32_vplzcntd_128_mask ((__v4si
) __A
,
8338 _mm_setzero_si128 (),
8342 extern __inline __m128i
8343 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8344 _mm_lzcnt_epi64 (__m128i __A
)
8346 return (__m128i
) __builtin_ia32_vplzcntq_128_mask ((__v2di
) __A
,
8352 extern __inline __m128i
8353 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8354 _mm_mask_lzcnt_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
)
8356 return (__m128i
) __builtin_ia32_vplzcntq_128_mask ((__v2di
) __A
,
8361 extern __inline __m128i
8362 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8363 _mm_maskz_lzcnt_epi64 (__mmask8 __U
, __m128i __A
)
8365 return (__m128i
) __builtin_ia32_vplzcntq_128_mask ((__v2di
) __A
,
8371 extern __inline __m128i
8372 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8373 _mm_conflict_epi64 (__m128i __A
)
8375 return (__m128i
) __builtin_ia32_vpconflictdi_128_mask ((__v2di
) __A
,
8381 extern __inline __m128i
8382 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8383 _mm_mask_conflict_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
)
8385 return (__m128i
) __builtin_ia32_vpconflictdi_128_mask ((__v2di
) __A
,
8391 extern __inline __m128i
8392 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8393 _mm_maskz_conflict_epi64 (__mmask8 __U
, __m128i __A
)
8395 return (__m128i
) __builtin_ia32_vpconflictdi_128_mask ((__v2di
) __A
,
8402 extern __inline __m128i
8403 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8404 _mm_conflict_epi32 (__m128i __A
)
8406 return (__m128i
) __builtin_ia32_vpconflictsi_128_mask ((__v4si
) __A
,
8408 _mm_setzero_si128 (),
8412 extern __inline __m128i
8413 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8414 _mm_mask_conflict_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
)
8416 return (__m128i
) __builtin_ia32_vpconflictsi_128_mask ((__v4si
) __A
,
8422 extern __inline __m128i
8423 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8424 _mm_maskz_conflict_epi32 (__mmask8 __U
, __m128i __A
)
8426 return (__m128i
) __builtin_ia32_vpconflictsi_128_mask ((__v4si
) __A
,
8428 _mm_setzero_si128 (),
8433 #ifdef __DISABLE_AVX512VLCD__
8434 #pragma GCC pop_options
8437 extern __inline __m256d
8438 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8439 _mm256_mask_unpacklo_pd (__m256d __W
, __mmask8 __U
, __m256d __A
,
8442 return (__m256d
) __builtin_ia32_unpcklpd256_mask ((__v4df
) __A
,
8448 extern __inline __m256d
8449 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8450 _mm256_maskz_unpacklo_pd (__mmask8 __U
, __m256d __A
, __m256d __B
)
8452 return (__m256d
) __builtin_ia32_unpcklpd256_mask ((__v4df
) __A
,
8455 _mm256_setzero_pd (),
8459 extern __inline __m128d
8460 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8461 _mm_mask_unpacklo_pd (__m128d __W
, __mmask8 __U
, __m128d __A
,
8464 return (__m128d
) __builtin_ia32_unpcklpd128_mask ((__v2df
) __A
,
8470 extern __inline __m128d
8471 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8472 _mm_maskz_unpacklo_pd (__mmask8 __U
, __m128d __A
, __m128d __B
)
8474 return (__m128d
) __builtin_ia32_unpcklpd128_mask ((__v2df
) __A
,
8481 extern __inline __m256
8482 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8483 _mm256_mask_unpacklo_ps (__m256 __W
, __mmask8 __U
, __m256 __A
,
8486 return (__m256
) __builtin_ia32_unpcklps256_mask ((__v8sf
) __A
,
8492 extern __inline __m256d
8493 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8494 _mm256_mask_unpackhi_pd (__m256d __W
, __mmask8 __U
, __m256d __A
,
8497 return (__m256d
) __builtin_ia32_unpckhpd256_mask ((__v4df
) __A
,
8503 extern __inline __m256d
8504 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8505 _mm256_maskz_unpackhi_pd (__mmask8 __U
, __m256d __A
, __m256d __B
)
8507 return (__m256d
) __builtin_ia32_unpckhpd256_mask ((__v4df
) __A
,
8510 _mm256_setzero_pd (),
8514 extern __inline __m128d
8515 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8516 _mm_mask_unpackhi_pd (__m128d __W
, __mmask8 __U
, __m128d __A
,
8519 return (__m128d
) __builtin_ia32_unpckhpd128_mask ((__v2df
) __A
,
8525 extern __inline __m128d
8526 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8527 _mm_maskz_unpackhi_pd (__mmask8 __U
, __m128d __A
, __m128d __B
)
8529 return (__m128d
) __builtin_ia32_unpckhpd128_mask ((__v2df
) __A
,
8536 extern __inline __m256
8537 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8538 _mm256_mask_unpackhi_ps (__m256 __W
, __mmask8 __U
, __m256 __A
,
8541 return (__m256
) __builtin_ia32_unpckhps256_mask ((__v8sf
) __A
,
8547 extern __inline __m256
8548 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8549 _mm256_maskz_unpackhi_ps (__mmask8 __U
, __m256 __A
, __m256 __B
)
8551 return (__m256
) __builtin_ia32_unpckhps256_mask ((__v8sf
) __A
,
8554 _mm256_setzero_ps (),
8558 extern __inline __m128
8559 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8560 _mm_mask_unpackhi_ps (__m128 __W
, __mmask8 __U
, __m128 __A
, __m128 __B
)
8562 return (__m128
) __builtin_ia32_unpckhps128_mask ((__v4sf
) __A
,
8568 extern __inline __m128
8569 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8570 _mm_maskz_unpackhi_ps (__mmask8 __U
, __m128 __A
, __m128 __B
)
8572 return (__m128
) __builtin_ia32_unpckhps128_mask ((__v4sf
) __A
,
8579 extern __inline __m128
8580 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8581 _mm_mask_cvtph_ps (__m128 __W
, __mmask8 __U
, __m128i __A
)
8583 return (__m128
) __builtin_ia32_vcvtph2ps_mask ((__v8hi
) __A
,
8588 extern __inline __m128
8589 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8590 _mm_maskz_cvtph_ps (__mmask8 __U
, __m128i __A
)
8592 return (__m128
) __builtin_ia32_vcvtph2ps_mask ((__v8hi
) __A
,
8598 extern __inline __m256
8599 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8600 _mm256_maskz_unpacklo_ps (__mmask8 __U
, __m256 __A
, __m256 __B
)
8602 return (__m256
) __builtin_ia32_unpcklps256_mask ((__v8sf
) __A
,
8605 _mm256_setzero_ps (),
8609 extern __inline __m256
8610 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8611 _mm256_mask_cvtph_ps (__m256 __W
, __mmask8 __U
, __m128i __A
)
8613 return (__m256
) __builtin_ia32_vcvtph2ps256_mask ((__v8hi
) __A
,
8618 extern __inline __m256
8619 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8620 _mm256_maskz_cvtph_ps (__mmask8 __U
, __m128i __A
)
8622 return (__m256
) __builtin_ia32_vcvtph2ps256_mask ((__v8hi
) __A
,
8624 _mm256_setzero_ps (),
8628 extern __inline __m128
8629 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8630 _mm_mask_unpacklo_ps (__m128 __W
, __mmask8 __U
, __m128 __A
, __m128 __B
)
8632 return (__m128
) __builtin_ia32_unpcklps128_mask ((__v4sf
) __A
,
8638 extern __inline __m128
8639 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8640 _mm_maskz_unpacklo_ps (__mmask8 __U
, __m128 __A
, __m128 __B
)
8642 return (__m128
) __builtin_ia32_unpcklps128_mask ((__v4sf
) __A
,
8649 extern __inline __m256i
8650 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8651 _mm256_mask_sra_epi32 (__m256i __W
, __mmask8 __U
, __m256i __A
,
8654 return (__m256i
) __builtin_ia32_psrad256_mask ((__v8si
) __A
,
8660 extern __inline __m256i
8661 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8662 _mm256_maskz_sra_epi32 (__mmask8 __U
, __m256i __A
, __m128i __B
)
8664 return (__m256i
) __builtin_ia32_psrad256_mask ((__v8si
) __A
,
8667 _mm256_setzero_si256 (),
8671 extern __inline __m128i
8672 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8673 _mm_mask_sra_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
,
8676 return (__m128i
) __builtin_ia32_psrad128_mask ((__v4si
) __A
,
8682 extern __inline __m128i
8683 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8684 _mm_maskz_sra_epi32 (__mmask8 __U
, __m128i __A
, __m128i __B
)
8686 return (__m128i
) __builtin_ia32_psrad128_mask ((__v4si
) __A
,
8689 _mm_setzero_si128 (),
8693 extern __inline __m256i
8694 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8695 _mm256_sra_epi64 (__m256i __A
, __m128i __B
)
8697 return (__m256i
) __builtin_ia32_psraq256_mask ((__v4di
) __A
,
8700 _mm256_setzero_si256 (),
8704 extern __inline __m256i
8705 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8706 _mm256_mask_sra_epi64 (__m256i __W
, __mmask8 __U
, __m256i __A
,
8709 return (__m256i
) __builtin_ia32_psraq256_mask ((__v4di
) __A
,
8715 extern __inline __m256i
8716 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8717 _mm256_maskz_sra_epi64 (__mmask8 __U
, __m256i __A
, __m128i __B
)
8719 return (__m256i
) __builtin_ia32_psraq256_mask ((__v4di
) __A
,
8722 _mm256_setzero_si256 (),
8726 extern __inline __m128i
8727 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8728 _mm_sra_epi64 (__m128i __A
, __m128i __B
)
8730 return (__m128i
) __builtin_ia32_psraq128_mask ((__v2di
) __A
,
8737 extern __inline __m128i
8738 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8739 _mm_mask_sra_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
,
8742 return (__m128i
) __builtin_ia32_psraq128_mask ((__v2di
) __A
,
8748 extern __inline __m128i
8749 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8750 _mm_maskz_sra_epi64 (__mmask8 __U
, __m128i __A
, __m128i __B
)
8752 return (__m128i
) __builtin_ia32_psraq128_mask ((__v2di
) __A
,
8759 extern __inline __m128i
8760 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8761 _mm_mask_sll_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
,
8764 return (__m128i
) __builtin_ia32_pslld128_mask ((__v4si
) __A
,
8770 extern __inline __m128i
8771 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8772 _mm_maskz_sll_epi32 (__mmask8 __U
, __m128i __A
, __m128i __B
)
8774 return (__m128i
) __builtin_ia32_pslld128_mask ((__v4si
) __A
,
8777 _mm_setzero_si128 (),
8781 extern __inline __m128i
8782 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8783 _mm_mask_sll_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
,
8786 return (__m128i
) __builtin_ia32_psllq128_mask ((__v2di
) __A
,
8792 extern __inline __m128i
8793 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8794 _mm_maskz_sll_epi64 (__mmask8 __U
, __m128i __A
, __m128i __B
)
8796 return (__m128i
) __builtin_ia32_psllq128_mask ((__v2di
) __A
,
8803 extern __inline __m256i
8804 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8805 _mm256_mask_sll_epi32 (__m256i __W
, __mmask8 __U
, __m256i __A
,
8808 return (__m256i
) __builtin_ia32_pslld256_mask ((__v8si
) __A
,
8814 extern __inline __m256i
8815 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8816 _mm256_maskz_sll_epi32 (__mmask8 __U
, __m256i __A
, __m128i __B
)
8818 return (__m256i
) __builtin_ia32_pslld256_mask ((__v8si
) __A
,
8821 _mm256_setzero_si256 (),
8825 extern __inline __m256i
8826 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8827 _mm256_mask_sll_epi64 (__m256i __W
, __mmask8 __U
, __m256i __A
,
8830 return (__m256i
) __builtin_ia32_psllq256_mask ((__v4di
) __A
,
8836 extern __inline __m256i
8837 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8838 _mm256_maskz_sll_epi64 (__mmask8 __U
, __m256i __A
, __m128i __B
)
8840 return (__m256i
) __builtin_ia32_psllq256_mask ((__v4di
) __A
,
8843 _mm256_setzero_si256 (),
8847 extern __inline __m256
8848 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8849 _mm256_mask_permutexvar_ps (__m256 __W
, __mmask8 __U
, __m256i __X
,
8852 return (__m256
) __builtin_ia32_permvarsf256_mask ((__v8sf
) __Y
,
8858 extern __inline __m256
8859 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8860 _mm256_maskz_permutexvar_ps (__mmask8 __U
, __m256i __X
, __m256 __Y
)
8862 return (__m256
) __builtin_ia32_permvarsf256_mask ((__v8sf
) __Y
,
8865 _mm256_setzero_ps (),
8869 extern __inline __m256d
8870 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8871 _mm256_permutexvar_pd (__m256i __X
, __m256d __Y
)
8873 return (__m256d
) __builtin_ia32_permvardf256_mask ((__v4df
) __Y
,
8876 _mm256_setzero_pd (),
8880 extern __inline __m256d
8881 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8882 _mm256_mask_permutexvar_pd (__m256d __W
, __mmask8 __U
, __m256i __X
,
8885 return (__m256d
) __builtin_ia32_permvardf256_mask ((__v4df
) __Y
,
8891 extern __inline __m256d
8892 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8893 _mm256_maskz_permutexvar_pd (__mmask8 __U
, __m256i __X
, __m256d __Y
)
8895 return (__m256d
) __builtin_ia32_permvardf256_mask ((__v4df
) __Y
,
8898 _mm256_setzero_pd (),
8902 extern __inline __m256d
8903 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8904 _mm256_mask_permutevar_pd (__m256d __W
, __mmask8 __U
, __m256d __A
,
8907 return (__m256d
) __builtin_ia32_vpermilvarpd256_mask ((__v4df
) __A
,
8914 extern __inline __m256d
8915 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8916 _mm256_maskz_permutevar_pd (__mmask8 __U
, __m256d __A
, __m256i __C
)
8918 return (__m256d
) __builtin_ia32_vpermilvarpd256_mask ((__v4df
) __A
,
8921 _mm256_setzero_pd (),
8926 extern __inline __m256
8927 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8928 _mm256_mask_permutevar_ps (__m256 __W
, __mmask8 __U
, __m256 __A
,
8931 return (__m256
) __builtin_ia32_vpermilvarps256_mask ((__v8sf
) __A
,
8937 extern __inline __m256
8938 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8939 _mm256_maskz_permutevar_ps (__mmask8 __U
, __m256 __A
, __m256i __C
)
8941 return (__m256
) __builtin_ia32_vpermilvarps256_mask ((__v8sf
) __A
,
8944 _mm256_setzero_ps (),
8948 extern __inline __m128d
8949 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8950 _mm_mask_permutevar_pd (__m128d __W
, __mmask8 __U
, __m128d __A
,
8953 return (__m128d
) __builtin_ia32_vpermilvarpd_mask ((__v2df
) __A
,
8959 extern __inline __m128d
8960 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8961 _mm_maskz_permutevar_pd (__mmask8 __U
, __m128d __A
, __m128i __C
)
8963 return (__m128d
) __builtin_ia32_vpermilvarpd_mask ((__v2df
) __A
,
8970 extern __inline __m128
8971 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8972 _mm_mask_permutevar_ps (__m128 __W
, __mmask8 __U
, __m128 __A
,
8975 return (__m128
) __builtin_ia32_vpermilvarps_mask ((__v4sf
) __A
,
8981 extern __inline __m128
8982 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8983 _mm_maskz_permutevar_ps (__mmask8 __U
, __m128 __A
, __m128i __C
)
8985 return (__m128
) __builtin_ia32_vpermilvarps_mask ((__v4sf
) __A
,
8992 extern __inline __m256i
8993 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
8994 _mm256_maskz_mullo_epi32 (__mmask8 __M
, __m256i __A
, __m256i __B
)
8996 return (__m256i
) __builtin_ia32_pmulld256_mask ((__v8si
) __A
,
8999 _mm256_setzero_si256 (),
9003 extern __inline __m256i
9004 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9005 _mm256_maskz_permutexvar_epi64 (__mmask8 __M
, __m256i __X
, __m256i __Y
)
9007 return (__m256i
) __builtin_ia32_permvardi256_mask ((__v4di
) __Y
,
9010 _mm256_setzero_si256 (),
9014 extern __inline __m256i
9015 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9016 _mm256_mask_mullo_epi32 (__m256i __W
, __mmask8 __M
, __m256i __A
,
9019 return (__m256i
) __builtin_ia32_pmulld256_mask ((__v8si
) __A
,
9024 extern __inline __m128i
9025 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9026 _mm_maskz_mullo_epi32 (__mmask8 __M
, __m128i __A
, __m128i __B
)
9028 return (__m128i
) __builtin_ia32_pmulld128_mask ((__v4si
) __A
,
9031 _mm_setzero_si128 (),
9035 extern __inline __m128i
9036 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9037 _mm_mask_mullo_epi32 (__m128i __W
, __mmask16 __M
, __m128i __A
,
9040 return (__m128i
) __builtin_ia32_pmulld128_mask ((__v4si
) __A
,
9045 extern __inline __m256i
9046 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9047 _mm256_mask_mul_epi32 (__m256i __W
, __mmask8 __M
, __m256i __X
,
9050 return (__m256i
) __builtin_ia32_pmuldq256_mask ((__v8si
) __X
,
9055 extern __inline __m256i
9056 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9057 _mm256_maskz_mul_epi32 (__mmask8 __M
, __m256i __X
, __m256i __Y
)
9059 return (__m256i
) __builtin_ia32_pmuldq256_mask ((__v8si
) __X
,
9062 _mm256_setzero_si256 (),
9066 extern __inline __m128i
9067 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9068 _mm_mask_mul_epi32 (__m128i __W
, __mmask8 __M
, __m128i __X
,
9071 return (__m128i
) __builtin_ia32_pmuldq128_mask ((__v4si
) __X
,
9076 extern __inline __m128i
9077 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9078 _mm_maskz_mul_epi32 (__mmask8 __M
, __m128i __X
, __m128i __Y
)
9080 return (__m128i
) __builtin_ia32_pmuldq128_mask ((__v4si
) __X
,
9083 _mm_setzero_si128 (),
9087 extern __inline __m256i
9088 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9089 _mm256_mask_permutexvar_epi64 (__m256i __W
, __mmask8 __M
, __m256i __X
,
9092 return (__m256i
) __builtin_ia32_permvardi256_mask ((__v4di
) __Y
,
9098 extern __inline __m256i
9099 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9100 _mm256_mask_mul_epu32 (__m256i __W
, __mmask8 __M
, __m256i __X
,
9103 return (__m256i
) __builtin_ia32_pmuludq256_mask ((__v8si
) __X
,
9108 extern __inline __m256i
9109 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9110 _mm256_maskz_permutexvar_epi32 (__mmask8 __M
, __m256i __X
, __m256i __Y
)
9112 return (__m256i
) __builtin_ia32_permvarsi256_mask ((__v8si
) __Y
,
9115 _mm256_setzero_si256 (),
9119 extern __inline __m256i
9120 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9121 _mm256_maskz_mul_epu32 (__mmask8 __M
, __m256i __X
, __m256i __Y
)
9123 return (__m256i
) __builtin_ia32_pmuludq256_mask ((__v8si
) __X
,
9126 _mm256_setzero_si256 (),
9130 extern __inline __m128i
9131 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9132 _mm_mask_mul_epu32 (__m128i __W
, __mmask8 __M
, __m128i __X
,
9135 return (__m128i
) __builtin_ia32_pmuludq128_mask ((__v4si
) __X
,
9140 extern __inline __m128i
9141 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9142 _mm_maskz_mul_epu32 (__mmask8 __M
, __m128i __X
, __m128i __Y
)
9144 return (__m128i
) __builtin_ia32_pmuludq128_mask ((__v4si
) __X
,
9147 _mm_setzero_si128 (),
9151 extern __inline __m256i
9152 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9153 _mm256_mask_permutexvar_epi32 (__m256i __W
, __mmask8 __M
, __m256i __X
,
9156 return (__m256i
) __builtin_ia32_permvarsi256_mask ((__v8si
) __Y
,
9163 extern __inline __m256i
9164 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9165 _mm256_mask_permutex_epi64 (__m256i __W
, __mmask8 __M
,
9166 __m256i __X
, const int __I
)
9168 return (__m256i
) __builtin_ia32_permdi256_mask ((__v4di
) __X
,
9174 extern __inline __m256i
9175 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9176 _mm256_maskz_permutex_epi64 (__mmask8 __M
, __m256i __X
, const int __I
)
9178 return (__m256i
) __builtin_ia32_permdi256_mask ((__v4di
) __X
,
9181 _mm256_setzero_si256 (),
9185 extern __inline __m256d
9186 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9187 _mm256_mask_shuffle_pd (__m256d __W
, __mmask8 __U
, __m256d __A
,
9188 __m256d __B
, const int __imm
)
9190 return (__m256d
) __builtin_ia32_shufpd256_mask ((__v4df
) __A
,
9191 (__v4df
) __B
, __imm
,
9196 extern __inline __m256d
9197 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9198 _mm256_maskz_shuffle_pd (__mmask8 __U
, __m256d __A
, __m256d __B
,
9201 return (__m256d
) __builtin_ia32_shufpd256_mask ((__v4df
) __A
,
9202 (__v4df
) __B
, __imm
,
9204 _mm256_setzero_pd (),
9208 extern __inline __m128d
9209 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9210 _mm_mask_shuffle_pd (__m128d __W
, __mmask8 __U
, __m128d __A
,
9211 __m128d __B
, const int __imm
)
9213 return (__m128d
) __builtin_ia32_shufpd128_mask ((__v2df
) __A
,
9214 (__v2df
) __B
, __imm
,
9219 extern __inline __m128d
9220 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9221 _mm_maskz_shuffle_pd (__mmask8 __U
, __m128d __A
, __m128d __B
,
9224 return (__m128d
) __builtin_ia32_shufpd128_mask ((__v2df
) __A
,
9225 (__v2df
) __B
, __imm
,
9231 extern __inline __m256
9232 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9233 _mm256_mask_shuffle_ps (__m256 __W
, __mmask8 __U
, __m256 __A
,
9234 __m256 __B
, const int __imm
)
9236 return (__m256
) __builtin_ia32_shufps256_mask ((__v8sf
) __A
,
9237 (__v8sf
) __B
, __imm
,
9242 extern __inline __m256
9243 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9244 _mm256_maskz_shuffle_ps (__mmask8 __U
, __m256 __A
, __m256 __B
,
9247 return (__m256
) __builtin_ia32_shufps256_mask ((__v8sf
) __A
,
9248 (__v8sf
) __B
, __imm
,
9250 _mm256_setzero_ps (),
9254 extern __inline __m128
9255 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9256 _mm_mask_shuffle_ps (__m128 __W
, __mmask8 __U
, __m128 __A
, __m128 __B
,
9259 return (__m128
) __builtin_ia32_shufps128_mask ((__v4sf
) __A
,
9260 (__v4sf
) __B
, __imm
,
9265 extern __inline __m128
9266 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9267 _mm_maskz_shuffle_ps (__mmask8 __U
, __m128 __A
, __m128 __B
,
9270 return (__m128
) __builtin_ia32_shufps128_mask ((__v4sf
) __A
,
9271 (__v4sf
) __B
, __imm
,
9277 extern __inline __m256i
9278 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9279 _mm256_inserti32x4 (__m256i __A
, __m128i __B
, const int __imm
)
9281 return (__m256i
) __builtin_ia32_inserti32x4_256_mask ((__v8si
) __A
,
9285 _mm256_setzero_si256 (),
9289 extern __inline __m256i
9290 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9291 _mm256_mask_inserti32x4 (__m256i __W
, __mmask8 __U
, __m256i __A
,
9292 __m128i __B
, const int __imm
)
9294 return (__m256i
) __builtin_ia32_inserti32x4_256_mask ((__v8si
) __A
,
9302 extern __inline __m256i
9303 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9304 _mm256_maskz_inserti32x4 (__mmask8 __U
, __m256i __A
, __m128i __B
,
9307 return (__m256i
) __builtin_ia32_inserti32x4_256_mask ((__v8si
) __A
,
9311 _mm256_setzero_si256 (),
9316 extern __inline __m256
9317 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9318 _mm256_insertf32x4 (__m256 __A
, __m128 __B
, const int __imm
)
9320 return (__m256
) __builtin_ia32_insertf32x4_256_mask ((__v8sf
) __A
,
9324 _mm256_setzero_ps (),
9328 extern __inline __m256
9329 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9330 _mm256_mask_insertf32x4 (__m256 __W
, __mmask8 __U
, __m256 __A
,
9331 __m128 __B
, const int __imm
)
9333 return (__m256
) __builtin_ia32_insertf32x4_256_mask ((__v8sf
) __A
,
9340 extern __inline __m256
9341 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9342 _mm256_maskz_insertf32x4 (__mmask8 __U
, __m256 __A
, __m128 __B
,
9345 return (__m256
) __builtin_ia32_insertf32x4_256_mask ((__v8sf
) __A
,
9349 _mm256_setzero_ps (),
9353 extern __inline __m128i
9354 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9355 _mm256_extracti32x4_epi32 (__m256i __A
, const int __imm
)
9357 return (__m128i
) __builtin_ia32_extracti32x4_256_mask ((__v8si
) __A
,
9360 _mm_setzero_si128 (),
9364 extern __inline __m128i
9365 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9366 _mm256_mask_extracti32x4_epi32 (__m128i __W
, __mmask8 __U
, __m256i __A
,
9369 return (__m128i
) __builtin_ia32_extracti32x4_256_mask ((__v8si
) __A
,
9376 extern __inline __m128i
9377 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9378 _mm256_maskz_extracti32x4_epi32 (__mmask8 __U
, __m256i __A
,
9381 return (__m128i
) __builtin_ia32_extracti32x4_256_mask ((__v8si
) __A
,
9384 _mm_setzero_si128 (),
9389 extern __inline __m128
9390 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9391 _mm256_extractf32x4_ps (__m256 __A
, const int __imm
)
9393 return (__m128
) __builtin_ia32_extractf32x4_256_mask ((__v8sf
) __A
,
9400 extern __inline __m128
9401 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9402 _mm256_mask_extractf32x4_ps (__m128 __W
, __mmask8 __U
, __m256 __A
,
9405 return (__m128
) __builtin_ia32_extractf32x4_256_mask ((__v8sf
) __A
,
9412 extern __inline __m128
9413 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9414 _mm256_maskz_extractf32x4_ps (__mmask8 __U
, __m256 __A
,
9417 return (__m128
) __builtin_ia32_extractf32x4_256_mask ((__v8sf
) __A
,
9425 extern __inline __m256i
9426 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9427 _mm256_shuffle_i64x2 (__m256i __A
, __m256i __B
, const int __imm
)
9429 return (__m256i
) __builtin_ia32_shuf_i64x2_256_mask ((__v4di
) __A
,
9433 _mm256_setzero_si256 (),
9437 extern __inline __m256i
9438 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9439 _mm256_mask_shuffle_i64x2 (__m256i __W
, __mmask8 __U
, __m256i __A
,
9440 __m256i __B
, const int __imm
)
9442 return (__m256i
) __builtin_ia32_shuf_i64x2_256_mask ((__v4di
) __A
,
9449 extern __inline __m256i
9450 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9451 _mm256_maskz_shuffle_i64x2 (__mmask8 __U
, __m256i __A
, __m256i __B
,
9454 return (__m256i
) __builtin_ia32_shuf_i64x2_256_mask ((__v4di
) __A
,
9458 _mm256_setzero_si256 (),
9462 extern __inline __m256i
9463 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9464 _mm256_shuffle_i32x4 (__m256i __A
, __m256i __B
, const int __imm
)
9466 return (__m256i
) __builtin_ia32_shuf_i32x4_256_mask ((__v8si
) __A
,
9470 _mm256_setzero_si256 (),
9474 extern __inline __m256i
9475 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9476 _mm256_mask_shuffle_i32x4 (__m256i __W
, __mmask8 __U
, __m256i __A
,
9477 __m256i __B
, const int __imm
)
9479 return (__m256i
) __builtin_ia32_shuf_i32x4_256_mask ((__v8si
) __A
,
9486 extern __inline __m256i
9487 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9488 _mm256_maskz_shuffle_i32x4 (__mmask8 __U
, __m256i __A
, __m256i __B
,
9491 return (__m256i
) __builtin_ia32_shuf_i32x4_256_mask ((__v8si
) __A
,
9495 _mm256_setzero_si256 (),
9499 extern __inline __m256d
9500 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9501 _mm256_shuffle_f64x2 (__m256d __A
, __m256d __B
, const int __imm
)
9503 return (__m256d
) __builtin_ia32_shuf_f64x2_256_mask ((__v4df
) __A
,
9507 _mm256_setzero_pd (),
9511 extern __inline __m256d
9512 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9513 _mm256_mask_shuffle_f64x2 (__m256d __W
, __mmask8 __U
, __m256d __A
,
9514 __m256d __B
, const int __imm
)
9516 return (__m256d
) __builtin_ia32_shuf_f64x2_256_mask ((__v4df
) __A
,
9523 extern __inline __m256d
9524 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9525 _mm256_maskz_shuffle_f64x2 (__mmask8 __U
, __m256d __A
, __m256d __B
,
9528 return (__m256d
) __builtin_ia32_shuf_f64x2_256_mask ((__v4df
) __A
,
9532 _mm256_setzero_pd (),
9536 extern __inline __m256
9537 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9538 _mm256_shuffle_f32x4 (__m256 __A
, __m256 __B
, const int __imm
)
9540 return (__m256
) __builtin_ia32_shuf_f32x4_256_mask ((__v8sf
) __A
,
9544 _mm256_setzero_ps (),
9548 extern __inline __m256
9549 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9550 _mm256_mask_shuffle_f32x4 (__m256 __W
, __mmask8 __U
, __m256 __A
,
9551 __m256 __B
, const int __imm
)
9553 return (__m256
) __builtin_ia32_shuf_f32x4_256_mask ((__v8sf
) __A
,
9560 extern __inline __m256
9561 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9562 _mm256_maskz_shuffle_f32x4 (__mmask8 __U
, __m256 __A
, __m256 __B
,
9565 return (__m256
) __builtin_ia32_shuf_f32x4_256_mask ((__v8sf
) __A
,
9569 _mm256_setzero_ps (),
9573 extern __inline __m256d
9574 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9575 _mm256_fixupimm_pd (__m256d __A
, __m256d __B
, __m256i __C
,
9578 return (__m256d
) __builtin_ia32_fixupimmpd256_mask ((__v4df
) __A
,
9585 extern __inline __m256d
9586 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9587 _mm256_mask_fixupimm_pd (__m256d __A
, __mmask8 __U
, __m256d __B
,
9588 __m256i __C
, const int __imm
)
9590 return (__m256d
) __builtin_ia32_fixupimmpd256_mask ((__v4df
) __A
,
9597 extern __inline __m256d
9598 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9599 _mm256_maskz_fixupimm_pd (__mmask8 __U
, __m256d __A
, __m256d __B
,
9600 __m256i __C
, const int __imm
)
9602 return (__m256d
) __builtin_ia32_fixupimmpd256_maskz ((__v4df
) __A
,
9609 extern __inline __m256
9610 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9611 _mm256_fixupimm_ps (__m256 __A
, __m256 __B
, __m256i __C
,
9614 return (__m256
) __builtin_ia32_fixupimmps256_mask ((__v8sf
) __A
,
9621 extern __inline __m256
9622 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9623 _mm256_mask_fixupimm_ps (__m256 __A
, __mmask8 __U
, __m256 __B
,
9624 __m256i __C
, const int __imm
)
9626 return (__m256
) __builtin_ia32_fixupimmps256_mask ((__v8sf
) __A
,
9633 extern __inline __m256
9634 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9635 _mm256_maskz_fixupimm_ps (__mmask8 __U
, __m256 __A
, __m256 __B
,
9636 __m256i __C
, const int __imm
)
9638 return (__m256
) __builtin_ia32_fixupimmps256_maskz ((__v8sf
) __A
,
9645 extern __inline __m128d
9646 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9647 _mm_fixupimm_pd (__m128d __A
, __m128d __B
, __m128i __C
,
9650 return (__m128d
) __builtin_ia32_fixupimmpd128_mask ((__v2df
) __A
,
9657 extern __inline __m128d
9658 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9659 _mm_mask_fixupimm_pd (__m128d __A
, __mmask8 __U
, __m128d __B
,
9660 __m128i __C
, const int __imm
)
9662 return (__m128d
) __builtin_ia32_fixupimmpd128_mask ((__v2df
) __A
,
9669 extern __inline __m128d
9670 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9671 _mm_maskz_fixupimm_pd (__mmask8 __U
, __m128d __A
, __m128d __B
,
9672 __m128i __C
, const int __imm
)
9674 return (__m128d
) __builtin_ia32_fixupimmpd128_maskz ((__v2df
) __A
,
9681 extern __inline __m128
9682 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9683 _mm_fixupimm_ps (__m128 __A
, __m128 __B
, __m128i __C
, const int __imm
)
9685 return (__m128
) __builtin_ia32_fixupimmps128_mask ((__v4sf
) __A
,
9692 extern __inline __m128
9693 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9694 _mm_mask_fixupimm_ps (__m128 __A
, __mmask8 __U
, __m128 __B
,
9695 __m128i __C
, const int __imm
)
9697 return (__m128
) __builtin_ia32_fixupimmps128_mask ((__v4sf
) __A
,
9704 extern __inline __m128
9705 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9706 _mm_maskz_fixupimm_ps (__mmask8 __U
, __m128 __A
, __m128 __B
,
9707 __m128i __C
, const int __imm
)
9709 return (__m128
) __builtin_ia32_fixupimmps128_maskz ((__v4sf
) __A
,
9716 extern __inline __m256i
9717 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9718 _mm256_mask_srli_epi32 (__m256i __W
, __mmask8 __U
, __m256i __A
,
9721 return (__m256i
) __builtin_ia32_psrldi256_mask ((__v8si
) __A
, __imm
,
9726 extern __inline __m256i
9727 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9728 _mm256_maskz_srli_epi32 (__mmask8 __U
, __m256i __A
, const int __imm
)
9730 return (__m256i
) __builtin_ia32_psrldi256_mask ((__v8si
) __A
, __imm
,
9732 _mm256_setzero_si256 (),
9736 extern __inline __m128i
9737 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9738 _mm_mask_srli_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
,
9741 return (__m128i
) __builtin_ia32_psrldi128_mask ((__v4si
) __A
, __imm
,
9746 extern __inline __m128i
9747 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9748 _mm_maskz_srli_epi32 (__mmask8 __U
, __m128i __A
, const int __imm
)
9750 return (__m128i
) __builtin_ia32_psrldi128_mask ((__v4si
) __A
, __imm
,
9752 _mm_setzero_si128 (),
9756 extern __inline __m256i
9757 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9758 _mm256_mask_srli_epi64 (__m256i __W
, __mmask8 __U
, __m256i __A
,
9761 return (__m256i
) __builtin_ia32_psrlqi256_mask ((__v4di
) __A
, __imm
,
9766 extern __inline __m256i
9767 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9768 _mm256_maskz_srli_epi64 (__mmask8 __U
, __m256i __A
, const int __imm
)
9770 return (__m256i
) __builtin_ia32_psrlqi256_mask ((__v4di
) __A
, __imm
,
9772 _mm256_setzero_si256 (),
9776 extern __inline __m128i
9777 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9778 _mm_mask_srli_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
,
9781 return (__m128i
) __builtin_ia32_psrlqi128_mask ((__v2di
) __A
, __imm
,
9786 extern __inline __m128i
9787 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9788 _mm_maskz_srli_epi64 (__mmask8 __U
, __m128i __A
, const int __imm
)
9790 return (__m128i
) __builtin_ia32_psrlqi128_mask ((__v2di
) __A
, __imm
,
9792 _mm_setzero_si128 (),
9796 extern __inline __m256i
9797 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9798 _mm256_ternarylogic_epi64 (__m256i __A
, __m256i __B
, __m256i __C
,
9801 return (__m256i
) __builtin_ia32_pternlogq256_mask ((__v4di
) __A
,
9803 (__v4di
) __C
, __imm
,
9807 extern __inline __m256i
9808 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9809 _mm256_mask_ternarylogic_epi64 (__m256i __A
, __mmask8 __U
,
9810 __m256i __B
, __m256i __C
,
9813 return (__m256i
) __builtin_ia32_pternlogq256_mask ((__v4di
) __A
,
9815 (__v4di
) __C
, __imm
,
9819 extern __inline __m256i
9820 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9821 _mm256_maskz_ternarylogic_epi64 (__mmask8 __U
, __m256i __A
,
9822 __m256i __B
, __m256i __C
,
9825 return (__m256i
) __builtin_ia32_pternlogq256_maskz ((__v4di
) __A
,
9832 extern __inline __m256i
9833 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9834 _mm256_ternarylogic_epi32 (__m256i __A
, __m256i __B
, __m256i __C
,
9837 return (__m256i
) __builtin_ia32_pternlogd256_mask ((__v8si
) __A
,
9839 (__v8si
) __C
, __imm
,
9843 extern __inline __m256i
9844 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9845 _mm256_mask_ternarylogic_epi32 (__m256i __A
, __mmask8 __U
,
9846 __m256i __B
, __m256i __C
,
9849 return (__m256i
) __builtin_ia32_pternlogd256_mask ((__v8si
) __A
,
9851 (__v8si
) __C
, __imm
,
9855 extern __inline __m256i
9856 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9857 _mm256_maskz_ternarylogic_epi32 (__mmask8 __U
, __m256i __A
,
9858 __m256i __B
, __m256i __C
,
9861 return (__m256i
) __builtin_ia32_pternlogd256_maskz ((__v8si
) __A
,
9868 extern __inline __m128i
9869 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9870 _mm_ternarylogic_epi64 (__m128i __A
, __m128i __B
, __m128i __C
,
9873 return (__m128i
) __builtin_ia32_pternlogq128_mask ((__v2di
) __A
,
9875 (__v2di
) __C
, __imm
,
9879 extern __inline __m128i
9880 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9881 _mm_mask_ternarylogic_epi64 (__m128i __A
, __mmask8 __U
,
9882 __m128i __B
, __m128i __C
, const int __imm
)
9884 return (__m128i
) __builtin_ia32_pternlogq128_mask ((__v2di
) __A
,
9886 (__v2di
) __C
, __imm
,
9890 extern __inline __m128i
9891 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9892 _mm_maskz_ternarylogic_epi64 (__mmask8 __U
, __m128i __A
,
9893 __m128i __B
, __m128i __C
, const int __imm
)
9895 return (__m128i
) __builtin_ia32_pternlogq128_maskz ((__v2di
) __A
,
9902 extern __inline __m128i
9903 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9904 _mm_ternarylogic_epi32 (__m128i __A
, __m128i __B
, __m128i __C
,
9907 return (__m128i
) __builtin_ia32_pternlogd128_mask ((__v4si
) __A
,
9909 (__v4si
) __C
, __imm
,
9913 extern __inline __m128i
9914 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9915 _mm_mask_ternarylogic_epi32 (__m128i __A
, __mmask8 __U
,
9916 __m128i __B
, __m128i __C
, const int __imm
)
9918 return (__m128i
) __builtin_ia32_pternlogd128_mask ((__v4si
) __A
,
9920 (__v4si
) __C
, __imm
,
9924 extern __inline __m128i
9925 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9926 _mm_maskz_ternarylogic_epi32 (__mmask8 __U
, __m128i __A
,
9927 __m128i __B
, __m128i __C
, const int __imm
)
9929 return (__m128i
) __builtin_ia32_pternlogd128_maskz ((__v4si
) __A
,
9936 extern __inline __m256
9937 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9938 _mm256_roundscale_ps (__m256 __A
, const int __imm
)
9940 return (__m256
) __builtin_ia32_rndscaleps_256_mask ((__v8sf
) __A
,
9943 _mm256_setzero_ps (),
9947 extern __inline __m256
9948 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9949 _mm256_mask_roundscale_ps (__m256 __W
, __mmask8 __U
, __m256 __A
,
9952 return (__m256
) __builtin_ia32_rndscaleps_256_mask ((__v8sf
) __A
,
9958 extern __inline __m256
9959 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9960 _mm256_maskz_roundscale_ps (__mmask8 __U
, __m256 __A
, const int __imm
)
9962 return (__m256
) __builtin_ia32_rndscaleps_256_mask ((__v8sf
) __A
,
9965 _mm256_setzero_ps (),
9969 extern __inline __m256d
9970 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9971 _mm256_roundscale_pd (__m256d __A
, const int __imm
)
9973 return (__m256d
) __builtin_ia32_rndscalepd_256_mask ((__v4df
) __A
,
9976 _mm256_setzero_pd (),
9980 extern __inline __m256d
9981 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9982 _mm256_mask_roundscale_pd (__m256d __W
, __mmask8 __U
, __m256d __A
,
9985 return (__m256d
) __builtin_ia32_rndscalepd_256_mask ((__v4df
) __A
,
9991 extern __inline __m256d
9992 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
9993 _mm256_maskz_roundscale_pd (__mmask8 __U
, __m256d __A
, const int __imm
)
9995 return (__m256d
) __builtin_ia32_rndscalepd_256_mask ((__v4df
) __A
,
9998 _mm256_setzero_pd (),
10002 extern __inline __m128
10003 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10004 _mm_roundscale_ps (__m128 __A
, const int __imm
)
10006 return (__m128
) __builtin_ia32_rndscaleps_128_mask ((__v4sf
) __A
,
10013 extern __inline __m128
10014 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10015 _mm_mask_roundscale_ps (__m128 __W
, __mmask8 __U
, __m128 __A
,
10018 return (__m128
) __builtin_ia32_rndscaleps_128_mask ((__v4sf
) __A
,
10024 extern __inline __m128
10025 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10026 _mm_maskz_roundscale_ps (__mmask8 __U
, __m128 __A
, const int __imm
)
10028 return (__m128
) __builtin_ia32_rndscaleps_128_mask ((__v4sf
) __A
,
10035 extern __inline __m128d
10036 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10037 _mm_roundscale_pd (__m128d __A
, const int __imm
)
10039 return (__m128d
) __builtin_ia32_rndscalepd_128_mask ((__v2df
) __A
,
10046 extern __inline __m128d
10047 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10048 _mm_mask_roundscale_pd (__m128d __W
, __mmask8 __U
, __m128d __A
,
10051 return (__m128d
) __builtin_ia32_rndscalepd_128_mask ((__v2df
) __A
,
10057 extern __inline __m128d
10058 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10059 _mm_maskz_roundscale_pd (__mmask8 __U
, __m128d __A
, const int __imm
)
10061 return (__m128d
) __builtin_ia32_rndscalepd_128_mask ((__v2df
) __A
,
10068 extern __inline __m256
10069 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10070 _mm256_getmant_ps (__m256 __A
, _MM_MANTISSA_NORM_ENUM __B
,
10071 _MM_MANTISSA_SIGN_ENUM __C
)
10073 return (__m256
) __builtin_ia32_getmantps256_mask ((__v8sf
) __A
,
10076 _mm256_setzero_ps (),
10080 extern __inline __m256
10081 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10082 _mm256_mask_getmant_ps (__m256 __W
, __mmask8 __U
, __m256 __A
,
10083 _MM_MANTISSA_NORM_ENUM __B
,
10084 _MM_MANTISSA_SIGN_ENUM __C
)
10086 return (__m256
) __builtin_ia32_getmantps256_mask ((__v8sf
) __A
,
10092 extern __inline __m256
10093 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10094 _mm256_maskz_getmant_ps (__mmask8 __U
, __m256 __A
,
10095 _MM_MANTISSA_NORM_ENUM __B
,
10096 _MM_MANTISSA_SIGN_ENUM __C
)
10098 return (__m256
) __builtin_ia32_getmantps256_mask ((__v8sf
) __A
,
10101 _mm256_setzero_ps (),
10105 extern __inline __m128
10106 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10107 _mm_getmant_ps (__m128 __A
, _MM_MANTISSA_NORM_ENUM __B
,
10108 _MM_MANTISSA_SIGN_ENUM __C
)
10110 return (__m128
) __builtin_ia32_getmantps128_mask ((__v4sf
) __A
,
10117 extern __inline __m128
10118 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10119 _mm_mask_getmant_ps (__m128 __W
, __mmask8 __U
, __m128 __A
,
10120 _MM_MANTISSA_NORM_ENUM __B
,
10121 _MM_MANTISSA_SIGN_ENUM __C
)
10123 return (__m128
) __builtin_ia32_getmantps128_mask ((__v4sf
) __A
,
10129 extern __inline __m128
10130 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10131 _mm_maskz_getmant_ps (__mmask8 __U
, __m128 __A
,
10132 _MM_MANTISSA_NORM_ENUM __B
,
10133 _MM_MANTISSA_SIGN_ENUM __C
)
10135 return (__m128
) __builtin_ia32_getmantps128_mask ((__v4sf
) __A
,
10142 extern __inline __m256d
10143 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10144 _mm256_getmant_pd (__m256d __A
, _MM_MANTISSA_NORM_ENUM __B
,
10145 _MM_MANTISSA_SIGN_ENUM __C
)
10147 return (__m256d
) __builtin_ia32_getmantpd256_mask ((__v4df
) __A
,
10150 _mm256_setzero_pd (),
10154 extern __inline __m256d
10155 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10156 _mm256_mask_getmant_pd (__m256d __W
, __mmask8 __U
, __m256d __A
,
10157 _MM_MANTISSA_NORM_ENUM __B
,
10158 _MM_MANTISSA_SIGN_ENUM __C
)
10160 return (__m256d
) __builtin_ia32_getmantpd256_mask ((__v4df
) __A
,
10166 extern __inline __m256d
10167 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10168 _mm256_maskz_getmant_pd (__mmask8 __U
, __m256d __A
,
10169 _MM_MANTISSA_NORM_ENUM __B
,
10170 _MM_MANTISSA_SIGN_ENUM __C
)
10172 return (__m256d
) __builtin_ia32_getmantpd256_mask ((__v4df
) __A
,
10175 _mm256_setzero_pd (),
10179 extern __inline __m128d
10180 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10181 _mm_getmant_pd (__m128d __A
, _MM_MANTISSA_NORM_ENUM __B
,
10182 _MM_MANTISSA_SIGN_ENUM __C
)
10184 return (__m128d
) __builtin_ia32_getmantpd128_mask ((__v2df
) __A
,
10191 extern __inline __m128d
10192 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10193 _mm_mask_getmant_pd (__m128d __W
, __mmask8 __U
, __m128d __A
,
10194 _MM_MANTISSA_NORM_ENUM __B
,
10195 _MM_MANTISSA_SIGN_ENUM __C
)
10197 return (__m128d
) __builtin_ia32_getmantpd128_mask ((__v2df
) __A
,
10203 extern __inline __m128d
10204 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10205 _mm_maskz_getmant_pd (__mmask8 __U
, __m128d __A
,
10206 _MM_MANTISSA_NORM_ENUM __B
,
10207 _MM_MANTISSA_SIGN_ENUM __C
)
10209 return (__m128d
) __builtin_ia32_getmantpd128_mask ((__v2df
) __A
,
10216 extern __inline __m256
10217 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10218 _mm256_mmask_i32gather_ps (__m256 __v1_old
, __mmask8 __mask
,
10219 __m256i __index
, float const *__addr
,
10222 return (__m256
) __builtin_ia32_gather3siv8sf ((__v8sf
) __v1_old
,
10228 extern __inline __m128
10229 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10230 _mm_mmask_i32gather_ps (__m128 __v1_old
, __mmask8 __mask
,
10231 __m128i __index
, float const *__addr
,
10234 return (__m128
) __builtin_ia32_gather3siv4sf ((__v4sf
) __v1_old
,
10240 extern __inline __m256d
10241 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10242 _mm256_mmask_i32gather_pd (__m256d __v1_old
, __mmask8 __mask
,
10243 __m128i __index
, double const *__addr
,
10246 return (__m256d
) __builtin_ia32_gather3siv4df ((__v4df
) __v1_old
,
10252 extern __inline __m128d
10253 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10254 _mm_mmask_i32gather_pd (__m128d __v1_old
, __mmask8 __mask
,
10255 __m128i __index
, double const *__addr
,
10258 return (__m128d
) __builtin_ia32_gather3siv2df ((__v2df
) __v1_old
,
10264 extern __inline __m128
10265 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10266 _mm256_mmask_i64gather_ps (__m128 __v1_old
, __mmask8 __mask
,
10267 __m256i __index
, float const *__addr
,
10270 return (__m128
) __builtin_ia32_gather3div8sf ((__v4sf
) __v1_old
,
10276 extern __inline __m128
10277 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10278 _mm_mmask_i64gather_ps (__m128 __v1_old
, __mmask8 __mask
,
10279 __m128i __index
, float const *__addr
,
10282 return (__m128
) __builtin_ia32_gather3div4sf ((__v4sf
) __v1_old
,
10288 extern __inline __m256d
10289 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10290 _mm256_mmask_i64gather_pd (__m256d __v1_old
, __mmask8 __mask
,
10291 __m256i __index
, double const *__addr
,
10294 return (__m256d
) __builtin_ia32_gather3div4df ((__v4df
) __v1_old
,
10300 extern __inline __m128d
10301 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10302 _mm_mmask_i64gather_pd (__m128d __v1_old
, __mmask8 __mask
,
10303 __m128i __index
, double const *__addr
,
10306 return (__m128d
) __builtin_ia32_gather3div2df ((__v2df
) __v1_old
,
10312 extern __inline __m256i
10313 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10314 _mm256_mmask_i32gather_epi32 (__m256i __v1_old
, __mmask8 __mask
,
10315 __m256i __index
, int const *__addr
,
10318 return (__m256i
) __builtin_ia32_gather3siv8si ((__v8si
) __v1_old
,
10324 extern __inline __m128i
10325 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10326 _mm_mmask_i32gather_epi32 (__m128i __v1_old
, __mmask8 __mask
,
10327 __m128i __index
, int const *__addr
,
10330 return (__m128i
) __builtin_ia32_gather3siv4si ((__v4si
) __v1_old
,
10336 extern __inline __m256i
10337 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10338 _mm256_mmask_i32gather_epi64 (__m256i __v1_old
, __mmask8 __mask
,
10339 __m128i __index
, long long const *__addr
,
10342 return (__m256i
) __builtin_ia32_gather3siv4di ((__v4di
) __v1_old
,
10348 extern __inline __m128i
10349 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10350 _mm_mmask_i32gather_epi64 (__m128i __v1_old
, __mmask8 __mask
,
10351 __m128i __index
, long long const *__addr
,
10354 return (__m128i
) __builtin_ia32_gather3siv2di ((__v2di
) __v1_old
,
10360 extern __inline __m128i
10361 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10362 _mm256_mmask_i64gather_epi32 (__m128i __v1_old
, __mmask8 __mask
,
10363 __m256i __index
, int const *__addr
,
10366 return (__m128i
) __builtin_ia32_gather3div8si ((__v4si
) __v1_old
,
10372 extern __inline __m128i
10373 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10374 _mm_mmask_i64gather_epi32 (__m128i __v1_old
, __mmask8 __mask
,
10375 __m128i __index
, int const *__addr
,
10378 return (__m128i
) __builtin_ia32_gather3div4si ((__v4si
) __v1_old
,
10384 extern __inline __m256i
10385 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10386 _mm256_mmask_i64gather_epi64 (__m256i __v1_old
, __mmask8 __mask
,
10387 __m256i __index
, long long const *__addr
,
10390 return (__m256i
) __builtin_ia32_gather3div4di ((__v4di
) __v1_old
,
10396 extern __inline __m128i
10397 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10398 _mm_mmask_i64gather_epi64 (__m128i __v1_old
, __mmask8 __mask
,
10399 __m128i __index
, long long const *__addr
,
10402 return (__m128i
) __builtin_ia32_gather3div2di ((__v2di
) __v1_old
,
10408 extern __inline
void
10409 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10410 _mm256_i32scatter_ps (float *__addr
, __m256i __index
,
10411 __m256 __v1
, const int __scale
)
10413 __builtin_ia32_scattersiv8sf (__addr
, (__mmask8
) 0xFF,
10414 (__v8si
) __index
, (__v8sf
) __v1
,
10418 extern __inline
void
10419 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10420 _mm256_mask_i32scatter_ps (float *__addr
, __mmask8 __mask
,
10421 __m256i __index
, __m256 __v1
,
10424 __builtin_ia32_scattersiv8sf (__addr
, __mask
, (__v8si
) __index
,
10425 (__v8sf
) __v1
, __scale
);
10428 extern __inline
void
10429 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10430 _mm_i32scatter_ps (float *__addr
, __m128i __index
, __m128 __v1
,
10433 __builtin_ia32_scattersiv4sf (__addr
, (__mmask8
) 0xFF,
10434 (__v4si
) __index
, (__v4sf
) __v1
,
10438 extern __inline
void
10439 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10440 _mm_mask_i32scatter_ps (float *__addr
, __mmask8 __mask
,
10441 __m128i __index
, __m128 __v1
,
10444 __builtin_ia32_scattersiv4sf (__addr
, __mask
, (__v4si
) __index
,
10445 (__v4sf
) __v1
, __scale
);
10448 extern __inline
void
10449 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10450 _mm256_i32scatter_pd (double *__addr
, __m128i __index
,
10451 __m256d __v1
, const int __scale
)
10453 __builtin_ia32_scattersiv4df (__addr
, (__mmask8
) 0xFF,
10454 (__v4si
) __index
, (__v4df
) __v1
,
10458 extern __inline
void
10459 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10460 _mm256_mask_i32scatter_pd (double *__addr
, __mmask8 __mask
,
10461 __m128i __index
, __m256d __v1
,
10464 __builtin_ia32_scattersiv4df (__addr
, __mask
, (__v4si
) __index
,
10465 (__v4df
) __v1
, __scale
);
10468 extern __inline
void
10469 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10470 _mm_i32scatter_pd (double *__addr
, __m128i __index
,
10471 __m128d __v1
, const int __scale
)
10473 __builtin_ia32_scattersiv2df (__addr
, (__mmask8
) 0xFF,
10474 (__v4si
) __index
, (__v2df
) __v1
,
10478 extern __inline
void
10479 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10480 _mm_mask_i32scatter_pd (double *__addr
, __mmask8 __mask
,
10481 __m128i __index
, __m128d __v1
,
10484 __builtin_ia32_scattersiv2df (__addr
, __mask
, (__v4si
) __index
,
10485 (__v2df
) __v1
, __scale
);
10488 extern __inline
void
10489 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10490 _mm256_i64scatter_ps (float *__addr
, __m256i __index
,
10491 __m128 __v1
, const int __scale
)
10493 __builtin_ia32_scatterdiv8sf (__addr
, (__mmask8
) 0xFF,
10494 (__v4di
) __index
, (__v4sf
) __v1
,
10498 extern __inline
void
10499 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10500 _mm256_mask_i64scatter_ps (float *__addr
, __mmask8 __mask
,
10501 __m256i __index
, __m128 __v1
,
10504 __builtin_ia32_scatterdiv8sf (__addr
, __mask
, (__v4di
) __index
,
10505 (__v4sf
) __v1
, __scale
);
10508 extern __inline
void
10509 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10510 _mm_i64scatter_ps (float *__addr
, __m128i __index
, __m128 __v1
,
10513 __builtin_ia32_scatterdiv4sf (__addr
, (__mmask8
) 0xFF,
10514 (__v2di
) __index
, (__v4sf
) __v1
,
10518 extern __inline
void
10519 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10520 _mm_mask_i64scatter_ps (float *__addr
, __mmask8 __mask
,
10521 __m128i __index
, __m128 __v1
,
10524 __builtin_ia32_scatterdiv4sf (__addr
, __mask
, (__v2di
) __index
,
10525 (__v4sf
) __v1
, __scale
);
10528 extern __inline
void
10529 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10530 _mm256_i64scatter_pd (double *__addr
, __m256i __index
,
10531 __m256d __v1
, const int __scale
)
10533 __builtin_ia32_scatterdiv4df (__addr
, (__mmask8
) 0xFF,
10534 (__v4di
) __index
, (__v4df
) __v1
,
10538 extern __inline
void
10539 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10540 _mm256_mask_i64scatter_pd (double *__addr
, __mmask8 __mask
,
10541 __m256i __index
, __m256d __v1
,
10544 __builtin_ia32_scatterdiv4df (__addr
, __mask
, (__v4di
) __index
,
10545 (__v4df
) __v1
, __scale
);
10548 extern __inline
void
10549 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10550 _mm_i64scatter_pd (double *__addr
, __m128i __index
,
10551 __m128d __v1
, const int __scale
)
10553 __builtin_ia32_scatterdiv2df (__addr
, (__mmask8
) 0xFF,
10554 (__v2di
) __index
, (__v2df
) __v1
,
10558 extern __inline
void
10559 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10560 _mm_mask_i64scatter_pd (double *__addr
, __mmask8 __mask
,
10561 __m128i __index
, __m128d __v1
,
10564 __builtin_ia32_scatterdiv2df (__addr
, __mask
, (__v2di
) __index
,
10565 (__v2df
) __v1
, __scale
);
10568 extern __inline
void
10569 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10570 _mm256_i32scatter_epi32 (int *__addr
, __m256i __index
,
10571 __m256i __v1
, const int __scale
)
10573 __builtin_ia32_scattersiv8si (__addr
, (__mmask8
) 0xFF,
10574 (__v8si
) __index
, (__v8si
) __v1
,
10578 extern __inline
void
10579 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10580 _mm256_mask_i32scatter_epi32 (int *__addr
, __mmask8 __mask
,
10581 __m256i __index
, __m256i __v1
,
10584 __builtin_ia32_scattersiv8si (__addr
, __mask
, (__v8si
) __index
,
10585 (__v8si
) __v1
, __scale
);
10588 extern __inline
void
10589 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10590 _mm_i32scatter_epi32 (int *__addr
, __m128i __index
,
10591 __m128i __v1
, const int __scale
)
10593 __builtin_ia32_scattersiv4si (__addr
, (__mmask8
) 0xFF,
10594 (__v4si
) __index
, (__v4si
) __v1
,
10598 extern __inline
void
10599 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10600 _mm_mask_i32scatter_epi32 (int *__addr
, __mmask8 __mask
,
10601 __m128i __index
, __m128i __v1
,
10604 __builtin_ia32_scattersiv4si (__addr
, __mask
, (__v4si
) __index
,
10605 (__v4si
) __v1
, __scale
);
10608 extern __inline
void
10609 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10610 _mm256_i32scatter_epi64 (long long *__addr
, __m128i __index
,
10611 __m256i __v1
, const int __scale
)
10613 __builtin_ia32_scattersiv4di (__addr
, (__mmask8
) 0xFF,
10614 (__v4si
) __index
, (__v4di
) __v1
,
10618 extern __inline
void
10619 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10620 _mm256_mask_i32scatter_epi64 (long long *__addr
, __mmask8 __mask
,
10621 __m128i __index
, __m256i __v1
,
10624 __builtin_ia32_scattersiv4di (__addr
, __mask
, (__v4si
) __index
,
10625 (__v4di
) __v1
, __scale
);
10628 extern __inline
void
10629 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10630 _mm_i32scatter_epi64 (long long *__addr
, __m128i __index
,
10631 __m128i __v1
, const int __scale
)
10633 __builtin_ia32_scattersiv2di (__addr
, (__mmask8
) 0xFF,
10634 (__v4si
) __index
, (__v2di
) __v1
,
10638 extern __inline
void
10639 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10640 _mm_mask_i32scatter_epi64 (long long *__addr
, __mmask8 __mask
,
10641 __m128i __index
, __m128i __v1
,
10644 __builtin_ia32_scattersiv2di (__addr
, __mask
, (__v4si
) __index
,
10645 (__v2di
) __v1
, __scale
);
10648 extern __inline
void
10649 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10650 _mm256_i64scatter_epi32 (int *__addr
, __m256i __index
,
10651 __m128i __v1
, const int __scale
)
10653 __builtin_ia32_scatterdiv8si (__addr
, (__mmask8
) 0xFF,
10654 (__v4di
) __index
, (__v4si
) __v1
,
10658 extern __inline
void
10659 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10660 _mm256_mask_i64scatter_epi32 (int *__addr
, __mmask8 __mask
,
10661 __m256i __index
, __m128i __v1
,
10664 __builtin_ia32_scatterdiv8si (__addr
, __mask
, (__v4di
) __index
,
10665 (__v4si
) __v1
, __scale
);
10668 extern __inline
void
10669 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10670 _mm_i64scatter_epi32 (int *__addr
, __m128i __index
,
10671 __m128i __v1
, const int __scale
)
10673 __builtin_ia32_scatterdiv4si (__addr
, (__mmask8
) 0xFF,
10674 (__v2di
) __index
, (__v4si
) __v1
,
10678 extern __inline
void
10679 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10680 _mm_mask_i64scatter_epi32 (int *__addr
, __mmask8 __mask
,
10681 __m128i __index
, __m128i __v1
,
10684 __builtin_ia32_scatterdiv4si (__addr
, __mask
, (__v2di
) __index
,
10685 (__v4si
) __v1
, __scale
);
10688 extern __inline
void
10689 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10690 _mm256_i64scatter_epi64 (long long *__addr
, __m256i __index
,
10691 __m256i __v1
, const int __scale
)
10693 __builtin_ia32_scatterdiv4di (__addr
, (__mmask8
) 0xFF,
10694 (__v4di
) __index
, (__v4di
) __v1
,
10698 extern __inline
void
10699 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10700 _mm256_mask_i64scatter_epi64 (long long *__addr
, __mmask8 __mask
,
10701 __m256i __index
, __m256i __v1
,
10704 __builtin_ia32_scatterdiv4di (__addr
, __mask
, (__v4di
) __index
,
10705 (__v4di
) __v1
, __scale
);
10708 extern __inline
void
10709 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10710 _mm_i64scatter_epi64 (long long *__addr
, __m128i __index
,
10711 __m128i __v1
, const int __scale
)
10713 __builtin_ia32_scatterdiv2di (__addr
, (__mmask8
) 0xFF,
10714 (__v2di
) __index
, (__v2di
) __v1
,
10718 extern __inline
void
10719 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10720 _mm_mask_i64scatter_epi64 (long long *__addr
, __mmask8 __mask
,
10721 __m128i __index
, __m128i __v1
,
10724 __builtin_ia32_scatterdiv2di (__addr
, __mask
, (__v2di
) __index
,
10725 (__v2di
) __v1
, __scale
);
10728 extern __inline __m256i
10729 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10730 _mm256_mask_shuffle_epi32 (__m256i __W
, __mmask8 __U
, __m256i __A
,
10731 _MM_PERM_ENUM __mask
)
10733 return (__m256i
) __builtin_ia32_pshufd256_mask ((__v8si
) __A
, __mask
,
10738 extern __inline __m256i
10739 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10740 _mm256_maskz_shuffle_epi32 (__mmask8 __U
, __m256i __A
,
10741 _MM_PERM_ENUM __mask
)
10743 return (__m256i
) __builtin_ia32_pshufd256_mask ((__v8si
) __A
, __mask
,
10745 _mm256_setzero_si256 (),
10749 extern __inline __m128i
10750 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10751 _mm_mask_shuffle_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
,
10752 _MM_PERM_ENUM __mask
)
10754 return (__m128i
) __builtin_ia32_pshufd128_mask ((__v4si
) __A
, __mask
,
10759 extern __inline __m128i
10760 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10761 _mm_maskz_shuffle_epi32 (__mmask8 __U
, __m128i __A
,
10762 _MM_PERM_ENUM __mask
)
10764 return (__m128i
) __builtin_ia32_pshufd128_mask ((__v4si
) __A
, __mask
,
10766 _mm_setzero_si128 (),
10770 extern __inline __m256i
10771 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10772 _mm256_rol_epi32 (__m256i __A
, const int __B
)
10774 return (__m256i
) __builtin_ia32_prold256_mask ((__v8si
) __A
, __B
,
10776 _mm256_setzero_si256 (),
10780 extern __inline __m256i
10781 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10782 _mm256_mask_rol_epi32 (__m256i __W
, __mmask8 __U
, __m256i __A
,
10785 return (__m256i
) __builtin_ia32_prold256_mask ((__v8si
) __A
, __B
,
10790 extern __inline __m256i
10791 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10792 _mm256_maskz_rol_epi32 (__mmask8 __U
, __m256i __A
, const int __B
)
10794 return (__m256i
) __builtin_ia32_prold256_mask ((__v8si
) __A
, __B
,
10796 _mm256_setzero_si256 (),
10800 extern __inline __m128i
10801 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10802 _mm_rol_epi32 (__m128i __A
, const int __B
)
10804 return (__m128i
) __builtin_ia32_prold128_mask ((__v4si
) __A
, __B
,
10806 _mm_setzero_si128 (),
10810 extern __inline __m128i
10811 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10812 _mm_mask_rol_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
,
10815 return (__m128i
) __builtin_ia32_prold128_mask ((__v4si
) __A
, __B
,
10820 extern __inline __m128i
10821 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10822 _mm_maskz_rol_epi32 (__mmask8 __U
, __m128i __A
, const int __B
)
10824 return (__m128i
) __builtin_ia32_prold128_mask ((__v4si
) __A
, __B
,
10826 _mm_setzero_si128 (),
10830 extern __inline __m256i
10831 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10832 _mm256_ror_epi32 (__m256i __A
, const int __B
)
10834 return (__m256i
) __builtin_ia32_prord256_mask ((__v8si
) __A
, __B
,
10836 _mm256_setzero_si256 (),
10840 extern __inline __m256i
10841 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10842 _mm256_mask_ror_epi32 (__m256i __W
, __mmask8 __U
, __m256i __A
,
10845 return (__m256i
) __builtin_ia32_prord256_mask ((__v8si
) __A
, __B
,
10850 extern __inline __m256i
10851 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10852 _mm256_maskz_ror_epi32 (__mmask8 __U
, __m256i __A
, const int __B
)
10854 return (__m256i
) __builtin_ia32_prord256_mask ((__v8si
) __A
, __B
,
10856 _mm256_setzero_si256 (),
10860 extern __inline __m128i
10861 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10862 _mm_ror_epi32 (__m128i __A
, const int __B
)
10864 return (__m128i
) __builtin_ia32_prord128_mask ((__v4si
) __A
, __B
,
10866 _mm_setzero_si128 (),
10870 extern __inline __m128i
10871 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10872 _mm_mask_ror_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
,
10875 return (__m128i
) __builtin_ia32_prord128_mask ((__v4si
) __A
, __B
,
10880 extern __inline __m128i
10881 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10882 _mm_maskz_ror_epi32 (__mmask8 __U
, __m128i __A
, const int __B
)
10884 return (__m128i
) __builtin_ia32_prord128_mask ((__v4si
) __A
, __B
,
10886 _mm_setzero_si128 (),
10890 extern __inline __m256i
10891 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10892 _mm256_rol_epi64 (__m256i __A
, const int __B
)
10894 return (__m256i
) __builtin_ia32_prolq256_mask ((__v4di
) __A
, __B
,
10896 _mm256_setzero_si256 (),
10900 extern __inline __m256i
10901 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10902 _mm256_mask_rol_epi64 (__m256i __W
, __mmask8 __U
, __m256i __A
,
10905 return (__m256i
) __builtin_ia32_prolq256_mask ((__v4di
) __A
, __B
,
10910 extern __inline __m256i
10911 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10912 _mm256_maskz_rol_epi64 (__mmask8 __U
, __m256i __A
, const int __B
)
10914 return (__m256i
) __builtin_ia32_prolq256_mask ((__v4di
) __A
, __B
,
10916 _mm256_setzero_si256 (),
10920 extern __inline __m128i
10921 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10922 _mm_rol_epi64 (__m128i __A
, const int __B
)
10924 return (__m128i
) __builtin_ia32_prolq128_mask ((__v2di
) __A
, __B
,
10930 extern __inline __m128i
10931 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10932 _mm_mask_rol_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
,
10935 return (__m128i
) __builtin_ia32_prolq128_mask ((__v2di
) __A
, __B
,
10940 extern __inline __m128i
10941 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10942 _mm_maskz_rol_epi64 (__mmask8 __U
, __m128i __A
, const int __B
)
10944 return (__m128i
) __builtin_ia32_prolq128_mask ((__v2di
) __A
, __B
,
10950 extern __inline __m256i
10951 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10952 _mm256_ror_epi64 (__m256i __A
, const int __B
)
10954 return (__m256i
) __builtin_ia32_prorq256_mask ((__v4di
) __A
, __B
,
10956 _mm256_setzero_si256 (),
10960 extern __inline __m256i
10961 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10962 _mm256_mask_ror_epi64 (__m256i __W
, __mmask8 __U
, __m256i __A
,
10965 return (__m256i
) __builtin_ia32_prorq256_mask ((__v4di
) __A
, __B
,
10970 extern __inline __m256i
10971 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10972 _mm256_maskz_ror_epi64 (__mmask8 __U
, __m256i __A
, const int __B
)
10974 return (__m256i
) __builtin_ia32_prorq256_mask ((__v4di
) __A
, __B
,
10976 _mm256_setzero_si256 (),
10980 extern __inline __m128i
10981 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10982 _mm_ror_epi64 (__m128i __A
, const int __B
)
10984 return (__m128i
) __builtin_ia32_prorq128_mask ((__v2di
) __A
, __B
,
10990 extern __inline __m128i
10991 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
10992 _mm_mask_ror_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
,
10995 return (__m128i
) __builtin_ia32_prorq128_mask ((__v2di
) __A
, __B
,
11000 extern __inline __m128i
11001 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11002 _mm_maskz_ror_epi64 (__mmask8 __U
, __m128i __A
, const int __B
)
11004 return (__m128i
) __builtin_ia32_prorq128_mask ((__v2di
) __A
, __B
,
11010 extern __inline __m128i
11011 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11012 _mm_alignr_epi32 (__m128i __A
, __m128i __B
, const int __imm
)
11014 return (__m128i
) __builtin_ia32_alignd128_mask ((__v4si
) __A
,
11015 (__v4si
) __B
, __imm
,
11017 _mm_setzero_si128 (),
11021 extern __inline __m128i
11022 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11023 _mm_mask_alignr_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
,
11024 __m128i __B
, const int __imm
)
11026 return (__m128i
) __builtin_ia32_alignd128_mask ((__v4si
) __A
,
11027 (__v4si
) __B
, __imm
,
11032 extern __inline __m128i
11033 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11034 _mm_maskz_alignr_epi32 (__mmask8 __U
, __m128i __A
, __m128i __B
,
11037 return (__m128i
) __builtin_ia32_alignd128_mask ((__v4si
) __A
,
11038 (__v4si
) __B
, __imm
,
11040 _mm_setzero_si128 (),
11044 extern __inline __m128i
11045 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11046 _mm_alignr_epi64 (__m128i __A
, __m128i __B
, const int __imm
)
11048 return (__m128i
) __builtin_ia32_alignq128_mask ((__v2di
) __A
,
11049 (__v2di
) __B
, __imm
,
11055 extern __inline __m128i
11056 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11057 _mm_mask_alignr_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
,
11058 __m128i __B
, const int __imm
)
11060 return (__m128i
) __builtin_ia32_alignq128_mask ((__v2di
) __A
,
11061 (__v2di
) __B
, __imm
,
11066 extern __inline __m128i
11067 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11068 _mm_maskz_alignr_epi64 (__mmask8 __U
, __m128i __A
, __m128i __B
,
11071 return (__m128i
) __builtin_ia32_alignq128_mask ((__v2di
) __A
,
11072 (__v2di
) __B
, __imm
,
11078 extern __inline __m256i
11079 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11080 _mm256_alignr_epi32 (__m256i __A
, __m256i __B
, const int __imm
)
11082 return (__m256i
) __builtin_ia32_alignd256_mask ((__v8si
) __A
,
11083 (__v8si
) __B
, __imm
,
11085 _mm256_setzero_si256 (),
11089 extern __inline __m256i
11090 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11091 _mm256_mask_alignr_epi32 (__m256i __W
, __mmask8 __U
, __m256i __A
,
11092 __m256i __B
, const int __imm
)
11094 return (__m256i
) __builtin_ia32_alignd256_mask ((__v8si
) __A
,
11095 (__v8si
) __B
, __imm
,
11100 extern __inline __m256i
11101 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11102 _mm256_maskz_alignr_epi32 (__mmask8 __U
, __m256i __A
, __m256i __B
,
11105 return (__m256i
) __builtin_ia32_alignd256_mask ((__v8si
) __A
,
11106 (__v8si
) __B
, __imm
,
11108 _mm256_setzero_si256 (),
11112 extern __inline __m256i
11113 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11114 _mm256_alignr_epi64 (__m256i __A
, __m256i __B
, const int __imm
)
11116 return (__m256i
) __builtin_ia32_alignq256_mask ((__v4di
) __A
,
11117 (__v4di
) __B
, __imm
,
11119 _mm256_setzero_si256 (),
11123 extern __inline __m256i
11124 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11125 _mm256_mask_alignr_epi64 (__m256i __W
, __mmask8 __U
, __m256i __A
,
11126 __m256i __B
, const int __imm
)
11128 return (__m256i
) __builtin_ia32_alignq256_mask ((__v4di
) __A
,
11129 (__v4di
) __B
, __imm
,
11134 extern __inline __m256i
11135 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11136 _mm256_maskz_alignr_epi64 (__mmask8 __U
, __m256i __A
, __m256i __B
,
11139 return (__m256i
) __builtin_ia32_alignq256_mask ((__v4di
) __A
,
11140 (__v4di
) __B
, __imm
,
11142 _mm256_setzero_si256 (),
11146 extern __inline __m128i
11147 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11148 _mm_mask_cvtps_ph (__m128i __W
, __mmask8 __U
, __m128 __A
,
11151 return (__m128i
) __builtin_ia32_vcvtps2ph_mask ((__v4sf
) __A
, __I
,
11156 extern __inline __m128i
11157 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11158 _mm_maskz_cvtps_ph (__mmask8 __U
, __m128 __A
, const int __I
)
11160 return (__m128i
) __builtin_ia32_vcvtps2ph_mask ((__v4sf
) __A
, __I
,
11166 extern __inline __m128i
11167 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11168 _mm256_mask_cvtps_ph (__m128i __W
, __mmask8 __U
, __m256 __A
,
11171 return (__m128i
) __builtin_ia32_vcvtps2ph256_mask ((__v8sf
) __A
, __I
,
11176 extern __inline __m128i
11177 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11178 _mm256_maskz_cvtps_ph (__mmask8 __U
, __m256 __A
, const int __I
)
11180 return (__m128i
) __builtin_ia32_vcvtps2ph256_mask ((__v8sf
) __A
, __I
,
11186 extern __inline __m256i
11187 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11188 _mm256_mask_srai_epi32 (__m256i __W
, __mmask8 __U
, __m256i __A
,
11191 return (__m256i
) __builtin_ia32_psradi256_mask ((__v8si
) __A
, __imm
,
11196 extern __inline __m256i
11197 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11198 _mm256_maskz_srai_epi32 (__mmask8 __U
, __m256i __A
, const int __imm
)
11200 return (__m256i
) __builtin_ia32_psradi256_mask ((__v8si
) __A
, __imm
,
11202 _mm256_setzero_si256 (),
11206 extern __inline __m128i
11207 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11208 _mm_mask_srai_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
,
11211 return (__m128i
) __builtin_ia32_psradi128_mask ((__v4si
) __A
, __imm
,
11216 extern __inline __m128i
11217 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11218 _mm_maskz_srai_epi32 (__mmask8 __U
, __m128i __A
, const int __imm
)
11220 return (__m128i
) __builtin_ia32_psradi128_mask ((__v4si
) __A
, __imm
,
11222 _mm_setzero_si128 (),
11226 extern __inline __m256i
11227 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11228 _mm256_srai_epi64 (__m256i __A
, const int __imm
)
11230 return (__m256i
) __builtin_ia32_psraqi256_mask ((__v4di
) __A
, __imm
,
11232 _mm256_setzero_si256 (),
11236 extern __inline __m256i
11237 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11238 _mm256_mask_srai_epi64 (__m256i __W
, __mmask8 __U
, __m256i __A
,
11241 return (__m256i
) __builtin_ia32_psraqi256_mask ((__v4di
) __A
, __imm
,
11246 extern __inline __m256i
11247 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11248 _mm256_maskz_srai_epi64 (__mmask8 __U
, __m256i __A
, const int __imm
)
11250 return (__m256i
) __builtin_ia32_psraqi256_mask ((__v4di
) __A
, __imm
,
11252 _mm256_setzero_si256 (),
11256 extern __inline __m128i
11257 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11258 _mm_srai_epi64 (__m128i __A
, const int __imm
)
11260 return (__m128i
) __builtin_ia32_psraqi128_mask ((__v2di
) __A
, __imm
,
11266 extern __inline __m128i
11267 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11268 _mm_mask_srai_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
,
11271 return (__m128i
) __builtin_ia32_psraqi128_mask ((__v2di
) __A
, __imm
,
11276 extern __inline __m128i
11277 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11278 _mm_maskz_srai_epi64 (__mmask8 __U
, __m128i __A
, const int __imm
)
11280 return (__m128i
) __builtin_ia32_psraqi128_mask ((__v2di
) __A
, __imm
,
11282 _mm_setzero_si128 (),
11286 extern __inline __m128i
11287 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11288 _mm_mask_slli_epi32 (__m128i __W
, __mmask8 __U
, __m128i __A
, int __B
)
11290 return (__m128i
) __builtin_ia32_pslldi128_mask ((__v4si
) __A
, __B
,
11295 extern __inline __m128i
11296 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11297 _mm_maskz_slli_epi32 (__mmask8 __U
, __m128i __A
, int __B
)
11299 return (__m128i
) __builtin_ia32_pslldi128_mask ((__v4si
) __A
, __B
,
11301 _mm_setzero_si128 (),
11305 extern __inline __m128i
11306 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11307 _mm_mask_slli_epi64 (__m128i __W
, __mmask8 __U
, __m128i __A
, int __B
)
11309 return (__m128i
) __builtin_ia32_psllqi128_mask ((__v2di
) __A
, __B
,
11314 extern __inline __m128i
11315 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11316 _mm_maskz_slli_epi64 (__mmask8 __U
, __m128i __A
, int __B
)
11318 return (__m128i
) __builtin_ia32_psllqi128_mask ((__v2di
) __A
, __B
,
11324 extern __inline __m256i
11325 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11326 _mm256_mask_slli_epi32 (__m256i __W
, __mmask8 __U
, __m256i __A
,
11329 return (__m256i
) __builtin_ia32_pslldi256_mask ((__v8si
) __A
, __B
,
11334 extern __inline __m256i
11335 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11336 _mm256_maskz_slli_epi32 (__mmask8 __U
, __m256i __A
, int __B
)
11338 return (__m256i
) __builtin_ia32_pslldi256_mask ((__v8si
) __A
, __B
,
11340 _mm256_setzero_si256 (),
11344 extern __inline __m256i
11345 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11346 _mm256_mask_slli_epi64 (__m256i __W
, __mmask8 __U
, __m256i __A
,
11349 return (__m256i
) __builtin_ia32_psllqi256_mask ((__v4di
) __A
, __B
,
11354 extern __inline __m256i
11355 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11356 _mm256_maskz_slli_epi64 (__mmask8 __U
, __m256i __A
, int __B
)
11358 return (__m256i
) __builtin_ia32_psllqi256_mask ((__v4di
) __A
, __B
,
11360 _mm256_setzero_si256 (),
11364 extern __inline __m256d
11365 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11366 _mm256_mask_permutex_pd (__m256d __W
, __mmask8 __U
, __m256d __X
,
11369 return (__m256d
) __builtin_ia32_permdf256_mask ((__v4df
) __X
, __imm
,
11374 extern __inline __m256d
11375 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11376 _mm256_maskz_permutex_pd (__mmask8 __U
, __m256d __X
, const int __imm
)
11378 return (__m256d
) __builtin_ia32_permdf256_mask ((__v4df
) __X
, __imm
,
11380 _mm256_setzero_pd (),
11384 extern __inline __m256d
11385 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11386 _mm256_mask_permute_pd (__m256d __W
, __mmask8 __U
, __m256d __X
,
11389 return (__m256d
) __builtin_ia32_vpermilpd256_mask ((__v4df
) __X
, __C
,
11394 extern __inline __m256d
11395 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11396 _mm256_maskz_permute_pd (__mmask8 __U
, __m256d __X
, const int __C
)
11398 return (__m256d
) __builtin_ia32_vpermilpd256_mask ((__v4df
) __X
, __C
,
11400 _mm256_setzero_pd (),
11404 extern __inline __m128d
11405 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11406 _mm_mask_permute_pd (__m128d __W
, __mmask8 __U
, __m128d __X
,
11409 return (__m128d
) __builtin_ia32_vpermilpd_mask ((__v2df
) __X
, __C
,
11414 extern __inline __m128d
11415 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11416 _mm_maskz_permute_pd (__mmask8 __U
, __m128d __X
, const int __C
)
11418 return (__m128d
) __builtin_ia32_vpermilpd_mask ((__v2df
) __X
, __C
,
11424 extern __inline __m256
11425 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11426 _mm256_mask_permute_ps (__m256 __W
, __mmask8 __U
, __m256 __X
,
11429 return (__m256
) __builtin_ia32_vpermilps256_mask ((__v8sf
) __X
, __C
,
11434 extern __inline __m256
11435 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11436 _mm256_maskz_permute_ps (__mmask8 __U
, __m256 __X
, const int __C
)
11438 return (__m256
) __builtin_ia32_vpermilps256_mask ((__v8sf
) __X
, __C
,
11440 _mm256_setzero_ps (),
11444 extern __inline __m128
11445 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11446 _mm_mask_permute_ps (__m128 __W
, __mmask8 __U
, __m128 __X
,
11449 return (__m128
) __builtin_ia32_vpermilps_mask ((__v4sf
) __X
, __C
,
11454 extern __inline __m128
11455 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11456 _mm_maskz_permute_ps (__mmask8 __U
, __m128 __X
, const int __C
)
11458 return (__m128
) __builtin_ia32_vpermilps_mask ((__v4sf
) __X
, __C
,
11464 extern __inline __m256d
11465 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11466 _mm256_mask_blend_pd (__mmask8 __U
, __m256d __A
, __m256d __W
)
11468 return (__m256d
) __builtin_ia32_blendmpd_256_mask ((__v4df
) __A
,
11473 extern __inline __m256
11474 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11475 _mm256_mask_blend_ps (__mmask8 __U
, __m256 __A
, __m256 __W
)
11477 return (__m256
) __builtin_ia32_blendmps_256_mask ((__v8sf
) __A
,
11482 extern __inline __m256i
11483 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11484 _mm256_mask_blend_epi64 (__mmask8 __U
, __m256i __A
, __m256i __W
)
11486 return (__m256i
) __builtin_ia32_blendmq_256_mask ((__v4di
) __A
,
11491 extern __inline __m256i
11492 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11493 _mm256_mask_blend_epi32 (__mmask8 __U
, __m256i __A
, __m256i __W
)
11495 return (__m256i
) __builtin_ia32_blendmd_256_mask ((__v8si
) __A
,
11500 extern __inline __m128d
11501 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11502 _mm_mask_blend_pd (__mmask8 __U
, __m128d __A
, __m128d __W
)
11504 return (__m128d
) __builtin_ia32_blendmpd_128_mask ((__v2df
) __A
,
11509 extern __inline __m128
11510 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11511 _mm_mask_blend_ps (__mmask8 __U
, __m128 __A
, __m128 __W
)
11513 return (__m128
) __builtin_ia32_blendmps_128_mask ((__v4sf
) __A
,
11518 extern __inline __m128i
11519 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11520 _mm_mask_blend_epi64 (__mmask8 __U
, __m128i __A
, __m128i __W
)
11522 return (__m128i
) __builtin_ia32_blendmq_128_mask ((__v2di
) __A
,
11527 extern __inline __m128i
11528 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11529 _mm_mask_blend_epi32 (__mmask8 __U
, __m128i __A
, __m128i __W
)
11531 return (__m128i
) __builtin_ia32_blendmd_128_mask ((__v4si
) __A
,
11536 extern __inline __mmask8
11537 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11538 _mm256_cmp_epi64_mask (__m256i __X
, __m256i __Y
, const int __P
)
11540 return (__mmask8
) __builtin_ia32_cmpq256_mask ((__v4di
) __X
,
11545 extern __inline __mmask8
11546 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11547 _mm256_cmp_epi32_mask (__m256i __X
, __m256i __Y
, const int __P
)
11549 return (__mmask8
) __builtin_ia32_cmpd256_mask ((__v8si
) __X
,
11554 extern __inline __mmask8
11555 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11556 _mm256_cmp_epu64_mask (__m256i __X
, __m256i __Y
, const int __P
)
11558 return (__mmask8
) __builtin_ia32_ucmpq256_mask ((__v4di
) __X
,
11563 extern __inline __mmask8
11564 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11565 _mm256_cmp_epu32_mask (__m256i __X
, __m256i __Y
, const int __P
)
11567 return (__mmask8
) __builtin_ia32_ucmpd256_mask ((__v8si
) __X
,
11572 extern __inline __mmask8
11573 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11574 _mm256_cmp_pd_mask (__m256d __X
, __m256d __Y
, const int __P
)
11576 return (__mmask8
) __builtin_ia32_cmppd256_mask ((__v4df
) __X
,
11581 extern __inline __mmask8
11582 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11583 _mm256_cmp_ps_mask (__m256 __X
, __m256 __Y
, const int __P
)
11585 return (__mmask8
) __builtin_ia32_cmpps256_mask ((__v8sf
) __X
,
11590 extern __inline __mmask8
11591 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11592 _mm256_mask_cmp_epi64_mask (__mmask8 __U
, __m256i __X
, __m256i __Y
,
11595 return (__mmask8
) __builtin_ia32_cmpq256_mask ((__v4di
) __X
,
11600 extern __inline __mmask8
11601 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11602 _mm256_mask_cmp_epi32_mask (__mmask8 __U
, __m256i __X
, __m256i __Y
,
11605 return (__mmask8
) __builtin_ia32_cmpd256_mask ((__v8si
) __X
,
11610 extern __inline __mmask8
11611 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11612 _mm256_mask_cmp_epu64_mask (__mmask8 __U
, __m256i __X
, __m256i __Y
,
11615 return (__mmask8
) __builtin_ia32_ucmpq256_mask ((__v4di
) __X
,
11620 extern __inline __mmask8
11621 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11622 _mm256_mask_cmp_epu32_mask (__mmask8 __U
, __m256i __X
, __m256i __Y
,
11625 return (__mmask8
) __builtin_ia32_ucmpd256_mask ((__v8si
) __X
,
11630 extern __inline __mmask8
11631 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11632 _mm256_mask_cmp_pd_mask (__mmask8 __U
, __m256d __X
, __m256d __Y
,
11635 return (__mmask8
) __builtin_ia32_cmppd256_mask ((__v4df
) __X
,
11640 extern __inline __mmask8
11641 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11642 _mm256_mask_cmp_ps_mask (__mmask8 __U
, __m256 __X
, __m256 __Y
,
11645 return (__mmask8
) __builtin_ia32_cmpps256_mask ((__v8sf
) __X
,
11650 extern __inline __mmask8
11651 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11652 _mm_cmp_epi64_mask (__m128i __X
, __m128i __Y
, const int __P
)
11654 return (__mmask8
) __builtin_ia32_cmpq128_mask ((__v2di
) __X
,
11659 extern __inline __mmask8
11660 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11661 _mm_cmp_epi32_mask (__m128i __X
, __m128i __Y
, const int __P
)
11663 return (__mmask8
) __builtin_ia32_cmpd128_mask ((__v4si
) __X
,
11668 extern __inline __mmask8
11669 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11670 _mm_cmp_epu64_mask (__m128i __X
, __m128i __Y
, const int __P
)
11672 return (__mmask8
) __builtin_ia32_ucmpq128_mask ((__v2di
) __X
,
11677 extern __inline __mmask8
11678 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11679 _mm_cmp_epu32_mask (__m128i __X
, __m128i __Y
, const int __P
)
11681 return (__mmask8
) __builtin_ia32_ucmpd128_mask ((__v4si
) __X
,
11686 extern __inline __mmask8
11687 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11688 _mm_cmp_pd_mask (__m128d __X
, __m128d __Y
, const int __P
)
11690 return (__mmask8
) __builtin_ia32_cmppd128_mask ((__v2df
) __X
,
11695 extern __inline __mmask8
11696 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11697 _mm_cmp_ps_mask (__m128 __X
, __m128 __Y
, const int __P
)
11699 return (__mmask8
) __builtin_ia32_cmpps128_mask ((__v4sf
) __X
,
11704 extern __inline __mmask8
11705 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11706 _mm_mask_cmp_epi64_mask (__mmask8 __U
, __m128i __X
, __m128i __Y
,
11709 return (__mmask8
) __builtin_ia32_cmpq128_mask ((__v2di
) __X
,
11714 extern __inline __mmask8
11715 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11716 _mm_mask_cmp_epi32_mask (__mmask8 __U
, __m128i __X
, __m128i __Y
,
11719 return (__mmask8
) __builtin_ia32_cmpd128_mask ((__v4si
) __X
,
11724 extern __inline __mmask8
11725 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11726 _mm_mask_cmp_epu64_mask (__mmask8 __U
, __m128i __X
, __m128i __Y
,
11729 return (__mmask8
) __builtin_ia32_ucmpq128_mask ((__v2di
) __X
,
11734 extern __inline __mmask8
11735 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11736 _mm_mask_cmp_epu32_mask (__mmask8 __U
, __m128i __X
, __m128i __Y
,
11739 return (__mmask8
) __builtin_ia32_ucmpd128_mask ((__v4si
) __X
,
11744 extern __inline __mmask8
11745 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11746 _mm_mask_cmp_pd_mask (__mmask8 __U
, __m128d __X
, __m128d __Y
,
11749 return (__mmask8
) __builtin_ia32_cmppd128_mask ((__v2df
) __X
,
11754 extern __inline __mmask8
11755 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11756 _mm_mask_cmp_ps_mask (__mmask8 __U
, __m128 __X
, __m128 __Y
,
11759 return (__mmask8
) __builtin_ia32_cmpps128_mask ((__v4sf
) __X
,
11764 extern __inline __m256d
11765 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11766 _mm256_permutex_pd (__m256d __X
, const int __M
)
11768 return (__m256d
) __builtin_ia32_permdf256_mask ((__v4df
) __X
, __M
,
11770 _mm256_undefined_pd (),
11774 extern __inline __mmask8
11775 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11776 _mm256_mask_cmpneq_epu32_mask (__mmask8 __M
, __m256i __X
, __m256i __Y
)
11778 return (__mmask8
) __builtin_ia32_ucmpd256_mask ((__v8si
) __X
,
11783 extern __inline __mmask8
11784 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11785 _mm256_cmpneq_epu32_mask (__m256i __X
, __m256i __Y
)
11787 return (__mmask8
) __builtin_ia32_ucmpd256_mask ((__v8si
) __X
,
11792 extern __inline __mmask8
11793 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11794 _mm256_mask_cmplt_epu32_mask (__mmask8 __M
, __m256i __X
, __m256i __Y
)
11796 return (__mmask8
) __builtin_ia32_ucmpd256_mask ((__v8si
) __X
,
11801 extern __inline __mmask8
11802 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11803 _mm256_cmplt_epu32_mask (__m256i __X
, __m256i __Y
)
11805 return (__mmask8
) __builtin_ia32_ucmpd256_mask ((__v8si
) __X
,
11810 extern __inline __mmask8
11811 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11812 _mm256_mask_cmpge_epu32_mask (__mmask8 __M
, __m256i __X
, __m256i __Y
)
11814 return (__mmask8
) __builtin_ia32_ucmpd256_mask ((__v8si
) __X
,
11819 extern __inline __mmask8
11820 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11821 _mm256_cmpge_epu32_mask (__m256i __X
, __m256i __Y
)
11823 return (__mmask8
) __builtin_ia32_ucmpd256_mask ((__v8si
) __X
,
11828 extern __inline __mmask8
11829 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11830 _mm256_mask_cmple_epu32_mask (__mmask8 __M
, __m256i __X
, __m256i __Y
)
11832 return (__mmask8
) __builtin_ia32_ucmpd256_mask ((__v8si
) __X
,
11837 extern __inline __mmask8
11838 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11839 _mm256_cmple_epu32_mask (__m256i __X
, __m256i __Y
)
11841 return (__mmask8
) __builtin_ia32_ucmpd256_mask ((__v8si
) __X
,
11846 extern __inline __mmask8
11847 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11848 _mm256_mask_cmpneq_epu64_mask (__mmask8 __M
, __m256i __X
, __m256i __Y
)
11850 return (__mmask8
) __builtin_ia32_ucmpq256_mask ((__v4di
) __X
,
11855 extern __inline __mmask8
11856 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11857 _mm256_cmpneq_epu64_mask (__m256i __X
, __m256i __Y
)
11859 return (__mmask8
) __builtin_ia32_ucmpq256_mask ((__v4di
) __X
,
11864 extern __inline __mmask8
11865 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11866 _mm256_mask_cmplt_epu64_mask (__mmask8 __M
, __m256i __X
, __m256i __Y
)
11868 return (__mmask8
) __builtin_ia32_ucmpq256_mask ((__v4di
) __X
,
11873 extern __inline __mmask8
11874 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11875 _mm256_cmplt_epu64_mask (__m256i __X
, __m256i __Y
)
11877 return (__mmask8
) __builtin_ia32_ucmpq256_mask ((__v4di
) __X
,
11882 extern __inline __mmask8
11883 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11884 _mm256_mask_cmpge_epu64_mask (__mmask8 __M
, __m256i __X
, __m256i __Y
)
11886 return (__mmask8
) __builtin_ia32_ucmpq256_mask ((__v4di
) __X
,
11891 extern __inline __mmask8
11892 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11893 _mm256_cmpge_epu64_mask (__m256i __X
, __m256i __Y
)
11895 return (__mmask8
) __builtin_ia32_ucmpq256_mask ((__v4di
) __X
,
11900 extern __inline __mmask8
11901 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11902 _mm256_mask_cmple_epu64_mask (__mmask8 __M
, __m256i __X
, __m256i __Y
)
11904 return (__mmask8
) __builtin_ia32_ucmpq256_mask ((__v4di
) __X
,
11909 extern __inline __mmask8
11910 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11911 _mm256_cmple_epu64_mask (__m256i __X
, __m256i __Y
)
11913 return (__mmask8
) __builtin_ia32_ucmpq256_mask ((__v4di
) __X
,
11918 extern __inline __mmask8
11919 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11920 _mm256_mask_cmpneq_epi32_mask (__mmask8 __M
, __m256i __X
, __m256i __Y
)
11922 return (__mmask8
) __builtin_ia32_cmpd256_mask ((__v8si
) __X
,
11927 extern __inline __mmask8
11928 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11929 _mm256_cmpneq_epi32_mask (__m256i __X
, __m256i __Y
)
11931 return (__mmask8
) __builtin_ia32_cmpd256_mask ((__v8si
) __X
,
11936 extern __inline __mmask8
11937 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11938 _mm256_mask_cmplt_epi32_mask (__mmask8 __M
, __m256i __X
, __m256i __Y
)
11940 return (__mmask8
) __builtin_ia32_cmpd256_mask ((__v8si
) __X
,
11945 extern __inline __mmask8
11946 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11947 _mm256_cmplt_epi32_mask (__m256i __X
, __m256i __Y
)
11949 return (__mmask8
) __builtin_ia32_cmpd256_mask ((__v8si
) __X
,
11954 extern __inline __mmask8
11955 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11956 _mm256_mask_cmpge_epi32_mask (__mmask8 __M
, __m256i __X
, __m256i __Y
)
11958 return (__mmask8
) __builtin_ia32_cmpd256_mask ((__v8si
) __X
,
11963 extern __inline __mmask8
11964 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11965 _mm256_cmpge_epi32_mask (__m256i __X
, __m256i __Y
)
11967 return (__mmask8
) __builtin_ia32_cmpd256_mask ((__v8si
) __X
,
11972 extern __inline __mmask8
11973 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11974 _mm256_mask_cmple_epi32_mask (__mmask8 __M
, __m256i __X
, __m256i __Y
)
11976 return (__mmask8
) __builtin_ia32_cmpd256_mask ((__v8si
) __X
,
11981 extern __inline __mmask8
11982 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11983 _mm256_cmple_epi32_mask (__m256i __X
, __m256i __Y
)
11985 return (__mmask8
) __builtin_ia32_cmpd256_mask ((__v8si
) __X
,
11990 extern __inline __mmask8
11991 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
11992 _mm256_mask_cmpneq_epi64_mask (__mmask8 __M
, __m256i __X
, __m256i __Y
)
11994 return (__mmask8
) __builtin_ia32_cmpq256_mask ((__v4di
) __X
,
11999 extern __inline __mmask8
12000 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12001 _mm256_cmpneq_epi64_mask (__m256i __X
, __m256i __Y
)
12003 return (__mmask8
) __builtin_ia32_cmpq256_mask ((__v4di
) __X
,
12008 extern __inline __mmask8
12009 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12010 _mm256_mask_cmplt_epi64_mask (__mmask8 __M
, __m256i __X
, __m256i __Y
)
12012 return (__mmask8
) __builtin_ia32_cmpq256_mask ((__v4di
) __X
,
12017 extern __inline __mmask8
12018 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12019 _mm256_cmplt_epi64_mask (__m256i __X
, __m256i __Y
)
12021 return (__mmask8
) __builtin_ia32_cmpq256_mask ((__v4di
) __X
,
12026 extern __inline __mmask8
12027 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12028 _mm256_mask_cmpge_epi64_mask (__mmask8 __M
, __m256i __X
, __m256i __Y
)
12030 return (__mmask8
) __builtin_ia32_cmpq256_mask ((__v4di
) __X
,
12035 extern __inline __mmask8
12036 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12037 _mm256_cmpge_epi64_mask (__m256i __X
, __m256i __Y
)
12039 return (__mmask8
) __builtin_ia32_cmpq256_mask ((__v4di
) __X
,
12044 extern __inline __mmask8
12045 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12046 _mm256_mask_cmple_epi64_mask (__mmask8 __M
, __m256i __X
, __m256i __Y
)
12048 return (__mmask8
) __builtin_ia32_cmpq256_mask ((__v4di
) __X
,
12053 extern __inline __mmask8
12054 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12055 _mm256_cmple_epi64_mask (__m256i __X
, __m256i __Y
)
12057 return (__mmask8
) __builtin_ia32_cmpq256_mask ((__v4di
) __X
,
12062 extern __inline __mmask8
12063 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12064 _mm_mask_cmpneq_epu32_mask (__mmask8 __M
, __m128i __X
, __m128i __Y
)
12066 return (__mmask8
) __builtin_ia32_ucmpd128_mask ((__v4si
) __X
,
12071 extern __inline __mmask8
12072 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12073 _mm_cmpneq_epu32_mask (__m128i __X
, __m128i __Y
)
12075 return (__mmask8
) __builtin_ia32_ucmpd128_mask ((__v4si
) __X
,
12080 extern __inline __mmask8
12081 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12082 _mm_mask_cmplt_epu32_mask (__mmask8 __M
, __m128i __X
, __m128i __Y
)
12084 return (__mmask8
) __builtin_ia32_ucmpd128_mask ((__v4si
) __X
,
12089 extern __inline __mmask8
12090 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12091 _mm_cmplt_epu32_mask (__m128i __X
, __m128i __Y
)
12093 return (__mmask8
) __builtin_ia32_ucmpd128_mask ((__v4si
) __X
,
12098 extern __inline __mmask8
12099 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12100 _mm_mask_cmpge_epu32_mask (__mmask8 __M
, __m128i __X
, __m128i __Y
)
12102 return (__mmask8
) __builtin_ia32_ucmpd128_mask ((__v4si
) __X
,
12107 extern __inline __mmask8
12108 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12109 _mm_cmpge_epu32_mask (__m128i __X
, __m128i __Y
)
12111 return (__mmask8
) __builtin_ia32_ucmpd128_mask ((__v4si
) __X
,
12116 extern __inline __mmask8
12117 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12118 _mm_mask_cmple_epu32_mask (__mmask8 __M
, __m128i __X
, __m128i __Y
)
12120 return (__mmask8
) __builtin_ia32_ucmpd128_mask ((__v4si
) __X
,
12125 extern __inline __mmask8
12126 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12127 _mm_cmple_epu32_mask (__m128i __X
, __m128i __Y
)
12129 return (__mmask8
) __builtin_ia32_ucmpd128_mask ((__v4si
) __X
,
12134 extern __inline __mmask8
12135 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12136 _mm_mask_cmpneq_epu64_mask (__mmask8 __M
, __m128i __X
, __m128i __Y
)
12138 return (__mmask8
) __builtin_ia32_ucmpq128_mask ((__v2di
) __X
,
12143 extern __inline __mmask8
12144 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12145 _mm_cmpneq_epu64_mask (__m128i __X
, __m128i __Y
)
12147 return (__mmask8
) __builtin_ia32_ucmpq128_mask ((__v2di
) __X
,
12152 extern __inline __mmask8
12153 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12154 _mm_mask_cmplt_epu64_mask (__mmask8 __M
, __m128i __X
, __m128i __Y
)
12156 return (__mmask8
) __builtin_ia32_ucmpq128_mask ((__v2di
) __X
,
12161 extern __inline __mmask8
12162 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12163 _mm_cmplt_epu64_mask (__m128i __X
, __m128i __Y
)
12165 return (__mmask8
) __builtin_ia32_ucmpq128_mask ((__v2di
) __X
,
12170 extern __inline __mmask8
12171 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12172 _mm_mask_cmpge_epu64_mask (__mmask8 __M
, __m128i __X
, __m128i __Y
)
12174 return (__mmask8
) __builtin_ia32_ucmpq128_mask ((__v2di
) __X
,
12179 extern __inline __mmask8
12180 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12181 _mm_cmpge_epu64_mask (__m128i __X
, __m128i __Y
)
12183 return (__mmask8
) __builtin_ia32_ucmpq128_mask ((__v2di
) __X
,
12188 extern __inline __mmask8
12189 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12190 _mm_mask_cmple_epu64_mask (__mmask8 __M
, __m128i __X
, __m128i __Y
)
12192 return (__mmask8
) __builtin_ia32_ucmpq128_mask ((__v2di
) __X
,
12197 extern __inline __mmask8
12198 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12199 _mm_cmple_epu64_mask (__m128i __X
, __m128i __Y
)
12201 return (__mmask8
) __builtin_ia32_ucmpq128_mask ((__v2di
) __X
,
12206 extern __inline __mmask8
12207 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12208 _mm_mask_cmpneq_epi32_mask (__mmask8 __M
, __m128i __X
, __m128i __Y
)
12210 return (__mmask8
) __builtin_ia32_cmpd128_mask ((__v4si
) __X
,
12215 extern __inline __mmask8
12216 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12217 _mm_cmpneq_epi32_mask (__m128i __X
, __m128i __Y
)
12219 return (__mmask8
) __builtin_ia32_cmpd128_mask ((__v4si
) __X
,
12224 extern __inline __mmask8
12225 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12226 _mm_mask_cmplt_epi32_mask (__mmask8 __M
, __m128i __X
, __m128i __Y
)
12228 return (__mmask8
) __builtin_ia32_cmpd128_mask ((__v4si
) __X
,
12233 extern __inline __mmask8
12234 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12235 _mm_cmplt_epi32_mask (__m128i __X
, __m128i __Y
)
12237 return (__mmask8
) __builtin_ia32_cmpd128_mask ((__v4si
) __X
,
12242 extern __inline __mmask8
12243 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12244 _mm_mask_cmpge_epi32_mask (__mmask8 __M
, __m128i __X
, __m128i __Y
)
12246 return (__mmask8
) __builtin_ia32_cmpd128_mask ((__v4si
) __X
,
12251 extern __inline __mmask8
12252 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12253 _mm_cmpge_epi32_mask (__m128i __X
, __m128i __Y
)
12255 return (__mmask8
) __builtin_ia32_cmpd128_mask ((__v4si
) __X
,
12260 extern __inline __mmask8
12261 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12262 _mm_mask_cmple_epi32_mask (__mmask8 __M
, __m128i __X
, __m128i __Y
)
12264 return (__mmask8
) __builtin_ia32_cmpd128_mask ((__v4si
) __X
,
12269 extern __inline __mmask8
12270 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12271 _mm_cmple_epi32_mask (__m128i __X
, __m128i __Y
)
12273 return (__mmask8
) __builtin_ia32_cmpd128_mask ((__v4si
) __X
,
12278 extern __inline __mmask8
12279 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12280 _mm_mask_cmpneq_epi64_mask (__mmask8 __M
, __m128i __X
, __m128i __Y
)
12282 return (__mmask8
) __builtin_ia32_cmpq128_mask ((__v2di
) __X
,
12287 extern __inline __mmask8
12288 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12289 _mm_cmpneq_epi64_mask (__m128i __X
, __m128i __Y
)
12291 return (__mmask8
) __builtin_ia32_cmpq128_mask ((__v2di
) __X
,
12296 extern __inline __mmask8
12297 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12298 _mm_mask_cmplt_epi64_mask (__mmask8 __M
, __m128i __X
, __m128i __Y
)
12300 return (__mmask8
) __builtin_ia32_cmpq128_mask ((__v2di
) __X
,
12305 extern __inline __mmask8
12306 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12307 _mm_cmplt_epi64_mask (__m128i __X
, __m128i __Y
)
12309 return (__mmask8
) __builtin_ia32_cmpq128_mask ((__v2di
) __X
,
12314 extern __inline __mmask8
12315 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12316 _mm_mask_cmpge_epi64_mask (__mmask8 __M
, __m128i __X
, __m128i __Y
)
12318 return (__mmask8
) __builtin_ia32_cmpq128_mask ((__v2di
) __X
,
12323 extern __inline __mmask8
12324 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12325 _mm_cmpge_epi64_mask (__m128i __X
, __m128i __Y
)
12327 return (__mmask8
) __builtin_ia32_cmpq128_mask ((__v2di
) __X
,
12332 extern __inline __mmask8
12333 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12334 _mm_mask_cmple_epi64_mask (__mmask8 __M
, __m128i __X
, __m128i __Y
)
12336 return (__mmask8
) __builtin_ia32_cmpq128_mask ((__v2di
) __X
,
12341 extern __inline __mmask8
12342 __attribute__ ((__gnu_inline__
, __always_inline__
, __artificial__
))
12343 _mm_cmple_epi64_mask (__m128i __X
, __m128i __Y
)
12345 return (__mmask8
) __builtin_ia32_cmpq128_mask ((__v2di
) __X
,
12351 #define _mm256_permutex_pd(X, M) \
12352 ((__m256d) __builtin_ia32_permdf256_mask ((__v4df)(__m256d)(X), (int)(M), \
12353 (__v4df)(__m256d)_mm256_undefined_pd(),\
12356 #define _mm256_maskz_permutex_epi64(M, X, I) \
12357 ((__m256i) __builtin_ia32_permdi256_mask ((__v4di)(__m256i)(X), \
12359 (__v4di)(__m256i) \
12360 (_mm256_setzero_si256()),\
12363 #define _mm256_mask_permutex_epi64(W, M, X, I) \
12364 ((__m256i) __builtin_ia32_permdi256_mask ((__v4di)(__m256i)(X), \
12366 (__v4di)(__m256i)(W), \
12369 #define _mm256_insertf32x4(X, Y, C) \
12370 ((__m256) __builtin_ia32_insertf32x4_256_mask ((__v8sf)(__m256) (X), \
12371 (__v4sf)(__m128) (Y), (int) (C), \
12372 (__v8sf)(__m256)_mm256_setzero_ps(), \
12375 #define _mm256_mask_insertf32x4(W, U, X, Y, C) \
12376 ((__m256) __builtin_ia32_insertf32x4_256_mask ((__v8sf)(__m256) (X), \
12377 (__v4sf)(__m128) (Y), (int) (C), \
12378 (__v8sf)(__m256)(W), \
12381 #define _mm256_maskz_insertf32x4(U, X, Y, C) \
12382 ((__m256) __builtin_ia32_insertf32x4_256_mask ((__v8sf)(__m256) (X), \
12383 (__v4sf)(__m128) (Y), (int) (C), \
12384 (__v8sf)(__m256)_mm256_setzero_ps(), \
12387 #define _mm256_inserti32x4(X, Y, C) \
12388 ((__m256i) __builtin_ia32_inserti32x4_256_mask ((__v8si)(__m256i) (X),\
12389 (__v4si)(__m128i) (Y), (int) (C), \
12390 (__v8si)(__m256i)_mm256_setzero_si256(), \
12393 #define _mm256_mask_inserti32x4(W, U, X, Y, C) \
12394 ((__m256i) __builtin_ia32_inserti32x4_256_mask ((__v8si)(__m256i) (X),\
12395 (__v4si)(__m128i) (Y), (int) (C), \
12396 (__v8si)(__m256i)(W), \
12399 #define _mm256_maskz_inserti32x4(U, X, Y, C) \
12400 ((__m256i) __builtin_ia32_inserti32x4_256_mask ((__v8si)(__m256i) (X),\
12401 (__v4si)(__m128i) (Y), (int) (C), \
12402 (__v8si)(__m256i)_mm256_setzero_si256(), \
12405 #define _mm256_extractf32x4_ps(X, C) \
12406 ((__m128) __builtin_ia32_extractf32x4_256_mask ((__v8sf)(__m256) (X), \
12408 (__v4sf)(__m128)_mm_setzero_ps(), \
12411 #define _mm256_mask_extractf32x4_ps(W, U, X, C) \
12412 ((__m128) __builtin_ia32_extractf32x4_256_mask ((__v8sf)(__m256) (X), \
12414 (__v4sf)(__m128)(W), \
12417 #define _mm256_maskz_extractf32x4_ps(U, X, C) \
12418 ((__m128) __builtin_ia32_extractf32x4_256_mask ((__v8sf)(__m256) (X), \
12420 (__v4sf)(__m128)_mm_setzero_ps(), \
12423 #define _mm256_extracti32x4_epi32(X, C) \
12424 ((__m128i) __builtin_ia32_extracti32x4_256_mask ((__v8si)(__m256i) (X),\
12425 (int) (C), (__v4si)(__m128i)_mm_setzero_si128 (), (__mmask8)-1))
12427 #define _mm256_mask_extracti32x4_epi32(W, U, X, C) \
12428 ((__m128i) __builtin_ia32_extracti32x4_256_mask ((__v8si)(__m256i) (X),\
12429 (int) (C), (__v4si)(__m128i)(W), (__mmask8)(U)))
12431 #define _mm256_maskz_extracti32x4_epi32(U, X, C) \
12432 ((__m128i) __builtin_ia32_extracti32x4_256_mask ((__v8si)(__m256i) (X),\
12433 (int) (C), (__v4si)(__m128i)_mm_setzero_si128 (), (__mmask8)(U)))
12435 #define _mm256_shuffle_i64x2(X, Y, C) \
12436 ((__m256i) __builtin_ia32_shuf_i64x2_256_mask ((__v4di)(__m256i)(X), \
12437 (__v4di)(__m256i)(Y), (int)(C), \
12438 (__v4di)(__m256i)_mm256_setzero_si256 (), \
12441 #define _mm256_mask_shuffle_i64x2(W, U, X, Y, C) \
12442 ((__m256i) __builtin_ia32_shuf_i64x2_256_mask ((__v4di)(__m256i)(X), \
12443 (__v4di)(__m256i)(Y), (int)(C), \
12444 (__v4di)(__m256i)(W),\
12447 #define _mm256_maskz_shuffle_i64x2(U, X, Y, C) \
12448 ((__m256i) __builtin_ia32_shuf_i64x2_256_mask ((__v4di)(__m256i)(X), \
12449 (__v4di)(__m256i)(Y), (int)(C), \
12450 (__v4di)(__m256i)_mm256_setzero_si256 (), \
12453 #define _mm256_shuffle_i32x4(X, Y, C) \
12454 ((__m256i) __builtin_ia32_shuf_i32x4_256_mask ((__v8si)(__m256i)(X), \
12455 (__v8si)(__m256i)(Y), (int)(C), \
12456 (__v8si)(__m256i)_mm256_setzero_si256(), \
12459 #define _mm256_mask_shuffle_i32x4(W, U, X, Y, C) \
12460 ((__m256i) __builtin_ia32_shuf_i32x4_256_mask ((__v8si)(__m256i)(X), \
12461 (__v8si)(__m256i)(Y), (int)(C), \
12462 (__v8si)(__m256i)(W), \
12465 #define _mm256_maskz_shuffle_i32x4(U, X, Y, C) \
12466 ((__m256i) __builtin_ia32_shuf_i32x4_256_mask ((__v8si)(__m256i)(X), \
12467 (__v8si)(__m256i)(Y), (int)(C), \
12468 (__v8si)(__m256i)_mm256_setzero_si256(), \
12471 #define _mm256_shuffle_f64x2(X, Y, C) \
12472 ((__m256d) __builtin_ia32_shuf_f64x2_256_mask ((__v4df)(__m256d)(X), \
12473 (__v4df)(__m256d)(Y), (int)(C), \
12474 (__v4df)(__m256d)_mm256_setzero_pd(), \
12477 #define _mm256_mask_shuffle_f64x2(W, U, X, Y, C) \
12478 ((__m256d) __builtin_ia32_shuf_f64x2_256_mask ((__v4df)(__m256d)(X), \
12479 (__v4df)(__m256d)(Y), (int)(C), \
12480 (__v4df)(__m256d)(W), \
12483 #define _mm256_maskz_shuffle_f64x2(U, X, Y, C) \
12484 ((__m256d) __builtin_ia32_shuf_f64x2_256_mask ((__v4df)(__m256d)(X), \
12485 (__v4df)(__m256d)(Y), (int)(C), \
12486 (__v4df)(__m256d)_mm256_setzero_pd(), \
12489 #define _mm256_shuffle_f32x4(X, Y, C) \
12490 ((__m256) __builtin_ia32_shuf_f32x4_256_mask ((__v8sf)(__m256)(X), \
12491 (__v8sf)(__m256)(Y), (int)(C), \
12492 (__v8sf)(__m256)_mm256_setzero_ps(), \
12495 #define _mm256_mask_shuffle_f32x4(W, U, X, Y, C) \
12496 ((__m256) __builtin_ia32_shuf_f32x4_256_mask ((__v8sf)(__m256)(X), \
12497 (__v8sf)(__m256)(Y), (int)(C), \
12498 (__v8sf)(__m256)(W), \
12501 #define _mm256_maskz_shuffle_f32x4(U, X, Y, C) \
12502 ((__m256) __builtin_ia32_shuf_f32x4_256_mask ((__v8sf)(__m256)(X), \
12503 (__v8sf)(__m256)(Y), (int)(C), \
12504 (__v8sf)(__m256)_mm256_setzero_ps(), \
12507 #define _mm256_mask_shuffle_pd(W, U, A, B, C) \
12508 ((__m256d)__builtin_ia32_shufpd256_mask ((__v4df)(__m256d)(A), \
12509 (__v4df)(__m256d)(B), (int)(C), \
12510 (__v4df)(__m256d)(W), \
12513 #define _mm256_maskz_shuffle_pd(U, A, B, C) \
12514 ((__m256d)__builtin_ia32_shufpd256_mask ((__v4df)(__m256d)(A), \
12515 (__v4df)(__m256d)(B), (int)(C), \
12516 (__v4df)(__m256d)_mm256_setzero_pd(),\
12519 #define _mm_mask_shuffle_pd(W, U, A, B, C) \
12520 ((__m128d)__builtin_ia32_shufpd128_mask ((__v2df)(__m128d)(A), \
12521 (__v2df)(__m128d)(B), (int)(C), \
12522 (__v2df)(__m128d)(W), \
12525 #define _mm_maskz_shuffle_pd(U, A, B, C) \
12526 ((__m128d)__builtin_ia32_shufpd128_mask ((__v2df)(__m128d)(A), \
12527 (__v2df)(__m128d)(B), (int)(C), \
12528 (__v2df)(__m128d)_mm_setzero_pd(), \
12531 #define _mm256_mask_shuffle_ps(W, U, A, B, C) \
12532 ((__m256) __builtin_ia32_shufps256_mask ((__v8sf)(__m256)(A), \
12533 (__v8sf)(__m256)(B), (int)(C), \
12534 (__v8sf)(__m256)(W), \
12537 #define _mm256_maskz_shuffle_ps(U, A, B, C) \
12538 ((__m256) __builtin_ia32_shufps256_mask ((__v8sf)(__m256)(A), \
12539 (__v8sf)(__m256)(B), (int)(C), \
12540 (__v8sf)(__m256)_mm256_setzero_ps(), \
12543 #define _mm_mask_shuffle_ps(W, U, A, B, C) \
12544 ((__m128) __builtin_ia32_shufps128_mask ((__v4sf)(__m128)(A), \
12545 (__v4sf)(__m128)(B), (int)(C), \
12546 (__v4sf)(__m128)(W), \
12549 #define _mm_maskz_shuffle_ps(U, A, B, C) \
12550 ((__m128) __builtin_ia32_shufps128_mask ((__v4sf)(__m128)(A), \
12551 (__v4sf)(__m128)(B), (int)(C), \
12552 (__v4sf)(__m128)_mm_setzero_ps(), \
12555 #define _mm256_fixupimm_pd(X, Y, Z, C) \
12556 ((__m256d)__builtin_ia32_fixupimmpd256_mask ((__v4df)(__m256d)(X), \
12557 (__v4df)(__m256d)(Y), \
12558 (__v4di)(__m256i)(Z), (int)(C), \
12561 #define _mm256_mask_fixupimm_pd(X, U, Y, Z, C) \
12562 ((__m256d)__builtin_ia32_fixupimmpd256_mask ((__v4df)(__m256d)(X), \
12563 (__v4df)(__m256d)(Y), \
12564 (__v4di)(__m256i)(Z), (int)(C), \
12567 #define _mm256_maskz_fixupimm_pd(U, X, Y, Z, C) \
12568 ((__m256d)__builtin_ia32_fixupimmpd256_maskz ((__v4df)(__m256d)(X), \
12569 (__v4df)(__m256d)(Y), \
12570 (__v4di)(__m256i)(Z), (int)(C),\
12573 #define _mm256_fixupimm_ps(X, Y, Z, C) \
12574 ((__m256)__builtin_ia32_fixupimmps256_mask ((__v8sf)(__m256)(X), \
12575 (__v8sf)(__m256)(Y), \
12576 (__v8si)(__m256i)(Z), (int)(C), \
12580 #define _mm256_mask_fixupimm_ps(X, U, Y, Z, C) \
12581 ((__m256)__builtin_ia32_fixupimmps256_mask ((__v8sf)(__m256)(X), \
12582 (__v8sf)(__m256)(Y), \
12583 (__v8si)(__m256i)(Z), (int)(C), \
12586 #define _mm256_maskz_fixupimm_ps(U, X, Y, Z, C) \
12587 ((__m256)__builtin_ia32_fixupimmps256_maskz ((__v8sf)(__m256)(X), \
12588 (__v8sf)(__m256)(Y), \
12589 (__v8si)(__m256i)(Z), (int)(C),\
12592 #define _mm_fixupimm_pd(X, Y, Z, C) \
12593 ((__m128d)__builtin_ia32_fixupimmpd128_mask ((__v2df)(__m128d)(X), \
12594 (__v2df)(__m128d)(Y), \
12595 (__v2di)(__m128i)(Z), (int)(C), \
12599 #define _mm_mask_fixupimm_pd(X, U, Y, Z, C) \
12600 ((__m128d)__builtin_ia32_fixupimmpd128_mask ((__v2df)(__m128d)(X), \
12601 (__v2df)(__m128d)(Y), \
12602 (__v2di)(__m128i)(Z), (int)(C), \
12605 #define _mm_maskz_fixupimm_pd(U, X, Y, Z, C) \
12606 ((__m128d)__builtin_ia32_fixupimmpd128_maskz ((__v2df)(__m128d)(X), \
12607 (__v2df)(__m128d)(Y), \
12608 (__v2di)(__m128i)(Z), (int)(C),\
12611 #define _mm_fixupimm_ps(X, Y, Z, C) \
12612 ((__m128)__builtin_ia32_fixupimmps128_mask ((__v4sf)(__m128)(X), \
12613 (__v4sf)(__m128)(Y), \
12614 (__v4si)(__m128i)(Z), (int)(C), \
12617 #define _mm_mask_fixupimm_ps(X, U, Y, Z, C) \
12618 ((__m128)__builtin_ia32_fixupimmps128_mask ((__v4sf)(__m128)(X), \
12619 (__v4sf)(__m128)(Y), \
12620 (__v4si)(__m128i)(Z), (int)(C),\
12623 #define _mm_maskz_fixupimm_ps(U, X, Y, Z, C) \
12624 ((__m128)__builtin_ia32_fixupimmps128_maskz ((__v4sf)(__m128)(X), \
12625 (__v4sf)(__m128)(Y), \
12626 (__v4si)(__m128i)(Z), (int)(C),\
12629 #define _mm256_mask_srli_epi32(W, U, A, B) \
12630 ((__m256i) __builtin_ia32_psrldi256_mask ((__v8si)(__m256i)(A), \
12631 (int)(B), (__v8si)(__m256i)(W), (__mmask8)(U)))
12633 #define _mm256_maskz_srli_epi32(U, A, B) \
12634 ((__m256i) __builtin_ia32_psrldi256_mask ((__v8si)(__m256i)(A), \
12635 (int)(B), (__v8si)_mm256_setzero_si256(), (__mmask8)(U)))
12637 #define _mm_mask_srli_epi32(W, U, A, B) \
12638 ((__m128i) __builtin_ia32_psrldi128_mask ((__v4si)(__m128i)(A), \
12639 (int)(B), (__v4si)(__m128i)(W), (__mmask8)(U)))
12641 #define _mm_maskz_srli_epi32(U, A, B) \
12642 ((__m128i) __builtin_ia32_psrldi128_mask ((__v4si)(__m128i)(A), \
12643 (int)(B), (__v4si)_mm_setzero_si128(), (__mmask8)(U)))
12645 #define _mm256_mask_srli_epi64(W, U, A, B) \
12646 ((__m256i) __builtin_ia32_psrlqi256_mask ((__v4di)(__m256i)(A), \
12647 (int)(B), (__v4di)(__m256i)(W), (__mmask8)(U)))
12649 #define _mm256_maskz_srli_epi64(U, A, B) \
12650 ((__m256i) __builtin_ia32_psrlqi256_mask ((__v4di)(__m256i)(A), \
12651 (int)(B), (__v4di)_mm256_setzero_si256 (), (__mmask8)(U)))
12653 #define _mm_mask_srli_epi64(W, U, A, B) \
12654 ((__m128i) __builtin_ia32_psrlqi128_mask ((__v2di)(__m128i)(A), \
12655 (int)(B), (__v2di)(__m128i)(W), (__mmask8)(U)))
12657 #define _mm_maskz_srli_epi64(U, A, B) \
12658 ((__m128i) __builtin_ia32_psrlqi128_mask ((__v2di)(__m128i)(A), \
12659 (int)(B), (__v2di)_mm_setzero_si128(), (__mmask8)(U)))
12661 #define _mm256_mask_slli_epi32(W, U, X, C) \
12662 ((__m256i)__builtin_ia32_pslldi256_mask ((__v8si)(__m256i)(X), (int)(C),\
12663 (__v8si)(__m256i)(W),\
12666 #define _mm256_maskz_slli_epi32(U, X, C) \
12667 ((__m256i)__builtin_ia32_pslldi256_mask ((__v8si)(__m256i)(X), (int)(C),\
12668 (__v8si)(__m256i)_mm256_setzero_si256(),\
12671 #define _mm256_mask_slli_epi64(W, U, X, C) \
12672 ((__m256i)__builtin_ia32_psllqi256_mask ((__v4di)(__m256i)(X), (int)(C),\
12673 (__v4di)(__m256i)(W),\
12676 #define _mm256_maskz_slli_epi64(U, X, C) \
12677 ((__m256i)__builtin_ia32_psllqi256_mask ((__v4di)(__m256i)(X), (int)(C),\
12678 (__v4di)(__m256i)_mm256_setzero_si256 (),\
12681 #define _mm_mask_slli_epi32(W, U, X, C) \
12682 ((__m128i)__builtin_ia32_pslldi128_mask ((__v4si)(__m128i)(X), (int)(C),\
12683 (__v4si)(__m128i)(W),\
12686 #define _mm_maskz_slli_epi32(U, X, C) \
12687 ((__m128i)__builtin_ia32_pslldi128_mask ((__v4si)(__m128i)(X), (int)(C),\
12688 (__v4si)(__m128i)_mm_setzero_si128 (),\
12691 #define _mm_mask_slli_epi64(W, U, X, C) \
12692 ((__m128i)__builtin_ia32_psllqi128_mask ((__v2di)(__m128i)(X), (int)(C),\
12693 (__v2di)(__m128i)(W),\
12696 #define _mm_maskz_slli_epi64(U, X, C) \
12697 ((__m128i)__builtin_ia32_psllqi128_mask ((__v2di)(__m128i)(X), (int)(C),\
12698 (__v2di)(__m128i)_mm_setzero_di(),\
12701 #define _mm256_ternarylogic_epi64(A, B, C, I) \
12702 ((__m256i) __builtin_ia32_pternlogq256_mask ((__v4di)(__m256i)(A), \
12703 (__v4di)(__m256i)(B), (__v4di)(__m256i)(C), (int)(I), (__mmask8)-1))
12705 #define _mm256_mask_ternarylogic_epi64(A, U, B, C, I) \
12706 ((__m256i) __builtin_ia32_pternlogq256_mask ((__v4di)(__m256i)(A), \
12707 (__v4di)(__m256i)(B), (__v4di)(__m256i)(C), (int)(I), (__mmask8)(U)))
12709 #define _mm256_maskz_ternarylogic_epi64(U, A, B, C, I) \
12710 ((__m256i) __builtin_ia32_pternlogq256_maskz ((__v4di)(__m256i)(A), \
12711 (__v4di)(__m256i)(B), (__v4di)(__m256i)(C), (int)(I), (__mmask8)(U)))
12713 #define _mm256_ternarylogic_epi32(A, B, C, I) \
12714 ((__m256i) __builtin_ia32_pternlogd256_mask ((__v8si)(__m256i)(A), \
12715 (__v8si)(__m256i)(B), (__v8si)(__m256i)(C), (int)(I), (__mmask8)-1))
12717 #define _mm256_mask_ternarylogic_epi32(A, U, B, C, I) \
12718 ((__m256i) __builtin_ia32_pternlogd256_mask ((__v8si)(__m256i)(A), \
12719 (__v8si)(__m256i)(B), (__v8si)(__m256i)(C), (int)(I), (__mmask8)(U)))
12721 #define _mm256_maskz_ternarylogic_epi32(U, A, B, C, I) \
12722 ((__m256i) __builtin_ia32_pternlogd256_maskz ((__v8si)(__m256i)(A), \
12723 (__v8si)(__m256i)(B), (__v8si)(__m256i)(C), (int)(I), (__mmask8)(U)))
12725 #define _mm_ternarylogic_epi64(A, B, C, I) \
12726 ((__m128i) __builtin_ia32_pternlogq128_mask ((__v2di)(__m128i)(A), \
12727 (__v2di)(__m128i)(B), (__v2di)(__m128i)(C), (int)(I), (__mmask8)-1))
12729 #define _mm_mask_ternarylogic_epi64(A, U, B, C, I) \
12730 ((__m128i) __builtin_ia32_pternlogq128_mask ((__v2di)(__m128i)(A), \
12731 (__v2di)(__m128i)(B), (__v2di)(__m128i)(C), (int)(I), (__mmask8)(U)))
12733 #define _mm_maskz_ternarylogic_epi64(U, A, B, C, I) \
12734 ((__m128i) __builtin_ia32_pternlogq128_maskz ((__v2di)(__m128i)(A), \
12735 (__v2di)(__m128i)(B), (__v2di)(__m128i)(C), (int)(I), (__mmask8)(U)))
12737 #define _mm_ternarylogic_epi32(A, B, C, I) \
12738 ((__m128i) __builtin_ia32_pternlogd128_mask ((__v4si)(__m128i)(A), \
12739 (__v4si)(__m128i)(B), (__v4si)(__m128i)(C), (int)(I), (__mmask8)-1))
12741 #define _mm_mask_ternarylogic_epi32(A, U, B, C, I) \
12742 ((__m128i) __builtin_ia32_pternlogd128_mask ((__v4si)(__m128i)(A), \
12743 (__v4si)(__m128i)(B), (__v4si)(__m128i)(C), (int)(I), (__mmask8)(U)))
12745 #define _mm_maskz_ternarylogic_epi32(U, A, B, C, I) \
12746 ((__m128i) __builtin_ia32_pternlogd128_maskz ((__v4si)(__m128i)(A), \
12747 (__v4si)(__m128i)(B), (__v4si)(__m128i)(C), (int)(I), (__mmask8)(U)))
12749 #define _mm256_roundscale_ps(A, B) \
12750 ((__m256) __builtin_ia32_rndscaleps_256_mask ((__v8sf)(__m256)(A), \
12751 (int)(B), (__v8sf)(__m256)_mm256_setzero_ps(), (__mmask8)-1))
12753 #define _mm256_mask_roundscale_ps(W, U, A, B) \
12754 ((__m256) __builtin_ia32_rndscaleps_256_mask ((__v8sf)(__m256)(A), \
12755 (int)(B), (__v8sf)(__m256)(W), (__mmask8)(U)))
12757 #define _mm256_maskz_roundscale_ps(U, A, B) \
12758 ((__m256) __builtin_ia32_rndscaleps_256_mask ((__v8sf)(__m256)(A), \
12759 (int)(B), (__v8sf)(__m256)_mm256_setzero_ps(), (__mmask8)(U)))
12761 #define _mm256_roundscale_pd(A, B) \
12762 ((__m256d) __builtin_ia32_rndscalepd_256_mask ((__v4df)(__m256d)(A), \
12763 (int)(B), (__v4df)(__m256d)_mm256_setzero_pd(), (__mmask8)-1))
12765 #define _mm256_mask_roundscale_pd(W, U, A, B) \
12766 ((__m256d) __builtin_ia32_rndscalepd_256_mask ((__v4df)(__m256d)(A), \
12767 (int)(B), (__v4df)(__m256d)(W), (__mmask8)(U)))
12769 #define _mm256_maskz_roundscale_pd(U, A, B) \
12770 ((__m256d) __builtin_ia32_rndscalepd_256_mask ((__v4df)(__m256d)(A), \
12771 (int)(B), (__v4df)(__m256d)_mm256_setzero_pd(), (__mmask8)(U)))
12773 #define _mm_roundscale_ps(A, B) \
12774 ((__m128) __builtin_ia32_rndscaleps_128_mask ((__v4sf)(__m128)(A), \
12775 (int)(B), (__v4sf)(__m128)_mm_setzero_ps(), (__mmask8)-1))
12777 #define _mm_mask_roundscale_ps(W, U, A, B) \
12778 ((__m128) __builtin_ia32_rndscaleps_128_mask ((__v4sf)(__m128)(A), \
12779 (int)(B), (__v4sf)(__m128)(W), (__mmask8)(U)))
12781 #define _mm_maskz_roundscale_ps(U, A, B) \
12782 ((__m128) __builtin_ia32_rndscaleps_128_mask ((__v4sf)(__m128)(A), \
12783 (int)(B), (__v4sf)(__m128)_mm_setzero_ps(), (__mmask8)(U)))
12785 #define _mm_roundscale_pd(A, B) \
12786 ((__m128d) __builtin_ia32_rndscalepd_128_mask ((__v2df)(__m128d)(A), \
12787 (int)(B), (__v2df)(__m128d)_mm_setzero_pd(), (__mmask8)-1))
12789 #define _mm_mask_roundscale_pd(W, U, A, B) \
12790 ((__m128d) __builtin_ia32_rndscalepd_128_mask ((__v2df)(__m128d)(A), \
12791 (int)(B), (__v2df)(__m128d)(W), (__mmask8)(U)))
12793 #define _mm_maskz_roundscale_pd(U, A, B) \
12794 ((__m128d) __builtin_ia32_rndscalepd_128_mask ((__v2df)(__m128d)(A), \
12795 (int)(B), (__v2df)(__m128d)_mm_setzero_pd(), (__mmask8)(U)))
12797 #define _mm256_getmant_ps(X, B, C) \
12798 ((__m256) __builtin_ia32_getmantps256_mask ((__v8sf)(__m256) (X), \
12799 (int)(((C)<<2) | (B)), \
12800 (__v8sf)(__m256)_mm256_setzero_ps(), \
12803 #define _mm256_mask_getmant_ps(W, U, X, B, C) \
12804 ((__m256) __builtin_ia32_getmantps256_mask ((__v8sf)(__m256) (X), \
12805 (int)(((C)<<2) | (B)), \
12806 (__v8sf)(__m256)(W), \
12809 #define _mm256_maskz_getmant_ps(U, X, B, C) \
12810 ((__m256) __builtin_ia32_getmantps256_mask ((__v8sf)(__m256) (X), \
12811 (int)(((C)<<2) | (B)), \
12812 (__v8sf)(__m256)_mm256_setzero_ps(), \
12815 #define _mm_getmant_ps(X, B, C) \
12816 ((__m128) __builtin_ia32_getmantps128_mask ((__v4sf)(__m128) (X), \
12817 (int)(((C)<<2) | (B)), \
12818 (__v4sf)(__m128)_mm_setzero_ps(), \
12821 #define _mm_mask_getmant_ps(W, U, X, B, C) \
12822 ((__m128) __builtin_ia32_getmantps128_mask ((__v4sf)(__m128) (X), \
12823 (int)(((C)<<2) | (B)), \
12824 (__v4sf)(__m128)(W), \
12827 #define _mm_maskz_getmant_ps(U, X, B, C) \
12828 ((__m128) __builtin_ia32_getmantps128_mask ((__v4sf)(__m128) (X), \
12829 (int)(((C)<<2) | (B)), \
12830 (__v4sf)(__m128)_mm_setzero_ps(), \
12833 #define _mm256_getmant_pd(X, B, C) \
12834 ((__m256d) __builtin_ia32_getmantpd256_mask ((__v4df)(__m256d) (X), \
12835 (int)(((C)<<2) | (B)), \
12836 (__v4df)(__m256d)_mm256_setzero_pd(), \
12839 #define _mm256_mask_getmant_pd(W, U, X, B, C) \
12840 ((__m256d) __builtin_ia32_getmantpd256_mask ((__v4df)(__m256d) (X), \
12841 (int)(((C)<<2) | (B)), \
12842 (__v4df)(__m256d)(W), \
12845 #define _mm256_maskz_getmant_pd(U, X, B, C) \
12846 ((__m256d) __builtin_ia32_getmantpd256_mask ((__v4df)(__m256d) (X), \
12847 (int)(((C)<<2) | (B)), \
12848 (__v4df)(__m256d)_mm256_setzero_pd(), \
12851 #define _mm_getmant_pd(X, B, C) \
12852 ((__m128d) __builtin_ia32_getmantpd128_mask ((__v2df)(__m128d) (X), \
12853 (int)(((C)<<2) | (B)), \
12854 (__v2df)(__m128d)_mm_setzero_pd(), \
12857 #define _mm_mask_getmant_pd(W, U, X, B, C) \
12858 ((__m128d) __builtin_ia32_getmantpd128_mask ((__v2df)(__m128d) (X), \
12859 (int)(((C)<<2) | (B)), \
12860 (__v2df)(__m128d)(W), \
12863 #define _mm_maskz_getmant_pd(U, X, B, C) \
12864 ((__m128d) __builtin_ia32_getmantpd128_mask ((__v2df)(__m128d) (X), \
12865 (int)(((C)<<2) | (B)), \
12866 (__v2df)(__m128d)_mm_setzero_pd(), \
12869 #define _mm256_mmask_i32gather_ps(V1OLD, MASK, INDEX, ADDR, SCALE) \
12870 (__m256) __builtin_ia32_gather3siv8sf ((__v8sf)(__m256)V1OLD, \
12871 (float const *)ADDR, \
12872 (__v8si)(__m256i)INDEX, \
12873 (__mmask8)MASK, (int)SCALE)
12875 #define _mm_mmask_i32gather_ps(V1OLD, MASK, INDEX, ADDR, SCALE) \
12876 (__m128) __builtin_ia32_gather3siv4sf ((__v4sf)(__m128)V1OLD, \
12877 (float const *)ADDR, \
12878 (__v4si)(__m128i)INDEX, \
12879 (__mmask8)MASK, (int)SCALE)
12881 #define _mm256_mmask_i32gather_pd(V1OLD, MASK, INDEX, ADDR, SCALE) \
12882 (__m256d) __builtin_ia32_gather3siv4df ((__v4df)(__m256d)V1OLD, \
12883 (double const *)ADDR, \
12884 (__v4si)(__m128i)INDEX, \
12885 (__mmask8)MASK, (int)SCALE)
12887 #define _mm_mmask_i32gather_pd(V1OLD, MASK, INDEX, ADDR, SCALE) \
12888 (__m128d) __builtin_ia32_gather3siv2df ((__v2df)(__m128d)V1OLD, \
12889 (double const *)ADDR, \
12890 (__v4si)(__m128i)INDEX, \
12891 (__mmask8)MASK, (int)SCALE)
12893 #define _mm256_mmask_i64gather_ps(V1OLD, MASK, INDEX, ADDR, SCALE) \
12894 (__m128) __builtin_ia32_gather3div8sf ((__v4sf)(__m128)V1OLD, \
12895 (float const *)ADDR, \
12896 (__v4di)(__m256i)INDEX, \
12897 (__mmask8)MASK, (int)SCALE)
12899 #define _mm_mmask_i64gather_ps(V1OLD, MASK, INDEX, ADDR, SCALE) \
12900 (__m128) __builtin_ia32_gather3div4sf ((__v4sf)(__m128)V1OLD, \
12901 (float const *)ADDR, \
12902 (__v2di)(__m128i)INDEX, \
12903 (__mmask8)MASK, (int)SCALE)
12905 #define _mm256_mmask_i64gather_pd(V1OLD, MASK, INDEX, ADDR, SCALE) \
12906 (__m256d) __builtin_ia32_gather3div4df ((__v4df)(__m256d)V1OLD, \
12907 (double const *)ADDR, \
12908 (__v4di)(__m256i)INDEX, \
12909 (__mmask8)MASK, (int)SCALE)
12911 #define _mm_mmask_i64gather_pd(V1OLD, MASK, INDEX, ADDR, SCALE) \
12912 (__m128d) __builtin_ia32_gather3div2df ((__v2df)(__m128d)V1OLD, \
12913 (double const *)ADDR, \
12914 (__v2di)(__m128i)INDEX, \
12915 (__mmask8)MASK, (int)SCALE)
12917 #define _mm256_mmask_i32gather_epi32(V1OLD, MASK, INDEX, ADDR, SCALE) \
12918 (__m256i) __builtin_ia32_gather3siv8si ((__v8si)(__m256i)V1OLD, \
12919 (int const *)ADDR, \
12920 (__v8si)(__m256i)INDEX, \
12921 (__mmask8)MASK, (int)SCALE)
12923 #define _mm_mmask_i32gather_epi32(V1OLD, MASK, INDEX, ADDR, SCALE) \
12924 (__m128i) __builtin_ia32_gather3siv4si ((__v4si)(__m128i)V1OLD, \
12925 (int const *)ADDR, \
12926 (__v4si)(__m128i)INDEX, \
12927 (__mmask8)MASK, (int)SCALE)
12929 #define _mm256_mmask_i32gather_epi64(V1OLD, MASK, INDEX, ADDR, SCALE) \
12930 (__m256i) __builtin_ia32_gather3siv4di ((__v4di)(__m256i)V1OLD, \
12931 (long long const *)ADDR, \
12932 (__v4si)(__m128i)INDEX, \
12933 (__mmask8)MASK, (int)SCALE)
12935 #define _mm_mmask_i32gather_epi64(V1OLD, MASK, INDEX, ADDR, SCALE) \
12936 (__m128i) __builtin_ia32_gather3siv2di ((__v2di)(__m128i)V1OLD, \
12937 (long long const *)ADDR, \
12938 (__v4si)(__m128i)INDEX, \
12939 (__mmask8)MASK, (int)SCALE)
12941 #define _mm256_mmask_i64gather_epi32(V1OLD, MASK, INDEX, ADDR, SCALE) \
12942 (__m128i) __builtin_ia32_gather3div8si ((__v4si)(__m128i)V1OLD, \
12943 (int const *)ADDR, \
12944 (__v4di)(__m256i)INDEX, \
12945 (__mmask8)MASK, (int)SCALE)
12947 #define _mm_mmask_i64gather_epi32(V1OLD, MASK, INDEX, ADDR, SCALE) \
12948 (__m128i) __builtin_ia32_gather3div4si ((__v4si)(__m128i)V1OLD, \
12949 (int const *)ADDR, \
12950 (__v2di)(__m128i)INDEX, \
12951 (__mmask8)MASK, (int)SCALE)
12953 #define _mm256_mmask_i64gather_epi64(V1OLD, MASK, INDEX, ADDR, SCALE) \
12954 (__m256i) __builtin_ia32_gather3div4di ((__v4di)(__m256i)V1OLD, \
12955 (long long const *)ADDR, \
12956 (__v4di)(__m256i)INDEX, \
12957 (__mmask8)MASK, (int)SCALE)
12959 #define _mm_mmask_i64gather_epi64(V1OLD, MASK, INDEX, ADDR, SCALE) \
12960 (__m128i) __builtin_ia32_gather3div2di ((__v2di)(__m128i)V1OLD, \
12961 (long long const *)ADDR, \
12962 (__v2di)(__m128i)INDEX, \
12963 (__mmask8)MASK, (int)SCALE)
12965 #define _mm256_i32scatter_ps(ADDR, INDEX, V1, SCALE) \
12966 __builtin_ia32_scattersiv8sf ((float *)ADDR, (__mmask8)0xFF, \
12967 (__v8si)(__m256i)INDEX, \
12968 (__v8sf)(__m256)V1, (int)SCALE)
12970 #define _mm256_mask_i32scatter_ps(ADDR, MASK, INDEX, V1, SCALE) \
12971 __builtin_ia32_scattersiv8sf ((float *)ADDR, (__mmask8)MASK, \
12972 (__v8si)(__m256i)INDEX, \
12973 (__v8sf)(__m256)V1, (int)SCALE)
12975 #define _mm_i32scatter_ps(ADDR, INDEX, V1, SCALE) \
12976 __builtin_ia32_scattersiv4sf ((float *)ADDR, (__mmask8)0xFF, \
12977 (__v4si)(__m128i)INDEX, \
12978 (__v4sf)(__m128)V1, (int)SCALE)
12980 #define _mm_mask_i32scatter_ps(ADDR, MASK, INDEX, V1, SCALE) \
12981 __builtin_ia32_scattersiv4sf ((float *)ADDR, (__mmask8)MASK, \
12982 (__v4si)(__m128i)INDEX, \
12983 (__v4sf)(__m128)V1, (int)SCALE)
12985 #define _mm256_i32scatter_pd(ADDR, INDEX, V1, SCALE) \
12986 __builtin_ia32_scattersiv4df ((double *)ADDR, (__mmask8)0xFF, \
12987 (__v4si)(__m128i)INDEX, \
12988 (__v4df)(__m256d)V1, (int)SCALE)
12990 #define _mm256_mask_i32scatter_pd(ADDR, MASK, INDEX, V1, SCALE) \
12991 __builtin_ia32_scattersiv4df ((double *)ADDR, (__mmask8)MASK, \
12992 (__v4si)(__m128i)INDEX, \
12993 (__v4df)(__m256d)V1, (int)SCALE)
12995 #define _mm_i32scatter_pd(ADDR, INDEX, V1, SCALE) \
12996 __builtin_ia32_scattersiv2df ((double *)ADDR, (__mmask8)0xFF, \
12997 (__v4si)(__m128i)INDEX, \
12998 (__v2df)(__m128d)V1, (int)SCALE)
13000 #define _mm_mask_i32scatter_pd(ADDR, MASK, INDEX, V1, SCALE) \
13001 __builtin_ia32_scattersiv2df ((double *)ADDR, (__mmask8)MASK, \
13002 (__v4si)(__m128i)INDEX, \
13003 (__v2df)(__m128d)V1, (int)SCALE)
13005 #define _mm256_i64scatter_ps(ADDR, INDEX, V1, SCALE) \
13006 __builtin_ia32_scatterdiv8sf ((float *)ADDR, (__mmask8)0xFF, \
13007 (__v4di)(__m256i)INDEX, \
13008 (__v4sf)(__m128)V1, (int)SCALE)
13010 #define _mm256_mask_i64scatter_ps(ADDR, MASK, INDEX, V1, SCALE) \
13011 __builtin_ia32_scatterdiv8sf ((float *)ADDR, (__mmask8)MASK, \
13012 (__v4di)(__m256i)INDEX, \
13013 (__v4sf)(__m128)V1, (int)SCALE)
13015 #define _mm_i64scatter_ps(ADDR, INDEX, V1, SCALE) \
13016 __builtin_ia32_scatterdiv4sf ((float *)ADDR, (__mmask8)0xFF, \
13017 (__v2di)(__m128i)INDEX, \
13018 (__v4sf)(__m128)V1, (int)SCALE)
13020 #define _mm_mask_i64scatter_ps(ADDR, MASK, INDEX, V1, SCALE) \
13021 __builtin_ia32_scatterdiv4sf ((float *)ADDR, (__mmask8)MASK, \
13022 (__v2di)(__m128i)INDEX, \
13023 (__v4sf)(__m128)V1, (int)SCALE)
13025 #define _mm256_i64scatter_pd(ADDR, INDEX, V1, SCALE) \
13026 __builtin_ia32_scatterdiv4df ((double *)ADDR, (__mmask8)0xFF, \
13027 (__v4di)(__m256i)INDEX, \
13028 (__v4df)(__m256d)V1, (int)SCALE)
13030 #define _mm256_mask_i64scatter_pd(ADDR, MASK, INDEX, V1, SCALE) \
13031 __builtin_ia32_scatterdiv4df ((double *)ADDR, (__mmask8)MASK, \
13032 (__v4di)(__m256i)INDEX, \
13033 (__v4df)(__m256d)V1, (int)SCALE)
13035 #define _mm_i64scatter_pd(ADDR, INDEX, V1, SCALE) \
13036 __builtin_ia32_scatterdiv2df ((double *)ADDR, (__mmask8)0xFF, \
13037 (__v2di)(__m128i)INDEX, \
13038 (__v2df)(__m128d)V1, (int)SCALE)
13040 #define _mm_mask_i64scatter_pd(ADDR, MASK, INDEX, V1, SCALE) \
13041 __builtin_ia32_scatterdiv2df ((double *)ADDR, (__mmask8)MASK, \
13042 (__v2di)(__m128i)INDEX, \
13043 (__v2df)(__m128d)V1, (int)SCALE)
13045 #define _mm256_i32scatter_epi32(ADDR, INDEX, V1, SCALE) \
13046 __builtin_ia32_scattersiv8si ((int *)ADDR, (__mmask8)0xFF, \
13047 (__v8si)(__m256i)INDEX, \
13048 (__v8si)(__m256i)V1, (int)SCALE)
13050 #define _mm256_mask_i32scatter_epi32(ADDR, MASK, INDEX, V1, SCALE) \
13051 __builtin_ia32_scattersiv8si ((int *)ADDR, (__mmask8)MASK, \
13052 (__v8si)(__m256i)INDEX, \
13053 (__v8si)(__m256i)V1, (int)SCALE)
13055 #define _mm_i32scatter_epi32(ADDR, INDEX, V1, SCALE) \
13056 __builtin_ia32_scattersiv4si ((int *)ADDR, (__mmask8)0xFF, \
13057 (__v4si)(__m128i)INDEX, \
13058 (__v4si)(__m128i)V1, (int)SCALE)
13060 #define _mm_mask_i32scatter_epi32(ADDR, MASK, INDEX, V1, SCALE) \
13061 __builtin_ia32_scattersiv4si ((int *)ADDR, (__mmask8)MASK, \
13062 (__v4si)(__m128i)INDEX, \
13063 (__v4si)(__m128i)V1, (int)SCALE)
13065 #define _mm256_i32scatter_epi64(ADDR, INDEX, V1, SCALE) \
13066 __builtin_ia32_scattersiv4di ((long long *)ADDR, (__mmask8)0xFF, \
13067 (__v4si)(__m128i)INDEX, \
13068 (__v4di)(__m256i)V1, (int)SCALE)
13070 #define _mm256_mask_i32scatter_epi64(ADDR, MASK, INDEX, V1, SCALE) \
13071 __builtin_ia32_scattersiv4di ((long long *)ADDR, (__mmask8)MASK, \
13072 (__v4si)(__m128i)INDEX, \
13073 (__v4di)(__m256i)V1, (int)SCALE)
13075 #define _mm_i32scatter_epi64(ADDR, INDEX, V1, SCALE) \
13076 __builtin_ia32_scattersiv2di ((long long *)ADDR, (__mmask8)0xFF, \
13077 (__v4si)(__m128i)INDEX, \
13078 (__v2di)(__m128i)V1, (int)SCALE)
13080 #define _mm_mask_i32scatter_epi64(ADDR, MASK, INDEX, V1, SCALE) \
13081 __builtin_ia32_scattersiv2di ((long long *)ADDR, (__mmask8)MASK, \
13082 (__v4si)(__m128i)INDEX, \
13083 (__v2di)(__m128i)V1, (int)SCALE)
13085 #define _mm256_i64scatter_epi32(ADDR, INDEX, V1, SCALE) \
13086 __builtin_ia32_scatterdiv8si ((int *)ADDR, (__mmask8)0xFF, \
13087 (__v4di)(__m256i)INDEX, \
13088 (__v4si)(__m128i)V1, (int)SCALE)
13090 #define _mm256_mask_i64scatter_epi32(ADDR, MASK, INDEX, V1, SCALE) \
13091 __builtin_ia32_scatterdiv8si ((int *)ADDR, (__mmask8)MASK, \
13092 (__v4di)(__m256i)INDEX, \
13093 (__v4si)(__m128i)V1, (int)SCALE)
13095 #define _mm_i64scatter_epi32(ADDR, INDEX, V1, SCALE) \
13096 __builtin_ia32_scatterdiv4si ((int *)ADDR, (__mmask8)0xFF, \
13097 (__v2di)(__m128i)INDEX, \
13098 (__v4si)(__m128i)V1, (int)SCALE)
13100 #define _mm_mask_i64scatter_epi32(ADDR, MASK, INDEX, V1, SCALE) \
13101 __builtin_ia32_scatterdiv4si ((int *)ADDR, (__mmask8)MASK, \
13102 (__v2di)(__m128i)INDEX, \
13103 (__v4si)(__m128i)V1, (int)SCALE)
13105 #define _mm256_i64scatter_epi64(ADDR, INDEX, V1, SCALE) \
13106 __builtin_ia32_scatterdiv4di ((long long *)ADDR, (__mmask8)0xFF, \
13107 (__v4di)(__m256i)INDEX, \
13108 (__v4di)(__m256i)V1, (int)SCALE)
13110 #define _mm256_mask_i64scatter_epi64(ADDR, MASK, INDEX, V1, SCALE) \
13111 __builtin_ia32_scatterdiv4di ((long long *)ADDR, (__mmask8)MASK, \
13112 (__v4di)(__m256i)INDEX, \
13113 (__v4di)(__m256i)V1, (int)SCALE)
13115 #define _mm_i64scatter_epi64(ADDR, INDEX, V1, SCALE) \
13116 __builtin_ia32_scatterdiv2di ((long long *)ADDR, (__mmask8)0xFF, \
13117 (__v2di)(__m128i)INDEX, \
13118 (__v2di)(__m128i)V1, (int)SCALE)
13120 #define _mm_mask_i64scatter_epi64(ADDR, MASK, INDEX, V1, SCALE) \
13121 __builtin_ia32_scatterdiv2di ((long long *)ADDR, (__mmask8)MASK, \
13122 (__v2di)(__m128i)INDEX, \
13123 (__v2di)(__m128i)V1, (int)SCALE)
13125 #define _mm256_mask_shuffle_epi32(W, U, X, C) \
13126 ((__m256i) __builtin_ia32_pshufd256_mask ((__v8si)(__m256i)(X), (int)(C), \
13127 (__v8si)(__m256i)(W), \
13130 #define _mm256_maskz_shuffle_epi32(U, X, C) \
13131 ((__m256i) __builtin_ia32_pshufd256_mask ((__v8si)(__m256i)(X), (int)(C), \
13132 (__v8si)(__m256i)_mm256_setzero_si256(), \
13135 #define _mm_mask_shuffle_epi32(W, U, X, C) \
13136 ((__m128i) __builtin_ia32_pshufd128_mask ((__v4si)(__m128i)(X), (int)(C), \
13137 (__v4si)(__m128i)(W), \
13140 #define _mm_maskz_shuffle_epi32(U, X, C) \
13141 ((__m128i) __builtin_ia32_pshufd128_mask ((__v4si)(__m128i)(X), (int)(C), \
13142 (__v4si)(__m128i)_mm_setzero_si128 (), \
13145 #define _mm256_rol_epi64(A, B) \
13146 ((__m256i)__builtin_ia32_prolq256_mask ((__v4di)(__m256i)(A), (int)(B), \
13147 (__v4di)(__m256i)_mm256_setzero_si256 (),\
13150 #define _mm256_mask_rol_epi64(W, U, A, B) \
13151 ((__m256i)__builtin_ia32_prolq256_mask ((__v4di)(__m256i)(A), (int)(B), \
13152 (__v4di)(__m256i)(W), \
13155 #define _mm256_maskz_rol_epi64(U, A, B) \
13156 ((__m256i)__builtin_ia32_prolq256_mask ((__v4di)(__m256i)(A), (int)(B), \
13157 (__v4di)(__m256i)_mm256_setzero_si256 (),\
13160 #define _mm_rol_epi64(A, B) \
13161 ((__m128i)__builtin_ia32_prolq128_mask ((__v2di)(__m128i)(A), (int)(B), \
13162 (__v2di)(__m128i)_mm_setzero_di(), \
13165 #define _mm_mask_rol_epi64(W, U, A, B) \
13166 ((__m128i)__builtin_ia32_prolq128_mask ((__v2di)(__m128i)(A), (int)(B), \
13167 (__v2di)(__m128i)(W), \
13170 #define _mm_maskz_rol_epi64(U, A, B) \
13171 ((__m128i)__builtin_ia32_prolq128_mask ((__v2di)(__m128i)(A), (int)(B), \
13172 (__v2di)(__m128i)_mm_setzero_di(), \
13175 #define _mm256_ror_epi64(A, B) \
13176 ((__m256i)__builtin_ia32_prorq256_mask ((__v4di)(__m256i)(A), (int)(B), \
13177 (__v4di)(__m256i)_mm256_setzero_si256 (),\
13180 #define _mm256_mask_ror_epi64(W, U, A, B) \
13181 ((__m256i)__builtin_ia32_prorq256_mask ((__v4di)(__m256i)(A), (int)(B), \
13182 (__v4di)(__m256i)(W), \
13185 #define _mm256_maskz_ror_epi64(U, A, B) \
13186 ((__m256i)__builtin_ia32_prorq256_mask ((__v4di)(__m256i)(A), (int)(B), \
13187 (__v4di)(__m256i)_mm256_setzero_si256 (),\
13190 #define _mm_ror_epi64(A, B) \
13191 ((__m128i)__builtin_ia32_prorq128_mask ((__v2di)(__m128i)(A), (int)(B), \
13192 (__v2di)(__m128i)_mm_setzero_di(), \
13195 #define _mm_mask_ror_epi64(W, U, A, B) \
13196 ((__m128i)__builtin_ia32_prorq128_mask ((__v2di)(__m128i)(A), (int)(B), \
13197 (__v2di)(__m128i)(W), \
13200 #define _mm_maskz_ror_epi64(U, A, B) \
13201 ((__m128i)__builtin_ia32_prorq128_mask ((__v2di)(__m128i)(A), (int)(B), \
13202 (__v2di)(__m128i)_mm_setzero_di(), \
13205 #define _mm256_rol_epi32(A, B) \
13206 ((__m256i)__builtin_ia32_prold256_mask ((__v8si)(__m256i)(A), (int)(B), \
13207 (__v8si)(__m256i)_mm256_setzero_si256(),\
13210 #define _mm256_mask_rol_epi32(W, U, A, B) \
13211 ((__m256i)__builtin_ia32_prold256_mask ((__v8si)(__m256i)(A), (int)(B), \
13212 (__v8si)(__m256i)(W), \
13215 #define _mm256_maskz_rol_epi32(U, A, B) \
13216 ((__m256i)__builtin_ia32_prold256_mask ((__v8si)(__m256i)(A), (int)(B), \
13217 (__v8si)(__m256i)_mm256_setzero_si256(),\
13220 #define _mm_rol_epi32(A, B) \
13221 ((__m128i)__builtin_ia32_prold128_mask ((__v4si)(__m128i)(A), (int)(B), \
13222 (__v4si)(__m128i)_mm_setzero_si128 (), \
13225 #define _mm_mask_rol_epi32(W, U, A, B) \
13226 ((__m128i)__builtin_ia32_prold128_mask ((__v4si)(__m128i)(A), (int)(B), \
13227 (__v4si)(__m128i)(W), \
13230 #define _mm_maskz_rol_epi32(U, A, B) \
13231 ((__m128i)__builtin_ia32_prold128_mask ((__v4si)(__m128i)(A), (int)(B), \
13232 (__v4si)(__m128i)_mm_setzero_si128 (), \
13235 #define _mm256_ror_epi32(A, B) \
13236 ((__m256i)__builtin_ia32_prord256_mask ((__v8si)(__m256i)(A), (int)(B), \
13237 (__v8si)(__m256i)_mm256_setzero_si256(),\
13240 #define _mm256_mask_ror_epi32(W, U, A, B) \
13241 ((__m256i)__builtin_ia32_prord256_mask ((__v8si)(__m256i)(A), (int)(B), \
13242 (__v8si)(__m256i)(W), \
13245 #define _mm256_maskz_ror_epi32(U, A, B) \
13246 ((__m256i)__builtin_ia32_prord256_mask ((__v8si)(__m256i)(A), (int)(B), \
13247 (__v8si)(__m256i)_mm256_setzero_si256(),\
13250 #define _mm_ror_epi32(A, B) \
13251 ((__m128i)__builtin_ia32_prord128_mask ((__v4si)(__m128i)(A), (int)(B), \
13252 (__v4si)(__m128i)_mm_setzero_si128 (), \
13255 #define _mm_mask_ror_epi32(W, U, A, B) \
13256 ((__m128i)__builtin_ia32_prord128_mask ((__v4si)(__m128i)(A), (int)(B), \
13257 (__v4si)(__m128i)(W), \
13260 #define _mm_maskz_ror_epi32(U, A, B) \
13261 ((__m128i)__builtin_ia32_prord128_mask ((__v4si)(__m128i)(A), (int)(B), \
13262 (__v4si)(__m128i)_mm_setzero_si128 (), \
13265 #define _mm256_alignr_epi32(X, Y, C) \
13266 ((__m256i)__builtin_ia32_alignd256_mask ((__v8si)(__m256i)(X), \
13267 (__v8si)(__m256i)(Y), (int)(C), (__v8si)(__m256i)(X), (__mmask8)-1))
13269 #define _mm256_mask_alignr_epi32(W, U, X, Y, C) \
13270 ((__m256i)__builtin_ia32_alignd256_mask ((__v8si)(__m256i)(X), \
13271 (__v8si)(__m256i)(Y), (int)(C), (__v8si)(__m256i)(W), (__mmask8)(U)))
13273 #define _mm256_maskz_alignr_epi32(U, X, Y, C) \
13274 ((__m256i)__builtin_ia32_alignd256_mask ((__v8si)(__m256i)(X), \
13275 (__v8si)(__m256i)(Y), (int)(C), (__v8si)(__m256i)_mm256_setzero_si256 (),\
13278 #define _mm256_alignr_epi64(X, Y, C) \
13279 ((__m256i)__builtin_ia32_alignq256_mask ((__v4di)(__m256i)(X), \
13280 (__v4di)(__m256i)(Y), (int)(C), (__v4di)(__m256i)(X), (__mmask8)-1))
13282 #define _mm256_mask_alignr_epi64(W, U, X, Y, C) \
13283 ((__m256i)__builtin_ia32_alignq256_mask ((__v4di)(__m256i)(X), \
13284 (__v4di)(__m256i)(Y), (int)(C), (__v4di)(__m256i)(W), (__mmask8)(U)))
13286 #define _mm256_maskz_alignr_epi64(U, X, Y, C) \
13287 ((__m256i)__builtin_ia32_alignq256_mask ((__v4di)(__m256i)(X), \
13288 (__v4di)(__m256i)(Y), (int)(C), (__v4di)(__m256i)_mm256_setzero_si256 (),\
13291 #define _mm_alignr_epi32(X, Y, C) \
13292 ((__m128i)__builtin_ia32_alignd128_mask ((__v4si)(__m128i)(X), \
13293 (__v4si)(__m128i)(Y), (int)(C), (__v4si)(__m128i)(X), (__mmask8)-1))
13295 #define _mm_mask_alignr_epi32(W, U, X, Y, C) \
13296 ((__m128i)__builtin_ia32_alignd128_mask ((__v4si)(__m128i)(X), \
13297 (__v4si)(__m128i)(Y), (int)(C), (__v4si)(__m128i)(W), (__mmask8)(U)))
13299 #define _mm_maskz_alignr_epi32(U, X, Y, C) \
13300 ((__m128i)__builtin_ia32_alignd128_mask ((__v4si)(__m128i)(X), \
13301 (__v4si)(__m128i)(Y), (int)(C), (__v4si)(__m128i)_mm_setzero_si128(),\
13304 #define _mm_alignr_epi64(X, Y, C) \
13305 ((__m128i)__builtin_ia32_alignq128_mask ((__v2di)(__m128i)(X), \
13306 (__v2di)(__m128i)(Y), (int)(C), (__v2di)(__m128i)(X), (__mmask8)-1))
13308 #define _mm_mask_alignr_epi64(W, U, X, Y, C) \
13309 ((__m128i)__builtin_ia32_alignq128_mask ((__v2di)(__m128i)(X), \
13310 (__v2di)(__m128i)(Y), (int)(C), (__v2di)(__m128i)(X), (__mmask8)-1))
13312 #define _mm_maskz_alignr_epi64(U, X, Y, C) \
13313 ((__m128i)__builtin_ia32_alignq128_mask ((__v2di)(__m128i)(X), \
13314 (__v2di)(__m128i)(Y), (int)(C), (__v2di)(__m128i)_mm_setzero_si128(),\
13317 #define _mm_mask_cvtps_ph(W, U, A, I) \
13318 ((__m128i) __builtin_ia32_vcvtps2ph_mask ((__v4sf)(__m128) A, (int) (I), \
13319 (__v8hi)(__m128i) (W), (__mmask8) (U)))
13321 #define _mm_maskz_cvtps_ph(U, A, I) \
13322 ((__m128i) __builtin_ia32_vcvtps2ph_mask ((__v4sf)(__m128) A, (int) (I), \
13323 (__v8hi)(__m128i) _mm_setzero_hi(), (__mmask8) (U)))
13325 #define _mm256_mask_cvtps_ph(W, U, A, I) \
13326 ((__m128i) __builtin_ia32_vcvtps2ph256_mask ((__v8sf)(__m256) A, (int) (I), \
13327 (__v8hi)(__m128i) (W), (__mmask8) (U)))
13329 #define _mm256_maskz_cvtps_ph(U, A, I) \
13330 ((__m128i) __builtin_ia32_vcvtps2ph256_mask ((__v8sf)(__m256) A, (int) (I), \
13331 (__v8hi)(__m128i) _mm_setzero_hi(), (__mmask8) (U)))
13333 #define _mm256_mask_srai_epi32(W, U, A, B) \
13334 ((__m256i) __builtin_ia32_psradi256_mask ((__v8si)(__m256i)(A), \
13335 (int)(B), (__v8si)(__m256i)(W), (__mmask8)(U)))
13337 #define _mm256_maskz_srai_epi32(U, A, B) \
13338 ((__m256i) __builtin_ia32_psradi256_mask ((__v8si)(__m256i)(A), \
13339 (int)(B), (__v8si)_mm256_setzero_si256(), (__mmask8)(U)))
13341 #define _mm_mask_srai_epi32(W, U, A, B) \
13342 ((__m128i) __builtin_ia32_psradi128_mask ((__v4si)(__m128i)(A), \
13343 (int)(B), (__v4si)(__m128i)(W), (__mmask8)(U)))
13345 #define _mm_maskz_srai_epi32(U, A, B) \
13346 ((__m128i) __builtin_ia32_psradi128_mask ((__v4si)(__m128i)(A), \
13347 (int)(B), (__v4si)_mm_setzero_si128(), (__mmask8)(U)))
13349 #define _mm256_srai_epi64(A, B) \
13350 ((__m256i) __builtin_ia32_psraqi256_mask ((__v4di)(__m256i)(A), \
13351 (int)(B), (__v4di)_mm256_setzero_si256 (), (__mmask8)-1))
13353 #define _mm256_mask_srai_epi64(W, U, A, B) \
13354 ((__m256i) __builtin_ia32_psraqi256_mask ((__v4di)(__m256i)(A), \
13355 (int)(B), (__v4di)(__m256i)(W), (__mmask8)(U)))
13357 #define _mm256_maskz_srai_epi64(U, A, B) \
13358 ((__m256i) __builtin_ia32_psraqi256_mask ((__v4di)(__m256i)(A), \
13359 (int)(B), (__v4di)_mm256_setzero_si256 (), (__mmask8)(U)))
13361 #define _mm_srai_epi64(A, B) \
13362 ((__m128i) __builtin_ia32_psraqi128_mask ((__v2di)(__m128i)(A), \
13363 (int)(B), (__v2di)_mm_setzero_si128(), (__mmask8)-1))
13365 #define _mm_mask_srai_epi64(W, U, A, B) \
13366 ((__m128i) __builtin_ia32_psraqi128_mask ((__v2di)(__m128i)(A), \
13367 (int)(B), (__v2di)(__m128i)(W), (__mmask8)(U)))
13369 #define _mm_maskz_srai_epi64(U, A, B) \
13370 ((__m128i) __builtin_ia32_psraqi128_mask ((__v2di)(__m128i)(A), \
13371 (int)(B), (__v2di)_mm_setzero_si128(), (__mmask8)(U)))
13373 #define _mm256_mask_permutex_pd(W, U, A, B) \
13374 ((__m256d) __builtin_ia32_permdf256_mask ((__v4df)(__m256d)(A), \
13375 (int)(B), (__v4df)(__m256d)(W), (__mmask8)(U)))
13377 #define _mm256_maskz_permutex_pd(U, A, B) \
13378 ((__m256d) __builtin_ia32_permdf256_mask ((__v4df)(__m256d)(A), \
13379 (int)(B), (__v4df)(__m256d)_mm256_setzero_pd(), (__mmask8)(U)))
13381 #define _mm256_mask_permute_pd(W, U, X, C) \
13382 ((__m256d) __builtin_ia32_vpermilpd256_mask ((__v4df)(__m256d)(X), (int)(C), \
13383 (__v4df)(__m256d)(W), \
13386 #define _mm256_maskz_permute_pd(U, X, C) \
13387 ((__m256d) __builtin_ia32_vpermilpd256_mask ((__v4df)(__m256d)(X), (int)(C), \
13388 (__v4df)(__m256d)_mm256_setzero_pd(), \
13391 #define _mm256_mask_permute_ps(W, U, X, C) \
13392 ((__m256) __builtin_ia32_vpermilps256_mask ((__v8sf)(__m256)(X), (int)(C), \
13393 (__v8sf)(__m256)(W), (__mmask8)(U)))
13395 #define _mm256_maskz_permute_ps(U, X, C) \
13396 ((__m256) __builtin_ia32_vpermilps256_mask ((__v8sf)(__m256)(X), (int)(C), \
13397 (__v8sf)(__m256)_mm256_setzero_ps(), \
13400 #define _mm_mask_permute_pd(W, U, X, C) \
13401 ((__m128d) __builtin_ia32_vpermilpd_mask ((__v2df)(__m128d)(X), (int)(C), \
13402 (__v2df)(__m128d)(W), (__mmask8)(U)))
13404 #define _mm_maskz_permute_pd(U, X, C) \
13405 ((__m128d) __builtin_ia32_vpermilpd_mask ((__v2df)(__m128d)(X), (int)(C), \
13406 (__v2df)(__m128d)_mm_setzero_pd(), \
13409 #define _mm_mask_permute_ps(W, U, X, C) \
13410 ((__m128) __builtin_ia32_vpermilps_mask ((__v4sf)(__m128)(X), (int)(C), \
13411 (__v4sf)(__m128)(W), (__mmask8)(U)))
13413 #define _mm_maskz_permute_ps(U, X, C) \
13414 ((__m128) __builtin_ia32_vpermilps_mask ((__v4sf)(__m128)(X), (int)(C), \
13415 (__v4sf)(__m128)_mm_setzero_ps(), \
13418 #define _mm256_mask_blend_pd(__U, __A, __W) \
13419 ((__m256d) __builtin_ia32_blendmpd_256_mask ((__v4df) (__A), \
13423 #define _mm256_mask_blend_ps(__U, __A, __W) \
13424 ((__m256) __builtin_ia32_blendmps_256_mask ((__v8sf) (__A), \
13428 #define _mm256_mask_blend_epi64(__U, __A, __W) \
13429 ((__m256i) __builtin_ia32_blendmq_256_mask ((__v4di) (__A), \
13433 #define _mm256_mask_blend_epi32(__U, __A, __W) \
13434 ((__m256i) __builtin_ia32_blendmd_256_mask ((__v8si) (__A), \
13438 #define _mm_mask_blend_pd(__U, __A, __W) \
13439 ((__m128d) __builtin_ia32_blendmpd_128_mask ((__v2df) (__A), \
13443 #define _mm_mask_blend_ps(__U, __A, __W) \
13444 ((__m128) __builtin_ia32_blendmps_128_mask ((__v4sf) (__A), \
13448 #define _mm_mask_blend_epi64(__U, __A, __W) \
13449 ((__m128i) __builtin_ia32_blendmq_128_mask ((__v2di) (__A), \
13453 #define _mm_mask_blend_epi32(__U, __A, __W) \
13454 ((__m128i) __builtin_ia32_blendmd_128_mask ((__v4si) (__A), \
13458 #define _mm256_cmp_epu32_mask(X, Y, P) \
13459 ((__mmask8) __builtin_ia32_ucmpd256_mask ((__v8si)(__m256i)(X), \
13460 (__v8si)(__m256i)(Y), (int)(P),\
13463 #define _mm256_cmp_epi64_mask(X, Y, P) \
13464 ((__mmask8) __builtin_ia32_cmpq256_mask ((__v4di)(__m256i)(X), \
13465 (__v4di)(__m256i)(Y), (int)(P),\
13468 #define _mm256_cmp_epi32_mask(X, Y, P) \
13469 ((__mmask8) __builtin_ia32_cmpd256_mask ((__v8si)(__m256i)(X), \
13470 (__v8si)(__m256i)(Y), (int)(P),\
13473 #define _mm256_cmp_epu64_mask(X, Y, P) \
13474 ((__mmask8) __builtin_ia32_ucmpq256_mask ((__v4di)(__m256i)(X), \
13475 (__v4di)(__m256i)(Y), (int)(P),\
13478 #define _mm256_cmp_pd_mask(X, Y, P) \
13479 ((__mmask8) __builtin_ia32_cmppd256_mask ((__v4df)(__m256d)(X), \
13480 (__v4df)(__m256d)(Y), (int)(P),\
13483 #define _mm256_cmp_ps_mask(X, Y, P) \
13484 ((__mmask8) __builtin_ia32_cmpps256_mask ((__v8sf)(__m256)(X), \
13485 (__v8sf)(__m256)(Y), (int)(P),\
13488 #define _mm256_mask_cmp_epi64_mask(M, X, Y, P) \
13489 ((__mmask8) __builtin_ia32_cmpq256_mask ((__v4di)(__m256i)(X), \
13490 (__v4di)(__m256i)(Y), (int)(P),\
13493 #define _mm256_mask_cmp_epi32_mask(M, X, Y, P) \
13494 ((__mmask8) __builtin_ia32_cmpd256_mask ((__v8si)(__m256i)(X), \
13495 (__v8si)(__m256i)(Y), (int)(P),\
13498 #define _mm256_mask_cmp_epu64_mask(M, X, Y, P) \
13499 ((__mmask8) __builtin_ia32_ucmpq256_mask ((__v4di)(__m256i)(X), \
13500 (__v4di)(__m256i)(Y), (int)(P),\
13503 #define _mm256_mask_cmp_epu32_mask(M, X, Y, P) \
13504 ((__mmask8) __builtin_ia32_ucmpd256_mask ((__v8si)(__m256i)(X), \
13505 (__v8si)(__m256i)(Y), (int)(P),\
13508 #define _mm256_mask_cmp_pd_mask(M, X, Y, P) \
13509 ((__mmask8) __builtin_ia32_cmppd256_mask ((__v4df)(__m256d)(X), \
13510 (__v4df)(__m256d)(Y), (int)(P),\
13513 #define _mm256_mask_cmp_ps_mask(M, X, Y, P) \
13514 ((__mmask8) __builtin_ia32_cmpps256_mask ((__v8sf)(__m256)(X), \
13515 (__v8sf)(__m256)(Y), (int)(P),\
13518 #define _mm_cmp_epi64_mask(X, Y, P) \
13519 ((__mmask8) __builtin_ia32_cmpq128_mask ((__v2di)(__m128i)(X), \
13520 (__v2di)(__m128i)(Y), (int)(P),\
13523 #define _mm_cmp_epi32_mask(X, Y, P) \
13524 ((__mmask8) __builtin_ia32_cmpd128_mask ((__v4si)(__m128i)(X), \
13525 (__v4si)(__m128i)(Y), (int)(P),\
13528 #define _mm_cmp_epu64_mask(X, Y, P) \
13529 ((__mmask8) __builtin_ia32_ucmpq128_mask ((__v2di)(__m128i)(X), \
13530 (__v2di)(__m128i)(Y), (int)(P),\
13533 #define _mm_cmp_epu32_mask(X, Y, P) \
13534 ((__mmask8) __builtin_ia32_ucmpd128_mask ((__v4si)(__m128i)(X), \
13535 (__v4si)(__m128i)(Y), (int)(P),\
13538 #define _mm_cmp_pd_mask(X, Y, P) \
13539 ((__mmask8) __builtin_ia32_cmppd128_mask ((__v2df)(__m128d)(X), \
13540 (__v2df)(__m128d)(Y), (int)(P),\
13543 #define _mm_cmp_ps_mask(X, Y, P) \
13544 ((__mmask8) __builtin_ia32_cmpps128_mask ((__v4sf)(__m128)(X), \
13545 (__v4sf)(__m128)(Y), (int)(P),\
13548 #define _mm_mask_cmp_epi64_mask(M, X, Y, P) \
13549 ((__mmask8) __builtin_ia32_cmpq128_mask ((__v2di)(__m128i)(X), \
13550 (__v2di)(__m128i)(Y), (int)(P),\
13553 #define _mm_mask_cmp_epi32_mask(M, X, Y, P) \
13554 ((__mmask8) __builtin_ia32_cmpd128_mask ((__v4si)(__m128i)(X), \
13555 (__v4si)(__m128i)(Y), (int)(P),\
13558 #define _mm_mask_cmp_epu64_mask(M, X, Y, P) \
13559 ((__mmask8) __builtin_ia32_ucmpq128_mask ((__v2di)(__m128i)(X), \
13560 (__v2di)(__m128i)(Y), (int)(P),\
13563 #define _mm_mask_cmp_epu32_mask(M, X, Y, P) \
13564 ((__mmask8) __builtin_ia32_ucmpd128_mask ((__v4si)(__m128i)(X), \
13565 (__v4si)(__m128i)(Y), (int)(P),\
13568 #define _mm_mask_cmp_pd_mask(M, X, Y, P) \
13569 ((__mmask8) __builtin_ia32_cmppd128_mask ((__v2df)(__m128d)(X), \
13570 (__v2df)(__m128d)(Y), (int)(P),\
13573 #define _mm_mask_cmp_ps_mask(M, X, Y, P) \
13574 ((__mmask8) __builtin_ia32_cmpps128_mask ((__v4sf)(__m128)(X), \
13575 (__v4sf)(__m128)(Y), (int)(P),\
13580 #define _mm256_permutexvar_ps(A, B) _mm256_permutevar8x32_ps((B), (A))
13582 #ifdef __DISABLE_AVX512VL__
13583 #undef __DISABLE_AVX512VL__
13584 #pragma GCC pop_options
13585 #endif /* __DISABLE_AVX512VL__ */
13587 #endif /* _AVX512VLINTRIN_H_INCLUDED */