1 /* { dg-do compile } */
2 /* { dg-options "-O2 -ftree-vectorize -ffast-math" } */
4 #define TEST_LOOP(NAME, OUTTYPE, INTYPE, MASKTYPE) \
5 void __attribute__ ((noinline, noclone)) \
6 NAME##_2 (OUTTYPE *__restrict dest, INTYPE *__restrict src, \
7 MASKTYPE *__restrict cond, int n) \
9 for (int i = 0; i < n; ++i) \
11 dest[i] = src[i * 2] + src[i * 2 + 1]; \
14 #define TEST2(NAME, OUTTYPE, INTYPE) \
15 TEST_LOOP (NAME##_i8, OUTTYPE, INTYPE, signed char) \
16 TEST_LOOP (NAME##_i16, OUTTYPE, INTYPE, unsigned short) \
17 TEST_LOOP (NAME##_f32, OUTTYPE, INTYPE, float) \
18 TEST_LOOP (NAME##_f64, OUTTYPE, INTYPE, double)
20 #define TEST1(NAME, OUTTYPE) \
21 TEST2 (NAME##_i8, OUTTYPE, signed char) \
22 TEST2 (NAME##_i16, OUTTYPE, unsigned short) \
23 TEST2 (NAME##_i32, OUTTYPE, int) \
24 TEST2 (NAME##_i64, OUTTYPE, unsigned long)
27 TEST1 (NAME##_i8, signed char) \
28 TEST1 (NAME##_i16, unsigned short) \
29 TEST1 (NAME##_i32, int) \
30 TEST1 (NAME##_i64, unsigned long) \
31 TEST2 (NAME##_f16_f16, _Float16, _Float16) \
32 TEST2 (NAME##_f32_f32, float, float) \
33 TEST2 (NAME##_f64_f64, double, double)
43 /* { dg-final { scan-assembler-times {\tld2b\t.z[0-9]} 16 } } */
48 16 | 2 1 1 1 x2 (for half float)
51 /* { dg-final { scan-assembler-times {\tld2h\t.z[0-9]} 28 } } */
57 32 | 4 2 1 1 x2 (for float)
59 /* { dg-final { scan-assembler-times {\tld2w\t.z[0-9]} 50 } } */
66 64 | 8 4 2 1 x2 (for double). */
67 /* { dg-final { scan-assembler-times {\tld2d\t.z[0-9]} 98 } } */