1 /* { dg-do compile } */
2 /* { dg-options "-O2 -ftree-vectorize -ffast-math" } */
6 #define TEST_LOOP(NAME, OUTTYPE, INTYPE, MASKTYPE) \
7 void __attribute__ ((noinline, noclone)) \
8 NAME##_3 (OUTTYPE *__restrict dest, INTYPE *__restrict src, \
9 MASKTYPE *__restrict cond, INTYPE bias, int n) \
11 for (int i = 0; i < n; ++i) \
13 INTYPE value = src[i] + bias; \
16 dest[i * 3] = value; \
17 dest[i * 3 + 1] = value; \
18 dest[i * 3 + 2] = value; \
23 #define TEST2(NAME, OUTTYPE, INTYPE) \
24 TEST_LOOP (NAME##_i8, OUTTYPE, INTYPE, int8_t) \
25 TEST_LOOP (NAME##_i16, OUTTYPE, INTYPE, uint16_t) \
26 TEST_LOOP (NAME##_f32, OUTTYPE, INTYPE, float) \
27 TEST_LOOP (NAME##_f64, OUTTYPE, INTYPE, double)
29 #define TEST1(NAME, OUTTYPE) \
30 TEST2 (NAME##_i8, OUTTYPE, int8_t) \
31 TEST2 (NAME##_i16, OUTTYPE, uint16_t) \
32 TEST2 (NAME##_i32, OUTTYPE, int32_t) \
33 TEST2 (NAME##_i64, OUTTYPE, uint64_t)
36 TEST1 (NAME##_i8, int8_t) \
37 TEST1 (NAME##_i16, uint16_t) \
38 TEST1 (NAME##_i32, int32_t) \
39 TEST1 (NAME##_i64, uint64_t) \
40 TEST2 (NAME##_f16_f16, _Float16, _Float16) \
41 TEST2 (NAME##_f32_f32, float, float) \
42 TEST2 (NAME##_f64_f64, double, double)
52 /* { dg-final { scan-assembler-times {\tst3b\t.z[0-9]} 16 } } */
57 16 | 2 1 1 1 x2 (for _Float16)
60 /* { dg-final { scan-assembler-times {\tst3h\t.z[0-9]} 28 } } */
66 32 | 4 2 1 1 x2 (for float)
68 /* { dg-final { scan-assembler-times {\tst3w\t.z[0-9]} 50 } } */
75 64 | 8 4 2 1 x2 (for double). */
76 /* { dg-final { scan-assembler-times {\tst3d\t.z[0-9]} 98 } } */