1 /* Test vmov_n works correctly. */
3 /* { dg-options "-O3 --save-temps" } */
7 extern void abort (void);
9 #define INHIB_OPTIMIZATION asm volatile ("" : : : "memory")
11 #define CONCAT(a, b) a##b
12 #define CONCAT1(a, b) CONCAT (a, b)
14 #define REG_INFEX128 q_
15 #define REG_INFEX(reg_len) REG_INFEX##reg_len
16 #define POSTFIX_N(reg_len, data_len, data_type) \
17 CONCAT1 (REG_INFEX (reg_len), n_##data_type##data_len)
18 #define LANE_POSTFIX(reg_len, data_len, data_type) \
19 CONCAT1 (REG_INFEX (reg_len),lane_##data_type##data_len)
21 /* Test values consist of bytes with following hex values.
23 TEST1 for int16_t will be 0xaaaa
24 TEST1 for int32_t will be 0xaaaaaaaa
34 #define TESTh_8(x) TEST##x##h
35 #define TESTh_16(x) CONCAT1 (TESTh_8 (x), TESTh_8 (x))
36 #define TESTh_32(x) CONCAT1 (TESTh_16 (x), TESTh_16 (x))
37 #define TESTh_64(x) CONCAT1 (TESTh_32 (x), TESTh_32 (x))
39 #define TEST_8(x) CONCAT1 (0x, TESTh_8 (x))
40 #define TEST_16(x) CONCAT1 (0x, TESTh_16 (x))
41 #define TEST_32(x) CONCAT1 (0x, TESTh_32 (x))
42 #define TEST_64(x) CONCAT1 (0x, TESTh_64 (x))
44 #define TEST(test, data_len) \
45 CONCAT1 (TEST, _##data_len) (test)
47 #define GET_ELEMENT(reg_len, data_len, data_type) \
48 CONCAT1 (vget, LANE_POSTFIX (reg_len, data_len, data_type))
50 #define VMOV_INST(reg_len, data_len, data_type) \
51 CONCAT1 (vmov, POSTFIX_N (reg_len, data_len, data_type))
53 #define VMOV_OBSCURE_INST(reg_len, data_len, data_type) \
54 CONCAT1 (VMOV_INST (reg_len, data_len, data_type), _obscure)
56 #define RUN_TEST(reg_len, data_len, data_type, \
61 (a) = TEST (test, data_len); \
63 (b) = VMOV_OBSCURE_INST (reg_len, data_len, data_type) (&(a)); \
64 (c) = TEST (test, data_len); \
65 for (i = 0; i < n; i++) \
68 a = GET_ELEMENT (reg_len, data_len, data_type) (b, i); \
74 #define TYPE_f32 float32_t
75 #define TYPE_64_f32 float32x2_t
76 #define TYPE_128_f32 float32x4_t
78 #define TYPE_f64 float64_t
79 #define TYPE_64_f64 float64x1_t
80 #define TYPE_128_f64 float64x2_t
82 #define TYPE_s8 int8_t
83 #define TYPE_64_s8 int8x8_t
84 #define TYPE_128_s8 int8x16_t
86 #define TYPE_s16 int16_t
87 #define TYPE_64_s16 int16x4_t
88 #define TYPE_128_s16 int16x8_t
90 #define TYPE_s32 int32_t
91 #define TYPE_64_s32 int32x2_t
92 #define TYPE_128_s32 int32x4_t
94 #define TYPE_s64 int64_t
95 #define TYPE_64_s64 int64x1_t
96 #define TYPE_128_s64 int64x2_t
98 #define TYPE_u8 uint8_t
99 #define TYPE_64_u8 uint8x8_t
100 #define TYPE_128_u8 uint8x16_t
102 #define TYPE_u16 uint16_t
103 #define TYPE_64_u16 uint16x4_t
104 #define TYPE_128_u16 uint16x8_t
106 #define TYPE_u32 uint32_t
107 #define TYPE_64_u32 uint32x2_t
108 #define TYPE_128_u32 uint32x4_t
110 #define TYPE_u64 uint64_t
111 #define TYPE_64_u64 uint64x1_t
112 #define TYPE_128_u64 uint64x2_t
114 #define TYPE_p8 poly8_t
115 #define TYPE_64_p8 poly8x8_t
116 #define TYPE_128_p8 poly8x16_t
118 #define TYPE_p16 poly16_t
119 #define TYPE_64_p16 poly16x4_t
120 #define TYPE_128_p16 poly16x8_t
132 #define DIV(reg_len, data_len) \
133 CONCAT1 (CONCAT1 (DIV, reg_len), \
134 CONCAT1 (_, data_len))
136 #define VECTOR_TYPE(reg_len, data_len, data_type) \
137 CONCAT1 (CONCAT1 (CONCAT1 (TYPE_,reg_len), \
138 CONCAT1 (_,data_type)), \
141 #define SIMPLE_TYPE(data_len, data_type) \
143 CONCAT1 (data_type, \
146 #define OBSCURE_FUNC_NAME(reg_len, data_type, data_len) \
147 CONCAT1 (CONCAT1 (vmov, \
148 POSTFIX_N (reg_len, data_len, data_type)), \
151 #define OBSCURE_FUNC(reg_len, data_len, data_type) \
152 VECTOR_TYPE (reg_len, data_len, data_type) \
153 __attribute__ ((noinline)) \
154 OBSCURE_FUNC_NAME (reg_len, data_type, data_len) \
155 (SIMPLE_TYPE (data_len, data_type) *ap) \
157 SIMPLE_TYPE (data_len, data_type) register a; \
158 INHIB_OPTIMIZATION; \
160 INHIB_OPTIMIZATION; \
161 return VMOV_INST (reg_len, data_len, data_type) (a); \
164 #define TESTFUNC_NAME(reg_len, data_type, data_len) \
165 CONCAT1 (test_vmov, \
166 POSTFIX_N (reg_len, data_len, data_type))
168 #define TESTFUNC(reg_len, data_len, data_type) \
170 TESTFUNC_NAME (reg_len, data_type, data_len) () \
172 SIMPLE_TYPE (data_len, data_type) a; \
173 VECTOR_TYPE (reg_len, data_len, data_type) b; \
174 SIMPLE_TYPE (data_len, data_type) c; \
176 RUN_TEST (reg_len, data_len, data_type, 1, \
177 DIV (reg_len, data_len), a, b, c); \
178 RUN_TEST (reg_len, data_len, data_type, 2, \
179 DIV (reg_len, data_len), a, b, c); \
180 RUN_TEST (reg_len, data_len, data_type, 3, \
181 DIV (reg_len, data_len), a, b, c); \
182 RUN_TEST (reg_len, data_len, data_type, 4, \
183 DIV (reg_len, data_len), a, b, c); \
184 RUN_TEST (reg_len, data_len, data_type, 5, \
185 DIV (reg_len, data_len), a, b, c); \
186 RUN_TEST (reg_len, data_len, data_type, 6, \
187 DIV (reg_len, data_len), a, b, c); \
191 OBSCURE_FUNC (64, 32, f
)
193 /* "dup Vd.2s, Rn" is less preferable than "dup Vd.2s, Vn.s[lane]". */
194 /* { dg-final { scan-assembler-not "dup\\tv\[0-9\]+\.2s, w\[0-9\]+" } } */
195 /* { dg-final { scan-assembler-times "dup\\tv\[0-9\]+\.2s, v\[0-9\]+\.s\\\[\[0-9\]+\\\]" 3 } } */
197 OBSCURE_FUNC (64, 64, f
)
199 /* "fmov Dd, Rn" is generated instead of "dup Dd, Rn".
200 No assembley scan included. */
202 OBSCURE_FUNC (64, 8, p
)
204 /* Generates "dup Vd.8b, Rn". Scan found near s8 version. */
206 OBSCURE_FUNC (64, 16, p
)
208 /* Generates "dup Vd.4h, Rn". Scan found near s16 version. */
210 OBSCURE_FUNC (64, 8, s
)
212 /* { dg-final { scan-assembler-times "dup\\tv\[0-9\]+\.8b, w\[0-9\]+" 3 } } */
214 OBSCURE_FUNC (64, 16, s
)
216 /* { dg-final { scan-assembler-times "dup\\tv\[0-9\]+\.4h, w\[0-9\]+" 3 } } */
218 OBSCURE_FUNC (64, 32, s
)
220 /* "dup Vd.2s, Rn" is less preferable than "dup Vd.2s, Vn.s[lane]". */
221 /* { dg-final { scan-assembler-not "dup\\tv\[0-9\]+\.2s, w\[0-9\]+" } } */
222 /* { dg-final { scan-assembler-times "dup\\tv\[0-9\]+\.2s, v\[0-9\]+\.s\\\[\[0-9\]+\\\]" 3 } } */
224 OBSCURE_FUNC (64, 64, s
)
226 /* "fmov Dd, Rn" is generated instead of "dup Dd, Rn".
227 No assembley scan included. */
229 OBSCURE_FUNC (64, 8, u
)
231 /* Generates "dup Vd.8b, Rn". Scan found near s8 version. */
233 OBSCURE_FUNC (64, 16, u
)
235 /* Generates "dup Vd.4h, Rn". Scan found near s16 version. */
237 OBSCURE_FUNC (64, 32, u
)
239 /* Generates "dup Vd.2s, Rn". Scan found near s32 version. */
241 OBSCURE_FUNC (64, 64, u
)
243 /* "fmov Dd, Rn" is generated instead of "dup Dd, Rn".
244 No assembley scan included. */
246 OBSCURE_FUNC (128, 32, f
)
247 TESTFUNC (128, 32, f
)
248 /* "dup Vd.4s, Rn" is less preferable than "dup Vd.4s, Vn.s[lane]". */
249 /* { dg-final { scan-assembler-not "dup\\tv\[0-9\]+\.4s, w\[0-9\]+" } } */
250 /* { dg-final { scan-assembler-times "dup\\tv\[0-9\]+\.4s, v\[0-9\]+\.s\\\[\[0-9\]+\\\]" 3 } } */
252 OBSCURE_FUNC (128, 64, f
)
253 TESTFUNC (128, 64, f
)
254 /* "dup Vd.2d, Rn" is less preferable than "dup Vd.2d, Vn.d[lane]". */
255 /* { dg-final { scan-assembler-not "dup\\tv\[0-9\]+\.2d, x\[0-9\]+" } } */
256 /* { dg-final { scan-assembler-times "dup\\tv\[0-9\]+\.2d, v\[0-9\]+\.d\\\[\[0-9\]+\\\]" 3 } } */
258 OBSCURE_FUNC (128, 8, p
)
260 /* Generates "dup Vd.16b, Rn". Scan found near s8 version. */
262 OBSCURE_FUNC (128, 16, p
)
263 TESTFUNC (128, 16, p
)
264 /* Generates "dup Vd.8h, Rn". Scan found near s16 version. */
266 OBSCURE_FUNC (128, 8, s
)
268 /* { dg-final { scan-assembler-times "dup\\tv\[0-9\]+\.16b, w\[0-9\]+" 3 } } */
270 OBSCURE_FUNC (128, 16, s
)
271 TESTFUNC (128, 16, s
)
272 /* { dg-final { scan-assembler-times "dup\\tv\[0-9\]+\.8h, w\[0-9\]+" 3 } } */
274 OBSCURE_FUNC (128, 32, s
)
275 TESTFUNC (128, 32, s
)
276 /* "dup Vd.4s, Rn" is less preferable than "dup Vd.4s, Vn.s[lane]". */
277 /* { dg-final { scan-assembler-not "dup\\tv\[0-9\]+\.4s, w\[0-9\]+" } } */
278 /* { dg-final { scan-assembler-times "dup\\tv\[0-9\]+\.4s, v\[0-9\]+\.s\\\[\[0-9\]+\\\]" 3 } } */
280 OBSCURE_FUNC (128, 64, s
)
281 TESTFUNC (128, 64, s
)
282 /* "dup Vd.2d, Rn" is less preferable than "dup Vd.2d, Vn.d[lane]". */
283 /* { dg-final { scan-assembler-not "dup\\tv\[0-9\]+\.2d, x\[0-9\]+" } } */
284 /* { dg-final { scan-assembler-times "dup\\tv\[0-9\]+\.2d, v\[0-9\]+\.d\\\[\[0-9\]+\\\]" 3 } } */
286 OBSCURE_FUNC (128, 8, u
)
288 /* Generates "dup Vd.16b, Rn". Scan found near s8 version. */
290 OBSCURE_FUNC (128, 16, u
)
291 TESTFUNC (128, 16, u
)
292 /* Generates "dup Vd.8h, Rn". Scan found near s16 version. */
294 OBSCURE_FUNC (128, 32, u
)
295 TESTFUNC (128, 32, u
)
296 /* Generates "dup Vd.4s, Rn". Scan found near s32 version. */
298 OBSCURE_FUNC (128, 64, u
)
299 TESTFUNC (128, 64, u
)
300 /* Generates "dup Vd.2d, Rn". Scan found near s64 version. */
303 main (int argc
, char **argv
)
305 if (test_vmov_n_f32 ())
307 if (test_vmov_n_f64 ())
309 if (test_vmov_n_p8 ())
311 if (test_vmov_n_p16 ())
313 if (test_vmov_n_s8 ())
315 if (test_vmov_n_s16 ())
317 if (test_vmov_n_s32 ())
319 if (test_vmov_n_s64 ())
321 if (test_vmov_n_u8 ())
323 if (test_vmov_n_u16 ())
325 if (test_vmov_n_u32 ())
327 if (test_vmov_n_u64 ())
330 if (test_vmovq_n_f32 ())
332 if (test_vmovq_n_f64 ())
334 if (test_vmovq_n_p8 ())
336 if (test_vmovq_n_p16 ())
338 if (test_vmovq_n_s8 ())
340 if (test_vmovq_n_s16 ())
342 if (test_vmovq_n_s32 ())
344 if (test_vmovq_n_s64 ())
346 if (test_vmovq_n_u8 ())
348 if (test_vmovq_n_u16 ())
350 if (test_vmovq_n_u32 ())
352 if (test_vmovq_n_u64 ())