2 * Generic vector operation expansion
4 * Copyright (c) 2018 Linaro
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
20 #ifndef TCG_TCG_OP_GVEC_H
21 #define TCG_TCG_OP_GVEC_H
24 * "Generic" vectors. All operands are given as offsets from ENV,
25 * and therefore cannot also be allocated via tcg_global_mem_new_*.
26 * OPRSZ is the byte size of the vector upon which the operation is performed.
27 * MAXSZ is the byte size of the full vector; bytes beyond OPSZ are cleared.
29 * All sizes must be 8 or any multiple of 16.
30 * When OPRSZ is 8, the alignment may be 8, otherwise must be 16.
31 * Operands may completely, but not partially, overlap.
34 /* Expand a call to a gvec-style helper, with pointers to two vector
35 operands, and a descriptor (see tcg-gvec-desc.h). */
36 typedef void gen_helper_gvec_2(TCGv_ptr
, TCGv_ptr
, TCGv_i32
);
37 void tcg_gen_gvec_2_ool(uint32_t dofs
, uint32_t aofs
,
38 uint32_t oprsz
, uint32_t maxsz
, int32_t data
,
39 gen_helper_gvec_2
*fn
);
41 /* Similarly, passing an extra data value. */
42 typedef void gen_helper_gvec_2i(TCGv_ptr
, TCGv_ptr
, TCGv_i64
, TCGv_i32
);
43 void tcg_gen_gvec_2i_ool(uint32_t dofs
, uint32_t aofs
, TCGv_i64 c
,
44 uint32_t oprsz
, uint32_t maxsz
, int32_t data
,
45 gen_helper_gvec_2i
*fn
);
47 /* Similarly, passing an extra pointer (e.g. env or float_status). */
48 typedef void gen_helper_gvec_2_ptr(TCGv_ptr
, TCGv_ptr
, TCGv_ptr
, TCGv_i32
);
49 void tcg_gen_gvec_2_ptr(uint32_t dofs
, uint32_t aofs
,
50 TCGv_ptr ptr
, uint32_t oprsz
, uint32_t maxsz
,
51 int32_t data
, gen_helper_gvec_2_ptr
*fn
);
53 /* Similarly, with three vector operands. */
54 typedef void gen_helper_gvec_3(TCGv_ptr
, TCGv_ptr
, TCGv_ptr
, TCGv_i32
);
55 void tcg_gen_gvec_3_ool(uint32_t dofs
, uint32_t aofs
, uint32_t bofs
,
56 uint32_t oprsz
, uint32_t maxsz
, int32_t data
,
57 gen_helper_gvec_3
*fn
);
59 /* Similarly, with four vector operands. */
60 typedef void gen_helper_gvec_4(TCGv_ptr
, TCGv_ptr
, TCGv_ptr
,
62 void tcg_gen_gvec_4_ool(uint32_t dofs
, uint32_t aofs
, uint32_t bofs
,
63 uint32_t cofs
, uint32_t oprsz
, uint32_t maxsz
,
64 int32_t data
, gen_helper_gvec_4
*fn
);
66 /* Similarly, with five vector operands. */
67 typedef void gen_helper_gvec_5(TCGv_ptr
, TCGv_ptr
, TCGv_ptr
, TCGv_ptr
,
69 void tcg_gen_gvec_5_ool(uint32_t dofs
, uint32_t aofs
, uint32_t bofs
,
70 uint32_t cofs
, uint32_t xofs
, uint32_t oprsz
,
71 uint32_t maxsz
, int32_t data
, gen_helper_gvec_5
*fn
);
73 typedef void gen_helper_gvec_3_ptr(TCGv_ptr
, TCGv_ptr
, TCGv_ptr
,
75 void tcg_gen_gvec_3_ptr(uint32_t dofs
, uint32_t aofs
, uint32_t bofs
,
76 TCGv_ptr ptr
, uint32_t oprsz
, uint32_t maxsz
,
77 int32_t data
, gen_helper_gvec_3_ptr
*fn
);
79 typedef void gen_helper_gvec_4_ptr(TCGv_ptr
, TCGv_ptr
, TCGv_ptr
,
80 TCGv_ptr
, TCGv_ptr
, TCGv_i32
);
81 void tcg_gen_gvec_4_ptr(uint32_t dofs
, uint32_t aofs
, uint32_t bofs
,
82 uint32_t cofs
, TCGv_ptr ptr
, uint32_t oprsz
,
83 uint32_t maxsz
, int32_t data
,
84 gen_helper_gvec_4_ptr
*fn
);
86 /* Expand a gvec operation. Either inline or out-of-line depending on
87 the actual vector size and the operations supported by the host. */
89 /* Expand inline as a 64-bit or 32-bit integer.
90 Only one of these will be non-NULL. */
91 void (*fni8
)(TCGv_i64
, TCGv_i64
);
92 void (*fni4
)(TCGv_i32
, TCGv_i32
);
93 /* Expand inline with a host vector type. */
94 void (*fniv
)(unsigned, TCGv_vec
, TCGv_vec
);
95 /* Expand out-of-line helper w/descriptor. */
96 gen_helper_gvec_2
*fno
;
97 /* The optional opcodes, if any, utilized by .fniv. */
98 const TCGOpcode
*opt_opc
;
99 /* The data argument to the out-of-line helper. */
101 /* The vector element size, if applicable. */
103 /* Prefer i64 to v64. */
108 /* Expand inline as a 64-bit or 32-bit integer.
109 Only one of these will be non-NULL. */
110 void (*fni8
)(TCGv_i64
, TCGv_i64
, int64_t);
111 void (*fni4
)(TCGv_i32
, TCGv_i32
, int32_t);
112 /* Expand inline with a host vector type. */
113 void (*fniv
)(unsigned, TCGv_vec
, TCGv_vec
, int64_t);
114 /* Expand out-of-line helper w/descriptor, data in descriptor. */
115 gen_helper_gvec_2
*fno
;
116 /* Expand out-of-line helper w/descriptor, data as argument. */
117 gen_helper_gvec_2i
*fnoi
;
118 /* The optional opcodes, if any, utilized by .fniv. */
119 const TCGOpcode
*opt_opc
;
120 /* The vector element size, if applicable. */
122 /* Prefer i64 to v64. */
124 /* Load dest as a 3rd source operand. */
129 /* Expand inline as a 64-bit or 32-bit integer.
130 Only one of these will be non-NULL. */
131 void (*fni8
)(TCGv_i64
, TCGv_i64
, TCGv_i64
);
132 void (*fni4
)(TCGv_i32
, TCGv_i32
, TCGv_i32
);
133 /* Expand inline with a host vector type. */
134 void (*fniv
)(unsigned, TCGv_vec
, TCGv_vec
, TCGv_vec
);
135 /* Expand out-of-line helper w/descriptor. */
136 gen_helper_gvec_2i
*fno
;
137 /* The optional opcodes, if any, utilized by .fniv. */
138 const TCGOpcode
*opt_opc
;
139 /* The data argument to the out-of-line helper. */
141 /* The vector element size, if applicable. */
143 /* Prefer i64 to v64. */
145 /* Load scalar as 1st source operand. */
150 /* Expand inline as a 64-bit or 32-bit integer.
151 Only one of these will be non-NULL. */
152 void (*fni8
)(TCGv_i64
, TCGv_i64
, TCGv_i64
);
153 void (*fni4
)(TCGv_i32
, TCGv_i32
, TCGv_i32
);
154 /* Expand inline with a host vector type. */
155 void (*fniv
)(unsigned, TCGv_vec
, TCGv_vec
, TCGv_vec
);
156 /* Expand out-of-line helper w/descriptor. */
157 gen_helper_gvec_3
*fno
;
158 /* The optional opcodes, if any, utilized by .fniv. */
159 const TCGOpcode
*opt_opc
;
160 /* The data argument to the out-of-line helper. */
162 /* The vector element size, if applicable. */
164 /* Prefer i64 to v64. */
166 /* Load dest as a 3rd source operand. */
172 * Expand inline as a 64-bit or 32-bit integer. Only one of these will be
175 void (*fni8
)(TCGv_i64
, TCGv_i64
, TCGv_i64
, int64_t);
176 void (*fni4
)(TCGv_i32
, TCGv_i32
, TCGv_i32
, int32_t);
177 /* Expand inline with a host vector type. */
178 void (*fniv
)(unsigned, TCGv_vec
, TCGv_vec
, TCGv_vec
, int64_t);
179 /* Expand out-of-line helper w/descriptor, data in descriptor. */
180 gen_helper_gvec_3
*fno
;
181 /* The optional opcodes, if any, utilized by .fniv. */
182 const TCGOpcode
*opt_opc
;
183 /* The vector element size, if applicable. */
185 /* Prefer i64 to v64. */
187 /* Load dest as a 3rd source operand. */
192 /* Expand inline as a 64-bit or 32-bit integer.
193 Only one of these will be non-NULL. */
194 void (*fni8
)(TCGv_i64
, TCGv_i64
, TCGv_i64
, TCGv_i64
);
195 void (*fni4
)(TCGv_i32
, TCGv_i32
, TCGv_i32
, TCGv_i32
);
196 /* Expand inline with a host vector type. */
197 void (*fniv
)(unsigned, TCGv_vec
, TCGv_vec
, TCGv_vec
, TCGv_vec
);
198 /* Expand out-of-line helper w/descriptor. */
199 gen_helper_gvec_4
*fno
;
200 /* The optional opcodes, if any, utilized by .fniv. */
201 const TCGOpcode
*opt_opc
;
202 /* The data argument to the out-of-line helper. */
204 /* The vector element size, if applicable. */
206 /* Prefer i64 to v64. */
208 /* Write aofs as a 2nd dest operand. */
212 void tcg_gen_gvec_2(uint32_t dofs
, uint32_t aofs
,
213 uint32_t oprsz
, uint32_t maxsz
, const GVecGen2
*);
214 void tcg_gen_gvec_2i(uint32_t dofs
, uint32_t aofs
, uint32_t oprsz
,
215 uint32_t maxsz
, int64_t c
, const GVecGen2i
*);
216 void tcg_gen_gvec_2s(uint32_t dofs
, uint32_t aofs
, uint32_t oprsz
,
217 uint32_t maxsz
, TCGv_i64 c
, const GVecGen2s
*);
218 void tcg_gen_gvec_3(uint32_t dofs
, uint32_t aofs
, uint32_t bofs
,
219 uint32_t oprsz
, uint32_t maxsz
, const GVecGen3
*);
220 void tcg_gen_gvec_3i(uint32_t dofs
, uint32_t aofs
, uint32_t bofs
,
221 uint32_t oprsz
, uint32_t maxsz
, int64_t c
,
223 void tcg_gen_gvec_4(uint32_t dofs
, uint32_t aofs
, uint32_t bofs
, uint32_t cofs
,
224 uint32_t oprsz
, uint32_t maxsz
, const GVecGen4
*);
226 /* Expand a specific vector operation. */
228 void tcg_gen_gvec_mov(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
229 uint32_t oprsz
, uint32_t maxsz
);
230 void tcg_gen_gvec_not(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
231 uint32_t oprsz
, uint32_t maxsz
);
232 void tcg_gen_gvec_neg(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
233 uint32_t oprsz
, uint32_t maxsz
);
234 void tcg_gen_gvec_abs(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
235 uint32_t oprsz
, uint32_t maxsz
);
237 void tcg_gen_gvec_add(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
238 uint32_t bofs
, uint32_t oprsz
, uint32_t maxsz
);
239 void tcg_gen_gvec_sub(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
240 uint32_t bofs
, uint32_t oprsz
, uint32_t maxsz
);
241 void tcg_gen_gvec_mul(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
242 uint32_t bofs
, uint32_t oprsz
, uint32_t maxsz
);
244 void tcg_gen_gvec_addi(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
245 int64_t c
, uint32_t oprsz
, uint32_t maxsz
);
246 void tcg_gen_gvec_muli(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
247 int64_t c
, uint32_t oprsz
, uint32_t maxsz
);
249 void tcg_gen_gvec_adds(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
250 TCGv_i64 c
, uint32_t oprsz
, uint32_t maxsz
);
251 void tcg_gen_gvec_subs(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
252 TCGv_i64 c
, uint32_t oprsz
, uint32_t maxsz
);
253 void tcg_gen_gvec_muls(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
254 TCGv_i64 c
, uint32_t oprsz
, uint32_t maxsz
);
256 /* Saturated arithmetic. */
257 void tcg_gen_gvec_ssadd(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
258 uint32_t bofs
, uint32_t oprsz
, uint32_t maxsz
);
259 void tcg_gen_gvec_sssub(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
260 uint32_t bofs
, uint32_t oprsz
, uint32_t maxsz
);
261 void tcg_gen_gvec_usadd(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
262 uint32_t bofs
, uint32_t oprsz
, uint32_t maxsz
);
263 void tcg_gen_gvec_ussub(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
264 uint32_t bofs
, uint32_t oprsz
, uint32_t maxsz
);
267 void tcg_gen_gvec_smin(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
268 uint32_t bofs
, uint32_t oprsz
, uint32_t maxsz
);
269 void tcg_gen_gvec_umin(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
270 uint32_t bofs
, uint32_t oprsz
, uint32_t maxsz
);
271 void tcg_gen_gvec_smax(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
272 uint32_t bofs
, uint32_t oprsz
, uint32_t maxsz
);
273 void tcg_gen_gvec_umax(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
274 uint32_t bofs
, uint32_t oprsz
, uint32_t maxsz
);
276 void tcg_gen_gvec_and(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
277 uint32_t bofs
, uint32_t oprsz
, uint32_t maxsz
);
278 void tcg_gen_gvec_or(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
279 uint32_t bofs
, uint32_t oprsz
, uint32_t maxsz
);
280 void tcg_gen_gvec_xor(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
281 uint32_t bofs
, uint32_t oprsz
, uint32_t maxsz
);
282 void tcg_gen_gvec_andc(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
283 uint32_t bofs
, uint32_t oprsz
, uint32_t maxsz
);
284 void tcg_gen_gvec_orc(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
285 uint32_t bofs
, uint32_t oprsz
, uint32_t maxsz
);
286 void tcg_gen_gvec_nand(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
287 uint32_t bofs
, uint32_t oprsz
, uint32_t maxsz
);
288 void tcg_gen_gvec_nor(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
289 uint32_t bofs
, uint32_t oprsz
, uint32_t maxsz
);
290 void tcg_gen_gvec_eqv(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
291 uint32_t bofs
, uint32_t oprsz
, uint32_t maxsz
);
293 void tcg_gen_gvec_andi(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
294 int64_t c
, uint32_t oprsz
, uint32_t maxsz
);
295 void tcg_gen_gvec_xori(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
296 int64_t c
, uint32_t oprsz
, uint32_t maxsz
);
297 void tcg_gen_gvec_ori(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
298 int64_t c
, uint32_t oprsz
, uint32_t maxsz
);
300 void tcg_gen_gvec_ands(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
301 TCGv_i64 c
, uint32_t oprsz
, uint32_t maxsz
);
302 void tcg_gen_gvec_xors(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
303 TCGv_i64 c
, uint32_t oprsz
, uint32_t maxsz
);
304 void tcg_gen_gvec_ors(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
305 TCGv_i64 c
, uint32_t oprsz
, uint32_t maxsz
);
307 void tcg_gen_gvec_dup_mem(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
308 uint32_t s
, uint32_t m
);
309 void tcg_gen_gvec_dup_i32(unsigned vece
, uint32_t dofs
, uint32_t s
,
310 uint32_t m
, TCGv_i32
);
311 void tcg_gen_gvec_dup_i64(unsigned vece
, uint32_t dofs
, uint32_t s
,
312 uint32_t m
, TCGv_i64
);
314 void tcg_gen_gvec_dup8i(uint32_t dofs
, uint32_t s
, uint32_t m
, uint8_t x
);
315 void tcg_gen_gvec_dup16i(uint32_t dofs
, uint32_t s
, uint32_t m
, uint16_t x
);
316 void tcg_gen_gvec_dup32i(uint32_t dofs
, uint32_t s
, uint32_t m
, uint32_t x
);
317 void tcg_gen_gvec_dup64i(uint32_t dofs
, uint32_t s
, uint32_t m
, uint64_t x
);
319 void tcg_gen_gvec_shli(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
320 int64_t shift
, uint32_t oprsz
, uint32_t maxsz
);
321 void tcg_gen_gvec_shri(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
322 int64_t shift
, uint32_t oprsz
, uint32_t maxsz
);
323 void tcg_gen_gvec_sari(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
324 int64_t shift
, uint32_t oprsz
, uint32_t maxsz
);
326 void tcg_gen_gvec_shls(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
327 TCGv_i32 shift
, uint32_t oprsz
, uint32_t maxsz
);
328 void tcg_gen_gvec_shrs(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
329 TCGv_i32 shift
, uint32_t oprsz
, uint32_t maxsz
);
330 void tcg_gen_gvec_sars(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
331 TCGv_i32 shift
, uint32_t oprsz
, uint32_t maxsz
);
334 * Perform vector shift by vector element, modulo the element size.
335 * E.g. D[i] = A[i] << (B[i] % (8 << vece)).
337 void tcg_gen_gvec_shlv(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
338 uint32_t bofs
, uint32_t oprsz
, uint32_t maxsz
);
339 void tcg_gen_gvec_shrv(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
340 uint32_t bofs
, uint32_t oprsz
, uint32_t maxsz
);
341 void tcg_gen_gvec_sarv(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
342 uint32_t bofs
, uint32_t oprsz
, uint32_t maxsz
);
344 void tcg_gen_gvec_cmp(TCGCond cond
, unsigned vece
, uint32_t dofs
,
345 uint32_t aofs
, uint32_t bofs
,
346 uint32_t oprsz
, uint32_t maxsz
);
349 * Perform vector bit select: d = (b & a) | (c & ~a).
351 void tcg_gen_gvec_bitsel(unsigned vece
, uint32_t dofs
, uint32_t aofs
,
352 uint32_t bofs
, uint32_t cofs
,
353 uint32_t oprsz
, uint32_t maxsz
);
356 * 64-bit vector operations. Use these when the register has been allocated
357 * with tcg_global_mem_new_i64, and so we cannot also address it via pointer.
361 void tcg_gen_vec_neg8_i64(TCGv_i64 d
, TCGv_i64 a
);
362 void tcg_gen_vec_neg16_i64(TCGv_i64 d
, TCGv_i64 a
);
363 void tcg_gen_vec_neg32_i64(TCGv_i64 d
, TCGv_i64 a
);
365 void tcg_gen_vec_add8_i64(TCGv_i64 d
, TCGv_i64 a
, TCGv_i64 b
);
366 void tcg_gen_vec_add16_i64(TCGv_i64 d
, TCGv_i64 a
, TCGv_i64 b
);
367 void tcg_gen_vec_add32_i64(TCGv_i64 d
, TCGv_i64 a
, TCGv_i64 b
);
369 void tcg_gen_vec_sub8_i64(TCGv_i64 d
, TCGv_i64 a
, TCGv_i64 b
);
370 void tcg_gen_vec_sub16_i64(TCGv_i64 d
, TCGv_i64 a
, TCGv_i64 b
);
371 void tcg_gen_vec_sub32_i64(TCGv_i64 d
, TCGv_i64 a
, TCGv_i64 b
);
373 void tcg_gen_vec_shl8i_i64(TCGv_i64 d
, TCGv_i64 a
, int64_t);
374 void tcg_gen_vec_shl16i_i64(TCGv_i64 d
, TCGv_i64 a
, int64_t);
375 void tcg_gen_vec_shr8i_i64(TCGv_i64 d
, TCGv_i64 a
, int64_t);
376 void tcg_gen_vec_shr16i_i64(TCGv_i64 d
, TCGv_i64 a
, int64_t);
377 void tcg_gen_vec_sar8i_i64(TCGv_i64 d
, TCGv_i64 a
, int64_t);
378 void tcg_gen_vec_sar16i_i64(TCGv_i64 d
, TCGv_i64 a
, int64_t);