scsi: move host_status handling into SCSI drivers
[qemu/ar7.git] / target / hexagon / imported / alu.idef
blob45cc529fbc988811b23a12456a2a6278a2290e96
1 /*
2  *  Copyright(c) 2019-2021 Qualcomm Innovation Center, Inc. All Rights Reserved.
3  *
4  *  This program is free software; you can redistribute it and/or modify
5  *  it under the terms of the GNU General Public License as published by
6  *  the Free Software Foundation; either version 2 of the License, or
7  *  (at your option) any later version.
8  *
9  *  This program is distributed in the hope that it will be useful,
10  *  but WITHOUT ANY WARRANTY; without even the implied warranty of
11  *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
12  *  GNU General Public License for more details.
13  *
14  *  You should have received a copy of the GNU General Public License
15  *  along with this program; if not, see <http://www.gnu.org/licenses/>.
16  */
19  * ALU Instructions
20  */
23 /**********************************************/
24 /* Add/Sub instructions                       */
25 /**********************************************/
27 Q6INSN(A2_add,"Rd32=add(Rs32,Rt32)",ATTRIBS(),
28 "Add 32-bit registers",
29 { RdV=RsV+RtV;})
31 Q6INSN(A2_sub,"Rd32=sub(Rt32,Rs32)",ATTRIBS(),
32 "Subtract 32-bit registers",
33 { RdV=RtV-RsV;})
35 #define COND_ALU(TAG,OPER,DESCR,SEMANTICS)\
36 Q6INSN(TAG##t,"if (Pu4) "OPER,ATTRIBS(A_ARCHV2),DESCR,{if(fLSBOLD(PuV)){SEMANTICS;} else {CANCEL;}})\
37 Q6INSN(TAG##f,"if (!Pu4) "OPER,ATTRIBS(A_ARCHV2),DESCR,{if(fLSBOLDNOT(PuV)){SEMANTICS;} else {CANCEL;}})\
38 Q6INSN(TAG##tnew,"if (Pu4.new) " OPER,ATTRIBS(A_ARCHV2),DESCR,{if(fLSBNEW(PuN)){SEMANTICS;} else {CANCEL;}})\
39 Q6INSN(TAG##fnew,"if (!Pu4.new) "OPER,ATTRIBS(A_ARCHV2),DESCR,{if(fLSBNEWNOT(PuN)){SEMANTICS;} else {CANCEL;}})
41 COND_ALU(A2_padd,"Rd32=add(Rs32,Rt32)","Conditionally Add 32-bit registers",RdV=RsV+RtV)
42 COND_ALU(A2_psub,"Rd32=sub(Rt32,Rs32)","Conditionally Subtract 32-bit registers",RdV=RtV-RsV)
43 COND_ALU(A2_paddi,"Rd32=add(Rs32,#s8)","Conditionally Add Register and immediate",fIMMEXT(siV); RdV=RsV+siV)
44 COND_ALU(A2_pxor,"Rd32=xor(Rs32,Rt32)","Conditionally XOR registers",RdV=RsV^RtV)
45 COND_ALU(A2_pand,"Rd32=and(Rs32,Rt32)","Conditionally AND registers",RdV=RsV&RtV)
46 COND_ALU(A2_por,"Rd32=or(Rs32,Rt32)","Conditionally OR registers",RdV=RsV|RtV)
48 COND_ALU(A4_psxtb,"Rd32=sxtb(Rs32)","Conditionally sign-extend byte", RdV=fSXTN(8,32,RsV))
49 COND_ALU(A4_pzxtb,"Rd32=zxtb(Rs32)","Conditionally zero-extend byte", RdV=fZXTN(8,32,RsV))
50 COND_ALU(A4_psxth,"Rd32=sxth(Rs32)","Conditionally sign-extend halfword", RdV=fSXTN(16,32,RsV))
51 COND_ALU(A4_pzxth,"Rd32=zxth(Rs32)","Conditionally zero-extend halfword", RdV=fZXTN(16,32,RsV))
52 COND_ALU(A4_paslh,"Rd32=aslh(Rs32)","Conditionally zero-extend halfword", RdV=RsV<<16)
53 COND_ALU(A4_pasrh,"Rd32=asrh(Rs32)","Conditionally zero-extend halfword", RdV=RsV>>16)
56 Q6INSN(A2_addsat,"Rd32=add(Rs32,Rt32):sat",ATTRIBS(),
57 "Add 32-bit registers with saturation",
58 { RdV=fSAT(fSE32_64(RsV)+fSE32_64(RtV)); })
60 Q6INSN(A2_subsat,"Rd32=sub(Rt32,Rs32):sat",ATTRIBS(),
61 "Subtract 32-bit registers with saturation",
62 { RdV=fSAT(fSE32_64(RtV) - fSE32_64(RsV)); })
65 Q6INSN(A2_addi,"Rd32=add(Rs32,#s16)",ATTRIBS(),
66 "Add a signed immediate to a register",
67 { fIMMEXT(siV); RdV=RsV+siV;})
70 Q6INSN(C4_addipc,"Rd32=add(pc,#u6)",ATTRIBS(),
71 "Add immediate to PC",
72 { RdV=fREAD_PC()+fIMMEXT(uiV);})
76 /**********************************************/
77 /* Single-precision HL forms                  */
78 /* These insns and the SP mpy are the ones    */
79 /* that can do .HL stuff                      */
80 /**********************************************/
81 #define STD_HL_INSN(TAG,OPER,AOPER,ATR,SEM)\
82 Q6INSN(A2_##TAG##_ll, OPER"(Rt.L32,Rs.L32)"AOPER,    ATR,"",{SEM(fGETHALF(0,RtV),fGETHALF(0,RsV));})\
83 Q6INSN(A2_##TAG##_lh, OPER"(Rt.L32,Rs.H32)"AOPER,    ATR,"",{SEM(fGETHALF(0,RtV),fGETHALF(1,RsV));})\
84 Q6INSN(A2_##TAG##_hl, OPER"(Rt.H32,Rs.L32)"AOPER,    ATR,"",{SEM(fGETHALF(1,RtV),fGETHALF(0,RsV));})\
85 Q6INSN(A2_##TAG##_hh, OPER"(Rt.H32,Rs.H32)"AOPER,    ATR,"",{SEM(fGETHALF(1,RtV),fGETHALF(1,RsV));})
87 #define SUBSTD_HL_INSN(TAG,OPER,AOPER,ATR,SEM)\
88 Q6INSN(A2_##TAG##_ll, OPER"(Rt.L32,Rs.L32)"AOPER,    ATR,"",{SEM(fGETHALF(0,RtV),fGETHALF(0,RsV));})\
89 Q6INSN(A2_##TAG##_hl, OPER"(Rt.L32,Rs.H32)"AOPER,    ATR,"",{SEM(fGETHALF(0,RtV),fGETHALF(1,RsV));})
92 #undef HLSEM
93 #define HLSEM(A,B) RdV=fSXTN(16,32,(A+B))
94 SUBSTD_HL_INSN(addh_l16,"Rd32=add","",ATTRIBS(),HLSEM)
96 #undef HLSEM
97 #define HLSEM(A,B) RdV=fSATH(A+B)
98 SUBSTD_HL_INSN(addh_l16_sat,"Rd32=add",":sat",ATTRIBS(),HLSEM)
100 #undef HLSEM
101 #define HLSEM(A,B) RdV=fSXTN(16,32,(A-B))
102 SUBSTD_HL_INSN(subh_l16,"Rd32=sub","",ATTRIBS(),HLSEM)
104 #undef HLSEM
105 #define HLSEM(A,B) RdV=fSATH(A-B)
106 SUBSTD_HL_INSN(subh_l16_sat,"Rd32=sub",":sat",ATTRIBS(),HLSEM)
108 #undef HLSEM
109 #define HLSEM(A,B) RdV=(A+B)<<16
110 STD_HL_INSN(addh_h16,"Rd32=add",":<<16",ATTRIBS(),HLSEM)
112 #undef HLSEM
113 #define HLSEM(A,B) RdV=(fSATH(A+B))<<16
114 STD_HL_INSN(addh_h16_sat,"Rd32=add",":sat:<<16",ATTRIBS(),HLSEM)
116 #undef HLSEM
117 #define HLSEM(A,B) RdV=(A-B)<<16
118 STD_HL_INSN(subh_h16,"Rd32=sub",":<<16",ATTRIBS(),HLSEM)
120 #undef HLSEM
121 #define HLSEM(A,B) RdV=(fSATH(A-B))<<16
122 STD_HL_INSN(subh_h16_sat,"Rd32=sub",":sat:<<16",ATTRIBS(),HLSEM)
127 Q6INSN(A2_aslh,"Rd32=aslh(Rs32)",ATTRIBS(),
128 "Arithmetic Shift Left by Halfword",{ RdV=RsV<<16; })
130 Q6INSN(A2_asrh,"Rd32=asrh(Rs32)",ATTRIBS(),
131 "Arithmetic Shift Right by Halfword",{ RdV=RsV>>16; })
134 /* 64-bit versions */
136 Q6INSN(A2_addp,"Rdd32=add(Rss32,Rtt32)",ATTRIBS(),
137 "Add",
138 { RddV=RssV+RttV;})
140 Q6INSN(A2_addpsat,"Rdd32=add(Rss32,Rtt32):sat",ATTRIBS(A_ARCHV3),
141 "Add",
142 { fADDSAT64(RddV,RssV,RttV);})
144 Q6INSN(A2_addspl,"Rdd32=add(Rss32,Rtt32):raw:lo",ATTRIBS(A_ARCHV3),
145 "Add",
146 { RddV=RttV+fSXTN(32,64,fGETWORD(0,RssV));})
148 Q6INSN(A2_addsph,"Rdd32=add(Rss32,Rtt32):raw:hi",ATTRIBS(A_ARCHV3),
149 "Add",
150 { RddV=RttV+fSXTN(32,64,fGETWORD(1,RssV));})
152 Q6INSN(A2_subp,"Rdd32=sub(Rtt32,Rss32)",ATTRIBS(),
153 "Sub",
154 { RddV=RttV-RssV;})
156 /* NEG and ABS */
158 Q6INSN(A2_negsat,"Rd32=neg(Rs32):sat",ATTRIBS(),
159 "Arithmetic negate register", { RdV = fSAT(-fCAST8s(RsV)); })
161 Q6INSN(A2_abs,"Rd32=abs(Rs32)",ATTRIBS(),
162 "Absolute Value register", { RdV = fABS(RsV); })
164 Q6INSN(A2_abssat,"Rd32=abs(Rs32):sat",ATTRIBS(),
165 "Arithmetic negate register", { RdV = fSAT(fABS(fCAST4_8s(RsV))); })
167 Q6INSN(A2_vconj,"Rdd32=vconj(Rss32):sat",ATTRIBS(A_ARCHV2),
168 "Vector Complex conjugate of Rss",
169 {  fSETHALF(1,RddV,fSATN(16,-fGETHALF(1,RssV)));
170    fSETHALF(0,RddV,fGETHALF(0,RssV));
171    fSETHALF(3,RddV,fSATN(16,-fGETHALF(3,RssV)));
172    fSETHALF(2,RddV,fGETHALF(2,RssV));
176 /* 64-bit versions */
178 Q6INSN(A2_negp,"Rdd32=neg(Rss32)",ATTRIBS(),
179 "Arithmetic negate register", { RddV = -RssV; })
181 Q6INSN(A2_absp,"Rdd32=abs(Rss32)",ATTRIBS(),
182 "Absolute Value register", { RddV = fABS(RssV); })
185 /* MIN and MAX  R */
187 Q6INSN(A2_max,"Rd32=max(Rs32,Rt32)",ATTRIBS(),
188 "Maximum of two registers",
189 { RdV = fMAX(RsV,RtV); })
191 Q6INSN(A2_maxu,"Rd32=maxu(Rs32,Rt32)",ATTRIBS(),
192 "Maximum of two registers (unsigned)",
193 { RdV = fMAX(fCAST4u(RsV),fCAST4u(RtV)); })
195 Q6INSN(A2_min,"Rd32=min(Rt32,Rs32)",ATTRIBS(),
196 "Minimum of two registers",
197 { RdV = fMIN(RtV,RsV); })
199 Q6INSN(A2_minu,"Rd32=minu(Rt32,Rs32)",ATTRIBS(),
200 "Minimum of two registers (unsigned)",
201 { RdV = fMIN(fCAST4u(RtV),fCAST4u(RsV)); })
203 /* MIN and MAX Pairs */
204 #if 1
205 Q6INSN(A2_maxp,"Rdd32=max(Rss32,Rtt32)",ATTRIBS(A_ARCHV3),
206 "Maximum of two register pairs",
207 { RddV = fMAX(RssV,RttV); })
209 Q6INSN(A2_maxup,"Rdd32=maxu(Rss32,Rtt32)",ATTRIBS(A_ARCHV3),
210 "Maximum of two register pairs (unsigned)",
211 { RddV = fMAX(fCAST8u(RssV),fCAST8u(RttV)); })
213 Q6INSN(A2_minp,"Rdd32=min(Rtt32,Rss32)",ATTRIBS(A_ARCHV3),
214 "Minimum of two register pairs",
215 { RddV = fMIN(RttV,RssV); })
217 Q6INSN(A2_minup,"Rdd32=minu(Rtt32,Rss32)",ATTRIBS(A_ARCHV3),
218 "Minimum of two register pairs (unsigned)",
219 { RddV = fMIN(fCAST8u(RttV),fCAST8u(RssV)); })
220 #endif
222 /**********************************************/
223 /* Register and Immediate Transfers           */
224 /**********************************************/
226 Q6INSN(A2_nop,"nop",ATTRIBS(A_IT_NOP),
227 "Nop (32-bit encoding)",
228  fHIDE( { }  ))
231 Q6INSN(A4_ext,"immext(#u26:6)",ATTRIBS(A_IT_EXTENDER),
232 "This instruction carries the 26 most-significant immediate bits for the next instruction",
233 { fHIDE(); })
236 Q6INSN(A2_tfr,"Rd32=Rs32",ATTRIBS(),
237 "tfr register",{ RdV=RsV;})
239 Q6INSN(A2_tfrsi,"Rd32=#s16",ATTRIBS(),
240 "transfer signed immediate to register",{ fIMMEXT(siV); RdV=siV;})
242 Q6INSN(A2_sxtb,"Rd32=sxtb(Rs32)",ATTRIBS(),
243 "Sign extend byte", {RdV = fSXTN(8,32,RsV);})
245 Q6INSN(A2_zxth,"Rd32=zxth(Rs32)",ATTRIBS(),
246 "Zero extend half", {RdV = fZXTN(16,32,RsV);})
248 Q6INSN(A2_sxth,"Rd32=sxth(Rs32)",ATTRIBS(),
249 "Sign extend half", {RdV = fSXTN(16,32,RsV);})
251 Q6INSN(A2_combinew,"Rdd32=combine(Rs32,Rt32)",ATTRIBS(),
252 "Combine two words into a register pair",
253 { fSETWORD(0,RddV,RtV);
254   fSETWORD(1,RddV,RsV);
257 Q6INSN(A4_combineri,"Rdd32=combine(Rs32,#s8)",ATTRIBS(),
258 "Combine a word and an immediate into a register pair",
259 { fIMMEXT(siV); fSETWORD(0,RddV,siV);
260   fSETWORD(1,RddV,RsV);
263 Q6INSN(A4_combineir,"Rdd32=combine(#s8,Rs32)",ATTRIBS(),
264 "Combine a word and an immediate into a register pair",
265 { fIMMEXT(siV); fSETWORD(0,RddV,RsV);
266   fSETWORD(1,RddV,siV);
271 Q6INSN(A2_combineii,"Rdd32=combine(#s8,#S8)",ATTRIBS(A_ARCHV2),
272 "Set two small immediates",
273 { fIMMEXT(siV); fSETWORD(0,RddV,SiV); fSETWORD(1,RddV,siV); })
275 Q6INSN(A4_combineii,"Rdd32=combine(#s8,#U6)",ATTRIBS(),"Set two small immediates",
276 { fIMMEXT(UiV); fSETWORD(0,RddV,UiV); fSETWORD(1,RddV,siV); })
279 Q6INSN(A2_combine_hh,"Rd32=combine(Rt.H32,Rs.H32)",ATTRIBS(),
280 "Combine two halfs into a register", {RdV = (fGETUHALF(1,RtV)<<16) | fGETUHALF(1,RsV);})
282 Q6INSN(A2_combine_hl,"Rd32=combine(Rt.H32,Rs.L32)",ATTRIBS(),
283 "Combine two halfs into a register", {RdV = (fGETUHALF(1,RtV)<<16) | fGETUHALF(0,RsV);})
285 Q6INSN(A2_combine_lh,"Rd32=combine(Rt.L32,Rs.H32)",ATTRIBS(),
286 "Combine two halfs into a register", {RdV = (fGETUHALF(0,RtV)<<16) | fGETUHALF(1,RsV);})
288 Q6INSN(A2_combine_ll,"Rd32=combine(Rt.L32,Rs.L32)",ATTRIBS(),
289 "Combine two halfs into a register", {RdV = (fGETUHALF(0,RtV)<<16) | fGETUHALF(0,RsV);})
291 Q6INSN(A2_tfril,"Rx.L32=#u16",ATTRIBS(),
292 "Set low 16-bits, leave upper 16 unchanged",{ fSETHALF(0,RxV,uiV);})
294 Q6INSN(A2_tfrih,"Rx.H32=#u16",ATTRIBS(),
295 "Set high 16-bits, leave low 16 unchanged",{ fSETHALF(1,RxV,uiV);})
297 Q6INSN(A2_tfrcrr,"Rd32=Cs32",ATTRIBS(),
298 "transfer control register to general register",{ RdV=CsV;})
300 Q6INSN(A2_tfrrcr,"Cd32=Rs32",ATTRIBS(),
301 "transfer general register to control register",{ CdV=RsV;})
303 Q6INSN(A4_tfrcpp,"Rdd32=Css32",ATTRIBS(),
304 "transfer control register to general register",{ RddV=CssV;})
306 Q6INSN(A4_tfrpcp,"Cdd32=Rss32",ATTRIBS(),
307 "transfer general register to control register",{ CddV=RssV;})
310 /**********************************************/
311 /* Logicals                                   */
312 /**********************************************/
314 Q6INSN(A2_and,"Rd32=and(Rs32,Rt32)",ATTRIBS(),
315 "logical AND",{ RdV=RsV&RtV;})
317 Q6INSN(A2_or,"Rd32=or(Rs32,Rt32)",ATTRIBS(),
318 "logical OR",{ RdV=RsV|RtV;})
320 Q6INSN(A2_xor,"Rd32=xor(Rs32,Rt32)",ATTRIBS(),
321 "logical XOR",{ RdV=RsV^RtV;})
323 Q6INSN(M2_xor_xacc,"Rx32^=xor(Rs32,Rt32)",ATTRIBS(A_ARCHV2),
324 "logical XOR with XOR accumulation",{ RxV^=RsV^RtV;})
326 Q6INSN(M4_xor_xacc,"Rxx32^=xor(Rss32,Rtt32)",,
327 "logical XOR with XOR accumulation",{ RxxV^=RssV^RttV;})
331 Q6INSN(A4_andn,"Rd32=and(Rt32,~Rs32)",,
332 "And-Not", { RdV = (RtV & ~RsV); })
334 Q6INSN(A4_orn,"Rd32=or(Rt32,~Rs32)",,
335 "Or-Not", { RdV = (RtV | ~RsV); })
338 Q6INSN(A4_andnp,"Rdd32=and(Rtt32,~Rss32)",,
339 "And-Not", { RddV = (RttV & ~RssV); })
341 Q6INSN(A4_ornp,"Rdd32=or(Rtt32,~Rss32)",,
342 "Or-Not", { RddV = (RttV | ~RssV); })
347 /********************/
348 /* Compound add-add */
349 /********************/
351 Q6INSN(S4_addaddi,"Rd32=add(Rs32,add(Ru32,#s6))",ATTRIBS(),
352         "3-input add",
353         { RdV = RsV + RuV + fIMMEXT(siV); })
356 Q6INSN(S4_subaddi,"Rd32=add(Rs32,sub(#s6,Ru32))",ATTRIBS(),
357         "3-input sub",
358         { RdV = RsV - RuV + fIMMEXT(siV); })
362 /****************************/
363 /* Compound logical-logical */
364 /****************************/
366 Q6INSN(M4_and_and,"Rx32&=and(Rs32,Rt32)",ATTRIBS(),
367 "Compound And-And", { RxV &= (RsV & RtV); })
369 Q6INSN(M4_and_andn,"Rx32&=and(Rs32,~Rt32)",ATTRIBS(),
370 "Compound And-Andn", { RxV &= (RsV & ~RtV); })
372 Q6INSN(M4_and_or,"Rx32&=or(Rs32,Rt32)",ATTRIBS(),
373 "Compound And-Or", { RxV &= (RsV | RtV); })
375 Q6INSN(M4_and_xor,"Rx32&=xor(Rs32,Rt32)",ATTRIBS(),
376 "Compound And-xor", { RxV &= (RsV ^ RtV); })
380 Q6INSN(M4_or_and,"Rx32|=and(Rs32,Rt32)",ATTRIBS(),
381 "Compound Or-And", { RxV |= (RsV & RtV); })
383 Q6INSN(M4_or_andn,"Rx32|=and(Rs32,~Rt32)",ATTRIBS(),
384 "Compound Or-AndN", { RxV |= (RsV & ~RtV); })
386 Q6INSN(M4_or_or,"Rx32|=or(Rs32,Rt32)",ATTRIBS(),
387 "Compound Or-Or", { RxV |= (RsV | RtV); })
389 Q6INSN(M4_or_xor,"Rx32|=xor(Rs32,Rt32)",ATTRIBS(),
390 "Compound Or-xor", { RxV |= (RsV ^ RtV); })
393 Q6INSN(S4_or_andix,"Rx32=or(Ru32,and(Rx32,#s10))",ATTRIBS(),
394 "Compound Or-And", { RxV = RuV | (RxV & fIMMEXT(siV)); })
396 Q6INSN(S4_or_andi,"Rx32|=and(Rs32,#s10)",ATTRIBS(),
397 "Compound Or-And", { RxV = RxV | (RsV & fIMMEXT(siV)); })
399 Q6INSN(S4_or_ori,"Rx32|=or(Rs32,#s10)",ATTRIBS(),
400 "Compound Or-And", { RxV = RxV | (RsV | fIMMEXT(siV)); })
405 Q6INSN(M4_xor_and,"Rx32^=and(Rs32,Rt32)",ATTRIBS(),
406 "Compound Xor-And", { RxV ^= (RsV & RtV); })
408 Q6INSN(M4_xor_or,"Rx32^=or(Rs32,Rt32)",ATTRIBS(),
409 "Compound Xor-Or", { RxV ^= (RsV | RtV); })
411 Q6INSN(M4_xor_andn,"Rx32^=and(Rs32,~Rt32)",ATTRIBS(),
412 "Compound Xor-And", { RxV ^= (RsV & ~RtV); })
419 Q6INSN(A2_subri,"Rd32=sub(#s10,Rs32)",ATTRIBS(A_ARCHV2),
420 "Subtract register from immediate",{ fIMMEXT(siV); RdV=siV-RsV;})
422 Q6INSN(A2_andir,"Rd32=and(Rs32,#s10)",ATTRIBS(A_ARCHV2),
423 "logical AND with immediate",{ fIMMEXT(siV); RdV=RsV&siV;})
425 Q6INSN(A2_orir,"Rd32=or(Rs32,#s10)",ATTRIBS(A_ARCHV2),
426 "logical OR with immediate",{ fIMMEXT(siV); RdV=RsV|siV;})
431 Q6INSN(A2_andp,"Rdd32=and(Rss32,Rtt32)",ATTRIBS(),
432 "logical AND pair",{ RddV=RssV&RttV;})
434 Q6INSN(A2_orp,"Rdd32=or(Rss32,Rtt32)",ATTRIBS(),
435 "logical OR pair",{ RddV=RssV|RttV;})
437 Q6INSN(A2_xorp,"Rdd32=xor(Rss32,Rtt32)",ATTRIBS(),
438 "logical eXclusive OR pair",{ RddV=RssV^RttV;})
440 Q6INSN(A2_notp,"Rdd32=not(Rss32)",ATTRIBS(),
441 "logical NOT pair",{ RddV=~RssV;})
443 Q6INSN(A2_sxtw,"Rdd32=sxtw(Rs32)",ATTRIBS(),
444 "Sign extend 32-bit word to 64-bit pair",
445 { RddV = fCAST4_8s(RsV); })
447 Q6INSN(A2_sat,"Rd32=sat(Rss32)",ATTRIBS(),
448 "Saturate to 32-bit Signed",
449 { RdV = fSAT(RssV); })
451 Q6INSN(A2_roundsat,"Rd32=round(Rss32):sat",ATTRIBS(),
452 "Round & Saturate to 32-bit Signed",
453 { fHIDE(size8s_t tmp;) fADDSAT64(tmp,RssV,0x080000000ULL); RdV = fGETWORD(1,tmp); })
455 Q6INSN(A2_sath,"Rd32=sath(Rs32)",ATTRIBS(),
456 "Saturate to 16-bit Signed",
457 { RdV = fSATH(RsV); })
459 Q6INSN(A2_satuh,"Rd32=satuh(Rs32)",ATTRIBS(),
460 "Saturate to 16-bit Unsigned",
461 { RdV = fSATUH(RsV); })
463 Q6INSN(A2_satub,"Rd32=satub(Rs32)",ATTRIBS(),
464 "Saturate to 8-bit Unsigned",
465 { RdV = fSATUB(RsV); })
467 Q6INSN(A2_satb,"Rd32=satb(Rs32)",ATTRIBS(A_ARCHV2),
468 "Saturate to 8-bit Signed",
469 { RdV = fSATB(RsV); })
471 /**********************************************/
472 /* Vector Add                                 */
473 /**********************************************/
475 Q6INSN(A2_vaddub,"Rdd32=vaddub(Rss32,Rtt32)",ATTRIBS(),
476 "Add vector of bytes",
478         fHIDE(int i;)
479         for (i = 0; i < 8; i++) {
480             fSETBYTE(i,RddV,(fGETUBYTE(i,RssV)+fGETUBYTE(i,RttV)));
481         }
484 Q6INSN(A2_vaddubs,"Rdd32=vaddub(Rss32,Rtt32):sat",ATTRIBS(),
485 "Add vector of bytes",
487         fHIDE(int i;)
488         for (i = 0; i < 8; i++) {
489             fSETBYTE(i,RddV,fSATUN(8,fGETUBYTE(i,RssV)+fGETUBYTE(i,RttV)));
490         }
493 Q6INSN(A2_vaddh,"Rdd32=vaddh(Rss32,Rtt32)",ATTRIBS(),
494 "Add vector of half integers",
496         fHIDE(int i;)
497         for (i=0;i<4;i++) {
498             fSETHALF(i,RddV,fGETHALF(i,RssV)+fGETHALF(i,RttV));
499         }
502 Q6INSN(A2_vaddhs,"Rdd32=vaddh(Rss32,Rtt32):sat",ATTRIBS(),
503 "Add vector of half integers with saturation",
505         fHIDE(int i;)
506         for (i=0;i<4;i++) {
507             fSETHALF(i,RddV,fSATN(16,fGETHALF(i,RssV)+fGETHALF(i,RttV)));
508         }
511 Q6INSN(A2_vadduhs,"Rdd32=vadduh(Rss32,Rtt32):sat",ATTRIBS(),
512 "Add vector of unsigned half integers with saturation",
514         fHIDE(int i;)
515         for (i=0;i<4;i++) {
516             fSETHALF(i,RddV,fSATUN(16,fGETUHALF(i,RssV)+fGETUHALF(i,RttV)));
517         }
520 Q6INSN(A5_vaddhubs,"Rd32=vaddhub(Rss32,Rtt32):sat",ATTRIBS(),
521 "Add vector of half integers with saturation and pack to unsigned bytes",
523         fHIDE(int i;)
524         for (i=0;i<4;i++) {
525             fSETBYTE(i,RdV,fSATUB(fGETHALF(i,RssV)+fGETHALF(i,RttV)));
526         }
529 Q6INSN(A2_vaddw,"Rdd32=vaddw(Rss32,Rtt32)",ATTRIBS(),
530 "Add vector of words",
532         fHIDE(int i;)
533         for (i=0;i<2;i++) {
534             fSETWORD(i,RddV,fGETWORD(i,RssV)+fGETWORD(i,RttV));
535         }
538 Q6INSN(A2_vaddws,"Rdd32=vaddw(Rss32,Rtt32):sat",ATTRIBS(),
539 "Add vector of words with saturation",
541         fHIDE(int i;)
542         for (i=0;i<2;i++) {
543             fSETWORD(i,RddV,fSATN(32,fGETWORD(i,RssV)+fGETWORD(i,RttV)));
544         }
549 Q6INSN(S4_vxaddsubw,"Rdd32=vxaddsubw(Rss32,Rtt32):sat",ATTRIBS(),
550 "Cross vector add-sub words with saturation",
552         fSETWORD(0,RddV,fSAT(fGETWORD(0,RssV)+fGETWORD(1,RttV)));
553         fSETWORD(1,RddV,fSAT(fGETWORD(1,RssV)-fGETWORD(0,RttV)));
555 Q6INSN(S4_vxsubaddw,"Rdd32=vxsubaddw(Rss32,Rtt32):sat",ATTRIBS(),
556 "Cross vector sub-add words with saturation",
558         fSETWORD(0,RddV,fSAT(fGETWORD(0,RssV)-fGETWORD(1,RttV)));
559         fSETWORD(1,RddV,fSAT(fGETWORD(1,RssV)+fGETWORD(0,RttV)));
564 Q6INSN(S4_vxaddsubh,"Rdd32=vxaddsubh(Rss32,Rtt32):sat",ATTRIBS(),
565 "Cross vector add-sub halfwords with saturation",
567         fSETHALF(0,RddV,fSATH(fGETHALF(0,RssV)+fGETHALF(1,RttV)));
568         fSETHALF(1,RddV,fSATH(fGETHALF(1,RssV)-fGETHALF(0,RttV)));
570         fSETHALF(2,RddV,fSATH(fGETHALF(2,RssV)+fGETHALF(3,RttV)));
571         fSETHALF(3,RddV,fSATH(fGETHALF(3,RssV)-fGETHALF(2,RttV)));
574 Q6INSN(S4_vxsubaddh,"Rdd32=vxsubaddh(Rss32,Rtt32):sat",ATTRIBS(),
575 "Cross vector sub-add halfwords with saturation",
577         fSETHALF(0,RddV,fSATH(fGETHALF(0,RssV)-fGETHALF(1,RttV)));
578         fSETHALF(1,RddV,fSATH(fGETHALF(1,RssV)+fGETHALF(0,RttV)));
580         fSETHALF(2,RddV,fSATH(fGETHALF(2,RssV)-fGETHALF(3,RttV)));
581         fSETHALF(3,RddV,fSATH(fGETHALF(3,RssV)+fGETHALF(2,RttV)));
587 Q6INSN(S4_vxaddsubhr,"Rdd32=vxaddsubh(Rss32,Rtt32):rnd:>>1:sat",ATTRIBS(),
588 "Cross vector add-sub halfwords with shift, round, and saturation",
590         fSETHALF(0,RddV,fSATH((fGETHALF(0,RssV)+fGETHALF(1,RttV)+1)>>1));
591         fSETHALF(1,RddV,fSATH((fGETHALF(1,RssV)-fGETHALF(0,RttV)+1)>>1));
593         fSETHALF(2,RddV,fSATH((fGETHALF(2,RssV)+fGETHALF(3,RttV)+1)>>1));
594         fSETHALF(3,RddV,fSATH((fGETHALF(3,RssV)-fGETHALF(2,RttV)+1)>>1));
597 Q6INSN(S4_vxsubaddhr,"Rdd32=vxsubaddh(Rss32,Rtt32):rnd:>>1:sat",ATTRIBS(),
598 "Cross vector sub-add halfwords with shift, round, and saturation",
600         fSETHALF(0,RddV,fSATH((fGETHALF(0,RssV)-fGETHALF(1,RttV)+1)>>1));
601         fSETHALF(1,RddV,fSATH((fGETHALF(1,RssV)+fGETHALF(0,RttV)+1)>>1));
603         fSETHALF(2,RddV,fSATH((fGETHALF(2,RssV)-fGETHALF(3,RttV)+1)>>1));
604         fSETHALF(3,RddV,fSATH((fGETHALF(3,RssV)+fGETHALF(2,RttV)+1)>>1));
611 /**********************************************/
612 /* 1/2 Vector operations                      */
613 /**********************************************/
616 Q6INSN(A2_svavgh,"Rd32=vavgh(Rs32,Rt32)",ATTRIBS(A_ARCHV2),
617 "Avg vector of half integers",
619         fHIDE(int i;)
620         for (i=0;i<2;i++) {
621             fSETHALF(i,RdV,((fGETHALF(i,RsV)+fGETHALF(i,RtV))>>1));
622         }
625 Q6INSN(A2_svavghs,"Rd32=vavgh(Rs32,Rt32):rnd",ATTRIBS(A_ARCHV2),
626 "Avg vector of half integers with rounding",
628         fHIDE(int i;)
629         for (i=0;i<2;i++) {
630             fSETHALF(i,RdV,((fGETHALF(i,RsV)+fGETHALF(i,RtV)+1)>>1));
631         }
636 Q6INSN(A2_svnavgh,"Rd32=vnavgh(Rt32,Rs32)",ATTRIBS(A_ARCHV2),
637 "Avg vector of half integers",
639         fHIDE(int i;)
640         for (i=0;i<2;i++) {
641             fSETHALF(i,RdV,((fGETHALF(i,RtV)-fGETHALF(i,RsV))>>1));
642         }
646 Q6INSN(A2_svaddh,"Rd32=vaddh(Rs32,Rt32)",ATTRIBS(),
647 "Add vector of half integers",
649         fHIDE(int i;)
650         for (i=0;i<2;i++) {
651             fSETHALF(i,RdV,fGETHALF(i,RsV)+fGETHALF(i,RtV));
652         }
655 Q6INSN(A2_svaddhs,"Rd32=vaddh(Rs32,Rt32):sat",ATTRIBS(),
656 "Add vector of half integers with saturation",
658         fHIDE(int i;)
659         for (i=0;i<2;i++) {
660             fSETHALF(i,RdV,fSATN(16,fGETHALF(i,RsV)+fGETHALF(i,RtV)));
661         }
664 Q6INSN(A2_svadduhs,"Rd32=vadduh(Rs32,Rt32):sat",ATTRIBS(),
665 "Add vector of unsigned half integers with saturation",
667         fHIDE(int i;)
668         for (i=0;i<2;i++) {
669             fSETHALF(i,RdV,fSATUN(16,fGETUHALF(i,RsV)+fGETUHALF(i,RtV)));
670         }
674 Q6INSN(A2_svsubh,"Rd32=vsubh(Rt32,Rs32)",ATTRIBS(),
675 "Sub vector of half integers",
677         fHIDE(int i;)
678         for (i=0;i<2;i++) {
679             fSETHALF(i,RdV,fGETHALF(i,RtV)-fGETHALF(i,RsV));
680         }
683 Q6INSN(A2_svsubhs,"Rd32=vsubh(Rt32,Rs32):sat",ATTRIBS(),
684 "Sub vector of half integers with saturation",
686         fHIDE(int i;)
687         for (i=0;i<2;i++) {
688             fSETHALF(i,RdV,fSATN(16,fGETHALF(i,RtV)-fGETHALF(i,RsV)));
689         }
692 Q6INSN(A2_svsubuhs,"Rd32=vsubuh(Rt32,Rs32):sat",ATTRIBS(),
693 "Sub vector of unsigned half integers with saturation",
695         fHIDE(int i;)
696         for (i=0;i<2;i++) {
697             fSETHALF(i,RdV,fSATUN(16,fGETUHALF(i,RtV)-fGETUHALF(i,RsV)));
698         }
704 /**********************************************/
705 /* Vector Reduce Add                          */
706 /**********************************************/
708 Q6INSN(A2_vraddub,"Rdd32=vraddub(Rss32,Rtt32)",ATTRIBS(),
709 "Sum: two vectors of unsigned bytes",
711         fHIDE(int i;)
712         RddV = 0;
713         for (i=0;i<4;i++) {
714             fSETWORD(0,RddV,(fGETWORD(0,RddV) + (fGETUBYTE(i,RssV)+fGETUBYTE(i,RttV))));
715         }
716         for (i=4;i<8;i++) {
717             fSETWORD(1,RddV,(fGETWORD(1,RddV) + (fGETUBYTE(i,RssV)+fGETUBYTE(i,RttV))));
718         }
721 Q6INSN(A2_vraddub_acc,"Rxx32+=vraddub(Rss32,Rtt32)",ATTRIBS(),
722 "Sum: two vectors of unsigned bytes",
724         fHIDE(int i;)
725         for (i = 0; i < 4; i++) {
726             fSETWORD(0,RxxV,(fGETWORD(0,RxxV) + (fGETUBYTE(i,RssV)+fGETUBYTE(i,RttV))));
727         }
728         for (i = 4; i < 8; i++) {
729             fSETWORD(1,RxxV,(fGETWORD(1,RxxV) + (fGETUBYTE(i,RssV)+fGETUBYTE(i,RttV))));
730         }
735 Q6INSN(M2_vraddh,"Rd32=vraddh(Rss32,Rtt32)",ATTRIBS(A_ARCHV3),
736 "Sum: two vectors of halves",
738         fHIDE(int i;)
739         RdV = 0;
740         for (i=0;i<4;i++) {
741             RdV += (fGETHALF(i,RssV)+fGETHALF(i,RttV));
742         }
745 Q6INSN(M2_vradduh,"Rd32=vradduh(Rss32,Rtt32)",ATTRIBS(A_ARCHV3),
746 "Sum: two vectors of unsigned halves",
748         fHIDE(int i;)
749         RdV = 0;
750         for (i=0;i<4;i++) {
751             RdV += (fGETUHALF(i,RssV)+fGETUHALF(i,RttV));
752         }
755 /**********************************************/
756 /* Vector Sub                                 */
757 /**********************************************/
759 Q6INSN(A2_vsubub,"Rdd32=vsubub(Rtt32,Rss32)",ATTRIBS(),
760 "Sub vector of bytes",
762         fHIDE(int i;)
763         for (i = 0; i < 8; i++) {
764             fSETBYTE(i,RddV,(fGETUBYTE(i,RttV)-fGETUBYTE(i,RssV)));
765         }
768 Q6INSN(A2_vsububs,"Rdd32=vsubub(Rtt32,Rss32):sat",ATTRIBS(),
769 "Sub vector of bytes",
771         fHIDE(int i;)
772         for (i = 0; i < 8; i++) {
773             fSETBYTE(i,RddV,fSATUN(8,fGETUBYTE(i,RttV)-fGETUBYTE(i,RssV)));
774         }
777 Q6INSN(A2_vsubh,"Rdd32=vsubh(Rtt32,Rss32)",ATTRIBS(),
778 "Sub vector of half integers",
780         fHIDE(int i;)
781         for (i=0;i<4;i++) {
782             fSETHALF(i,RddV,fGETHALF(i,RttV)-fGETHALF(i,RssV));
783         }
786 Q6INSN(A2_vsubhs,"Rdd32=vsubh(Rtt32,Rss32):sat",ATTRIBS(),
787 "Sub vector of half integers with saturation",
789         fHIDE(int i;)
790         for (i=0;i<4;i++) {
791             fSETHALF(i,RddV,fSATN(16,fGETHALF(i,RttV)-fGETHALF(i,RssV)));
792         }
795 Q6INSN(A2_vsubuhs,"Rdd32=vsubuh(Rtt32,Rss32):sat",ATTRIBS(),
796 "Sub vector of unsigned half integers with saturation",
798         fHIDE(int i;)
799         for (i=0;i<4;i++) {
800             fSETHALF(i,RddV,fSATUN(16,fGETUHALF(i,RttV)-fGETUHALF(i,RssV)));
801         }
804 Q6INSN(A2_vsubw,"Rdd32=vsubw(Rtt32,Rss32)",ATTRIBS(),
805 "Sub vector of words",
807         fHIDE(int i;)
808         for (i=0;i<2;i++) {
809             fSETWORD(i,RddV,fGETWORD(i,RttV)-fGETWORD(i,RssV));
810         }
813 Q6INSN(A2_vsubws,"Rdd32=vsubw(Rtt32,Rss32):sat",ATTRIBS(),
814 "Sub vector of words with saturation",
816         fHIDE(int i;)
817         for (i=0;i<2;i++) {
818             fSETWORD(i,RddV,fSATN(32,fGETWORD(i,RttV)-fGETWORD(i,RssV)));
819         }
825 /**********************************************/
826 /* Vector Abs                                 */
827 /**********************************************/
829 Q6INSN(A2_vabsh,"Rdd32=vabsh(Rss32)",ATTRIBS(),
830 "Negate vector of half integers",
832         fHIDE(int i;)
833         for (i=0;i<4;i++) {
834             fSETHALF(i,RddV,fABS(fGETHALF(i,RssV)));
835         }
838 Q6INSN(A2_vabshsat,"Rdd32=vabsh(Rss32):sat",ATTRIBS(),
839 "Negate vector of half integers",
841         fHIDE(int i;)
842         for (i=0;i<4;i++) {
843             fSETHALF(i,RddV,fSATH(fABS(fGETHALF(i,RssV))));
844         }
847 Q6INSN(A2_vabsw,"Rdd32=vabsw(Rss32)",ATTRIBS(),
848 "Absolute Value vector of words",
850         fHIDE(int i;)
851         for (i=0;i<2;i++) {
852             fSETWORD(i,RddV,fABS(fGETWORD(i,RssV)));
853         }
856 Q6INSN(A2_vabswsat,"Rdd32=vabsw(Rss32):sat",ATTRIBS(),
857 "Absolute Value vector of words",
859         fHIDE(int i;)
860         for (i=0;i<2;i++) {
861             fSETWORD(i,RddV,fSAT(fABS(fGETWORD(i,RssV))));
862         }
865 /**********************************************/
866 /* Vector SAD                                 */
867 /**********************************************/
870 Q6INSN(M2_vabsdiffw,"Rdd32=vabsdiffw(Rtt32,Rss32)",ATTRIBS(A_ARCHV2),
871 "Absolute Differences: vector of words",
873         fHIDE(int i;)
874         for (i=0;i<2;i++) {
875             fSETWORD(i,RddV,fABS(fGETWORD(i,RttV) - fGETWORD(i,RssV)));
876         }
879 Q6INSN(M2_vabsdiffh,"Rdd32=vabsdiffh(Rtt32,Rss32)",ATTRIBS(A_ARCHV2),
880 "Absolute Differences: vector of halfwords",
882         fHIDE(int i;)
883         for (i=0;i<4;i++) {
884             fSETHALF(i,RddV,fABS(fGETHALF(i,RttV) - fGETHALF(i,RssV)));
885         }
888 Q6INSN(M6_vabsdiffb,"Rdd32=vabsdiffb(Rtt32,Rss32)",ATTRIBS(),
889 "Absolute Differences: vector of halfwords",
891         fHIDE(int i;)
892         for (i=0;i<8;i++) {
893             fSETBYTE(i,RddV,fABS(fGETBYTE(i,RttV) - fGETBYTE(i,RssV)));
894         }
897 Q6INSN(M6_vabsdiffub,"Rdd32=vabsdiffub(Rtt32,Rss32)",ATTRIBS(),
898 "Absolute Differences: vector of halfwords",
900         fHIDE(int i;)
901         for (i=0;i<8;i++) {
902             fSETBYTE(i,RddV,fABS(fGETUBYTE(i,RttV) - fGETUBYTE(i,RssV)));
903         }
908 Q6INSN(A2_vrsadub,"Rdd32=vrsadub(Rss32,Rtt32)",ATTRIBS(),
909 "Sum of Absolute Differences: vector of unsigned bytes",
911         fHIDE(int i;)
912         RddV = 0;
913         for (i = 0; i < 4; i++) {
914             fSETWORD(0,RddV,(fGETWORD(0,RddV) + fABS((fGETUBYTE(i,RssV) - fGETUBYTE(i,RttV)))));
915         }
916         for (i = 4; i < 8; i++) {
917             fSETWORD(1,RddV,(fGETWORD(1,RddV) + fABS((fGETUBYTE(i,RssV) - fGETUBYTE(i,RttV)))));
918         }
921 Q6INSN(A2_vrsadub_acc,"Rxx32+=vrsadub(Rss32,Rtt32)",ATTRIBS(),
922 "Sum of Absolute Differences: vector of unsigned bytes",
924         fHIDE(int i;)
925         for (i = 0; i < 4; i++) {
926             fSETWORD(0,RxxV,(fGETWORD(0,RxxV) + fABS((fGETUBYTE(i,RssV) - fGETUBYTE(i,RttV)))));
927         }
928         for (i = 4; i < 8; i++) {
929             fSETWORD(1,RxxV,(fGETWORD(1,RxxV) + fABS((fGETUBYTE(i,RssV) - fGETUBYTE(i,RttV)))));
930         }
934 /**********************************************/
935 /* Vector Average                             */
936 /**********************************************/
938 Q6INSN(A2_vavgub,"Rdd32=vavgub(Rss32,Rtt32)",ATTRIBS(),
939 "Average vector of unsigned bytes",
941         fHIDE(int i;)
942         for (i = 0; i < 8; i++) {
943             fSETBYTE(i,RddV,((fGETUBYTE(i,RssV) + fGETUBYTE(i,RttV))>>1));
944         }
947 Q6INSN(A2_vavguh,"Rdd32=vavguh(Rss32,Rtt32)",ATTRIBS(),
948 "Average vector of unsigned halfwords",
950         fHIDE(int i;)
951         for (i=0;i<4;i++) {
952             fSETHALF(i,RddV,(fGETUHALF(i,RssV)+fGETUHALF(i,RttV))>>1);
953         }
956 Q6INSN(A2_vavgh,"Rdd32=vavgh(Rss32,Rtt32)",ATTRIBS(),
957 "Average vector of halfwords",
959         fHIDE(int i;)
960         for (i=0;i<4;i++) {
961             fSETHALF(i,RddV,(fGETHALF(i,RssV)+fGETHALF(i,RttV))>>1);
962         }
965 Q6INSN(A2_vnavgh,"Rdd32=vnavgh(Rtt32,Rss32)",ATTRIBS(),
966 "Negative Average vector of halfwords",
968         fHIDE(int i;)
969         for (i=0;i<4;i++) {
970             fSETHALF(i,RddV,(fGETHALF(i,RttV)-fGETHALF(i,RssV))>>1);
971         }
974 Q6INSN(A2_vavgw,"Rdd32=vavgw(Rss32,Rtt32)",ATTRIBS(),
975 "Average vector of words",
977         fHIDE(int i;)
978         for (i=0;i<2;i++) {
979             fSETWORD(i,RddV,(fSXTN(32,33,fGETWORD(i,RssV))+fSXTN(32,33,fGETWORD(i,RttV)))>>1);
980         }
983 Q6INSN(A2_vnavgw,"Rdd32=vnavgw(Rtt32,Rss32)",ATTRIBS(A_ARCHV2),
984 "Average vector of words",
986         fHIDE(int i;)
987         for (i=0;i<2;i++) {
988             fSETWORD(i,RddV,(fSXTN(32,33,fGETWORD(i,RttV))-fSXTN(32,33,fGETWORD(i,RssV)))>>1);
989         }
992 Q6INSN(A2_vavgwr,"Rdd32=vavgw(Rss32,Rtt32):rnd",ATTRIBS(),
993 "Average vector of words",
995         fHIDE(int i;)
996         for (i=0;i<2;i++) {
997             fSETWORD(i,RddV,(fSXTN(32,33,fGETWORD(i,RssV))+fSXTN(32,33,fGETWORD(i,RttV))+1)>>1);
998         }
1001 Q6INSN(A2_vnavgwr,"Rdd32=vnavgw(Rtt32,Rss32):rnd:sat",ATTRIBS(A_ARCHV2),
1002 "Average vector of words",
1004         fHIDE(int i;)
1005         for (i=0;i<2;i++) {
1006             fSETWORD(i,RddV,fSAT((fSXTN(32,33,fGETWORD(i,RttV))-fSXTN(32,33,fGETWORD(i,RssV))+1)>>1));
1007         }
1010 Q6INSN(A2_vavgwcr,"Rdd32=vavgw(Rss32,Rtt32):crnd",ATTRIBS(A_ARCHV2),
1011 "Average vector of words with convergent rounding",
1013         fHIDE(int i;)
1014         for (i=0;i<2;i++) {
1015             fSETWORD(i,RddV,(fCRND(fSXTN(32,33,fGETWORD(i,RssV))+fSXTN(32,33,fGETWORD(i,RttV)))>>1));
1016         }
1019 Q6INSN(A2_vnavgwcr,"Rdd32=vnavgw(Rtt32,Rss32):crnd:sat",ATTRIBS(A_ARCHV2),
1020 "Average negative vector of words with convergent rounding",
1022         fHIDE(int i;)
1023         for (i=0;i<2;i++) {
1024             fSETWORD(i,RddV,fSAT(fCRND(fSXTN(32,33,fGETWORD(i,RttV))-fSXTN(32,33,fGETWORD(i,RssV)))>>1));
1025         }
1028 Q6INSN(A2_vavghcr,"Rdd32=vavgh(Rss32,Rtt32):crnd",ATTRIBS(A_ARCHV2),
1029 "Average vector of halfwords with conv rounding",
1031         fHIDE(int i;)
1032         for (i=0;i<4;i++) {
1033             fSETHALF(i,RddV,fCRND(fGETHALF(i,RssV)+fGETHALF(i,RttV))>>1);
1034         }
1037 Q6INSN(A2_vnavghcr,"Rdd32=vnavgh(Rtt32,Rss32):crnd:sat",ATTRIBS(A_ARCHV2),
1038 "Average negative vector of halfwords with conv rounding",
1040         fHIDE(int i;)
1041         for (i=0;i<4;i++) {
1042             fSETHALF(i,RddV,fSATH(fCRND(fGETHALF(i,RttV)-fGETHALF(i,RssV))>>1));
1043         }
1047 Q6INSN(A2_vavguw,"Rdd32=vavguw(Rss32,Rtt32)",ATTRIBS(),
1048 "Average vector of unsigned words",
1050         fHIDE(int i;)
1051         for (i=0;i<2;i++) {
1052             fSETWORD(i,RddV,(fZXTN(32,33,fGETUWORD(i,RssV))+fZXTN(32,33,fGETUWORD(i,RttV)))>>1);
1053         }
1056 Q6INSN(A2_vavguwr,"Rdd32=vavguw(Rss32,Rtt32):rnd",ATTRIBS(),
1057 "Average vector of unsigned words",
1059         fHIDE(int i;)
1060         for (i=0;i<2;i++) {
1061             fSETWORD(i,RddV,(fZXTN(32,33,fGETUWORD(i,RssV))+fZXTN(32,33,fGETUWORD(i,RttV))+1)>>1);
1062         }
1065 Q6INSN(A2_vavgubr,"Rdd32=vavgub(Rss32,Rtt32):rnd",ATTRIBS(),
1066 "Average vector of unsigned bytes",
1068         fHIDE(int i;)
1069         for (i = 0; i < 8; i++) {
1070             fSETBYTE(i,RddV,((fGETUBYTE(i,RssV)+fGETUBYTE(i,RttV)+1)>>1));
1071         }
1074 Q6INSN(A2_vavguhr,"Rdd32=vavguh(Rss32,Rtt32):rnd",ATTRIBS(),
1075 "Average vector of unsigned halfwords with rounding",
1077         fHIDE(int i;)
1078         for (i=0;i<4;i++) {
1079             fSETHALF(i,RddV,(fGETUHALF(i,RssV)+fGETUHALF(i,RttV)+1)>>1);
1080         }
1083 Q6INSN(A2_vavghr,"Rdd32=vavgh(Rss32,Rtt32):rnd",ATTRIBS(),
1084 "Average vector of halfwords with rounding",
1086         fHIDE(int i;)
1087         for (i=0;i<4;i++) {
1088             fSETHALF(i,RddV,(fGETHALF(i,RssV)+fGETHALF(i,RttV)+1)>>1);
1089         }
1092 Q6INSN(A2_vnavghr,"Rdd32=vnavgh(Rtt32,Rss32):rnd:sat",ATTRIBS(A_ARCHV2),
1093 "Negative Average vector of halfwords with rounding",
1095         fHIDE(int i;)
1096         for (i=0;i<4;i++) {
1097             fSETHALF(i,RddV,fSATH((fGETHALF(i,RttV)-fGETHALF(i,RssV)+1)>>1));
1098         }
1102 /* Rounding Instruction */
1104 Q6INSN(A4_round_ri,"Rd32=round(Rs32,#u5)",ATTRIBS(),"Round", {RdV = fRNDN(RsV,uiV)>>uiV; })
1105 Q6INSN(A4_round_rr,"Rd32=round(Rs32,Rt32)",ATTRIBS(),"Round", {RdV = fRNDN(RsV,fZXTN(5,32,RtV))>>fZXTN(5,32,RtV); })
1106 Q6INSN(A4_round_ri_sat,"Rd32=round(Rs32,#u5):sat",ATTRIBS(),"Round", {RdV = (fSAT(fRNDN(RsV,uiV)))>>uiV; })
1107 Q6INSN(A4_round_rr_sat,"Rd32=round(Rs32,Rt32):sat",ATTRIBS(),"Round", {RdV = (fSAT(fRNDN(RsV,fZXTN(5,32,RtV))))>>fZXTN(5,32,RtV); })
1110 Q6INSN(A4_cround_ri,"Rd32=cround(Rs32,#u5)",ATTRIBS(),"Convergent Round", {RdV = fCRNDN(RsV,uiV); })
1111 Q6INSN(A4_cround_rr,"Rd32=cround(Rs32,Rt32)",ATTRIBS(),"Convergent Round", {RdV = fCRNDN(RsV,fZXTN(5,32,RtV)); })
1114 #define CROUND(DST,SRC,SHIFT) \
1115         fHIDE(size16s_t rndbit_128;)\
1116         fHIDE(size16s_t tmp128;)\
1117         fHIDE(size16s_t src_128;)\
1118         if (SHIFT == 0) { \
1119             DST = SRC;\
1120         } else if ((SRC & (size8s_t)((1LL << (SHIFT - 1)) - 1LL)) == 0) { \
1121             src_128 = fCAST8S_16S(SRC);\
1122             rndbit_128 = fCAST8S_16S(1LL);\
1123             rndbit_128 = fSHIFTL128(rndbit_128, SHIFT);\
1124             rndbit_128 = fAND128(rndbit_128, src_128);\
1125             rndbit_128 = fSHIFTR128(rndbit_128, 1);\
1126             tmp128 = fADD128(src_128, rndbit_128);\
1127             tmp128 = fSHIFTR128(tmp128, SHIFT);\
1128             DST =  fCAST16S_8S(tmp128);\
1129         } else {\
1130             size16s_t rndbit_128 =  fCAST8S_16S((1LL << (SHIFT - 1))); \
1131             size16s_t src_128 =  fCAST8S_16S(SRC); \
1132             size16s_t tmp128 = fADD128(src_128, rndbit_128);\
1133             tmp128 = fSHIFTR128(tmp128, SHIFT);\
1134             DST =  fCAST16S_8S(tmp128);\
1135         }
1137 Q6INSN(A7_croundd_ri,"Rdd32=cround(Rss32,#u6)",ATTRIBS(),"Convergent Round",
1139 CROUND(RddV,RssV,uiV);
1142 Q6INSN(A7_croundd_rr,"Rdd32=cround(Rss32,Rt32)",ATTRIBS(),"Convergent Round",
1144 CROUND(RddV,RssV,fZXTN(6,32,RtV));
1155 Q6INSN(A7_clip,"Rd32=clip(Rs32,#u5)",ATTRIBS(),"Clip to  #s5", {   fCLIP(RdV,RsV,uiV);})
1156 Q6INSN(A7_vclip,"Rdd32=vclip(Rss32,#u5)",ATTRIBS(),"Clip to  #s5",
1158 fHIDE(size4s_t tmp;)
1159 fCLIP(tmp, fGETWORD(0, RssV), uiV);
1160 fSETWORD(0, RddV, tmp);
1161 fCLIP(tmp,fGETWORD(1, RssV), uiV);
1162 fSETWORD(1, RddV, tmp);
1168 /**********************************************/
1169 /* V4: Cross Vector Min/Max                   */
1170 /**********************************************/
1173 #define VRMINORMAX(TAG,STR,OP,SHORTTYPE,SETTYPE,GETTYPE,NEL,SHIFT) \
1174 Q6INSN(A4_vr##TAG##SHORTTYPE,"Rxx32=vr"#TAG#SHORTTYPE"(Rss32,Ru32)",ATTRIBS(), \
1175 "Choose " STR " elements of a vector", \
1176 { \
1177         fHIDE(int i; size8s_t TAG; size4s_t addr;) \
1178         TAG = fGET##GETTYPE(0,RxxV); \
1179         addr = fGETWORD(1,RxxV); \
1180         for (i = 0; i < NEL; i++) { \
1181             if (TAG OP fGET##GETTYPE(i,RssV)) { \
1182                 TAG = fGET##GETTYPE(i,RssV); \
1183                 addr = RuV | i<<SHIFT; \
1184             } \
1185         } \
1186         fSETWORD(0,RxxV,TAG); \
1187         fSETWORD(1,RxxV,addr); \
1190 #define RMINMAX(SHORTTYPE,SETTYPE,GETTYPE,NEL,SHIFT) \
1191 VRMINORMAX(min,"minimum",>,SHORTTYPE,SETTYPE,GETTYPE,NEL,SHIFT) \
1192 VRMINORMAX(max,"maximum",<,SHORTTYPE,SETTYPE,GETTYPE,NEL,SHIFT)
1195 RMINMAX(h,HALF,HALF,4,1)
1196 RMINMAX(uh,HALF,UHALF,4,1)
1197 RMINMAX(w,WORD,WORD,2,2)
1198 RMINMAX(uw,WORD,UWORD,2,2)
1200 #undef RMINMAX
1201 #undef VRMINORMAX
1203 /**********************************************/
1204 /* Vector Min/Max                             */
1205 /**********************************************/
1207 #define VMINORMAX(TAG,STR,FUNC,SHORTTYPE,SETTYPE,GETTYPE,NEL) \
1208 Q6INSN(A2_v##TAG##SHORTTYPE,"Rdd32=v"#TAG#SHORTTYPE"(Rtt32,Rss32)",ATTRIBS(), \
1209 "Choose " STR " elements of two vectors", \
1210 { \
1211         fHIDE(int i;) \
1212         for (i = 0; i < NEL; i++) { \
1213             fSET##SETTYPE(i,RddV,FUNC(fGET##GETTYPE(i,RttV),fGET##GETTYPE(i,RssV))); \
1214         } \
1217 #define VMINORMAX3(TAG,STR,FUNC,SHORTTYPE,SETTYPE,GETTYPE,NEL) \
1218 Q6INSN(A6_v##TAG##SHORTTYPE##3,"Rxx32=v"#TAG#SHORTTYPE"3(Rtt32,Rss32)",ATTRIBS(), \
1219 "Choose " STR " elements of two vectors", \
1220 { \
1221         fHIDE(int i;) \
1222         for (i = 0; i < NEL; i++) { \
1223             fSET##SETTYPE(i,RxxV,FUNC(fGET##GETTYPE(i,RxxV),FUNC(fGET##GETTYPE(i,RttV),fGET##GETTYPE(i,RssV)))); \
1224         } \
1227 #define MINMAX(SHORTTYPE,SETTYPE,GETTYPE,NEL) \
1228 VMINORMAX(min,"minimum",fMIN,SHORTTYPE,SETTYPE,GETTYPE,NEL) \
1229 VMINORMAX(max,"maximum",fMAX,SHORTTYPE,SETTYPE,GETTYPE,NEL)
1231 MINMAX(b,BYTE,BYTE,8)
1232 MINMAX(ub,BYTE,UBYTE,8)
1233 MINMAX(h,HALF,HALF,4)
1234 MINMAX(uh,HALF,UHALF,4)
1235 MINMAX(w,WORD,WORD,2)
1236 MINMAX(uw,WORD,UWORD,2)
1238 #undef MINMAX
1239 #undef VMINORMAX
1240 #undef VMINORMAX3
1243 /**********************************************/
1244 /* Vector Min/Max                             */
1245 /**********************************************/
1248 Q6INSN(A4_modwrapu,"Rd32=modwrap(Rs32,Rt32)",ATTRIBS(),
1249 "Wrap to an unsigned modulo buffer",
1251         if (RsV < 0) {
1252             RdV = RsV + fCAST4u(RtV);
1253         } else if (fCAST4u(RsV) >= fCAST4u(RtV)) {
1254             RdV = RsV - fCAST4u(RtV);
1255         } else {
1256             RdV = RsV;
1257         }