gcc/config/powerpcspe/spu2vmx.h

   1 /* Cell SPU 2 VMX intrinsics header
   2    Copyright (C) 2007-2017 Free Software Foundation, Inc.
   3
   4    This file is free software; you can redistribute it and/or modify it under
   5    the terms of the GNU General Public License as published by the Free
   6    Software Foundation; either version 3 of the License, or (at your option)
   7    any later version.
   8
   9    This file is distributed in the hope that it will be useful, but WITHOUT
  10    ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  11    FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  12    for more details.
  13
  14    Under Section 7 of GPL version 3, you are granted additional
  15    permissions described in the GCC Runtime Library Exception, version
  16    3.1, as published by the Free Software Foundation.
  17
  18    You should have received a copy of the GNU General Public License and
  19    a copy of the GCC Runtime Library Exception along with this program;
  20    see the files COPYING3 and COPYING.RUNTIME respectively.  If not, see
  21    <http://www.gnu.org/licenses/>.  */
  22
  23 #ifndef _SPU2VMX_H_
  24 #define _SPU2VMX_H_     1
  25
  26 #ifdef __cplusplus
  27
  28 #ifndef __SPU__
  29
  30 #include <si2vmx.h>
  31
  32 /* spu_absd (absolute difference)
  33  * ========
  34  */
  35 static __inline vec_uchar16 spu_absd(vec_uchar16 a, vec_uchar16 b)
  36 {
  37   return ((vec_uchar16)(si_absdb((qword)(a), (qword)(b))));
  38
  39 }
  40
  41
  42 /* spu_add
  43  * =======
  44  */
  45 static __inline vec_uint4 spu_add(vec_uint4 a, vec_uint4 b)
  46 {
  47   return ((vec_uint4)(si_a((qword)(a), (qword)(b))));
  48 }
  49
  50 static __inline vec_int4 spu_add(vec_int4 a, vec_int4 b)
  51 {
  52   return ((vec_int4)(si_a((qword)(a), (qword)(b))));
  53 }
  54
  55 static __inline vec_ushort8 spu_add(vec_ushort8 a, vec_ushort8 b)
  56 {
  57   return ((vec_ushort8)(si_ah((qword)(a), (qword)(b))));
  58 }
  59
  60 static __inline vec_short8 spu_add(vec_short8 a, vec_short8 b)
  61 {
  62   return ((vec_short8)(si_ah((qword)(a), (qword)(b))));
  63 }
  64
  65 static __inline vec_uint4 spu_add(vec_uint4 a, unsigned int b)
  66 {
  67   return ((vec_uint4)(si_ai((qword)(a), (int)(b))));
  68 }
  69
  70 static __inline vec_int4 spu_add(vec_int4 a, int b)
  71 {
  72   return ((vec_int4)(si_ai((qword)(a), b)));
  73 }
  74
  75 static __inline vec_ushort8 spu_add(vec_ushort8 a, unsigned short b)
  76 {
  77   return ((vec_ushort8)(si_ahi((qword)(a), (short)(b))));
  78 }
  79
  80 static __inline vec_short8 spu_add(vec_short8 a, short b)
  81 {
  82   return ((vec_short8)(si_ahi((qword)(a), b)));
  83 }
  84
  85 static __inline vec_float4 spu_add(vec_float4 a, vec_float4 b)
  86 {
  87   return ((vec_float4)(si_fa((qword)(a), (qword)(b))));
  88 }
  89
  90 static __inline vec_double2 spu_add(vec_double2 a, vec_double2 b)
  91 {
  92   return ((vec_double2)(si_dfa((qword)(a), (qword)(b))));
  93 }
  94
  95
  96 /* spu_addx
  97  * ========
  98  */
  99 static __inline vec_uint4 spu_addx(vec_uint4 a, vec_uint4 b, vec_uint4 c)
 100 {
 101   return ((vec_uint4)(si_addx((qword)(a), (qword)(b), (qword)(c))));
 102 }
 103
 104 static __inline vec_int4 spu_addx(vec_int4 a, vec_int4 b, vec_int4 c)
 105 {
 106   return ((vec_int4)(si_addx((qword)(a), (qword)(b), (qword)(c))));
 107 }
 108
 109
 110 /* spu_and
 111  * =======
 112  */
 113 static __inline vec_uchar16 spu_and(vec_uchar16 a, vec_uchar16 b)
 114 {
 115   return ((vec_uchar16)(si_and((qword)(a), (qword)(b))));
 116 }
 117
 118 static __inline vec_char16 spu_and(vec_char16 a, vec_char16 b)
 119 {
 120   return ((vec_char16)(si_and((qword)(a), (qword)(b))));
 121 }
 122
 123 static __inline vec_ushort8 spu_and(vec_ushort8 a, vec_ushort8 b)
 124 {
 125   return ((vec_ushort8)(si_and((qword)(a), (qword)(b))));
 126 }
 127
 128 static __inline vec_short8 spu_and(vec_short8 a, vec_short8 b)
 129 {
 130   return ((vec_short8)(si_and((qword)(a), (qword)(b))));
 131 }
 132
 133 static __inline vec_uint4 spu_and(vec_uint4 a, vec_uint4 b)
 134 {
 135   return ((vec_uint4)(si_and((qword)(a), (qword)(b))));
 136 }
 137
 138 static __inline vec_int4 spu_and(vec_int4 a, vec_int4 b)
 139 {
 140   return ((vec_int4)(si_and((qword)(a), (qword)(b))));
 141 }
 142
 143 static __inline vec_float4 spu_and(vec_float4 a, vec_float4 b)
 144 {
 145   return ((vec_float4)(si_and((qword)(a), (qword)(b))));
 146 }
 147
 148 static __inline vec_ullong2 spu_and(vec_ullong2 a, vec_ullong2 b)
 149 {
 150   return ((vec_ullong2)(si_and((qword)(a), (qword)(b))));
 151 }
 152
 153 static __inline vec_llong2 spu_and(vec_llong2 a, vec_llong2 b)
 154 {
 155   return ((vec_llong2)(si_and((qword)(a), (qword)(b))));
 156 }
 157
 158 static __inline vec_double2 spu_and(vec_double2 a, vec_double2 b)
 159 {
 160   return ((vec_double2)(si_and((qword)(a), (qword)(b))));
 161 }
 162
 163 static __inline vec_uchar16 spu_and(vec_uchar16 a, unsigned char b)
 164 {
 165   return ((vec_uchar16)(si_andbi((qword)(a), (signed char)(b))));
 166 }
 167
 168
 169 static __inline vec_char16 spu_and(vec_char16 a, signed char b)
 170 {
 171   return ((vec_char16)(si_andbi((qword)(a), b)));
 172 }
 173
 174 static __inline vec_ushort8 spu_and(vec_ushort8 a, unsigned short b)
 175 {
 176   return ((vec_ushort8)(si_andhi((qword)(a), (signed short)(b))));
 177 }
 178
 179 static __inline vec_short8 spu_and(vec_short8 a, signed short b)
 180 {
 181   return ((vec_short8)(si_andhi((qword)(a), b)));
 182 }
 183
 184 static __inline vec_uint4 spu_and(vec_uint4 a, unsigned int b)
 185 {
 186   return ((vec_uint4)(si_andi((qword)(a), (signed int)(b))));
 187 }
 188
 189 static __inline vec_int4 spu_and(vec_int4 a, signed int b)
 190 {
 191   return ((vec_int4)(si_andi((qword)(a), b)));
 192 }
 193
 194
 195 /* spu_andc
 196  * ========
 197  */
 198 #define spu_andc(_a, _b)        vec_andc(_a, _b)
 199
 200
 201 /* spu_avg
 202  * =======
 203  */
 204 #define spu_avg(_a, _b)         vec_avg(_a, _b)
 205
 206
 207 /* spu_bisled
 208  * spu_bisled_d
 209  * spu_bisled_e
 210  * ============
 211  */
 212 #define spu_bisled(_func)       /* not mappable */
 213 #define spu_bisled_d(_func)     /* not mappable */
 214 #define spu_bisled_e(_func)     /* not mappable */
 215
 216 /* spu_cmpabseq
 217  * ============
 218  */
 219 static __inline vec_uint4 spu_cmpabseq(vec_float4 a, vec_float4 b)
 220 {
 221   return ((vec_uint4)(si_fcmeq((qword)(a), (qword)(b))));
 222
 223 }
 224
 225 static __inline vec_ullong2 spu_cmpabseq(vec_double2 a, vec_double2 b)
 226 {
 227   return ((vec_ullong2)(si_dfcmeq((qword)(a), (qword)(b))));
 228 }
 229
 230
 231 /* spu_cmpabsgt
 232  * ============
 233  */
 234 static __inline vec_uint4 spu_cmpabsgt(vec_float4 a, vec_float4 b)
 235 {
 236   return ((vec_uint4)(si_fcmgt((qword)(a), (qword)(b))));
 237 }
 238
 239 static __inline vec_ullong2 spu_cmpabsgt(vec_double2 a, vec_double2 b)
 240 {
 241   return ((vec_ullong2)(si_dfcmgt((qword)(a), (qword)(b))));
 242 }
 243
 244
 245 /* spu_cmpeq
 246  * ========
 247  */
 248 static __inline vec_uchar16 spu_cmpeq(vec_uchar16 a, vec_uchar16 b)
 249 {
 250   return ((vec_uchar16)(si_ceqb((qword)(a), (qword)(b))));
 251 }
 252
 253 static __inline vec_uchar16 spu_cmpeq(vec_char16 a, vec_char16 b)
 254 {
 255   return ((vec_uchar16)(si_ceqb((qword)(a), (qword)(b))));
 256 }
 257
 258 static __inline vec_ushort8 spu_cmpeq(vec_ushort8 a, vec_ushort8 b)
 259 {
 260   return ((vec_ushort8)(si_ceqh((qword)(a), (qword)(b))));
 261 }
 262
 263 static __inline vec_ushort8 spu_cmpeq(vec_short8 a, vec_short8 b)
 264 {
 265   return ((vec_ushort8)(si_ceqh((qword)(a), (qword)(b))));
 266 }
 267
 268 static __inline vec_uint4 spu_cmpeq(vec_uint4 a, vec_uint4 b)
 269 {
 270   return ((vec_uint4)(si_ceq((qword)(a), (qword)(b))));
 271 }
 272
 273 static __inline vec_uint4 spu_cmpeq(vec_int4 a, vec_int4 b)
 274 {
 275   return ((vec_uint4)(si_ceq((qword)(a), (qword)(b))));
 276 }
 277
 278 static __inline vec_uint4 spu_cmpeq(vec_float4 a, vec_float4 b)
 279 {
 280   return ((vec_uint4)(si_fceq((qword)(a), (qword)(b))));
 281 }
 282
 283 static __inline vec_uchar16 spu_cmpeq(vec_uchar16 a, unsigned char b)
 284 {
 285   return ((vec_uchar16)(si_ceqbi((qword)(a), (signed char)(b))));
 286 }
 287
 288 static __inline vec_uchar16 spu_cmpeq(vec_char16 a, signed char b)
 289 {
 290   return ((vec_uchar16)(si_ceqbi((qword)(a), b)));
 291 }
 292
 293 static __inline vec_ushort8 spu_cmpeq(vec_ushort8 a, unsigned short b)
 294 {
 295   return ((vec_ushort8)(si_ceqhi((qword)(a), (signed short)(b))));
 296 }
 297
 298 static __inline vec_ushort8 spu_cmpeq(vec_short8 a, signed short b)
 299 {
 300   return ((vec_ushort8)(si_ceqhi((qword)(a), b)));
 301 }
 302
 303 static __inline vec_uint4 spu_cmpeq(vec_uint4 a, unsigned int b)
 304 {
 305   return ((vec_uint4)(si_ceqi((qword)(a), (signed int)(b))));
 306 }
 307
 308 static __inline vec_uint4 spu_cmpeq(vec_int4 a, signed int b)
 309 {
 310   return ((vec_uint4)(si_ceqi((qword)(a), b)));
 311 }
 312
 313 static __inline vec_ullong2 spu_cmpeq(vec_double2 a, vec_double2 b)
 314 {
 315   return ((vec_ullong2)(si_dfceq((qword)(a), (qword)(b))));
 316 }
 317
 318
 319 /* spu_cmpgt
 320  * ========
 321  */
 322 static __inline vec_uchar16 spu_cmpgt(vec_uchar16 a, vec_uchar16 b)
 323 {
 324   return ((vec_uchar16)(si_clgtb((qword)(a), (qword)(b))));
 325 }
 326
 327 static __inline vec_uchar16 spu_cmpgt(vec_char16 a, vec_char16 b)
 328 {
 329   return ((vec_uchar16)(si_cgtb((qword)(a), (qword)(b))));
 330 }
 331
 332 static __inline vec_ushort8 spu_cmpgt(vec_ushort8 a, vec_ushort8 b)
 333 {
 334   return ((vec_ushort8)(si_clgth((qword)(a), (qword)(b))));
 335 }
 336
 337 static __inline vec_ushort8 spu_cmpgt(vec_short8 a, vec_short8 b)
 338 {
 339   return ((vec_ushort8)(si_cgth((qword)(a), (qword)(b))));
 340 }
 341
 342 static __inline vec_uint4 spu_cmpgt(vec_uint4 a, vec_uint4 b)
 343 {
 344   return ((vec_uint4)(si_clgt((qword)(a), (qword)(b))));
 345 }
 346
 347 static __inline vec_uint4 spu_cmpgt(vec_int4 a, vec_int4 b)
 348 {
 349   return ((vec_uint4)(si_cgt((qword)(a), (qword)(b))));
 350 }
 351
 352 static __inline vec_uint4 spu_cmpgt(vec_float4 a, vec_float4 b)
 353 {
 354   return ((vec_uint4)(si_fcgt((qword)(a), (qword)(b))));
 355 }
 356
 357 static __inline vec_uchar16 spu_cmpgt(vec_uchar16 a, unsigned char b)
 358 {
 359   return ((vec_uchar16)(si_clgtbi((qword)(a), b)));
 360 }
 361
 362 static __inline vec_uchar16 spu_cmpgt(vec_char16 a, signed char b)
 363 {
 364   return ((vec_uchar16)(si_cgtbi((qword)(a), b)));
 365 }
 366
 367 static __inline vec_ushort8 spu_cmpgt(vec_ushort8 a, unsigned short b)
 368 {
 369   return ((vec_ushort8)(si_clgthi((qword)(a), b)));
 370 }
 371
 372 static __inline vec_ushort8 spu_cmpgt(vec_short8 a, signed short b)
 373 {
 374   return ((vec_ushort8)(si_cgthi((qword)(a), b)));
 375 }
 376
 377 static __inline vec_uint4 spu_cmpgt(vec_uint4 a, unsigned int b)
 378 {
 379   return ((vec_uint4)(si_clgti((qword)(a), b)));
 380 }
 381
 382 static __inline vec_uint4 spu_cmpgt(vec_int4 a, signed int b)
 383 {
 384   return ((vec_uint4)(si_cgti((qword)(a), b)));
 385 }
 386
 387 static __inline vec_ullong2 spu_cmpgt(vec_double2 a, vec_double2 b)
 388 {
 389   return ((vec_ullong2)(si_dfcgt((qword)(a), (qword)(b))));
 390 }
 391
 392
 393 /* spu_cntb
 394  * ========
 395  */
 396 static __inline vec_uchar16 spu_cntb(vec_uchar16 a)
 397 {
 398   return ((vec_uchar16)(si_cntb((qword)(a))));
 399 }
 400
 401
 402 static __inline vec_uchar16 spu_cntb(vec_char16 a)
 403 {
 404   return ((vec_uchar16)(si_cntb((qword)(a))));
 405 }
 406
 407 /* spu_cntlz
 408  * =========
 409  */
 410 static __inline vec_uint4 spu_cntlz(vec_uint4 a)
 411 {
 412   return ((vec_uint4)(si_clz((qword)(a))));
 413 }
 414
 415 static __inline vec_uint4 spu_cntlz(vec_int4 a)
 416 {
 417   return ((vec_uint4)(si_clz((qword)(a))));
 418 }
 419
 420 static __inline vec_uint4 spu_cntlz(vec_float4 a)
 421 {
 422   return ((vec_uint4)(si_clz((qword)(a))));
 423 }
 424
 425 /* spu_testsv
 426  * ==========
 427  */
 428 static __inline vec_ullong2 spu_testsv(vec_double2 a, char b)
 429 {
 430   return ((vec_ullong2)(si_dftsv((qword)(a), b)));
 431 }
 432
 433 /* spu_convtf
 434  * ==========
 435  */
 436 #define spu_convtf(_a, _b)      (vec_ctf(_a, _b))
 437
 438 /* spu_convts
 439  * ==========
 440  */
 441 #define spu_convts(_a, _b)      (vec_cts(_a, _b))
 442
 443 /* spu_convtu
 444  * ==========
 445  */
 446 #define spu_convtu(_a, _b)      (vec_ctu(_a, _b))
 447
 448
 449 /* spu_dsync
 450  * ========
 451  */
 452 #define spu_dsync()
 453
 454 /* spu_eqv
 455  * =======
 456  */
 457 static __inline vec_uchar16 spu_eqv(vec_uchar16 a, vec_uchar16 b)
 458 {
 459   return ((vec_uchar16)(si_eqv((qword)(a), (qword)(b))));
 460 }
 461
 462 static __inline vec_char16 spu_eqv(vec_char16 a, vec_char16 b)
 463 {
 464   return ((vec_char16)(si_eqv((qword)(a), (qword)(b))));
 465 }
 466
 467 static __inline vec_ushort8 spu_eqv(vec_ushort8 a, vec_ushort8 b)
 468 {
 469   return ((vec_ushort8)(si_eqv((qword)(a), (qword)(b))));
 470 }
 471
 472 static __inline vec_short8 spu_eqv(vec_short8 a, vec_short8 b)
 473 {
 474   return ((vec_short8)(si_eqv((qword)(a), (qword)(b))));
 475 }
 476
 477 static __inline vec_uint4 spu_eqv(vec_uint4 a, vec_uint4 b)
 478 {
 479   return ((vec_uint4)(si_eqv((qword)(a), (qword)(b))));
 480 }
 481
 482 static __inline vec_int4 spu_eqv(vec_int4 a, vec_int4 b)
 483 {
 484   return ((vec_int4)(si_eqv((qword)(a), (qword)(b))));
 485 }
 486
 487 static __inline vec_float4 spu_eqv(vec_float4 a, vec_float4 b)
 488 {
 489   return ((vec_float4)(si_eqv((qword)(a), (qword)(b))));
 490 }
 491
 492 static __inline vec_ullong2 spu_eqv(vec_ullong2 a, vec_ullong2 b)
 493 {
 494   return ((vec_ullong2)(si_eqv((qword)(a), (qword)(b))));
 495 }
 496
 497 static __inline vec_llong2 spu_eqv(vec_llong2 a, vec_llong2 b)
 498 {
 499   return ((vec_llong2)(si_eqv((qword)(a), (qword)(b))));
 500 }
 501
 502 static __inline vec_double2 spu_eqv(vec_double2 a, vec_double2 b)
 503 {
 504   return ((vec_double2)(si_eqv((qword)(a), (qword)(b))));
 505 }
 506
 507 /* spu_extend
 508  * ========
 509  */
 510 static __inline vec_short8 spu_extend(vec_char16 a)
 511 {
 512   return ((vec_short8)(si_xsbh((qword)(a))));
 513 }
 514
 515
 516 static __inline vec_int4 spu_extend(vec_short8 a)
 517 {
 518   return ((vec_int4)(si_xshw((qword)(a))));
 519 }
 520
 521 static __inline vec_llong2 spu_extend(vec_int4 a)
 522 {
 523   return ((vec_llong2)(si_xswd((qword)(a))));
 524 }
 525
 526
 527 static __inline vec_double2 spu_extend(vec_float4 a)
 528 {
 529   return ((vec_double2)(si_fesd((qword)(a))));
 530 }
 531
 532
 533 /* spu_extract
 534  * ========
 535  */
 536 static __inline unsigned char spu_extract(vec_uchar16 a, int element)
 537 {
 538   union {
 539     vec_uchar16 v;
 540     unsigned char c[16];
 541   } in;
 542
 543   in.v = a;
 544   return (in.c[element & 15]);
 545 }
 546
 547 static __inline signed char spu_extract(vec_char16 a, int element)
 548 {
 549   union {
 550     vec_char16 v;
 551     signed char c[16];
 552   } in;
 553
 554   in.v = a;
 555   return (in.c[element & 15]);
 556 }
 557
 558 static __inline unsigned short spu_extract(vec_ushort8 a, int element)
 559 {
 560   union {
 561     vec_ushort8 v;
 562     unsigned short s[8];
 563   } in;
 564
 565   in.v = a;
 566   return (in.s[element & 7]);
 567 }
 568
 569 static __inline signed short spu_extract(vec_short8 a, int element)
 570 {
 571   union {
 572     vec_short8 v;
 573     signed short s[8];
 574   } in;
 575
 576   in.v = a;
 577   return (in.s[element & 7]);
 578 }
 579
 580 static __inline unsigned int spu_extract(vec_uint4 a, int element)
 581 {
 582   union {
 583     vec_uint4 v;
 584     unsigned int i[4];
 585   } in;
 586
 587   in.v = a;
 588   return (in.i[element & 3]);
 589 }
 590
 591 static __inline signed int spu_extract(vec_int4 a, int element)
 592 {
 593   union {
 594     vec_int4 v;
 595     signed int i[4];
 596   } in;
 597
 598   in.v = a;
 599   return (in.i[element & 3]);
 600 }
 601
 602 static __inline float spu_extract(vec_float4 a, int element)
 603 {
 604   union {
 605     vec_float4 v;
 606     float f[4];
 607   } in;
 608
 609   in.v = a;
 610   return (in.f[element & 3]);
 611 }
 612
 613 static __inline unsigned long long  spu_extract(vec_ullong2 a, int element)
 614 {
 615   union {
 616     vec_ullong2 v;
 617     unsigned long long l[2];
 618   } in;
 619
 620   in.v = a;
 621   return (in.l[element & 1]);
 622 }
 623
 624 static __inline signed long long  spu_extract(vec_llong2 a, int element)
 625 {
 626   union {
 627     vec_llong2 v;
 628     signed long long l[2];
 629   } in;
 630
 631   in.v = a;
 632   return (in.l[element & 1]);
 633 }
 634
 635 static __inline double spu_extract(vec_double2 a, int element)
 636 {
 637   union {
 638     vec_double2 v;
 639     double d[2];
 640   } in;
 641
 642   in.v = a;
 643   return (in.d[element & 1]);
 644 }
 645
 646 /* spu_gather
 647  * ========
 648  */
 649 static __inline vec_uint4 spu_gather(vec_uchar16 a)
 650 {
 651   return ((vec_uint4)(si_gbb((qword)(a))));
 652 }
 653
 654
 655 static __inline vec_uint4 spu_gather(vec_char16 a)
 656 {
 657   return ((vec_uint4)(si_gbb((qword)(a))));
 658 }
 659
 660 static __inline vec_uint4 spu_gather(vec_ushort8 a)
 661 {
 662   return ((vec_uint4)(si_gbh((qword)(a))));
 663 }
 664
 665 static __inline vec_uint4 spu_gather(vec_short8 a)
 666 {
 667   return ((vec_uint4)(si_gbh((qword)(a))));
 668 }
 669
 670
 671 static __inline vec_uint4 spu_gather(vec_uint4 a)
 672 {
 673   return ((vec_uint4)(si_gb((qword)(a))));
 674 }
 675
 676 static __inline vec_uint4 spu_gather(vec_int4 a)
 677 {
 678   return ((vec_uint4)(si_gb((qword)(a))));
 679 }
 680
 681 static __inline vec_uint4 spu_gather(vec_float4 a)
 682 {
 683   return ((vec_uint4)(si_gb((qword)(a))));
 684 }
 685
 686 /* spu_genb
 687  * ========
 688  */
 689 static __inline vec_uint4 spu_genb(vec_uint4 a, vec_uint4 b)
 690 {
 691   return ((vec_uint4)(si_bg((qword)(b), (qword)(a))));
 692 }
 693
 694 static __inline vec_int4 spu_genb(vec_int4 a, vec_int4 b)
 695 {
 696   return ((vec_int4)(si_bg((qword)(b), (qword)(a))));
 697 }
 698
 699 /* spu_genbx
 700  * =========
 701  */
 702 static __inline vec_uint4 spu_genbx(vec_uint4 a, vec_uint4 b, vec_uint4 c)
 703 {
 704   return ((vec_uint4)(si_bgx((qword)(b), (qword)(a), (qword)(c))));
 705 }
 706
 707 static __inline vec_int4 spu_genbx(vec_int4 a, vec_int4 b, vec_int4 c)
 708 {
 709   return ((vec_int4)(si_bgx((qword)(b), (qword)(a), (qword)(c))));
 710 }
 711
 712
 713 /* spu_genc
 714  * ========
 715  */
 716 static __inline vec_uint4 spu_genc(vec_uint4 a, vec_uint4 b)
 717 {
 718   return ((vec_uint4)(si_cg((qword)(a), (qword)(b))));
 719 }
 720
 721 static __inline vec_int4 spu_genc(vec_int4 a, vec_int4 b)
 722 {
 723   return ((vec_int4)(si_cg((qword)(a), (qword)(b))));
 724 }
 725
 726 /* spu_gencx
 727  * =========
 728  */
 729 static __inline vec_uint4 spu_gencx(vec_uint4 a, vec_uint4 b, vec_uint4 c)
 730 {
 731   return ((vec_uint4)(si_cgx((qword)(a), (qword)(b), (qword)(c))));
 732 }
 733
 734 static __inline vec_int4 spu_gencx(vec_int4 a, vec_int4 b, vec_int4 c)
 735 {
 736   return ((vec_int4)(si_cgx((qword)(a), (qword)(b), (qword)(c))));
 737 }
 738
 739
 740 /* spu_hcmpeq
 741  * ========
 742  */
 743 #define spu_hcmpeq(_a, _b)      if (_a == _b) { SPU_HALT_ACTION; };
 744
 745
 746 /* spu_hcmpgt
 747  * ========
 748  */
 749 #define spu_hcmpgt(_a, _b)      if (_a > _b) { SPU_HALT_ACTION; };
 750
 751
 752 /* spu_idisable
 753  * ============
 754  */
 755 #define spu_idisable()          SPU_UNSUPPORTED_ACTION
 756
 757
 758 /* spu_ienable
 759  * ===========
 760  */
 761 #define spu_ienable()           SPU_UNSUPPORTED_ACTION
 762
 763
 764 /* spu_insert
 765  * ========
 766  */
 767 static __inline vec_uchar16 spu_insert(unsigned char a, vec_uchar16 b, int element)
 768 {
 769   union {
 770     vec_uchar16 v;
 771     unsigned char c[16];
 772   } in;
 773
 774   in.v = b;
 775   in.c[element & 15] = a;
 776   return (in.v);
 777 }
 778
 779 static __inline vec_char16 spu_insert(signed char a, vec_char16 b, int element)
 780 {
 781   return ((vec_char16)spu_insert((unsigned char)(a), (vec_uchar16)(b), element));
 782 }
 783
 784 static __inline vec_ushort8 spu_insert(unsigned short a, vec_ushort8 b, int element)
 785 {
 786   union {
 787     vec_ushort8 v;
 788     unsigned short s[8];
 789   } in;
 790
 791   in.v = b;
 792   in.s[element & 7] = a;
 793   return (in.v);
 794 }
 795
 796 static __inline vec_short8 spu_insert(signed short a, vec_short8 b, int element)
 797 {
 798   return ((vec_short8)spu_insert((unsigned short)(a), (vec_ushort8)(b), element));
 799 }
 800
 801 static __inline vec_uint4 spu_insert(unsigned int a, vec_uint4 b, int element)
 802 {
 803   union {
 804     vec_uint4 v;
 805     unsigned int i[4];
 806   } in;
 807
 808   in.v = b;
 809   in.i[element & 3] = a;
 810   return (in.v);
 811 }
 812
 813 static __inline vec_int4 spu_insert(signed int a, vec_int4 b, int element)
 814 {
 815   return ((vec_int4)spu_insert((unsigned int)(a), (vec_uint4)(b), element));
 816 }
 817
 818 static __inline vec_float4 spu_insert(float a, vec_float4 b, int element)
 819 {
 820   union {
 821     vec_float4 v;
 822     float f[4];
 823   } in;
 824
 825   in.v = b;
 826   in.f[element & 3] = a;
 827   return (in.v);
 828 }
 829
 830 static __inline vec_ullong2 spu_insert(unsigned long long a, vec_ullong2 b, int element)
 831 {
 832   union {
 833     vec_ullong2 v;
 834     unsigned long long l[2];
 835   } in;
 836
 837   in.v = b;
 838   in.l[element & 1] = a;
 839   return (in.v);
 840 }
 841
 842 static __inline vec_llong2 spu_insert(signed long long a, vec_llong2 b, int element)
 843 {
 844   return ((vec_llong2)spu_insert((unsigned long long)(a), (vec_ullong2)(b), element));
 845 }
 846
 847 static __inline vec_double2 spu_insert(double a, vec_double2 b, int element)
 848 {
 849   union {
 850     vec_double2 v;
 851     double d[2];
 852   } in;
 853
 854   in.v = b;
 855   in.d[element & 1] = a;
 856   return (in.v);
 857 }
 858
 859
 860 /* spu_madd
 861  * ========
 862  */
 863 static __inline vec_int4 spu_madd(vec_short8 a, vec_short8 b, vec_int4 c)
 864 {
 865   return ((vec_int4)(si_mpya((qword)(a), (qword)(b), (qword)(c))));
 866 }
 867
 868 static __inline vec_float4 spu_madd(vec_float4 a, vec_float4 b, vec_float4 c)
 869 {
 870   return ((vec_float4)(si_fma((qword)(a), (qword)(b), (qword)(c))));
 871 }
 872
 873 static __inline vec_double2 spu_madd(vec_double2 a, vec_double2 b, vec_double2 c)
 874 {
 875   return ((vec_double2)(si_dfma((qword)(a), (qword)(b), (qword)(c))));
 876 }
 877
 878
 879 /* spu_maskb
 880  * ========
 881  */
 882 #define spu_maskb(_a)   (vec_uchar16)(si_fsmb(si_from_int((int)(_a))))
 883
 884 /* spu_maskh
 885  * ========
 886  */
 887 #define spu_maskh(_a)   (vec_ushort8)(si_fsmh(si_from_int((int)(_a))))
 888
 889
 890 /* spu_maskw
 891  * ========
 892  */
 893 #define spu_maskw(_a)   (vec_uint4)(si_fsm(si_from_int((int)(_a))))
 894
 895
 896 /* spu_mfcdma32
 897  * ========
 898  */
 899 #define spu_mfcdma32(_ls, _ea, _size, _tagid, _cmd)
 900
 901
 902 /* spu_mfcdma64
 903  * ========
 904  */
 905 #define spu_mfcdma64(_ls, _eahi, _ealow,  _size, _tagid, _cmd)
 906
 907 /* spu_mfcstat
 908  * ========
 909  */
 910 #define spu_mfcstat(_type)      0xFFFFFFFF
 911
 912
 913
 914 /* spu_mffpscr
 915  * ===========
 916  */
 917 #define spu_mffpscr()           (vec_uint4)(si_fscrrd())
 918
 919
 920 /* spu_mfspr
 921  * ========
 922  */
 923
 924 #define spu_mfspr(_reg)         si_to_uint(si_mfspr(_reg))
 925
 926
 927
 928 /* spu_mhhadd
 929  * ==========
 930  */
 931 static __inline vec_int4 spu_mhhadd(vec_short8 a, vec_short8 b, vec_int4 c)
 932 {
 933   return ((vec_int4)(si_mpyhha((qword)(a), (qword)(b), (qword)(c))));
 934 }
 935
 936
 937 static __inline vec_uint4 spu_mhhadd(vec_ushort8 a, vec_ushort8 b, vec_uint4 c)
 938 {
 939   return ((vec_uint4)(si_mpyhhau((qword)(a), (qword)(b), (qword)(c))));
 940 }
 941
 942
 943 /* spu_msub
 944  * ========
 945  */
 946 static __inline vec_float4 spu_msub(vec_float4 a, vec_float4 b, vec_float4 c)
 947 {
 948   return ((vec_float4)(si_fms((qword)(a), (qword)(b), (qword)(c))));
 949 }
 950
 951 static __inline vec_double2 spu_msub(vec_double2 a, vec_double2 b, vec_double2 c)
 952 {
 953   return ((vec_double2)(si_dfms((qword)(a), (qword)(b), (qword)(c))));
 954 }
 955
 956
 957 /* spu_mtfpscr
 958  * ===========
 959  */
 960 #define spu_mtfpscr(_a)
 961
 962
 963 /* spu_mtspr
 964  * ========
 965  */
 966 #define spu_mtspr(_reg, _a)
 967
 968
 969 /* spu_mul
 970  * ========
 971  */
 972 static __inline vec_float4 spu_mul(vec_float4 a, vec_float4 b)
 973 {
 974   return ((vec_float4)(si_fm((qword)(a), (qword)(b))));
 975 }
 976
 977 static __inline vec_double2 spu_mul(vec_double2 a, vec_double2 b)
 978 {
 979   return ((vec_double2)(si_dfm((qword)(a), (qword)(b))));
 980 }
 981
 982
 983 /* spu_mulh
 984  * ========
 985  */
 986 static __inline vec_int4 spu_mulh(vec_short8 a, vec_short8 b)
 987 {
 988   return ((vec_int4)(si_mpyh((qword)(a), (qword)(b))));
 989 }
 990
 991 /* spu_mule
 992  * =========
 993  */
 994 #define spu_mule(_a, _b)        vec_mule(_a, _b)
 995
 996
 997
 998 /* spu_mulo
 999  * ========
1000  */
1001 static __inline vec_int4 spu_mulo(vec_short8 a, vec_short8 b)
1002 {
1003   return ((vec_int4)(si_mpy((qword)(a), (qword)(b))));
1004 }
1005
1006
1007 static __inline vec_uint4 spu_mulo(vec_ushort8 a, vec_ushort8 b)
1008 {
1009   return ((vec_uint4)(si_mpyu((qword)(a), (qword)(b))));
1010 }
1011
1012
1013 static __inline vec_int4 spu_mulo(vec_short8 a, short b)
1014 {
1015   return ((vec_int4)(si_mpyi((qword)(a), b)));
1016 }
1017
1018 static __inline vec_uint4 spu_mulo(vec_ushort8 a, unsigned short b)
1019 {
1020   return ((vec_uint4)(si_mpyui((qword)(a), b)));
1021 }
1022
1023
1024 /* spu_mulsr
1025  * =========
1026  */
1027 static __inline vec_int4 spu_mulsr(vec_short8 a, vec_short8 b)
1028 {
1029   return ((vec_int4)(si_mpys((qword)(a), (qword)(b))));
1030 }
1031
1032
1033 /* spu_nand
1034  * ========
1035  */
1036 static __inline vec_uchar16 spu_nand(vec_uchar16 a, vec_uchar16 b)
1037 {
1038   return ((vec_uchar16)(si_nand((qword)(a), (qword)(b))));
1039 }
1040
1041 static __inline vec_char16 spu_nand(vec_char16 a, vec_char16 b)
1042 {
1043   return ((vec_char16)(si_nand((qword)(a), (qword)(b))));
1044 }
1045
1046 static __inline vec_ushort8 spu_nand(vec_ushort8 a, vec_ushort8 b)
1047 {
1048   return ((vec_ushort8)(si_nand((qword)(a), (qword)(b))));
1049 }
1050
1051 static __inline vec_short8 spu_nand(vec_short8 a, vec_short8 b)
1052 {
1053   return ((vec_short8)(si_nand((qword)(a), (qword)(b))));
1054 }
1055
1056 static __inline vec_uint4 spu_nand(vec_uint4 a, vec_uint4 b)
1057 {
1058   return ((vec_uint4)(si_nand((qword)(a), (qword)(b))));
1059 }
1060
1061 static __inline vec_int4 spu_nand(vec_int4 a, vec_int4 b)
1062 {
1063   return ((vec_int4)(si_nand((qword)(a), (qword)(b))));
1064 }
1065
1066 static __inline vec_float4 spu_nand(vec_float4 a, vec_float4 b)
1067 {
1068   return ((vec_float4)(si_nand((qword)(a), (qword)(b))));
1069 }
1070
1071 static __inline vec_ullong2 spu_nand(vec_ullong2 a, vec_ullong2 b)
1072 {
1073   return ((vec_ullong2)(si_nand((qword)(a), (qword)(b))));
1074 }
1075
1076 static __inline vec_llong2 spu_nand(vec_llong2 a, vec_llong2 b)
1077 {
1078   return ((vec_llong2)(si_nand((qword)(a), (qword)(b))));
1079 }
1080
1081 static __inline vec_double2 spu_nand(vec_double2 a, vec_double2 b)
1082 {
1083   return ((vec_double2)(si_nand((qword)(a), (qword)(b))));
1084 }
1085
1086
1087 /* spu_nmadd
1088  * =========
1089  */
1090 static __inline vec_double2 spu_nmadd(vec_double2 a, vec_double2 b, vec_double2 c)
1091 {
1092   return ((vec_double2)(si_dfnma((qword)(a), (qword)(b), (qword)(c))));
1093 }
1094
1095
1096 /* spu_nmsub
1097  * =========
1098  */
1099 static __inline vec_float4 spu_nmsub(vec_float4 a, vec_float4 b, vec_float4 c)
1100 {
1101   return ((vec_float4)(si_fnms((qword)(a), (qword)(b), (qword)(c))));
1102 }
1103
1104 static __inline vec_double2 spu_nmsub(vec_double2 a, vec_double2 b, vec_double2 c)
1105 {
1106   return ((vec_double2)(si_dfnms((qword)(a), (qword)(b), (qword)(c))));
1107 }
1108
1109
1110 /* spu_nor
1111  * =======
1112  */
1113 #define spu_nor(_a, _b)         vec_nor(_a, _b)
1114
1115
1116 /* spu_or
1117  * ======
1118  */
1119 static __inline vec_uchar16 spu_or(vec_uchar16 a, vec_uchar16 b)
1120 {
1121   return ((vec_uchar16)(si_or((qword)(a), (qword)(b))));
1122 }
1123
1124 static __inline vec_char16 spu_or(vec_char16 a, vec_char16 b)
1125 {
1126   return ((vec_char16)(si_or((qword)(a), (qword)(b))));
1127 }
1128
1129 static __inline vec_ushort8 spu_or(vec_ushort8 a, vec_ushort8 b)
1130 {
1131   return ((vec_ushort8)(si_or((qword)(a), (qword)(b))));
1132 }
1133
1134 static __inline vec_short8 spu_or(vec_short8 a, vec_short8 b)
1135 {
1136   return ((vec_short8)(si_or((qword)(a), (qword)(b))));
1137 }
1138
1139 static __inline vec_uint4 spu_or(vec_uint4 a, vec_uint4 b)
1140 {
1141   return ((vec_uint4)(si_or((qword)(a), (qword)(b))));
1142 }
1143
1144 static __inline vec_int4 spu_or(vec_int4 a, vec_int4 b)
1145 {
1146   return ((vec_int4)(si_or((qword)(a), (qword)(b))));
1147 }
1148
1149 static __inline vec_float4 spu_or(vec_float4 a, vec_float4 b)
1150 {
1151   return ((vec_float4)(si_or((qword)(a), (qword)(b))));
1152 }
1153
1154 static __inline vec_ullong2 spu_or(vec_ullong2 a, vec_ullong2 b)
1155 {
1156   return ((vec_ullong2)(si_or((qword)(a), (qword)(b))));
1157 }
1158
1159 static __inline vec_llong2 spu_or(vec_llong2 a, vec_llong2 b)
1160 {
1161   return ((vec_llong2)(si_or((qword)(a), (qword)(b))));
1162 }
1163
1164 static __inline vec_double2 spu_or(vec_double2 a, vec_double2 b)
1165 {
1166   return ((vec_double2)(si_or((qword)(a), (qword)(b))));
1167 }
1168
1169
1170 static __inline vec_uchar16 spu_or(vec_uchar16 a, unsigned char b)
1171 {
1172   return ((vec_uchar16)(si_orbi((qword)(a), b)));
1173 }
1174
1175 static __inline vec_char16 spu_or(vec_char16 a, signed char b)
1176 {
1177   return ((vec_char16)(si_orbi((qword)(a), (unsigned char)(b))));
1178 }
1179
1180 static __inline vec_ushort8 spu_or(vec_ushort8 a, unsigned short b)
1181 {
1182   return ((vec_ushort8)(si_orhi((qword)(a), b)));
1183 }
1184
1185 static __inline vec_short8 spu_or(vec_short8 a, signed short b)
1186 {
1187   return ((vec_short8)(si_orhi((qword)(a), (unsigned short)(b))));
1188 }
1189
1190 static __inline vec_uint4 spu_or(vec_uint4 a, unsigned int b)
1191 {
1192   return ((vec_uint4)(si_ori((qword)(a), b)));
1193 }
1194
1195 static __inline vec_int4 spu_or(vec_int4 a, signed int b)
1196 {
1197   return ((vec_int4)(si_ori((qword)(a), (unsigned int)(b))));
1198 }
1199
1200
1201 /* spu_orc
1202  * =======
1203  */
1204 #define spu_orc(_a, _b)         vec_or(_a, vec_nor(_b, _b))
1205
1206
1207 /* spu_orx
1208  * =======
1209  */
1210 static __inline vec_uint4 spu_orx(vec_uint4 a)
1211 {
1212   return ((vec_uint4)(si_orx((qword)(a))));
1213 }
1214
1215 static __inline vec_int4 spu_orx(vec_int4 a)
1216 {
1217   return ((vec_int4)(si_orx((qword)(a))));
1218 }
1219
1220
1221 /* spu_promote
1222  * ===========
1223  */
1224 static __inline vec_uchar16 spu_promote(unsigned char a, int element)
1225 {
1226   union {
1227     vec_uchar16 v;
1228     unsigned char c[16];
1229   } in;
1230
1231   in.c[element & 15] = a;
1232   return (in.v);
1233 }
1234
1235 static __inline vec_char16 spu_promote(signed char a, int element)
1236 {
1237   union {
1238     vec_char16 v;
1239     signed char c[16];
1240   } in;
1241
1242   in.c[element & 15] = a;
1243   return (in.v);
1244 }
1245
1246 static __inline vec_ushort8 spu_promote(unsigned short a, int element)
1247 {
1248   union {
1249     vec_ushort8 v;
1250     unsigned short s[8];
1251   } in;
1252
1253   in.s[element & 7] = a;
1254   return (in.v);
1255 }
1256
1257 static __inline vec_short8 spu_promote(signed short a, int element)
1258 {
1259   union {
1260     vec_short8 v;
1261     signed short s[8];
1262   } in;
1263
1264   in.s[element & 7] = a;
1265   return (in.v);
1266 }
1267
1268 static __inline vec_uint4 spu_promote(unsigned int a, int element)
1269 {
1270   union {
1271     vec_uint4 v;
1272     unsigned int i[4];
1273   } in;
1274
1275   in.i[element & 3] = a;
1276   return (in.v);
1277 }
1278
1279 static __inline vec_int4 spu_promote(signed int a, int element)
1280 {
1281   union {
1282     vec_int4 v;
1283     signed int i[4];
1284   } in;
1285
1286   in.i[element & 3] = a;
1287   return (in.v);
1288 }
1289
1290 static __inline vec_float4 spu_promote(float a, int element)
1291 {
1292   union {
1293     vec_float4 v;
1294     float f[4];
1295   } in;
1296
1297   in.f[element & 3] = a;
1298   return (in.v);
1299 }
1300
1301 static __inline vec_ullong2 spu_promote(unsigned long long a, int element)
1302 {
1303   union {
1304     vec_ullong2 v;
1305     unsigned long long l[2];
1306   } in;
1307
1308   in.l[element & 1] = a;
1309   return (in.v);
1310 }
1311
1312 static __inline vec_llong2 spu_promote(signed long long a, int element)
1313 {
1314   union {
1315     vec_llong2 v;
1316     signed long long l[2];
1317   } in;
1318
1319   in.l[element & 1] = a;
1320   return (in.v);
1321 }
1322
1323 static __inline vec_double2 spu_promote(double a, int element)
1324 {
1325   union {
1326     vec_double2 v;
1327     double d[2];
1328   } in;
1329
1330   in.d[element & 1] = a;
1331   return (in.v);
1332 }
1333
1334 /* spu_re
1335  * ======
1336  */
1337 #define spu_re(_a)              vec_re(_a)
1338
1339
1340 /* spu_readch
1341  * ==========
1342  */
1343 #define spu_readch(_channel)            0       /* not mappable */
1344
1345
1346 /* spu_readchcnt
1347  * =============
1348  */
1349 #define spu_readchcnt(_channel)         0       /* not mappable */
1350
1351
1352 /* spu_readchqw
1353  * ============
1354  */
1355 #define spu_readchqw(_channel) __extension__ ({ vec_uint4 result = { 0, 0, 0, 0 }; result; })
1356
1357 /* spu_rl
1358  * ======
1359  */
1360 static __inline vec_ushort8 spu_rl(vec_ushort8 a, vec_short8 b)
1361 {
1362   return ((vec_ushort8)(si_roth((qword)(a), (qword)(b))));
1363 }
1364
1365 static __inline vec_short8 spu_rl(vec_short8 a, vec_short8 b)
1366 {
1367   return ((vec_short8)(si_roth((qword)(a), (qword)(b))));
1368 }
1369
1370 static __inline vec_uint4 spu_rl(vec_uint4 a, vec_int4 b)
1371 {
1372   return ((vec_uint4)(si_rot((qword)(a), (qword)(b))));
1373 }
1374
1375 static __inline vec_int4 spu_rl(vec_int4 a, vec_int4 b)
1376 {
1377   return ((vec_int4)(si_rot((qword)(a), (qword)(b))));
1378 }
1379
1380 static __inline vec_ushort8 spu_rl(vec_ushort8 a, int b)
1381 {
1382   return ((vec_ushort8)(si_rothi((qword)(a), b)));
1383 }
1384
1385 static __inline vec_short8 spu_rl(vec_short8 a, int b)
1386 {
1387   return ((vec_short8)(si_rothi((qword)(a), b)));
1388 }
1389
1390 static __inline vec_uint4 spu_rl(vec_uint4 a, int b)
1391 {
1392   return ((vec_uint4)(si_roti((qword)(a), b)));
1393 }
1394
1395 static __inline vec_int4 spu_rl(vec_int4 a, int b)
1396 {
1397   return ((vec_int4)(si_roti((qword)(a), b)));
1398 }
1399
1400
1401 /* spu_rlmask
1402  * ==========
1403  */
1404 static __inline vec_ushort8 spu_rlmask(vec_ushort8 a, vec_short8 b)
1405 {
1406   return ((vec_ushort8)(si_rothm((qword)(a), (qword)(b))));
1407 }
1408
1409 static __inline vec_short8 spu_rlmask(vec_short8 a, vec_short8 b)
1410 {
1411   return ((vec_short8)(si_rothm((qword)(a), (qword)(b))));
1412 }
1413
1414 static __inline vec_uint4 spu_rlmask(vec_uint4 a, vec_int4 b)
1415 {
1416   return ((vec_uint4)(si_rotm((qword)(a), (qword)(b))));
1417 }
1418
1419 static __inline vec_int4 spu_rlmask(vec_int4 a, vec_int4 b)
1420 {
1421   return ((vec_int4)(si_rotm((qword)(a), (qword)(b))));
1422 }
1423
1424 static __inline vec_ushort8 spu_rlmask(vec_ushort8 a, int b)
1425 {
1426   return ((vec_ushort8)(si_rothmi((qword)(a), b)));
1427 }
1428
1429 static __inline vec_short8 spu_rlmask(vec_short8 a, int b)
1430 {
1431   return ((vec_short8)(si_rothmi((qword)(a), b)));
1432 }
1433
1434
1435 static __inline vec_uint4 spu_rlmask(vec_uint4 a, int b)
1436 {
1437   return ((vec_uint4)(si_rotmi((qword)(a), b)));
1438 }
1439
1440 static __inline vec_int4 spu_rlmask(vec_int4 a, int b)
1441 {
1442   return ((vec_int4)(si_rotmi((qword)(a), b)));
1443 }
1444
1445 /* spu_rlmaska
1446  * ===========
1447  */
1448 static __inline vec_short8 spu_rlmaska(vec_short8 a, vec_short8 b)
1449 {
1450   return ((vec_short8)(si_rotmah((qword)(a), (qword)(b))));
1451 }
1452
1453 static __inline vec_ushort8 spu_rlmaska(vec_ushort8 a, vec_short8 b)
1454 {
1455   return ((vec_ushort8)(si_rotmah((qword)(a), (qword)(b))));
1456 }
1457
1458
1459 static __inline vec_int4 spu_rlmaska(vec_int4 a, vec_int4 b)
1460 {
1461   return ((vec_int4)(si_rotma((qword)(a), (qword)(b))));
1462 }
1463
1464 static __inline vec_uint4 spu_rlmaska(vec_uint4 a, vec_int4 b)
1465 {
1466   return ((vec_uint4)(si_rotma((qword)(a), (qword)(b))));
1467 }
1468
1469 static __inline vec_ushort8 spu_rlmaska(vec_ushort8 a, int b)
1470 {
1471   return ((vec_ushort8)(si_rotmahi((qword)(a), b)));
1472 }
1473
1474 static __inline vec_short8 spu_rlmaska(vec_short8 a, int b)
1475 {
1476   return ((vec_short8)(si_rotmahi((qword)(a), b)));
1477 }
1478
1479 static __inline vec_uint4 spu_rlmaska(vec_uint4 a, int b)
1480 {
1481   return ((vec_uint4)(si_rotmai((qword)(a), b)));
1482 }
1483
1484 static __inline vec_int4 spu_rlmaska(vec_int4 a, int b)
1485 {
1486   return ((vec_int4)(si_rotmai((qword)(a), b)));
1487 }
1488
1489
1490 /* spu_rlmaskqw
1491  * ============
1492  */
1493 static __inline vec_uchar16 spu_rlmaskqw(vec_uchar16 a, int count)
1494 {
1495   return ((vec_uchar16)(si_rotqmbi((qword)(a), si_from_int(count))));
1496 }
1497
1498 static __inline vec_char16 spu_rlmaskqw(vec_char16 a, int count)
1499 {
1500   return ((vec_char16)(si_rotqmbi((qword)(a), si_from_int(count))));
1501 }
1502
1503 static __inline vec_ushort8 spu_rlmaskqw(vec_ushort8 a, int count)
1504 {
1505   return ((vec_ushort8)(si_rotqmbi((qword)(a), si_from_int(count))));
1506 }
1507
1508 static __inline vec_short8 spu_rlmaskqw(vec_short8 a, int count)
1509 {
1510   return ((vec_short8)(si_rotqmbi((qword)(a), si_from_int(count))));
1511 }
1512
1513 static __inline vec_uint4 spu_rlmaskqw(vec_uint4 a, int count)
1514 {
1515   return ((vec_uint4)(si_rotqmbi((qword)(a), si_from_int(count))));
1516 }
1517
1518 static __inline vec_int4 spu_rlmaskqw(vec_int4 a, int count)
1519 {
1520   return ((vec_int4)(si_rotqmbi((qword)(a), si_from_int(count))));
1521 }
1522
1523 static __inline vec_float4 spu_rlmaskqw(vec_float4 a, int count)
1524 {
1525   return ((vec_float4)(si_rotqmbi((qword)(a), si_from_int(count))));
1526 }
1527
1528 static __inline vec_ullong2 spu_rlmaskqw(vec_ullong2 a, int count)
1529 {
1530   return ((vec_ullong2)(si_rotqmbi((qword)(a), si_from_int(count))));
1531 }
1532
1533 static __inline vec_llong2 spu_rlmaskqw(vec_llong2 a, int count)
1534 {
1535   return ((vec_llong2)(si_rotqmbi((qword)(a), si_from_int(count))));
1536 }
1537
1538 static __inline vec_double2 spu_rlmaskqw(vec_double2 a, int count)
1539 {
1540   return ((vec_double2)(si_rotqmbi((qword)(a), si_from_int(count))));
1541 }
1542
1543 /* spu_rlmaskqwbyte
1544  * ================
1545  */
1546 static __inline vec_uchar16 spu_rlmaskqwbyte(vec_uchar16 a, int count)
1547 {
1548   return ((vec_uchar16)(si_rotqmby((qword)(a), si_from_int(count))));
1549 }
1550
1551 static __inline vec_char16 spu_rlmaskqwbyte(vec_char16 a, int count)
1552 {
1553   return ((vec_char16)(si_rotqmby((qword)(a), si_from_int(count))));
1554 }
1555
1556 static __inline vec_ushort8 spu_rlmaskqwbyte(vec_ushort8 a, int count)
1557 {
1558   return ((vec_ushort8)(si_rotqmby((qword)(a), si_from_int(count))));
1559 }
1560
1561 static __inline vec_short8 spu_rlmaskqwbyte(vec_short8 a, int count)
1562 {
1563   return ((vec_short8)(si_rotqmby((qword)(a), si_from_int(count))));
1564 }
1565
1566 static __inline vec_uint4 spu_rlmaskqwbyte(vec_uint4 a, int count)
1567 {
1568   return ((vec_uint4)(si_rotqmby((qword)(a), si_from_int(count))));
1569 }
1570
1571 static __inline vec_int4 spu_rlmaskqwbyte(vec_int4 a, int count)
1572 {
1573   return ((vec_int4)(si_rotqmby((qword)(a), si_from_int(count))));
1574 }
1575
1576 static __inline vec_float4 spu_rlmaskqwbyte(vec_float4 a, int count)
1577 {
1578   return ((vec_float4)(si_rotqmby((qword)(a), si_from_int(count))));
1579 }
1580
1581 static __inline vec_ullong2 spu_rlmaskqwbyte(vec_ullong2 a, int count)
1582 {
1583   return ((vec_ullong2)(si_rotqmby((qword)(a), si_from_int(count))));
1584 }
1585
1586 static __inline vec_llong2 spu_rlmaskqwbyte(vec_llong2 a, int count)
1587 {
1588   return ((vec_llong2)(si_rotqmby((qword)(a), si_from_int(count))));
1589 }
1590
1591 static __inline vec_double2 spu_rlmaskqwbyte(vec_double2 a, int count)
1592 {
1593   return ((vec_double2)(si_rotqmby((qword)(a), si_from_int(count))));
1594 }
1595
1596 /* spu_rlmaskqwbytebc
1597  * ==================
1598  */
1599 static __inline vec_uchar16 spu_rlmaskqwbytebc(vec_uchar16 a, int count)
1600 {
1601   return ((vec_uchar16)(si_rotqmbybi((qword)(a), si_from_int(count))));
1602 }
1603
1604 static __inline vec_char16 spu_rlmaskqwbytebc(vec_char16 a, int count)
1605 {
1606   return ((vec_char16)(si_rotqmbybi((qword)(a), si_from_int(count))));
1607 }
1608
1609 static __inline vec_ushort8 spu_rlmaskqwbytebc(vec_ushort8 a, int count)
1610 {
1611   return ((vec_ushort8)(si_rotqmbybi((qword)(a), si_from_int(count))));
1612 }
1613
1614 static __inline vec_short8 spu_rlmaskqwbytebc(vec_short8 a, int count)
1615 {
1616   return ((vec_short8)(si_rotqmbybi((qword)(a), si_from_int(count))));
1617 }
1618
1619 static __inline vec_uint4 spu_rlmaskqwbytebc(vec_uint4 a, int count)
1620 {
1621   return ((vec_uint4)(si_rotqmbybi((qword)(a), si_from_int(count))));
1622 }
1623
1624 static __inline vec_int4 spu_rlmaskqwbytebc(vec_int4 a, int count)
1625 {
1626   return ((vec_int4)(si_rotqmbybi((qword)(a), si_from_int(count))));
1627 }
1628
1629 static __inline vec_float4 spu_rlmaskqwbytebc(vec_float4 a, int count)
1630 {
1631   return ((vec_float4)(si_rotqmbybi((qword)(a), si_from_int(count))));
1632 }
1633
1634 static __inline vec_ullong2 spu_rlmaskqwbytebc(vec_ullong2 a, int count)
1635 {
1636   return ((vec_ullong2)(si_rotqmbybi((qword)(a), si_from_int(count))));
1637 }
1638
1639 static __inline vec_llong2 spu_rlmaskqwbytebc(vec_llong2 a, int count)
1640 {
1641   return ((vec_llong2)(si_rotqmbybi((qword)(a), si_from_int(count))));
1642 }
1643
1644 static __inline vec_double2 spu_rlmaskqwbytebc(vec_double2 a, int count)
1645 {
1646   return ((vec_double2)(si_rotqmbybi((qword)(a), si_from_int(count))));
1647 }
1648
1649
1650 /* spu_rlqwbyte
1651  * ============
1652  */
1653 static __inline vec_uchar16 spu_rlqwbyte(vec_uchar16 a, int count)
1654 {
1655   return ((vec_uchar16)(si_rotqby((qword)(a), si_from_int(count))));
1656 }
1657
1658 static __inline vec_char16 spu_rlqwbyte(vec_char16 a, int count)
1659 {
1660   return ((vec_char16)(si_rotqby((qword)(a), si_from_int(count))));
1661 }
1662
1663 static __inline vec_ushort8 spu_rlqwbyte(vec_ushort8 a, int count)
1664 {
1665   return ((vec_ushort8)(si_rotqby((qword)(a), si_from_int(count))));
1666 }
1667
1668 static __inline vec_short8 spu_rlqwbyte(vec_short8 a, int count)
1669 {
1670   return ((vec_short8)(si_rotqby((qword)(a), si_from_int(count))));
1671 }
1672
1673 static __inline vec_uint4 spu_rlqwbyte(vec_uint4 a, int count)
1674 {
1675   return ((vec_uint4)(si_rotqby((qword)(a), si_from_int(count))));
1676 }
1677
1678 static __inline vec_int4 spu_rlqwbyte(vec_int4 a, int count)
1679 {
1680   return ((vec_int4)(si_rotqby((qword)(a), si_from_int(count))));
1681 }
1682
1683 static __inline vec_float4 spu_rlqwbyte(vec_float4 a, int count)
1684 {
1685   return ((vec_float4)(si_rotqby((qword)(a), si_from_int(count))));
1686 }
1687
1688 static __inline vec_ullong2 spu_rlqwbyte(vec_ullong2 a, int count)
1689 {
1690   return ((vec_ullong2)(si_rotqby((qword)(a), si_from_int(count))));
1691 }
1692
1693 static __inline vec_llong2 spu_rlqwbyte(vec_llong2 a, int count)
1694 {
1695   return ((vec_llong2)(si_rotqby((qword)(a), si_from_int(count))));
1696 }
1697
1698 static __inline vec_double2 spu_rlqwbyte(vec_double2 a, int count)
1699 {
1700   return ((vec_double2)(si_rotqby((qword)(a), si_from_int(count))));
1701 }
1702
1703
1704 /* spu_rlqwbytebc
1705  * ==============
1706  */
1707 static __inline vec_uchar16 spu_rlqwbytebc(vec_uchar16 a, int count)
1708 {
1709   return ((vec_uchar16)(si_rotqbybi((qword)(a), si_from_int(count))));
1710 }
1711
1712 static __inline vec_char16 spu_rlqwbytebc(vec_char16 a, int count)
1713 {
1714   return ((vec_char16)(si_rotqbybi((qword)(a), si_from_int(count))));
1715 }
1716
1717 static __inline vec_ushort8 spu_rlqwbytebc(vec_ushort8 a, int count)
1718 {
1719   return ((vec_ushort8)(si_rotqbybi((qword)(a), si_from_int(count))));
1720 }
1721
1722 static __inline vec_short8 spu_rlqwbytebc(vec_short8 a, int count)
1723 {
1724   return ((vec_short8)(si_rotqbybi((qword)(a), si_from_int(count))));
1725 }
1726
1727 static __inline vec_uint4 spu_rlqwbytebc(vec_uint4 a, int count)
1728 {
1729   return ((vec_uint4)(si_rotqbybi((qword)(a), si_from_int(count))));
1730 }
1731
1732 static __inline vec_int4 spu_rlqwbytebc(vec_int4 a, int count)
1733 {
1734   return ((vec_int4)(si_rotqbybi((qword)(a), si_from_int(count))));
1735 }
1736
1737 static __inline vec_float4 spu_rlqwbytebc(vec_float4 a, int count)
1738 {
1739   return ((vec_float4)(si_rotqbybi((qword)(a), si_from_int(count))));
1740 }
1741
1742 static __inline vec_ullong2 spu_rlqwbytebc(vec_ullong2 a, int count)
1743 {
1744   return ((vec_ullong2)(si_rotqbybi((qword)(a), si_from_int(count))));
1745 }
1746
1747 static __inline vec_llong2 spu_rlqwbytebc(vec_llong2 a, int count)
1748 {
1749   return ((vec_llong2)(si_rotqbybi((qword)(a), si_from_int(count))));
1750 }
1751
1752 static __inline vec_double2 spu_rlqwbytebc(vec_double2 a, int count)
1753 {
1754   return ((vec_double2)(si_rotqbybi((qword)(a), si_from_int(count))));
1755 }
1756
1757 /* spu_rlqw
1758  * ========
1759  */
1760 static __inline vec_uchar16 spu_rlqw(vec_uchar16 a, int count)
1761 {
1762   return ((vec_uchar16)(si_rotqbi((qword)(a), si_from_int(count))));
1763 }
1764
1765 static __inline vec_char16 spu_rlqw(vec_char16 a, int count)
1766 {
1767   return ((vec_char16)(si_rotqbi((qword)(a), si_from_int(count))));
1768 }
1769
1770 static __inline vec_ushort8 spu_rlqw(vec_ushort8 a, int count)
1771 {
1772   return ((vec_ushort8)(si_rotqbi((qword)(a), si_from_int(count))));
1773 }
1774
1775 static __inline vec_short8 spu_rlqw(vec_short8 a, int count)
1776 {
1777   return ((vec_short8)(si_rotqbi((qword)(a), si_from_int(count))));
1778 }
1779
1780 static __inline vec_uint4 spu_rlqw(vec_uint4 a, int count)
1781 {
1782   return ((vec_uint4)(si_rotqbi((qword)(a), si_from_int(count))));
1783 }
1784
1785 static __inline vec_int4 spu_rlqw(vec_int4 a, int count)
1786 {
1787   return ((vec_int4)(si_rotqbi((qword)(a), si_from_int(count))));
1788 }
1789
1790 static __inline vec_float4 spu_rlqw(vec_float4 a, int count)
1791 {
1792   return ((vec_float4)(si_rotqbi((qword)(a), si_from_int(count))));
1793 }
1794
1795 static __inline vec_ullong2 spu_rlqw(vec_ullong2 a, int count)
1796 {
1797   return ((vec_ullong2)(si_rotqbi((qword)(a), si_from_int(count))));
1798 }
1799
1800 static __inline vec_llong2 spu_rlqw(vec_llong2 a, int count)
1801 {
1802   return ((vec_llong2)(si_rotqbi((qword)(a), si_from_int(count))));
1803 }
1804
1805 static __inline vec_double2 spu_rlqw(vec_double2 a, int count)
1806 {
1807   return ((vec_double2)(si_rotqbi((qword)(a), si_from_int(count))));
1808 }
1809
1810 /* spu_roundtf
1811  * ===========
1812  */
1813 static __inline vec_float4 spu_roundtf(vec_double2 a)
1814 {
1815   return ((vec_float4)(si_frds((qword)(a))));
1816 }
1817
1818
1819 /* spu_rsqrte
1820  * ==========
1821  */
1822 #define spu_rsqrte(_a)          vec_rsqrte(_a)
1823
1824
1825 /* spu_sel
1826  * =======
1827  */
1828 static __inline vec_uchar16 spu_sel(vec_uchar16 a, vec_uchar16 b, vec_uchar16 pattern)
1829 {
1830   return ((vec_uchar16)(si_selb((qword)(a), (qword)(b), (qword)(pattern))));
1831 }
1832
1833 static __inline vec_char16 spu_sel(vec_char16 a, vec_char16 b, vec_uchar16 pattern)
1834 {
1835   return ((vec_char16)(si_selb((qword)(a), (qword)(b), (qword)(pattern))));
1836 }
1837
1838 static __inline vec_ushort8 spu_sel(vec_ushort8 a, vec_ushort8 b, vec_ushort8 pattern)
1839 {
1840   return ((vec_ushort8)(si_selb((qword)(a), (qword)(b), (qword)(pattern))));
1841 }
1842
1843 static __inline vec_short8 spu_sel(vec_short8 a, vec_short8 b, vec_ushort8 pattern)
1844 {
1845   return ((vec_short8)(si_selb((qword)(a), (qword)(b), (qword)(pattern))));
1846 }
1847
1848 static __inline vec_uint4 spu_sel(vec_uint4 a, vec_uint4 b, vec_uint4 pattern)
1849 {
1850   return ((vec_uint4)(si_selb((qword)(a), (qword)(b), (qword)(pattern))));
1851 }
1852
1853 static __inline vec_int4 spu_sel(vec_int4 a, vec_int4 b, vec_uint4 pattern)
1854 {
1855   return ((vec_int4)(si_selb((qword)(a), (qword)(b), (qword)(pattern))));
1856 }
1857
1858 static __inline vec_float4 spu_sel(vec_float4 a, vec_float4 b, vec_uint4 pattern)
1859 {
1860   return ((vec_float4)(si_selb((qword)(a), (qword)(b), (qword)(pattern))));
1861 }
1862
1863 static __inline vec_ullong2 spu_sel(vec_ullong2 a, vec_ullong2 b, vec_ullong2 pattern)
1864 {
1865   return ((vec_ullong2)(si_selb((qword)(a), (qword)(b), (qword)(pattern))));
1866 }
1867
1868 static __inline vec_llong2 spu_sel(vec_llong2 a, vec_llong2 b, vec_ullong2 pattern)
1869 {
1870   return ((vec_llong2)(si_selb((qword)(a), (qword)(b), (qword)(pattern))));
1871 }
1872
1873 static __inline vec_double2 spu_sel(vec_double2 a, vec_double2 b, vec_ullong2 pattern)
1874 {
1875   return ((vec_double2)(si_selb((qword)(a), (qword)(b), (qword)(pattern))));
1876 }
1877
1878
1879
1880 /* spu_shuffle
1881  * ===========
1882  */
1883 static __inline vec_uchar16 spu_shuffle(vec_uchar16 a, vec_uchar16 b, vec_uchar16 pattern)
1884 {
1885   return ((vec_uchar16)(si_shufb((qword)(a), (qword)(b), (qword)(pattern))));
1886 }
1887
1888 static __inline vec_char16 spu_shuffle(vec_char16 a, vec_char16 b, vec_uchar16 pattern)
1889 {
1890   return ((vec_char16)(si_shufb((qword)(a), (qword)(b), (qword)(pattern))));
1891 }
1892
1893 static __inline vec_ushort8 spu_shuffle(vec_ushort8 a, vec_ushort8 b, vec_uchar16 pattern)
1894 {
1895   return ((vec_ushort8)(si_shufb((qword)(a), (qword)(b), (qword)(pattern))));
1896 }
1897
1898 static __inline vec_short8 spu_shuffle(vec_short8 a, vec_short8 b, vec_uchar16 pattern)
1899 {
1900   return ((vec_short8)(si_shufb((qword)(a), (qword)(b), (qword)(pattern))));
1901 }
1902
1903 static __inline vec_uint4 spu_shuffle(vec_uint4 a, vec_uint4 b, vec_uchar16 pattern)
1904 {
1905   return ((vec_uint4)(si_shufb((qword)(a), (qword)(b), (qword)(pattern))));
1906 }
1907
1908 static __inline vec_int4 spu_shuffle(vec_int4 a, vec_int4 b, vec_uchar16 pattern)
1909 {
1910   return ((vec_int4)(si_shufb((qword)(a), (qword)(b), (qword)(pattern))));
1911 }
1912
1913 static __inline vec_float4 spu_shuffle(vec_float4 a, vec_float4 b, vec_uchar16 pattern)
1914 {
1915   return ((vec_float4)(si_shufb((qword)(a), (qword)(b), (qword)(pattern))));
1916 }
1917
1918 static __inline vec_ullong2 spu_shuffle(vec_ullong2 a, vec_ullong2 b, vec_uchar16 pattern)
1919 {
1920   return ((vec_ullong2)(si_shufb((qword)(a), (qword)(b), (qword)(pattern))));
1921 }
1922
1923 static __inline vec_llong2 spu_shuffle(vec_llong2 a, vec_llong2 b, vec_uchar16 pattern)
1924 {
1925   return ((vec_llong2)(si_shufb((qword)(a), (qword)(b), (qword)(pattern))));
1926 }
1927
1928 static __inline vec_double2 spu_shuffle(vec_double2 a, vec_double2 b, vec_uchar16 pattern)
1929 {
1930   return ((vec_double2)(si_shufb((qword)(a), (qword)(b), (qword)(pattern))));
1931 }
1932
1933
1934 /* spu_sl
1935  * ======
1936  */
1937 static __inline vec_ushort8 spu_sl(vec_ushort8 a, vec_ushort8 b)
1938 {
1939   return ((vec_ushort8)(si_shlh((qword)(a), (qword)(b))));
1940 }
1941
1942 static __inline vec_short8 spu_sl(vec_short8 a, vec_ushort8 b)
1943 {
1944   return ((vec_short8)(si_shlh((qword)(a), (qword)(b))));
1945 }
1946
1947 static __inline vec_uint4 spu_sl(vec_uint4 a, vec_uint4 b)
1948 {
1949   return ((vec_uint4)(si_shl((qword)(a), (qword)(b))));
1950 }
1951
1952 static __inline vec_int4 spu_sl(vec_int4 a, vec_uint4 b)
1953 {
1954   return ((vec_int4)(si_shl((qword)(a), (qword)(b))));
1955 }
1956
1957 static __inline vec_ushort8 spu_sl(vec_ushort8 a, unsigned int b)
1958 {
1959   return ((vec_ushort8)(si_shlhi((qword)(a), b)));
1960 }
1961
1962 static __inline vec_short8 spu_sl(vec_short8 a, unsigned int b)
1963 {
1964   return ((vec_short8)(si_shlhi((qword)(a), b)));
1965 }
1966
1967 static __inline vec_uint4 spu_sl(vec_uint4 a, unsigned int b)
1968 {
1969   return ((vec_uint4)(si_shli((qword)(a), b)));
1970 }
1971
1972 static __inline vec_int4 spu_sl(vec_int4 a, unsigned int b)
1973 {
1974   return ((vec_int4)(si_shli((qword)(a), b)));
1975 }
1976
1977
1978 /* spu_slqw
1979  * ========
1980  */
1981 static __inline vec_uchar16 spu_slqw(vec_uchar16 a, unsigned int count)
1982 {
1983   return ((vec_uchar16)(si_shlqbi((qword)(a), si_from_uint(count))));
1984 }
1985
1986 static __inline vec_char16 spu_slqw(vec_char16 a, unsigned int count)
1987 {
1988   return ((vec_char16)(si_shlqbi((qword)(a), si_from_uint(count))));
1989 }
1990
1991 static __inline vec_ushort8 spu_slqw(vec_ushort8 a, unsigned int count)
1992 {
1993   return ((vec_ushort8)(si_shlqbi((qword)(a), si_from_uint(count))));
1994 }
1995
1996 static __inline vec_short8 spu_slqw(vec_short8 a, unsigned int count)
1997 {
1998   return ((vec_short8)(si_shlqbi((qword)(a), si_from_uint(count))));
1999 }
2000
2001 static __inline vec_uint4 spu_slqw(vec_uint4 a, unsigned int count)
2002 {
2003   return ((vec_uint4)(si_shlqbi((qword)(a), si_from_uint(count))));
2004 }
2005
2006 static __inline vec_int4 spu_slqw(vec_int4 a, unsigned int count)
2007 {
2008   return ((vec_int4)(si_shlqbi((qword)(a), si_from_uint(count))));
2009 }
2010
2011 static __inline vec_float4 spu_slqw(vec_float4 a, unsigned int count)
2012 {
2013   return ((vec_float4)(si_shlqbi((qword)(a), si_from_uint(count))));
2014 }
2015
2016 static __inline vec_ullong2 spu_slqw(vec_ullong2 a, unsigned int count)
2017 {
2018   return ((vec_ullong2)(si_shlqbi((qword)(a), si_from_uint(count))));
2019 }
2020
2021 static __inline vec_llong2 spu_slqw(vec_llong2 a, unsigned int count)
2022 {
2023   return ((vec_llong2)(si_shlqbi((qword)(a), si_from_uint(count))));
2024 }
2025
2026 static __inline vec_double2 spu_slqw(vec_double2 a, unsigned int count)
2027 {
2028   return ((vec_double2)(si_shlqbi((qword)(a), si_from_uint(count))));
2029 }
2030
2031 /* spu_slqwbyte
2032  * ============
2033  */
2034 static __inline vec_uchar16 spu_slqwbyte(vec_uchar16 a, unsigned int count)
2035 {
2036   return ((vec_uchar16)(si_shlqby((qword)(a), si_from_uint(count))));
2037 }
2038
2039 static __inline vec_char16 spu_slqwbyte(vec_char16 a, unsigned int count)
2040 {
2041   return ((vec_char16)(si_shlqby((qword)(a), si_from_uint(count))));
2042 }
2043
2044 static __inline vec_ushort8 spu_slqwbyte(vec_ushort8 a, unsigned int count)
2045 {
2046   return ((vec_ushort8)(si_shlqby((qword)(a), si_from_uint(count))));
2047 }
2048
2049 static __inline vec_short8 spu_slqwbyte(vec_short8 a, unsigned int count)
2050 {
2051   return ((vec_short8)(si_shlqby((qword)(a), si_from_uint(count))));
2052 }
2053
2054 static __inline vec_uint4 spu_slqwbyte(vec_uint4 a, unsigned int count)
2055 {
2056   return ((vec_uint4)(si_shlqby((qword)(a), si_from_uint(count))));
2057 }
2058
2059 static __inline vec_int4 spu_slqwbyte(vec_int4 a, unsigned int count)
2060 {
2061   return ((vec_int4)(si_shlqby((qword)(a), si_from_uint(count))));
2062 }
2063
2064 static __inline vec_float4 spu_slqwbyte(vec_float4 a, unsigned int count)
2065 {
2066   return ((vec_float4)(si_shlqby((qword)(a), si_from_uint(count))));
2067 }
2068
2069 static __inline vec_ullong2 spu_slqwbyte(vec_ullong2 a, unsigned int count)
2070 {
2071   return ((vec_ullong2)(si_shlqby((qword)(a), si_from_uint(count))));
2072 }
2073
2074 static __inline vec_llong2 spu_slqwbyte(vec_llong2 a, unsigned int count)
2075 {
2076   return ((vec_llong2)(si_shlqby((qword)(a), si_from_uint(count))));
2077 }
2078
2079 static __inline vec_double2 spu_slqwbyte(vec_double2 a, unsigned int count)
2080 {
2081   return ((vec_double2)(si_shlqby((qword)(a), si_from_uint(count))));
2082 }
2083
2084 /* spu_slqwbytebc
2085  * ==============
2086  */
2087 static __inline vec_uchar16 spu_slqwbytebc(vec_uchar16 a, unsigned int count)
2088 {
2089   return ((vec_uchar16)(si_shlqbybi((qword)(a), si_from_uint(count))));
2090 }
2091
2092 static __inline vec_char16 spu_slqwbytebc(vec_char16 a, unsigned int count)
2093 {
2094   return ((vec_char16)(si_shlqbybi((qword)(a), si_from_uint(count))));
2095 }
2096
2097 static __inline vec_ushort8 spu_slqwbytebc(vec_ushort8 a, unsigned int count)
2098 {
2099   return ((vec_ushort8)(si_shlqbybi((qword)(a), si_from_uint(count))));
2100 }
2101
2102 static __inline vec_short8 spu_slqwbytebc(vec_short8 a, unsigned int count)
2103 {
2104   return ((vec_short8)(si_shlqbybi((qword)(a), si_from_uint(count))));
2105 }
2106
2107 static __inline vec_uint4 spu_slqwbytebc(vec_uint4 a, unsigned int count)
2108 {
2109   return ((vec_uint4)(si_shlqbybi((qword)(a), si_from_uint(count))));
2110 }
2111
2112 static __inline vec_int4 spu_slqwbytebc(vec_int4 a, unsigned int count)
2113 {
2114   return ((vec_int4)(si_shlqbybi((qword)(a), si_from_uint(count))));
2115 }
2116
2117 static __inline vec_float4 spu_slqwbytebc(vec_float4 a, unsigned int count)
2118 {
2119   return ((vec_float4)(si_shlqbybi((qword)(a), si_from_uint(count))));
2120 }
2121
2122 static __inline vec_ullong2 spu_slqwbytebc(vec_ullong2 a, unsigned int count)
2123 {
2124   return ((vec_ullong2)(si_shlqbybi((qword)(a), si_from_uint(count))));
2125 }
2126
2127 static __inline vec_llong2 spu_slqwbytebc(vec_llong2 a, unsigned int count)
2128 {
2129   return ((vec_llong2)(si_shlqbybi((qword)(a), si_from_uint(count))));
2130 }
2131
2132 static __inline vec_double2 spu_slqwbytebc(vec_double2 a, unsigned int count)
2133 {
2134   return ((vec_double2)(si_shlqbybi((qword)(a), si_from_uint(count))));
2135 }
2136
2137 /* spu_splats
2138  * ==========
2139  */
2140 static __inline vec_uchar16 spu_splats(unsigned char a)
2141 {
2142   union {
2143     vec_uchar16 v;
2144     unsigned char c[16];
2145   } in;
2146
2147   in.c[0] = a;
2148   return (vec_splat(in.v, 0));
2149 }
2150
2151 static __inline vec_char16 spu_splats(signed char a)
2152 {
2153   return ((vec_char16)spu_splats((unsigned char)(a)));
2154 }
2155
2156 static __inline vec_ushort8 spu_splats(unsigned short a)
2157 {
2158   union {
2159     vec_ushort8 v;
2160     unsigned short s[8];
2161   } in;
2162
2163   in.s[0] = a;
2164   return (vec_splat(in.v, 0));
2165 }
2166
2167 static __inline vec_short8 spu_splats(signed short a)
2168 {
2169   return ((vec_short8)spu_splats((unsigned short)(a)));
2170 }
2171
2172 static __inline vec_uint4 spu_splats(unsigned int a)
2173 {
2174   union {
2175     vec_uint4 v;
2176     unsigned int i[4];
2177   } in;
2178
2179   in.i[0] = a;
2180   return (vec_splat(in.v, 0));
2181 }
2182
2183 static __inline vec_int4 spu_splats(signed int a)
2184 {
2185   return ((vec_int4)spu_splats((unsigned int)(a)));
2186 }
2187
2188 static __inline vec_float4 spu_splats(float a)
2189 {
2190   union {
2191     vec_float4 v;
2192     float f[4];
2193   } in;
2194
2195   in.f[0] = a;
2196   return (vec_splat(in.v, 0));
2197 }
2198
2199 static __inline vec_ullong2 spu_splats(unsigned long long a)
2200 {
2201   union {
2202     vec_ullong2 v;
2203     unsigned long long l[2];
2204   } in;
2205
2206   in.l[0] = a;
2207   in.l[1] = a;
2208   return (in.v);
2209 }
2210
2211 static __inline vec_llong2 spu_splats(signed long long a)
2212 {
2213   return ((vec_llong2)spu_splats((unsigned long long)(a)));
2214 }
2215
2216 static __inline vec_double2 spu_splats(double a)
2217 {
2218   union {
2219     vec_double2 v;
2220     double d[2];
2221   } in;
2222
2223   in.d[0] = a;
2224   in.d[1] = a;
2225   return (in.v);
2226 }
2227
2228
2229 /* spu_stop
2230  * ========
2231  */
2232 #define spu_stop(_type) si_stop(_type)
2233
2234
2235 /* spu_sub
2236  * =======
2237  */
2238 static __inline vec_ushort8 spu_sub(vec_ushort8 a, vec_ushort8 b)
2239 {
2240   return ((vec_ushort8)(si_sfh((qword)(b), (qword)(a))));
2241 }
2242
2243 static __inline vec_short8 spu_sub(vec_short8 a, vec_short8 b)
2244 {
2245   return ((vec_short8)(si_sfh((qword)(b), (qword)(a))));
2246 }
2247
2248 static __inline vec_uint4 spu_sub(vec_uint4 a, vec_uint4 b)
2249 {
2250   return ((vec_uint4)(si_sf((qword)(b), (qword)(a))));
2251 }
2252
2253 static __inline vec_int4 spu_sub(vec_int4 a, vec_int4 b)
2254 {
2255   return ((vec_int4)(si_sf((qword)(b), (qword)(a))));
2256 }
2257
2258 static __inline vec_float4 spu_sub(vec_float4 a, vec_float4 b)
2259 {
2260   return ((vec_float4)(si_fs((qword)(a), (qword)(b))));
2261 }
2262
2263 static __inline vec_double2 spu_sub(vec_double2 a, vec_double2 b)
2264 {
2265   return ((vec_double2)(si_dfs((qword)(a), (qword)(b))));
2266 }
2267
2268 static __inline vec_uint4 spu_sub(unsigned int a, vec_uint4 b)
2269 {
2270   return ((vec_uint4)(si_sfi((qword)b, (int)a)));
2271 }
2272
2273 static __inline vec_int4 spu_sub(signed int a, vec_int4 b)
2274 {
2275   return ((vec_int4)(si_sfi((qword)b, (int)a)));
2276 }
2277
2278 static __inline vec_ushort8 spu_sub(unsigned short a, vec_ushort8 b)
2279 {
2280   return ((vec_ushort8)(si_sfhi((qword)b, (short)a)));
2281 }
2282
2283 static __inline vec_short8 spu_sub(signed short a, vec_short8 b)
2284 {
2285   return ((vec_short8)(si_sfhi((qword)b, (short)a)));
2286 }
2287
2288 /* spu_subx
2289  * ========
2290  */
2291 static __inline vec_uint4 spu_subx(vec_uint4 a, vec_uint4 b, vec_uint4 c)
2292 {
2293   return ((vec_uint4)(si_sfx((qword)(b), (qword)(a), (qword)(c))));
2294 }
2295
2296 static __inline vec_int4 spu_subx(vec_int4 a, vec_int4 b, vec_int4 c)
2297 {
2298   return ((vec_int4)(si_sfx((qword)(b), (qword)(a), (qword)(c))));
2299 }
2300
2301 /* spu_sumb
2302  * ========
2303  */
2304 static __inline vec_ushort8 spu_sumb(vec_uchar16 a, vec_uchar16 b)
2305 {
2306   return ((vec_ushort8)(si_sumb((qword)(a), (qword)(b))));
2307 }
2308
2309
2310 /* spu_sync
2311  * spu_sync_c
2312  * ========
2313  */
2314 #define spu_sync()      /* do nothing */
2315
2316 #define spu_sync_c()    /* do nothing */
2317
2318
2319 /* spu_writech
2320  * ===========
2321  */
2322 #define spu_writech(_channel, _a)       /* not mappable */
2323
2324 /* spu_writechqw
2325  * =============
2326  */
2327 #define spu_writechqw(_channel, _a)     /* not mappable */
2328
2329
2330 /* spu_xor
2331  * =======
2332  */
2333 static __inline vec_uchar16 spu_xor(vec_uchar16 a, vec_uchar16 b)
2334 {
2335   return ((vec_uchar16)(si_xor((qword)(a), (qword)(b))));
2336 }
2337
2338 static __inline vec_char16 spu_xor(vec_char16 a, vec_char16 b)
2339 {
2340   return ((vec_char16)(si_xor((qword)(a), (qword)(b))));
2341 }
2342
2343 static __inline vec_ushort8 spu_xor(vec_ushort8 a, vec_ushort8 b)
2344 {
2345   return ((vec_ushort8)(si_xor((qword)(a), (qword)(b))));
2346 }
2347
2348 static __inline vec_short8 spu_xor(vec_short8 a, vec_short8 b)
2349 {
2350   return ((vec_short8)(si_xor((qword)(a), (qword)(b))));
2351 }
2352
2353 static __inline vec_uint4 spu_xor(vec_uint4 a, vec_uint4 b)
2354 {
2355   return ((vec_uint4)(si_xor((qword)(a), (qword)(b))));
2356 }
2357
2358 static __inline vec_int4 spu_xor(vec_int4 a, vec_int4 b)
2359 {
2360   return ((vec_int4)(si_xor((qword)(a), (qword)(b))));
2361 }
2362
2363 static __inline vec_float4 spu_xor(vec_float4 a, vec_float4 b)
2364 {
2365   return ((vec_float4)(si_xor((qword)(a), (qword)(b))));
2366 }
2367
2368 static __inline vec_ullong2 spu_xor(vec_ullong2 a, vec_ullong2 b)
2369 {
2370   return ((vec_ullong2)(si_xor((qword)(a), (qword)(b))));
2371 }
2372
2373 static __inline vec_llong2 spu_xor(vec_llong2 a, vec_llong2 b)
2374 {
2375   return ((vec_llong2)(si_xor((qword)(a), (qword)(b))));
2376 }
2377
2378 static __inline vec_double2 spu_xor(vec_double2 a, vec_double2 b)
2379 {
2380   return ((vec_double2)(si_xor((qword)(a), (qword)(b))));
2381 }
2382
2383 static __inline vec_uchar16 spu_xor(vec_uchar16 a, unsigned char b)
2384 {
2385   return ((vec_uchar16)(si_xorbi((qword)(a), b)));
2386 }
2387
2388 static __inline vec_char16 spu_xor(vec_char16 a, signed char b)
2389 {
2390   return ((vec_char16)(si_xorbi((qword)(a), (unsigned char)(b))));
2391 }
2392
2393 static __inline vec_ushort8 spu_xor(vec_ushort8 a, unsigned short b)
2394 {
2395   return ((vec_ushort8)(si_xorhi((qword)(a), b)));
2396 }
2397
2398 static __inline vec_short8 spu_xor(vec_short8 a, signed short b)
2399 {
2400   return ((vec_short8)(si_xorhi((qword)(a), (unsigned short)(b))));
2401 }
2402
2403 static __inline vec_uint4 spu_xor(vec_uint4 a, unsigned int b)
2404 {
2405   return ((vec_uint4)(si_xori((qword)(a), b)));
2406 }
2407
2408 static __inline vec_int4 spu_xor(vec_int4 a, signed int b)
2409 {
2410   return ((vec_int4)(si_xori((qword)(a), (unsigned int)(b))));
2411 }
2412
2413 #endif /* !__SPU__ */
2414 #endif /* __cplusplus */
2415 #endif /* !_SPU2VMX_H_ */