2 /* { dg-require-effective-target sse4 } */
3 /* { dg-options "-O2 -msse4.1" } */
5 #include "sse4_1-check.h"
20 compute_mpsadbw (unsigned char *v1
, unsigned char *v2
, int mask
)
31 offs2
= 4 * (mask
& 3);
32 for (i
= 0; i
< 4; i
++)
35 offs1
= 4 * ((mask
& 4) >> 2);
36 for (j
= 0; j
< 8; j
++)
39 for (i
= 0; i
< 4; i
++)
40 ret
.s
[j
] += abs (v1
[offs1
+ j
+ i
] - s
[i
]);
54 } val1
, val2
, val3
[8];
56 unsigned char masks
[8];
59 val1
.i
[0] = 0x35251505;
60 val1
.i
[1] = 0x75655545;
61 val1
.i
[2] = 0xB5A59585;
62 val1
.i
[3] = 0xF5E5D5C5;
64 val2
.i
[0] = 0x31211101;
65 val2
.i
[1] = 0x71615141;
66 val2
.i
[2] = 0xB1A19181;
67 val2
.i
[3] = 0xF1E1D1C1;
73 val3
[i
].i
[0] = 0xF1E1D1C1;
74 val3
[i
].i
[1] = 0xB1A19181;
75 val3
[i
].i
[2] = 0x71615141;
76 val3
[i
].i
[3] = 0x31211101;
83 /* Check mpsadbw imm8, xmm, xmm. */
84 res
[0] = _mm_mpsadbw_epu8 (val1
.x
, val2
.x
, msk0
);
85 res
[1] = _mm_mpsadbw_epu8 (val1
.x
, val2
.x
, msk1
);
86 res
[2] = _mm_mpsadbw_epu8 (val1
.x
, val2
.x
, msk2
);
87 res
[3] = _mm_mpsadbw_epu8 (val1
.x
, val2
.x
, msk3
);
88 res
[4] = _mm_mpsadbw_epu8 (val1
.x
, val2
.x
, msk4
);
89 res
[5] = _mm_mpsadbw_epu8 (val1
.x
, val2
.x
, msk5
);
90 res
[6] = _mm_mpsadbw_epu8 (val1
.x
, val2
.x
, msk6
);
91 res
[7] = _mm_mpsadbw_epu8 (val1
.x
, val2
.x
, msk7
);
102 for (i
=0; i
< 8; i
++)
104 tmp
= compute_mpsadbw (val1
.c
, val2
.c
, masks
[i
]);
105 if (memcmp (&tmp
, &res
[i
], sizeof (tmp
)))
109 /* Check mpsadbw imm8, m128, xmm. */
110 for (i
=0; i
< 8; i
++)
112 res
[i
] = _mm_mpsadbw_epu8 (val1
.x
, val3
[i
].x
, msk4
);
116 for (i
=0; i
< 8; i
++)
118 tmp
= compute_mpsadbw (val1
.c
, val3
[i
].c
, masks
[i
]);
119 if (memcmp (&tmp
, &res
[i
], sizeof (tmp
)))