4 * Copyright (c) 2015 Chen Gang
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, see
18 * <http://www.gnu.org/licenses/lgpl-2.1.html>
21 #include "qemu/osdep.h"
23 #include "qemu-common.h"
24 #include "exec/helper-proto.h"
27 /* Broadcast a value to all elements of a vector. */
28 #define V1(X) (((X) & 0xff) * 0x0101010101010101ull)
29 #define V2(X) (((X) & 0xffff) * 0x0001000100010001ull)
32 uint64_t helper_v1multu(uint64_t a
, uint64_t b
)
37 for (i
= 0; i
< 64; i
+= 8) {
38 unsigned ae
= extract64(a
, i
, 8);
39 unsigned be
= extract64(b
, i
, 8);
40 r
= deposit64(r
, i
, 8, ae
* be
);
45 uint64_t helper_v2mults(uint64_t a
, uint64_t b
)
50 /* While the instruction talks about signed inputs, with a
51 truncated result the sign of the inputs doesn't matter. */
52 for (i
= 0; i
< 64; i
+= 16) {
53 unsigned ae
= extract64(a
, i
, 16);
54 unsigned be
= extract64(b
, i
, 16);
55 r
= deposit64(r
, i
, 16, ae
* be
);
60 uint64_t helper_v1shl(uint64_t a
, uint64_t b
)
69 uint64_t helper_v2shl(uint64_t a
, uint64_t b
)
78 uint64_t helper_v1shru(uint64_t a
, uint64_t b
)
87 uint64_t helper_v2shru(uint64_t a
, uint64_t b
)
96 uint64_t helper_v1shrs(uint64_t a
, uint64_t b
)
102 for (i
= 0; i
< 64; i
+= 8) {
103 r
= deposit64(r
, i
, 8, sextract64(a
, i
+ b
, 8 - b
));
108 uint64_t helper_v2shrs(uint64_t a
, uint64_t b
)
114 for (i
= 0; i
< 64; i
+= 16) {
115 r
= deposit64(r
, i
, 16, sextract64(a
, i
+ b
, 16 - b
));
120 uint64_t helper_v1int_h(uint64_t a
, uint64_t b
)
125 for (i
= 0; i
< 32; i
+= 8) {
126 r
= deposit64(r
, 2 * i
+ 8, 8, extract64(a
, i
+ 32, 8));
127 r
= deposit64(r
, 2 * i
, 8, extract64(b
, i
+ 32, 8));
132 uint64_t helper_v1int_l(uint64_t a
, uint64_t b
)
137 for (i
= 0; i
< 32; i
+= 8) {
138 r
= deposit64(r
, 2 * i
+ 8, 8, extract64(a
, i
, 8));
139 r
= deposit64(r
, 2 * i
, 8, extract64(b
, i
, 8));
144 uint64_t helper_v2int_h(uint64_t a
, uint64_t b
)
149 for (i
= 0; i
< 32; i
+= 16) {
150 r
= deposit64(r
, 2 * i
+ 16, 16, extract64(a
, i
+ 32, 16));
151 r
= deposit64(r
, 2 * i
, 16, extract64(b
, i
+ 32, 16));
156 uint64_t helper_v2int_l(uint64_t a
, uint64_t b
)
161 for (i
= 0; i
< 32; i
+= 16) {
162 r
= deposit64(r
, 2 * i
+ 16, 16, extract64(a
, i
, 16));
163 r
= deposit64(r
, 2 * i
, 16, extract64(b
, i
, 16));