Merge remote-tracking branch 'remotes/jasowang/tags/net-pull-request' into staging
[qemu/ar7.git] / target / tilegx / simd_helper.c
blob0fdfad2fa9cc77c8b5f68971a69ca8efdb876a95
1 /*
2 * QEMU TILE-Gx helpers
4 * Copyright (c) 2015 Chen Gang
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, see
18 * <http://www.gnu.org/licenses/lgpl-2.1.html>
21 #include "qemu/osdep.h"
22 #include "cpu.h"
23 #include "exec/helper-proto.h"
26 /* Broadcast a value to all elements of a vector. */
27 #define V1(X) (((X) & 0xff) * 0x0101010101010101ull)
28 #define V2(X) (((X) & 0xffff) * 0x0001000100010001ull)
31 uint64_t helper_v1multu(uint64_t a, uint64_t b)
33 uint64_t r = 0;
34 int i;
36 for (i = 0; i < 64; i += 8) {
37 unsigned ae = extract64(a, i, 8);
38 unsigned be = extract64(b, i, 8);
39 r = deposit64(r, i, 8, ae * be);
41 return r;
44 uint64_t helper_v2mults(uint64_t a, uint64_t b)
46 uint64_t r = 0;
47 int i;
49 /* While the instruction talks about signed inputs, with a
50 truncated result the sign of the inputs doesn't matter. */
51 for (i = 0; i < 64; i += 16) {
52 unsigned ae = extract64(a, i, 16);
53 unsigned be = extract64(b, i, 16);
54 r = deposit64(r, i, 16, ae * be);
56 return r;
59 uint64_t helper_v1shl(uint64_t a, uint64_t b)
61 uint64_t m;
63 b &= 7;
64 m = V1(0xff >> b);
65 return (a & m) << b;
68 uint64_t helper_v2shl(uint64_t a, uint64_t b)
70 uint64_t m;
72 b &= 15;
73 m = V2(0xffff >> b);
74 return (a & m) << b;
77 uint64_t helper_v1shru(uint64_t a, uint64_t b)
79 uint64_t m;
81 b &= 7;
82 m = V1(0xff << b);
83 return (a & m) >> b;
86 uint64_t helper_v2shru(uint64_t a, uint64_t b)
88 uint64_t m;
90 b &= 15;
91 m = V2(0xffff << b);
92 return (a & m) >> b;
95 uint64_t helper_v1shrs(uint64_t a, uint64_t b)
97 uint64_t r = 0;
98 int i;
100 b &= 7;
101 for (i = 0; i < 64; i += 8) {
102 r = deposit64(r, i, 8, sextract64(a, i + b, 8 - b));
104 return r;
107 uint64_t helper_v2shrs(uint64_t a, uint64_t b)
109 uint64_t r = 0;
110 int i;
112 b &= 15;
113 for (i = 0; i < 64; i += 16) {
114 r = deposit64(r, i, 16, sextract64(a, i + b, 16 - b));
116 return r;
119 uint64_t helper_v1int_h(uint64_t a, uint64_t b)
121 uint64_t r = 0;
122 int i;
124 for (i = 0; i < 32; i += 8) {
125 r = deposit64(r, 2 * i + 8, 8, extract64(a, i + 32, 8));
126 r = deposit64(r, 2 * i, 8, extract64(b, i + 32, 8));
128 return r;
131 uint64_t helper_v1int_l(uint64_t a, uint64_t b)
133 uint64_t r = 0;
134 int i;
136 for (i = 0; i < 32; i += 8) {
137 r = deposit64(r, 2 * i + 8, 8, extract64(a, i, 8));
138 r = deposit64(r, 2 * i, 8, extract64(b, i, 8));
140 return r;
143 uint64_t helper_v2int_h(uint64_t a, uint64_t b)
145 uint64_t r = 0;
146 int i;
148 for (i = 0; i < 32; i += 16) {
149 r = deposit64(r, 2 * i + 16, 16, extract64(a, i + 32, 16));
150 r = deposit64(r, 2 * i, 16, extract64(b, i + 32, 16));
152 return r;
155 uint64_t helper_v2int_l(uint64_t a, uint64_t b)
157 uint64_t r = 0;
158 int i;
160 for (i = 0; i < 32; i += 16) {
161 r = deposit64(r, 2 * i + 16, 16, extract64(a, i, 16));
162 r = deposit64(r, 2 * i, 16, extract64(b, i, 16));
164 return r;