xref: /openbmc/qemu/include/tcg/tcg-op-gvec.h (revision 0c4e9931)
1 /*
2  * Generic vector operation expansion
3  *
4  * Copyright (c) 2018 Linaro
5  *
6  * This library is free software; you can redistribute it and/or
7  * modify it under the terms of the GNU Lesser General Public
8  * License as published by the Free Software Foundation; either
9  * version 2.1 of the License, or (at your option) any later version.
10  *
11  * This library is distributed in the hope that it will be useful,
12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14  * Lesser General Public License for more details.
15  *
16  * You should have received a copy of the GNU Lesser General Public
17  * License along with this library; if not, see <http://www.gnu.org/licenses/>.
18  */
19 
20 #ifndef TCG_TCG_OP_GVEC_H
21 #define TCG_TCG_OP_GVEC_H
22 
23 /*
24  * "Generic" vectors.  All operands are given as offsets from ENV,
25  * and therefore cannot also be allocated via tcg_global_mem_new_*.
26  * OPRSZ is the byte size of the vector upon which the operation is performed.
27  * MAXSZ is the byte size of the full vector; bytes beyond OPSZ are cleared.
28  *
29  * All sizes must be 8 or any multiple of 16.
30  * When OPRSZ is 8, the alignment may be 8, otherwise must be 16.
31  * Operands may completely, but not partially, overlap.
32  */
33 
34 /* Expand a call to a gvec-style helper, with pointers to two vector
35    operands, and a descriptor (see tcg-gvec-desc.h).  */
36 typedef void gen_helper_gvec_2(TCGv_ptr, TCGv_ptr, TCGv_i32);
37 void tcg_gen_gvec_2_ool(uint32_t dofs, uint32_t aofs,
38                         uint32_t oprsz, uint32_t maxsz, int32_t data,
39                         gen_helper_gvec_2 *fn);
40 
41 /* Similarly, passing an extra data value.  */
42 typedef void gen_helper_gvec_2i(TCGv_ptr, TCGv_ptr, TCGv_i64, TCGv_i32);
43 void tcg_gen_gvec_2i_ool(uint32_t dofs, uint32_t aofs, TCGv_i64 c,
44                          uint32_t oprsz, uint32_t maxsz, int32_t data,
45                          gen_helper_gvec_2i *fn);
46 
47 /* Similarly, passing an extra pointer (e.g. env or float_status).  */
48 typedef void gen_helper_gvec_2_ptr(TCGv_ptr, TCGv_ptr, TCGv_ptr, TCGv_i32);
49 void tcg_gen_gvec_2_ptr(uint32_t dofs, uint32_t aofs,
50                         TCGv_ptr ptr, uint32_t oprsz, uint32_t maxsz,
51                         int32_t data, gen_helper_gvec_2_ptr *fn);
52 
53 /* Similarly, with three vector operands.  */
54 typedef void gen_helper_gvec_3(TCGv_ptr, TCGv_ptr, TCGv_ptr, TCGv_i32);
55 void tcg_gen_gvec_3_ool(uint32_t dofs, uint32_t aofs, uint32_t bofs,
56                         uint32_t oprsz, uint32_t maxsz, int32_t data,
57                         gen_helper_gvec_3 *fn);
58 
59 /* Similarly, with four vector operands.  */
60 typedef void gen_helper_gvec_4(TCGv_ptr, TCGv_ptr, TCGv_ptr,
61                                TCGv_ptr, TCGv_i32);
62 void tcg_gen_gvec_4_ool(uint32_t dofs, uint32_t aofs, uint32_t bofs,
63                         uint32_t cofs, uint32_t oprsz, uint32_t maxsz,
64                         int32_t data, gen_helper_gvec_4 *fn);
65 
66 /* Similarly, with five vector operands.  */
67 typedef void gen_helper_gvec_5(TCGv_ptr, TCGv_ptr, TCGv_ptr, TCGv_ptr,
68                                TCGv_ptr, TCGv_i32);
69 void tcg_gen_gvec_5_ool(uint32_t dofs, uint32_t aofs, uint32_t bofs,
70                         uint32_t cofs, uint32_t xofs, uint32_t oprsz,
71                         uint32_t maxsz, int32_t data, gen_helper_gvec_5 *fn);
72 
73 typedef void gen_helper_gvec_3_ptr(TCGv_ptr, TCGv_ptr, TCGv_ptr,
74                                    TCGv_ptr, TCGv_i32);
75 void tcg_gen_gvec_3_ptr(uint32_t dofs, uint32_t aofs, uint32_t bofs,
76                         TCGv_ptr ptr, uint32_t oprsz, uint32_t maxsz,
77                         int32_t data, gen_helper_gvec_3_ptr *fn);
78 
79 typedef void gen_helper_gvec_4_ptr(TCGv_ptr, TCGv_ptr, TCGv_ptr,
80                                    TCGv_ptr, TCGv_ptr, TCGv_i32);
81 void tcg_gen_gvec_4_ptr(uint32_t dofs, uint32_t aofs, uint32_t bofs,
82                         uint32_t cofs, TCGv_ptr ptr, uint32_t oprsz,
83                         uint32_t maxsz, int32_t data,
84                         gen_helper_gvec_4_ptr *fn);
85 
86 typedef void gen_helper_gvec_5_ptr(TCGv_ptr, TCGv_ptr, TCGv_ptr, TCGv_ptr,
87                                    TCGv_ptr, TCGv_ptr, TCGv_i32);
88 void tcg_gen_gvec_5_ptr(uint32_t dofs, uint32_t aofs, uint32_t bofs,
89                         uint32_t cofs, uint32_t eofs, TCGv_ptr ptr,
90                         uint32_t oprsz, uint32_t maxsz, int32_t data,
91                         gen_helper_gvec_5_ptr *fn);
92 
93 /* Expand a gvec operation.  Either inline or out-of-line depending on
94    the actual vector size and the operations supported by the host.  */
95 typedef struct {
96     /* Expand inline as a 64-bit or 32-bit integer.
97        Only one of these will be non-NULL.  */
98     void (*fni8)(TCGv_i64, TCGv_i64);
99     void (*fni4)(TCGv_i32, TCGv_i32);
100     /* Expand inline with a host vector type.  */
101     void (*fniv)(unsigned, TCGv_vec, TCGv_vec);
102     /* Expand out-of-line helper w/descriptor.  */
103     gen_helper_gvec_2 *fno;
104     /* The optional opcodes, if any, utilized by .fniv.  */
105     const TCGOpcode *opt_opc;
106     /* The data argument to the out-of-line helper.  */
107     int32_t data;
108     /* The vector element size, if applicable.  */
109     uint8_t vece;
110     /* Prefer i64 to v64.  */
111     bool prefer_i64;
112     /* Load dest as a 2nd source operand.  */
113     bool load_dest;
114 } GVecGen2;
115 
116 typedef struct {
117     /* Expand inline as a 64-bit or 32-bit integer.
118        Only one of these will be non-NULL.  */
119     void (*fni8)(TCGv_i64, TCGv_i64, int64_t);
120     void (*fni4)(TCGv_i32, TCGv_i32, int32_t);
121     /* Expand inline with a host vector type.  */
122     void (*fniv)(unsigned, TCGv_vec, TCGv_vec, int64_t);
123     /* Expand out-of-line helper w/descriptor, data in descriptor.  */
124     gen_helper_gvec_2 *fno;
125     /* Expand out-of-line helper w/descriptor, data as argument.  */
126     gen_helper_gvec_2i *fnoi;
127     /* The optional opcodes, if any, utilized by .fniv.  */
128     const TCGOpcode *opt_opc;
129     /* The vector element size, if applicable.  */
130     uint8_t vece;
131     /* Prefer i64 to v64.  */
132     bool prefer_i64;
133     /* Load dest as a 3rd source operand.  */
134     bool load_dest;
135 } GVecGen2i;
136 
137 typedef struct {
138     /* Expand inline as a 64-bit or 32-bit integer.
139        Only one of these will be non-NULL.  */
140     void (*fni8)(TCGv_i64, TCGv_i64, TCGv_i64);
141     void (*fni4)(TCGv_i32, TCGv_i32, TCGv_i32);
142     /* Expand inline with a host vector type.  */
143     void (*fniv)(unsigned, TCGv_vec, TCGv_vec, TCGv_vec);
144     /* Expand out-of-line helper w/descriptor.  */
145     gen_helper_gvec_2i *fno;
146     /* The optional opcodes, if any, utilized by .fniv.  */
147     const TCGOpcode *opt_opc;
148     /* The data argument to the out-of-line helper.  */
149     uint32_t data;
150     /* The vector element size, if applicable.  */
151     uint8_t vece;
152     /* Prefer i64 to v64.  */
153     bool prefer_i64;
154     /* Load scalar as 1st source operand.  */
155     bool scalar_first;
156 } GVecGen2s;
157 
158 typedef struct {
159     /* Expand inline as a 64-bit or 32-bit integer.
160        Only one of these will be non-NULL.  */
161     void (*fni8)(TCGv_i64, TCGv_i64, TCGv_i64);
162     void (*fni4)(TCGv_i32, TCGv_i32, TCGv_i32);
163     /* Expand inline with a host vector type.  */
164     void (*fniv)(unsigned, TCGv_vec, TCGv_vec, TCGv_vec);
165     /* Expand out-of-line helper w/descriptor.  */
166     gen_helper_gvec_3 *fno;
167     /* The optional opcodes, if any, utilized by .fniv.  */
168     const TCGOpcode *opt_opc;
169     /* The data argument to the out-of-line helper.  */
170     int32_t data;
171     /* The vector element size, if applicable.  */
172     uint8_t vece;
173     /* Prefer i64 to v64.  */
174     bool prefer_i64;
175     /* Load dest as a 3rd source operand.  */
176     bool load_dest;
177 } GVecGen3;
178 
179 typedef struct {
180     /*
181      * Expand inline as a 64-bit or 32-bit integer. Only one of these will be
182      * non-NULL.
183      */
184     void (*fni8)(TCGv_i64, TCGv_i64, TCGv_i64, int64_t);
185     void (*fni4)(TCGv_i32, TCGv_i32, TCGv_i32, int32_t);
186     /* Expand inline with a host vector type.  */
187     void (*fniv)(unsigned, TCGv_vec, TCGv_vec, TCGv_vec, int64_t);
188     /* Expand out-of-line helper w/descriptor, data in descriptor.  */
189     gen_helper_gvec_3 *fno;
190     /* The optional opcodes, if any, utilized by .fniv.  */
191     const TCGOpcode *opt_opc;
192     /* The vector element size, if applicable.  */
193     uint8_t vece;
194     /* Prefer i64 to v64.  */
195     bool prefer_i64;
196     /* Load dest as a 3rd source operand.  */
197     bool load_dest;
198 } GVecGen3i;
199 
200 typedef struct {
201     /* Expand inline as a 64-bit or 32-bit integer.
202        Only one of these will be non-NULL.  */
203     void (*fni8)(TCGv_i64, TCGv_i64, TCGv_i64, TCGv_i64);
204     void (*fni4)(TCGv_i32, TCGv_i32, TCGv_i32, TCGv_i32);
205     /* Expand inline with a host vector type.  */
206     void (*fniv)(unsigned, TCGv_vec, TCGv_vec, TCGv_vec, TCGv_vec);
207     /* Expand out-of-line helper w/descriptor.  */
208     gen_helper_gvec_4 *fno;
209     /* The optional opcodes, if any, utilized by .fniv.  */
210     const TCGOpcode *opt_opc;
211     /* The data argument to the out-of-line helper.  */
212     int32_t data;
213     /* The vector element size, if applicable.  */
214     uint8_t vece;
215     /* Prefer i64 to v64.  */
216     bool prefer_i64;
217     /* Write aofs as a 2nd dest operand.  */
218     bool write_aofs;
219 } GVecGen4;
220 
221 void tcg_gen_gvec_2(uint32_t dofs, uint32_t aofs,
222                     uint32_t oprsz, uint32_t maxsz, const GVecGen2 *);
223 void tcg_gen_gvec_2i(uint32_t dofs, uint32_t aofs, uint32_t oprsz,
224                      uint32_t maxsz, int64_t c, const GVecGen2i *);
225 void tcg_gen_gvec_2s(uint32_t dofs, uint32_t aofs, uint32_t oprsz,
226                      uint32_t maxsz, TCGv_i64 c, const GVecGen2s *);
227 void tcg_gen_gvec_3(uint32_t dofs, uint32_t aofs, uint32_t bofs,
228                     uint32_t oprsz, uint32_t maxsz, const GVecGen3 *);
229 void tcg_gen_gvec_3i(uint32_t dofs, uint32_t aofs, uint32_t bofs,
230                      uint32_t oprsz, uint32_t maxsz, int64_t c,
231                      const GVecGen3i *);
232 void tcg_gen_gvec_4(uint32_t dofs, uint32_t aofs, uint32_t bofs, uint32_t cofs,
233                     uint32_t oprsz, uint32_t maxsz, const GVecGen4 *);
234 
235 /* Expand a specific vector operation.  */
236 
237 void tcg_gen_gvec_mov(unsigned vece, uint32_t dofs, uint32_t aofs,
238                       uint32_t oprsz, uint32_t maxsz);
239 void tcg_gen_gvec_not(unsigned vece, uint32_t dofs, uint32_t aofs,
240                       uint32_t oprsz, uint32_t maxsz);
241 void tcg_gen_gvec_neg(unsigned vece, uint32_t dofs, uint32_t aofs,
242                       uint32_t oprsz, uint32_t maxsz);
243 void tcg_gen_gvec_abs(unsigned vece, uint32_t dofs, uint32_t aofs,
244                       uint32_t oprsz, uint32_t maxsz);
245 
246 void tcg_gen_gvec_add(unsigned vece, uint32_t dofs, uint32_t aofs,
247                       uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
248 void tcg_gen_gvec_sub(unsigned vece, uint32_t dofs, uint32_t aofs,
249                       uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
250 void tcg_gen_gvec_mul(unsigned vece, uint32_t dofs, uint32_t aofs,
251                       uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
252 
253 void tcg_gen_gvec_addi(unsigned vece, uint32_t dofs, uint32_t aofs,
254                        int64_t c, uint32_t oprsz, uint32_t maxsz);
255 void tcg_gen_gvec_muli(unsigned vece, uint32_t dofs, uint32_t aofs,
256                        int64_t c, uint32_t oprsz, uint32_t maxsz);
257 
258 void tcg_gen_gvec_adds(unsigned vece, uint32_t dofs, uint32_t aofs,
259                        TCGv_i64 c, uint32_t oprsz, uint32_t maxsz);
260 void tcg_gen_gvec_subs(unsigned vece, uint32_t dofs, uint32_t aofs,
261                        TCGv_i64 c, uint32_t oprsz, uint32_t maxsz);
262 void tcg_gen_gvec_muls(unsigned vece, uint32_t dofs, uint32_t aofs,
263                        TCGv_i64 c, uint32_t oprsz, uint32_t maxsz);
264 
265 /* Saturated arithmetic.  */
266 void tcg_gen_gvec_ssadd(unsigned vece, uint32_t dofs, uint32_t aofs,
267                         uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
268 void tcg_gen_gvec_sssub(unsigned vece, uint32_t dofs, uint32_t aofs,
269                         uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
270 void tcg_gen_gvec_usadd(unsigned vece, uint32_t dofs, uint32_t aofs,
271                         uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
272 void tcg_gen_gvec_ussub(unsigned vece, uint32_t dofs, uint32_t aofs,
273                         uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
274 
275 /* Min/max.  */
276 void tcg_gen_gvec_smin(unsigned vece, uint32_t dofs, uint32_t aofs,
277                        uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
278 void tcg_gen_gvec_umin(unsigned vece, uint32_t dofs, uint32_t aofs,
279                        uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
280 void tcg_gen_gvec_smax(unsigned vece, uint32_t dofs, uint32_t aofs,
281                        uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
282 void tcg_gen_gvec_umax(unsigned vece, uint32_t dofs, uint32_t aofs,
283                        uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
284 
285 void tcg_gen_gvec_and(unsigned vece, uint32_t dofs, uint32_t aofs,
286                       uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
287 void tcg_gen_gvec_or(unsigned vece, uint32_t dofs, uint32_t aofs,
288                      uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
289 void tcg_gen_gvec_xor(unsigned vece, uint32_t dofs, uint32_t aofs,
290                       uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
291 void tcg_gen_gvec_andc(unsigned vece, uint32_t dofs, uint32_t aofs,
292                        uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
293 void tcg_gen_gvec_orc(unsigned vece, uint32_t dofs, uint32_t aofs,
294                       uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
295 void tcg_gen_gvec_nand(unsigned vece, uint32_t dofs, uint32_t aofs,
296                        uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
297 void tcg_gen_gvec_nor(unsigned vece, uint32_t dofs, uint32_t aofs,
298                       uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
299 void tcg_gen_gvec_eqv(unsigned vece, uint32_t dofs, uint32_t aofs,
300                       uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
301 
302 void tcg_gen_gvec_andi(unsigned vece, uint32_t dofs, uint32_t aofs,
303                        int64_t c, uint32_t oprsz, uint32_t maxsz);
304 void tcg_gen_gvec_xori(unsigned vece, uint32_t dofs, uint32_t aofs,
305                        int64_t c, uint32_t oprsz, uint32_t maxsz);
306 void tcg_gen_gvec_ori(unsigned vece, uint32_t dofs, uint32_t aofs,
307                       int64_t c, uint32_t oprsz, uint32_t maxsz);
308 
309 void tcg_gen_gvec_ands(unsigned vece, uint32_t dofs, uint32_t aofs,
310                        TCGv_i64 c, uint32_t oprsz, uint32_t maxsz);
311 void tcg_gen_gvec_xors(unsigned vece, uint32_t dofs, uint32_t aofs,
312                        TCGv_i64 c, uint32_t oprsz, uint32_t maxsz);
313 void tcg_gen_gvec_ors(unsigned vece, uint32_t dofs, uint32_t aofs,
314                       TCGv_i64 c, uint32_t oprsz, uint32_t maxsz);
315 
316 void tcg_gen_gvec_dup_mem(unsigned vece, uint32_t dofs, uint32_t aofs,
317                           uint32_t s, uint32_t m);
318 void tcg_gen_gvec_dup_imm(unsigned vece, uint32_t dofs, uint32_t s,
319                           uint32_t m, uint64_t imm);
320 void tcg_gen_gvec_dup_i32(unsigned vece, uint32_t dofs, uint32_t s,
321                           uint32_t m, TCGv_i32);
322 void tcg_gen_gvec_dup_i64(unsigned vece, uint32_t dofs, uint32_t s,
323                           uint32_t m, TCGv_i64);
324 
325 #if TARGET_LONG_BITS == 64
326 # define tcg_gen_gvec_dup_tl  tcg_gen_gvec_dup_i64
327 #else
328 # define tcg_gen_gvec_dup_tl  tcg_gen_gvec_dup_i32
329 #endif
330 
331 void tcg_gen_gvec_shli(unsigned vece, uint32_t dofs, uint32_t aofs,
332                        int64_t shift, uint32_t oprsz, uint32_t maxsz);
333 void tcg_gen_gvec_shri(unsigned vece, uint32_t dofs, uint32_t aofs,
334                        int64_t shift, uint32_t oprsz, uint32_t maxsz);
335 void tcg_gen_gvec_sari(unsigned vece, uint32_t dofs, uint32_t aofs,
336                        int64_t shift, uint32_t oprsz, uint32_t maxsz);
337 
338 void tcg_gen_gvec_shls(unsigned vece, uint32_t dofs, uint32_t aofs,
339                        TCGv_i32 shift, uint32_t oprsz, uint32_t maxsz);
340 void tcg_gen_gvec_shrs(unsigned vece, uint32_t dofs, uint32_t aofs,
341                        TCGv_i32 shift, uint32_t oprsz, uint32_t maxsz);
342 void tcg_gen_gvec_sars(unsigned vece, uint32_t dofs, uint32_t aofs,
343                        TCGv_i32 shift, uint32_t oprsz, uint32_t maxsz);
344 
345 /*
346  * Perform vector shift by vector element, modulo the element size.
347  * E.g.  D[i] = A[i] << (B[i] % (8 << vece)).
348  */
349 void tcg_gen_gvec_shlv(unsigned vece, uint32_t dofs, uint32_t aofs,
350                        uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
351 void tcg_gen_gvec_shrv(unsigned vece, uint32_t dofs, uint32_t aofs,
352                        uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
353 void tcg_gen_gvec_sarv(unsigned vece, uint32_t dofs, uint32_t aofs,
354                        uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
355 
356 void tcg_gen_gvec_cmp(TCGCond cond, unsigned vece, uint32_t dofs,
357                       uint32_t aofs, uint32_t bofs,
358                       uint32_t oprsz, uint32_t maxsz);
359 
360 /*
361  * Perform vector bit select: d = (b & a) | (c & ~a).
362  */
363 void tcg_gen_gvec_bitsel(unsigned vece, uint32_t dofs, uint32_t aofs,
364                          uint32_t bofs, uint32_t cofs,
365                          uint32_t oprsz, uint32_t maxsz);
366 
367 /*
368  * 64-bit vector operations.  Use these when the register has been allocated
369  * with tcg_global_mem_new_i64, and so we cannot also address it via pointer.
370  * OPRSZ = MAXSZ = 8.
371  */
372 
373 void tcg_gen_vec_neg8_i64(TCGv_i64 d, TCGv_i64 a);
374 void tcg_gen_vec_neg16_i64(TCGv_i64 d, TCGv_i64 a);
375 void tcg_gen_vec_neg32_i64(TCGv_i64 d, TCGv_i64 a);
376 
377 void tcg_gen_vec_add8_i64(TCGv_i64 d, TCGv_i64 a, TCGv_i64 b);
378 void tcg_gen_vec_add16_i64(TCGv_i64 d, TCGv_i64 a, TCGv_i64 b);
379 void tcg_gen_vec_add32_i64(TCGv_i64 d, TCGv_i64 a, TCGv_i64 b);
380 
381 void tcg_gen_vec_sub8_i64(TCGv_i64 d, TCGv_i64 a, TCGv_i64 b);
382 void tcg_gen_vec_sub16_i64(TCGv_i64 d, TCGv_i64 a, TCGv_i64 b);
383 void tcg_gen_vec_sub32_i64(TCGv_i64 d, TCGv_i64 a, TCGv_i64 b);
384 
385 void tcg_gen_vec_shl8i_i64(TCGv_i64 d, TCGv_i64 a, int64_t);
386 void tcg_gen_vec_shl16i_i64(TCGv_i64 d, TCGv_i64 a, int64_t);
387 void tcg_gen_vec_shr8i_i64(TCGv_i64 d, TCGv_i64 a, int64_t);
388 void tcg_gen_vec_shr16i_i64(TCGv_i64 d, TCGv_i64 a, int64_t);
389 void tcg_gen_vec_sar8i_i64(TCGv_i64 d, TCGv_i64 a, int64_t);
390 void tcg_gen_vec_sar16i_i64(TCGv_i64 d, TCGv_i64 a, int64_t);
391 
392 #endif
393