tcg-op-gvec.h source code [qemu/tcg/tcg-op-gvec.h]

1	/*
2	* Generic vector operation expansion
3	*
4	* Copyright (c) 2018 Linaro
5	*
6	* This library is free software; you can redistribute it and/or
7	* modify it under the terms of the GNU Lesser General Public
8	* License as published by the Free Software Foundation; either
9	* version 2.1 of the License, or (at your option) any later version.
10	*
11	* This library is distributed in the hope that it will be useful,
12	* but WITHOUT ANY WARRANTY; without even the implied warranty of
13	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14	* Lesser General Public License for more details.
15	*
16	* You should have received a copy of the GNU Lesser General Public
17	* License along with this library; if not, see <http://www.gnu.org/licenses/>.
18	*/
19
20	#ifndef TCG_TCG_OP_GVEC_H
21	#define TCG_TCG_OP_GVEC_H
22
23	/*
24	* "Generic" vectors. All operands are given as offsets from ENV,
25	* and therefore cannot also be allocated via tcg_global_mem_new_*.
26	* OPRSZ is the byte size of the vector upon which the operation is performed.
27	* MAXSZ is the byte size of the full vector; bytes beyond OPSZ are cleared.
28	*
29	* All sizes must be 8 or any multiple of 16.
30	* When OPRSZ is 8, the alignment may be 8, otherwise must be 16.
31	* Operands may completely, but not partially, overlap.
32	*/
33
34	/ Expand a call to a gvec-style helper, with pointers to two vector*
35	operands, and a descriptor (see tcg-gvec-desc.h). /*
36	typedef void gen_helper_gvec_2(TCGv_ptr, TCGv_ptr, TCGv_i32);
37	void tcg_gen_gvec_2_ool(uint32_t dofs, uint32_t aofs,
38	uint32_t oprsz, uint32_t maxsz, int32_t data,
39	gen_helper_gvec_2 *fn);
40
41	/ Similarly, passing an extra data value. /
42	typedef void gen_helper_gvec_2i(TCGv_ptr, TCGv_ptr, TCGv_i64, TCGv_i32);
43	void tcg_gen_gvec_2i_ool(uint32_t dofs, uint32_t aofs, TCGv_i64 c,
44	uint32_t oprsz, uint32_t maxsz, int32_t data,
45	gen_helper_gvec_2i *fn);
46
47	/ Similarly, passing an extra pointer (e.g. env or float_status). /
48	typedef void gen_helper_gvec_2_ptr(TCGv_ptr, TCGv_ptr, TCGv_ptr, TCGv_i32);
49	void tcg_gen_gvec_2_ptr(uint32_t dofs, uint32_t aofs,
50	TCGv_ptr ptr, uint32_t oprsz, uint32_t maxsz,
51	int32_t data, gen_helper_gvec_2_ptr *fn);
52
53	/ Similarly, with three vector operands. /
54	typedef void gen_helper_gvec_3(TCGv_ptr, TCGv_ptr, TCGv_ptr, TCGv_i32);
55	void tcg_gen_gvec_3_ool(uint32_t dofs, uint32_t aofs, uint32_t bofs,
56	uint32_t oprsz, uint32_t maxsz, int32_t data,
57	gen_helper_gvec_3 *fn);
58
59	/ Similarly, with four vector operands. /
60	typedef void gen_helper_gvec_4(TCGv_ptr, TCGv_ptr, TCGv_ptr,
61	TCGv_ptr, TCGv_i32);
62	void tcg_gen_gvec_4_ool(uint32_t dofs, uint32_t aofs, uint32_t bofs,
63	uint32_t cofs, uint32_t oprsz, uint32_t maxsz,
64	int32_t data, gen_helper_gvec_4 *fn);
65
66	/ Similarly, with five vector operands. /
67	typedef void gen_helper_gvec_5(TCGv_ptr, TCGv_ptr, TCGv_ptr, TCGv_ptr,
68	TCGv_ptr, TCGv_i32);
69	void tcg_gen_gvec_5_ool(uint32_t dofs, uint32_t aofs, uint32_t bofs,
70	uint32_t cofs, uint32_t xofs, uint32_t oprsz,
71	uint32_t maxsz, int32_t data, gen_helper_gvec_5 *fn);
72
73	typedef void gen_helper_gvec_3_ptr(TCGv_ptr, TCGv_ptr, TCGv_ptr,
74	TCGv_ptr, TCGv_i32);
75	void tcg_gen_gvec_3_ptr(uint32_t dofs, uint32_t aofs, uint32_t bofs,
76	TCGv_ptr ptr, uint32_t oprsz, uint32_t maxsz,
77	int32_t data, gen_helper_gvec_3_ptr *fn);
78
79	typedef void gen_helper_gvec_4_ptr(TCGv_ptr, TCGv_ptr, TCGv_ptr,
80	TCGv_ptr, TCGv_ptr, TCGv_i32);
81	void tcg_gen_gvec_4_ptr(uint32_t dofs, uint32_t aofs, uint32_t bofs,
82	uint32_t cofs, TCGv_ptr ptr, uint32_t oprsz,
83	uint32_t maxsz, int32_t data,
84	gen_helper_gvec_4_ptr *fn);
85
86	/ Expand a gvec operation. Either inline or out-of-line depending on*
87	the actual vector size and the operations supported by the host. /*
88	typedef struct {
89	/ Expand inline as a 64-bit or 32-bit integer.*
90	Only one of these will be non-NULL. /*
91	void (*fni8)(TCGv_i64, TCGv_i64);
92	void (*fni4)(TCGv_i32, TCGv_i32);
93	/ Expand inline with a host vector type. /
94	void (fniv)(unsigned*, TCGv_vec, TCGv_vec);
95	/ Expand out-of-line helper w/descriptor. /
96	gen_helper_gvec_2 *fno;
97	/ The optional opcodes, if any, utilized by .fniv. /
98	const TCGOpcode *opt_opc;
99	/ The data argument to the out-of-line helper. /
100	int32_t data;
101	/ The vector element size, if applicable. /
102	uint8_t vece;
103	/ Prefer i64 to v64. /
104	bool prefer_i64;
105	} GVecGen2;
106
107	typedef struct {
108	/ Expand inline as a 64-bit or 32-bit integer.*
109	Only one of these will be non-NULL. /*
110	void (*fni8)(TCGv_i64, TCGv_i64, int64_t);
111	void (*fni4)(TCGv_i32, TCGv_i32, int32_t);
112	/ Expand inline with a host vector type. /
113	void (fniv)(unsigned*, TCGv_vec, TCGv_vec, int64_t);
114	/ Expand out-of-line helper w/descriptor, data in descriptor. /
115	gen_helper_gvec_2 *fno;
116	/ Expand out-of-line helper w/descriptor, data as argument. /
117	gen_helper_gvec_2i *fnoi;
118	/ The optional opcodes, if any, utilized by .fniv. /
119	const TCGOpcode *opt_opc;
120	/ The vector element size, if applicable. /
121	uint8_t vece;
122	/ Prefer i64 to v64. /
123	bool prefer_i64;
124	/ Load dest as a 3rd source operand. /
125	bool load_dest;
126	} GVecGen2i;
127
128	typedef struct {
129	/ Expand inline as a 64-bit or 32-bit integer.*
130	Only one of these will be non-NULL. /*
131	void (*fni8)(TCGv_i64, TCGv_i64, TCGv_i64);
132	void (*fni4)(TCGv_i32, TCGv_i32, TCGv_i32);
133	/ Expand inline with a host vector type. /
134	void (fniv)(unsigned*, TCGv_vec, TCGv_vec, TCGv_vec);
135	/ Expand out-of-line helper w/descriptor. /
136	gen_helper_gvec_2i *fno;
137	/ The optional opcodes, if any, utilized by .fniv. /
138	const TCGOpcode *opt_opc;
139	/ The data argument to the out-of-line helper. /
140	uint32_t data;
141	/ The vector element size, if applicable. /
142	uint8_t vece;
143	/ Prefer i64 to v64. /
144	bool prefer_i64;
145	/ Load scalar as 1st source operand. /
146	bool scalar_first;
147	} GVecGen2s;
148
149	typedef struct {
150	/ Expand inline as a 64-bit or 32-bit integer.*
151	Only one of these will be non-NULL. /*
152	void (*fni8)(TCGv_i64, TCGv_i64, TCGv_i64);
153	void (*fni4)(TCGv_i32, TCGv_i32, TCGv_i32);
154	/ Expand inline with a host vector type. /
155	void (fniv)(unsigned*, TCGv_vec, TCGv_vec, TCGv_vec);
156	/ Expand out-of-line helper w/descriptor. /
157	gen_helper_gvec_3 *fno;
158	/ The optional opcodes, if any, utilized by .fniv. /
159	const TCGOpcode *opt_opc;
160	/ The data argument to the out-of-line helper. /
161	int32_t data;
162	/ The vector element size, if applicable. /
163	uint8_t vece;
164	/ Prefer i64 to v64. /
165	bool prefer_i64;
166	/ Load dest as a 3rd source operand. /
167	bool load_dest;
168	} GVecGen3;
169
170	typedef struct {
171	/*
172	* Expand inline as a 64-bit or 32-bit integer. Only one of these will be
173	* non-NULL.
174	*/
175	void (*fni8)(TCGv_i64, TCGv_i64, TCGv_i64, int64_t);
176	void (*fni4)(TCGv_i32, TCGv_i32, TCGv_i32, int32_t);
177	/ Expand inline with a host vector type. /
178	void (fniv)(unsigned*, TCGv_vec, TCGv_vec, TCGv_vec, int64_t);
179	/ Expand out-of-line helper w/descriptor, data in descriptor. /
180	gen_helper_gvec_3 *fno;
181	/ The optional opcodes, if any, utilized by .fniv. /
182	const TCGOpcode *opt_opc;
183	/ The vector element size, if applicable. /
184	uint8_t vece;
185	/ Prefer i64 to v64. /
186	bool prefer_i64;
187	/ Load dest as a 3rd source operand. /
188	bool load_dest;
189	} GVecGen3i;
190
191	typedef struct {
192	/ Expand inline as a 64-bit or 32-bit integer.*
193	Only one of these will be non-NULL. /*
194	void (*fni8)(TCGv_i64, TCGv_i64, TCGv_i64, TCGv_i64);
195	void (*fni4)(TCGv_i32, TCGv_i32, TCGv_i32, TCGv_i32);
196	/ Expand inline with a host vector type. /
197	void (fniv)(unsigned*, TCGv_vec, TCGv_vec, TCGv_vec, TCGv_vec);
198	/ Expand out-of-line helper w/descriptor. /
199	gen_helper_gvec_4 *fno;
200	/ The optional opcodes, if any, utilized by .fniv. /
201	const TCGOpcode *opt_opc;
202	/ The data argument to the out-of-line helper. /
203	int32_t data;
204	/ The vector element size, if applicable. /
205	uint8_t vece;
206	/ Prefer i64 to v64. /
207	bool prefer_i64;
208	/ Write aofs as a 2nd dest operand. /
209	bool write_aofs;
210	} GVecGen4;
211
212	void tcg_gen_gvec_2(uint32_t dofs, uint32_t aofs,
213	uint32_t oprsz, uint32_t maxsz, const GVecGen2 *);
214	void tcg_gen_gvec_2i(uint32_t dofs, uint32_t aofs, uint32_t oprsz,
215	uint32_t maxsz, int64_t c, const GVecGen2i *);
216	void tcg_gen_gvec_2s(uint32_t dofs, uint32_t aofs, uint32_t oprsz,
217	uint32_t maxsz, TCGv_i64 c, const GVecGen2s *);
218	void tcg_gen_gvec_3(uint32_t dofs, uint32_t aofs, uint32_t bofs,
219	uint32_t oprsz, uint32_t maxsz, const GVecGen3 *);
220	void tcg_gen_gvec_3i(uint32_t dofs, uint32_t aofs, uint32_t bofs,
221	uint32_t oprsz, uint32_t maxsz, int64_t c,
222	const GVecGen3i *);
223	void tcg_gen_gvec_4(uint32_t dofs, uint32_t aofs, uint32_t bofs, uint32_t cofs,
224	uint32_t oprsz, uint32_t maxsz, const GVecGen4 *);
225
226	/ Expand a specific vector operation. /
227
228	void tcg_gen_gvec_mov(unsigned vece, uint32_t dofs, uint32_t aofs,
229	uint32_t oprsz, uint32_t maxsz);
230	void tcg_gen_gvec_not(unsigned vece, uint32_t dofs, uint32_t aofs,
231	uint32_t oprsz, uint32_t maxsz);
232	void tcg_gen_gvec_neg(unsigned vece, uint32_t dofs, uint32_t aofs,
233	uint32_t oprsz, uint32_t maxsz);
234	void tcg_gen_gvec_abs(unsigned vece, uint32_t dofs, uint32_t aofs,
235	uint32_t oprsz, uint32_t maxsz);
236
237	void tcg_gen_gvec_add(unsigned vece, uint32_t dofs, uint32_t aofs,
238	uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
239	void tcg_gen_gvec_sub(unsigned vece, uint32_t dofs, uint32_t aofs,
240	uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
241	void tcg_gen_gvec_mul(unsigned vece, uint32_t dofs, uint32_t aofs,
242	uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
243
244	void tcg_gen_gvec_addi(unsigned vece, uint32_t dofs, uint32_t aofs,
245	int64_t c, uint32_t oprsz, uint32_t maxsz);
246	void tcg_gen_gvec_muli(unsigned vece, uint32_t dofs, uint32_t aofs,
247	int64_t c, uint32_t oprsz, uint32_t maxsz);
248
249	void tcg_gen_gvec_adds(unsigned vece, uint32_t dofs, uint32_t aofs,
250	TCGv_i64 c, uint32_t oprsz, uint32_t maxsz);
251	void tcg_gen_gvec_subs(unsigned vece, uint32_t dofs, uint32_t aofs,
252	TCGv_i64 c, uint32_t oprsz, uint32_t maxsz);
253	void tcg_gen_gvec_muls(unsigned vece, uint32_t dofs, uint32_t aofs,
254	TCGv_i64 c, uint32_t oprsz, uint32_t maxsz);
255
256	/ Saturated arithmetic. /
257	void tcg_gen_gvec_ssadd(unsigned vece, uint32_t dofs, uint32_t aofs,
258	uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
259	void tcg_gen_gvec_sssub(unsigned vece, uint32_t dofs, uint32_t aofs,
260	uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
261	void tcg_gen_gvec_usadd(unsigned vece, uint32_t dofs, uint32_t aofs,
262	uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
263	void tcg_gen_gvec_ussub(unsigned vece, uint32_t dofs, uint32_t aofs,
264	uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
265
266	/ Min/max. /
267	void tcg_gen_gvec_smin(unsigned vece, uint32_t dofs, uint32_t aofs,
268	uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
269	void tcg_gen_gvec_umin(unsigned vece, uint32_t dofs, uint32_t aofs,
270	uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
271	void tcg_gen_gvec_smax(unsigned vece, uint32_t dofs, uint32_t aofs,
272	uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
273	void tcg_gen_gvec_umax(unsigned vece, uint32_t dofs, uint32_t aofs,
274	uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
275
276	void tcg_gen_gvec_and(unsigned vece, uint32_t dofs, uint32_t aofs,
277	uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
278	void tcg_gen_gvec_or(unsigned vece, uint32_t dofs, uint32_t aofs,
279	uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
280	void tcg_gen_gvec_xor(unsigned vece, uint32_t dofs, uint32_t aofs,
281	uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
282	void tcg_gen_gvec_andc(unsigned vece, uint32_t dofs, uint32_t aofs,
283	uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
284	void tcg_gen_gvec_orc(unsigned vece, uint32_t dofs, uint32_t aofs,
285	uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
286	void tcg_gen_gvec_nand(unsigned vece, uint32_t dofs, uint32_t aofs,
287	uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
288	void tcg_gen_gvec_nor(unsigned vece, uint32_t dofs, uint32_t aofs,
289	uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
290	void tcg_gen_gvec_eqv(unsigned vece, uint32_t dofs, uint32_t aofs,
291	uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
292
293	void tcg_gen_gvec_andi(unsigned vece, uint32_t dofs, uint32_t aofs,
294	int64_t c, uint32_t oprsz, uint32_t maxsz);
295	void tcg_gen_gvec_xori(unsigned vece, uint32_t dofs, uint32_t aofs,
296	int64_t c, uint32_t oprsz, uint32_t maxsz);
297	void tcg_gen_gvec_ori(unsigned vece, uint32_t dofs, uint32_t aofs,
298	int64_t c, uint32_t oprsz, uint32_t maxsz);
299
300	void tcg_gen_gvec_ands(unsigned vece, uint32_t dofs, uint32_t aofs,
301	TCGv_i64 c, uint32_t oprsz, uint32_t maxsz);
302	void tcg_gen_gvec_xors(unsigned vece, uint32_t dofs, uint32_t aofs,
303	TCGv_i64 c, uint32_t oprsz, uint32_t maxsz);
304	void tcg_gen_gvec_ors(unsigned vece, uint32_t dofs, uint32_t aofs,
305	TCGv_i64 c, uint32_t oprsz, uint32_t maxsz);
306
307	void tcg_gen_gvec_dup_mem(unsigned vece, uint32_t dofs, uint32_t aofs,
308	uint32_t s, uint32_t m);
309	void tcg_gen_gvec_dup_i32(unsigned vece, uint32_t dofs, uint32_t s,
310	uint32_t m, TCGv_i32);
311	void tcg_gen_gvec_dup_i64(unsigned vece, uint32_t dofs, uint32_t s,
312	uint32_t m, TCGv_i64);
313
314	void tcg_gen_gvec_dup8i(uint32_t dofs, uint32_t s, uint32_t m, uint8_t x);
315	void tcg_gen_gvec_dup16i(uint32_t dofs, uint32_t s, uint32_t m, uint16_t x);
316	void tcg_gen_gvec_dup32i(uint32_t dofs, uint32_t s, uint32_t m, uint32_t x);
317	void tcg_gen_gvec_dup64i(uint32_t dofs, uint32_t s, uint32_t m, uint64_t x);
318
319	void tcg_gen_gvec_shli(unsigned vece, uint32_t dofs, uint32_t aofs,
320	int64_t shift, uint32_t oprsz, uint32_t maxsz);
321	void tcg_gen_gvec_shri(unsigned vece, uint32_t dofs, uint32_t aofs,
322	int64_t shift, uint32_t oprsz, uint32_t maxsz);
323	void tcg_gen_gvec_sari(unsigned vece, uint32_t dofs, uint32_t aofs,
324	int64_t shift, uint32_t oprsz, uint32_t maxsz);
325
326	void tcg_gen_gvec_shls(unsigned vece, uint32_t dofs, uint32_t aofs,
327	TCGv_i32 shift, uint32_t oprsz, uint32_t maxsz);
328	void tcg_gen_gvec_shrs(unsigned vece, uint32_t dofs, uint32_t aofs,
329	TCGv_i32 shift, uint32_t oprsz, uint32_t maxsz);
330	void tcg_gen_gvec_sars(unsigned vece, uint32_t dofs, uint32_t aofs,
331	TCGv_i32 shift, uint32_t oprsz, uint32_t maxsz);
332
333	/*
334	* Perform vector shift by vector element, modulo the element size.
335	* E.g. D[i] = A[i] << (B[i] % (8 << vece)).
336	*/
337	void tcg_gen_gvec_shlv(unsigned vece, uint32_t dofs, uint32_t aofs,
338	uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
339	void tcg_gen_gvec_shrv(unsigned vece, uint32_t dofs, uint32_t aofs,
340	uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
341	void tcg_gen_gvec_sarv(unsigned vece, uint32_t dofs, uint32_t aofs,
342	uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
343
344	void tcg_gen_gvec_cmp(TCGCond cond, unsigned vece, uint32_t dofs,
345	uint32_t aofs, uint32_t bofs,
346	uint32_t oprsz, uint32_t maxsz);
347
348	/*
349	* Perform vector bit select: d = (b & a) \| (c & ~a).
350	*/
351	void tcg_gen_gvec_bitsel(unsigned vece, uint32_t dofs, uint32_t aofs,
352	uint32_t bofs, uint32_t cofs,
353	uint32_t oprsz, uint32_t maxsz);
354
355	/*
356	* 64-bit vector operations. Use these when the register has been allocated
357	* with tcg_global_mem_new_i64, and so we cannot also address it via pointer.
358	* OPRSZ = MAXSZ = 8.
359	*/
360
361	void tcg_gen_vec_neg8_i64(TCGv_i64 d, TCGv_i64 a);
362	void tcg_gen_vec_neg16_i64(TCGv_i64 d, TCGv_i64 a);
363	void tcg_gen_vec_neg32_i64(TCGv_i64 d, TCGv_i64 a);
364
365	void tcg_gen_vec_add8_i64(TCGv_i64 d, TCGv_i64 a, TCGv_i64 b);
366	void tcg_gen_vec_add16_i64(TCGv_i64 d, TCGv_i64 a, TCGv_i64 b);
367	void tcg_gen_vec_add32_i64(TCGv_i64 d, TCGv_i64 a, TCGv_i64 b);
368
369	void tcg_gen_vec_sub8_i64(TCGv_i64 d, TCGv_i64 a, TCGv_i64 b);
370	void tcg_gen_vec_sub16_i64(TCGv_i64 d, TCGv_i64 a, TCGv_i64 b);
371	void tcg_gen_vec_sub32_i64(TCGv_i64 d, TCGv_i64 a, TCGv_i64 b);
372
373	void tcg_gen_vec_shl8i_i64(TCGv_i64 d, TCGv_i64 a, int64_t);
374	void tcg_gen_vec_shl16i_i64(TCGv_i64 d, TCGv_i64 a, int64_t);
375	void tcg_gen_vec_shr8i_i64(TCGv_i64 d, TCGv_i64 a, int64_t);
376	void tcg_gen_vec_shr16i_i64(TCGv_i64 d, TCGv_i64 a, int64_t);
377	void tcg_gen_vec_sar8i_i64(TCGv_i64 d, TCGv_i64 a, int64_t);
378	void tcg_gen_vec_sar16i_i64(TCGv_i64 d, TCGv_i64 a, int64_t);
379
380	#endif
381

Browse the source code of qemu/tcg/tcg-op-gvec.h