mirror of
https://github.com/yuzu-emu/unicorn
synced 2024-11-25 06:49:24 +00:00
57bdf0faa2
No vector ops as yet. SSE only has direct support for 8- and 16-bit saturation; handling 32- and 64-bit saturation is much more expensive. Backports commit f49b12c6e6a75a5bd109bcbbda072b24e5fb8dfd from qemu
249 lines
12 KiB
C
249 lines
12 KiB
C
/*
|
|
* Generic vector operation expansion
|
|
*
|
|
* Copyright (c) 2018 Linaro
|
|
*
|
|
* This library is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2 of the License, or (at your option) any later version.
|
|
*
|
|
* This library is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with this library; if not, see <http://www.gnu.org/licenses/>.
|
|
*/
|
|
|
|
/*
|
|
* "Generic" vectors. All operands are given as offsets from ENV,
|
|
* and therefore cannot also be allocated via tcg_global_mem_new_*.
|
|
* OPRSZ is the byte size of the vector upon which the operation is performed.
|
|
* MAXSZ is the byte size of the full vector; bytes beyond OPSZ are cleared.
|
|
*
|
|
* All sizes must be 8 or any multiple of 16.
|
|
* When OPRSZ is 8, the alignment may be 8, otherwise must be 16.
|
|
* Operands may completely, but not partially, overlap.
|
|
*/
|
|
|
|
/* Expand a call to a gvec-style helper, with pointers to two vector
|
|
operands, and a descriptor (see tcg-gvec-desc.h). */
|
|
typedef void gen_helper_gvec_2(TCGContext *s, TCGv_ptr, TCGv_ptr, TCGv_i32);
|
|
void tcg_gen_gvec_2_ool(TCGContext *, uint32_t dofs, uint32_t aofs,
|
|
uint32_t oprsz, uint32_t maxsz, int32_t data,
|
|
gen_helper_gvec_2 *fn);
|
|
|
|
/* Similarly, passing an extra pointer (e.g. env or float_status). */
|
|
typedef void gen_helper_gvec_2_ptr(TCGContext *s, TCGv_ptr, TCGv_ptr, TCGv_ptr, TCGv_i32);
|
|
void tcg_gen_gvec_2_ptr(TCGContext *, uint32_t dofs, uint32_t aofs,
|
|
TCGv_ptr ptr, uint32_t oprsz, uint32_t maxsz,
|
|
int32_t data, gen_helper_gvec_2_ptr *fn);
|
|
|
|
/* Similarly, with three vector operands. */
|
|
typedef void gen_helper_gvec_3(TCGContext *s, TCGv_ptr, TCGv_ptr, TCGv_ptr, TCGv_i32);
|
|
void tcg_gen_gvec_3_ool(TCGContext *, uint32_t dofs, uint32_t aofs, uint32_t bofs,
|
|
uint32_t oprsz, uint32_t maxsz, int32_t data,
|
|
gen_helper_gvec_3 *fn);
|
|
|
|
/* Similarly, with four vector operands. */
|
|
typedef void gen_helper_gvec_4(TCGContext *s, TCGv_ptr, TCGv_ptr, TCGv_ptr,
|
|
TCGv_ptr, TCGv_i32);
|
|
void tcg_gen_gvec_4_ool(TCGContext *, uint32_t dofs, uint32_t aofs, uint32_t bofs,
|
|
uint32_t cofs, uint32_t oprsz, uint32_t maxsz,
|
|
int32_t data, gen_helper_gvec_4 *fn);
|
|
|
|
/* Similarly, with five vector operands. */
|
|
typedef void gen_helper_gvec_5(TCGContext *s, TCGv_ptr, TCGv_ptr, TCGv_ptr, TCGv_ptr,
|
|
TCGv_ptr, TCGv_i32);
|
|
void tcg_gen_gvec_5_ool(TCGContext *, uint32_t dofs, uint32_t aofs, uint32_t bofs,
|
|
uint32_t cofs, uint32_t xofs, uint32_t oprsz,
|
|
uint32_t maxsz, int32_t data, gen_helper_gvec_5 *fn);
|
|
|
|
typedef void gen_helper_gvec_3_ptr(TCGContext *s, TCGv_ptr, TCGv_ptr, TCGv_ptr,
|
|
TCGv_ptr, TCGv_i32);
|
|
void tcg_gen_gvec_3_ptr(TCGContext *, uint32_t dofs, uint32_t aofs, uint32_t bofs,
|
|
TCGv_ptr ptr, uint32_t oprsz, uint32_t maxsz,
|
|
int32_t data, gen_helper_gvec_3_ptr *fn);
|
|
|
|
typedef void gen_helper_gvec_4_ptr(TCGContext *s, TCGv_ptr, TCGv_ptr, TCGv_ptr,
|
|
TCGv_ptr, TCGv_ptr, TCGv_i32);
|
|
void tcg_gen_gvec_4_ptr(TCGContext *s, uint32_t dofs, uint32_t aofs, uint32_t bofs,
|
|
uint32_t cofs, TCGv_ptr ptr, uint32_t oprsz,
|
|
uint32_t maxsz, int32_t data,
|
|
gen_helper_gvec_4_ptr *fn);
|
|
|
|
/* Expand a gvec operation. Either inline or out-of-line depending on
|
|
the actual vector size and the operations supported by the host. */
|
|
typedef struct {
|
|
/* Expand inline as a 64-bit or 32-bit integer.
|
|
Only one of these will be non-NULL. */
|
|
void (*fni8)(TCGContext *, TCGv_i64, TCGv_i64, int64_t);
|
|
void (*fni4)(TCGContext *, TCGv_i32, TCGv_i32, int32_t);
|
|
/* Expand inline with a host vector type. */
|
|
void (*fniv)(TCGContext *, unsigned, TCGv_vec, TCGv_vec, int64_t);
|
|
/* Expand out-of-line helper w/descriptor. */
|
|
gen_helper_gvec_2 *fno;
|
|
/* The opcode, if any, to which this corresponds. */
|
|
TCGOpcode opc;
|
|
/* The vector element size, if applicable. */
|
|
uint8_t vece;
|
|
/* Prefer i64 to v64. */
|
|
bool prefer_i64;
|
|
/* Load dest as a 3rd source operand. */
|
|
bool load_dest;
|
|
} GVecGen2i;
|
|
|
|
typedef struct {
|
|
/* Expand inline as a 64-bit or 32-bit integer.
|
|
Only one of these will be non-NULL. */
|
|
void (*fni8)(TCGContext *, TCGv_i64, TCGv_i64);
|
|
void (*fni4)(TCGContext *, TCGv_i32, TCGv_i32);
|
|
/* Expand inline with a host vector type. */
|
|
void (*fniv)(TCGContext *, unsigned, TCGv_vec, TCGv_vec);
|
|
/* Expand out-of-line helper w/descriptor. */
|
|
gen_helper_gvec_2 *fno;
|
|
/* The opcode, if any, to which this corresponds. */
|
|
TCGOpcode opc;
|
|
/* The data argument to the out-of-line helper. */
|
|
int32_t data;
|
|
/* The vector element size, if applicable. */
|
|
uint8_t vece;
|
|
/* Prefer i64 to v64. */
|
|
bool prefer_i64;
|
|
} GVecGen2;
|
|
|
|
typedef struct {
|
|
/* Expand inline as a 64-bit or 32-bit integer.
|
|
Only one of these will be non-NULL. */
|
|
void (*fni8)(TCGContext *, TCGv_i64, TCGv_i64, TCGv_i64);
|
|
void (*fni4)(TCGContext *, TCGv_i32, TCGv_i32, TCGv_i32);
|
|
/* Expand inline with a host vector type. */
|
|
void (*fniv)(TCGContext *, unsigned, TCGv_vec, TCGv_vec, TCGv_vec);
|
|
/* Expand out-of-line helper w/descriptor. */
|
|
gen_helper_gvec_3 *fno;
|
|
/* The opcode, if any, to which this corresponds. */
|
|
TCGOpcode opc;
|
|
/* The data argument to the out-of-line helper. */
|
|
int32_t data;
|
|
/* The vector element size, if applicable. */
|
|
uint8_t vece;
|
|
/* Prefer i64 to v64. */
|
|
bool prefer_i64;
|
|
/* Load dest as a 3rd source operand. */
|
|
bool load_dest;
|
|
} GVecGen3;
|
|
|
|
typedef struct {
|
|
/* Expand inline as a 64-bit or 32-bit integer.
|
|
Only one of these will be non-NULL. */
|
|
void (*fni8)(TCGContext *s, TCGv_i64, TCGv_i64, TCGv_i64, TCGv_i64);
|
|
void (*fni4)(TCGContext *s, TCGv_i32, TCGv_i32, TCGv_i32, TCGv_i32);
|
|
/* Expand inline with a host vector type. */
|
|
void (*fniv)(TCGContext *s, unsigned, TCGv_vec, TCGv_vec, TCGv_vec, TCGv_vec);
|
|
/* Expand out-of-line helper w/descriptor. */
|
|
gen_helper_gvec_4 *fno;
|
|
/* The opcode, if any, to which this corresponds. */
|
|
TCGOpcode opc;
|
|
/* The data argument to the out-of-line helper. */
|
|
int32_t data;
|
|
/* The vector element size, if applicable. */
|
|
uint8_t vece;
|
|
/* Prefer i64 to v64. */
|
|
bool prefer_i64;
|
|
} GVecGen4;
|
|
|
|
void tcg_gen_gvec_2(TCGContext *, uint32_t dofs, uint32_t aofs,
|
|
uint32_t oprsz, uint32_t maxsz, const GVecGen2 *);
|
|
void tcg_gen_gvec_2i(TCGContext *, uint32_t dofs, uint32_t aofs, uint32_t oprsz,
|
|
uint32_t maxsz, int64_t c, const GVecGen2i *);
|
|
void tcg_gen_gvec_3(TCGContext *, uint32_t dofs, uint32_t aofs, uint32_t bofs,
|
|
uint32_t oprsz, uint32_t maxsz, const GVecGen3 *);
|
|
void tcg_gen_gvec_4(TCGContext *, uint32_t dofs, uint32_t aofs, uint32_t bofs, uint32_t cofs,
|
|
uint32_t oprsz, uint32_t maxsz, const GVecGen4 *);
|
|
|
|
/* Expand a specific vector operation. */
|
|
|
|
void tcg_gen_gvec_mov(TCGContext *, unsigned vece, uint32_t dofs, uint32_t aofs,
|
|
uint32_t oprsz, uint32_t maxsz);
|
|
void tcg_gen_gvec_not(TCGContext *, unsigned vece, uint32_t dofs, uint32_t aofs,
|
|
uint32_t oprsz, uint32_t maxsz);
|
|
void tcg_gen_gvec_neg(TCGContext *, unsigned vece, uint32_t dofs, uint32_t aofs,
|
|
uint32_t oprsz, uint32_t maxsz);
|
|
|
|
void tcg_gen_gvec_add(TCGContext *, unsigned vece, uint32_t dofs, uint32_t aofs,
|
|
uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
|
|
void tcg_gen_gvec_sub(TCGContext *, unsigned vece, uint32_t dofs, uint32_t aofs,
|
|
uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
|
|
void tcg_gen_gvec_mul(TCGContext *, unsigned vece, uint32_t dofs, uint32_t aofs,
|
|
uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
|
|
|
|
/* Saturated arithmetic. */
|
|
void tcg_gen_gvec_ssadd(TCGContext *s, unsigned vece, uint32_t dofs, uint32_t aofs,
|
|
uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
|
|
void tcg_gen_gvec_sssub(TCGContext *s, unsigned vece, uint32_t dofs, uint32_t aofs,
|
|
uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
|
|
void tcg_gen_gvec_usadd(TCGContext *s, unsigned vece, uint32_t dofs, uint32_t aofs,
|
|
uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
|
|
void tcg_gen_gvec_ussub(TCGContext *s, unsigned vece, uint32_t dofs, uint32_t aofs,
|
|
uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
|
|
|
|
void tcg_gen_gvec_and(TCGContext *, unsigned vece, uint32_t dofs, uint32_t aofs,
|
|
uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
|
|
void tcg_gen_gvec_or(TCGContext *, unsigned vece, uint32_t dofs, uint32_t aofs,
|
|
uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
|
|
void tcg_gen_gvec_xor(TCGContext *, unsigned vece, uint32_t dofs, uint32_t aofs,
|
|
uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
|
|
void tcg_gen_gvec_andc(TCGContext *, unsigned vece, uint32_t dofs, uint32_t aofs,
|
|
uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
|
|
void tcg_gen_gvec_orc(TCGContext *, unsigned vece, uint32_t dofs, uint32_t aofs,
|
|
uint32_t bofs, uint32_t oprsz, uint32_t maxsz);
|
|
|
|
void tcg_gen_gvec_dup_mem(TCGContext *, unsigned vece, uint32_t dofs, uint32_t aofs,
|
|
uint32_t s, uint32_t m);
|
|
void tcg_gen_gvec_dup_i32(TCGContext *, unsigned vece, uint32_t dofs, uint32_t s,
|
|
uint32_t m, TCGv_i32);
|
|
void tcg_gen_gvec_dup_i64(TCGContext *, unsigned vece, uint32_t dofs, uint32_t s,
|
|
uint32_t m, TCGv_i64);
|
|
|
|
void tcg_gen_gvec_shli(TCGContext *s, unsigned vece, uint32_t dofs, uint32_t aofs,
|
|
int64_t shift, uint32_t oprsz, uint32_t maxsz);
|
|
void tcg_gen_gvec_shri(TCGContext *s, unsigned vece, uint32_t dofs, uint32_t aofs,
|
|
int64_t shift, uint32_t oprsz, uint32_t maxsz);
|
|
void tcg_gen_gvec_sari(TCGContext *s, unsigned vece, uint32_t dofs, uint32_t aofs,
|
|
int64_t shift, uint32_t oprsz, uint32_t maxsz);
|
|
|
|
void tcg_gen_gvec_cmp(TCGContext *s, TCGCond cond, unsigned vece, uint32_t dofs,
|
|
uint32_t aofs, uint32_t bofs,
|
|
uint32_t oprsz, uint32_t maxsz);
|
|
|
|
void tcg_gen_gvec_dup8i(TCGContext *, uint32_t dofs, uint32_t s, uint32_t m, uint8_t x);
|
|
void tcg_gen_gvec_dup16i(TCGContext *, uint32_t dofs, uint32_t s, uint32_t m, uint16_t x);
|
|
void tcg_gen_gvec_dup32i(TCGContext *, uint32_t dofs, uint32_t s, uint32_t m, uint32_t x);
|
|
void tcg_gen_gvec_dup64i(TCGContext *, uint32_t dofs, uint32_t s, uint32_t m, uint64_t x);
|
|
|
|
/*
|
|
* 64-bit vector operations. Use these when the register has been allocated
|
|
* with tcg_global_mem_new_i64, and so we cannot also address it via pointer.
|
|
* OPRSZ = MAXSZ = 8.
|
|
*/
|
|
|
|
void tcg_gen_vec_neg8_i64(TCGContext *, TCGv_i64 d, TCGv_i64 a);
|
|
void tcg_gen_vec_neg16_i64(TCGContext *, TCGv_i64 d, TCGv_i64 a);
|
|
void tcg_gen_vec_neg32_i64(TCGContext *, TCGv_i64 d, TCGv_i64 a);
|
|
|
|
void tcg_gen_vec_add8_i64(TCGContext *, TCGv_i64 d, TCGv_i64 a, TCGv_i64 b);
|
|
void tcg_gen_vec_add16_i64(TCGContext *, TCGv_i64 d, TCGv_i64 a, TCGv_i64 b);
|
|
void tcg_gen_vec_add32_i64(TCGContext *, TCGv_i64 d, TCGv_i64 a, TCGv_i64 b);
|
|
|
|
void tcg_gen_vec_sub8_i64(TCGContext *, TCGv_i64 d, TCGv_i64 a, TCGv_i64 b);
|
|
void tcg_gen_vec_sub16_i64(TCGContext *, TCGv_i64 d, TCGv_i64 a, TCGv_i64 b);
|
|
void tcg_gen_vec_sub32_i64(TCGContext *, TCGv_i64 d, TCGv_i64 a, TCGv_i64 b);
|
|
|
|
void tcg_gen_vec_shl8i_i64(TCGContext *, TCGv_i64 d, TCGv_i64 a, int64_t);
|
|
void tcg_gen_vec_shl16i_i64(TCGContext *, TCGv_i64 d, TCGv_i64 a, int64_t);
|
|
void tcg_gen_vec_shr8i_i64(TCGContext *, TCGv_i64 d, TCGv_i64 a, int64_t);
|
|
void tcg_gen_vec_shr16i_i64(TCGContext *, TCGv_i64 d, TCGv_i64 a, int64_t);
|
|
void tcg_gen_vec_sar8i_i64(TCGContext *, TCGv_i64 d, TCGv_i64 a, int64_t);
|
|
void tcg_gen_vec_sar16i_i64(TCGContext *, TCGv_i64 d, TCGv_i64 a, int64_t);
|