mirror of https://github.com/xemu-project/xemu.git
target/i386: Rework sse_op_table1
Add a flags field to each row in sse_op_table1. Initially this is only used as a replacement for the magic SSE_SPECIAL and SSE_DUMMY pointers, the other flags are mostly relevant for the AVX implementation but can be applied to SSE as well. Signed-off-by: Paul Brook <paul@nowt.org> Message-Id: <20220424220204.2493824-5-paul@nowt.org> Reviewed-by: Richard Henderson <richard.henderson@linaro.org> Signed-off-by: Paolo Bonzini <pbonzini@redhat.com>
This commit is contained in:
parent
36fc7ee299
commit
f2dbc28947
|
@ -2790,146 +2790,193 @@ typedef void (*SSEFunc_0_ppi)(TCGv_ptr reg_a, TCGv_ptr reg_b, TCGv_i32 val);
|
|||
typedef void (*SSEFunc_0_eppt)(TCGv_ptr env, TCGv_ptr reg_a, TCGv_ptr reg_b,
|
||||
TCGv val);
|
||||
|
||||
#define SSE_SPECIAL ((void *)1)
|
||||
#define SSE_DUMMY ((void *)2)
|
||||
#define SSE_OPF_CMP (1 << 1) /* does not write for first operand */
|
||||
#define SSE_OPF_SPECIAL (1 << 3) /* magic */
|
||||
#define SSE_OPF_3DNOW (1 << 4) /* 3DNow! instruction */
|
||||
#define SSE_OPF_MMX (1 << 5) /* MMX/integer/AVX2 instruction */
|
||||
#define SSE_OPF_SCALAR (1 << 6) /* Has SSE scalar variants */
|
||||
#define SSE_OPF_SHUF (1 << 9) /* pshufx/shufpx */
|
||||
|
||||
#define MMX_OP2(x) { gen_helper_ ## x ## _mmx, gen_helper_ ## x ## _xmm }
|
||||
#define SSE_FOP(x) { gen_helper_ ## x ## ps, gen_helper_ ## x ## pd, \
|
||||
gen_helper_ ## x ## ss, gen_helper_ ## x ## sd, }
|
||||
#define OP(op, flags, a, b, c, d) \
|
||||
{flags, {a, b, c, d} }
|
||||
|
||||
static const SSEFunc_0_epp sse_op_table1[256][4] = {
|
||||
#define MMX_OP(x) OP(op1, SSE_OPF_MMX, \
|
||||
gen_helper_ ## x ## _mmx, gen_helper_ ## x ## _xmm, NULL, NULL)
|
||||
|
||||
#define SSE_FOP(name) OP(op1, SSE_OPF_SCALAR, \
|
||||
gen_helper_##name##ps, gen_helper_##name##pd, \
|
||||
gen_helper_##name##ss, gen_helper_##name##sd)
|
||||
#define SSE_OP(sname, dname, op, flags) OP(op, flags, \
|
||||
gen_helper_##sname##_xmm, gen_helper_##dname##_xmm, NULL, NULL)
|
||||
|
||||
struct SSEOpHelper_table1 {
|
||||
int flags;
|
||||
SSEFunc_0_epp op[4];
|
||||
};
|
||||
|
||||
#define SSE_3DNOW { SSE_OPF_3DNOW }
|
||||
#define SSE_SPECIAL { SSE_OPF_SPECIAL }
|
||||
|
||||
static const struct SSEOpHelper_table1 sse_op_table1[256] = {
|
||||
/* 3DNow! extensions */
|
||||
[0x0e] = { SSE_DUMMY }, /* femms */
|
||||
[0x0f] = { SSE_DUMMY }, /* pf... */
|
||||
[0x0e] = SSE_SPECIAL, /* femms */
|
||||
[0x0f] = SSE_3DNOW, /* pf... (sse_op_table5) */
|
||||
/* pure SSE operations */
|
||||
[0x10] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* movups, movupd, movss, movsd */
|
||||
[0x11] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* movups, movupd, movss, movsd */
|
||||
[0x12] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* movlps, movlpd, movsldup, movddup */
|
||||
[0x13] = { SSE_SPECIAL, SSE_SPECIAL }, /* movlps, movlpd */
|
||||
[0x14] = { gen_helper_punpckldq_xmm, gen_helper_punpcklqdq_xmm },
|
||||
[0x15] = { gen_helper_punpckhdq_xmm, gen_helper_punpckhqdq_xmm },
|
||||
[0x16] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* movhps, movhpd, movshdup */
|
||||
[0x17] = { SSE_SPECIAL, SSE_SPECIAL }, /* movhps, movhpd */
|
||||
[0x10] = SSE_SPECIAL, /* movups, movupd, movss, movsd */
|
||||
[0x11] = SSE_SPECIAL, /* movups, movupd, movss, movsd */
|
||||
[0x12] = SSE_SPECIAL, /* movlps, movlpd, movsldup, movddup */
|
||||
[0x13] = SSE_SPECIAL, /* movlps, movlpd */
|
||||
[0x14] = SSE_OP(punpckldq, punpcklqdq, op1, 0), /* unpcklps, unpcklpd */
|
||||
[0x15] = SSE_OP(punpckhdq, punpckhqdq, op1, 0), /* unpckhps, unpckhpd */
|
||||
[0x16] = SSE_SPECIAL, /* movhps, movhpd, movshdup */
|
||||
[0x17] = SSE_SPECIAL, /* movhps, movhpd */
|
||||
|
||||
[0x28] = { SSE_SPECIAL, SSE_SPECIAL }, /* movaps, movapd */
|
||||
[0x29] = { SSE_SPECIAL, SSE_SPECIAL }, /* movaps, movapd */
|
||||
[0x2a] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* cvtpi2ps, cvtpi2pd, cvtsi2ss, cvtsi2sd */
|
||||
[0x2b] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* movntps, movntpd, movntss, movntsd */
|
||||
[0x2c] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* cvttps2pi, cvttpd2pi, cvttsd2si, cvttss2si */
|
||||
[0x2d] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* cvtps2pi, cvtpd2pi, cvtsd2si, cvtss2si */
|
||||
[0x2e] = { gen_helper_ucomiss, gen_helper_ucomisd },
|
||||
[0x2f] = { gen_helper_comiss, gen_helper_comisd },
|
||||
[0x50] = { SSE_SPECIAL, SSE_SPECIAL }, /* movmskps, movmskpd */
|
||||
[0x51] = SSE_FOP(sqrt),
|
||||
[0x52] = { gen_helper_rsqrtps, NULL, gen_helper_rsqrtss, NULL },
|
||||
[0x53] = { gen_helper_rcpps, NULL, gen_helper_rcpss, NULL },
|
||||
[0x54] = { gen_helper_pand_xmm, gen_helper_pand_xmm }, /* andps, andpd */
|
||||
[0x55] = { gen_helper_pandn_xmm, gen_helper_pandn_xmm }, /* andnps, andnpd */
|
||||
[0x56] = { gen_helper_por_xmm, gen_helper_por_xmm }, /* orps, orpd */
|
||||
[0x57] = { gen_helper_pxor_xmm, gen_helper_pxor_xmm }, /* xorps, xorpd */
|
||||
[0x28] = SSE_SPECIAL, /* movaps, movapd */
|
||||
[0x29] = SSE_SPECIAL, /* movaps, movapd */
|
||||
[0x2a] = SSE_SPECIAL, /* cvtpi2ps, cvtpi2pd, cvtsi2ss, cvtsi2sd */
|
||||
[0x2b] = SSE_SPECIAL, /* movntps, movntpd, movntss, movntsd */
|
||||
[0x2c] = SSE_SPECIAL, /* cvttps2pi, cvttpd2pi, cvttsd2si, cvttss2si */
|
||||
[0x2d] = SSE_SPECIAL, /* cvtps2pi, cvtpd2pi, cvtsd2si, cvtss2si */
|
||||
[0x2e] = OP(op1, SSE_OPF_CMP | SSE_OPF_SCALAR,
|
||||
gen_helper_ucomiss, gen_helper_ucomisd, NULL, NULL),
|
||||
[0x2f] = OP(op1, SSE_OPF_CMP | SSE_OPF_SCALAR,
|
||||
gen_helper_comiss, gen_helper_comisd, NULL, NULL),
|
||||
[0x50] = SSE_SPECIAL, /* movmskps, movmskpd */
|
||||
[0x51] = OP(op1, SSE_OPF_SCALAR,
|
||||
gen_helper_sqrtps, gen_helper_sqrtpd,
|
||||
gen_helper_sqrtss, gen_helper_sqrtsd),
|
||||
[0x52] = OP(op1, SSE_OPF_SCALAR,
|
||||
gen_helper_rsqrtps, NULL, gen_helper_rsqrtss, NULL),
|
||||
[0x53] = OP(op1, SSE_OPF_SCALAR,
|
||||
gen_helper_rcpps, NULL, gen_helper_rcpss, NULL),
|
||||
[0x54] = SSE_OP(pand, pand, op1, 0), /* andps, andpd */
|
||||
[0x55] = SSE_OP(pandn, pandn, op1, 0), /* andnps, andnpd */
|
||||
[0x56] = SSE_OP(por, por, op1, 0), /* orps, orpd */
|
||||
[0x57] = SSE_OP(pxor, pxor, op1, 0), /* xorps, xorpd */
|
||||
[0x58] = SSE_FOP(add),
|
||||
[0x59] = SSE_FOP(mul),
|
||||
[0x5a] = { gen_helper_cvtps2pd, gen_helper_cvtpd2ps,
|
||||
gen_helper_cvtss2sd, gen_helper_cvtsd2ss },
|
||||
[0x5b] = { gen_helper_cvtdq2ps, gen_helper_cvtps2dq, gen_helper_cvttps2dq },
|
||||
[0x5a] = OP(op1, SSE_OPF_SCALAR,
|
||||
gen_helper_cvtps2pd, gen_helper_cvtpd2ps,
|
||||
gen_helper_cvtss2sd, gen_helper_cvtsd2ss),
|
||||
[0x5b] = OP(op1, 0,
|
||||
gen_helper_cvtdq2ps, gen_helper_cvtps2dq,
|
||||
gen_helper_cvttps2dq, NULL),
|
||||
[0x5c] = SSE_FOP(sub),
|
||||
[0x5d] = SSE_FOP(min),
|
||||
[0x5e] = SSE_FOP(div),
|
||||
[0x5f] = SSE_FOP(max),
|
||||
|
||||
[0xc2] = SSE_FOP(cmpeq),
|
||||
[0xc6] = { (SSEFunc_0_epp)gen_helper_shufps,
|
||||
(SSEFunc_0_epp)gen_helper_shufpd }, /* XXX: casts */
|
||||
[0xc2] = SSE_FOP(cmpeq), /* sse_op_table4 */
|
||||
[0xc6] = OP(dummy, SSE_OPF_SHUF, (SSEFunc_0_epp)gen_helper_shufps,
|
||||
(SSEFunc_0_epp)gen_helper_shufpd, NULL, NULL),
|
||||
|
||||
/* SSSE3, SSE4, MOVBE, CRC32, BMI1, BMI2, ADX. */
|
||||
[0x38] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL },
|
||||
[0x3a] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL },
|
||||
[0x38] = SSE_SPECIAL,
|
||||
[0x3a] = SSE_SPECIAL,
|
||||
|
||||
/* MMX ops and their SSE extensions */
|
||||
[0x60] = MMX_OP2(punpcklbw),
|
||||
[0x61] = MMX_OP2(punpcklwd),
|
||||
[0x62] = MMX_OP2(punpckldq),
|
||||
[0x63] = MMX_OP2(packsswb),
|
||||
[0x64] = MMX_OP2(pcmpgtb),
|
||||
[0x65] = MMX_OP2(pcmpgtw),
|
||||
[0x66] = MMX_OP2(pcmpgtl),
|
||||
[0x67] = MMX_OP2(packuswb),
|
||||
[0x68] = MMX_OP2(punpckhbw),
|
||||
[0x69] = MMX_OP2(punpckhwd),
|
||||
[0x6a] = MMX_OP2(punpckhdq),
|
||||
[0x6b] = MMX_OP2(packssdw),
|
||||
[0x6c] = { NULL, gen_helper_punpcklqdq_xmm },
|
||||
[0x6d] = { NULL, gen_helper_punpckhqdq_xmm },
|
||||
[0x6e] = { SSE_SPECIAL, SSE_SPECIAL }, /* movd mm, ea */
|
||||
[0x6f] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* movq, movdqa, , movqdu */
|
||||
[0x70] = { (SSEFunc_0_epp)gen_helper_pshufw_mmx,
|
||||
(SSEFunc_0_epp)gen_helper_pshufd_xmm,
|
||||
(SSEFunc_0_epp)gen_helper_pshufhw_xmm,
|
||||
(SSEFunc_0_epp)gen_helper_pshuflw_xmm }, /* XXX: casts */
|
||||
[0x71] = { SSE_SPECIAL, SSE_SPECIAL }, /* shiftw */
|
||||
[0x72] = { SSE_SPECIAL, SSE_SPECIAL }, /* shiftd */
|
||||
[0x73] = { SSE_SPECIAL, SSE_SPECIAL }, /* shiftq */
|
||||
[0x74] = MMX_OP2(pcmpeqb),
|
||||
[0x75] = MMX_OP2(pcmpeqw),
|
||||
[0x76] = MMX_OP2(pcmpeql),
|
||||
[0x77] = { SSE_DUMMY }, /* emms */
|
||||
[0x78] = { NULL, SSE_SPECIAL, NULL, SSE_SPECIAL }, /* extrq_i, insertq_i */
|
||||
[0x79] = { NULL, gen_helper_extrq_r, NULL, gen_helper_insertq_r },
|
||||
[0x7c] = { NULL, gen_helper_haddpd, NULL, gen_helper_haddps },
|
||||
[0x7d] = { NULL, gen_helper_hsubpd, NULL, gen_helper_hsubps },
|
||||
[0x7e] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* movd, movd, , movq */
|
||||
[0x7f] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* movq, movdqa, movdqu */
|
||||
[0xc4] = { SSE_SPECIAL, SSE_SPECIAL }, /* pinsrw */
|
||||
[0xc5] = { SSE_SPECIAL, SSE_SPECIAL }, /* pextrw */
|
||||
[0xd0] = { NULL, gen_helper_addsubpd, NULL, gen_helper_addsubps },
|
||||
[0xd1] = MMX_OP2(psrlw),
|
||||
[0xd2] = MMX_OP2(psrld),
|
||||
[0xd3] = MMX_OP2(psrlq),
|
||||
[0xd4] = MMX_OP2(paddq),
|
||||
[0xd5] = MMX_OP2(pmullw),
|
||||
[0xd6] = { NULL, SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL },
|
||||
[0xd7] = { SSE_SPECIAL, SSE_SPECIAL }, /* pmovmskb */
|
||||
[0xd8] = MMX_OP2(psubusb),
|
||||
[0xd9] = MMX_OP2(psubusw),
|
||||
[0xda] = MMX_OP2(pminub),
|
||||
[0xdb] = MMX_OP2(pand),
|
||||
[0xdc] = MMX_OP2(paddusb),
|
||||
[0xdd] = MMX_OP2(paddusw),
|
||||
[0xde] = MMX_OP2(pmaxub),
|
||||
[0xdf] = MMX_OP2(pandn),
|
||||
[0xe0] = MMX_OP2(pavgb),
|
||||
[0xe1] = MMX_OP2(psraw),
|
||||
[0xe2] = MMX_OP2(psrad),
|
||||
[0xe3] = MMX_OP2(pavgw),
|
||||
[0xe4] = MMX_OP2(pmulhuw),
|
||||
[0xe5] = MMX_OP2(pmulhw),
|
||||
[0xe6] = { NULL, gen_helper_cvttpd2dq, gen_helper_cvtdq2pd, gen_helper_cvtpd2dq },
|
||||
[0xe7] = { SSE_SPECIAL , SSE_SPECIAL }, /* movntq, movntq */
|
||||
[0xe8] = MMX_OP2(psubsb),
|
||||
[0xe9] = MMX_OP2(psubsw),
|
||||
[0xea] = MMX_OP2(pminsw),
|
||||
[0xeb] = MMX_OP2(por),
|
||||
[0xec] = MMX_OP2(paddsb),
|
||||
[0xed] = MMX_OP2(paddsw),
|
||||
[0xee] = MMX_OP2(pmaxsw),
|
||||
[0xef] = MMX_OP2(pxor),
|
||||
[0xf0] = { NULL, NULL, NULL, SSE_SPECIAL }, /* lddqu */
|
||||
[0xf1] = MMX_OP2(psllw),
|
||||
[0xf2] = MMX_OP2(pslld),
|
||||
[0xf3] = MMX_OP2(psllq),
|
||||
[0xf4] = MMX_OP2(pmuludq),
|
||||
[0xf5] = MMX_OP2(pmaddwd),
|
||||
[0xf6] = MMX_OP2(psadbw),
|
||||
[0xf7] = { (SSEFunc_0_epp)gen_helper_maskmov_mmx,
|
||||
(SSEFunc_0_epp)gen_helper_maskmov_xmm }, /* XXX: casts */
|
||||
[0xf8] = MMX_OP2(psubb),
|
||||
[0xf9] = MMX_OP2(psubw),
|
||||
[0xfa] = MMX_OP2(psubl),
|
||||
[0xfb] = MMX_OP2(psubq),
|
||||
[0xfc] = MMX_OP2(paddb),
|
||||
[0xfd] = MMX_OP2(paddw),
|
||||
[0xfe] = MMX_OP2(paddl),
|
||||
[0x60] = MMX_OP(punpcklbw),
|
||||
[0x61] = MMX_OP(punpcklwd),
|
||||
[0x62] = MMX_OP(punpckldq),
|
||||
[0x63] = MMX_OP(packsswb),
|
||||
[0x64] = MMX_OP(pcmpgtb),
|
||||
[0x65] = MMX_OP(pcmpgtw),
|
||||
[0x66] = MMX_OP(pcmpgtl),
|
||||
[0x67] = MMX_OP(packuswb),
|
||||
[0x68] = MMX_OP(punpckhbw),
|
||||
[0x69] = MMX_OP(punpckhwd),
|
||||
[0x6a] = MMX_OP(punpckhdq),
|
||||
[0x6b] = MMX_OP(packssdw),
|
||||
[0x6c] = OP(op1, SSE_OPF_MMX,
|
||||
NULL, gen_helper_punpcklqdq_xmm, NULL, NULL),
|
||||
[0x6d] = OP(op1, SSE_OPF_MMX,
|
||||
NULL, gen_helper_punpckhqdq_xmm, NULL, NULL),
|
||||
[0x6e] = SSE_SPECIAL, /* movd mm, ea */
|
||||
[0x6f] = SSE_SPECIAL, /* movq, movdqa, , movqdu */
|
||||
[0x70] = OP(op1i, SSE_OPF_SHUF | SSE_OPF_MMX,
|
||||
(SSEFunc_0_epp)gen_helper_pshufw_mmx,
|
||||
(SSEFunc_0_epp)gen_helper_pshufd_xmm,
|
||||
(SSEFunc_0_epp)gen_helper_pshufhw_xmm,
|
||||
(SSEFunc_0_epp)gen_helper_pshuflw_xmm),
|
||||
[0x71] = SSE_SPECIAL, /* shiftw */
|
||||
[0x72] = SSE_SPECIAL, /* shiftd */
|
||||
[0x73] = SSE_SPECIAL, /* shiftq */
|
||||
[0x74] = MMX_OP(pcmpeqb),
|
||||
[0x75] = MMX_OP(pcmpeqw),
|
||||
[0x76] = MMX_OP(pcmpeql),
|
||||
[0x77] = SSE_SPECIAL, /* emms */
|
||||
[0x78] = SSE_SPECIAL, /* extrq_i, insertq_i (sse4a) */
|
||||
[0x79] = OP(op1, 0,
|
||||
NULL, gen_helper_extrq_r, NULL, gen_helper_insertq_r),
|
||||
[0x7c] = OP(op1, 0,
|
||||
NULL, gen_helper_haddpd, NULL, gen_helper_haddps),
|
||||
[0x7d] = OP(op1, 0,
|
||||
NULL, gen_helper_hsubpd, NULL, gen_helper_hsubps),
|
||||
[0x7e] = SSE_SPECIAL, /* movd, movd, , movq */
|
||||
[0x7f] = SSE_SPECIAL, /* movq, movdqa, movdqu */
|
||||
[0xc4] = SSE_SPECIAL, /* pinsrw */
|
||||
[0xc5] = SSE_SPECIAL, /* pextrw */
|
||||
[0xd0] = OP(op1, 0,
|
||||
NULL, gen_helper_addsubpd, NULL, gen_helper_addsubps),
|
||||
[0xd1] = MMX_OP(psrlw),
|
||||
[0xd2] = MMX_OP(psrld),
|
||||
[0xd3] = MMX_OP(psrlq),
|
||||
[0xd4] = MMX_OP(paddq),
|
||||
[0xd5] = MMX_OP(pmullw),
|
||||
[0xd6] = SSE_SPECIAL,
|
||||
[0xd7] = SSE_SPECIAL, /* pmovmskb */
|
||||
[0xd8] = MMX_OP(psubusb),
|
||||
[0xd9] = MMX_OP(psubusw),
|
||||
[0xda] = MMX_OP(pminub),
|
||||
[0xdb] = MMX_OP(pand),
|
||||
[0xdc] = MMX_OP(paddusb),
|
||||
[0xdd] = MMX_OP(paddusw),
|
||||
[0xde] = MMX_OP(pmaxub),
|
||||
[0xdf] = MMX_OP(pandn),
|
||||
[0xe0] = MMX_OP(pavgb),
|
||||
[0xe1] = MMX_OP(psraw),
|
||||
[0xe2] = MMX_OP(psrad),
|
||||
[0xe3] = MMX_OP(pavgw),
|
||||
[0xe4] = MMX_OP(pmulhuw),
|
||||
[0xe5] = MMX_OP(pmulhw),
|
||||
[0xe6] = OP(op1, 0,
|
||||
NULL, gen_helper_cvttpd2dq,
|
||||
gen_helper_cvtdq2pd, gen_helper_cvtpd2dq),
|
||||
[0xe7] = SSE_SPECIAL, /* movntq, movntq */
|
||||
[0xe8] = MMX_OP(psubsb),
|
||||
[0xe9] = MMX_OP(psubsw),
|
||||
[0xea] = MMX_OP(pminsw),
|
||||
[0xeb] = MMX_OP(por),
|
||||
[0xec] = MMX_OP(paddsb),
|
||||
[0xed] = MMX_OP(paddsw),
|
||||
[0xee] = MMX_OP(pmaxsw),
|
||||
[0xef] = MMX_OP(pxor),
|
||||
[0xf0] = SSE_SPECIAL, /* lddqu */
|
||||
[0xf1] = MMX_OP(psllw),
|
||||
[0xf2] = MMX_OP(pslld),
|
||||
[0xf3] = MMX_OP(psllq),
|
||||
[0xf4] = MMX_OP(pmuludq),
|
||||
[0xf5] = MMX_OP(pmaddwd),
|
||||
[0xf6] = MMX_OP(psadbw),
|
||||
[0xf7] = OP(op1t, SSE_OPF_MMX,
|
||||
(SSEFunc_0_epp)gen_helper_maskmov_mmx,
|
||||
(SSEFunc_0_epp)gen_helper_maskmov_xmm, NULL, NULL),
|
||||
[0xf8] = MMX_OP(psubb),
|
||||
[0xf9] = MMX_OP(psubw),
|
||||
[0xfa] = MMX_OP(psubl),
|
||||
[0xfb] = MMX_OP(psubq),
|
||||
[0xfc] = MMX_OP(paddb),
|
||||
[0xfd] = MMX_OP(paddw),
|
||||
[0xfe] = MMX_OP(paddl),
|
||||
};
|
||||
#undef MMX_OP
|
||||
#undef OP
|
||||
#undef SSE_FOP
|
||||
#undef SSE_OP
|
||||
#undef SSE_SPECIAL
|
||||
|
||||
#define MMX_OP2(x) { gen_helper_ ## x ## _mmx, gen_helper_ ## x ## _xmm }
|
||||
#define SSE_SPECIAL_FN ((void *)1)
|
||||
|
||||
static const SSEFunc_0_epp sse_op_table2[3 * 8][2] = {
|
||||
[0 + 2] = MMX_OP2(psrlw),
|
||||
|
@ -2972,6 +3019,8 @@ static const SSEFunc_l_ep sse_op_table3bq[] = {
|
|||
};
|
||||
#endif
|
||||
|
||||
#define SSE_FOP(x) { gen_helper_ ## x ## ps, gen_helper_ ## x ## pd, \
|
||||
gen_helper_ ## x ## ss, gen_helper_ ## x ## sd, }
|
||||
static const SSEFunc_0_epp sse_op_table4[8][4] = {
|
||||
SSE_FOP(cmpeq),
|
||||
SSE_FOP(cmplt),
|
||||
|
@ -2982,6 +3031,7 @@ static const SSEFunc_0_epp sse_op_table4[8][4] = {
|
|||
SSE_FOP(cmpnle),
|
||||
SSE_FOP(cmpord),
|
||||
};
|
||||
#undef SSE_FOP
|
||||
|
||||
static const SSEFunc_0_epp sse_op_table5[256] = {
|
||||
[0x0c] = gen_helper_pi2fw,
|
||||
|
@ -3023,7 +3073,7 @@ struct SSEOpHelper_eppi {
|
|||
#define SSSE3_OP(x) { MMX_OP2(x), CPUID_EXT_SSSE3 }
|
||||
#define SSE41_OP(x) { { NULL, gen_helper_ ## x ## _xmm }, CPUID_EXT_SSE41 }
|
||||
#define SSE42_OP(x) { { NULL, gen_helper_ ## x ## _xmm }, CPUID_EXT_SSE42 }
|
||||
#define SSE41_SPECIAL { { NULL, SSE_SPECIAL }, CPUID_EXT_SSE41 }
|
||||
#define SSE41_SPECIAL { { NULL, SSE_SPECIAL_FN }, CPUID_EXT_SSE41 }
|
||||
#define PCLMULQDQ_OP(x) { { NULL, gen_helper_ ## x ## _xmm }, \
|
||||
CPUID_EXT_PCLMULQDQ }
|
||||
#define AESNI_OP(x) { { NULL, gen_helper_ ## x ## _xmm }, CPUID_EXT_AES }
|
||||
|
@ -3114,6 +3164,7 @@ static void gen_sse(CPUX86State *env, DisasContext *s, int b,
|
|||
{
|
||||
int b1, op1_offset, op2_offset, is_xmm, val;
|
||||
int modrm, mod, rm, reg;
|
||||
int sse_op_flags;
|
||||
SSEFunc_0_epp sse_fn_epp;
|
||||
SSEFunc_0_eppi sse_fn_eppi;
|
||||
SSEFunc_0_ppi sse_fn_ppi;
|
||||
|
@ -3129,8 +3180,10 @@ static void gen_sse(CPUX86State *env, DisasContext *s, int b,
|
|||
b1 = 3;
|
||||
else
|
||||
b1 = 0;
|
||||
sse_fn_epp = sse_op_table1[b][b1];
|
||||
if (!sse_fn_epp) {
|
||||
sse_op_flags = sse_op_table1[b].flags;
|
||||
sse_fn_epp = sse_op_table1[b].op[b1];
|
||||
if ((sse_op_flags & (SSE_OPF_SPECIAL | SSE_OPF_3DNOW)) == 0
|
||||
&& !sse_fn_epp) {
|
||||
goto unknown_op;
|
||||
}
|
||||
if ((b <= 0x5f && b >= 0x10) || b == 0xc6 || b == 0xc2) {
|
||||
|
@ -3184,7 +3237,7 @@ static void gen_sse(CPUX86State *env, DisasContext *s, int b,
|
|||
reg |= REX_R(s);
|
||||
}
|
||||
mod = (modrm >> 6) & 3;
|
||||
if (sse_fn_epp == SSE_SPECIAL) {
|
||||
if (sse_op_flags & SSE_OPF_SPECIAL) {
|
||||
b |= (b1 << 8);
|
||||
switch(b) {
|
||||
case 0x0e7: /* movntq */
|
||||
|
@ -3819,7 +3872,7 @@ static void gen_sse(CPUX86State *env, DisasContext *s, int b,
|
|||
gen_ldq_env_A0(s, op2_offset);
|
||||
}
|
||||
}
|
||||
if (sse_fn_epp == SSE_SPECIAL) {
|
||||
if (sse_fn_epp == SSE_SPECIAL_FN) {
|
||||
goto unknown_op;
|
||||
}
|
||||
|
||||
|
@ -4205,7 +4258,7 @@ static void gen_sse(CPUX86State *env, DisasContext *s, int b,
|
|||
|
||||
s->rip_offset = 1;
|
||||
|
||||
if (sse_fn_eppi == SSE_SPECIAL) {
|
||||
if (sse_fn_eppi == SSE_SPECIAL_FN) {
|
||||
ot = mo_64_32(s->dflag);
|
||||
rm = (modrm & 7) | REX_B(s);
|
||||
if (mod != 3)
|
||||
|
|
Loading…
Reference in New Issue