From 91ebfd1b3c9df291031858663ee945eed0bce998 Mon Sep 17 00:00:00 2001 From: Peter Johnson Date: Thu, 5 Feb 2004 03:40:16 +0000 Subject: [PATCH] Fix SIMD VR/PR instruction encoding for the following instructions: - PEXTRW - MOVMSKPD - MOVMSKPS - PMOVMSKB Reported by: Vivek Mohan Also, while we're here, fix all CVT* SIMD instructions; they were variously incorrect (mostly with regards to accepted operands). New testcase, simd-2, tests all the above (output verified with GNU objdump). svn path=/trunk/yasm/; revision=1093 --- modules/arch/x86/tests/Makefile.inc | 3 + modules/arch/x86/tests/simd-2.asm | 104 ++++++ modules/arch/x86/tests/simd-2.errwarn | 0 modules/arch/x86/tests/simd-2.hex | 474 ++++++++++++++++++++++++++ modules/arch/x86/x86id.re | 116 +++++-- 5 files changed, 673 insertions(+), 24 deletions(-) create mode 100644 modules/arch/x86/tests/simd-2.asm create mode 100644 modules/arch/x86/tests/simd-2.errwarn create mode 100644 modules/arch/x86/tests/simd-2.hex diff --git a/modules/arch/x86/tests/Makefile.inc b/modules/arch/x86/tests/Makefile.inc index 073cafee..8a423108 100644 --- a/modules/arch/x86/tests/Makefile.inc +++ b/modules/arch/x86/tests/Makefile.inc @@ -110,6 +110,9 @@ EXTRA_DIST += modules/arch/x86/tests/shift.hex EXTRA_DIST += modules/arch/x86/tests/simd-1.asm EXTRA_DIST += modules/arch/x86/tests/simd-1.errwarn EXTRA_DIST += modules/arch/x86/tests/simd-1.hex +EXTRA_DIST += modules/arch/x86/tests/simd-2.asm +EXTRA_DIST += modules/arch/x86/tests/simd-2.errwarn +EXTRA_DIST += modules/arch/x86/tests/simd-2.hex EXTRA_DIST += modules/arch/x86/tests/stos.asm EXTRA_DIST += modules/arch/x86/tests/stos.errwarn EXTRA_DIST += modules/arch/x86/tests/stos.hex diff --git a/modules/arch/x86/tests/simd-2.asm b/modules/arch/x86/tests/simd-2.asm new file mode 100644 index 00000000..a3a351aa --- /dev/null +++ b/modules/arch/x86/tests/simd-2.asm @@ -0,0 +1,104 @@ +[bits 32] +pextrw ebx, mm5, 0 ; 0F C5 DD 00 +pextrw ecx, xmm0, 1 ; 66 0F C5 C8 01 + +pinsrw mm3, esi, 5 ; 0F C4 DE 05 +pinsrw mm3, [0], 4 ; 0F C4 1D 00 00 00 00 04 + +pinsrw xmm1, eax, 3 ; 66 0F C4 C8 03 +pinsrw xmm1, [0], 2 ; 66 0F C4 0D 00 00 00 00 02 + +movmskpd edx, xmm7 ; 66 0F 50 D7 +movmskps eax, xmm1 ; 0F 50 C1 + +pmovmskb edi, mm0 ; 0F D7 F8 +pmovmskb esi, xmm1 ; 66 0F D7 F1 + +cvtdq2pd xmm5, xmm4 ; F3 0F E6 EC +cvtdq2pd xmm3, [0] ; F3 0F E6 1D 00 00 00 00 +cvtdq2pd xmm2, qword [0] ; F3 0F E6 15 00 00 00 00 + +cvtdq2ps xmm1, xmm2 ; 0F 5B CA +cvtdq2ps xmm4, [0] ; 0F 5B 25 00 00 00 00 +cvtdq2ps xmm5, dqword [0] ; 0F 5B 2D 00 00 00 00 + +cvtpd2dq xmm0, xmm1 ; F2 0F E6 C1 +cvtpd2dq xmm2, [0] ; F2 0F E6 15 00 00 00 00 +cvtpd2dq xmm3, dqword [0] ; F2 0F E6 1D 00 00 00 00 + +cvtpd2pi mm4, xmm5 ; 66 0F 2D E5 +cvtpd2pi mm6, [0] ; 66 0F 2D 35 00 00 00 00 +cvtpd2pi mm7, dqword [0] ; 66 0F 2D 3D 00 00 00 00 + +cvtpd2ps xmm1, xmm2 ; 66 0F 5A CA +cvtpd2ps xmm3, [0] ; 66 0F 5A 1D 00 00 00 00 +cvtpd2ps xmm4, dqword [0] ; 66 0F 5A 25 00 00 00 00 + +cvtpi2pd xmm5, mm6 ; 66 0F 2A EE +cvtpi2pd xmm7, [0] ; 66 0F 2A 3D 00 00 00 00 +cvtpi2pd xmm0, qword [0] ; 66 0F 2A 05 00 00 00 00 + +cvtpi2ps xmm2, mm3 ; 0F 2A D3 +cvtpi2ps xmm4, [0] ; 0F 2A 25 00 00 00 00 +cvtpi2ps xmm5, qword [0] ; 0F 2A 2D 00 00 00 00 + +cvtps2dq xmm6, xmm7 ; 66 0F 5B F7 +cvtps2dq xmm0, [0] ; 66 0F 5B 05 00 00 00 00 +cvtps2dq xmm1, dqword [0] ; 66 0F 5B 0D 00 00 00 00 + +cvtps2pd xmm2, xmm3 ; 0F 5A D3 +cvtps2pd xmm4, [0] ; 0F 5A 25 00 00 00 00 +cvtps2pd xmm5, qword [0] ; 0F 5A 2D 00 00 00 00 + +cvtps2pi mm6, xmm7 ; 0F 2D F7 +cvtps2pi mm0, [0] ; 0F 2D 05 00 00 00 00 +cvtps2pi mm1, qword [0] ; 0F 2D 0D 00 00 00 00 + +cvtsd2si edx, xmm0 ; F2 0F 2D D0 +cvtsd2si eax, [0] ; F2 0F 2D 05 00 00 00 00 +cvtsd2si ebx, qword [0] ; F2 0F 2D 1D 00 00 00 00 + +cvtsd2ss xmm1, xmm2 ; F2 0F 5A CA +cvtsd2ss xmm3, [0] ; F2 0F 5A 1D 00 00 00 00 +cvtsd2ss xmm4, qword [0] ; F2 0F 5A 25 00 00 00 00 + +cvtsi2sd xmm5, eax ; F2 0F 2A E8 +cvtsi2sd xmm6, [0] ; F2 0F 2A 35 00 00 00 00 +cvtsi2sd xmm7, dword [0] ; F2 0F 2A 3D 00 00 00 00 + +cvtsi2ss xmm0, edx ; F3 0F 2A C2 +cvtsi2ss xmm1, [0] ; F3 0F 2A 0D 00 00 00 00 +cvtsi2ss xmm2, dword [0] ; F3 0F 2A 15 00 00 00 00 + +cvtss2sd xmm3, xmm4 ; F3 0F 5A DC +cvtss2sd xmm5, [0] ; F3 0F 5A 2D 00 00 00 00 +cvtss2sd xmm6, dword [0] ; F3 0F 5A 35 00 00 00 00 + +cvtss2si ebx, xmm7 ; F3 0F 2D DF +cvtss2si ecx, [0] ; F3 0F 2D 0D 00 00 00 00 +cvtss2si eax, dword [0] ; F3 0F 2D 05 00 00 00 00 + +cvttpd2pi mm0, xmm1 ; 66 0F 2C C1 +cvttpd2pi mm2, [0] ; 66 0F 2C 15 00 00 00 00 +cvttpd2pi mm3, dqword [0] ; 66 0F 2C 1D 00 00 00 00 + +cvttpd2dq xmm4, xmm5 ; 66 0F E6 E5 +cvttpd2dq xmm6, [0] ; 66 0F E6 35 00 00 00 00 +cvttpd2dq xmm7, dqword [0] ; 66 0F E6 3D 00 00 00 00 + +cvttps2dq xmm0, xmm1 ; F3 0F 5B C1 +cvttps2dq xmm2, [0] ; F3 0F 5B 15 00 00 00 00 +cvttps2dq xmm3, dqword [0] ; F3 0F 5B 1D 00 00 00 00 + +cvttps2pi mm4, xmm5 ; 0F 2C E5 +cvttps2pi mm6, [0] ; 0F 2C 35 00 00 00 00 +cvttps2pi mm7, qword [0] ; 0F 2C 3D 00 00 00 00 + +cvttsd2si ecx, xmm0 ; F2 0F 2C C8 +cvttsd2si ebx, [0] ; F2 0F 2C 1D 00 00 00 00 +cvttsd2si edi, qword [0] ; F2 0F 2C 3D 00 00 00 00 + +cvttss2si esi, xmm3 ; F3 0F 2C F3 +cvttss2si ebp, [0] ; F3 0F 2C 2D 00 00 00 00 +cvttss2si eax, dword [0] ; F3 0F 2C 05 00 00 00 00 + diff --git a/modules/arch/x86/tests/simd-2.errwarn b/modules/arch/x86/tests/simd-2.errwarn new file mode 100644 index 00000000..e69de29b diff --git a/modules/arch/x86/tests/simd-2.hex b/modules/arch/x86/tests/simd-2.hex new file mode 100644 index 00000000..a34ddc10 --- /dev/null +++ b/modules/arch/x86/tests/simd-2.hex @@ -0,0 +1,474 @@ +0f +c5 +dd +00 +66 +0f +c5 +c8 +01 +0f +c4 +de +05 +0f +c4 +1d +00 +00 +00 +00 +04 +66 +0f +c4 +c8 +03 +66 +0f +c4 +0d +00 +00 +00 +00 +02 +66 +0f +50 +d7 +0f +50 +c1 +0f +d7 +f8 +66 +0f +d7 +f1 +f3 +0f +e6 +ec +f3 +0f +e6 +1d +00 +00 +00 +00 +f3 +0f +e6 +15 +00 +00 +00 +00 +0f +5b +ca +0f +5b +25 +00 +00 +00 +00 +0f +5b +2d +00 +00 +00 +00 +f2 +0f +e6 +c1 +f2 +0f +e6 +15 +00 +00 +00 +00 +f2 +0f +e6 +1d +00 +00 +00 +00 +66 +0f +2d +e5 +66 +0f +2d +35 +00 +00 +00 +00 +66 +0f +2d +3d +00 +00 +00 +00 +66 +0f +5a +ca +66 +0f +5a +1d +00 +00 +00 +00 +66 +0f +5a +25 +00 +00 +00 +00 +66 +0f +2a +ee +66 +0f +2a +3d +00 +00 +00 +00 +66 +0f +2a +05 +00 +00 +00 +00 +0f +2a +d3 +0f +2a +25 +00 +00 +00 +00 +0f +2a +2d +00 +00 +00 +00 +66 +0f +5b +f7 +66 +0f +5b +05 +00 +00 +00 +00 +66 +0f +5b +0d +00 +00 +00 +00 +0f +5a +d3 +0f +5a +25 +00 +00 +00 +00 +0f +5a +2d +00 +00 +00 +00 +0f +2d +f7 +0f +2d +05 +00 +00 +00 +00 +0f +2d +0d +00 +00 +00 +00 +f2 +0f +2d +d0 +f2 +0f +2d +05 +00 +00 +00 +00 +f2 +0f +2d +1d +00 +00 +00 +00 +f2 +0f +5a +ca +f2 +0f +5a +1d +00 +00 +00 +00 +f2 +0f +5a +25 +00 +00 +00 +00 +f2 +0f +2a +e8 +f2 +0f +2a +35 +00 +00 +00 +00 +f2 +0f +2a +3d +00 +00 +00 +00 +f3 +0f +2a +c2 +f3 +0f +2a +0d +00 +00 +00 +00 +f3 +0f +2a +15 +00 +00 +00 +00 +f3 +0f +5a +dc +f3 +0f +5a +2d +00 +00 +00 +00 +f3 +0f +5a +35 +00 +00 +00 +00 +f3 +0f +2d +df +f3 +0f +2d +0d +00 +00 +00 +00 +f3 +0f +2d +05 +00 +00 +00 +00 +66 +0f +2c +c1 +66 +0f +2c +15 +00 +00 +00 +00 +66 +0f +2c +1d +00 +00 +00 +00 +66 +0f +e6 +e5 +66 +0f +e6 +35 +00 +00 +00 +00 +66 +0f +e6 +3d +00 +00 +00 +00 +f3 +0f +5b +c1 +f3 +0f +5b +15 +00 +00 +00 +00 +f3 +0f +5b +1d +00 +00 +00 +00 +0f +2c +e5 +0f +2c +35 +00 +00 +00 +00 +0f +2c +3d +00 +00 +00 +00 +f2 +0f +2c +c8 +f2 +0f +2c +1d +00 +00 +00 +00 +f2 +0f +2c +3d +00 +00 +00 +00 +f3 +0f +2c +f3 +f3 +0f +2c +2d +00 +00 +00 +00 +f3 +0f +2c +05 +00 +00 +00 +00 diff --git a/modules/arch/x86/x86id.re b/modules/arch/x86/x86id.re index 7dd6e43c..50d67631 100644 --- a/modules/arch/x86/x86id.re +++ b/modules/arch/x86/x86id.re @@ -1291,6 +1291,74 @@ static const x86_insn_info sseps_insn[] = { {OPT_SIMDReg|OPS_128|OPA_Spare, OPT_SIMDRM|OPS_128|OPS_Relaxed|OPA_EA, 0} } }; +static const x86_insn_info cvt_xmm_xmm64_ss_insn[] = { + { CPU_SSE, MOD_Op0Add|MOD_Op2Add, 0, 0, 3, {0x00, 0x0F, 0x00}, 0, 2, + {OPT_SIMDReg|OPS_128|OPA_Spare, OPT_SIMDReg|OPS_128|OPA_EA, 0} + }, + { CPU_SSE, MOD_Op0Add|MOD_Op2Add, 0, 0, 3, {0x00, 0x0F, 0x00}, 0, 2, + {OPT_SIMDReg|OPS_128|OPA_Spare, OPT_Mem|OPS_64|OPS_Relaxed|OPA_EA, 0} + } +}; +static const x86_insn_info cvt_xmm_xmm64_ps_insn[] = { + { CPU_SSE, MOD_Op1Add, 0, 0, 2, {0x0F, 0x00, 0x00}, 0, 2, + {OPT_SIMDReg|OPS_128|OPA_Spare, OPT_SIMDReg|OPS_128|OPA_EA, 0} + }, + { CPU_SSE, MOD_Op1Add, 0, 0, 2, {0x0F, 0x00, 0x00}, 0, 2, + {OPT_SIMDReg|OPS_128|OPA_Spare, OPT_Mem|OPS_64|OPS_Relaxed|OPA_EA, 0} + } +}; +static const x86_insn_info cvt_xmm_xmm32_insn[] = { + { CPU_SSE, MOD_Op0Add|MOD_Op2Add, 0, 0, 3, {0x00, 0x0F, 0x00}, 0, 2, + {OPT_SIMDReg|OPS_128|OPA_Spare, OPT_SIMDReg|OPS_128|OPA_EA, 0} + }, + { CPU_SSE, MOD_Op0Add|MOD_Op2Add, 0, 0, 3, {0x00, 0x0F, 0x00}, 0, 2, + {OPT_SIMDReg|OPS_128|OPA_Spare, OPT_Mem|OPS_32|OPS_Relaxed|OPA_EA, 0} + } +}; +static const x86_insn_info cvt_r32_xmm64_insn[] = { + { CPU_SSE, MOD_Op0Add|MOD_Op2Add, 0, 0, 3, {0x00, 0x0F, 0x00}, 0, 2, + {OPT_Reg|OPS_32|OPA_Spare, OPT_SIMDReg|OPS_128|OPA_EA, 0} + }, + { CPU_SSE, MOD_Op0Add|MOD_Op2Add, 0, 0, 3, {0x00, 0x0F, 0x00}, 0, 2, + {OPT_Reg|OPS_32|OPA_Spare, OPT_Mem|OPS_64|OPS_Relaxed|OPA_EA, 0} + } +}; +static const x86_insn_info cvt_r32_xmm32_insn[] = { + { CPU_SSE, MOD_Op0Add|MOD_Op2Add, 0, 0, 3, {0x00, 0x0F, 0x00}, 0, 2, + {OPT_Reg|OPS_32|OPA_Spare, OPT_SIMDReg|OPS_128|OPA_EA, 0} + }, + { CPU_SSE, MOD_Op0Add|MOD_Op2Add, 0, 0, 3, {0x00, 0x0F, 0x00}, 0, 2, + {OPT_Reg|OPS_32|OPA_Spare, OPT_Mem|OPS_32|OPS_Relaxed|OPA_EA, 0} + } +}; +static const x86_insn_info cvt_mm_xmm64_insn[] = { + { CPU_SSE, MOD_Op1Add, 0, 0, 2, {0x0F, 0x00, 0x00}, 0, 2, + {OPT_SIMDReg|OPS_64|OPA_Spare, OPT_SIMDReg|OPS_128|OPA_EA, 0} + }, + { CPU_SSE, MOD_Op1Add, 0, 0, 2, {0x0F, 0x00, 0x00}, 0, 2, + {OPT_SIMDReg|OPS_64|OPA_Spare, OPT_Mem|OPS_64|OPS_Relaxed|OPA_EA, 0} + } +}; +static const x86_insn_info cvt_mm_xmm_insn[] = { + { CPU_SSE, MOD_Op0Add|MOD_Op2Add, 0, 0, 3, {0x00, 0x0F, 0x00}, 0, 2, + {OPT_SIMDReg|OPS_64|OPA_Spare, OPT_SIMDRM|OPS_128|OPS_Relaxed|OPA_EA, 0} + } +}; +static const x86_insn_info cvt_xmm_mm_ss_insn[] = { + { CPU_SSE, MOD_Op0Add|MOD_Op2Add, 0, 0, 3, {0x00, 0x0F, 0x00}, 0, 2, + {OPT_SIMDReg|OPS_128|OPA_Spare, OPT_SIMDRM|OPS_64|OPS_Relaxed|OPA_EA, 0} + } +}; +static const x86_insn_info cvt_xmm_mm_ps_insn[] = { + { CPU_SSE, MOD_Op1Add, 0, 0, 2, {0x0F, 0x00, 0x00}, 0, 2, + {OPT_SIMDReg|OPS_128|OPA_Spare, OPT_SIMDRM|OPS_64|OPS_Relaxed|OPA_EA, 0} + } +}; +static const x86_insn_info cvt_xmm_rm32_insn[] = { + { CPU_SSE, MOD_Op0Add|MOD_Op2Add, 0, 0, 3, {0x00, 0x0F, 0x00}, 0, 2, + {OPT_SIMDReg|OPS_128|OPA_Spare, OPT_RM|OPS_32|OPS_Relaxed|OPA_EA, 0} + } +}; static const x86_insn_info ssess_insn[] = { { CPU_SSE, MOD_Op0Add|MOD_Op2Add, 0, 0, 3, {0x00, 0x0F, 0x00}, 0, 2, {OPT_SIMDReg|OPS_128|OPA_Spare, OPT_SIMDRM|OPS_128|OPS_Relaxed|OPA_EA, 0} @@ -1344,7 +1412,7 @@ static const x86_insn_info movhlps_insn[] = { }; static const x86_insn_info movmskps_insn[] = { { CPU_SSE, 0, 0, 0, 2, {0x0F, 0x50, 0}, 0, 2, - {OPT_Reg|OPS_32|OPA_EA, OPT_SIMDReg|OPS_128|OPA_Spare, 0} } + {OPT_Reg|OPS_32|OPA_Spare, OPT_SIMDReg|OPS_128|OPA_EA, 0} } }; static const x86_insn_info movntps_insn[] = { { CPU_SSE, 0, 0, 0, 2, {0x0F, 0x2B, 0}, 0, 2, @@ -1364,10 +1432,10 @@ static const x86_insn_info movss_insn[] = { }; static const x86_insn_info pextrw_insn[] = { { CPU_P3|CPU_MMX, 0, 0, 0, 2, {0x0F, 0xC5, 0}, 0, 3, - {OPT_Reg|OPS_32|OPA_EA, OPT_SIMDReg|OPS_64|OPA_Spare, + {OPT_Reg|OPS_32|OPA_Spare, OPT_SIMDReg|OPS_64|OPA_EA, OPT_Imm|OPS_8|OPS_Relaxed|OPA_Imm} }, { CPU_SSE2, 0, 0, 0, 3, {0x66, 0x0F, 0xC5}, 0, 3, - {OPT_Reg|OPS_32|OPA_EA, OPT_SIMDReg|OPS_128|OPA_Spare, + {OPT_Reg|OPS_32|OPA_Spare, OPT_SIMDReg|OPS_128|OPA_EA, OPT_Imm|OPS_8|OPS_Relaxed|OPA_Imm} } }; static const x86_insn_info pinsrw_insn[] = { @@ -1375,20 +1443,20 @@ static const x86_insn_info pinsrw_insn[] = { {OPT_SIMDReg|OPS_64|OPA_Spare, OPT_Reg|OPS_32|OPA_EA, OPT_Imm|OPS_8|OPS_Relaxed|OPA_Imm} }, { CPU_P3|CPU_MMX, 0, 0, 0, 2, {0x0F, 0xC4, 0}, 0, 3, - {OPT_SIMDReg|OPS_64|OPA_Spare, OPT_RM|OPS_16|OPS_Relaxed|OPA_EA, + {OPT_SIMDReg|OPS_64|OPA_Spare, OPT_Mem|OPS_16|OPS_Relaxed|OPA_EA, OPT_Imm|OPS_8|OPS_Relaxed|OPA_Imm} }, { CPU_SSE2, 0, 0, 0, 3, {0x66, 0x0F, 0xC4}, 0, 3, {OPT_SIMDReg|OPS_128|OPA_Spare, OPT_Reg|OPS_32|OPA_EA, OPT_Imm|OPS_8|OPS_Relaxed|OPA_Imm} }, { CPU_SSE2, 0, 0, 0, 3, {0x66, 0x0F, 0xC4}, 0, 3, - {OPT_SIMDReg|OPS_64|OPA_Spare, OPT_RM|OPS_16|OPS_Relaxed|OPA_EA, + {OPT_SIMDReg|OPS_128|OPA_Spare, OPT_Mem|OPS_16|OPS_Relaxed|OPA_EA, OPT_Imm|OPS_8|OPS_Relaxed|OPA_Imm} } }; static const x86_insn_info pmovmskb_insn[] = { { CPU_P3|CPU_MMX, 0, 0, 0, 2, {0x0F, 0xD7, 0}, 0, 2, - {OPT_Reg|OPS_32|OPA_EA, OPT_SIMDReg|OPS_64|OPA_Spare, 0} }, + {OPT_Reg|OPS_32|OPA_Spare, OPT_SIMDReg|OPS_64|OPA_EA, 0} }, { CPU_SSE2, 0, 0, 0, 3, {0x66, 0x0F, 0xD7}, 0, 2, - {OPT_Reg|OPS_32|OPA_EA, OPT_SIMDReg|OPS_128|OPA_Spare, 0} } + {OPT_Reg|OPS_32|OPA_Spare, OPT_SIMDReg|OPS_128|OPA_EA, 0} } }; static const x86_insn_info pshufw_insn[] = { { CPU_P3|CPU_MMX, 0, 0, 0, 2, {0x0F, 0x70, 0}, 0, 3, @@ -1419,7 +1487,7 @@ static const x86_insn_info movhlpd_insn[] = { }; static const x86_insn_info movmskpd_insn[] = { { CPU_SSE2, 0, 0, 0, 3, {0x66, 0x0F, 0x50}, 0, 2, - {OPT_Reg|OPS_32|OPA_EA, OPT_SIMDReg|OPS_128|OPA_Spare, 0} } + {OPT_Reg|OPS_32|OPA_Spare, OPT_SIMDReg|OPS_128|OPA_EA, 0} } }; static const x86_insn_info movntpddq_insn[] = { { CPU_SSE2, MOD_Op2Add, 0, 0, 3, {0x66, 0x0F, 0x00}, 0, 2, @@ -3399,12 +3467,12 @@ yasm_x86__parse_check_id(yasm_arch *arch, unsigned long data[4], C M P P S { RET_INSN(ssepsimm, 0xC2, CPU_SSE); } C M P S S { RET_INSN(ssessimm, 0xF3C2, CPU_SSE); } C O M I S S { RET_INSN(sseps, 0x2F, CPU_SSE); } - C V T P I "2" P S { RET_INSN(sseps, 0x2A, CPU_SSE); } - C V T P S "2" P I { RET_INSN(sseps, 0x2D, CPU_SSE); } - C V T S I "2" S S { RET_INSN(ssess, 0xF32A, CPU_SSE); } - C V T S S "2" S I { RET_INSN(ssess, 0xF32D, CPU_SSE); } - C V T T P S "2" P I { RET_INSN(sseps, 0x2C, CPU_SSE); } - C V T T S S "2" S I { RET_INSN(ssess, 0xF32C, CPU_SSE); } + C V T P I "2" P S { RET_INSN(cvt_xmm_mm_ps, 0x2A, CPU_SSE); } + C V T P S "2" P I { RET_INSN(cvt_mm_xmm64, 0x2D, CPU_SSE); } + C V T S I "2" S S { RET_INSN(cvt_xmm_rm32, 0xF32A, CPU_SSE); } + C V T S S "2" S I { RET_INSN(cvt_r32_xmm32, 0xF32D, CPU_SSE); } + C V T T P S "2" P I { RET_INSN(cvt_mm_xmm64, 0x2C, CPU_SSE); } + C V T T S S "2" S I { RET_INSN(cvt_r32_xmm32, 0xF32C, CPU_SSE); } D I V P S { RET_INSN(sseps, 0x5E, CPU_SSE); } D I V S S { RET_INSN(ssess, 0xF35E, CPU_SSE); } L D M X C S R { RET_INSN(ldstmxcsr, 0x02, CPU_SSE); } @@ -3481,8 +3549,8 @@ yasm_x86__parse_check_id(yasm_arch *arch, unsigned long data[4], C M P P D { RET_INSN(ssessimm, 0x66C2, CPU_SSE2); } /* C M P S D is in string instructions above */ C O M I S D { RET_INSN(ssess, 0x662F, CPU_SSE2); } - C V T P I "2" P D { RET_INSN(ssess, 0x662A, CPU_SSE2); } - C V T S I "2" S D { RET_INSN(ssess, 0xF22A, CPU_SSE2); } + C V T P I "2" P D { RET_INSN(cvt_xmm_mm_ss, 0x662A, CPU_SSE2); } + C V T S I "2" S D { RET_INSN(cvt_xmm_rm32, 0xF22A, CPU_SSE2); } D I V P D { RET_INSN(ssess, 0x665E, CPU_SSE2); } D I V S D { RET_INSN(ssess, 0xF25E, CPU_SSE2); } M A X P D { RET_INSN(ssess, 0x665F, CPU_SSE2); } @@ -3509,18 +3577,18 @@ yasm_x86__parse_check_id(yasm_arch *arch, unsigned long data[4], U N P C K H P D { RET_INSN(ssess, 0x6615, CPU_SSE2); } U N P C K L P D { RET_INSN(ssess, 0x6614, CPU_SSE2); } X O R P D { RET_INSN(ssess, 0x6657, CPU_SSE2); } - C V T D Q "2" P D { RET_INSN(ssess, 0xF3E6, CPU_SSE2); } + C V T D Q "2" P D { RET_INSN(cvt_xmm_xmm64_ss, 0xF3E6, CPU_SSE2); } C V T P D "2" D Q { RET_INSN(ssess, 0xF2E6, CPU_SSE2); } C V T D Q "2" P S { RET_INSN(sseps, 0x5B, CPU_SSE2); } - C V T P D "2" P I { RET_INSN(ssess, 0x662D, CPU_SSE2); } + C V T P D "2" P I { RET_INSN(cvt_mm_xmm, 0x662D, CPU_SSE2); } C V T P D "2" P S { RET_INSN(ssess, 0x665A, CPU_SSE2); } - C V T P S "2" P D { RET_INSN(sseps, 0x5A, CPU_SSE2); } + C V T P S "2" P D { RET_INSN(cvt_xmm_xmm64_ps, 0x5A, CPU_SSE2); } C V T P S "2" D Q { RET_INSN(ssess, 0x665B, CPU_SSE2); } - C V T S D "2" S I { RET_INSN(ssess, 0xF22D, CPU_SSE2); } - C V T S D "2" S S { RET_INSN(ssess, 0xF25A, CPU_SSE2); } - C V T S S "2" S D { RET_INSN(ssess, 0xF35A, CPU_SSE2); } - C V T T P D "2" P I { RET_INSN(ssess, 0x662C, CPU_SSE2); } - C V T T S D "2" S I { RET_INSN(ssess, 0xF22C, CPU_SSE2); } + C V T S D "2" S I { RET_INSN(cvt_r32_xmm64, 0xF22D, CPU_SSE2); } + C V T S D "2" S S { RET_INSN(cvt_xmm_xmm64_ss, 0xF25A, CPU_SSE2); } + C V T S S "2" S D { RET_INSN(cvt_xmm_xmm32, 0xF35A, CPU_SSE2); } + C V T T P D "2" P I { RET_INSN(cvt_mm_xmm, 0x662C, CPU_SSE2); } + C V T T S D "2" S I { RET_INSN(cvt_r32_xmm64, 0xF22C, CPU_SSE2); } C V T T P D "2" D Q { RET_INSN(ssess, 0x66E6, CPU_SSE2); } C V T T P S "2" D Q { RET_INSN(ssess, 0xF35B, CPU_SSE2); } M A S K M O V D Q U { RET_INSN(maskmovdqu, 0, CPU_SSE2); } -- 2.40.0