On 13.11.2024 09:44, Haochen Jiang wrote:
> --- /dev/null
> +++ b/gas/testsuite/gas/i386/x86-64-amx-movrs-inval.l
> @@ -0,0 +1,5 @@
> +.* Assembler messages:
> +.*:6: Error: `t2rpntlvwz0rs' is not supported on `x86_64.noamx_transpose'
> +.*:7: Error: `t2rpntlvwz0rst1' is not supported on `x86_64.noamx_transpose'
> +.*:8: Error: `t2rpntlvwz1rs' is not supported on `x86_64.noamx_transpose'
> +.*:9: Error: `t2rpntlvwz1rst1' is not supported on `x86_64.noamx_transpose'
> --- /dev/null
> +++ b/gas/testsuite/gas/i386/x86-64-amx-movrs-inval.s
> @@ -0,0 +1,9 @@
> +# Check Invalid 64bit AMX-MOVRS instructions
> +
> + .text
> + .arch .noamx_transpose
> +_start:
> + t2rpntlvwz0rs (%r9), %tmm3
> + t2rpntlvwz0rst1 (%r9), %tmm3
> + t2rpntlvwz1rs (%r9), %tmm3
> + t2rpntlvwz1rst1 (%r9), %tmm3
This is too little imo - the SIBMEM constraints also want checking.
> --- a/opcodes/i386-opc.tbl
> +++ b/opcodes/i386-opc.tbl
> @@ -3197,6 +3197,11 @@ t2rpntlvwz0t1, 0x6f, AMX_TRANSPOSE, TMMPairOperand1|Sibmem|Vex128|Space0F38|VexW
> t2rpntlvwz1, 0x666e, AMX_TRANSPOSE, TMMPairOperand1|Sibmem|Vex128|Space0F38|VexW0|NoSuf, { Unspecified|BaseIndex, RegTMM }
> t2rpntlvwz1t1, 0x666f, AMX_TRANSPOSE, TMMPairOperand1|Sibmem|Vex128|Space0F38|VexW0|NoSuf, { Unspecified|BaseIndex, RegTMM }
>
> +t2rpntlvwz0rs, 0xf8, AMX_MOVRS&AMX_TRANSPOSE, TMMPairOperand1|Sibmem|Vex128|xVexMap5|VexW0|NoSuf, { Unspecified|BaseIndex, RegTMM }
> +t2rpntlvwz0rst1, 0xf9, AMX_MOVRS&AMX_TRANSPOSE, TMMPairOperand1|Sibmem|Vex128|xVexMap5|VexW0|NoSuf, { Unspecified|BaseIndex, RegTMM }
> +t2rpntlvwz1rs, 0x66f8, AMX_MOVRS&AMX_TRANSPOSE, TMMPairOperand1|Sibmem|Vex128|xVexMap5|VexW0|NoSuf, { Unspecified|BaseIndex, RegTMM }
> +t2rpntlvwz1rst1, 0x66f9, AMX_MOVRS&AMX_TRANSPOSE, TMMPairOperand1|Sibmem|Vex128|xVexMap5|VexW0|NoSuf, { Unspecified|BaseIndex, RegTMM }
Judging from VMOVRS{B,W,D,Q}, shouldn't the RS infix move a little earlier,
ahead of the element width specifier: T2RPNTLVRSW{Z0,Z1}{,T1}?
> @@ -3230,6 +3235,8 @@ tdphf8ps, 0x66fd, AMX_FP8, Modrm|Vex128|xVexMap5|Src2VVVV|VexW0|NoSuf, { RegTMM,
>
> tileloadd, 0xf24b, APX_F(AMX_TILE), Sibmem|Vex128|EVex128|Space0F38|VexW0|NoSuf, { Unspecified|BaseIndex, RegTMM }
> tileloaddt1, 0x664b, APX_F(AMX_TILE), Sibmem|Vex128|EVex128|Space0F38|VexW0|NoSuf, { Unspecified|BaseIndex, RegTMM }
> +tileloaddrs, 0xf24a, AMX_MOVRS, Sibmem|Vex128|Space0F38|VexW0|NoSuf, { Unspecified|BaseIndex, RegTMM }
> +tileloaddrst1, 0x664a, AMX_MOVRS, Sibmem|Vex128|Space0F38|VexW0|NoSuf, { Unspecified|BaseIndex, RegTMM }
> tilemovrow, 0x664a, AMX_AVX512, Modrm|EVex512|Space0F38|Src2VVVV|VexW0|NoSuf, { Reg32, RegTMM, RegZMM }
> tilemovrow, 0x6607, AMX_AVX512, Modrm|EVex512|Space0F3A|VexW0|NoSuf, { Imm8, RegTMM, RegZMM }
> tilestored, 0xf34b, APX_F(AMX_TILE), Sibmem|Vex128|EVex128|Space0F38|VexW0|NoSuf, { RegTMM, Unspecified|BaseIndex }
Same here: TILELOADRSD{,T1} would seem like a better match for VMOVRS{B,W,D,Q}.
For all of these: What about their APX forms (presumably simply re-encoded as
EVEX at the same position in the opcode map)?
Jan
@@ -1,5 +1,7 @@
-*- text -*-
+* Add support for Intel AMX-MOVRS instructions.
+
* Add support for Intel AMX-FP8 instructions.
* Add support for Intel AMX-TF32 instructions.
@@ -1186,6 +1186,7 @@ static const arch_entry cpu_arch[] =
SUBARCH (amx_avx512, AMX_AVX512, ANY_AMX_AVX512, false),
SUBARCH (amx_tf32, AMX_TF32, ANY_AMX_TF32, false),
SUBARCH (amx_fp8, AMX_FP8, ANY_AMX_FP8, false),
+ SUBARCH (amx_movrs, AMX_MOVRS, ANY_AMX_MOVRS, false),
SUBARCH (amx_tile, AMX_TILE, ANY_AMX_TILE, false),
SUBARCH (movdiri, MOVDIRI, MOVDIRI, false),
SUBARCH (movdir64b, MOVDIR64B, MOVDIR64B, false),
@@ -232,6 +232,7 @@ accept various extension mnemonics. For example,
@code{amx_avx512},
@code{amx_tf32},
@code{amx_fp8}
+@code{amx_movrs},
@code{amx_tile},
@code{vmx},
@code{vmfunc},
@@ -1705,7 +1706,8 @@ supported on the CPU specified. The choices for @var{cpu_type} are:
@item @samp{.movdiri} @tab @samp{.movdir64b} @tab @samp{.enqcmd} @tab @samp{.tsxldtrk}
@item @samp{.amx_int8} @tab @samp{.amx_bf16} @tab @samp{.amx_fp16}
@item @samp{.amx_complex} @tab @samp{.amx_transpose} @tab @samp{.amx_avx512}
-@item @samp{.amx_tf32} @tab @samp {.amx_fp8} @tab @samp{.amx_tile}
+@item @samp{.amx_tf32} @tab @samp{.amx_tile} @tab @tab @samp{.amx_movrs}
+@item @samp{.amx_tile}
@item @samp{.kl} @tab @samp{.widekl} @tab @samp{.uintr} @tab @samp{.hreset}
@item @samp{.3dnow} @tab @samp{.3dnowa} @tab @samp{.sse4a} @tab @samp{.sse5}
@item @samp{.syscall} @tab @samp{.rdtscp} @tab @samp{.svme}
new file mode 100644
@@ -0,0 +1,7 @@
+.* Assembler messages:
+.*:6: Error: `t2rpntlvwz0rs' is only supported in 64-bit mode
+.*:7: Error: `t2rpntlvwz0rst1' is only supported in 64-bit mode
+.*:8: Error: `t2rpntlvwz1rs' is only supported in 64-bit mode
+.*:9: Error: `t2rpntlvwz1rst1' is only supported in 64-bit mode
+.*:10: Error: `tileloaddrs' is only supported in 64-bit mode
+.*:11: Error: `tileloaddrst1' is only supported in 64-bit mode
new file mode 100644
@@ -0,0 +1,11 @@
+# Check Illegal 32bit AMX-MOVRS instructions
+
+ .allow_index_reg
+ .text
+_start:
+ t2rpntlvwz0rs 0x10000000(%esp, %esi, 8), %tmm6
+ t2rpntlvwz0rst1 0x10000000(%esp, %esi, 8), %tmm6
+ t2rpntlvwz1rs 0x10000000(%esp, %esi, 8), %tmm6
+ t2rpntlvwz1rst1 0x10000000(%esp, %esi, 8), %tmm6
+ tileloaddrs 0x10000000(%esp, %esi, 8), %tmm6
+ tileloaddrst1 0x10000000(%esp, %esi, 8), %tmm6
@@ -550,6 +550,7 @@ if [gas_32_check] then {
run_list_test "amx-avx512-inval"
run_list_test "amx-tf32-inval"
run_list_test "amx-fp8-inval"
+ run_list_test "amx-movrs-inval"
run_list_test "sg"
run_dump_test "clzero"
run_dump_test "invlpgb"
new file mode 100644
@@ -0,0 +1,23 @@
+#objdump: -dw -Mintel
+#name: x86_64 AMX-MOVRS insns (Intel disassembly)
+#source: x86-64-amx-movrs.s
+
+.*: +file format .*
+
+Disassembly of section \.text:
+
+#...
+[a-f0-9]+ <_intel>:
+\s*[a-f0-9]+:\s*c4 a5 78 f8 b4 f5 00 00 00 10\s+t2rpntlvwz0rs tmm6,\[rbp\+r14\*8\+0x10000000\]
+\s*[a-f0-9]+:\s*c4 c5 78 f8 14 21\s+t2rpntlvwz0rs tmm2,\[r9\+riz\*1\]
+\s*[a-f0-9]+:\s*c4 a5 78 f9 b4 f5 00 00 00 10\s+t2rpntlvwz0rst1 tmm6,\[rbp\+r14\*8\+0x10000000\]
+\s*[a-f0-9]+:\s*c4 c5 78 f9 14 21\s+t2rpntlvwz0rst1 tmm2,\[r9\+riz\*1\]
+\s*[a-f0-9]+:\s*c4 a5 79 f8 b4 f5 00 00 00 10\s+t2rpntlvwz1rs tmm6,\[rbp\+r14\*8\+0x10000000\]
+\s*[a-f0-9]+:\s*c4 c5 79 f8 14 21\s+t2rpntlvwz1rs tmm2,\[r9\+riz\*1\]
+\s*[a-f0-9]+:\s*c4 a5 79 f9 b4 f5 00 00 00 10\s+t2rpntlvwz1rst1 tmm6,\[rbp\+r14\*8\+0x10000000\]
+\s*[a-f0-9]+:\s*c4 c5 79 f9 14 21\s+t2rpntlvwz1rst1 tmm2,\[r9\+riz\*1\]
+\s*[a-f0-9]+:\s*c4 a2 7b 4a b4 f5 00 00 00 10\s+tileloaddrs tmm6,\[rbp\+r14\*8\+0x10000000\]
+\s*[a-f0-9]+:\s*c4 c2 7b 4a 1c 21\s+tileloaddrs tmm3,\[r9\+riz\*1\]
+\s*[a-f0-9]+:\s*c4 a2 79 4a b4 f5 00 00 00 10\s+tileloaddrst1 tmm6,\[rbp\+r14\*8\+0x10000000\]
+\s*[a-f0-9]+:\s*c4 c2 79 4a 1c 21\s+tileloaddrst1 tmm3,\[r9\+riz\*1\]
+#pass
new file mode 100644
@@ -0,0 +1,5 @@
+.* Assembler messages:
+.*:6: Error: `t2rpntlvwz0rs' is not supported on `x86_64.noamx_transpose'
+.*:7: Error: `t2rpntlvwz0rst1' is not supported on `x86_64.noamx_transpose'
+.*:8: Error: `t2rpntlvwz1rs' is not supported on `x86_64.noamx_transpose'
+.*:9: Error: `t2rpntlvwz1rst1' is not supported on `x86_64.noamx_transpose'
new file mode 100644
@@ -0,0 +1,9 @@
+# Check Invalid 64bit AMX-MOVRS instructions
+
+ .text
+ .arch .noamx_transpose
+_start:
+ t2rpntlvwz0rs (%r9), %tmm3
+ t2rpntlvwz0rst1 (%r9), %tmm3
+ t2rpntlvwz1rs (%r9), %tmm3
+ t2rpntlvwz1rst1 (%r9), %tmm3
new file mode 100644
@@ -0,0 +1,21 @@
+#objdump: -dw
+#name: x86_64 AMX-MOVRS insns
+
+.*: +file format .*
+
+Disassembly of section \.text:
+
+0+ <_start>:
+\s*[a-f0-9]+:\s*c4 a5 78 f8 b4 f5 00 00 00 10\s+t2rpntlvwz0rs 0x10000000\(%rbp,%r14,8\),%tmm6
+\s*[a-f0-9]+:\s*c4 c5 78 f8 14 21\s+t2rpntlvwz0rs \(%r9,%riz,1\),%tmm2
+\s*[a-f0-9]+:\s*c4 a5 78 f9 b4 f5 00 00 00 10\s+t2rpntlvwz0rst1 0x10000000\(%rbp,%r14,8\),%tmm6
+\s*[a-f0-9]+:\s*c4 c5 78 f9 14 21\s+t2rpntlvwz0rst1 \(%r9,%riz,1\),%tmm2
+\s*[a-f0-9]+:\s*c4 a5 79 f8 b4 f5 00 00 00 10\s+t2rpntlvwz1rs 0x10000000\(%rbp,%r14,8\),%tmm6
+\s*[a-f0-9]+:\s*c4 c5 79 f8 14 21\s+t2rpntlvwz1rs \(%r9,%riz,1\),%tmm2
+\s*[a-f0-9]+:\s*c4 a5 79 f9 b4 f5 00 00 00 10\s+t2rpntlvwz1rst1 0x10000000\(%rbp,%r14,8\),%tmm6
+\s*[a-f0-9]+:\s*c4 c5 79 f9 14 21\s+t2rpntlvwz1rst1 \(%r9,%riz,1\),%tmm2
+\s*[a-f0-9]+:\s*c4 a2 7b 4a b4 f5 00 00 00 10\s+tileloaddrs 0x10000000\(%rbp,%r14,8\),%tmm6
+\s*[a-f0-9]+:\s*c4 c2 7b 4a 1c 21\s+tileloaddrs \(%r9,%riz,1\),%tmm3
+\s*[a-f0-9]+:\s*c4 a2 79 4a b4 f5 00 00 00 10\s+tileloaddrst1 0x10000000\(%rbp,%r14,8\),%tmm6
+\s*[a-f0-9]+:\s*c4 c2 79 4a 1c 21\s+tileloaddrst1 \(%r9,%riz,1\),%tmm3
+#pass
new file mode 100644
@@ -0,0 +1,31 @@
+# Check 64bit AMX-MOVRS instructions
+
+ .text
+_start:
+ t2rpntlvwz0rs 0x10000000(%rbp, %r14, 8), %tmm6
+ t2rpntlvwz0rs (%r9), %tmm3
+ t2rpntlvwz0rst1 0x10000000(%rbp, %r14, 8), %tmm6
+ t2rpntlvwz0rst1 (%r9), %tmm3
+ t2rpntlvwz1rs 0x10000000(%rbp, %r14, 8), %tmm6
+ t2rpntlvwz1rs (%r9), %tmm3
+ t2rpntlvwz1rst1 0x10000000(%rbp, %r14, 8), %tmm6
+ t2rpntlvwz1rst1 (%r9), %tmm3
+ tileloaddrs 0x10000000(%rbp, %r14, 8), %tmm6
+ tileloaddrs (%r9), %tmm3
+ tileloaddrst1 0x10000000(%rbp, %r14, 8), %tmm6
+ tileloaddrst1 (%r9), %tmm3
+
+_intel:
+ .intel_syntax noprefix
+ t2rpntlvwz0rs tmm6, [rbp+r14*8+0x10000000]
+ t2rpntlvwz0rs tmm3, [r9]
+ t2rpntlvwz0rst1 tmm6, [rbp+r14*8+0x10000000]
+ t2rpntlvwz0rst1 tmm3, [r9]
+ t2rpntlvwz1rs tmm6, [rbp+r14*8+0x10000000]
+ t2rpntlvwz1rs tmm3, [r9]
+ t2rpntlvwz1rst1 tmm6, [rbp+r14*8+0x10000000]
+ t2rpntlvwz1rst1 tmm3, [r9]
+ tileloaddrs tmm6, [rbp+r14*8+0x10000000]
+ tileloaddrs tmm3, [r9]
+ tileloaddrst1 tmm6, [rbp+r14*8+0x10000000]
+ tileloaddrst1 tmm3, [r9]
@@ -535,6 +535,9 @@ run_list_test "x86-64-amx-tf32-inval"
run_dump_test "x86-64-amx-fp8"
run_dump_test "x86-64-amx-fp8-intel"
run_list_test "x86-64-amx-fp8-inval"
+run_dump_test "x86-64-amx-movrs"
+run_dump_test "x86-64-amx-movrs-intel"
+run_list_test "x86-64-amx-movrs-inval"
run_dump_test "x86-64-clzero"
run_dump_test "x86-64-mwaitx-bdver4"
run_list_test "x86-64-mwaitx-reg"
@@ -964,8 +964,11 @@ enum
MOD_0F38F8,
MOD_VEX_0F3849_X86_64_L_0_W_0,
+ MOD_VEX_0F384A_X86_64,
MOD_VEX_0F386E_X86_64,
MOD_VEX_0F386F_X86_64,
+ MOD_VEX_MAP5_F8_X86_64,
+ MOD_VEX_MAP5_F9_X86_64,
MOD_EVEX_MAP4_60,
MOD_EVEX_MAP4_61,
@@ -1135,6 +1138,7 @@ enum
PREFIX_VEX_0F3848_X86_64_L_0_W_0,
PREFIX_VEX_0F3849_X86_64_L_0_W_0_M_0,
PREFIX_VEX_0F3849_X86_64_L_0_W_0_M_1,
+ PREFIX_VEX_0F384A_X86_64_M_0_L_0_W_0,
PREFIX_VEX_0F384B_X86_64_L_0_W_0,
PREFIX_VEX_0F3850_W_0,
PREFIX_VEX_0F3851_W_0,
@@ -1160,6 +1164,8 @@ enum
PREFIX_VEX_0F38F6_L_0,
PREFIX_VEX_0F38F7_L_0,
PREFIX_VEX_0F3AF0_L_0,
+ PREFIX_VEX_MAP5_F8_X86_64_M_0_L_0_W_0,
+ PREFIX_VEX_MAP5_F9_X86_64_M_0_L_0_W_0,
PREFIX_VEX_MAP5_FD_X86_64_L_0_W_0,
PREFIX_VEX_MAP7_F6_L_0_W_0_R_0_X86_64,
PREFIX_VEX_MAP7_F8_L_0_W_0_R_0_X86_64,
@@ -1358,6 +1364,7 @@ enum
X86_64_VEX_0F3848,
X86_64_VEX_0F3849,
+ X86_64_VEX_0F384A,
X86_64_VEX_0F384B,
X86_64_VEX_0F385C,
X86_64_VEX_0F385E,
@@ -1368,6 +1375,8 @@ enum
X86_64_VEX_0F386F,
X86_64_VEX_0F38Ex,
+ X86_64_VEX_MAP5_F8,
+ X86_64_VEX_MAP5_F9,
X86_64_VEX_MAP5_FD,
X86_64_VEX_MAP7_F6_L_0_W_0_R_0,
X86_64_VEX_MAP7_F8_L_0_W_0_R_0,
@@ -1453,6 +1462,7 @@ enum
VEX_LEN_0F3841,
VEX_LEN_0F3848_X86_64,
VEX_LEN_0F3849_X86_64,
+ VEX_LEN_0F384A_X86_64_M_0,
VEX_LEN_0F384B_X86_64,
VEX_LEN_0F385A,
VEX_LEN_0F385C_X86_64,
@@ -1500,6 +1510,8 @@ enum
VEX_LEN_0F3ADE_W_0,
VEX_LEN_0F3ADF,
VEX_LEN_0F3AF0,
+ VEX_LEN_MAP5_F8_X86_64_M_0,
+ VEX_LEN_MAP5_F9_X86_64_M_0,
VEX_LEN_MAP5_FD_X86_64,
VEX_LEN_MAP7_F6,
VEX_LEN_MAP7_F8,
@@ -1630,6 +1642,7 @@ enum
VEX_W_0F3846,
VEX_W_0F3848_X86_64_L_0,
VEX_W_0F3849_X86_64_L_0,
+ VEX_W_0F384A_X86_64_M_0_L_0,
VEX_W_0F384B_X86_64_L_0,
VEX_W_0F3850,
VEX_W_0F3851,
@@ -1677,6 +1690,8 @@ enum
VEX_W_0F3ACE,
VEX_W_0F3ACF,
VEX_W_0F3ADE,
+ VEX_W_MAP5_F8_X86_64_M_0_L_0,
+ VEX_W_MAP5_F9_X86_64_M_0_L_0,
VEX_W_MAP5_FD_X86_64_L_0,
VEX_W_MAP7_F6_L_0,
VEX_W_MAP7_F8_L_0,
@@ -4118,6 +4133,14 @@ static const struct dis386 prefix_table[][4] = {
{ RM_TABLE (RM_VEX_0F3849_X86_64_L_0_W_0_M_1_P_3) },
},
+ /* PREFIX_VEX_0F384A_X86_64_M_0_L_0_W_0 */
+ {
+ { Bad_Opcode },
+ { Bad_Opcode },
+ { "tileloaddrst1", { TMM, MVexSIBMEM }, 0 },
+ { "tileloaddrs", { TMM, MVexSIBMEM }, 0 },
+ },
+
/* PREFIX_VEX_0F384B_X86_64_L_0_W_0 */
{
{ Bad_Opcode },
@@ -4302,6 +4325,20 @@ static const struct dis386 prefix_table[][4] = {
{ "%XErorxS", { Gdq, Edq, Ib }, 0 },
},
+ /* PREFIX_VEX_MAP5_F8_X86_64_M_0_L_0_W_0 */
+ {
+ { "t2rpntlvwz0rs", { TMM, MVexSIBMEM }, 0 },
+ { Bad_Opcode },
+ { "t2rpntlvwz1rs", { TMM, MVexSIBMEM }, 0 },
+ },
+
+ /* PREFIX_VEX_MAP5_F9_X86_64_M_0_L_0_W_0 */
+ {
+ { "t2rpntlvwz0rst1", { TMM, MVexSIBMEM }, 0 },
+ { Bad_Opcode },
+ { "t2rpntlvwz1rst1", { TMM, MVexSIBMEM }, 0 },
+ },
+
/* PREFIX_VEX_MAP5_FD_X86_64_L_0_W_0 */
{
{ "tdpbf8ps", { TMM, Rtmm, VexTmm }, 0 },
@@ -4658,6 +4695,12 @@ static const struct dis386 x86_64_table[][2] = {
{ VEX_LEN_TABLE (VEX_LEN_0F3849_X86_64) },
},
+ /* X86_64_VEX_0F384A */
+ {
+ { Bad_Opcode },
+ { MOD_TABLE (MOD_VEX_0F384A_X86_64) },
+ },
+
/* X86_64_VEX_0F384B */
{
{ Bad_Opcode },
@@ -4712,6 +4755,18 @@ static const struct dis386 x86_64_table[][2] = {
{ "%XEcmp%CCxadd", { Mdq, Gdq, VexGdq }, PREFIX_DATA },
},
+ /* X86_64_VEX_MAP5_F8 */
+ {
+ { Bad_Opcode },
+ { MOD_TABLE (MOD_VEX_MAP5_F8_X86_64) },
+ },
+
+ /* X86_64_VEX_MAP5_F9 */
+ {
+ { Bad_Opcode },
+ { MOD_TABLE (MOD_VEX_MAP5_F9_X86_64) },
+ },
+
/* X86_64_VEX_MAP5_FD */
{
{ Bad_Opcode },
@@ -6573,7 +6628,7 @@ static const struct dis386 vex_table[][256] = {
/* 48 */
{ X86_64_TABLE (X86_64_VEX_0F3848) },
{ X86_64_TABLE (X86_64_VEX_0F3849) },
- { Bad_Opcode },
+ { X86_64_TABLE (X86_64_VEX_0F384A) },
{ X86_64_TABLE (X86_64_VEX_0F384B) },
{ Bad_Opcode },
{ Bad_Opcode },
@@ -7351,8 +7406,8 @@ static const struct dis386 vex_table[][256] = {
{ Bad_Opcode },
{ Bad_Opcode },
/* f8 */
- { Bad_Opcode },
- { Bad_Opcode },
+ { X86_64_TABLE (X86_64_VEX_MAP5_F8) },
+ { X86_64_TABLE (X86_64_VEX_MAP5_F9) },
{ Bad_Opcode },
{ Bad_Opcode },
{ Bad_Opcode },
@@ -7552,6 +7607,11 @@ static const struct dis386 vex_len_table[][2] = {
{ VEX_W_TABLE (VEX_W_0F3849_X86_64_L_0) },
},
+ /* VEX_LEN_0F384A_X86_64_M_0 */
+ {
+ { VEX_W_TABLE (VEX_W_0F384A_X86_64_M_0_L_0) },
+ },
+
/* VEX_LEN_0F384B_X86_64 */
{
{ VEX_W_TABLE (VEX_W_0F384B_X86_64_L_0) },
@@ -7799,6 +7859,16 @@ static const struct dis386 vex_len_table[][2] = {
{ PREFIX_TABLE (PREFIX_VEX_0F3AF0_L_0) },
},
+ /* VEX_LEN_MAP5_F8_X86_64_M_0 */
+ {
+ { VEX_W_TABLE (VEX_W_MAP5_F8_X86_64_M_0_L_0) },
+ },
+
+ /* VEX_LEN_MAP5_F9_X86_64_M_0 */
+ {
+ { VEX_W_TABLE (VEX_W_MAP5_F9_X86_64_M_0_L_0) },
+ },
+
/* VEX_LEN_MAP5_FD_X86_64 */
{
{ VEX_W_TABLE (VEX_W_MAP5_FD_X86_64_L_0) },
@@ -8246,6 +8316,10 @@ static const struct dis386 vex_w_table[][2] = {
/* VEX_W_0F3849_X86_64_L_0 */
{ MOD_TABLE (MOD_VEX_0F3849_X86_64_L_0_W_0) },
},
+ {
+ /* VEX_W_0F384A_X86_64_M_0_L_0 */
+ { PREFIX_TABLE (PREFIX_VEX_0F384A_X86_64_M_0_L_0_W_0) },
+ },
{
/* VEX_W_0F384B_X86_64_L_0 */
{ PREFIX_TABLE (PREFIX_VEX_0F384B_X86_64_L_0_W_0) },
@@ -8440,6 +8514,14 @@ static const struct dis386 vex_w_table[][2] = {
/* VEX_W_0F3ADE */
{ VEX_LEN_TABLE (VEX_LEN_0F3ADE_W_0) },
},
+ {
+ /* VEX_W_MAP5_F8_X86_64_M_0 */
+ { PREFIX_TABLE (PREFIX_VEX_MAP5_F8_X86_64_M_0_L_0_W_0) },
+ },
+ {
+ /* VEX_W_MAP5_F9_X86_64_M_0 */
+ { PREFIX_TABLE (PREFIX_VEX_MAP5_F9_X86_64_M_0_L_0_W_0) },
+ },
{
/* VEX_W_MAP5_FD_X86_64 */
{ PREFIX_TABLE (PREFIX_VEX_MAP5_FD_X86_64_L_0_W_0) },
@@ -8804,6 +8886,10 @@ static const struct dis386 mod_table[][2] = {
{ PREFIX_TABLE (PREFIX_VEX_0F3849_X86_64_L_0_W_0_M_0) },
{ PREFIX_TABLE (PREFIX_VEX_0F3849_X86_64_L_0_W_0_M_1) },
},
+ {
+ /* MOD_VEX_0F384A_X86_64 */
+ { VEX_LEN_TABLE (VEX_LEN_0F384A_X86_64_M_0) },
+ },
{
/* MOD_VEX_0F386E_X86_64 */
{ VEX_LEN_TABLE (VEX_LEN_0F386E_X86_64_M_0) },
@@ -8812,6 +8898,14 @@ static const struct dis386 mod_table[][2] = {
/* MOD_VEX_0F386F_X86_64 */
{ VEX_LEN_TABLE (VEX_LEN_0F386F_X86_64_M_0) },
},
+ {
+ /* MOD_VEX_MAP5_F8_X86_64 */
+ { VEX_LEN_TABLE (VEX_LEN_MAP5_F8_X86_64_M_0) },
+ },
+ {
+ /* MOD_VEX_MAP5_F9_X86_64 */
+ { VEX_LEN_TABLE (VEX_LEN_MAP5_F9_X86_64_M_0) },
+ },
#include "i386-dis-evex-mod.h"
};
@@ -271,6 +271,8 @@ static const dependency isa_dependencies[] =
"AMX_TILE" },
{ "AMX_FP8",
"AMX_TILE" },
+ { "AMX_MOVRS",
+ "AMX_TILE" },
{ "KL",
"SSE2" },
{ "WIDEKL",
@@ -441,6 +443,7 @@ static bitfield cpu_flags[] =
BITFIELD (AMX_AVX512),
BITFIELD (AMX_TF32),
BITFIELD (AMX_FP8),
+ BITFIELD (AMX_MOVRS),
BITFIELD (AMX_TILE),
BITFIELD (MOVDIRI),
BITFIELD (MOVDIR64B),
@@ -258,6 +258,8 @@ enum i386_cpu
CpuAMX_TF32,
/* AMX-FP8 instructions required */
CpuAMX_FP8,
+ /* Intel AMX-MOVRS Instructions support required. */
+ CpuAMX_MOVRS,
/* AMX-TILE instructions required */
CpuAMX_TILE,
/* GFNI instructions required */
@@ -509,6 +511,7 @@ typedef union i386_cpu_flags
unsigned int cpuamx_avx512:1;
unsigned int cpuamx_tf32:1;
unsigned int cpuamx_fp8:1;
+ unsigned int cpuamx_movrs:1;
unsigned int cpuamx_tile:1;
unsigned int cpugfni:1;
unsigned int cpuvaes:1;
@@ -3197,6 +3197,11 @@ t2rpntlvwz0t1, 0x6f, AMX_TRANSPOSE, TMMPairOperand1|Sibmem|Vex128|Space0F38|VexW
t2rpntlvwz1, 0x666e, AMX_TRANSPOSE, TMMPairOperand1|Sibmem|Vex128|Space0F38|VexW0|NoSuf, { Unspecified|BaseIndex, RegTMM }
t2rpntlvwz1t1, 0x666f, AMX_TRANSPOSE, TMMPairOperand1|Sibmem|Vex128|Space0F38|VexW0|NoSuf, { Unspecified|BaseIndex, RegTMM }
+t2rpntlvwz0rs, 0xf8, AMX_MOVRS&AMX_TRANSPOSE, TMMPairOperand1|Sibmem|Vex128|xVexMap5|VexW0|NoSuf, { Unspecified|BaseIndex, RegTMM }
+t2rpntlvwz0rst1, 0xf9, AMX_MOVRS&AMX_TRANSPOSE, TMMPairOperand1|Sibmem|Vex128|xVexMap5|VexW0|NoSuf, { Unspecified|BaseIndex, RegTMM }
+t2rpntlvwz1rs, 0x66f8, AMX_MOVRS&AMX_TRANSPOSE, TMMPairOperand1|Sibmem|Vex128|xVexMap5|VexW0|NoSuf, { Unspecified|BaseIndex, RegTMM }
+t2rpntlvwz1rst1, 0x66f9, AMX_MOVRS&AMX_TRANSPOSE, TMMPairOperand1|Sibmem|Vex128|xVexMap5|VexW0|NoSuf, { Unspecified|BaseIndex, RegTMM }
+
tcmmimfp16ps, 0x666c, AMX_COMPLEX, Modrm|Vex128|Space0F38|Src2VVVV|VexW0|NoSuf, { RegTMM, RegTMM, RegTMM }
tcmmrlfp16ps, 0x6c, AMX_COMPLEX, Modrm|Vex128|Space0F38|Src2VVVV|VexW0|NoSuf, { RegTMM, RegTMM, RegTMM }
@@ -3230,6 +3235,8 @@ tdphf8ps, 0x66fd, AMX_FP8, Modrm|Vex128|xVexMap5|Src2VVVV|VexW0|NoSuf, { RegTMM,
tileloadd, 0xf24b, APX_F(AMX_TILE), Sibmem|Vex128|EVex128|Space0F38|VexW0|NoSuf, { Unspecified|BaseIndex, RegTMM }
tileloaddt1, 0x664b, APX_F(AMX_TILE), Sibmem|Vex128|EVex128|Space0F38|VexW0|NoSuf, { Unspecified|BaseIndex, RegTMM }
+tileloaddrs, 0xf24a, AMX_MOVRS, Sibmem|Vex128|Space0F38|VexW0|NoSuf, { Unspecified|BaseIndex, RegTMM }
+tileloaddrst1, 0x664a, AMX_MOVRS, Sibmem|Vex128|Space0F38|VexW0|NoSuf, { Unspecified|BaseIndex, RegTMM }
tilemovrow, 0x664a, AMX_AVX512, Modrm|EVex512|Space0F38|Src2VVVV|VexW0|NoSuf, { Reg32, RegTMM, RegZMM }
tilemovrow, 0x6607, AMX_AVX512, Modrm|EVex512|Space0F3A|VexW0|NoSuf, { Imm8, RegTMM, RegZMM }
tilestored, 0xf34b, APX_F(AMX_TILE), Sibmem|Vex128|EVex128|Space0F38|VexW0|NoSuf, { RegTMM, Unspecified|BaseIndex }