@@ -1185,6 +1185,7 @@ static const arch_entry cpu_arch[] =
SUBARCH (amx_transpose, AMX_TRANSPOSE, ANY_AMX_TRANSPOSE, false),
SUBARCH (amx_tf32, AMX_TF32, ANY_AMX_TF32, false),
SUBARCH (amx_fp8, AMX_FP8, ANY_AMX_FP8, false),
+ SUBARCH (amx_movrs, AMX_MOVRS, ANY_AMX_MOVRS, false),
SUBARCH (amx_tile, AMX_TILE, ANY_AMX_TILE, false),
SUBARCH (movdiri, MOVDIRI, MOVDIRI, false),
SUBARCH (movdir64b, MOVDIR64B, MOVDIR64B, false),
@@ -2250,7 +2251,8 @@ cpu_flags_match (const insn_template *t)
|| any.bitfield.cpuavx512f || any.bitfield.cpuavx512bw
|| any.bitfield.cpuavx512dq || any.bitfield.cpuamx_tile
|| any.bitfield.cpucmpccxadd || any.bitfield.cpuuser_msr
- || any.bitfield.cpumsr_imm || any.bitfield.cpuamx_transpose))
+ || any.bitfield.cpumsr_imm || any.bitfield.cpuamx_transpose
+ || any.bitfield.cpuamx_movrs))
{
/* These checks (verifying that APX_F() was properly used in the
opcode table entry) make sure there's no need for an "else" to
@@ -4055,7 +4057,8 @@ install_template (const insn_template *t)
|| maybe_cpu (t, CpuAVX512F) || maybe_cpu (t, CpuAVX512DQ)
|| maybe_cpu (t, CpuAVX512BW) || maybe_cpu (t, CpuBMI)
|| maybe_cpu (t, CpuBMI2) || maybe_cpu (t, CpuUSER_MSR)
- || maybe_cpu (t, CpuMSR_IMM) || maybe_cpu (t, CpuAMX_TRANSPOSE))
+ || maybe_cpu (t, CpuMSR_IMM) || maybe_cpu (t, CpuAMX_TRANSPOSE)
+ || maybe_cpu (t, CpuAMX_MOVRS))
&& maybe_cpu (t, CpuAPX_F))
{
if (need_evex_encoding (t))
@@ -232,6 +232,7 @@ accept various extension mnemonics. For example,
@code{amx_transpose},
@code{amx_tf32},
@code{amx_fp8}
+@code{amx_movrs},
@code{amx_tile},
@code{vmx},
@code{vmfunc},
@@ -1706,7 +1707,7 @@ supported on the CPU specified. The choices for @var{cpu_type} are:
@item @samp{.movdiri} @tab @samp{.movdir64b} @tab @samp{.enqcmd} @tab @samp{.tsxldtrk}
@item @samp{.amx_int8} @tab @samp{.amx_bf16} @tab @samp{.amx_fp16}
@item @samp{.amx_complex} @tab @samp{.amx_transpose} @tab @samp{.amx_tf32}
-@item @samp{.amx_fp8} @tab @samp{.amx_tile}
+@item @samp{.amx_fp8} @tab @samp{.amx_movrs} @tab @samp{.amx_tile}
@item @samp{.kl} @tab @samp{.widekl} @tab @samp{.uintr} @tab @samp{.hreset}
@item @samp{.3dnow} @tab @samp{.3dnowa} @tab @samp{.sse4a} @tab @samp{.sse5}
@item @samp{.syscall} @tab @samp{.rdtscp} @tab @samp{.svme}
new file mode 100644
@@ -0,0 +1,23 @@
+#objdump: -dw -Mintel
+#name: x86_64 AMX-MOVRS insns (Intel disassembly)
+#source: x86-64-amx-movrs.s
+
+.*: +file format .*
+
+Disassembly of section \.text:
+
+#...
+[a-f0-9]+ <_intel>:
+\s*[a-f0-9]+:\s*c4 a5 78 f8 b4 f5 00 00 00 10\s+t2rpntlvwz0rs tmm6,\[rbp\+r14\*8\+0x10000000\]
+\s*[a-f0-9]+:\s*c4 c5 78 f8 14 21\s+t2rpntlvwz0rs tmm2,\[r9\+riz\*1\]
+\s*[a-f0-9]+:\s*c4 a5 78 f9 b4 f5 00 00 00 10\s+t2rpntlvwz0rst1 tmm6,\[rbp\+r14\*8\+0x10000000\]
+\s*[a-f0-9]+:\s*c4 c5 78 f9 14 21\s+t2rpntlvwz0rst1 tmm2,\[r9\+riz\*1\]
+\s*[a-f0-9]+:\s*c4 a5 79 f8 b4 f5 00 00 00 10\s+t2rpntlvwz1rs tmm6,\[rbp\+r14\*8\+0x10000000\]
+\s*[a-f0-9]+:\s*c4 c5 79 f8 14 21\s+t2rpntlvwz1rs tmm2,\[r9\+riz\*1\]
+\s*[a-f0-9]+:\s*c4 a5 79 f9 b4 f5 00 00 00 10\s+t2rpntlvwz1rst1 tmm6,\[rbp\+r14\*8\+0x10000000\]
+\s*[a-f0-9]+:\s*c4 c5 79 f9 14 21\s+t2rpntlvwz1rst1 tmm2,\[r9\+riz\*1\]
+\s*[a-f0-9]+:\s*c4 a2 7b 4a b4 f5 00 00 00 10\s+tileloaddrs tmm6,\[rbp\+r14\*8\+0x10000000\]
+\s*[a-f0-9]+:\s*c4 c2 7b 4a 1c 21\s+tileloaddrs tmm3,\[r9\+riz\*1\]
+\s*[a-f0-9]+:\s*c4 a2 79 4a b4 f5 00 00 00 10\s+tileloaddrst1 tmm6,\[rbp\+r14\*8\+0x10000000\]
+\s*[a-f0-9]+:\s*c4 c2 79 4a 1c 21\s+tileloaddrst1 tmm3,\[r9\+riz\*1\]
+#pass
new file mode 100644
@@ -0,0 +1,13 @@
+.* Assembler messages:
+.*:5: Error: `\(%rip\)' cannot be used here
+.*:6: Error: `\(%rip\)' cannot be used here
+.*:7: Error: `\(%rip\)' cannot be used here
+.*:8: Error: `\(%rip\)' cannot be used here
+.*:9: Warning: operand 2 `%tmm1' implicitly denotes `%tmm0' to `%tmm1' group in `t2rpntlvwz0rs'
+.*:10: Warning: operand 2 `%tmm3' implicitly denotes `%tmm2' to `%tmm3' group in `t2rpntlvwz0rst1'
+.*:11: Warning: operand 2 `%tmm5' implicitly denotes `%tmm4' to `%tmm5' group in `t2rpntlvwz1rs'
+.*:12: Warning: operand 2 `%tmm7' implicitly denotes `%tmm6' to `%tmm7' group in `t2rpntlvwz1rst1'
+.*:16: Error: `t2rpntlvwz0rs' is not supported on `x86_64.noamx_transpose'
+.*:17: Error: `t2rpntlvwz0rst1' is not supported on `x86_64.noamx_transpose'
+.*:18: Error: `t2rpntlvwz1rs' is not supported on `x86_64.noamx_transpose'
+.*:19: Error: `t2rpntlvwz1rst1' is not supported on `x86_64.noamx_transpose'
new file mode 100644
@@ -0,0 +1,19 @@
+# Check Invalid 64bit AMX-MOVRS instructions
+
+ .text
+_start:
+ t2rpntlvwz0rs (%rip), %tmm2
+ t2rpntlvwz0rst1 (%rip), %tmm2
+ t2rpntlvwz1rs (%rip), %tmm2
+ t2rpntlvwz1rst1 (%rip), %tmm2
+ t2rpntlvwz0rs (%r9), %tmm1
+ t2rpntlvwz0rst1 (%r9), %tmm3
+ t2rpntlvwz1rs (%r9), %tmm5
+ t2rpntlvwz1rst1 (%r9), %tmm7
+
+ .arch .noamx_transpose
+_transpose:
+ t2rpntlvwz0rs (%r9), %tmm2
+ t2rpntlvwz0rst1 (%r9), %tmm2
+ t2rpntlvwz1rs (%r9), %tmm2
+ t2rpntlvwz1rst1 (%r9), %tmm2
new file mode 100644
@@ -0,0 +1,21 @@
+#objdump: -dw
+#name: x86_64 AMX-MOVRS insns
+
+.*: +file format .*
+
+Disassembly of section \.text:
+
+0+ <_start>:
+\s*[a-f0-9]+:\s*c4 a5 78 f8 b4 f5 00 00 00 10\s+t2rpntlvwz0rs 0x10000000\(%rbp,%r14,8\),%tmm6
+\s*[a-f0-9]+:\s*c4 c5 78 f8 14 21\s+t2rpntlvwz0rs \(%r9,%riz,1\),%tmm2
+\s*[a-f0-9]+:\s*c4 a5 78 f9 b4 f5 00 00 00 10\s+t2rpntlvwz0rst1 0x10000000\(%rbp,%r14,8\),%tmm6
+\s*[a-f0-9]+:\s*c4 c5 78 f9 14 21\s+t2rpntlvwz0rst1 \(%r9,%riz,1\),%tmm2
+\s*[a-f0-9]+:\s*c4 a5 79 f8 b4 f5 00 00 00 10\s+t2rpntlvwz1rs 0x10000000\(%rbp,%r14,8\),%tmm6
+\s*[a-f0-9]+:\s*c4 c5 79 f8 14 21\s+t2rpntlvwz1rs \(%r9,%riz,1\),%tmm2
+\s*[a-f0-9]+:\s*c4 a5 79 f9 b4 f5 00 00 00 10\s+t2rpntlvwz1rst1 0x10000000\(%rbp,%r14,8\),%tmm6
+\s*[a-f0-9]+:\s*c4 c5 79 f9 14 21\s+t2rpntlvwz1rst1 \(%r9,%riz,1\),%tmm2
+\s*[a-f0-9]+:\s*c4 a2 7b 4a b4 f5 00 00 00 10\s+tileloaddrs 0x10000000\(%rbp,%r14,8\),%tmm6
+\s*[a-f0-9]+:\s*c4 c2 7b 4a 1c 21\s+tileloaddrs \(%r9,%riz,1\),%tmm3
+\s*[a-f0-9]+:\s*c4 a2 79 4a b4 f5 00 00 00 10\s+tileloaddrst1 0x10000000\(%rbp,%r14,8\),%tmm6
+\s*[a-f0-9]+:\s*c4 c2 79 4a 1c 21\s+tileloaddrst1 \(%r9,%riz,1\),%tmm3
+#pass
new file mode 100644
@@ -0,0 +1,31 @@
+# Check 64bit AMX-MOVRS instructions
+
+ .text
+_start:
+ t2rpntlvwz0rs 0x10000000(%rbp, %r14, 8), %tmm6
+ t2rpntlvwz0rs (%r9), %tmm2
+ t2rpntlvwz0rst1 0x10000000(%rbp, %r14, 8), %tmm6
+ t2rpntlvwz0rst1 (%r9), %tmm2
+ t2rpntlvwz1rs 0x10000000(%rbp, %r14, 8), %tmm6
+ t2rpntlvwz1rs (%r9), %tmm2
+ t2rpntlvwz1rst1 0x10000000(%rbp, %r14, 8), %tmm6
+ t2rpntlvwz1rst1 (%r9), %tmm2
+ tileloaddrs 0x10000000(%rbp, %r14, 8), %tmm6
+ tileloaddrs (%r9), %tmm3
+ tileloaddrst1 0x10000000(%rbp, %r14, 8), %tmm6
+ tileloaddrst1 (%r9), %tmm3
+
+_intel:
+ .intel_syntax noprefix
+ t2rpntlvwz0rs tmm6, [rbp+r14*8+0x10000000]
+ t2rpntlvwz0rs tmm2, [r9]
+ t2rpntlvwz0rst1 tmm6, [rbp+r14*8+0x10000000]
+ t2rpntlvwz0rst1 tmm2, [r9]
+ t2rpntlvwz1rs tmm6, [rbp+r14*8+0x10000000]
+ t2rpntlvwz1rs tmm2, [r9]
+ t2rpntlvwz1rst1 tmm6, [rbp+r14*8+0x10000000]
+ t2rpntlvwz1rst1 tmm2, [r9]
+ tileloaddrs tmm6, [rbp+r14*8+0x10000000]
+ tileloaddrs tmm3, [r9]
+ tileloaddrst1 tmm6, [rbp+r14*8+0x10000000]
+ tileloaddrst1 tmm3, [r9]
@@ -141,11 +141,19 @@ Disassembly of section \.text:
[ ]*[a-f0-9]+:[ ]*62 da 7d 08 49 84 87 23 01 00 00[ ]+sttilecfg[ ]+\[r31\+rax\*4\+0x123\]
[ ]*[a-f0-9]+:[ ]*62 da 7f 08 4b b4 87 23 01 00 00[ ]+tileloadd tmm6,\[r31\+rax\*4\+0x123\]
[ ]*[a-f0-9]+:[ ]*62 da 7d 08 4b b4 87 23 01 00 00[ ]+tileloaddt1 tmm6,\[r31\+rax\*4\+0x123\]
+[ ]*[a-f0-9]+:[ ]*62 b2 7b 08 4a b4 fd 00 00 00 10[ ]+tileloaddrs[ ]+tmm6,\[rbp\+r31\*8\+0x10000000\]
+[ ]*[a-f0-9]+:[ ]*62 fa 7f 08 4a 1c 20[ ]+tileloaddrs[ ]+tmm3,\[r16\+riz\*1\]
+[ ]*[a-f0-9]+:[ ]*62 9a 7d 08 4a b4 f7 00 00 00 10[ ]+tileloaddrst1[ ]+tmm6,\[r31\+r14\*8\+0x10000000\]
+[ ]*[a-f0-9]+:[ ]*62 fa 7d 08 4a 1c 20[ ]+tileloaddrst1[ ]+tmm3,\[r16\+riz\*1\]
[ ]*[a-f0-9]+:[ ]*62 da 7e 08 4b b4 87 23 01 00 00[ ]+tilestored[ ]+\[r31\+rax\*4\+0x123\],tmm6
[ ]*[a-f0-9]+:[ ]*62 da 7c 08 6e b4 c7 23 01 00 00[ ]+t2rpntlvwz0 tmm6,\[r31\+rax\*8\+0x123\]
[ ]*[a-f0-9]+:[ ]*62 da 7c 08 6f b4 c7 23 01 00 00[ ]+t2rpntlvwz0t1 tmm6,\[r31\+rax\*8\+0x123\]
[ ]*[a-f0-9]+:[ ]*62 da 7d 08 6e b4 c7 23 01 00 00[ ]+t2rpntlvwz1 tmm6,\[r31\+rax\*8\+0x123\]
[ ]*[a-f0-9]+:[ ]*62 da 7d 08 6f b4 c7 23 01 00 00[ ]+t2rpntlvwz1t1 tmm6,\[r31\+rax\*8\+0x123\]
+[ ]*[a-f0-9]+:[ ]*62 dd 7c 08 f8 b4 c7 23 01 00 00[ ]+t2rpntlvwz0rs tmm6,\[r31\+rax\*8\+0x123\]
+[ ]*[a-f0-9]+:[ ]*62 dd 7c 08 f9 b4 c7 23 01 00 00[ ]+t2rpntlvwz0rst1 tmm6,\[r31\+rax\*8\+0x123\]
+[ ]*[a-f0-9]+:[ ]*62 dd 7d 08 f8 b4 c7 23 01 00 00[ ]+t2rpntlvwz1rs tmm6,\[r31\+rax\*8\+0x123\]
+[ ]*[a-f0-9]+:[ ]*62 dd 7d 08 f9 b4 c7 23 01 00 00[ ]+t2rpntlvwz1rst1 tmm6,\[r31\+rax\*8\+0x123\]
[ ]*[a-f0-9]+:[ ]*62 4c 7c 08 66 8c 87 23 01 00 00[ ]+wrssd[ ]+\[r31\+rax\*4\+0x123\],r25d
[ ]*[a-f0-9]+:[ ]*62 4c fc 08 66 bc 87 23 01 00 00[ ]+wrssq[ ]+\[r31\+rax\*4\+0x123\],r31
[ ]*[a-f0-9]+:[ ]*62 4c 7d 08 65 8c 87 23 01 00 00[ ]+wrussd[ ]+\[r31\+rax\*4\+0x123\],r25d
@@ -280,11 +288,19 @@ Disassembly of section \.text:
[ ]*[a-f0-9]+:[ ]*62 da 7d 08 49 84 87 23 01 00 00[ ]+sttilecfg[ ]+\[r31\+rax\*4\+0x123\]
[ ]*[a-f0-9]+:[ ]*62 da 7f 08 4b b4 87 23 01 00 00[ ]+tileloadd tmm6,\[r31\+rax\*4\+0x123\]
[ ]*[a-f0-9]+:[ ]*62 da 7d 08 4b b4 87 23 01 00 00[ ]+tileloaddt1 tmm6,\[r31\+rax\*4\+0x123\]
+[ ]*[a-f0-9]+:[ ]*62 b2 7b 08 4a b4 fd 00 00 00 10[ ]+tileloaddrs[ ]+tmm6,\[rbp\+r31\*8\+0x10000000\]
+[ ]*[a-f0-9]+:[ ]*62 fa 7f 08 4a 1c 20[ ]+tileloaddrs[ ]+tmm3,\[r16\+riz\*1\]
+[ ]*[a-f0-9]+:[ ]*62 9a 7d 08 4a b4 f7 00 00 00 10[ ]+tileloaddrst1[ ]+tmm6,\[r31\+r14\*8\+0x10000000\]
+[ ]*[a-f0-9]+:[ ]*62 fa 7d 08 4a 1c 20[ ]+tileloaddrst1[ ]+tmm3,\[r16\+riz\*1\]
[ ]*[a-f0-9]+:[ ]*62 da 7e 08 4b b4 87 23 01 00 00[ ]+tilestored[ ]+\[r31\+rax\*4\+0x123\],tmm6
[ ]*[a-f0-9]+:[ ]*62 da 7c 08 6e b4 c7 23 01 00 00[ ]+t2rpntlvwz0 tmm6,\[r31\+rax\*8\+0x123\]
[ ]*[a-f0-9]+:[ ]*62 da 7c 08 6f b4 c7 23 01 00 00[ ]+t2rpntlvwz0t1 tmm6,\[r31\+rax\*8\+0x123\]
[ ]*[a-f0-9]+:[ ]*62 da 7d 08 6e b4 c7 23 01 00 00[ ]+t2rpntlvwz1 tmm6,\[r31\+rax\*8\+0x123\]
[ ]*[a-f0-9]+:[ ]*62 da 7d 08 6f b4 c7 23 01 00 00[ ]+t2rpntlvwz1t1 tmm6,\[r31\+rax\*8\+0x123\]
+[ ]*[a-f0-9]+:[ ]*62 dd 7c 08 f8 b4 c7 23 01 00 00[ ]+t2rpntlvwz0rs tmm6,\[r31\+rax\*8\+0x123\]
+[ ]*[a-f0-9]+:[ ]*62 dd 7c 08 f9 b4 c7 23 01 00 00[ ]+t2rpntlvwz0rst1 tmm6,\[r31\+rax\*8\+0x123\]
+[ ]*[a-f0-9]+:[ ]*62 dd 7d 08 f8 b4 c7 23 01 00 00[ ]+t2rpntlvwz1rs tmm6,\[r31\+rax\*8\+0x123\]
+[ ]*[a-f0-9]+:[ ]*62 dd 7d 08 f9 b4 c7 23 01 00 00[ ]+t2rpntlvwz1rst1 tmm6,\[r31\+rax\*8\+0x123\]
[ ]*[a-f0-9]+:[ ]*62 4c 7c 08 66 8c 87 23 01 00 00[ ]+wrssd[ ]+\[r31\+rax\*4\+0x123\],r25d
[ ]*[a-f0-9]+:[ ]*62 4c fc 08 66 bc 87 23 01 00 00[ ]+wrssq[ ]+\[r31\+rax\*4\+0x123\],r31
[ ]*[a-f0-9]+:[ ]*62 4c 7d 08 65 8c 87 23 01 00 00[ ]+wrussd[ ]+\[r31\+rax\*4\+0x123\],r25d
@@ -141,11 +141,19 @@ Disassembly of section \.text:
[ ]*[a-f0-9]+:[ ]*62 da 7d 08 49 84 87 23 01 00 00[ ]+sttilecfg[ ]+0x123\(%r31,%rax,4\)
[ ]*[a-f0-9]+:[ ]*62 da 7f 08 4b b4 87 23 01 00 00[ ]+tileloadd[ ]+0x123\(%r31,%rax,4\),%tmm6
[ ]*[a-f0-9]+:[ ]*62 da 7d 08 4b b4 87 23 01 00 00[ ]+tileloaddt1[ ]+0x123\(%r31,%rax,4\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 b2 7b 08 4a b4 fd 00 00 00 10[ ]+tileloaddrs[ ]+0x10000000\(%rbp,%r31,8\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 fa 7f 08 4a 1c 20[ ]+tileloaddrs[ ]+\(%r16,%riz,1\),%tmm3
+[ ]*[a-f0-9]+:[ ]*62 9a 7d 08 4a b4 f7 00 00 00 10[ ]+tileloaddrst1[ ]+0x10000000\(%r31,%r14,8\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 fa 7d 08 4a 1c 20[ ]+tileloaddrst1[ ]+\(%r16,%riz,1\),%tmm3
[ ]*[a-f0-9]+:[ ]*62 da 7e 08 4b b4 87 23 01 00 00[ ]+tilestored[ ]+%tmm6,0x123\(%r31,%rax,4\)
[ ]*[a-f0-9]+:[ ]*62 da 7c 08 6e b4 c7 23 01 00 00[ ]+t2rpntlvwz0[ ]+0x123\(%r31,%rax,8\),%tmm6
[ ]*[a-f0-9]+:[ ]*62 da 7c 08 6f b4 c7 23 01 00 00[ ]+t2rpntlvwz0t1[ ]+0x123\(%r31,%rax,8\),%tmm6
[ ]*[a-f0-9]+:[ ]*62 da 7d 08 6e b4 c7 23 01 00 00[ ]+t2rpntlvwz1[ ]+0x123\(%r31,%rax,8\),%tmm6
[ ]*[a-f0-9]+:[ ]*62 da 7d 08 6f b4 c7 23 01 00 00[ ]+t2rpntlvwz1t1[ ]+0x123\(%r31,%rax,8\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 dd 7c 08 f8 b4 c7 23 01 00 00[ ]+t2rpntlvwz0rs[ ]+0x123\(%r31,%rax,8\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 dd 7c 08 f9 b4 c7 23 01 00 00[ ]+t2rpntlvwz0rst1[ ]+0x123\(%r31,%rax,8\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 dd 7d 08 f8 b4 c7 23 01 00 00[ ]+t2rpntlvwz1rs[ ]+0x123\(%r31,%rax,8\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 dd 7d 08 f9 b4 c7 23 01 00 00[ ]+t2rpntlvwz1rst1[ ]+0x123\(%r31,%rax,8\),%tmm6
[ ]*[a-f0-9]+:[ ]*62 4c 7c 08 66 8c 87 23 01 00 00[ ]+wrssd[ ]+%r25d,0x123\(%r31,%rax,4\)
[ ]*[a-f0-9]+:[ ]*62 4c fc 08 66 bc 87 23 01 00 00[ ]+wrssq[ ]+%r31,0x123\(%r31,%rax,4\)
[ ]*[a-f0-9]+:[ ]*62 4c 7d 08 65 8c 87 23 01 00 00[ ]+wrussd[ ]+%r25d,0x123\(%r31,%rax,4\)
@@ -280,11 +288,19 @@ Disassembly of section \.text:
[ ]*[a-f0-9]+:[ ]*62 da 7d 08 49 84 87 23 01 00 00[ ]+sttilecfg[ ]+0x123\(%r31,%rax,4\)
[ ]*[a-f0-9]+:[ ]*62 da 7f 08 4b b4 87 23 01 00 00[ ]+tileloadd[ ]+0x123\(%r31,%rax,4\),%tmm6
[ ]*[a-f0-9]+:[ ]*62 da 7d 08 4b b4 87 23 01 00 00[ ]+tileloaddt1[ ]+0x123\(%r31,%rax,4\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 b2 7b 08 4a b4 fd 00 00 00 10[ ]+tileloaddrs[ ]+0x10000000\(%rbp,%r31,8\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 fa 7f 08 4a 1c 20[ ]+tileloaddrs[ ]+\(%r16,%riz,1\),%tmm3
+[ ]*[a-f0-9]+:[ ]*62 9a 7d 08 4a b4 f7 00 00 00 10[ ]+tileloaddrst1[ ]+0x10000000\(%r31,%r14,8\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 fa 7d 08 4a 1c 20[ ]+tileloaddrst1[ ]+\(%r16,%riz,1\),%tmm3
[ ]*[a-f0-9]+:[ ]*62 da 7e 08 4b b4 87 23 01 00 00[ ]+tilestored[ ]+%tmm6,0x123\(%r31,%rax,4\)
[ ]*[a-f0-9]+:[ ]*62 da 7c 08 6e b4 c7 23 01 00 00[ ]+t2rpntlvwz0[ ]+0x123\(%r31,%rax,8\),%tmm6
[ ]*[a-f0-9]+:[ ]*62 da 7c 08 6f b4 c7 23 01 00 00[ ]+t2rpntlvwz0t1[ ]+0x123\(%r31,%rax,8\),%tmm6
[ ]*[a-f0-9]+:[ ]*62 da 7d 08 6e b4 c7 23 01 00 00[ ]+t2rpntlvwz1[ ]+0x123\(%r31,%rax,8\),%tmm6
[ ]*[a-f0-9]+:[ ]*62 da 7d 08 6f b4 c7 23 01 00 00[ ]+t2rpntlvwz1t1[ ]+0x123\(%r31,%rax,8\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 dd 7c 08 f8 b4 c7 23 01 00 00[ ]+t2rpntlvwz0rs[ ]+0x123\(%r31,%rax,8\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 dd 7c 08 f9 b4 c7 23 01 00 00[ ]+t2rpntlvwz0rst1[ ]+0x123\(%r31,%rax,8\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 dd 7d 08 f8 b4 c7 23 01 00 00[ ]+t2rpntlvwz1rs[ ]+0x123\(%r31,%rax,8\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 dd 7d 08 f9 b4 c7 23 01 00 00[ ]+t2rpntlvwz1rst1[ ]+0x123\(%r31,%rax,8\),%tmm6
[ ]*[a-f0-9]+:[ ]*62 4c 7c 08 66 8c 87 23 01 00 00[ ]+wrssd[ ]+%r25d,0x123\(%r31,%rax,4\)
[ ]*[a-f0-9]+:[ ]*62 4c fc 08 66 bc 87 23 01 00 00[ ]+wrssq[ ]+%r31,0x123\(%r31,%rax,4\)
[ ]*[a-f0-9]+:[ ]*62 4c 7d 08 65 8c 87 23 01 00 00[ ]+wrussd[ ]+%r25d,0x123\(%r31,%rax,4\)
@@ -141,11 +141,19 @@ Disassembly of section \.text:
[ ]*[a-f0-9]+:[ ]*62 da 7d 08 49 84 87 23 01 00 00[ ]+sttilecfg[ ]+0x123\(%r31,%rax,4\)
[ ]*[a-f0-9]+:[ ]*62 da 7f 08 4b b4 87 23 01 00 00[ ]+tileloadd[ ]+0x123\(%r31,%rax,4\),%tmm6
[ ]*[a-f0-9]+:[ ]*62 da 7d 08 4b b4 87 23 01 00 00[ ]+tileloaddt1[ ]+0x123\(%r31,%rax,4\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 b2 7b 08 4a b4 fd 00 00 00 10[ ]+tileloaddrs[ ]+0x10000000\(%rbp,%r31,8\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 fa 7f 08 4a 1c 20[ ]+tileloaddrs[ ]+\(%r16,%riz,1\),%tmm3
+[ ]*[a-f0-9]+:[ ]*62 9a 7d 08 4a b4 f7 00 00 00 10[ ]+tileloaddrst1[ ]+0x10000000\(%r31,%r14,8\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 fa 7d 08 4a 1c 20[ ]+tileloaddrst1[ ]+\(%r16,%riz,1\),%tmm3
[ ]*[a-f0-9]+:[ ]*62 da 7e 08 4b b4 87 23 01 00 00[ ]+tilestored[ ]+%tmm6,0x123\(%r31,%rax,4\)
[ ]*[a-f0-9]+:[ ]*62 da 7c 08 6e b4 c7 23 01 00 00[ ]+t2rpntlvwz0[ ]+0x123\(%r31,%rax,8\),%tmm6
[ ]*[a-f0-9]+:[ ]*62 da 7c 08 6f b4 c7 23 01 00 00[ ]+t2rpntlvwz0t1[ ]+0x123\(%r31,%rax,8\),%tmm6
[ ]*[a-f0-9]+:[ ]*62 da 7d 08 6e b4 c7 23 01 00 00[ ]+t2rpntlvwz1[ ]+0x123\(%r31,%rax,8\),%tmm6
[ ]*[a-f0-9]+:[ ]*62 da 7d 08 6f b4 c7 23 01 00 00[ ]+t2rpntlvwz1t1[ ]+0x123\(%r31,%rax,8\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 dd 7c 08 f8 b4 c7 23 01 00 00[ ]+t2rpntlvwz0rs[ ]+0x123\(%r31,%rax,8\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 dd 7c 08 f9 b4 c7 23 01 00 00[ ]+t2rpntlvwz0rst1[ ]+0x123\(%r31,%rax,8\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 dd 7d 08 f8 b4 c7 23 01 00 00[ ]+t2rpntlvwz1rs[ ]+0x123\(%r31,%rax,8\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 dd 7d 08 f9 b4 c7 23 01 00 00[ ]+t2rpntlvwz1rst1[ ]+0x123\(%r31,%rax,8\),%tmm6
[ ]*[a-f0-9]+:[ ]*62 4c 7c 08 66 8c 87 23 01 00 00[ ]+wrssd[ ]+%r25d,0x123\(%r31,%rax,4\)
[ ]*[a-f0-9]+:[ ]*62 4c fc 08 66 bc 87 23 01 00 00[ ]+wrssq[ ]+%r31,0x123\(%r31,%rax,4\)
[ ]*[a-f0-9]+:[ ]*62 4c 7d 08 65 8c 87 23 01 00 00[ ]+wrussd[ ]+%r25d,0x123\(%r31,%rax,4\)
@@ -280,11 +288,19 @@ Disassembly of section \.text:
[ ]*[a-f0-9]+:[ ]*62 da 7d 08 49 84 87 23 01 00 00[ ]+sttilecfg[ ]+0x123\(%r31,%rax,4\)
[ ]*[a-f0-9]+:[ ]*62 da 7f 08 4b b4 87 23 01 00 00[ ]+tileloadd[ ]+0x123\(%r31,%rax,4\),%tmm6
[ ]*[a-f0-9]+:[ ]*62 da 7d 08 4b b4 87 23 01 00 00[ ]+tileloaddt1[ ]+0x123\(%r31,%rax,4\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 b2 7b 08 4a b4 fd 00 00 00 10[ ]+tileloaddrs[ ]+0x10000000\(%rbp,%r31,8\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 fa 7f 08 4a 1c 20[ ]+tileloaddrs[ ]+\(%r16,%riz,1\),%tmm3
+[ ]*[a-f0-9]+:[ ]*62 9a 7d 08 4a b4 f7 00 00 00 10[ ]+tileloaddrst1[ ]+0x10000000\(%r31,%r14,8\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 fa 7d 08 4a 1c 20[ ]+tileloaddrst1[ ]+\(%r16,%riz,1\),%tmm3
[ ]*[a-f0-9]+:[ ]*62 da 7e 08 4b b4 87 23 01 00 00[ ]+tilestored[ ]+%tmm6,0x123\(%r31,%rax,4\)
[ ]*[a-f0-9]+:[ ]*62 da 7c 08 6e b4 c7 23 01 00 00[ ]+t2rpntlvwz0[ ]+0x123\(%r31,%rax,8\),%tmm6
[ ]*[a-f0-9]+:[ ]*62 da 7c 08 6f b4 c7 23 01 00 00[ ]+t2rpntlvwz0t1[ ]+0x123\(%r31,%rax,8\),%tmm6
[ ]*[a-f0-9]+:[ ]*62 da 7d 08 6e b4 c7 23 01 00 00[ ]+t2rpntlvwz1[ ]+0x123\(%r31,%rax,8\),%tmm6
[ ]*[a-f0-9]+:[ ]*62 da 7d 08 6f b4 c7 23 01 00 00[ ]+t2rpntlvwz1t1[ ]+0x123\(%r31,%rax,8\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 dd 7c 08 f8 b4 c7 23 01 00 00[ ]+t2rpntlvwz0rs[ ]+0x123\(%r31,%rax,8\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 dd 7c 08 f9 b4 c7 23 01 00 00[ ]+t2rpntlvwz0rst1[ ]+0x123\(%r31,%rax,8\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 dd 7d 08 f8 b4 c7 23 01 00 00[ ]+t2rpntlvwz1rs[ ]+0x123\(%r31,%rax,8\),%tmm6
+[ ]*[a-f0-9]+:[ ]*62 dd 7d 08 f9 b4 c7 23 01 00 00[ ]+t2rpntlvwz1rst1[ ]+0x123\(%r31,%rax,8\),%tmm6
[ ]*[a-f0-9]+:[ ]*62 4c 7c 08 66 8c 87 23 01 00 00[ ]+wrssd[ ]+%r25d,0x123\(%r31,%rax,4\)
[ ]*[a-f0-9]+:[ ]*62 4c fc 08 66 bc 87 23 01 00 00[ ]+wrssq[ ]+%r31,0x123\(%r31,%rax,4\)
[ ]*[a-f0-9]+:[ ]*62 4c 7d 08 65 8c 87 23 01 00 00[ ]+wrussd[ ]+%r25d,0x123\(%r31,%rax,4\)
@@ -135,11 +135,19 @@ _start:
sttilecfg 0x123(%r31,%rax,4)
tileloadd 0x123(%r31,%rax,4),%tmm6
tileloaddt1 0x123(%r31,%rax,4),%tmm6
+ tileloaddrs 0x10000000(%rbp, %r31, 8), %tmm6
+ tileloaddrs (%r16), %tmm3
+ tileloaddrst1 0x10000000(%r31, %r14, 8), %tmm6
+ tileloaddrst1 (%r16), %tmm3
tilestored %tmm6,0x123(%r31,%rax,4)
t2rpntlvwz0 0x123(%r31,%rax,8),%tmm6
t2rpntlvwz0t1 0x123(%r31,%rax,8),%tmm6
t2rpntlvwz1 0x123(%r31,%rax,8),%tmm6
t2rpntlvwz1t1 0x123(%r31,%rax,8),%tmm6
+ t2rpntlvwz0rs 0x123(%r31,%rax,8),%tmm6
+ t2rpntlvwz0rst1 0x123(%r31,%rax,8),%tmm6
+ t2rpntlvwz1rs 0x123(%r31,%rax,8),%tmm6
+ t2rpntlvwz1rst1 0x123(%r31,%rax,8),%tmm6
wrssd %r25d,0x123(%r31,%rax,4)
wrssq %r31,0x123(%r31,%rax,4)
wrussd %r25d,0x123(%r31,%rax,4)
@@ -276,11 +284,19 @@ _start:
sttilecfg [r31+rax*4+0x123]
tileloadd tmm6,[r31+rax*4+0x123]
tileloaddt1 tmm6,[r31+rax*4+0x123]
+ tileloaddrs tmm6, [rbp+r31*8+0x10000000]
+ tileloaddrs tmm3, [r16]
+ tileloaddrst1 tmm6, [r31+r14*8+0x10000000]
+ tileloaddrst1 tmm3, [r16]
tilestored [r31+rax*4+0x123],tmm6
t2rpntlvwz0 tmm6,[r31+rax*8+0x123]
t2rpntlvwz0t1 tmm6,[r31+rax*8+0x123]
t2rpntlvwz1 tmm6,[r31+rax*8+0x123]
t2rpntlvwz1t1 tmm6,[r31+rax*8+0x123]
+ t2rpntlvwz0rs tmm6,[r31+rax*8+0x123]
+ t2rpntlvwz0rst1 tmm6,[r31+rax*8+0x123]
+ t2rpntlvwz1rs tmm6,[r31+rax*8+0x123]
+ t2rpntlvwz1rst1 tmm6,[r31+rax*8+0x123]
wrssd DWORD PTR [r31+rax*4+0x123],r25d
wrssq QWORD PTR [r31+rax*4+0x123],r31
wrussd DWORD PTR [r31+rax*4+0x123],r25d
@@ -535,6 +535,9 @@ run_dump_test "x86-64-amx-fp8"
run_dump_test "x86-64-amx-fp8-intel"
run_list_test "x86-64-amx-fp8-inval"
run_dump_test "x86-64-amx-fp8-bad"
+run_dump_test "x86-64-amx-movrs"
+run_dump_test "x86-64-amx-movrs-intel"
+run_list_test "x86-64-amx-movrs-inval"
run_dump_test "x86-64-movrs"
run_dump_test "x86-64-movrs-intel"
run_dump_test "x86-64-movrs-avx10_2-512"
@@ -44,6 +44,11 @@ static const struct dis386 evex_len_table[][3] = {
{ "vperm%DQ", { XM, Vex, EXx }, PREFIX_DATA },
},
+ /* EVEX_LEN_0F384A_X86_64_W_0 */
+ {
+ { X86_64_EVEX_PFX_TABLE (PREFIX_VEX_0F384A_X86_64_W_0_L_0) },
+ },
+
/* EVEX_LEN_0F385A */
{
{ Bad_Opcode },
@@ -346,6 +346,10 @@
{
{ "vpbroadcastmw2dY", { XM, MaskR }, 0 },
},
+ /* EVEX_W_0F384A_X86_64 */
+ {
+ { EVEX_LEN_TABLE (EVEX_LEN_0F384A_X86_64_W_0) },
+ },
/* EVEX_W_0F3859 */
{
{ "vbroadcasti32x2", { XM, EXq }, PREFIX_DATA },
@@ -1,3 +1,8 @@
+ /* X86_64_EVEX_0F384A */
+ {
+ { Bad_Opcode },
+ { VEX_W_TABLE (EVEX_W_0F384A_X86_64) },
+ },
/* X86_64_EVEX_MAP5_6F_M_0 */
{
{ Bad_Opcode },
@@ -376,7 +376,7 @@ static const struct dis386 evex_table[][256] = {
/* 48 */
{ Bad_Opcode },
{ X86_64_EVEX_MEM_W_TABLE (VEX_W_0F3849_X86_64_L_0) },
- { Bad_Opcode },
+ { X86_64_TABLE (X86_64_EVEX_0F384A) },
{ X86_64_EVEX_MEM_W_TABLE (VEX_W_0F384B_X86_64_L_0) },
{ "vrcp14p%XW", { XM, EXx }, PREFIX_DATA },
{ "vrcp14s%XW", { XMScalar, VexScalar, EXdq }, PREFIX_DATA },
@@ -1445,8 +1445,8 @@ static const struct dis386 evex_table[][256] = {
{ Bad_Opcode },
{ Bad_Opcode },
/* F8 */
- { Bad_Opcode },
- { Bad_Opcode },
+ { X86_64_EVEX_FROM_VEX_TABLE (X86_64_VEX_MAP5_F8) },
+ { X86_64_EVEX_FROM_VEX_TABLE (X86_64_VEX_MAP5_F9) },
{ Bad_Opcode },
{ Bad_Opcode },
{ Bad_Opcode },
@@ -968,6 +968,8 @@ enum
MOD_VEX_0F3849_X86_64_L_0_W_0,
MOD_VEX_0F386E_X86_64,
MOD_VEX_0F386F_X86_64,
+ MOD_VEX_MAP5_F8_X86_64,
+ MOD_VEX_MAP5_F9_X86_64,
MOD_EVEX_MAP4_60,
MOD_EVEX_MAP4_61,
@@ -1141,6 +1143,7 @@ enum
PREFIX_VEX_0F3848_X86_64_L_0_W_0,
PREFIX_VEX_0F3849_X86_64_L_0_W_0_M_0,
PREFIX_VEX_0F3849_X86_64_L_0_W_0_M_1,
+ PREFIX_VEX_0F384A_X86_64_W_0_L_0,
PREFIX_VEX_0F384B_X86_64_L_0_W_0,
PREFIX_VEX_0F3850_W_0,
PREFIX_VEX_0F3851_W_0,
@@ -1166,6 +1169,8 @@ enum
PREFIX_VEX_0F38F6_L_0,
PREFIX_VEX_0F38F7_L_0,
PREFIX_VEX_0F3AF0_L_0,
+ PREFIX_VEX_MAP5_F8_X86_64_M_0_L_0_W_0,
+ PREFIX_VEX_MAP5_F9_X86_64_M_0_L_0_W_0,
PREFIX_VEX_MAP5_FD_X86_64_L_0_W_0,
PREFIX_VEX_MAP7_F6_L_0_W_0_R_0_X86_64,
PREFIX_VEX_MAP7_F8_L_0_W_0_R_0_X86_64,
@@ -1361,6 +1366,7 @@ enum
X86_64_VEX_0F3848,
X86_64_VEX_0F3849,
+ X86_64_VEX_0F384A,
X86_64_VEX_0F384B,
X86_64_VEX_0F385C,
X86_64_VEX_0F385E,
@@ -1371,10 +1377,14 @@ enum
X86_64_VEX_0F386F,
X86_64_VEX_0F38Ex,
+ X86_64_VEX_MAP5_F8,
+ X86_64_VEX_MAP5_F9,
X86_64_VEX_MAP5_FD,
X86_64_VEX_MAP7_F6_L_0_W_0_R_0,
X86_64_VEX_MAP7_F8_L_0_W_0_R_0,
+ X86_64_EVEX_0F384A,
+
X86_64_EVEX_MAP5_6F_M_0,
};
@@ -1448,6 +1458,7 @@ enum
VEX_LEN_0F3841,
VEX_LEN_0F3848_X86_64,
VEX_LEN_0F3849_X86_64,
+ VEX_LEN_0F384A_X86_64_W_0,
VEX_LEN_0F384B_X86_64,
VEX_LEN_0F385A,
VEX_LEN_0F385C_X86_64,
@@ -1495,6 +1506,8 @@ enum
VEX_LEN_0F3ADE_W_0,
VEX_LEN_0F3ADF,
VEX_LEN_0F3AF0,
+ VEX_LEN_MAP5_F8_X86_64_M_0,
+ VEX_LEN_MAP5_F9_X86_64_M_0,
VEX_LEN_MAP5_FD_X86_64,
VEX_LEN_MAP7_F6,
VEX_LEN_MAP7_F8,
@@ -1567,6 +1580,7 @@ enum
EVEX_LEN_0F381A,
EVEX_LEN_0F381B,
EVEX_LEN_0F3836,
+ EVEX_LEN_0F384A_X86_64_W_0,
EVEX_LEN_0F385A,
EVEX_LEN_0F385B,
EVEX_LEN_0F38C6,
@@ -1621,6 +1635,7 @@ enum
VEX_W_0F3846,
VEX_W_0F3848_X86_64_L_0,
VEX_W_0F3849_X86_64_L_0,
+ VEX_W_0F384A_X86_64,
VEX_W_0F384B_X86_64_L_0,
VEX_W_0F3850,
VEX_W_0F3851,
@@ -1668,6 +1683,8 @@ enum
VEX_W_0F3ACE,
VEX_W_0F3ACF,
VEX_W_0F3ADE,
+ VEX_W_MAP5_F8_X86_64_M_0_L_0,
+ VEX_W_MAP5_F9_X86_64_M_0_L_0,
VEX_W_MAP5_FD_X86_64_L_0,
VEX_W_MAP7_F6_L_0,
VEX_W_MAP7_F8_L_0,
@@ -1795,6 +1812,7 @@ enum
EVEX_W_0F3835_P_2,
EVEX_W_0F3837,
EVEX_W_0F383A_P_1,
+ EVEX_W_0F384A_X86_64,
EVEX_W_0F3859,
EVEX_W_0F385A_L_n,
EVEX_W_0F385B_L_2,
@@ -4112,6 +4130,14 @@ static const struct dis386 prefix_table[][4] = {
{ RM_TABLE (RM_VEX_0F3849_X86_64_L_0_W_0_M_1_P_3) },
},
+ /* PREFIX_VEX_0F384A_X86_64_W_0_L_0 */
+ {
+ { Bad_Opcode },
+ { Bad_Opcode },
+ { "tileloaddrst1", { TMM, MVexSIBMEM }, 0 },
+ { "tileloaddrs", { TMM, MVexSIBMEM }, 0 },
+ },
+
/* PREFIX_VEX_0F384B_X86_64_L_0_W_0 */
{
{ Bad_Opcode },
@@ -4296,6 +4322,20 @@ static const struct dis386 prefix_table[][4] = {
{ "%XErorxS", { Gdq, Edq, Ib }, 0 },
},
+ /* PREFIX_VEX_MAP5_F8_X86_64_M_0_L_0_W_0 */
+ {
+ { "t2rpntlvwz0rs", { TMM, MVexSIBMEM }, 0 },
+ { Bad_Opcode },
+ { "t2rpntlvwz1rs", { TMM, MVexSIBMEM }, 0 },
+ },
+
+ /* PREFIX_VEX_MAP5_F9_X86_64_M_0_L_0_W_0 */
+ {
+ { "t2rpntlvwz0rst1", { TMM, MVexSIBMEM }, 0 },
+ { Bad_Opcode },
+ { "t2rpntlvwz1rst1", { TMM, MVexSIBMEM }, 0 },
+ },
+
/* PREFIX_VEX_MAP5_FD_X86_64_L_0_W_0 */
{
{ "tdpbf8ps", { TMM, Rtmm, VexTmm }, 0 },
@@ -4664,6 +4704,12 @@ static const struct dis386 x86_64_table[][2] = {
{ VEX_LEN_TABLE (VEX_LEN_0F3849_X86_64) },
},
+ /* X86_64_VEX_0F384A */
+ {
+ { Bad_Opcode },
+ { VEX_W_TABLE (VEX_W_0F384A_X86_64) },
+ },
+
/* X86_64_VEX_0F384B */
{
{ Bad_Opcode },
@@ -4718,6 +4764,18 @@ static const struct dis386 x86_64_table[][2] = {
{ "%XEcmp%CCxadd", { Mdq, Gdq, VexGdq }, PREFIX_DATA },
},
+ /* X86_64_VEX_MAP5_F8 */
+ {
+ { Bad_Opcode },
+ { MOD_TABLE (MOD_VEX_MAP5_F8_X86_64) },
+ },
+
+ /* X86_64_VEX_MAP5_F9 */
+ {
+ { Bad_Opcode },
+ { MOD_TABLE (MOD_VEX_MAP5_F9_X86_64) },
+ },
+
/* X86_64_VEX_MAP5_FD */
{
{ Bad_Opcode },
@@ -6579,7 +6637,7 @@ static const struct dis386 vex_table[][256] = {
/* 48 */
{ X86_64_TABLE (X86_64_VEX_0F3848) },
{ X86_64_TABLE (X86_64_VEX_0F3849) },
- { Bad_Opcode },
+ { X86_64_TABLE (X86_64_VEX_0F384A) },
{ X86_64_TABLE (X86_64_VEX_0F384B) },
{ Bad_Opcode },
{ Bad_Opcode },
@@ -7267,6 +7325,11 @@ static const struct dis386 vex_len_table[][2] = {
{ VEX_W_TABLE (VEX_W_0F3849_X86_64_L_0) },
},
+ /* VEX_LEN_0F384A_X86_64_W_0 */
+ {
+ { PREFIX_TABLE (PREFIX_VEX_0F384A_X86_64_W_0_L_0) },
+ },
+
/* VEX_LEN_0F384B_X86_64 */
{
{ VEX_W_TABLE (VEX_W_0F384B_X86_64_L_0) },
@@ -7514,6 +7577,16 @@ static const struct dis386 vex_len_table[][2] = {
{ PREFIX_TABLE (PREFIX_VEX_0F3AF0_L_0) },
},
+ /* VEX_LEN_MAP5_F8_X86_64_M_0 */
+ {
+ { VEX_W_TABLE (VEX_W_MAP5_F8_X86_64_M_0_L_0) },
+ },
+
+ /* VEX_LEN_MAP5_F9_X86_64_M_0 */
+ {
+ { VEX_W_TABLE (VEX_W_MAP5_F9_X86_64_M_0_L_0) },
+ },
+
/* VEX_LEN_MAP5_FD_X86_64 */
{
{ VEX_W_TABLE (VEX_W_MAP5_FD_X86_64_L_0) },
@@ -7961,6 +8034,10 @@ static const struct dis386 vex_w_table[][2] = {
/* VEX_W_0F3849_X86_64_L_0 */
{ MOD_TABLE (MOD_VEX_0F3849_X86_64_L_0_W_0) },
},
+ {
+ /* VEX_W_0F384A_X86_64 */
+ { VEX_LEN_TABLE (VEX_LEN_0F384A_X86_64_W_0) },
+ },
{
/* VEX_W_0F384B_X86_64_L_0 */
{ PREFIX_TABLE (PREFIX_VEX_0F384B_X86_64_L_0_W_0) },
@@ -8155,6 +8232,14 @@ static const struct dis386 vex_w_table[][2] = {
/* VEX_W_0F3ADE */
{ VEX_LEN_TABLE (VEX_LEN_0F3ADE_W_0) },
},
+ {
+ /* VEX_W_MAP5_F8_X86_64_M_0 */
+ { PREFIX_TABLE (PREFIX_VEX_MAP5_F8_X86_64_M_0_L_0_W_0) },
+ },
+ {
+ /* VEX_W_MAP5_F9_X86_64_M_0 */
+ { PREFIX_TABLE (PREFIX_VEX_MAP5_F9_X86_64_M_0_L_0_W_0) },
+ },
{
/* VEX_W_MAP5_FD_X86_64 */
{ PREFIX_TABLE (PREFIX_VEX_MAP5_FD_X86_64_L_0_W_0) },
@@ -8540,6 +8625,14 @@ static const struct dis386 mod_table[][2] = {
/* MOD_VEX_0F386F_X86_64 */
{ VEX_LEN_TABLE (VEX_LEN_0F386F_X86_64_M_0) },
},
+ {
+ /* MOD_VEX_MAP5_F8_X86_64 */
+ { VEX_LEN_TABLE (VEX_LEN_MAP5_F8_X86_64_M_0) },
+ },
+ {
+ /* MOD_VEX_MAP5_F9_X86_64 */
+ { VEX_LEN_TABLE (VEX_LEN_MAP5_F9_X86_64_M_0) },
+ },
#include "i386-dis-evex-mod.h"
};
@@ -8929,6 +9022,8 @@ static const struct dis386 bad_opcode = { "(bad)", { XX }, 0 };
/* Fetch error indicator. */
static const struct dis386 err_opcode = { NULL, { XX }, 0 };
+static const struct dis386 map5_f8_opcode = { X86_64_TABLE (X86_64_VEX_MAP5_F8) };
+static const struct dis386 map5_f9_opcode = { X86_64_TABLE (X86_64_VEX_MAP5_F9) };
static const struct dis386 map5_fd_opcode = { X86_64_TABLE (X86_64_VEX_MAP5_FD) };
static const struct dis386 map7_f6_opcode = { VEX_LEN_TABLE (VEX_LEN_MAP7_F6) };
static const struct dis386 map7_f8_opcode = { VEX_LEN_TABLE (VEX_LEN_MAP7_F8) };
@@ -9250,7 +9345,14 @@ get_valid_dis386 (const struct dis386 *dp, instr_info *ins)
else if (vindex == 0xf6)
dp = &map7_f6_opcode;
else if (vindex == 0xf8)
- dp = &map7_f8_opcode;
+ {
+ if (vex_table_index == VEX_MAP5)
+ dp = &map5_f8_opcode;
+ else
+ dp = &map7_f8_opcode;
+ }
+ else if (vindex == 0xf9)
+ dp = &map5_f9_opcode;
else if (vindex == 0xfd)
dp = &map5_fd_opcode;
else
@@ -271,6 +271,8 @@ static const dependency isa_dependencies[] =
"AMX_TILE" },
{ "AMX_FP8",
"AMX_TILE" },
+ { "AMX_MOVRS",
+ "AMX_TILE" },
{ "KL",
"SSE2" },
{ "WIDEKL",
@@ -441,6 +443,7 @@ static bitfield cpu_flags[] =
BITFIELD (AMX_TRANSPOSE),
BITFIELD (AMX_TF32),
BITFIELD (AMX_FP8),
+ BITFIELD (AMX_MOVRS),
BITFIELD (AMX_TILE),
BITFIELD (MOVDIRI),
BITFIELD (MOVDIR64B),
@@ -256,6 +256,8 @@ enum i386_cpu
CpuAMX_TF32,
/* AMX-FP8 instructions required */
CpuAMX_FP8,
+ /* AMX-MOVRS Instructions support required. */
+ CpuAMX_MOVRS,
/* AMX-TILE instructions required */
CpuAMX_TILE,
/* GFNI instructions required */
@@ -509,6 +511,7 @@ typedef union i386_cpu_flags
unsigned int cpuamx_complex:1;
unsigned int cpuamx_tf32:1;
unsigned int cpuamx_fp8:1;
+ unsigned int cpuamx_movrs:1;
unsigned int cpuamx_tile:1;
unsigned int cpugfni:1;
unsigned int cpuvaes:1;
@@ -3235,9 +3235,15 @@ tdpbhf8ps, 0xf2fd, AMX_FP8, Modrm|Vex128|Map5|Src2VVVV|VexW0|NoSuf, { RegTMM, Re
tdphbf8ps, 0xf3fd, AMX_FP8, Modrm|Vex128|Map5|Src2VVVV|VexW0|NoSuf, { RegTMM, RegTMM, RegTMM }
tdphf8ps, 0x66fd, AMX_FP8, Modrm|Vex128|Map5|Src2VVVV|VexW0|NoSuf, { RegTMM, RegTMM, RegTMM }
+t2rpntlvw<z>rs<loc>, 0x<z:opc>f8 | <loc:opc>, AMX_MOVRS&AMX_TRANSPOSE, Sibmem|Vex128|Map5|VexW0|NoSuf|ImplicitGroup, { Unspecified|BaseIndex, RegTMM }
+t2rpntlvw<z>rs<loc>, 0x<z:opc>f8 | <loc:opc>, APX_F&AMX_MOVRS&AMX_TRANSPOSE, Sibmem|EVex128|Map5|VexW0|NoSuf|ImplicitGroup, { Unspecified|BaseIndex, RegTMM }
+
<z>
<loc>
+tileloaddrs, 0xf24a, APX_F(AMX_MOVRS), Sibmem|Vex128|EVex128|Space0F38|VexW0|NoSuf, { Unspecified|BaseIndex, RegTMM }
+tileloaddrst1, 0x664a, APX_F(AMX_MOVRS), Sibmem|Vex128|EVex128|Space0F38|VexW0|NoSuf, { Unspecified|BaseIndex, RegTMM }
+
// AMX instructions end.
// KEYLOCKER instructions.