@@ -1186,6 +1186,7 @@ static const arch_entry cpu_arch[] =
SUBARCH (amx_tf32, AMX_TF32, ANY_AMX_TF32, false),
SUBARCH (amx_fp8, AMX_FP8, ANY_AMX_FP8, false),
SUBARCH (amx_movrs, AMX_MOVRS, ANY_AMX_MOVRS, false),
+ SUBARCH (amx_avx512, AMX_AVX512, ANY_AMX_AVX512, false),
SUBARCH (amx_tile, AMX_TILE, ANY_AMX_TILE, false),
SUBARCH (movdiri, MOVDIRI, MOVDIRI, false),
SUBARCH (movdir64b, MOVDIR64B, MOVDIR64B, false),
@@ -233,6 +233,7 @@ accept various extension mnemonics. For example,
@code{amx_tf32},
@code{amx_fp8}
@code{amx_movrs},
+@code{amx_avx512},
@code{amx_tile},
@code{vmx},
@code{vmfunc},
@@ -1707,7 +1708,8 @@ supported on the CPU specified. The choices for @var{cpu_type} are:
@item @samp{.movdiri} @tab @samp{.movdir64b} @tab @samp{.enqcmd} @tab @samp{.tsxldtrk}
@item @samp{.amx_int8} @tab @samp{.amx_bf16} @tab @samp{.amx_fp16}
@item @samp{.amx_complex} @tab @samp{.amx_transpose} @tab @samp{.amx_tf32}
-@item @samp{.amx_fp8} @tab @samp{.amx_movrs} @tab @samp{.amx_tile}
+@item @samp{.amx_fp8} @tab @samp{.amx_movrs} @tab @samp{.amx_avx512}
+@item @samp{.amx_tile}
@item @samp{.kl} @tab @samp{.widekl} @tab @samp{.uintr} @tab @samp{.hreset}
@item @samp{.3dnow} @tab @samp{.3dnowa} @tab @samp{.sse4a} @tab @samp{.sse5}
@item @samp{.syscall} @tab @samp{.rdtscp} @tab @samp{.svme}
new file mode 100644
@@ -0,0 +1,35 @@
+#objdump: -dw -Mintel
+#name: x86_64 AMX-AVX512 insns (Intel disassembly)
+#source: x86-64-amx-avx512.s
+
+.*: +file format .*
+
+Disassembly of section \.text:
+
+#...
+[a-f0-9]+ <_intel>:
+\s*[a-f0-9]+:\s*62 62 6e 48 4a f5\s+tcvtrowd2ps zmm30,tmm5,edx
+\s*[a-f0-9]+:\s*62 62 6e 48 4a f2\s+tcvtrowd2ps zmm30,tmm2,edx
+\s*[a-f0-9]+:\s*62 63 7e 48 07 f5 7b\s+tcvtrowd2ps zmm30,tmm5,0x7b
+\s*[a-f0-9]+:\s*62 63 7e 48 07 f2 7b\s+tcvtrowd2ps zmm30,tmm2,0x7b
+\s*[a-f0-9]+:\s*62 62 6f 48 6d f5\s+tcvtrowps2bf16h zmm30,tmm5,edx
+\s*[a-f0-9]+:\s*62 62 6f 48 6d f2\s+tcvtrowps2bf16h zmm30,tmm2,edx
+\s*[a-f0-9]+:\s*62 63 7f 48 07 f5 7b\s+tcvtrowps2bf16h zmm30,tmm5,0x7b
+\s*[a-f0-9]+:\s*62 63 7f 48 07 f2 7b\s+tcvtrowps2bf16h zmm30,tmm2,0x7b
+\s*[a-f0-9]+:\s*62 62 6e 48 6d f5\s+tcvtrowps2bf16l zmm30,tmm5,edx
+\s*[a-f0-9]+:\s*62 62 6e 48 6d f2\s+tcvtrowps2bf16l zmm30,tmm2,edx
+\s*[a-f0-9]+:\s*62 63 7e 48 77 f5 7b\s+tcvtrowps2bf16l zmm30,tmm5,0x7b
+\s*[a-f0-9]+:\s*62 63 7e 48 77 f2 7b\s+tcvtrowps2bf16l zmm30,tmm2,0x7b
+\s*[a-f0-9]+:\s*62 62 6c 48 6d f5\s+tcvtrowps2phh zmm30,tmm5,edx
+\s*[a-f0-9]+:\s*62 62 6c 48 6d f2\s+tcvtrowps2phh zmm30,tmm2,edx
+\s*[a-f0-9]+:\s*62 63 7c 48 07 f5 7b\s+tcvtrowps2phh zmm30,tmm5,0x7b
+\s*[a-f0-9]+:\s*62 63 7c 48 07 f2 7b\s+tcvtrowps2phh zmm30,tmm2,0x7b
+\s*[a-f0-9]+:\s*62 62 6d 48 6d f5\s+tcvtrowps2phl zmm30,tmm5,edx
+\s*[a-f0-9]+:\s*62 62 6d 48 6d f2\s+tcvtrowps2phl zmm30,tmm2,edx
+\s*[a-f0-9]+:\s*62 63 7f 48 77 f5 7b\s+tcvtrowps2phl zmm30,tmm5,0x7b
+\s*[a-f0-9]+:\s*62 63 7f 48 77 f2 7b\s+tcvtrowps2phl zmm30,tmm2,0x7b
+\s*[a-f0-9]+:\s*62 62 6d 48 4a f5\s+tilemovrow zmm30,tmm5,edx
+\s*[a-f0-9]+:\s*62 62 6d 48 4a f2\s+tilemovrow zmm30,tmm2,edx
+\s*[a-f0-9]+:\s*62 63 7d 48 07 f5 7b\s+tilemovrow zmm30,tmm5,0x7b
+\s*[a-f0-9]+:\s*62 63 7d 48 07 f2 7b\s+tilemovrow zmm30,tmm2,0x7b
+#pass
new file mode 100644
@@ -0,0 +1,34 @@
+#objdump: -dw
+#name: x86_64 AMX-AVX512 insns
+#source: x86-64-amx-avx512.s
+
+.*: +file format .*
+
+Disassembly of section \.text:
+
+0+ <_start>:
+\s*[a-f0-9]+:\s*62 62 6e 48 4a f5\s+tcvtrowd2ps %edx,%tmm5,%zmm30
+\s*[a-f0-9]+:\s*62 62 6e 48 4a f2\s+tcvtrowd2ps %edx,%tmm2,%zmm30
+\s*[a-f0-9]+:\s*62 63 7e 48 07 f5 7b\s+tcvtrowd2ps \$0x7b,%tmm5,%zmm30
+\s*[a-f0-9]+:\s*62 63 7e 48 07 f2 7b\s+tcvtrowd2ps \$0x7b,%tmm2,%zmm30
+\s*[a-f0-9]+:\s*62 62 6f 48 6d f5\s+tcvtrowps2bf16h %edx,%tmm5,%zmm30
+\s*[a-f0-9]+:\s*62 62 6f 48 6d f2\s+tcvtrowps2bf16h %edx,%tmm2,%zmm30
+\s*[a-f0-9]+:\s*62 63 7f 48 07 f5 7b\s+tcvtrowps2bf16h \$0x7b,%tmm5,%zmm30
+\s*[a-f0-9]+:\s*62 63 7f 48 07 f2 7b\s+tcvtrowps2bf16h \$0x7b,%tmm2,%zmm30
+\s*[a-f0-9]+:\s*62 62 6e 48 6d f5\s+tcvtrowps2bf16l %edx,%tmm5,%zmm30
+\s*[a-f0-9]+:\s*62 62 6e 48 6d f2\s+tcvtrowps2bf16l %edx,%tmm2,%zmm30
+\s*[a-f0-9]+:\s*62 63 7e 48 77 f5 7b\s+tcvtrowps2bf16l \$0x7b,%tmm5,%zmm30
+\s*[a-f0-9]+:\s*62 63 7e 48 77 f2 7b\s+tcvtrowps2bf16l \$0x7b,%tmm2,%zmm30
+\s*[a-f0-9]+:\s*62 62 6c 48 6d f5\s+tcvtrowps2phh %edx,%tmm5,%zmm30
+\s*[a-f0-9]+:\s*62 62 6c 48 6d f2\s+tcvtrowps2phh %edx,%tmm2,%zmm30
+\s*[a-f0-9]+:\s*62 63 7c 48 07 f5 7b\s+tcvtrowps2phh \$0x7b,%tmm5,%zmm30
+\s*[a-f0-9]+:\s*62 63 7c 48 07 f2 7b\s+tcvtrowps2phh \$0x7b,%tmm2,%zmm30
+\s*[a-f0-9]+:\s*62 62 6d 48 6d f5\s+tcvtrowps2phl %edx,%tmm5,%zmm30
+\s*[a-f0-9]+:\s*62 62 6d 48 6d f2\s+tcvtrowps2phl %edx,%tmm2,%zmm30
+\s*[a-f0-9]+:\s*62 63 7f 48 77 f5 7b\s+tcvtrowps2phl \$0x7b,%tmm5,%zmm30
+\s*[a-f0-9]+:\s*62 63 7f 48 77 f2 7b\s+tcvtrowps2phl \$0x7b,%tmm2,%zmm30
+\s*[a-f0-9]+:\s*62 62 6d 48 4a f5\s+tilemovrow %edx,%tmm5,%zmm30
+\s*[a-f0-9]+:\s*62 62 6d 48 4a f2\s+tilemovrow %edx,%tmm2,%zmm30
+\s*[a-f0-9]+:\s*62 63 7d 48 07 f5 7b\s+tilemovrow \$0x7b,%tmm5,%zmm30
+\s*[a-f0-9]+:\s*62 63 7d 48 07 f2 7b\s+tilemovrow \$0x7b,%tmm2,%zmm30
+#pass
new file mode 100644
@@ -0,0 +1,55 @@
+# Check 64bit AMX-AVX512 instructions
+
+ .text
+_start:
+ tcvtrowd2ps %edx, %tmm5, %zmm30
+ tcvtrowd2ps %edx, %tmm2, %zmm30
+ tcvtrowd2ps $123, %tmm5, %zmm30
+ tcvtrowd2ps $123, %tmm2, %zmm30
+ tcvtrowps2bf16h %edx, %tmm5, %zmm30
+ tcvtrowps2bf16h %edx, %tmm2, %zmm30
+ tcvtrowps2bf16h $123, %tmm5, %zmm30
+ tcvtrowps2bf16h $123, %tmm2, %zmm30
+ tcvtrowps2bf16l %edx, %tmm5, %zmm30
+ tcvtrowps2bf16l %edx, %tmm2, %zmm30
+ tcvtrowps2bf16l $123, %tmm5, %zmm30
+ tcvtrowps2bf16l $123, %tmm2, %zmm30
+ tcvtrowps2phh %edx, %tmm5, %zmm30
+ tcvtrowps2phh %edx, %tmm2, %zmm30
+ tcvtrowps2phh $123, %tmm5, %zmm30
+ tcvtrowps2phh $123, %tmm2, %zmm30
+ tcvtrowps2phl %edx, %tmm5, %zmm30
+ tcvtrowps2phl %edx, %tmm2, %zmm30
+ tcvtrowps2phl $123, %tmm5, %zmm30
+ tcvtrowps2phl $123, %tmm2, %zmm30
+ tilemovrow %edx, %tmm5, %zmm30
+ tilemovrow %edx, %tmm2, %zmm30
+ tilemovrow $123, %tmm5, %zmm30
+ tilemovrow $123, %tmm2, %zmm30
+
+_intel:
+ .intel_syntax noprefix
+ tcvtrowd2ps zmm30, tmm5, edx
+ tcvtrowd2ps zmm30, tmm2, edx
+ tcvtrowd2ps zmm30, tmm5, 123
+ tcvtrowd2ps zmm30, tmm2, 123
+ tcvtrowps2bf16h zmm30, tmm5, edx
+ tcvtrowps2bf16h zmm30, tmm2, edx
+ tcvtrowps2bf16h zmm30, tmm5, 123
+ tcvtrowps2bf16h zmm30, tmm2, 123
+ tcvtrowps2bf16l zmm30, tmm5, edx
+ tcvtrowps2bf16l zmm30, tmm2, edx
+ tcvtrowps2bf16l zmm30, tmm5, 123
+ tcvtrowps2bf16l zmm30, tmm2, 123
+ tcvtrowps2phh zmm30, tmm5, edx
+ tcvtrowps2phh zmm30, tmm2, edx
+ tcvtrowps2phh zmm30, tmm5, 123
+ tcvtrowps2phh zmm30, tmm2, 123
+ tcvtrowps2phl zmm30, tmm5, edx
+ tcvtrowps2phl zmm30, tmm2, edx
+ tcvtrowps2phl zmm30, tmm5, 123
+ tcvtrowps2phl zmm30, tmm2, 123
+ tilemovrow zmm30, tmm5, edx
+ tilemovrow zmm30, tmm2, edx
+ tilemovrow zmm30, tmm5, 123
+ tilemovrow zmm30, tmm2, 123
@@ -538,6 +538,8 @@ run_dump_test "x86-64-amx-fp8-bad"
run_dump_test "x86-64-amx-movrs"
run_dump_test "x86-64-amx-movrs-intel"
run_list_test "x86-64-amx-movrs-inval"
+run_dump_test "x86-64-amx-avx512"
+run_dump_test "x86-64-amx-avx512-intel"
run_dump_test "x86-64-movrs"
run_dump_test "x86-64-movrs-intel"
run_dump_test "x86-64-movrs-avx10_2-512"
@@ -47,6 +47,8 @@ static const struct dis386 evex_len_table[][3] = {
/* EVEX_LEN_0F384A_X86_64_W_0 */
{
{ X86_64_EVEX_PFX_TABLE (PREFIX_VEX_0F384A_X86_64_W_0_L_0) },
+ { Bad_Opcode },
+ { PREFIX_TABLE (PREFIX_EVEX_0F384A_X86_64_W_0_L_2) },
},
/* EVEX_LEN_0F385A */
@@ -63,6 +65,13 @@ static const struct dis386 evex_len_table[][3] = {
{ VEX_W_TABLE (EVEX_W_0F385B_L_2) },
},
+ /* EVEX_LEN_0F386D_X86_64_W_0_M_1 */
+ {
+ { Bad_Opcode },
+ { Bad_Opcode },
+ { PREFIX_TABLE (PREFIX_EVEX_0F386D_X86_64_W_0_L_2) },
+ },
+
/* EVEX_LEN_0F38C6 */
{
{ Bad_Opcode },
@@ -91,6 +100,13 @@ static const struct dis386 evex_len_table[][3] = {
{ VEX_W_TABLE (VEX_W_0F3A01_L_1) },
},
+ /* EVEX_LEN_0F3A07_X86_64_W_0 */
+ {
+ { Bad_Opcode },
+ { Bad_Opcode },
+ { PREFIX_TABLE (PREFIX_EVEX_0F3A07_X86_64_W_0_L_2) },
+ },
+
/* EVEX_LEN_0F3A18 */
{
{ Bad_Opcode },
@@ -161,6 +177,13 @@ static const struct dis386 evex_len_table[][3] = {
{ VEX_W_TABLE (EVEX_W_0F3A43_L_n) },
},
+ /* EVEX_LEN_0F3A77_X86_64_W_0 */
+ {
+ { Bad_Opcode },
+ { Bad_Opcode },
+ { PREFIX_TABLE (PREFIX_EVEX_0F3A77_X86_64_W_0_L_2) },
+ },
+
/* EVEX_LEN_MAP5_6E */
{
{ PREFIX_TABLE (PREFIX_EVEX_MAP5_6E_L_0) },
@@ -243,6 +243,12 @@
{ VEX_W_TABLE (EVEX_W_0F383A_P_1) },
{ "%XEvpminuw", { XM, Vex, EXx }, 0 },
},
+ /* PREFIX_EVEX_0F384A_W_0_L_2 */
+ {
+ { Bad_Opcode },
+ { "tcvtrowd2ps", { XM, Rtmm, VexGdq }, 0 },
+ { "tilemovrow", { XM, Rtmm, VexGdq }, 0 },
+ },
/* PREFIX_EVEX_0F3852 */
{
{ "vdpphp%XS", { XM, Vex, EXx }, 0 },
@@ -264,6 +270,13 @@
{ Bad_Opcode },
{ "vp2intersectY%DQ", { MaskG, Vex, EXx, EXxEVexS }, 0 },
},
+ /* PREFIX_EVEX_0F386D_W_0_L_2 */
+ {
+ { "tcvtrowps2phh", { XM, Rtmm, VexGdq }, 0 },
+ { "tcvtrowps2bf16l", { XM, Rtmm, VexGdq }, 0 },
+ { "tcvtrowps2phl", { XM, Rtmm, VexGdq }, 0 },
+ { "tcvtrowps2bf16h", { XM, Rtmm, VexGdq }, 0 },
+ },
/* PREFIX_EVEX_0F3872 */
{
{ Bad_Opcode },
@@ -306,6 +319,13 @@
{ "%XEvfmsub213s%XW", { XMScalar, VexScalar, EXdq, EXxEVexR }, 0 },
{ "v4fnmadds%XS", { XMScalar, VexScalar, Mxmm }, 0 },
},
+ /* PREFIX_EVEX_0F3A07_W_0_L_2 */
+ {
+ { "tcvtrowps2phh", { XM, Rtmm, Ib }, 0 },
+ { "tcvtrowd2ps", { XM, Rtmm, Ib }, 0 },
+ { "tilemovrow", { XM, Rtmm, Ib }, 0 },
+ { "tcvtrowps2bf16h", { XM, Rtmm, Ib }, 0 },
+ },
/* PREFIX_EVEX_0F3A08 */
{
{ "vrndscalep%XH", { XM, EXxh, EXxEVexS, Ib }, 0 },
@@ -377,6 +397,13 @@
{ Bad_Opcode },
{ "vfpclasss%XW", { MaskG, EXdq, Ib }, 0 },
},
+ /* PREFIX_EVEX_0F3A77_W_0_L_2 */
+ {
+ { Bad_Opcode },
+ { "tcvtrowps2bf16l", { XM, Rtmm, Ib }, 0 },
+ { Bad_Opcode },
+ { "tcvtrowps2phl", { XM, Rtmm, Ib }, 0 },
+ },
/* PREFIX_EVEX_0F3AC2 */
{
{ "vcmpp%XH", { MaskG, Vex, EXxh, EXxEVexS, CMP }, 0 },
@@ -365,6 +365,10 @@
{ "vbroadcasti32x8", { XM, Mymm }, PREFIX_DATA },
{ "vbroadcasti64x4", { XM, Mymm }, PREFIX_DATA },
},
+ /* EVEX_W_0F386D_X86_64 */
+ {
+ { EVEX_LEN_TABLE (EVEX_LEN_0F386D_X86_64_W_0) },
+ },
/* EVEX_W_0F3870 */
{
{ Bad_Opcode },
@@ -388,6 +392,10 @@
{ Bad_Opcode },
{ "vpmultishiftqb", { XM, Vex, EXx }, PREFIX_DATA },
},
+ /* EVEX_W_0F3A07_X86_64 */
+ {
+ { EVEX_LEN_TABLE (EVEX_LEN_0F3A07_X86_64_W_0) },
+ },
/* EVEX_W_0F3A18_L_n */
{
{ "vinsertf32x4", { XM, Vex, EXxmm, Ib }, PREFIX_DATA },
@@ -456,6 +464,10 @@
{ Bad_Opcode },
{ "vpshrdw", { XM, Vex, EXx, Ib }, 0 },
},
+ /* EVEX_W_0F3A77_X86_64 */
+ {
+ { EVEX_LEN_TABLE (EVEX_LEN_0F3A77_X86_64_W_0) },
+ },
/* EVEX_W_MAP4_8A */
{
{ MOD_TABLE (MOD_EVEX_MAP4_8A_W_0) },
@@ -3,6 +3,21 @@
{ Bad_Opcode },
{ VEX_W_TABLE (EVEX_W_0F384A_X86_64) },
},
+ /* X86_64_EVEX_0F386D */
+ {
+ { Bad_Opcode },
+ { VEX_W_TABLE (EVEX_W_0F386D_X86_64) },
+ },
+ /* X86_64_EVEX_0F3A07 */
+ {
+ { Bad_Opcode },
+ { VEX_W_TABLE (EVEX_W_0F3A07_X86_64) },
+ },
+ /* X86_64_EVEX_0F3A77 */
+ {
+ { Bad_Opcode },
+ { VEX_W_TABLE (EVEX_W_0F3A77_X86_64) },
+ },
/* X86_64_EVEX_MAP5_6F_M_0 */
{
{ Bad_Opcode },
@@ -415,7 +415,7 @@ static const struct dis386 evex_table[][256] = {
{ Bad_Opcode },
{ Bad_Opcode },
{ Bad_Opcode },
- { Bad_Opcode },
+ { X86_64_TABLE (X86_64_EVEX_0F386D) },
{ X86_64_EVEX_FROM_VEX_TABLE (X86_64_VEX_0F386E) },
{ X86_64_EVEX_FROM_VEX_TABLE (X86_64_VEX_0F386F) },
/* 70 */
@@ -591,7 +591,7 @@ static const struct dis386 evex_table[][256] = {
{ VEX_W_TABLE (VEX_W_0F3A04) },
{ "%XEvpermilp%XD", { XM, EXx, Ib }, PREFIX_DATA },
{ Bad_Opcode },
- { Bad_Opcode },
+ { X86_64_TABLE (X86_64_EVEX_0F3A07) },
/* 08 */
{ PREFIX_TABLE (PREFIX_EVEX_0F3A08) },
{ "vrndscalep%XD", { XM, EXx, EXxEVexS, Ib }, PREFIX_DATA },
@@ -717,7 +717,7 @@ static const struct dis386 evex_table[][256] = {
{ Bad_Opcode },
{ Bad_Opcode },
{ Bad_Opcode },
- { Bad_Opcode },
+ { X86_64_TABLE (X86_64_EVEX_0F3A77) },
/* 78 */
{ Bad_Opcode },
{ Bad_Opcode },
@@ -1214,9 +1214,11 @@ enum
PREFIX_EVEX_0F3838,
PREFIX_EVEX_0F3839,
PREFIX_EVEX_0F383A,
+ PREFIX_EVEX_0F384A_X86_64_W_0_L_2,
PREFIX_EVEX_0F3852,
PREFIX_EVEX_0F3853,
PREFIX_EVEX_0F3868,
+ PREFIX_EVEX_0F386D_X86_64_W_0_L_2,
PREFIX_EVEX_0F3872,
PREFIX_EVEX_0F3874,
PREFIX_EVEX_0F389A,
@@ -1224,6 +1226,7 @@ enum
PREFIX_EVEX_0F38AA,
PREFIX_EVEX_0F38AB,
+ PREFIX_EVEX_0F3A07_X86_64_W_0_L_2,
PREFIX_EVEX_0F3A08,
PREFIX_EVEX_0F3A0A,
PREFIX_EVEX_0F3A26,
@@ -1235,6 +1238,7 @@ enum
PREFIX_EVEX_0F3A57,
PREFIX_EVEX_0F3A66,
PREFIX_EVEX_0F3A67,
+ PREFIX_EVEX_0F3A77_X86_64_W_0_L_2,
PREFIX_EVEX_0F3AC2,
PREFIX_EVEX_MAP4_4x,
@@ -1384,6 +1388,9 @@ enum
X86_64_VEX_MAP7_F8_L_0_W_0_R_0,
X86_64_EVEX_0F384A,
+ X86_64_EVEX_0F386D,
+ X86_64_EVEX_0F3A07,
+ X86_64_EVEX_0F3A77,
X86_64_EVEX_MAP5_6F_M_0,
};
@@ -1583,10 +1590,12 @@ enum
EVEX_LEN_0F384A_X86_64_W_0,
EVEX_LEN_0F385A,
EVEX_LEN_0F385B,
+ EVEX_LEN_0F386D_X86_64_W_0,
EVEX_LEN_0F38C6,
EVEX_LEN_0F38C7,
EVEX_LEN_0F3A00,
EVEX_LEN_0F3A01,
+ EVEX_LEN_0F3A07_X86_64_W_0,
EVEX_LEN_0F3A18,
EVEX_LEN_0F3A19,
EVEX_LEN_0F3A1A,
@@ -1597,6 +1606,7 @@ enum
EVEX_LEN_0F3A3A,
EVEX_LEN_0F3A3B,
EVEX_LEN_0F3A43,
+ EVEX_LEN_0F3A77_X86_64_W_0,
EVEX_LEN_MAP5_6E,
EVEX_LEN_MAP5_7E,
@@ -1816,12 +1826,14 @@ enum
EVEX_W_0F3859,
EVEX_W_0F385A_L_n,
EVEX_W_0F385B_L_2,
+ EVEX_W_0F386D_X86_64,
EVEX_W_0F3870,
EVEX_W_0F3872_P_2,
EVEX_W_0F387A,
EVEX_W_0F387B,
EVEX_W_0F3883,
+ EVEX_W_0F3A07_X86_64,
EVEX_W_0F3A18_L_n,
EVEX_W_0F3A19_L_n,
EVEX_W_0F3A1A_L_2,
@@ -1836,6 +1848,7 @@ enum
EVEX_W_0F3A43_L_n,
EVEX_W_0F3A70,
EVEX_W_0F3A72,
+ EVEX_W_0F3A77_X86_64,
EVEX_W_MAP4_8A,
EVEX_W_MAP4_8F_R_0,
@@ -14070,6 +14083,29 @@ OP_VEX (instr_info *ins, int bytemode, int sizeflag ATTRIBUTE_UNUSED)
return true;
}
+ switch (bytemode)
+ {
+ case v_mode:
+ case dq_mode:
+ if (ins->rex & REX_W)
+ names = att_names64;
+ else if (bytemode == v_mode
+ && !(sizeflag & DFLAG))
+ names = att_names16;
+ else
+ names = att_names32;
+ oappend_register (ins, names[reg]);
+ return true;
+ case b_mode:
+ names = att_names8rex;
+ oappend_register (ins, names[reg]);
+ return true;
+ case q_mode:
+ names = att_names64;
+ oappend_register (ins, names[reg]);
+ return true;
+ }
+
switch (ins->vex.length)
{
case 128:
@@ -14079,22 +14115,6 @@ OP_VEX (instr_info *ins, int bytemode, int sizeflag ATTRIBUTE_UNUSED)
names = att_names_xmm;
ins->evex_used |= EVEX_len_used;
break;
- case v_mode:
- case dq_mode:
- if (ins->rex & REX_W)
- names = att_names64;
- else if (bytemode == v_mode
- && !(sizeflag & DFLAG))
- names = att_names16;
- else
- names = att_names32;
- break;
- case b_mode:
- names = att_names8rex;
- break;
- case q_mode:
- names = att_names64;
- break;
case mask_bd_mode:
case mask_mode:
if (reg > 0x7)
@@ -273,6 +273,8 @@ static const dependency isa_dependencies[] =
"AMX_TILE" },
{ "AMX_MOVRS",
"AMX_TILE" },
+ { "AMX_AVX512",
+ "AMX_TILE|AVX10_2" },
{ "KL",
"SSE2" },
{ "WIDEKL",
@@ -444,6 +446,7 @@ static bitfield cpu_flags[] =
BITFIELD (AMX_TF32),
BITFIELD (AMX_FP8),
BITFIELD (AMX_MOVRS),
+ BITFIELD (AMX_AVX512),
BITFIELD (AMX_TILE),
BITFIELD (MOVDIRI),
BITFIELD (MOVDIR64B),
@@ -258,6 +258,8 @@ enum i386_cpu
CpuAMX_FP8,
/* AMX-MOVRS Instructions support required. */
CpuAMX_MOVRS,
+ /* AMX-AVX512 Instructions support required. */
+ CpuAMX_AVX512,
/* AMX-TILE instructions required */
CpuAMX_TILE,
/* GFNI instructions required */
@@ -512,6 +514,7 @@ typedef union i386_cpu_flags
unsigned int cpuamx_tf32:1;
unsigned int cpuamx_fp8:1;
unsigned int cpuamx_movrs:1;
+ unsigned int cpuamx_avx512:1;
unsigned int cpuamx_tile:1;
unsigned int cpugfni:1;
unsigned int cpuvaes:1;
@@ -3243,6 +3243,21 @@ t2rpntlvw<z>rs<loc>, 0x<z:pfx>f8 | <loc:opc>, AMX_TRANSPOSE&APX_F(AMX_MOVRS), Si
tileloaddrs, 0xf24a, APX_F(AMX_MOVRS), Sibmem|Vex128|EVex128|Space0F38|VexW0|NoSuf, { Unspecified|BaseIndex, RegTMM }
tileloaddrst1, 0x664a, APX_F(AMX_MOVRS), Sibmem|Vex128|EVex128|Space0F38|VexW0|NoSuf, { Unspecified|BaseIndex, RegTMM }
+tcvtrowd2ps, 0xf34a, AMX_AVX512, Modrm|EVex512|Space0F38|Src2VVVV|VexW0|NoSuf, { Reg32, RegTMM, RegZMM }
+tcvtrowd2ps, 0xf307, AMX_AVX512, Modrm|EVex512|Space0F3A|VexW0|NoSuf, { Imm8, RegTMM, RegZMM }
+
+tcvtrowps2bf16h, 0xf26d, AMX_AVX512, Modrm|EVex512|Space0F38|Src2VVVV|VexW0|NoSuf, { Reg32, RegTMM, RegZMM }
+tcvtrowps2bf16h, 0xf207, AMX_AVX512, Modrm|EVex512|Space0F3A|VexW0|NoSuf, { Imm8, RegTMM, RegZMM }
+tcvtrowps2bf16l, 0xf36d, AMX_AVX512, Modrm|EVex512|Space0F38|Src2VVVV|VexW0|NoSuf, { Reg32, RegTMM, RegZMM }
+tcvtrowps2bf16l, 0xf377, AMX_AVX512, Modrm|EVex512|Space0F3A|VexW0|NoSuf, { Imm8, RegTMM, RegZMM }
+tcvtrowps2phh, 0x6d, AMX_AVX512, Modrm|EVex512|Space0F38|Src2VVVV|VexW0|NoSuf, { Reg32, RegTMM, RegZMM }
+tcvtrowps2phh, 0x07, AMX_AVX512, Modrm|EVex512|Space0F3A|VexW0|NoSuf, { Imm8, RegTMM, RegZMM }
+tcvtrowps2phl, 0x666d, AMX_AVX512, Modrm|EVex512|Space0F38|Src2VVVV|VexW0|NoSuf, { Reg32, RegTMM, RegZMM }
+tcvtrowps2phl, 0xf277, AMX_AVX512, Modrm|EVex512|Space0F3A|VexW0|NoSuf, { Imm8, RegTMM, RegZMM }
+
+tilemovrow, 0x664a, AMX_AVX512, Modrm|EVex512|Space0F38|Src2VVVV|VexW0|NoSuf, { Reg32, RegTMM, RegZMM }
+tilemovrow, 0x6607, AMX_AVX512, Modrm|EVex512|Space0F3A|VexW0|NoSuf, { Imm8, RegTMM, RegZMM }
+
// AMX instructions end.
// KEYLOCKER instructions.