Skip to content

Commit

Permalink
[NFC][X86] Reorg MC tests for APX promoted instrs (#76697)
Browse files Browse the repository at this point in the history
As suggested in #76210, this
patch re-organize the mc tests for apx promoted instrs, instr tests
within same cpuid would be listed in one test.
Also add explicit prefix {evex} tests and 8 displacement memory test,
promoted instrs need set No_CD8 to avoid AVX512 compress encoding.
  • Loading branch information
XinWang10 committed Jan 4, 2024
1 parent dd9681f commit ddf0096
Show file tree
Hide file tree
Showing 87 changed files with 1,911 additions and 777 deletions.
12 changes: 6 additions & 6 deletions llvm/lib/Target/X86/X86InstrMisc.td
Original file line number Diff line number Diff line change
Expand Up @@ -1353,22 +1353,22 @@ multiclass bmi_pdep_pext<string mnemonic, RegisterClass RC,
def rr#Suffix : I<0xF5, MRMSrcReg, (outs RC:$dst), (ins RC:$src1, RC:$src2),
!strconcat(mnemonic, "\t{$src2, $src1, $dst|$dst, $src1, $src2}"),
[(set RC:$dst, (OpNode RC:$src1, RC:$src2))]>,
VEX, VVVV, Sched<[WriteALU]>;
NoCD8, VVVV, Sched<[WriteALU]>;
def rm#Suffix : I<0xF5, MRMSrcMem, (outs RC:$dst), (ins RC:$src1, x86memop:$src2),
!strconcat(mnemonic, "\t{$src2, $src1, $dst|$dst, $src1, $src2}"),
[(set RC:$dst, (OpNode RC:$src1, (ld_frag addr:$src2)))]>,
VEX, VVVV, Sched<[WriteALU.Folded, WriteALU.ReadAfterFold]>;
NoCD8, VVVV, Sched<[WriteALU.Folded, WriteALU.ReadAfterFold]>;
}

let Predicates = [HasBMI2, NoEGPR] in {
defm PDEP32 : bmi_pdep_pext<"pdep{l}", GR32, i32mem,
X86pdep, loadi32>, T8, XD;
X86pdep, loadi32>, T8, XD, VEX;
defm PDEP64 : bmi_pdep_pext<"pdep{q}", GR64, i64mem,
X86pdep, loadi64>, T8, XD, REX_W;
X86pdep, loadi64>, T8, XD, REX_W, VEX;
defm PEXT32 : bmi_pdep_pext<"pext{l}", GR32, i32mem,
X86pext, loadi32>, T8, XS;
X86pext, loadi32>, T8, XS, VEX;
defm PEXT64 : bmi_pdep_pext<"pext{q}", GR64, i64mem,
X86pext, loadi64>, T8, XS, REX_W;
X86pext, loadi64>, T8, XS, REX_W, VEX;
}

let Predicates = [HasBMI2, HasEGPR] in {
Expand Down
2 changes: 1 addition & 1 deletion llvm/lib/Target/X86/X86InstrShiftRotate.td
Original file line number Diff line number Diff line change
Expand Up @@ -868,7 +868,7 @@ let Predicates = [HasBMI2, NoEGPR] in {
defm SHLX64 : bmi_shift<"shlx{q}", GR64, i64mem>, T8, PD, REX_W;
}

let Predicates = [HasBMI2, HasEGPR] in {
let Predicates = [HasBMI2, HasEGPR, In64BitMode] in {
defm RORX32 : bmi_rotate<"rorx{l}", GR32, i32mem, "_EVEX">, EVEX;
defm RORX64 : bmi_rotate<"rorx{q}", GR64, i64mem, "_EVEX">, REX_W, EVEX;
defm SARX32 : bmi_shift<"sarx{l}", GR32, i32mem, "_EVEX">, T8, XS, EVEX;
Expand Down
30 changes: 30 additions & 0 deletions llvm/test/MC/Disassembler/X86/apx/amx-tile.txt
Original file line number Diff line number Diff line change
@@ -1,22 +1,52 @@
# RUN: llvm-mc --disassemble %s -triple=x86_64 | FileCheck %s --check-prefixes=ATT
# RUN: llvm-mc --disassemble %s -triple=x86_64 -x86-asm-syntax=intel --output-asm-variant=1 | FileCheck %s --check-prefixes=INTEL

## ldtilecfg

# ATT: ldtilecfg 123(%rax,%rbx,4)
# INTEL: ldtilecfg [rax + 4*rbx + 123]
0x62,0xf2,0x7c,0x08,0x49,0x44,0x98,0x7b

# ATT: ldtilecfg 291(%r28,%r29,4)
# INTEL: ldtilecfg [r28 + 4*r29 + 291]
0x62,0x9a,0x78,0x08,0x49,0x84,0xac,0x23,0x01,0x00,0x00

## sttilecfg

# ATT: sttilecfg 123(%rax,%rbx,4)
# INTEL: sttilecfg [rax + 4*rbx + 123]
0x62,0xf2,0x7d,0x08,0x49,0x44,0x98,0x7b

# ATT: sttilecfg 291(%r28,%r29,4)
# INTEL: sttilecfg [r28 + 4*r29 + 291]
0x62,0x9a,0x79,0x08,0x49,0x84,0xac,0x23,0x01,0x00,0x00

## tileloadd

# ATT: tileloadd 123(%rax,%rbx,4), %tmm6
# INTEL: tileloadd tmm6, [rax + 4*rbx + 123]
0x62,0xf2,0x7f,0x08,0x4b,0x74,0x98,0x7b

# ATT: tileloadd 291(%r28,%r29,4), %tmm6
# INTEL: tileloadd tmm6, [r28 + 4*r29 + 291]
0x62,0x9a,0x7b,0x08,0x4b,0xb4,0xac,0x23,0x01,0x00,0x00

## tileloaddt1

# ATT: tileloaddt1 123(%rax,%rbx,4), %tmm6
# INTEL: tileloaddt1 tmm6, [rax + 4*rbx + 123]
0x62,0xf2,0x7d,0x08,0x4b,0x74,0x98,0x7b

# ATT: tileloaddt1 291(%r28,%r29,4), %tmm6
# INTEL: tileloaddt1 tmm6, [r28 + 4*r29 + 291]
0x62,0x9a,0x79,0x08,0x4b,0xb4,0xac,0x23,0x01,0x00,0x00

## tilestored

# ATT: tilestored %tmm6, 123(%rax,%rbx,4)
# INTEL: tilestored [rax + 4*rbx + 123], tmm6
0x62,0xf2,0x7e,0x08,0x4b,0x74,0x98,0x7b

# ATT: tilestored %tmm6, 291(%r28,%r29,4)
# INTEL: tilestored [r28 + 4*r29 + 291], tmm6
0x62,0x9a,0x7a,0x08,0x4b,0xb4,0xac,0x23,0x01,0x00,0x00
240 changes: 240 additions & 0 deletions llvm/test/MC/Disassembler/X86/apx/bmi2.txt
Original file line number Diff line number Diff line change
@@ -0,0 +1,240 @@
# RUN: llvm-mc --disassemble %s -triple=x86_64 | FileCheck %s --check-prefixes=ATT
# RUN: llvm-mc --disassemble %s -triple=x86_64 -x86-asm-syntax=intel --output-asm-variant=1 | FileCheck %s --check-prefixes=INTEL

## mulx

# ATT: mulxl %ecx, %edx, %r10d
# INTEL: mulx r10d, edx, ecx
0x62,0x72,0x6f,0x08,0xf6,0xd1

# ATT: mulxq %r9, %r15, %r11
# INTEL: mulx r11, r15, r9
0x62,0x52,0x87,0x08,0xf6,0xd9

# ATT: mulxl 123(%rax,%rbx,4), %ecx, %edx
# INTEL: mulx edx, ecx, dword ptr [rax + 4*rbx + 123]
0x62,0xf2,0x77,0x08,0xf6,0x94,0x98,0x7b,0x00,0x00,0x00

# ATT: mulxq 123(%rax,%rbx,4), %r9, %r15
# INTEL: mulx r15, r9, qword ptr [rax + 4*rbx + 123]
0x62,0x72,0xb7,0x08,0xf6,0xbc,0x98,0x7b,0x00,0x00,0x00

# ATT: mulxl %r18d, %r22d, %r26d
# INTEL: mulx r26d, r22d, r18d
0x62,0x6a,0x4f,0x00,0xf6,0xd2

# ATT: mulxq %r19, %r23, %r27
# INTEL: mulx r27, r23, r19
0x62,0x6a,0xc7,0x00,0xf6,0xdb

# ATT: mulxl 291(%r28,%r29,4), %r18d, %r22d
# INTEL: mulx r22d, r18d, dword ptr [r28 + 4*r29 + 291]
0x62,0x8a,0x6b,0x00,0xf6,0xb4,0xac,0x23,0x01,0x00,0x00

# ATT: mulxq 291(%r28,%r29,4), %r19, %r23
# INTEL: mulx r23, r19, qword ptr [r28 + 4*r29 + 291]
0x62,0x8a,0xe3,0x00,0xf6,0xbc,0xac,0x23,0x01,0x00,0x00

## pdep

# ATT: pdepl %ecx, %edx, %r10d
# INTEL: pdep r10d, edx, ecx
0x62,0x72,0x6f,0x08,0xf5,0xd1

# ATT: pdepq %r9, %r15, %r11
# INTEL: pdep r11, r15, r9
0x62,0x52,0x87,0x08,0xf5,0xd9

# ATT: pdepl 123(%rax,%rbx,4), %ecx, %edx
# INTEL: pdep edx, ecx, dword ptr [rax + 4*rbx + 123]
0x62,0xf2,0x77,0x08,0xf5,0x54,0x98,0x7b

# ATT: pdepq 123(%rax,%rbx,4), %r9, %r15
# INTEL: pdep r15, r9, qword ptr [rax + 4*rbx + 123]
0x62,0x72,0xb7,0x08,0xf5,0x7c,0x98,0x7b

# ATT: pdepl %r18d, %r22d, %r26d
# INTEL: pdep r26d, r22d, r18d
0x62,0x6a,0x4f,0x00,0xf5,0xd2

# ATT: pdepq %r19, %r23, %r27
# INTEL: pdep r27, r23, r19
0x62,0x6a,0xc7,0x00,0xf5,0xdb

# ATT: pdepl 291(%r28,%r29,4), %r18d, %r22d
# INTEL: pdep r22d, r18d, dword ptr [r28 + 4*r29 + 291]
0x62,0x8a,0x6b,0x00,0xf5,0xb4,0xac,0x23,0x01,0x00,0x00

# ATT: pdepq 291(%r28,%r29,4), %r19, %r23
# INTEL: pdep r23, r19, qword ptr [r28 + 4*r29 + 291]
0x62,0x8a,0xe3,0x00,0xf5,0xbc,0xac,0x23,0x01,0x00,0x00

## pext

# ATT: pextl %ecx, %edx, %r10d
# INTEL: pext r10d, edx, ecx
0x62,0x72,0x6e,0x08,0xf5,0xd1

# ATT: pextq %r9, %r15, %r11
# INTEL: pext r11, r15, r9
0x62,0x52,0x86,0x08,0xf5,0xd9

# ATT: pextl 123(%rax,%rbx,4), %ecx, %edx
# INTEL: pext edx, ecx, dword ptr [rax + 4*rbx + 123]
0x62,0xf2,0x76,0x08,0xf5,0x54,0x98,0x7b

# ATT: pextq 123(%rax,%rbx,4), %r9, %r15
# INTEL: pext r15, r9, qword ptr [rax + 4*rbx + 123]
0x62,0x72,0xb6,0x08,0xf5,0x7c,0x98,0x7b

# ATT: pextl %r18d, %r22d, %r26d
# INTEL: pext r26d, r22d, r18d
0x62,0x6a,0x4e,0x00,0xf5,0xd2

# ATT: pextq %r19, %r23, %r27
# INTEL: pext r27, r23, r19
0x62,0x6a,0xc6,0x00,0xf5,0xdb

# ATT: pextl 291(%r28,%r29,4), %r18d, %r22d
# INTEL: pext r22d, r18d, dword ptr [r28 + 4*r29 + 291]
0x62,0x8a,0x6a,0x00,0xf5,0xb4,0xac,0x23,0x01,0x00,0x00

# ATT: pextq 291(%r28,%r29,4), %r19, %r23
# INTEL: pext r23, r19, qword ptr [r28 + 4*r29 + 291]
0x62,0x8a,0xe2,0x00,0xf5,0xbc,0xac,0x23,0x01,0x00,0x00

## rorx

# ATT: rorxl $123, %ecx, %edx
# INTEL: rorx edx, ecx, 123
0x62,0xf3,0x7f,0x08,0xf0,0xd1,0x7b

# ATT: rorxq $123, %r9, %r15
# INTEL: rorx r15, r9, 123
0x62,0x53,0xff,0x08,0xf0,0xf9,0x7b

# ATT: rorxl $123, 123(%rax,%rbx,4), %ecx
# INTEL: rorx ecx, dword ptr [rax + 4*rbx + 123], 123
0x62,0xf3,0x7f,0x08,0xf0,0x8c,0x98,0x7b,0x00,0x00,0x00,0x7b

# ATT: rorxq $123, 123(%rax,%rbx,4), %r9
# INTEL: rorx r9, qword ptr [rax + 4*rbx + 123], 123
0x62,0x73,0xff,0x08,0xf0,0x8c,0x98,0x7b,0x00,0x00,0x00,0x7b

# ATT: rorxl $123, %r18d, %r22d
# INTEL: rorx r22d, r18d, 123
0x62,0xeb,0x7f,0x08,0xf0,0xf2,0x7b

# ATT: rorxq $123, %r19, %r23
# INTEL: rorx r23, r19, 123
0x62,0xeb,0xff,0x08,0xf0,0xfb,0x7b

# ATT: rorxl $123, 291(%r28,%r29,4), %r18d
# INTEL: rorx r18d, dword ptr [r28 + 4*r29 + 291], 123
0x62,0x8b,0x7b,0x08,0xf0,0x94,0xac,0x23,0x01,0x00,0x00,0x7b

# ATT: rorxq $123, 291(%r28,%r29,4), %r19
# INTEL: rorx r19, qword ptr [r28 + 4*r29 + 291], 123
0x62,0x8b,0xfb,0x08,0xf0,0x9c,0xac,0x23,0x01,0x00,0x00,0x7b

## sarx

# ATT: sarxl %ecx, %edx, %r10d
# INTEL: sarx r10d, edx, ecx
0x62,0x72,0x76,0x08,0xf7,0xd2

# ATT: sarxl %ecx, 123(%rax,%rbx,4), %edx
# INTEL: sarx edx, dword ptr [rax + 4*rbx + 123], ecx
0x62,0xf2,0x76,0x08,0xf7,0x94,0x98,0x7b,0x00,0x00,0x00

# ATT: sarxq %r9, %r15, %r11
# INTEL: sarx r11, r15, r9
0x62,0x52,0xb6,0x08,0xf7,0xdf

# ATT: sarxq %r9, 123(%rax,%rbx,4), %r15
# INTEL: sarx r15, qword ptr [rax + 4*rbx + 123], r9
0x62,0x72,0xb6,0x08,0xf7,0xbc,0x98,0x7b,0x00,0x00,0x00

# ATT: sarxl %r18d, %r22d, %r26d
# INTEL: sarx r26d, r22d, r18d
0x62,0x6a,0x6e,0x00,0xf7,0xd6

# ATT: sarxl %r18d, 291(%r28,%r29,4), %r22d
# INTEL: sarx r22d, dword ptr [r28 + 4*r29 + 291], r18d
0x62,0x8a,0x6a,0x00,0xf7,0xb4,0xac,0x23,0x01,0x00,0x00

# ATT: sarxq %r19, %r23, %r27
# INTEL: sarx r27, r23, r19
0x62,0x6a,0xe6,0x00,0xf7,0xdf

# ATT: sarxq %r19, 291(%r28,%r29,4), %r23
# INTEL: sarx r23, qword ptr [r28 + 4*r29 + 291], r19
0x62,0x8a,0xe2,0x00,0xf7,0xbc,0xac,0x23,0x01,0x00,0x00

## shlx

# ATT: shlxl %ecx, %edx, %r10d
# INTEL: shlx r10d, edx, ecx
0x62,0x72,0x75,0x08,0xf7,0xd2

# ATT: shlxl %ecx, 123(%rax,%rbx,4), %edx
# INTEL: shlx edx, dword ptr [rax + 4*rbx + 123], ecx
0x62,0xf2,0x75,0x08,0xf7,0x94,0x98,0x7b,0x00,0x00,0x00

# ATT: shlxq %r9, %r15, %r11
# INTEL: shlx r11, r15, r9
0x62,0x52,0xb5,0x08,0xf7,0xdf

# ATT: shlxq %r9, 123(%rax,%rbx,4), %r15
# INTEL: shlx r15, qword ptr [rax + 4*rbx + 123], r9
0x62,0x72,0xb5,0x08,0xf7,0xbc,0x98,0x7b,0x00,0x00,0x00

# ATT: shlxl %r18d, %r22d, %r26d
# INTEL: shlx r26d, r22d, r18d
0x62,0x6a,0x6d,0x00,0xf7,0xd6

# ATT: shlxl %r18d, 291(%r28,%r29,4), %r22d
# INTEL: shlx r22d, dword ptr [r28 + 4*r29 + 291], r18d
0x62,0x8a,0x69,0x00,0xf7,0xb4,0xac,0x23,0x01,0x00,0x00

# ATT: shlxq %r19, %r23, %r27
# INTEL: shlx r27, r23, r19
0x62,0x6a,0xe5,0x00,0xf7,0xdf

# ATT: shlxq %r19, 291(%r28,%r29,4), %r23
# INTEL: shlx r23, qword ptr [r28 + 4*r29 + 291], r19
0x62,0x8a,0xe1,0x00,0xf7,0xbc,0xac,0x23,0x01,0x00,0x00

## shrx

# ATT: shrxl %ecx, %edx, %r10d
# INTEL: shrx r10d, edx, ecx
0x62,0x72,0x77,0x08,0xf7,0xd2

# ATT: shrxl %ecx, 123(%rax,%rbx,4), %edx
# INTEL: shrx edx, dword ptr [rax + 4*rbx + 123], ecx
0x62,0xf2,0x77,0x08,0xf7,0x94,0x98,0x7b,0x00,0x00,0x00

# ATT: shrxq %r9, %r15, %r11
# INTEL: shrx r11, r15, r9
0x62,0x52,0xb7,0x08,0xf7,0xdf

# ATT: shrxq %r9, 123(%rax,%rbx,4), %r15
# INTEL: shrx r15, qword ptr [rax + 4*rbx + 123], r9
0x62,0x72,0xb7,0x08,0xf7,0xbc,0x98,0x7b,0x00,0x00,0x00

# ATT: shrxl %r18d, %r22d, %r26d
# INTEL: shrx r26d, r22d, r18d
0x62,0x6a,0x6f,0x00,0xf7,0xd6

# ATT: shrxl %r18d, 291(%r28,%r29,4), %r22d
# INTEL: shrx r22d, dword ptr [r28 + 4*r29 + 291], r18d
0x62,0x8a,0x6b,0x00,0xf7,0xb4,0xac,0x23,0x01,0x00,0x00

# ATT: shrxq %r19, %r23, %r27
# INTEL: shrx r27, r23, r19
0x62,0x6a,0xe7,0x00,0xf7,0xdf

# ATT: shrxq %r19, 291(%r28,%r29,4), %r23
# INTEL: shrx r23, qword ptr [r28 + 4*r29 + 291], r19
0x62,0x8a,0xe3,0x00,0xf7,0xbc,0xac,0x23,0x01,0x00,0x00
42 changes: 42 additions & 0 deletions llvm/test/MC/Disassembler/X86/apx/cet.txt
Original file line number Diff line number Diff line change
@@ -0,0 +1,42 @@
# RUN: llvm-mc --disassemble %s -triple=x86_64 | FileCheck %s --check-prefixes=ATT
# RUN: llvm-mc --disassemble %s -triple=x86_64 -x86-asm-syntax=intel --output-asm-variant=1 | FileCheck %s --check-prefixes=INTEL

## wrssd

# ATT: wrssd %ecx, 123(%rax,%rbx,4)
# INTEL: wrssd dword ptr [rax + 4*rbx + 123], ecx
0x62,0xf4,0x7c,0x08,0x66,0x4c,0x98,0x7b

# ATT: wrssd %r18d, 291(%r28,%r29,4)
# INTEL: wrssd dword ptr [r28 + 4*r29 + 291], r18d
0x62,0x8c,0x78,0x08,0x66,0x94,0xac,0x23,0x01,0x00,0x00

## wrssq

# ATT: wrssq %r9, 123(%rax,%rbx,4)
# INTEL: wrssq qword ptr [rax + 4*rbx + 123], r9
0x62,0x74,0xfc,0x08,0x66,0x4c,0x98,0x7b

# ATT: wrssq %r19, 291(%r28,%r29,4)
# INTEL: wrssq qword ptr [r28 + 4*r29 + 291], r19
0x62,0x8c,0xf8,0x08,0x66,0x9c,0xac,0x23,0x01,0x00,0x00

## wrussd

# ATT: wrussd %ecx, 123(%rax,%rbx,4)
# INTEL: wrussd dword ptr [rax + 4*rbx + 123], ecx
0x62,0xf4,0x7d,0x08,0x65,0x4c,0x98,0x7b

# ATT: wrussd %r18d, 291(%r28,%r29,4)
# INTEL: wrussd dword ptr [r28 + 4*r29 + 291], r18d
0x62,0x8c,0x79,0x08,0x65,0x94,0xac,0x23,0x01,0x00,0x00

## wrussq

# ATT: wrussq %r9, 123(%rax,%rbx,4)
# INTEL: wrussq qword ptr [rax + 4*rbx + 123], r9
0x62,0x74,0xfd,0x08,0x65,0x4c,0x98,0x7b

# ATT: wrussq %r19, 291(%r28,%r29,4)
# INTEL: wrussq qword ptr [r28 + 4*r29 + 291], r19
0x62,0x8c,0xf9,0x08,0x65,0x9c,0xac,0x23,0x01,0x00,0x00

0 comments on commit ddf0096

Please sign in to comment.