129 changes: 129 additions & 0 deletions llvm/test/tools/llvm-mca/X86/Znver4/resources-avx512vbmi.s
Original file line number Diff line number Diff line change
@@ -0,0 +1,129 @@
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -instruction-tables < %s | FileCheck %s

vpermb %zmm16, %zmm17, %zmm19
vpermb (%rax), %zmm17, %zmm19
vpermb %zmm16, %zmm17, %zmm19 {k1}
vpermb (%rax), %zmm17, %zmm19 {k1}
vpermb %zmm16, %zmm17, %zmm19 {k1}{z}
vpermb (%rax), %zmm17, %zmm19 {k1}{z}

vpermi2b %zmm16, %zmm17, %zmm19
vpermi2b (%rax), %zmm17, %zmm19
vpermi2b %zmm16, %zmm17, %zmm19 {k1}
vpermi2b (%rax), %zmm17, %zmm19 {k1}
vpermi2b %zmm16, %zmm17, %zmm19 {k1}{z}
vpermi2b (%rax), %zmm17, %zmm19 {k1}{z}

vpermt2b %zmm16, %zmm17, %zmm19
vpermt2b (%rax), %zmm17, %zmm19
vpermt2b %zmm16, %zmm17, %zmm19 {k1}
vpermt2b (%rax), %zmm17, %zmm19 {k1}
vpermt2b %zmm16, %zmm17, %zmm19 {k1}{z}
vpermt2b (%rax), %zmm17, %zmm19 {k1}{z}

vpmultishiftqb %zmm16, %zmm17, %zmm19
vpmultishiftqb (%rax), %zmm17, %zmm19
vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19
vpmultishiftqb %zmm16, %zmm17, %zmm19 {k1}
vpmultishiftqb (%rax), %zmm17, %zmm19 {k1}
vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19 {k1}
vpmultishiftqb %zmm16, %zmm17, %zmm19 {k1}{z}
vpmultishiftqb (%rax), %zmm17, %zmm19 {k1}{z}
vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19 {k1}{z}

# CHECK: Instruction Info:
# CHECK-NEXT: [1]: #uOps
# CHECK-NEXT: [2]: Latency
# CHECK-NEXT: [3]: RThroughput
# CHECK-NEXT: [4]: MayLoad
# CHECK-NEXT: [5]: MayStore
# CHECK-NEXT: [6]: HasSideEffects (U)

# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
# CHECK-NEXT: 1 5 1.00 vpermb %zmm16, %zmm17, %zmm19
# CHECK-NEXT: 2 8 0.50 * vpermb (%rax), %zmm17, %zmm19
# CHECK-NEXT: 1 5 1.00 vpermb %zmm16, %zmm17, %zmm19 {%k1}
# CHECK-NEXT: 2 8 0.50 * vpermb (%rax), %zmm17, %zmm19 {%k1}
# CHECK-NEXT: 1 5 1.00 vpermb %zmm16, %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: 2 8 0.50 * vpermb (%rax), %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: 1 5 1.00 vpermi2b %zmm16, %zmm17, %zmm19
# CHECK-NEXT: 2 8 0.50 * vpermi2b (%rax), %zmm17, %zmm19
# CHECK-NEXT: 1 5 1.00 vpermi2b %zmm16, %zmm17, %zmm19 {%k1}
# CHECK-NEXT: 2 8 0.50 * vpermi2b (%rax), %zmm17, %zmm19 {%k1}
# CHECK-NEXT: 1 5 1.00 vpermi2b %zmm16, %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: 2 8 0.50 * vpermi2b (%rax), %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: 1 5 1.00 vpermt2b %zmm16, %zmm17, %zmm19
# CHECK-NEXT: 2 8 0.50 * vpermt2b (%rax), %zmm17, %zmm19
# CHECK-NEXT: 1 5 1.00 vpermt2b %zmm16, %zmm17, %zmm19 {%k1}
# CHECK-NEXT: 2 8 0.50 * vpermt2b (%rax), %zmm17, %zmm19 {%k1}
# CHECK-NEXT: 1 5 1.00 vpermt2b %zmm16, %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: 2 8 0.50 * vpermt2b (%rax), %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: 1 1 0.50 vpmultishiftqb %zmm16, %zmm17, %zmm19
# CHECK-NEXT: 1 8 0.50 * vpmultishiftqb (%rax), %zmm17, %zmm19
# CHECK-NEXT: 1 8 0.50 * vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19
# CHECK-NEXT: 1 1 0.50 vpmultishiftqb %zmm16, %zmm17, %zmm19 {%k1}
# CHECK-NEXT: 1 8 0.50 * vpmultishiftqb (%rax), %zmm17, %zmm19 {%k1}
# CHECK-NEXT: 1 8 0.50 * vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19 {%k1}
# CHECK-NEXT: 1 1 0.50 vpmultishiftqb %zmm16, %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: 1 8 0.50 * vpmultishiftqb (%rax), %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: 1 8 0.50 * vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19 {%k1} {z}

# CHECK: Resources:
# CHECK-NEXT: [0] - Zn4AGU0
# CHECK-NEXT: [1] - Zn4AGU1
# CHECK-NEXT: [2] - Zn4AGU2
# CHECK-NEXT: [3] - Zn4ALU0
# CHECK-NEXT: [4] - Zn4ALU1
# CHECK-NEXT: [5] - Zn4ALU2
# CHECK-NEXT: [6] - Zn4ALU3
# CHECK-NEXT: [7] - Zn4BRU1
# CHECK-NEXT: [8] - Zn4FP0
# CHECK-NEXT: [9] - Zn4FP1
# CHECK-NEXT: [10] - Zn4FP2
# CHECK-NEXT: [11] - Zn4FP3
# CHECK-NEXT: [12.0] - Zn4FP45
# CHECK-NEXT: [12.1] - Zn4FP45
# CHECK-NEXT: [13] - Zn4FPSt
# CHECK-NEXT: [14.0] - Zn4LSU
# CHECK-NEXT: [14.1] - Zn4LSU
# CHECK-NEXT: [14.2] - Zn4LSU
# CHECK-NEXT: [15.0] - Zn4Load
# CHECK-NEXT: [15.1] - Zn4Load
# CHECK-NEXT: [15.2] - Zn4Load
# CHECK-NEXT: [16.0] - Zn4Store
# CHECK-NEXT: [16.1] - Zn4Store

# CHECK: Resource pressure per iteration:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
# CHECK-NEXT: - - - - - - - - 4.50 18.00 18.00 4.50 7.50 7.50 - 5.00 5.00 5.00 5.00 5.00 5.00 - -

# CHECK: Resource pressure by instruction:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
# CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermb %zmm16, %zmm17, %zmm19
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermb (%rax), %zmm17, %zmm19
# CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermb %zmm16, %zmm17, %zmm19 {%k1}
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermb (%rax), %zmm17, %zmm19 {%k1}
# CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermb %zmm16, %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermb (%rax), %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermi2b %zmm16, %zmm17, %zmm19
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermi2b (%rax), %zmm17, %zmm19
# CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermi2b %zmm16, %zmm17, %zmm19 {%k1}
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermi2b (%rax), %zmm17, %zmm19 {%k1}
# CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermi2b %zmm16, %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermi2b (%rax), %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermt2b %zmm16, %zmm17, %zmm19
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermt2b (%rax), %zmm17, %zmm19
# CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermt2b %zmm16, %zmm17, %zmm19 {%k1}
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermt2b (%rax), %zmm17, %zmm19 {%k1}
# CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermt2b %zmm16, %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermt2b (%rax), %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - vpmultishiftqb %zmm16, %zmm17, %zmm19
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpmultishiftqb (%rax), %zmm17, %zmm19
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - vpmultishiftqb %zmm16, %zmm17, %zmm19 {%k1}
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpmultishiftqb (%rax), %zmm17, %zmm19 {%k1}
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19 {%k1}
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - vpmultishiftqb %zmm16, %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpmultishiftqb (%rax), %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19 {%k1} {z}
408 changes: 408 additions & 0 deletions llvm/test/tools/llvm-mca/X86/Znver4/resources-avx512vbmi2.s

Large diffs are not rendered by default.

772 changes: 772 additions & 0 deletions llvm/test/tools/llvm-mca/X86/Znver4/resources-avx512vbmi2vl.s

Large diffs are not rendered by default.

214 changes: 214 additions & 0 deletions llvm/test/tools/llvm-mca/X86/Znver4/resources-avx512vbmivl.s

Large diffs are not rendered by default.

4,419 changes: 4,419 additions & 0 deletions llvm/test/tools/llvm-mca/X86/Znver4/resources-avx512vl.s

Large diffs are not rendered by default.

156 changes: 156 additions & 0 deletions llvm/test/tools/llvm-mca/X86/Znver4/resources-avx512vnni.s
Original file line number Diff line number Diff line change
@@ -0,0 +1,156 @@
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -instruction-tables < %s | FileCheck %s

vpdpbusd %zmm16, %zmm17, %zmm19
vpdpbusd (%rax), %zmm17, %zmm19
vpdpbusd (%rax){1to16}, %zmm17, %zmm19
vpdpbusd %zmm16, %zmm17, %zmm19 {k1}
vpdpbusd (%rax), %zmm17, %zmm19 {k1}
vpdpbusd (%rax){1to16}, %zmm17, %zmm19 {k1}
vpdpbusd %zmm16, %zmm17, %zmm19 {z}{k1}
vpdpbusd (%rax), %zmm17, %zmm19 {z}{k1}
vpdpbusd (%rax){1to16}, %zmm17, %zmm19 {z}{k1}

vpdpbusds %zmm16, %zmm17, %zmm19
vpdpbusds (%rax), %zmm17, %zmm19
vpdpbusds (%rax){1to16}, %zmm17, %zmm19
vpdpbusds %zmm16, %zmm17, %zmm19 {k1}
vpdpbusds (%rax), %zmm17, %zmm19 {k1}
vpdpbusds (%rax){1to16}, %zmm17, %zmm19 {k1}
vpdpbusds %zmm16, %zmm17, %zmm19 {z}{k1}
vpdpbusds (%rax), %zmm17, %zmm19 {z}{k1}
vpdpbusds (%rax){1to16}, %zmm17, %zmm19 {z}{k1}

vpdpwssd %zmm16, %zmm17, %zmm19
vpdpwssd (%rax), %zmm17, %zmm19
vpdpwssd (%rax){1to16}, %zmm17, %zmm19
vpdpwssd %zmm16, %zmm17, %zmm19 {k1}
vpdpwssd (%rax), %zmm17, %zmm19 {k1}
vpdpwssd (%rax){1to16}, %zmm17, %zmm19 {k1}
vpdpwssd %zmm16, %zmm17, %zmm19 {z}{k1}
vpdpwssd (%rax), %zmm17, %zmm19 {z}{k1}
vpdpwssd (%rax){1to16}, %zmm17, %zmm19 {z}{k1}

vpdpwssds %zmm16, %zmm17, %zmm19
vpdpwssds (%rax), %zmm17, %zmm19
vpdpwssds (%rax){1to16}, %zmm17, %zmm19
vpdpwssds %zmm16, %zmm17, %zmm19 {k1}
vpdpwssds (%rax), %zmm17, %zmm19 {k1}
vpdpwssds (%rax){1to16}, %zmm17, %zmm19 {k1}
vpdpwssds %zmm16, %zmm17, %zmm19 {z}{k1}
vpdpwssds (%rax), %zmm17, %zmm19 {z}{k1}
vpdpwssds (%rax){1to16}, %zmm17, %zmm19 {z}{k1}

# CHECK: Instruction Info:
# CHECK-NEXT: [1]: #uOps
# CHECK-NEXT: [2]: Latency
# CHECK-NEXT: [3]: RThroughput
# CHECK-NEXT: [4]: MayLoad
# CHECK-NEXT: [5]: MayStore
# CHECK-NEXT: [6]: HasSideEffects (U)

# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
# CHECK-NEXT: 1 4 2.00 vpdpbusd %zmm16, %zmm17, %zmm19
# CHECK-NEXT: 1 10 1.00 * vpdpbusd (%rax), %zmm17, %zmm19
# CHECK-NEXT: 1 10 1.00 * vpdpbusd (%rax){1to16}, %zmm17, %zmm19
# CHECK-NEXT: 1 4 2.00 vpdpbusd %zmm16, %zmm17, %zmm19 {%k1}
# CHECK-NEXT: 1 10 1.00 * vpdpbusd (%rax), %zmm17, %zmm19 {%k1}
# CHECK-NEXT: 1 10 1.00 * vpdpbusd (%rax){1to16}, %zmm17, %zmm19 {%k1}
# CHECK-NEXT: 1 4 2.00 vpdpbusd %zmm16, %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: 1 10 1.00 * vpdpbusd (%rax), %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: 1 10 1.00 * vpdpbusd (%rax){1to16}, %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: 1 4 2.00 vpdpbusds %zmm16, %zmm17, %zmm19
# CHECK-NEXT: 1 10 1.00 * vpdpbusds (%rax), %zmm17, %zmm19
# CHECK-NEXT: 1 10 1.00 * vpdpbusds (%rax){1to16}, %zmm17, %zmm19
# CHECK-NEXT: 1 4 2.00 vpdpbusds %zmm16, %zmm17, %zmm19 {%k1}
# CHECK-NEXT: 1 10 1.00 * vpdpbusds (%rax), %zmm17, %zmm19 {%k1}
# CHECK-NEXT: 1 10 1.00 * vpdpbusds (%rax){1to16}, %zmm17, %zmm19 {%k1}
# CHECK-NEXT: 1 4 2.00 vpdpbusds %zmm16, %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: 1 10 1.00 * vpdpbusds (%rax), %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: 1 10 1.00 * vpdpbusds (%rax){1to16}, %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: 1 4 2.00 vpdpwssd %zmm16, %zmm17, %zmm19
# CHECK-NEXT: 1 10 1.00 * vpdpwssd (%rax), %zmm17, %zmm19
# CHECK-NEXT: 1 10 1.00 * vpdpwssd (%rax){1to16}, %zmm17, %zmm19
# CHECK-NEXT: 1 4 2.00 vpdpwssd %zmm16, %zmm17, %zmm19 {%k1}
# CHECK-NEXT: 1 10 1.00 * vpdpwssd (%rax), %zmm17, %zmm19 {%k1}
# CHECK-NEXT: 1 10 1.00 * vpdpwssd (%rax){1to16}, %zmm17, %zmm19 {%k1}
# CHECK-NEXT: 1 4 2.00 vpdpwssd %zmm16, %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: 1 10 1.00 * vpdpwssd (%rax), %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: 1 10 1.00 * vpdpwssd (%rax){1to16}, %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: 1 4 2.00 vpdpwssds %zmm16, %zmm17, %zmm19
# CHECK-NEXT: 1 10 1.00 * vpdpwssds (%rax), %zmm17, %zmm19
# CHECK-NEXT: 1 10 1.00 * vpdpwssds (%rax){1to16}, %zmm17, %zmm19
# CHECK-NEXT: 1 4 2.00 vpdpwssds %zmm16, %zmm17, %zmm19 {%k1}
# CHECK-NEXT: 1 10 1.00 * vpdpwssds (%rax), %zmm17, %zmm19 {%k1}
# CHECK-NEXT: 1 10 1.00 * vpdpwssds (%rax){1to16}, %zmm17, %zmm19 {%k1}
# CHECK-NEXT: 1 4 2.00 vpdpwssds %zmm16, %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: 1 10 1.00 * vpdpwssds (%rax), %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: 1 10 1.00 * vpdpwssds (%rax){1to16}, %zmm17, %zmm19 {%k1} {z}

# CHECK: Resources:
# CHECK-NEXT: [0] - Zn4AGU0
# CHECK-NEXT: [1] - Zn4AGU1
# CHECK-NEXT: [2] - Zn4AGU2
# CHECK-NEXT: [3] - Zn4ALU0
# CHECK-NEXT: [4] - Zn4ALU1
# CHECK-NEXT: [5] - Zn4ALU2
# CHECK-NEXT: [6] - Zn4ALU3
# CHECK-NEXT: [7] - Zn4BRU1
# CHECK-NEXT: [8] - Zn4FP0
# CHECK-NEXT: [9] - Zn4FP1
# CHECK-NEXT: [10] - Zn4FP2
# CHECK-NEXT: [11] - Zn4FP3
# CHECK-NEXT: [12.0] - Zn4FP45
# CHECK-NEXT: [12.1] - Zn4FP45
# CHECK-NEXT: [13] - Zn4FPSt
# CHECK-NEXT: [14.0] - Zn4LSU
# CHECK-NEXT: [14.1] - Zn4LSU
# CHECK-NEXT: [14.2] - Zn4LSU
# CHECK-NEXT: [15.0] - Zn4Load
# CHECK-NEXT: [15.1] - Zn4Load
# CHECK-NEXT: [15.2] - Zn4Load
# CHECK-NEXT: [16.0] - Zn4Store
# CHECK-NEXT: [16.1] - Zn4Store

# CHECK: Resource pressure per iteration:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
# CHECK-NEXT: - - - - - - - - 48.00 24.00 - 24.00 12.00 12.00 - 8.00 8.00 8.00 8.00 8.00 8.00 - -

# CHECK: Resource pressure by instruction:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpbusd %zmm16, %zmm17, %zmm19
# CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusd (%rax), %zmm17, %zmm19
# CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusd (%rax){1to16}, %zmm17, %zmm19
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpbusd %zmm16, %zmm17, %zmm19 {%k1}
# CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusd (%rax), %zmm17, %zmm19 {%k1}
# CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusd (%rax){1to16}, %zmm17, %zmm19 {%k1}
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpbusd %zmm16, %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusd (%rax), %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusd (%rax){1to16}, %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpbusds %zmm16, %zmm17, %zmm19
# CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusds (%rax), %zmm17, %zmm19
# CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusds (%rax){1to16}, %zmm17, %zmm19
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpbusds %zmm16, %zmm17, %zmm19 {%k1}
# CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusds (%rax), %zmm17, %zmm19 {%k1}
# CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusds (%rax){1to16}, %zmm17, %zmm19 {%k1}
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpbusds %zmm16, %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusds (%rax), %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusds (%rax){1to16}, %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpwssd %zmm16, %zmm17, %zmm19
# CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssd (%rax), %zmm17, %zmm19
# CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssd (%rax){1to16}, %zmm17, %zmm19
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpwssd %zmm16, %zmm17, %zmm19 {%k1}
# CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssd (%rax), %zmm17, %zmm19 {%k1}
# CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssd (%rax){1to16}, %zmm17, %zmm19 {%k1}
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpwssd %zmm16, %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssd (%rax), %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssd (%rax){1to16}, %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpwssds %zmm16, %zmm17, %zmm19
# CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssds (%rax), %zmm17, %zmm19
# CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssds (%rax){1to16}, %zmm17, %zmm19
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpwssds %zmm16, %zmm17, %zmm19 {%k1}
# CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssds (%rax), %zmm17, %zmm19 {%k1}
# CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssds (%rax){1to16}, %zmm17, %zmm19 {%k1}
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpwssds %zmm16, %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssds (%rax), %zmm17, %zmm19 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssds (%rax){1to16}, %zmm17, %zmm19 {%k1} {z}
268 changes: 268 additions & 0 deletions llvm/test/tools/llvm-mca/X86/Znver4/resources-avx512vnnivl.s

Large diffs are not rendered by default.

53 changes: 53 additions & 0 deletions llvm/test/tools/llvm-mca/X86/Znver4/resources-avx512vp2intersect.s
Original file line number Diff line number Diff line change
@@ -0,0 +1,53 @@
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=tigerlake -instruction-tables < %s | FileCheck %s

vp2intersectd %zmm16, %zmm19, %k0
vp2intersectd (%rax), %zmm19, %k0
vp2intersectd (%rax){1to16}, %zmm19, %k0

vp2intersectq %zmm16, %zmm19, %k0
vp2intersectq (%rax), %zmm19, %k0
vp2intersectq (%rax){1to8}, %zmm19, %k0

# CHECK: Instruction Info:
# CHECK-NEXT: [1]: #uOps
# CHECK-NEXT: [2]: Latency
# CHECK-NEXT: [3]: RThroughput
# CHECK-NEXT: [4]: MayLoad
# CHECK-NEXT: [5]: MayStore
# CHECK-NEXT: [6]: HasSideEffects (U)

# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
# CHECK-NEXT: 1 1 1.00 vp2intersectd %zmm16, %zmm19, %k0
# CHECK-NEXT: 2 8 1.00 * vp2intersectd (%rax), %zmm19, %k0
# CHECK-NEXT: 2 8 1.00 * vp2intersectd (%rax){1to16}, %zmm19, %k0
# CHECK-NEXT: 1 1 1.00 vp2intersectq %zmm16, %zmm19, %k0
# CHECK-NEXT: 2 8 1.00 * vp2intersectq (%rax), %zmm19, %k0
# CHECK-NEXT: 2 8 1.00 * vp2intersectq (%rax){1to8}, %zmm19, %k0

# CHECK: Resources:
# CHECK-NEXT: [0] - ICXDivider
# CHECK-NEXT: [1] - ICXFPDivider
# CHECK-NEXT: [2] - ICXPort0
# CHECK-NEXT: [3] - ICXPort1
# CHECK-NEXT: [4] - ICXPort2
# CHECK-NEXT: [5] - ICXPort3
# CHECK-NEXT: [6] - ICXPort4
# CHECK-NEXT: [7] - ICXPort5
# CHECK-NEXT: [8] - ICXPort6
# CHECK-NEXT: [9] - ICXPort7
# CHECK-NEXT: [10] - ICXPort8
# CHECK-NEXT: [11] - ICXPort9

# CHECK: Resource pressure per iteration:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11]
# CHECK-NEXT: - - 6.00 - 2.00 2.00 - - - - - -

# CHECK: Resource pressure by instruction:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] Instructions:
# CHECK-NEXT: - - 1.00 - - - - - - - - - vp2intersectd %zmm16, %zmm19, %k0
# CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - - - vp2intersectd (%rax), %zmm19, %k0
# CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - - - vp2intersectd (%rax){1to16}, %zmm19, %k0
# CHECK-NEXT: - - 1.00 - - - - - - - - - vp2intersectq %zmm16, %zmm19, %k0
# CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - - - vp2intersectq (%rax), %zmm19, %k0
# CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - - - vp2intersectq (%rax){1to8}, %zmm19, %k0
Original file line number Diff line number Diff line change
@@ -0,0 +1,73 @@
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=tigerlake -instruction-tables < %s | FileCheck %s

vp2intersectd %xmm16, %xmm19, %k0
vp2intersectd (%rax), %xmm19, %k0
vp2intersectd (%rax){1to4}, %xmm19, %k0

vp2intersectd %ymm16, %ymm19, %k0
vp2intersectd (%rax), %ymm19, %k0
vp2intersectd (%rax){1to8}, %ymm19, %k0

vp2intersectq %xmm16, %xmm19, %k0
vp2intersectq (%rax), %xmm19, %k0
vp2intersectq (%rax){1to2}, %xmm19, %k0

vp2intersectq %ymm16, %ymm19, %k0
vp2intersectq (%rax), %ymm19, %k0
vp2intersectq (%rax){1to4}, %ymm19, %k0

# CHECK: Instruction Info:
# CHECK-NEXT: [1]: #uOps
# CHECK-NEXT: [2]: Latency
# CHECK-NEXT: [3]: RThroughput
# CHECK-NEXT: [4]: MayLoad
# CHECK-NEXT: [5]: MayStore
# CHECK-NEXT: [6]: HasSideEffects (U)

# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
# CHECK-NEXT: 1 1 0.50 vp2intersectd %xmm16, %xmm19, %k0
# CHECK-NEXT: 2 7 0.50 * vp2intersectd (%rax), %xmm19, %k0
# CHECK-NEXT: 2 7 0.50 * vp2intersectd (%rax){1to4}, %xmm19, %k0
# CHECK-NEXT: 1 1 0.50 vp2intersectd %ymm16, %ymm19, %k0
# CHECK-NEXT: 2 8 0.50 * vp2intersectd (%rax), %ymm19, %k0
# CHECK-NEXT: 2 8 0.50 * vp2intersectd (%rax){1to8}, %ymm19, %k0
# CHECK-NEXT: 1 1 0.50 vp2intersectq %xmm16, %xmm19, %k0
# CHECK-NEXT: 2 7 0.50 * vp2intersectq (%rax), %xmm19, %k0
# CHECK-NEXT: 2 7 0.50 * vp2intersectq (%rax){1to2}, %xmm19, %k0
# CHECK-NEXT: 1 1 0.50 vp2intersectq %ymm16, %ymm19, %k0
# CHECK-NEXT: 2 8 0.50 * vp2intersectq (%rax), %ymm19, %k0
# CHECK-NEXT: 2 8 0.50 * vp2intersectq (%rax){1to4}, %ymm19, %k0

# CHECK: Resources:
# CHECK-NEXT: [0] - ICXDivider
# CHECK-NEXT: [1] - ICXFPDivider
# CHECK-NEXT: [2] - ICXPort0
# CHECK-NEXT: [3] - ICXPort1
# CHECK-NEXT: [4] - ICXPort2
# CHECK-NEXT: [5] - ICXPort3
# CHECK-NEXT: [6] - ICXPort4
# CHECK-NEXT: [7] - ICXPort5
# CHECK-NEXT: [8] - ICXPort6
# CHECK-NEXT: [9] - ICXPort7
# CHECK-NEXT: [10] - ICXPort8
# CHECK-NEXT: [11] - ICXPort9

# CHECK: Resource pressure per iteration:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11]
# CHECK-NEXT: - - 6.00 6.00 4.00 4.00 - - - - - -

# CHECK: Resource pressure by instruction:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] Instructions:
# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vp2intersectd %xmm16, %xmm19, %k0
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vp2intersectd (%rax), %xmm19, %k0
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vp2intersectd (%rax){1to4}, %xmm19, %k0
# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vp2intersectd %ymm16, %ymm19, %k0
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vp2intersectd (%rax), %ymm19, %k0
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vp2intersectd (%rax){1to8}, %ymm19, %k0
# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vp2intersectq %xmm16, %xmm19, %k0
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vp2intersectq (%rax), %xmm19, %k0
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vp2intersectq (%rax){1to2}, %xmm19, %k0
# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vp2intersectq %ymm16, %ymm19, %k0
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vp2intersectq (%rax), %ymm19, %k0
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vp2intersectq (%rax){1to4}, %ymm19, %k0
51 changes: 51 additions & 0 deletions llvm/test/tools/llvm-mca/X86/Znver4/resources-avx512vpclmulqdq.s
Original file line number Diff line number Diff line change
@@ -0,0 +1,51 @@
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -instruction-tables < %s | FileCheck %s

vpclmulqdq $11, %zmm16, %zmm17, %zmm19
vpclmulqdq $11, (%rax), %zmm17, %zmm19

# CHECK: Instruction Info:
# CHECK-NEXT: [1]: #uOps
# CHECK-NEXT: [2]: Latency
# CHECK-NEXT: [3]: RThroughput
# CHECK-NEXT: [4]: MayLoad
# CHECK-NEXT: [5]: MayStore
# CHECK-NEXT: [6]: HasSideEffects (U)

# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
# CHECK-NEXT: 4 4 2.00 vpclmulqdq $11, %zmm16, %zmm17, %zmm19
# CHECK-NEXT: 4 11 2.00 * vpclmulqdq $11, (%rax), %zmm17, %zmm19

# CHECK: Resources:
# CHECK-NEXT: [0] - Zn4AGU0
# CHECK-NEXT: [1] - Zn4AGU1
# CHECK-NEXT: [2] - Zn4AGU2
# CHECK-NEXT: [3] - Zn4ALU0
# CHECK-NEXT: [4] - Zn4ALU1
# CHECK-NEXT: [5] - Zn4ALU2
# CHECK-NEXT: [6] - Zn4ALU3
# CHECK-NEXT: [7] - Zn4BRU1
# CHECK-NEXT: [8] - Zn4FP0
# CHECK-NEXT: [9] - Zn4FP1
# CHECK-NEXT: [10] - Zn4FP2
# CHECK-NEXT: [11] - Zn4FP3
# CHECK-NEXT: [12.0] - Zn4FP45
# CHECK-NEXT: [12.1] - Zn4FP45
# CHECK-NEXT: [13] - Zn4FPSt
# CHECK-NEXT: [14.0] - Zn4LSU
# CHECK-NEXT: [14.1] - Zn4LSU
# CHECK-NEXT: [14.2] - Zn4LSU
# CHECK-NEXT: [15.0] - Zn4Load
# CHECK-NEXT: [15.1] - Zn4Load
# CHECK-NEXT: [15.2] - Zn4Load
# CHECK-NEXT: [16.0] - Zn4Store
# CHECK-NEXT: [16.1] - Zn4Store

# CHECK: Resource pressure per iteration:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
# CHECK-NEXT: - - - - - - - - 4.00 4.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - -

# CHECK: Resource pressure by instruction:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpclmulqdq $11, %zmm16, %zmm17, %zmm19
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpclmulqdq $11, (%rax), %zmm17, %zmm19
58 changes: 58 additions & 0 deletions llvm/test/tools/llvm-mca/X86/Znver4/resources-avx512vpclmulqdqvl.s
Original file line number Diff line number Diff line change
@@ -0,0 +1,58 @@
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -instruction-tables < %s | FileCheck %s

vpclmulqdq $11, %xmm16, %xmm17, %xmm19
vpclmulqdq $11, (%rax), %xmm17, %xmm19

vpclmulqdq $11, %ymm16, %ymm17, %ymm19
vpclmulqdq $11, (%rax), %ymm17, %ymm19

# CHECK: Instruction Info:
# CHECK-NEXT: [1]: #uOps
# CHECK-NEXT: [2]: Latency
# CHECK-NEXT: [3]: RThroughput
# CHECK-NEXT: [4]: MayLoad
# CHECK-NEXT: [5]: MayStore
# CHECK-NEXT: [6]: HasSideEffects (U)

# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
# CHECK-NEXT: 4 4 2.00 vpclmulqdq $11, %xmm16, %xmm17, %xmm19
# CHECK-NEXT: 4 11 2.00 * vpclmulqdq $11, (%rax), %xmm17, %xmm19
# CHECK-NEXT: 4 4 2.00 vpclmulqdq $11, %ymm16, %ymm17, %ymm19
# CHECK-NEXT: 4 11 2.00 * vpclmulqdq $11, (%rax), %ymm17, %ymm19

# CHECK: Resources:
# CHECK-NEXT: [0] - Zn4AGU0
# CHECK-NEXT: [1] - Zn4AGU1
# CHECK-NEXT: [2] - Zn4AGU2
# CHECK-NEXT: [3] - Zn4ALU0
# CHECK-NEXT: [4] - Zn4ALU1
# CHECK-NEXT: [5] - Zn4ALU2
# CHECK-NEXT: [6] - Zn4ALU3
# CHECK-NEXT: [7] - Zn4BRU1
# CHECK-NEXT: [8] - Zn4FP0
# CHECK-NEXT: [9] - Zn4FP1
# CHECK-NEXT: [10] - Zn4FP2
# CHECK-NEXT: [11] - Zn4FP3
# CHECK-NEXT: [12.0] - Zn4FP45
# CHECK-NEXT: [12.1] - Zn4FP45
# CHECK-NEXT: [13] - Zn4FPSt
# CHECK-NEXT: [14.0] - Zn4LSU
# CHECK-NEXT: [14.1] - Zn4LSU
# CHECK-NEXT: [14.2] - Zn4LSU
# CHECK-NEXT: [15.0] - Zn4Load
# CHECK-NEXT: [15.1] - Zn4Load
# CHECK-NEXT: [15.2] - Zn4Load
# CHECK-NEXT: [16.0] - Zn4Store
# CHECK-NEXT: [16.1] - Zn4Store

# CHECK: Resource pressure per iteration:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
# CHECK-NEXT: - - - - - - - - 8.00 8.00 - - 1.00 1.00 - 0.67 0.67 0.67 0.67 0.67 0.67 - -

# CHECK: Resource pressure by instruction:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpclmulqdq $11, %xmm16, %xmm17, %xmm19
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpclmulqdq $11, (%rax), %xmm17, %xmm19
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpclmulqdq $11, %ymm16, %ymm17, %ymm19
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpclmulqdq $11, (%rax), %ymm17, %ymm19
104 changes: 104 additions & 0 deletions llvm/test/tools/llvm-mca/X86/Znver4/resources-avx512vpopcntdq.s
Original file line number Diff line number Diff line change
@@ -0,0 +1,104 @@
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -instruction-tables < %s | FileCheck %s

vpopcntd %zmm1, %zmm0
vpopcntd (%rdi), %zmm0
vpopcntd (%rdi){1to16}, %zmm0

vpopcntd %zmm1, %zmm0 {%k1}
vpopcntd (%rdi), %zmm0 {%k1}
vpopcntd (%rdi){1to16}, %zmm0 {%k1}

vpopcntd %zmm1, %zmm0 {%k1} {z}
vpopcntd (%rdi), %zmm0 {%k1} {z}
vpopcntd (%rdi){1to16}, %zmm0 {%k1} {z}

vpopcntq %zmm1, %zmm0
vpopcntq (%rdi), %zmm0
vpopcntq (%rdi){1to8}, %zmm0

vpopcntq %zmm1, %zmm0 {%k1}
vpopcntq (%rdi), %zmm0 {%k1}
vpopcntq (%rdi){1to8}, %zmm0 {%k1}

vpopcntq %zmm1, %zmm0 {%k1} {z}
vpopcntq (%rdi), %zmm0 {%k1} {z}
vpopcntq (%rdi){1to8}, %zmm0 {%k1} {z}

# CHECK: Instruction Info:
# CHECK-NEXT: [1]: #uOps
# CHECK-NEXT: [2]: Latency
# CHECK-NEXT: [3]: RThroughput
# CHECK-NEXT: [4]: MayLoad
# CHECK-NEXT: [5]: MayStore
# CHECK-NEXT: [6]: HasSideEffects (U)

# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
# CHECK-NEXT: 1 1 0.50 vpopcntd %zmm1, %zmm0
# CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi), %zmm0
# CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi){1to16}, %zmm0
# CHECK-NEXT: 1 1 0.50 vpopcntd %zmm1, %zmm0 {%k1}
# CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi), %zmm0 {%k1}
# CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi){1to16}, %zmm0 {%k1}
# CHECK-NEXT: 1 1 0.50 vpopcntd %zmm1, %zmm0 {%k1} {z}
# CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi), %zmm0 {%k1} {z}
# CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi){1to16}, %zmm0 {%k1} {z}
# CHECK-NEXT: 1 1 0.50 vpopcntq %zmm1, %zmm0
# CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi), %zmm0
# CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi){1to8}, %zmm0
# CHECK-NEXT: 1 1 0.50 vpopcntq %zmm1, %zmm0 {%k1}
# CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi), %zmm0 {%k1}
# CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi){1to8}, %zmm0 {%k1}
# CHECK-NEXT: 1 1 0.50 vpopcntq %zmm1, %zmm0 {%k1} {z}
# CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi), %zmm0 {%k1} {z}
# CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi){1to8}, %zmm0 {%k1} {z}

# CHECK: Resources:
# CHECK-NEXT: [0] - Zn4AGU0
# CHECK-NEXT: [1] - Zn4AGU1
# CHECK-NEXT: [2] - Zn4AGU2
# CHECK-NEXT: [3] - Zn4ALU0
# CHECK-NEXT: [4] - Zn4ALU1
# CHECK-NEXT: [5] - Zn4ALU2
# CHECK-NEXT: [6] - Zn4ALU3
# CHECK-NEXT: [7] - Zn4BRU1
# CHECK-NEXT: [8] - Zn4FP0
# CHECK-NEXT: [9] - Zn4FP1
# CHECK-NEXT: [10] - Zn4FP2
# CHECK-NEXT: [11] - Zn4FP3
# CHECK-NEXT: [12.0] - Zn4FP45
# CHECK-NEXT: [12.1] - Zn4FP45
# CHECK-NEXT: [13] - Zn4FPSt
# CHECK-NEXT: [14.0] - Zn4LSU
# CHECK-NEXT: [14.1] - Zn4LSU
# CHECK-NEXT: [14.2] - Zn4LSU
# CHECK-NEXT: [15.0] - Zn4Load
# CHECK-NEXT: [15.1] - Zn4Load
# CHECK-NEXT: [15.2] - Zn4Load
# CHECK-NEXT: [16.0] - Zn4Store
# CHECK-NEXT: [16.1] - Zn4Store

# CHECK: Resource pressure per iteration:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
# CHECK-NEXT: - - - - - - - - 9.00 9.00 9.00 9.00 6.00 6.00 - 4.00 4.00 4.00 4.00 4.00 4.00 - -

# CHECK: Resource pressure by instruction:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - vpopcntd %zmm1, %zmm0
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi), %zmm0
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi){1to16}, %zmm0
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - vpopcntd %zmm1, %zmm0 {%k1}
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi), %zmm0 {%k1}
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi){1to16}, %zmm0 {%k1}
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - vpopcntd %zmm1, %zmm0 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi), %zmm0 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi){1to16}, %zmm0 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - vpopcntq %zmm1, %zmm0
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi), %zmm0
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi){1to8}, %zmm0
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - vpopcntq %zmm1, %zmm0 {%k1}
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi), %zmm0 {%k1}
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi){1to8}, %zmm0 {%k1}
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - vpopcntq %zmm1, %zmm0 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi), %zmm0 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi){1to8}, %zmm0 {%k1} {z}
164 changes: 164 additions & 0 deletions llvm/test/tools/llvm-mca/X86/Znver4/resources-avx512vpopcntdqvl.s
Original file line number Diff line number Diff line change
@@ -0,0 +1,164 @@
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -instruction-tables < %s | FileCheck %s

vpopcntd %xmm1, %xmm0
vpopcntd (%rdi), %xmm0
vpopcntd (%rdi){1to4}, %xmm0

vpopcntd %xmm1, %xmm0 {%k1}
vpopcntd (%rdi), %xmm0 {%k1}
vpopcntd (%rdi){1to4}, %xmm0 {%k1}

vpopcntd %xmm1, %xmm0 {%k1} {z}
vpopcntd (%rdi), %xmm0 {%k1} {z}
vpopcntd (%rdi){1to4}, %xmm0 {%k1} {z}

vpopcntd %ymm1, %ymm0
vpopcntd (%rdi), %ymm0
vpopcntd (%rdi){1to8}, %ymm0

vpopcntd %ymm1, %ymm0 {%k1}
vpopcntd (%rdi), %ymm0 {%k1}
vpopcntd (%rdi){1to8}, %ymm0 {%k1}

vpopcntd %ymm1, %ymm0 {%k1} {z}
vpopcntd (%rdi), %ymm0 {%k1} {z}
vpopcntd (%rdi){1to8}, %ymm0 {%k1} {z}

vpopcntq %xmm1, %xmm0
vpopcntq (%rdi), %xmm0
vpopcntq (%rdi){1to2}, %xmm0

vpopcntq %xmm1, %xmm0 {%k1}
vpopcntq (%rdi), %xmm0 {%k1}
vpopcntq (%rdi){1to2}, %xmm0 {%k1}

vpopcntq %xmm1, %xmm0 {%k1} {z}
vpopcntq (%rdi), %xmm0 {%k1} {z}
vpopcntq (%rdi){1to2}, %xmm0 {%k1} {z}

vpopcntq %ymm1, %ymm0
vpopcntq (%rdi), %ymm0
vpopcntq (%rdi){1to4}, %ymm0

vpopcntq %ymm1, %ymm0 {%k1}
vpopcntq (%rdi), %ymm0 {%k1}
vpopcntq (%rdi){1to4}, %ymm0 {%k1}

vpopcntq %ymm1, %ymm0 {%k1} {z}
vpopcntq (%rdi), %ymm0 {%k1} {z}
vpopcntq (%rdi){1to4}, %ymm0 {%k1} {z}

# CHECK: Instruction Info:
# CHECK-NEXT: [1]: #uOps
# CHECK-NEXT: [2]: Latency
# CHECK-NEXT: [3]: RThroughput
# CHECK-NEXT: [4]: MayLoad
# CHECK-NEXT: [5]: MayStore
# CHECK-NEXT: [6]: HasSideEffects (U)

# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
# CHECK-NEXT: 1 2 1.00 vpopcntd %xmm1, %xmm0
# CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi), %xmm0
# CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi){1to4}, %xmm0
# CHECK-NEXT: 1 2 1.00 vpopcntd %xmm1, %xmm0 {%k1}
# CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi), %xmm0 {%k1}
# CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi){1to4}, %xmm0 {%k1}
# CHECK-NEXT: 1 2 1.00 vpopcntd %xmm1, %xmm0 {%k1} {z}
# CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi), %xmm0 {%k1} {z}
# CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi){1to4}, %xmm0 {%k1} {z}
# CHECK-NEXT: 1 1 0.25 vpopcntd %ymm1, %ymm0
# CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi), %ymm0
# CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi){1to8}, %ymm0
# CHECK-NEXT: 1 1 0.25 vpopcntd %ymm1, %ymm0 {%k1}
# CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi), %ymm0 {%k1}
# CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi){1to8}, %ymm0 {%k1}
# CHECK-NEXT: 1 1 0.25 vpopcntd %ymm1, %ymm0 {%k1} {z}
# CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi), %ymm0 {%k1} {z}
# CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi){1to8}, %ymm0 {%k1} {z}
# CHECK-NEXT: 1 2 1.00 vpopcntq %xmm1, %xmm0
# CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi), %xmm0
# CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi){1to2}, %xmm0
# CHECK-NEXT: 1 2 1.00 vpopcntq %xmm1, %xmm0 {%k1}
# CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi), %xmm0 {%k1}
# CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi){1to2}, %xmm0 {%k1}
# CHECK-NEXT: 1 2 1.00 vpopcntq %xmm1, %xmm0 {%k1} {z}
# CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi), %xmm0 {%k1} {z}
# CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi){1to2}, %xmm0 {%k1} {z}
# CHECK-NEXT: 1 1 0.25 vpopcntq %ymm1, %ymm0
# CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi), %ymm0
# CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi){1to4}, %ymm0
# CHECK-NEXT: 1 1 0.25 vpopcntq %ymm1, %ymm0 {%k1}
# CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi), %ymm0 {%k1}
# CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi){1to4}, %ymm0 {%k1}
# CHECK-NEXT: 1 1 0.25 vpopcntq %ymm1, %ymm0 {%k1} {z}
# CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi), %ymm0 {%k1} {z}
# CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi){1to4}, %ymm0 {%k1} {z}

# CHECK: Resources:
# CHECK-NEXT: [0] - Zn4AGU0
# CHECK-NEXT: [1] - Zn4AGU1
# CHECK-NEXT: [2] - Zn4AGU2
# CHECK-NEXT: [3] - Zn4ALU0
# CHECK-NEXT: [4] - Zn4ALU1
# CHECK-NEXT: [5] - Zn4ALU2
# CHECK-NEXT: [6] - Zn4ALU3
# CHECK-NEXT: [7] - Zn4BRU1
# CHECK-NEXT: [8] - Zn4FP0
# CHECK-NEXT: [9] - Zn4FP1
# CHECK-NEXT: [10] - Zn4FP2
# CHECK-NEXT: [11] - Zn4FP3
# CHECK-NEXT: [12.0] - Zn4FP45
# CHECK-NEXT: [12.1] - Zn4FP45
# CHECK-NEXT: [13] - Zn4FPSt
# CHECK-NEXT: [14.0] - Zn4LSU
# CHECK-NEXT: [14.1] - Zn4LSU
# CHECK-NEXT: [14.2] - Zn4LSU
# CHECK-NEXT: [15.0] - Zn4Load
# CHECK-NEXT: [15.1] - Zn4Load
# CHECK-NEXT: [15.2] - Zn4Load
# CHECK-NEXT: [16.0] - Zn4Store
# CHECK-NEXT: [16.1] - Zn4Store

# CHECK: Resource pressure per iteration:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
# CHECK-NEXT: - - - - - - - - 13.50 13.50 7.50 7.50 12.00 12.00 - 8.00 8.00 8.00 8.00 8.00 8.00 - -

# CHECK: Resource pressure by instruction:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vpopcntd %xmm1, %xmm0
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi), %xmm0
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi){1to4}, %xmm0
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vpopcntd %xmm1, %xmm0 {%k1}
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi), %xmm0 {%k1}
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi){1to4}, %xmm0 {%k1}
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vpopcntd %xmm1, %xmm0 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi), %xmm0 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi){1to4}, %xmm0 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - vpopcntd %ymm1, %ymm0
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi), %ymm0
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi){1to8}, %ymm0
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - vpopcntd %ymm1, %ymm0 {%k1}
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi), %ymm0 {%k1}
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi){1to8}, %ymm0 {%k1}
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - vpopcntd %ymm1, %ymm0 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi), %ymm0 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi){1to8}, %ymm0 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vpopcntq %xmm1, %xmm0
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi), %xmm0
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi){1to2}, %xmm0
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vpopcntq %xmm1, %xmm0 {%k1}
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi), %xmm0 {%k1}
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi){1to2}, %xmm0 {%k1}
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vpopcntq %xmm1, %xmm0 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi), %xmm0 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi){1to2}, %xmm0 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - vpopcntq %ymm1, %ymm0
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi), %ymm0
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi){1to4}, %ymm0
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - vpopcntq %ymm1, %ymm0 {%k1}
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi), %ymm0 {%k1}
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi){1to4}, %ymm0 {%k1}
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - vpopcntq %ymm1, %ymm0 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi), %ymm0 {%k1} {z}
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi){1to4}, %ymm0 {%k1} {z}
86 changes: 86 additions & 0 deletions llvm/test/tools/llvm-mca/X86/Znver4/resources-avxgfni.s
Original file line number Diff line number Diff line change
@@ -0,0 +1,86 @@
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -instruction-tables < %s | FileCheck %s

vgf2p8affineinvqb $0, %xmm0, %xmm1, %xmm2
vgf2p8affineinvqb $0, (%rax), %xmm1, %xmm2

vgf2p8affineinvqb $0, %ymm0, %ymm1, %ymm2
vgf2p8affineinvqb $0, (%rax), %ymm1, %ymm2

vgf2p8affineqb $0, %xmm0, %xmm1, %xmm2
vgf2p8affineqb $0, (%rax), %xmm1, %xmm2

vgf2p8affineqb $0, %ymm0, %ymm1, %ymm2
vgf2p8affineqb $0, (%rax), %ymm1, %ymm2

vgf2p8mulb %xmm0, %xmm1, %xmm2
vgf2p8mulb (%rax), %xmm1, %xmm2

vgf2p8mulb %ymm0, %ymm1, %ymm2
vgf2p8mulb (%rax), %ymm1, %ymm2

# CHECK: Instruction Info:
# CHECK-NEXT: [1]: #uOps
# CHECK-NEXT: [2]: Latency
# CHECK-NEXT: [3]: RThroughput
# CHECK-NEXT: [4]: MayLoad
# CHECK-NEXT: [5]: MayStore
# CHECK-NEXT: [6]: HasSideEffects (U)

# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
# CHECK-NEXT: 1 3 0.50 vgf2p8affineinvqb $0, %xmm0, %xmm1, %xmm2
# CHECK-NEXT: 1 10 0.50 * vgf2p8affineinvqb $0, (%rax), %xmm1, %xmm2
# CHECK-NEXT: 1 3 0.50 vgf2p8affineinvqb $0, %ymm0, %ymm1, %ymm2
# CHECK-NEXT: 1 10 0.50 * vgf2p8affineinvqb $0, (%rax), %ymm1, %ymm2
# CHECK-NEXT: 1 3 0.50 vgf2p8affineqb $0, %xmm0, %xmm1, %xmm2
# CHECK-NEXT: 1 10 0.50 * vgf2p8affineqb $0, (%rax), %xmm1, %xmm2
# CHECK-NEXT: 1 3 0.50 vgf2p8affineqb $0, %ymm0, %ymm1, %ymm2
# CHECK-NEXT: 1 10 0.50 * vgf2p8affineqb $0, (%rax), %ymm1, %ymm2
# CHECK-NEXT: 1 1 0.25 vgf2p8mulb %xmm0, %xmm1, %xmm2
# CHECK-NEXT: 1 8 0.50 * vgf2p8mulb (%rax), %xmm1, %xmm2
# CHECK-NEXT: 1 1 0.25 vgf2p8mulb %ymm0, %ymm1, %ymm2
# CHECK-NEXT: 1 8 0.50 * vgf2p8mulb (%rax), %ymm1, %ymm2

# CHECK: Resources:
# CHECK-NEXT: [0] - Zn4AGU0
# CHECK-NEXT: [1] - Zn4AGU1
# CHECK-NEXT: [2] - Zn4AGU2
# CHECK-NEXT: [3] - Zn4ALU0
# CHECK-NEXT: [4] - Zn4ALU1
# CHECK-NEXT: [5] - Zn4ALU2
# CHECK-NEXT: [6] - Zn4ALU3
# CHECK-NEXT: [7] - Zn4BRU1
# CHECK-NEXT: [8] - Zn4FP0
# CHECK-NEXT: [9] - Zn4FP1
# CHECK-NEXT: [10] - Zn4FP2
# CHECK-NEXT: [11] - Zn4FP3
# CHECK-NEXT: [12.0] - Zn4FP45
# CHECK-NEXT: [12.1] - Zn4FP45
# CHECK-NEXT: [13] - Zn4FPSt
# CHECK-NEXT: [14.0] - Zn4LSU
# CHECK-NEXT: [14.1] - Zn4LSU
# CHECK-NEXT: [14.2] - Zn4LSU
# CHECK-NEXT: [15.0] - Zn4Load
# CHECK-NEXT: [15.1] - Zn4Load
# CHECK-NEXT: [15.2] - Zn4Load
# CHECK-NEXT: [16.0] - Zn4Store
# CHECK-NEXT: [16.1] - Zn4Store

# CHECK: Resource pressure per iteration:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
# CHECK-NEXT: - - - - - - - - 5.00 1.00 1.00 5.00 3.00 3.00 - 2.00 2.00 2.00 2.00 2.00 2.00 - -

# CHECK: Resource pressure by instruction:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - vgf2p8affineinvqb $0, %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vgf2p8affineinvqb $0, (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - vgf2p8affineinvqb $0, %ymm0, %ymm1, %ymm2
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vgf2p8affineinvqb $0, (%rax), %ymm1, %ymm2
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - vgf2p8affineqb $0, %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vgf2p8affineqb $0, (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - vgf2p8affineqb $0, %ymm0, %ymm1, %ymm2
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vgf2p8affineqb $0, (%rax), %ymm1, %ymm2
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - vgf2p8mulb %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vgf2p8mulb (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - vgf2p8mulb %ymm0, %ymm1, %ymm2
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vgf2p8mulb (%rax), %ymm1, %ymm2
100 changes: 100 additions & 0 deletions llvm/test/tools/llvm-mca/X86/Znver4/resources-avxvnni.s
Original file line number Diff line number Diff line change
@@ -0,0 +1,100 @@
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -instruction-tables < %s | FileCheck %s

vpdpbusd %xmm0, %xmm1, %xmm2
vpdpbusd (%rax), %xmm1, %xmm2

vpdpbusd %ymm0, %ymm1, %ymm2
vpdpbusd (%rax), %ymm1, %ymm2

vpdpbusds %xmm0, %xmm1, %xmm2
vpdpbusds (%rax), %xmm1, %xmm2

vpdpbusds %ymm0, %ymm1, %ymm2
vpdpbusds (%rax), %ymm1, %ymm2

vpdpwssd %xmm0, %xmm1, %xmm2
vpdpwssd (%rax), %xmm1, %xmm2

vpdpwssd %ymm0, %ymm1, %ymm2
vpdpwssd (%rax), %ymm1, %ymm2

vpdpwssds %xmm0, %xmm1, %xmm2
vpdpwssds (%rax), %xmm1, %xmm2

vpdpwssds %ymm0, %ymm1, %ymm2
vpdpwssds (%rax), %ymm1, %ymm2

# CHECK: Instruction Info:
# CHECK-NEXT: [1]: #uOps
# CHECK-NEXT: [2]: Latency
# CHECK-NEXT: [3]: RThroughput
# CHECK-NEXT: [4]: MayLoad
# CHECK-NEXT: [5]: MayStore
# CHECK-NEXT: [6]: HasSideEffects (U)

# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
# CHECK-NEXT: 1 4 2.00 vpdpbusd %xmm0, %xmm1, %xmm2
# CHECK-NEXT: 1 10 0.50 * vpdpbusd (%rax), %xmm1, %xmm2
# CHECK-NEXT: 1 4 2.00 vpdpbusd %ymm0, %ymm1, %ymm2
# CHECK-NEXT: 1 10 0.50 * vpdpbusd (%rax), %ymm1, %ymm2
# CHECK-NEXT: 1 4 2.00 vpdpbusds %xmm0, %xmm1, %xmm2
# CHECK-NEXT: 1 10 0.50 * vpdpbusds (%rax), %xmm1, %xmm2
# CHECK-NEXT: 1 4 2.00 vpdpbusds %ymm0, %ymm1, %ymm2
# CHECK-NEXT: 1 10 0.50 * vpdpbusds (%rax), %ymm1, %ymm2
# CHECK-NEXT: 1 4 2.00 vpdpwssd %xmm0, %xmm1, %xmm2
# CHECK-NEXT: 1 10 0.50 * vpdpwssd (%rax), %xmm1, %xmm2
# CHECK-NEXT: 1 4 2.00 vpdpwssd %ymm0, %ymm1, %ymm2
# CHECK-NEXT: 1 10 0.50 * vpdpwssd (%rax), %ymm1, %ymm2
# CHECK-NEXT: 1 4 2.00 vpdpwssds %xmm0, %xmm1, %xmm2
# CHECK-NEXT: 1 10 0.50 * vpdpwssds (%rax), %xmm1, %xmm2
# CHECK-NEXT: 1 4 2.00 vpdpwssds %ymm0, %ymm1, %ymm2
# CHECK-NEXT: 1 10 0.50 * vpdpwssds (%rax), %ymm1, %ymm2

# CHECK: Resources:
# CHECK-NEXT: [0] - Zn4AGU0
# CHECK-NEXT: [1] - Zn4AGU1
# CHECK-NEXT: [2] - Zn4AGU2
# CHECK-NEXT: [3] - Zn4ALU0
# CHECK-NEXT: [4] - Zn4ALU1
# CHECK-NEXT: [5] - Zn4ALU2
# CHECK-NEXT: [6] - Zn4ALU3
# CHECK-NEXT: [7] - Zn4BRU1
# CHECK-NEXT: [8] - Zn4FP0
# CHECK-NEXT: [9] - Zn4FP1
# CHECK-NEXT: [10] - Zn4FP2
# CHECK-NEXT: [11] - Zn4FP3
# CHECK-NEXT: [12.0] - Zn4FP45
# CHECK-NEXT: [12.1] - Zn4FP45
# CHECK-NEXT: [13] - Zn4FPSt
# CHECK-NEXT: [14.0] - Zn4LSU
# CHECK-NEXT: [14.1] - Zn4LSU
# CHECK-NEXT: [14.2] - Zn4LSU
# CHECK-NEXT: [15.0] - Zn4Load
# CHECK-NEXT: [15.1] - Zn4Load
# CHECK-NEXT: [15.2] - Zn4Load
# CHECK-NEXT: [16.0] - Zn4Store
# CHECK-NEXT: [16.1] - Zn4Store

# CHECK: Resource pressure per iteration:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
# CHECK-NEXT: - - - - - - - - 20.00 16.00 - 4.00 4.00 4.00 - 2.67 2.67 2.67 2.67 2.67 2.67 - -

# CHECK: Resource pressure by instruction:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpbusd %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusd (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpbusd %ymm0, %ymm1, %ymm2
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusd (%rax), %ymm1, %ymm2
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpbusds %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusds (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpbusds %ymm0, %ymm1, %ymm2
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusds (%rax), %ymm1, %ymm2
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpwssd %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssd (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpwssd %ymm0, %ymm1, %ymm2
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssd (%rax), %ymm1, %ymm2
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpwssds %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssds (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpwssds %ymm0, %ymm1, %ymm2
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssds (%rax), %ymm1, %ymm2
135 changes: 135 additions & 0 deletions llvm/test/tools/llvm-mca/X86/Znver4/resources-bmi1.s
Original file line number Diff line number Diff line change
@@ -0,0 +1,135 @@
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -instruction-tables < %s | FileCheck %s

andn %eax, %ebx, %ecx
andn (%rax), %ebx, %ecx

andn %rax, %rbx, %rcx
andn (%rax), %rbx, %rcx

bextr %eax, %ebx, %ecx
bextr %eax, (%rbx), %ecx

bextr %rax, %rbx, %rcx
bextr %rax, (%rbx), %rcx

blsi %eax, %ecx
blsi (%rax), %ecx

blsi %rax, %rcx
blsi (%rax), %rcx

blsmsk %eax, %ecx
blsmsk (%rax), %ecx

blsmsk %rax, %rcx
blsmsk (%rax), %rcx

blsr %eax, %ecx
blsr (%rax), %ecx

blsr %rax, %rcx
blsr (%rax), %rcx

tzcnt %ax, %cx
tzcnt (%rax), %cx

tzcnt %eax, %ecx
tzcnt (%rax), %ecx

tzcnt %rax, %rcx
tzcnt (%rax), %rcx

# CHECK: Instruction Info:
# CHECK-NEXT: [1]: #uOps
# CHECK-NEXT: [2]: Latency
# CHECK-NEXT: [3]: RThroughput
# CHECK-NEXT: [4]: MayLoad
# CHECK-NEXT: [5]: MayStore
# CHECK-NEXT: [6]: HasSideEffects (U)

# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
# CHECK-NEXT: 1 1 0.25 andnl %eax, %ebx, %ecx
# CHECK-NEXT: 1 5 0.33 * andnl (%rax), %ebx, %ecx
# CHECK-NEXT: 1 1 0.25 andnq %rax, %rbx, %rcx
# CHECK-NEXT: 1 5 0.33 * andnq (%rax), %rbx, %rcx
# CHECK-NEXT: 1 1 0.50 bextrl %eax, %ebx, %ecx
# CHECK-NEXT: 2 5 0.50 * bextrl %eax, (%rbx), %ecx
# CHECK-NEXT: 1 1 0.50 bextrq %rax, %rbx, %rcx
# CHECK-NEXT: 2 5 0.50 * bextrq %rax, (%rbx), %rcx
# CHECK-NEXT: 1 1 0.25 blsil %eax, %ecx
# CHECK-NEXT: 2 5 0.33 * blsil (%rax), %ecx
# CHECK-NEXT: 1 1 0.25 blsiq %rax, %rcx
# CHECK-NEXT: 2 5 0.33 * blsiq (%rax), %rcx
# CHECK-NEXT: 1 1 0.25 blsmskl %eax, %ecx
# CHECK-NEXT: 2 5 0.33 * blsmskl (%rax), %ecx
# CHECK-NEXT: 1 1 0.25 blsmskq %rax, %rcx
# CHECK-NEXT: 2 5 0.33 * blsmskq (%rax), %rcx
# CHECK-NEXT: 1 1 0.25 blsrl %eax, %ecx
# CHECK-NEXT: 2 5 0.33 * blsrl (%rax), %ecx
# CHECK-NEXT: 1 1 0.25 blsrq %rax, %rcx
# CHECK-NEXT: 2 5 0.33 * blsrq (%rax), %rcx
# CHECK-NEXT: 2 2 1.00 tzcntw %ax, %cx
# CHECK-NEXT: 2 6 0.50 * tzcntw (%rax), %cx
# CHECK-NEXT: 2 2 0.50 tzcntl %eax, %ecx
# CHECK-NEXT: 2 6 0.50 * tzcntl (%rax), %ecx
# CHECK-NEXT: 2 2 0.50 tzcntq %rax, %rcx
# CHECK-NEXT: 2 6 0.50 * tzcntq (%rax), %rcx

# CHECK: Resources:
# CHECK-NEXT: [0] - Zn4AGU0
# CHECK-NEXT: [1] - Zn4AGU1
# CHECK-NEXT: [2] - Zn4AGU2
# CHECK-NEXT: [3] - Zn4ALU0
# CHECK-NEXT: [4] - Zn4ALU1
# CHECK-NEXT: [5] - Zn4ALU2
# CHECK-NEXT: [6] - Zn4ALU3
# CHECK-NEXT: [7] - Zn4BRU1
# CHECK-NEXT: [8] - Zn4FP0
# CHECK-NEXT: [9] - Zn4FP1
# CHECK-NEXT: [10] - Zn4FP2
# CHECK-NEXT: [11] - Zn4FP3
# CHECK-NEXT: [12.0] - Zn4FP45
# CHECK-NEXT: [12.1] - Zn4FP45
# CHECK-NEXT: [13] - Zn4FPSt
# CHECK-NEXT: [14.0] - Zn4LSU
# CHECK-NEXT: [14.1] - Zn4LSU
# CHECK-NEXT: [14.2] - Zn4LSU
# CHECK-NEXT: [15.0] - Zn4Load
# CHECK-NEXT: [15.1] - Zn4Load
# CHECK-NEXT: [15.2] - Zn4Load
# CHECK-NEXT: [16.0] - Zn4Store
# CHECK-NEXT: [16.1] - Zn4Store

# CHECK: Resource pressure per iteration:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
# CHECK-NEXT: 4.33 4.33 4.33 5.00 9.50 9.50 5.00 - - - - - - - - 4.33 4.33 4.33 4.33 4.33 4.33 - -

# CHECK: Resource pressure by instruction:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - andnl %eax, %ebx, %ecx
# CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - andnl (%rax), %ebx, %ecx
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - andnq %rax, %rbx, %rcx
# CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - andnq (%rax), %rbx, %rcx
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - bextrl %eax, %ebx, %ecx
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - bextrl %eax, (%rbx), %ecx
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - bextrq %rax, %rbx, %rcx
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - bextrq %rax, (%rbx), %rcx
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - blsil %eax, %ecx
# CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - blsil (%rax), %ecx
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - blsiq %rax, %rcx
# CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - blsiq (%rax), %rcx
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - blsmskl %eax, %ecx
# CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - blsmskl (%rax), %ecx
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - blsmskq %rax, %rcx
# CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - blsmskq (%rax), %rcx
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - blsrl %eax, %ecx
# CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - blsrl (%rax), %ecx
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - blsrq %rax, %rcx
# CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - blsrq (%rax), %rcx
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - tzcntw %ax, %cx
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - tzcntw (%rax), %cx
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - tzcntl %eax, %ecx
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - tzcntl (%rax), %ecx
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - tzcntq %rax, %rcx
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - tzcntq (%rax), %rcx
156 changes: 156 additions & 0 deletions llvm/test/tools/llvm-mca/X86/Znver4/resources-bmi2.s
Original file line number Diff line number Diff line change
@@ -0,0 +1,156 @@
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -instruction-tables < %s | FileCheck %s

bzhi %eax, %ebx, %ecx
bzhi %eax, (%rbx), %ecx

bzhi %rax, %rbx, %rcx
bzhi %rax, (%rbx), %rcx

mulx %eax, %ebx, %ecx
mulx (%rax), %ebx, %ecx

mulx %rax, %rbx, %rcx
mulx (%rax), %rbx, %rcx

pdep %eax, %ebx, %ecx
pdep (%rax), %ebx, %ecx

pdep %rax, %rbx, %rcx
pdep (%rax), %rbx, %rcx

pext %eax, %ebx, %ecx
pext (%rax), %ebx, %ecx

pext %rax, %rbx, %rcx
pext (%rax), %rbx, %rcx

rorx $1, %eax, %ecx
rorx $1, (%rax), %ecx

rorx $1, %rax, %rcx
rorx $1, (%rax), %rcx

sarx %eax, %ebx, %ecx
sarx %eax, (%rbx), %ecx

sarx %rax, %rbx, %rcx
sarx %rax, (%rbx), %rcx

shlx %eax, %ebx, %ecx
shlx %eax, (%rbx), %ecx

shlx %rax, %rbx, %rcx
shlx %rax, (%rbx), %rcx

shrx %eax, %ebx, %ecx
shrx %eax, (%rbx), %ecx

shrx %rax, %rbx, %rcx
shrx %rax, (%rbx), %rcx

# CHECK: Instruction Info:
# CHECK-NEXT: [1]: #uOps
# CHECK-NEXT: [2]: Latency
# CHECK-NEXT: [3]: RThroughput
# CHECK-NEXT: [4]: MayLoad
# CHECK-NEXT: [5]: MayStore
# CHECK-NEXT: [6]: HasSideEffects (U)

# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
# CHECK-NEXT: 1 1 0.50 bzhil %eax, %ebx, %ecx
# CHECK-NEXT: 2 5 0.50 * bzhil %eax, (%rbx), %ecx
# CHECK-NEXT: 1 1 0.50 bzhiq %rax, %rbx, %rcx
# CHECK-NEXT: 2 5 0.50 * bzhiq %rax, (%rbx), %rcx
# CHECK-NEXT: 2 4 1.00 mulxl %eax, %ebx, %ecx
# CHECK-NEXT: 2 8 1.00 * mulxl (%rax), %ebx, %ecx
# CHECK-NEXT: 2 4 1.00 mulxq %rax, %rbx, %rcx
# CHECK-NEXT: 2 8 1.00 * mulxq (%rax), %rbx, %rcx
# CHECK-NEXT: 1 3 1.00 pdepl %eax, %ebx, %ecx
# CHECK-NEXT: 1 5 0.33 * pdepl (%rax), %ebx, %ecx
# CHECK-NEXT: 1 3 1.00 pdepq %rax, %rbx, %rcx
# CHECK-NEXT: 1 5 0.33 * pdepq (%rax), %rbx, %rcx
# CHECK-NEXT: 1 3 1.00 pextl %eax, %ebx, %ecx
# CHECK-NEXT: 1 5 0.33 * pextl (%rax), %ebx, %ecx
# CHECK-NEXT: 1 3 1.00 pextq %rax, %rbx, %rcx
# CHECK-NEXT: 1 5 0.33 * pextq (%rax), %rbx, %rcx
# CHECK-NEXT: 1 1 0.50 rorxl $1, %eax, %ecx
# CHECK-NEXT: 2 5 0.50 * rorxl $1, (%rax), %ecx
# CHECK-NEXT: 1 1 0.50 rorxq $1, %rax, %rcx
# CHECK-NEXT: 2 5 0.50 * rorxq $1, (%rax), %rcx
# CHECK-NEXT: 1 1 0.50 sarxl %eax, %ebx, %ecx
# CHECK-NEXT: 2 5 0.50 * sarxl %eax, (%rbx), %ecx
# CHECK-NEXT: 1 1 0.50 sarxq %rax, %rbx, %rcx
# CHECK-NEXT: 2 5 0.50 * sarxq %rax, (%rbx), %rcx
# CHECK-NEXT: 1 1 0.50 shlxl %eax, %ebx, %ecx
# CHECK-NEXT: 2 5 0.50 * shlxl %eax, (%rbx), %ecx
# CHECK-NEXT: 1 1 0.50 shlxq %rax, %rbx, %rcx
# CHECK-NEXT: 2 5 0.50 * shlxq %rax, (%rbx), %rcx
# CHECK-NEXT: 1 1 0.50 shrxl %eax, %ebx, %ecx
# CHECK-NEXT: 2 5 0.50 * shrxl %eax, (%rbx), %ecx
# CHECK-NEXT: 1 1 0.50 shrxq %rax, %rbx, %rcx
# CHECK-NEXT: 2 5 0.50 * shrxq %rax, (%rbx), %rcx

# CHECK: Resources:
# CHECK-NEXT: [0] - Zn4AGU0
# CHECK-NEXT: [1] - Zn4AGU1
# CHECK-NEXT: [2] - Zn4AGU2
# CHECK-NEXT: [3] - Zn4ALU0
# CHECK-NEXT: [4] - Zn4ALU1
# CHECK-NEXT: [5] - Zn4ALU2
# CHECK-NEXT: [6] - Zn4ALU3
# CHECK-NEXT: [7] - Zn4BRU1
# CHECK-NEXT: [8] - Zn4FP0
# CHECK-NEXT: [9] - Zn4FP1
# CHECK-NEXT: [10] - Zn4FP2
# CHECK-NEXT: [11] - Zn4FP3
# CHECK-NEXT: [12.0] - Zn4FP45
# CHECK-NEXT: [12.1] - Zn4FP45
# CHECK-NEXT: [13] - Zn4FPSt
# CHECK-NEXT: [14.0] - Zn4LSU
# CHECK-NEXT: [14.1] - Zn4LSU
# CHECK-NEXT: [14.2] - Zn4LSU
# CHECK-NEXT: [15.0] - Zn4Load
# CHECK-NEXT: [15.1] - Zn4Load
# CHECK-NEXT: [15.2] - Zn4Load
# CHECK-NEXT: [16.0] - Zn4Store
# CHECK-NEXT: [16.1] - Zn4Store

# CHECK: Resource pressure per iteration:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
# CHECK-NEXT: 5.33 5.33 5.33 1.00 19.00 11.00 1.00 - - - - - - - - 5.33 5.33 5.33 5.33 5.33 5.33 - -

# CHECK: Resource pressure by instruction:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - bzhil %eax, %ebx, %ecx
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - bzhil %eax, (%rbx), %ecx
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - bzhiq %rax, %rbx, %rcx
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - bzhiq %rax, (%rbx), %rcx
# CHECK-NEXT: - - - - 1.00 - - - - - - - - - - - - - - - - - - mulxl %eax, %ebx, %ecx
# CHECK-NEXT: 0.33 0.33 0.33 - 1.00 - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - mulxl (%rax), %ebx, %ecx
# CHECK-NEXT: - - - - 1.00 - - - - - - - - - - - - - - - - - - mulxq %rax, %rbx, %rcx
# CHECK-NEXT: 0.33 0.33 0.33 - 1.00 - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - mulxq (%rax), %rbx, %rcx
# CHECK-NEXT: - - - - 1.00 - - - - - - - - - - - - - - - - - - pdepl %eax, %ebx, %ecx
# CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - pdepl (%rax), %ebx, %ecx
# CHECK-NEXT: - - - - 1.00 - - - - - - - - - - - - - - - - - - pdepq %rax, %rbx, %rcx
# CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - pdepq (%rax), %rbx, %rcx
# CHECK-NEXT: - - - - 1.00 - - - - - - - - - - - - - - - - - - pextl %eax, %ebx, %ecx
# CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - pextl (%rax), %ebx, %ecx
# CHECK-NEXT: - - - - 1.00 - - - - - - - - - - - - - - - - - - pextq %rax, %rbx, %rcx
# CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - pextq (%rax), %rbx, %rcx
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - rorxl $1, %eax, %ecx
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - rorxl $1, (%rax), %ecx
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - rorxq $1, %rax, %rcx
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - rorxq $1, (%rax), %rcx
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - sarxl %eax, %ebx, %ecx
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - sarxl %eax, (%rbx), %ecx
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - sarxq %rax, %rbx, %rcx
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - sarxq %rax, (%rbx), %rcx
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - shlxl %eax, %ebx, %ecx
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - shlxl %eax, (%rbx), %ecx
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - shlxq %rax, %rbx, %rcx
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - shlxq %rax, (%rbx), %rcx
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - shrxl %eax, %ebx, %ecx
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - shrxl %eax, (%rbx), %ecx
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - shrxq %rax, %rbx, %rcx
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - shrxq %rax, (%rbx), %rcx
48 changes: 48 additions & 0 deletions llvm/test/tools/llvm-mca/X86/Znver4/resources-clflushopt.s
Original file line number Diff line number Diff line change
@@ -0,0 +1,48 @@
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -instruction-tables < %s | FileCheck %s

clflushopt (%rax)

# CHECK: Instruction Info:
# CHECK-NEXT: [1]: #uOps
# CHECK-NEXT: [2]: Latency
# CHECK-NEXT: [3]: RThroughput
# CHECK-NEXT: [4]: MayLoad
# CHECK-NEXT: [5]: MayStore
# CHECK-NEXT: [6]: HasSideEffects (U)

# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
# CHECK-NEXT: 1 5 0.33 * * U clflushopt (%rax)

# CHECK: Resources:
# CHECK-NEXT: [0] - Zn4AGU0
# CHECK-NEXT: [1] - Zn4AGU1
# CHECK-NEXT: [2] - Zn4AGU2
# CHECK-NEXT: [3] - Zn4ALU0
# CHECK-NEXT: [4] - Zn4ALU1
# CHECK-NEXT: [5] - Zn4ALU2
# CHECK-NEXT: [6] - Zn4ALU3
# CHECK-NEXT: [7] - Zn4BRU1
# CHECK-NEXT: [8] - Zn4FP0
# CHECK-NEXT: [9] - Zn4FP1
# CHECK-NEXT: [10] - Zn4FP2
# CHECK-NEXT: [11] - Zn4FP3
# CHECK-NEXT: [12.0] - Zn4FP45
# CHECK-NEXT: [12.1] - Zn4FP45
# CHECK-NEXT: [13] - Zn4FPSt
# CHECK-NEXT: [14.0] - Zn4LSU
# CHECK-NEXT: [14.1] - Zn4LSU
# CHECK-NEXT: [14.2] - Zn4LSU
# CHECK-NEXT: [15.0] - Zn4Load
# CHECK-NEXT: [15.1] - Zn4Load
# CHECK-NEXT: [15.2] - Zn4Load
# CHECK-NEXT: [16.0] - Zn4Store
# CHECK-NEXT: [16.1] - Zn4Store

# CHECK: Resource pressure per iteration:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - -

# CHECK: Resource pressure by instruction:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - clflushopt (%rax)
48 changes: 48 additions & 0 deletions llvm/test/tools/llvm-mca/X86/Znver4/resources-clwb.s
Original file line number Diff line number Diff line change
@@ -0,0 +1,48 @@
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -instruction-tables < %s | FileCheck %s

clwb (%rax)

# CHECK: Instruction Info:
# CHECK-NEXT: [1]: #uOps
# CHECK-NEXT: [2]: Latency
# CHECK-NEXT: [3]: RThroughput
# CHECK-NEXT: [4]: MayLoad
# CHECK-NEXT: [5]: MayStore
# CHECK-NEXT: [6]: HasSideEffects (U)

# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
# CHECK-NEXT: 1 5 0.33 * * U clwb (%rax)

# CHECK: Resources:
# CHECK-NEXT: [0] - Zn4AGU0
# CHECK-NEXT: [1] - Zn4AGU1
# CHECK-NEXT: [2] - Zn4AGU2
# CHECK-NEXT: [3] - Zn4ALU0
# CHECK-NEXT: [4] - Zn4ALU1
# CHECK-NEXT: [5] - Zn4ALU2
# CHECK-NEXT: [6] - Zn4ALU3
# CHECK-NEXT: [7] - Zn4BRU1
# CHECK-NEXT: [8] - Zn4FP0
# CHECK-NEXT: [9] - Zn4FP1
# CHECK-NEXT: [10] - Zn4FP2
# CHECK-NEXT: [11] - Zn4FP3
# CHECK-NEXT: [12.0] - Zn4FP45
# CHECK-NEXT: [12.1] - Zn4FP45
# CHECK-NEXT: [13] - Zn4FPSt
# CHECK-NEXT: [14.0] - Zn4LSU
# CHECK-NEXT: [14.1] - Zn4LSU
# CHECK-NEXT: [14.2] - Zn4LSU
# CHECK-NEXT: [15.0] - Zn4Load
# CHECK-NEXT: [15.1] - Zn4Load
# CHECK-NEXT: [15.2] - Zn4Load
# CHECK-NEXT: [16.0] - Zn4Store
# CHECK-NEXT: [16.1] - Zn4Store

# CHECK: Resource pressure per iteration:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - -

# CHECK: Resource pressure by instruction:
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - clwb (%rax)
Loading