diff --git a/llvm/test/tools/llvm-mca/X86/Generic/resources-avx512cd.s b/llvm/test/tools/llvm-mca/X86/Generic/resources-avx512cd.s new file mode 100644 index 0000000000000..498e1422d32c0 --- /dev/null +++ b/llvm/test/tools/llvm-mca/X86/Generic/resources-avx512cd.s @@ -0,0 +1,149 @@ +# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py +# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=x86-64 -instruction-tables < %s | FileCheck %s + +vpbroadcastmb2q %k0, %zmm16 + +vpbroadcastmw2d %k0, %zmm16 + +vpconflictd %zmm16, %zmm19 +vpconflictd (%rax), %zmm19 +vpconflictd (%rax){1to16}, %zmm19 +vpconflictd %zmm16, %zmm19 {k1} +vpconflictd (%rax), %zmm19 {k1} +vpconflictd (%rax){1to16}, %zmm19 {k1} +vpconflictd %zmm16, %zmm19 {z}{k1} +vpconflictd (%rax), %zmm19 {z}{k1} +vpconflictd (%rax){1to16}, %zmm19 {z}{k1} + +vpconflictq %zmm16, %zmm19 +vpconflictq (%rax), %zmm19 +vpconflictq (%rax){1to8}, %zmm19 +vpconflictq %zmm16, %zmm19 {k1} +vpconflictq (%rax), %zmm19 {k1} +vpconflictq (%rax){1to8}, %zmm19 {k1} +vpconflictq %zmm16, %zmm19 {z}{k1} +vpconflictq (%rax), %zmm19 {z}{k1} +vpconflictq (%rax){1to8}, %zmm19 {z}{k1} + +vplzcntd %zmm16, %zmm19 +vplzcntd (%rax), %zmm19 +vplzcntd (%rax){1to16}, %zmm19 +vplzcntd %zmm16, %zmm19 {k1} +vplzcntd (%rax), %zmm19 {k1} +vplzcntd (%rax){1to16}, %zmm19 {k1} +vplzcntd %zmm16, %zmm19 {z}{k1} +vplzcntd (%rax), %zmm19 {z}{k1} +vplzcntd (%rax){1to16}, %zmm19 {z}{k1} + +vplzcntq %zmm16, %zmm19 +vplzcntq (%rax), %zmm19 +vplzcntq (%rax){1to8}, %zmm19 +vplzcntq %zmm16, %zmm19 {k1} +vplzcntq (%rax), %zmm19 {k1} +vplzcntq (%rax){1to8}, %zmm19 {k1} +vplzcntq %zmm16, %zmm19 {z}{k1} +vplzcntq (%rax), %zmm19 {z}{k1} +vplzcntq (%rax){1to8}, %zmm19 {z}{k1} + +# CHECK: Instruction Info: +# CHECK-NEXT: [1]: #uOps +# CHECK-NEXT: [2]: Latency +# CHECK-NEXT: [3]: RThroughput +# CHECK-NEXT: [4]: MayLoad +# CHECK-NEXT: [5]: MayStore +# CHECK-NEXT: [6]: HasSideEffects (U) + +# CHECK: [1] [2] [3] [4] [5] [6] Instructions: +# CHECK-NEXT: 1 1 1.00 vpbroadcastmb2q %k0, %zmm16 +# CHECK-NEXT: 1 1 1.00 vpbroadcastmw2d %k0, %zmm16 +# CHECK-NEXT: 1 1 0.50 vpconflictd %zmm16, %zmm19 +# CHECK-NEXT: 2 8 0.50 * vpconflictd (%rax), %zmm19 +# CHECK-NEXT: 2 8 0.50 * vpconflictd (%rax){1to16}, %zmm19 +# CHECK-NEXT: 1 1 0.50 vpconflictd %zmm16, %zmm19 {%k1} +# CHECK-NEXT: 2 8 0.50 * vpconflictd (%rax), %zmm19 {%k1} +# CHECK-NEXT: 2 8 0.50 * vpconflictd (%rax){1to16}, %zmm19 {%k1} +# CHECK-NEXT: 1 1 0.50 vpconflictd %zmm16, %zmm19 {%k1} {z} +# CHECK-NEXT: 2 8 0.50 * vpconflictd (%rax), %zmm19 {%k1} {z} +# CHECK-NEXT: 2 8 0.50 * vpconflictd (%rax){1to16}, %zmm19 {%k1} {z} +# CHECK-NEXT: 1 1 0.50 vpconflictq %zmm16, %zmm19 +# CHECK-NEXT: 2 8 0.50 * vpconflictq (%rax), %zmm19 +# CHECK-NEXT: 2 8 0.50 * vpconflictq (%rax){1to8}, %zmm19 +# CHECK-NEXT: 1 1 0.50 vpconflictq %zmm16, %zmm19 {%k1} +# CHECK-NEXT: 2 8 0.50 * vpconflictq (%rax), %zmm19 {%k1} +# CHECK-NEXT: 2 8 0.50 * vpconflictq (%rax){1to8}, %zmm19 {%k1} +# CHECK-NEXT: 1 1 0.50 vpconflictq %zmm16, %zmm19 {%k1} {z} +# CHECK-NEXT: 2 8 0.50 * vpconflictq (%rax), %zmm19 {%k1} {z} +# CHECK-NEXT: 2 8 0.50 * vpconflictq (%rax){1to8}, %zmm19 {%k1} {z} +# CHECK-NEXT: 1 5 1.00 vplzcntd %zmm16, %zmm19 +# CHECK-NEXT: 2 12 1.00 * vplzcntd (%rax), %zmm19 +# CHECK-NEXT: 2 12 1.00 * vplzcntd (%rax){1to16}, %zmm19 +# CHECK-NEXT: 1 5 1.00 vplzcntd %zmm16, %zmm19 {%k1} +# CHECK-NEXT: 2 12 1.00 * vplzcntd (%rax), %zmm19 {%k1} +# CHECK-NEXT: 2 12 1.00 * vplzcntd (%rax){1to16}, %zmm19 {%k1} +# CHECK-NEXT: 1 5 1.00 vplzcntd %zmm16, %zmm19 {%k1} {z} +# CHECK-NEXT: 2 12 1.00 * vplzcntd (%rax), %zmm19 {%k1} {z} +# CHECK-NEXT: 2 12 1.00 * vplzcntd (%rax){1to16}, %zmm19 {%k1} {z} +# CHECK-NEXT: 1 5 1.00 vplzcntq %zmm16, %zmm19 +# CHECK-NEXT: 2 12 1.00 * vplzcntq (%rax), %zmm19 +# CHECK-NEXT: 2 12 1.00 * vplzcntq (%rax){1to8}, %zmm19 +# CHECK-NEXT: 1 5 1.00 vplzcntq %zmm16, %zmm19 {%k1} +# CHECK-NEXT: 2 12 1.00 * vplzcntq (%rax), %zmm19 {%k1} +# CHECK-NEXT: 2 12 1.00 * vplzcntq (%rax){1to8}, %zmm19 {%k1} +# CHECK-NEXT: 1 5 1.00 vplzcntq %zmm16, %zmm19 {%k1} {z} +# CHECK-NEXT: 2 12 1.00 * vplzcntq (%rax), %zmm19 {%k1} {z} +# CHECK-NEXT: 2 12 1.00 * vplzcntq (%rax){1to8}, %zmm19 {%k1} {z} + +# CHECK: Resources: +# CHECK-NEXT: [0] - SBDivider +# CHECK-NEXT: [1] - SBFPDivider +# CHECK-NEXT: [2] - SBPort0 +# CHECK-NEXT: [3] - SBPort1 +# CHECK-NEXT: [4] - SBPort4 +# CHECK-NEXT: [5] - SBPort5 +# CHECK-NEXT: [6.0] - SBPort23 +# CHECK-NEXT: [6.1] - SBPort23 + +# CHECK: Resource pressure per iteration: +# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1] +# CHECK-NEXT: - - 18.00 9.00 - 11.00 12.00 12.00 + +# CHECK: Resource pressure by instruction: +# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1] Instructions: +# CHECK-NEXT: - - - - - 1.00 - - vpbroadcastmb2q %k0, %zmm16 +# CHECK-NEXT: - - - - - 1.00 - - vpbroadcastmw2d %k0, %zmm16 +# CHECK-NEXT: - - - 0.50 - 0.50 - - vpconflictd %zmm16, %zmm19 +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictd (%rax), %zmm19 +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictd (%rax){1to16}, %zmm19 +# CHECK-NEXT: - - - 0.50 - 0.50 - - vpconflictd %zmm16, %zmm19 {%k1} +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictd (%rax), %zmm19 {%k1} +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictd (%rax){1to16}, %zmm19 {%k1} +# CHECK-NEXT: - - - 0.50 - 0.50 - - vpconflictd %zmm16, %zmm19 {%k1} {z} +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictd (%rax), %zmm19 {%k1} {z} +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictd (%rax){1to16}, %zmm19 {%k1} {z} +# CHECK-NEXT: - - - 0.50 - 0.50 - - vpconflictq %zmm16, %zmm19 +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictq (%rax), %zmm19 +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictq (%rax){1to8}, %zmm19 +# CHECK-NEXT: - - - 0.50 - 0.50 - - vpconflictq %zmm16, %zmm19 {%k1} +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictq (%rax), %zmm19 {%k1} +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictq (%rax){1to8}, %zmm19 {%k1} +# CHECK-NEXT: - - - 0.50 - 0.50 - - vpconflictq %zmm16, %zmm19 {%k1} {z} +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictq (%rax), %zmm19 {%k1} {z} +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictq (%rax){1to8}, %zmm19 {%k1} {z} +# CHECK-NEXT: - - 1.00 - - - - - vplzcntd %zmm16, %zmm19 +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntd (%rax), %zmm19 +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntd (%rax){1to16}, %zmm19 +# CHECK-NEXT: - - 1.00 - - - - - vplzcntd %zmm16, %zmm19 {%k1} +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntd (%rax), %zmm19 {%k1} +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntd (%rax){1to16}, %zmm19 {%k1} +# CHECK-NEXT: - - 1.00 - - - - - vplzcntd %zmm16, %zmm19 {%k1} {z} +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntd (%rax), %zmm19 {%k1} {z} +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntd (%rax){1to16}, %zmm19 {%k1} {z} +# CHECK-NEXT: - - 1.00 - - - - - vplzcntq %zmm16, %zmm19 +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntq (%rax), %zmm19 +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntq (%rax){1to8}, %zmm19 +# CHECK-NEXT: - - 1.00 - - - - - vplzcntq %zmm16, %zmm19 {%k1} +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntq (%rax), %zmm19 {%k1} +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntq (%rax){1to8}, %zmm19 {%k1} +# CHECK-NEXT: - - 1.00 - - - - - vplzcntq %zmm16, %zmm19 {%k1} {z} +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntq (%rax), %zmm19 {%k1} {z} +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntq (%rax){1to8}, %zmm19 {%k1} {z} diff --git a/llvm/test/tools/llvm-mca/X86/Generic/resources-avx512cdvl.s b/llvm/test/tools/llvm-mca/X86/Generic/resources-avx512cdvl.s new file mode 100644 index 0000000000000..af926dc81161e --- /dev/null +++ b/llvm/test/tools/llvm-mca/X86/Generic/resources-avx512cdvl.s @@ -0,0 +1,267 @@ +# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py +# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=x86-64 -instruction-tables < %s | FileCheck %s + +vpbroadcastmb2q %k0, %xmm16 +vpbroadcastmb2q %k0, %ymm16 + +vpbroadcastmw2d %k0, %xmm16 +vpbroadcastmw2d %k0, %ymm16 + +vpconflictd %xmm16, %xmm19 +vpconflictd (%rax), %xmm19 +vpconflictd (%rax){1to4}, %xmm19 +vpconflictd %xmm16, %xmm19 {k1} +vpconflictd (%rax), %xmm19 {k1} +vpconflictd (%rax){1to4}, %xmm19 {k1} +vpconflictd %xmm16, %xmm19 {z}{k1} +vpconflictd (%rax), %xmm19 {z}{k1} +vpconflictd (%rax){1to4}, %xmm19 {z}{k1} + +vpconflictd %ymm16, %ymm19 +vpconflictd (%rax), %ymm19 +vpconflictd (%rax){1to8}, %ymm19 +vpconflictd %ymm16, %ymm19 {k1} +vpconflictd (%rax), %ymm19 {k1} +vpconflictd (%rax){1to8}, %ymm19 {k1} +vpconflictd %ymm16, %ymm19 {z}{k1} +vpconflictd (%rax), %ymm19 {z}{k1} +vpconflictd (%rax){1to8}, %ymm19 {z}{k1} + +vpconflictq %xmm16, %xmm19 +vpconflictq (%rax), %xmm19 +vpconflictq (%rax){1to2}, %xmm19 +vpconflictq %xmm16, %xmm19 {k1} +vpconflictq (%rax), %xmm19 {k1} +vpconflictq (%rax){1to2}, %xmm19 {k1} +vpconflictq %xmm16, %xmm19 {z}{k1} +vpconflictq (%rax), %xmm19 {z}{k1} +vpconflictq (%rax){1to2}, %xmm19 {z}{k1} + +vpconflictq %ymm16, %ymm19 +vpconflictq (%rax), %ymm19 +vpconflictq (%rax){1to4}, %ymm19 +vpconflictq %ymm16, %ymm19 {k1} +vpconflictq (%rax), %ymm19 {k1} +vpconflictq (%rax){1to4}, %ymm19 {k1} +vpconflictq %ymm16, %ymm19 {z}{k1} +vpconflictq (%rax), %ymm19 {z}{k1} +vpconflictq (%rax){1to4}, %ymm19 {z}{k1} + +vplzcntd %xmm16, %xmm19 +vplzcntd (%rax), %xmm19 +vplzcntd (%rax){1to4}, %xmm19 +vplzcntd %xmm16, %xmm19 {k1} +vplzcntd (%rax), %xmm19 {k1} +vplzcntd (%rax){1to4}, %xmm19 {k1} +vplzcntd %xmm16, %xmm19 {z}{k1} +vplzcntd (%rax), %xmm19 {z}{k1} +vplzcntd (%rax){1to4}, %xmm19 {z}{k1} + +vplzcntd %ymm16, %ymm19 +vplzcntd (%rax), %ymm19 +vplzcntd (%rax){1to8}, %ymm19 +vplzcntd %ymm16, %ymm19 {k1} +vplzcntd (%rax), %ymm19 {k1} +vplzcntd (%rax){1to8}, %ymm19 {k1} +vplzcntd %ymm16, %ymm19 {z}{k1} +vplzcntd (%rax), %ymm19 {z}{k1} +vplzcntd (%rax){1to8}, %ymm19 {z}{k1} + +vplzcntq %xmm16, %xmm19 +vplzcntq (%rax), %xmm19 +vplzcntq (%rax){1to2}, %xmm19 +vplzcntq %xmm16, %xmm19 {k1} +vplzcntq (%rax), %xmm19 {k1} +vplzcntq (%rax){1to2}, %xmm19 {k1} +vplzcntq %xmm16, %xmm19 {z}{k1} +vplzcntq (%rax), %xmm19 {z}{k1} +vplzcntq (%rax){1to2}, %xmm19 {z}{k1} + +vplzcntq %ymm16, %ymm19 +vplzcntq (%rax), %ymm19 +vplzcntq (%rax){1to4}, %ymm19 +vplzcntq %ymm16, %ymm19 {k1} +vplzcntq (%rax), %ymm19 {k1} +vplzcntq (%rax){1to4}, %ymm19 {k1} +vplzcntq %ymm16, %ymm19 {z}{k1} +vplzcntq (%rax), %ymm19 {z}{k1} +vplzcntq (%rax){1to4}, %ymm19 {z}{k1} + +# CHECK: Instruction Info: +# CHECK-NEXT: [1]: #uOps +# CHECK-NEXT: [2]: Latency +# CHECK-NEXT: [3]: RThroughput +# CHECK-NEXT: [4]: MayLoad +# CHECK-NEXT: [5]: MayStore +# CHECK-NEXT: [6]: HasSideEffects (U) + +# CHECK: [1] [2] [3] [4] [5] [6] Instructions: +# CHECK-NEXT: 1 1 1.00 vpbroadcastmb2q %k0, %xmm16 +# CHECK-NEXT: 1 1 1.00 vpbroadcastmb2q %k0, %ymm16 +# CHECK-NEXT: 1 1 1.00 vpbroadcastmw2d %k0, %xmm16 +# CHECK-NEXT: 1 1 1.00 vpbroadcastmw2d %k0, %ymm16 +# CHECK-NEXT: 1 1 0.50 vpconflictd %xmm16, %xmm19 +# CHECK-NEXT: 2 7 0.50 * vpconflictd (%rax), %xmm19 +# CHECK-NEXT: 2 7 0.50 * vpconflictd (%rax){1to4}, %xmm19 +# CHECK-NEXT: 1 1 0.50 vpconflictd %xmm16, %xmm19 {%k1} +# CHECK-NEXT: 2 7 0.50 * vpconflictd (%rax), %xmm19 {%k1} +# CHECK-NEXT: 2 7 0.50 * vpconflictd (%rax){1to4}, %xmm19 {%k1} +# CHECK-NEXT: 1 1 0.50 vpconflictd %xmm16, %xmm19 {%k1} {z} +# CHECK-NEXT: 2 7 0.50 * vpconflictd (%rax), %xmm19 {%k1} {z} +# CHECK-NEXT: 2 7 0.50 * vpconflictd (%rax){1to4}, %xmm19 {%k1} {z} +# CHECK-NEXT: 1 1 0.50 vpconflictd %ymm16, %ymm19 +# CHECK-NEXT: 2 8 0.50 * vpconflictd (%rax), %ymm19 +# CHECK-NEXT: 2 8 0.50 * vpconflictd (%rax){1to8}, %ymm19 +# CHECK-NEXT: 1 1 0.50 vpconflictd %ymm16, %ymm19 {%k1} +# CHECK-NEXT: 2 8 0.50 * vpconflictd (%rax), %ymm19 {%k1} +# CHECK-NEXT: 2 8 0.50 * vpconflictd (%rax){1to8}, %ymm19 {%k1} +# CHECK-NEXT: 1 1 0.50 vpconflictd %ymm16, %ymm19 {%k1} {z} +# CHECK-NEXT: 2 8 0.50 * vpconflictd (%rax), %ymm19 {%k1} {z} +# CHECK-NEXT: 2 8 0.50 * vpconflictd (%rax){1to8}, %ymm19 {%k1} {z} +# CHECK-NEXT: 1 1 0.50 vpconflictq %xmm16, %xmm19 +# CHECK-NEXT: 2 7 0.50 * vpconflictq (%rax), %xmm19 +# CHECK-NEXT: 2 7 0.50 * vpconflictq (%rax){1to2}, %xmm19 +# CHECK-NEXT: 1 1 0.50 vpconflictq %xmm16, %xmm19 {%k1} +# CHECK-NEXT: 2 7 0.50 * vpconflictq (%rax), %xmm19 {%k1} +# CHECK-NEXT: 2 7 0.50 * vpconflictq (%rax){1to2}, %xmm19 {%k1} +# CHECK-NEXT: 1 1 0.50 vpconflictq %xmm16, %xmm19 {%k1} {z} +# CHECK-NEXT: 2 7 0.50 * vpconflictq (%rax), %xmm19 {%k1} {z} +# CHECK-NEXT: 2 7 0.50 * vpconflictq (%rax){1to2}, %xmm19 {%k1} {z} +# CHECK-NEXT: 1 1 0.50 vpconflictq %ymm16, %ymm19 +# CHECK-NEXT: 2 8 0.50 * vpconflictq (%rax), %ymm19 +# CHECK-NEXT: 2 8 0.50 * vpconflictq (%rax){1to4}, %ymm19 +# CHECK-NEXT: 1 1 0.50 vpconflictq %ymm16, %ymm19 {%k1} +# CHECK-NEXT: 2 8 0.50 * vpconflictq (%rax), %ymm19 {%k1} +# CHECK-NEXT: 2 8 0.50 * vpconflictq (%rax){1to4}, %ymm19 {%k1} +# CHECK-NEXT: 1 1 0.50 vpconflictq %ymm16, %ymm19 {%k1} {z} +# CHECK-NEXT: 2 8 0.50 * vpconflictq (%rax), %ymm19 {%k1} {z} +# CHECK-NEXT: 2 8 0.50 * vpconflictq (%rax){1to4}, %ymm19 {%k1} {z} +# CHECK-NEXT: 1 5 1.00 vplzcntd %xmm16, %xmm19 +# CHECK-NEXT: 2 11 1.00 * vplzcntd (%rax), %xmm19 +# CHECK-NEXT: 2 11 1.00 * vplzcntd (%rax){1to4}, %xmm19 +# CHECK-NEXT: 1 5 1.00 vplzcntd %xmm16, %xmm19 {%k1} +# CHECK-NEXT: 2 11 1.00 * vplzcntd (%rax), %xmm19 {%k1} +# CHECK-NEXT: 2 11 1.00 * vplzcntd (%rax){1to4}, %xmm19 {%k1} +# CHECK-NEXT: 1 5 1.00 vplzcntd %xmm16, %xmm19 {%k1} {z} +# CHECK-NEXT: 2 11 1.00 * vplzcntd (%rax), %xmm19 {%k1} {z} +# CHECK-NEXT: 2 11 1.00 * vplzcntd (%rax){1to4}, %xmm19 {%k1} {z} +# CHECK-NEXT: 1 5 1.00 vplzcntd %ymm16, %ymm19 +# CHECK-NEXT: 2 12 1.00 * vplzcntd (%rax), %ymm19 +# CHECK-NEXT: 2 12 1.00 * vplzcntd (%rax){1to8}, %ymm19 +# CHECK-NEXT: 1 5 1.00 vplzcntd %ymm16, %ymm19 {%k1} +# CHECK-NEXT: 2 12 1.00 * vplzcntd (%rax), %ymm19 {%k1} +# CHECK-NEXT: 2 12 1.00 * vplzcntd (%rax){1to8}, %ymm19 {%k1} +# CHECK-NEXT: 1 5 1.00 vplzcntd %ymm16, %ymm19 {%k1} {z} +# CHECK-NEXT: 2 12 1.00 * vplzcntd (%rax), %ymm19 {%k1} {z} +# CHECK-NEXT: 2 12 1.00 * vplzcntd (%rax){1to8}, %ymm19 {%k1} {z} +# CHECK-NEXT: 1 5 1.00 vplzcntq %xmm16, %xmm19 +# CHECK-NEXT: 2 11 1.00 * vplzcntq (%rax), %xmm19 +# CHECK-NEXT: 2 11 1.00 * vplzcntq (%rax){1to2}, %xmm19 +# CHECK-NEXT: 1 5 1.00 vplzcntq %xmm16, %xmm19 {%k1} +# CHECK-NEXT: 2 11 1.00 * vplzcntq (%rax), %xmm19 {%k1} +# CHECK-NEXT: 2 11 1.00 * vplzcntq (%rax){1to2}, %xmm19 {%k1} +# CHECK-NEXT: 1 5 1.00 vplzcntq %xmm16, %xmm19 {%k1} {z} +# CHECK-NEXT: 2 11 1.00 * vplzcntq (%rax), %xmm19 {%k1} {z} +# CHECK-NEXT: 2 11 1.00 * vplzcntq (%rax){1to2}, %xmm19 {%k1} {z} +# CHECK-NEXT: 1 5 1.00 vplzcntq %ymm16, %ymm19 +# CHECK-NEXT: 2 12 1.00 * vplzcntq (%rax), %ymm19 +# CHECK-NEXT: 2 12 1.00 * vplzcntq (%rax){1to4}, %ymm19 +# CHECK-NEXT: 1 5 1.00 vplzcntq %ymm16, %ymm19 {%k1} +# CHECK-NEXT: 2 12 1.00 * vplzcntq (%rax), %ymm19 {%k1} +# CHECK-NEXT: 2 12 1.00 * vplzcntq (%rax){1to4}, %ymm19 {%k1} +# CHECK-NEXT: 1 5 1.00 vplzcntq %ymm16, %ymm19 {%k1} {z} +# CHECK-NEXT: 2 12 1.00 * vplzcntq (%rax), %ymm19 {%k1} {z} +# CHECK-NEXT: 2 12 1.00 * vplzcntq (%rax){1to4}, %ymm19 {%k1} {z} + +# CHECK: Resources: +# CHECK-NEXT: [0] - SBDivider +# CHECK-NEXT: [1] - SBFPDivider +# CHECK-NEXT: [2] - SBPort0 +# CHECK-NEXT: [3] - SBPort1 +# CHECK-NEXT: [4] - SBPort4 +# CHECK-NEXT: [5] - SBPort5 +# CHECK-NEXT: [6.0] - SBPort23 +# CHECK-NEXT: [6.1] - SBPort23 + +# CHECK: Resource pressure per iteration: +# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1] +# CHECK-NEXT: - - 36.00 18.00 - 22.00 24.00 24.00 + +# CHECK: Resource pressure by instruction: +# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6.0] [6.1] Instructions: +# CHECK-NEXT: - - - - - 1.00 - - vpbroadcastmb2q %k0, %xmm16 +# CHECK-NEXT: - - - - - 1.00 - - vpbroadcastmb2q %k0, %ymm16 +# CHECK-NEXT: - - - - - 1.00 - - vpbroadcastmw2d %k0, %xmm16 +# CHECK-NEXT: - - - - - 1.00 - - vpbroadcastmw2d %k0, %ymm16 +# CHECK-NEXT: - - - 0.50 - 0.50 - - vpconflictd %xmm16, %xmm19 +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictd (%rax), %xmm19 +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictd (%rax){1to4}, %xmm19 +# CHECK-NEXT: - - - 0.50 - 0.50 - - vpconflictd %xmm16, %xmm19 {%k1} +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictd (%rax), %xmm19 {%k1} +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictd (%rax){1to4}, %xmm19 {%k1} +# CHECK-NEXT: - - - 0.50 - 0.50 - - vpconflictd %xmm16, %xmm19 {%k1} {z} +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictd (%rax), %xmm19 {%k1} {z} +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictd (%rax){1to4}, %xmm19 {%k1} {z} +# CHECK-NEXT: - - - 0.50 - 0.50 - - vpconflictd %ymm16, %ymm19 +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictd (%rax), %ymm19 +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictd (%rax){1to8}, %ymm19 +# CHECK-NEXT: - - - 0.50 - 0.50 - - vpconflictd %ymm16, %ymm19 {%k1} +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictd (%rax), %ymm19 {%k1} +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictd (%rax){1to8}, %ymm19 {%k1} +# CHECK-NEXT: - - - 0.50 - 0.50 - - vpconflictd %ymm16, %ymm19 {%k1} {z} +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictd (%rax), %ymm19 {%k1} {z} +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictd (%rax){1to8}, %ymm19 {%k1} {z} +# CHECK-NEXT: - - - 0.50 - 0.50 - - vpconflictq %xmm16, %xmm19 +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictq (%rax), %xmm19 +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictq (%rax){1to2}, %xmm19 +# CHECK-NEXT: - - - 0.50 - 0.50 - - vpconflictq %xmm16, %xmm19 {%k1} +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictq (%rax), %xmm19 {%k1} +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictq (%rax){1to2}, %xmm19 {%k1} +# CHECK-NEXT: - - - 0.50 - 0.50 - - vpconflictq %xmm16, %xmm19 {%k1} {z} +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictq (%rax), %xmm19 {%k1} {z} +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictq (%rax){1to2}, %xmm19 {%k1} {z} +# CHECK-NEXT: - - - 0.50 - 0.50 - - vpconflictq %ymm16, %ymm19 +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictq (%rax), %ymm19 +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictq (%rax){1to4}, %ymm19 +# CHECK-NEXT: - - - 0.50 - 0.50 - - vpconflictq %ymm16, %ymm19 {%k1} +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictq (%rax), %ymm19 {%k1} +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictq (%rax){1to4}, %ymm19 {%k1} +# CHECK-NEXT: - - - 0.50 - 0.50 - - vpconflictq %ymm16, %ymm19 {%k1} {z} +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictq (%rax), %ymm19 {%k1} {z} +# CHECK-NEXT: - - - 0.50 - 0.50 0.50 0.50 vpconflictq (%rax){1to4}, %ymm19 {%k1} {z} +# CHECK-NEXT: - - 1.00 - - - - - vplzcntd %xmm16, %xmm19 +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntd (%rax), %xmm19 +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntd (%rax){1to4}, %xmm19 +# CHECK-NEXT: - - 1.00 - - - - - vplzcntd %xmm16, %xmm19 {%k1} +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntd (%rax), %xmm19 {%k1} +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntd (%rax){1to4}, %xmm19 {%k1} +# CHECK-NEXT: - - 1.00 - - - - - vplzcntd %xmm16, %xmm19 {%k1} {z} +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntd (%rax), %xmm19 {%k1} {z} +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntd (%rax){1to4}, %xmm19 {%k1} {z} +# CHECK-NEXT: - - 1.00 - - - - - vplzcntd %ymm16, %ymm19 +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntd (%rax), %ymm19 +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntd (%rax){1to8}, %ymm19 +# CHECK-NEXT: - - 1.00 - - - - - vplzcntd %ymm16, %ymm19 {%k1} +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntd (%rax), %ymm19 {%k1} +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntd (%rax){1to8}, %ymm19 {%k1} +# CHECK-NEXT: - - 1.00 - - - - - vplzcntd %ymm16, %ymm19 {%k1} {z} +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntd (%rax), %ymm19 {%k1} {z} +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntd (%rax){1to8}, %ymm19 {%k1} {z} +# CHECK-NEXT: - - 1.00 - - - - - vplzcntq %xmm16, %xmm19 +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntq (%rax), %xmm19 +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntq (%rax){1to2}, %xmm19 +# CHECK-NEXT: - - 1.00 - - - - - vplzcntq %xmm16, %xmm19 {%k1} +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntq (%rax), %xmm19 {%k1} +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntq (%rax){1to2}, %xmm19 {%k1} +# CHECK-NEXT: - - 1.00 - - - - - vplzcntq %xmm16, %xmm19 {%k1} {z} +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntq (%rax), %xmm19 {%k1} {z} +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntq (%rax){1to2}, %xmm19 {%k1} {z} +# CHECK-NEXT: - - 1.00 - - - - - vplzcntq %ymm16, %ymm19 +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntq (%rax), %ymm19 +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntq (%rax){1to4}, %ymm19 +# CHECK-NEXT: - - 1.00 - - - - - vplzcntq %ymm16, %ymm19 {%k1} +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntq (%rax), %ymm19 {%k1} +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntq (%rax){1to4}, %ymm19 {%k1} +# CHECK-NEXT: - - 1.00 - - - - - vplzcntq %ymm16, %ymm19 {%k1} {z} +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntq (%rax), %ymm19 {%k1} {z} +# CHECK-NEXT: - - 1.00 - - - 0.50 0.50 vplzcntq (%rax){1to4}, %ymm19 {%k1} {z} diff --git a/llvm/test/tools/llvm-mca/X86/IceLakeServer/resources-avx512cd.s b/llvm/test/tools/llvm-mca/X86/IceLakeServer/resources-avx512cd.s new file mode 100644 index 0000000000000..901646d909266 --- /dev/null +++ b/llvm/test/tools/llvm-mca/X86/IceLakeServer/resources-avx512cd.s @@ -0,0 +1,153 @@ +# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py +# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=icelake-server -instruction-tables < %s | FileCheck %s + +vpbroadcastmb2q %k0, %zmm16 + +vpbroadcastmw2d %k0, %zmm16 + +vpconflictd %zmm16, %zmm19 +vpconflictd (%rax), %zmm19 +vpconflictd (%rax){1to16}, %zmm19 +vpconflictd %zmm16, %zmm19 {k1} +vpconflictd (%rax), %zmm19 {k1} +vpconflictd (%rax){1to16}, %zmm19 {k1} +vpconflictd %zmm16, %zmm19 {z}{k1} +vpconflictd (%rax), %zmm19 {z}{k1} +vpconflictd (%rax){1to16}, %zmm19 {z}{k1} + +vpconflictq %zmm16, %zmm19 +vpconflictq (%rax), %zmm19 +vpconflictq (%rax){1to8}, %zmm19 +vpconflictq %zmm16, %zmm19 {k1} +vpconflictq (%rax), %zmm19 {k1} +vpconflictq (%rax){1to8}, %zmm19 {k1} +vpconflictq %zmm16, %zmm19 {z}{k1} +vpconflictq (%rax), %zmm19 {z}{k1} +vpconflictq (%rax){1to8}, %zmm19 {z}{k1} + +vplzcntd %zmm16, %zmm19 +vplzcntd (%rax), %zmm19 +vplzcntd (%rax){1to16}, %zmm19 +vplzcntd %zmm16, %zmm19 {k1} +vplzcntd (%rax), %zmm19 {k1} +vplzcntd (%rax){1to16}, %zmm19 {k1} +vplzcntd %zmm16, %zmm19 {z}{k1} +vplzcntd (%rax), %zmm19 {z}{k1} +vplzcntd (%rax){1to16}, %zmm19 {z}{k1} + +vplzcntq %zmm16, %zmm19 +vplzcntq (%rax), %zmm19 +vplzcntq (%rax){1to8}, %zmm19 +vplzcntq %zmm16, %zmm19 {k1} +vplzcntq (%rax), %zmm19 {k1} +vplzcntq (%rax){1to8}, %zmm19 {k1} +vplzcntq %zmm16, %zmm19 {z}{k1} +vplzcntq (%rax), %zmm19 {z}{k1} +vplzcntq (%rax){1to8}, %zmm19 {z}{k1} + +# CHECK: Instruction Info: +# CHECK-NEXT: [1]: #uOps +# CHECK-NEXT: [2]: Latency +# CHECK-NEXT: [3]: RThroughput +# CHECK-NEXT: [4]: MayLoad +# CHECK-NEXT: [5]: MayStore +# CHECK-NEXT: [6]: HasSideEffects (U) + +# CHECK: [1] [2] [3] [4] [5] [6] Instructions: +# CHECK-NEXT: 1 1 1.00 vpbroadcastmb2q %k0, %zmm16 +# CHECK-NEXT: 1 1 1.00 vpbroadcastmw2d %k0, %zmm16 +# CHECK-NEXT: 35 67 17.00 vpconflictd %zmm16, %zmm19 +# CHECK-NEXT: 36 74 17.00 * vpconflictd (%rax), %zmm19 +# CHECK-NEXT: 36 74 17.00 * vpconflictd (%rax){1to16}, %zmm19 +# CHECK-NEXT: 35 67 17.00 vpconflictd %zmm16, %zmm19 {%k1} +# CHECK-NEXT: 36 74 17.00 * vpconflictd (%rax), %zmm19 {%k1} +# CHECK-NEXT: 36 74 17.00 * vpconflictd (%rax){1to16}, %zmm19 {%k1} +# CHECK-NEXT: 35 67 17.00 vpconflictd %zmm16, %zmm19 {%k1} {z} +# CHECK-NEXT: 36 74 17.00 * vpconflictd (%rax), %zmm19 {%k1} {z} +# CHECK-NEXT: 36 74 17.00 * vpconflictd (%rax){1to16}, %zmm19 {%k1} {z} +# CHECK-NEXT: 21 37 9.00 vpconflictq %zmm16, %zmm19 +# CHECK-NEXT: 22 44 9.00 * vpconflictq (%rax), %zmm19 +# CHECK-NEXT: 22 44 9.00 * vpconflictq (%rax){1to8}, %zmm19 +# CHECK-NEXT: 21 37 9.00 vpconflictq %zmm16, %zmm19 {%k1} +# CHECK-NEXT: 22 44 9.00 * vpconflictq (%rax), %zmm19 {%k1} +# CHECK-NEXT: 22 44 9.00 * vpconflictq (%rax){1to8}, %zmm19 {%k1} +# CHECK-NEXT: 21 37 9.00 vpconflictq %zmm16, %zmm19 {%k1} {z} +# CHECK-NEXT: 22 44 9.00 * vpconflictq (%rax), %zmm19 {%k1} {z} +# CHECK-NEXT: 22 44 9.00 * vpconflictq (%rax){1to8}, %zmm19 {%k1} {z} +# CHECK-NEXT: 1 5 0.50 vplzcntd %zmm16, %zmm19 +# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax), %zmm19 +# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax){1to16}, %zmm19 +# CHECK-NEXT: 1 5 0.50 vplzcntd %zmm16, %zmm19 {%k1} +# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax), %zmm19 {%k1} +# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax){1to16}, %zmm19 {%k1} +# CHECK-NEXT: 1 5 0.50 vplzcntd %zmm16, %zmm19 {%k1} {z} +# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax), %zmm19 {%k1} {z} +# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax){1to16}, %zmm19 {%k1} {z} +# CHECK-NEXT: 1 5 0.50 vplzcntq %zmm16, %zmm19 +# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax), %zmm19 +# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax){1to8}, %zmm19 +# CHECK-NEXT: 1 5 0.50 vplzcntq %zmm16, %zmm19 {%k1} +# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax), %zmm19 {%k1} +# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax){1to8}, %zmm19 {%k1} +# CHECK-NEXT: 1 5 0.50 vplzcntq %zmm16, %zmm19 {%k1} {z} +# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax), %zmm19 {%k1} {z} +# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax){1to8}, %zmm19 {%k1} {z} + +# CHECK: Resources: +# CHECK-NEXT: [0] - ICXDivider +# CHECK-NEXT: [1] - ICXFPDivider +# CHECK-NEXT: [2] - ICXPort0 +# CHECK-NEXT: [3] - ICXPort1 +# CHECK-NEXT: [4] - ICXPort2 +# CHECK-NEXT: [5] - ICXPort3 +# CHECK-NEXT: [6] - ICXPort4 +# CHECK-NEXT: [7] - ICXPort5 +# CHECK-NEXT: [8] - ICXPort6 +# CHECK-NEXT: [9] - ICXPort7 +# CHECK-NEXT: [10] - ICXPort8 +# CHECK-NEXT: [11] - ICXPort9 + +# CHECK: Resource pressure per iteration: +# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] +# CHECK-NEXT: - - 126.00 117.00 12.00 12.00 - 281.00 - - - - + +# CHECK: Resource pressure by instruction: +# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] Instructions: +# CHECK-NEXT: - - - - - - - 1.00 - - - - vpbroadcastmb2q %k0, %zmm16 +# CHECK-NEXT: - - - - - - - 1.00 - - - - vpbroadcastmw2d %k0, %zmm16 +# CHECK-NEXT: - - 7.83 7.83 - - - 19.33 - - - - vpconflictd %zmm16, %zmm19 +# CHECK-NEXT: - - 7.83 7.83 0.50 0.50 - 19.33 - - - - vpconflictd (%rax), %zmm19 +# CHECK-NEXT: - - 7.83 7.83 0.50 0.50 - 19.33 - - - - vpconflictd (%rax){1to16}, %zmm19 +# CHECK-NEXT: - - 7.83 7.83 - - - 19.33 - - - - vpconflictd %zmm16, %zmm19 {%k1} +# CHECK-NEXT: - - 7.83 7.83 0.50 0.50 - 19.33 - - - - vpconflictd (%rax), %zmm19 {%k1} +# CHECK-NEXT: - - 7.83 7.83 0.50 0.50 - 19.33 - - - - vpconflictd (%rax){1to16}, %zmm19 {%k1} +# CHECK-NEXT: - - 7.83 7.83 - - - 19.33 - - - - vpconflictd %zmm16, %zmm19 {%k1} {z} +# CHECK-NEXT: - - 7.83 7.83 0.50 0.50 - 19.33 - - - - vpconflictd (%rax), %zmm19 {%k1} {z} +# CHECK-NEXT: - - 7.83 7.83 0.50 0.50 - 19.33 - - - - vpconflictd (%rax){1to16}, %zmm19 {%k1} {z} +# CHECK-NEXT: - - 5.17 5.17 - - - 10.67 - - - - vpconflictq %zmm16, %zmm19 +# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - - - vpconflictq (%rax), %zmm19 +# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - - - vpconflictq (%rax){1to8}, %zmm19 +# CHECK-NEXT: - - 5.17 5.17 - - - 10.67 - - - - vpconflictq %zmm16, %zmm19 {%k1} +# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - - - vpconflictq (%rax), %zmm19 {%k1} +# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - - - vpconflictq (%rax){1to8}, %zmm19 {%k1} +# CHECK-NEXT: - - 5.17 5.17 - - - 10.67 - - - - vpconflictq %zmm16, %zmm19 {%k1} {z} +# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - - - vpconflictq (%rax), %zmm19 {%k1} {z} +# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - - - vpconflictq (%rax){1to8}, %zmm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 - - - - 0.50 - - - - vplzcntd %zmm16, %zmm19 +# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - - - vplzcntd (%rax), %zmm19 +# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - - - vplzcntd (%rax){1to16}, %zmm19 +# CHECK-NEXT: - - 0.50 - - - - 0.50 - - - - vplzcntd %zmm16, %zmm19 {%k1} +# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - - - vplzcntd (%rax), %zmm19 {%k1} +# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - - - vplzcntd (%rax){1to16}, %zmm19 {%k1} +# CHECK-NEXT: - - 0.50 - - - - 0.50 - - - - vplzcntd %zmm16, %zmm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - - - vplzcntd (%rax), %zmm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - - - vplzcntd (%rax){1to16}, %zmm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 - - - - 0.50 - - - - vplzcntq %zmm16, %zmm19 +# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - - - vplzcntq (%rax), %zmm19 +# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - - - vplzcntq (%rax){1to8}, %zmm19 +# CHECK-NEXT: - - 0.50 - - - - 0.50 - - - - vplzcntq %zmm16, %zmm19 {%k1} +# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - - - vplzcntq (%rax), %zmm19 {%k1} +# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - - - vplzcntq (%rax){1to8}, %zmm19 {%k1} +# CHECK-NEXT: - - 0.50 - - - - 0.50 - - - - vplzcntq %zmm16, %zmm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - - - vplzcntq (%rax), %zmm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - - - vplzcntq (%rax){1to8}, %zmm19 {%k1} {z} diff --git a/llvm/test/tools/llvm-mca/X86/IceLakeServer/resources-avx512cdvl.s b/llvm/test/tools/llvm-mca/X86/IceLakeServer/resources-avx512cdvl.s new file mode 100644 index 0000000000000..77ef4b19fa9f4 --- /dev/null +++ b/llvm/test/tools/llvm-mca/X86/IceLakeServer/resources-avx512cdvl.s @@ -0,0 +1,271 @@ +# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py +# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=icelake-server -instruction-tables < %s | FileCheck %s + +vpbroadcastmb2q %k0, %xmm16 +vpbroadcastmb2q %k0, %ymm16 + +vpbroadcastmw2d %k0, %xmm16 +vpbroadcastmw2d %k0, %ymm16 + +vpconflictd %xmm16, %xmm19 +vpconflictd (%rax), %xmm19 +vpconflictd (%rax){1to4}, %xmm19 +vpconflictd %xmm16, %xmm19 {k1} +vpconflictd (%rax), %xmm19 {k1} +vpconflictd (%rax){1to4}, %xmm19 {k1} +vpconflictd %xmm16, %xmm19 {z}{k1} +vpconflictd (%rax), %xmm19 {z}{k1} +vpconflictd (%rax){1to4}, %xmm19 {z}{k1} + +vpconflictd %ymm16, %ymm19 +vpconflictd (%rax), %ymm19 +vpconflictd (%rax){1to8}, %ymm19 +vpconflictd %ymm16, %ymm19 {k1} +vpconflictd (%rax), %ymm19 {k1} +vpconflictd (%rax){1to8}, %ymm19 {k1} +vpconflictd %ymm16, %ymm19 {z}{k1} +vpconflictd (%rax), %ymm19 {z}{k1} +vpconflictd (%rax){1to8}, %ymm19 {z}{k1} + +vpconflictq %xmm16, %xmm19 +vpconflictq (%rax), %xmm19 +vpconflictq (%rax){1to2}, %xmm19 +vpconflictq %xmm16, %xmm19 {k1} +vpconflictq (%rax), %xmm19 {k1} +vpconflictq (%rax){1to2}, %xmm19 {k1} +vpconflictq %xmm16, %xmm19 {z}{k1} +vpconflictq (%rax), %xmm19 {z}{k1} +vpconflictq (%rax){1to2}, %xmm19 {z}{k1} + +vpconflictq %ymm16, %ymm19 +vpconflictq (%rax), %ymm19 +vpconflictq (%rax){1to4}, %ymm19 +vpconflictq %ymm16, %ymm19 {k1} +vpconflictq (%rax), %ymm19 {k1} +vpconflictq (%rax){1to4}, %ymm19 {k1} +vpconflictq %ymm16, %ymm19 {z}{k1} +vpconflictq (%rax), %ymm19 {z}{k1} +vpconflictq (%rax){1to4}, %ymm19 {z}{k1} + +vplzcntd %xmm16, %xmm19 +vplzcntd (%rax), %xmm19 +vplzcntd (%rax){1to4}, %xmm19 +vplzcntd %xmm16, %xmm19 {k1} +vplzcntd (%rax), %xmm19 {k1} +vplzcntd (%rax){1to4}, %xmm19 {k1} +vplzcntd %xmm16, %xmm19 {z}{k1} +vplzcntd (%rax), %xmm19 {z}{k1} +vplzcntd (%rax){1to4}, %xmm19 {z}{k1} + +vplzcntd %ymm16, %ymm19 +vplzcntd (%rax), %ymm19 +vplzcntd (%rax){1to8}, %ymm19 +vplzcntd %ymm16, %ymm19 {k1} +vplzcntd (%rax), %ymm19 {k1} +vplzcntd (%rax){1to8}, %ymm19 {k1} +vplzcntd %ymm16, %ymm19 {z}{k1} +vplzcntd (%rax), %ymm19 {z}{k1} +vplzcntd (%rax){1to8}, %ymm19 {z}{k1} + +vplzcntq %xmm16, %xmm19 +vplzcntq (%rax), %xmm19 +vplzcntq (%rax){1to2}, %xmm19 +vplzcntq %xmm16, %xmm19 {k1} +vplzcntq (%rax), %xmm19 {k1} +vplzcntq (%rax){1to2}, %xmm19 {k1} +vplzcntq %xmm16, %xmm19 {z}{k1} +vplzcntq (%rax), %xmm19 {z}{k1} +vplzcntq (%rax){1to2}, %xmm19 {z}{k1} + +vplzcntq %ymm16, %ymm19 +vplzcntq (%rax), %ymm19 +vplzcntq (%rax){1to4}, %ymm19 +vplzcntq %ymm16, %ymm19 {k1} +vplzcntq (%rax), %ymm19 {k1} +vplzcntq (%rax){1to4}, %ymm19 {k1} +vplzcntq %ymm16, %ymm19 {z}{k1} +vplzcntq (%rax), %ymm19 {z}{k1} +vplzcntq (%rax){1to4}, %ymm19 {z}{k1} + +# CHECK: Instruction Info: +# CHECK-NEXT: [1]: #uOps +# CHECK-NEXT: [2]: Latency +# CHECK-NEXT: [3]: RThroughput +# CHECK-NEXT: [4]: MayLoad +# CHECK-NEXT: [5]: MayStore +# CHECK-NEXT: [6]: HasSideEffects (U) + +# CHECK: [1] [2] [3] [4] [5] [6] Instructions: +# CHECK-NEXT: 1 1 1.00 vpbroadcastmb2q %k0, %xmm16 +# CHECK-NEXT: 1 1 1.00 vpbroadcastmb2q %k0, %ymm16 +# CHECK-NEXT: 1 1 1.00 vpbroadcastmw2d %k0, %xmm16 +# CHECK-NEXT: 1 1 1.00 vpbroadcastmw2d %k0, %ymm16 +# CHECK-NEXT: 14 22 5.00 vpconflictd %xmm16, %xmm19 +# CHECK-NEXT: 8 15 2.33 * vpconflictd (%rax), %xmm19 +# CHECK-NEXT: 8 15 2.33 * vpconflictd (%rax){1to4}, %xmm19 +# CHECK-NEXT: 14 22 5.00 vpconflictd %xmm16, %xmm19 {%k1} +# CHECK-NEXT: 8 15 2.33 * vpconflictd (%rax), %xmm19 {%k1} +# CHECK-NEXT: 8 15 2.33 * vpconflictd (%rax){1to4}, %xmm19 {%k1} +# CHECK-NEXT: 14 22 5.00 vpconflictd %xmm16, %xmm19 {%k1} {z} +# CHECK-NEXT: 8 15 2.33 * vpconflictd (%rax), %xmm19 {%k1} {z} +# CHECK-NEXT: 8 15 2.33 * vpconflictd (%rax){1to4}, %xmm19 {%k1} {z} +# CHECK-NEXT: 21 37 9.00 vpconflictd %ymm16, %ymm19 +# CHECK-NEXT: 22 44 9.00 * vpconflictd (%rax), %ymm19 +# CHECK-NEXT: 22 44 9.00 * vpconflictd (%rax){1to8}, %ymm19 +# CHECK-NEXT: 21 37 9.00 vpconflictd %ymm16, %ymm19 {%k1} +# CHECK-NEXT: 22 44 9.00 * vpconflictd (%rax), %ymm19 {%k1} +# CHECK-NEXT: 22 44 9.00 * vpconflictd (%rax){1to8}, %ymm19 {%k1} +# CHECK-NEXT: 21 37 9.00 vpconflictd %ymm16, %ymm19 {%k1} {z} +# CHECK-NEXT: 22 44 9.00 * vpconflictd (%rax), %ymm19 {%k1} {z} +# CHECK-NEXT: 22 44 9.00 * vpconflictd (%rax){1to8}, %ymm19 {%k1} {z} +# CHECK-NEXT: 3 5 2.00 vpconflictq %xmm16, %xmm19 +# CHECK-NEXT: 4 11 2.00 * vpconflictq (%rax), %xmm19 +# CHECK-NEXT: 4 11 2.00 * vpconflictq (%rax){1to2}, %xmm19 +# CHECK-NEXT: 3 5 2.00 vpconflictq %xmm16, %xmm19 {%k1} +# CHECK-NEXT: 4 11 2.00 * vpconflictq (%rax), %xmm19 {%k1} +# CHECK-NEXT: 4 11 2.00 * vpconflictq (%rax){1to2}, %xmm19 {%k1} +# CHECK-NEXT: 3 5 2.00 vpconflictq %xmm16, %xmm19 {%k1} {z} +# CHECK-NEXT: 4 11 2.00 * vpconflictq (%rax), %xmm19 {%k1} {z} +# CHECK-NEXT: 4 11 2.00 * vpconflictq (%rax){1to2}, %xmm19 {%k1} {z} +# CHECK-NEXT: 14 22 5.00 vpconflictq %ymm16, %ymm19 +# CHECK-NEXT: 15 29 5.00 * vpconflictq (%rax), %ymm19 +# CHECK-NEXT: 15 29 5.00 * vpconflictq (%rax){1to4}, %ymm19 +# CHECK-NEXT: 14 22 5.00 vpconflictq %ymm16, %ymm19 {%k1} +# CHECK-NEXT: 15 29 5.00 * vpconflictq (%rax), %ymm19 {%k1} +# CHECK-NEXT: 15 29 5.00 * vpconflictq (%rax){1to4}, %ymm19 {%k1} +# CHECK-NEXT: 14 22 5.00 vpconflictq %ymm16, %ymm19 {%k1} {z} +# CHECK-NEXT: 15 29 5.00 * vpconflictq (%rax), %ymm19 {%k1} {z} +# CHECK-NEXT: 15 29 5.00 * vpconflictq (%rax){1to4}, %ymm19 {%k1} {z} +# CHECK-NEXT: 1 5 0.50 vplzcntd %xmm16, %xmm19 +# CHECK-NEXT: 2 11 0.50 * vplzcntd (%rax), %xmm19 +# CHECK-NEXT: 2 11 0.50 * vplzcntd (%rax){1to4}, %xmm19 +# CHECK-NEXT: 1 5 0.50 vplzcntd %xmm16, %xmm19 {%k1} +# CHECK-NEXT: 2 11 0.50 * vplzcntd (%rax), %xmm19 {%k1} +# CHECK-NEXT: 2 11 0.50 * vplzcntd (%rax){1to4}, %xmm19 {%k1} +# CHECK-NEXT: 1 5 0.50 vplzcntd %xmm16, %xmm19 {%k1} {z} +# CHECK-NEXT: 2 11 0.50 * vplzcntd (%rax), %xmm19 {%k1} {z} +# CHECK-NEXT: 2 11 0.50 * vplzcntd (%rax){1to4}, %xmm19 {%k1} {z} +# CHECK-NEXT: 1 5 0.50 vplzcntd %ymm16, %ymm19 +# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax), %ymm19 +# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax){1to8}, %ymm19 +# CHECK-NEXT: 1 5 0.50 vplzcntd %ymm16, %ymm19 {%k1} +# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax), %ymm19 {%k1} +# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax){1to8}, %ymm19 {%k1} +# CHECK-NEXT: 1 5 0.50 vplzcntd %ymm16, %ymm19 {%k1} {z} +# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax), %ymm19 {%k1} {z} +# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax){1to8}, %ymm19 {%k1} {z} +# CHECK-NEXT: 1 5 0.50 vplzcntq %xmm16, %xmm19 +# CHECK-NEXT: 2 11 0.50 * vplzcntq (%rax), %xmm19 +# CHECK-NEXT: 2 11 0.50 * vplzcntq (%rax){1to2}, %xmm19 +# CHECK-NEXT: 1 5 0.50 vplzcntq %xmm16, %xmm19 {%k1} +# CHECK-NEXT: 2 11 0.50 * vplzcntq (%rax), %xmm19 {%k1} +# CHECK-NEXT: 2 11 0.50 * vplzcntq (%rax){1to2}, %xmm19 {%k1} +# CHECK-NEXT: 1 5 0.50 vplzcntq %xmm16, %xmm19 {%k1} {z} +# CHECK-NEXT: 2 11 0.50 * vplzcntq (%rax), %xmm19 {%k1} {z} +# CHECK-NEXT: 2 11 0.50 * vplzcntq (%rax){1to2}, %xmm19 {%k1} {z} +# CHECK-NEXT: 1 5 0.50 vplzcntq %ymm16, %ymm19 +# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax), %ymm19 +# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax){1to4}, %ymm19 +# CHECK-NEXT: 1 5 0.50 vplzcntq %ymm16, %ymm19 {%k1} +# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax), %ymm19 {%k1} +# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax){1to4}, %ymm19 {%k1} +# CHECK-NEXT: 1 5 0.50 vplzcntq %ymm16, %ymm19 {%k1} {z} +# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax), %ymm19 {%k1} {z} +# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax){1to4}, %ymm19 {%k1} {z} + +# CHECK: Resources: +# CHECK-NEXT: [0] - ICXDivider +# CHECK-NEXT: [1] - ICXFPDivider +# CHECK-NEXT: [2] - ICXPort0 +# CHECK-NEXT: [3] - ICXPort1 +# CHECK-NEXT: [4] - ICXPort2 +# CHECK-NEXT: [5] - ICXPort3 +# CHECK-NEXT: [6] - ICXPort4 +# CHECK-NEXT: [7] - ICXPort5 +# CHECK-NEXT: [8] - ICXPort6 +# CHECK-NEXT: [9] - ICXPort7 +# CHECK-NEXT: [10] - ICXPort8 +# CHECK-NEXT: [11] - ICXPort9 + +# CHECK: Resource pressure per iteration: +# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] +# CHECK-NEXT: - - 123.50 129.50 24.00 24.00 - 213.00 - - - - + +# CHECK: Resource pressure by instruction: +# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] Instructions: +# CHECK-NEXT: - - - - - - - 1.00 - - - - vpbroadcastmb2q %k0, %xmm16 +# CHECK-NEXT: - - - - - - - 1.00 - - - - vpbroadcastmb2q %k0, %ymm16 +# CHECK-NEXT: - - - - - - - 1.00 - - - - vpbroadcastmw2d %k0, %xmm16 +# CHECK-NEXT: - - - - - - - 1.00 - - - - vpbroadcastmw2d %k0, %ymm16 +# CHECK-NEXT: - - 3.83 3.83 - - - 6.33 - - - - vpconflictd %xmm16, %xmm19 +# CHECK-NEXT: - - 1.67 2.67 0.50 0.50 - 2.67 - - - - vpconflictd (%rax), %xmm19 +# CHECK-NEXT: - - 1.67 2.67 0.50 0.50 - 2.67 - - - - vpconflictd (%rax){1to4}, %xmm19 +# CHECK-NEXT: - - 3.83 3.83 - - - 6.33 - - - - vpconflictd %xmm16, %xmm19 {%k1} +# CHECK-NEXT: - - 1.67 2.67 0.50 0.50 - 2.67 - - - - vpconflictd (%rax), %xmm19 {%k1} +# CHECK-NEXT: - - 1.67 2.67 0.50 0.50 - 2.67 - - - - vpconflictd (%rax){1to4}, %xmm19 {%k1} +# CHECK-NEXT: - - 3.83 3.83 - - - 6.33 - - - - vpconflictd %xmm16, %xmm19 {%k1} {z} +# CHECK-NEXT: - - 1.67 2.67 0.50 0.50 - 2.67 - - - - vpconflictd (%rax), %xmm19 {%k1} {z} +# CHECK-NEXT: - - 1.67 2.67 0.50 0.50 - 2.67 - - - - vpconflictd (%rax){1to4}, %xmm19 {%k1} {z} +# CHECK-NEXT: - - 5.17 5.17 - - - 10.67 - - - - vpconflictd %ymm16, %ymm19 +# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - - - vpconflictd (%rax), %ymm19 +# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - - - vpconflictd (%rax){1to8}, %ymm19 +# CHECK-NEXT: - - 5.17 5.17 - - - 10.67 - - - - vpconflictd %ymm16, %ymm19 {%k1} +# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - - - vpconflictd (%rax), %ymm19 {%k1} +# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - - - vpconflictd (%rax){1to8}, %ymm19 {%k1} +# CHECK-NEXT: - - 5.17 5.17 - - - 10.67 - - - - vpconflictd %ymm16, %ymm19 {%k1} {z} +# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - - - vpconflictd (%rax), %ymm19 {%k1} {z} +# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - - - vpconflictd (%rax){1to8}, %ymm19 {%k1} {z} +# CHECK-NEXT: - - 0.33 0.33 - - - 2.33 - - - - vpconflictq %xmm16, %xmm19 +# CHECK-NEXT: - - 0.33 0.33 0.50 0.50 - 2.33 - - - - vpconflictq (%rax), %xmm19 +# CHECK-NEXT: - - 0.33 0.33 0.50 0.50 - 2.33 - - - - vpconflictq (%rax){1to2}, %xmm19 +# CHECK-NEXT: - - 0.33 0.33 - - - 2.33 - - - - vpconflictq %xmm16, %xmm19 {%k1} +# CHECK-NEXT: - - 0.33 0.33 0.50 0.50 - 2.33 - - - - vpconflictq (%rax), %xmm19 {%k1} +# CHECK-NEXT: - - 0.33 0.33 0.50 0.50 - 2.33 - - - - vpconflictq (%rax){1to2}, %xmm19 {%k1} +# CHECK-NEXT: - - 0.33 0.33 - - - 2.33 - - - - vpconflictq %xmm16, %xmm19 {%k1} {z} +# CHECK-NEXT: - - 0.33 0.33 0.50 0.50 - 2.33 - - - - vpconflictq (%rax), %xmm19 {%k1} {z} +# CHECK-NEXT: - - 0.33 0.33 0.50 0.50 - 2.33 - - - - vpconflictq (%rax){1to2}, %xmm19 {%k1} {z} +# CHECK-NEXT: - - 3.83 3.83 - - - 6.33 - - - - vpconflictq %ymm16, %ymm19 +# CHECK-NEXT: - - 3.83 3.83 0.50 0.50 - 6.33 - - - - vpconflictq (%rax), %ymm19 +# CHECK-NEXT: - - 3.83 3.83 0.50 0.50 - 6.33 - - - - vpconflictq (%rax){1to4}, %ymm19 +# CHECK-NEXT: - - 3.83 3.83 - - - 6.33 - - - - vpconflictq %ymm16, %ymm19 {%k1} +# CHECK-NEXT: - - 3.83 3.83 0.50 0.50 - 6.33 - - - - vpconflictq (%rax), %ymm19 {%k1} +# CHECK-NEXT: - - 3.83 3.83 0.50 0.50 - 6.33 - - - - vpconflictq (%rax){1to4}, %ymm19 {%k1} +# CHECK-NEXT: - - 3.83 3.83 - - - 6.33 - - - - vpconflictq %ymm16, %ymm19 {%k1} {z} +# CHECK-NEXT: - - 3.83 3.83 0.50 0.50 - 6.33 - - - - vpconflictq (%rax), %ymm19 {%k1} {z} +# CHECK-NEXT: - - 3.83 3.83 0.50 0.50 - 6.33 - - - - vpconflictq (%rax){1to4}, %ymm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vplzcntd %xmm16, %xmm19 +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vplzcntd (%rax), %xmm19 +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vplzcntd (%rax){1to4}, %xmm19 +# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vplzcntd %xmm16, %xmm19 {%k1} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vplzcntd (%rax), %xmm19 {%k1} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vplzcntd (%rax){1to4}, %xmm19 {%k1} +# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vplzcntd %xmm16, %xmm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vplzcntd (%rax), %xmm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vplzcntd (%rax){1to4}, %xmm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vplzcntd %ymm16, %ymm19 +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vplzcntd (%rax), %ymm19 +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vplzcntd (%rax){1to8}, %ymm19 +# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vplzcntd %ymm16, %ymm19 {%k1} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vplzcntd (%rax), %ymm19 {%k1} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vplzcntd (%rax){1to8}, %ymm19 {%k1} +# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vplzcntd %ymm16, %ymm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vplzcntd (%rax), %ymm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vplzcntd (%rax){1to8}, %ymm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vplzcntq %xmm16, %xmm19 +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vplzcntq (%rax), %xmm19 +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vplzcntq (%rax){1to2}, %xmm19 +# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vplzcntq %xmm16, %xmm19 {%k1} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vplzcntq (%rax), %xmm19 {%k1} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vplzcntq (%rax){1to2}, %xmm19 {%k1} +# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vplzcntq %xmm16, %xmm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vplzcntq (%rax), %xmm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vplzcntq (%rax){1to2}, %xmm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vplzcntq %ymm16, %ymm19 +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vplzcntq (%rax), %ymm19 +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vplzcntq (%rax){1to4}, %ymm19 +# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vplzcntq %ymm16, %ymm19 {%k1} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vplzcntq (%rax), %ymm19 {%k1} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vplzcntq (%rax){1to4}, %ymm19 {%k1} +# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vplzcntq %ymm16, %ymm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vplzcntq (%rax), %ymm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vplzcntq (%rax){1to4}, %ymm19 {%k1} {z} diff --git a/llvm/test/tools/llvm-mca/X86/SkylakeServer/resources-avx512cd.s b/llvm/test/tools/llvm-mca/X86/SkylakeServer/resources-avx512cd.s new file mode 100644 index 0000000000000..3ab21932d1391 --- /dev/null +++ b/llvm/test/tools/llvm-mca/X86/SkylakeServer/resources-avx512cd.s @@ -0,0 +1,151 @@ +# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py +# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=skylake-avx512 -instruction-tables < %s | FileCheck %s + +vpbroadcastmb2q %k0, %zmm16 + +vpbroadcastmw2d %k0, %zmm16 + +vpconflictd %zmm16, %zmm19 +vpconflictd (%rax), %zmm19 +vpconflictd (%rax){1to16}, %zmm19 +vpconflictd %zmm16, %zmm19 {k1} +vpconflictd (%rax), %zmm19 {k1} +vpconflictd (%rax){1to16}, %zmm19 {k1} +vpconflictd %zmm16, %zmm19 {z}{k1} +vpconflictd (%rax), %zmm19 {z}{k1} +vpconflictd (%rax){1to16}, %zmm19 {z}{k1} + +vpconflictq %zmm16, %zmm19 +vpconflictq (%rax), %zmm19 +vpconflictq (%rax){1to8}, %zmm19 +vpconflictq %zmm16, %zmm19 {k1} +vpconflictq (%rax), %zmm19 {k1} +vpconflictq (%rax){1to8}, %zmm19 {k1} +vpconflictq %zmm16, %zmm19 {z}{k1} +vpconflictq (%rax), %zmm19 {z}{k1} +vpconflictq (%rax){1to8}, %zmm19 {z}{k1} + +vplzcntd %zmm16, %zmm19 +vplzcntd (%rax), %zmm19 +vplzcntd (%rax){1to16}, %zmm19 +vplzcntd %zmm16, %zmm19 {k1} +vplzcntd (%rax), %zmm19 {k1} +vplzcntd (%rax){1to16}, %zmm19 {k1} +vplzcntd %zmm16, %zmm19 {z}{k1} +vplzcntd (%rax), %zmm19 {z}{k1} +vplzcntd (%rax){1to16}, %zmm19 {z}{k1} + +vplzcntq %zmm16, %zmm19 +vplzcntq (%rax), %zmm19 +vplzcntq (%rax){1to8}, %zmm19 +vplzcntq %zmm16, %zmm19 {k1} +vplzcntq (%rax), %zmm19 {k1} +vplzcntq (%rax){1to8}, %zmm19 {k1} +vplzcntq %zmm16, %zmm19 {z}{k1} +vplzcntq (%rax), %zmm19 {z}{k1} +vplzcntq (%rax){1to8}, %zmm19 {z}{k1} + +# CHECK: Instruction Info: +# CHECK-NEXT: [1]: #uOps +# CHECK-NEXT: [2]: Latency +# CHECK-NEXT: [3]: RThroughput +# CHECK-NEXT: [4]: MayLoad +# CHECK-NEXT: [5]: MayStore +# CHECK-NEXT: [6]: HasSideEffects (U) + +# CHECK: [1] [2] [3] [4] [5] [6] Instructions: +# CHECK-NEXT: 1 1 1.00 vpbroadcastmb2q %k0, %zmm16 +# CHECK-NEXT: 1 1 1.00 vpbroadcastmw2d %k0, %zmm16 +# CHECK-NEXT: 35 67 17.00 vpconflictd %zmm16, %zmm19 +# CHECK-NEXT: 36 74 17.00 * vpconflictd (%rax), %zmm19 +# CHECK-NEXT: 36 74 17.00 * vpconflictd (%rax){1to16}, %zmm19 +# CHECK-NEXT: 35 67 17.00 vpconflictd %zmm16, %zmm19 {%k1} +# CHECK-NEXT: 36 74 17.00 * vpconflictd (%rax), %zmm19 {%k1} +# CHECK-NEXT: 36 74 17.00 * vpconflictd (%rax){1to16}, %zmm19 {%k1} +# CHECK-NEXT: 35 67 17.00 vpconflictd %zmm16, %zmm19 {%k1} {z} +# CHECK-NEXT: 36 74 17.00 * vpconflictd (%rax), %zmm19 {%k1} {z} +# CHECK-NEXT: 36 74 17.00 * vpconflictd (%rax){1to16}, %zmm19 {%k1} {z} +# CHECK-NEXT: 21 37 9.00 vpconflictq %zmm16, %zmm19 +# CHECK-NEXT: 22 44 9.00 * vpconflictq (%rax), %zmm19 +# CHECK-NEXT: 22 44 9.00 * vpconflictq (%rax){1to8}, %zmm19 +# CHECK-NEXT: 21 37 9.00 vpconflictq %zmm16, %zmm19 {%k1} +# CHECK-NEXT: 22 44 9.00 * vpconflictq (%rax), %zmm19 {%k1} +# CHECK-NEXT: 22 44 9.00 * vpconflictq (%rax){1to8}, %zmm19 {%k1} +# CHECK-NEXT: 21 37 9.00 vpconflictq %zmm16, %zmm19 {%k1} {z} +# CHECK-NEXT: 22 44 9.00 * vpconflictq (%rax), %zmm19 {%k1} {z} +# CHECK-NEXT: 22 44 9.00 * vpconflictq (%rax){1to8}, %zmm19 {%k1} {z} +# CHECK-NEXT: 1 5 0.50 vplzcntd %zmm16, %zmm19 +# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax), %zmm19 +# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax){1to16}, %zmm19 +# CHECK-NEXT: 1 5 0.50 vplzcntd %zmm16, %zmm19 {%k1} +# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax), %zmm19 {%k1} +# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax){1to16}, %zmm19 {%k1} +# CHECK-NEXT: 1 5 0.50 vplzcntd %zmm16, %zmm19 {%k1} {z} +# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax), %zmm19 {%k1} {z} +# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax){1to16}, %zmm19 {%k1} {z} +# CHECK-NEXT: 1 5 0.50 vplzcntq %zmm16, %zmm19 +# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax), %zmm19 +# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax){1to8}, %zmm19 +# CHECK-NEXT: 1 5 0.50 vplzcntq %zmm16, %zmm19 {%k1} +# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax), %zmm19 {%k1} +# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax){1to8}, %zmm19 {%k1} +# CHECK-NEXT: 1 5 0.50 vplzcntq %zmm16, %zmm19 {%k1} {z} +# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax), %zmm19 {%k1} {z} +# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax){1to8}, %zmm19 {%k1} {z} + +# CHECK: Resources: +# CHECK-NEXT: [0] - SKXDivider +# CHECK-NEXT: [1] - SKXFPDivider +# CHECK-NEXT: [2] - SKXPort0 +# CHECK-NEXT: [3] - SKXPort1 +# CHECK-NEXT: [4] - SKXPort2 +# CHECK-NEXT: [5] - SKXPort3 +# CHECK-NEXT: [6] - SKXPort4 +# CHECK-NEXT: [7] - SKXPort5 +# CHECK-NEXT: [8] - SKXPort6 +# CHECK-NEXT: [9] - SKXPort7 + +# CHECK: Resource pressure per iteration: +# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] +# CHECK-NEXT: - - 126.00 117.00 12.00 12.00 - 281.00 - - + +# CHECK: Resource pressure by instruction: +# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] Instructions: +# CHECK-NEXT: - - - - - - - 1.00 - - vpbroadcastmb2q %k0, %zmm16 +# CHECK-NEXT: - - - - - - - 1.00 - - vpbroadcastmw2d %k0, %zmm16 +# CHECK-NEXT: - - 7.83 7.83 - - - 19.33 - - vpconflictd %zmm16, %zmm19 +# CHECK-NEXT: - - 7.83 7.83 0.50 0.50 - 19.33 - - vpconflictd (%rax), %zmm19 +# CHECK-NEXT: - - 7.83 7.83 0.50 0.50 - 19.33 - - vpconflictd (%rax){1to16}, %zmm19 +# CHECK-NEXT: - - 7.83 7.83 - - - 19.33 - - vpconflictd %zmm16, %zmm19 {%k1} +# CHECK-NEXT: - - 7.83 7.83 0.50 0.50 - 19.33 - - vpconflictd (%rax), %zmm19 {%k1} +# CHECK-NEXT: - - 7.83 7.83 0.50 0.50 - 19.33 - - vpconflictd (%rax){1to16}, %zmm19 {%k1} +# CHECK-NEXT: - - 7.83 7.83 - - - 19.33 - - vpconflictd %zmm16, %zmm19 {%k1} {z} +# CHECK-NEXT: - - 7.83 7.83 0.50 0.50 - 19.33 - - vpconflictd (%rax), %zmm19 {%k1} {z} +# CHECK-NEXT: - - 7.83 7.83 0.50 0.50 - 19.33 - - vpconflictd (%rax){1to16}, %zmm19 {%k1} {z} +# CHECK-NEXT: - - 5.17 5.17 - - - 10.67 - - vpconflictq %zmm16, %zmm19 +# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - vpconflictq (%rax), %zmm19 +# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - vpconflictq (%rax){1to8}, %zmm19 +# CHECK-NEXT: - - 5.17 5.17 - - - 10.67 - - vpconflictq %zmm16, %zmm19 {%k1} +# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - vpconflictq (%rax), %zmm19 {%k1} +# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - vpconflictq (%rax){1to8}, %zmm19 {%k1} +# CHECK-NEXT: - - 5.17 5.17 - - - 10.67 - - vpconflictq %zmm16, %zmm19 {%k1} {z} +# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - vpconflictq (%rax), %zmm19 {%k1} {z} +# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - vpconflictq (%rax){1to8}, %zmm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 - - - - 0.50 - - vplzcntd %zmm16, %zmm19 +# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - vplzcntd (%rax), %zmm19 +# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - vplzcntd (%rax){1to16}, %zmm19 +# CHECK-NEXT: - - 0.50 - - - - 0.50 - - vplzcntd %zmm16, %zmm19 {%k1} +# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - vplzcntd (%rax), %zmm19 {%k1} +# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - vplzcntd (%rax){1to16}, %zmm19 {%k1} +# CHECK-NEXT: - - 0.50 - - - - 0.50 - - vplzcntd %zmm16, %zmm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - vplzcntd (%rax), %zmm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - vplzcntd (%rax){1to16}, %zmm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 - - - - 0.50 - - vplzcntq %zmm16, %zmm19 +# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - vplzcntq (%rax), %zmm19 +# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - vplzcntq (%rax){1to8}, %zmm19 +# CHECK-NEXT: - - 0.50 - - - - 0.50 - - vplzcntq %zmm16, %zmm19 {%k1} +# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - vplzcntq (%rax), %zmm19 {%k1} +# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - vplzcntq (%rax){1to8}, %zmm19 {%k1} +# CHECK-NEXT: - - 0.50 - - - - 0.50 - - vplzcntq %zmm16, %zmm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - vplzcntq (%rax), %zmm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - vplzcntq (%rax){1to8}, %zmm19 {%k1} {z} diff --git a/llvm/test/tools/llvm-mca/X86/SkylakeServer/resources-avx512cdvl.s b/llvm/test/tools/llvm-mca/X86/SkylakeServer/resources-avx512cdvl.s new file mode 100644 index 0000000000000..90e4c38583ccc --- /dev/null +++ b/llvm/test/tools/llvm-mca/X86/SkylakeServer/resources-avx512cdvl.s @@ -0,0 +1,269 @@ +# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py +# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=skylake-avx512 -instruction-tables < %s | FileCheck %s + +vpbroadcastmb2q %k0, %xmm16 +vpbroadcastmb2q %k0, %ymm16 + +vpbroadcastmw2d %k0, %xmm16 +vpbroadcastmw2d %k0, %ymm16 + +vpconflictd %xmm16, %xmm19 +vpconflictd (%rax), %xmm19 +vpconflictd (%rax){1to4}, %xmm19 +vpconflictd %xmm16, %xmm19 {k1} +vpconflictd (%rax), %xmm19 {k1} +vpconflictd (%rax){1to4}, %xmm19 {k1} +vpconflictd %xmm16, %xmm19 {z}{k1} +vpconflictd (%rax), %xmm19 {z}{k1} +vpconflictd (%rax){1to4}, %xmm19 {z}{k1} + +vpconflictd %ymm16, %ymm19 +vpconflictd (%rax), %ymm19 +vpconflictd (%rax){1to8}, %ymm19 +vpconflictd %ymm16, %ymm19 {k1} +vpconflictd (%rax), %ymm19 {k1} +vpconflictd (%rax){1to8}, %ymm19 {k1} +vpconflictd %ymm16, %ymm19 {z}{k1} +vpconflictd (%rax), %ymm19 {z}{k1} +vpconflictd (%rax){1to8}, %ymm19 {z}{k1} + +vpconflictq %xmm16, %xmm19 +vpconflictq (%rax), %xmm19 +vpconflictq (%rax){1to2}, %xmm19 +vpconflictq %xmm16, %xmm19 {k1} +vpconflictq (%rax), %xmm19 {k1} +vpconflictq (%rax){1to2}, %xmm19 {k1} +vpconflictq %xmm16, %xmm19 {z}{k1} +vpconflictq (%rax), %xmm19 {z}{k1} +vpconflictq (%rax){1to2}, %xmm19 {z}{k1} + +vpconflictq %ymm16, %ymm19 +vpconflictq (%rax), %ymm19 +vpconflictq (%rax){1to4}, %ymm19 +vpconflictq %ymm16, %ymm19 {k1} +vpconflictq (%rax), %ymm19 {k1} +vpconflictq (%rax){1to4}, %ymm19 {k1} +vpconflictq %ymm16, %ymm19 {z}{k1} +vpconflictq (%rax), %ymm19 {z}{k1} +vpconflictq (%rax){1to4}, %ymm19 {z}{k1} + +vplzcntd %xmm16, %xmm19 +vplzcntd (%rax), %xmm19 +vplzcntd (%rax){1to4}, %xmm19 +vplzcntd %xmm16, %xmm19 {k1} +vplzcntd (%rax), %xmm19 {k1} +vplzcntd (%rax){1to4}, %xmm19 {k1} +vplzcntd %xmm16, %xmm19 {z}{k1} +vplzcntd (%rax), %xmm19 {z}{k1} +vplzcntd (%rax){1to4}, %xmm19 {z}{k1} + +vplzcntd %ymm16, %ymm19 +vplzcntd (%rax), %ymm19 +vplzcntd (%rax){1to8}, %ymm19 +vplzcntd %ymm16, %ymm19 {k1} +vplzcntd (%rax), %ymm19 {k1} +vplzcntd (%rax){1to8}, %ymm19 {k1} +vplzcntd %ymm16, %ymm19 {z}{k1} +vplzcntd (%rax), %ymm19 {z}{k1} +vplzcntd (%rax){1to8}, %ymm19 {z}{k1} + +vplzcntq %xmm16, %xmm19 +vplzcntq (%rax), %xmm19 +vplzcntq (%rax){1to2}, %xmm19 +vplzcntq %xmm16, %xmm19 {k1} +vplzcntq (%rax), %xmm19 {k1} +vplzcntq (%rax){1to2}, %xmm19 {k1} +vplzcntq %xmm16, %xmm19 {z}{k1} +vplzcntq (%rax), %xmm19 {z}{k1} +vplzcntq (%rax){1to2}, %xmm19 {z}{k1} + +vplzcntq %ymm16, %ymm19 +vplzcntq (%rax), %ymm19 +vplzcntq (%rax){1to4}, %ymm19 +vplzcntq %ymm16, %ymm19 {k1} +vplzcntq (%rax), %ymm19 {k1} +vplzcntq (%rax){1to4}, %ymm19 {k1} +vplzcntq %ymm16, %ymm19 {z}{k1} +vplzcntq (%rax), %ymm19 {z}{k1} +vplzcntq (%rax){1to4}, %ymm19 {z}{k1} + +# CHECK: Instruction Info: +# CHECK-NEXT: [1]: #uOps +# CHECK-NEXT: [2]: Latency +# CHECK-NEXT: [3]: RThroughput +# CHECK-NEXT: [4]: MayLoad +# CHECK-NEXT: [5]: MayStore +# CHECK-NEXT: [6]: HasSideEffects (U) + +# CHECK: [1] [2] [3] [4] [5] [6] Instructions: +# CHECK-NEXT: 1 1 1.00 vpbroadcastmb2q %k0, %xmm16 +# CHECK-NEXT: 1 1 1.00 vpbroadcastmb2q %k0, %ymm16 +# CHECK-NEXT: 1 1 1.00 vpbroadcastmw2d %k0, %xmm16 +# CHECK-NEXT: 1 1 1.00 vpbroadcastmw2d %k0, %ymm16 +# CHECK-NEXT: 14 22 5.00 vpconflictd %xmm16, %xmm19 +# CHECK-NEXT: 8 15 2.33 * vpconflictd (%rax), %xmm19 +# CHECK-NEXT: 8 15 2.33 * vpconflictd (%rax){1to4}, %xmm19 +# CHECK-NEXT: 14 22 5.00 vpconflictd %xmm16, %xmm19 {%k1} +# CHECK-NEXT: 8 15 2.33 * vpconflictd (%rax), %xmm19 {%k1} +# CHECK-NEXT: 8 15 2.33 * vpconflictd (%rax){1to4}, %xmm19 {%k1} +# CHECK-NEXT: 14 22 5.00 vpconflictd %xmm16, %xmm19 {%k1} {z} +# CHECK-NEXT: 8 15 2.33 * vpconflictd (%rax), %xmm19 {%k1} {z} +# CHECK-NEXT: 8 15 2.33 * vpconflictd (%rax){1to4}, %xmm19 {%k1} {z} +# CHECK-NEXT: 21 37 9.00 vpconflictd %ymm16, %ymm19 +# CHECK-NEXT: 22 44 9.00 * vpconflictd (%rax), %ymm19 +# CHECK-NEXT: 22 44 9.00 * vpconflictd (%rax){1to8}, %ymm19 +# CHECK-NEXT: 21 37 9.00 vpconflictd %ymm16, %ymm19 {%k1} +# CHECK-NEXT: 22 44 9.00 * vpconflictd (%rax), %ymm19 {%k1} +# CHECK-NEXT: 22 44 9.00 * vpconflictd (%rax){1to8}, %ymm19 {%k1} +# CHECK-NEXT: 21 37 9.00 vpconflictd %ymm16, %ymm19 {%k1} {z} +# CHECK-NEXT: 22 44 9.00 * vpconflictd (%rax), %ymm19 {%k1} {z} +# CHECK-NEXT: 22 44 9.00 * vpconflictd (%rax){1to8}, %ymm19 {%k1} {z} +# CHECK-NEXT: 3 5 2.00 vpconflictq %xmm16, %xmm19 +# CHECK-NEXT: 4 11 2.00 * vpconflictq (%rax), %xmm19 +# CHECK-NEXT: 4 11 2.00 * vpconflictq (%rax){1to2}, %xmm19 +# CHECK-NEXT: 3 5 2.00 vpconflictq %xmm16, %xmm19 {%k1} +# CHECK-NEXT: 4 11 2.00 * vpconflictq (%rax), %xmm19 {%k1} +# CHECK-NEXT: 4 11 2.00 * vpconflictq (%rax){1to2}, %xmm19 {%k1} +# CHECK-NEXT: 3 5 2.00 vpconflictq %xmm16, %xmm19 {%k1} {z} +# CHECK-NEXT: 4 11 2.00 * vpconflictq (%rax), %xmm19 {%k1} {z} +# CHECK-NEXT: 4 11 2.00 * vpconflictq (%rax){1to2}, %xmm19 {%k1} {z} +# CHECK-NEXT: 14 22 5.00 vpconflictq %ymm16, %ymm19 +# CHECK-NEXT: 15 29 5.00 * vpconflictq (%rax), %ymm19 +# CHECK-NEXT: 15 29 5.00 * vpconflictq (%rax){1to4}, %ymm19 +# CHECK-NEXT: 14 22 5.00 vpconflictq %ymm16, %ymm19 {%k1} +# CHECK-NEXT: 15 29 5.00 * vpconflictq (%rax), %ymm19 {%k1} +# CHECK-NEXT: 15 29 5.00 * vpconflictq (%rax){1to4}, %ymm19 {%k1} +# CHECK-NEXT: 14 22 5.00 vpconflictq %ymm16, %ymm19 {%k1} {z} +# CHECK-NEXT: 15 29 5.00 * vpconflictq (%rax), %ymm19 {%k1} {z} +# CHECK-NEXT: 15 29 5.00 * vpconflictq (%rax){1to4}, %ymm19 {%k1} {z} +# CHECK-NEXT: 1 5 0.50 vplzcntd %xmm16, %xmm19 +# CHECK-NEXT: 2 11 0.50 * vplzcntd (%rax), %xmm19 +# CHECK-NEXT: 2 11 0.50 * vplzcntd (%rax){1to4}, %xmm19 +# CHECK-NEXT: 1 5 0.50 vplzcntd %xmm16, %xmm19 {%k1} +# CHECK-NEXT: 2 11 0.50 * vplzcntd (%rax), %xmm19 {%k1} +# CHECK-NEXT: 2 11 0.50 * vplzcntd (%rax){1to4}, %xmm19 {%k1} +# CHECK-NEXT: 1 5 0.50 vplzcntd %xmm16, %xmm19 {%k1} {z} +# CHECK-NEXT: 2 11 0.50 * vplzcntd (%rax), %xmm19 {%k1} {z} +# CHECK-NEXT: 2 11 0.50 * vplzcntd (%rax){1to4}, %xmm19 {%k1} {z} +# CHECK-NEXT: 1 5 0.50 vplzcntd %ymm16, %ymm19 +# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax), %ymm19 +# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax){1to8}, %ymm19 +# CHECK-NEXT: 1 5 0.50 vplzcntd %ymm16, %ymm19 {%k1} +# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax), %ymm19 {%k1} +# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax){1to8}, %ymm19 {%k1} +# CHECK-NEXT: 1 5 0.50 vplzcntd %ymm16, %ymm19 {%k1} {z} +# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax), %ymm19 {%k1} {z} +# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax){1to8}, %ymm19 {%k1} {z} +# CHECK-NEXT: 1 5 0.50 vplzcntq %xmm16, %xmm19 +# CHECK-NEXT: 2 11 0.50 * vplzcntq (%rax), %xmm19 +# CHECK-NEXT: 2 11 0.50 * vplzcntq (%rax){1to2}, %xmm19 +# CHECK-NEXT: 1 5 0.50 vplzcntq %xmm16, %xmm19 {%k1} +# CHECK-NEXT: 2 11 0.50 * vplzcntq (%rax), %xmm19 {%k1} +# CHECK-NEXT: 2 11 0.50 * vplzcntq (%rax){1to2}, %xmm19 {%k1} +# CHECK-NEXT: 1 5 0.50 vplzcntq %xmm16, %xmm19 {%k1} {z} +# CHECK-NEXT: 2 11 0.50 * vplzcntq (%rax), %xmm19 {%k1} {z} +# CHECK-NEXT: 2 11 0.50 * vplzcntq (%rax){1to2}, %xmm19 {%k1} {z} +# CHECK-NEXT: 1 5 0.50 vplzcntq %ymm16, %ymm19 +# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax), %ymm19 +# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax){1to4}, %ymm19 +# CHECK-NEXT: 1 5 0.50 vplzcntq %ymm16, %ymm19 {%k1} +# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax), %ymm19 {%k1} +# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax){1to4}, %ymm19 {%k1} +# CHECK-NEXT: 1 5 0.50 vplzcntq %ymm16, %ymm19 {%k1} {z} +# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax), %ymm19 {%k1} {z} +# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax){1to4}, %ymm19 {%k1} {z} + +# CHECK: Resources: +# CHECK-NEXT: [0] - SKXDivider +# CHECK-NEXT: [1] - SKXFPDivider +# CHECK-NEXT: [2] - SKXPort0 +# CHECK-NEXT: [3] - SKXPort1 +# CHECK-NEXT: [4] - SKXPort2 +# CHECK-NEXT: [5] - SKXPort3 +# CHECK-NEXT: [6] - SKXPort4 +# CHECK-NEXT: [7] - SKXPort5 +# CHECK-NEXT: [8] - SKXPort6 +# CHECK-NEXT: [9] - SKXPort7 + +# CHECK: Resource pressure per iteration: +# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] +# CHECK-NEXT: - - 123.50 129.50 24.00 24.00 - 213.00 - - + +# CHECK: Resource pressure by instruction: +# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] Instructions: +# CHECK-NEXT: - - - - - - - 1.00 - - vpbroadcastmb2q %k0, %xmm16 +# CHECK-NEXT: - - - - - - - 1.00 - - vpbroadcastmb2q %k0, %ymm16 +# CHECK-NEXT: - - - - - - - 1.00 - - vpbroadcastmw2d %k0, %xmm16 +# CHECK-NEXT: - - - - - - - 1.00 - - vpbroadcastmw2d %k0, %ymm16 +# CHECK-NEXT: - - 3.83 3.83 - - - 6.33 - - vpconflictd %xmm16, %xmm19 +# CHECK-NEXT: - - 1.67 2.67 0.50 0.50 - 2.67 - - vpconflictd (%rax), %xmm19 +# CHECK-NEXT: - - 1.67 2.67 0.50 0.50 - 2.67 - - vpconflictd (%rax){1to4}, %xmm19 +# CHECK-NEXT: - - 3.83 3.83 - - - 6.33 - - vpconflictd %xmm16, %xmm19 {%k1} +# CHECK-NEXT: - - 1.67 2.67 0.50 0.50 - 2.67 - - vpconflictd (%rax), %xmm19 {%k1} +# CHECK-NEXT: - - 1.67 2.67 0.50 0.50 - 2.67 - - vpconflictd (%rax){1to4}, %xmm19 {%k1} +# CHECK-NEXT: - - 3.83 3.83 - - - 6.33 - - vpconflictd %xmm16, %xmm19 {%k1} {z} +# CHECK-NEXT: - - 1.67 2.67 0.50 0.50 - 2.67 - - vpconflictd (%rax), %xmm19 {%k1} {z} +# CHECK-NEXT: - - 1.67 2.67 0.50 0.50 - 2.67 - - vpconflictd (%rax){1to4}, %xmm19 {%k1} {z} +# CHECK-NEXT: - - 5.17 5.17 - - - 10.67 - - vpconflictd %ymm16, %ymm19 +# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - vpconflictd (%rax), %ymm19 +# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - vpconflictd (%rax){1to8}, %ymm19 +# CHECK-NEXT: - - 5.17 5.17 - - - 10.67 - - vpconflictd %ymm16, %ymm19 {%k1} +# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - vpconflictd (%rax), %ymm19 {%k1} +# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - vpconflictd (%rax){1to8}, %ymm19 {%k1} +# CHECK-NEXT: - - 5.17 5.17 - - - 10.67 - - vpconflictd %ymm16, %ymm19 {%k1} {z} +# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - vpconflictd (%rax), %ymm19 {%k1} {z} +# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - vpconflictd (%rax){1to8}, %ymm19 {%k1} {z} +# CHECK-NEXT: - - 0.33 0.33 - - - 2.33 - - vpconflictq %xmm16, %xmm19 +# CHECK-NEXT: - - 0.33 0.33 0.50 0.50 - 2.33 - - vpconflictq (%rax), %xmm19 +# CHECK-NEXT: - - 0.33 0.33 0.50 0.50 - 2.33 - - vpconflictq (%rax){1to2}, %xmm19 +# CHECK-NEXT: - - 0.33 0.33 - - - 2.33 - - vpconflictq %xmm16, %xmm19 {%k1} +# CHECK-NEXT: - - 0.33 0.33 0.50 0.50 - 2.33 - - vpconflictq (%rax), %xmm19 {%k1} +# CHECK-NEXT: - - 0.33 0.33 0.50 0.50 - 2.33 - - vpconflictq (%rax){1to2}, %xmm19 {%k1} +# CHECK-NEXT: - - 0.33 0.33 - - - 2.33 - - vpconflictq %xmm16, %xmm19 {%k1} {z} +# CHECK-NEXT: - - 0.33 0.33 0.50 0.50 - 2.33 - - vpconflictq (%rax), %xmm19 {%k1} {z} +# CHECK-NEXT: - - 0.33 0.33 0.50 0.50 - 2.33 - - vpconflictq (%rax){1to2}, %xmm19 {%k1} {z} +# CHECK-NEXT: - - 3.83 3.83 - - - 6.33 - - vpconflictq %ymm16, %ymm19 +# CHECK-NEXT: - - 3.83 3.83 0.50 0.50 - 6.33 - - vpconflictq (%rax), %ymm19 +# CHECK-NEXT: - - 3.83 3.83 0.50 0.50 - 6.33 - - vpconflictq (%rax){1to4}, %ymm19 +# CHECK-NEXT: - - 3.83 3.83 - - - 6.33 - - vpconflictq %ymm16, %ymm19 {%k1} +# CHECK-NEXT: - - 3.83 3.83 0.50 0.50 - 6.33 - - vpconflictq (%rax), %ymm19 {%k1} +# CHECK-NEXT: - - 3.83 3.83 0.50 0.50 - 6.33 - - vpconflictq (%rax){1to4}, %ymm19 {%k1} +# CHECK-NEXT: - - 3.83 3.83 - - - 6.33 - - vpconflictq %ymm16, %ymm19 {%k1} {z} +# CHECK-NEXT: - - 3.83 3.83 0.50 0.50 - 6.33 - - vpconflictq (%rax), %ymm19 {%k1} {z} +# CHECK-NEXT: - - 3.83 3.83 0.50 0.50 - 6.33 - - vpconflictq (%rax){1to4}, %ymm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 0.50 - - - - - - vplzcntd %xmm16, %xmm19 +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - vplzcntd (%rax), %xmm19 +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - vplzcntd (%rax){1to4}, %xmm19 +# CHECK-NEXT: - - 0.50 0.50 - - - - - - vplzcntd %xmm16, %xmm19 {%k1} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - vplzcntd (%rax), %xmm19 {%k1} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - vplzcntd (%rax){1to4}, %xmm19 {%k1} +# CHECK-NEXT: - - 0.50 0.50 - - - - - - vplzcntd %xmm16, %xmm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - vplzcntd (%rax), %xmm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - vplzcntd (%rax){1to4}, %xmm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 0.50 - - - - - - vplzcntd %ymm16, %ymm19 +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - vplzcntd (%rax), %ymm19 +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - vplzcntd (%rax){1to8}, %ymm19 +# CHECK-NEXT: - - 0.50 0.50 - - - - - - vplzcntd %ymm16, %ymm19 {%k1} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - vplzcntd (%rax), %ymm19 {%k1} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - vplzcntd (%rax){1to8}, %ymm19 {%k1} +# CHECK-NEXT: - - 0.50 0.50 - - - - - - vplzcntd %ymm16, %ymm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - vplzcntd (%rax), %ymm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - vplzcntd (%rax){1to8}, %ymm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 0.50 - - - - - - vplzcntq %xmm16, %xmm19 +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - vplzcntq (%rax), %xmm19 +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - vplzcntq (%rax){1to2}, %xmm19 +# CHECK-NEXT: - - 0.50 0.50 - - - - - - vplzcntq %xmm16, %xmm19 {%k1} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - vplzcntq (%rax), %xmm19 {%k1} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - vplzcntq (%rax){1to2}, %xmm19 {%k1} +# CHECK-NEXT: - - 0.50 0.50 - - - - - - vplzcntq %xmm16, %xmm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - vplzcntq (%rax), %xmm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - vplzcntq (%rax){1to2}, %xmm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 0.50 - - - - - - vplzcntq %ymm16, %ymm19 +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - vplzcntq (%rax), %ymm19 +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - vplzcntq (%rax){1to4}, %ymm19 +# CHECK-NEXT: - - 0.50 0.50 - - - - - - vplzcntq %ymm16, %ymm19 {%k1} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - vplzcntq (%rax), %ymm19 {%k1} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - vplzcntq (%rax){1to4}, %ymm19 {%k1} +# CHECK-NEXT: - - 0.50 0.50 - - - - - - vplzcntq %ymm16, %ymm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - vplzcntq (%rax), %ymm19 {%k1} {z} +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - vplzcntq (%rax){1to4}, %ymm19 {%k1} {z}