| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,129 @@ | ||
| # NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py | ||
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -instruction-tables < %s | FileCheck %s | ||
|
|
||
| vpermb %zmm16, %zmm17, %zmm19 | ||
| vpermb (%rax), %zmm17, %zmm19 | ||
| vpermb %zmm16, %zmm17, %zmm19 {k1} | ||
| vpermb (%rax), %zmm17, %zmm19 {k1} | ||
| vpermb %zmm16, %zmm17, %zmm19 {k1}{z} | ||
| vpermb (%rax), %zmm17, %zmm19 {k1}{z} | ||
|
|
||
| vpermi2b %zmm16, %zmm17, %zmm19 | ||
| vpermi2b (%rax), %zmm17, %zmm19 | ||
| vpermi2b %zmm16, %zmm17, %zmm19 {k1} | ||
| vpermi2b (%rax), %zmm17, %zmm19 {k1} | ||
| vpermi2b %zmm16, %zmm17, %zmm19 {k1}{z} | ||
| vpermi2b (%rax), %zmm17, %zmm19 {k1}{z} | ||
|
|
||
| vpermt2b %zmm16, %zmm17, %zmm19 | ||
| vpermt2b (%rax), %zmm17, %zmm19 | ||
| vpermt2b %zmm16, %zmm17, %zmm19 {k1} | ||
| vpermt2b (%rax), %zmm17, %zmm19 {k1} | ||
| vpermt2b %zmm16, %zmm17, %zmm19 {k1}{z} | ||
| vpermt2b (%rax), %zmm17, %zmm19 {k1}{z} | ||
|
|
||
| vpmultishiftqb %zmm16, %zmm17, %zmm19 | ||
| vpmultishiftqb (%rax), %zmm17, %zmm19 | ||
| vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19 | ||
| vpmultishiftqb %zmm16, %zmm17, %zmm19 {k1} | ||
| vpmultishiftqb (%rax), %zmm17, %zmm19 {k1} | ||
| vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19 {k1} | ||
| vpmultishiftqb %zmm16, %zmm17, %zmm19 {k1}{z} | ||
| vpmultishiftqb (%rax), %zmm17, %zmm19 {k1}{z} | ||
| vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19 {k1}{z} | ||
|
|
||
| # CHECK: Instruction Info: | ||
| # CHECK-NEXT: [1]: #uOps | ||
| # CHECK-NEXT: [2]: Latency | ||
| # CHECK-NEXT: [3]: RThroughput | ||
| # CHECK-NEXT: [4]: MayLoad | ||
| # CHECK-NEXT: [5]: MayStore | ||
| # CHECK-NEXT: [6]: HasSideEffects (U) | ||
|
|
||
| # CHECK: [1] [2] [3] [4] [5] [6] Instructions: | ||
| # CHECK-NEXT: 1 5 1.00 vpermb %zmm16, %zmm17, %zmm19 | ||
| # CHECK-NEXT: 2 8 0.50 * vpermb (%rax), %zmm17, %zmm19 | ||
| # CHECK-NEXT: 1 5 1.00 vpermb %zmm16, %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: 2 8 0.50 * vpermb (%rax), %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: 1 5 1.00 vpermb %zmm16, %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: 2 8 0.50 * vpermb (%rax), %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: 1 5 1.00 vpermi2b %zmm16, %zmm17, %zmm19 | ||
| # CHECK-NEXT: 2 8 0.50 * vpermi2b (%rax), %zmm17, %zmm19 | ||
| # CHECK-NEXT: 1 5 1.00 vpermi2b %zmm16, %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: 2 8 0.50 * vpermi2b (%rax), %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: 1 5 1.00 vpermi2b %zmm16, %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: 2 8 0.50 * vpermi2b (%rax), %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: 1 5 1.00 vpermt2b %zmm16, %zmm17, %zmm19 | ||
| # CHECK-NEXT: 2 8 0.50 * vpermt2b (%rax), %zmm17, %zmm19 | ||
| # CHECK-NEXT: 1 5 1.00 vpermt2b %zmm16, %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: 2 8 0.50 * vpermt2b (%rax), %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: 1 5 1.00 vpermt2b %zmm16, %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: 2 8 0.50 * vpermt2b (%rax), %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: 1 1 0.50 vpmultishiftqb %zmm16, %zmm17, %zmm19 | ||
| # CHECK-NEXT: 1 8 0.50 * vpmultishiftqb (%rax), %zmm17, %zmm19 | ||
| # CHECK-NEXT: 1 8 0.50 * vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19 | ||
| # CHECK-NEXT: 1 1 0.50 vpmultishiftqb %zmm16, %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: 1 8 0.50 * vpmultishiftqb (%rax), %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: 1 8 0.50 * vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: 1 1 0.50 vpmultishiftqb %zmm16, %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: 1 8 0.50 * vpmultishiftqb (%rax), %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: 1 8 0.50 * vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19 {%k1} {z} | ||
|
|
||
| # CHECK: Resources: | ||
| # CHECK-NEXT: [0] - Zn4AGU0 | ||
| # CHECK-NEXT: [1] - Zn4AGU1 | ||
| # CHECK-NEXT: [2] - Zn4AGU2 | ||
| # CHECK-NEXT: [3] - Zn4ALU0 | ||
| # CHECK-NEXT: [4] - Zn4ALU1 | ||
| # CHECK-NEXT: [5] - Zn4ALU2 | ||
| # CHECK-NEXT: [6] - Zn4ALU3 | ||
| # CHECK-NEXT: [7] - Zn4BRU1 | ||
| # CHECK-NEXT: [8] - Zn4FP0 | ||
| # CHECK-NEXT: [9] - Zn4FP1 | ||
| # CHECK-NEXT: [10] - Zn4FP2 | ||
| # CHECK-NEXT: [11] - Zn4FP3 | ||
| # CHECK-NEXT: [12.0] - Zn4FP45 | ||
| # CHECK-NEXT: [12.1] - Zn4FP45 | ||
| # CHECK-NEXT: [13] - Zn4FPSt | ||
| # CHECK-NEXT: [14.0] - Zn4LSU | ||
| # CHECK-NEXT: [14.1] - Zn4LSU | ||
| # CHECK-NEXT: [14.2] - Zn4LSU | ||
| # CHECK-NEXT: [15.0] - Zn4Load | ||
| # CHECK-NEXT: [15.1] - Zn4Load | ||
| # CHECK-NEXT: [15.2] - Zn4Load | ||
| # CHECK-NEXT: [16.0] - Zn4Store | ||
| # CHECK-NEXT: [16.1] - Zn4Store | ||
|
|
||
| # CHECK: Resource pressure per iteration: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] | ||
| # CHECK-NEXT: - - - - - - - - 4.50 18.00 18.00 4.50 7.50 7.50 - 5.00 5.00 5.00 5.00 5.00 5.00 - - | ||
|
|
||
| # CHECK: Resource pressure by instruction: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions: | ||
| # CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermb %zmm16, %zmm17, %zmm19 | ||
| # CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermb (%rax), %zmm17, %zmm19 | ||
| # CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermb %zmm16, %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermb (%rax), %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermb %zmm16, %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermb (%rax), %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermi2b %zmm16, %zmm17, %zmm19 | ||
| # CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermi2b (%rax), %zmm17, %zmm19 | ||
| # CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermi2b %zmm16, %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermi2b (%rax), %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermi2b %zmm16, %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermi2b (%rax), %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermt2b %zmm16, %zmm17, %zmm19 | ||
| # CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermt2b (%rax), %zmm17, %zmm19 | ||
| # CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermt2b %zmm16, %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermt2b (%rax), %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermt2b %zmm16, %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermt2b (%rax), %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - vpmultishiftqb %zmm16, %zmm17, %zmm19 | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpmultishiftqb (%rax), %zmm17, %zmm19 | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19 | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - vpmultishiftqb %zmm16, %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpmultishiftqb (%rax), %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - vpmultishiftqb %zmm16, %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpmultishiftqb (%rax), %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19 {%k1} {z} |
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,156 @@ | ||
| # NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py | ||
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -instruction-tables < %s | FileCheck %s | ||
|
|
||
| vpdpbusd %zmm16, %zmm17, %zmm19 | ||
| vpdpbusd (%rax), %zmm17, %zmm19 | ||
| vpdpbusd (%rax){1to16}, %zmm17, %zmm19 | ||
| vpdpbusd %zmm16, %zmm17, %zmm19 {k1} | ||
| vpdpbusd (%rax), %zmm17, %zmm19 {k1} | ||
| vpdpbusd (%rax){1to16}, %zmm17, %zmm19 {k1} | ||
| vpdpbusd %zmm16, %zmm17, %zmm19 {z}{k1} | ||
| vpdpbusd (%rax), %zmm17, %zmm19 {z}{k1} | ||
| vpdpbusd (%rax){1to16}, %zmm17, %zmm19 {z}{k1} | ||
|
|
||
| vpdpbusds %zmm16, %zmm17, %zmm19 | ||
| vpdpbusds (%rax), %zmm17, %zmm19 | ||
| vpdpbusds (%rax){1to16}, %zmm17, %zmm19 | ||
| vpdpbusds %zmm16, %zmm17, %zmm19 {k1} | ||
| vpdpbusds (%rax), %zmm17, %zmm19 {k1} | ||
| vpdpbusds (%rax){1to16}, %zmm17, %zmm19 {k1} | ||
| vpdpbusds %zmm16, %zmm17, %zmm19 {z}{k1} | ||
| vpdpbusds (%rax), %zmm17, %zmm19 {z}{k1} | ||
| vpdpbusds (%rax){1to16}, %zmm17, %zmm19 {z}{k1} | ||
|
|
||
| vpdpwssd %zmm16, %zmm17, %zmm19 | ||
| vpdpwssd (%rax), %zmm17, %zmm19 | ||
| vpdpwssd (%rax){1to16}, %zmm17, %zmm19 | ||
| vpdpwssd %zmm16, %zmm17, %zmm19 {k1} | ||
| vpdpwssd (%rax), %zmm17, %zmm19 {k1} | ||
| vpdpwssd (%rax){1to16}, %zmm17, %zmm19 {k1} | ||
| vpdpwssd %zmm16, %zmm17, %zmm19 {z}{k1} | ||
| vpdpwssd (%rax), %zmm17, %zmm19 {z}{k1} | ||
| vpdpwssd (%rax){1to16}, %zmm17, %zmm19 {z}{k1} | ||
|
|
||
| vpdpwssds %zmm16, %zmm17, %zmm19 | ||
| vpdpwssds (%rax), %zmm17, %zmm19 | ||
| vpdpwssds (%rax){1to16}, %zmm17, %zmm19 | ||
| vpdpwssds %zmm16, %zmm17, %zmm19 {k1} | ||
| vpdpwssds (%rax), %zmm17, %zmm19 {k1} | ||
| vpdpwssds (%rax){1to16}, %zmm17, %zmm19 {k1} | ||
| vpdpwssds %zmm16, %zmm17, %zmm19 {z}{k1} | ||
| vpdpwssds (%rax), %zmm17, %zmm19 {z}{k1} | ||
| vpdpwssds (%rax){1to16}, %zmm17, %zmm19 {z}{k1} | ||
|
|
||
| # CHECK: Instruction Info: | ||
| # CHECK-NEXT: [1]: #uOps | ||
| # CHECK-NEXT: [2]: Latency | ||
| # CHECK-NEXT: [3]: RThroughput | ||
| # CHECK-NEXT: [4]: MayLoad | ||
| # CHECK-NEXT: [5]: MayStore | ||
| # CHECK-NEXT: [6]: HasSideEffects (U) | ||
|
|
||
| # CHECK: [1] [2] [3] [4] [5] [6] Instructions: | ||
| # CHECK-NEXT: 1 4 2.00 vpdpbusd %zmm16, %zmm17, %zmm19 | ||
| # CHECK-NEXT: 1 10 1.00 * vpdpbusd (%rax), %zmm17, %zmm19 | ||
| # CHECK-NEXT: 1 10 1.00 * vpdpbusd (%rax){1to16}, %zmm17, %zmm19 | ||
| # CHECK-NEXT: 1 4 2.00 vpdpbusd %zmm16, %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: 1 10 1.00 * vpdpbusd (%rax), %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: 1 10 1.00 * vpdpbusd (%rax){1to16}, %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: 1 4 2.00 vpdpbusd %zmm16, %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: 1 10 1.00 * vpdpbusd (%rax), %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: 1 10 1.00 * vpdpbusd (%rax){1to16}, %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: 1 4 2.00 vpdpbusds %zmm16, %zmm17, %zmm19 | ||
| # CHECK-NEXT: 1 10 1.00 * vpdpbusds (%rax), %zmm17, %zmm19 | ||
| # CHECK-NEXT: 1 10 1.00 * vpdpbusds (%rax){1to16}, %zmm17, %zmm19 | ||
| # CHECK-NEXT: 1 4 2.00 vpdpbusds %zmm16, %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: 1 10 1.00 * vpdpbusds (%rax), %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: 1 10 1.00 * vpdpbusds (%rax){1to16}, %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: 1 4 2.00 vpdpbusds %zmm16, %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: 1 10 1.00 * vpdpbusds (%rax), %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: 1 10 1.00 * vpdpbusds (%rax){1to16}, %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: 1 4 2.00 vpdpwssd %zmm16, %zmm17, %zmm19 | ||
| # CHECK-NEXT: 1 10 1.00 * vpdpwssd (%rax), %zmm17, %zmm19 | ||
| # CHECK-NEXT: 1 10 1.00 * vpdpwssd (%rax){1to16}, %zmm17, %zmm19 | ||
| # CHECK-NEXT: 1 4 2.00 vpdpwssd %zmm16, %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: 1 10 1.00 * vpdpwssd (%rax), %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: 1 10 1.00 * vpdpwssd (%rax){1to16}, %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: 1 4 2.00 vpdpwssd %zmm16, %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: 1 10 1.00 * vpdpwssd (%rax), %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: 1 10 1.00 * vpdpwssd (%rax){1to16}, %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: 1 4 2.00 vpdpwssds %zmm16, %zmm17, %zmm19 | ||
| # CHECK-NEXT: 1 10 1.00 * vpdpwssds (%rax), %zmm17, %zmm19 | ||
| # CHECK-NEXT: 1 10 1.00 * vpdpwssds (%rax){1to16}, %zmm17, %zmm19 | ||
| # CHECK-NEXT: 1 4 2.00 vpdpwssds %zmm16, %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: 1 10 1.00 * vpdpwssds (%rax), %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: 1 10 1.00 * vpdpwssds (%rax){1to16}, %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: 1 4 2.00 vpdpwssds %zmm16, %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: 1 10 1.00 * vpdpwssds (%rax), %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: 1 10 1.00 * vpdpwssds (%rax){1to16}, %zmm17, %zmm19 {%k1} {z} | ||
|
|
||
| # CHECK: Resources: | ||
| # CHECK-NEXT: [0] - Zn4AGU0 | ||
| # CHECK-NEXT: [1] - Zn4AGU1 | ||
| # CHECK-NEXT: [2] - Zn4AGU2 | ||
| # CHECK-NEXT: [3] - Zn4ALU0 | ||
| # CHECK-NEXT: [4] - Zn4ALU1 | ||
| # CHECK-NEXT: [5] - Zn4ALU2 | ||
| # CHECK-NEXT: [6] - Zn4ALU3 | ||
| # CHECK-NEXT: [7] - Zn4BRU1 | ||
| # CHECK-NEXT: [8] - Zn4FP0 | ||
| # CHECK-NEXT: [9] - Zn4FP1 | ||
| # CHECK-NEXT: [10] - Zn4FP2 | ||
| # CHECK-NEXT: [11] - Zn4FP3 | ||
| # CHECK-NEXT: [12.0] - Zn4FP45 | ||
| # CHECK-NEXT: [12.1] - Zn4FP45 | ||
| # CHECK-NEXT: [13] - Zn4FPSt | ||
| # CHECK-NEXT: [14.0] - Zn4LSU | ||
| # CHECK-NEXT: [14.1] - Zn4LSU | ||
| # CHECK-NEXT: [14.2] - Zn4LSU | ||
| # CHECK-NEXT: [15.0] - Zn4Load | ||
| # CHECK-NEXT: [15.1] - Zn4Load | ||
| # CHECK-NEXT: [15.2] - Zn4Load | ||
| # CHECK-NEXT: [16.0] - Zn4Store | ||
| # CHECK-NEXT: [16.1] - Zn4Store | ||
|
|
||
| # CHECK: Resource pressure per iteration: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] | ||
| # CHECK-NEXT: - - - - - - - - 48.00 24.00 - 24.00 12.00 12.00 - 8.00 8.00 8.00 8.00 8.00 8.00 - - | ||
|
|
||
| # CHECK: Resource pressure by instruction: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions: | ||
| # CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpbusd %zmm16, %zmm17, %zmm19 | ||
| # CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusd (%rax), %zmm17, %zmm19 | ||
| # CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusd (%rax){1to16}, %zmm17, %zmm19 | ||
| # CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpbusd %zmm16, %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusd (%rax), %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusd (%rax){1to16}, %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpbusd %zmm16, %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusd (%rax), %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusd (%rax){1to16}, %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpbusds %zmm16, %zmm17, %zmm19 | ||
| # CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusds (%rax), %zmm17, %zmm19 | ||
| # CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusds (%rax){1to16}, %zmm17, %zmm19 | ||
| # CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpbusds %zmm16, %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusds (%rax), %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusds (%rax){1to16}, %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpbusds %zmm16, %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusds (%rax), %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusds (%rax){1to16}, %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpwssd %zmm16, %zmm17, %zmm19 | ||
| # CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssd (%rax), %zmm17, %zmm19 | ||
| # CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssd (%rax){1to16}, %zmm17, %zmm19 | ||
| # CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpwssd %zmm16, %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssd (%rax), %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssd (%rax){1to16}, %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpwssd %zmm16, %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssd (%rax), %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssd (%rax){1to16}, %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpwssds %zmm16, %zmm17, %zmm19 | ||
| # CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssds (%rax), %zmm17, %zmm19 | ||
| # CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssds (%rax){1to16}, %zmm17, %zmm19 | ||
| # CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpwssds %zmm16, %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssds (%rax), %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssds (%rax){1to16}, %zmm17, %zmm19 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpwssds %zmm16, %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssds (%rax), %zmm17, %zmm19 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 1.00 - - 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssds (%rax){1to16}, %zmm17, %zmm19 {%k1} {z} |
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,53 @@ | ||
| # NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py | ||
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=tigerlake -instruction-tables < %s | FileCheck %s | ||
|
|
||
| vp2intersectd %zmm16, %zmm19, %k0 | ||
| vp2intersectd (%rax), %zmm19, %k0 | ||
| vp2intersectd (%rax){1to16}, %zmm19, %k0 | ||
|
|
||
| vp2intersectq %zmm16, %zmm19, %k0 | ||
| vp2intersectq (%rax), %zmm19, %k0 | ||
| vp2intersectq (%rax){1to8}, %zmm19, %k0 | ||
|
|
||
| # CHECK: Instruction Info: | ||
| # CHECK-NEXT: [1]: #uOps | ||
| # CHECK-NEXT: [2]: Latency | ||
| # CHECK-NEXT: [3]: RThroughput | ||
| # CHECK-NEXT: [4]: MayLoad | ||
| # CHECK-NEXT: [5]: MayStore | ||
| # CHECK-NEXT: [6]: HasSideEffects (U) | ||
|
|
||
| # CHECK: [1] [2] [3] [4] [5] [6] Instructions: | ||
| # CHECK-NEXT: 1 1 1.00 vp2intersectd %zmm16, %zmm19, %k0 | ||
| # CHECK-NEXT: 2 8 1.00 * vp2intersectd (%rax), %zmm19, %k0 | ||
| # CHECK-NEXT: 2 8 1.00 * vp2intersectd (%rax){1to16}, %zmm19, %k0 | ||
| # CHECK-NEXT: 1 1 1.00 vp2intersectq %zmm16, %zmm19, %k0 | ||
| # CHECK-NEXT: 2 8 1.00 * vp2intersectq (%rax), %zmm19, %k0 | ||
| # CHECK-NEXT: 2 8 1.00 * vp2intersectq (%rax){1to8}, %zmm19, %k0 | ||
|
|
||
| # CHECK: Resources: | ||
| # CHECK-NEXT: [0] - ICXDivider | ||
| # CHECK-NEXT: [1] - ICXFPDivider | ||
| # CHECK-NEXT: [2] - ICXPort0 | ||
| # CHECK-NEXT: [3] - ICXPort1 | ||
| # CHECK-NEXT: [4] - ICXPort2 | ||
| # CHECK-NEXT: [5] - ICXPort3 | ||
| # CHECK-NEXT: [6] - ICXPort4 | ||
| # CHECK-NEXT: [7] - ICXPort5 | ||
| # CHECK-NEXT: [8] - ICXPort6 | ||
| # CHECK-NEXT: [9] - ICXPort7 | ||
| # CHECK-NEXT: [10] - ICXPort8 | ||
| # CHECK-NEXT: [11] - ICXPort9 | ||
|
|
||
| # CHECK: Resource pressure per iteration: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] | ||
| # CHECK-NEXT: - - 6.00 - 2.00 2.00 - - - - - - | ||
|
|
||
| # CHECK: Resource pressure by instruction: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] Instructions: | ||
| # CHECK-NEXT: - - 1.00 - - - - - - - - - vp2intersectd %zmm16, %zmm19, %k0 | ||
| # CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - - - vp2intersectd (%rax), %zmm19, %k0 | ||
| # CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - - - vp2intersectd (%rax){1to16}, %zmm19, %k0 | ||
| # CHECK-NEXT: - - 1.00 - - - - - - - - - vp2intersectq %zmm16, %zmm19, %k0 | ||
| # CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - - - vp2intersectq (%rax), %zmm19, %k0 | ||
| # CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - - - vp2intersectq (%rax){1to8}, %zmm19, %k0 |
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,73 @@ | ||
| # NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py | ||
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=tigerlake -instruction-tables < %s | FileCheck %s | ||
|
|
||
| vp2intersectd %xmm16, %xmm19, %k0 | ||
| vp2intersectd (%rax), %xmm19, %k0 | ||
| vp2intersectd (%rax){1to4}, %xmm19, %k0 | ||
|
|
||
| vp2intersectd %ymm16, %ymm19, %k0 | ||
| vp2intersectd (%rax), %ymm19, %k0 | ||
| vp2intersectd (%rax){1to8}, %ymm19, %k0 | ||
|
|
||
| vp2intersectq %xmm16, %xmm19, %k0 | ||
| vp2intersectq (%rax), %xmm19, %k0 | ||
| vp2intersectq (%rax){1to2}, %xmm19, %k0 | ||
|
|
||
| vp2intersectq %ymm16, %ymm19, %k0 | ||
| vp2intersectq (%rax), %ymm19, %k0 | ||
| vp2intersectq (%rax){1to4}, %ymm19, %k0 | ||
|
|
||
| # CHECK: Instruction Info: | ||
| # CHECK-NEXT: [1]: #uOps | ||
| # CHECK-NEXT: [2]: Latency | ||
| # CHECK-NEXT: [3]: RThroughput | ||
| # CHECK-NEXT: [4]: MayLoad | ||
| # CHECK-NEXT: [5]: MayStore | ||
| # CHECK-NEXT: [6]: HasSideEffects (U) | ||
|
|
||
| # CHECK: [1] [2] [3] [4] [5] [6] Instructions: | ||
| # CHECK-NEXT: 1 1 0.50 vp2intersectd %xmm16, %xmm19, %k0 | ||
| # CHECK-NEXT: 2 7 0.50 * vp2intersectd (%rax), %xmm19, %k0 | ||
| # CHECK-NEXT: 2 7 0.50 * vp2intersectd (%rax){1to4}, %xmm19, %k0 | ||
| # CHECK-NEXT: 1 1 0.50 vp2intersectd %ymm16, %ymm19, %k0 | ||
| # CHECK-NEXT: 2 8 0.50 * vp2intersectd (%rax), %ymm19, %k0 | ||
| # CHECK-NEXT: 2 8 0.50 * vp2intersectd (%rax){1to8}, %ymm19, %k0 | ||
| # CHECK-NEXT: 1 1 0.50 vp2intersectq %xmm16, %xmm19, %k0 | ||
| # CHECK-NEXT: 2 7 0.50 * vp2intersectq (%rax), %xmm19, %k0 | ||
| # CHECK-NEXT: 2 7 0.50 * vp2intersectq (%rax){1to2}, %xmm19, %k0 | ||
| # CHECK-NEXT: 1 1 0.50 vp2intersectq %ymm16, %ymm19, %k0 | ||
| # CHECK-NEXT: 2 8 0.50 * vp2intersectq (%rax), %ymm19, %k0 | ||
| # CHECK-NEXT: 2 8 0.50 * vp2intersectq (%rax){1to4}, %ymm19, %k0 | ||
|
|
||
| # CHECK: Resources: | ||
| # CHECK-NEXT: [0] - ICXDivider | ||
| # CHECK-NEXT: [1] - ICXFPDivider | ||
| # CHECK-NEXT: [2] - ICXPort0 | ||
| # CHECK-NEXT: [3] - ICXPort1 | ||
| # CHECK-NEXT: [4] - ICXPort2 | ||
| # CHECK-NEXT: [5] - ICXPort3 | ||
| # CHECK-NEXT: [6] - ICXPort4 | ||
| # CHECK-NEXT: [7] - ICXPort5 | ||
| # CHECK-NEXT: [8] - ICXPort6 | ||
| # CHECK-NEXT: [9] - ICXPort7 | ||
| # CHECK-NEXT: [10] - ICXPort8 | ||
| # CHECK-NEXT: [11] - ICXPort9 | ||
|
|
||
| # CHECK: Resource pressure per iteration: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] | ||
| # CHECK-NEXT: - - 6.00 6.00 4.00 4.00 - - - - - - | ||
|
|
||
| # CHECK: Resource pressure by instruction: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] Instructions: | ||
| # CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vp2intersectd %xmm16, %xmm19, %k0 | ||
| # CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vp2intersectd (%rax), %xmm19, %k0 | ||
| # CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vp2intersectd (%rax){1to4}, %xmm19, %k0 | ||
| # CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vp2intersectd %ymm16, %ymm19, %k0 | ||
| # CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vp2intersectd (%rax), %ymm19, %k0 | ||
| # CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vp2intersectd (%rax){1to8}, %ymm19, %k0 | ||
| # CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vp2intersectq %xmm16, %xmm19, %k0 | ||
| # CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vp2intersectq (%rax), %xmm19, %k0 | ||
| # CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vp2intersectq (%rax){1to2}, %xmm19, %k0 | ||
| # CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vp2intersectq %ymm16, %ymm19, %k0 | ||
| # CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vp2intersectq (%rax), %ymm19, %k0 | ||
| # CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vp2intersectq (%rax){1to4}, %ymm19, %k0 |
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,51 @@ | ||
| # NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py | ||
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -instruction-tables < %s | FileCheck %s | ||
|
|
||
| vpclmulqdq $11, %zmm16, %zmm17, %zmm19 | ||
| vpclmulqdq $11, (%rax), %zmm17, %zmm19 | ||
|
|
||
| # CHECK: Instruction Info: | ||
| # CHECK-NEXT: [1]: #uOps | ||
| # CHECK-NEXT: [2]: Latency | ||
| # CHECK-NEXT: [3]: RThroughput | ||
| # CHECK-NEXT: [4]: MayLoad | ||
| # CHECK-NEXT: [5]: MayStore | ||
| # CHECK-NEXT: [6]: HasSideEffects (U) | ||
|
|
||
| # CHECK: [1] [2] [3] [4] [5] [6] Instructions: | ||
| # CHECK-NEXT: 4 4 2.00 vpclmulqdq $11, %zmm16, %zmm17, %zmm19 | ||
| # CHECK-NEXT: 4 11 2.00 * vpclmulqdq $11, (%rax), %zmm17, %zmm19 | ||
|
|
||
| # CHECK: Resources: | ||
| # CHECK-NEXT: [0] - Zn4AGU0 | ||
| # CHECK-NEXT: [1] - Zn4AGU1 | ||
| # CHECK-NEXT: [2] - Zn4AGU2 | ||
| # CHECK-NEXT: [3] - Zn4ALU0 | ||
| # CHECK-NEXT: [4] - Zn4ALU1 | ||
| # CHECK-NEXT: [5] - Zn4ALU2 | ||
| # CHECK-NEXT: [6] - Zn4ALU3 | ||
| # CHECK-NEXT: [7] - Zn4BRU1 | ||
| # CHECK-NEXT: [8] - Zn4FP0 | ||
| # CHECK-NEXT: [9] - Zn4FP1 | ||
| # CHECK-NEXT: [10] - Zn4FP2 | ||
| # CHECK-NEXT: [11] - Zn4FP3 | ||
| # CHECK-NEXT: [12.0] - Zn4FP45 | ||
| # CHECK-NEXT: [12.1] - Zn4FP45 | ||
| # CHECK-NEXT: [13] - Zn4FPSt | ||
| # CHECK-NEXT: [14.0] - Zn4LSU | ||
| # CHECK-NEXT: [14.1] - Zn4LSU | ||
| # CHECK-NEXT: [14.2] - Zn4LSU | ||
| # CHECK-NEXT: [15.0] - Zn4Load | ||
| # CHECK-NEXT: [15.1] - Zn4Load | ||
| # CHECK-NEXT: [15.2] - Zn4Load | ||
| # CHECK-NEXT: [16.0] - Zn4Store | ||
| # CHECK-NEXT: [16.1] - Zn4Store | ||
|
|
||
| # CHECK: Resource pressure per iteration: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] | ||
| # CHECK-NEXT: - - - - - - - - 4.00 4.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - | ||
|
|
||
| # CHECK: Resource pressure by instruction: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions: | ||
| # CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpclmulqdq $11, %zmm16, %zmm17, %zmm19 | ||
| # CHECK-NEXT: - - - - - - - - 2.00 2.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpclmulqdq $11, (%rax), %zmm17, %zmm19 |
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,58 @@ | ||
| # NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py | ||
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -instruction-tables < %s | FileCheck %s | ||
|
|
||
| vpclmulqdq $11, %xmm16, %xmm17, %xmm19 | ||
| vpclmulqdq $11, (%rax), %xmm17, %xmm19 | ||
|
|
||
| vpclmulqdq $11, %ymm16, %ymm17, %ymm19 | ||
| vpclmulqdq $11, (%rax), %ymm17, %ymm19 | ||
|
|
||
| # CHECK: Instruction Info: | ||
| # CHECK-NEXT: [1]: #uOps | ||
| # CHECK-NEXT: [2]: Latency | ||
| # CHECK-NEXT: [3]: RThroughput | ||
| # CHECK-NEXT: [4]: MayLoad | ||
| # CHECK-NEXT: [5]: MayStore | ||
| # CHECK-NEXT: [6]: HasSideEffects (U) | ||
|
|
||
| # CHECK: [1] [2] [3] [4] [5] [6] Instructions: | ||
| # CHECK-NEXT: 4 4 2.00 vpclmulqdq $11, %xmm16, %xmm17, %xmm19 | ||
| # CHECK-NEXT: 4 11 2.00 * vpclmulqdq $11, (%rax), %xmm17, %xmm19 | ||
| # CHECK-NEXT: 4 4 2.00 vpclmulqdq $11, %ymm16, %ymm17, %ymm19 | ||
| # CHECK-NEXT: 4 11 2.00 * vpclmulqdq $11, (%rax), %ymm17, %ymm19 | ||
|
|
||
| # CHECK: Resources: | ||
| # CHECK-NEXT: [0] - Zn4AGU0 | ||
| # CHECK-NEXT: [1] - Zn4AGU1 | ||
| # CHECK-NEXT: [2] - Zn4AGU2 | ||
| # CHECK-NEXT: [3] - Zn4ALU0 | ||
| # CHECK-NEXT: [4] - Zn4ALU1 | ||
| # CHECK-NEXT: [5] - Zn4ALU2 | ||
| # CHECK-NEXT: [6] - Zn4ALU3 | ||
| # CHECK-NEXT: [7] - Zn4BRU1 | ||
| # CHECK-NEXT: [8] - Zn4FP0 | ||
| # CHECK-NEXT: [9] - Zn4FP1 | ||
| # CHECK-NEXT: [10] - Zn4FP2 | ||
| # CHECK-NEXT: [11] - Zn4FP3 | ||
| # CHECK-NEXT: [12.0] - Zn4FP45 | ||
| # CHECK-NEXT: [12.1] - Zn4FP45 | ||
| # CHECK-NEXT: [13] - Zn4FPSt | ||
| # CHECK-NEXT: [14.0] - Zn4LSU | ||
| # CHECK-NEXT: [14.1] - Zn4LSU | ||
| # CHECK-NEXT: [14.2] - Zn4LSU | ||
| # CHECK-NEXT: [15.0] - Zn4Load | ||
| # CHECK-NEXT: [15.1] - Zn4Load | ||
| # CHECK-NEXT: [15.2] - Zn4Load | ||
| # CHECK-NEXT: [16.0] - Zn4Store | ||
| # CHECK-NEXT: [16.1] - Zn4Store | ||
|
|
||
| # CHECK: Resource pressure per iteration: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] | ||
| # CHECK-NEXT: - - - - - - - - 8.00 8.00 - - 1.00 1.00 - 0.67 0.67 0.67 0.67 0.67 0.67 - - | ||
|
|
||
| # CHECK: Resource pressure by instruction: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions: | ||
| # CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpclmulqdq $11, %xmm16, %xmm17, %xmm19 | ||
| # CHECK-NEXT: - - - - - - - - 2.00 2.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpclmulqdq $11, (%rax), %xmm17, %xmm19 | ||
| # CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpclmulqdq $11, %ymm16, %ymm17, %ymm19 | ||
| # CHECK-NEXT: - - - - - - - - 2.00 2.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpclmulqdq $11, (%rax), %ymm17, %ymm19 |
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,104 @@ | ||
| # NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py | ||
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -instruction-tables < %s | FileCheck %s | ||
|
|
||
| vpopcntd %zmm1, %zmm0 | ||
| vpopcntd (%rdi), %zmm0 | ||
| vpopcntd (%rdi){1to16}, %zmm0 | ||
|
|
||
| vpopcntd %zmm1, %zmm0 {%k1} | ||
| vpopcntd (%rdi), %zmm0 {%k1} | ||
| vpopcntd (%rdi){1to16}, %zmm0 {%k1} | ||
|
|
||
| vpopcntd %zmm1, %zmm0 {%k1} {z} | ||
| vpopcntd (%rdi), %zmm0 {%k1} {z} | ||
| vpopcntd (%rdi){1to16}, %zmm0 {%k1} {z} | ||
|
|
||
| vpopcntq %zmm1, %zmm0 | ||
| vpopcntq (%rdi), %zmm0 | ||
| vpopcntq (%rdi){1to8}, %zmm0 | ||
|
|
||
| vpopcntq %zmm1, %zmm0 {%k1} | ||
| vpopcntq (%rdi), %zmm0 {%k1} | ||
| vpopcntq (%rdi){1to8}, %zmm0 {%k1} | ||
|
|
||
| vpopcntq %zmm1, %zmm0 {%k1} {z} | ||
| vpopcntq (%rdi), %zmm0 {%k1} {z} | ||
| vpopcntq (%rdi){1to8}, %zmm0 {%k1} {z} | ||
|
|
||
| # CHECK: Instruction Info: | ||
| # CHECK-NEXT: [1]: #uOps | ||
| # CHECK-NEXT: [2]: Latency | ||
| # CHECK-NEXT: [3]: RThroughput | ||
| # CHECK-NEXT: [4]: MayLoad | ||
| # CHECK-NEXT: [5]: MayStore | ||
| # CHECK-NEXT: [6]: HasSideEffects (U) | ||
|
|
||
| # CHECK: [1] [2] [3] [4] [5] [6] Instructions: | ||
| # CHECK-NEXT: 1 1 0.50 vpopcntd %zmm1, %zmm0 | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi), %zmm0 | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi){1to16}, %zmm0 | ||
| # CHECK-NEXT: 1 1 0.50 vpopcntd %zmm1, %zmm0 {%k1} | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi), %zmm0 {%k1} | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi){1to16}, %zmm0 {%k1} | ||
| # CHECK-NEXT: 1 1 0.50 vpopcntd %zmm1, %zmm0 {%k1} {z} | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi), %zmm0 {%k1} {z} | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi){1to16}, %zmm0 {%k1} {z} | ||
| # CHECK-NEXT: 1 1 0.50 vpopcntq %zmm1, %zmm0 | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi), %zmm0 | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi){1to8}, %zmm0 | ||
| # CHECK-NEXT: 1 1 0.50 vpopcntq %zmm1, %zmm0 {%k1} | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi), %zmm0 {%k1} | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi){1to8}, %zmm0 {%k1} | ||
| # CHECK-NEXT: 1 1 0.50 vpopcntq %zmm1, %zmm0 {%k1} {z} | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi), %zmm0 {%k1} {z} | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi){1to8}, %zmm0 {%k1} {z} | ||
|
|
||
| # CHECK: Resources: | ||
| # CHECK-NEXT: [0] - Zn4AGU0 | ||
| # CHECK-NEXT: [1] - Zn4AGU1 | ||
| # CHECK-NEXT: [2] - Zn4AGU2 | ||
| # CHECK-NEXT: [3] - Zn4ALU0 | ||
| # CHECK-NEXT: [4] - Zn4ALU1 | ||
| # CHECK-NEXT: [5] - Zn4ALU2 | ||
| # CHECK-NEXT: [6] - Zn4ALU3 | ||
| # CHECK-NEXT: [7] - Zn4BRU1 | ||
| # CHECK-NEXT: [8] - Zn4FP0 | ||
| # CHECK-NEXT: [9] - Zn4FP1 | ||
| # CHECK-NEXT: [10] - Zn4FP2 | ||
| # CHECK-NEXT: [11] - Zn4FP3 | ||
| # CHECK-NEXT: [12.0] - Zn4FP45 | ||
| # CHECK-NEXT: [12.1] - Zn4FP45 | ||
| # CHECK-NEXT: [13] - Zn4FPSt | ||
| # CHECK-NEXT: [14.0] - Zn4LSU | ||
| # CHECK-NEXT: [14.1] - Zn4LSU | ||
| # CHECK-NEXT: [14.2] - Zn4LSU | ||
| # CHECK-NEXT: [15.0] - Zn4Load | ||
| # CHECK-NEXT: [15.1] - Zn4Load | ||
| # CHECK-NEXT: [15.2] - Zn4Load | ||
| # CHECK-NEXT: [16.0] - Zn4Store | ||
| # CHECK-NEXT: [16.1] - Zn4Store | ||
|
|
||
| # CHECK: Resource pressure per iteration: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] | ||
| # CHECK-NEXT: - - - - - - - - 9.00 9.00 9.00 9.00 6.00 6.00 - 4.00 4.00 4.00 4.00 4.00 4.00 - - | ||
|
|
||
| # CHECK: Resource pressure by instruction: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions: | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - vpopcntd %zmm1, %zmm0 | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi), %zmm0 | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi){1to16}, %zmm0 | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - vpopcntd %zmm1, %zmm0 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi), %zmm0 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi){1to16}, %zmm0 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - vpopcntd %zmm1, %zmm0 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi), %zmm0 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi){1to16}, %zmm0 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - vpopcntq %zmm1, %zmm0 | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi), %zmm0 | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi){1to8}, %zmm0 | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - vpopcntq %zmm1, %zmm0 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi), %zmm0 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi){1to8}, %zmm0 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - vpopcntq %zmm1, %zmm0 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi), %zmm0 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi){1to8}, %zmm0 {%k1} {z} |
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,164 @@ | ||
| # NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py | ||
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -instruction-tables < %s | FileCheck %s | ||
|
|
||
| vpopcntd %xmm1, %xmm0 | ||
| vpopcntd (%rdi), %xmm0 | ||
| vpopcntd (%rdi){1to4}, %xmm0 | ||
|
|
||
| vpopcntd %xmm1, %xmm0 {%k1} | ||
| vpopcntd (%rdi), %xmm0 {%k1} | ||
| vpopcntd (%rdi){1to4}, %xmm0 {%k1} | ||
|
|
||
| vpopcntd %xmm1, %xmm0 {%k1} {z} | ||
| vpopcntd (%rdi), %xmm0 {%k1} {z} | ||
| vpopcntd (%rdi){1to4}, %xmm0 {%k1} {z} | ||
|
|
||
| vpopcntd %ymm1, %ymm0 | ||
| vpopcntd (%rdi), %ymm0 | ||
| vpopcntd (%rdi){1to8}, %ymm0 | ||
|
|
||
| vpopcntd %ymm1, %ymm0 {%k1} | ||
| vpopcntd (%rdi), %ymm0 {%k1} | ||
| vpopcntd (%rdi){1to8}, %ymm0 {%k1} | ||
|
|
||
| vpopcntd %ymm1, %ymm0 {%k1} {z} | ||
| vpopcntd (%rdi), %ymm0 {%k1} {z} | ||
| vpopcntd (%rdi){1to8}, %ymm0 {%k1} {z} | ||
|
|
||
| vpopcntq %xmm1, %xmm0 | ||
| vpopcntq (%rdi), %xmm0 | ||
| vpopcntq (%rdi){1to2}, %xmm0 | ||
|
|
||
| vpopcntq %xmm1, %xmm0 {%k1} | ||
| vpopcntq (%rdi), %xmm0 {%k1} | ||
| vpopcntq (%rdi){1to2}, %xmm0 {%k1} | ||
|
|
||
| vpopcntq %xmm1, %xmm0 {%k1} {z} | ||
| vpopcntq (%rdi), %xmm0 {%k1} {z} | ||
| vpopcntq (%rdi){1to2}, %xmm0 {%k1} {z} | ||
|
|
||
| vpopcntq %ymm1, %ymm0 | ||
| vpopcntq (%rdi), %ymm0 | ||
| vpopcntq (%rdi){1to4}, %ymm0 | ||
|
|
||
| vpopcntq %ymm1, %ymm0 {%k1} | ||
| vpopcntq (%rdi), %ymm0 {%k1} | ||
| vpopcntq (%rdi){1to4}, %ymm0 {%k1} | ||
|
|
||
| vpopcntq %ymm1, %ymm0 {%k1} {z} | ||
| vpopcntq (%rdi), %ymm0 {%k1} {z} | ||
| vpopcntq (%rdi){1to4}, %ymm0 {%k1} {z} | ||
|
|
||
| # CHECK: Instruction Info: | ||
| # CHECK-NEXT: [1]: #uOps | ||
| # CHECK-NEXT: [2]: Latency | ||
| # CHECK-NEXT: [3]: RThroughput | ||
| # CHECK-NEXT: [4]: MayLoad | ||
| # CHECK-NEXT: [5]: MayStore | ||
| # CHECK-NEXT: [6]: HasSideEffects (U) | ||
|
|
||
| # CHECK: [1] [2] [3] [4] [5] [6] Instructions: | ||
| # CHECK-NEXT: 1 2 1.00 vpopcntd %xmm1, %xmm0 | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi), %xmm0 | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi){1to4}, %xmm0 | ||
| # CHECK-NEXT: 1 2 1.00 vpopcntd %xmm1, %xmm0 {%k1} | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi), %xmm0 {%k1} | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi){1to4}, %xmm0 {%k1} | ||
| # CHECK-NEXT: 1 2 1.00 vpopcntd %xmm1, %xmm0 {%k1} {z} | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi), %xmm0 {%k1} {z} | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi){1to4}, %xmm0 {%k1} {z} | ||
| # CHECK-NEXT: 1 1 0.25 vpopcntd %ymm1, %ymm0 | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi), %ymm0 | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi){1to8}, %ymm0 | ||
| # CHECK-NEXT: 1 1 0.25 vpopcntd %ymm1, %ymm0 {%k1} | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi), %ymm0 {%k1} | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi){1to8}, %ymm0 {%k1} | ||
| # CHECK-NEXT: 1 1 0.25 vpopcntd %ymm1, %ymm0 {%k1} {z} | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi), %ymm0 {%k1} {z} | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntd (%rdi){1to8}, %ymm0 {%k1} {z} | ||
| # CHECK-NEXT: 1 2 1.00 vpopcntq %xmm1, %xmm0 | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi), %xmm0 | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi){1to2}, %xmm0 | ||
| # CHECK-NEXT: 1 2 1.00 vpopcntq %xmm1, %xmm0 {%k1} | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi), %xmm0 {%k1} | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi){1to2}, %xmm0 {%k1} | ||
| # CHECK-NEXT: 1 2 1.00 vpopcntq %xmm1, %xmm0 {%k1} {z} | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi), %xmm0 {%k1} {z} | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi){1to2}, %xmm0 {%k1} {z} | ||
| # CHECK-NEXT: 1 1 0.25 vpopcntq %ymm1, %ymm0 | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi), %ymm0 | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi){1to4}, %ymm0 | ||
| # CHECK-NEXT: 1 1 0.25 vpopcntq %ymm1, %ymm0 {%k1} | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi), %ymm0 {%k1} | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi){1to4}, %ymm0 {%k1} | ||
| # CHECK-NEXT: 1 1 0.25 vpopcntq %ymm1, %ymm0 {%k1} {z} | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi), %ymm0 {%k1} {z} | ||
| # CHECK-NEXT: 1 8 0.50 * vpopcntq (%rdi){1to4}, %ymm0 {%k1} {z} | ||
|
|
||
| # CHECK: Resources: | ||
| # CHECK-NEXT: [0] - Zn4AGU0 | ||
| # CHECK-NEXT: [1] - Zn4AGU1 | ||
| # CHECK-NEXT: [2] - Zn4AGU2 | ||
| # CHECK-NEXT: [3] - Zn4ALU0 | ||
| # CHECK-NEXT: [4] - Zn4ALU1 | ||
| # CHECK-NEXT: [5] - Zn4ALU2 | ||
| # CHECK-NEXT: [6] - Zn4ALU3 | ||
| # CHECK-NEXT: [7] - Zn4BRU1 | ||
| # CHECK-NEXT: [8] - Zn4FP0 | ||
| # CHECK-NEXT: [9] - Zn4FP1 | ||
| # CHECK-NEXT: [10] - Zn4FP2 | ||
| # CHECK-NEXT: [11] - Zn4FP3 | ||
| # CHECK-NEXT: [12.0] - Zn4FP45 | ||
| # CHECK-NEXT: [12.1] - Zn4FP45 | ||
| # CHECK-NEXT: [13] - Zn4FPSt | ||
| # CHECK-NEXT: [14.0] - Zn4LSU | ||
| # CHECK-NEXT: [14.1] - Zn4LSU | ||
| # CHECK-NEXT: [14.2] - Zn4LSU | ||
| # CHECK-NEXT: [15.0] - Zn4Load | ||
| # CHECK-NEXT: [15.1] - Zn4Load | ||
| # CHECK-NEXT: [15.2] - Zn4Load | ||
| # CHECK-NEXT: [16.0] - Zn4Store | ||
| # CHECK-NEXT: [16.1] - Zn4Store | ||
|
|
||
| # CHECK: Resource pressure per iteration: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] | ||
| # CHECK-NEXT: - - - - - - - - 13.50 13.50 7.50 7.50 12.00 12.00 - 8.00 8.00 8.00 8.00 8.00 8.00 - - | ||
|
|
||
| # CHECK: Resource pressure by instruction: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions: | ||
| # CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vpopcntd %xmm1, %xmm0 | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi), %xmm0 | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi){1to4}, %xmm0 | ||
| # CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vpopcntd %xmm1, %xmm0 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi), %xmm0 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi){1to4}, %xmm0 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vpopcntd %xmm1, %xmm0 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi), %xmm0 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi){1to4}, %xmm0 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - vpopcntd %ymm1, %ymm0 | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi), %ymm0 | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi){1to8}, %ymm0 | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - vpopcntd %ymm1, %ymm0 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi), %ymm0 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi){1to8}, %ymm0 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - vpopcntd %ymm1, %ymm0 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi), %ymm0 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntd (%rdi){1to8}, %ymm0 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vpopcntq %xmm1, %xmm0 | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi), %xmm0 | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi){1to2}, %xmm0 | ||
| # CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vpopcntq %xmm1, %xmm0 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi), %xmm0 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi){1to2}, %xmm0 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vpopcntq %xmm1, %xmm0 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi), %xmm0 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi){1to2}, %xmm0 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - vpopcntq %ymm1, %ymm0 | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi), %ymm0 | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi){1to4}, %ymm0 | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - vpopcntq %ymm1, %ymm0 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi), %ymm0 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi){1to4}, %ymm0 {%k1} | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - vpopcntq %ymm1, %ymm0 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi), %ymm0 {%k1} {z} | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpopcntq (%rdi){1to4}, %ymm0 {%k1} {z} |
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,86 @@ | ||
| # NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py | ||
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -instruction-tables < %s | FileCheck %s | ||
|
|
||
| vgf2p8affineinvqb $0, %xmm0, %xmm1, %xmm2 | ||
| vgf2p8affineinvqb $0, (%rax), %xmm1, %xmm2 | ||
|
|
||
| vgf2p8affineinvqb $0, %ymm0, %ymm1, %ymm2 | ||
| vgf2p8affineinvqb $0, (%rax), %ymm1, %ymm2 | ||
|
|
||
| vgf2p8affineqb $0, %xmm0, %xmm1, %xmm2 | ||
| vgf2p8affineqb $0, (%rax), %xmm1, %xmm2 | ||
|
|
||
| vgf2p8affineqb $0, %ymm0, %ymm1, %ymm2 | ||
| vgf2p8affineqb $0, (%rax), %ymm1, %ymm2 | ||
|
|
||
| vgf2p8mulb %xmm0, %xmm1, %xmm2 | ||
| vgf2p8mulb (%rax), %xmm1, %xmm2 | ||
|
|
||
| vgf2p8mulb %ymm0, %ymm1, %ymm2 | ||
| vgf2p8mulb (%rax), %ymm1, %ymm2 | ||
|
|
||
| # CHECK: Instruction Info: | ||
| # CHECK-NEXT: [1]: #uOps | ||
| # CHECK-NEXT: [2]: Latency | ||
| # CHECK-NEXT: [3]: RThroughput | ||
| # CHECK-NEXT: [4]: MayLoad | ||
| # CHECK-NEXT: [5]: MayStore | ||
| # CHECK-NEXT: [6]: HasSideEffects (U) | ||
|
|
||
| # CHECK: [1] [2] [3] [4] [5] [6] Instructions: | ||
| # CHECK-NEXT: 1 3 0.50 vgf2p8affineinvqb $0, %xmm0, %xmm1, %xmm2 | ||
| # CHECK-NEXT: 1 10 0.50 * vgf2p8affineinvqb $0, (%rax), %xmm1, %xmm2 | ||
| # CHECK-NEXT: 1 3 0.50 vgf2p8affineinvqb $0, %ymm0, %ymm1, %ymm2 | ||
| # CHECK-NEXT: 1 10 0.50 * vgf2p8affineinvqb $0, (%rax), %ymm1, %ymm2 | ||
| # CHECK-NEXT: 1 3 0.50 vgf2p8affineqb $0, %xmm0, %xmm1, %xmm2 | ||
| # CHECK-NEXT: 1 10 0.50 * vgf2p8affineqb $0, (%rax), %xmm1, %xmm2 | ||
| # CHECK-NEXT: 1 3 0.50 vgf2p8affineqb $0, %ymm0, %ymm1, %ymm2 | ||
| # CHECK-NEXT: 1 10 0.50 * vgf2p8affineqb $0, (%rax), %ymm1, %ymm2 | ||
| # CHECK-NEXT: 1 1 0.25 vgf2p8mulb %xmm0, %xmm1, %xmm2 | ||
| # CHECK-NEXT: 1 8 0.50 * vgf2p8mulb (%rax), %xmm1, %xmm2 | ||
| # CHECK-NEXT: 1 1 0.25 vgf2p8mulb %ymm0, %ymm1, %ymm2 | ||
| # CHECK-NEXT: 1 8 0.50 * vgf2p8mulb (%rax), %ymm1, %ymm2 | ||
|
|
||
| # CHECK: Resources: | ||
| # CHECK-NEXT: [0] - Zn4AGU0 | ||
| # CHECK-NEXT: [1] - Zn4AGU1 | ||
| # CHECK-NEXT: [2] - Zn4AGU2 | ||
| # CHECK-NEXT: [3] - Zn4ALU0 | ||
| # CHECK-NEXT: [4] - Zn4ALU1 | ||
| # CHECK-NEXT: [5] - Zn4ALU2 | ||
| # CHECK-NEXT: [6] - Zn4ALU3 | ||
| # CHECK-NEXT: [7] - Zn4BRU1 | ||
| # CHECK-NEXT: [8] - Zn4FP0 | ||
| # CHECK-NEXT: [9] - Zn4FP1 | ||
| # CHECK-NEXT: [10] - Zn4FP2 | ||
| # CHECK-NEXT: [11] - Zn4FP3 | ||
| # CHECK-NEXT: [12.0] - Zn4FP45 | ||
| # CHECK-NEXT: [12.1] - Zn4FP45 | ||
| # CHECK-NEXT: [13] - Zn4FPSt | ||
| # CHECK-NEXT: [14.0] - Zn4LSU | ||
| # CHECK-NEXT: [14.1] - Zn4LSU | ||
| # CHECK-NEXT: [14.2] - Zn4LSU | ||
| # CHECK-NEXT: [15.0] - Zn4Load | ||
| # CHECK-NEXT: [15.1] - Zn4Load | ||
| # CHECK-NEXT: [15.2] - Zn4Load | ||
| # CHECK-NEXT: [16.0] - Zn4Store | ||
| # CHECK-NEXT: [16.1] - Zn4Store | ||
|
|
||
| # CHECK: Resource pressure per iteration: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] | ||
| # CHECK-NEXT: - - - - - - - - 5.00 1.00 1.00 5.00 3.00 3.00 - 2.00 2.00 2.00 2.00 2.00 2.00 - - | ||
|
|
||
| # CHECK: Resource pressure by instruction: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions: | ||
| # CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - vgf2p8affineinvqb $0, %xmm0, %xmm1, %xmm2 | ||
| # CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vgf2p8affineinvqb $0, (%rax), %xmm1, %xmm2 | ||
| # CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - vgf2p8affineinvqb $0, %ymm0, %ymm1, %ymm2 | ||
| # CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vgf2p8affineinvqb $0, (%rax), %ymm1, %ymm2 | ||
| # CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - vgf2p8affineqb $0, %xmm0, %xmm1, %xmm2 | ||
| # CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vgf2p8affineqb $0, (%rax), %xmm1, %xmm2 | ||
| # CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - vgf2p8affineqb $0, %ymm0, %ymm1, %ymm2 | ||
| # CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vgf2p8affineqb $0, (%rax), %ymm1, %ymm2 | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - vgf2p8mulb %xmm0, %xmm1, %xmm2 | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vgf2p8mulb (%rax), %xmm1, %xmm2 | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - vgf2p8mulb %ymm0, %ymm1, %ymm2 | ||
| # CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vgf2p8mulb (%rax), %ymm1, %ymm2 |
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,100 @@ | ||
| # NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py | ||
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -instruction-tables < %s | FileCheck %s | ||
|
|
||
| vpdpbusd %xmm0, %xmm1, %xmm2 | ||
| vpdpbusd (%rax), %xmm1, %xmm2 | ||
|
|
||
| vpdpbusd %ymm0, %ymm1, %ymm2 | ||
| vpdpbusd (%rax), %ymm1, %ymm2 | ||
|
|
||
| vpdpbusds %xmm0, %xmm1, %xmm2 | ||
| vpdpbusds (%rax), %xmm1, %xmm2 | ||
|
|
||
| vpdpbusds %ymm0, %ymm1, %ymm2 | ||
| vpdpbusds (%rax), %ymm1, %ymm2 | ||
|
|
||
| vpdpwssd %xmm0, %xmm1, %xmm2 | ||
| vpdpwssd (%rax), %xmm1, %xmm2 | ||
|
|
||
| vpdpwssd %ymm0, %ymm1, %ymm2 | ||
| vpdpwssd (%rax), %ymm1, %ymm2 | ||
|
|
||
| vpdpwssds %xmm0, %xmm1, %xmm2 | ||
| vpdpwssds (%rax), %xmm1, %xmm2 | ||
|
|
||
| vpdpwssds %ymm0, %ymm1, %ymm2 | ||
| vpdpwssds (%rax), %ymm1, %ymm2 | ||
|
|
||
| # CHECK: Instruction Info: | ||
| # CHECK-NEXT: [1]: #uOps | ||
| # CHECK-NEXT: [2]: Latency | ||
| # CHECK-NEXT: [3]: RThroughput | ||
| # CHECK-NEXT: [4]: MayLoad | ||
| # CHECK-NEXT: [5]: MayStore | ||
| # CHECK-NEXT: [6]: HasSideEffects (U) | ||
|
|
||
| # CHECK: [1] [2] [3] [4] [5] [6] Instructions: | ||
| # CHECK-NEXT: 1 4 2.00 vpdpbusd %xmm0, %xmm1, %xmm2 | ||
| # CHECK-NEXT: 1 10 0.50 * vpdpbusd (%rax), %xmm1, %xmm2 | ||
| # CHECK-NEXT: 1 4 2.00 vpdpbusd %ymm0, %ymm1, %ymm2 | ||
| # CHECK-NEXT: 1 10 0.50 * vpdpbusd (%rax), %ymm1, %ymm2 | ||
| # CHECK-NEXT: 1 4 2.00 vpdpbusds %xmm0, %xmm1, %xmm2 | ||
| # CHECK-NEXT: 1 10 0.50 * vpdpbusds (%rax), %xmm1, %xmm2 | ||
| # CHECK-NEXT: 1 4 2.00 vpdpbusds %ymm0, %ymm1, %ymm2 | ||
| # CHECK-NEXT: 1 10 0.50 * vpdpbusds (%rax), %ymm1, %ymm2 | ||
| # CHECK-NEXT: 1 4 2.00 vpdpwssd %xmm0, %xmm1, %xmm2 | ||
| # CHECK-NEXT: 1 10 0.50 * vpdpwssd (%rax), %xmm1, %xmm2 | ||
| # CHECK-NEXT: 1 4 2.00 vpdpwssd %ymm0, %ymm1, %ymm2 | ||
| # CHECK-NEXT: 1 10 0.50 * vpdpwssd (%rax), %ymm1, %ymm2 | ||
| # CHECK-NEXT: 1 4 2.00 vpdpwssds %xmm0, %xmm1, %xmm2 | ||
| # CHECK-NEXT: 1 10 0.50 * vpdpwssds (%rax), %xmm1, %xmm2 | ||
| # CHECK-NEXT: 1 4 2.00 vpdpwssds %ymm0, %ymm1, %ymm2 | ||
| # CHECK-NEXT: 1 10 0.50 * vpdpwssds (%rax), %ymm1, %ymm2 | ||
|
|
||
| # CHECK: Resources: | ||
| # CHECK-NEXT: [0] - Zn4AGU0 | ||
| # CHECK-NEXT: [1] - Zn4AGU1 | ||
| # CHECK-NEXT: [2] - Zn4AGU2 | ||
| # CHECK-NEXT: [3] - Zn4ALU0 | ||
| # CHECK-NEXT: [4] - Zn4ALU1 | ||
| # CHECK-NEXT: [5] - Zn4ALU2 | ||
| # CHECK-NEXT: [6] - Zn4ALU3 | ||
| # CHECK-NEXT: [7] - Zn4BRU1 | ||
| # CHECK-NEXT: [8] - Zn4FP0 | ||
| # CHECK-NEXT: [9] - Zn4FP1 | ||
| # CHECK-NEXT: [10] - Zn4FP2 | ||
| # CHECK-NEXT: [11] - Zn4FP3 | ||
| # CHECK-NEXT: [12.0] - Zn4FP45 | ||
| # CHECK-NEXT: [12.1] - Zn4FP45 | ||
| # CHECK-NEXT: [13] - Zn4FPSt | ||
| # CHECK-NEXT: [14.0] - Zn4LSU | ||
| # CHECK-NEXT: [14.1] - Zn4LSU | ||
| # CHECK-NEXT: [14.2] - Zn4LSU | ||
| # CHECK-NEXT: [15.0] - Zn4Load | ||
| # CHECK-NEXT: [15.1] - Zn4Load | ||
| # CHECK-NEXT: [15.2] - Zn4Load | ||
| # CHECK-NEXT: [16.0] - Zn4Store | ||
| # CHECK-NEXT: [16.1] - Zn4Store | ||
|
|
||
| # CHECK: Resource pressure per iteration: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] | ||
| # CHECK-NEXT: - - - - - - - - 20.00 16.00 - 4.00 4.00 4.00 - 2.67 2.67 2.67 2.67 2.67 2.67 - - | ||
|
|
||
| # CHECK: Resource pressure by instruction: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions: | ||
| # CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpbusd %xmm0, %xmm1, %xmm2 | ||
| # CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusd (%rax), %xmm1, %xmm2 | ||
| # CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpbusd %ymm0, %ymm1, %ymm2 | ||
| # CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusd (%rax), %ymm1, %ymm2 | ||
| # CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpbusds %xmm0, %xmm1, %xmm2 | ||
| # CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusds (%rax), %xmm1, %xmm2 | ||
| # CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpbusds %ymm0, %ymm1, %ymm2 | ||
| # CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpbusds (%rax), %ymm1, %ymm2 | ||
| # CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpwssd %xmm0, %xmm1, %xmm2 | ||
| # CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssd (%rax), %xmm1, %xmm2 | ||
| # CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpwssd %ymm0, %ymm1, %ymm2 | ||
| # CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssd (%rax), %ymm1, %ymm2 | ||
| # CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpwssds %xmm0, %xmm1, %xmm2 | ||
| # CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssds (%rax), %xmm1, %xmm2 | ||
| # CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - vpdpwssds %ymm0, %ymm1, %ymm2 | ||
| # CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpdpwssds (%rax), %ymm1, %ymm2 |
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,135 @@ | ||
| # NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py | ||
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -instruction-tables < %s | FileCheck %s | ||
|
|
||
| andn %eax, %ebx, %ecx | ||
| andn (%rax), %ebx, %ecx | ||
|
|
||
| andn %rax, %rbx, %rcx | ||
| andn (%rax), %rbx, %rcx | ||
|
|
||
| bextr %eax, %ebx, %ecx | ||
| bextr %eax, (%rbx), %ecx | ||
|
|
||
| bextr %rax, %rbx, %rcx | ||
| bextr %rax, (%rbx), %rcx | ||
|
|
||
| blsi %eax, %ecx | ||
| blsi (%rax), %ecx | ||
|
|
||
| blsi %rax, %rcx | ||
| blsi (%rax), %rcx | ||
|
|
||
| blsmsk %eax, %ecx | ||
| blsmsk (%rax), %ecx | ||
|
|
||
| blsmsk %rax, %rcx | ||
| blsmsk (%rax), %rcx | ||
|
|
||
| blsr %eax, %ecx | ||
| blsr (%rax), %ecx | ||
|
|
||
| blsr %rax, %rcx | ||
| blsr (%rax), %rcx | ||
|
|
||
| tzcnt %ax, %cx | ||
| tzcnt (%rax), %cx | ||
|
|
||
| tzcnt %eax, %ecx | ||
| tzcnt (%rax), %ecx | ||
|
|
||
| tzcnt %rax, %rcx | ||
| tzcnt (%rax), %rcx | ||
|
|
||
| # CHECK: Instruction Info: | ||
| # CHECK-NEXT: [1]: #uOps | ||
| # CHECK-NEXT: [2]: Latency | ||
| # CHECK-NEXT: [3]: RThroughput | ||
| # CHECK-NEXT: [4]: MayLoad | ||
| # CHECK-NEXT: [5]: MayStore | ||
| # CHECK-NEXT: [6]: HasSideEffects (U) | ||
|
|
||
| # CHECK: [1] [2] [3] [4] [5] [6] Instructions: | ||
| # CHECK-NEXT: 1 1 0.25 andnl %eax, %ebx, %ecx | ||
| # CHECK-NEXT: 1 5 0.33 * andnl (%rax), %ebx, %ecx | ||
| # CHECK-NEXT: 1 1 0.25 andnq %rax, %rbx, %rcx | ||
| # CHECK-NEXT: 1 5 0.33 * andnq (%rax), %rbx, %rcx | ||
| # CHECK-NEXT: 1 1 0.50 bextrl %eax, %ebx, %ecx | ||
| # CHECK-NEXT: 2 5 0.50 * bextrl %eax, (%rbx), %ecx | ||
| # CHECK-NEXT: 1 1 0.50 bextrq %rax, %rbx, %rcx | ||
| # CHECK-NEXT: 2 5 0.50 * bextrq %rax, (%rbx), %rcx | ||
| # CHECK-NEXT: 1 1 0.25 blsil %eax, %ecx | ||
| # CHECK-NEXT: 2 5 0.33 * blsil (%rax), %ecx | ||
| # CHECK-NEXT: 1 1 0.25 blsiq %rax, %rcx | ||
| # CHECK-NEXT: 2 5 0.33 * blsiq (%rax), %rcx | ||
| # CHECK-NEXT: 1 1 0.25 blsmskl %eax, %ecx | ||
| # CHECK-NEXT: 2 5 0.33 * blsmskl (%rax), %ecx | ||
| # CHECK-NEXT: 1 1 0.25 blsmskq %rax, %rcx | ||
| # CHECK-NEXT: 2 5 0.33 * blsmskq (%rax), %rcx | ||
| # CHECK-NEXT: 1 1 0.25 blsrl %eax, %ecx | ||
| # CHECK-NEXT: 2 5 0.33 * blsrl (%rax), %ecx | ||
| # CHECK-NEXT: 1 1 0.25 blsrq %rax, %rcx | ||
| # CHECK-NEXT: 2 5 0.33 * blsrq (%rax), %rcx | ||
| # CHECK-NEXT: 2 2 1.00 tzcntw %ax, %cx | ||
| # CHECK-NEXT: 2 6 0.50 * tzcntw (%rax), %cx | ||
| # CHECK-NEXT: 2 2 0.50 tzcntl %eax, %ecx | ||
| # CHECK-NEXT: 2 6 0.50 * tzcntl (%rax), %ecx | ||
| # CHECK-NEXT: 2 2 0.50 tzcntq %rax, %rcx | ||
| # CHECK-NEXT: 2 6 0.50 * tzcntq (%rax), %rcx | ||
|
|
||
| # CHECK: Resources: | ||
| # CHECK-NEXT: [0] - Zn4AGU0 | ||
| # CHECK-NEXT: [1] - Zn4AGU1 | ||
| # CHECK-NEXT: [2] - Zn4AGU2 | ||
| # CHECK-NEXT: [3] - Zn4ALU0 | ||
| # CHECK-NEXT: [4] - Zn4ALU1 | ||
| # CHECK-NEXT: [5] - Zn4ALU2 | ||
| # CHECK-NEXT: [6] - Zn4ALU3 | ||
| # CHECK-NEXT: [7] - Zn4BRU1 | ||
| # CHECK-NEXT: [8] - Zn4FP0 | ||
| # CHECK-NEXT: [9] - Zn4FP1 | ||
| # CHECK-NEXT: [10] - Zn4FP2 | ||
| # CHECK-NEXT: [11] - Zn4FP3 | ||
| # CHECK-NEXT: [12.0] - Zn4FP45 | ||
| # CHECK-NEXT: [12.1] - Zn4FP45 | ||
| # CHECK-NEXT: [13] - Zn4FPSt | ||
| # CHECK-NEXT: [14.0] - Zn4LSU | ||
| # CHECK-NEXT: [14.1] - Zn4LSU | ||
| # CHECK-NEXT: [14.2] - Zn4LSU | ||
| # CHECK-NEXT: [15.0] - Zn4Load | ||
| # CHECK-NEXT: [15.1] - Zn4Load | ||
| # CHECK-NEXT: [15.2] - Zn4Load | ||
| # CHECK-NEXT: [16.0] - Zn4Store | ||
| # CHECK-NEXT: [16.1] - Zn4Store | ||
|
|
||
| # CHECK: Resource pressure per iteration: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] | ||
| # CHECK-NEXT: 4.33 4.33 4.33 5.00 9.50 9.50 5.00 - - - - - - - - 4.33 4.33 4.33 4.33 4.33 4.33 - - | ||
|
|
||
| # CHECK: Resource pressure by instruction: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions: | ||
| # CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - andnl %eax, %ebx, %ecx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - andnl (%rax), %ebx, %ecx | ||
| # CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - andnq %rax, %rbx, %rcx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - andnq (%rax), %rbx, %rcx | ||
| # CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - bextrl %eax, %ebx, %ecx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - bextrl %eax, (%rbx), %ecx | ||
| # CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - bextrq %rax, %rbx, %rcx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - bextrq %rax, (%rbx), %rcx | ||
| # CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - blsil %eax, %ecx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - blsil (%rax), %ecx | ||
| # CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - blsiq %rax, %rcx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - blsiq (%rax), %rcx | ||
| # CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - blsmskl %eax, %ecx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - blsmskl (%rax), %ecx | ||
| # CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - blsmskq %rax, %rcx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - blsmskq (%rax), %rcx | ||
| # CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - blsrl %eax, %ecx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - blsrl (%rax), %ecx | ||
| # CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - blsrq %rax, %rcx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - blsrq (%rax), %rcx | ||
| # CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - tzcntw %ax, %cx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - tzcntw (%rax), %cx | ||
| # CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - tzcntl %eax, %ecx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - tzcntl (%rax), %ecx | ||
| # CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - tzcntq %rax, %rcx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - tzcntq (%rax), %rcx |
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,156 @@ | ||
| # NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py | ||
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -instruction-tables < %s | FileCheck %s | ||
|
|
||
| bzhi %eax, %ebx, %ecx | ||
| bzhi %eax, (%rbx), %ecx | ||
|
|
||
| bzhi %rax, %rbx, %rcx | ||
| bzhi %rax, (%rbx), %rcx | ||
|
|
||
| mulx %eax, %ebx, %ecx | ||
| mulx (%rax), %ebx, %ecx | ||
|
|
||
| mulx %rax, %rbx, %rcx | ||
| mulx (%rax), %rbx, %rcx | ||
|
|
||
| pdep %eax, %ebx, %ecx | ||
| pdep (%rax), %ebx, %ecx | ||
|
|
||
| pdep %rax, %rbx, %rcx | ||
| pdep (%rax), %rbx, %rcx | ||
|
|
||
| pext %eax, %ebx, %ecx | ||
| pext (%rax), %ebx, %ecx | ||
|
|
||
| pext %rax, %rbx, %rcx | ||
| pext (%rax), %rbx, %rcx | ||
|
|
||
| rorx $1, %eax, %ecx | ||
| rorx $1, (%rax), %ecx | ||
|
|
||
| rorx $1, %rax, %rcx | ||
| rorx $1, (%rax), %rcx | ||
|
|
||
| sarx %eax, %ebx, %ecx | ||
| sarx %eax, (%rbx), %ecx | ||
|
|
||
| sarx %rax, %rbx, %rcx | ||
| sarx %rax, (%rbx), %rcx | ||
|
|
||
| shlx %eax, %ebx, %ecx | ||
| shlx %eax, (%rbx), %ecx | ||
|
|
||
| shlx %rax, %rbx, %rcx | ||
| shlx %rax, (%rbx), %rcx | ||
|
|
||
| shrx %eax, %ebx, %ecx | ||
| shrx %eax, (%rbx), %ecx | ||
|
|
||
| shrx %rax, %rbx, %rcx | ||
| shrx %rax, (%rbx), %rcx | ||
|
|
||
| # CHECK: Instruction Info: | ||
| # CHECK-NEXT: [1]: #uOps | ||
| # CHECK-NEXT: [2]: Latency | ||
| # CHECK-NEXT: [3]: RThroughput | ||
| # CHECK-NEXT: [4]: MayLoad | ||
| # CHECK-NEXT: [5]: MayStore | ||
| # CHECK-NEXT: [6]: HasSideEffects (U) | ||
|
|
||
| # CHECK: [1] [2] [3] [4] [5] [6] Instructions: | ||
| # CHECK-NEXT: 1 1 0.50 bzhil %eax, %ebx, %ecx | ||
| # CHECK-NEXT: 2 5 0.50 * bzhil %eax, (%rbx), %ecx | ||
| # CHECK-NEXT: 1 1 0.50 bzhiq %rax, %rbx, %rcx | ||
| # CHECK-NEXT: 2 5 0.50 * bzhiq %rax, (%rbx), %rcx | ||
| # CHECK-NEXT: 2 4 1.00 mulxl %eax, %ebx, %ecx | ||
| # CHECK-NEXT: 2 8 1.00 * mulxl (%rax), %ebx, %ecx | ||
| # CHECK-NEXT: 2 4 1.00 mulxq %rax, %rbx, %rcx | ||
| # CHECK-NEXT: 2 8 1.00 * mulxq (%rax), %rbx, %rcx | ||
| # CHECK-NEXT: 1 3 1.00 pdepl %eax, %ebx, %ecx | ||
| # CHECK-NEXT: 1 5 0.33 * pdepl (%rax), %ebx, %ecx | ||
| # CHECK-NEXT: 1 3 1.00 pdepq %rax, %rbx, %rcx | ||
| # CHECK-NEXT: 1 5 0.33 * pdepq (%rax), %rbx, %rcx | ||
| # CHECK-NEXT: 1 3 1.00 pextl %eax, %ebx, %ecx | ||
| # CHECK-NEXT: 1 5 0.33 * pextl (%rax), %ebx, %ecx | ||
| # CHECK-NEXT: 1 3 1.00 pextq %rax, %rbx, %rcx | ||
| # CHECK-NEXT: 1 5 0.33 * pextq (%rax), %rbx, %rcx | ||
| # CHECK-NEXT: 1 1 0.50 rorxl $1, %eax, %ecx | ||
| # CHECK-NEXT: 2 5 0.50 * rorxl $1, (%rax), %ecx | ||
| # CHECK-NEXT: 1 1 0.50 rorxq $1, %rax, %rcx | ||
| # CHECK-NEXT: 2 5 0.50 * rorxq $1, (%rax), %rcx | ||
| # CHECK-NEXT: 1 1 0.50 sarxl %eax, %ebx, %ecx | ||
| # CHECK-NEXT: 2 5 0.50 * sarxl %eax, (%rbx), %ecx | ||
| # CHECK-NEXT: 1 1 0.50 sarxq %rax, %rbx, %rcx | ||
| # CHECK-NEXT: 2 5 0.50 * sarxq %rax, (%rbx), %rcx | ||
| # CHECK-NEXT: 1 1 0.50 shlxl %eax, %ebx, %ecx | ||
| # CHECK-NEXT: 2 5 0.50 * shlxl %eax, (%rbx), %ecx | ||
| # CHECK-NEXT: 1 1 0.50 shlxq %rax, %rbx, %rcx | ||
| # CHECK-NEXT: 2 5 0.50 * shlxq %rax, (%rbx), %rcx | ||
| # CHECK-NEXT: 1 1 0.50 shrxl %eax, %ebx, %ecx | ||
| # CHECK-NEXT: 2 5 0.50 * shrxl %eax, (%rbx), %ecx | ||
| # CHECK-NEXT: 1 1 0.50 shrxq %rax, %rbx, %rcx | ||
| # CHECK-NEXT: 2 5 0.50 * shrxq %rax, (%rbx), %rcx | ||
|
|
||
| # CHECK: Resources: | ||
| # CHECK-NEXT: [0] - Zn4AGU0 | ||
| # CHECK-NEXT: [1] - Zn4AGU1 | ||
| # CHECK-NEXT: [2] - Zn4AGU2 | ||
| # CHECK-NEXT: [3] - Zn4ALU0 | ||
| # CHECK-NEXT: [4] - Zn4ALU1 | ||
| # CHECK-NEXT: [5] - Zn4ALU2 | ||
| # CHECK-NEXT: [6] - Zn4ALU3 | ||
| # CHECK-NEXT: [7] - Zn4BRU1 | ||
| # CHECK-NEXT: [8] - Zn4FP0 | ||
| # CHECK-NEXT: [9] - Zn4FP1 | ||
| # CHECK-NEXT: [10] - Zn4FP2 | ||
| # CHECK-NEXT: [11] - Zn4FP3 | ||
| # CHECK-NEXT: [12.0] - Zn4FP45 | ||
| # CHECK-NEXT: [12.1] - Zn4FP45 | ||
| # CHECK-NEXT: [13] - Zn4FPSt | ||
| # CHECK-NEXT: [14.0] - Zn4LSU | ||
| # CHECK-NEXT: [14.1] - Zn4LSU | ||
| # CHECK-NEXT: [14.2] - Zn4LSU | ||
| # CHECK-NEXT: [15.0] - Zn4Load | ||
| # CHECK-NEXT: [15.1] - Zn4Load | ||
| # CHECK-NEXT: [15.2] - Zn4Load | ||
| # CHECK-NEXT: [16.0] - Zn4Store | ||
| # CHECK-NEXT: [16.1] - Zn4Store | ||
|
|
||
| # CHECK: Resource pressure per iteration: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] | ||
| # CHECK-NEXT: 5.33 5.33 5.33 1.00 19.00 11.00 1.00 - - - - - - - - 5.33 5.33 5.33 5.33 5.33 5.33 - - | ||
|
|
||
| # CHECK: Resource pressure by instruction: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions: | ||
| # CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - bzhil %eax, %ebx, %ecx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - bzhil %eax, (%rbx), %ecx | ||
| # CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - bzhiq %rax, %rbx, %rcx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - bzhiq %rax, (%rbx), %rcx | ||
| # CHECK-NEXT: - - - - 1.00 - - - - - - - - - - - - - - - - - - mulxl %eax, %ebx, %ecx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 - 1.00 - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - mulxl (%rax), %ebx, %ecx | ||
| # CHECK-NEXT: - - - - 1.00 - - - - - - - - - - - - - - - - - - mulxq %rax, %rbx, %rcx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 - 1.00 - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - mulxq (%rax), %rbx, %rcx | ||
| # CHECK-NEXT: - - - - 1.00 - - - - - - - - - - - - - - - - - - pdepl %eax, %ebx, %ecx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - pdepl (%rax), %ebx, %ecx | ||
| # CHECK-NEXT: - - - - 1.00 - - - - - - - - - - - - - - - - - - pdepq %rax, %rbx, %rcx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - pdepq (%rax), %rbx, %rcx | ||
| # CHECK-NEXT: - - - - 1.00 - - - - - - - - - - - - - - - - - - pextl %eax, %ebx, %ecx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - pextl (%rax), %ebx, %ecx | ||
| # CHECK-NEXT: - - - - 1.00 - - - - - - - - - - - - - - - - - - pextq %rax, %rbx, %rcx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - pextq (%rax), %rbx, %rcx | ||
| # CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - rorxl $1, %eax, %ecx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - rorxl $1, (%rax), %ecx | ||
| # CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - rorxq $1, %rax, %rcx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - rorxq $1, (%rax), %rcx | ||
| # CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - sarxl %eax, %ebx, %ecx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - sarxl %eax, (%rbx), %ecx | ||
| # CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - sarxq %rax, %rbx, %rcx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - sarxq %rax, (%rbx), %rcx | ||
| # CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - shlxl %eax, %ebx, %ecx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - shlxl %eax, (%rbx), %ecx | ||
| # CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - shlxq %rax, %rbx, %rcx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - shlxq %rax, (%rbx), %rcx | ||
| # CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - shrxl %eax, %ebx, %ecx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - shrxl %eax, (%rbx), %ecx | ||
| # CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - shrxq %rax, %rbx, %rcx | ||
| # CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - shrxq %rax, (%rbx), %rcx |
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,48 @@ | ||
| # NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py | ||
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -instruction-tables < %s | FileCheck %s | ||
|
|
||
| clflushopt (%rax) | ||
|
|
||
| # CHECK: Instruction Info: | ||
| # CHECK-NEXT: [1]: #uOps | ||
| # CHECK-NEXT: [2]: Latency | ||
| # CHECK-NEXT: [3]: RThroughput | ||
| # CHECK-NEXT: [4]: MayLoad | ||
| # CHECK-NEXT: [5]: MayStore | ||
| # CHECK-NEXT: [6]: HasSideEffects (U) | ||
|
|
||
| # CHECK: [1] [2] [3] [4] [5] [6] Instructions: | ||
| # CHECK-NEXT: 1 5 0.33 * * U clflushopt (%rax) | ||
|
|
||
| # CHECK: Resources: | ||
| # CHECK-NEXT: [0] - Zn4AGU0 | ||
| # CHECK-NEXT: [1] - Zn4AGU1 | ||
| # CHECK-NEXT: [2] - Zn4AGU2 | ||
| # CHECK-NEXT: [3] - Zn4ALU0 | ||
| # CHECK-NEXT: [4] - Zn4ALU1 | ||
| # CHECK-NEXT: [5] - Zn4ALU2 | ||
| # CHECK-NEXT: [6] - Zn4ALU3 | ||
| # CHECK-NEXT: [7] - Zn4BRU1 | ||
| # CHECK-NEXT: [8] - Zn4FP0 | ||
| # CHECK-NEXT: [9] - Zn4FP1 | ||
| # CHECK-NEXT: [10] - Zn4FP2 | ||
| # CHECK-NEXT: [11] - Zn4FP3 | ||
| # CHECK-NEXT: [12.0] - Zn4FP45 | ||
| # CHECK-NEXT: [12.1] - Zn4FP45 | ||
| # CHECK-NEXT: [13] - Zn4FPSt | ||
| # CHECK-NEXT: [14.0] - Zn4LSU | ||
| # CHECK-NEXT: [14.1] - Zn4LSU | ||
| # CHECK-NEXT: [14.2] - Zn4LSU | ||
| # CHECK-NEXT: [15.0] - Zn4Load | ||
| # CHECK-NEXT: [15.1] - Zn4Load | ||
| # CHECK-NEXT: [15.2] - Zn4Load | ||
| # CHECK-NEXT: [16.0] - Zn4Store | ||
| # CHECK-NEXT: [16.1] - Zn4Store | ||
|
|
||
| # CHECK: Resource pressure per iteration: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] | ||
| # CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - | ||
|
|
||
| # CHECK: Resource pressure by instruction: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions: | ||
| # CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - clflushopt (%rax) |
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,48 @@ | ||
| # NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py | ||
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -instruction-tables < %s | FileCheck %s | ||
|
|
||
| clwb (%rax) | ||
|
|
||
| # CHECK: Instruction Info: | ||
| # CHECK-NEXT: [1]: #uOps | ||
| # CHECK-NEXT: [2]: Latency | ||
| # CHECK-NEXT: [3]: RThroughput | ||
| # CHECK-NEXT: [4]: MayLoad | ||
| # CHECK-NEXT: [5]: MayStore | ||
| # CHECK-NEXT: [6]: HasSideEffects (U) | ||
|
|
||
| # CHECK: [1] [2] [3] [4] [5] [6] Instructions: | ||
| # CHECK-NEXT: 1 5 0.33 * * U clwb (%rax) | ||
|
|
||
| # CHECK: Resources: | ||
| # CHECK-NEXT: [0] - Zn4AGU0 | ||
| # CHECK-NEXT: [1] - Zn4AGU1 | ||
| # CHECK-NEXT: [2] - Zn4AGU2 | ||
| # CHECK-NEXT: [3] - Zn4ALU0 | ||
| # CHECK-NEXT: [4] - Zn4ALU1 | ||
| # CHECK-NEXT: [5] - Zn4ALU2 | ||
| # CHECK-NEXT: [6] - Zn4ALU3 | ||
| # CHECK-NEXT: [7] - Zn4BRU1 | ||
| # CHECK-NEXT: [8] - Zn4FP0 | ||
| # CHECK-NEXT: [9] - Zn4FP1 | ||
| # CHECK-NEXT: [10] - Zn4FP2 | ||
| # CHECK-NEXT: [11] - Zn4FP3 | ||
| # CHECK-NEXT: [12.0] - Zn4FP45 | ||
| # CHECK-NEXT: [12.1] - Zn4FP45 | ||
| # CHECK-NEXT: [13] - Zn4FPSt | ||
| # CHECK-NEXT: [14.0] - Zn4LSU | ||
| # CHECK-NEXT: [14.1] - Zn4LSU | ||
| # CHECK-NEXT: [14.2] - Zn4LSU | ||
| # CHECK-NEXT: [15.0] - Zn4Load | ||
| # CHECK-NEXT: [15.1] - Zn4Load | ||
| # CHECK-NEXT: [15.2] - Zn4Load | ||
| # CHECK-NEXT: [16.0] - Zn4Store | ||
| # CHECK-NEXT: [16.1] - Zn4Store | ||
|
|
||
| # CHECK: Resource pressure per iteration: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] | ||
| # CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - | ||
|
|
||
| # CHECK: Resource pressure by instruction: | ||
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions: | ||
| # CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - clwb (%rax) |