130 lines
11 KiB
ArmAsm
130 lines
11 KiB
ArmAsm
|
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||
|
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -instruction-tables < %s | FileCheck %s
|
||
|
|
||
|
vpermb %zmm16, %zmm17, %zmm19
|
||
|
vpermb (%rax), %zmm17, %zmm19
|
||
|
vpermb %zmm16, %zmm17, %zmm19 {k1}
|
||
|
vpermb (%rax), %zmm17, %zmm19 {k1}
|
||
|
vpermb %zmm16, %zmm17, %zmm19 {k1}{z}
|
||
|
vpermb (%rax), %zmm17, %zmm19 {k1}{z}
|
||
|
|
||
|
vpermi2b %zmm16, %zmm17, %zmm19
|
||
|
vpermi2b (%rax), %zmm17, %zmm19
|
||
|
vpermi2b %zmm16, %zmm17, %zmm19 {k1}
|
||
|
vpermi2b (%rax), %zmm17, %zmm19 {k1}
|
||
|
vpermi2b %zmm16, %zmm17, %zmm19 {k1}{z}
|
||
|
vpermi2b (%rax), %zmm17, %zmm19 {k1}{z}
|
||
|
|
||
|
vpermt2b %zmm16, %zmm17, %zmm19
|
||
|
vpermt2b (%rax), %zmm17, %zmm19
|
||
|
vpermt2b %zmm16, %zmm17, %zmm19 {k1}
|
||
|
vpermt2b (%rax), %zmm17, %zmm19 {k1}
|
||
|
vpermt2b %zmm16, %zmm17, %zmm19 {k1}{z}
|
||
|
vpermt2b (%rax), %zmm17, %zmm19 {k1}{z}
|
||
|
|
||
|
vpmultishiftqb %zmm16, %zmm17, %zmm19
|
||
|
vpmultishiftqb (%rax), %zmm17, %zmm19
|
||
|
vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19
|
||
|
vpmultishiftqb %zmm16, %zmm17, %zmm19 {k1}
|
||
|
vpmultishiftqb (%rax), %zmm17, %zmm19 {k1}
|
||
|
vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19 {k1}
|
||
|
vpmultishiftqb %zmm16, %zmm17, %zmm19 {k1}{z}
|
||
|
vpmultishiftqb (%rax), %zmm17, %zmm19 {k1}{z}
|
||
|
vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19 {k1}{z}
|
||
|
|
||
|
# CHECK: Instruction Info:
|
||
|
# CHECK-NEXT: [1]: #uOps
|
||
|
# CHECK-NEXT: [2]: Latency
|
||
|
# CHECK-NEXT: [3]: RThroughput
|
||
|
# CHECK-NEXT: [4]: MayLoad
|
||
|
# CHECK-NEXT: [5]: MayStore
|
||
|
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||
|
|
||
|
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||
|
# CHECK-NEXT: 1 5 1.00 vpermb %zmm16, %zmm17, %zmm19
|
||
|
# CHECK-NEXT: 2 8 0.50 * vpermb (%rax), %zmm17, %zmm19
|
||
|
# CHECK-NEXT: 1 5 1.00 vpermb %zmm16, %zmm17, %zmm19 {%k1}
|
||
|
# CHECK-NEXT: 2 8 0.50 * vpermb (%rax), %zmm17, %zmm19 {%k1}
|
||
|
# CHECK-NEXT: 1 5 1.00 vpermb %zmm16, %zmm17, %zmm19 {%k1} {z}
|
||
|
# CHECK-NEXT: 2 8 0.50 * vpermb (%rax), %zmm17, %zmm19 {%k1} {z}
|
||
|
# CHECK-NEXT: 1 5 1.00 vpermi2b %zmm16, %zmm17, %zmm19
|
||
|
# CHECK-NEXT: 2 8 0.50 * vpermi2b (%rax), %zmm17, %zmm19
|
||
|
# CHECK-NEXT: 1 5 1.00 vpermi2b %zmm16, %zmm17, %zmm19 {%k1}
|
||
|
# CHECK-NEXT: 2 8 0.50 * vpermi2b (%rax), %zmm17, %zmm19 {%k1}
|
||
|
# CHECK-NEXT: 1 5 1.00 vpermi2b %zmm16, %zmm17, %zmm19 {%k1} {z}
|
||
|
# CHECK-NEXT: 2 8 0.50 * vpermi2b (%rax), %zmm17, %zmm19 {%k1} {z}
|
||
|
# CHECK-NEXT: 1 5 1.00 vpermt2b %zmm16, %zmm17, %zmm19
|
||
|
# CHECK-NEXT: 2 8 0.50 * vpermt2b (%rax), %zmm17, %zmm19
|
||
|
# CHECK-NEXT: 1 5 1.00 vpermt2b %zmm16, %zmm17, %zmm19 {%k1}
|
||
|
# CHECK-NEXT: 2 8 0.50 * vpermt2b (%rax), %zmm17, %zmm19 {%k1}
|
||
|
# CHECK-NEXT: 1 5 1.00 vpermt2b %zmm16, %zmm17, %zmm19 {%k1} {z}
|
||
|
# CHECK-NEXT: 2 8 0.50 * vpermt2b (%rax), %zmm17, %zmm19 {%k1} {z}
|
||
|
# CHECK-NEXT: 1 1 0.50 vpmultishiftqb %zmm16, %zmm17, %zmm19
|
||
|
# CHECK-NEXT: 1 8 0.50 * vpmultishiftqb (%rax), %zmm17, %zmm19
|
||
|
# CHECK-NEXT: 1 8 0.50 * vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19
|
||
|
# CHECK-NEXT: 1 1 0.50 vpmultishiftqb %zmm16, %zmm17, %zmm19 {%k1}
|
||
|
# CHECK-NEXT: 1 8 0.50 * vpmultishiftqb (%rax), %zmm17, %zmm19 {%k1}
|
||
|
# CHECK-NEXT: 1 8 0.50 * vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19 {%k1}
|
||
|
# CHECK-NEXT: 1 1 0.50 vpmultishiftqb %zmm16, %zmm17, %zmm19 {%k1} {z}
|
||
|
# CHECK-NEXT: 1 8 0.50 * vpmultishiftqb (%rax), %zmm17, %zmm19 {%k1} {z}
|
||
|
# CHECK-NEXT: 1 8 0.50 * vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19 {%k1} {z}
|
||
|
|
||
|
# CHECK: Resources:
|
||
|
# CHECK-NEXT: [0] - Zn4AGU0
|
||
|
# CHECK-NEXT: [1] - Zn4AGU1
|
||
|
# CHECK-NEXT: [2] - Zn4AGU2
|
||
|
# CHECK-NEXT: [3] - Zn4ALU0
|
||
|
# CHECK-NEXT: [4] - Zn4ALU1
|
||
|
# CHECK-NEXT: [5] - Zn4ALU2
|
||
|
# CHECK-NEXT: [6] - Zn4ALU3
|
||
|
# CHECK-NEXT: [7] - Zn4BRU1
|
||
|
# CHECK-NEXT: [8] - Zn4FP0
|
||
|
# CHECK-NEXT: [9] - Zn4FP1
|
||
|
# CHECK-NEXT: [10] - Zn4FP2
|
||
|
# CHECK-NEXT: [11] - Zn4FP3
|
||
|
# CHECK-NEXT: [12.0] - Zn4FP45
|
||
|
# CHECK-NEXT: [12.1] - Zn4FP45
|
||
|
# CHECK-NEXT: [13] - Zn4FPSt
|
||
|
# CHECK-NEXT: [14.0] - Zn4LSU
|
||
|
# CHECK-NEXT: [14.1] - Zn4LSU
|
||
|
# CHECK-NEXT: [14.2] - Zn4LSU
|
||
|
# CHECK-NEXT: [15.0] - Zn4Load
|
||
|
# CHECK-NEXT: [15.1] - Zn4Load
|
||
|
# CHECK-NEXT: [15.2] - Zn4Load
|
||
|
# CHECK-NEXT: [16.0] - Zn4Store
|
||
|
# CHECK-NEXT: [16.1] - Zn4Store
|
||
|
|
||
|
# CHECK: Resource pressure per iteration:
|
||
|
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||
|
# CHECK-NEXT: - - - - - - - - 4.50 18.00 18.00 4.50 7.50 7.50 - 5.00 5.00 5.00 5.00 5.00 5.00 - -
|
||
|
|
||
|
# CHECK: Resource pressure by instruction:
|
||
|
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||
|
# CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermb %zmm16, %zmm17, %zmm19
|
||
|
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermb (%rax), %zmm17, %zmm19
|
||
|
# CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermb %zmm16, %zmm17, %zmm19 {%k1}
|
||
|
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermb (%rax), %zmm17, %zmm19 {%k1}
|
||
|
# CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermb %zmm16, %zmm17, %zmm19 {%k1} {z}
|
||
|
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermb (%rax), %zmm17, %zmm19 {%k1} {z}
|
||
|
# CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermi2b %zmm16, %zmm17, %zmm19
|
||
|
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermi2b (%rax), %zmm17, %zmm19
|
||
|
# CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermi2b %zmm16, %zmm17, %zmm19 {%k1}
|
||
|
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermi2b (%rax), %zmm17, %zmm19 {%k1}
|
||
|
# CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermi2b %zmm16, %zmm17, %zmm19 {%k1} {z}
|
||
|
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermi2b (%rax), %zmm17, %zmm19 {%k1} {z}
|
||
|
# CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermt2b %zmm16, %zmm17, %zmm19
|
||
|
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermt2b (%rax), %zmm17, %zmm19
|
||
|
# CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermt2b %zmm16, %zmm17, %zmm19 {%k1}
|
||
|
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermt2b (%rax), %zmm17, %zmm19 {%k1}
|
||
|
# CHECK-NEXT: - - - - - - - - - 1.00 1.00 - - - - - - - - - - - - vpermt2b %zmm16, %zmm17, %zmm19 {%k1} {z}
|
||
|
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpermt2b (%rax), %zmm17, %zmm19 {%k1} {z}
|
||
|
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - vpmultishiftqb %zmm16, %zmm17, %zmm19
|
||
|
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpmultishiftqb (%rax), %zmm17, %zmm19
|
||
|
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19
|
||
|
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - vpmultishiftqb %zmm16, %zmm17, %zmm19 {%k1}
|
||
|
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpmultishiftqb (%rax), %zmm17, %zmm19 {%k1}
|
||
|
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19 {%k1}
|
||
|
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - vpmultishiftqb %zmm16, %zmm17, %zmm19 {%k1} {z}
|
||
|
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpmultishiftqb (%rax), %zmm17, %zmm19 {%k1} {z}
|
||
|
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vpmultishiftqb (%rax){1to8}, %zmm17, %zmm19 {%k1} {z}
|