151 lines
10 KiB
ArmAsm
151 lines
10 KiB
ArmAsm
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
|
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=skylake-avx512 -instruction-tables < %s | FileCheck %s
|
|
|
|
vpbroadcastmb2q %k0, %zmm16
|
|
|
|
vpbroadcastmw2d %k0, %zmm16
|
|
|
|
vpconflictd %zmm16, %zmm19
|
|
vpconflictd (%rax), %zmm19
|
|
vpconflictd (%rax){1to16}, %zmm19
|
|
vpconflictd %zmm16, %zmm19 {k1}
|
|
vpconflictd (%rax), %zmm19 {k1}
|
|
vpconflictd (%rax){1to16}, %zmm19 {k1}
|
|
vpconflictd %zmm16, %zmm19 {z}{k1}
|
|
vpconflictd (%rax), %zmm19 {z}{k1}
|
|
vpconflictd (%rax){1to16}, %zmm19 {z}{k1}
|
|
|
|
vpconflictq %zmm16, %zmm19
|
|
vpconflictq (%rax), %zmm19
|
|
vpconflictq (%rax){1to8}, %zmm19
|
|
vpconflictq %zmm16, %zmm19 {k1}
|
|
vpconflictq (%rax), %zmm19 {k1}
|
|
vpconflictq (%rax){1to8}, %zmm19 {k1}
|
|
vpconflictq %zmm16, %zmm19 {z}{k1}
|
|
vpconflictq (%rax), %zmm19 {z}{k1}
|
|
vpconflictq (%rax){1to8}, %zmm19 {z}{k1}
|
|
|
|
vplzcntd %zmm16, %zmm19
|
|
vplzcntd (%rax), %zmm19
|
|
vplzcntd (%rax){1to16}, %zmm19
|
|
vplzcntd %zmm16, %zmm19 {k1}
|
|
vplzcntd (%rax), %zmm19 {k1}
|
|
vplzcntd (%rax){1to16}, %zmm19 {k1}
|
|
vplzcntd %zmm16, %zmm19 {z}{k1}
|
|
vplzcntd (%rax), %zmm19 {z}{k1}
|
|
vplzcntd (%rax){1to16}, %zmm19 {z}{k1}
|
|
|
|
vplzcntq %zmm16, %zmm19
|
|
vplzcntq (%rax), %zmm19
|
|
vplzcntq (%rax){1to8}, %zmm19
|
|
vplzcntq %zmm16, %zmm19 {k1}
|
|
vplzcntq (%rax), %zmm19 {k1}
|
|
vplzcntq (%rax){1to8}, %zmm19 {k1}
|
|
vplzcntq %zmm16, %zmm19 {z}{k1}
|
|
vplzcntq (%rax), %zmm19 {z}{k1}
|
|
vplzcntq (%rax){1to8}, %zmm19 {z}{k1}
|
|
|
|
# CHECK: Instruction Info:
|
|
# CHECK-NEXT: [1]: #uOps
|
|
# CHECK-NEXT: [2]: Latency
|
|
# CHECK-NEXT: [3]: RThroughput
|
|
# CHECK-NEXT: [4]: MayLoad
|
|
# CHECK-NEXT: [5]: MayStore
|
|
# CHECK-NEXT: [6]: HasSideEffects (U)
|
|
|
|
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
|
# CHECK-NEXT: 1 1 1.00 vpbroadcastmb2q %k0, %zmm16
|
|
# CHECK-NEXT: 1 1 1.00 vpbroadcastmw2d %k0, %zmm16
|
|
# CHECK-NEXT: 35 67 17.00 vpconflictd %zmm16, %zmm19
|
|
# CHECK-NEXT: 36 74 17.00 * vpconflictd (%rax), %zmm19
|
|
# CHECK-NEXT: 36 74 17.00 * vpconflictd (%rax){1to16}, %zmm19
|
|
# CHECK-NEXT: 35 67 17.00 vpconflictd %zmm16, %zmm19 {%k1}
|
|
# CHECK-NEXT: 36 74 17.00 * vpconflictd (%rax), %zmm19 {%k1}
|
|
# CHECK-NEXT: 36 74 17.00 * vpconflictd (%rax){1to16}, %zmm19 {%k1}
|
|
# CHECK-NEXT: 35 67 17.00 vpconflictd %zmm16, %zmm19 {%k1} {z}
|
|
# CHECK-NEXT: 36 74 17.00 * vpconflictd (%rax), %zmm19 {%k1} {z}
|
|
# CHECK-NEXT: 36 74 17.00 * vpconflictd (%rax){1to16}, %zmm19 {%k1} {z}
|
|
# CHECK-NEXT: 21 37 9.00 vpconflictq %zmm16, %zmm19
|
|
# CHECK-NEXT: 22 44 9.00 * vpconflictq (%rax), %zmm19
|
|
# CHECK-NEXT: 22 44 9.00 * vpconflictq (%rax){1to8}, %zmm19
|
|
# CHECK-NEXT: 21 37 9.00 vpconflictq %zmm16, %zmm19 {%k1}
|
|
# CHECK-NEXT: 22 44 9.00 * vpconflictq (%rax), %zmm19 {%k1}
|
|
# CHECK-NEXT: 22 44 9.00 * vpconflictq (%rax){1to8}, %zmm19 {%k1}
|
|
# CHECK-NEXT: 21 37 9.00 vpconflictq %zmm16, %zmm19 {%k1} {z}
|
|
# CHECK-NEXT: 22 44 9.00 * vpconflictq (%rax), %zmm19 {%k1} {z}
|
|
# CHECK-NEXT: 22 44 9.00 * vpconflictq (%rax){1to8}, %zmm19 {%k1} {z}
|
|
# CHECK-NEXT: 1 5 0.50 vplzcntd %zmm16, %zmm19
|
|
# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax), %zmm19
|
|
# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax){1to16}, %zmm19
|
|
# CHECK-NEXT: 1 5 0.50 vplzcntd %zmm16, %zmm19 {%k1}
|
|
# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax), %zmm19 {%k1}
|
|
# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax){1to16}, %zmm19 {%k1}
|
|
# CHECK-NEXT: 1 5 0.50 vplzcntd %zmm16, %zmm19 {%k1} {z}
|
|
# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax), %zmm19 {%k1} {z}
|
|
# CHECK-NEXT: 2 12 0.50 * vplzcntd (%rax){1to16}, %zmm19 {%k1} {z}
|
|
# CHECK-NEXT: 1 5 0.50 vplzcntq %zmm16, %zmm19
|
|
# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax), %zmm19
|
|
# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax){1to8}, %zmm19
|
|
# CHECK-NEXT: 1 5 0.50 vplzcntq %zmm16, %zmm19 {%k1}
|
|
# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax), %zmm19 {%k1}
|
|
# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax){1to8}, %zmm19 {%k1}
|
|
# CHECK-NEXT: 1 5 0.50 vplzcntq %zmm16, %zmm19 {%k1} {z}
|
|
# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax), %zmm19 {%k1} {z}
|
|
# CHECK-NEXT: 2 12 0.50 * vplzcntq (%rax){1to8}, %zmm19 {%k1} {z}
|
|
|
|
# CHECK: Resources:
|
|
# CHECK-NEXT: [0] - SKXDivider
|
|
# CHECK-NEXT: [1] - SKXFPDivider
|
|
# CHECK-NEXT: [2] - SKXPort0
|
|
# CHECK-NEXT: [3] - SKXPort1
|
|
# CHECK-NEXT: [4] - SKXPort2
|
|
# CHECK-NEXT: [5] - SKXPort3
|
|
# CHECK-NEXT: [6] - SKXPort4
|
|
# CHECK-NEXT: [7] - SKXPort5
|
|
# CHECK-NEXT: [8] - SKXPort6
|
|
# CHECK-NEXT: [9] - SKXPort7
|
|
|
|
# CHECK: Resource pressure per iteration:
|
|
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9]
|
|
# CHECK-NEXT: - - 126.00 117.00 12.00 12.00 - 281.00 - -
|
|
|
|
# CHECK: Resource pressure by instruction:
|
|
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] Instructions:
|
|
# CHECK-NEXT: - - - - - - - 1.00 - - vpbroadcastmb2q %k0, %zmm16
|
|
# CHECK-NEXT: - - - - - - - 1.00 - - vpbroadcastmw2d %k0, %zmm16
|
|
# CHECK-NEXT: - - 7.83 7.83 - - - 19.33 - - vpconflictd %zmm16, %zmm19
|
|
# CHECK-NEXT: - - 7.83 7.83 0.50 0.50 - 19.33 - - vpconflictd (%rax), %zmm19
|
|
# CHECK-NEXT: - - 7.83 7.83 0.50 0.50 - 19.33 - - vpconflictd (%rax){1to16}, %zmm19
|
|
# CHECK-NEXT: - - 7.83 7.83 - - - 19.33 - - vpconflictd %zmm16, %zmm19 {%k1}
|
|
# CHECK-NEXT: - - 7.83 7.83 0.50 0.50 - 19.33 - - vpconflictd (%rax), %zmm19 {%k1}
|
|
# CHECK-NEXT: - - 7.83 7.83 0.50 0.50 - 19.33 - - vpconflictd (%rax){1to16}, %zmm19 {%k1}
|
|
# CHECK-NEXT: - - 7.83 7.83 - - - 19.33 - - vpconflictd %zmm16, %zmm19 {%k1} {z}
|
|
# CHECK-NEXT: - - 7.83 7.83 0.50 0.50 - 19.33 - - vpconflictd (%rax), %zmm19 {%k1} {z}
|
|
# CHECK-NEXT: - - 7.83 7.83 0.50 0.50 - 19.33 - - vpconflictd (%rax){1to16}, %zmm19 {%k1} {z}
|
|
# CHECK-NEXT: - - 5.17 5.17 - - - 10.67 - - vpconflictq %zmm16, %zmm19
|
|
# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - vpconflictq (%rax), %zmm19
|
|
# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - vpconflictq (%rax){1to8}, %zmm19
|
|
# CHECK-NEXT: - - 5.17 5.17 - - - 10.67 - - vpconflictq %zmm16, %zmm19 {%k1}
|
|
# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - vpconflictq (%rax), %zmm19 {%k1}
|
|
# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - vpconflictq (%rax){1to8}, %zmm19 {%k1}
|
|
# CHECK-NEXT: - - 5.17 5.17 - - - 10.67 - - vpconflictq %zmm16, %zmm19 {%k1} {z}
|
|
# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - vpconflictq (%rax), %zmm19 {%k1} {z}
|
|
# CHECK-NEXT: - - 5.17 5.17 0.50 0.50 - 10.67 - - vpconflictq (%rax){1to8}, %zmm19 {%k1} {z}
|
|
# CHECK-NEXT: - - 0.50 - - - - 0.50 - - vplzcntd %zmm16, %zmm19
|
|
# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - vplzcntd (%rax), %zmm19
|
|
# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - vplzcntd (%rax){1to16}, %zmm19
|
|
# CHECK-NEXT: - - 0.50 - - - - 0.50 - - vplzcntd %zmm16, %zmm19 {%k1}
|
|
# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - vplzcntd (%rax), %zmm19 {%k1}
|
|
# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - vplzcntd (%rax){1to16}, %zmm19 {%k1}
|
|
# CHECK-NEXT: - - 0.50 - - - - 0.50 - - vplzcntd %zmm16, %zmm19 {%k1} {z}
|
|
# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - vplzcntd (%rax), %zmm19 {%k1} {z}
|
|
# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - vplzcntd (%rax){1to16}, %zmm19 {%k1} {z}
|
|
# CHECK-NEXT: - - 0.50 - - - - 0.50 - - vplzcntq %zmm16, %zmm19
|
|
# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - vplzcntq (%rax), %zmm19
|
|
# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - vplzcntq (%rax){1to8}, %zmm19
|
|
# CHECK-NEXT: - - 0.50 - - - - 0.50 - - vplzcntq %zmm16, %zmm19 {%k1}
|
|
# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - vplzcntq (%rax), %zmm19 {%k1}
|
|
# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - vplzcntq (%rax){1to8}, %zmm19 {%k1}
|
|
# CHECK-NEXT: - - 0.50 - - - - 0.50 - - vplzcntq %zmm16, %zmm19 {%k1} {z}
|
|
# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - vplzcntq (%rax), %zmm19 {%k1} {z}
|
|
# CHECK-NEXT: - - 0.50 - 0.50 0.50 - 0.50 - - vplzcntq (%rax){1to8}, %zmm19 {%k1} {z}
|