268 lines
20 KiB
ArmAsm
268 lines
20 KiB
ArmAsm
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
|
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
|
|
|
pabsb %mm0, %mm2
|
|
pabsb (%rax), %mm2
|
|
|
|
pabsb %xmm0, %xmm2
|
|
pabsb (%rax), %xmm2
|
|
|
|
pabsd %mm0, %mm2
|
|
pabsd (%rax), %mm2
|
|
|
|
pabsd %xmm0, %xmm2
|
|
pabsd (%rax), %xmm2
|
|
|
|
pabsw %mm0, %mm2
|
|
pabsw (%rax), %mm2
|
|
|
|
pabsw %xmm0, %xmm2
|
|
pabsw (%rax), %xmm2
|
|
|
|
palignr $1, %mm0, %mm2
|
|
palignr $1, (%rax), %mm2
|
|
|
|
palignr $1, %xmm0, %xmm2
|
|
palignr $1, (%rax), %xmm2
|
|
|
|
phaddd %mm0, %mm2
|
|
phaddd (%rax), %mm2
|
|
|
|
phaddd %xmm0, %xmm2
|
|
phaddd (%rax), %xmm2
|
|
|
|
phaddsw %mm0, %mm2
|
|
phaddsw (%rax), %mm2
|
|
|
|
phaddsw %xmm0, %xmm2
|
|
phaddsw (%rax), %xmm2
|
|
|
|
phaddw %mm0, %mm2
|
|
phaddw (%rax), %mm2
|
|
|
|
phaddw %xmm0, %xmm2
|
|
phaddw (%rax), %xmm2
|
|
|
|
phsubd %mm0, %mm2
|
|
phsubd (%rax), %mm2
|
|
|
|
phsubd %xmm0, %xmm2
|
|
phsubd (%rax), %xmm2
|
|
|
|
phsubsw %mm0, %mm2
|
|
phsubsw (%rax), %mm2
|
|
|
|
phsubsw %xmm0, %xmm2
|
|
phsubsw (%rax), %xmm2
|
|
|
|
phsubw %mm0, %mm2
|
|
phsubw (%rax), %mm2
|
|
|
|
phsubw %xmm0, %xmm2
|
|
phsubw (%rax), %xmm2
|
|
|
|
pmaddubsw %mm0, %mm2
|
|
pmaddubsw (%rax), %mm2
|
|
|
|
pmaddubsw %xmm0, %xmm2
|
|
pmaddubsw (%rax), %xmm2
|
|
|
|
pmulhrsw %mm0, %mm2
|
|
pmulhrsw (%rax), %mm2
|
|
|
|
pmulhrsw %xmm0, %xmm2
|
|
pmulhrsw (%rax), %xmm2
|
|
|
|
pshufb %mm0, %mm2
|
|
pshufb (%rax), %mm2
|
|
|
|
pshufb %xmm0, %xmm2
|
|
pshufb (%rax), %xmm2
|
|
|
|
psignb %mm0, %mm2
|
|
psignb (%rax), %mm2
|
|
|
|
psignb %xmm0, %xmm2
|
|
psignb (%rax), %xmm2
|
|
|
|
psignd %mm0, %mm2
|
|
psignd (%rax), %mm2
|
|
|
|
psignd %xmm0, %xmm2
|
|
psignd (%rax), %xmm2
|
|
|
|
psignw %mm0, %mm2
|
|
psignw (%rax), %mm2
|
|
|
|
psignw %xmm0, %xmm2
|
|
psignw (%rax), %xmm2
|
|
|
|
# CHECK: Instruction Info:
|
|
# CHECK-NEXT: [1]: #uOps
|
|
# CHECK-NEXT: [2]: Latency
|
|
# CHECK-NEXT: [3]: RThroughput
|
|
# CHECK-NEXT: [4]: MayLoad
|
|
# CHECK-NEXT: [5]: MayStore
|
|
# CHECK-NEXT: [6]: HasSideEffects (U)
|
|
|
|
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
|
# CHECK-NEXT: 1 1 0.50 pabsb %mm0, %mm2
|
|
# CHECK-NEXT: 1 8 0.50 * pabsb (%rax), %mm2
|
|
# CHECK-NEXT: 1 1 0.50 pabsb %xmm0, %xmm2
|
|
# CHECK-NEXT: 1 8 0.50 * pabsb (%rax), %xmm2
|
|
# CHECK-NEXT: 1 1 0.50 pabsd %mm0, %mm2
|
|
# CHECK-NEXT: 1 8 0.50 * pabsd (%rax), %mm2
|
|
# CHECK-NEXT: 1 1 0.50 pabsd %xmm0, %xmm2
|
|
# CHECK-NEXT: 1 8 0.50 * pabsd (%rax), %xmm2
|
|
# CHECK-NEXT: 1 1 0.50 pabsw %mm0, %mm2
|
|
# CHECK-NEXT: 1 8 0.50 * pabsw (%rax), %mm2
|
|
# CHECK-NEXT: 1 1 0.50 pabsw %xmm0, %xmm2
|
|
# CHECK-NEXT: 1 8 0.50 * pabsw (%rax), %xmm2
|
|
# CHECK-NEXT: 1 1 0.50 palignr $1, %mm0, %mm2
|
|
# CHECK-NEXT: 1 8 0.50 * palignr $1, (%rax), %mm2
|
|
# CHECK-NEXT: 1 1 0.50 palignr $1, %xmm0, %xmm2
|
|
# CHECK-NEXT: 1 8 0.50 * palignr $1, (%rax), %xmm2
|
|
# CHECK-NEXT: 3 2 2.00 phaddd %mm0, %mm2
|
|
# CHECK-NEXT: 4 9 2.00 * phaddd (%rax), %mm2
|
|
# CHECK-NEXT: 4 2 2.00 phaddd %xmm0, %xmm2
|
|
# CHECK-NEXT: 4 9 2.00 * phaddd (%rax), %xmm2
|
|
# CHECK-NEXT: 3 2 2.00 phaddsw %mm0, %mm2
|
|
# CHECK-NEXT: 4 9 2.00 * phaddsw (%rax), %mm2
|
|
# CHECK-NEXT: 4 2 2.00 phaddsw %xmm0, %xmm2
|
|
# CHECK-NEXT: 4 9 2.00 * phaddsw (%rax), %xmm2
|
|
# CHECK-NEXT: 3 2 2.00 phaddw %mm0, %mm2
|
|
# CHECK-NEXT: 4 9 2.00 * phaddw (%rax), %mm2
|
|
# CHECK-NEXT: 4 2 2.00 phaddw %xmm0, %xmm2
|
|
# CHECK-NEXT: 4 9 2.00 * phaddw (%rax), %xmm2
|
|
# CHECK-NEXT: 3 2 2.00 phsubd %mm0, %mm2
|
|
# CHECK-NEXT: 4 9 2.00 * phsubd (%rax), %mm2
|
|
# CHECK-NEXT: 4 2 2.00 phsubd %xmm0, %xmm2
|
|
# CHECK-NEXT: 4 9 2.00 * phsubd (%rax), %xmm2
|
|
# CHECK-NEXT: 3 2 2.00 phsubsw %mm0, %mm2
|
|
# CHECK-NEXT: 4 9 2.00 * phsubsw (%rax), %mm2
|
|
# CHECK-NEXT: 4 2 2.00 phsubsw %xmm0, %xmm2
|
|
# CHECK-NEXT: 4 9 2.00 * phsubsw (%rax), %xmm2
|
|
# CHECK-NEXT: 3 2 2.00 phsubw %mm0, %mm2
|
|
# CHECK-NEXT: 4 9 2.00 * phsubw (%rax), %mm2
|
|
# CHECK-NEXT: 4 2 2.00 phsubw %xmm0, %xmm2
|
|
# CHECK-NEXT: 4 9 2.00 * phsubw (%rax), %xmm2
|
|
# CHECK-NEXT: 1 3 0.50 pmaddubsw %mm0, %mm2
|
|
# CHECK-NEXT: 1 10 0.50 * pmaddubsw (%rax), %mm2
|
|
# CHECK-NEXT: 1 3 0.50 pmaddubsw %xmm0, %xmm2
|
|
# CHECK-NEXT: 1 10 0.50 * pmaddubsw (%rax), %xmm2
|
|
# CHECK-NEXT: 1 3 0.50 pmulhrsw %mm0, %mm2
|
|
# CHECK-NEXT: 1 10 0.50 * pmulhrsw (%rax), %mm2
|
|
# CHECK-NEXT: 1 3 0.50 pmulhrsw %xmm0, %xmm2
|
|
# CHECK-NEXT: 1 10 0.50 * pmulhrsw (%rax), %xmm2
|
|
# CHECK-NEXT: 1 1 0.50 pshufb %mm0, %mm2
|
|
# CHECK-NEXT: 1 8 0.50 * pshufb (%rax), %mm2
|
|
# CHECK-NEXT: 1 1 0.50 pshufb %xmm0, %xmm2
|
|
# CHECK-NEXT: 1 8 0.50 * pshufb (%rax), %xmm2
|
|
# CHECK-NEXT: 1 1 0.50 psignb %mm0, %mm2
|
|
# CHECK-NEXT: 1 8 0.50 * psignb (%rax), %mm2
|
|
# CHECK-NEXT: 1 1 0.50 psignb %xmm0, %xmm2
|
|
# CHECK-NEXT: 1 8 0.50 * psignb (%rax), %xmm2
|
|
# CHECK-NEXT: 1 1 0.50 psignd %mm0, %mm2
|
|
# CHECK-NEXT: 1 8 0.50 * psignd (%rax), %mm2
|
|
# CHECK-NEXT: 1 1 0.50 psignd %xmm0, %xmm2
|
|
# CHECK-NEXT: 1 8 0.50 * psignd (%rax), %xmm2
|
|
# CHECK-NEXT: 1 1 0.50 psignw %mm0, %mm2
|
|
# CHECK-NEXT: 1 8 0.50 * psignw (%rax), %mm2
|
|
# CHECK-NEXT: 1 1 0.50 psignw %xmm0, %xmm2
|
|
# CHECK-NEXT: 1 8 0.50 * psignw (%rax), %xmm2
|
|
|
|
# CHECK: Resources:
|
|
# CHECK-NEXT: [0] - Zn3AGU0
|
|
# CHECK-NEXT: [1] - Zn3AGU1
|
|
# CHECK-NEXT: [2] - Zn3AGU2
|
|
# CHECK-NEXT: [3] - Zn3ALU0
|
|
# CHECK-NEXT: [4] - Zn3ALU1
|
|
# CHECK-NEXT: [5] - Zn3ALU2
|
|
# CHECK-NEXT: [6] - Zn3ALU3
|
|
# CHECK-NEXT: [7] - Zn3BRU1
|
|
# CHECK-NEXT: [8] - Zn3FPP0
|
|
# CHECK-NEXT: [9] - Zn3FPP1
|
|
# CHECK-NEXT: [10] - Zn3FPP2
|
|
# CHECK-NEXT: [11] - Zn3FPP3
|
|
# CHECK-NEXT: [12.0] - Zn3FPP45
|
|
# CHECK-NEXT: [12.1] - Zn3FPP45
|
|
# CHECK-NEXT: [13] - Zn3FPSt
|
|
# CHECK-NEXT: [14.0] - Zn3LSU
|
|
# CHECK-NEXT: [14.1] - Zn3LSU
|
|
# CHECK-NEXT: [14.2] - Zn3LSU
|
|
# CHECK-NEXT: [15.0] - Zn3Load
|
|
# CHECK-NEXT: [15.1] - Zn3Load
|
|
# CHECK-NEXT: [15.2] - Zn3Load
|
|
# CHECK-NEXT: [16.0] - Zn3Store
|
|
# CHECK-NEXT: [16.1] - Zn3Store
|
|
|
|
# CHECK: Resource pressure per iteration:
|
|
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
|
# CHECK-NEXT: - - - - - - - - 61.00 13.00 7.00 7.00 16.00 16.00 - 10.67 10.67 10.67 10.67 10.67 10.67 - -
|
|
|
|
# CHECK: Resource pressure by instruction:
|
|
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
|
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - pabsb %mm0, %mm2
|
|
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pabsb (%rax), %mm2
|
|
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - pabsb %xmm0, %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pabsb (%rax), %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - pabsd %mm0, %mm2
|
|
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pabsd (%rax), %mm2
|
|
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - pabsd %xmm0, %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pabsd (%rax), %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - pabsw %mm0, %mm2
|
|
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pabsw (%rax), %mm2
|
|
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - pabsw %xmm0, %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pabsw (%rax), %xmm2
|
|
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - palignr $1, %mm0, %mm2
|
|
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - palignr $1, (%rax), %mm2
|
|
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - palignr $1, %xmm0, %xmm2
|
|
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - palignr $1, (%rax), %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phaddd %mm0, %mm2
|
|
# CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phaddd (%rax), %mm2
|
|
# CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phaddd %xmm0, %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phaddd (%rax), %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phaddsw %mm0, %mm2
|
|
# CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phaddsw (%rax), %mm2
|
|
# CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phaddsw %xmm0, %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phaddsw (%rax), %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phaddw %mm0, %mm2
|
|
# CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phaddw (%rax), %mm2
|
|
# CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phaddw %xmm0, %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phaddw (%rax), %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phsubd %mm0, %mm2
|
|
# CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phsubd (%rax), %mm2
|
|
# CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phsubd %xmm0, %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phsubd (%rax), %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phsubsw %mm0, %mm2
|
|
# CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phsubsw (%rax), %mm2
|
|
# CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phsubsw %xmm0, %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phsubsw (%rax), %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phsubw %mm0, %mm2
|
|
# CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phsubw (%rax), %mm2
|
|
# CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phsubw %xmm0, %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phsubw (%rax), %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - pmaddubsw %mm0, %mm2
|
|
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmaddubsw (%rax), %mm2
|
|
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - pmaddubsw %xmm0, %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmaddubsw (%rax), %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - pmulhrsw %mm0, %mm2
|
|
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmulhrsw (%rax), %mm2
|
|
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - pmulhrsw %xmm0, %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmulhrsw (%rax), %xmm2
|
|
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pshufb %mm0, %mm2
|
|
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pshufb (%rax), %mm2
|
|
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pshufb %xmm0, %xmm2
|
|
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pshufb (%rax), %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - psignb %mm0, %mm2
|
|
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psignb (%rax), %mm2
|
|
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - psignb %xmm0, %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psignb (%rax), %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - psignd %mm0, %mm2
|
|
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psignd (%rax), %mm2
|
|
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - psignd %xmm0, %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psignd (%rax), %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - psignw %mm0, %mm2
|
|
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psignw (%rax), %mm2
|
|
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - psignw %xmm0, %xmm2
|
|
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psignw (%rax), %xmm2
|