| # NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py |
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=skylake -timeline -register-file-stats -iterations=1 < %s | FileCheck %s |
| |
| # On SKL, renamer-based zeroing does not work for: |
| # - 16 and 8-bit GPRs |
| # - MMX |
| # - ANDN variants |
| |
| subl %eax, %eax |
| subq %rax, %rax |
| xorl %eax, %eax |
| xorq %rax, %rax |
| |
| pcmpgtb %mm2, %mm2 |
| pcmpgtd %mm2, %mm2 |
| # pcmpgtq %mm2, %mm2 # invalid operand for instruction |
| pcmpgtw %mm2, %mm2 |
| |
| pcmpgtb %xmm2, %xmm2 |
| pcmpgtd %xmm2, %xmm2 |
| pcmpgtq %xmm2, %xmm2 |
| pcmpgtw %xmm2, %xmm2 |
| |
| vpcmpgtb %xmm3, %xmm3, %xmm3 |
| vpcmpgtd %xmm3, %xmm3, %xmm3 |
| vpcmpgtq %xmm3, %xmm3, %xmm3 |
| vpcmpgtw %xmm3, %xmm3, %xmm3 |
| |
| vpcmpgtb %xmm3, %xmm3, %xmm5 |
| vpcmpgtd %xmm3, %xmm3, %xmm5 |
| vpcmpgtq %xmm3, %xmm3, %xmm5 |
| vpcmpgtw %xmm3, %xmm3, %xmm5 |
| |
| vpcmpgtb %ymm3, %ymm3, %ymm3 |
| vpcmpgtd %ymm3, %ymm3, %ymm3 |
| vpcmpgtq %ymm3, %ymm3, %ymm3 |
| vpcmpgtw %ymm3, %ymm3, %ymm3 |
| |
| vpcmpgtb %ymm3, %ymm3, %ymm5 |
| vpcmpgtd %ymm3, %ymm3, %ymm5 |
| vpcmpgtq %ymm3, %ymm3, %ymm5 |
| vpcmpgtw %ymm3, %ymm3, %ymm5 |
| |
| psubb %mm2, %mm2 |
| psubd %mm2, %mm2 |
| psubq %mm2, %mm2 |
| psubw %mm2, %mm2 |
| psubb %xmm2, %xmm2 |
| psubd %xmm2, %xmm2 |
| psubq %xmm2, %xmm2 |
| psubw %xmm2, %xmm2 |
| vpsubb %xmm3, %xmm3, %xmm3 |
| vpsubd %xmm3, %xmm3, %xmm3 |
| vpsubq %xmm3, %xmm3, %xmm3 |
| vpsubw %xmm3, %xmm3, %xmm3 |
| vpsubb %ymm3, %ymm3, %ymm3 |
| vpsubd %ymm3, %ymm3, %ymm3 |
| vpsubq %ymm3, %ymm3, %ymm3 |
| vpsubw %ymm3, %ymm3, %ymm3 |
| |
| vpsubb %xmm3, %xmm3, %xmm5 |
| vpsubd %xmm3, %xmm3, %xmm5 |
| vpsubq %xmm3, %xmm3, %xmm5 |
| vpsubw %xmm3, %xmm3, %xmm5 |
| vpsubb %ymm3, %ymm3, %ymm5 |
| vpsubd %ymm3, %ymm3, %ymm5 |
| vpsubq %ymm3, %ymm3, %ymm5 |
| vpsubw %ymm3, %ymm3, %ymm5 |
| |
| andnps %xmm0, %xmm0 |
| andnpd %xmm1, %xmm1 |
| vandnps %xmm2, %xmm2, %xmm2 |
| vandnpd %xmm1, %xmm1, %xmm1 |
| vandnps %ymm2, %ymm2, %ymm2 |
| vandnpd %ymm1, %ymm1, %ymm1 |
| pandn %mm2, %mm2 |
| pandn %xmm2, %xmm2 |
| vpandn %xmm3, %xmm3, %xmm3 |
| vpandn %ymm3, %ymm3, %ymm3 |
| |
| vandnps %xmm2, %xmm2, %xmm5 |
| vandnpd %xmm1, %xmm1, %xmm5 |
| vpandn %xmm3, %xmm3, %xmm5 |
| vandnps %ymm2, %ymm2, %ymm5 |
| vandnpd %ymm1, %ymm1, %ymm5 |
| vpandn %ymm3, %ymm3, %ymm5 |
| |
| xorps %xmm0, %xmm0 |
| xorpd %xmm1, %xmm1 |
| vxorps %xmm2, %xmm2, %xmm2 |
| vxorpd %xmm1, %xmm1, %xmm1 |
| vxorps %ymm2, %ymm2, %ymm2 |
| vxorpd %ymm1, %ymm1, %ymm1 |
| pxor %mm2, %mm2 |
| pxor %xmm2, %xmm2 |
| vpxor %xmm3, %xmm3, %xmm3 |
| vpxor %ymm3, %ymm3, %ymm3 |
| |
| vxorps %xmm4, %xmm4, %xmm5 |
| vxorpd %xmm1, %xmm1, %xmm3 |
| vxorps %ymm4, %ymm4, %ymm5 |
| vxorpd %ymm1, %ymm1, %ymm3 |
| vpxor %xmm3, %xmm3, %xmm5 |
| vpxor %ymm3, %ymm3, %ymm5 |
| |
| # CHECK: Iterations: 1 |
| # CHECK-NEXT: Instructions: 83 |
| # CHECK-NEXT: Total Cycles: 34 |
| # CHECK-NEXT: Total uOps: 83 |
| |
| # CHECK: Dispatch Width: 6 |
| # CHECK-NEXT: uOps Per Cycle: 2.44 |
| # CHECK-NEXT: IPC: 2.44 |
| # CHECK-NEXT: Block RThroughput: 16.7 |
| |
| # CHECK: Instruction Info: |
| # CHECK-NEXT: [1]: #uOps |
| # CHECK-NEXT: [2]: Latency |
| # CHECK-NEXT: [3]: RThroughput |
| # CHECK-NEXT: [4]: MayLoad |
| # CHECK-NEXT: [5]: MayStore |
| # CHECK-NEXT: [6]: HasSideEffects (U) |
| |
| # CHECK: [1] [2] [3] [4] [5] [6] Instructions: |
| # CHECK-NEXT: 1 1 0.25 subl %eax, %eax |
| # CHECK-NEXT: 1 1 0.25 subq %rax, %rax |
| # CHECK-NEXT: 1 1 0.25 xorl %eax, %eax |
| # CHECK-NEXT: 1 1 0.25 xorq %rax, %rax |
| # CHECK-NEXT: 1 1 1.00 pcmpgtb %mm2, %mm2 |
| # CHECK-NEXT: 1 1 1.00 pcmpgtd %mm2, %mm2 |
| # CHECK-NEXT: 1 1 1.00 pcmpgtw %mm2, %mm2 |
| # CHECK-NEXT: 1 1 0.50 pcmpgtb %xmm2, %xmm2 |
| # CHECK-NEXT: 1 1 0.50 pcmpgtd %xmm2, %xmm2 |
| # CHECK-NEXT: 1 3 1.00 pcmpgtq %xmm2, %xmm2 |
| # CHECK-NEXT: 1 1 0.50 pcmpgtw %xmm2, %xmm2 |
| # CHECK-NEXT: 1 1 0.50 vpcmpgtb %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: 1 1 0.50 vpcmpgtd %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: 1 3 1.00 vpcmpgtq %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: 1 1 0.50 vpcmpgtw %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: 1 1 0.50 vpcmpgtb %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: 1 1 0.50 vpcmpgtd %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: 1 3 1.00 vpcmpgtq %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: 1 1 0.50 vpcmpgtw %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: 1 1 0.50 vpcmpgtb %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: 1 1 0.50 vpcmpgtd %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: 1 3 1.00 vpcmpgtq %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: 1 1 0.50 vpcmpgtw %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: 1 1 0.50 vpcmpgtb %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: 1 1 0.50 vpcmpgtd %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: 1 3 1.00 vpcmpgtq %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: 1 1 0.50 vpcmpgtw %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: 1 1 0.50 psubb %mm2, %mm2 |
| # CHECK-NEXT: 1 1 0.50 psubd %mm2, %mm2 |
| # CHECK-NEXT: 1 1 0.50 psubq %mm2, %mm2 |
| # CHECK-NEXT: 1 1 0.50 psubw %mm2, %mm2 |
| # CHECK-NEXT: 1 1 0.33 psubb %xmm2, %xmm2 |
| # CHECK-NEXT: 1 1 0.33 psubd %xmm2, %xmm2 |
| # CHECK-NEXT: 1 1 0.33 psubq %xmm2, %xmm2 |
| # CHECK-NEXT: 1 1 0.33 psubw %xmm2, %xmm2 |
| # CHECK-NEXT: 1 1 0.33 vpsubb %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: 1 1 0.33 vpsubd %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: 1 1 0.33 vpsubq %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: 1 1 0.33 vpsubw %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: 1 1 0.33 vpsubb %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: 1 1 0.33 vpsubd %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: 1 1 0.33 vpsubq %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: 1 1 0.33 vpsubw %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: 1 1 0.33 vpsubb %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: 1 1 0.33 vpsubd %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: 1 1 0.33 vpsubq %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: 1 1 0.33 vpsubw %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: 1 1 0.33 vpsubb %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: 1 1 0.33 vpsubd %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: 1 1 0.33 vpsubq %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: 1 1 0.33 vpsubw %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: 1 1 0.33 andnps %xmm0, %xmm0 |
| # CHECK-NEXT: 1 1 0.33 andnpd %xmm1, %xmm1 |
| # CHECK-NEXT: 1 1 0.33 vandnps %xmm2, %xmm2, %xmm2 |
| # CHECK-NEXT: 1 1 0.33 vandnpd %xmm1, %xmm1, %xmm1 |
| # CHECK-NEXT: 1 1 0.33 vandnps %ymm2, %ymm2, %ymm2 |
| # CHECK-NEXT: 1 1 0.33 vandnpd %ymm1, %ymm1, %ymm1 |
| # CHECK-NEXT: 1 1 0.50 pandn %mm2, %mm2 |
| # CHECK-NEXT: 1 1 0.33 pandn %xmm2, %xmm2 |
| # CHECK-NEXT: 1 1 0.33 vpandn %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: 1 1 0.33 vpandn %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: 1 1 0.33 vandnps %xmm2, %xmm2, %xmm5 |
| # CHECK-NEXT: 1 1 0.33 vandnpd %xmm1, %xmm1, %xmm5 |
| # CHECK-NEXT: 1 1 0.33 vpandn %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: 1 1 0.33 vandnps %ymm2, %ymm2, %ymm5 |
| # CHECK-NEXT: 1 1 0.33 vandnpd %ymm1, %ymm1, %ymm5 |
| # CHECK-NEXT: 1 1 0.33 vpandn %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: 1 1 0.33 xorps %xmm0, %xmm0 |
| # CHECK-NEXT: 1 1 0.33 xorpd %xmm1, %xmm1 |
| # CHECK-NEXT: 1 1 0.33 vxorps %xmm2, %xmm2, %xmm2 |
| # CHECK-NEXT: 1 1 0.33 vxorpd %xmm1, %xmm1, %xmm1 |
| # CHECK-NEXT: 1 1 0.33 vxorps %ymm2, %ymm2, %ymm2 |
| # CHECK-NEXT: 1 1 0.33 vxorpd %ymm1, %ymm1, %ymm1 |
| # CHECK-NEXT: 1 1 0.50 pxor %mm2, %mm2 |
| # CHECK-NEXT: 1 1 0.33 pxor %xmm2, %xmm2 |
| # CHECK-NEXT: 1 1 0.33 vpxor %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: 1 1 0.33 vpxor %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: 1 1 0.33 vxorps %xmm4, %xmm4, %xmm5 |
| # CHECK-NEXT: 1 1 0.33 vxorpd %xmm1, %xmm1, %xmm3 |
| # CHECK-NEXT: 1 1 0.33 vxorps %ymm4, %ymm4, %ymm5 |
| # CHECK-NEXT: 1 1 0.33 vxorpd %ymm1, %ymm1, %ymm3 |
| # CHECK-NEXT: 1 1 0.33 vpxor %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: 1 1 0.33 vpxor %ymm3, %ymm3, %ymm5 |
| |
| # CHECK: Register File statistics: |
| # CHECK-NEXT: Total number of mappings created: 87 |
| # CHECK-NEXT: Max number of mappings used: 66 |
| |
| # CHECK: Resources: |
| # CHECK-NEXT: [0] - SKLDivider |
| # CHECK-NEXT: [1] - SKLFPDivider |
| # CHECK-NEXT: [2] - SKLPort0 |
| # CHECK-NEXT: [3] - SKLPort1 |
| # CHECK-NEXT: [4] - SKLPort2 |
| # CHECK-NEXT: [5] - SKLPort3 |
| # CHECK-NEXT: [6] - SKLPort4 |
| # CHECK-NEXT: [7] - SKLPort5 |
| # CHECK-NEXT: [8] - SKLPort6 |
| # CHECK-NEXT: [9] - SKLPort7 |
| |
| # CHECK: Resource pressure per iteration: |
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] |
| # CHECK-NEXT: - - 28.00 26.00 - - - 27.00 2.00 - |
| |
| # CHECK: Resource pressure by instruction: |
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] Instructions: |
| # CHECK-NEXT: - - - - - - - - 1.00 - subl %eax, %eax |
| # CHECK-NEXT: - - - - - - - 1.00 - - subq %rax, %rax |
| # CHECK-NEXT: - - - - - - - - 1.00 - xorl %eax, %eax |
| # CHECK-NEXT: - - - - - - - 1.00 - - xorq %rax, %rax |
| # CHECK-NEXT: - - 1.00 - - - - - - - pcmpgtb %mm2, %mm2 |
| # CHECK-NEXT: - - 1.00 - - - - - - - pcmpgtd %mm2, %mm2 |
| # CHECK-NEXT: - - 1.00 - - - - - - - pcmpgtw %mm2, %mm2 |
| # CHECK-NEXT: - - - 1.00 - - - - - - pcmpgtb %xmm2, %xmm2 |
| # CHECK-NEXT: - - - 1.00 - - - - - - pcmpgtd %xmm2, %xmm2 |
| # CHECK-NEXT: - - - - - - - 1.00 - - pcmpgtq %xmm2, %xmm2 |
| # CHECK-NEXT: - - - 1.00 - - - - - - pcmpgtw %xmm2, %xmm2 |
| # CHECK-NEXT: - - - 1.00 - - - - - - vpcmpgtb %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: - - 1.00 - - - - - - - vpcmpgtd %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: - - - - - - - 1.00 - - vpcmpgtq %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: - - - 1.00 - - - - - - vpcmpgtw %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: - - - 1.00 - - - - - - vpcmpgtb %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: - - 1.00 - - - - - - - vpcmpgtd %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: - - - - - - - 1.00 - - vpcmpgtq %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: - - 1.00 - - - - - - - vpcmpgtw %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: - - - 1.00 - - - - - - vpcmpgtb %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: - - - 1.00 - - - - - - vpcmpgtd %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: - - - - - - - 1.00 - - vpcmpgtq %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: - - - 1.00 - - - - - - vpcmpgtw %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: - - - 1.00 - - - - - - vpcmpgtb %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: - - 1.00 - - - - - - - vpcmpgtd %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: - - - - - - - 1.00 - - vpcmpgtq %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: - - - 1.00 - - - - - - vpcmpgtw %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: - - 1.00 - - - - - - - psubb %mm2, %mm2 |
| # CHECK-NEXT: - - - - - - - 1.00 - - psubd %mm2, %mm2 |
| # CHECK-NEXT: - - 1.00 - - - - - - - psubq %mm2, %mm2 |
| # CHECK-NEXT: - - 1.00 - - - - - - - psubw %mm2, %mm2 |
| # CHECK-NEXT: - - - - - - - 1.00 - - psubb %xmm2, %xmm2 |
| # CHECK-NEXT: - - - - - - - 1.00 - - psubd %xmm2, %xmm2 |
| # CHECK-NEXT: - - - - - - - 1.00 - - psubq %xmm2, %xmm2 |
| # CHECK-NEXT: - - - 1.00 - - - - - - psubw %xmm2, %xmm2 |
| # CHECK-NEXT: - - - - - - - 1.00 - - vpsubb %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: - - - - - - - 1.00 - - vpsubd %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: - - - - - - - 1.00 - - vpsubq %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: - - - - - - - 1.00 - - vpsubw %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: - - - - - - - 1.00 - - vpsubb %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: - - - - - - - 1.00 - - vpsubd %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: - - - - - - - 1.00 - - vpsubq %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: - - - - - - - 1.00 - - vpsubw %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: - - - - - - - 1.00 - - vpsubb %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: - - - 1.00 - - - - - - vpsubd %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: - - 1.00 - - - - - - - vpsubq %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: - - - - - - - 1.00 - - vpsubw %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: - - - 1.00 - - - - - - vpsubb %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: - - 1.00 - - - - - - - vpsubd %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: - - - - - - - 1.00 - - vpsubq %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: - - - 1.00 - - - - - - vpsubw %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: - - 1.00 - - - - - - - andnps %xmm0, %xmm0 |
| # CHECK-NEXT: - - 1.00 - - - - - - - andnpd %xmm1, %xmm1 |
| # CHECK-NEXT: - - - - - - - 1.00 - - vandnps %xmm2, %xmm2, %xmm2 |
| # CHECK-NEXT: - - - 1.00 - - - - - - vandnpd %xmm1, %xmm1, %xmm1 |
| # CHECK-NEXT: - - - 1.00 - - - - - - vandnps %ymm2, %ymm2, %ymm2 |
| # CHECK-NEXT: - - - - - - - 1.00 - - vandnpd %ymm1, %ymm1, %ymm1 |
| # CHECK-NEXT: - - 1.00 - - - - - - - pandn %mm2, %mm2 |
| # CHECK-NEXT: - - - - - - - 1.00 - - pandn %xmm2, %xmm2 |
| # CHECK-NEXT: - - 1.00 - - - - - - - vpandn %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: - - - - - - - 1.00 - - vpandn %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: - - 1.00 - - - - - - - vandnps %xmm2, %xmm2, %xmm5 |
| # CHECK-NEXT: - - 1.00 - - - - - - - vandnpd %xmm1, %xmm1, %xmm5 |
| # CHECK-NEXT: - - 1.00 - - - - - - - vpandn %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: - - - 1.00 - - - - - - vandnps %ymm2, %ymm2, %ymm5 |
| # CHECK-NEXT: - - 1.00 - - - - - - - vandnpd %ymm1, %ymm1, %ymm5 |
| # CHECK-NEXT: - - - - - - - 1.00 - - vpandn %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: - - 1.00 - - - - - - - xorps %xmm0, %xmm0 |
| # CHECK-NEXT: - - - 1.00 - - - - - - xorpd %xmm1, %xmm1 |
| # CHECK-NEXT: - - 1.00 - - - - - - - vxorps %xmm2, %xmm2, %xmm2 |
| # CHECK-NEXT: - - - 1.00 - - - - - - vxorpd %xmm1, %xmm1, %xmm1 |
| # CHECK-NEXT: - - 1.00 - - - - - - - vxorps %ymm2, %ymm2, %ymm2 |
| # CHECK-NEXT: - - - 1.00 - - - - - - vxorpd %ymm1, %ymm1, %ymm1 |
| # CHECK-NEXT: - - 1.00 - - - - - - - pxor %mm2, %mm2 |
| # CHECK-NEXT: - - - 1.00 - - - - - - pxor %xmm2, %xmm2 |
| # CHECK-NEXT: - - - 1.00 - - - - - - vpxor %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: - - 1.00 - - - - - - - vpxor %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: - - - 1.00 - - - - - - vxorps %xmm4, %xmm4, %xmm5 |
| # CHECK-NEXT: - - 1.00 - - - - - - - vxorpd %xmm1, %xmm1, %xmm3 |
| # CHECK-NEXT: - - - 1.00 - - - - - - vxorps %ymm4, %ymm4, %ymm5 |
| # CHECK-NEXT: - - 1.00 - - - - - - - vxorpd %ymm1, %ymm1, %ymm3 |
| # CHECK-NEXT: - - 1.00 - - - - - - - vpxor %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: - - - 1.00 - - - - - - vpxor %ymm3, %ymm3, %ymm5 |
| |
| # CHECK: Timeline view: |
| # CHECK-NEXT: 0123456789 0123 |
| # CHECK-NEXT: Index 0123456789 0123456789 |
| |
| # CHECK: [0,0] DeER . . . . . . . subl %eax, %eax |
| # CHECK-NEXT: [0,1] D=eER. . . . . . . subq %rax, %rax |
| # CHECK-NEXT: [0,2] D==eER . . . . . . xorl %eax, %eax |
| # CHECK-NEXT: [0,3] D===eER . . . . . . xorq %rax, %rax |
| # CHECK-NEXT: [0,4] DeE---R . . . . . . pcmpgtb %mm2, %mm2 |
| # CHECK-NEXT: [0,5] D=eE--R . . . . . . pcmpgtd %mm2, %mm2 |
| # CHECK-NEXT: [0,6] .D=eE-R . . . . . . pcmpgtw %mm2, %mm2 |
| # CHECK-NEXT: [0,7] .DeE--R . . . . . . pcmpgtb %xmm2, %xmm2 |
| # CHECK-NEXT: [0,8] .D=eE-R . . . . . . pcmpgtd %xmm2, %xmm2 |
| # CHECK-NEXT: [0,9] .D===eeeER. . . . . . pcmpgtq %xmm2, %xmm2 |
| # CHECK-NEXT: [0,10] .D======eER . . . . . pcmpgtw %xmm2, %xmm2 |
| # CHECK-NEXT: [0,11] .D==eE----R . . . . . vpcmpgtb %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: [0,12] . D==eE---R . . . . . vpcmpgtd %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: [0,13] . D===eeeER . . . . . vpcmpgtq %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: [0,14] . D======eER . . . . . vpcmpgtw %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: [0,15] . D=======eER . . . . . vpcmpgtb %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: [0,16] . D=======eER . . . . . vpcmpgtd %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: [0,17] . D=======eeeER. . . . . vpcmpgtq %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: [0,18] . D=======eE-R. . . . . vpcmpgtw %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: [0,19] . D=======eE-R. . . . . vpcmpgtb %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: [0,20] . D========eER. . . . . vpcmpgtd %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: [0,21] . D=========eeeER . . . . vpcmpgtq %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: [0,22] . D============eER . . . . vpcmpgtw %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: [0,23] . D=============eER. . . . vpcmpgtb %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: [0,24] . D============eER. . . . vpcmpgtd %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: [0,25] . D============eeeER . . . vpcmpgtq %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: [0,26] . D=============eE-R . . . vpcmpgtw %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: [0,27] . D=eE-------------R . . . psubb %mm2, %mm2 |
| # CHECK-NEXT: [0,28] . D==eE------------R . . . psubd %mm2, %mm2 |
| # CHECK-NEXT: [0,29] . D===eE-----------R . . . psubq %mm2, %mm2 |
| # CHECK-NEXT: [0,30] . D===eE----------R . . . psubw %mm2, %mm2 |
| # CHECK-NEXT: [0,31] . D===eE----------R . . . psubb %xmm2, %xmm2 |
| # CHECK-NEXT: [0,32] . D=====eE--------R . . . psubd %xmm2, %xmm2 |
| # CHECK-NEXT: [0,33] . D======eE-------R . . . psubq %xmm2, %xmm2 |
| # CHECK-NEXT: [0,34] . D=======eE------R . . . psubw %xmm2, %xmm2 |
| # CHECK-NEXT: [0,35] . D============eE-R . . . vpsubb %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: [0,36] . .D============eER . . . vpsubd %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: [0,37] . .D=============eER . . . vpsubq %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: [0,38] . .D==============eER . . . vpsubw %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: [0,39] . .D===============eER. . . vpsubb %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: [0,40] . .D================eER . . vpsubd %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: [0,41] . .D=================eER . . vpsubq %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: [0,42] . . D=================eER . . vpsubw %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: [0,43] . . D==================eER . . vpsubb %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: [0,44] . . D==================eER . . vpsubd %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: [0,45] . . D==================eER . . vpsubq %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: [0,46] . . D===================eER. . vpsubw %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: [0,47] . . D===================eER. . vpsubb %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: [0,48] . . D==================eER. . vpsubd %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: [0,49] . . D===================eER . vpsubq %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: [0,50] . . D===================eER . vpsubw %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: [0,51] . . D===eE----------------R . andnps %xmm0, %xmm0 |
| # CHECK-NEXT: [0,52] . . D====eE---------------R . andnpd %xmm1, %xmm1 |
| # CHECK-NEXT: [0,53] . . D=====eE--------------R . vandnps %xmm2, %xmm2, %xmm2 |
| # CHECK-NEXT: [0,54] . . D====eE--------------R . vandnpd %xmm1, %xmm1, %xmm1 |
| # CHECK-NEXT: [0,55] . . D=====eE-------------R . vandnps %ymm2, %ymm2, %ymm2 |
| # CHECK-NEXT: [0,56] . . D=====eE-------------R . vandnpd %ymm1, %ymm1, %ymm1 |
| # CHECK-NEXT: [0,57] . . D====eE--------------R . pandn %mm2, %mm2 |
| # CHECK-NEXT: [0,58] . . D======eE------------R . pandn %xmm2, %xmm2 |
| # CHECK-NEXT: [0,59] . . D==================eER . vpandn %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: [0,60] . . D==================eER . vpandn %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: [0,61] . . D=======eE-----------R . vandnps %xmm2, %xmm2, %xmm5 |
| # CHECK-NEXT: [0,62] . . D=====eE-------------R . vandnpd %xmm1, %xmm1, %xmm5 |
| # CHECK-NEXT: [0,63] . . D===================eER. vpandn %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: [0,64] . . D========eE-----------R. vandnps %ymm2, %ymm2, %ymm5 |
| # CHECK-NEXT: [0,65] . . D========eE-----------R. vandnpd %ymm1, %ymm1, %ymm5 |
| # CHECK-NEXT: [0,66] . . .D==================eER. vpandn %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: [0,67] . . .D===eE---------------R. xorps %xmm0, %xmm0 |
| # CHECK-NEXT: [0,68] . . .D========eE----------R. xorpd %xmm1, %xmm1 |
| # CHECK-NEXT: [0,69] . . .D========eE----------R. vxorps %xmm2, %xmm2, %xmm2 |
| # CHECK-NEXT: [0,70] . . .D=========eE---------R. vxorpd %xmm1, %xmm1, %xmm1 |
| # CHECK-NEXT: [0,71] . . .D=========eE---------R. vxorps %ymm2, %ymm2, %ymm2 |
| # CHECK-NEXT: [0,72] . . . D=========eE--------R. vxorpd %ymm1, %ymm1, %ymm1 |
| # CHECK-NEXT: [0,73] . . . D=========eE--------R. pxor %mm2, %mm2 |
| # CHECK-NEXT: [0,74] . . . D==========eE-------R. pxor %xmm2, %xmm2 |
| # CHECK-NEXT: [0,75] . . . D=================eER. vpxor %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: [0,76] . . . D==================eER vpxor %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: [0,77] . . . D===========eE-------R vxorps %xmm4, %xmm4, %xmm5 |
| # CHECK-NEXT: [0,78] . . . D==========eE-------R vxorpd %xmm1, %xmm1, %xmm3 |
| # CHECK-NEXT: [0,79] . . . D===========eE------R vxorps %ymm4, %ymm4, %ymm5 |
| # CHECK-NEXT: [0,80] . . . D=========eE--------R vxorpd %ymm1, %ymm1, %ymm3 |
| # CHECK-NEXT: [0,81] . . . D===========eE------R vpxor %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: [0,82] . . . D===============eE--R vpxor %ymm3, %ymm3, %ymm5 |
| |
| # CHECK: Average Wait times (based on the timeline view): |
| # CHECK-NEXT: [0]: Executions |
| # CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue |
| # CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready |
| # CHECK-NEXT: [3]: Average time elapsed from WB until retire stage |
| |
| # CHECK: [0] [1] [2] [3] |
| # CHECK-NEXT: 0. 1 1.0 1.0 0.0 subl %eax, %eax |
| # CHECK-NEXT: 1. 1 2.0 0.0 0.0 subq %rax, %rax |
| # CHECK-NEXT: 2. 1 3.0 0.0 0.0 xorl %eax, %eax |
| # CHECK-NEXT: 3. 1 4.0 0.0 0.0 xorq %rax, %rax |
| # CHECK-NEXT: 4. 1 1.0 1.0 3.0 pcmpgtb %mm2, %mm2 |
| # CHECK-NEXT: 5. 1 2.0 0.0 2.0 pcmpgtd %mm2, %mm2 |
| # CHECK-NEXT: 6. 1 2.0 0.0 1.0 pcmpgtw %mm2, %mm2 |
| # CHECK-NEXT: 7. 1 1.0 1.0 2.0 pcmpgtb %xmm2, %xmm2 |
| # CHECK-NEXT: 8. 1 2.0 0.0 1.0 pcmpgtd %xmm2, %xmm2 |
| # CHECK-NEXT: 9. 1 4.0 1.0 0.0 pcmpgtq %xmm2, %xmm2 |
| # CHECK-NEXT: 10. 1 7.0 0.0 0.0 pcmpgtw %xmm2, %xmm2 |
| # CHECK-NEXT: 11. 1 3.0 3.0 4.0 vpcmpgtb %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: 12. 1 3.0 0.0 3.0 vpcmpgtd %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: 13. 1 4.0 0.0 0.0 vpcmpgtq %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: 14. 1 7.0 0.0 0.0 vpcmpgtw %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: 15. 1 8.0 0.0 0.0 vpcmpgtb %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: 16. 1 8.0 0.0 0.0 vpcmpgtd %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: 17. 1 8.0 0.0 0.0 vpcmpgtq %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: 18. 1 8.0 1.0 1.0 vpcmpgtw %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: 19. 1 8.0 1.0 1.0 vpcmpgtb %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: 20. 1 9.0 0.0 0.0 vpcmpgtd %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: 21. 1 10.0 0.0 0.0 vpcmpgtq %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: 22. 1 13.0 0.0 0.0 vpcmpgtw %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: 23. 1 14.0 0.0 0.0 vpcmpgtb %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: 24. 1 13.0 0.0 0.0 vpcmpgtd %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: 25. 1 13.0 0.0 0.0 vpcmpgtq %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: 26. 1 14.0 1.0 1.0 vpcmpgtw %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: 27. 1 2.0 2.0 13.0 psubb %mm2, %mm2 |
| # CHECK-NEXT: 28. 1 3.0 0.0 12.0 psubd %mm2, %mm2 |
| # CHECK-NEXT: 29. 1 4.0 0.0 11.0 psubq %mm2, %mm2 |
| # CHECK-NEXT: 30. 1 4.0 0.0 10.0 psubw %mm2, %mm2 |
| # CHECK-NEXT: 31. 1 4.0 0.0 10.0 psubb %xmm2, %xmm2 |
| # CHECK-NEXT: 32. 1 6.0 1.0 8.0 psubd %xmm2, %xmm2 |
| # CHECK-NEXT: 33. 1 7.0 0.0 7.0 psubq %xmm2, %xmm2 |
| # CHECK-NEXT: 34. 1 8.0 0.0 6.0 psubw %xmm2, %xmm2 |
| # CHECK-NEXT: 35. 1 13.0 1.0 1.0 vpsubb %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: 36. 1 13.0 0.0 0.0 vpsubd %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: 37. 1 14.0 0.0 0.0 vpsubq %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: 38. 1 15.0 0.0 0.0 vpsubw %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: 39. 1 16.0 0.0 0.0 vpsubb %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: 40. 1 17.0 0.0 0.0 vpsubd %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: 41. 1 18.0 0.0 0.0 vpsubq %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: 42. 1 18.0 0.0 0.0 vpsubw %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: 43. 1 19.0 0.0 0.0 vpsubb %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: 44. 1 19.0 0.0 0.0 vpsubd %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: 45. 1 19.0 0.0 0.0 vpsubq %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: 46. 1 20.0 1.0 0.0 vpsubw %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: 47. 1 20.0 1.0 0.0 vpsubb %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: 48. 1 19.0 1.0 0.0 vpsubd %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: 49. 1 20.0 2.0 0.0 vpsubq %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: 50. 1 20.0 2.0 0.0 vpsubw %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: 51. 1 4.0 4.0 16.0 andnps %xmm0, %xmm0 |
| # CHECK-NEXT: 52. 1 5.0 5.0 15.0 andnpd %xmm1, %xmm1 |
| # CHECK-NEXT: 53. 1 6.0 0.0 14.0 vandnps %xmm2, %xmm2, %xmm2 |
| # CHECK-NEXT: 54. 1 5.0 0.0 14.0 vandnpd %xmm1, %xmm1, %xmm1 |
| # CHECK-NEXT: 55. 1 6.0 0.0 13.0 vandnps %ymm2, %ymm2, %ymm2 |
| # CHECK-NEXT: 56. 1 6.0 0.0 13.0 vandnpd %ymm1, %ymm1, %ymm1 |
| # CHECK-NEXT: 57. 1 5.0 4.0 14.0 pandn %mm2, %mm2 |
| # CHECK-NEXT: 58. 1 7.0 0.0 12.0 pandn %xmm2, %xmm2 |
| # CHECK-NEXT: 59. 1 19.0 2.0 0.0 vpandn %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: 60. 1 19.0 0.0 0.0 vpandn %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: 61. 1 8.0 1.0 11.0 vandnps %xmm2, %xmm2, %xmm5 |
| # CHECK-NEXT: 62. 1 6.0 0.0 13.0 vandnpd %xmm1, %xmm1, %xmm5 |
| # CHECK-NEXT: 63. 1 20.0 0.0 0.0 vpandn %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: 64. 1 9.0 2.0 11.0 vandnps %ymm2, %ymm2, %ymm5 |
| # CHECK-NEXT: 65. 1 9.0 3.0 11.0 vandnpd %ymm1, %ymm1, %ymm5 |
| # CHECK-NEXT: 66. 1 19.0 0.0 0.0 vpandn %ymm3, %ymm3, %ymm5 |
| # CHECK-NEXT: 67. 1 4.0 2.0 15.0 xorps %xmm0, %xmm0 |
| # CHECK-NEXT: 68. 1 9.0 4.0 10.0 xorpd %xmm1, %xmm1 |
| # CHECK-NEXT: 69. 1 9.0 3.0 10.0 vxorps %xmm2, %xmm2, %xmm2 |
| # CHECK-NEXT: 70. 1 10.0 0.0 9.0 vxorpd %xmm1, %xmm1, %xmm1 |
| # CHECK-NEXT: 71. 1 10.0 0.0 9.0 vxorps %ymm2, %ymm2, %ymm2 |
| # CHECK-NEXT: 72. 1 10.0 0.0 8.0 vxorpd %ymm1, %ymm1, %ymm1 |
| # CHECK-NEXT: 73. 1 10.0 7.0 8.0 pxor %mm2, %mm2 |
| # CHECK-NEXT: 74. 1 11.0 1.0 7.0 pxor %xmm2, %xmm2 |
| # CHECK-NEXT: 75. 1 18.0 0.0 0.0 vpxor %xmm3, %xmm3, %xmm3 |
| # CHECK-NEXT: 76. 1 19.0 0.0 0.0 vpxor %ymm3, %ymm3, %ymm3 |
| # CHECK-NEXT: 77. 1 12.0 12.0 7.0 vxorps %xmm4, %xmm4, %xmm5 |
| # CHECK-NEXT: 78. 1 11.0 1.0 7.0 vxorpd %xmm1, %xmm1, %xmm3 |
| # CHECK-NEXT: 79. 1 12.0 12.0 6.0 vxorps %ymm4, %ymm4, %ymm5 |
| # CHECK-NEXT: 80. 1 10.0 0.0 8.0 vxorpd %ymm1, %ymm1, %ymm3 |
| # CHECK-NEXT: 81. 1 12.0 1.0 6.0 vpxor %xmm3, %xmm3, %xmm5 |
| # CHECK-NEXT: 82. 1 16.0 5.0 2.0 vpxor %ymm3, %ymm3, %ymm5 |