| # NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py |
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=slm -instruction-tables < %s | FileCheck %s |
| |
| pabsb %mm0, %mm2 |
| pabsb (%rax), %mm2 |
| |
| pabsb %xmm0, %xmm2 |
| pabsb (%rax), %xmm2 |
| |
| pabsd %mm0, %mm2 |
| pabsd (%rax), %mm2 |
| |
| pabsd %xmm0, %xmm2 |
| pabsd (%rax), %xmm2 |
| |
| pabsw %mm0, %mm2 |
| pabsw (%rax), %mm2 |
| |
| pabsw %xmm0, %xmm2 |
| pabsw (%rax), %xmm2 |
| |
| palignr $1, %mm0, %mm2 |
| palignr $1, (%rax), %mm2 |
| |
| palignr $1, %xmm0, %xmm2 |
| palignr $1, (%rax), %xmm2 |
| |
| phaddd %mm0, %mm2 |
| phaddd (%rax), %mm2 |
| |
| phaddd %xmm0, %xmm2 |
| phaddd (%rax), %xmm2 |
| |
| phaddsw %mm0, %mm2 |
| phaddsw (%rax), %mm2 |
| |
| phaddsw %xmm0, %xmm2 |
| phaddsw (%rax), %xmm2 |
| |
| phaddw %mm0, %mm2 |
| phaddw (%rax), %mm2 |
| |
| phaddw %xmm0, %xmm2 |
| phaddw (%rax), %xmm2 |
| |
| phsubd %mm0, %mm2 |
| phsubd (%rax), %mm2 |
| |
| phsubd %xmm0, %xmm2 |
| phsubd (%rax), %xmm2 |
| |
| phsubsw %mm0, %mm2 |
| phsubsw (%rax), %mm2 |
| |
| phsubsw %xmm0, %xmm2 |
| phsubsw (%rax), %xmm2 |
| |
| phsubw %mm0, %mm2 |
| phsubw (%rax), %mm2 |
| |
| phsubw %xmm0, %xmm2 |
| phsubw (%rax), %xmm2 |
| |
| pmaddubsw %mm0, %mm2 |
| pmaddubsw (%rax), %mm2 |
| |
| pmaddubsw %xmm0, %xmm2 |
| pmaddubsw (%rax), %xmm2 |
| |
| pmulhrsw %mm0, %mm2 |
| pmulhrsw (%rax), %mm2 |
| |
| pmulhrsw %xmm0, %xmm2 |
| pmulhrsw (%rax), %xmm2 |
| |
| pshufb %mm0, %mm2 |
| pshufb (%rax), %mm2 |
| |
| pshufb %xmm0, %xmm2 |
| pshufb (%rax), %xmm2 |
| |
| psignb %mm0, %mm2 |
| psignb (%rax), %mm2 |
| |
| psignb %xmm0, %xmm2 |
| psignb (%rax), %xmm2 |
| |
| psignd %mm0, %mm2 |
| psignd (%rax), %mm2 |
| |
| psignd %xmm0, %xmm2 |
| psignd (%rax), %xmm2 |
| |
| psignw %mm0, %mm2 |
| psignw (%rax), %mm2 |
| |
| psignw %xmm0, %xmm2 |
| psignw (%rax), %xmm2 |
| |
| # CHECK: Instruction Info: |
| # CHECK-NEXT: [1]: #uOps |
| # CHECK-NEXT: [2]: Latency |
| # CHECK-NEXT: [3]: RThroughput |
| # CHECK-NEXT: [4]: MayLoad |
| # CHECK-NEXT: [5]: MayStore |
| # CHECK-NEXT: [6]: HasSideEffects (U) |
| |
| # CHECK: [1] [2] [3] [4] [5] [6] Instructions: |
| # CHECK-NEXT: 1 1 0.50 pabsb %mm0, %mm2 |
| # CHECK-NEXT: 1 4 1.00 * pabsb (%rax), %mm2 |
| # CHECK-NEXT: 1 1 0.50 pabsb %xmm0, %xmm2 |
| # CHECK-NEXT: 1 4 1.00 * pabsb (%rax), %xmm2 |
| # CHECK-NEXT: 1 1 0.50 pabsd %mm0, %mm2 |
| # CHECK-NEXT: 1 4 1.00 * pabsd (%rax), %mm2 |
| # CHECK-NEXT: 1 1 0.50 pabsd %xmm0, %xmm2 |
| # CHECK-NEXT: 1 4 1.00 * pabsd (%rax), %xmm2 |
| # CHECK-NEXT: 1 1 0.50 pabsw %mm0, %mm2 |
| # CHECK-NEXT: 1 4 1.00 * pabsw (%rax), %mm2 |
| # CHECK-NEXT: 1 1 0.50 pabsw %xmm0, %xmm2 |
| # CHECK-NEXT: 1 4 1.00 * pabsw (%rax), %xmm2 |
| # CHECK-NEXT: 1 1 1.00 palignr $1, %mm0, %mm2 |
| # CHECK-NEXT: 1 4 1.00 * palignr $1, (%rax), %mm2 |
| # CHECK-NEXT: 1 1 1.00 palignr $1, %xmm0, %xmm2 |
| # CHECK-NEXT: 1 4 1.00 * palignr $1, (%rax), %xmm2 |
| # CHECK-NEXT: 3 6 3.00 phaddd %mm0, %mm2 |
| # CHECK-NEXT: 4 9 3.00 * phaddd (%rax), %mm2 |
| # CHECK-NEXT: 3 6 3.00 phaddd %xmm0, %xmm2 |
| # CHECK-NEXT: 4 9 3.00 * phaddd (%rax), %xmm2 |
| # CHECK-NEXT: 3 6 3.00 phaddsw %mm0, %mm2 |
| # CHECK-NEXT: 4 9 3.00 * phaddsw (%rax), %mm2 |
| # CHECK-NEXT: 3 6 3.00 phaddsw %xmm0, %xmm2 |
| # CHECK-NEXT: 4 9 3.00 * phaddsw (%rax), %xmm2 |
| # CHECK-NEXT: 3 6 3.00 phaddw %mm0, %mm2 |
| # CHECK-NEXT: 4 9 3.00 * phaddw (%rax), %mm2 |
| # CHECK-NEXT: 3 6 3.00 phaddw %xmm0, %xmm2 |
| # CHECK-NEXT: 4 9 3.00 * phaddw (%rax), %xmm2 |
| # CHECK-NEXT: 3 6 3.00 phsubd %mm0, %mm2 |
| # CHECK-NEXT: 4 9 3.00 * phsubd (%rax), %mm2 |
| # CHECK-NEXT: 3 6 3.00 phsubd %xmm0, %xmm2 |
| # CHECK-NEXT: 4 9 3.00 * phsubd (%rax), %xmm2 |
| # CHECK-NEXT: 3 6 3.00 phsubsw %mm0, %mm2 |
| # CHECK-NEXT: 4 9 3.00 * phsubsw (%rax), %mm2 |
| # CHECK-NEXT: 3 6 3.00 phsubsw %xmm0, %xmm2 |
| # CHECK-NEXT: 4 9 3.00 * phsubsw (%rax), %xmm2 |
| # CHECK-NEXT: 3 6 3.00 phsubw %mm0, %mm2 |
| # CHECK-NEXT: 4 9 3.00 * phsubw (%rax), %mm2 |
| # CHECK-NEXT: 3 6 3.00 phsubw %xmm0, %xmm2 |
| # CHECK-NEXT: 4 9 3.00 * phsubw (%rax), %xmm2 |
| # CHECK-NEXT: 1 4 1.00 pmaddubsw %mm0, %mm2 |
| # CHECK-NEXT: 1 7 1.00 * pmaddubsw (%rax), %mm2 |
| # CHECK-NEXT: 1 5 2.00 pmaddubsw %xmm0, %xmm2 |
| # CHECK-NEXT: 1 8 2.00 * pmaddubsw (%rax), %xmm2 |
| # CHECK-NEXT: 1 4 1.00 pmulhrsw %mm0, %mm2 |
| # CHECK-NEXT: 1 7 1.00 * pmulhrsw (%rax), %mm2 |
| # CHECK-NEXT: 1 5 2.00 pmulhrsw %xmm0, %xmm2 |
| # CHECK-NEXT: 1 8 2.00 * pmulhrsw (%rax), %xmm2 |
| # CHECK-NEXT: 1 1 1.00 pshufb %mm0, %mm2 |
| # CHECK-NEXT: 1 4 1.00 * pshufb (%rax), %mm2 |
| # CHECK-NEXT: 4 5 5.00 pshufb %xmm0, %xmm2 |
| # CHECK-NEXT: 5 8 5.00 * pshufb (%rax), %xmm2 |
| # CHECK-NEXT: 1 1 0.50 psignb %mm0, %mm2 |
| # CHECK-NEXT: 1 4 1.00 * psignb (%rax), %mm2 |
| # CHECK-NEXT: 1 1 0.50 psignb %xmm0, %xmm2 |
| # CHECK-NEXT: 1 4 1.00 * psignb (%rax), %xmm2 |
| # CHECK-NEXT: 1 1 0.50 psignd %mm0, %mm2 |
| # CHECK-NEXT: 1 4 1.00 * psignd (%rax), %mm2 |
| # CHECK-NEXT: 1 1 0.50 psignd %xmm0, %xmm2 |
| # CHECK-NEXT: 1 4 1.00 * psignd (%rax), %xmm2 |
| # CHECK-NEXT: 1 1 0.50 psignw %mm0, %mm2 |
| # CHECK-NEXT: 1 4 1.00 * psignw (%rax), %mm2 |
| # CHECK-NEXT: 1 1 0.50 psignw %xmm0, %xmm2 |
| # CHECK-NEXT: 1 4 1.00 * psignw (%rax), %xmm2 |
| |
| # CHECK: Resources: |
| # CHECK-NEXT: [0] - SLMDivider |
| # CHECK-NEXT: [1] - SLMFPDivider |
| # CHECK-NEXT: [2] - SLMFPMultiplier |
| # CHECK-NEXT: [3] - SLM_FPC_RSV0 |
| # CHECK-NEXT: [4] - SLM_FPC_RSV1 |
| # CHECK-NEXT: [5] - SLM_IEC_RSV0 |
| # CHECK-NEXT: [6] - SLM_IEC_RSV1 |
| # CHECK-NEXT: [7] - SLM_MEC_RSV |
| |
| # CHECK: Resource pressure per iteration: |
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] |
| # CHECK-NEXT: - - - 112.00 84.00 - - 32.00 |
| |
| # CHECK: Resource pressure by instruction: |
| # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] Instructions: |
| # CHECK-NEXT: - - - 0.50 0.50 - - - pabsb %mm0, %mm2 |
| # CHECK-NEXT: - - - 0.50 0.50 - - 1.00 pabsb (%rax), %mm2 |
| # CHECK-NEXT: - - - 0.50 0.50 - - - pabsb %xmm0, %xmm2 |
| # CHECK-NEXT: - - - 0.50 0.50 - - 1.00 pabsb (%rax), %xmm2 |
| # CHECK-NEXT: - - - 0.50 0.50 - - - pabsd %mm0, %mm2 |
| # CHECK-NEXT: - - - 0.50 0.50 - - 1.00 pabsd (%rax), %mm2 |
| # CHECK-NEXT: - - - 0.50 0.50 - - - pabsd %xmm0, %xmm2 |
| # CHECK-NEXT: - - - 0.50 0.50 - - 1.00 pabsd (%rax), %xmm2 |
| # CHECK-NEXT: - - - 0.50 0.50 - - - pabsw %mm0, %mm2 |
| # CHECK-NEXT: - - - 0.50 0.50 - - 1.00 pabsw (%rax), %mm2 |
| # CHECK-NEXT: - - - 0.50 0.50 - - - pabsw %xmm0, %xmm2 |
| # CHECK-NEXT: - - - 0.50 0.50 - - 1.00 pabsw (%rax), %xmm2 |
| # CHECK-NEXT: - - - 1.00 - - - - palignr $1, %mm0, %mm2 |
| # CHECK-NEXT: - - - 1.00 - - - 1.00 palignr $1, (%rax), %mm2 |
| # CHECK-NEXT: - - - 1.00 - - - - palignr $1, %xmm0, %xmm2 |
| # CHECK-NEXT: - - - 1.00 - - - 1.00 palignr $1, (%rax), %xmm2 |
| # CHECK-NEXT: - - - 3.00 3.00 - - - phaddd %mm0, %mm2 |
| # CHECK-NEXT: - - - 3.00 3.00 - - 1.00 phaddd (%rax), %mm2 |
| # CHECK-NEXT: - - - 3.00 3.00 - - - phaddd %xmm0, %xmm2 |
| # CHECK-NEXT: - - - 3.00 3.00 - - 1.00 phaddd (%rax), %xmm2 |
| # CHECK-NEXT: - - - 3.00 3.00 - - - phaddsw %mm0, %mm2 |
| # CHECK-NEXT: - - - 3.00 3.00 - - 1.00 phaddsw (%rax), %mm2 |
| # CHECK-NEXT: - - - 3.00 3.00 - - - phaddsw %xmm0, %xmm2 |
| # CHECK-NEXT: - - - 3.00 3.00 - - 1.00 phaddsw (%rax), %xmm2 |
| # CHECK-NEXT: - - - 3.00 3.00 - - - phaddw %mm0, %mm2 |
| # CHECK-NEXT: - - - 3.00 3.00 - - 1.00 phaddw (%rax), %mm2 |
| # CHECK-NEXT: - - - 3.00 3.00 - - - phaddw %xmm0, %xmm2 |
| # CHECK-NEXT: - - - 3.00 3.00 - - 1.00 phaddw (%rax), %xmm2 |
| # CHECK-NEXT: - - - 3.00 3.00 - - - phsubd %mm0, %mm2 |
| # CHECK-NEXT: - - - 3.00 3.00 - - 1.00 phsubd (%rax), %mm2 |
| # CHECK-NEXT: - - - 3.00 3.00 - - - phsubd %xmm0, %xmm2 |
| # CHECK-NEXT: - - - 3.00 3.00 - - 1.00 phsubd (%rax), %xmm2 |
| # CHECK-NEXT: - - - 3.00 3.00 - - - phsubsw %mm0, %mm2 |
| # CHECK-NEXT: - - - 3.00 3.00 - - 1.00 phsubsw (%rax), %mm2 |
| # CHECK-NEXT: - - - 3.00 3.00 - - - phsubsw %xmm0, %xmm2 |
| # CHECK-NEXT: - - - 3.00 3.00 - - 1.00 phsubsw (%rax), %xmm2 |
| # CHECK-NEXT: - - - 3.00 3.00 - - - phsubw %mm0, %mm2 |
| # CHECK-NEXT: - - - 3.00 3.00 - - 1.00 phsubw (%rax), %mm2 |
| # CHECK-NEXT: - - - 3.00 3.00 - - - phsubw %xmm0, %xmm2 |
| # CHECK-NEXT: - - - 3.00 3.00 - - 1.00 phsubw (%rax), %xmm2 |
| # CHECK-NEXT: - - - 1.00 - - - - pmaddubsw %mm0, %mm2 |
| # CHECK-NEXT: - - - 1.00 - - - 1.00 pmaddubsw (%rax), %mm2 |
| # CHECK-NEXT: - - - 2.00 - - - - pmaddubsw %xmm0, %xmm2 |
| # CHECK-NEXT: - - - 2.00 - - - 1.00 pmaddubsw (%rax), %xmm2 |
| # CHECK-NEXT: - - - 1.00 - - - - pmulhrsw %mm0, %mm2 |
| # CHECK-NEXT: - - - 1.00 - - - 1.00 pmulhrsw (%rax), %mm2 |
| # CHECK-NEXT: - - - 2.00 - - - - pmulhrsw %xmm0, %xmm2 |
| # CHECK-NEXT: - - - 2.00 - - - 1.00 pmulhrsw (%rax), %xmm2 |
| # CHECK-NEXT: - - - 1.00 - - - - pshufb %mm0, %mm2 |
| # CHECK-NEXT: - - - 1.00 - - - 1.00 pshufb (%rax), %mm2 |
| # CHECK-NEXT: - - - 5.00 - - - - pshufb %xmm0, %xmm2 |
| # CHECK-NEXT: - - - 5.00 - - - 1.00 pshufb (%rax), %xmm2 |
| # CHECK-NEXT: - - - 0.50 0.50 - - - psignb %mm0, %mm2 |
| # CHECK-NEXT: - - - 0.50 0.50 - - 1.00 psignb (%rax), %mm2 |
| # CHECK-NEXT: - - - 0.50 0.50 - - - psignb %xmm0, %xmm2 |
| # CHECK-NEXT: - - - 0.50 0.50 - - 1.00 psignb (%rax), %xmm2 |
| # CHECK-NEXT: - - - 0.50 0.50 - - - psignd %mm0, %mm2 |
| # CHECK-NEXT: - - - 0.50 0.50 - - 1.00 psignd (%rax), %mm2 |
| # CHECK-NEXT: - - - 0.50 0.50 - - - psignd %xmm0, %xmm2 |
| # CHECK-NEXT: - - - 0.50 0.50 - - 1.00 psignd (%rax), %xmm2 |
| # CHECK-NEXT: - - - 0.50 0.50 - - - psignw %mm0, %mm2 |
| # CHECK-NEXT: - - - 0.50 0.50 - - 1.00 psignw (%rax), %mm2 |
| # CHECK-NEXT: - - - 0.50 0.50 - - - psignw %xmm0, %xmm2 |
| # CHECK-NEXT: - - - 0.50 0.50 - - 1.00 psignw (%rax), %xmm2 |