| # NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py |
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=sandybridge -iterations=1 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,SANDY |
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=haswell -iterations=1 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,HASWELL |
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=broadwell -iterations=1 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,BDWELL |
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=skylake -iterations=1 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,SKYLAKE |
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=icelake-server -iterations=1 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,SKYLAKE |
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=x86-64 -iterations=1 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,BARCELONA |
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=bdver2 -iterations=1 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,BDVER2 |
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=btver2 -iterations=1 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,BTVER2 |
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver1 -iterations=1 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,ZNVER1 |
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver2 -iterations=1 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,ZNVER2 |
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -iterations=1 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,ZNVER3 |
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver4 -iterations=1 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,ZNVER4 |
| |
| vdivps %xmm0, %xmm1, %xmm1 |
| vaddps (%rax), %xmm1, %xmm1 |
| |
| # ALL: Iterations: 1 |
| # ALL-NEXT: Instructions: 2 |
| |
| # BARCELONA-NEXT: Total Cycles: 20 |
| # BARCELONA-NEXT: Total uOps: 3 |
| |
| # BDVER2-NEXT: Total Cycles: 17 |
| # BDVER2-NEXT: Total uOps: 2 |
| |
| # BDWELL-NEXT: Total Cycles: 17 |
| # BDWELL-NEXT: Total uOps: 3 |
| |
| # BTVER2-NEXT: Total Cycles: 25 |
| # BTVER2-NEXT: Total uOps: 2 |
| |
| # HASWELL-NEXT: Total Cycles: 19 |
| # HASWELL-NEXT: Total uOps: 3 |
| |
| # SANDY-NEXT: Total Cycles: 20 |
| # SANDY-NEXT: Total uOps: 3 |
| |
| # SKYLAKE-NEXT: Total Cycles: 18 |
| # SKYLAKE-NEXT: Total uOps: 3 |
| |
| # ZNVER1-NEXT: Total Cycles: 15 |
| # ZNVER1-NEXT: Total uOps: 2 |
| |
| # ZNVER2-NEXT: Total Cycles: 16 |
| # ZNVER2-NEXT: Total uOps: 2 |
| |
| # ZNVER3-NEXT: Total Cycles: 17 |
| # ZNVER3-NEXT: Total uOps: 2 |
| |
| # ZNVER4-NEXT: Total Cycles: 17 |
| # ZNVER4-NEXT: Total uOps: 2 |
| |
| # BARCELONA: Dispatch Width: 4 |
| # BARCELONA-NEXT: uOps Per Cycle: 0.15 |
| # BARCELONA-NEXT: IPC: 0.10 |
| # BARCELONA-NEXT: Block RThroughput: 14.0 |
| |
| # BDVER2: Dispatch Width: 4 |
| # BDVER2-NEXT: uOps Per Cycle: 0.12 |
| # BDVER2-NEXT: IPC: 0.12 |
| # BDVER2-NEXT: Block RThroughput: 5.0 |
| |
| # BDWELL: Dispatch Width: 4 |
| # BDWELL-NEXT: uOps Per Cycle: 0.18 |
| # BDWELL-NEXT: IPC: 0.12 |
| # BDWELL-NEXT: Block RThroughput: 5.0 |
| |
| # BTVER2: Dispatch Width: 2 |
| # BTVER2-NEXT: uOps Per Cycle: 0.08 |
| # BTVER2-NEXT: IPC: 0.08 |
| # BTVER2-NEXT: Block RThroughput: 19.0 |
| |
| # HASWELL: Dispatch Width: 4 |
| # HASWELL-NEXT: uOps Per Cycle: 0.16 |
| # HASWELL-NEXT: IPC: 0.11 |
| # HASWELL-NEXT: Block RThroughput: 7.0 |
| |
| # SANDY: Dispatch Width: 4 |
| # SANDY-NEXT: uOps Per Cycle: 0.15 |
| # SANDY-NEXT: IPC: 0.10 |
| # SANDY-NEXT: Block RThroughput: 14.0 |
| |
| # SKYLAKE: Dispatch Width: 6 |
| # SKYLAKE-NEXT: uOps Per Cycle: 0.17 |
| # SKYLAKE-NEXT: IPC: 0.11 |
| # SKYLAKE-NEXT: Block RThroughput: 3.0 |
| |
| # ZNVER1: Dispatch Width: 4 |
| # ZNVER1-NEXT: uOps Per Cycle: 0.13 |
| # ZNVER1-NEXT: IPC: 0.13 |
| # ZNVER1-NEXT: Block RThroughput: 3.0 |
| |
| # ZNVER2: Dispatch Width: 4 |
| # ZNVER2-NEXT: uOps Per Cycle: 0.13 |
| # ZNVER2-NEXT: IPC: 0.13 |
| # ZNVER2-NEXT: Block RThroughput: 5.0 |
| |
| # ZNVER3: Dispatch Width: 6 |
| # ZNVER3-NEXT: uOps Per Cycle: 0.12 |
| # ZNVER3-NEXT: IPC: 0.12 |
| # ZNVER3-NEXT: Block RThroughput: 3.0 |
| |
| # ZNVER4: Dispatch Width: 6 |
| # ZNVER4-NEXT: uOps Per Cycle: 0.12 |
| # ZNVER4-NEXT: IPC: 0.12 |
| # ZNVER4-NEXT: Block RThroughput: 3.0 |
| |
| # ALL: Timeline view: |
| |
| # BARCELONA-NEXT: 0123456789 |
| # BARCELONA-NEXT: Index 0123456789 |
| |
| # BDVER2-NEXT: 0123456 |
| # BDVER2-NEXT: Index 0123456789 |
| |
| # BDWELL-NEXT: 0123456 |
| # BDWELL-NEXT: Index 0123456789 |
| |
| # BTVER2-NEXT: 0123456789 |
| # BTVER2-NEXT: Index 0123456789 01234 |
| |
| # HASWELL-NEXT: 012345678 |
| # HASWELL-NEXT: Index 0123456789 |
| |
| # SANDY-NEXT: 0123456789 |
| # SANDY-NEXT: Index 0123456789 |
| |
| # SKYLAKE-NEXT: 01234567 |
| # SKYLAKE-NEXT: Index 0123456789 |
| |
| # ZNVER1-NEXT: 01234 |
| # ZNVER1-NEXT: Index 0123456789 |
| |
| # ZNVER2-NEXT: 012345 |
| # ZNVER2-NEXT: Index 0123456789 |
| |
| # ZNVER3-NEXT: 0123456 |
| # ZNVER3-NEXT: Index 0123456789 |
| |
| # ZNVER4-NEXT: 0123456 |
| # ZNVER4-NEXT: Index 0123456789 |
| |
| # BARCELONA: [0,0] DeeeeeeeeeeeeeeER . vdivps %xmm0, %xmm1, %xmm1 |
| # BARCELONA-NEXT: [0,1] D========eeeeeeeeeER vaddps (%rax), %xmm1, %xmm1 |
| |
| # BDVER2: [0,0] DeeeeeeeeeER .. vdivps %xmm0, %xmm1, %xmm1 |
| # BDVER2-NEXT: [0,1] D====eeeeeeeeeeER vaddps (%rax), %xmm1, %xmm1 |
| |
| # BDWELL: [0,0] DeeeeeeeeeeeER .. vdivps %xmm0, %xmm1, %xmm1 |
| # BDWELL-NEXT: [0,1] D======eeeeeeeeER vaddps (%rax), %xmm1, %xmm1 |
| |
| # BTVER2: [0,0] DeeeeeeeeeeeeeeeeeeeER . vdivps %xmm0, %xmm1, %xmm1 |
| # BTVER2-NEXT: [0,1] D==============eeeeeeeeER vaddps (%rax), %xmm1, %xmm1 |
| |
| # HASWELL: [0,0] DeeeeeeeeeeeeeER . vdivps %xmm0, %xmm1, %xmm1 |
| # HASWELL-NEXT: [0,1] D=======eeeeeeeeeER vaddps (%rax), %xmm1, %xmm1 |
| |
| # SANDY: [0,0] DeeeeeeeeeeeeeeER . vdivps %xmm0, %xmm1, %xmm1 |
| # SANDY-NEXT: [0,1] D========eeeeeeeeeER vaddps (%rax), %xmm1, %xmm1 |
| |
| # SKYLAKE: [0,0] DeeeeeeeeeeeER . . vdivps %xmm0, %xmm1, %xmm1 |
| # SKYLAKE-NEXT: [0,1] D=====eeeeeeeeeeER vaddps (%rax), %xmm1, %xmm1 |
| |
| # ZNVER1: [0,0] DeeeeeeeeeeER . vdivps %xmm0, %xmm1, %xmm1 |
| # ZNVER1-NEXT: [0,1] D==eeeeeeeeeeER vaddps (%rax), %xmm1, %xmm1 |
| |
| # ZNVER2: [0,0] DeeeeeeeeeeER . vdivps %xmm0, %xmm1, %xmm1 |
| # ZNVER2-NEXT: [0,1] D===eeeeeeeeeeER vaddps (%rax), %xmm1, %xmm1 |
| |
| # ZNVER3: [0,0] DeeeeeeeeeeeER .. vdivps %xmm0, %xmm1, %xmm1 |
| # ZNVER3-NEXT: [0,1] D====eeeeeeeeeeER vaddps (%rax), %xmm1, %xmm1 |
| |
| # ZNVER4: [0,0] DeeeeeeeeeeeER .. vdivps %xmm0, %xmm1, %xmm1 |
| # ZNVER4-NEXT: [0,1] D====eeeeeeeeeeER vaddps (%rax), %xmm1, %xmm1 |
| |
| # ALL: Average Wait times (based on the timeline view): |
| # ALL-NEXT: [0]: Executions |
| # ALL-NEXT: [1]: Average time spent waiting in a scheduler's queue |
| # ALL-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready |
| # ALL-NEXT: [3]: Average time elapsed from WB until retire stage |
| |
| # ALL: [0] [1] [2] [3] |
| # ALL-NEXT: 0. 1 1.0 1.0 0.0 vdivps %xmm0, %xmm1, %xmm1 |
| |
| # BARCELONA-NEXT: 1. 1 9.0 0.0 0.0 vaddps (%rax), %xmm1, %xmm1 |
| # BARCELONA-NEXT: 1 5.0 0.5 0.0 <total> |
| |
| # BDVER2-NEXT: 1. 1 5.0 0.0 0.0 vaddps (%rax), %xmm1, %xmm1 |
| # BDVER2-NEXT: 1 3.0 0.5 0.0 <total> |
| |
| # BDWELL-NEXT: 1. 1 7.0 0.0 0.0 vaddps (%rax), %xmm1, %xmm1 |
| # BDWELL-NEXT: 1 4.0 0.5 0.0 <total> |
| |
| # BTVER2-NEXT: 1. 1 15.0 0.0 0.0 vaddps (%rax), %xmm1, %xmm1 |
| # BTVER2-NEXT: 1 8.0 0.5 0.0 <total> |
| |
| # HASWELL-NEXT: 1. 1 8.0 0.0 0.0 vaddps (%rax), %xmm1, %xmm1 |
| # HASWELL-NEXT: 1 4.5 0.5 0.0 <total> |
| |
| # SANDY-NEXT: 1. 1 9.0 0.0 0.0 vaddps (%rax), %xmm1, %xmm1 |
| # SANDY-NEXT: 1 5.0 0.5 0.0 <total> |
| |
| # SKYLAKE-NEXT: 1. 1 6.0 0.0 0.0 vaddps (%rax), %xmm1, %xmm1 |
| # SKYLAKE-NEXT: 1 3.5 0.5 0.0 <total> |
| |
| # ZNVER1-NEXT: 1. 1 3.0 0.0 0.0 vaddps (%rax), %xmm1, %xmm1 |
| # ZNVER1-NEXT: 1 2.0 0.5 0.0 <total> |
| |
| # ZNVER2-NEXT: 1. 1 4.0 0.0 0.0 vaddps (%rax), %xmm1, %xmm1 |
| # ZNVER2-NEXT: 1 2.5 0.5 0.0 <total> |
| |
| # ZNVER3-NEXT: 1. 1 5.0 0.0 0.0 vaddps (%rax), %xmm1, %xmm1 |
| # ZNVER3-NEXT: 1 3.0 0.5 0.0 <total> |
| |
| # ZNVER4-NEXT: 1. 1 5.0 0.0 0.0 vaddps (%rax), %xmm1, %xmm1 |
| # ZNVER4-NEXT: 1 3.0 0.5 0.0 <total> |