| # NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py |
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=haswell -iterations=100 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,HASWELL |
| |
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=broadwell -iterations=100 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,BDWELL |
| |
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=skylake -iterations=100 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,SKYLAKE |
| |
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=icelake-server -iterations=100 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,SKYLAKE |
| |
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver1 -iterations=100 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,ZNVER1 |
| |
| # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver2 -iterations=100 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,ZNVER2 |
| |
| # Code Snippet from "Ithemal: Accurate, Portable and Fast Basic Block Throughput Estimation using Deep Neural Networks" |
| # Charith Mendis, Saman Amarasinghe, Michael Carbin |
| add $1, %edx |
| vpaddd (%r8), %ymm0, %ymm0 |
| add $32, %r8 |
| cmp %edi, %edx |
| |
| # ALL: Iterations: 100 |
| # ALL-NEXT: Instructions: 400 |
| |
| # BDWELL-NEXT: Total Cycles: 142 |
| # BDWELL-NEXT: Total uOps: 500 |
| |
| # HASWELL-NEXT: Total Cycles: 143 |
| # HASWELL-NEXT: Total uOps: 500 |
| |
| # SKYLAKE-NEXT: Total Cycles: 110 |
| # SKYLAKE-NEXT: Total uOps: 500 |
| |
| # ZNVER1-NEXT: Total Cycles: 143 |
| # ZNVER1-NEXT: Total uOps: 500 |
| |
| # ZNVER2-NEXT: Total Cycles: 110 |
| # ZNVER2-NEXT: Total uOps: 400 |
| |
| # BDWELL: Dispatch Width: 4 |
| # BDWELL-NEXT: uOps Per Cycle: 3.52 |
| # BDWELL-NEXT: IPC: 2.82 |
| # BDWELL-NEXT: Block RThroughput: 1.3 |
| |
| # HASWELL: Dispatch Width: 4 |
| # HASWELL-NEXT: uOps Per Cycle: 3.50 |
| # HASWELL-NEXT: IPC: 2.80 |
| # HASWELL-NEXT: Block RThroughput: 1.3 |
| |
| # SKYLAKE: Dispatch Width: 6 |
| # SKYLAKE-NEXT: uOps Per Cycle: 4.55 |
| # SKYLAKE-NEXT: IPC: 3.64 |
| # SKYLAKE-NEXT: Block RThroughput: 0.8 |
| |
| # ZNVER1: Dispatch Width: 4 |
| # ZNVER1-NEXT: uOps Per Cycle: 3.50 |
| # ZNVER1-NEXT: IPC: 2.80 |
| # ZNVER1-NEXT: Block RThroughput: 1.3 |
| |
| # ZNVER2: Dispatch Width: 4 |
| # ZNVER2-NEXT: uOps Per Cycle: 3.64 |
| # ZNVER2-NEXT: IPC: 3.64 |
| # ZNVER2-NEXT: Block RThroughput: 1.0 |
| |
| # ALL: Timeline view: |
| |
| # BDWELL-NEXT: 0123456789 |
| # BDWELL-NEXT: Index 0123456789 01 |
| |
| # HASWELL-NEXT: 0123456789 |
| # HASWELL-NEXT: Index 0123456789 012 |
| |
| # SKYLAKE-NEXT: 0123456789 |
| # SKYLAKE-NEXT: Index 0123456789 |
| |
| # ZNVER1-NEXT: 0123456789 |
| # ZNVER1-NEXT: Index 0123456789 012 |
| |
| # ZNVER2-NEXT: 0123456789 |
| # ZNVER2-NEXT: Index 0123456789 |
| |
| # BDWELL: [0,0] DeER . . . .. addl $1, %edx |
| # BDWELL-NEXT: [0,1] DeeeeeeeER. . .. vpaddd (%r8), %ymm0, %ymm0 |
| # BDWELL-NEXT: [0,2] DeE------R. . .. addq $32, %r8 |
| # BDWELL-NEXT: [0,3] .DeE-----R. . .. cmpl %edi, %edx |
| # BDWELL-NEXT: [1,0] .DeE-----R. . .. addl $1, %edx |
| # BDWELL-NEXT: [1,1] .DeeeeeeeER . .. vpaddd (%r8), %ymm0, %ymm0 |
| # BDWELL-NEXT: [1,2] . DeE-----R . .. addq $32, %r8 |
| # BDWELL-NEXT: [1,3] . DeE-----R . .. cmpl %edi, %edx |
| # BDWELL-NEXT: [2,0] . DeE-----R . .. addl $1, %edx |
| # BDWELL-NEXT: [2,1] . DeeeeeeeER . .. vpaddd (%r8), %ymm0, %ymm0 |
| # BDWELL-NEXT: [2,2] . DeE------R . .. addq $32, %r8 |
| # BDWELL-NEXT: [2,3] . DeE------R . .. cmpl %edi, %edx |
| # BDWELL-NEXT: [3,0] . DeE-----R . .. addl $1, %edx |
| # BDWELL-NEXT: [3,1] . DeeeeeeeER . .. vpaddd (%r8), %ymm0, %ymm0 |
| # BDWELL-NEXT: [3,2] . DeE------R . .. addq $32, %r8 |
| # BDWELL-NEXT: [3,3] . DeE-----R . .. cmpl %edi, %edx |
| # BDWELL-NEXT: [4,0] . DeE-----R . .. addl $1, %edx |
| # BDWELL-NEXT: [4,1] . DeeeeeeeER. .. vpaddd (%r8), %ymm0, %ymm0 |
| # BDWELL-NEXT: [4,2] . .DeE-----R. .. addq $32, %r8 |
| # BDWELL-NEXT: [4,3] . .DeE-----R. .. cmpl %edi, %edx |
| # BDWELL-NEXT: [5,0] . .DeE-----R. .. addl $1, %edx |
| # BDWELL-NEXT: [5,1] . . DeeeeeeeER .. vpaddd (%r8), %ymm0, %ymm0 |
| # BDWELL-NEXT: [5,2] . . DeE------R .. addq $32, %r8 |
| # BDWELL-NEXT: [5,3] . . DeE------R .. cmpl %edi, %edx |
| # BDWELL-NEXT: [6,0] . . DeE-----R .. addl $1, %edx |
| # BDWELL-NEXT: [6,1] . . DeeeeeeeER .. vpaddd (%r8), %ymm0, %ymm0 |
| # BDWELL-NEXT: [6,2] . . DeE------R .. addq $32, %r8 |
| # BDWELL-NEXT: [6,3] . . DeE-----R .. cmpl %edi, %edx |
| # BDWELL-NEXT: [7,0] . . DeE-----R .. addl $1, %edx |
| # BDWELL-NEXT: [7,1] . . DeeeeeeeER .. vpaddd (%r8), %ymm0, %ymm0 |
| # BDWELL-NEXT: [7,2] . . DeE-----R .. addq $32, %r8 |
| # BDWELL-NEXT: [7,3] . . DeE-----R .. cmpl %edi, %edx |
| # BDWELL-NEXT: [8,0] . . DeE-----R .. addl $1, %edx |
| # BDWELL-NEXT: [8,1] . . .DeeeeeeeER. vpaddd (%r8), %ymm0, %ymm0 |
| # BDWELL-NEXT: [8,2] . . .DeE------R. addq $32, %r8 |
| # BDWELL-NEXT: [8,3] . . .DeE------R. cmpl %edi, %edx |
| # BDWELL-NEXT: [9,0] . . . DeE-----R. addl $1, %edx |
| # BDWELL-NEXT: [9,1] . . . DeeeeeeeER vpaddd (%r8), %ymm0, %ymm0 |
| # BDWELL-NEXT: [9,2] . . . DeE------R addq $32, %r8 |
| # BDWELL-NEXT: [9,3] . . . DeE-----R cmpl %edi, %edx |
| |
| # HASWELL: [0,0] DeER . . . . . addl $1, %edx |
| # HASWELL-NEXT: [0,1] DeeeeeeeeER . . . vpaddd (%r8), %ymm0, %ymm0 |
| # HASWELL-NEXT: [0,2] DeE-------R . . . addq $32, %r8 |
| # HASWELL-NEXT: [0,3] .DeE------R . . . cmpl %edi, %edx |
| # HASWELL-NEXT: [1,0] .DeE------R . . . addl $1, %edx |
| # HASWELL-NEXT: [1,1] .DeeeeeeeeER . . . vpaddd (%r8), %ymm0, %ymm0 |
| # HASWELL-NEXT: [1,2] . DeE------R . . . addq $32, %r8 |
| # HASWELL-NEXT: [1,3] . DeE------R . . . cmpl %edi, %edx |
| # HASWELL-NEXT: [2,0] . DeE------R . . . addl $1, %edx |
| # HASWELL-NEXT: [2,1] . DeeeeeeeeER . . . vpaddd (%r8), %ymm0, %ymm0 |
| # HASWELL-NEXT: [2,2] . DeE-------R . . . addq $32, %r8 |
| # HASWELL-NEXT: [2,3] . DeE-------R . . . cmpl %edi, %edx |
| # HASWELL-NEXT: [3,0] . DeE------R . . . addl $1, %edx |
| # HASWELL-NEXT: [3,1] . DeeeeeeeeER. . . vpaddd (%r8), %ymm0, %ymm0 |
| # HASWELL-NEXT: [3,2] . DeE-------R. . . addq $32, %r8 |
| # HASWELL-NEXT: [3,3] . DeE------R. . . cmpl %edi, %edx |
| # HASWELL-NEXT: [4,0] . DeE------R. . . addl $1, %edx |
| # HASWELL-NEXT: [4,1] . DeeeeeeeeER . . vpaddd (%r8), %ymm0, %ymm0 |
| # HASWELL-NEXT: [4,2] . .DeE------R . . addq $32, %r8 |
| # HASWELL-NEXT: [4,3] . .DeE------R . . cmpl %edi, %edx |
| # HASWELL-NEXT: [5,0] . .DeE------R . . addl $1, %edx |
| # HASWELL-NEXT: [5,1] . . DeeeeeeeeER . . vpaddd (%r8), %ymm0, %ymm0 |
| # HASWELL-NEXT: [5,2] . . DeE-------R . . addq $32, %r8 |
| # HASWELL-NEXT: [5,3] . . DeE-------R . . cmpl %edi, %edx |
| # HASWELL-NEXT: [6,0] . . DeE------R . . addl $1, %edx |
| # HASWELL-NEXT: [6,1] . . DeeeeeeeeER . . vpaddd (%r8), %ymm0, %ymm0 |
| # HASWELL-NEXT: [6,2] . . DeE-------R . . addq $32, %r8 |
| # HASWELL-NEXT: [6,3] . . DeE------R . . cmpl %edi, %edx |
| # HASWELL-NEXT: [7,0] . . DeE------R . . addl $1, %edx |
| # HASWELL-NEXT: [7,1] . . DeeeeeeeeER. . vpaddd (%r8), %ymm0, %ymm0 |
| # HASWELL-NEXT: [7,2] . . DeE------R. . addq $32, %r8 |
| # HASWELL-NEXT: [7,3] . . DeE------R. . cmpl %edi, %edx |
| # HASWELL-NEXT: [8,0] . . DeE------R. . addl $1, %edx |
| # HASWELL-NEXT: [8,1] . . .DeeeeeeeeER. vpaddd (%r8), %ymm0, %ymm0 |
| # HASWELL-NEXT: [8,2] . . .DeE-------R. addq $32, %r8 |
| # HASWELL-NEXT: [8,3] . . .DeE-------R. cmpl %edi, %edx |
| # HASWELL-NEXT: [9,0] . . . DeE------R. addl $1, %edx |
| # HASWELL-NEXT: [9,1] . . . DeeeeeeeeER vpaddd (%r8), %ymm0, %ymm0 |
| # HASWELL-NEXT: [9,2] . . . DeE-------R addq $32, %r8 |
| # HASWELL-NEXT: [9,3] . . . DeE------R cmpl %edi, %edx |
| |
| # SKYLAKE: [0,0] DeER . . . . addl $1, %edx |
| # SKYLAKE-NEXT: [0,1] DeeeeeeeeER . . vpaddd (%r8), %ymm0, %ymm0 |
| # SKYLAKE-NEXT: [0,2] DeE-------R . . addq $32, %r8 |
| # SKYLAKE-NEXT: [0,3] D=eE------R . . cmpl %edi, %edx |
| # SKYLAKE-NEXT: [1,0] D=eE------R . . addl $1, %edx |
| # SKYLAKE-NEXT: [1,1] .DeeeeeeeeER . . vpaddd (%r8), %ymm0, %ymm0 |
| # SKYLAKE-NEXT: [1,2] .DeE-------R . . addq $32, %r8 |
| # SKYLAKE-NEXT: [1,3] .D=eE------R . . cmpl %edi, %edx |
| # SKYLAKE-NEXT: [2,0] .D=eE------R . . addl $1, %edx |
| # SKYLAKE-NEXT: [2,1] . DeeeeeeeeER . . vpaddd (%r8), %ymm0, %ymm0 |
| # SKYLAKE-NEXT: [2,2] . DeE-------R . . addq $32, %r8 |
| # SKYLAKE-NEXT: [2,3] . D=eE------R . . cmpl %edi, %edx |
| # SKYLAKE-NEXT: [3,0] . D=eE------R . . addl $1, %edx |
| # SKYLAKE-NEXT: [3,1] . DeeeeeeeeER . . vpaddd (%r8), %ymm0, %ymm0 |
| # SKYLAKE-NEXT: [3,2] . DeE-------R . . addq $32, %r8 |
| # SKYLAKE-NEXT: [3,3] . D=eE------R . . cmpl %edi, %edx |
| # SKYLAKE-NEXT: [4,0] . D=eE------R . . addl $1, %edx |
| # SKYLAKE-NEXT: [4,1] . DeeeeeeeeER. . vpaddd (%r8), %ymm0, %ymm0 |
| # SKYLAKE-NEXT: [4,2] . DeE-------R. . addq $32, %r8 |
| # SKYLAKE-NEXT: [4,3] . D=eE------R. . cmpl %edi, %edx |
| # SKYLAKE-NEXT: [5,0] . D=eE------R. . addl $1, %edx |
| # SKYLAKE-NEXT: [5,1] . DeeeeeeeeER . vpaddd (%r8), %ymm0, %ymm0 |
| # SKYLAKE-NEXT: [5,2] . DeE-------R . addq $32, %r8 |
| # SKYLAKE-NEXT: [5,3] . D=eE------R . cmpl %edi, %edx |
| # SKYLAKE-NEXT: [6,0] . D=eE------R . addl $1, %edx |
| # SKYLAKE-NEXT: [6,1] . .DeeeeeeeeER . vpaddd (%r8), %ymm0, %ymm0 |
| # SKYLAKE-NEXT: [6,2] . .DeE-------R . addq $32, %r8 |
| # SKYLAKE-NEXT: [6,3] . .D=eE------R . cmpl %edi, %edx |
| # SKYLAKE-NEXT: [7,0] . .D=eE------R . addl $1, %edx |
| # SKYLAKE-NEXT: [7,1] . . DeeeeeeeeER . vpaddd (%r8), %ymm0, %ymm0 |
| # SKYLAKE-NEXT: [7,2] . . DeE-------R . addq $32, %r8 |
| # SKYLAKE-NEXT: [7,3] . . D=eE------R . cmpl %edi, %edx |
| # SKYLAKE-NEXT: [8,0] . . D=eE------R . addl $1, %edx |
| # SKYLAKE-NEXT: [8,1] . . DeeeeeeeeER. vpaddd (%r8), %ymm0, %ymm0 |
| # SKYLAKE-NEXT: [8,2] . . DeE-------R. addq $32, %r8 |
| # SKYLAKE-NEXT: [8,3] . . D=eE------R. cmpl %edi, %edx |
| # SKYLAKE-NEXT: [9,0] . . D=eE------R. addl $1, %edx |
| # SKYLAKE-NEXT: [9,1] . . DeeeeeeeeER vpaddd (%r8), %ymm0, %ymm0 |
| # SKYLAKE-NEXT: [9,2] . . DeE-------R addq $32, %r8 |
| # SKYLAKE-NEXT: [9,3] . . D=eE------R cmpl %edi, %edx |
| |
| # ZNVER1: [0,0] DeER . . . . . addl $1, %edx |
| # ZNVER1-NEXT: [0,1] DeeeeeeeeER . . . vpaddd (%r8), %ymm0, %ymm0 |
| # ZNVER1-NEXT: [0,2] DeE-------R . . . addq $32, %r8 |
| # ZNVER1-NEXT: [0,3] .DeE------R . . . cmpl %edi, %edx |
| # ZNVER1-NEXT: [1,0] .DeE------R . . . addl $1, %edx |
| # ZNVER1-NEXT: [1,1] .DeeeeeeeeER . . . vpaddd (%r8), %ymm0, %ymm0 |
| # ZNVER1-NEXT: [1,2] . DeE------R . . . addq $32, %r8 |
| # ZNVER1-NEXT: [1,3] . DeE------R . . . cmpl %edi, %edx |
| # ZNVER1-NEXT: [2,0] . DeE------R . . . addl $1, %edx |
| # ZNVER1-NEXT: [2,1] . DeeeeeeeeER . . . vpaddd (%r8), %ymm0, %ymm0 |
| # ZNVER1-NEXT: [2,2] . DeE-------R . . . addq $32, %r8 |
| # ZNVER1-NEXT: [2,3] . DeE-------R . . . cmpl %edi, %edx |
| # ZNVER1-NEXT: [3,0] . DeE------R . . . addl $1, %edx |
| # ZNVER1-NEXT: [3,1] . DeeeeeeeeER. . . vpaddd (%r8), %ymm0, %ymm0 |
| # ZNVER1-NEXT: [3,2] . DeE-------R. . . addq $32, %r8 |
| # ZNVER1-NEXT: [3,3] . DeE------R. . . cmpl %edi, %edx |
| # ZNVER1-NEXT: [4,0] . DeE------R. . . addl $1, %edx |
| # ZNVER1-NEXT: [4,1] . DeeeeeeeeER . . vpaddd (%r8), %ymm0, %ymm0 |
| # ZNVER1-NEXT: [4,2] . .DeE------R . . addq $32, %r8 |
| # ZNVER1-NEXT: [4,3] . .DeE------R . . cmpl %edi, %edx |
| # ZNVER1-NEXT: [5,0] . .DeE------R . . addl $1, %edx |
| # ZNVER1-NEXT: [5,1] . . DeeeeeeeeER . . vpaddd (%r8), %ymm0, %ymm0 |
| # ZNVER1-NEXT: [5,2] . . DeE-------R . . addq $32, %r8 |
| # ZNVER1-NEXT: [5,3] . . DeE-------R . . cmpl %edi, %edx |
| # ZNVER1-NEXT: [6,0] . . DeE------R . . addl $1, %edx |
| # ZNVER1-NEXT: [6,1] . . DeeeeeeeeER . . vpaddd (%r8), %ymm0, %ymm0 |
| # ZNVER1-NEXT: [6,2] . . DeE-------R . . addq $32, %r8 |
| # ZNVER1-NEXT: [6,3] . . DeE------R . . cmpl %edi, %edx |
| # ZNVER1-NEXT: [7,0] . . DeE------R . . addl $1, %edx |
| # ZNVER1-NEXT: [7,1] . . DeeeeeeeeER. . vpaddd (%r8), %ymm0, %ymm0 |
| # ZNVER1-NEXT: [7,2] . . DeE------R. . addq $32, %r8 |
| # ZNVER1-NEXT: [7,3] . . DeE------R. . cmpl %edi, %edx |
| # ZNVER1-NEXT: [8,0] . . DeE------R. . addl $1, %edx |
| # ZNVER1-NEXT: [8,1] . . .DeeeeeeeeER. vpaddd (%r8), %ymm0, %ymm0 |
| # ZNVER1-NEXT: [8,2] . . .DeE-------R. addq $32, %r8 |
| # ZNVER1-NEXT: [8,3] . . .DeE-------R. cmpl %edi, %edx |
| # ZNVER1-NEXT: [9,0] . . . DeE------R. addl $1, %edx |
| # ZNVER1-NEXT: [9,1] . . . DeeeeeeeeER vpaddd (%r8), %ymm0, %ymm0 |
| # ZNVER1-NEXT: [9,2] . . . DeE-------R addq $32, %r8 |
| # ZNVER1-NEXT: [9,3] . . . DeE------R cmpl %edi, %edx |
| |
| # ZNVER2: [0,0] DeER . . . . addl $1, %edx |
| # ZNVER2-NEXT: [0,1] DeeeeeeeeER . . vpaddd (%r8), %ymm0, %ymm0 |
| # ZNVER2-NEXT: [0,2] DeE-------R . . addq $32, %r8 |
| # ZNVER2-NEXT: [0,3] D=eE------R . . cmpl %edi, %edx |
| # ZNVER2-NEXT: [1,0] .DeE------R . . addl $1, %edx |
| # ZNVER2-NEXT: [1,1] .DeeeeeeeeER . . vpaddd (%r8), %ymm0, %ymm0 |
| # ZNVER2-NEXT: [1,2] .DeE-------R . . addq $32, %r8 |
| # ZNVER2-NEXT: [1,3] .D=eE------R . . cmpl %edi, %edx |
| # ZNVER2-NEXT: [2,0] . DeE------R . . addl $1, %edx |
| # ZNVER2-NEXT: [2,1] . DeeeeeeeeER . . vpaddd (%r8), %ymm0, %ymm0 |
| # ZNVER2-NEXT: [2,2] . DeE-------R . . addq $32, %r8 |
| # ZNVER2-NEXT: [2,3] . D=eE------R . . cmpl %edi, %edx |
| # ZNVER2-NEXT: [3,0] . DeE------R . . addl $1, %edx |
| # ZNVER2-NEXT: [3,1] . DeeeeeeeeER . . vpaddd (%r8), %ymm0, %ymm0 |
| # ZNVER2-NEXT: [3,2] . DeE-------R . . addq $32, %r8 |
| # ZNVER2-NEXT: [3,3] . D=eE------R . . cmpl %edi, %edx |
| # ZNVER2-NEXT: [4,0] . DeE------R . . addl $1, %edx |
| # ZNVER2-NEXT: [4,1] . DeeeeeeeeER. . vpaddd (%r8), %ymm0, %ymm0 |
| # ZNVER2-NEXT: [4,2] . DeE-------R. . addq $32, %r8 |
| # ZNVER2-NEXT: [4,3] . D=eE------R. . cmpl %edi, %edx |
| # ZNVER2-NEXT: [5,0] . DeE------R. . addl $1, %edx |
| # ZNVER2-NEXT: [5,1] . DeeeeeeeeER . vpaddd (%r8), %ymm0, %ymm0 |
| # ZNVER2-NEXT: [5,2] . DeE-------R . addq $32, %r8 |
| # ZNVER2-NEXT: [5,3] . D=eE------R . cmpl %edi, %edx |
| # ZNVER2-NEXT: [6,0] . .DeE------R . addl $1, %edx |
| # ZNVER2-NEXT: [6,1] . .DeeeeeeeeER . vpaddd (%r8), %ymm0, %ymm0 |
| # ZNVER2-NEXT: [6,2] . .DeE-------R . addq $32, %r8 |
| # ZNVER2-NEXT: [6,3] . .D=eE------R . cmpl %edi, %edx |
| # ZNVER2-NEXT: [7,0] . . DeE------R . addl $1, %edx |
| # ZNVER2-NEXT: [7,1] . . DeeeeeeeeER . vpaddd (%r8), %ymm0, %ymm0 |
| # ZNVER2-NEXT: [7,2] . . DeE-------R . addq $32, %r8 |
| # ZNVER2-NEXT: [7,3] . . D=eE------R . cmpl %edi, %edx |
| # ZNVER2-NEXT: [8,0] . . DeE------R . addl $1, %edx |
| # ZNVER2-NEXT: [8,1] . . DeeeeeeeeER. vpaddd (%r8), %ymm0, %ymm0 |
| # ZNVER2-NEXT: [8,2] . . DeE-------R. addq $32, %r8 |
| # ZNVER2-NEXT: [8,3] . . D=eE------R. cmpl %edi, %edx |
| # ZNVER2-NEXT: [9,0] . . DeE------R. addl $1, %edx |
| # ZNVER2-NEXT: [9,1] . . DeeeeeeeeER vpaddd (%r8), %ymm0, %ymm0 |
| # ZNVER2-NEXT: [9,2] . . DeE-------R addq $32, %r8 |
| # ZNVER2-NEXT: [9,3] . . D=eE------R cmpl %edi, %edx |
| |
| # ALL: Average Wait times (based on the timeline view): |
| # ALL-NEXT: [0]: Executions |
| # ALL-NEXT: [1]: Average time spent waiting in a scheduler's queue |
| # ALL-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready |
| # ALL-NEXT: [3]: Average time elapsed from WB until retire stage |
| |
| # ALL: [0] [1] [2] [3] |
| |
| # BDWELL-NEXT: 0. 10 1.0 0.4 4.5 addl $1, %edx |
| # HASWELL-NEXT: 0. 10 1.0 0.4 5.4 addl $1, %edx |
| # SKYLAKE-NEXT: 0. 10 1.9 0.1 5.4 addl $1, %edx |
| # ZNVER1-NEXT: 0. 10 1.0 0.4 5.4 addl $1, %edx |
| # ZNVER2-NEXT: 0. 10 1.0 0.1 5.4 addl $1, %edx |
| |
| # ALL-NEXT: 1. 10 1.0 0.1 0.0 vpaddd (%r8), %ymm0, %ymm0 |
| |
| # BDWELL-NEXT: 2. 10 1.0 0.4 5.7 addq $32, %r8 |
| # BDWELL-NEXT: 3. 10 1.0 0.0 5.3 cmpl %edi, %edx |
| # BDWELL-NEXT: 10 1.0 0.2 3.9 <total> |
| |
| # HASWELL-NEXT: 2. 10 1.0 0.4 6.7 addq $32, %r8 |
| # HASWELL-NEXT: 3. 10 1.0 0.0 6.3 cmpl %edi, %edx |
| # HASWELL-NEXT: 10 1.0 0.2 4.6 <total> |
| |
| # SKYLAKE-NEXT: 2. 10 1.0 0.1 7.0 addq $32, %r8 |
| # SKYLAKE-NEXT: 3. 10 2.0 0.0 6.0 cmpl %edi, %edx |
| # SKYLAKE-NEXT: 10 1.5 0.1 4.6 <total> |
| |
| # ZNVER1-NEXT: 2. 10 1.0 0.4 6.7 addq $32, %r8 |
| # ZNVER1-NEXT: 3. 10 1.0 0.0 6.3 cmpl %edi, %edx |
| # ZNVER1-NEXT: 10 1.0 0.2 4.6 <total> |
| |
| # ZNVER2-NEXT: 2. 10 1.0 0.1 7.0 addq $32, %r8 |
| # ZNVER2-NEXT: 3. 10 2.0 0.0 6.0 cmpl %edi, %edx |
| # ZNVER2-NEXT: 10 1.3 0.1 4.6 <total> |