181 lines
7.9 KiB
ArmAsm
181 lines
7.9 KiB
ArmAsm
|
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||
|
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=sandybridge -iterations=1 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,SANDY
|
||
|
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=haswell -iterations=1 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,HASWELL
|
||
|
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=broadwell -iterations=1 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,BDWELL
|
||
|
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=skylake -iterations=1 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,SKYLAKE
|
||
|
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=x86-64 -iterations=1 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,BARCELONA
|
||
|
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=bdver2 -iterations=1 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,BDVER2
|
||
|
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=btver2 -iterations=1 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,BTVER2
|
||
|
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver1 -iterations=1 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,ZNVER1
|
||
|
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver2 -iterations=1 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,ZNVER2
|
||
|
|
||
|
vdivps %xmm0, %xmm1, %xmm1
|
||
|
vaddps (%rax), %xmm1, %xmm1
|
||
|
|
||
|
# ALL: Iterations: 1
|
||
|
# ALL-NEXT: Instructions: 2
|
||
|
|
||
|
# BARCELONA-NEXT: Total Cycles: 20
|
||
|
# BARCELONA-NEXT: Total uOps: 3
|
||
|
|
||
|
# BDVER2-NEXT: Total Cycles: 17
|
||
|
# BDVER2-NEXT: Total uOps: 2
|
||
|
|
||
|
# BDWELL-NEXT: Total Cycles: 17
|
||
|
# BDWELL-NEXT: Total uOps: 3
|
||
|
|
||
|
# BTVER2-NEXT: Total Cycles: 25
|
||
|
# BTVER2-NEXT: Total uOps: 2
|
||
|
|
||
|
# HASWELL-NEXT: Total Cycles: 19
|
||
|
# HASWELL-NEXT: Total uOps: 3
|
||
|
|
||
|
# SANDY-NEXT: Total Cycles: 20
|
||
|
# SANDY-NEXT: Total uOps: 3
|
||
|
|
||
|
# SKYLAKE-NEXT: Total Cycles: 18
|
||
|
# SKYLAKE-NEXT: Total uOps: 3
|
||
|
|
||
|
# ZNVER1-NEXT: Total Cycles: 20
|
||
|
# ZNVER1-NEXT: Total uOps: 2
|
||
|
|
||
|
# ZNVER2-NEXT: Total Cycles: 21
|
||
|
# ZNVER2-NEXT: Total uOps: 2
|
||
|
|
||
|
# BARCELONA: Dispatch Width: 4
|
||
|
# BARCELONA-NEXT: uOps Per Cycle: 0.15
|
||
|
# BARCELONA-NEXT: IPC: 0.10
|
||
|
# BARCELONA-NEXT: Block RThroughput: 14.0
|
||
|
|
||
|
# BDVER2: Dispatch Width: 4
|
||
|
# BDVER2-NEXT: uOps Per Cycle: 0.12
|
||
|
# BDVER2-NEXT: IPC: 0.12
|
||
|
# BDVER2-NEXT: Block RThroughput: 5.0
|
||
|
|
||
|
# BDWELL: Dispatch Width: 4
|
||
|
# BDWELL-NEXT: uOps Per Cycle: 0.18
|
||
|
# BDWELL-NEXT: IPC: 0.12
|
||
|
# BDWELL-NEXT: Block RThroughput: 5.0
|
||
|
|
||
|
# BTVER2: Dispatch Width: 2
|
||
|
# BTVER2-NEXT: uOps Per Cycle: 0.08
|
||
|
# BTVER2-NEXT: IPC: 0.08
|
||
|
# BTVER2-NEXT: Block RThroughput: 19.0
|
||
|
|
||
|
# HASWELL: Dispatch Width: 4
|
||
|
# HASWELL-NEXT: uOps Per Cycle: 0.16
|
||
|
# HASWELL-NEXT: IPC: 0.11
|
||
|
# HASWELL-NEXT: Block RThroughput: 7.0
|
||
|
|
||
|
# SANDY: Dispatch Width: 4
|
||
|
# SANDY-NEXT: uOps Per Cycle: 0.15
|
||
|
# SANDY-NEXT: IPC: 0.10
|
||
|
# SANDY-NEXT: Block RThroughput: 14.0
|
||
|
|
||
|
# SKYLAKE: Dispatch Width: 6
|
||
|
# SKYLAKE-NEXT: uOps Per Cycle: 0.17
|
||
|
# SKYLAKE-NEXT: IPC: 0.11
|
||
|
# SKYLAKE-NEXT: Block RThroughput: 3.0
|
||
|
|
||
|
# ZNVER1: Dispatch Width: 4
|
||
|
# ZNVER1-NEXT: uOps Per Cycle: 0.10
|
||
|
# ZNVER1-NEXT: IPC: 0.10
|
||
|
# ZNVER1-NEXT: Block RThroughput: 1.0
|
||
|
|
||
|
# ZNVER2: Dispatch Width: 4
|
||
|
# ZNVER2-NEXT: uOps Per Cycle: 0.10
|
||
|
# ZNVER2-NEXT: IPC: 0.10
|
||
|
# ZNVER2-NEXT: Block RThroughput: 1.0
|
||
|
|
||
|
# ALL: Timeline view:
|
||
|
|
||
|
# BARCELONA-NEXT: 0123456789
|
||
|
# BARCELONA-NEXT: Index 0123456789
|
||
|
|
||
|
# BDVER2-NEXT: 0123456
|
||
|
# BDVER2-NEXT: Index 0123456789
|
||
|
|
||
|
# BDWELL-NEXT: 0123456
|
||
|
# BDWELL-NEXT: Index 0123456789
|
||
|
|
||
|
# BTVER2-NEXT: 0123456789
|
||
|
# BTVER2-NEXT: Index 0123456789 01234
|
||
|
|
||
|
# HASWELL-NEXT: 012345678
|
||
|
# HASWELL-NEXT: Index 0123456789
|
||
|
|
||
|
# SANDY-NEXT: 0123456789
|
||
|
# SANDY-NEXT: Index 0123456789
|
||
|
|
||
|
# SKYLAKE-NEXT: 01234567
|
||
|
# SKYLAKE-NEXT: Index 0123456789
|
||
|
|
||
|
# ZNVER1-NEXT: 0123456789
|
||
|
# ZNVER1-NEXT: Index 0123456789
|
||
|
|
||
|
# ZNVER2-NEXT: 0123456789
|
||
|
# ZNVER2-NEXT: Index 0123456789 0
|
||
|
|
||
|
# BARCELONA: [0,0] DeeeeeeeeeeeeeeER . vdivps %xmm0, %xmm1, %xmm1
|
||
|
# BARCELONA-NEXT: [0,1] D========eeeeeeeeeER vaddps (%rax), %xmm1, %xmm1
|
||
|
|
||
|
# BDVER2: [0,0] DeeeeeeeeeER .. vdivps %xmm0, %xmm1, %xmm1
|
||
|
# BDVER2-NEXT: [0,1] D====eeeeeeeeeeER vaddps (%rax), %xmm1, %xmm1
|
||
|
|
||
|
# BDWELL: [0,0] DeeeeeeeeeeeER .. vdivps %xmm0, %xmm1, %xmm1
|
||
|
# BDWELL-NEXT: [0,1] D======eeeeeeeeER vaddps (%rax), %xmm1, %xmm1
|
||
|
|
||
|
# BTVER2: [0,0] DeeeeeeeeeeeeeeeeeeeER . vdivps %xmm0, %xmm1, %xmm1
|
||
|
# BTVER2-NEXT: [0,1] D==============eeeeeeeeER vaddps (%rax), %xmm1, %xmm1
|
||
|
|
||
|
# HASWELL: [0,0] DeeeeeeeeeeeeeER . vdivps %xmm0, %xmm1, %xmm1
|
||
|
# HASWELL-NEXT: [0,1] D=======eeeeeeeeeER vaddps (%rax), %xmm1, %xmm1
|
||
|
|
||
|
# SANDY: [0,0] DeeeeeeeeeeeeeeER . vdivps %xmm0, %xmm1, %xmm1
|
||
|
# SANDY-NEXT: [0,1] D========eeeeeeeeeER vaddps (%rax), %xmm1, %xmm1
|
||
|
|
||
|
# SKYLAKE: [0,0] DeeeeeeeeeeeER . . vdivps %xmm0, %xmm1, %xmm1
|
||
|
# SKYLAKE-NEXT: [0,1] D=====eeeeeeeeeeER vaddps (%rax), %xmm1, %xmm1
|
||
|
|
||
|
# ZNVER1: [0,0] DeeeeeeeeeeeeeeeER . vdivps %xmm0, %xmm1, %xmm1
|
||
|
# ZNVER1-NEXT: [0,1] D=======eeeeeeeeeeER vaddps (%rax), %xmm1, %xmm1
|
||
|
|
||
|
# ZNVER2: [0,0] DeeeeeeeeeeeeeeeER . vdivps %xmm0, %xmm1, %xmm1
|
||
|
# ZNVER2-NEXT: [0,1] D========eeeeeeeeeeER vaddps (%rax), %xmm1, %xmm1
|
||
|
|
||
|
# ALL: Average Wait times (based on the timeline view):
|
||
|
# ALL-NEXT: [0]: Executions
|
||
|
# ALL-NEXT: [1]: Average time spent waiting in a scheduler's queue
|
||
|
# ALL-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
|
||
|
# ALL-NEXT: [3]: Average time elapsed from WB until retire stage
|
||
|
|
||
|
# ALL: [0] [1] [2] [3]
|
||
|
# ALL-NEXT: 0. 1 1.0 1.0 0.0 vdivps %xmm0, %xmm1, %xmm1
|
||
|
|
||
|
# BARCELONA-NEXT: 1. 1 9.0 0.0 0.0 vaddps (%rax), %xmm1, %xmm1
|
||
|
# BARCELONA-NEXT: 1 5.0 0.5 0.0 <total>
|
||
|
|
||
|
# BDVER2-NEXT: 1. 1 5.0 0.0 0.0 vaddps (%rax), %xmm1, %xmm1
|
||
|
# BDVER2-NEXT: 1 3.0 0.5 0.0 <total>
|
||
|
|
||
|
# BDWELL-NEXT: 1. 1 7.0 0.0 0.0 vaddps (%rax), %xmm1, %xmm1
|
||
|
# BDWELL-NEXT: 1 4.0 0.5 0.0 <total>
|
||
|
|
||
|
# BTVER2-NEXT: 1. 1 15.0 0.0 0.0 vaddps (%rax), %xmm1, %xmm1
|
||
|
# BTVER2-NEXT: 1 8.0 0.5 0.0 <total>
|
||
|
|
||
|
# HASWELL-NEXT: 1. 1 8.0 0.0 0.0 vaddps (%rax), %xmm1, %xmm1
|
||
|
# HASWELL-NEXT: 1 4.5 0.5 0.0 <total>
|
||
|
|
||
|
# SANDY-NEXT: 1. 1 9.0 0.0 0.0 vaddps (%rax), %xmm1, %xmm1
|
||
|
# SANDY-NEXT: 1 5.0 0.5 0.0 <total>
|
||
|
|
||
|
# SKYLAKE-NEXT: 1. 1 6.0 0.0 0.0 vaddps (%rax), %xmm1, %xmm1
|
||
|
# SKYLAKE-NEXT: 1 3.5 0.5 0.0 <total>
|
||
|
|
||
|
# ZNVER1-NEXT: 1. 1 8.0 0.0 0.0 vaddps (%rax), %xmm1, %xmm1
|
||
|
# ZNVER1-NEXT: 1 4.5 0.5 0.0 <total>
|
||
|
|
||
|
# ZNVER2-NEXT: 1. 1 9.0 0.0 0.0 vaddps (%rax), %xmm1, %xmm1
|
||
|
# ZNVER2-NEXT: 1 5.0 0.5 0.0 <total>
|