You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
344 lines
15 KiB
344 lines
15 KiB
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
|
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=x86-64 -iterations=1 -all-views=false -timeline < %s | FileCheck %s -check-prefixes=ALL,BARCELONA
|
|
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=bdver2 -iterations=1 -all-views=false -timeline < %s | FileCheck %s -check-prefixes=ALL,BDVER2
|
|
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=btver2 -iterations=1 -all-views=false -timeline < %s | FileCheck %s -check-prefixes=ALL,BTVER2
|
|
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver1 -iterations=1 -all-views=false -timeline < %s | FileCheck %s -check-prefixes=ALL,ZNVER1
|
|
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver2 -iterations=1 -all-views=false -timeline < %s | FileCheck %s -check-prefixes=ALL,ZNVER2
|
|
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=haswell -iterations=1 -all-views=false -timeline < %s | FileCheck %s -check-prefixes=ALL,HASWELL
|
|
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=broadwell -iterations=1 -all-views=false -timeline < %s | FileCheck %s -check-prefixes=ALL,BROADWELL
|
|
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=skylake -iterations=1 -all-views=false -timeline < %s | FileCheck %s -check-prefixes=ALL,SKYLAKE
|
|
|
|
#LLVM-MCA-BEGIN test_sqrtss
|
|
leaq 8(%rsp, %rdi, 2), %rax
|
|
sqrtss (%rax), %xmm1
|
|
#LLVM-MCA-END
|
|
|
|
#LLVM-MCA-BEGIN test_sqrtsd
|
|
leaq 8(%rsp, %rdi, 2), %rax
|
|
sqrtsd (%rax), %xmm1
|
|
#LLVM-MCA-END
|
|
|
|
#LLVM-MCA-BEGIN test_rsqrtss
|
|
leaq 8(%rsp, %rdi, 2), %rax
|
|
rsqrtss (%rax), %xmm1
|
|
#LLVM-MCA-END
|
|
|
|
#LLVM-MCA-BEGIN test_rcp
|
|
leaq 8(%rsp, %rdi, 2), %rax
|
|
rcpss (%rax), %xmm1
|
|
#LLVM-MCA-END
|
|
|
|
# ALL: [0] Code Region - test_sqrtss
|
|
|
|
# ALL: Timeline view:
|
|
|
|
# BARCELONA-NEXT: 0123456789
|
|
# BARCELONA-NEXT: Index 0123456789 0123
|
|
|
|
# BDVER2-NEXT: 012345678
|
|
# BDVER2-NEXT: Index 0123456789
|
|
|
|
# BROADWELL-NEXT: 0123456789
|
|
# BROADWELL-NEXT: Index 0123456789
|
|
|
|
# BTVER2-NEXT: 0123456789 0
|
|
# BTVER2-NEXT: Index 0123456789 0123456789
|
|
|
|
# HASWELL-NEXT: 0123456789
|
|
# HASWELL-NEXT: Index 0123456789
|
|
|
|
# SKYLAKE-NEXT: 0123456789
|
|
# SKYLAKE-NEXT: Index 0123456789 0
|
|
|
|
# ZNVER1-NEXT: 0123456789 0
|
|
# ZNVER1-NEXT: Index 0123456789 0123456789
|
|
|
|
# ZNVER2-NEXT: 0123456789 0
|
|
# ZNVER2-NEXT: Index 0123456789 0123456789
|
|
|
|
# BARCELONA: [0,0] DeER . . . . . leaq 8(%rsp,%rdi,2), %rax
|
|
# BARCELONA-NEXT: [0,1] D=eeeeeeeeeeeeeeeeeeeeER sqrtss (%rax), %xmm1
|
|
|
|
# BDVER2: [0,0] DeeER. . . . leaq 8(%rsp,%rdi,2), %rax
|
|
# BDVER2-NEXT: [0,1] D==eeeeeeeeeeeeeeER sqrtss (%rax), %xmm1
|
|
|
|
# BROADWELL: [0,0] DeER . . . . leaq 8(%rsp,%rdi,2), %rax
|
|
# BROADWELL-NEXT: [0,1] D=eeeeeeeeeeeeeeeeER sqrtss (%rax), %xmm1
|
|
|
|
# BTVER2: [0,0] DeeER. . . . . . leaq 8(%rsp,%rdi,2), %rax
|
|
# BTVER2-NEXT: [0,1] D==eeeeeeeeeeeeeeeeeeeeeeeeeeER sqrtss (%rax), %xmm1
|
|
|
|
# HASWELL: [0,0] DeER . . . . leaq 8(%rsp,%rdi,2), %rax
|
|
# HASWELL-NEXT: [0,1] D=eeeeeeeeeeeeeeeeER sqrtss (%rax), %xmm1
|
|
|
|
# SKYLAKE: [0,0] DeER . . . . leaq 8(%rsp,%rdi,2), %rax
|
|
# SKYLAKE-NEXT: [0,1] D=eeeeeeeeeeeeeeeeeER sqrtss (%rax), %xmm1
|
|
|
|
# ZNVER1: [0,0] DeER . . . . . . leaq 8(%rsp,%rdi,2), %rax
|
|
# ZNVER1-NEXT: [0,1] D=eeeeeeeeeeeeeeeeeeeeeeeeeeeER sqrtss (%rax), %xmm1
|
|
|
|
# ZNVER2: [0,0] DeER . . . . . . leaq 8(%rsp,%rdi,2), %rax
|
|
# ZNVER2-NEXT: [0,1] D=eeeeeeeeeeeeeeeeeeeeeeeeeeeER sqrtss (%rax), %xmm1
|
|
|
|
# ALL: Average Wait times (based on the timeline view):
|
|
# ALL-NEXT: [0]: Executions
|
|
# ALL-NEXT: [1]: Average time spent waiting in a scheduler's queue
|
|
# ALL-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
|
|
# ALL-NEXT: [3]: Average time elapsed from WB until retire stage
|
|
|
|
# ALL: [0] [1] [2] [3]
|
|
# ALL-NEXT: 0. 1 1.0 1.0 0.0 leaq 8(%rsp,%rdi,2), %rax
|
|
|
|
# BARCELONA-NEXT: 1. 1 2.0 0.0 0.0 sqrtss (%rax), %xmm1
|
|
# BARCELONA-NEXT: 1 1.5 0.5 0.0 <total>
|
|
|
|
# BDVER2-NEXT: 1. 1 3.0 0.0 0.0 sqrtss (%rax), %xmm1
|
|
# BDVER2-NEXT: 1 2.0 0.5 0.0 <total>
|
|
|
|
# BROADWELL-NEXT: 1. 1 2.0 0.0 0.0 sqrtss (%rax), %xmm1
|
|
# BROADWELL-NEXT: 1 1.5 0.5 0.0 <total>
|
|
|
|
# BTVER2-NEXT: 1. 1 3.0 0.0 0.0 sqrtss (%rax), %xmm1
|
|
# BTVER2-NEXT: 1 2.0 0.5 0.0 <total>
|
|
|
|
# HASWELL-NEXT: 1. 1 2.0 0.0 0.0 sqrtss (%rax), %xmm1
|
|
# HASWELL-NEXT: 1 1.5 0.5 0.0 <total>
|
|
|
|
# SKYLAKE-NEXT: 1. 1 2.0 0.0 0.0 sqrtss (%rax), %xmm1
|
|
# SKYLAKE-NEXT: 1 1.5 0.5 0.0 <total>
|
|
|
|
# ZNVER1-NEXT: 1. 1 2.0 0.0 0.0 sqrtss (%rax), %xmm1
|
|
# ZNVER1-NEXT: 1 1.5 0.5 0.0 <total>
|
|
|
|
# ZNVER2-NEXT: 1. 1 2.0 0.0 0.0 sqrtss (%rax), %xmm1
|
|
# ZNVER2-NEXT: 1 1.5 0.5 0.0 <total>
|
|
|
|
# ALL: [1] Code Region - test_sqrtsd
|
|
|
|
# ALL: Timeline view:
|
|
|
|
# BARCELONA-NEXT: 0123456789 0
|
|
# BARCELONA-NEXT: Index 0123456789 0123456789
|
|
|
|
# BDVER2-NEXT: 012345678
|
|
# BDVER2-NEXT: Index 0123456789
|
|
|
|
# BROADWELL-NEXT: 0123456789
|
|
# BROADWELL-NEXT: Index 0123456789 01234
|
|
|
|
# BTVER2-NEXT: 0123456789 0123456
|
|
# BTVER2-NEXT: Index 0123456789 0123456789
|
|
|
|
# HASWELL-NEXT: 0123456789
|
|
# HASWELL-NEXT: Index 0123456789 01234
|
|
|
|
# SKYLAKE-NEXT: 0123456789
|
|
# SKYLAKE-NEXT: Index 0123456789 0123456
|
|
|
|
# ZNVER1-NEXT: 0123456789 0
|
|
# ZNVER1-NEXT: Index 0123456789 0123456789
|
|
|
|
# ZNVER2-NEXT: 0123456789 0
|
|
# ZNVER2-NEXT: Index 0123456789 0123456789
|
|
|
|
# BARCELONA: [0,0] DeER . . . . . . leaq 8(%rsp,%rdi,2), %rax
|
|
# BARCELONA-NEXT: [0,1] D=eeeeeeeeeeeeeeeeeeeeeeeeeeeER sqrtsd (%rax), %xmm1
|
|
|
|
# BDVER2: [0,0] DeeER. . . . leaq 8(%rsp,%rdi,2), %rax
|
|
# BDVER2-NEXT: [0,1] D==eeeeeeeeeeeeeeER sqrtsd (%rax), %xmm1
|
|
|
|
# BROADWELL: [0,0] DeER . . . . . leaq 8(%rsp,%rdi,2), %rax
|
|
# BROADWELL-NEXT: [0,1] D=eeeeeeeeeeeeeeeeeeeeeER sqrtsd (%rax), %xmm1
|
|
|
|
# BTVER2: [0,0] DeeER. . . . . . .. leaq 8(%rsp,%rdi,2), %rax
|
|
# BTVER2-NEXT: [0,1] D==eeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeeER sqrtsd (%rax), %xmm1
|
|
|
|
# HASWELL: [0,0] DeER . . . . . leaq 8(%rsp,%rdi,2), %rax
|
|
# HASWELL-NEXT: [0,1] D=eeeeeeeeeeeeeeeeeeeeeER sqrtsd (%rax), %xmm1
|
|
|
|
# SKYLAKE: [0,0] DeER . . . . .. leaq 8(%rsp,%rdi,2), %rax
|
|
# SKYLAKE-NEXT: [0,1] D=eeeeeeeeeeeeeeeeeeeeeeeER sqrtsd (%rax), %xmm1
|
|
|
|
# ZNVER1: [0,0] DeER . . . . . . leaq 8(%rsp,%rdi,2), %rax
|
|
# ZNVER1-NEXT: [0,1] D=eeeeeeeeeeeeeeeeeeeeeeeeeeeER sqrtsd (%rax), %xmm1
|
|
|
|
# ZNVER2: [0,0] DeER . . . . . . leaq 8(%rsp,%rdi,2), %rax
|
|
# ZNVER2-NEXT: [0,1] D=eeeeeeeeeeeeeeeeeeeeeeeeeeeER sqrtsd (%rax), %xmm1
|
|
|
|
# ALL: Average Wait times (based on the timeline view):
|
|
# ALL-NEXT: [0]: Executions
|
|
# ALL-NEXT: [1]: Average time spent waiting in a scheduler's queue
|
|
# ALL-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
|
|
# ALL-NEXT: [3]: Average time elapsed from WB until retire stage
|
|
|
|
# ALL: [0] [1] [2] [3]
|
|
# ALL-NEXT: 0. 1 1.0 1.0 0.0 leaq 8(%rsp,%rdi,2), %rax
|
|
|
|
# BARCELONA-NEXT: 1. 1 2.0 0.0 0.0 sqrtsd (%rax), %xmm1
|
|
# BARCELONA-NEXT: 1 1.5 0.5 0.0 <total>
|
|
|
|
# BDVER2-NEXT: 1. 1 3.0 0.0 0.0 sqrtsd (%rax), %xmm1
|
|
# BDVER2-NEXT: 1 2.0 0.5 0.0 <total>
|
|
|
|
# BROADWELL-NEXT: 1. 1 2.0 0.0 0.0 sqrtsd (%rax), %xmm1
|
|
# BROADWELL-NEXT: 1 1.5 0.5 0.0 <total>
|
|
|
|
# BTVER2-NEXT: 1. 1 3.0 0.0 0.0 sqrtsd (%rax), %xmm1
|
|
# BTVER2-NEXT: 1 2.0 0.5 0.0 <total>
|
|
|
|
# HASWELL-NEXT: 1. 1 2.0 0.0 0.0 sqrtsd (%rax), %xmm1
|
|
# HASWELL-NEXT: 1 1.5 0.5 0.0 <total>
|
|
|
|
# SKYLAKE-NEXT: 1. 1 2.0 0.0 0.0 sqrtsd (%rax), %xmm1
|
|
# SKYLAKE-NEXT: 1 1.5 0.5 0.0 <total>
|
|
|
|
# ZNVER1-NEXT: 1. 1 2.0 0.0 0.0 sqrtsd (%rax), %xmm1
|
|
# ZNVER1-NEXT: 1 1.5 0.5 0.0 <total>
|
|
|
|
# ZNVER2-NEXT: 1. 1 2.0 0.0 0.0 sqrtsd (%rax), %xmm1
|
|
# ZNVER2-NEXT: 1 1.5 0.5 0.0 <total>
|
|
|
|
# ALL: [2] Code Region - test_rsqrtss
|
|
|
|
# ALL: Timeline view:
|
|
|
|
# BARCELONA-NEXT: 01234
|
|
# BDVER2-NEXT: 01234
|
|
# BROADWELL-NEXT: 0123
|
|
# BTVER2-NEXT: 01
|
|
# HASWELL-NEXT: 0123
|
|
# SKYLAKE-NEXT: 012
|
|
# ZNVER1-NEXT: 012345
|
|
# ZNVER2-NEXT: 012345
|
|
|
|
# ALL-NEXT: Index 0123456789
|
|
|
|
# BARCELONA: [0,0] DeER . . . leaq 8(%rsp,%rdi,2), %rax
|
|
# BARCELONA-NEXT: [0,1] D=eeeeeeeeeeeER rsqrtss (%rax), %xmm1
|
|
|
|
# BDVER2: [0,0] DeeER. . . leaq 8(%rsp,%rdi,2), %rax
|
|
# BDVER2-NEXT: [0,1] D==eeeeeeeeeeER rsqrtss (%rax), %xmm1
|
|
|
|
# BROADWELL: [0,0] DeER . . . leaq 8(%rsp,%rdi,2), %rax
|
|
# BROADWELL-NEXT: [0,1] D=eeeeeeeeeeER rsqrtss (%rax), %xmm1
|
|
|
|
# BTVER2: [0,0] DeeER. .. leaq 8(%rsp,%rdi,2), %rax
|
|
# BTVER2-NEXT: [0,1] D==eeeeeeeER rsqrtss (%rax), %xmm1
|
|
|
|
# HASWELL: [0,0] DeER . . . leaq 8(%rsp,%rdi,2), %rax
|
|
# HASWELL-NEXT: [0,1] D=eeeeeeeeeeER rsqrtss (%rax), %xmm1
|
|
|
|
# SKYLAKE: [0,0] DeER . . . leaq 8(%rsp,%rdi,2), %rax
|
|
# SKYLAKE-NEXT: [0,1] D=eeeeeeeeeER rsqrtss (%rax), %xmm1
|
|
|
|
# ZNVER1: [0,0] DeER . . . leaq 8(%rsp,%rdi,2), %rax
|
|
# ZNVER1-NEXT: [0,1] D=eeeeeeeeeeeeER rsqrtss (%rax), %xmm1
|
|
|
|
# ZNVER2: [0,0] DeER . . . leaq 8(%rsp,%rdi,2), %rax
|
|
# ZNVER2-NEXT: [0,1] D=eeeeeeeeeeeeER rsqrtss (%rax), %xmm1
|
|
|
|
# ALL: Average Wait times (based on the timeline view):
|
|
# ALL-NEXT: [0]: Executions
|
|
# ALL-NEXT: [1]: Average time spent waiting in a scheduler's queue
|
|
# ALL-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
|
|
# ALL-NEXT: [3]: Average time elapsed from WB until retire stage
|
|
|
|
# ALL: [0] [1] [2] [3]
|
|
# ALL-NEXT: 0. 1 1.0 1.0 0.0 leaq 8(%rsp,%rdi,2), %rax
|
|
|
|
# BARCELONA-NEXT: 1. 1 2.0 0.0 0.0 rsqrtss (%rax), %xmm1
|
|
# BARCELONA-NEXT: 1 1.5 0.5 0.0 <total>
|
|
|
|
# BDVER2-NEXT: 1. 1 3.0 0.0 0.0 rsqrtss (%rax), %xmm1
|
|
# BDVER2-NEXT: 1 2.0 0.5 0.0 <total>
|
|
|
|
# BROADWELL-NEXT: 1. 1 2.0 0.0 0.0 rsqrtss (%rax), %xmm1
|
|
# BROADWELL-NEXT: 1 1.5 0.5 0.0 <total>
|
|
|
|
# BTVER2-NEXT: 1. 1 3.0 0.0 0.0 rsqrtss (%rax), %xmm1
|
|
# BTVER2-NEXT: 1 2.0 0.5 0.0 <total>
|
|
|
|
# HASWELL-NEXT: 1. 1 2.0 0.0 0.0 rsqrtss (%rax), %xmm1
|
|
# HASWELL-NEXT: 1 1.5 0.5 0.0 <total>
|
|
|
|
# SKYLAKE-NEXT: 1. 1 2.0 0.0 0.0 rsqrtss (%rax), %xmm1
|
|
# SKYLAKE-NEXT: 1 1.5 0.5 0.0 <total>
|
|
|
|
# ZNVER1-NEXT: 1. 1 2.0 0.0 0.0 rsqrtss (%rax), %xmm1
|
|
# ZNVER1-NEXT: 1 1.5 0.5 0.0 <total>
|
|
|
|
# ZNVER2-NEXT: 1. 1 2.0 0.0 0.0 rsqrtss (%rax), %xmm1
|
|
# ZNVER2-NEXT: 1 1.5 0.5 0.0 <total>
|
|
|
|
# ALL: [3] Code Region - test_rcp
|
|
|
|
# ALL: Timeline view:
|
|
|
|
# BARCELONA-NEXT: 01234
|
|
# BDVER2-NEXT: 01234
|
|
# BROADWELL-NEXT: 0123
|
|
# BTVER2-NEXT: 01
|
|
# HASWELL-NEXT: 0123
|
|
# SKYLAKE-NEXT: 012
|
|
# ZNVER1-NEXT: 012345
|
|
# ZNVER2-NEXT: 012345
|
|
|
|
# ALL-NEXT: Index 0123456789
|
|
|
|
# BARCELONA: [0,0] DeER . . . leaq 8(%rsp,%rdi,2), %rax
|
|
# BARCELONA-NEXT: [0,1] D=eeeeeeeeeeeER rcpss (%rax), %xmm1
|
|
|
|
# BDVER2: [0,0] DeeER. . . leaq 8(%rsp,%rdi,2), %rax
|
|
# BDVER2-NEXT: [0,1] D==eeeeeeeeeeER rcpss (%rax), %xmm1
|
|
|
|
# BROADWELL: [0,0] DeER . . . leaq 8(%rsp,%rdi,2), %rax
|
|
# BROADWELL-NEXT: [0,1] D=eeeeeeeeeeER rcpss (%rax), %xmm1
|
|
|
|
# BTVER2: [0,0] DeeER. .. leaq 8(%rsp,%rdi,2), %rax
|
|
# BTVER2-NEXT: [0,1] D==eeeeeeeER rcpss (%rax), %xmm1
|
|
|
|
# HASWELL: [0,0] DeER . . . leaq 8(%rsp,%rdi,2), %rax
|
|
# HASWELL-NEXT: [0,1] D=eeeeeeeeeeER rcpss (%rax), %xmm1
|
|
|
|
# SKYLAKE: [0,0] DeER . . . leaq 8(%rsp,%rdi,2), %rax
|
|
# SKYLAKE-NEXT: [0,1] D=eeeeeeeeeER rcpss (%rax), %xmm1
|
|
|
|
# ZNVER1: [0,0] DeER . . . leaq 8(%rsp,%rdi,2), %rax
|
|
# ZNVER1-NEXT: [0,1] D=eeeeeeeeeeeeER rcpss (%rax), %xmm1
|
|
|
|
# ZNVER2: [0,0] DeER . . . leaq 8(%rsp,%rdi,2), %rax
|
|
# ZNVER2-NEXT: [0,1] D=eeeeeeeeeeeeER rcpss (%rax), %xmm1
|
|
|
|
# ALL: Average Wait times (based on the timeline view):
|
|
# ALL-NEXT: [0]: Executions
|
|
# ALL-NEXT: [1]: Average time spent waiting in a scheduler's queue
|
|
# ALL-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
|
|
# ALL-NEXT: [3]: Average time elapsed from WB until retire stage
|
|
|
|
# ALL: [0] [1] [2] [3]
|
|
# ALL-NEXT: 0. 1 1.0 1.0 0.0 leaq 8(%rsp,%rdi,2), %rax
|
|
|
|
# BARCELONA-NEXT: 1. 1 2.0 0.0 0.0 rcpss (%rax), %xmm1
|
|
# BARCELONA-NEXT: 1 1.5 0.5 0.0 <total>
|
|
|
|
# BDVER2-NEXT: 1. 1 3.0 0.0 0.0 rcpss (%rax), %xmm1
|
|
# BDVER2-NEXT: 1 2.0 0.5 0.0 <total>
|
|
|
|
# BROADWELL-NEXT: 1. 1 2.0 0.0 0.0 rcpss (%rax), %xmm1
|
|
# BROADWELL-NEXT: 1 1.5 0.5 0.0 <total>
|
|
|
|
# BTVER2-NEXT: 1. 1 3.0 0.0 0.0 rcpss (%rax), %xmm1
|
|
# BTVER2-NEXT: 1 2.0 0.5 0.0 <total>
|
|
|
|
# HASWELL-NEXT: 1. 1 2.0 0.0 0.0 rcpss (%rax), %xmm1
|
|
# HASWELL-NEXT: 1 1.5 0.5 0.0 <total>
|
|
|
|
# SKYLAKE-NEXT: 1. 1 2.0 0.0 0.0 rcpss (%rax), %xmm1
|
|
# SKYLAKE-NEXT: 1 1.5 0.5 0.0 <total>
|
|
|
|
# ZNVER1-NEXT: 1. 1 2.0 0.0 0.0 rcpss (%rax), %xmm1
|
|
# ZNVER1-NEXT: 1 1.5 0.5 0.0 <total>
|
|
|
|
# ZNVER2-NEXT: 1. 1 2.0 0.0 0.0 rcpss (%rax), %xmm1
|
|
# ZNVER2-NEXT: 1 1.5 0.5 0.0 <total>
|