diff options
Diffstat (limited to 'llvm/test/tools/llvm-mca/X86/Broadwell/resources-sse1.s')
| -rw-r--r-- | llvm/test/tools/llvm-mca/X86/Broadwell/resources-sse1.s | 464 |
1 files changed, 464 insertions, 0 deletions
diff --git a/llvm/test/tools/llvm-mca/X86/Broadwell/resources-sse1.s b/llvm/test/tools/llvm-mca/X86/Broadwell/resources-sse1.s new file mode 100644 index 00000000000..c4df3ab8a44 --- /dev/null +++ b/llvm/test/tools/llvm-mca/X86/Broadwell/resources-sse1.s @@ -0,0 +1,464 @@ +# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py +# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=broadwell -instruction-tables < %s | FileCheck %s + +addps %xmm0, %xmm2 +addps (%rax), %xmm2 + +addss %xmm0, %xmm2 +addss (%rax), %xmm2 + +andnps %xmm0, %xmm2 +andnps (%rax), %xmm2 + +andps %xmm0, %xmm2 +andps (%rax), %xmm2 + +cmpps $0, %xmm0, %xmm2 +cmpps $0, (%rax), %xmm2 + +cmpss $0, %xmm0, %xmm2 +cmpss $0, (%rax), %xmm2 + +comiss %xmm0, %xmm1 +comiss (%rax), %xmm1 + +cvtpi2ps %mm0, %xmm2 +cvtpi2ps (%rax), %xmm2 + +cvtps2pi %xmm0, %mm2 +cvtps2pi (%rax), %mm2 + +cvtsi2ss %ecx, %xmm2 +cvtsi2ss %rcx, %xmm2 +cvtsi2ss (%rax), %xmm2 +cvtsi2ss (%rax), %xmm2 + +cvtss2si %xmm0, %ecx +cvtss2si %xmm0, %rcx +cvtss2si (%rax), %ecx +cvtss2si (%rax), %rcx + +cvttps2pi %xmm0, %mm2 +cvttps2pi (%rax), %mm2 + +cvttss2si %xmm0, %ecx +cvttss2si %xmm0, %rcx +cvttss2si (%rax), %ecx +cvttss2si (%rax), %rcx + +divps %xmm0, %xmm2 +divps (%rax), %xmm2 + +divss %xmm0, %xmm2 +divss (%rax), %xmm2 + +ldmxcsr (%rax) + +maskmovq %mm0, %mm1 + +maxps %xmm0, %xmm2 +maxps (%rax), %xmm2 + +maxss %xmm0, %xmm2 +maxss (%rax), %xmm2 + +minps %xmm0, %xmm2 +minps (%rax), %xmm2 + +minss %xmm0, %xmm2 +minss (%rax), %xmm2 + +movaps %xmm0, %xmm2 +movaps %xmm0, (%rax) +movaps (%rax), %xmm2 + +movhlps %xmm0, %xmm2 +movlhps %xmm0, %xmm2 + +movhps %xmm0, (%rax) +movhps (%rax), %xmm2 + +movlps %xmm0, (%rax) +movlps (%rax), %xmm2 + +movmskps %xmm0, %rcx + +movntps %xmm0, (%rax) +movntq %mm0, (%rax) + +movss %xmm0, %xmm2 +movss %xmm0, (%rax) +movss (%rax), %xmm2 + +movups %xmm0, %xmm2 +movups %xmm0, (%rax) +movups (%rax), %xmm2 + +mulps %xmm0, %xmm2 +mulps (%rax), %xmm2 + +mulss %xmm0, %xmm2 +mulss (%rax), %xmm2 + +orps %xmm0, %xmm2 +orps (%rax), %xmm2 + +pavgb %mm0, %mm2 +pavgb (%rax), %mm2 + +pavgw %mm0, %mm2 +pavgw (%rax), %mm2 + +pextrw $1, %mm0, %rcx + +pinsrw $1, %rax, %mm2 +pinsrw $1, (%rax), %mm2 + +pmaxsw %mm0, %mm2 +pmaxsw (%rax), %mm2 + +pmaxub %mm0, %mm2 +pmaxub (%rax), %mm2 + +pminsw %mm0, %mm2 +pminsw (%rax), %mm2 + +pminub %mm0, %mm2 +pminub (%rax), %mm2 + +pmovmskb %xmm0, %rcx + +pmulhuw %mm0, %mm2 +pmulhuw (%rax), %mm2 + +prefetcht0 (%rax) +prefetcht1 (%rax) +prefetcht2 (%rax) +prefetchnta (%rax) + +psadbw %mm0, %mm2 +psadbw (%rax), %mm2 + +pshufw $1, %mm0, %mm2 +pshufw $1, (%rax), %mm2 + +rcpps %xmm0, %xmm2 +rcpps (%rax), %xmm2 + +rcpss %xmm0, %xmm2 +rcpss (%rax), %xmm2 + +rsqrtps %xmm0, %xmm2 +rsqrtps (%rax), %xmm2 + +rsqrtss %xmm0, %xmm2 +rsqrtss (%rax), %xmm2 + +sfence + +shufps $1, %xmm0, %xmm2 +shufps $1, (%rax), %xmm2 + +sqrtps %xmm0, %xmm2 +sqrtps (%rax), %xmm2 + +sqrtss %xmm0, %xmm2 +sqrtss (%rax), %xmm2 + +stmxcsr (%rax) + +subps %xmm0, %xmm2 +subps (%rax), %xmm2 + +subss %xmm0, %xmm2 +subss (%rax), %xmm2 + +ucomiss %xmm0, %xmm1 +ucomiss (%rax), %xmm1 + +unpckhps %xmm0, %xmm2 +unpckhps (%rax), %xmm2 + +unpcklps %xmm0, %xmm2 +unpcklps (%rax), %xmm2 + +xorps %xmm0, %xmm2 +xorps (%rax), %xmm2 + +# CHECK: Instruction Info: +# CHECK-NEXT: [1]: #uOps +# CHECK-NEXT: [2]: Latency +# CHECK-NEXT: [3]: RThroughput +# CHECK-NEXT: [4]: MayLoad +# CHECK-NEXT: [5]: MayStore +# CHECK-NEXT: [6]: HasSideEffects + +# CHECK: [1] [2] [3] [4] [5] [6] Instructions: +# CHECK-NEXT: 1 3 1.00 addps %xmm0, %xmm2 +# CHECK-NEXT: 2 8 1.00 * addps (%rax), %xmm2 +# CHECK-NEXT: 1 3 1.00 addss %xmm0, %xmm2 +# CHECK-NEXT: 2 8 1.00 * addss (%rax), %xmm2 +# CHECK-NEXT: 1 1 1.00 andnps %xmm0, %xmm2 +# CHECK-NEXT: 2 6 1.00 * andnps (%rax), %xmm2 +# CHECK-NEXT: 1 1 1.00 andps %xmm0, %xmm2 +# CHECK-NEXT: 2 6 1.00 * andps (%rax), %xmm2 +# CHECK-NEXT: 1 3 1.00 cmpps $0, %xmm0, %xmm2 +# CHECK-NEXT: 2 8 1.00 * cmpps $0, (%rax), %xmm2 +# CHECK-NEXT: 1 3 1.00 cmpss $0, %xmm0, %xmm2 +# CHECK-NEXT: 2 8 1.00 * cmpss $0, (%rax), %xmm2 +# CHECK-NEXT: 1 3 1.00 comiss %xmm0, %xmm1 +# CHECK-NEXT: 2 8 1.00 * comiss (%rax), %xmm1 +# CHECK-NEXT: 1 3 1.00 cvtpi2ps %mm0, %xmm2 +# CHECK-NEXT: 2 8 1.00 * cvtpi2ps (%rax), %xmm2 +# CHECK-NEXT: 2 4 1.00 cvtps2pi %xmm0, %mm2 +# CHECK-NEXT: 2 8 1.00 * cvtps2pi (%rax), %mm2 +# CHECK-NEXT: 2 4 1.00 cvtsi2ssl %ecx, %xmm2 +# CHECK-NEXT: 3 5 2.00 cvtsi2ssq %rcx, %xmm2 +# CHECK-NEXT: 2 9 1.00 * cvtsi2ssl (%rax), %xmm2 +# CHECK-NEXT: 2 9 1.00 * cvtsi2ssl (%rax), %xmm2 +# CHECK-NEXT: 2 4 1.00 cvtss2si %xmm0, %ecx +# CHECK-NEXT: 2 4 1.00 cvtss2si %xmm0, %rcx +# CHECK-NEXT: 3 9 1.00 * cvtss2si (%rax), %ecx +# CHECK-NEXT: 3 9 1.00 * cvtss2si (%rax), %rcx +# CHECK-NEXT: 2 4 1.00 cvttps2pi %xmm0, %mm2 +# CHECK-NEXT: 2 8 1.00 * cvttps2pi (%rax), %mm2 +# CHECK-NEXT: 2 4 1.00 cvttss2si %xmm0, %ecx +# CHECK-NEXT: 2 4 1.00 cvttss2si %xmm0, %rcx +# CHECK-NEXT: 3 9 1.00 * cvttss2si (%rax), %ecx +# CHECK-NEXT: 4 10 1.00 * cvttss2si (%rax), %rcx +# CHECK-NEXT: 1 11 5.00 divps %xmm0, %xmm2 +# CHECK-NEXT: 2 16 5.00 * divps (%rax), %xmm2 +# CHECK-NEXT: 1 11 3.00 divss %xmm0, %xmm2 +# CHECK-NEXT: 2 16 5.00 * divss (%rax), %xmm2 +# CHECK-NEXT: 3 7 1.00 * * * ldmxcsr (%rax) +# CHECK-NEXT: 1 1 1.00 * * * maskmovq %mm0, %mm1 +# CHECK-NEXT: 1 3 1.00 maxps %xmm0, %xmm2 +# CHECK-NEXT: 2 8 1.00 * maxps (%rax), %xmm2 +# CHECK-NEXT: 1 3 1.00 maxss %xmm0, %xmm2 +# CHECK-NEXT: 2 8 1.00 * maxss (%rax), %xmm2 +# CHECK-NEXT: 1 3 1.00 minps %xmm0, %xmm2 +# CHECK-NEXT: 2 8 1.00 * minps (%rax), %xmm2 +# CHECK-NEXT: 1 3 1.00 minss %xmm0, %xmm2 +# CHECK-NEXT: 2 8 1.00 * minss (%rax), %xmm2 +# CHECK-NEXT: 1 1 1.00 movaps %xmm0, %xmm2 +# CHECK-NEXT: 2 1 1.00 * movaps %xmm0, (%rax) +# CHECK-NEXT: 1 5 0.50 * movaps (%rax), %xmm2 +# CHECK-NEXT: 1 1 1.00 movhlps %xmm0, %xmm2 +# CHECK-NEXT: 1 1 1.00 movlhps %xmm0, %xmm2 +# CHECK-NEXT: 2 1 1.00 * movhps %xmm0, (%rax) +# CHECK-NEXT: 2 6 1.00 * movhps (%rax), %xmm2 +# CHECK-NEXT: 2 1 1.00 * movlps %xmm0, (%rax) +# CHECK-NEXT: 2 6 1.00 * movlps (%rax), %xmm2 +# CHECK-NEXT: 1 3 1.00 movmskps %xmm0, %ecx +# CHECK-NEXT: 2 1 1.00 * movntps %xmm0, (%rax) +# CHECK-NEXT: 2 1 1.00 * * * movntq %mm0, (%rax) +# CHECK-NEXT: 1 1 1.00 movss %xmm0, %xmm2 +# CHECK-NEXT: 2 1 1.00 * movss %xmm0, (%rax) +# CHECK-NEXT: 1 5 0.50 * movss (%rax), %xmm2 +# CHECK-NEXT: 1 1 1.00 movups %xmm0, %xmm2 +# CHECK-NEXT: 2 1 1.00 * movups %xmm0, (%rax) +# CHECK-NEXT: 1 5 0.50 * movups (%rax), %xmm2 +# CHECK-NEXT: 1 3 0.50 mulps %xmm0, %xmm2 +# CHECK-NEXT: 2 8 0.50 * mulps (%rax), %xmm2 +# CHECK-NEXT: 1 3 0.50 mulss %xmm0, %xmm2 +# CHECK-NEXT: 2 8 0.50 * mulss (%rax), %xmm2 +# CHECK-NEXT: 1 1 1.00 orps %xmm0, %xmm2 +# CHECK-NEXT: 2 6 1.00 * orps (%rax), %xmm2 +# CHECK-NEXT: 1 1 0.50 pavgb %mm0, %mm2 +# CHECK-NEXT: 2 6 0.50 * pavgb (%rax), %mm2 +# CHECK-NEXT: 1 1 0.50 pavgw %mm0, %mm2 +# CHECK-NEXT: 2 6 0.50 * pavgw (%rax), %mm2 +# CHECK-NEXT: 2 2 1.00 pextrw $1, %mm0, %ecx +# CHECK-NEXT: 2 2 2.00 pinsrw $1, %eax, %mm2 +# CHECK-NEXT: 2 6 1.00 * pinsrw $1, (%rax), %mm2 +# CHECK-NEXT: 1 1 0.50 pmaxsw %mm0, %mm2 +# CHECK-NEXT: 2 6 0.50 * pmaxsw (%rax), %mm2 +# CHECK-NEXT: 1 1 0.50 pmaxub %mm0, %mm2 +# CHECK-NEXT: 2 6 0.50 * pmaxub (%rax), %mm2 +# CHECK-NEXT: 1 1 0.50 pminsw %mm0, %mm2 +# CHECK-NEXT: 2 6 0.50 * pminsw (%rax), %mm2 +# CHECK-NEXT: 1 1 0.50 pminub %mm0, %mm2 +# CHECK-NEXT: 2 6 0.50 * pminub (%rax), %mm2 +# CHECK-NEXT: 1 3 1.00 pmovmskb %xmm0, %ecx +# CHECK-NEXT: 1 5 1.00 pmulhuw %mm0, %mm2 +# CHECK-NEXT: 2 10 1.00 * pmulhuw (%rax), %mm2 +# CHECK-NEXT: 1 5 0.50 * * prefetcht0 (%rax) +# CHECK-NEXT: 1 5 0.50 * * prefetcht1 (%rax) +# CHECK-NEXT: 1 5 0.50 * * prefetcht2 (%rax) +# CHECK-NEXT: 1 5 0.50 * * prefetchnta (%rax) +# CHECK-NEXT: 1 5 1.00 psadbw %mm0, %mm2 +# CHECK-NEXT: 2 10 1.00 * psadbw (%rax), %mm2 +# CHECK-NEXT: 1 1 1.00 pshufw $1, %mm0, %mm2 +# CHECK-NEXT: 2 6 1.00 * pshufw $1, (%rax), %mm2 +# CHECK-NEXT: 1 5 1.00 rcpps %xmm0, %xmm2 +# CHECK-NEXT: 2 10 1.00 * rcpps (%rax), %xmm2 +# CHECK-NEXT: 1 5 1.00 rcpss %xmm0, %xmm2 +# CHECK-NEXT: 2 10 1.00 * rcpss (%rax), %xmm2 +# CHECK-NEXT: 1 5 1.00 rsqrtps %xmm0, %xmm2 +# CHECK-NEXT: 2 10 1.00 * rsqrtps (%rax), %xmm2 +# CHECK-NEXT: 1 5 1.00 rsqrtss %xmm0, %xmm2 +# CHECK-NEXT: 2 10 1.00 * rsqrtss (%rax), %xmm2 +# CHECK-NEXT: 2 2 0.33 * * * sfence +# CHECK-NEXT: 1 1 1.00 shufps $1, %xmm0, %xmm2 +# CHECK-NEXT: 2 6 1.00 * shufps $1, (%rax), %xmm2 +# CHECK-NEXT: 1 11 7.00 sqrtps %xmm0, %xmm2 +# CHECK-NEXT: 2 16 7.00 * sqrtps (%rax), %xmm2 +# CHECK-NEXT: 1 11 4.00 sqrtss %xmm0, %xmm2 +# CHECK-NEXT: 2 16 7.00 * sqrtss (%rax), %xmm2 +# CHECK-NEXT: 3 2 1.00 * * * stmxcsr (%rax) +# CHECK-NEXT: 1 3 1.00 subps %xmm0, %xmm2 +# CHECK-NEXT: 2 8 1.00 * subps (%rax), %xmm2 +# CHECK-NEXT: 1 3 1.00 subss %xmm0, %xmm2 +# CHECK-NEXT: 2 8 1.00 * subss (%rax), %xmm2 +# CHECK-NEXT: 1 3 1.00 ucomiss %xmm0, %xmm1 +# CHECK-NEXT: 2 8 1.00 * ucomiss (%rax), %xmm1 +# CHECK-NEXT: 1 1 1.00 unpckhps %xmm0, %xmm2 +# CHECK-NEXT: 2 6 1.00 * unpckhps (%rax), %xmm2 +# CHECK-NEXT: 1 1 1.00 unpcklps %xmm0, %xmm2 +# CHECK-NEXT: 2 6 1.00 * unpcklps (%rax), %xmm2 +# CHECK-NEXT: 1 1 1.00 xorps %xmm0, %xmm2 +# CHECK-NEXT: 2 6 1.00 * xorps (%rax), %xmm2 + +# CHECK: Resources: +# CHECK-NEXT: [0] - BWDivider +# CHECK-NEXT: [1] - BWFPDivider +# CHECK-NEXT: [2] - BWPort0 +# CHECK-NEXT: [3] - BWPort1 +# CHECK-NEXT: [4] - BWPort2 +# CHECK-NEXT: [5] - BWPort3 +# CHECK-NEXT: [6] - BWPort4 +# CHECK-NEXT: [7] - BWPort5 +# CHECK-NEXT: [8] - BWPort6 +# CHECK-NEXT: [9] - BWPort7 + +# CHECK: Resource pressure per iteration: +# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] +# CHECK-NEXT: - 43.00 34.50 50.50 32.00 32.00 8.00 41.50 0.50 3.00 + +# CHECK: Resource pressure by instruction: +# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] Instructions: +# CHECK-NEXT: - - - 1.00 - - - - - - addps %xmm0, %xmm2 +# CHECK-NEXT: - - - 1.00 0.50 0.50 - - - - addps (%rax), %xmm2 +# CHECK-NEXT: - - - 1.00 - - - - - - addss %xmm0, %xmm2 +# CHECK-NEXT: - - - 1.00 0.50 0.50 - - - - addss (%rax), %xmm2 +# CHECK-NEXT: - - - - - - - 1.00 - - andnps %xmm0, %xmm2 +# CHECK-NEXT: - - - - 0.50 0.50 - 1.00 - - andnps (%rax), %xmm2 +# CHECK-NEXT: - - - - - - - 1.00 - - andps %xmm0, %xmm2 +# CHECK-NEXT: - - - - 0.50 0.50 - 1.00 - - andps (%rax), %xmm2 +# CHECK-NEXT: - - - 1.00 - - - - - - cmpps $0, %xmm0, %xmm2 +# CHECK-NEXT: - - - 1.00 0.50 0.50 - - - - cmpps $0, (%rax), %xmm2 +# CHECK-NEXT: - - - 1.00 - - - - - - cmpss $0, %xmm0, %xmm2 +# CHECK-NEXT: - - - 1.00 0.50 0.50 - - - - cmpss $0, (%rax), %xmm2 +# CHECK-NEXT: - - - 1.00 - - - - - - comiss %xmm0, %xmm1 +# CHECK-NEXT: - - - 1.00 0.50 0.50 - - - - comiss (%rax), %xmm1 +# CHECK-NEXT: - - - 1.00 - - - - - - cvtpi2ps %mm0, %xmm2 +# CHECK-NEXT: - - - 1.00 0.50 0.50 - - - - cvtpi2ps (%rax), %xmm2 +# CHECK-NEXT: - - - 1.00 - - - 1.00 - - cvtps2pi %xmm0, %mm2 +# CHECK-NEXT: - - - 1.00 0.50 0.50 - - - - cvtps2pi (%rax), %mm2 +# CHECK-NEXT: - - - 1.00 - - - 1.00 - - cvtsi2ssl %ecx, %xmm2 +# CHECK-NEXT: - - - 1.00 - - - 2.00 - - cvtsi2ssq %rcx, %xmm2 +# CHECK-NEXT: - - - 1.00 0.50 0.50 - - - - cvtsi2ssl (%rax), %xmm2 +# CHECK-NEXT: - - - 1.00 0.50 0.50 - - - - cvtsi2ssl (%rax), %xmm2 +# CHECK-NEXT: - - 1.00 1.00 - - - - - - cvtss2si %xmm0, %ecx +# CHECK-NEXT: - - 1.00 1.00 - - - - - - cvtss2si %xmm0, %rcx +# CHECK-NEXT: - - 1.00 1.00 0.50 0.50 - - - - cvtss2si (%rax), %ecx +# CHECK-NEXT: - - 1.00 1.00 0.50 0.50 - - - - cvtss2si (%rax), %rcx +# CHECK-NEXT: - - - 1.00 - - - 1.00 - - cvttps2pi %xmm0, %mm2 +# CHECK-NEXT: - - - 1.00 0.50 0.50 - - - - cvttps2pi (%rax), %mm2 +# CHECK-NEXT: - - 1.00 1.00 - - - - - - cvttss2si %xmm0, %ecx +# CHECK-NEXT: - - 1.00 1.00 - - - - - - cvttss2si %xmm0, %rcx +# CHECK-NEXT: - - 1.00 1.00 0.50 0.50 - - - - cvttss2si (%rax), %ecx +# CHECK-NEXT: - - 1.00 1.00 0.50 0.50 - 1.00 - - cvttss2si (%rax), %rcx +# CHECK-NEXT: - 5.00 1.00 - - - - - - - divps %xmm0, %xmm2 +# CHECK-NEXT: - 5.00 1.00 - 0.50 0.50 - - - - divps (%rax), %xmm2 +# CHECK-NEXT: - 3.00 1.00 - - - - - - - divss %xmm0, %xmm2 +# CHECK-NEXT: - 5.00 1.00 - 0.50 0.50 - - - - divss (%rax), %xmm2 +# CHECK-NEXT: - - 1.25 0.25 0.50 0.50 - 0.25 0.25 - ldmxcsr (%rax) +# CHECK-NEXT: - - - - - - - 1.00 - - maskmovq %mm0, %mm1 +# CHECK-NEXT: - - - 1.00 - - - - - - maxps %xmm0, %xmm2 +# CHECK-NEXT: - - - 1.00 0.50 0.50 - - - - maxps (%rax), %xmm2 +# CHECK-NEXT: - - - 1.00 - - - - - - maxss %xmm0, %xmm2 +# CHECK-NEXT: - - - 1.00 0.50 0.50 - - - - maxss (%rax), %xmm2 +# CHECK-NEXT: - - - 1.00 - - - - - - minps %xmm0, %xmm2 +# CHECK-NEXT: - - - 1.00 0.50 0.50 - - - - minps (%rax), %xmm2 +# CHECK-NEXT: - - - 1.00 - - - - - - minss %xmm0, %xmm2 +# CHECK-NEXT: - - - 1.00 0.50 0.50 - - - - minss (%rax), %xmm2 +# CHECK-NEXT: - - - - - - - 1.00 - - movaps %xmm0, %xmm2 +# CHECK-NEXT: - - - - 0.33 0.33 1.00 - - 0.33 movaps %xmm0, (%rax) +# CHECK-NEXT: - - - - 0.50 0.50 - - - - movaps (%rax), %xmm2 +# CHECK-NEXT: - - - - - - - 1.00 - - movhlps %xmm0, %xmm2 +# CHECK-NEXT: - - - - - - - 1.00 - - movlhps %xmm0, %xmm2 +# CHECK-NEXT: - - - - 0.33 0.33 1.00 - - 0.33 movhps %xmm0, (%rax) +# CHECK-NEXT: - - - - 0.50 0.50 - 1.00 - - movhps (%rax), %xmm2 +# CHECK-NEXT: - - - - 0.33 0.33 1.00 - - 0.33 movlps %xmm0, (%rax) +# CHECK-NEXT: - - - - 0.50 0.50 - 1.00 - - movlps (%rax), %xmm2 +# CHECK-NEXT: - - 1.00 - - - - - - - movmskps %xmm0, %ecx +# CHECK-NEXT: - - - - 0.33 0.33 1.00 - - 0.33 movntps %xmm0, (%rax) +# CHECK-NEXT: - - - - 0.33 0.33 1.00 - - 0.33 movntq %mm0, (%rax) +# CHECK-NEXT: - - - - - - - 1.00 - - movss %xmm0, %xmm2 +# CHECK-NEXT: - - - - 0.33 0.33 1.00 - - 0.33 movss %xmm0, (%rax) +# CHECK-NEXT: - - - - 0.50 0.50 - - - - movss (%rax), %xmm2 +# CHECK-NEXT: - - - - - - - 1.00 - - movups %xmm0, %xmm2 +# CHECK-NEXT: - - - - 0.33 0.33 1.00 - - 0.33 movups %xmm0, (%rax) +# CHECK-NEXT: - - - - 0.50 0.50 - - - - movups (%rax), %xmm2 +# CHECK-NEXT: - - 0.50 0.50 - - - - - - mulps %xmm0, %xmm2 +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - mulps (%rax), %xmm2 +# CHECK-NEXT: - - 0.50 0.50 - - - - - - mulss %xmm0, %xmm2 +# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - mulss (%rax), %xmm2 +# CHECK-NEXT: - - - - - - - 1.00 - - orps %xmm0, %xmm2 +# CHECK-NEXT: - - - - 0.50 0.50 - 1.00 - - orps (%rax), %xmm2 +# CHECK-NEXT: - - - 0.50 - - - 0.50 - - pavgb %mm0, %mm2 +# CHECK-NEXT: - - - 0.50 0.50 0.50 - 0.50 - - pavgb (%rax), %mm2 +# CHECK-NEXT: - - - 0.50 - - - 0.50 - - pavgw %mm0, %mm2 +# CHECK-NEXT: - - - 0.50 0.50 0.50 - 0.50 - - pavgw (%rax), %mm2 +# CHECK-NEXT: - - 1.00 - - - - 1.00 - - pextrw $1, %mm0, %ecx +# CHECK-NEXT: - - - - - - - 2.00 - - pinsrw $1, %eax, %mm2 +# CHECK-NEXT: - - - - 0.50 0.50 - 1.00 - - pinsrw $1, (%rax), %mm2 +# CHECK-NEXT: - - - 0.50 - - - 0.50 - - pmaxsw %mm0, %mm2 +# CHECK-NEXT: - - - 0.50 0.50 0.50 - 0.50 - - pmaxsw (%rax), %mm2 +# CHECK-NEXT: - - - 0.50 - - - 0.50 - - pmaxub %mm0, %mm2 +# CHECK-NEXT: - - - 0.50 0.50 0.50 - 0.50 - - pmaxub (%rax), %mm2 +# CHECK-NEXT: - - - 0.50 - - - 0.50 - - pminsw %mm0, %mm2 +# CHECK-NEXT: - - - 0.50 0.50 0.50 - 0.50 - - pminsw (%rax), %mm2 +# CHECK-NEXT: - - - 0.50 - - - 0.50 - - pminub %mm0, %mm2 +# CHECK-NEXT: - - - 0.50 0.50 0.50 - 0.50 - - pminub (%rax), %mm2 +# CHECK-NEXT: - - 1.00 - - - - - - - pmovmskb %xmm0, %ecx +# CHECK-NEXT: - - 1.00 - - - - - - - pmulhuw %mm0, %mm2 +# CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - pmulhuw (%rax), %mm2 +# CHECK-NEXT: - - - - 0.50 0.50 - - - - prefetcht0 (%rax) +# CHECK-NEXT: - - - - 0.50 0.50 - - - - prefetcht1 (%rax) +# CHECK-NEXT: - - - - 0.50 0.50 - - - - prefetcht2 (%rax) +# CHECK-NEXT: - - - - 0.50 0.50 - - - - prefetchnta (%rax) +# CHECK-NEXT: - - 1.00 - - - - - - - psadbw %mm0, %mm2 +# CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - psadbw (%rax), %mm2 +# CHECK-NEXT: - - - - - - - 1.00 - - pshufw $1, %mm0, %mm2 +# CHECK-NEXT: - - - - 0.50 0.50 - 1.00 - - pshufw $1, (%rax), %mm2 +# CHECK-NEXT: - - 1.00 - - - - - - - rcpps %xmm0, %xmm2 +# CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - rcpps (%rax), %xmm2 +# CHECK-NEXT: - - 1.00 - - - - - - - rcpss %xmm0, %xmm2 +# CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - rcpss (%rax), %xmm2 +# CHECK-NEXT: - - 1.00 - - - - - - - rsqrtps %xmm0, %xmm2 +# CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - rsqrtps (%rax), %xmm2 +# CHECK-NEXT: - - 1.00 - - - - - - - rsqrtss %xmm0, %xmm2 +# CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - rsqrtss (%rax), %xmm2 +# CHECK-NEXT: - - 0.25 0.25 0.33 0.33 - 0.25 0.25 0.33 sfence +# CHECK-NEXT: - - - - - - - 1.00 - - shufps $1, %xmm0, %xmm2 +# CHECK-NEXT: - - - - 0.50 0.50 - 1.00 - - shufps $1, (%rax), %xmm2 +# CHECK-NEXT: - 7.00 1.00 - - - - - - - sqrtps %xmm0, %xmm2 +# CHECK-NEXT: - 7.00 1.00 - 0.50 0.50 - - - - sqrtps (%rax), %xmm2 +# CHECK-NEXT: - 4.00 1.00 - - - - - - - sqrtss %xmm0, %xmm2 +# CHECK-NEXT: - 7.00 1.00 - 0.50 0.50 - - - - sqrtss (%rax), %xmm2 +# CHECK-NEXT: - - - - 0.33 0.33 1.00 1.00 - 0.33 stmxcsr (%rax) +# CHECK-NEXT: - - - 1.00 - - - - - - subps %xmm0, %xmm2 +# CHECK-NEXT: - - - 1.00 0.50 0.50 - - - - subps (%rax), %xmm2 +# CHECK-NEXT: - - - 1.00 - - - - - - subss %xmm0, %xmm2 +# CHECK-NEXT: - - - 1.00 0.50 0.50 - - - - subss (%rax), %xmm2 +# CHECK-NEXT: - - - 1.00 - - - - - - ucomiss %xmm0, %xmm1 +# CHECK-NEXT: - - - 1.00 0.50 0.50 - - - - ucomiss (%rax), %xmm1 +# CHECK-NEXT: - - - - - - - 1.00 - - unpckhps %xmm0, %xmm2 +# CHECK-NEXT: - - - - 0.50 0.50 - 1.00 - - unpckhps (%rax), %xmm2 +# CHECK-NEXT: - - - - - - - 1.00 - - unpcklps %xmm0, %xmm2 +# CHECK-NEXT: - - - - 0.50 0.50 - 1.00 - - unpcklps (%rax), %xmm2 +# CHECK-NEXT: - - - - - - - 1.00 - - xorps %xmm0, %xmm2 +# CHECK-NEXT: - - - - 0.50 0.50 - 1.00 - - xorps (%rax), %xmm2 + |

