diff options
author | Jatin Bhateja <jatin.bhateja@gmail.com> | 2017-09-08 09:15:36 +0000 |
---|---|---|
committer | Jatin Bhateja <jatin.bhateja@gmail.com> | 2017-09-08 09:15:36 +0000 |
commit | a2513127193b445afcfacd3529f3693fff3c1b30 (patch) | |
tree | 5027143e5b5e0c9385696e434e308ab532d6c61b | |
parent | 5f37541c7396cf4759cf79b8fd8b1a4a64a29c80 (diff) | |
download | bcm5719-llvm-a2513127193b445afcfacd3529f3693fff3c1b30.tar.gz bcm5719-llvm-a2513127193b445afcfacd3529f3693fff3c1b30.zip |
[X86] Adding a test point for PR34149 'Suboptimal codegen for "fast" minnum and maxnum'
Differential Revision: https://reviews.llvm.org/D37614
llvm-svn: 312778
-rw-r--r-- | llvm/test/CodeGen/X86/pr34149.ll | 40 |
1 files changed, 40 insertions, 0 deletions
diff --git a/llvm/test/CodeGen/X86/pr34149.ll b/llvm/test/CodeGen/X86/pr34149.ll new file mode 100644 index 00000000000..3875c2fa47d --- /dev/null +++ b/llvm/test/CodeGen/X86/pr34149.ll @@ -0,0 +1,40 @@ +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py + +; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu -mcpu=haswell | FileCheck %s + +declare <4 x double> @llvm.minnum.v4f64(<4 x double> %x, <4 x double> %y) +declare <4 x double> @llvm.maxnum.v4f64(<4 x double> %x, <4 x double> %y) + +define <4 x double> @via_minnum(<4 x double> %x, <4 x double> %y) { +; CHECK-LABEL: via_minnum: +; CHECK: # BB#0: +; CHECK-NEXT: vminpd %ymm0, %ymm1, %ymm2 +; CHECK-NEXT: vcmpunordpd %ymm0, %ymm0, %ymm0 +; CHECK-NEXT: vblendvpd %ymm0, %ymm1, %ymm2, %ymm0 +; CHECK-NEXT: retq + %z = call fast <4 x double> @llvm.minnum.v4f64(<4 x double> %x, <4 x double> %y) readnone + ret <4 x double> %z +} + +define <4 x double> @via_maxnum(<4 x double> %x, <4 x double> %y) { +; CHECK-LABEL: via_maxnum: +; CHECK: # BB#0: +; CHECK-NEXT: vmaxpd %ymm0, %ymm1, %ymm2 +; CHECK-NEXT: vcmpunordpd %ymm0, %ymm0, %ymm0 +; CHECK-NEXT: vblendvpd %ymm0, %ymm1, %ymm2, %ymm0 +; CHECK-NEXT: retq + %z = call fast <4 x double> @llvm.maxnum.v4f64(<4 x double> %x, <4 x double> %y) readnone + ret <4 x double> %z +} + +define <4 x double> @via_fcmp(<4 x double> %x, <4 x double> %y) { +; CHECK-LABEL: via_fcmp: +; CHECK: # BB#0: +; CHECK-NEXT: vminpd %ymm0, %ymm1, %ymm0 +; CHECK-NEXT: retq + %c = fcmp ule <4 x double> %x, %y + %z = select <4 x i1> %c, <4 x double> %x, <4 x double> %y + ret <4 x double> %z +} + + |