diff options
| author | Sameer AbuAsal <sabuasal@codeaurora.org> | 2018-03-08 23:41:40 +0000 |
|---|---|---|
| committer | Sameer AbuAsal <sabuasal@codeaurora.org> | 2018-03-08 23:41:40 +0000 |
| commit | 986865c090a9cef1b41a3a9cdddf9576a5610dd1 (patch) | |
| tree | a283fec798d19fed2903993fff5f921af009336d /llvm/test | |
| parent | 69fce12c38ff605b2c65747746e4c635a9fac900 (diff) | |
| download | bcm5719-llvm-986865c090a9cef1b41a3a9cdddf9576a5610dd1.tar.gz bcm5719-llvm-986865c090a9cef1b41a3a9cdddf9576a5610dd1.zip | |
Propagate flags to SDValue in SplitVecOp_VECREDUCE
This patch is a fix for PR36642.
While legalizing long vector types, make sure the smaller types get the
flags of the wider type.
bugzilla link: https://bugs.llvm.org/show_bug.cgi?id=36642
Change-Id: I0c2829639f094c862c10a6b51b342d4c2563e1fa
llvm-svn: 327079
Diffstat (limited to 'llvm/test')
| -rw-r--r-- | llvm/test/CodeGen/AArch64/vecreduce-propagate-sd-flags.ll | 31 |
1 files changed, 31 insertions, 0 deletions
diff --git a/llvm/test/CodeGen/AArch64/vecreduce-propagate-sd-flags.ll b/llvm/test/CodeGen/AArch64/vecreduce-propagate-sd-flags.ll new file mode 100644 index 00000000000..32adf513e47 --- /dev/null +++ b/llvm/test/CodeGen/AArch64/vecreduce-propagate-sd-flags.ll @@ -0,0 +1,31 @@ +; REQUIRES: arm-registered-target +; REQUIRES: asserts +; RUN: llc %s -debug-only=legalize-types 2>&1 | FileCheck %s + +; This test check that when v4f64 gets broken down to two v2f64 it maintains +; the "nnan" flags. + +; CHECK: Legalizing node: [[VFOUR:t.*]]: v4f64 = BUILD_VECTOR +; CHECK-NEXT: Analyzing result type: v4f64 +; CHECK-NEXT: Split node result: [[VFOUR]]: v4f64 = BUILD_VECTOR + +; CHECK: Legalizing node: [[VTWO:t.*]]: v2f64 = BUILD_VECTOR +; CHECK: Legally typed node: [[VTWO]]: v2f64 = BUILD_VECTOR +; CHECK: Legalizing node: t26: v2f64 = fmaxnum nnan [[VTWO]], [[VTWO]] + +target datalayout = "e-m:e-i8:8:32-i16:16:32-i64:64-i128:128-n32:64-S128" +target triple = "aarch64--linux-gnu" + + +; Function Attrs: norecurse nounwind +define fastcc double @test() unnamed_addr #1 { +entry: + %0 = insertelement <4 x double> undef, double 1.0, i32 0 + %1 = insertelement <4 x double> %0, double 1.0, i32 1 + %2 = insertelement <4 x double> %1, double 1.0, i32 2 + %3 = insertelement <4 x double> %2, double 1.0, i32 3 + %4 = call nnan double @llvm.experimental.vector.reduce.fmax.f64.v4f64(<4 x double> %3) + ret double %4 +} + +declare double @llvm.experimental.vector.reduce.fmax.f64.v4f64(<4 x double>) |

