Support generic expansion of ordered vector reduction (PR36732)

Without the fast math flags, the llvm.experimental.vector.reduce.fadd/fmul intrinsic expansions must be expanded in order. This patch scalarizes the reduction, applying the accumulator at the start of the sequence: ((((Acc + Scl[0]) + Scl[1]) + Scl[2]) + ) ... + Scl[NumElts-1] Differential Revision: https://reviews.llvm.org/D45366 llvm-svn: 329585
author: Simon Pilgrim <llvm-dev@redking.me.uk> 2018-04-09 15:44:20 +0000
committer: Simon Pilgrim <llvm-dev@redking.me.uk> 2018-04-09 15:44:20 +0000
commit: 23c2182c2bfcd145b2c33cf5ca831a7348e6adce (patch)
tree: 539213fa47e89fc0f31e62c647aceda93c205cb5 /llvm/lib/CodeGen/ExpandReductions.cpp
parent: bec8a66454882285db4c98311ba430adec2c8dac (diff)
download: bcm5719-llvm-23c2182c2bfcd145b2c33cf5ca831a7348e6adce.tar.gz
bcm5719-llvm-23c2182c2bfcd145b2c33cf5ca831a7348e6adce.zip
1 files changed, 9 insertions, 6 deletions
diff --git a/llvm/lib/CodeGen/ExpandReductions.cpp b/llvm/lib/CodeGen/ExpandReductions.cpp
index abf487a4f19..7552ba8cd85 100644
--- a/llvm/lib/CodeGen/ExpandReductions.cpp
+++ b/llvm/lib/CodeGen/ExpandReductions.cpp
@@ -78,13 +78,15 @@ RecurrenceDescriptor::MinMaxRecurrenceKind getMRK(Intrinsic::ID ID) {
 
 bool expandReductions(Function &F, const TargetTransformInfo *TTI) {
   bool Changed = false;
-  SmallVector<IntrinsicInst*, 4> Worklist;
+  SmallVector<IntrinsicInst *, 4> Worklist;
   for (inst_iterator I = inst_begin(F), E = inst_end(F); I != E; ++I)
     if (auto II = dyn_cast<IntrinsicInst>(&*I))
       Worklist.push_back(II);
 
   for (auto *II : Worklist) {
     IRBuilder<> Builder(II);
+    bool IsOrdered = false;
+    Value *Acc = nullptr;
     Value *Vec = nullptr;
     auto ID = II->getIntrinsicID();
     auto MRK = RecurrenceDescriptor::MRK_Invalid;
@@ -92,11 +94,10 @@ bool expandReductions(Function &F, const TargetTransformInfo *TTI) {
     case Intrinsic::experimental_vector_reduce_fadd:
     case Intrinsic::experimental_vector_reduce_fmul:
       // FMFs must be attached to the call, otherwise it's an ordered reduction
-      // and it can't be handled by generating this shuffle sequence.
-      // TODO: Implement scalarization of ordered reductions here for targets
-      // without native support.
+      // and it can't be handled by generating a shuffle sequence.
       if (!II->getFastMathFlags().isFast())
-        continue;
+        IsOrdered = true;
+      Acc = II->getArgOperand(0);
       Vec = II->getArgOperand(1);
       break;
     case Intrinsic::experimental_vector_reduce_add:
@@ -118,7 +119,9 @@ bool expandReductions(Function &F, const TargetTransformInfo *TTI) {
     }
     if (!TTI->shouldExpandReduction(II))
       continue;
-    auto Rdx = getShuffleReduction(Builder, Vec, getOpcode(ID), MRK);
+    Value *Rdx =
+        IsOrdered ? getOrderedReduction(Builder, Acc, Vec, getOpcode(ID), MRK)
+                  : getShuffleReduction(Builder, Vec, getOpcode(ID), MRK);
     II->replaceAllUsesWith(Rdx);
     II->eraseFromParent();
     Changed = true;
author	Simon Pilgrim <llvm-dev@redking.me.uk>	2018-04-09 15:44:20 +0000
committer	Simon Pilgrim <llvm-dev@redking.me.uk>	2018-04-09 15:44:20 +0000
commit	23c2182c2bfcd145b2c33cf5ca831a7348e6adce (patch)
tree	539213fa47e89fc0f31e62c647aceda93c205cb5 /llvm/lib/CodeGen/ExpandReductions.cpp
parent	bec8a66454882285db4c98311ba430adec2c8dac (diff)
download	bcm5719-llvm-23c2182c2bfcd145b2c33cf5ca831a7348e6adce.tar.gz bcm5719-llvm-23c2182c2bfcd145b2c33cf5ca831a7348e6adce.zip