summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
-rw-r--r--polly/lib/CodeGeneration.cpp21
-rw-r--r--polly/test/CodeGen/simple_vec_cast.ll33
2 files changed, 53 insertions, 1 deletions
diff --git a/polly/lib/CodeGeneration.cpp b/polly/lib/CodeGeneration.cpp
index cb8a01f4ed4..10e96baa20b 100644
--- a/polly/lib/CodeGeneration.cpp
+++ b/polly/lib/CodeGeneration.cpp
@@ -409,6 +409,21 @@ public:
vectorMap[load] = newLoad;
}
+ void copyUnaryInst(const UnaryInstruction *Inst, ValueMapT &BBMap,
+ ValueMapT &VectorMap, int VectorDimension,
+ int VectorWidth) {
+ Value *NewOperand = getOperand(Inst->getOperand(0), BBMap, &VectorMap);
+ NewOperand = makeVectorOperand(NewOperand, VectorWidth);
+
+ if (const CastInst *Cast = dyn_cast<CastInst>(Inst)) {
+ VectorType *DestType = VectorType::get(Inst->getType(), VectorWidth);
+ VectorMap[Inst] = Builder.CreateCast(Cast->getOpcode(), NewOperand,
+ DestType);
+ } else
+ llvm_unreachable("Can not generate vector code for instruction");
+ return;
+ }
+
void copyBinInst(const BinaryOperator *Inst, ValueMapT &BBMap,
ValueMapT &vectorMap, int vectorDimension, int vectorWidth) {
Value *opZero = Inst->getOperand(0);
@@ -529,7 +544,11 @@ public:
}
if (isVectorBlock() && hasVectorOperands(Inst, vectorMap)) {
- if (const BinaryOperator *binaryInst = dyn_cast<BinaryOperator>(Inst))
+ if (const UnaryInstruction *UnaryInst = dyn_cast<UnaryInstruction>(Inst))
+ copyUnaryInst(UnaryInst, BBMap, vectorMap, vectorDimension,
+ vectorWidth);
+ else if
+ (const BinaryOperator *binaryInst = dyn_cast<BinaryOperator>(Inst))
copyBinInst(binaryInst, BBMap, vectorMap, vectorDimension, vectorWidth);
else if (const StoreInst *store = dyn_cast<StoreInst>(Inst))
copyVectorStore(store, BBMap, vectorMap, scalarMaps, vectorDimension,
diff --git a/polly/test/CodeGen/simple_vec_cast.ll b/polly/test/CodeGen/simple_vec_cast.ll
new file mode 100644
index 00000000000..949ecd43187
--- /dev/null
+++ b/polly/test/CodeGen/simple_vec_cast.ll
@@ -0,0 +1,33 @@
+; RUN: opt %loadPolly -basicaa -polly-codegen -enable-polly-vector -dce -S %s | FileCheck %s
+target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64"
+target triple = "x86_64-unknown-linux-gnu"
+
+@A = common global [1024 x float] zeroinitializer, align 16
+@B = common global [1024 x double] zeroinitializer, align 16
+
+define void @simple_vec_const() nounwind {
+bb:
+ br label %bb1
+
+bb1: ; preds = %bb3, %bb
+ %indvar = phi i64 [ %indvar.next, %bb3 ], [ 0, %bb ]
+ %scevgep = getelementptr [1024 x double]* @B, i64 0, i64 %indvar
+ %exitcond = icmp ne i64 %indvar, 4
+ br i1 %exitcond, label %bb2, label %bb4
+
+bb2: ; preds = %bb1
+ %tmp = load float* getelementptr inbounds ([1024 x float]* @A, i64 0, i64 0), align 16
+ %tmp2 = fpext float %tmp to double
+ store double %tmp2, double* %scevgep, align 4
+ br label %bb3
+
+bb3: ; preds = %bb2
+ %indvar.next = add i64 %indvar, 1
+ br label %bb1
+
+bb4: ; preds = %bb1
+ ret void
+}
+
+; CHECK: fpext <4 x float> %tmp_p_splat to <4 x double>
+
OpenPOWER on IntegriCloud