summaryrefslogtreecommitdiffstats
path: root/llvm/test/CodeGen/Hexagon
diff options
context:
space:
mode:
authorKrzysztof Parzyszek <kparzysz@codeaurora.org>2017-08-24 11:59:53 +0000
committerKrzysztof Parzyszek <kparzysz@codeaurora.org>2017-08-24 11:59:53 +0000
commitc09a14eeb251988c8dbdb753d845436faddb82e1 (patch)
tree8f85dc736ab99b6f311ff4720ebc75d439f47919 /llvm/test/CodeGen/Hexagon
parent540a39adf7f0c1190249e6a3c9b5a13bd20d80d9 (diff)
downloadbcm5719-llvm-c09a14eeb251988c8dbdb753d845436faddb82e1.tar.gz
bcm5719-llvm-c09a14eeb251988c8dbdb753d845436faddb82e1.zip
[Hexagon] Generate correct runtime check when recognizing memmove
The check (assuming positive stride) for validity of memmove should be (a) the destination is at a lower address than the source, or (b) the distance between the source and destination is greater than or equal the number of bytes copied. For the second part it is sufficient to assume that the destination is at a higher address, since the opposite case is covered by (a). The distance calculation was previously done by subtracting the pointers in the wrong order. llvm-svn: 311650
Diffstat (limited to 'llvm/test/CodeGen/Hexagon')
-rw-r--r--llvm/test/CodeGen/Hexagon/loop-idiom/memmove-rt-check.ll45
1 files changed, 45 insertions, 0 deletions
diff --git a/llvm/test/CodeGen/Hexagon/loop-idiom/memmove-rt-check.ll b/llvm/test/CodeGen/Hexagon/loop-idiom/memmove-rt-check.ll
new file mode 100644
index 00000000000..ce2c17e4198
--- /dev/null
+++ b/llvm/test/CodeGen/Hexagon/loop-idiom/memmove-rt-check.ll
@@ -0,0 +1,45 @@
+; RUN: opt -hexagon-loop-idiom -S < %s | FileCheck %s
+
+; Make sure that we generate correct runtime checks.
+
+; CHECK: b7.old:
+; CHECK: [[LEN:%[0-9]+]] = shl i32 %len, 3
+; CHECK: [[SRC:%[0-9]+]] = ptrtoint i8* %src to i32
+; CHECK: [[DST:%[0-9]+]] = ptrtoint i8* %dst to i32
+; CHECK: [[ULT:%[0-9]+]] = icmp ult i32 [[DST]], [[SRC]]
+; CHECK: [[SUB:%[0-9]+]] = sub i32 [[DST]], [[SRC]]
+; CHECK: [[SLT:%[0-9]+]] = icmp sle i32 [[LEN]], [[SUB]]
+; CHECK: [[CND:%[0-9]+]] = or i1 [[ULT]], [[SLT]]
+; CHECK: br i1 [[CND]], label %b8.rtli, label %b8.rtli.ph
+
+target datalayout = "e-m:e-p:32:32:32-a:0-n16:32-i64:64:64-i32:32:32-i16:16:16-i1:8:8-f32:32:32-f64:64:64-v32:32:32-v64:64:64-v512:512:512-v1024:1024:1024-v2048:2048:2048"
+target triple = "hexagon"
+
+define void @fred(i8* %dst, i8* %src, i32 %len) #0 {
+b3:
+ %v4 = bitcast i8* %src to i64*
+ %v5 = bitcast i8* %dst to i64*
+ %v6 = icmp slt i32 0, %len
+ br i1 %v6, label %b7, label %b16
+
+b7: ; preds = %b3
+ br label %b8
+
+b8: ; preds = %b13, %b7
+ %v9 = phi i32 [ 0, %b7 ], [ %v14, %b13 ]
+ %v10 = getelementptr inbounds i64, i64* %v4, i32 %v9
+ %v11 = load i64, i64* %v10, align 8
+ %v12 = getelementptr inbounds i64, i64* %v5, i32 %v9
+ store i64 %v11, i64* %v12, align 8
+ br label %b13
+
+b13: ; preds = %b8
+ %v14 = add nsw i32 %v9, 1
+ %v15 = icmp slt i32 %v14, %len
+ br i1 %v15, label %b8, label %b16
+
+b16: ; preds = %b13, %b3
+ ret void
+}
+
+attributes #0 = { noinline nounwind "target-cpu"="hexagonv60" }
OpenPOWER on IntegriCloud