summaryrefslogtreecommitdiffstats
path: root/llvm/test/CodeGen/XCore/memcpy.ll
diff options
context:
space:
mode:
authorRichard Osborne <richard@xmos.com>2014-02-27 13:39:07 +0000
committerRichard Osborne <richard@xmos.com>2014-02-27 13:39:07 +0000
commita283d24ad9afdf0136595dae3b9fd4c0fc087ec8 (patch)
treef38ad90d1ed9b704129f71c9f405dd2daf1aa178 /llvm/test/CodeGen/XCore/memcpy.ll
parentd6e85018c5f21381db8b8fab9416488c9c970d4d (diff)
downloadbcm5719-llvm-a283d24ad9afdf0136595dae3b9fd4c0fc087ec8.tar.gz
bcm5719-llvm-a283d24ad9afdf0136595dae3b9fd4c0fc087ec8.zip
[XCore] Target optimized library function __memcpy_4()
Summary: If the src, dst and size of a memcpy are known to be 4 byte aligned we can call __memcpy_4() instead of memcpy(). Reviewers: robertlytton Reviewed By: robertlytton CC: llvm-commits Differential Revision: http://llvm-reviews.chandlerc.com/D2871 llvm-svn: 202395
Diffstat (limited to 'llvm/test/CodeGen/XCore/memcpy.ll')
-rw-r--r--llvm/test/CodeGen/XCore/memcpy.ll32
1 files changed, 32 insertions, 0 deletions
diff --git a/llvm/test/CodeGen/XCore/memcpy.ll b/llvm/test/CodeGen/XCore/memcpy.ll
new file mode 100644
index 00000000000..fe424c50cb2
--- /dev/null
+++ b/llvm/test/CodeGen/XCore/memcpy.ll
@@ -0,0 +1,32 @@
+; RUN: llc < %s -march=xcore | FileCheck %s
+
+; Optimize memcpy to __memcpy_4 if src, dst and size are all 4 byte aligned.
+define void @f1(i8* %dst, i8* %src, i32 %n) nounwind {
+; CHECK-LABEL: f1:
+; CHECK: bl __memcpy_4
+entry:
+ %0 = shl i32 %n, 2
+ call void @llvm.memcpy.p0i8.p0i8.i32(i8* %dst, i8* %src, i32 %0, i32 4, i1 false)
+ ret void
+}
+
+; Can't optimize - size is not a multiple of 4.
+define void @f2(i8* %dst, i8* %src, i32 %n) nounwind {
+; CHECK-LABEL: f2:
+; CHECK: bl memcpy
+entry:
+ call void @llvm.memcpy.p0i8.p0i8.i32(i8* %dst, i8* %src, i32 %n, i32 4, i1 false)
+ ret void
+}
+
+; Can't optimize - alignment is not a multiple of 4.
+define void @f3(i8* %dst, i8* %src, i32 %n) nounwind {
+; CHECK-LABEL: f3:
+; CHECK: bl memcpy
+entry:
+ %0 = shl i32 %n, 2
+ call void @llvm.memcpy.p0i8.p0i8.i32(i8* %dst, i8* %src, i32 %0, i32 2, i1 false)
+ ret void
+}
+
+declare void @llvm.memcpy.p0i8.p0i8.i32(i8* nocapture, i8* nocapture, i32, i32, i1) nounwind
OpenPOWER on IntegriCloud