summaryrefslogtreecommitdiffstats
path: root/llvm/test
diff options
context:
space:
mode:
authorRoman Tereshin <rtereshin@apple.com>2018-04-23 22:28:36 +0000
committerRoman Tereshin <rtereshin@apple.com>2018-04-23 22:28:36 +0000
commit3c6ea7e28c957bdaf03df8a3a4ff00c46e9315f6 (patch)
treea28696867a28b68a9a3621e7f49fe96dbb61467f /llvm/test
parenteb6090941c49ccaf48715f49c89eef07409a7cf2 (diff)
downloadbcm5719-llvm-3c6ea7e28c957bdaf03df8a3a4ff00c46e9315f6.tar.gz
bcm5719-llvm-3c6ea7e28c957bdaf03df8a3a4ff00c46e9315f6.zip
[GlobalISel][Legalizer] Look thro copies while combining G_UNMERGE's
As we're becoming stricter w/ respect to not allowing vregs having LLTs and regclasses assigned both mid-globalisel pipeline, the number of extra copies grows, some of which separate G_UNMERGE's from their corresponding G_MERGE's, becoming a performance concern. It's worth mentioning that we're already looking through copies while combining legalization artifacts for every kind of artifact but G_UNMERGE. Reviewed By: aditya_nandakumar Reviewers: ab, t.p.northover, volkan, javed.absar Subscribers: rovka, kristof.beyls, llvm-commits Differential Revision: https://reviews.llvm.org/D45644 llvm-svn: 330660
Diffstat (limited to 'llvm/test')
-rw-r--r--llvm/test/CodeGen/AArch64/GlobalISel/legalize-combines.mir34
-rw-r--r--llvm/test/CodeGen/AArch64/GlobalISel/legalize-nonpowerof2eltsvec.mir9
2 files changed, 37 insertions, 6 deletions
diff --git a/llvm/test/CodeGen/AArch64/GlobalISel/legalize-combines.mir b/llvm/test/CodeGen/AArch64/GlobalISel/legalize-combines.mir
index 9dd68eb4a46..f9b54defeab 100644
--- a/llvm/test/CodeGen/AArch64/GlobalISel/legalize-combines.mir
+++ b/llvm/test/CodeGen/AArch64/GlobalISel/legalize-combines.mir
@@ -8,6 +8,7 @@
define void @test_combines_3() { ret void }
define void @test_combines_4() { ret void }
define void @test_combines_5() { ret void }
+ define void @test_combines_6() { ret void }
...
---
@@ -85,7 +86,38 @@ body: |
%1:_(s32) = G_ADD %0, %0
%2:_(s64) = G_MERGE_VALUES %0, %1
- %3:_(s32), %4:_(s32) = G_UNMERGE_VALUES %2
+ %6:_(s64) = COPY %2
+ %7:_(s64) = COPY %6
+ %8:_(s64) = COPY %7
+ %3:_(s32), %4:_(s32) = G_UNMERGE_VALUES %8
+ %5:_(s32) = G_ADD %3, %4
+ $w0 = COPY %5
+...
+
+---
+name: test_combines_6
+body: |
+ bb.0:
+ liveins: $w0
+
+ ; CHECK-LABEL: name: test_combines_6
+ ; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $w0
+ ; CHECK: [[ADD:%[0-9]+]]:_(s32) = G_ADD [[COPY]], [[COPY]]
+ ; CHECK: [[MV:%[0-9]+]]:_(s64) = G_MERGE_VALUES [[COPY]](s32), [[ADD]](s32)
+ ; CHECK: [[COPY1:%[0-9]+]]:_(s64) = COPY [[MV]](s64)
+ ; CHECK: [[COPY2:%[0-9]+]]:_(s64) = COPY [[COPY1]](s64)
+ ; CHECK: [[ADD1:%[0-9]+]]:_(s32) = G_ADD [[COPY]], [[ADD]]
+ ; CHECK: $w0 = COPY [[ADD1]](s32)
+ ; CHECK: $x0 = COPY [[COPY2]](s64)
+ %0:_(s32) = COPY $w0
+
+ %1:_(s32) = G_ADD %0, %0
+ %2:_(s64) = G_MERGE_VALUES %0, %1
+ %6:_(s64) = COPY %2
+ %7:_(s64) = COPY %6
+ %8:_(s64) = COPY %7
+ %3:_(s32), %4:_(s32) = G_UNMERGE_VALUES %8
%5:_(s32) = G_ADD %3, %4
$w0 = COPY %5
+ $x0 = COPY %7
...
diff --git a/llvm/test/CodeGen/AArch64/GlobalISel/legalize-nonpowerof2eltsvec.mir b/llvm/test/CodeGen/AArch64/GlobalISel/legalize-nonpowerof2eltsvec.mir
index 72e53b5f43c..0f8e07c2235 100644
--- a/llvm/test/CodeGen/AArch64/GlobalISel/legalize-nonpowerof2eltsvec.mir
+++ b/llvm/test/CodeGen/AArch64/GlobalISel/legalize-nonpowerof2eltsvec.mir
@@ -23,12 +23,11 @@ body: |
; CHECK-LABEL: name: test_legalize_merge_v3s64
; CHECK: [[COPY:%[0-9]+]]:_(s64) = COPY $x0
; CHECK: [[MV:%[0-9]+]]:_(<3 x s64>) = G_MERGE_VALUES [[COPY]](s64), [[COPY]](s64), [[COPY]](s64)
- ; CHECK: [[COPY1:%[0-9]+]]:_(<3 x s64>) = COPY [[MV]](<3 x s64>)
- ; CHECK: [[UV:%[0-9]+]]:_(s64), [[UV1:%[0-9]+]]:_(s64), [[UV2:%[0-9]+]]:_(s64) = G_UNMERGE_VALUES [[COPY1]](<3 x s64>)
- ; CHECK: $x0 = COPY [[UV]](s64)
+ ; CHECK: $x0 = COPY [[COPY]](s64)
+ ; CHECK: $noreg = PATCHABLE_RET [[MV]](<3 x s64>)
%0(s64) = COPY $x0
%1(<3 x s64>) = G_MERGE_VALUES %0(s64), %0(s64), %0(s64)
- %2(<3 x s64>) = COPY %1(<3 x s64>)
- %3(s64), %4(s64), %5(s64) = G_UNMERGE_VALUES %2(<3 x s64>)
+ %2(s64), %3(s64), %4(s64) = G_UNMERGE_VALUES %1(<3 x s64>)
$x0 = COPY %3(s64)
+ $noreg = PATCHABLE_RET %1(<3 x s64>)
...
OpenPOWER on IntegriCloud