diff options
| author | Simon Pilgrim <llvm-dev@redking.me.uk> | 2016-12-02 17:16:21 +0000 |
|---|---|---|
| committer | Simon Pilgrim <llvm-dev@redking.me.uk> | 2016-12-02 17:16:21 +0000 |
| commit | b2116d9b94be5b99713f20147377d83be79661c6 (patch) | |
| tree | a1647c37fa1c68787e2c9142dbe7b0304d4b55a5 | |
| parent | 43bc269ffa9e0bf0b1850fef642962d6da0f8f8c (diff) | |
| download | bcm5719-llvm-b2116d9b94be5b99713f20147377d83be79661c6.tar.gz bcm5719-llvm-b2116d9b94be5b99713f20147377d83be79661c6.zip | |
[InstCombine] Add vector urem tests
Demonstrate missed opportunity for urem -> and combine for powerof2 or zero non-uniform constant dividers
llvm-svn: 288510
| -rw-r--r-- | llvm/test/Transforms/InstCombine/vector-urem.ll | 29 |
1 files changed, 29 insertions, 0 deletions
diff --git a/llvm/test/Transforms/InstCombine/vector-urem.ll b/llvm/test/Transforms/InstCombine/vector-urem.ll new file mode 100644 index 00000000000..6cecc16069d --- /dev/null +++ b/llvm/test/Transforms/InstCombine/vector-urem.ll @@ -0,0 +1,29 @@ +; NOTE: Assertions have been autogenerated by utils/update_test_checks.py +; RUN: opt < %s -instcombine -S | FileCheck %s + +define <4 x i32> @test_v4i32_splatconst_pow2(<4 x i32> %a0) { +; CHECK-LABEL: @test_v4i32_splatconst_pow2( +; CHECK-NEXT: [[TMP1:%.*]] = and <4 x i32> %a0, <i32 1, i32 1, i32 1, i32 1> +; CHECK-NEXT: ret <4 x i32> [[TMP1]] +; + %1 = urem <4 x i32> %a0, <i32 2, i32 2, i32 2, i32 2> + ret <4 x i32> %1 +} + +define <4 x i32> @test_v4i32_const_pow2(<4 x i32> %a0) { +; CHECK-LABEL: @test_v4i32_const_pow2( +; CHECK-NEXT: [[TMP1:%.*]] = urem <4 x i32> %a0, <i32 1, i32 2, i32 4, i32 8> +; CHECK-NEXT: ret <4 x i32> [[TMP1]] +; + %1 = urem <4 x i32> %a0, <i32 1, i32 2, i32 4, i32 8> + ret <4 x i32> %1 +} + +define <4 x i32> @test_v4i32_const_pow2_or_zero(<4 x i32> %a0) { +; CHECK-LABEL: @test_v4i32_const_pow2_or_zero( +; CHECK-NEXT: [[TMP1:%.*]] = urem <4 x i32> %a0, <i32 1, i32 2, i32 0, i32 8> +; CHECK-NEXT: ret <4 x i32> [[TMP1]] +; + %1 = urem <4 x i32> %a0, <i32 1, i32 2, i32 0, i32 8> + ret <4 x i32> %1 +} |

