summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorEvgeniy Stepanov <eugeni.stepanov@gmail.com>2018-01-31 22:55:19 +0000
committerEvgeniy Stepanov <eugeni.stepanov@gmail.com>2018-01-31 22:55:19 +0000
commit7746899f48031664084c29389e62399569883c71 (patch)
treef922e6b865343e6534824dfc9155d03af83f16df
parent06dfbb50d70eea4ae38d655842626a0b9b224d5c (diff)
downloadbcm5719-llvm-7746899f48031664084c29389e62399569883c71.tar.gz
bcm5719-llvm-7746899f48031664084c29389e62399569883c71.zip
Revert "[ARM] Lower lower saturate to 0 and lower saturate to -1 using bit-operations"
Miscompiles code. Testcase pending. This reverts commit r323869. llvm-svn: 323929
-rw-r--r--llvm/lib/Target/ARM/ARMISelLowering.cpp20
-rw-r--r--llvm/test/CodeGen/ARM/atomic-op.ll5
-rw-r--r--llvm/test/CodeGen/ARM/sat-to-bitop.ll132
-rw-r--r--llvm/test/CodeGen/ARM/select.ll2
-rw-r--r--llvm/test/CodeGen/Thumb/select.ll4
5 files changed, 5 insertions, 158 deletions
diff --git a/llvm/lib/Target/ARM/ARMISelLowering.cpp b/llvm/lib/Target/ARM/ARMISelLowering.cpp
index 90a228f19ab..cddd957417e 100644
--- a/llvm/lib/Target/ARM/ARMISelLowering.cpp
+++ b/llvm/lib/Target/ARM/ARMISelLowering.cpp
@@ -4407,26 +4407,6 @@ SDValue ARMTargetLowering::LowerSELECT_CC(SDValue Op, SelectionDAG &DAG) const {
SDValue TrueVal = Op.getOperand(2);
SDValue FalseVal = Op.getOperand(3);
- // Try to convert expressions of the form x < k ? k : x (and similar forms) into
- // more efficient bit operations, which is possible when k is 0 or -1
- // On ARM and Thumb-2 which has flexible operand 2 this will result in single
- // instructions. On Thumb the shift and the bit operation will be two instructions.
- SDValue *K = isa<ConstantSDNode>(LHS) ? &LHS : isa<ConstantSDNode>(RHS)
- ? &RHS
- : nullptr;
- SDValue KTmp = isa<ConstantSDNode>(TrueVal) ? TrueVal : FalseVal;
- SDValue V = (KTmp == TrueVal) ? FalseVal : TrueVal;
-
- if (K && isLowerSaturate(LHS, RHS, TrueVal, FalseVal, CC, *K) && *K == KTmp) {
- SDValue ShiftV = DAG.getNode(ISD::SRA, dl, VT, V, DAG.getConstant(31, dl, VT));
- if (isNullConstant(*K)) {
- SDValue NotShiftV = DAG.getNode(ISD::XOR, dl, VT, ShiftV, DAG.getConstant(-1, dl, VT));
- return DAG.getNode(ISD::AND, dl, VT, V, NotShiftV);
- } else if (isAllOnesConstant(*K)) {
- return DAG.getNode(ISD::OR, dl, VT, V, ShiftV);
- }
- }
-
if (Subtarget->isFPOnlySP() && LHS.getValueType() == MVT::f64) {
DAG.getTargetLoweringInfo().softenSetCCOperands(DAG, MVT::f64, LHS, RHS, CC,
dl);
diff --git a/llvm/test/CodeGen/ARM/atomic-op.ll b/llvm/test/CodeGen/ARM/atomic-op.ll
index 77c022f03e0..644a7fbf8d9 100644
--- a/llvm/test/CodeGen/ARM/atomic-op.ll
+++ b/llvm/test/CodeGen/ARM/atomic-op.ll
@@ -129,12 +129,11 @@ entry:
store i32 %9, i32* %old
call void asm sideeffect "", "~{memory},~{dirflag},~{fpsr},~{flags}"()
; CHECK: ldrex
- ; CHECK: bic
- ; CHECK-NOT: cmp
+ ; CHECK: cmp
; CHECK: strex
; CHECK-T1: bl ___sync_fetch_and_max_4
; CHECK-T1-M0: bl ___sync_fetch_and_max_4
- ; CHECK-BAREMETAL: bic
+ ; CHECK-BAREMETAL: cmp
; CHECK-BAREMETAL-NOT: __sync
%10 = atomicrmw max i32* %val2, i32 0 monotonic
store i32 %10, i32* %old
diff --git a/llvm/test/CodeGen/ARM/sat-to-bitop.ll b/llvm/test/CodeGen/ARM/sat-to-bitop.ll
deleted file mode 100644
index 35e2300ba87..00000000000
--- a/llvm/test/CodeGen/ARM/sat-to-bitop.ll
+++ /dev/null
@@ -1,132 +0,0 @@
-; RUN: llc -mtriple=arm %s -o - | FileCheck %s --check-prefix=CHECK --check-prefix=CHECK-ARM --check-prefix=CHECK-CMP
-; RUN: llc -mtriple=thumb-eabi %s -o - | FileCheck %s --check-prefix=CHECK --check-prefix=CHECK-T --check-prefix=CHECK-CMP
-; RUN: llc -mtriple=thumb-eabi -mcpu=arm1156t2-s -mattr=+thumb2 %s -o - | FileCheck %s --check-prefix=CHECK --check-prefix=CHECK-T2 --check-prefix=CHECK-CMP
-
-
-; Check for clipping against 0 that should result in bic
-;
-; Base tests with different bit widths
-;
-
-; x < 0 ? 0 : x
-; 32-bit base test
-define i32 @sat0_base_32bit(i32 %x) #0 {
-; CHECK-LABEL: sat0_base_32bit:
-; CHECK-CMP-NOT: cmp
-; CHECK-ARM: bic {{r[0-9]}}, [[INPUT:r[0-9]]], [[INPUT]], asr #31
-; CHECK-T2: bic.w {{r[0-9]}}, [[INPUT:r[0-9]]], [[INPUT]], asr #31
-; CHECK-T: asrs [[IM:r[0-9]]], {{r[0-9]}}, #31
-; CHECK-T-NEXT: bics {{r[0-9]}}, [[IM]]
-entry:
- %cmpLow = icmp slt i32 %x, 0
- %saturateLow = select i1 %cmpLow, i32 0, i32 %x
- ret i32 %saturateLow
-}
-
-; x < 0 ? 0 : x
-; 16-bit base test
-define i16 @sat0_base_16bit(i16 %x) #0 {
-; CHECK-LABEL: sat0_base_16bit:
-; CHECK-CMP-NOT: cmp
-; CHECK-ARM: bic {{r[0-9]}}, [[INPUT:r[0-9]]], [[INPUT]], asr #31
-; CHECK-T2: bic.w {{r[0-9]}}, [[INPUT:r[0-9]]], [[INPUT]], asr #31
-; CHECK-T: asrs [[IM:r[0-9]]], {{r[0-9]}}, #31
-; CHECK-T-NEXT: bics {{r[0-9]}}, [[IM]]
-entry:
- %cmpLow = icmp slt i16 %x, 0
- %saturateLow = select i1 %cmpLow, i16 0, i16 %x
- ret i16 %saturateLow
-}
-
-; x < 0 ? 0 : x
-; 8-bit base test
-define i8 @sat0_base_8bit(i8 %x) #0 {
-; CHECK-LABEL: sat0_base_8bit:
-; CHECK-CMP-NOT: cmp
-; CHECK-ARM: bic {{r[0-9]}}, [[INPUT:r[0-9]]], [[INPUT]], asr #31
-; CHECK-T2: bic.w {{r[0-9]}}, [[INPUT:r[0-9]]], [[INPUT]], asr #31
-; CHECK-T: asrs [[IM:r[0-9]]], {{r[0-9]}}, #31
-; CHECK-T-NEXT: bics {{r[0-9]}}, [[IM]]
-entry:
- %cmpLow = icmp slt i8 %x, 0
- %saturateLow = select i1 %cmpLow, i8 0, i8 %x
- ret i8 %saturateLow
-}
-
-; Test where the conditional is formed in a different way
-
-; x > 0 ? x : 0
-define i32 @sat0_lower_1(i32 %x) #0 {
-; CHECK-LABEL: sat0_lower_1:
-; CHECK-CMP-NOT: cmp
-; CHECK-ARM: bic {{r[0-9]}}, [[INPUT:r[0-9]]], [[INPUT]], asr #31
-; CHECK-T2: bic.w {{r[0-9]}}, [[INPUT:r[0-9]]], [[INPUT]], asr #31
-; CHECK-T: asrs [[IM:r[0-9]]], {{r[0-9]}}, #31
-; CHECK-T-NEXT: bics {{r[0-9]}}, [[IM]]
-entry:
- %cmpGt = icmp sgt i32 %x, 0
- %saturateLow = select i1 %cmpGt, i32 %x, i32 0
- ret i32 %saturateLow
-}
-
-
-; Check for clipping against -1 that should result in orr
-;
-; Base tests with different bit widths
-;
-
-; x < -1 ? -1 : x
-; 32-bit base test
-define i32 @sat1_base_32bit(i32 %x) #0 {
-; CHECK-LABEL: sat1_base_32bit:
-; CHECK-CMP-NOT: cmp
-; CHECK-ARM: orr {{r[0-9]}}, [[INPUT:r[0-9]]], [[INPUT]], asr #31
-; CHECK-T2: orr.w {{r[0-9]}}, [[INPUT:r[0-9]]], [[INPUT]], asr #31
-; CHECK-T: asrs [[IM:r[0-9]]], {{r[0-9]}}, #31
-; CHECK-T-NEXT: orrs {{r[0-9]}}, [[IM]]
-entry:
- %cmpLow = icmp slt i32 %x, -1
- %saturateLow = select i1 %cmpLow, i32 -1, i32 %x
- ret i32 %saturateLow
-}
-
-; x < -1 ? -1 : x
-; 16-bit base test
-; Note this currently fails due to combination of constant hoisting and bitcasts
-define i16 @sat1_base_16bit(i16 %x) #0 {
-; CHECK-LABEL: sat1_base_16bit:
-entry:
- %cmpLow = icmp slt i16 %x, -1
- %saturateLow = select i1 %cmpLow, i16 -1, i16 %x
- ret i16 %saturateLow
-}
-
-; x < -1 ? -1 : x
-; 8-bit base test
-define i8 @sat1_base_8bit(i8 %x) #0 {
-; CHECK-LABEL: sat1_base_8bit:
-; CHECK-ARM: orr {{r[0-9]}}, [[INPUT:r[0-9]]], [[INPUT]], asr #31
-; CHECK-ARM-NOT: cmp
-; CHECK-T2: orr.w {{r[0-9]}}, [[INPUT:r[0-9]]], [[INPUT]], asr #31
-; CHECK-T2-NOT: cmp
-entry:
- %cmpLow = icmp slt i8 %x, -1
- %saturateLow = select i1 %cmpLow, i8 -1, i8 %x
- ret i8 %saturateLow
-}
-
-; Test where the conditional is formed in a different way
-
-; x > -1 ? x : -1
-define i32 @sat1_lower_1(i32 %x) #0 {
-; CHECK-LABEL: sat1_lower_1:
-; CHECK-ARM: orr {{r[0-9]}}, [[INPUT:r[0-9]]], [[INPUT]], asr #31
-; CHECK-T2: orr.w {{r[0-9]}}, [[INPUT:r[0-9]]], [[INPUT]], asr #31
-; CHECK-T: asrs [[IM:r[0-9]]], {{r[0-9]}}, #31
-; CHECK-T-NEXT: orrs {{r[0-9]}}, [[IM]]
-; CHECK-CMP-NOT: cmp
-entry:
- %cmpGt = icmp sgt i32 %x, -1
- %saturateLow = select i1 %cmpGt, i32 %x, i32 -1
- ret i32 %saturateLow
-}
diff --git a/llvm/test/CodeGen/ARM/select.ll b/llvm/test/CodeGen/ARM/select.ll
index 7b1855e432b..e9394a72073 100644
--- a/llvm/test/CodeGen/ARM/select.ll
+++ b/llvm/test/CodeGen/ARM/select.ll
@@ -62,7 +62,7 @@ entry:
define double @f7(double %a, double %b) {
;CHECK-LABEL: f7:
-;CHECK: bic
+;CHECK: movlt
;CHECK: movge
;CHECK-VFP-LABEL: f7:
;CHECK-VFP: vmovmi
diff --git a/llvm/test/CodeGen/Thumb/select.ll b/llvm/test/CodeGen/Thumb/select.ll
index 91d0453304c..75dbeab5ad0 100644
--- a/llvm/test/CodeGen/Thumb/select.ll
+++ b/llvm/test/CodeGen/Thumb/select.ll
@@ -73,8 +73,8 @@ define double @f7(double %a, double %b) {
ret double %tmp1
}
; CHECK-LABEL: f7:
-; CHECK: bge
-; CHECK: bic
+; CHECK: blt
+; CHECK: {{blt|bge}}
; CHECK: __ltdf2
; CHECK-EABI-LABEL: f7:
; CHECK-EABI: __aeabi_dcmplt
OpenPOWER on IntegriCloud