diff options
author | Matt Arsenault <Matthew.Arsenault@amd.com> | 2016-02-27 09:38:05 +0000 |
---|---|---|
committer | Matt Arsenault <Matthew.Arsenault@amd.com> | 2016-02-27 09:38:05 +0000 |
commit | 360d244d5befb9b8270d93a4aa0e3f0744c796e1 (patch) | |
tree | 637ca80707fe6fa9fdfa780e6d6b3fd83a357727 | |
parent | 5e020b2628522d086bb49bcc80f8f4ac0c978d8b (diff) | |
download | bcm5719-llvm-360d244d5befb9b8270d93a4aa0e3f0744c796e1.tar.gz bcm5719-llvm-360d244d5befb9b8270d93a4aa0e3f0744c796e1.zip |
DAGCombiner: Relax sqrt NaN folding check
This is OK for +0 since compares to +/-0 give the same result.
llvm-svn: 262125
-rw-r--r-- | llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp | 14 | ||||
-rw-r--r-- | llvm/test/CodeGen/AMDGPU/llvm.sqrt.ll | 16 |
2 files changed, 21 insertions, 9 deletions
diff --git a/llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp b/llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp index 1425ff3c1db..9178aefac49 100644 --- a/llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp +++ b/llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp @@ -13814,33 +13814,33 @@ SDValue DAGCombiner::SimplifySelect(SDLoc DL, SDValue N0, bool DAGCombiner::SimplifySelectOps(SDNode *TheSelect, SDValue LHS, SDValue RHS) { - // fold (select (setcc x, -0.0, *lt), NaN, (fsqrt x)) - // The select + setcc is redundant, because fsqrt returns NaN for X < -0. + // fold (select (setcc x, [+-]0.0, *lt), NaN, (fsqrt x)) + // The select + setcc is redundant, because fsqrt returns NaN for X < 0. if (const ConstantFPSDNode *NaN = isConstOrConstSplatFP(LHS)) { if (NaN->isNaN() && RHS.getOpcode() == ISD::FSQRT) { // We have: (select (setcc ?, ?, ?), NaN, (fsqrt ?)) SDValue Sqrt = RHS; ISD::CondCode CC; SDValue CmpLHS; - const ConstantFPSDNode *NegZero = nullptr; + const ConstantFPSDNode *Zero = nullptr; if (TheSelect->getOpcode() == ISD::SELECT_CC) { CC = dyn_cast<CondCodeSDNode>(TheSelect->getOperand(4))->get(); CmpLHS = TheSelect->getOperand(0); - NegZero = isConstOrConstSplatFP(TheSelect->getOperand(1)); + Zero = isConstOrConstSplatFP(TheSelect->getOperand(1)); } else { // SELECT or VSELECT SDValue Cmp = TheSelect->getOperand(0); if (Cmp.getOpcode() == ISD::SETCC) { CC = dyn_cast<CondCodeSDNode>(Cmp.getOperand(2))->get(); CmpLHS = Cmp.getOperand(0); - NegZero = isConstOrConstSplatFP(Cmp.getOperand(1)); + Zero = isConstOrConstSplatFP(Cmp.getOperand(1)); } } - if (NegZero && NegZero->isNegative() && NegZero->isZero() && + if (Zero && Zero->isZero() && Sqrt.getOperand(0) == CmpLHS && (CC == ISD::SETOLT || CC == ISD::SETULT || CC == ISD::SETLT)) { - // We have: (select (setcc x, -0.0, *lt), NaN, (fsqrt x)) + // We have: (select (setcc x, [+-]0.0, *lt), NaN, (fsqrt x)) CombineTo(TheSelect, Sqrt); return true; } diff --git a/llvm/test/CodeGen/AMDGPU/llvm.sqrt.ll b/llvm/test/CodeGen/AMDGPU/llvm.sqrt.ll index c6da047f539..c8ac196e659 100644 --- a/llvm/test/CodeGen/AMDGPU/llvm.sqrt.ll +++ b/llvm/test/CodeGen/AMDGPU/llvm.sqrt.ll @@ -50,10 +50,10 @@ entry: ret void } -; SI-LABEL: {{^}}elim_redun_check: +; SI-LABEL: {{^}}elim_redun_check_neg0: ; SI: v_sqrt_f32_e32 ; SI-NOT: v_cndmask -define void @elim_redun_check(float addrspace(1)* %out, float %in) { +define void @elim_redun_check_neg0(float addrspace(1)* %out, float %in) { entry: %sqrt = call float @llvm.sqrt.f32(float %in) %cmp = fcmp olt float %in, -0.000000e+00 @@ -62,6 +62,18 @@ entry: ret void } +; SI-LABEL: {{^}}elim_redun_check_pos0: +; SI: v_sqrt_f32_e32 +; SI-NOT: v_cndmask +define void @elim_redun_check_pos0(float addrspace(1)* %out, float %in) { +entry: + %sqrt = call float @llvm.sqrt.f32(float %in) + %cmp = fcmp olt float %in, 0.000000e+00 + %res = select i1 %cmp, float 0x7FF8000000000000, float %sqrt + store float %res, float addrspace(1)* %out + ret void +} + ; SI-LABEL: {{^}}elim_redun_check_ult: ; SI: v_sqrt_f32_e32 ; SI-NOT: v_cndmask |