[DAGCombiner] Preserve the exact bit when simplifying SRA to SRL. Allows more aggressive folding of ashr/shl pairs. llvm-svn: 240788

commit: c2ae76737753a55f18a290f1e64f8bca60423449 [log] [tgz]
author: Benjamin Kramer <benny.kra@googlemail.com> Fri Jun 26 14:51:49 2015 +0000
committer: Benjamin Kramer <benny.kra@googlemail.com> Fri Jun 26 14:51:49 2015 +0000
tree: fdcb984129d8ef3720dfbdc54a2793c5510fe65a
parent: 07e70b4fa4d6e2504fcd3d6c0b0415e378b937eb [diff]
diff --git a/llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp b/llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp
index c70c3a27..b40025b 100644
--- a/llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp
+++ b/llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp

@@ -771,10 +771,13 @@
 
       // If the input sign bit is known to be zero, or if none of the top bits
       // are demanded, turn this into an unsigned shift right.
-      if (KnownZero.intersects(SignBit) || (HighBits & ~NewMask) == HighBits)
-        return TLO.CombineTo(Op, TLO.DAG.getNode(ISD::SRL, dl, VT,
-                                                 Op.getOperand(0),
-                                                 Op.getOperand(1)));
+      if (KnownZero.intersects(SignBit) || (HighBits & ~NewMask) == HighBits) {
+        SDNodeFlags Flags;
+        Flags.setExact(cast<BinaryWithFlagsSDNode>(Op)->Flags.hasExact());
+        return TLO.CombineTo(Op,
+                             TLO.DAG.getNode(ISD::SRL, dl, VT, Op.getOperand(0),
+                                             Op.getOperand(1), &Flags));
+      }
 
       int Log2 = NewMask.exactLogBase2();
       if (Log2 >= 0) {

diff --git a/llvm/test/CodeGen/X86/shift-combine.ll b/llvm/test/CodeGen/X86/shift-combine.ll
index 7fb19a6..4330104 100644
--- a/llvm/test/CodeGen/X86/shift-combine.ll
+++ b/llvm/test/CodeGen/X86/shift-combine.ll

@@ -37,6 +37,16 @@
   ret i32* %gep
 }
 
+define i32* @test_exact3(i32 %a, i32 %b, i32* %x)  {
+; CHECK-LABEL: test_exact3:
+; CHECK-NOT: sarl
+
+  %sub = sub i32 %b, %a
+  %shr = ashr exact i32 %sub, 2
+  %gep = getelementptr inbounds i32, i32* %x, i32 %shr
+  ret i32* %gep
+}
+
 define i32* @test_exact4(i32 %a, i32 %b, i32* %x)  {
 ; CHECK-LABEL: test_exact4:
 ; CHECK: shrl %
commit	c2ae76737753a55f18a290f1e64f8bca60423449	[log] [tgz]
author	Benjamin Kramer <benny.kra@googlemail.com>	Fri Jun 26 14:51:49 2015 +0000
committer	Benjamin Kramer <benny.kra@googlemail.com>	Fri Jun 26 14:51:49 2015 +0000
tree	fdcb984129d8ef3720dfbdc54a2793c5510fe65a
parent	07e70b4fa4d6e2504fcd3d6c0b0415e378b937eb [diff]