[InstCombine] fold sub of low-bit masked value from offset of same value

author Sanjay Patel <spatel@rotateright.com>

Fri, 13 Nov 2020 00:59:56 +0000 (19:59 -0500)

committer Sanjay Patel <spatel@rotateright.com>

Fri, 13 Nov 2020 01:10:28 +0000 (20:10 -0500)
author Sanjay Patel <spatel@rotateright.com>
Fri, 13 Nov 2020 00:59:56 +0000 (19:59 -0500)
committer Sanjay Patel <spatel@rotateright.com>
Fri, 13 Nov 2020 01:10:28 +0000 (20:10 -0500)
diff --git a/llvm/lib/Transforms/InstCombine/InstCombineAddSub.cpp b/llvm/lib/Transforms/InstCombine/InstCombineAddSub.cpp

index e78df30..abeddf4 100644 (file)
--- a/llvm/lib/Transforms/InstCombine/InstCombineAddSub.cpp
+++ b/llvm/lib/Transforms/InstCombine/InstCombineAddSub.cpp
@@ -2051,6 +2051,20 @@ Instruction *InstCombinerImpl::visitSub(BinaryOperator &I) {
      return SelectInst::Create(Cmp, Neg, A);
    }
  
+  // If we are subtracting a low-bit masked subset of some value from an add
+  // of that same value with no low bits changed, that is clearing some low bits
+  // of the sum:
+  // sub (X + AddC), (X & AndC) --> and (X + AddC), ~AndC
+  const APInt *AddC, *AndC;
+  if (match(Op0, m_Add(m_Value(X), m_APInt(AddC))) &&
+      match(Op1, m_And(m_Specific(X), m_APInt(AndC)))) {
+    unsigned BitWidth = Ty->getScalarSizeInBits();
+    unsigned Cttz = AddC->countTrailingZeros();
+    APInt HighMask(APInt::getHighBitsSet(BitWidth, BitWidth - Cttz));
+    if ((HighMask & *AndC).isNullValue())
+      return BinaryOperator::CreateAnd(Op0, ConstantInt::get(Ty, ~(*AndC)));
+  }
+
    if (Instruction *V =
            canonicalizeCondSignextOfHighBitExtractToSignextHighBitExtract(I))
      return V;
diff --git a/llvm/test/Transforms/InstCombine/sub.ll b/llvm/test/Transforms/InstCombine/sub.ll

index d703004..3e9c066 100644 (file)
--- a/llvm/test/Transforms/InstCombine/sub.ll
+++ b/llvm/test/Transforms/InstCombine/sub.ll
@@ -1464,8 +1464,7 @@ define i8 @sub_add_sub_reassoc_use2(i8 %w, i8 %x, i8 %y, i8 %z) {
  define i8 @sub_mask_lowbits(i8 %x) {
  ; CHECK-LABEL: @sub_mask_lowbits(
  ; CHECK-NEXT:    [[A1:%.*]] = add i8 [[X:%.*]], -108
-; CHECK-NEXT:    [[A2:%.*]] = and i8 [[X]], 3
-; CHECK-NEXT:    [[R:%.*]] = sub i8 [[A1]], [[A2]]
+; CHECK-NEXT:    [[R:%.*]] = and i8 [[A1]], -4
  ; CHECK-NEXT:    ret i8 [[R]]
  ;
    %a1 = add i8 %x, 148 ; 0x94
@@ -1474,6 +1473,8 @@ define i8 @sub_mask_lowbits(i8 %x) {
    ret i8 %r
  }
  
+; Negative test - low-bit mask must not overlap with offset
+
  define i8 @sub_not_mask_lowbits(i8 %x) {
  ; CHECK-LABEL: @sub_not_mask_lowbits(
  ; CHECK-NEXT:    [[A1:%.*]] = add i8 [[X:%.*]], 4
@@ -1492,7 +1493,7 @@ define <2 x i8> @sub_mask_lowbits_splat_extra_use(<2 x i8> %x, <2 x i8>* %p) {
  ; CHECK-NEXT:    [[A1:%.*]] = add <2 x i8> [[X:%.*]], <i8 -64, i8 -64>
  ; CHECK-NEXT:    [[A2:%.*]] = and <2 x i8> [[X]], <i8 10, i8 10>
  ; CHECK-NEXT:    store <2 x i8> [[A2]], <2 x i8>* [[P:%.*]], align 2
-; CHECK-NEXT:    [[R:%.*]] = sub <2 x i8> [[A1]], [[A2]]
+; CHECK-NEXT:    [[R:%.*]] = and <2 x i8> [[A1]], <i8 -11, i8 -11>
  ; CHECK-NEXT:    ret <2 x i8> [[R]]
  ;
    %a1 = add <2 x i8> %x, <i8 192, i8 192> ; 0xc0
author	Sanjay Patel <spatel@rotateright.com>
	Fri, 13 Nov 2020 00:59:56 +0000 (19:59 -0500)
committer	Sanjay Patel <spatel@rotateright.com>
	Fri, 13 Nov 2020 01:10:28 +0000 (20:10 -0500)
llvm/lib/Transforms/InstCombine/InstCombineAddSub.cpp		patch \| blob \| history
llvm/test/Transforms/InstCombine/sub.ll		patch \| blob \| history