[InstCombine] Fold x & (-1 >> y) == x to x u<= (-1 >> y)

author Roman Lebedev <lebedev.ri@gmail.com>

Wed, 11 Jul 2018 19:05:04 +0000 (19:05 +0000)

committer Roman Lebedev <lebedev.ri@gmail.com>

Wed, 11 Jul 2018 19:05:04 +0000 (19:05 +0000)
author Roman Lebedev <lebedev.ri@gmail.com>
Wed, 11 Jul 2018 19:05:04 +0000 (19:05 +0000)
committer Roman Lebedev <lebedev.ri@gmail.com>
Wed, 11 Jul 2018 19:05:04 +0000 (19:05 +0000)
diff --git a/llvm/include/llvm/IR/PatternMatch.h b/llvm/include/llvm/IR/PatternMatch.h

index aa502cf0ed7e984fea39ef4b679863465572182a..dcd604412f425e0b9974c2dc1fa45ec9ef048e93 100644 (file)
--- a/llvm/include/llvm/IR/PatternMatch.h
+++ b/llvm/include/llvm/IR/PatternMatch.h
@@ -407,6 +407,15 @@ inline cst_pred_ty<is_sign_mask> m_SignMask() {
    return cst_pred_ty<is_sign_mask>();
  }
  
+struct is_lowbit_mask {
+  bool isValue(const APInt &C) { return C.isMask(); }
+};
+/// Match an integer or vector with only the low bit(s) set.
+/// For vectors, this includes constants with undefined elements.
+inline cst_pred_ty<is_lowbit_mask> m_LowBitMask() {
+  return cst_pred_ty<is_lowbit_mask>();
+}
+
  struct is_nan {
    bool isValue(const APFloat &C) { return C.isNaN(); }
  };
diff --git a/llvm/lib/Transforms/InstCombine/InstCombineCompares.cpp b/llvm/lib/Transforms/InstCombine/InstCombineCompares.cpp

index d52ea2cf6eb223522f4a4be32942d410b190b782..f3cc81d237e052c5b260826eec93acaaf0a6258a 100644 (file)
--- a/llvm/lib/Transforms/InstCombine/InstCombineCompares.cpp
+++ b/llvm/lib/Transforms/InstCombine/InstCombineCompares.cpp
@@ -2866,6 +2866,36 @@ Instruction *InstCombiner::foldICmpInstWithConstantNotInt(ICmpInst &I) {
    return nullptr;
  }
  
+/// Some comparisons can be simplified.
+/// In this case, we are looking for comparisons that look like
+/// a check for a lossy truncation.
+/// Folds:
+///   x & (-1 >> y) SrcPred x    to    x DstPred (-1 >> y)
+/// The Mask can be a constant, too.
+static Value *foldICmpWithLowBitMaskedVal(ICmpInst &I,
+                                          InstCombiner::BuilderTy &Builder) {
+  ICmpInst::Predicate SrcPred;
+  Value *X, *M;
+  auto m_Mask = m_CombineOr(m_LShr(m_AllOnes(), m_Value()), m_LowBitMask());
+  if (!match(&I, m_c_ICmp(SrcPred,
+                          m_c_And(m_CombineAnd(m_Mask, m_Value(M)), m_Value(X)),
+                          m_Deferred(X))))
+    return nullptr;
+
+  ICmpInst::Predicate DstPred;
+  switch (SrcPred) {
+  case ICmpInst::Predicate::ICMP_EQ:
+    //  x & (-1 >> y) == x    ->    x u<= (-1 >> y)
+    DstPred = ICmpInst::Predicate::ICMP_ULE;
+    break;
+  // TODO: more folds are possible, https://bugs.llvm.org/show_bug.cgi?id=38123
+  default:
+    return nullptr;
+  }
+
+  return Builder.CreateICmp(DstPred, X, M);
+}
+
  /// Try to fold icmp (binop), X or icmp X, (binop).
  /// TODO: A large part of this logic is duplicated in InstSimplify's
  /// simplifyICmpWithBinOp(). We should be able to share that and avoid the code
@@ -3203,6 +3233,9 @@ Instruction *InstCombiner::foldICmpBinOp(ICmpInst &I) {
      }
    }
  
+  if (Value *V = foldICmpWithLowBitMaskedVal(I, Builder))
+    return replaceInstUsesWith(I, V);
+
    return nullptr;
  }
  
@@ -4706,6 +4739,7 @@ Instruction *InstCombiner::visitICmpInst(ICmpInst &I) {
      if (match(Op1, m_Add(m_Value(X), m_ConstantInt(Cst))) && Op0 == X)
        return foldICmpAddOpConst(X, Cst, I.getSwappedPredicate());
    }
+
    return Changed ? &I : nullptr;
  }
  
diff --git a/llvm/test/Transforms/InstCombine/canonicalize-constant-low-bit-mask-and-icmp-eq-to-icmp-ule.ll b/llvm/test/Transforms/InstCombine/canonicalize-constant-low-bit-mask-and-icmp-eq-to-icmp-ule.ll

index d4ae89c4616395ffb9d0735b3b6f79fcd77f2059..693d9c98da50c8a9336ee3cec3b1e0577f3736a6 100644 (file)
--- a/llvm/test/Transforms/InstCombine/canonicalize-constant-low-bit-mask-and-icmp-eq-to-icmp-ule.ll
+++ b/llvm/test/Transforms/InstCombine/canonicalize-constant-low-bit-mask-and-icmp-eq-to-icmp-ule.ll
@@ -15,9 +15,8 @@
  
  define i1 @p0(i8 %x) {
  ; CHECK-LABEL: @p0(
-; CHECK-NEXT:    [[TMP0:%.*]] = and i8 [[X:%.*]], 3
-; CHECK-NEXT:    [[RET:%.*]] = icmp eq i8 [[TMP0]], [[X]]
-; CHECK-NEXT:    ret i1 [[RET]]
+; CHECK-NEXT:    [[TMP1:%.*]] = icmp ult i8 [[X:%.*]], 4
+; CHECK-NEXT:    ret i1 [[TMP1]]
  ;
    %tmp0 = and i8 %x, 3
    %ret = icmp eq i8 %tmp0, %x
@@ -30,9 +29,8 @@ define i1 @p0(i8 %x) {
  
  define <2 x i1> @p1_vec_splat(<2 x i8> %x) {
  ; CHECK-LABEL: @p1_vec_splat(
-; CHECK-NEXT:    [[TMP0:%.*]] = and <2 x i8> [[X:%.*]], <i8 3, i8 3>
-; CHECK-NEXT:    [[RET:%.*]] = icmp eq <2 x i8> [[TMP0]], [[X]]
-; CHECK-NEXT:    ret <2 x i1> [[RET]]
+; CHECK-NEXT:    [[TMP1:%.*]] = icmp ult <2 x i8> [[X:%.*]], <i8 4, i8 4>
+; CHECK-NEXT:    ret <2 x i1> [[TMP1]]
  ;
    %tmp0 = and <2 x i8> %x, <i8 3, i8 3>
    %ret = icmp eq <2 x i8> %tmp0, %x
@@ -41,9 +39,8 @@ define <2 x i1> @p1_vec_splat(<2 x i8> %x) {
  
  define <2 x i1> @p2_vec_nonsplat(<2 x i8> %x) {
  ; CHECK-LABEL: @p2_vec_nonsplat(
-; CHECK-NEXT:    [[TMP0:%.*]] = and <2 x i8> [[X:%.*]], <i8 3, i8 15>
-; CHECK-NEXT:    [[RET:%.*]] = icmp eq <2 x i8> [[TMP0]], [[X]]
-; CHECK-NEXT:    ret <2 x i1> [[RET]]
+; CHECK-NEXT:    [[TMP1:%.*]] = icmp ult <2 x i8> [[X:%.*]], <i8 4, i8 16>
+; CHECK-NEXT:    ret <2 x i1> [[TMP1]]
  ;
    %tmp0 = and <2 x i8> %x, <i8 3, i8 15> ; doesn't have to be splat.
    %ret = icmp eq <2 x i8> %tmp0, %x
@@ -52,9 +49,8 @@ define <2 x i1> @p2_vec_nonsplat(<2 x i8> %x) {
  
  define <3 x i1> @p3_vec_splat_undef(<3 x i8> %x) {
  ; CHECK-LABEL: @p3_vec_splat_undef(
-; CHECK-NEXT:    [[TMP0:%.*]] = and <3 x i8> [[X:%.*]], <i8 3, i8 undef, i8 3>
-; CHECK-NEXT:    [[RET:%.*]] = icmp eq <3 x i8> [[TMP0]], [[X]]
-; CHECK-NEXT:    ret <3 x i1> [[RET]]
+; CHECK-NEXT:    [[TMP1:%.*]] = icmp ult <3 x i8> [[X:%.*]], <i8 4, i8 undef, i8 4>
+; CHECK-NEXT:    ret <3 x i1> [[TMP1]]
  ;
    %tmp0 = and <3 x i8> %x, <i8 3, i8 undef, i8 3>
    %ret = icmp eq <3 x i8> %tmp0, %x
@@ -70,9 +66,8 @@ declare i8 @gen8()
  define i1 @c0() {
  ; CHECK-LABEL: @c0(
  ; CHECK-NEXT:    [[X:%.*]] = call i8 @gen8()
-; CHECK-NEXT:    [[TMP0:%.*]] = and i8 [[X]], 3
-; CHECK-NEXT:    [[RET:%.*]] = icmp eq i8 [[X]], [[TMP0]]
-; CHECK-NEXT:    ret i1 [[RET]]
+; CHECK-NEXT:    [[TMP1:%.*]] = icmp ult i8 [[X]], 4
+; CHECK-NEXT:    ret i1 [[TMP1]]
  ;
    %x = call i8 @gen8()
    %tmp0 = and i8 %x, 3
@@ -90,8 +85,8 @@ define i1 @oneuse0(i8 %x) {
  ; CHECK-LABEL: @oneuse0(
  ; CHECK-NEXT:    [[TMP0:%.*]] = and i8 [[X:%.*]], 3
  ; CHECK-NEXT:    call void @use8(i8 [[TMP0]])
-; CHECK-NEXT:    [[RET:%.*]] = icmp eq i8 [[TMP0]], [[X]]
-; CHECK-NEXT:    ret i1 [[RET]]
+; CHECK-NEXT:    [[TMP1:%.*]] = icmp ult i8 [[X]], 4
+; CHECK-NEXT:    ret i1 [[TMP1]]
  ;
    %tmp0 = and i8 %x, 3
    call void @use8(i8 %tmp0)
diff --git a/llvm/test/Transforms/InstCombine/canonicalize-low-bit-mask-and-icmp-eq-to-icmp-ule.ll b/llvm/test/Transforms/InstCombine/canonicalize-low-bit-mask-and-icmp-eq-to-icmp-ule.ll

index ca769b9ccccd12020a144da903f885998d25d785..dc5fbebc2303eff06e8b7f6b6981a8a003a820e2 100644 (file)
--- a/llvm/test/Transforms/InstCombine/canonicalize-low-bit-mask-and-icmp-eq-to-icmp-ule.ll
+++ b/llvm/test/Transforms/InstCombine/canonicalize-low-bit-mask-and-icmp-eq-to-icmp-ule.ll
@@ -15,9 +15,8 @@
  define i1 @p0(i8 %x, i8 %y) {
  ; CHECK-LABEL: @p0(
  ; CHECK-NEXT:    [[TMP0:%.*]] = lshr i8 -1, [[Y:%.*]]
-; CHECK-NEXT:    [[TMP1:%.*]] = and i8 [[TMP0]], [[X:%.*]]
-; CHECK-NEXT:    [[RET:%.*]] = icmp eq i8 [[TMP1]], [[X]]
-; CHECK-NEXT:    ret i1 [[RET]]
+; CHECK-NEXT:    [[TMP1:%.*]] = icmp uge i8 [[TMP0]], [[X:%.*]]
+; CHECK-NEXT:    ret i1 [[TMP1]]
  ;
    %tmp0 = lshr i8 -1, %y
    %tmp1 = and i8 %tmp0, %x
@@ -32,9 +31,8 @@ define i1 @p0(i8 %x, i8 %y) {
  define <2 x i1> @p1_vec(<2 x i8> %x, <2 x i8> %y) {
  ; CHECK-LABEL: @p1_vec(
  ; CHECK-NEXT:    [[TMP0:%.*]] = lshr <2 x i8> <i8 -1, i8 -1>, [[Y:%.*]]
-; CHECK-NEXT:    [[TMP1:%.*]] = and <2 x i8> [[TMP0]], [[X:%.*]]
-; CHECK-NEXT:    [[RET:%.*]] = icmp eq <2 x i8> [[TMP1]], [[X]]
-; CHECK-NEXT:    ret <2 x i1> [[RET]]
+; CHECK-NEXT:    [[TMP1:%.*]] = icmp uge <2 x i8> [[TMP0]], [[X:%.*]]
+; CHECK-NEXT:    ret <2 x i1> [[TMP1]]
  ;
    %tmp0 = lshr <2 x i8> <i8 -1, i8 -1>, %y
    %tmp1 = and <2 x i8> %tmp0, %x
@@ -45,9 +43,8 @@ define <2 x i1> @p1_vec(<2 x i8> %x, <2 x i8> %y) {
  define <3 x i1> @p2_vec_undef(<3 x i8> %x, <3 x i8> %y) {
  ; CHECK-LABEL: @p2_vec_undef(
  ; CHECK-NEXT:    [[TMP0:%.*]] = lshr <3 x i8> <i8 -1, i8 undef, i8 -1>, [[Y:%.*]]
-; CHECK-NEXT:    [[TMP1:%.*]] = and <3 x i8> [[TMP0]], [[X:%.*]]
-; CHECK-NEXT:    [[RET:%.*]] = icmp eq <3 x i8> [[TMP1]], [[X]]
-; CHECK-NEXT:    ret <3 x i1> [[RET]]
+; CHECK-NEXT:    [[TMP1:%.*]] = icmp uge <3 x i8> [[TMP0]], [[X:%.*]]
+; CHECK-NEXT:    ret <3 x i1> [[TMP1]]
  ;
    %tmp0 = lshr <3 x i8> <i8 -1, i8 undef, i8 -1>, %y
    %tmp1 = and <3 x i8> %tmp0, %x
@@ -65,9 +62,8 @@ define i1 @c0(i8 %y) {
  ; CHECK-LABEL: @c0(
  ; CHECK-NEXT:    [[TMP0:%.*]] = lshr i8 -1, [[Y:%.*]]
  ; CHECK-NEXT:    [[X:%.*]] = call i8 @gen8()
-; CHECK-NEXT:    [[TMP1:%.*]] = and i8 [[X]], [[TMP0]]
-; CHECK-NEXT:    [[RET:%.*]] = icmp eq i8 [[TMP1]], [[X]]
-; CHECK-NEXT:    ret i1 [[RET]]
+; CHECK-NEXT:    [[TMP1:%.*]] = icmp ule i8 [[X]], [[TMP0]]
+; CHECK-NEXT:    ret i1 [[TMP1]]
  ;
    %tmp0 = lshr i8 -1, %y
    %x = call i8 @gen8()
@@ -80,9 +76,8 @@ define i1 @c1(i8 %y) {
  ; CHECK-LABEL: @c1(
  ; CHECK-NEXT:    [[TMP0:%.*]] = lshr i8 -1, [[Y:%.*]]
  ; CHECK-NEXT:    [[X:%.*]] = call i8 @gen8()
-; CHECK-NEXT:    [[TMP1:%.*]] = and i8 [[TMP0]], [[X]]
-; CHECK-NEXT:    [[RET:%.*]] = icmp eq i8 [[X]], [[TMP1]]
-; CHECK-NEXT:    ret i1 [[RET]]
+; CHECK-NEXT:    [[TMP1:%.*]] = icmp ule i8 [[X]], [[TMP0]]
+; CHECK-NEXT:    ret i1 [[TMP1]]
  ;
    %tmp0 = lshr i8 -1, %y
    %x = call i8 @gen8()
@@ -95,9 +90,8 @@ define i1 @c2(i8 %y) {
  ; CHECK-LABEL: @c2(
  ; CHECK-NEXT:    [[TMP0:%.*]] = lshr i8 -1, [[Y:%.*]]
  ; CHECK-NEXT:    [[X:%.*]] = call i8 @gen8()
-; CHECK-NEXT:    [[TMP1:%.*]] = and i8 [[X]], [[TMP0]]
-; CHECK-NEXT:    [[RET:%.*]] = icmp eq i8 [[X]], [[TMP1]]
-; CHECK-NEXT:    ret i1 [[RET]]
+; CHECK-NEXT:    [[TMP1:%.*]] = icmp ule i8 [[X]], [[TMP0]]
+; CHECK-NEXT:    ret i1 [[TMP1]]
  ;
    %tmp0 = lshr i8 -1, %y
    %x = call i8 @gen8()
@@ -116,9 +110,8 @@ define i1 @oneuse0(i8 %x, i8 %y) {
  ; CHECK-LABEL: @oneuse0(
  ; CHECK-NEXT:    [[TMP0:%.*]] = lshr i8 -1, [[Y:%.*]]
  ; CHECK-NEXT:    call void @use8(i8 [[TMP0]])
-; CHECK-NEXT:    [[TMP1:%.*]] = and i8 [[TMP0]], [[X:%.*]]
-; CHECK-NEXT:    [[RET:%.*]] = icmp eq i8 [[TMP1]], [[X]]
-; CHECK-NEXT:    ret i1 [[RET]]
+; CHECK-NEXT:    [[TMP1:%.*]] = icmp uge i8 [[TMP0]], [[X:%.*]]
+; CHECK-NEXT:    ret i1 [[TMP1]]
  ;
    %tmp0 = lshr i8 -1, %y
    call void @use8(i8 %tmp0)
@@ -132,8 +125,8 @@ define i1 @oneuse1(i8 %x, i8 %y) {
  ; CHECK-NEXT:    [[TMP0:%.*]] = lshr i8 -1, [[Y:%.*]]
  ; CHECK-NEXT:    [[TMP1:%.*]] = and i8 [[TMP0]], [[X:%.*]]
  ; CHECK-NEXT:    call void @use8(i8 [[TMP1]])
-; CHECK-NEXT:    [[RET:%.*]] = icmp eq i8 [[TMP1]], [[X]]
-; CHECK-NEXT:    ret i1 [[RET]]
+; CHECK-NEXT:    [[TMP1:%.*]] = icmp uge i8 [[TMP0]], [[X]]
+; CHECK-NEXT:    ret i1 [[TMP1]]
  ;
    %tmp0 = lshr i8 -1, %y
    %tmp1 = and i8 %tmp0, %x
@@ -148,8 +141,8 @@ define i1 @oneuse2(i8 %x, i8 %y) {
  ; CHECK-NEXT:    call void @use8(i8 [[TMP0]])
  ; CHECK-NEXT:    [[TMP1:%.*]] = and i8 [[TMP0]], [[X:%.*]]
  ; CHECK-NEXT:    call void @use8(i8 [[TMP1]])
-; CHECK-NEXT:    [[RET:%.*]] = icmp eq i8 [[TMP1]], [[X]]
-; CHECK-NEXT:    ret i1 [[RET]]
+; CHECK-NEXT:    [[TMP1:%.*]] = icmp uge i8 [[TMP0]], [[X]]
+; CHECK-NEXT:    ret i1 [[TMP1]]
  ;
    %tmp0 = lshr i8 -1, %y
    call void @use8(i8 %tmp0)
diff --git a/llvm/test/Transforms/InstCombine/icmp-logical.ll b/llvm/test/Transforms/InstCombine/icmp-logical.ll

index 94ab8b5e6a399f9512782bc9a89ba5c74bf684ee..fb18b3b4d0f9e28de418dbbda11e9a35c28ae1a2 100644 (file)
--- a/llvm/test/Transforms/InstCombine/icmp-logical.ll
+++ b/llvm/test/Transforms/InstCombine/icmp-logical.ll
@@ -88,9 +88,11 @@ define i1 @masked_and_notA_slightly_optimized(i32 %A) {
  
  define i1 @masked_or_A(i32 %A) {
  ; CHECK-LABEL: @masked_or_A(
-; CHECK-NEXT:    [[MASK2:%.*]] = and i32 [[A:%.*]], 39
+; CHECK-NEXT:    [[TMP1:%.*]] = icmp ult i32 [[A:%.*]], 8
+; CHECK-NEXT:    [[MASK2:%.*]] = and i32 [[A]], 39
  ; CHECK-NEXT:    [[TST2:%.*]] = icmp eq i32 [[MASK2]], [[A]]
-; CHECK-NEXT:    ret i1 [[TST2]]
+; CHECK-NEXT:    [[RES:%.*]] = or i1 [[TMP1]], [[TST2]]
+; CHECK-NEXT:    ret i1 [[RES]]
  ;
    %mask1 = and i32 %A, 7
    %tst1 = icmp eq i32 %mask1, %A
diff --git a/llvm/test/Transforms/InstCombine/icmp-mul-zext.ll b/llvm/test/Transforms/InstCombine/icmp-mul-zext.ll

index cd2f471ac8f8313bd22b2246a418652f9855a3d7..093dfd8308e63617ce26a617fda239e196ea5450 100644 (file)
--- a/llvm/test/Transforms/InstCombine/icmp-mul-zext.ll
+++ b/llvm/test/Transforms/InstCombine/icmp-mul-zext.ll
@@ -11,9 +11,8 @@ define i32 @sterix(i32, i8, i64) {
  ; CHECK-NEXT:    [[SHR:%.*]] = lshr i32 [[MUL]], [[SH_PROM]]
  ; CHECK-NEXT:    [[CONV2:%.*]] = zext i32 [[SHR]] to i64
  ; CHECK-NEXT:    [[MUL3:%.*]] = mul nuw nsw i64 [[CONV]], [[CONV2]]
-; CHECK-NEXT:    [[CONV6:%.*]] = and i64 [[MUL3]], 4294967295
-; CHECK-NEXT:    [[TOBOOL:%.*]] = icmp eq i64 [[CONV6]], [[MUL3]]
-; CHECK-NEXT:    br i1 [[TOBOOL]], label [[LOR_RHS:%.*]], label [[LOR_END:%.*]]
+; CHECK-NEXT:    [[TMP3:%.*]] = icmp ugt i64 [[MUL3]], 4294967295
+; CHECK-NEXT:    br i1 [[TMP3]], label [[LOR_END:%.*]], label [[LOR_RHS:%.*]]
  ; CHECK:       lor.rhs:
  ; CHECK-NEXT:    [[AND:%.*]] = and i64 [[MUL3]], [[TMP2]]
  ; CHECK-NEXT:    [[CONV4:%.*]] = trunc i64 [[AND]] to i32
@@ -21,8 +20,8 @@ define i32 @sterix(i32, i8, i64) {
  ; CHECK-NEXT:    [[PHITMP:%.*]] = zext i1 [[TOBOOL7]] to i32
  ; CHECK-NEXT:    br label [[LOR_END]]
  ; CHECK:       lor.end:
-; CHECK-NEXT:    [[TMP3:%.*]] = phi i32 [ 1, [[ENTRY:%.*]] ], [ [[PHITMP]], [[LOR_RHS]] ]
-; CHECK-NEXT:    ret i32 [[TMP3]]
+; CHECK-NEXT:    [[TMP4:%.*]] = phi i32 [ 1, [[ENTRY:%.*]] ], [ [[PHITMP]], [[LOR_RHS]] ]
+; CHECK-NEXT:    ret i32 [[TMP4]]
  ;
  entry:
    %conv = zext i32 %0 to i64
author	Roman Lebedev <lebedev.ri@gmail.com>
	Wed, 11 Jul 2018 19:05:04 +0000 (19:05 +0000)
committer	Roman Lebedev <lebedev.ri@gmail.com>
	Wed, 11 Jul 2018 19:05:04 +0000 (19:05 +0000)
llvm/include/llvm/IR/PatternMatch.h		patch \| blob \| history
llvm/lib/Transforms/InstCombine/InstCombineCompares.cpp		patch \| blob \| history
llvm/test/Transforms/InstCombine/canonicalize-constant-low-bit-mask-and-icmp-eq-to-icmp-ule.ll		patch \| blob \| history
llvm/test/Transforms/InstCombine/canonicalize-low-bit-mask-and-icmp-eq-to-icmp-ule.ll		patch \| blob \| history
llvm/test/Transforms/InstCombine/icmp-logical.ll		patch \| blob \| history
llvm/test/Transforms/InstCombine/icmp-mul-zext.ll		patch \| blob \| history