[X86] Improve detection of unneeded shift amount masking to also handle the case...

author Craig Topper <craig.topper@intel.com>

Mon, 25 Feb 2019 19:42:47 +0000 (19:42 +0000)

committer Craig Topper <craig.topper@intel.com>

Mon, 25 Feb 2019 19:42:47 +0000 (19:42 +0000)
author Craig Topper <craig.topper@intel.com>
Mon, 25 Feb 2019 19:42:47 +0000 (19:42 +0000)
committer Craig Topper <craig.topper@intel.com>
Mon, 25 Feb 2019 19:42:47 +0000 (19:42 +0000)
diff --git a/llvm/lib/Target/X86/X86ISelDAGToDAG.cpp b/llvm/lib/Target/X86/X86ISelDAGToDAG.cpp

index 5f051b3..e29c8dc 100644 (file)
--- a/llvm/lib/Target/X86/X86ISelDAGToDAG.cpp
+++ b/llvm/lib/Target/X86/X86ISelDAGToDAG.cpp
@@ -399,6 +399,19 @@ namespace {
        return getI8Imm((Index * VecVT.getScalarSizeInBits()) / VecWidth, DL);
      }
  
+    // Helper to detect unneeded and instructions on shift amounts. Called
+    // from PatFrags in tablegen.
+    bool isUnneededShiftMask(SDNode *N, unsigned Width) const {
+      assert(N->getOpcode() == ISD::AND && "Unexpected opcode");
+      const APInt &Val = cast<ConstantSDNode>(N->getOperand(1))->getAPIntValue();
+
+      if (Val.countTrailingOnes() >= Width)
+        return true;
+
+      APInt Mask = Val | CurDAG->computeKnownBits(N->getOperand(0)).Zero;
+      return Mask.countTrailingOnes() >= Width;
+    }
+
      /// Return an SDNode that returns the value of the global base register.
      /// Output instructions required to initialize the global base register,
      /// if necessary.
diff --git a/llvm/lib/Target/X86/X86InstrCompiler.td b/llvm/lib/Target/X86/X86InstrCompiler.td

index 55e87aa..fe826c4 100644 (file)
--- a/llvm/lib/Target/X86/X86InstrCompiler.td
+++ b/llvm/lib/Target/X86/X86InstrCompiler.td
@@ -1715,40 +1715,43 @@ def : Pat<(shl GR16:$src1, (i8 1)), (ADD16rr GR16:$src1, GR16:$src1)>;
  def : Pat<(shl GR32:$src1, (i8 1)), (ADD32rr GR32:$src1, GR32:$src1)>;
  def : Pat<(shl GR64:$src1, (i8 1)), (ADD64rr GR64:$src1, GR64:$src1)>;
  
-// Helper imms to check if a mask doesn't change significant shift/rotate bits.
-def immShift8 : ImmLeaf<i8, [{
-  return countTrailingOnes<uint64_t>(Imm) >= 3;
+def shiftMask8 : PatFrag<(ops node:$lhs), (and node:$lhs, imm), [{
+  return isUnneededShiftMask(N, 3);
  }]>;
-def immShift16 : ImmLeaf<i8, [{
-  return countTrailingOnes<uint64_t>(Imm) >= 4;
+
+def shiftMask16 : PatFrag<(ops node:$lhs), (and node:$lhs, imm), [{
+  return isUnneededShiftMask(N, 4);
  }]>;
-def immShift32 : ImmLeaf<i8, [{
-  return countTrailingOnes<uint64_t>(Imm) >= 5;
+
+def shiftMask32 : PatFrag<(ops node:$lhs), (and node:$lhs, imm), [{
+  return isUnneededShiftMask(N, 5);
  }]>;
-def immShift64 : ImmLeaf<i8, [{
-  return countTrailingOnes<uint64_t>(Imm) >= 6;
+
+def shiftMask64 : PatFrag<(ops node:$lhs), (and node:$lhs, imm), [{
+  return isUnneededShiftMask(N, 6);
  }]>;
  
+
  // Shift amount is implicitly masked.
  multiclass MaskedShiftAmountPats<SDNode frag, string name> {
    // (shift x (and y, 31)) ==> (shift x, y)
-  def : Pat<(frag GR8:$src1, (and CL, immShift32)),
+  def : Pat<(frag GR8:$src1, (shiftMask32 CL)),
              (!cast<Instruction>(name # "8rCL") GR8:$src1)>;
-  def : Pat<(frag GR16:$src1, (and CL, immShift32)),
+  def : Pat<(frag GR16:$src1, (shiftMask32 CL)),
              (!cast<Instruction>(name # "16rCL") GR16:$src1)>;
-  def : Pat<(frag GR32:$src1, (and CL, immShift32)),
+  def : Pat<(frag GR32:$src1, (shiftMask32 CL)),
              (!cast<Instruction>(name # "32rCL") GR32:$src1)>;
-  def : Pat<(store (frag (loadi8 addr:$dst), (and CL, immShift32)), addr:$dst),
+  def : Pat<(store (frag (loadi8 addr:$dst), (shiftMask32 CL)), addr:$dst),
              (!cast<Instruction>(name # "8mCL") addr:$dst)>;
-  def : Pat<(store (frag (loadi16 addr:$dst), (and CL, immShift32)), addr:$dst),
+  def : Pat<(store (frag (loadi16 addr:$dst), (shiftMask32 CL)), addr:$dst),
              (!cast<Instruction>(name # "16mCL") addr:$dst)>;
-  def : Pat<(store (frag (loadi32 addr:$dst), (and CL, immShift32)), addr:$dst),
+  def : Pat<(store (frag (loadi32 addr:$dst), (shiftMask32 CL)), addr:$dst),
              (!cast<Instruction>(name # "32mCL") addr:$dst)>;
  
    // (shift x (and y, 63)) ==> (shift x, y)
-  def : Pat<(frag GR64:$src1, (and CL, immShift64)),
+  def : Pat<(frag GR64:$src1, (shiftMask64 CL)),
              (!cast<Instruction>(name # "64rCL") GR64:$src1)>;
-  def : Pat<(store (frag (loadi64 addr:$dst), (and CL, immShift64)), addr:$dst),
+  def : Pat<(store (frag (loadi64 addr:$dst), (shiftMask64 CL)), addr:$dst),
              (!cast<Instruction>(name # "64mCL") addr:$dst)>;
  }
  
@@ -1764,23 +1767,23 @@ defm : MaskedShiftAmountPats<sra, "SAR">;
  // not tracking flags for these nodes.
  multiclass MaskedRotateAmountPats<SDNode frag, string name> {
    // (rot x (and y, BitWidth - 1)) ==> (rot x, y)
-  def : Pat<(frag GR8:$src1, (and CL, immShift8)),
+  def : Pat<(frag GR8:$src1, (shiftMask8 CL)),
    (!cast<Instruction>(name # "8rCL") GR8:$src1)>;
-  def : Pat<(frag GR16:$src1, (and CL, immShift16)),
+  def : Pat<(frag GR16:$src1, (shiftMask16 CL)),
    (!cast<Instruction>(name # "16rCL") GR16:$src1)>;
-  def : Pat<(frag GR32:$src1, (and CL, immShift32)),
+  def : Pat<(frag GR32:$src1, (shiftMask32 CL)),
    (!cast<Instruction>(name # "32rCL") GR32:$src1)>;
-  def : Pat<(store (frag (loadi8 addr:$dst), (and CL, immShift8)), addr:$dst),
+  def : Pat<(store (frag (loadi8 addr:$dst), (shiftMask8 CL)), addr:$dst),
    (!cast<Instruction>(name # "8mCL") addr:$dst)>;
-  def : Pat<(store (frag (loadi16 addr:$dst), (and CL, immShift16)), addr:$dst),
+  def : Pat<(store (frag (loadi16 addr:$dst), (shiftMask16 CL)), addr:$dst),
    (!cast<Instruction>(name # "16mCL") addr:$dst)>;
-  def : Pat<(store (frag (loadi32 addr:$dst), (and CL, immShift32)), addr:$dst),
+  def : Pat<(store (frag (loadi32 addr:$dst), (shiftMask32 CL)), addr:$dst),
    (!cast<Instruction>(name # "32mCL") addr:$dst)>;
  
    // (rot x (and y, 63)) ==> (rot x, y)
-  def : Pat<(frag GR64:$src1, (and CL, immShift64)),
+  def : Pat<(frag GR64:$src1, (shiftMask64 CL)),
    (!cast<Instruction>(name # "64rCL") GR64:$src1)>;
-  def : Pat<(store (frag (loadi64 addr:$dst), (and CL, immShift64)), addr:$dst),
+  def : Pat<(store (frag (loadi64 addr:$dst), (shiftMask64 CL)), addr:$dst),
    (!cast<Instruction>(name # "64mCL") addr:$dst)>;
  }
  
@@ -1791,13 +1794,13 @@ defm : MaskedRotateAmountPats<rotr, "ROR">;
  // Double shift amount is implicitly masked.
  multiclass MaskedDoubleShiftAmountPats<SDNode frag, string name> {
    // (shift x (and y, 31)) ==> (shift x, y)
-  def : Pat<(frag GR16:$src1, GR16:$src2, (and CL, immShift32)),
+  def : Pat<(frag GR16:$src1, GR16:$src2, (shiftMask32 CL)),
              (!cast<Instruction>(name # "16rrCL") GR16:$src1, GR16:$src2)>;
-  def : Pat<(frag GR32:$src1, GR32:$src2, (and CL, immShift32)),
+  def : Pat<(frag GR32:$src1, GR32:$src2, (shiftMask32 CL)),
              (!cast<Instruction>(name # "32rrCL") GR32:$src1, GR32:$src2)>;
  
    // (shift x (and y, 63)) ==> (shift x, y)
-  def : Pat<(frag GR64:$src1, GR64:$src2, (and CL, immShift64)),
+  def : Pat<(frag GR64:$src1, GR64:$src2, (shiftMask32 CL)),
              (!cast<Instruction>(name # "64rrCL") GR64:$src1, GR64:$src2)>;
  }
  
@@ -1806,57 +1809,57 @@ defm : MaskedDoubleShiftAmountPats<X86shrd, "SHRD">;
  
  let Predicates = [HasBMI2] in {
    let AddedComplexity = 1 in {
-    def : Pat<(sra GR32:$src1, (and GR8:$src2, immShift32)),
+    def : Pat<(sra GR32:$src1, (shiftMask32 GR8:$src2)),
                (SARX32rr GR32:$src1,
                          (INSERT_SUBREG
                            (i32 (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>;
-    def : Pat<(sra GR64:$src1, (and GR8:$src2, immShift64)),
+    def : Pat<(sra GR64:$src1, (shiftMask64 GR8:$src2)),
                (SARX64rr GR64:$src1,
                          (INSERT_SUBREG
                            (i64 (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>;
  
-    def : Pat<(srl GR32:$src1, (and GR8:$src2, immShift32)),
+    def : Pat<(srl GR32:$src1, (shiftMask32 GR8:$src2)),
                (SHRX32rr GR32:$src1,
                          (INSERT_SUBREG
                            (i32 (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>;
-    def : Pat<(srl GR64:$src1, (and GR8:$src2, immShift64)),
+    def : Pat<(srl GR64:$src1, (shiftMask64 GR8:$src2)),
                (SHRX64rr GR64:$src1,
                          (INSERT_SUBREG
                            (i64 (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>;
  
-    def : Pat<(shl GR32:$src1, (and GR8:$src2, immShift32)),
+    def : Pat<(shl GR32:$src1, (shiftMask32 GR8:$src2)),
                (SHLX32rr GR32:$src1,
                          (INSERT_SUBREG
                            (i32 (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>;
-    def : Pat<(shl GR64:$src1, (and GR8:$src2, immShift64)),
+    def : Pat<(shl GR64:$src1, (shiftMask64 GR8:$src2)),
                (SHLX64rr GR64:$src1,
                          (INSERT_SUBREG
                            (i64 (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>;
    }
  
-  def : Pat<(sra (loadi32 addr:$src1), (and GR8:$src2, immShift32)),
+  def : Pat<(sra (loadi32 addr:$src1), (shiftMask32 GR8:$src2)),
              (SARX32rm addr:$src1,
                        (INSERT_SUBREG
                          (i32 (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>;
-  def : Pat<(sra (loadi64 addr:$src1), (and GR8:$src2, immShift64)),
+  def : Pat<(sra (loadi64 addr:$src1), (shiftMask64 GR8:$src2)),
              (SARX64rm addr:$src1,
                        (INSERT_SUBREG
                          (i64 (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>;
  
-  def : Pat<(srl (loadi32 addr:$src1), (and GR8:$src2, immShift32)),
+  def : Pat<(srl (loadi32 addr:$src1), (shiftMask32 GR8:$src2)),
              (SHRX32rm addr:$src1,
                        (INSERT_SUBREG
                          (i32 (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>;
-  def : Pat<(srl (loadi64 addr:$src1), (and GR8:$src2, immShift64)),
+  def : Pat<(srl (loadi64 addr:$src1), (shiftMask64 GR8:$src2)),
              (SHRX64rm addr:$src1,
                        (INSERT_SUBREG
                          (i64 (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>;
  
-  def : Pat<(shl (loadi32 addr:$src1), (and GR8:$src2, immShift32)),
+  def : Pat<(shl (loadi32 addr:$src1), (shiftMask32 GR8:$src2)),
              (SHLX32rm addr:$src1,
                        (INSERT_SUBREG
                          (i32 (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>;
-  def : Pat<(shl (loadi64 addr:$src1), (and GR8:$src2, immShift64)),
+  def : Pat<(shl (loadi64 addr:$src1), (shiftMask64 GR8:$src2)),
              (SHLX64rm addr:$src1,
                        (INSERT_SUBREG
                          (i64 (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>;
@@ -1865,7 +1868,7 @@ let Predicates = [HasBMI2] in {
  // Use BTR/BTS/BTC for clearing/setting/toggling a bit in a variable location.
  multiclass one_bit_patterns<RegisterClass RC, ValueType VT, Instruction BTR,
                              Instruction BTS, Instruction BTC,
-                            ImmLeaf ImmShift> {
+                            PatFrag ShiftMask> {
    def : Pat<(and RC:$src1, (rotl -2, GR8:$src2)),
              (BTR RC:$src1,
                   (INSERT_SUBREG (VT (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>;
@@ -1877,20 +1880,20 @@ multiclass one_bit_patterns<RegisterClass RC, ValueType VT, Instruction BTR,
                   (INSERT_SUBREG (VT (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>;
  
    // Similar to above, but removing unneeded masking of the shift amount.
-  def : Pat<(and RC:$src1, (rotl -2, (and GR8:$src2, ImmShift))),
+  def : Pat<(and RC:$src1, (rotl -2, (ShiftMask GR8:$src2))),
              (BTR RC:$src1,
                   (INSERT_SUBREG (VT (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>;
-  def : Pat<(or RC:$src1, (shl 1, (and GR8:$src2, ImmShift))),
+  def : Pat<(or RC:$src1, (shl 1, (ShiftMask GR8:$src2))),
              (BTS RC:$src1,
                  (INSERT_SUBREG (VT (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>;
-  def : Pat<(xor RC:$src1, (shl 1, (and GR8:$src2, ImmShift))),
+  def : Pat<(xor RC:$src1, (shl 1, (ShiftMask GR8:$src2))),
              (BTC RC:$src1,
                  (INSERT_SUBREG (VT (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>;
  }
  
-defm : one_bit_patterns<GR16, i16, BTR16rr, BTS16rr, BTC16rr, immShift16>;
-defm : one_bit_patterns<GR32, i32, BTR32rr, BTS32rr, BTC32rr, immShift32>;
-defm : one_bit_patterns<GR64, i64, BTR64rr, BTS64rr, BTC64rr, immShift64>;
+defm : one_bit_patterns<GR16, i16, BTR16rr, BTS16rr, BTC16rr, shiftMask16>;
+defm : one_bit_patterns<GR32, i32, BTR32rr, BTS32rr, BTC32rr, shiftMask32>;
+defm : one_bit_patterns<GR64, i64, BTR64rr, BTS64rr, BTC64rr, shiftMask64>;
  
  
  // (anyext (setcc_carry)) -> (setcc_carry)
diff --git a/llvm/test/CodeGen/X86/btc_bts_btr.ll b/llvm/test/CodeGen/X86/btc_bts_btr.ll

index 7459e87..6f43cf7 100644 (file)
--- a/llvm/test/CodeGen/X86/btc_bts_btr.ll
+++ b/llvm/test/CodeGen/X86/btc_bts_btr.ll
@@ -955,7 +955,6 @@ define i32 @btr_32_mask_zeros(i32 %x, i32 %n) {
  ; X64:       # %bb.0:
  ; X64-NEXT:    movl %edi, %eax
  ; X64-NEXT:    shlb $2, %sil
-; X64-NEXT:    andb $28, %sil
  ; X64-NEXT:    btrl %esi, %eax
  ; X64-NEXT:    retq
  ;
@@ -964,7 +963,6 @@ define i32 @btr_32_mask_zeros(i32 %x, i32 %n) {
  ; X86-NEXT:    movl {{[0-9]+}}(%esp), %eax
  ; X86-NEXT:    movb {{[0-9]+}}(%esp), %cl
  ; X86-NEXT:    shlb $2, %cl
-; X86-NEXT:    andb $28, %cl
  ; X86-NEXT:    btrl %ecx, %eax
  ; X86-NEXT:    retl
    %1 = shl i32 %n, 2
@@ -980,7 +978,6 @@ define i32 @bts_32_mask_zeros(i32 %x, i32 %n) {
  ; X64:       # %bb.0:
  ; X64-NEXT:    movl %edi, %eax
  ; X64-NEXT:    shlb $2, %sil
-; X64-NEXT:    andb $28, %sil
  ; X64-NEXT:    btsl %esi, %eax
  ; X64-NEXT:    retq
  ;
@@ -989,7 +986,6 @@ define i32 @bts_32_mask_zeros(i32 %x, i32 %n) {
  ; X86-NEXT:    movl {{[0-9]+}}(%esp), %eax
  ; X86-NEXT:    movb {{[0-9]+}}(%esp), %cl
  ; X86-NEXT:    shlb $2, %cl
-; X86-NEXT:    andb $28, %cl
  ; X86-NEXT:    btsl %ecx, %eax
  ; X86-NEXT:    retl
    %1 = shl i32 %n, 2
@@ -1004,7 +1000,6 @@ define i32 @btc_32_mask_zeros(i32 %x, i32 %n) {
  ; X64:       # %bb.0:
  ; X64-NEXT:    movl %edi, %eax
  ; X64-NEXT:    shlb $2, %sil
-; X64-NEXT:    andb $28, %sil
  ; X64-NEXT:    btcl %esi, %eax
  ; X64-NEXT:    retq
  ;
@@ -1013,7 +1008,6 @@ define i32 @btc_32_mask_zeros(i32 %x, i32 %n) {
  ; X86-NEXT:    movl {{[0-9]+}}(%esp), %eax
  ; X86-NEXT:    movb {{[0-9]+}}(%esp), %cl
  ; X86-NEXT:    shlb $2, %cl
-; X86-NEXT:    andb $28, %cl
  ; X86-NEXT:    btcl %ecx, %eax
  ; X86-NEXT:    retl
    %1 = shl i32 %n, 2
@@ -1028,23 +1022,18 @@ define i64 @btr_64_mask_zeros(i64 %x, i64 %n) {
  ; X64:       # %bb.0:
  ; X64-NEXT:    movq %rdi, %rax
  ; X64-NEXT:    shlb $2, %sil
-; X64-NEXT:    andb $60, %sil
  ; X64-NEXT:    btrq %rsi, %rax
  ; X64-NEXT:    retq
  ;
  ; X86-LABEL: btr_64_mask_zeros:
  ; X86:       # %bb.0:
-; X86-NEXT:    movb {{[0-9]+}}(%esp), %ch
-; X86-NEXT:    shlb $2, %ch
-; X86-NEXT:    movb %ch, %cl
-; X86-NEXT:    andb $60, %cl
+; X86-NEXT:    movb {{[0-9]+}}(%esp), %cl
+; X86-NEXT:    shlb $2, %cl
  ; X86-NEXT:    movl $1, %eax
  ; X86-NEXT:    xorl %edx, %edx
  ; X86-NEXT:    shldl %cl, %eax, %edx
-; X86-NEXT:    movb %ch, %cl
-; X86-NEXT:    andb $28, %cl
  ; X86-NEXT:    shll %cl, %eax
-; X86-NEXT:    testb $32, %ch
+; X86-NEXT:    testb $32, %cl
  ; X86-NEXT:    je .LBB39_2
  ; X86-NEXT:  # %bb.1:
  ; X86-NEXT:    movl %eax, %edx
@@ -1068,23 +1057,18 @@ define i64 @bts_64_mask_zeros(i64 %x, i64 %n) {
  ; X64:       # %bb.0:
  ; X64-NEXT:    movq %rdi, %rax
  ; X64-NEXT:    shlb $2, %sil
-; X64-NEXT:    andb $60, %sil
  ; X64-NEXT:    btsq %rsi, %rax
  ; X64-NEXT:    retq
  ;
  ; X86-LABEL: bts_64_mask_zeros:
  ; X86:       # %bb.0:
-; X86-NEXT:    movb {{[0-9]+}}(%esp), %ch
-; X86-NEXT:    shlb $2, %ch
-; X86-NEXT:    movb %ch, %cl
-; X86-NEXT:    andb $60, %cl
+; X86-NEXT:    movb {{[0-9]+}}(%esp), %cl
+; X86-NEXT:    shlb $2, %cl
  ; X86-NEXT:    movl $1, %eax
  ; X86-NEXT:    xorl %edx, %edx
  ; X86-NEXT:    shldl %cl, %eax, %edx
-; X86-NEXT:    movb %ch, %cl
-; X86-NEXT:    andb $28, %cl
  ; X86-NEXT:    shll %cl, %eax
-; X86-NEXT:    testb $32, %ch
+; X86-NEXT:    testb $32, %cl
  ; X86-NEXT:    je .LBB40_2
  ; X86-NEXT:  # %bb.1:
  ; X86-NEXT:    movl %eax, %edx
@@ -1105,23 +1089,18 @@ define i64 @btc_64_mask_zeros(i64 %x, i64 %n) {
  ; X64:       # %bb.0:
  ; X64-NEXT:    movq %rdi, %rax
  ; X64-NEXT:    shlb $2, %sil
-; X64-NEXT:    andb $60, %sil
  ; X64-NEXT:    btcq %rsi, %rax
  ; X64-NEXT:    retq
  ;
  ; X86-LABEL: btc_64_mask_zeros:
  ; X86:       # %bb.0:
-; X86-NEXT:    movb {{[0-9]+}}(%esp), %ch
-; X86-NEXT:    shlb $2, %ch
-; X86-NEXT:    movb %ch, %cl
-; X86-NEXT:    andb $60, %cl
+; X86-NEXT:    movb {{[0-9]+}}(%esp), %cl
+; X86-NEXT:    shlb $2, %cl
  ; X86-NEXT:    movl $1, %eax
  ; X86-NEXT:    xorl %edx, %edx
  ; X86-NEXT:    shldl %cl, %eax, %edx
-; X86-NEXT:    movb %ch, %cl
-; X86-NEXT:    andb $28, %cl
  ; X86-NEXT:    shll %cl, %eax
-; X86-NEXT:    testb $32, %ch
+; X86-NEXT:    testb $32, %cl
  ; X86-NEXT:    je .LBB41_2
  ; X86-NEXT:  # %bb.1:
  ; X86-NEXT:    movl %eax, %edx
diff --git a/llvm/test/CodeGen/X86/rotate4.ll b/llvm/test/CodeGen/X86/rotate4.ll

index 91edff1..7f5e426 100644 (file)
--- a/llvm/test/CodeGen/X86/rotate4.ll
+++ b/llvm/test/CodeGen/X86/rotate4.ll
@@ -636,7 +636,6 @@ define i32 @rotate_demanded_bits_3(i32, i32) {
  ; X86-NEXT:    movl {{[0-9]+}}(%esp), %eax
  ; X86-NEXT:    movb {{[0-9]+}}(%esp), %cl
  ; X86-NEXT:    addb %cl, %cl
-; X86-NEXT:    andb $30, %cl
  ; X86-NEXT:    roll %cl, %eax
  ; X86-NEXT:    retl
  ;
@@ -645,7 +644,6 @@ define i32 @rotate_demanded_bits_3(i32, i32) {
  ; X64-NEXT:    # kill: def $esi killed $esi def $rsi
  ; X64-NEXT:    movl %edi, %eax
  ; X64-NEXT:    leal (%rsi,%rsi), %ecx
-; X64-NEXT:    andb $30, %cl
  ; X64-NEXT:    # kill: def $cl killed $cl killed $ecx
  ; X64-NEXT:    roll %cl, %eax
  ; X64-NEXT:    retq
author	Craig Topper <craig.topper@intel.com>
	Mon, 25 Feb 2019 19:42:47 +0000 (19:42 +0000)
committer	Craig Topper <craig.topper@intel.com>
	Mon, 25 Feb 2019 19:42:47 +0000 (19:42 +0000)
llvm/lib/Target/X86/X86ISelDAGToDAG.cpp		patch \| blob \| history
llvm/lib/Target/X86/X86InstrCompiler.td		patch \| blob \| history
llvm/test/CodeGen/X86/btc_bts_btr.ll		patch \| blob \| history
llvm/test/CodeGen/X86/rotate4.ll		patch \| blob \| history