[AArch64] Fix incorrect getSetCCInverse usage within trySwapVSelectOperands.

author Paul Walker <paul.walker@arm.com>

Thu, 17 Mar 2022 21:55:55 +0000 (21:55 +0000)

committer Paul Walker <paul.walker@arm.com>

Sat, 19 Mar 2022 12:36:14 +0000 (12:36 +0000)
author Paul Walker <paul.walker@arm.com>
Thu, 17 Mar 2022 21:55:55 +0000 (21:55 +0000)
committer Paul Walker <paul.walker@arm.com>
Sat, 19 Mar 2022 12:36:14 +0000 (12:36 +0000)
diff --git a/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp b/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp

index c30a5ea..9e49ccb 100644 (file)
--- a/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp
+++ b/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp
@@ -17623,10 +17623,12 @@ static SDValue trySwapVSelectOperands(SDNode *N, SelectionDAG &DAG) {
    if (SelectA != SelectB.getOperand(0))
      return SDValue();
  
-  ISD::CondCode CC = cast<CondCodeSDNode>(SetCC->getOperand(2))->get();
-  auto InverseSetCC = DAG.getSetCC(
-      SDLoc(SetCC), SetCC.getValueType(), SetCC.getOperand(0),
-      SetCC.getOperand(1), ISD::getSetCCInverse(CC, SetCC.getValueType()));
+  ISD::CondCode CC = cast<CondCodeSDNode>(SetCC.getOperand(2))->get();
+  ISD::CondCode InverseCC =
+      ISD::getSetCCInverse(CC, SetCC.getOperand(0).getValueType());
+  auto InverseSetCC =
+      DAG.getSetCC(SDLoc(SetCC), SetCC.getValueType(), SetCC.getOperand(0),
+                   SetCC.getOperand(1), InverseCC);
  
    return DAG.getNode(ISD::VSELECT, SDLoc(N), NTy,
                       {InverseSetCC, SelectB, SelectA});
diff --git a/llvm/test/CodeGen/AArch64/sve-select.ll b/llvm/test/CodeGen/AArch64/sve-select.ll

index 3183e1e..4e4c659 100644 (file)
--- a/llvm/test/CodeGen/AArch64/sve-select.ll
+++ b/llvm/test/CodeGen/AArch64/sve-select.ll
@@ -547,7 +547,8 @@ define <vscale x 4 x float> @select_f32_invert_fmul(<vscale x 4 x float> %a, <vs
  ; CHECK-LABEL: select_f32_invert_fmul:
  ; CHECK:       // %bb.0:
  ; CHECK-NEXT:    ptrue p0.s
-; CHECK-NEXT:    fcmne p0.s, p0/z, z0.s, #0.0
+; CHECK-NEXT:    fcmeq p1.s, p0/z, z0.s, #0.0
+; CHECK-NEXT:    not p0.b, p0/z, p1.b
  ; CHECK-NEXT:    fmul z0.s, p0/m, z0.s, z1.s
  ; CHECK-NEXT:    ret
    %p = fcmp oeq <vscale x 4 x float> %a, zeroinitializer
@@ -560,7 +561,8 @@ define <vscale x 4 x float> @select_f32_invert_fadd(<vscale x 4 x float> %a, <vs
  ; CHECK-LABEL: select_f32_invert_fadd:
  ; CHECK:       // %bb.0:
  ; CHECK-NEXT:    ptrue p0.s
-; CHECK-NEXT:    fcmne p0.s, p0/z, z0.s, #0.0
+; CHECK-NEXT:    fcmeq p1.s, p0/z, z0.s, #0.0
+; CHECK-NEXT:    not p0.b, p0/z, p1.b
  ; CHECK-NEXT:    fadd z0.s, p0/m, z0.s, z1.s
  ; CHECK-NEXT:    ret
    %p = fcmp oeq <vscale x 4 x float> %a, zeroinitializer
@@ -569,14 +571,14 @@ define <vscale x 4 x float> @select_f32_invert_fadd(<vscale x 4 x float> %a, <vs
    ret <vscale x 4 x float> %sel
  }
  
-define <vscale x 4 x float> @select_f32_invert_fsub(<vscale x 4 x float> %a, <vscale x 4 x float> %b) {
+define <vscale x 4 x float> @select_f32_invert_fsub(<vscale x 4 x float> %a, <vscale x 4 x float> %b, <vscale x 4 x i32> %c) {
  ; CHECK-LABEL: select_f32_invert_fsub:
  ; CHECK:       // %bb.0:
  ; CHECK-NEXT:    ptrue p0.s
-; CHECK-NEXT:    fcmne p0.s, p0/z, z0.s, #0.0
+; CHECK-NEXT:    cmpne p0.s, p0/z, z2.s, #0
  ; CHECK-NEXT:    fsub z0.s, p0/m, z0.s, z1.s
  ; CHECK-NEXT:    ret
-  %p = fcmp oeq <vscale x 4 x float> %a, zeroinitializer
+  %p = icmp eq <vscale x 4 x i32> %c, zeroinitializer
    %fsub = fsub <vscale x 4 x float> %a, %b
    %sel = select <vscale x 4 x i1> %p, <vscale x 4 x float> %a, <vscale x 4 x float> %fsub
    ret <vscale x 4 x float> %sel
author	Paul Walker <paul.walker@arm.com>
	Thu, 17 Mar 2022 21:55:55 +0000 (21:55 +0000)
committer	Paul Walker <paul.walker@arm.com>
	Sat, 19 Mar 2022 12:36:14 +0000 (12:36 +0000)
llvm/lib/Target/AArch64/AArch64ISelLowering.cpp		patch \| blob \| history
llvm/test/CodeGen/AArch64/sve-select.ll		patch \| blob \| history