From: Sanjay Patel Date: Tue, 17 Dec 2019 17:07:28 +0000 (-0500) Subject: [SDAG] remove use restriction in isNegatibleForFree() when called from getNegatedExpr... X-Git-Tag: llvmorg-11-init~1929 X-Git-Url: http://review.tizen.org/git/?a=commitdiff_plain;h=36b1232ec5f370ab9fe8fcff0458d2fca5ca9b7f;p=platform%2Fupstream%2Fllvm.git [SDAG] remove use restriction in isNegatibleForFree() when called from getNegatedExpression() This is an alternate fix for the bug discussed in D70595. This also includes minimal tests for other in-tree targets to show the problem more generally. We check the number of uses as a predicate for whether some value is free to negate, but that use count can change as we rewrite the expression in getNegatedExpression(). So something that was marked free to negate during the cost evaluation phase becomes not free to negate during the rewrite phase (or the inverse - something that was not free becomes free). This can lead to a crash/assert because we expect that everything in an expression that is negatible to be handled in the corresponding code within getNegatedExpression(). This patch adds a hack to work-around the case where we probably no longer detect that either multiply operand of an FMA isNegatibleForFree which is assumed to be true when we started rewriting the expression. Differential Revision: https://reviews.llvm.org/D70975 --- diff --git a/llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp b/llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp index 53cbe9d..c3d6d32 100644 --- a/llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp +++ b/llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp @@ -5631,7 +5631,14 @@ SDValue TargetLowering::getNegatedExpression(SDValue Op, SelectionDAG &DAG, ForCodeSize, Depth + 1); char V1 = isNegatibleForFree(Op.getOperand(1), DAG, LegalOperations, ForCodeSize, Depth + 1); - if (V0 >= V1) { + // TODO: This is a hack. It is possible that costs have changed between now + // and the initial calls to isNegatibleForFree(). That is because we + // are rewriting the expression, and that may change the number of + // uses (and therefore the cost) of values. If the negation costs are + // equal, only negate this value if it is a constant. Otherwise, try + // operand 1. A better fix would eliminate uses as a cost factor or + // track the change in uses as we rewrite the expression. + if (V0 > V1 || (V0 == V1 && isa(Op.getOperand(0)))) { // fold (fneg (fma X, Y, Z)) -> (fma (fneg X), Y, (fneg Z)) SDValue Neg0 = getNegatedExpression( Op.getOperand(0), DAG, LegalOperations, ForCodeSize, Depth + 1); diff --git a/llvm/test/CodeGen/AArch64/arm64-fmadd.ll b/llvm/test/CodeGen/AArch64/arm64-fmadd.ll index 203ce62..dffa83a 100644 --- a/llvm/test/CodeGen/AArch64/arm64-fmadd.ll +++ b/llvm/test/CodeGen/AArch64/arm64-fmadd.ll @@ -88,5 +88,23 @@ entry: ret double %0 } +; This would crash while trying getNegatedExpression(). + +define float @negated_constant(float %x) { +; CHECK-LABEL: negated_constant: +; CHECK: // %bb.0: +; CHECK-NEXT: mov w8, #-1037565952 +; CHECK-NEXT: mov w9, #1109917696 +; CHECK-NEXT: fmov s1, w8 +; CHECK-NEXT: fmul s1, s0, s1 +; CHECK-NEXT: fmov s2, w9 +; CHECK-NEXT: fmadd s0, s0, s2, s1 +; CHECK-NEXT: ret + %m = fmul float %x, 42.0 + %fma = call nsz float @llvm.fma.f32(float %x, float -42.0, float %m) + %nfma = fneg float %fma + ret float %nfma +} + declare float @llvm.fma.f32(float, float, float) nounwind readnone declare double @llvm.fma.f64(double, double, double) nounwind readnone diff --git a/llvm/test/CodeGen/X86/fma-fneg-combine-2.ll b/llvm/test/CodeGen/X86/fma-fneg-combine-2.ll index f9e8795..bc1e1be 100644 --- a/llvm/test/CodeGen/X86/fma-fneg-combine-2.ll +++ b/llvm/test/CodeGen/X86/fma-fneg-combine-2.ll @@ -45,15 +45,15 @@ entry: define float @test_fneg_fma_subx_suby_negz_f32(float %w, float %x, float %y, float %z) { ; FMA3-LABEL: test_fneg_fma_subx_suby_negz_f32: ; FMA3: # %bb.0: # %entry -; FMA3-NEXT: vsubss %xmm0, %xmm1, %xmm1 -; FMA3-NEXT: vsubss %xmm2, %xmm0, %xmm0 +; FMA3-NEXT: vsubss %xmm1, %xmm0, %xmm1 +; FMA3-NEXT: vsubss %xmm0, %xmm2, %xmm0 ; FMA3-NEXT: vfmadd213ss {{.*#+}} xmm0 = (xmm1 * xmm0) + xmm3 ; FMA3-NEXT: retq ; ; FMA4-LABEL: test_fneg_fma_subx_suby_negz_f32: ; FMA4: # %bb.0: # %entry -; FMA4-NEXT: vsubss %xmm0, %xmm1, %xmm1 -; FMA4-NEXT: vsubss %xmm2, %xmm0, %xmm0 +; FMA4-NEXT: vsubss %xmm1, %xmm0, %xmm1 +; FMA4-NEXT: vsubss %xmm0, %xmm2, %xmm0 ; FMA4-NEXT: vfmaddss %xmm3, %xmm0, %xmm1, %xmm0 ; FMA4-NEXT: retq entry: @@ -86,4 +86,24 @@ entry: ret float %1 } +; This would crash while trying getNegatedExpression(). + +define float @negated_constant(float %x) { +; FMA3-LABEL: negated_constant: +; FMA3: # %bb.0: +; FMA3-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm1 +; FMA3-NEXT: vfmadd132ss {{.*#+}} xmm0 = (xmm0 * mem) + xmm1 +; FMA3-NEXT: retq +; +; FMA4-LABEL: negated_constant: +; FMA4: # %bb.0: +; FMA4-NEXT: vmulss {{.*}}(%rip), %xmm0, %xmm1 +; FMA4-NEXT: vfmaddss %xmm1, {{.*}}(%rip), %xmm0, %xmm0 +; FMA4-NEXT: retq + %m = fmul float %x, 42.0 + %fma = call nsz float @llvm.fma.f32(float %x, float -42.0, float %m) + %nfma = fneg float %fma + ret float %nfma +} + declare float @llvm.fma.f32(float, float, float)