[X86] Recognize constant splats in LowerFCOPYSIGN.

author Craig Topper <craig.topper@intel.com>

Sun, 28 Oct 2018 23:51:35 +0000 (23:51 +0000)

committer Craig Topper <craig.topper@intel.com>

Sun, 28 Oct 2018 23:51:35 +0000 (23:51 +0000)
author Craig Topper <craig.topper@intel.com>
Sun, 28 Oct 2018 23:51:35 +0000 (23:51 +0000)
committer Craig Topper <craig.topper@intel.com>
Sun, 28 Oct 2018 23:51:35 +0000 (23:51 +0000)
diff --git a/llvm/lib/Target/X86/X86ISelLowering.cpp b/llvm/lib/Target/X86/X86ISelLowering.cpp

index 060b36c868ec54a4b5106b8f96c01027102c5223..f2c5040b89e0718003a5e394116743fff8e089b8 100644 (file)
--- a/llvm/lib/Target/X86/X86ISelLowering.cpp
+++ b/llvm/lib/Target/X86/X86ISelLowering.cpp
@@ -18060,7 +18060,7 @@ static SDValue LowerFCOPYSIGN(SDValue Op, SelectionDAG &DAG) {
    // TODO: If we had general constant folding for FP logic ops, this check
    // wouldn't be necessary.
    SDValue MagBits;
-  if (ConstantFPSDNode *Op0CN = dyn_cast<ConstantFPSDNode>(Mag)) {
+  if (ConstantFPSDNode *Op0CN = isConstOrConstSplatFP(Mag)) {
      APFloat APF = Op0CN->getValueAPF();
      APF.clearSign();
      MagBits = DAG.getConstantFP(APF, dl, LogicVT);
diff --git a/llvm/test/CodeGen/X86/sse1-fcopysign.ll b/llvm/test/CodeGen/X86/sse1-fcopysign.ll

index 59598ecd5df6a116485fb6c02680e50defa52149..ed7f31e444cf3d6c30472759404e0cda8366a661 100644 (file)
--- a/llvm/test/CodeGen/X86/sse1-fcopysign.ll
+++ b/llvm/test/CodeGen/X86/sse1-fcopysign.ll
@@ -71,18 +71,16 @@ define <4 x float> @v4f32_neg(<4 x float> %a, <4 x float> %b) nounwind {
  define <4 x float> @v4f32_const_mag(<4 x float> %a, <4 x float> %b) nounwind {
  ; X86-LABEL: v4f32_const_mag:
  ; X86:       # %bb.0:
-; X86-NEXT:    andps {{\.LCPI.*}}, %xmm1
-; X86-NEXT:    movaps {{.*#+}} xmm0 = [1,1,1,1]
+; X86-NEXT:    movaps %xmm1, %xmm0
  ; X86-NEXT:    andps {{\.LCPI.*}}, %xmm0
-; X86-NEXT:    orps %xmm1, %xmm0
+; X86-NEXT:    orps {{\.LCPI.*}}, %xmm0
  ; X86-NEXT:    retl
  ;
  ; X64-LABEL: v4f32_const_mag:
  ; X64:       # %bb.0:
-; X64-NEXT:    andps {{.*}}(%rip), %xmm1
-; X64-NEXT:    movaps {{.*#+}} xmm0 = [1,1,1,1]
+; X64-NEXT:    movaps %xmm1, %xmm0
  ; X64-NEXT:    andps {{.*}}(%rip), %xmm0
-; X64-NEXT:    orps %xmm1, %xmm0
+; X64-NEXT:    orps {{.*}}(%rip), %xmm0
  ; X64-NEXT:    retq
    %tmp = tail call <4 x float> @llvm.copysign.v4f32(<4 x float> <float 1.0, float 1.0, float 1.0, float 1.0>, <4 x float> %b )
    ret <4 x float> %tmp
author	Craig Topper <craig.topper@intel.com>
	Sun, 28 Oct 2018 23:51:35 +0000 (23:51 +0000)
committer	Craig Topper <craig.topper@intel.com>
	Sun, 28 Oct 2018 23:51:35 +0000 (23:51 +0000)
llvm/lib/Target/X86/X86ISelLowering.cpp		patch \| blob \| history
llvm/test/CodeGen/X86/sse1-fcopysign.ll		patch \| blob \| history