DAG: Fix not legalizing vector fcanonicalizes

author Matt Arsenault <Matthew.Arsenault@amd.com>

Thu, 26 Apr 2018 19:21:37 +0000 (19:21 +0000)

committer Matt Arsenault <Matthew.Arsenault@amd.com>

Thu, 26 Apr 2018 19:21:37 +0000 (19:21 +0000)
author Matt Arsenault <Matthew.Arsenault@amd.com>
Thu, 26 Apr 2018 19:21:37 +0000 (19:21 +0000)
committer Matt Arsenault <Matthew.Arsenault@amd.com>
Thu, 26 Apr 2018 19:21:37 +0000 (19:21 +0000)
diff --git a/llvm/lib/CodeGen/SelectionDAG/LegalizeVectorOps.cpp b/llvm/lib/CodeGen/SelectionDAG/LegalizeVectorOps.cpp

index f8c2db0..a481acd 100644 (file)
--- a/llvm/lib/CodeGen/SelectionDAG/LegalizeVectorOps.cpp
+++ b/llvm/lib/CodeGen/SelectionDAG/LegalizeVectorOps.cpp
@@ -366,6 +366,7 @@ SDValue VectorLegalizer::LegalizeOp(SDValue Op) {
    case ISD::UMAX:
    case ISD::SMUL_LOHI:
    case ISD::UMUL_LOHI:
+  case ISD::FCANONICALIZE:
      QueryType = Node->getValueType(0);
      break;
    case ISD::FP_ROUND_INREG:
diff --git a/llvm/lib/Target/AMDGPU/SIISelLowering.cpp b/llvm/lib/Target/AMDGPU/SIISelLowering.cpp

index 0d71bdd..925fdce 100644 (file)
--- a/llvm/lib/Target/AMDGPU/SIISelLowering.cpp
+++ b/llvm/lib/Target/AMDGPU/SIISelLowering.cpp
@@ -479,6 +479,7 @@ SITargetLowering::SITargetLowering(const TargetMachine &TM,
      setOperationAction(ISD::FMA, MVT::v2f16, Legal);
      setOperationAction(ISD::FMINNUM, MVT::v2f16, Legal);
      setOperationAction(ISD::FMAXNUM, MVT::v2f16, Legal);
+    setOperationAction(ISD::FCANONICALIZE, MVT::v2f16, Legal);
  
      // This isn't really legal, but this avoids the legalizer unrolling it (and
      // allows matching fneg (fabs x) patterns)
diff --git a/llvm/test/CodeGen/AMDGPU/fcanonicalize.ll b/llvm/test/CodeGen/AMDGPU/fcanonicalize.ll

index c0ac659..1c6d176 100644 (file)
--- a/llvm/test/CodeGen/AMDGPU/fcanonicalize.ll
+++ b/llvm/test/CodeGen/AMDGPU/fcanonicalize.ll
@@ -7,6 +7,7 @@ declare double @llvm.canonicalize.f64(double) #0
  declare half @llvm.canonicalize.f16(half) #0
  declare <2 x half> @llvm.canonicalize.v2f16(<2 x half>) #0
  declare i32 @llvm.amdgcn.workitem.id.x() #0
+declare <2 x double> @llvm.canonicalize.v2f64(<2 x double>) #0
  
  ; GCN-LABEL: {{^}}v_test_canonicalize_var_f32:
  ; GCN: v_mul_f32_e32 [[REG:v[0-9]+]], 1.0, {{v[0-9]+}}
@@ -528,6 +529,18 @@ define amdgpu_kernel void @test_canonicalize_value_v2f16_denorm(<2 x half> addrs
    ret void
  }
  
+; GCN-LABEL: {{^}}v_test_canonicalize_var_v2f64:
+; GCN: v_max_f64
+; GCN: v_max_f64
+define amdgpu_kernel void @v_test_canonicalize_var_v2f64(<2 x double> addrspace(1)* %out) #1 {
+  %tid = call i32 @llvm.amdgcn.workitem.id.x()
+  %gep = getelementptr <2 x double>, <2 x double> addrspace(1)* %out, i32 %tid
+  %val = load <2 x double>, <2 x double> addrspace(1)* %gep
+  %canonicalized = call <2 x double> @llvm.canonicalize.v2f64(<2 x double> %val)
+  store <2 x double> %canonicalized, <2 x double> addrspace(1)* %out
+  ret void
+}
+
  attributes #0 = { nounwind readnone }
  attributes #1 = { nounwind }
  attributes #2 = { nounwind "target-features"="-fp32-denormals,-fp64-fp16-denormals" }
author	Matt Arsenault <Matthew.Arsenault@amd.com>
	Thu, 26 Apr 2018 19:21:37 +0000 (19:21 +0000)
committer	Matt Arsenault <Matthew.Arsenault@amd.com>
	Thu, 26 Apr 2018 19:21:37 +0000 (19:21 +0000)
llvm/lib/CodeGen/SelectionDAG/LegalizeVectorOps.cpp		patch \| blob \| history
llvm/lib/Target/AMDGPU/SIISelLowering.cpp		patch \| blob \| history
llvm/test/CodeGen/AMDGPU/fcanonicalize.ll		patch \| blob \| history