Allow targets to prefer TypeSplitVector over TypePromoteInteger when computing the...

author Justin Holewinski <jholewinski@nvidia.com>

Thu, 29 Nov 2012 14:26:24 +0000 (14:26 +0000)

committer Justin Holewinski <jholewinski@nvidia.com>

Thu, 29 Nov 2012 14:26:24 +0000 (14:26 +0000)
author Justin Holewinski <jholewinski@nvidia.com>
Thu, 29 Nov 2012 14:26:24 +0000 (14:26 +0000)
committer Justin Holewinski <jholewinski@nvidia.com>
Thu, 29 Nov 2012 14:26:24 +0000 (14:26 +0000)
diff --git a/llvm/include/llvm/Target/TargetLowering.h b/llvm/include/llvm/Target/TargetLowering.h

index 580a30f..aaa5f51 100644 (file)
--- a/llvm/include/llvm/Target/TargetLowering.h
+++ b/llvm/include/llvm/Target/TargetLowering.h
@@ -159,6 +159,11 @@ public:
  
    virtual bool isSelectSupported(SelectSupportKind kind) const { return true; }
  
+  /// shouldSplitVectorElementType - Return true if a vector of the given type
+  /// should be split (TypeSplitVector) instead of promoted
+  /// (TypePromoteInteger) during type legalization.
+  virtual bool shouldSplitVectorElementType(EVT VT) const { return false; }
+
    /// isIntDivCheap() - Return true if integer divide is usually cheaper than
    /// a sequence of several shifts, adds, and multiplies for this target.
    bool isIntDivCheap() const { return IntDivIsCheap; }
diff --git a/llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp b/llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp

index 794935d..9ddcf7a 100644 (file)
--- a/llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp
+++ b/llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp
@@ -825,7 +825,7 @@ void TargetLowering::computeRegisterProperties() {
      // that wider vector type.
      EVT EltVT = VT.getVectorElementType();
      unsigned NElts = VT.getVectorNumElements();
-    if (NElts != 1) {
+    if (NElts != 1 && !shouldSplitVectorElementType(EltVT)) {
        bool IsLegalWiderType = false;
        // First try to promote the elements of integer vectors. If no legal
        // promotion was found, fallback to the widen-vector method.
diff --git a/llvm/lib/Target/NVPTX/NVPTXISelLowering.cpp b/llvm/lib/Target/NVPTX/NVPTXISelLowering.cpp

index f1a99d7..a6f7e25 100644 (file)
--- a/llvm/lib/Target/NVPTX/NVPTXISelLowering.cpp
+++ b/llvm/lib/Target/NVPTX/NVPTXISelLowering.cpp
@@ -271,6 +271,9 @@ const char *NVPTXTargetLowering::getTargetNodeName(unsigned Opcode) const {
    }
  }
  
+bool NVPTXTargetLowering::shouldSplitVectorElementType(EVT VT) const {
+  return VT == MVT::i1;
+}
  
  SDValue
  NVPTXTargetLowering::LowerGlobalAddress(SDValue Op, SelectionDAG &DAG) const {
diff --git a/llvm/lib/Target/NVPTX/NVPTXISelLowering.h b/llvm/lib/Target/NVPTX/NVPTXISelLowering.h

index 94a177c..0a1833a 100644 (file)
--- a/llvm/lib/Target/NVPTX/NVPTXISelLowering.h
+++ b/llvm/lib/Target/NVPTX/NVPTXISelLowering.h
@@ -92,6 +92,8 @@ public:
    virtual unsigned getFunctionAlignment(const Function *F) const;
  
    virtual EVT getSetCCResultType(EVT VT) const {
+    if (VT.isVector())
+      return MVT::getVectorVT(MVT::i1, VT.getVectorNumElements());
      return MVT::i1;
    }
  
@@ -129,6 +131,8 @@ public:
      return MVT::i32;
    }
  
+  virtual bool shouldSplitVectorElementType(EVT VT) const;
+
  private:
    const NVPTXSubtarget &nvptxSubtarget;  // cache the subtarget here
  
diff --git a/llvm/test/CodeGen/NVPTX/vector-compare.ll b/llvm/test/CodeGen/NVPTX/vector-compare.ll

new file mode 100644 (file)

index 0000000..2180499
--- /dev/null
+++ b/llvm/test/CodeGen/NVPTX/vector-compare.ll
@@ -0,0 +1,19 @@
+; RUN: llc < %s -march=nvptx -mcpu=sm_20
+; RUN: llc < %s -march=nvptx64 -mcpu=sm_20
+
+; This test makes sure that the result of vector compares are properly
+; scalarized.  If codegen fails, then the type legalizer incorrectly
+; tried to promote <2 x i1> to <2 x i8> and instruction selection failed.
+
+define void @foo(<2 x i32>* %a, <2 x i32>* %b, i32* %r1, i32* %r2) {
+  %aval = load <2 x i32>* %a
+  %bval = load <2 x i32>* %b
+  %res = icmp slt <2 x i32> %aval, %bval
+  %t1 = extractelement <2 x i1> %res, i32 0
+  %t2 = extractelement <2 x i1> %res, i32 1
+  %t1a = zext i1 %t1 to i32
+  %t2a = zext i1 %t2 to i32
+  store i32 %t1a, i32* %r1
+  store i32 %t2a, i32* %r2
+  ret void
+}
author	Justin Holewinski <jholewinski@nvidia.com>
	Thu, 29 Nov 2012 14:26:24 +0000 (14:26 +0000)
committer	Justin Holewinski <jholewinski@nvidia.com>
	Thu, 29 Nov 2012 14:26:24 +0000 (14:26 +0000)
llvm/include/llvm/Target/TargetLowering.h		patch \| blob \| history
llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp		patch \| blob \| history
llvm/lib/Target/NVPTX/NVPTXISelLowering.cpp		patch \| blob \| history
llvm/lib/Target/NVPTX/NVPTXISelLowering.h		patch \| blob \| history
llvm/test/CodeGen/NVPTX/vector-compare.ll	[new file with mode: 0644]	patch \| blob