Don't claim the udiv created in BypassSlowDivision is exact.

author Justin Lebar <jlebar@google.com>

Fri, 28 Oct 2016 21:43:51 +0000 (21:43 +0000)

committer Justin Lebar <jlebar@google.com>

Fri, 28 Oct 2016 21:43:51 +0000 (21:43 +0000)
author Justin Lebar <jlebar@google.com>
Fri, 28 Oct 2016 21:43:51 +0000 (21:43 +0000)
committer Justin Lebar <jlebar@google.com>
Fri, 28 Oct 2016 21:43:51 +0000 (21:43 +0000)
diff --git a/llvm/lib/Transforms/Utils/BypassSlowDivision.cpp b/llvm/lib/Transforms/Utils/BypassSlowDivision.cpp

index 42287d3..41a8543 100644 (file)
--- a/llvm/lib/Transforms/Utils/BypassSlowDivision.cpp
+++ b/llvm/lib/Transforms/Utils/BypassSlowDivision.cpp
@@ -120,8 +120,7 @@ static bool insertFastDiv(Instruction *I, IntegerType *BypassType,
                                                   BypassType);
  
    // udiv/urem because optimization only handles positive numbers
-  Value *ShortQuotientV = FastBuilder.CreateExactUDiv(ShortDividendV,
-                                                      ShortDivisorV);
+  Value *ShortQuotientV = FastBuilder.CreateUDiv(ShortDividendV, ShortDivisorV);
    Value *ShortRemainderV = FastBuilder.CreateURem(ShortDividendV,
                                                    ShortDivisorV);
    Value *FastQuotientV = FastBuilder.CreateCast(Instruction::ZExt,
diff --git a/llvm/test/Transforms/CodeGenPrepare/NVPTX/bypass-slow-div-not-exact.ll b/llvm/test/Transforms/CodeGenPrepare/NVPTX/bypass-slow-div-not-exact.ll

new file mode 100644 (file)

index 0000000..9db23d6
--- /dev/null
+++ b/llvm/test/Transforms/CodeGenPrepare/NVPTX/bypass-slow-div-not-exact.ll
@@ -0,0 +1,16 @@
+; RUN: opt -S -codegenprepare < %s | FileCheck %s
+
+target datalayout = "e-i64:64-v16:16-v32:32-n16:32:64"
+target triple = "nvptx64-nvidia-cuda"
+
+; Check that the smaller-width division that the BypassSlowDivision pass
+; creates is not marked as "exact" (that is, it doesn't claim that the
+; numerator is a multiple of the denominator).
+;
+; CHECK-LABEL: @test
+define void @test(i64 %a, i64 %b, i64* %retptr) {
+  ; CHECK: udiv i32
+  %d = sdiv i64 %a, %b
+  store i64 %d, i64* %retptr
+  ret void
+}
author	Justin Lebar <jlebar@google.com>
	Fri, 28 Oct 2016 21:43:51 +0000 (21:43 +0000)
committer	Justin Lebar <jlebar@google.com>
	Fri, 28 Oct 2016 21:43:51 +0000 (21:43 +0000)
llvm/lib/Transforms/Utils/BypassSlowDivision.cpp		patch \| blob \| history
llvm/test/Transforms/CodeGenPrepare/NVPTX/bypass-slow-div-not-exact.ll	[new file with mode: 0644]	patch \| blob