projects
/
platform
/
upstream
/
tvm.git
/ commitdiff
commit
grep
author
committer
pickaxe
?
search:
re
summary
|
shortlog
|
log
|
commit
| commitdiff |
tree
raw
|
patch
| inline |
side by side
(parent:
4332b0a
)
add more syncs (#3151)
author
Leyuan Wang
<laurawly@gmail.com>
Thu, 9 May 2019 15:44:47 +0000
(08:44 -0700)
committer
Tianqi Chen
<tqchen@users.noreply.github.com>
Thu, 9 May 2019 15:44:47 +0000
(08:44 -0700)
topi/python/topi/cuda/nms.py
patch
|
blob
|
history
diff --git
a/topi/python/topi/cuda/nms.py
b/topi/python/topi/cuda/nms.py
index
5d04d72
..
0c27bd2
100644
(file)
--- a/
topi/python/topi/cuda/nms.py
+++ b/
topi/python/topi/cuda/nms.py
@@
-133,6
+133,9
@@
def get_valid_counts_upsweep(data, idx_in, idx, partial):
idx[bx * num_anchors + tx * elem_per_thread + i] = \
idx[bx * num_anchors + tx * elem_per_thread + i - 1] + \
idx_in[bx * num_anchors + tx * elem_per_thread + i]
+ ib.emit(tvm.make.Call(None, 'tvm_storage_sync',
+ tvm.convert(['shared']),
+ tvm.expr.Call.Intrinsic, None, 0))
return ib.get()
def get_valid_counts_scan(data, partial_in, partial):