Adjust launch_bounds annotation for AMD hardware. (#17555)

author Johannes M Dieterich <johannes.dieterich@amd.com>

Fri, 1 Mar 2019 06:53:34 +0000 (22:53 -0800)

committer Facebook Github Bot <facebook-github-bot@users.noreply.github.com>

Fri, 1 Mar 2019 06:59:11 +0000 (22:59 -0800)
author Johannes M Dieterich <johannes.dieterich@amd.com>
Fri, 1 Mar 2019 06:53:34 +0000 (22:53 -0800)
committer Facebook Github Bot <facebook-github-bot@users.noreply.github.com>
Fri, 1 Mar 2019 06:59:11 +0000 (22:59 -0800)
diff --git a/aten/src/THCUNN/SpatialDilatedMaxPooling.cu b/aten/src/THCUNN/SpatialDilatedMaxPooling.cu

index d0213b1..e1202e0 100644 (file)
--- a/aten/src/THCUNN/SpatialDilatedMaxPooling.cu
+++ b/aten/src/THCUNN/SpatialDilatedMaxPooling.cu
@@ -48,7 +48,11 @@ __global__ void MaxPoolForward(const int nthreads, const Dtype* bottom_data,
  const int BACKWARD_THREADS = 256;
  
  template <typename Dtype, typename AccType>
+#if defined (__HIP_PLATFORM_HCC__)
+C10_LAUNCH_BOUNDS(BACKWARD_THREADS, 4)
+#else
  C10_LAUNCH_BOUNDS(BACKWARD_THREADS, 8)
+#endif
  __global__ void MaxPoolBackward(const int nthreads, const Dtype* top_diff,
      const int64_t* top_mask, const int num, const int channels,
      const int height, const int width, const int pooled_height,
author	Johannes M Dieterich <johannes.dieterich@amd.com>
	Fri, 1 Mar 2019 06:53:34 +0000 (22:53 -0800)
committer	Facebook Github Bot <facebook-github-bot@users.noreply.github.com>
	Fri, 1 Mar 2019 06:59:11 +0000 (22:59 -0800)