[libomptarget][nvptx] Fix build, second symbol reordering

author JonChesterfield <jonathanchesterfield@gmail.com>

Thu, 19 Dec 2019 02:00:26 +0000 (02:00 +0000)

committer JonChesterfield <jonathanchesterfield@gmail.com>

Thu, 19 Dec 2019 02:02:44 +0000 (02:02 +0000)
author JonChesterfield <jonathanchesterfield@gmail.com>
Thu, 19 Dec 2019 02:00:26 +0000 (02:00 +0000)
committer JonChesterfield <jonathanchesterfield@gmail.com>
Thu, 19 Dec 2019 02:02:44 +0000 (02:02 +0000)
diff --git a/openmp/libomptarget/deviceRTLs/amdgcn/src/target_impl.h b/openmp/libomptarget/deviceRTLs/amdgcn/src/target_impl.h

index 4e82329..9b7b8e3 100644 (file)
--- a/openmp/libomptarget/deviceRTLs/amdgcn/src/target_impl.h
+++ b/openmp/libomptarget/deviceRTLs/amdgcn/src/target_impl.h
@@ -124,8 +124,6 @@ INLINE __kmpc_impl_lanemask_t __kmpc_impl_activemask() {
    return __ballot64(1);
  }
  
-EXTERN bool __kmpc_impl_is_first_active_thread();
-
  EXTERN int32_t __kmpc_impl_shfl_sync(__kmpc_impl_lanemask_t, int32_t Var,
                                       int32_t SrcLane);
  
@@ -157,6 +155,8 @@ INLINE int GetBlockIdInKernel() { return __builtin_amdgcn_workgroup_id_x(); }
  INLINE int GetNumberOfBlocksInKernel() { return __ockl_get_num_groups(0); }
  INLINE int GetNumberOfThreadsInBlock() { return __ockl_get_local_size(0); }
  
+EXTERN bool __kmpc_impl_is_first_active_thread();
+
  // Locks
  EXTERN void __kmpc_impl_init_lock(omp_lock_t *lock);
  EXTERN void __kmpc_impl_destroy_lock(omp_lock_t *lock);
diff --git a/openmp/libomptarget/deviceRTLs/nvptx/src/target_impl.h b/openmp/libomptarget/deviceRTLs/nvptx/src/target_impl.h

index 8461a93..6d58528 100644 (file)
--- a/openmp/libomptarget/deviceRTLs/nvptx/src/target_impl.h
+++ b/openmp/libomptarget/deviceRTLs/nvptx/src/target_impl.h
@@ -133,15 +133,6 @@ INLINE __kmpc_impl_lanemask_t __kmpc_impl_activemask() {
  #endif
  }
  
-// Return true if this is the first active thread in the warp.
-INLINE bool __kmpc_impl_is_first_active_thread() {
-  unsigned long long Mask = __kmpc_impl_activemask();
-  unsigned long long ShNum = WARPSIZE - (GetThreadIdInBlock() % WARPSIZE);
-  unsigned long long Sh = Mask << ShNum;
-  // Truncate Sh to the 32 lower bits
-  return (unsigned)Sh == 0;
-}
-
  // In Cuda 9.0, the *_sync() version takes an extra argument 'mask'.
  
  INLINE int32_t __kmpc_impl_shfl_sync(__kmpc_impl_lanemask_t Mask, int32_t Var,
@@ -197,6 +188,15 @@ INLINE int GetBlockIdInKernel() { return blockIdx.x; }
  INLINE int GetNumberOfBlocksInKernel() { return gridDim.x; }
  INLINE int GetNumberOfThreadsInBlock() { return blockDim.x; }
  
+// Return true if this is the first active thread in the warp.
+INLINE bool __kmpc_impl_is_first_active_thread() {
+  unsigned long long Mask = __kmpc_impl_activemask();
+  unsigned long long ShNum = WARPSIZE - (GetThreadIdInBlock() % WARPSIZE);
+  unsigned long long Sh = Mask << ShNum;
+  // Truncate Sh to the 32 lower bits
+  return (unsigned)Sh == 0;
+}
+
  // Locks
  EXTERN void __kmpc_impl_init_lock(omp_lock_t *lock);
  EXTERN void __kmpc_impl_destroy_lock(omp_lock_t *lock);
author	JonChesterfield <jonathanchesterfield@gmail.com>
	Thu, 19 Dec 2019 02:00:26 +0000 (02:00 +0000)
committer	JonChesterfield <jonathanchesterfield@gmail.com>
	Thu, 19 Dec 2019 02:02:44 +0000 (02:02 +0000)
openmp/libomptarget/deviceRTLs/amdgcn/src/target_impl.h		patch \| blob \| history
openmp/libomptarget/deviceRTLs/nvptx/src/target_impl.h		patch \| blob \| history