[HIP][NFC] Use correct max in cuda_complex_builtins

author Aaron En Ye Shi <enye.shi@gmail.com>

Tue, 27 Oct 2020 19:08:58 +0000 (19:08 +0000)

committer Aaron En Ye Shi <enye.shi@gmail.com>

Tue, 27 Oct 2020 19:35:09 +0000 (19:35 +0000)
author Aaron En Ye Shi <enye.shi@gmail.com>
Tue, 27 Oct 2020 19:08:58 +0000 (19:08 +0000)
committer Aaron En Ye Shi <enye.shi@gmail.com>
Tue, 27 Oct 2020 19:35:09 +0000 (19:35 +0000)
diff --git a/clang/lib/Headers/__clang_cuda_complex_builtins.h b/clang/lib/Headers/__clang_cuda_complex_builtins.h

index 8c10ff6..9b254f7 100644 (file)
--- a/clang/lib/Headers/__clang_cuda_complex_builtins.h
+++ b/clang/lib/Headers/__clang_cuda_complex_builtins.h
@@ -41,6 +41,27 @@
  #define _ABSf std::abs
  #define _LOGBd std::logb
  #define _LOGBf std::logb
+// Rather than pulling in std::max from algorithm everytime, use available ::max.
+#define _fmaxd max
+#define _fmaxf max
+#else
+#ifdef __AMDGCN__
+#define _ISNANd __ocml_isnan_f64
+#define _ISNANf __ocml_isnan_f32
+#define _ISINFd __ocml_isinf_f64
+#define _ISINFf __ocml_isinf_f32
+#define _ISFINITEd __ocml_isfinite_f64
+#define _ISFINITEf __ocml_isfinite_f32
+#define _COPYSIGNd __ocml_copysign_f64
+#define _COPYSIGNf __ocml_copysign_f32
+#define _SCALBNd __ocml_scalbn_f64
+#define _SCALBNf __ocml_scalbn_f32
+#define _ABSd __ocml_fabs_f64
+#define _ABSf __ocml_fabs_f32
+#define _LOGBd __ocml_logb_f64
+#define _LOGBf __ocml_logb_f32
+#define _fmaxd __ocml_fmax_f64
+#define _fmaxf __ocml_fmax_f32
  #else
  #define _ISNANd __nv_isnand
  #define _ISNANf __nv_isnanf
@@ -56,6 +77,9 @@
  #define _ABSf __nv_fabsf
  #define _LOGBd __nv_logb
  #define _LOGBf __nv_logbf
+#define _fmaxd __nv_fmax
+#define _fmaxf __nv_fmaxf
+#endif
  #endif
  
  #if defined(__cplusplus)
@@ -167,7 +191,7 @@ __DEVICE__ double _Complex __divdc3(double __a, double __b, double __c,
    // Can't use std::max, because that's defined in <algorithm>, and we don't
    // want to pull that in for every compile.  The CUDA headers define
    // ::max(float, float) and ::max(double, double), which is sufficient for us.
-  double __logbw = _LOGBd(max(_ABSd(__c), _ABSd(__d)));
+  double __logbw = _LOGBd(_fmaxd(_ABSd(__c), _ABSd(__d)));
    if (_ISFINITEd(__logbw)) {
      __ilogbw = (int)__logbw;
      __c = _SCALBNd(__c, -__ilogbw);
@@ -200,7 +224,7 @@ __DEVICE__ double _Complex __divdc3(double __a, double __b, double __c,
  
  __DEVICE__ float _Complex __divsc3(float __a, float __b, float __c, float __d) {
    int __ilogbw = 0;
-  float __logbw = _LOGBf(max(_ABSf(__c), _ABSf(__d)));
+  float __logbw = _LOGBf(_fmaxf(_ABSf(__c), _ABSf(__d)));
    if (_ISFINITEf(__logbw)) {
      __ilogbw = (int)__logbw;
      __c = _SCALBNf(__c, -__ilogbw);
@@ -249,6 +273,8 @@ __DEVICE__ float _Complex __divsc3(float __a, float __b, float __c, float __d) {
  #undef _ABSf
  #undef _LOGBd
  #undef _LOGBf
+#undef _fmaxd
+#undef _fmaxf
  
  #ifdef _OPENMP
  #pragma omp end declare target
author	Aaron En Ye Shi <enye.shi@gmail.com>
	Tue, 27 Oct 2020 19:08:58 +0000 (19:08 +0000)
committer	Aaron En Ye Shi <enye.shi@gmail.com>
	Tue, 27 Oct 2020 19:35:09 +0000 (19:35 +0000)