[x86] Fix bugs of some intrinsic functions in CLANG : _mm512_stream_ps, _mm512_stream...

author Pengfei Wang <pengfei.wang@intel.com>

Tue, 3 Sep 2019 02:06:15 +0000 (02:06 +0000)

committer Pengfei Wang <pengfei.wang@intel.com>

Tue, 3 Sep 2019 02:06:15 +0000 (02:06 +0000)
author Pengfei Wang <pengfei.wang@intel.com>
Tue, 3 Sep 2019 02:06:15 +0000 (02:06 +0000)
committer Pengfei Wang <pengfei.wang@intel.com>
Tue, 3 Sep 2019 02:06:15 +0000 (02:06 +0000)
diff --git a/clang/lib/Headers/avx512fintrin.h b/clang/lib/Headers/avx512fintrin.h

index 5748c1e..4e341a1 100644 (file)
--- a/clang/lib/Headers/avx512fintrin.h
+++ b/clang/lib/Headers/avx512fintrin.h
@@ -8436,7 +8436,7 @@ _store_mask16(__mmask16 *__A, __mmask16 __B) {
  }
  
  static __inline__ void __DEFAULT_FN_ATTRS512
-_mm512_stream_si512 (__m512i * __P, __m512i __A)
+_mm512_stream_si512 (void * __P, __m512i __A)
  {
    typedef __v8di __v8di_aligned __attribute__((aligned(64)));
    __builtin_nontemporal_store((__v8di_aligned)__A, (__v8di_aligned*)__P);
@@ -8450,14 +8450,14 @@ _mm512_stream_load_si512 (void const *__P)
  }
  
  static __inline__ void __DEFAULT_FN_ATTRS512
-_mm512_stream_pd (double *__P, __m512d __A)
+_mm512_stream_pd (void *__P, __m512d __A)
  {
    typedef __v8df __v8df_aligned __attribute__((aligned(64)));
    __builtin_nontemporal_store((__v8df_aligned)__A, (__v8df_aligned*)__P);
  }
  
  static __inline__ void __DEFAULT_FN_ATTRS512
-_mm512_stream_ps (float *__P, __m512 __A)
+_mm512_stream_ps (void *__P, __m512 __A)
  {
    typedef __v16sf __v16sf_aligned __attribute__((aligned(64)));
    __builtin_nontemporal_store((__v16sf_aligned)__A, (__v16sf_aligned*)__P);
diff --git a/clang/test/CodeGen/avx512f-builtins.c b/clang/test/CodeGen/avx512f-builtins.c

index aaf3157..2a083e3 100644 (file)
--- a/clang/test/CodeGen/avx512f-builtins.c
+++ b/clang/test/CodeGen/avx512f-builtins.c
@@ -8575,6 +8575,12 @@ void test_mm512_stream_si512(__m512i * __P, __m512i __A) {
    _mm512_stream_si512(__P, __A); 
  }
  
+void test_mm512_stream_si512_2(void * __P, __m512i __A) {
+  // CHECK-LABEL: @test_mm512_stream_si512
+  // CHECK: store <8 x i64> %{{.*}}, <8 x i64>* %{{.*}}, align 64, !nontemporal
+  _mm512_stream_si512(__P, __A); 
+}
+
  __m512i test_mm512_stream_load_si512(void *__P) {
    // CHECK-LABEL: @test_mm512_stream_load_si512
    // CHECK: load <8 x i64>, <8 x i64>* %{{.*}}, align 64, !nontemporal
@@ -8593,12 +8599,23 @@ void test_mm512_stream_pd(double *__P, __m512d __A) {
    return _mm512_stream_pd(__P, __A); 
  }
  
+void test_mm512_stream_pd_2(void *__P, __m512d __A) {
+  // CHECK-LABEL: @test_mm512_stream_pd
+  // CHECK: store <8 x double> %{{.*}}, <8 x double>* %{{.*}}, align 64, !nontemporal
+  return _mm512_stream_pd(__P, __A); 
+}
+
  void test_mm512_stream_ps(float *__P, __m512 __A) {
    // CHECK-LABEL: @test_mm512_stream_ps
    // CHECK: store <16 x float> %{{.*}}, <16 x float>* %{{.*}}, align 64, !nontemporal
    _mm512_stream_ps(__P, __A); 
  }
  
+void test_mm512_stream_ps_2(void *__P, __m512 __A) {
+  // CHECK-LABEL: @test_mm512_stream_ps
+  // CHECK: store <16 x float> %{{.*}}, <16 x float>* %{{.*}}, align 64, !nontemporal
+  _mm512_stream_ps(__P, __A); 
+}
  __m512d test_mm512_mask_compress_pd(__m512d __W, __mmask8 __U, __m512d __A) {
    // CHECK-LABEL: @test_mm512_mask_compress_pd
    // CHECK: @llvm.x86.avx512.mask.compress
author	Pengfei Wang <pengfei.wang@intel.com>
	Tue, 3 Sep 2019 02:06:15 +0000 (02:06 +0000)
committer	Pengfei Wang <pengfei.wang@intel.com>
	Tue, 3 Sep 2019 02:06:15 +0000 (02:06 +0000)
clang/lib/Headers/avx512fintrin.h		patch \| blob \| history
clang/test/CodeGen/avx512f-builtins.c		patch \| blob \| history