[PPC] altivec.h functions for converting half precision to single precision.

author Sean Fertile <sfertile@ca.ibm.com>

Mon, 14 Nov 2016 18:47:15 +0000 (18:47 +0000)

committer Sean Fertile <sfertile@ca.ibm.com>

Mon, 14 Nov 2016 18:47:15 +0000 (18:47 +0000)
author Sean Fertile <sfertile@ca.ibm.com>
Mon, 14 Nov 2016 18:47:15 +0000 (18:47 +0000)
committer Sean Fertile <sfertile@ca.ibm.com>
Mon, 14 Nov 2016 18:47:15 +0000 (18:47 +0000)
diff --git a/clang/include/clang/Basic/BuiltinsPPC.def b/clang/include/clang/Basic/BuiltinsPPC.def

index c258e43187932528a6ec794e2fef9548af6fc6d8..f87a892b003d9c09ccd5a9861b2e9318dfe6f07f 100644 (file)
--- a/clang/include/clang/Basic/BuiltinsPPC.def
+++ b/clang/include/clang/Basic/BuiltinsPPC.def
@@ -402,6 +402,7 @@ BUILTIN(__builtin_vsx_xvcvuxdsp, "V4fV2ULLi", "")
  BUILTIN(__builtin_vsx_xvcvdpsp, "V4fV2d", "")
  
  BUILTIN(__builtin_vsx_xvcvsphp, "V4fV4f", "")
+BUILTIN(__builtin_vsx_xvcvhpsp, "V4fV8Us", "")
  
  // Vector Test Data Class builtins
  BUILTIN(__builtin_vsx_xvtstdcdp, "V2ULLiV2dIi", "")
diff --git a/clang/lib/Headers/altivec.h b/clang/lib/Headers/altivec.h

index 8a5312bd141d42d5d89b5f50ae400fd5de5cf8ea..66e0359d37fda28e2ce8f712cb595ae22f0dda20 100644 (file)
--- a/clang/lib/Headers/altivec.h
+++ b/clang/lib/Headers/altivec.h
@@ -12322,6 +12322,27 @@ vec_extract_sig (vector double __a) {
    return __builtin_vsx_xvxsigdp(__a);
  }
  
+static __inline__ vector float __ATTRS_o_ai
+vec_extract_fp32_from_shorth(vector unsigned short __a) {
+  vector unsigned short __b =
+#ifdef __LITTLE_ENDIAN__
+            __builtin_shufflevector(__a, __a, 0, -1, 1, -1, 2, -1, 3, -1);
+#else
+            __builtin_shufflevector(__a, __a, -1, 0, -1, 1, -1, 2, -1, 3);
+#endif
+  return __builtin_vsx_xvcvhpsp(__b);
+}
+
+static __inline__ vector float __ATTRS_o_ai
+vec_extract_fp32_from_shortl(vector unsigned short __a) {
+  vector unsigned short __b =
+#ifdef __LITTLE_ENDIAN__
+            __builtin_shufflevector(__a, __a, 4, -1, 5, -1, 6, -1, 7, -1);
+#else
+            __builtin_shufflevector(__a, __a, -1, 4, -1, 5, -1, 6, -1, 7);
+#endif
+  return __builtin_vsx_xvcvhpsp(__b);
+}
  #endif /* __POWER9_VECTOR__ */
  
  /* vec_insert */
diff --git a/clang/test/CodeGen/builtins-ppc-p9vector.c b/clang/test/CodeGen/builtins-ppc-p9vector.c

index c14ad71ea5e98c424e65548bafb925b68929a48d..80c6a43e1f03b8a6b678b2b00230ecdac4c01d50 100644 (file)
--- a/clang/test/CodeGen/builtins-ppc-p9vector.c
+++ b/clang/test/CodeGen/builtins-ppc-p9vector.c
@@ -967,3 +967,21 @@ vector bool long long test87(void) {
  // CHECK-NEXT: ret <2 x i64>
    return vec_test_data_class(vda, __VEC_CLASS_FP_NOT_NORMAL);
  }
+vector float test88(void) {
+// CHECK-BE: shufflevector <8 x i16> {{.+}}, <8 x i16> {{.+}}, <8 x i32> <i32 undef, i32 0, i32 undef, i32 1, i32 undef, i32 2, i32 undef, i32 3>
+// CHECK-BE: @llvm.ppc.vsx.xvcvhpsp(<8 x i16> {{.+}})
+// CHECK-BE-NEXT: ret <4 x float>
+// CHECK-LE: shufflevector <8 x i16> {{.+}}, <8 x i16> {{.+}}, <8 x i32> <i32 0, i32 undef, i32 1, i32 undef, i32 2, i32 undef, i32 3, i32 undef>
+// CHECK-LE: @llvm.ppc.vsx.xvcvhpsp(<8 x i16> {{.+}})
+// CHECK-LE-NEXT: ret <4 x float>
+  return vec_extract_fp32_from_shorth(vusa);
+}
+vector float test89(void) {
+// CHECK-BE: shufflevector <8 x i16> {{.+}}, <8 x i16> {{.+}}, <8 x i32> <i32 undef, i32 4, i32 undef, i32 5, i32 undef, i32 6, i32 undef, i32 7>
+// CHECK-BE: @llvm.ppc.vsx.xvcvhpsp(<8 x i16> {{.+}})
+// CHECK-BE-NEXT: ret <4 x float>
+// CHECK-LE: shufflevector <8 x i16> {{.+}}, <8 x i16> {{.+}}, <8 x i32> <i32 4, i32 undef, i32 5, i32 undef, i32 6, i32 undef, i32 7, i32 undef>
+// CHECK-LE: @llvm.ppc.vsx.xvcvhpsp(<8 x i16> {{.+}})
+// CHECK-LE-NEXT: ret <4 x float>
+  return vec_extract_fp32_from_shortl(vusa);
+}
author	Sean Fertile <sfertile@ca.ibm.com>
	Mon, 14 Nov 2016 18:47:15 +0000 (18:47 +0000)
committer	Sean Fertile <sfertile@ca.ibm.com>
	Mon, 14 Nov 2016 18:47:15 +0000 (18:47 +0000)
clang/include/clang/Basic/BuiltinsPPC.def		patch \| blob \| history
clang/lib/Headers/altivec.h		patch \| blob \| history
clang/test/CodeGen/builtins-ppc-p9vector.c		patch \| blob \| history