powerpc: Optimized strcat for POWER8/PPC64
authorAdhemerval Zanella <azanella@linux.vnet.ibm.com>
Tue, 23 Dec 2014 18:36:34 +0000 (13:36 -0500)
committerAdhemerval Zanella <azanella@linux.vnet.ibm.com>
Tue, 13 Jan 2015 16:28:36 +0000 (11:28 -0500)
With new optimized strcpy for POWER8, this patch adds an optimized
strcat which uses it along with default implementation at strings/.

ChangeLog
sysdeps/powerpc/powerpc64/multiarch/Makefile
sysdeps/powerpc/powerpc64/multiarch/ifunc-impl-list.c
sysdeps/powerpc/powerpc64/multiarch/strcat-power8.c [new file with mode: 0644]
sysdeps/powerpc/powerpc64/multiarch/strcat.c

index 7204573..744632a 100644 (file)
--- a/ChangeLog
+++ b/ChangeLog
@@ -1,6 +1,15 @@
 2015-01-13  Adhemerval Zanella  <azanella@linux.vnet.ibm.com>
 
        * sysdeps/powerpc/powerpc64/multiarch/Makefile [sysdep_routines]: Add
+       strncat-power8 object.
+       * sysdeps/powerpc/powerpc64/multiarch/strcat.c (strcat): Add
+       __strcat_power8 implementation.
+       * sysdeps/powerpc/powerpc64/multiarch/ifunc-impl-list.c
+       (__libc_ifunc_impl_list): Add __strcat_power8 implementation.
+       * sysdeps/powerpc/powerpc64/multiarch/strcat-power8.c: New file:
+       optimized strcat for power8.
+
+       * sysdeps/powerpc/powerpc64/multiarch/Makefile [sysdep_routines]: Add
        strcpy-power8 and stpcpy-power8 objects.
        * sysdeps/powerpc/powerpc64/multiarch/ifunc-impl-list.c
        (__libc_ifunc_impl_list): Add __strcpy_power8 and __stpcpy_power8
index f170551..74b2daa 100644 (file)
@@ -18,8 +18,8 @@ sysdep_routines += memcpy-power7 memcpy-a2 memcpy-power6 memcpy-cell \
                   strrchr-power7 strrchr-ppc64 strncat-power7 strncat-ppc64 \
                   strncpy-power7 strncpy-ppc64 \
                   stpncpy-power7 stpncpy-ppc64 strcmp-power7 strcmp-ppc64 \
-                  strcat-power7 strcat-ppc64 memmove-power7 memmove-ppc64 \
-                  bcopy-ppc64
+                  strcat-power8 strcat-power7 strcat-ppc64 memmove-power7 \
+                  memmove-ppc64 bcopy-ppc64
 
 CFLAGS-strncase-power7.c += -mcpu=power7 -funroll-loops
 CFLAGS-strncase_l-power7.c += -mcpu=power7 -funroll-loops
index 88c8234..dbb21fd 100644 (file)
@@ -303,6 +303,9 @@ __libc_ifunc_impl_list (const char *name, struct libc_ifunc_impl *array,
   /* Support sysdeps/powerpc/powerpc64/multiarch/strcat.c.  */
   IFUNC_IMPL (i, name, strcat,
              IFUNC_IMPL_ADD (array, i, strcat,
+                             hwcap2 & PPC_FEATURE2_ARCH_2_07,
+                             __strcat_power8)
+             IFUNC_IMPL_ADD (array, i, strcat,
                              hwcap & PPC_FEATURE_HAS_VSX,
                              __strcat_power7)
              IFUNC_IMPL_ADD (array, i, strcat, 1,
diff --git a/sysdeps/powerpc/powerpc64/multiarch/strcat-power8.c b/sysdeps/powerpc/powerpc64/multiarch/strcat-power8.c
new file mode 100644 (file)
index 0000000..6c7544c
--- /dev/null
@@ -0,0 +1,30 @@
+/* Copyright (C) 2015 Free Software Foundation, Inc.
+   This file is part of the GNU C Library.
+
+   The GNU C Library is free software; you can redistribute it and/or
+   modify it under the terms of the GNU Lesser General Public
+   License as published by the Free Software Foundation; either
+   version 2.1 of the License, or (at your option) any later version.
+
+   The GNU C Library is distributed in the hope that it will be useful,
+   but WITHOUT ANY WARRANTY; without even the implied warranty of
+   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+   Lesser General Public License for more details.
+
+   You should have received a copy of the GNU Lesser General Public
+   License along with the GNU C Library; if not, see
+   <http://www.gnu.org/licenses/ >.  */
+
+#include <string.h>
+
+#define STRCAT __strcat_power8
+
+#undef libc_hidden_def
+#define libc_hidden_def(name)
+
+extern typeof (strcpy) __strcpy_power8;
+extern typeof (strlen) __strlen_power7;
+
+#define strcpy __strcpy_power8
+#define strlen __strlen_power7
+#include <sysdeps/powerpc/strcat.c>
index af188d3..4708a9a 100644 (file)
 
 extern __typeof (strcat) __strcat_ppc attribute_hidden;
 extern __typeof (strcat) __strcat_power7 attribute_hidden;
+extern __typeof (strcat) __strcat_power8 attribute_hidden;
 
 libc_ifunc (strcat,
-            (hwcap & PPC_FEATURE_HAS_VSX)
-            ? __strcat_power7
+            (hwcap2 & PPC_FEATURE2_ARCH_2_07)
+            ? __strcat_power8 :
+              (hwcap & PPC_FEATURE_HAS_VSX)
+              ? __strcat_power7
             : __strcat_ppc);
 #endif