From: wernsaar Date: Thu, 21 Aug 2014 11:02:53 +0000 (+0200) Subject: added optimized dsymv_L kernel for bulldozer X-Git-Tag: v0.2.12^2~11^2~23 X-Git-Url: http://review.tizen.org/git/?a=commitdiff_plain;h=f6f9122660ee8be175b61dd91abc1a86e9bb4a7e;p=platform%2Fupstream%2Fopenblas.git added optimized dsymv_L kernel for bulldozer --- diff --git a/kernel/x86_64/dsymv_L.c b/kernel/x86_64/dsymv_L.c new file mode 100644 index 0000000..29e3aa2 --- /dev/null +++ b/kernel/x86_64/dsymv_L.c @@ -0,0 +1,299 @@ +/*************************************************************************** +Copyright (c) 2013, The OpenBLAS Project +All rights reserved. +Redistribution and use in source and binary forms, with or without +modification, are permitted provided that the following conditions are +met: +1. Redistributions of source code must retain the above copyright +notice, this list of conditions and the following disclaimer. +2. Redistributions in binary form must reproduce the above copyright +notice, this list of conditions and the following disclaimer in +the documentation and/or other materials provided with the +distribution. +3. Neither the name of the OpenBLAS project nor the names of +its contributors may be used to endorse or promote products +derived from this software without specific prior written permission. +THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" +AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE +IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE +ARE DISCLAIMED. IN NO EVENT SHALL THE OPENBLAS PROJECT OR CONTRIBUTORS BE +LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL +DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR +SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER +CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, +OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE +USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. +*****************************************************************************/ + + +#include "common.h" + +#if defined(BULLDOZER) +#include "dsymv_L_microk_bulldozer-2.c" +#elif defined(NEHALEM) +#include "dsymv_U_microk_nehalem-2.c" +#endif + + +#ifndef HAVE_KERNEL_4x4 + +static void dsymv_kernel_4x4(BLASLONG from, BLASLONG to, FLOAT **ap, FLOAT *x, FLOAT *y, FLOAT *tmp1, FLOAT *temp2) +{ + FLOAT tmp2[4] = { 0.0, 0.0, 0.0, 0.0 }; + BLASLONG i; + + for (i=from; i=12 ) + { + BLASLONG m2 = (m/4)*4; + for (i=j+1; i j+4 ) + dsymv_kernel_4x4(j+4,m2,ap,x,y,tmp1,tmp2); + + + for (i=m2; i=8 ) + { + BLASLONG j1 = ((from + 4)/4)*4; + BLASLONG j2 = (m/4)*4; + for (i=from; i