Fixed #395. Enable optimized cgemm for Sandybridge. Added optimized sdot kernel.
[platform/upstream/openblas.git] / kernel / x86_64 / KERNEL.BARCELONA
1 SGEMVNKERNEL = sgemv_n.S
2 SGEMVTKERNEL = sgemv_t.S
3
4 ZGEMVNKERNEL = zgemv_n_dup.S
5 ZGEMVTKERNEL = zgemv_t.S
6
7 SGEMMKERNEL    =  gemm_kernel_8x4_barcelona.S
8 SGEMMINCOPY    =  ../generic/gemm_ncopy_8.c
9 SGEMMITCOPY    =  ../generic/gemm_tcopy_8.c
10 SGEMMONCOPY    =  gemm_ncopy_4_opteron.S
11 SGEMMOTCOPY    =  gemm_tcopy_4_opteron.S
12 SGEMMINCOPYOBJ =  sgemm_incopy$(TSUFFIX).$(SUFFIX)
13 SGEMMITCOPYOBJ =  sgemm_itcopy$(TSUFFIX).$(SUFFIX)
14 SGEMMONCOPYOBJ =  sgemm_oncopy$(TSUFFIX).$(SUFFIX)
15 SGEMMOTCOPYOBJ =  sgemm_otcopy$(TSUFFIX).$(SUFFIX)
16 DGEMMKERNEL    =  gemm_kernel_4x4_barcelona.S
17 DGEMMINCOPY    =
18 DGEMMITCOPY    =
19 DGEMMONCOPY    =  gemm_ncopy_4_opteron.S
20 DGEMMOTCOPY    =  gemm_tcopy_4_opteron.S
21 DGEMMINCOPYOBJ =
22 DGEMMITCOPYOBJ =
23 DGEMMONCOPYOBJ =  dgemm_oncopy$(TSUFFIX).$(SUFFIX)
24 DGEMMOTCOPYOBJ =  dgemm_otcopy$(TSUFFIX).$(SUFFIX)
25 CGEMMKERNEL    =  zgemm_kernel_4x2_barcelona.S
26 CGEMMINCOPY    =  ../generic/zgemm_ncopy_4.c
27 CGEMMITCOPY    =  ../generic/zgemm_tcopy_4.c
28 CGEMMONCOPY    =  zgemm_ncopy_2.S
29 CGEMMOTCOPY    =  zgemm_tcopy_2.S
30 CGEMMINCOPYOBJ =  cgemm_incopy$(TSUFFIX).$(SUFFIX)
31 CGEMMITCOPYOBJ =  cgemm_itcopy$(TSUFFIX).$(SUFFIX)
32 CGEMMONCOPYOBJ =  cgemm_oncopy$(TSUFFIX).$(SUFFIX)
33 CGEMMOTCOPYOBJ =  cgemm_otcopy$(TSUFFIX).$(SUFFIX)
34 ZGEMMKERNEL    =  zgemm_kernel_2x2_barcelona.S
35 ZGEMMINCOPY    =
36 ZGEMMITCOPY    =
37 ZGEMMONCOPY    =  zgemm_ncopy_2.S
38 ZGEMMOTCOPY    =  zgemm_tcopy_2.S
39 ZGEMMINCOPYOBJ =
40 ZGEMMITCOPYOBJ =
41 ZGEMMONCOPYOBJ =  zgemm_oncopy$(TSUFFIX).$(SUFFIX)
42 ZGEMMOTCOPYOBJ =  zgemm_otcopy$(TSUFFIX).$(SUFFIX)
43
44 STRSMKERNEL_LN  =  trsm_kernel_LN_8x4_sse.S
45 STRSMKERNEL_LT  =  trsm_kernel_LT_8x4_sse.S
46 STRSMKERNEL_RN  =  trsm_kernel_LT_8x4_sse.S
47 STRSMKERNEL_RT  =  trsm_kernel_RT_8x4_sse.S
48
49 DTRSMKERNEL_LN  =  trsm_kernel_LN_4x4_barcelona.S
50 DTRSMKERNEL_LT  =  trsm_kernel_LT_4x4_barcelona.S
51 DTRSMKERNEL_RN  =  trsm_kernel_LT_4x4_barcelona.S
52 DTRSMKERNEL_RT  =  trsm_kernel_RT_4x4_barcelona.S
53
54 CTRSMKERNEL_LN  =  ztrsm_kernel_LN_4x2_sse.S
55 CTRSMKERNEL_LT  =  ztrsm_kernel_LT_4x2_sse.S
56 CTRSMKERNEL_RN  =  ztrsm_kernel_LT_4x2_sse.S
57 CTRSMKERNEL_RT  =  ztrsm_kernel_RT_4x2_sse.S
58
59 ZTRSMKERNEL_LN  =  ztrsm_kernel_LN_2x2_sse2.S
60 ZTRSMKERNEL_LT  =  ztrsm_kernel_LT_2x2_sse2.S
61 ZTRSMKERNEL_RN  =  ztrsm_kernel_LT_2x2_sse2.S
62 ZTRSMKERNEL_RT  =  ztrsm_kernel_RT_2x2_sse2.S
63
64 CGEMM3MKERNEL    =  zgemm3m_kernel_8x4_barcelona.S
65 ZGEMM3MKERNEL    =  zgemm3m_kernel_4x4_barcelona.S