2 # Beginning of user configuration
5 # This library's version
8 # If you set the suffix, the library name will be libopenblas_$(LIBNAMESUFFIX).a
9 # and libopenblas_$(LIBNAMESUFFIX).so. Meanwhile, the soname in shared library
10 # is libopenblas_$(LIBNAMESUFFIX).so.0.
13 # You can specify the target architecture, otherwise it's
14 # automatically detected.
17 # If you want to support multiple architecture in one binary
20 # C compiler including binary type(32bit / 64bit). Default is gcc.
21 # Don't use Intel Compiler or PGI, it won't generate right codes as I expect.
24 # Fortran compiler. Default is g77.
27 # Even you can specify cross compiler. Meanwhile, please set HOSTCC.
29 # cross compiler for Windows
30 # CC = x86_64-w64-mingw32-gcc
31 # FC = x86_64-w64-mingw32-gfortran
33 # cross compiler for 32bit ARM
34 # CC = arm-linux-gnueabihf-gcc
35 # FC = arm-linux-gnueabihf-gfortran
37 # cross compiler for 64bit ARM
38 # CC = aarch64-linux-gnu-gcc
39 # FC = aarch64-linux-gnu-gfortran
42 # If you use the cross compiler, please set this host compiler.
45 # If you need 32bit binary, define BINARY=32, otherwise define BINARY=64
48 # About threaded BLAS. It will be automatically detected if you don't
50 # For force setting for single threaded, specify USE_THREAD = 0
51 # For force setting for multi threaded, specify USE_THREAD = 1
54 # If you're going to use this library with OpenMP, please comment it in.
55 # This flag is always set for POWER8. Don't modify the flag
58 # You can define maximum number of threads. Basically it should be
59 # less than actual number of cores. If you don't specify one, it's
60 # automatically detected by the the script.
63 # if you don't need to install the static library, please comment it in.
66 # if you don't need generate the shared library, please comment it in.
69 # If you don't need CBLAS interface, please comment it in.
72 # If you only want CBLAS interface without installing Fortran compiler,
73 # please comment it in.
76 # If you don't need LAPACK, please comment it in.
77 # If you set NO_LAPACK=1, the library automatically sets NO_LAPACKE=1.
80 # If you don't need LAPACKE (C Interface to LAPACK), please comment it in.
83 # Build LAPACK Deprecated functions since LAPACK 3.6.0
84 BUILD_LAPACK_DEPRECATED = 1
86 # Build RecursiveLAPACK on top of LAPACK
89 # If you want to use legacy threaded Level 3 implementation.
90 # USE_SIMPLE_THREADED_LEVEL3 = 1
92 # If you want to drive whole 64bit region by BLAS. Not all Fortran
93 # compiler supports this. It's safe to keep comment it out if you
94 # are not sure(equivalent to "-i8" option).
97 # Unfortunately most of kernel won't give us high quality buffer.
98 # BLAS tries to find the best region before entering main function,
99 # but it will consume time. If you don't like it, you can disable one.
102 # If you want to disable CPU/Memory affinity on Linux.
105 # if you are compiling for Linux and you have more than 16 numa nodes or more than 256 cpus
108 # Don't use AVX kernel on Sandy Bridge. It is compatible with old compilers
109 # and OS. However, the performance is low.
112 # Don't use Haswell optimizations if binutils is too old (e.g. RHEL6)
115 # Don't use parallel make.
116 # NO_PARALLEL_MAKE = 1
118 # Force number of make jobs. The default is the number of logical CPU of the host.
119 # This is particularly useful when using distcc.
120 # A negative value will disable adding a -j flag to make, allowing to use a parent
121 # make -j value. This is useful to call OpenBLAS make from an other project
125 # If you would like to know minute performance report of GotoBLAS.
126 # FUNCTION_PROFILE = 1
128 # Support for IEEE quad precision(it's *real* REAL*16)( under testing)
131 # Theads are still working for a while after finishing BLAS operation
132 # to reduce thread activate/deactivate overhead. You can determine
133 # time out to improve performance. This number should be from 4 to 30
134 # which corresponds to (1 << n) cycles. For example, if you set to 26,
135 # thread will be running for (1 << 26) cycles(about 25ms on 3.0GHz
136 # system). Also you can control this mumber by THREAD_TIMEOUT
137 # CCOMMON_OPT += -DTHREAD_TIMEOUT=26
139 # Using special device driver for mapping physically contigous memory
140 # to the user space. If bigphysarea is enabled, it will use it.
141 # DEVICEDRIVER_ALLOCATION = 1
143 # If you need to synchronize FP CSR between threads (for x86/x86_64 only).
144 # CONSISTENT_FPCSR = 1
146 # If any gemm arguement m, n or k is less or equal this threshold, gemm will be execute
147 # with single thread. You can use this flag to avoid the overhead of multi-threading
148 # in small matrix sizes. The default value is 4.
149 # GEMM_MULTITHREAD_THRESHOLD = 4
151 # If you need santy check by comparing reference BLAS. It'll be very
152 # slow (Not implemented yet).
155 # The installation directory.
156 # PREFIX = /opt/OpenBLAS
158 # Common Optimization Flag;
159 # The default -O2 is enough.
160 # Flags for POWER8 are defined in Makefile.power. Don't modify COMMON_OPT
163 # gfortran option for LAPACK
164 # enable this flag only on 64bit Linux and if you need a thread safe lapack library
165 # Flags for POWER8 are defined in Makefile.power. Don't modify FCOMMON_OPT
166 # FCOMMON_OPT = -frecursive
171 # Build Debug version
174 # Set maximum stack allocation.
175 # The default value is 2048. 0 disable stack allocation a may reduce GER and GEMV
176 # performance. For details, https://github.com/xianyi/OpenBLAS/pull/482
178 # MAX_STACK_ALLOC = 0
180 # Add a prefix or suffix to all exported symbol names in the shared library.
181 # Avoid conflicts with other BLAS libraries, especially when using
182 # 64 bit integer interfaces in OpenBLAS.
183 # For details, https://github.com/xianyi/OpenBLAS/pull/459
185 # The same prefix and suffix are also added to the library name,
186 # i.e. you get lib$(SYMBOLPREFIX)openblas$(SYMBOLSUFFIX) rather than libopenblas
192 # End of user configuration