2 # Include user definition
5 # TO suppress recursive includes
12 NETLIB_LAPACK_DIR = $(TOPDIR)/lapack-netlib
15 # - Only set if not specified on the command line or inherited from the environment.
16 # - CC is an implicit variable so neither '?=' or 'ifndef' can be used.
17 # http://stackoverflow.com/questions/4029274/mingw-and-make-variables
18 # - Default value is 'cc' which is not always a valid command (e.g. MinGW).
19 ifeq ($(origin CC),default)
21 # Change the default compile to clang on Mac OSX.
22 # http://stackoverflow.com/questions/714100/os-detecting-makefile
23 UNAME_S := $(shell uname -s)
24 ifeq ($(UNAME_S),Darwin)
29 # Default Fortran compiler (FC) is selected by f_check.
32 include $(TOPDIR)/Makefile.rule
34 include $(TOPDIR)/$(MAKEFILE_RULE)
38 # Beginning of system configuration
46 GETARCH_FLAGS := -DFORCE_$(TARGET)
49 #TARGET_CORE will override TARGET which is used in DYNAMIC_ARCH=1.
52 GETARCH_FLAGS := -DFORCE_$(TARGET_CORE)
56 GETARCH_FLAGS += -DUSE64BITINT
59 ifndef GEMM_MULTITHREAD_THRESHOLD
60 GEMM_MULTITHREAD_THRESHOLD=4
62 GETARCH_FLAGS += -DGEMM_MULTITHREAD_THRESHOLD=$(GEMM_MULTITHREAD_THRESHOLD)
65 GETARCH_FLAGS += -DNO_AVX
72 ifeq ($(QUIET_MAKE), 1)
76 ifndef NO_PARALLEL_MAKE
79 GETARCH_FLAGS += -DNO_PARALLEL_MAKE=$(NO_PARALLEL_MAKE)
81 ifeq ($(HOSTCC), loongcc)
82 GETARCH_FLAGS += -static
85 # This operation is expensive, so execution should be once.
86 ifndef GOTOBLAS_MAKEFILE
87 export GOTOBLAS_MAKEFILE = 1
89 # Generating Makefile.conf and config.h
90 DUMMY := $(shell $(MAKE) -C $(TOPDIR) -f Makefile.prebuild CC="$(CC)" FC="$(FC)" HOSTCC="$(HOSTCC)" CFLAGS="$(GETARCH_FLAGS)" BINARY=$(BINARY) USE_OPENMP=$(USE_OPENMP) TARGET_CORE=$(TARGET_CORE) all)
93 include $(TOPDIR)/Makefile.conf
95 include $(TOPDIR)/Makefile_kernel.conf
101 NUM_THREADS = $(NUM_CORES)
104 ifeq ($(NUM_THREADS), 1)
105 override USE_THREAD = 0
109 ifeq ($(USE_THREAD), 0)
115 ifeq ($(NUM_THREAD), 1)
128 AR = $(CROSS_SUFFIX)ar
129 AS = $(CROSS_SUFFIX)as
130 LD = $(CROSS_SUFFIX)ld
131 RANLIB = $(CROSS_SUFFIX)ranlib
132 NM = $(CROSS_SUFFIX)nm
133 DLLWRAP = $(CROSS_SUFFIX)dllwrap
136 # OS dependent settings
139 ifeq ($(OSNAME), Darwin)
140 export MACOSX_DEPLOYMENT_TARGET=10.2
144 ifeq ($(OSNAME), FreeBSD)
148 ifeq ($(OSNAME), NetBSD)
152 ifeq ($(OSNAME), Linux)
156 ifeq ($(OSNAME), AIX)
160 ifeq ($(OSNAME), WINNT)
164 EXTRALIB += -defaultlib:advapi32
170 ifeq ($(C_COMPILER), CLANG)
171 CCOMMON_OPT += -DMS_ABI
174 ifeq ($(C_COMPILER), GCC)
175 #Test for supporting MS_ABI
176 GCCVERSIONGTEQ4 := $(shell expr `$(CC) -dumpversion | cut -f1 -d.` \>= 4)
177 GCCVERSIONGT4 := $(shell expr `$(CC) -dumpversion | cut -f1 -d.` \> 4)
178 GCCMINORVERSIONGTEQ7 := $(shell expr `$(CC) -dumpversion | cut -f2 -d.` \>= 7)
179 ifeq ($(GCCVERSIONGT4), 1)
180 # GCC Majar version > 4
181 # It is compatible with MSVC ABI.
182 CCOMMON_OPT += -DMS_ABI
185 ifeq ($(GCCVERSIONGTEQ4), 1)
186 ifeq ($(GCCMINORVERSIONGTEQ7), 1)
188 # It is compatible with MSVC ABI.
189 CCOMMON_OPT += -DMS_ABI
194 # Ensure the correct stack alignment on Win32
195 # http://permalink.gmane.org/gmane.comp.lib.openblas.general/97
197 CCOMMON_OPT += -mincoming-stack-boundary=2
198 FCOMMON_OPT += -mincoming-stack-boundary=2
203 ifeq ($(OSNAME), Interix)
207 INTERIX_TOOL_DIR = /opt/gcc.3.3/i586-pc-interix3/bin
210 ifeq ($(OSNAME), CYGWIN_NT)
215 ifneq ($(OSNAME), WINNT)
216 ifneq ($(OSNAME), CYGWIN_NT)
217 ifneq ($(OSNAME), Interix)
219 EXTRALIB += -lpthread
226 CCOMMON_OPT += -DQUAD_PRECISION
231 ifneq ($(ARCH), x86_64)
237 CCOMMON_OPT += -DUTEST_CHECK
242 CCOMMON_OPT += -DSANITY_CHECK -DREFNAME=$(*F)f$(BU)
246 # Architecture dependent settings
253 ifndef NO_EXPRECISION
254 ifeq ($(F_COMPILER), GFORTRAN)
255 # ifeq logical or. GCC or LSB
256 ifeq ($(C_COMPILER), $(filter $(C_COMPILER),GCC LSB))
258 CCOMMON_OPT += -DEXPRECISION -m128bit-long-double
259 FCOMMON_OPT += -m128bit-long-double
261 ifeq ($(C_COMPILER), CLANG)
263 CCOMMON_OPT += -DEXPRECISION
264 FCOMMON_OPT += -m128bit-long-double
270 ifeq ($(ARCH), x86_64)
271 ifndef NO_EXPRECISION
272 ifeq ($(F_COMPILER), GFORTRAN)
273 # ifeq logical or. GCC or LSB
274 ifeq ($(C_COMPILER), $(filter $(C_COMPILER),GCC LSB))
276 CCOMMON_OPT += -DEXPRECISION -m128bit-long-double
277 FCOMMON_OPT += -m128bit-long-double
279 ifeq ($(C_COMPILER), CLANG)
281 CCOMMON_OPT += -DEXPRECISION
282 FCOMMON_OPT += -m128bit-long-double
288 ifeq ($(C_COMPILER), INTEL)
289 CCOMMON_OPT += -wd981
292 ifeq ($(USE_OPENMP), 1)
293 # ifeq logical or. GCC or LSB
294 ifeq ($(C_COMPILER), $(filter $(C_COMPILER),GCC LSB))
295 CCOMMON_OPT += -fopenmp
298 ifeq ($(C_COMPILER), CLANG)
299 $(error OpenBLAS: Clang didn't support OpenMP yet.)
300 CCOMMON_OPT += -fopenmp
303 ifeq ($(C_COMPILER), INTEL)
304 CCOMMON_OPT += -openmp
307 ifeq ($(C_COMPILER), PGI)
311 ifeq ($(C_COMPILER), OPEN64)
313 CEXTRALIB += -lstdc++
316 ifeq ($(C_COMPILER), PATHSCALE)
322 ifeq ($(DYNAMIC_ARCH), 1)
324 DYNAMIC_CORE = KATMAI COPPERMINE NORTHWOOD PRESCOTT BANIAS \
325 CORE2 PENRYN DUNNINGTON NEHALEM ATHLON OPTERON OPTERON_SSE3 BARCELONA BOBCAT ATOM NANO
327 DYNAMIC_CORE += SANDYBRIDGE
328 #BULLDOZER PILEDRIVER
332 ifeq ($(ARCH), x86_64)
333 DYNAMIC_CORE = PRESCOTT CORE2 PENRYN DUNNINGTON NEHALEM OPTERON OPTERON_SSE3 BARCELONA BOBCAT ATOM NANO
335 DYNAMIC_CORE += SANDYBRIDGE
336 #BULLDOZER PILEDRIVER
349 ifeq ($(F_COMPILER), GFORTRAN)
350 ifeq ($(C_COMPILER), GCC)
352 # CCOMMON_OPT += -DEXPRECISION
357 ifeq ($(ARCH), mips64)
361 ifeq ($(ARCH), alpha)
371 ifeq ($(ARCH), arm64)
379 # C Compiler dependent settings
383 # ifeq logical or. GCC or CLANG or LSB
384 # http://stackoverflow.com/questions/7656425/makefile-ifeq-logical-or
385 ifeq ($(C_COMPILER), $(filter $(C_COMPILER),GCC CLANG LSB))
387 COMMON_PROF += -fno-inline
388 NO_UNINITIALIZED_WARN = -Wno-uninitialized
390 ifeq ($(QUIET_MAKE), 1)
391 CCOMMON_OPT += $(NO_UNINITIALIZED_WARN) -Wno-unused
396 ifeq ($(ARCH), mips64)
398 CCOMMON_OPT += -mabi=64
400 CCOMMON_OPT += -mabi=n32
405 ifeq ($(CORE), LOONGSON3A)
406 CCOMMON_OPT += -march=mips64
407 FCOMMON_OPT += -march=mips64
410 ifeq ($(CORE), LOONGSON3B)
411 CCOMMON_OPT += -march=mips64
412 FCOMMON_OPT += -march=mips64
415 ifeq ($(OSNAME), AIX)
421 ifndef BINARY_DEFINED
431 ifeq ($(C_COMPILER), PGI)
433 CCOMMON_OPT += -tp p7-64
435 CCOMMON_OPT += -tp p7
439 ifeq ($(C_COMPILER), PATHSCALE)
448 # Fortran Compiler dependent settings
451 ifeq ($(F_COMPILER), G77)
452 CCOMMON_OPT += -DF_INTERFACE_G77
454 ifndef NO_BINARY_MODE
463 ifeq ($(F_COMPILER), G95)
464 CCOMMON_OPT += -DF_INTERFACE_G95
466 ifndef NO_BINARY_MODE
475 ifeq ($(F_COMPILER), GFORTRAN)
476 CCOMMON_OPT += -DF_INTERFACE_GFORT
478 #Don't include -lgfortran, when NO_LAPACK=1 or lsbcc
479 ifneq ($(NO_LAPACK), 1)
480 ifneq ($(C_COMPILER), LSB)
481 EXTRALIB += -lgfortran
485 ifeq ($(ARCH), mips64)
487 FCOMMON_OPT += -mabi=64
489 FCOMMON_OPT += -mabi=n32
496 FCOMMON_OPT += -fdefault-integer-8
503 FCOMMON_OPT += -fopenmp
507 ifeq ($(F_COMPILER), INTEL)
508 CCOMMON_OPT += -DF_INTERFACE_INTEL
513 FCOMMON_OPT += -openmp
517 ifeq ($(F_COMPILER), FUJITSU)
518 CCOMMON_OPT += -DF_INTERFACE_FUJITSU
520 FCOMMON_OPT += -openmp
524 ifeq ($(F_COMPILER), IBM)
525 CCOMMON_OPT += -DF_INTERFACE_IBM
526 # FCOMMON_OPT += -qarch=440
530 FCOMMON_OPT += -qintsize=8
536 FCOMMON_OPT += -openmp
540 ifeq ($(F_COMPILER), PGI)
541 CCOMMON_OPT += -DF_INTERFACE_PGI
542 COMMON_PROF += -DPGICOMPILER
547 FCOMMON_OPT += -tp p7-64
549 FCOMMON_OPT += -tp p7
556 ifeq ($(F_COMPILER), PATHSCALE)
557 CCOMMON_OPT += -DF_INTERFACE_PATHSCALE
564 ifneq ($(ARCH), mips64)
572 FCOMMON_OPT += -mabi=64
574 FCOMMON_OPT += -mabi=n32
583 ifeq ($(F_COMPILER), OPEN64)
584 CCOMMON_OPT += -DF_INTERFACE_OPEN64
591 ifeq ($(ARCH), mips64)
597 ifeq ($(CORE), LOONGSON3A)
598 FCOMMON_OPT += -loongson3 -static
601 ifeq ($(CORE), LOONGSON3B)
602 FCOMMON_OPT += -loongson3 -static
614 FEXTRALIB += -lstdc++
619 ifeq ($(C_COMPILER), OPEN64)
621 ifeq ($(ARCH), mips64)
627 ifeq ($(CORE), LOONGSON3A)
628 CCOMMON_OPT += -loongson3 -static
631 ifeq ($(CORE), LOONGSON3B)
632 CCOMMON_OPT += -loongson3 -static
645 ifeq ($(C_COMPILER), SUN)
654 ifeq ($(F_COMPILER), SUN)
655 CCOMMON_OPT += -DF_INTERFACE_SUN
662 FCOMMON_OPT += -xopenmp=parallel
666 ifeq ($(F_COMPILER), COMPAQ)
667 CCOMMON_OPT += -DF_INTERFACE_COMPAQ
669 FCOMMON_OPT += -openmp
680 ifeq ($(NEED_PIC), 1)
681 ifeq ($(C_COMPILER), IBM)
682 CCOMMON_OPT += -qpic=large
686 ifeq ($(F_COMPILER), SUN)
693 ifeq ($(DYNAMIC_ARCH), 1)
694 CCOMMON_OPT += -DDYNAMIC_ARCH
697 ifeq ($(NO_LAPACK), 1)
698 CCOMMON_OPT += -DNO_LAPACK
699 #Disable LAPACK C interface
703 ifeq ($(NO_LAPACKE), 1)
704 CCOMMON_OPT += -DNO_LAPACKE
708 CCOMMON_OPT += -DNO_AVX
712 CCOMMON_OPT += -DSMP_SERVER
714 ifeq ($(ARCH), mips64)
715 ifneq ($(CORE), LOONGSON3B)
716 USE_SIMPLE_THREADED_LEVEL3 = 1
720 ifeq ($(USE_OPENMP), 1)
721 # USE_SIMPLE_THREADED_LEVEL3 = 1
723 CCOMMON_OPT += -DUSE_OPENMP
728 ifeq ($(NO_WARMUP), 1)
729 CCOMMON_OPT += -DNO_WARMUP
732 ifeq ($(CONSISTENT_FPCSR), 1)
733 CCOMMON_OPT += -DCONSISTENT_FPCSR
736 # Only for development
737 # CCOMMON_OPT += -DPARAMTEST
738 # CCOMMON_OPT += -DPREFETCHTEST
739 # CCOMMON_OPT += -DNO_SWITCHING
743 CCOMMON_OPT += -DUSE_PAPI
744 EXTRALIB += -lpapi -lperfctr
747 ifdef DYNAMIC_THREADS
748 CCOMMON_OPT += -DDYNAMIC_THREADS
751 CCOMMON_OPT += -DMAX_CPU_NUMBER=$(NUM_THREADS)
753 ifdef USE_SIMPLE_THREADED_LEVEL3
754 CCOMMON_OPT += -DUSE_SIMPLE_THREADED_LEVEL3
758 LIBPREFIX = libopenblas
760 LIBPREFIX = libopenblas_$(LIBNAMESUFFIX)
763 KERNELDIR = $(TOPDIR)/kernel/$(ARCH)
765 include $(TOPDIR)/Makefile.$(ARCH)
767 CCOMMON_OPT += -DASMNAME=$(FU)$(*F) -DASMFNAME=$(FU)$(*F)$(BU) -DNAME=$(*F)$(BU) -DCNAME=$(*F) -DCHAR_NAME=\"$(*F)$(BU)\" -DCHAR_CNAME=\"$(*F)\"
769 ifeq ($(CORE), PPC440)
770 CCOMMON_OPT += -DALLOC_QALLOC
773 ifeq ($(CORE), PPC440FP2)
774 STATIC_ALLOCATION = 1
777 ifneq ($(OSNAME), Linux)
781 ifneq ($(ARCH), x86_64)
783 ifneq ($(CORE), LOONGSON3B)
790 CCOMMON_OPT += -DNO_AFFINITY
793 ifdef FUNCTION_PROFILE
794 CCOMMON_OPT += -DFUNCTION_PROFILE
797 ifdef HUGETLB_ALLOCATION
798 CCOMMON_OPT += -DALLOC_HUGETLB
801 ifdef HUGETLBFILE_ALLOCATION
802 CCOMMON_OPT += -DALLOC_HUGETLBFILE -DHUGETLB_FILE_NAME=$(HUGETLBFILE_ALLOCATION)
805 ifdef STATIC_ALLOCATION
806 CCOMMON_OPT += -DALLOC_STATIC
809 ifdef DEVICEDRIVER_ALLOCATION
810 CCOMMON_OPT += -DALLOC_DEVICEDRIVER -DDEVICEDRIVER_NAME=\"/dev/mapper\"
813 ifdef MIXED_MEMORY_ALLOCATION
814 CCOMMON_OPT += -DMIXED_MEMORY_ALLOCATION
817 ifeq ($(OSNAME), SunOS)
833 REVISION = -r$(VERSION)
834 MAJOR_VERSION = $(word 1,$(subst ., ,$(VERSION)))
847 ifeq ($(ARCH), arm64)
857 override CFLAGS += $(COMMON_OPT) $(CCOMMON_OPT) -I$(TOPDIR)
858 override PFLAGS += $(COMMON_OPT) $(CCOMMON_OPT) -I$(TOPDIR) -DPROFILE $(COMMON_PROF)
860 override FFLAGS += $(COMMON_OPT) $(FCOMMON_OPT)
861 override FPFLAGS += $(COMMON_OPT) $(FCOMMON_OPT) $(COMMON_PROF)
864 LAPACK_CFLAGS = $(CFLAGS)
865 LAPACK_CFLAGS += -DHAVE_LAPACK_CONFIG_H
867 LAPACK_CFLAGS += -DLAPACK_ILP64
869 ifeq ($(C_COMPILER), LSB)
870 LAPACK_CFLAGS += -DLAPACK_COMPLEX_STRUCTURE
885 ifneq ($(DYNAMIC_ARCH), 1)
887 LIBNAME = $(LIBPREFIX)_$(LIBCORE)$(REVISION).$(LIBSUFFIX)
888 LIBNAME_P = $(LIBPREFIX)_$(LIBCORE)$(REVISION)_p.$(LIBSUFFIX)
890 LIBNAME = $(LIBPREFIX)_$(LIBCORE)p$(REVISION).$(LIBSUFFIX)
891 LIBNAME_P = $(LIBPREFIX)_$(LIBCORE)p$(REVISION)_p.$(LIBSUFFIX)
895 LIBNAME = $(LIBPREFIX)$(REVISION).$(LIBSUFFIX)
896 LIBNAME_P = $(LIBPREFIX)$(REVISION)_p.$(LIBSUFFIX)
898 LIBNAME = $(LIBPREFIX)p$(REVISION).$(LIBSUFFIX)
899 LIBNAME_P = $(LIBPREFIX)p$(REVISION)_p.$(LIBSUFFIX)
904 LIBDLLNAME = $(LIBPREFIX).dll
905 LIBSONAME = $(LIBNAME:.$(LIBSUFFIX)=.so)
906 LIBDYNNAME = $(LIBNAME:.$(LIBSUFFIX)=.dylib)
907 LIBDEFNAME = $(LIBNAME:.$(LIBSUFFIX)=.def)
908 LIBEXPNAME = $(LIBNAME:.$(LIBSUFFIX)=.exp)
909 LIBZIPNAME = $(LIBNAME:.$(LIBSUFFIX)=.zip)
911 LIBS = $(TOPDIR)/$(LIBNAME)
912 LIBS_P = $(TOPDIR)/$(LIBNAME_P)
924 export NEED2UNDERSCORES
957 export FUNCTION_PROFILE
960 export SGEMM_UNROLL_M
961 export SGEMM_UNROLL_N
962 export DGEMM_UNROLL_M
963 export DGEMM_UNROLL_N
964 export QGEMM_UNROLL_M
965 export QGEMM_UNROLL_N
966 export CGEMM_UNROLL_M
967 export CGEMM_UNROLL_N
968 export ZGEMM_UNROLL_M
969 export ZGEMM_UNROLL_N
970 export XGEMM_UNROLL_M
971 export XGEMM_UNROLL_N
972 export CGEMM3M_UNROLL_M
973 export CGEMM3M_UNROLL_N
974 export ZGEMM3M_UNROLL_M
975 export ZGEMM3M_UNROLL_N
976 export XGEMM3M_UNROLL_M
977 export XGEMM3M_UNROLL_N
987 .SUFFIXES: .$(PSUFFIX) .$(SUFFIX) .f
990 $(FC) $(FFLAGS) -c $< -o $(@F)
993 $(FC) $(FPFLAGS) -pg -c $< -o $(@F)
997 PATHSCALEPATH = /opt/pathscale/lib/3.1
998 PGIPATH = /opt/pgi/linux86-64/7.1-5/lib
1000 PATHSCALEPATH = /opt/pathscale/lib/3.1/32
1001 PGIPATH = /opt/pgi/linux86/7.1-5/lib
1004 ACMLPATH = /opt/acml/4.3.0
1005 ifneq ($(OSNAME), Darwin)
1006 MKLPATH = /opt/intel/mkl/10.2.2.025/lib
1008 MKLPATH = /Library/Frameworks/Intel_MKL.framework/Versions/10.0.1.014/lib
1010 ATLASPATH = /opt/atlas/3.9.17/opteron
1011 FLAMEPATH = $(HOME)/flame/lib
1012 ifneq ($(OSNAME), SunOS)
1013 SUNPATH = /opt/sunstudio12.1
1015 SUNPATH = /opt/SUNWspro