blob: b7a438f40f1283e8a94cff4501088d000303a235 [file] [log] [blame]
Austin Schuh9a24b372018-01-28 16:12:29 -08001###################################################################################################
2# #
3# This file is part of BLASFEO. #
4# #
5# BLASFEO -- BLAS For Embedded Optimization. #
6# Copyright (C) 2016-2017 by Gianluca Frison. #
7# Developed at IMTEK (University of Freiburg) under the supervision of Moritz Diehl. #
8# All rights reserved. #
9# #
10# HPMPC is free software; you can redistribute it and/or #
11# modify it under the terms of the GNU Lesser General Public #
12# License as published by the Free Software Foundation; either #
13# version 2.1 of the License, or (at your option) any later version. #
14# #
15# HPMPC is distributed in the hope that it will be useful, #
16# but WITHOUT ANY WARRANTY; without even the implied warranty of #
17# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. #
18# See the GNU Lesser General Public License for more details. #
19# #
20# You should have received a copy of the GNU Lesser General Public #
21# License along with HPMPC; if not, write to the Free Software #
22# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA #
23# #
24# Author: Gianluca Frison, giaf (at) dtu.dk #
25# gianluca.frison (at) imtek.uni-freiburg.de #
26# #
27###################################################################################################
28
29include ./Makefile.rule
30
31OBJS =
32
33ifeq ($(LA), HIGH_PERFORMANCE)
34
35ifeq ($(TARGET), X64_INTEL_HASWELL)
36# aux
37OBJS += ./auxiliary/d_aux_lib4.o ./auxiliary/avx/kernel_dgecp_lib4.o ./auxiliary/avx2/kernel_dgetr_lib4.o
38OBJS += ./auxiliary/s_aux_lib8.o
39OBJS += ./auxiliary/m_aux_lib48.o
40# kernels
41OBJS += ./kernel/avx2/kernel_dgemm_12x4_lib4.o ./kernel/avx2/kernel_dgemm_8x8_lib4.o ./kernel/avx2/kernel_dgemm_8x4_lib4.o ./kernel/avx2/kernel_dgemm_4x4_lib4.o ./kernel/avx/kernel_dgemm_diag_lib4.o ./kernel/avx2/kernel_dgemv_8_lib4.o ./kernel/avx/kernel_dgemv_4_lib4.o ./kernel/avx2/kernel_dsymv_6_lib4.o ./kernel/avx2/kernel_dgetrf_pivot_4_lib4.o ./kernel/avx/kernel_dgeqrf_4_lib4.o kernel/avx2/kernel_dgebp_lib4.o kernel/avx2/kernel_dgelqf_4_lib4.o
42OBJS += ./kernel/avx2/kernel_sgemm_24x4_lib8.o ./kernel/avx2/kernel_sgemm_16x4_lib8.o ./kernel/avx2/kernel_sgemm_8x8_lib8.o ./kernel/avx2/kernel_sgemm_8x4_lib8.o ./kernel/avx/kernel_sgemm_diag_lib8.o ./kernel/avx/kernel_sgecp_lib8.o ./kernel/avx/kernel_sgetr_lib8.o ./kernel/avx/kernel_sgead_lib8.o ./kernel/avx/kernel_sgesc_lib8.o ./kernel/avx/kernel_sgemv_8_lib8.o ./kernel/avx/kernel_sgemv_4_lib8.o
43# blas
44OBJS += ./blas/d_blas1_lib4.o ./blas/d_blas2_lib4.o ./blas/d_blas2_diag_lib.o ./blas/d_blas3_lib4.o ./blas/d_blas3_diag_lib4.o ./blas/d_lapack_lib4.o
45OBJS += ./blas/s_blas1_lib8.o ./blas/s_blas2_lib8.o ./blas/s_blas2_diag_lib.o ./blas/s_blas3_lib8.o ./blas/s_blas3_diag_lib8.o ./blas/s_lapack_lib8.o
46endif
47
48ifeq ($(TARGET), X64_INTEL_SANDY_BRIDGE)
49# aux
50OBJS += ./auxiliary/d_aux_lib4.o ./auxiliary/avx/kernel_dgecp_lib4.o ./auxiliary/avx/kernel_dgetr_lib4.o
51OBJS += ./auxiliary/s_aux_lib8.o
52OBJS += ./auxiliary/m_aux_lib48.o
53# kernels
54OBJS += ./kernel/avx/kernel_dgemm_8x4_lib4.o ./kernel/avx/kernel_dgemm_4x4_lib4.o ./kernel/avx/kernel_dgemm_diag_lib4.o ./kernel/avx/kernel_dgemv_12_lib4.o ./kernel/avx/kernel_dgemv_8_lib4.o ./kernel/avx/kernel_dgemv_4_lib4.o ./kernel/avx/kernel_dsymv_6_lib4.o ./kernel/avx/kernel_dgetrf_pivot_4_lib4.o ./kernel/avx/kernel_dgeqrf_4_lib4.o kernel/avx/kernel_dgebp_lib4.o
55OBJS += ./kernel/avx/kernel_sgemm_16x4_lib8.o ./kernel/avx/kernel_sgemm_8x8_lib8.o ./kernel/avx/kernel_sgemm_8x4_lib8.o ./kernel/avx/kernel_sgecp_lib8.o ./kernel/avx/kernel_sgemm_diag_lib8.o ./kernel/avx/kernel_sgetr_lib8.o ./kernel/avx/kernel_sgead_lib8.o ./kernel/avx/kernel_sgesc_lib8.o ./kernel/avx/kernel_sgemv_8_lib8.o ./kernel/avx/kernel_sgemv_4_lib8.o
56# blas
57OBJS += ./blas/d_blas1_lib4.o ./blas/d_blas2_lib4.o ./blas/d_blas2_diag_lib.o ./blas/d_blas3_lib4.o ./blas/d_blas3_diag_lib4.o ./blas/d_lapack_lib4.o
58OBJS += ./blas/s_blas1_lib8.o ./blas/s_blas2_lib8.o ./blas/s_blas2_diag_lib.o ./blas/s_blas3_lib8.o ./blas/s_blas3_diag_lib8.o ./blas/s_lapack_lib8.o
59endif
60
61ifeq ($(TARGET), X64_INTEL_CORE)
62# aux
63OBJS += ./auxiliary/d_aux_lib4.o ./auxiliary/c99/kernel_dgecp_lib4.o ./auxiliary/c99/kernel_dgetr_lib4.o
64OBJS += ./auxiliary/s_aux_lib4.o ./auxiliary/c99/kernel_sgetr_lib4.o
65OBJS += ./auxiliary/m_aux_lib44.o
66# kernels
67OBJS += ./kernel/sse3/kernel_dgemm_4x4_lib4.o ./kernel/c99/kernel_dgemm_4x4_lib4.o ./kernel/c99/kernel_dgemm_diag_lib4.o ./kernel/c99/kernel_dgemv_4_lib4.o ./kernel/c99/kernel_dsymv_4_lib4.o ./kernel/c99/kernel_dgetrf_pivot_4_lib4.o ./kernel/c99/kernel_dgeqrf_4_lib4.o
68OBJS += ./kernel/c99/kernel_sgemm_4x4_lib4.o ./kernel/c99/kernel_sgemm_diag_lib4.o ./kernel/c99/kernel_sgemv_4_lib4.o ./kernel/c99/kernel_ssymv_4_lib4.o ./kernel/c99/kernel_sgetrf_pivot_4_lib4.o ./kernel/c99/kernel_sgecp_lib4.o
69# blas
70OBJS += ./blas/d_blas1_lib4.o ./blas/d_blas2_lib4.o ./blas/d_blas2_diag_lib.o ./blas/d_blas3_lib4.o ./blas/d_blas3_diag_lib4.o ./blas/d_lapack_lib4.o
71OBJS += ./blas/s_blas1_lib4.o ./blas/s_blas2_lib4.o ./blas/s_blas2_diag_lib.o ./blas/s_blas3_lib4.o ./blas/s_blas3_diag_lib4.o ./blas/s_lapack_lib4.o
72endif
73
74ifeq ($(TARGET), X64_AMD_BULLDOZER)
75# aux
76OBJS += ./auxiliary/d_aux_lib4.o ./auxiliary/c99/kernel_dgecp_lib4.o ./auxiliary/c99/kernel_dgetr_lib4.o
77OBJS += ./auxiliary/s_aux_lib4.o ./auxiliary/c99/kernel_sgetr_lib4.o
78OBJS += ./auxiliary/m_aux_lib44.o
79# kernels
80OBJS += ./kernel/fma/kernel_dgemm_4x4_lib4.o ./kernel/c99/kernel_dgemm_4x4_lib4.o ./kernel/c99/kernel_dgemm_diag_lib4.o ./kernel/c99/kernel_dgemv_4_lib4.o ./kernel/c99/kernel_dsymv_4_lib4.o ./kernel/c99/kernel_dgetrf_pivot_4_lib4.o ./kernel/c99/kernel_dgeqrf_4_lib4.o
81OBJS += ./kernel/c99/kernel_sgemm_4x4_lib4.o ./kernel/c99/kernel_sgemm_diag_lib4.o ./kernel/c99/kernel_sgemv_4_lib4.o ./kernel/c99/kernel_ssymv_4_lib4.o ./kernel/c99/kernel_sgetrf_pivot_4_lib4.o ./kernel/c99/kernel_sgecp_lib4.o
82# blas
83OBJS += ./blas/d_blas1_lib4.o ./blas/d_blas2_lib4.o ./blas/d_blas2_diag_lib.o ./blas/d_blas3_lib4.o ./blas/d_blas3_diag_lib4.o ./blas/d_lapack_lib4.o
84OBJS += ./blas/s_blas1_lib4.o ./blas/s_blas2_lib4.o ./blas/s_blas2_diag_lib.o ./blas/s_blas3_lib4.o ./blas/s_blas3_diag_lib4.o ./blas/s_lapack_lib4.o
85endif
86
87ifeq ($(TARGET), ARMV8A_ARM_CORTEX_A57)
88# aux
89OBJS += ./auxiliary/d_aux_lib4.o ./auxiliary/c99/kernel_dgecp_lib4.o ./auxiliary/c99/kernel_dgetr_lib4.o
90OBJS += ./auxiliary/s_aux_lib4.o ./auxiliary/c99/kernel_sgetr_lib4.o
91OBJS += ./auxiliary/m_aux_lib44.o
92# kernels
93OBJS += ./kernel/armv8a/kernel_dgemm_8x4_lib4.o ./kernel/armv8a/kernel_dgemm_4x4_lib4.o ./kernel/c99/kernel_dgemm_4x4_lib4.o ./kernel/c99/kernel_dgemm_diag_lib4.o ./kernel/c99/kernel_dgemv_4_lib4.o ./kernel/c99/kernel_dsymv_4_lib4.o ./kernel/c99/kernel_dgetrf_pivot_4_lib4.o ./kernel/c99/kernel_dgeqrf_4_lib4.o
94OBJS += ./kernel/armv8a/kernel_sgemm_16x4_lib4.o ./kernel/armv8a/kernel_sgemm_12x4_lib4.o ./kernel/armv8a/kernel_sgemm_8x8_lib4.o ./kernel/armv8a/kernel_sgemm_8x4_lib4.o ./kernel/armv8a/kernel_sgemm_4x4_lib4.o ./kernel/c99/kernel_sgemm_4x4_lib4.o ./kernel/c99/kernel_sgemm_diag_lib4.o ./kernel/c99/kernel_sgemv_4_lib4.o ./kernel/c99/kernel_ssymv_4_lib4.o ./kernel/c99/kernel_sgetrf_pivot_4_lib4.o ./kernel/c99/kernel_sgecp_lib4.o
95# blas
96OBJS += ./blas/d_blas1_lib4.o ./blas/d_blas2_lib4.o ./blas/d_blas2_diag_lib.o ./blas/d_blas3_lib4.o ./blas/d_blas3_diag_lib4.o ./blas/d_lapack_lib4.o
97OBJS += ./blas/s_blas1_lib4.o ./blas/s_blas2_lib4.o ./blas/s_blas2_diag_lib.o ./blas/s_blas3_lib4.o ./blas/s_blas3_diag_lib4.o ./blas/s_lapack_lib4.o
98endif
99
100ifeq ($(TARGET), ARMV7A_ARM_CORTEX_A15)
101# aux
102OBJS += ./auxiliary/d_aux_lib4.o ./auxiliary/c99/kernel_dgecp_lib4.o ./auxiliary/c99/kernel_dgetr_lib4.o
103OBJS += ./auxiliary/s_aux_lib4.o ./auxiliary/c99/kernel_sgetr_lib4.o
104OBJS += ./auxiliary/m_aux_lib44.o
105# kernels
106OBJS += ./kernel/armv7a/kernel_dgemm_4x4_lib4.o ./kernel/c99/kernel_dgemm_4x4_lib4.o ./kernel/c99/kernel_dgemm_diag_lib4.o ./kernel/c99/kernel_dgemv_4_lib4.o ./kernel/c99/kernel_dsymv_4_lib4.o ./kernel/c99/kernel_dgetrf_pivot_4_lib4.o ./kernel/c99/kernel_dgeqrf_4_lib4.o
107OBJS += ./kernel/armv7a/kernel_sgemm_12x4_lib4.o ./kernel/armv7a/kernel_sgemm_8x4_lib4.o ./kernel/armv7a/kernel_sgemm_4x4_lib4.o ./kernel/c99/kernel_sgemm_4x4_lib4.o ./kernel/c99/kernel_sgemm_diag_lib4.o ./kernel/c99/kernel_sgemv_4_lib4.o ./kernel/c99/kernel_ssymv_4_lib4.o ./kernel/c99/kernel_sgetrf_pivot_4_lib4.o ./kernel/c99/kernel_sgecp_lib4.o
108# blas
109OBJS += ./blas/d_blas1_lib4.o ./blas/d_blas2_lib4.o ./blas/d_blas2_diag_lib.o ./blas/d_blas3_lib4.o ./blas/d_blas3_diag_lib4.o ./blas/d_lapack_lib4.o
110OBJS += ./blas/s_blas1_lib4.o ./blas/s_blas2_lib4.o ./blas/s_blas2_diag_lib.o ./blas/s_blas3_lib4.o ./blas/s_blas3_diag_lib4.o ./blas/s_lapack_lib4.o
111endif
112
113ifeq ($(TARGET), GENERIC)
114# aux
115OBJS += ./auxiliary/d_aux_lib4.o ./auxiliary/c99/kernel_dgecp_lib4.o ./auxiliary/c99/kernel_dgetr_lib4.o
116OBJS += ./auxiliary/s_aux_lib4.o ./auxiliary/c99/kernel_sgetr_lib4.o
117OBJS += ./auxiliary/m_aux_lib44.o
118# kernels
119OBJS += ./kernel/c99/kernel_dgemm_4x4_lib4.o ./kernel/c99/kernel_dgemm_diag_lib4.o ./kernel/c99/kernel_dgemv_4_lib4.o ./kernel/c99/kernel_dsymv_4_lib4.o ./kernel/c99/kernel_dgetrf_pivot_4_lib4.o ./kernel/c99/kernel_dgeqrf_4_lib4.o
120OBJS += ./kernel/c99/kernel_sgemm_4x4_lib4.o ./kernel/c99/kernel_sgemm_diag_lib4.o ./kernel/c99/kernel_sgemv_4_lib4.o ./kernel/c99/kernel_ssymv_4_lib4.o ./kernel/c99/kernel_sgetrf_pivot_4_lib4.o ./kernel/c99/kernel_sgecp_lib4.o
121# blas
122OBJS += ./blas/d_blas1_lib4.o ./blas/d_blas2_lib4.o ./blas/d_blas2_diag_lib.o ./blas/d_blas3_lib4.o ./blas/d_blas3_diag_lib4.o ./blas/d_lapack_lib4.o
123OBJS += ./blas/s_blas1_lib4.o ./blas/s_blas2_lib4.o ./blas/s_blas2_diag_lib.o ./blas/s_blas3_lib4.o ./blas/s_blas3_diag_lib4.o ./blas/s_lapack_lib4.o
124endif
125
126else # LA_REFERENCE | LA_BLAS
127
128# aux
129OBJS += ./auxiliary/d_aux_lib.o
130OBJS += ./auxiliary/s_aux_lib.o
131OBJS += ./auxiliary/m_aux_lib.o
132# blas
133OBJS += ./blas/d_blas1_lib.o ./blas/d_blas2_lib.o ./blas/d_blas2_diag_lib.o ./blas/d_blas3_lib.o ./blas/d_blas3_diag_lib.o ./blas/d_lapack_lib.o
134OBJS += ./blas/s_blas1_lib.o ./blas/s_blas2_lib.o ./blas/s_blas2_diag_lib.o ./blas/s_blas3_lib.o ./blas/s_blas3_diag_lib.o ./blas/s_lapack_lib.o
135
136endif # LA choice
137
138ifeq ($(EXT_DEP), 1)
139# ext dep
140OBJS += ./auxiliary/d_aux_ext_dep_lib.o
141OBJS += ./auxiliary/s_aux_ext_dep_lib.o
142OBJS += ./auxiliary/v_aux_ext_dep_lib.o
143OBJS += ./auxiliary/i_aux_ext_dep_lib.o
144endif
145
146
147
148all: clean static_library
149
150static_library: target
151 ( cd auxiliary; $(MAKE) obj)
152 ( cd kernel; $(MAKE) obj)
153 ( cd blas; $(MAKE) obj)
154 ar rcs libblasfeo.a $(OBJS)
155 cp libblasfeo.a ./lib/
156 @echo
157 @echo " libblasfeo.a static library build complete."
158 @echo
159
160shared_library: target
161 ( cd auxiliary; $(MAKE) obj)
162 ( cd kernel; $(MAKE) obj)
163 ( cd blas; $(MAKE) obj)
164 gcc -shared -o libblasfeo.so $(OBJS)
165 cp libblasfeo.so ./lib/
166 @echo
167 @echo " libblasfeo.so shared library build complete."
168 @echo
169
170target:
171 touch ./include/blasfeo_target.h
172ifeq ($(TARGET), X64_INTEL_HASWELL)
173 echo "#ifndef TARGET_X64_INTEL_HASWELL" > ./include/blasfeo_target.h
174 echo "#define TARGET_X64_INTEL_HASWELL" >> ./include/blasfeo_target.h
175 echo "#endif" >> ./include/blasfeo_target.h
176endif
177ifeq ($(TARGET), X64_INTEL_SANDY_BRIDGE)
178 echo "#ifndef TARGET_X64_INTEL_SANDY_BRIDGE" > ./include/blasfeo_target.h
179 echo "#define TARGET_X64_INTEL_SANDY_BRIDGE" >> ./include/blasfeo_target.h
180 echo "#endif" >> ./include/blasfeo_target.h
181endif
182ifeq ($(TARGET), X64_INTEL_CORE)
183 echo "#ifndef TARGET_X64_INTEL_CORE" > ./include/blasfeo_target.h
184 echo "#define TARGET_X64_INTEL_CORE" >> ./include/blasfeo_target.h
185 echo "#endif" >> ./include/blasfeo_target.h
186endif
187ifeq ($(TARGET), X64_AMD_BULLDOZER)
188 echo "#ifndef TARGET_X64_AMD_BULLDOZER" > ./include/blasfeo_target.h
189 echo "#define TARGET_X64_AMD_BULLDOZER" >> ./include/blasfeo_target.h
190 echo "#endif" >> ./include/blasfeo_target.h
191endif
192ifeq ($(TARGET), GENERIC)
193 echo "#ifndef TARGET_GENERIC" > ./include/blasfeo_target.h
194 echo "#define TARGET_GENERIC" >> ./include/blasfeo_target.h
195 echo "#endif" >> ./include/blasfeo_target.h
196endif
197ifeq ($(TARGET), ARMV7A_ARM_CORTEX_A15)
198 echo "#ifndef TARGET_ARMV7A_ARM_CORTEX_A15" > ./include/blasfeo_target.h
199 echo "#define TARGET_ARMV7A_ARM_CORTEX_A15" >> ./include/blasfeo_target.h
200 echo "#endif" >> ./include/blasfeo_target.h
201endif
202ifeq ($(LA), HIGH_PERFORMANCE)
203 echo "#ifndef LA_HIGH_PERFORMANCE" >> ./include/blasfeo_target.h
204 echo "#define LA_HIGH_PERFORMANCE" >> ./include/blasfeo_target.h
205 echo "#endif" >> ./include/blasfeo_target.h
206endif
207ifeq ($(LA), BLAS)
208 echo "#ifndef LA_BLAS" >> ./include/blasfeo_target.h
209 echo "#define LA_BLAS" >> ./include/blasfeo_target.h
210 echo "#endif" >> ./include/blasfeo_target.h
211endif
212ifeq ($(LA), REFERENCE)
213 echo "#ifndef LA_REFERENCE" >> ./include/blasfeo_target.h
214 echo "#define LA_REFERENCE" >> ./include/blasfeo_target.h
215 echo "#endif" >> ./include/blasfeo_target.h
216endif
217ifeq ($(EXT_DEP), 1)
218 echo "#ifndef EXT_DEP" >> ./include/blasfeo_target.h
219 echo "#define EXT_DEP" >> ./include/blasfeo_target.h
220 echo "#endif" >> ./include/blasfeo_target.h
221endif
222
223install_static:
224 mkdir -p $(PREFIX)/blasfeo
225 mkdir -p $(PREFIX)/blasfeo/lib
226 cp -f libblasfeo.a $(PREFIX)/blasfeo/lib/
227 mkdir -p $(PREFIX)/blasfeo/include
228 cp -f ./include/*.h $(PREFIX)/blasfeo/include/
229
230install_shared:
231 mkdir -p $(PREFIX)/blasfeo
232 mkdir -p $(PREFIX)/blasfeo/lib
233 cp -f libblasfeo.so $(PREFIX)/blasfeo/lib/
234 mkdir -p $(PREFIX)/blasfeo/include
235 cp -f ./include/*.h $(PREFIX)/blasfeo/include/
236
237test_problem:
238 cp libblasfeo.a ./test_problems/libblasfeo.a
239 make -C test_problems obj
240 @echo
241 @echo " Test problem build complete."
242 @echo
243
244run:
245 ./test_problems/test.out
246
247clean:
248 rm -f libblasfeo.a
249 rm -f libblasfeo.so
250 rm -f ./lib/libblasfeo.a
251 rm -f ./lib/libblasfeo.so
252 make -C auxiliary clean
253 make -C kernel clean
254 make -C blas clean
255 make -C test_problems clean
256 make -C examples clean
257