blob: 9b74139329617567f979f0258d66be47d71f8b27 [file] [log] [blame]
Austin Schuh9a24b372018-01-28 16:12:29 -08001/**************************************************************************************************
2* *
3* This file is part of BLASFEO. *
4* *
5* BLASFEO -- BLAS For Embedded Optimization. *
6* Copyright (C) 2016-2017 by Gianluca Frison. *
7* Developed at IMTEK (University of Freiburg) under the supervision of Moritz Diehl. *
8* All rights reserved. *
9* *
10* HPMPC is free software; you can redistribute it and/or *
11* modify it under the terms of the GNU Lesser General Public *
12* License as published by the Free Software Foundation; either *
13* version 2.1 of the License, or (at your option) any later version. *
14* *
15* HPMPC is distributed in the hope that it will be useful, *
16* but WITHOUT ANY WARRANTY; without even the implied warranty of *
17* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. *
18* See the GNU Lesser General Public License for more details. *
19* *
20* You should have received a copy of the GNU Lesser General Public *
21* License along with HPMPC; if not, write to the Free Software *
22* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA *
23* *
24* Author: Gianluca Frison, giaf (at) dtu.dk *
25* gianluca.frison (at) imtek.uni-freiburg.de *
26* *
27**************************************************************************************************/
28
29#ifndef BLASFEO_BLOCK_SIZE
30#define BLASFEO_BLOCK_SIZE
31
32
33
34#if defined( TARGET_X64_INTEL_HASWELL )
35
36#define D_PS 4
37#define S_PS 8
38#define D_NC 4 // 2 // until the smaller kernel is 4x4
39#define S_NC 4 //2
40
41#elif defined( TARGET_X64_INTEL_SANDY_BRIDGE )
42
43#define D_PS 4
44#define S_PS 8
45#define D_NC 4 // 2 // until the smaller kernel is 4x4
46#define S_NC 4 //2
47
48#elif defined( TARGET_X64_INTEL_CORE )
49
50#define D_PS 4
51#define S_PS 4
52#define D_NC 4 // 2 // until the smaller kernel is 4x4
53#define S_NC 4 //2
54
55#elif defined( TARGET_X64_AMD_BULLDOZER )
56
57#define D_PS 4
58#define S_PS 4
59#define D_NC 4 // 2 // until the smaller kernel is 4x4
60#define S_NC 4 //2
61
62#elif defined( TARGET_ARMV8A_ARM_CORTEX_A57 )
63
64#define D_PS 4
65#define S_PS 4
66#define D_NC 4
67#define S_NC 4
68
69#elif defined( TARGET_ARMV7A_ARM_CORTEX_A15 )
70
71#define D_PS 4
72#define S_PS 4
73#define D_NC 4 // 2 // until the smaller kernel is 4x4
74#define S_NC 4 //2
75
76#elif defined( TARGET_GENERIC )
77
78#define D_PS 4
79#define S_PS 4
80#define D_NC 4 // 2 // until the smaller kernel is 4x4
81#define S_NC 4 //2
82
83#else
84#error "Unknown architecture"
85#endif
86
87
88#endif // BLASFEO_BLOCK_SIZE