@@ -87,13 +87,18 @@ endif ()
87
87
# Cannot run getarch on target if we are cross-compiling
88
88
if (DEFINED CORE AND CMAKE_CROSSCOMPILING AND NOT (${HOST_OS} STREQUAL "WINDOWSSTORE" ))
89
89
# Write to config as getarch would
90
+ if (DEFINED TARGET_CORE )
91
+ set (TCORE ${TARGET_CORE} )
92
+ else ()
93
+ set (TCORE ${CORE} )
94
+ endif ()
90
95
91
96
# TODO: Set up defines that getarch sets up based on every other target
92
97
# Perhaps this should be inside a different file as it grows larger
93
98
file (APPEND ${TARGET_CONF_TEMP}
94
- "#define ${CORE } \n "
95
- "#define CHAR_CORENAME \" ${CORE } \"\n " )
96
- if ("${CORE } " STREQUAL "ARMV7" )
99
+ "#define ${TCORE } \n "
100
+ "#define CHAR_CORENAME \" ${TCORE } \"\n " )
101
+ if ("${TCORE } " STREQUAL "ARMV7" )
97
102
file (APPEND ${TARGET_CONF_TEMP}
98
103
"#define L1_DATA_SIZE\t 65536\n "
99
104
"#define L1_DATA_LINESIZE\t 32\n "
@@ -108,7 +113,7 @@ if (DEFINED CORE AND CMAKE_CROSSCOMPILING AND NOT (${HOST_OS} STREQUAL "WINDOWSS
108
113
set (SGEMM_UNROLL_N 4 )
109
114
set (DGEMM_UNROLL_M 4 )
110
115
set (DGEMM_UNROLL_N 4 )
111
- elseif ("${CORE } " STREQUAL "ARMV8" )
116
+ elseif ("${TCORE } " STREQUAL "ARMV8" )
112
117
file (APPEND ${TARGET_CONF_TEMP}
113
118
"#define L1_DATA_SIZE\t 32768\n "
114
119
"#define L1_DATA_LINESIZE\t 64\n "
@@ -118,9 +123,16 @@ if (DEFINED CORE AND CMAKE_CROSSCOMPILING AND NOT (${HOST_OS} STREQUAL "WINDOWSS
118
123
"#define DTB_SIZE\t 4096\n "
119
124
"#define L2_ASSOCIATIVE\t 32\n "
120
125
"#define ARMV8\n " )
121
- set (SGEMM_UNROLL_M 4 )
126
+ set (SGEMM_UNROLL_M 16 )
122
127
set (SGEMM_UNROLL_N 4 )
123
- elseif ("${CORE} " STREQUAL "CORTEXA57" OR "${CORE} " STREQUAL "CORTEXA53" )
128
+ set (DGEMM_UNROLL_M 8 )
129
+ set (DGEMM_UNROLL_N 4 )
130
+ set (CGEMM_UNROLL_M 8 )
131
+ set (CGEMM_UNROLL_N 4 )
132
+ set (ZGEMM_UNROLL_M 4 )
133
+ set (ZGEMM_UNROLL_N 4 )
134
+ set (SYMV_P 16 )
135
+ elseif ("${TCORE} " STREQUAL "CORTEXA57" OR "${TCORE} " STREQUAL "CORTEXA53" )
124
136
file (APPEND ${TARGET_CONF_TEMP}
125
137
"#define L1_CODE_SIZE\t 32768\n "
126
138
"#define L1_CODE_LINESIZE\t 64\n "
@@ -144,9 +156,10 @@ if (DEFINED CORE AND CMAKE_CROSSCOMPILING AND NOT (${HOST_OS} STREQUAL "WINDOWSS
144
156
set (DGEMM_UNROLL_N 4 )
145
157
set (CGEMM_UNROLL_M 8 )
146
158
set (CGEMM_UNROLL_N 4 )
147
- set (ZGEMM_UNROLL_M 8 )
159
+ set (ZGEMM_UNROLL_M 4 )
148
160
set (ZGEMM_UNROLL_N 4 )
149
- elseif ("${CORE} " STREQUAL "CORTEXA72" OR "${CORE} " STREQUAL "CORTEXA73" )
161
+ set (SYMV_P 16 )
162
+ elseif ("${TCORE} " STREQUAL "CORTEXA72" OR "${TCORE} " STREQUAL "CORTEXA73" )
150
163
file (APPEND ${TARGET_CONF_TEMP}
151
164
"#define L1_CODE_SIZE\t 49152\n "
152
165
"#define L1_CODE_LINESIZE\t 64\n "
@@ -170,9 +183,10 @@ if (DEFINED CORE AND CMAKE_CROSSCOMPILING AND NOT (${HOST_OS} STREQUAL "WINDOWSS
170
183
set (DGEMM_UNROLL_N 4 )
171
184
set (CGEMM_UNROLL_M 8 )
172
185
set (CGEMM_UNROLL_N 4 )
173
- set (ZGEMM_UNROLL_M 8 )
186
+ set (ZGEMM_UNROLL_M 4 )
174
187
set (ZGEMM_UNROLL_N 4 )
175
- elseif ("${CORE} " STREQUAL "FALKOR" )
188
+ set (SYMV_P 16 )
189
+ elseif ("${TCORE} " STREQUAL "FALKOR" )
176
190
file (APPEND ${TARGET_CONF_TEMP}
177
191
"#define L1_CODE_SIZE\t 65536\n "
178
192
"#define L1_CODE_LINESIZE\t 64\n "
@@ -196,9 +210,10 @@ if (DEFINED CORE AND CMAKE_CROSSCOMPILING AND NOT (${HOST_OS} STREQUAL "WINDOWSS
196
210
set (DGEMM_UNROLL_N 4 )
197
211
set (CGEMM_UNROLL_M 8 )
198
212
set (CGEMM_UNROLL_N 4 )
199
- set (ZGEMM_UNROLL_M 8 )
213
+ set (ZGEMM_UNROLL_M 4 )
200
214
set (ZGEMM_UNROLL_N 4 )
201
- elseif ("${CORE} " STREQUAL "THUNDERX" )
215
+ set (SYMV_P 16 )
216
+ elseif ("${TCORE} " STREQUAL "THUNDERX" )
202
217
file (APPEND ${TARGET_CONF_TEMP}
203
218
"#define L1_CODE_SIZE\t 32768\n "
204
219
"#define L1_CODE_LINESIZE\t 64\n "
@@ -224,7 +239,8 @@ if (DEFINED CORE AND CMAKE_CROSSCOMPILING AND NOT (${HOST_OS} STREQUAL "WINDOWSS
224
239
set (CGEMM_UNROLL_N 2 )
225
240
set (ZGEMM_UNROLL_M 2 )
226
241
set (ZGEMM_UNROLL_N 2 )
227
- elseif ("${CORE} " STREQUAL "THUNDERX2T99" )
242
+ set (SYMV_P 16 )
243
+ elseif ("${TCORE} " STREQUAL "THUNDERX2T99" )
228
244
file (APPEND ${TARGET_CONF_TEMP}
229
245
"#define L1_CODE_SIZE\t 32768\n "
230
246
"#define L1_CODE_LINESIZE\t 64\n "
@@ -240,7 +256,7 @@ if (DEFINED CORE AND CMAKE_CROSSCOMPILING AND NOT (${HOST_OS} STREQUAL "WINDOWSS
240
256
"#define L3_ASSOCIATIVE\t 32\n "
241
257
"#define DTB_DEFAULT_ENTRIES\t 64\n "
242
258
"#define DTB_SIZE\t 4096\n "
243
- "#define VULCAN \n " )
259
+ "#define ARMV8 \n " )
244
260
set (SGEMM_UNROLL_M 16 )
245
261
set (SGEMM_UNROLL_N 4 )
246
262
set (DGEMM_UNROLL_M 8 )
@@ -249,6 +265,7 @@ if (DEFINED CORE AND CMAKE_CROSSCOMPILING AND NOT (${HOST_OS} STREQUAL "WINDOWSS
249
265
set (CGEMM_UNROLL_N 4 )
250
266
set (ZGEMM_UNROLL_M 4 )
251
267
set (ZGEMM_UNROLL_N 4 )
268
+ set (SYMV_P 16 )
252
269
endif ()
253
270
254
271
# Or should this actually be NUM_CORES?
0 commit comments