blob: e5263cf34bc62cf269cf7af755722793fd03e401 [file] [log] [blame]
Renato Grottesi777c45c2023-05-08 13:04:07 +00001#!/usr/bin/python
2# -*- coding: utf-8 -*-
3
4# Copyright (c) 2016-2023 Arm Limited.
Anthony Barbierdbdab852017-06-23 15:42:00 +01005#
6# SPDX-License-Identifier: MIT
7#
8# Permission is hereby granted, free of charge, to any person obtaining a copy
9# of this software and associated documentation files (the "Software"), to
10# deal in the Software without restriction, including without limitation the
11# rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
12# sell copies of the Software, and to permit persons to whom the Software is
13# furnished to do so, subject to the following conditions:
14#
15# The above copyright notice and this permission notice shall be included in all
16# copies or substantial portions of the Software.
17#
18# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
19# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
20# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
21# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
22# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
23# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
24# SOFTWARE.
Renato Grottesi777c45c2023-05-08 13:04:07 +000025
Anthony Barbierdbdab852017-06-23 15:42:00 +010026import collections
27import os.path
28import re
29import subprocess
Renato Grottesi777c45c2023-05-08 13:04:07 +000030import zlib
31import json
32import codecs
Anthony Barbierdbdab852017-06-23 15:42:00 +010033
Renato Grottesi777c45c2023-05-08 13:04:07 +000034VERSION = "v23.02.1"
35LIBRARY_VERSION_MAJOR = 30
Jenkins18b685f2020-08-21 10:26:22 +010036LIBRARY_VERSION_MINOR = 0
Renato Grottesi777c45c2023-05-08 13:04:07 +000037LIBRARY_VERSION_PATCH = 1
Jenkins6a7771e2020-05-28 11:28:36 +010038SONAME_VERSION = str(LIBRARY_VERSION_MAJOR) + "." + str(LIBRARY_VERSION_MINOR) + "." + str(LIBRARY_VERSION_PATCH)
Anthony Barbierdbdab852017-06-23 15:42:00 +010039
40Import('env')
41Import('vars')
Jenkinsb9abeae2018-11-22 11:58:08 +000042Import('install_lib')
Anthony Barbierdbdab852017-06-23 15:42:00 +010043
Jenkins36ccc902020-02-21 11:10:48 +000044def build_bootcode_objs(sources):
Jenkins36ccc902020-02-21 11:10:48 +000045 arm_compute_env.Append(ASFLAGS = "-I bootcode/")
46 obj = arm_compute_env.Object(sources)
47 obj = install_lib(obj)
48 Default(obj)
49 return obj
50
Renato Grottesi777c45c2023-05-08 13:04:07 +000051
52
53
54# @brief Create a list of object from a given file list.
55#
56# @param arch_info A dictionary represents the architecture info such as the
57# compiler flags and defines (filedefs.json).
58#
59# @param sources A list of files to build
60#
61# @return A list of objects for the corresponding architecture.
62
63def build_obj_list(arch_info, sources, static=False):
64
65 # Clone environment
66 tmp_env = arm_compute_env.Clone()
67
68 # Append architecture spec
69 if 'cxxflags' in arch_info and len(arch_info['cxxflags']) > 0:
70 tmp_env.Append(CXXFLAGS = arch_info['cxxflags'])
71
72 # Build and return objects
Jenkins8f587de2022-02-26 12:23:41 +000073 if static:
Renato Grottesi777c45c2023-05-08 13:04:07 +000074 objs = tmp_env.StaticObject(sources)
75 else:
76 objs = tmp_env.SharedObject(sources)
77
78 tmp_env.Default(objs)
79 return objs
80
81# @brief Build multi-ISA files with the respective architecture.
82#
83# @return Two distinct lists:
84# A list of static objects
85# A list of shared objects
86
87def build_lib_objects():
88 lib_static_objs = [] # static objects
89 lib_shared_objs = [] # shared objects
90
91 arm_compute_env.Append(CPPDEFINES = ['ENABLE_NEON', 'ARM_COMPUTE_ENABLE_NEON',
92 'ENABLE_SVE', 'ARM_COMPUTE_ENABLE_SVE',
93 'ARM_COMPUTE_ENABLE_FP16', 'ARM_COMPUTE_ENABLE_BF16',
94 'ARM_COMPUTE_ENABLE_I8MM', 'ARM_COMPUTE_ENABLE_SVEF32MM'])
95
96 # Build all the common files for the base architecture
97 lib_static_objs += build_obj_list(filedefs["armv8.2-a"], lib_files, static=True)
98 lib_shared_objs += build_obj_list(filedefs["armv8.2-a"], lib_files, static=False)
99
100 # Build the SVE specific files
101 lib_static_objs += build_obj_list(filedefs["armv8.2-a-sve"], lib_files_sve, static=True)
102 lib_shared_objs += build_obj_list(filedefs["armv8.2-a-sve"], lib_files_sve, static=False)
103
104 # Build the SVE2 specific files
105 arm_compute_env.Append(CPPDEFINES = ['ARM_COMPUTE_ENABLE_SVE2'])
106 lib_static_objs += build_obj_list(filedefs["armv8.6-a-sve2"], lib_files_sve2, static=True)
107 lib_shared_objs += build_obj_list(filedefs["armv8.6-a-sve2"], lib_files_sve2, static=False)
108
109 return lib_static_objs, lib_shared_objs
110
111
112
113def build_library(name, build_env, sources, static=False, libs=[]):
114 cloned_build_env = build_env.Clone()
115 if env['os'] == 'android' and static == False:
116 cloned_build_env["LINKFLAGS"].remove('-pie')
117 cloned_build_env["LINKFLAGS"].remove('-static-libstdc++')
118
119 if static:
120 obj = cloned_build_env.StaticLibrary(name, source=sources, LIBS = arm_compute_env["LIBS"] + libs)
Anthony Barbierdbdab852017-06-23 15:42:00 +0100121 else:
122 if env['set_soname']:
Renato Grottesi777c45c2023-05-08 13:04:07 +0000123 obj = cloned_build_env.SharedLibrary(name, source=sources, SHLIBVERSION = SONAME_VERSION, LIBS = arm_compute_env["LIBS"] + libs)
Anthony Barbierdbdab852017-06-23 15:42:00 +0100124 else:
Renato Grottesi777c45c2023-05-08 13:04:07 +0000125 obj = cloned_build_env.SharedLibrary(name, source=sources, LIBS = arm_compute_env["LIBS"] + libs)
126
127 if env['mapfile']:
128 if not 'windows' in env['os'] and not 'macos' in env['os']:
129 cloned_build_env['LINKFLAGS'].append('"-Wl,-Map='+ name + '.map"')
130 else:
131 cloned_build_env['LINKFLAGS'].append('-Wl,-map,' + name + '.map')
Jenkins1b3192e2022-11-18 10:52:31 +0000132
Jenkinsb9abeae2018-11-22 11:58:08 +0000133 obj = install_lib(obj)
Renato Grottesi777c45c2023-05-08 13:04:07 +0000134 build_env.Default(obj)
Anthony Barbierdbdab852017-06-23 15:42:00 +0100135 return obj
136
Renato Grottesi777c45c2023-05-08 13:04:07 +0000137
138def remove_incode_comments(code):
139 def replace_with_empty(match):
140 s = match.group(0)
141 if s.startswith('/'):
142 return " "
143 else:
144 return s
145
146 comment_regex = re.compile(r'//.*?$|/\*.*?\*/|\'(?:\\.|[^\\\'])*\'|"(?:\\.|[^\\"])*"', re.DOTALL | re.MULTILINE)
147 return re.sub(comment_regex, replace_with_empty, code)
148
149
Anthony Barbierdbdab852017-06-23 15:42:00 +0100150def resolve_includes(target, source, env):
151 # File collection
152 FileEntry = collections.namedtuple('FileEntry', 'target_name file_contents')
153
154 # Include pattern
155 pattern = re.compile("#include \"(.*)\"")
156
157 # Get file contents
158 files = []
159 for i in range(len(source)):
160 src = source[i]
161 dst = target[i]
Renato Grottesi777c45c2023-05-08 13:04:07 +0000162 contents = src.get_contents().decode('utf-8')
163 contents = remove_incode_comments(contents).splitlines()
Anthony Barbierdbdab852017-06-23 15:42:00 +0100164 entry = FileEntry(target_name=dst, file_contents=contents)
165 files.append((os.path.basename(src.get_path()),entry))
166
167 # Create dictionary of tupled list
168 files_dict = dict(files)
169
170 # Check for includes (can only be files in the same folder)
171 final_files = []
172 for file in files:
173 done = False
174 tmp_file = file[1].file_contents
175 while not done:
176 file_count = 0
177 updated_file = []
178 for line in tmp_file:
179 found = pattern.search(line)
180 if found:
Renato Grottesi777c45c2023-05-08 13:04:07 +0000181 # Only get the header file name and discard the relative path.
182 # E.g. "common/experimental/gemm_fused_post_ops/fp_mixed_precision_helpers.h" -> "fp_mixed_precision_helpers.h"
183 include_file = found.group(1).split('/')[-1]
Anthony Barbierdbdab852017-06-23 15:42:00 +0100184 data = files_dict[include_file].file_contents
185 updated_file.extend(data)
186 else:
187 updated_file.append(line)
188 file_count += 1
189
190 # Check if all include are replaced.
191 if file_count == len(tmp_file):
192 done = True
193
194 # Update temp file
195 tmp_file = updated_file
196
197 # Append and prepend string literal identifiers and add expanded file to final list
Anthony Barbierdbdab852017-06-23 15:42:00 +0100198 entry = FileEntry(target_name=file[1].target_name, file_contents=tmp_file)
199 final_files.append((file[0], entry))
200
201 # Write output files
202 for file in final_files:
203 with open(file[1].target_name.get_path(), 'w+') as out_file:
Renato Grottesi777c45c2023-05-08 13:04:07 +0000204 file_to_write = "\n".join( file[1].file_contents )
205 if env['compress_kernels']:
206 file_to_write = zlib.compress(file_to_write.encode('utf-8'), 9)
207 file_to_write = codecs.encode(file_to_write, "base64").decode('utf-8').replace("\n", "")
208 file_to_write = "R\"(" + file_to_write + ")\""
209 out_file.write(file_to_write)
210
Jenkins91ee4d02021-11-15 14:37:16 +0000211
Anthony Barbierdbdab852017-06-23 15:42:00 +0100212def create_version_file(target, source, env):
213# Generate string with build options library version to embed in the library:
214 try:
215 git_hash = subprocess.check_output(["git", "rev-parse", "HEAD"])
216 except (OSError, subprocess.CalledProcessError):
217 git_hash="unknown"
218
Anthony Barbierdbdab852017-06-23 15:42:00 +0100219 build_info = "\"arm_compute_version=%s Build options: %s Git hash=%s\"" % (VERSION, vars.args, git_hash.strip())
220 with open(target[0].get_path(), "w") as fd:
221 fd.write(build_info)
222
Renato Grottesi777c45c2023-05-08 13:04:07 +0000223
224def get_attrs_list(env, data_types, data_layouts):
225 attrs = []
226
227 # Manage data-types
228 if 'all' in data_types:
229 attrs += ['fp16', 'fp32', 'integer', 'qasymm8', 'qasymm8_signed', 'qsymm16']
230 else:
231 if 'fp16' in data_types: attrs += ['fp16']
232 if 'fp32' in data_types: attrs += ['fp32']
233 if 'integer' in data_types: attrs += ['integer']
234 if 'qasymm8' in data_types: attrs += ['qasymm8']
235 if 'qasymm8_signed' in data_types: attrs += ['qasymm8_signed']
236 if 'qsymm16' in data_types: attrs += ['qsymm16']
237 # Manage data-layouts
238 if 'all' in data_layouts:
239 attrs += ['nhwc', 'nchw']
240 else:
241 if 'nhwc' in data_layouts: attrs += ['nhwc']
242 if 'nchw' in data_layouts: attrs += ['nchw']
243
244 # Manage execution state
245 attrs += ['estate32' if (env['estate'] == 'auto' and 'v7a' in env['arch']) or '32' in env['estate'] else 'estate64']
246
247 return attrs
248
249
250def get_operator_backend_files(filelist, operators, backend='', techs=[], attrs=[]):
251 files = { "common" : [] }
252
253 # Early return if filelist is empty
254 if backend not in filelist:
255 return files
256
257 # Iterate over operators and create the file lists to compiler
258 for operator in operators:
259 if operator in filelist[backend]['operators']:
260 files['common'] += filelist[backend]['operators'][operator]["files"]["common"]
261 for tech in techs:
262 if tech in filelist[backend]['operators'][operator]["files"]:
263 # Add tech as a key to dictionary if not there
264 if tech not in files:
265 files[tech] = []
266
267 # Add tech files to the tech file list
268 tech_files = filelist[backend]['operators'][operator]["files"][tech]
269 files[tech] += tech_files.get('common', [])
270 for attr in attrs:
271 files[tech] += tech_files.get(attr, [])
272
273 # Remove duplicates if they exist
274 return {k: list(set(v)) for k,v in files.items()}
275
276def collect_operators(filelist, operators, backend=''):
277 ops = set()
278 for operator in operators:
279 if operator in filelist[backend]['operators']:
280 ops.add(operator)
281 if 'deps' in filelist[backend]['operators'][operator]:
282 ops.update(filelist[backend]['operators'][operator]['deps'])
283 else:
284 print("Operator {0} is unsupported on {1} backend!".format(operator, backend))
285
286 return ops
287
288
289def resolve_operator_dependencies(filelist, operators, backend=''):
290 resolved_operators = collect_operators(filelist, operators, backend)
291
292 are_ops_resolved = False
293 while not are_ops_resolved:
294 resolution_pass = collect_operators(filelist, resolved_operators, backend)
295 if len(resolution_pass) != len(resolved_operators):
296 resolved_operators.update(resolution_pass)
297 else:
298 are_ops_resolved = True
299
300 return resolved_operators
301
302def read_build_config_json(build_config):
303 build_config_contents = {}
304 custom_operators = []
305 custom_types = []
306 custom_layouts = []
307 if os.path.isfile(build_config):
308 with open(build_config) as f:
309 try:
310 build_config_contents = json.load(f)
311 except:
312 print("Warning: Build configuration file is of invalid JSON format!")
313 else:
314 try:
315 build_config_contents = json.loads(build_config)
316 except:
317 print("Warning: Build configuration string is of invalid JSON format!")
318 if build_config_contents:
319 custom_operators = build_config_contents.get("operators", [])
320 custom_types = build_config_contents.get("data_types", [])
321 custom_layouts = build_config_contents.get("data_layouts", [])
322 return custom_operators, custom_types, custom_layouts
323
Anthony Barbierdbdab852017-06-23 15:42:00 +0100324arm_compute_env = env.Clone()
Jenkins52ba29e2018-08-29 15:32:11 +0000325version_file = arm_compute_env.Command("src/core/arm_compute_version.embed", "", action=create_version_file)
326arm_compute_env.AlwaysBuild(version_file)
Anthony Barbierdbdab852017-06-23 15:42:00 +0100327
Renato Grottesi777c45c2023-05-08 13:04:07 +0000328default_cpp_compiler = 'g++' if env['os'] not in ['android', 'macos', 'openbsd'] else 'clang++'
329cpp_compiler = os.environ.get('CXX', default_cpp_compiler)
330
Anthony Barbier06ea0482018-02-22 15:45:35 +0000331# Generate embed files
Jenkins52ba29e2018-08-29 15:32:11 +0000332generate_embed = [ version_file ]
Anthony Barbier06ea0482018-02-22 15:45:35 +0000333if env['opencl'] and env['embed_kernels']:
Jenkinsa175e882022-05-18 13:38:14 +0000334
Renato Grottesi777c45c2023-05-08 13:04:07 +0000335 # Header files
336 cl_helper_files = [ 'src/core/CL/cl_kernels/activation_float_helpers.h',
337 'src/core/CL/cl_kernels/activation_quant_helpers.h',
338 'src/core/CL/cl_kernels/gemm_helpers.h',
339 'src/core/CL/cl_kernels/helpers_asymm.h',
340 'src/core/CL/cl_kernels/helpers.h',
341 'src/core/CL/cl_kernels/load_store_utility.h',
342 'src/core/CL/cl_kernels/repeat.h',
343 'src/core/CL/cl_kernels/tile_helpers.h',
344 'src/core/CL/cl_kernels/types.h',
345 'src/core/CL/cl_kernels/warp_helpers.h',
346 'src/core/CL/cl_kernels/common/experimental/gemm_fused_post_ops/act_eltwise_op_act/fp_post_ops_act_eltwise_op_act.h',
347 'src/core/CL/cl_kernels/common/experimental/gemm_fused_post_ops/fp_mixed_precision_helpers.h',
348 'src/core/CL/cl_kernels/common/experimental/gemm_fused_post_ops/fp_elementwise_op_helpers.h',
349 ]
350
351 # Common kernels
352 cl_files_common = ['src/core/CL/cl_kernels/common/activation_layer.cl',
353 'src/core/CL/cl_kernels/common/activation_layer_quant.cl',
354 'src/core/CL/cl_kernels/common/arg_min_max.cl',
355 'src/core/CL/cl_kernels/common/batchnormalization_layer.cl',
356 'src/core/CL/cl_kernels/common/bounding_box_transform.cl',
357 'src/core/CL/cl_kernels/common/bounding_box_transform_quantized.cl',
358 'src/core/CL/cl_kernels/common/bitwise_op.cl',
359 'src/core/CL/cl_kernels/common/cast.cl',
360 'src/core/CL/cl_kernels/common/comparisons.cl',
361 'src/core/CL/cl_kernels/common/concatenate.cl',
362 'src/core/CL/cl_kernels/common/col2im.cl',
363 'src/core/CL/cl_kernels/common/convert_fc_weights.cl',
364 'src/core/CL/cl_kernels/common/copy_tensor.cl',
365 'src/core/CL/cl_kernels/common/crop_tensor.cl',
366 'src/core/CL/cl_kernels/common/deconvolution_layer.cl',
367 'src/core/CL/cl_kernels/common/dequantization_layer.cl',
368 'src/core/CL/cl_kernels/common/elementwise_operation.cl',
369 'src/core/CL/cl_kernels/common/elementwise_operation_quantized.cl',
370 'src/core/CL/cl_kernels/common/elementwise_unary.cl',
371 'src/core/CL/cl_kernels/common/fft_digit_reverse.cl',
372 'src/core/CL/cl_kernels/common/fft.cl',
373 'src/core/CL/cl_kernels/common/fft_scale.cl',
374 'src/core/CL/cl_kernels/common/fill_border.cl',
375 'src/core/CL/cl_kernels/common/floor.cl',
376 'src/core/CL/cl_kernels/common/gather.cl',
377 'src/core/CL/cl_kernels/common/gemm.cl',
378 'src/core/CL/cl_kernels/common/gemm_reshaped_only_rhs_mmul.cl',
379 'src/core/CL/cl_kernels/common/gemm_utils.cl',
380 'src/core/CL/cl_kernels/common/experimental/gemm_fused_post_ops/act_eltwise_op_act/gemm_mm_native.cl',
381 'src/core/CL/cl_kernels/common/experimental/gemm_fused_post_ops/act_eltwise_op_act/gemm_mm_reshaped.cl',
382 'src/core/CL/cl_kernels/common/experimental/gemm_fused_post_ops/act_eltwise_op_act/gemm_mm_reshaped_only_rhs.cl',
383 'src/core/CL/cl_kernels/common/gemv.cl',
384 'src/core/CL/cl_kernels/common/gemmlowp.cl',
385 'src/core/CL/cl_kernels/common/gemmlowp_reshaped_only_rhs_mmul.cl',
386 'src/core/CL/cl_kernels/common/generate_proposals.cl',
387 'src/core/CL/cl_kernels/common/generate_proposals_quantized.cl',
388 'src/core/CL/cl_kernels/common/instance_normalization.cl',
389 'src/core/CL/cl_kernels/common/l2_normalize.cl',
390 'src/core/CL/cl_kernels/common/mean_stddev_normalization.cl',
391 'src/core/CL/cl_kernels/common/unpooling_layer.cl',
392 'src/core/CL/cl_kernels/common/memset.cl',
393 'src/core/CL/cl_kernels/common/nonmax.cl',
394 'src/core/CL/cl_kernels/common/minmax_layer.cl',
395 'src/core/CL/cl_kernels/common/pad_layer.cl',
396 'src/core/CL/cl_kernels/common/permute.cl',
397 'src/core/CL/cl_kernels/common/pixelwise_mul_float.cl',
398 'src/core/CL/cl_kernels/common/pixelwise_mul_int.cl',
399 'src/core/CL/cl_kernels/common/qlstm_layer_normalization.cl',
400 'src/core/CL/cl_kernels/common/quantization_layer.cl',
401 'src/core/CL/cl_kernels/common/range.cl',
402 'src/core/CL/cl_kernels/common/reduction_operation.cl',
403 'src/core/CL/cl_kernels/common/reshape_layer.cl',
404 'src/core/CL/cl_kernels/common/convolution_layer.cl',
405 'src/core/CL/cl_kernels/common/reverse.cl',
406 'src/core/CL/cl_kernels/common/roi_align_layer.cl',
407 'src/core/CL/cl_kernels/common/roi_align_layer_quantized.cl',
408 'src/core/CL/cl_kernels/common/roi_pooling_layer.cl',
409 'src/core/CL/cl_kernels/common/select.cl',
410 'src/core/CL/cl_kernels/common/softmax_layer.cl',
411 'src/core/CL/cl_kernels/common/softmax_layer_quantized.cl',
412 'src/core/CL/cl_kernels/common/stack_layer.cl',
413 'src/core/CL/cl_kernels/common/slice_ops.cl',
414 'src/core/CL/cl_kernels/common/tile.cl',
415 'src/core/CL/cl_kernels/common/transpose.cl'
416 ]
417
418 # NCHW kernels
419 cl_files_nchw = ['src/core/CL/cl_kernels/nchw/batch_to_space.cl',
420 'src/core/CL/cl_kernels/nchw/batchnormalization_layer.cl',
421 'src/core/CL/cl_kernels/nchw/channel_shuffle.cl',
422 'src/core/CL/cl_kernels/nchw/depth_to_space.cl',
423 'src/core/CL/cl_kernels/nchw/direct_convolution.cl',
424 'src/core/CL/cl_kernels/nchw/dequantization_layer.cl',
425 'src/core/CL/cl_kernels/nchw/im2col.cl',
426 'src/core/CL/cl_kernels/nchw/normalization_layer.cl',
427 'src/core/CL/cl_kernels/nchw/normalize_planar_yuv_layer.cl',
428 'src/core/CL/cl_kernels/nchw/normalize_planar_yuv_layer_quantized.cl',
429 'src/core/CL/cl_kernels/nchw/pooling_layer.cl',
430 'src/core/CL/cl_kernels/nchw/prior_box_layer.cl',
431 'src/core/CL/cl_kernels/nchw/reorg_layer.cl',
432 'src/core/CL/cl_kernels/nchw/scale.cl',
433 'src/core/CL/cl_kernels/nchw/space_to_batch.cl',
434 'src/core/CL/cl_kernels/nchw/space_to_depth.cl',
435 'src/core/CL/cl_kernels/nchw/upsample_layer.cl',
436 'src/core/CL/cl_kernels/nchw/winograd_filter_transform.cl',
437 'src/core/CL/cl_kernels/nchw/winograd_input_transform.cl',
438 'src/core/CL/cl_kernels/nchw/winograd_output_transform.cl'
439 ]
440
441 # NHWC kernels
442 cl_files_nhwc = ['src/core/CL/cl_kernels/nhwc/batch_to_space.cl',
443 'src/core/CL/cl_kernels/nhwc/batchnormalization_layer.cl',
444 'src/core/CL/cl_kernels/nhwc/channel_shuffle.cl',
445 'src/core/CL/cl_kernels/nhwc/direct_convolution.cl',
446 'src/core/CL/cl_kernels/nhwc/direct_convolution3d.cl',
447 'src/core/CL/cl_kernels/nhwc/depth_to_space.cl',
448 'src/core/CL/cl_kernels/nhwc/dequantization_layer.cl',
449 'src/core/CL/cl_kernels/nhwc/dwc_native_fp_nhwc.cl',
450 'src/core/CL/cl_kernels/nhwc/dwc_native_quantized_nhwc.cl',
451 'src/core/CL/cl_kernels/nhwc/im2col.cl',
452 'src/core/CL/cl_kernels/nhwc/indirect_convolution.cl',
453 'src/core/CL/cl_kernels/nhwc/normalization_layer.cl',
454 'src/core/CL/cl_kernels/nhwc/normalize_planar_yuv_layer.cl',
455 'src/core/CL/cl_kernels/nhwc/normalize_planar_yuv_layer_quantized.cl',
456 'src/core/CL/cl_kernels/nhwc/pooling_layer.cl',
457 'src/core/CL/cl_kernels/nhwc/pooling_3d_layer.cl',
458 'src/core/CL/cl_kernels/nhwc/pooling_3d_layer_quantized.cl',
459 'src/core/CL/cl_kernels/nhwc/pooling_layer_quantized.cl',
460 'src/core/CL/cl_kernels/nhwc/reorg_layer.cl',
461 'src/core/CL/cl_kernels/nhwc/scale.cl',
462 'src/core/CL/cl_kernels/nhwc/space_to_batch.cl',
463 'src/core/CL/cl_kernels/nhwc/space_to_depth.cl',
464 'src/core/CL/cl_kernels/nhwc/transposed_convolution.cl',
465 'src/core/CL/cl_kernels/nhwc/upsample_layer.cl',
466 'src/core/CL/cl_kernels/nhwc/winograd_filter_transform.cl',
467 'src/core/CL/cl_kernels/nhwc/winograd_input_transform.cl',
468 'src/core/CL/cl_kernels/nhwc/winograd_output_transform.cl'
469 ]
470
471 cl_files = cl_helper_files + cl_files_common + cl_files_nchw + cl_files_nhwc
472
473 embed_files = [ f+"embed" for f in cl_files ]
Anthony Barbier06ea0482018-02-22 15:45:35 +0000474 arm_compute_env.Append(CPPPATH =[Dir("./src/core/CL/").path] )
475
476 generate_embed.append(arm_compute_env.Command(embed_files, cl_files, action=resolve_includes))
477
Anthony Barbier06ea0482018-02-22 15:45:35 +0000478Default(generate_embed)
479if env["build"] == "embed_only":
480 Return()
481
Jenkins6a7771e2020-05-28 11:28:36 +0100482# Append version defines for semantic versioning
483arm_compute_env.Append(CPPDEFINES = [('ARM_COMPUTE_VERSION_MAJOR', LIBRARY_VERSION_MAJOR),
484 ('ARM_COMPUTE_VERSION_MINOR', LIBRARY_VERSION_MINOR),
485 ('ARM_COMPUTE_VERSION_PATCH', LIBRARY_VERSION_PATCH)])
486
Anthony Barbier06ea0482018-02-22 15:45:35 +0000487# Don't allow undefined references in the libraries:
Renato Grottesi777c45c2023-05-08 13:04:07 +0000488undefined_flag = '-Wl,-undefined,error' if 'macos' in arm_compute_env["os"] else '-Wl,--no-undefined'
489arm_compute_env.Append(LINKFLAGS=[undefined_flag])
Anthony Barbierdbdab852017-06-23 15:42:00 +0100490arm_compute_env.Append(CPPPATH =[Dir("./src/core/").path] )
491
Renato Grottesi777c45c2023-05-08 13:04:07 +0000492if env['os'] != 'openbsd':
493 if env['os'] == 'windows':
494 arm_compute_env.Append(LIBS = [])
495 else:
496 arm_compute_env.Append(LIBS = ['dl'])
Jenkinsf8f7ede2023-02-16 15:41:23 +0000497
Renato Grottesi777c45c2023-05-08 13:04:07 +0000498
499# Load build definitions file
500with (open(Dir('#').path + '/filedefs.json')) as fd:
501 filedefs = json.load(fd)
502 filedefs = filedefs['cpu']['arch']
503
504
505with (open(Dir('#').path + '/filelist.json')) as fp:
506 filelist = json.load(fp)
507
508# Common backend files
509lib_files = filelist['common']
510
511# Experimental files
512# Dynamic fusion
513if env['experimental_dynamic_fusion']:
514 lib_files += filelist['experimental']['dynamic_fusion']
515
516# Fixed format GEMM kernels.
517if env['experimental_fixed_format_kernels']:
518 arm_compute_env.Append(CPPDEFINES = ['ARM_COMPUTE_ENABLE_FIXED_FORMAT_KERNELS'])
519
520
521# Logging files
Jenkins91ee4d02021-11-15 14:37:16 +0000522if env["logging"]:
Renato Grottesi777c45c2023-05-08 13:04:07 +0000523 lib_files += filelist['logging']
Anthony Barbier8140e1e2017-12-14 23:48:46 +0000524
Renato Grottesi777c45c2023-05-08 13:04:07 +0000525# C API files
526lib_files += filelist['c_api']['common']
527lib_files += filelist['c_api']['operators']
Jenkinsc66f0e02021-08-20 08:52:20 +0000528
Renato Grottesi777c45c2023-05-08 13:04:07 +0000529# Scheduler infrastructure
530lib_files += filelist['scheduler']['single']
531if env['cppthreads']:
532 lib_files += filelist['scheduler']['threads']
533if env['openmp']:
534 lib_files += filelist['scheduler']['omp']
Jenkinsf7399fd2021-05-18 15:04:27 +0100535
Renato Grottesi777c45c2023-05-08 13:04:07 +0000536# Graph files
Jenkinsb3a371b2018-05-23 11:36:53 +0100537graph_files = Glob('src/graph/*.cpp')
538graph_files += Glob('src/graph/*/*.cpp')
539
Renato Grottesi777c45c2023-05-08 13:04:07 +0000540# Specify user-defined priority operators
541custom_operators = []
542custom_types = []
543custom_layouts = []
Anthony Barbierdbdab852017-06-23 15:42:00 +0100544
Renato Grottesi777c45c2023-05-08 13:04:07 +0000545use_custom_ops = env['high_priority'] or env['build_config'];
546
547if env['high_priority']:
548 custom_operators = filelist['high_priority']
549 custom_types = ['all']
550 custom_layouts = ['all']
551
552if env['build_config']:
553 custom_operators, custom_types, custom_layouts = read_build_config_json(env['build_config'])
Anthony Barbierdbdab852017-06-23 15:42:00 +0100554
555if env['opencl']:
Renato Grottesi777c45c2023-05-08 13:04:07 +0000556 lib_files += filelist['c_api']['gpu']
557 lib_files += filelist['gpu']['common']
Anthony Barbierdbdab852017-06-23 15:42:00 +0100558
Renato Grottesi777c45c2023-05-08 13:04:07 +0000559 cl_operators = custom_operators if use_custom_ops else filelist['gpu']['operators'].keys()
560 cl_ops_to_build = resolve_operator_dependencies(filelist, cl_operators, 'gpu')
561 lib_files += get_operator_backend_files(filelist, cl_ops_to_build, 'gpu')['common']
Jenkinsf7399fd2021-05-18 15:04:27 +0100562
Jenkinsb3a371b2018-05-23 11:36:53 +0100563 graph_files += Glob('src/graph/backends/CL/*.cpp')
564
Jenkins8f587de2022-02-26 12:23:41 +0000565
Renato Grottesi777c45c2023-05-08 13:04:07 +0000566lib_files_sve = []
567lib_files_sve2 = []
568
Anthony Barbierdbdab852017-06-23 15:42:00 +0100569if env['neon']:
Jenkins975dfe12019-09-02 11:47:54 +0100570 # build winograd/depthwise sources for either v7a / v8a
Jenkins49b8f902020-11-27 12:49:11 +0000571 arm_compute_env.Append(CPPPATH = ["src/core/NEON/kernels/convolution/common/",
Jenkins18b685f2020-08-21 10:26:22 +0100572 "src/core/NEON/kernels/convolution/winograd/",
Renato Grottesi777c45c2023-05-08 13:04:07 +0000573 "src/core/NEON/kernels/arm_conv/depthwise/",
574 "src/core/NEON/kernels/arm_conv/pooling/",
575 "src/core/NEON/kernels/arm_conv/",
Jenkins49b8f902020-11-27 12:49:11 +0000576 "src/core/NEON/kernels/assembly/",
Renato Grottesi777c45c2023-05-08 13:04:07 +0000577 "arm_compute/core/NEON/kernels/assembly/",
578 "src/cpu/kernels/assembly/"])
579
580 lib_files += filelist['cpu']['common']
581
582 # Setup SIMD file list to include
583 simd = ['neon']
584 if env['multi_isa']:
585 simd += ['sve', 'sve2']
586 else:
587 if 'sve' in env['arch']: simd += ['sve']
588 if 'sve2' in env['arch']: simd += ['sve2']
589
590 # Get attributes
591 if(use_custom_ops):
592 attrs = get_attrs_list(env, custom_types, custom_layouts)
593 else:
594 attrs = get_attrs_list(env, env['data_type_support'], env['data_layout_support'])
595
596 if env['experimental_fixed_format_kernels']:
597 attrs.append("experimental_fixed_format_kernels")
598
599 # Setup data-type and data-layout files to include
600 cpu_operators = custom_operators if use_custom_ops else filelist['cpu']['operators'].keys()
601 cpu_ops_to_build = resolve_operator_dependencies(filelist, cpu_operators, 'cpu')
602
603 cpu_files = get_operator_backend_files(filelist, cpu_ops_to_build, 'cpu', simd, attrs)
604
605 # Shared among ALL CPU files
606 lib_files += cpu_files.get('common', [])
607
608 # Arm® Neon™ specific files
609 lib_files += cpu_files.get('neon', [])
610
611 # SVE files only
612 lib_files_sve = cpu_files.get('sve', [])
613
614 # SVE2 files only
615 lib_files_sve2 = cpu_files.get('sve2', [])
Anthony Barbierf45d5a92018-01-24 16:23:15 +0000616
Jenkinsb3a371b2018-05-23 11:36:53 +0100617 graph_files += Glob('src/graph/backends/NEON/*.cpp')
618
Renato Grottesi777c45c2023-05-08 13:04:07 +0000619# Restrict from building graph API if a reduced operator list has been provided
620if use_custom_ops:
621 print("WARNING: Graph library requires all operators to be built")
622 graph_files = []
Jenkins91ee4d02021-11-15 14:37:16 +0000623
Renato Grottesi777c45c2023-05-08 13:04:07 +0000624# Build bootcode in case of bare-metal
Jenkins36ccc902020-02-21 11:10:48 +0000625bootcode_o = []
626if env['os'] == 'bare_metal':
627 bootcode_files = Glob('bootcode/*.s')
628 bootcode_o = build_bootcode_objs(bootcode_files)
629Export('bootcode_o')
630
Renato Grottesi777c45c2023-05-08 13:04:07 +0000631
632if (env['multi_isa']):
633 lib_static_objs, lib_shared_objs = build_lib_objects()
634
635
636# STATIC library build.
637if (env['multi_isa']):
638 arm_compute_a = build_library('arm_compute-static', arm_compute_env, lib_static_objs, static=True)
639else:
640 if 'sve2' in env['arch']:
641 lib_files += lib_files_sve
642 lib_files += lib_files_sve2
643 elif 'sve' in env['arch']:
644 lib_files += lib_files_sve
645
646 arm_compute_a = build_library('arm_compute-static', arm_compute_env, lib_files, static=True)
647
648Export('arm_compute_a')
649
650# SHARED library build.
651if env['os'] != 'bare_metal' and not env['standalone']:
652 if (env['multi_isa']):
653
654 arm_compute_so = build_library('arm_compute', arm_compute_env, lib_shared_objs, static=False)
655 else:
656 arm_compute_so = build_library('arm_compute', arm_compute_env, lib_files, static=False)
657
658 Export('arm_compute_so')
659
660# Generate dummy core lib for backwards compatibility
661if env['os'] == 'macos':
662 # macos static library archiver fails if given an empty list of files
663 arm_compute_core_a = build_library('arm_compute_core-static', arm_compute_env, lib_files, static=True)
664else:
665 arm_compute_core_a = build_library('arm_compute_core-static', arm_compute_env, [], static=True)
666
Anthony Barbierdbdab852017-06-23 15:42:00 +0100667Export('arm_compute_core_a')
668
Kaizen8938bd32017-09-28 14:38:23 +0100669if env['os'] != 'bare_metal' and not env['standalone']:
Renato Grottesi777c45c2023-05-08 13:04:07 +0000670 arm_compute_core_a_so = build_library('arm_compute_core', arm_compute_env, [], static=False)
671 Export('arm_compute_core_a_so')
Anthony Barbierdbdab852017-06-23 15:42:00 +0100672
Renato Grottesi777c45c2023-05-08 13:04:07 +0000673arm_compute_graph_env = arm_compute_env.Clone()
Jenkins7dcb9fa2021-02-23 22:45:28 +0000674
Renato Grottesi777c45c2023-05-08 13:04:07 +0000675# Build graph libraries
676arm_compute_graph_env.Append(CXXFLAGS = ['-Wno-redundant-move', '-Wno-pessimizing-move'])
Jenkins7dcb9fa2021-02-23 22:45:28 +0000677
Renato Grottesi777c45c2023-05-08 13:04:07 +0000678arm_compute_graph_a = build_library('arm_compute_graph-static', arm_compute_graph_env, graph_files, static=True, libs = [ arm_compute_a ])
Jenkinsb3a371b2018-05-23 11:36:53 +0100679Export('arm_compute_graph_a')
Kaizen8938bd32017-09-28 14:38:23 +0100680
Jenkinsb3a371b2018-05-23 11:36:53 +0100681if env['os'] != 'bare_metal' and not env['standalone']:
Renato Grottesi777c45c2023-05-08 13:04:07 +0000682 arm_compute_graph_so = build_library('arm_compute_graph', arm_compute_graph_env, graph_files, static=False, libs = [ "arm_compute" ])
Anthony Barbier8140e1e2017-12-14 23:48:46 +0000683 Depends(arm_compute_graph_so, arm_compute_so)
Kaizen8938bd32017-09-28 14:38:23 +0100684 Export('arm_compute_graph_so')
685
Kaizen8938bd32017-09-28 14:38:23 +0100686if env['standalone']:
687 alias = arm_compute_env.Alias("arm_compute", [arm_compute_a])
688else:
689 alias = arm_compute_env.Alias("arm_compute", [arm_compute_a, arm_compute_so])
690
Anthony Barbierdbdab852017-06-23 15:42:00 +0100691Default(alias)
692
Kaizen8938bd32017-09-28 14:38:23 +0100693if env['standalone']:
Renato Grottesi777c45c2023-05-08 13:04:07 +0000694 Depends([alias], generate_embed)
Kaizen8938bd32017-09-28 14:38:23 +0100695else:
Renato Grottesi777c45c2023-05-08 13:04:07 +0000696 Depends([alias], generate_embed)