1#!/usr/bin/python 2# -*- coding: utf-8 -*- 3 4# Copyright (c) 2016-2023 Arm Limited. 5# 6# SPDX-License-Identifier: MIT 7# 8# Permission is hereby granted, free of charge, to any person obtaining a copy 9# of this software and associated documentation files (the "Software"), to 10# deal in the Software without restriction, including without limitation the 11# rights to use, copy, modify, merge, publish, distribute, sublicense, and/or 12# sell copies of the Software, and to permit persons to whom the Software is 13# furnished to do so, subject to the following conditions: 14# 15# The above copyright notice and this permission notice shall be included in all 16# copies or substantial portions of the Software. 17# 18# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 19# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 20# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE 21# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 22# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 23# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 24# SOFTWARE. 25 26import collections 27import os.path 28import re 29import subprocess 30import zlib 31import json 32import codecs 33 34VERSION = "v23.02.1" 35LIBRARY_VERSION_MAJOR = 30 36LIBRARY_VERSION_MINOR = 0 37LIBRARY_VERSION_PATCH = 1 38SONAME_VERSION = str(LIBRARY_VERSION_MAJOR) + "." + str(LIBRARY_VERSION_MINOR) + "." + str(LIBRARY_VERSION_PATCH) 39 40Import('env') 41Import('vars') 42Import('install_lib') 43 44def build_bootcode_objs(sources): 45 arm_compute_env.Append(ASFLAGS = "-I bootcode/") 46 obj = arm_compute_env.Object(sources) 47 obj = install_lib(obj) 48 Default(obj) 49 return obj 50 51 52 53 54# @brief Create a list of object from a given file list. 55# 56# @param arch_info A dictionary represents the architecture info such as the 57# compiler flags and defines (filedefs.json). 58# 59# @param sources A list of files to build 60# 61# @return A list of objects for the corresponding architecture. 62 63def build_obj_list(arch_info, sources, static=False): 64 65 # Clone environment 66 tmp_env = arm_compute_env.Clone() 67 68 # Append architecture spec 69 if 'cxxflags' in arch_info and len(arch_info['cxxflags']) > 0: 70 tmp_env.Append(CXXFLAGS = arch_info['cxxflags']) 71 72 # Build and return objects 73 if static: 74 objs = tmp_env.StaticObject(sources) 75 else: 76 objs = tmp_env.SharedObject(sources) 77 78 tmp_env.Default(objs) 79 return objs 80 81# @brief Build multi-ISA files with the respective architecture. 82# 83# @return Two distinct lists: 84# A list of static objects 85# A list of shared objects 86 87def build_lib_objects(): 88 lib_static_objs = [] # static objects 89 lib_shared_objs = [] # shared objects 90 91 arm_compute_env.Append(CPPDEFINES = ['ENABLE_NEON', 'ARM_COMPUTE_ENABLE_NEON', 92 'ENABLE_SVE', 'ARM_COMPUTE_ENABLE_SVE', 93 'ARM_COMPUTE_ENABLE_FP16', 'ARM_COMPUTE_ENABLE_BF16', 94 'ARM_COMPUTE_ENABLE_I8MM', 'ARM_COMPUTE_ENABLE_SVEF32MM']) 95 96 # Build all the common files for the base architecture 97 lib_static_objs += build_obj_list(filedefs["armv8.2-a"], lib_files, static=True) 98 lib_shared_objs += build_obj_list(filedefs["armv8.2-a"], lib_files, static=False) 99 100 # Build the SVE specific files 101 lib_static_objs += build_obj_list(filedefs["armv8.2-a-sve"], lib_files_sve, static=True) 102 lib_shared_objs += build_obj_list(filedefs["armv8.2-a-sve"], lib_files_sve, static=False) 103 104 # Build the SVE2 specific files 105 arm_compute_env.Append(CPPDEFINES = ['ARM_COMPUTE_ENABLE_SVE2']) 106 lib_static_objs += build_obj_list(filedefs["armv8.6-a-sve2"], lib_files_sve2, static=True) 107 lib_shared_objs += build_obj_list(filedefs["armv8.6-a-sve2"], lib_files_sve2, static=False) 108 109 return lib_static_objs, lib_shared_objs 110 111 112 113def build_library(name, build_env, sources, static=False, libs=[]): 114 cloned_build_env = build_env.Clone() 115 if env['os'] == 'android' and static == False: 116 cloned_build_env["LINKFLAGS"].remove('-pie') 117 cloned_build_env["LINKFLAGS"].remove('-static-libstdc++') 118 119 if static: 120 obj = cloned_build_env.StaticLibrary(name, source=sources, LIBS = arm_compute_env["LIBS"] + libs) 121 else: 122 if env['set_soname']: 123 obj = cloned_build_env.SharedLibrary(name, source=sources, SHLIBVERSION = SONAME_VERSION, LIBS = arm_compute_env["LIBS"] + libs) 124 else: 125 obj = cloned_build_env.SharedLibrary(name, source=sources, LIBS = arm_compute_env["LIBS"] + libs) 126 127 if env['mapfile']: 128 if not 'windows' in env['os'] and not 'macos' in env['os']: 129 cloned_build_env['LINKFLAGS'].append('"-Wl,-Map='+ name + '.map"') 130 else: 131 cloned_build_env['LINKFLAGS'].append('-Wl,-map,' + name + '.map') 132 133 obj = install_lib(obj) 134 build_env.Default(obj) 135 return obj 136 137 138def remove_incode_comments(code): 139 def replace_with_empty(match): 140 s = match.group(0) 141 if s.startswith('/'): 142 return " " 143 else: 144 return s 145 146 comment_regex = re.compile(r'//.*?$|/\*.*?\*/|\'(?:\\.|[^\\\'])*\'|"(?:\\.|[^\\"])*"', re.DOTALL | re.MULTILINE) 147 return re.sub(comment_regex, replace_with_empty, code) 148 149 150def resolve_includes(target, source, env): 151 # File collection 152 FileEntry = collections.namedtuple('FileEntry', 'target_name file_contents') 153 154 # Include pattern 155 pattern = re.compile("#include \"(.*)\"") 156 157 # Get file contents 158 files = [] 159 for i in range(len(source)): 160 src = source[i] 161 dst = target[i] 162 contents = src.get_contents().decode('utf-8') 163 contents = remove_incode_comments(contents).splitlines() 164 entry = FileEntry(target_name=dst, file_contents=contents) 165 files.append((os.path.basename(src.get_path()),entry)) 166 167 # Create dictionary of tupled list 168 files_dict = dict(files) 169 170 # Check for includes (can only be files in the same folder) 171 final_files = [] 172 for file in files: 173 done = False 174 tmp_file = file[1].file_contents 175 while not done: 176 file_count = 0 177 updated_file = [] 178 for line in tmp_file: 179 found = pattern.search(line) 180 if found: 181 # Only get the header file name and discard the relative path. 182 # E.g. "common/experimental/gemm_fused_post_ops/fp_mixed_precision_helpers.h" -> "fp_mixed_precision_helpers.h" 183 include_file = found.group(1).split('/')[-1] 184 data = files_dict[include_file].file_contents 185 updated_file.extend(data) 186 else: 187 updated_file.append(line) 188 file_count += 1 189 190 # Check if all include are replaced. 191 if file_count == len(tmp_file): 192 done = True 193 194 # Update temp file 195 tmp_file = updated_file 196 197 # Append and prepend string literal identifiers and add expanded file to final list 198 entry = FileEntry(target_name=file[1].target_name, file_contents=tmp_file) 199 final_files.append((file[0], entry)) 200 201 # Write output files 202 for file in final_files: 203 with open(file[1].target_name.get_path(), 'w+') as out_file: 204 file_to_write = "\n".join( file[1].file_contents ) 205 if env['compress_kernels']: 206 file_to_write = zlib.compress(file_to_write.encode('utf-8'), 9) 207 file_to_write = codecs.encode(file_to_write, "base64").decode('utf-8').replace("\n", "") 208 file_to_write = "R\"(" + file_to_write + ")\"" 209 out_file.write(file_to_write) 210 211 212def create_version_file(target, source, env): 213# Generate string with build options library version to embed in the library: 214 try: 215 git_hash = subprocess.check_output(["git", "rev-parse", "HEAD"]) 216 except (OSError, subprocess.CalledProcessError): 217 git_hash="unknown" 218 219 build_info = "\"arm_compute_version=%s Build options: %s Git hash=%s\"" % (VERSION, vars.args, git_hash.strip()) 220 with open(target[0].get_path(), "w") as fd: 221 fd.write(build_info) 222 223 224def get_attrs_list(env, data_types, data_layouts): 225 attrs = [] 226 227 # Manage data-types 228 if 'all' in data_types: 229 attrs += ['fp16', 'fp32', 'integer', 'qasymm8', 'qasymm8_signed', 'qsymm16'] 230 else: 231 if 'fp16' in data_types: attrs += ['fp16'] 232 if 'fp32' in data_types: attrs += ['fp32'] 233 if 'integer' in data_types: attrs += ['integer'] 234 if 'qasymm8' in data_types: attrs += ['qasymm8'] 235 if 'qasymm8_signed' in data_types: attrs += ['qasymm8_signed'] 236 if 'qsymm16' in data_types: attrs += ['qsymm16'] 237 # Manage data-layouts 238 if 'all' in data_layouts: 239 attrs += ['nhwc', 'nchw'] 240 else: 241 if 'nhwc' in data_layouts: attrs += ['nhwc'] 242 if 'nchw' in data_layouts: attrs += ['nchw'] 243 244 # Manage execution state 245 attrs += ['estate32' if (env['estate'] == 'auto' and 'v7a' in env['arch']) or '32' in env['estate'] else 'estate64'] 246 247 return attrs 248 249 250def get_operator_backend_files(filelist, operators, backend='', techs=[], attrs=[]): 251 files = { "common" : [] } 252 253 # Early return if filelist is empty 254 if backend not in filelist: 255 return files 256 257 # Iterate over operators and create the file lists to compiler 258 for operator in operators: 259 if operator in filelist[backend]['operators']: 260 files['common'] += filelist[backend]['operators'][operator]["files"]["common"] 261 for tech in techs: 262 if tech in filelist[backend]['operators'][operator]["files"]: 263 # Add tech as a key to dictionary if not there 264 if tech not in files: 265 files[tech] = [] 266 267 # Add tech files to the tech file list 268 tech_files = filelist[backend]['operators'][operator]["files"][tech] 269 files[tech] += tech_files.get('common', []) 270 for attr in attrs: 271 files[tech] += tech_files.get(attr, []) 272 273 # Remove duplicates if they exist 274 return {k: list(set(v)) for k,v in files.items()} 275 276def collect_operators(filelist, operators, backend=''): 277 ops = set() 278 for operator in operators: 279 if operator in filelist[backend]['operators']: 280 ops.add(operator) 281 if 'deps' in filelist[backend]['operators'][operator]: 282 ops.update(filelist[backend]['operators'][operator]['deps']) 283 else: 284 print("Operator {0} is unsupported on {1} backend!".format(operator, backend)) 285 286 return ops 287 288 289def resolve_operator_dependencies(filelist, operators, backend=''): 290 resolved_operators = collect_operators(filelist, operators, backend) 291 292 are_ops_resolved = False 293 while not are_ops_resolved: 294 resolution_pass = collect_operators(filelist, resolved_operators, backend) 295 if len(resolution_pass) != len(resolved_operators): 296 resolved_operators.update(resolution_pass) 297 else: 298 are_ops_resolved = True 299 300 return resolved_operators 301 302def read_build_config_json(build_config): 303 build_config_contents = {} 304 custom_operators = [] 305 custom_types = [] 306 custom_layouts = [] 307 if os.path.isfile(build_config): 308 with open(build_config) as f: 309 try: 310 build_config_contents = json.load(f) 311 except: 312 print("Warning: Build configuration file is of invalid JSON format!") 313 else: 314 try: 315 build_config_contents = json.loads(build_config) 316 except: 317 print("Warning: Build configuration string is of invalid JSON format!") 318 if build_config_contents: 319 custom_operators = build_config_contents.get("operators", []) 320 custom_types = build_config_contents.get("data_types", []) 321 custom_layouts = build_config_contents.get("data_layouts", []) 322 return custom_operators, custom_types, custom_layouts 323 324arm_compute_env = env.Clone() 325version_file = arm_compute_env.Command("src/core/arm_compute_version.embed", "", action=create_version_file) 326arm_compute_env.AlwaysBuild(version_file) 327 328default_cpp_compiler = 'g++' if env['os'] not in ['android', 'macos', 'openbsd'] else 'clang++' 329cpp_compiler = os.environ.get('CXX', default_cpp_compiler) 330 331# Generate embed files 332generate_embed = [ version_file ] 333if env['opencl'] and env['embed_kernels']: 334 335 # Header files 336 cl_helper_files = [ 'src/core/CL/cl_kernels/activation_float_helpers.h', 337 'src/core/CL/cl_kernels/activation_quant_helpers.h', 338 'src/core/CL/cl_kernels/gemm_helpers.h', 339 'src/core/CL/cl_kernels/helpers_asymm.h', 340 'src/core/CL/cl_kernels/helpers.h', 341 'src/core/CL/cl_kernels/load_store_utility.h', 342 'src/core/CL/cl_kernels/repeat.h', 343 'src/core/CL/cl_kernels/tile_helpers.h', 344 'src/core/CL/cl_kernels/types.h', 345 'src/core/CL/cl_kernels/warp_helpers.h', 346 'src/core/CL/cl_kernels/common/experimental/gemm_fused_post_ops/act_eltwise_op_act/fp_post_ops_act_eltwise_op_act.h', 347 'src/core/CL/cl_kernels/common/experimental/gemm_fused_post_ops/fp_mixed_precision_helpers.h', 348 'src/core/CL/cl_kernels/common/experimental/gemm_fused_post_ops/fp_elementwise_op_helpers.h', 349 ] 350 351 # Common kernels 352 cl_files_common = ['src/core/CL/cl_kernels/common/activation_layer.cl', 353 'src/core/CL/cl_kernels/common/activation_layer_quant.cl', 354 'src/core/CL/cl_kernels/common/arg_min_max.cl', 355 'src/core/CL/cl_kernels/common/batchnormalization_layer.cl', 356 'src/core/CL/cl_kernels/common/bounding_box_transform.cl', 357 'src/core/CL/cl_kernels/common/bounding_box_transform_quantized.cl', 358 'src/core/CL/cl_kernels/common/bitwise_op.cl', 359 'src/core/CL/cl_kernels/common/cast.cl', 360 'src/core/CL/cl_kernels/common/comparisons.cl', 361 'src/core/CL/cl_kernels/common/concatenate.cl', 362 'src/core/CL/cl_kernels/common/col2im.cl', 363 'src/core/CL/cl_kernels/common/convert_fc_weights.cl', 364 'src/core/CL/cl_kernels/common/copy_tensor.cl', 365 'src/core/CL/cl_kernels/common/crop_tensor.cl', 366 'src/core/CL/cl_kernels/common/deconvolution_layer.cl', 367 'src/core/CL/cl_kernels/common/dequantization_layer.cl', 368 'src/core/CL/cl_kernels/common/elementwise_operation.cl', 369 'src/core/CL/cl_kernels/common/elementwise_operation_quantized.cl', 370 'src/core/CL/cl_kernels/common/elementwise_unary.cl', 371 'src/core/CL/cl_kernels/common/fft_digit_reverse.cl', 372 'src/core/CL/cl_kernels/common/fft.cl', 373 'src/core/CL/cl_kernels/common/fft_scale.cl', 374 'src/core/CL/cl_kernels/common/fill_border.cl', 375 'src/core/CL/cl_kernels/common/floor.cl', 376 'src/core/CL/cl_kernels/common/gather.cl', 377 'src/core/CL/cl_kernels/common/gemm.cl', 378 'src/core/CL/cl_kernels/common/gemm_reshaped_only_rhs_mmul.cl', 379 'src/core/CL/cl_kernels/common/gemm_utils.cl', 380 'src/core/CL/cl_kernels/common/experimental/gemm_fused_post_ops/act_eltwise_op_act/gemm_mm_native.cl', 381 'src/core/CL/cl_kernels/common/experimental/gemm_fused_post_ops/act_eltwise_op_act/gemm_mm_reshaped.cl', 382 'src/core/CL/cl_kernels/common/experimental/gemm_fused_post_ops/act_eltwise_op_act/gemm_mm_reshaped_only_rhs.cl', 383 'src/core/CL/cl_kernels/common/gemv.cl', 384 'src/core/CL/cl_kernels/common/gemmlowp.cl', 385 'src/core/CL/cl_kernels/common/gemmlowp_reshaped_only_rhs_mmul.cl', 386 'src/core/CL/cl_kernels/common/generate_proposals.cl', 387 'src/core/CL/cl_kernels/common/generate_proposals_quantized.cl', 388 'src/core/CL/cl_kernels/common/instance_normalization.cl', 389 'src/core/CL/cl_kernels/common/l2_normalize.cl', 390 'src/core/CL/cl_kernels/common/mean_stddev_normalization.cl', 391 'src/core/CL/cl_kernels/common/unpooling_layer.cl', 392 'src/core/CL/cl_kernels/common/memset.cl', 393 'src/core/CL/cl_kernels/common/nonmax.cl', 394 'src/core/CL/cl_kernels/common/minmax_layer.cl', 395 'src/core/CL/cl_kernels/common/pad_layer.cl', 396 'src/core/CL/cl_kernels/common/permute.cl', 397 'src/core/CL/cl_kernels/common/pixelwise_mul_float.cl', 398 'src/core/CL/cl_kernels/common/pixelwise_mul_int.cl', 399 'src/core/CL/cl_kernels/common/qlstm_layer_normalization.cl', 400 'src/core/CL/cl_kernels/common/quantization_layer.cl', 401 'src/core/CL/cl_kernels/common/range.cl', 402 'src/core/CL/cl_kernels/common/reduction_operation.cl', 403 'src/core/CL/cl_kernels/common/reshape_layer.cl', 404 'src/core/CL/cl_kernels/common/convolution_layer.cl', 405 'src/core/CL/cl_kernels/common/reverse.cl', 406 'src/core/CL/cl_kernels/common/roi_align_layer.cl', 407 'src/core/CL/cl_kernels/common/roi_align_layer_quantized.cl', 408 'src/core/CL/cl_kernels/common/roi_pooling_layer.cl', 409 'src/core/CL/cl_kernels/common/select.cl', 410 'src/core/CL/cl_kernels/common/softmax_layer.cl', 411 'src/core/CL/cl_kernels/common/softmax_layer_quantized.cl', 412 'src/core/CL/cl_kernels/common/stack_layer.cl', 413 'src/core/CL/cl_kernels/common/slice_ops.cl', 414 'src/core/CL/cl_kernels/common/tile.cl', 415 'src/core/CL/cl_kernels/common/transpose.cl' 416 ] 417 418 # NCHW kernels 419 cl_files_nchw = ['src/core/CL/cl_kernels/nchw/batch_to_space.cl', 420 'src/core/CL/cl_kernels/nchw/batchnormalization_layer.cl', 421 'src/core/CL/cl_kernels/nchw/channel_shuffle.cl', 422 'src/core/CL/cl_kernels/nchw/depth_to_space.cl', 423 'src/core/CL/cl_kernels/nchw/direct_convolution.cl', 424 'src/core/CL/cl_kernels/nchw/dequantization_layer.cl', 425 'src/core/CL/cl_kernels/nchw/im2col.cl', 426 'src/core/CL/cl_kernels/nchw/normalization_layer.cl', 427 'src/core/CL/cl_kernels/nchw/normalize_planar_yuv_layer.cl', 428 'src/core/CL/cl_kernels/nchw/normalize_planar_yuv_layer_quantized.cl', 429 'src/core/CL/cl_kernels/nchw/pooling_layer.cl', 430 'src/core/CL/cl_kernels/nchw/prior_box_layer.cl', 431 'src/core/CL/cl_kernels/nchw/reorg_layer.cl', 432 'src/core/CL/cl_kernels/nchw/scale.cl', 433 'src/core/CL/cl_kernels/nchw/space_to_batch.cl', 434 'src/core/CL/cl_kernels/nchw/space_to_depth.cl', 435 'src/core/CL/cl_kernels/nchw/upsample_layer.cl', 436 'src/core/CL/cl_kernels/nchw/winograd_filter_transform.cl', 437 'src/core/CL/cl_kernels/nchw/winograd_input_transform.cl', 438 'src/core/CL/cl_kernels/nchw/winograd_output_transform.cl' 439 ] 440 441 # NHWC kernels 442 cl_files_nhwc = ['src/core/CL/cl_kernels/nhwc/batch_to_space.cl', 443 'src/core/CL/cl_kernels/nhwc/batchnormalization_layer.cl', 444 'src/core/CL/cl_kernels/nhwc/channel_shuffle.cl', 445 'src/core/CL/cl_kernels/nhwc/direct_convolution.cl', 446 'src/core/CL/cl_kernels/nhwc/direct_convolution3d.cl', 447 'src/core/CL/cl_kernels/nhwc/depth_to_space.cl', 448 'src/core/CL/cl_kernels/nhwc/dequantization_layer.cl', 449 'src/core/CL/cl_kernels/nhwc/dwc_native_fp_nhwc.cl', 450 'src/core/CL/cl_kernels/nhwc/dwc_native_quantized_nhwc.cl', 451 'src/core/CL/cl_kernels/nhwc/im2col.cl', 452 'src/core/CL/cl_kernels/nhwc/indirect_convolution.cl', 453 'src/core/CL/cl_kernels/nhwc/normalization_layer.cl', 454 'src/core/CL/cl_kernels/nhwc/normalize_planar_yuv_layer.cl', 455 'src/core/CL/cl_kernels/nhwc/normalize_planar_yuv_layer_quantized.cl', 456 'src/core/CL/cl_kernels/nhwc/pooling_layer.cl', 457 'src/core/CL/cl_kernels/nhwc/pooling_3d_layer.cl', 458 'src/core/CL/cl_kernels/nhwc/pooling_3d_layer_quantized.cl', 459 'src/core/CL/cl_kernels/nhwc/pooling_layer_quantized.cl', 460 'src/core/CL/cl_kernels/nhwc/reorg_layer.cl', 461 'src/core/CL/cl_kernels/nhwc/scale.cl', 462 'src/core/CL/cl_kernels/nhwc/space_to_batch.cl', 463 'src/core/CL/cl_kernels/nhwc/space_to_depth.cl', 464 'src/core/CL/cl_kernels/nhwc/transposed_convolution.cl', 465 'src/core/CL/cl_kernels/nhwc/upsample_layer.cl', 466 'src/core/CL/cl_kernels/nhwc/winograd_filter_transform.cl', 467 'src/core/CL/cl_kernels/nhwc/winograd_input_transform.cl', 468 'src/core/CL/cl_kernels/nhwc/winograd_output_transform.cl' 469 ] 470 471 cl_files = cl_helper_files + cl_files_common + cl_files_nchw + cl_files_nhwc 472 473 embed_files = [ f+"embed" for f in cl_files ] 474 arm_compute_env.Append(CPPPATH =[Dir("./src/core/CL/").path] ) 475 476 generate_embed.append(arm_compute_env.Command(embed_files, cl_files, action=resolve_includes)) 477 478Default(generate_embed) 479if env["build"] == "embed_only": 480 Return() 481 482# Append version defines for semantic versioning 483arm_compute_env.Append(CPPDEFINES = [('ARM_COMPUTE_VERSION_MAJOR', LIBRARY_VERSION_MAJOR), 484 ('ARM_COMPUTE_VERSION_MINOR', LIBRARY_VERSION_MINOR), 485 ('ARM_COMPUTE_VERSION_PATCH', LIBRARY_VERSION_PATCH)]) 486 487# Don't allow undefined references in the libraries: 488undefined_flag = '-Wl,-undefined,error' if 'macos' in arm_compute_env["os"] else '-Wl,--no-undefined' 489arm_compute_env.Append(LINKFLAGS=[undefined_flag]) 490arm_compute_env.Append(CPPPATH =[Dir("./src/core/").path] ) 491 492if env['os'] != 'openbsd': 493 if env['os'] == 'windows': 494 arm_compute_env.Append(LIBS = []) 495 else: 496 arm_compute_env.Append(LIBS = ['dl']) 497 498 499# Load build definitions file 500with (open(Dir('#').path + '/filedefs.json')) as fd: 501 filedefs = json.load(fd) 502 filedefs = filedefs['cpu']['arch'] 503 504 505with (open(Dir('#').path + '/filelist.json')) as fp: 506 filelist = json.load(fp) 507 508# Common backend files 509lib_files = filelist['common'] 510 511# Experimental files 512# Dynamic fusion 513if env['experimental_dynamic_fusion']: 514 lib_files += filelist['experimental']['dynamic_fusion'] 515 516# Fixed format GEMM kernels. 517if env['experimental_fixed_format_kernels']: 518 arm_compute_env.Append(CPPDEFINES = ['ARM_COMPUTE_ENABLE_FIXED_FORMAT_KERNELS']) 519 520 521# Logging files 522if env["logging"]: 523 lib_files += filelist['logging'] 524 525# C API files 526lib_files += filelist['c_api']['common'] 527lib_files += filelist['c_api']['operators'] 528 529# Scheduler infrastructure 530lib_files += filelist['scheduler']['single'] 531if env['cppthreads']: 532 lib_files += filelist['scheduler']['threads'] 533if env['openmp']: 534 lib_files += filelist['scheduler']['omp'] 535 536# Graph files 537graph_files = Glob('src/graph/*.cpp') 538graph_files += Glob('src/graph/*/*.cpp') 539 540# Specify user-defined priority operators 541custom_operators = [] 542custom_types = [] 543custom_layouts = [] 544 545use_custom_ops = env['high_priority'] or env['build_config']; 546 547if env['high_priority']: 548 custom_operators = filelist['high_priority'] 549 custom_types = ['all'] 550 custom_layouts = ['all'] 551 552if env['build_config']: 553 custom_operators, custom_types, custom_layouts = read_build_config_json(env['build_config']) 554 555if env['opencl']: 556 lib_files += filelist['c_api']['gpu'] 557 lib_files += filelist['gpu']['common'] 558 559 cl_operators = custom_operators if use_custom_ops else filelist['gpu']['operators'].keys() 560 cl_ops_to_build = resolve_operator_dependencies(filelist, cl_operators, 'gpu') 561 lib_files += get_operator_backend_files(filelist, cl_ops_to_build, 'gpu')['common'] 562 563 graph_files += Glob('src/graph/backends/CL/*.cpp') 564 565 566lib_files_sve = [] 567lib_files_sve2 = [] 568 569if env['neon']: 570 # build winograd/depthwise sources for either v7a / v8a 571 arm_compute_env.Append(CPPPATH = ["src/core/NEON/kernels/convolution/common/", 572 "src/core/NEON/kernels/convolution/winograd/", 573 "src/core/NEON/kernels/arm_conv/depthwise/", 574 "src/core/NEON/kernels/arm_conv/pooling/", 575 "src/core/NEON/kernels/arm_conv/", 576 "src/core/NEON/kernels/assembly/", 577 "arm_compute/core/NEON/kernels/assembly/", 578 "src/cpu/kernels/assembly/"]) 579 580 lib_files += filelist['cpu']['common'] 581 582 # Setup SIMD file list to include 583 simd = ['neon'] 584 if env['multi_isa']: 585 simd += ['sve', 'sve2'] 586 else: 587 if 'sve' in env['arch']: simd += ['sve'] 588 if 'sve2' in env['arch']: simd += ['sve2'] 589 590 # Get attributes 591 if(use_custom_ops): 592 attrs = get_attrs_list(env, custom_types, custom_layouts) 593 else: 594 attrs = get_attrs_list(env, env['data_type_support'], env['data_layout_support']) 595 596 if env['experimental_fixed_format_kernels']: 597 attrs.append("experimental_fixed_format_kernels") 598 599 # Setup data-type and data-layout files to include 600 cpu_operators = custom_operators if use_custom_ops else filelist['cpu']['operators'].keys() 601 cpu_ops_to_build = resolve_operator_dependencies(filelist, cpu_operators, 'cpu') 602 603 cpu_files = get_operator_backend_files(filelist, cpu_ops_to_build, 'cpu', simd, attrs) 604 605 # Shared among ALL CPU files 606 lib_files += cpu_files.get('common', []) 607 608 # Arm® Neon™ specific files 609 lib_files += cpu_files.get('neon', []) 610 611 # SVE files only 612 lib_files_sve = cpu_files.get('sve', []) 613 614 # SVE2 files only 615 lib_files_sve2 = cpu_files.get('sve2', []) 616 617 graph_files += Glob('src/graph/backends/NEON/*.cpp') 618 619# Restrict from building graph API if a reduced operator list has been provided 620if use_custom_ops: 621 print("WARNING: Graph library requires all operators to be built") 622 graph_files = [] 623 624# Build bootcode in case of bare-metal 625bootcode_o = [] 626if env['os'] == 'bare_metal': 627 bootcode_files = Glob('bootcode/*.s') 628 bootcode_o = build_bootcode_objs(bootcode_files) 629Export('bootcode_o') 630 631 632if (env['multi_isa']): 633 lib_static_objs, lib_shared_objs = build_lib_objects() 634 635 636# STATIC library build. 637if (env['multi_isa']): 638 arm_compute_a = build_library('arm_compute-static', arm_compute_env, lib_static_objs, static=True) 639else: 640 if 'sve2' in env['arch']: 641 lib_files += lib_files_sve 642 lib_files += lib_files_sve2 643 elif 'sve' in env['arch']: 644 lib_files += lib_files_sve 645 646 arm_compute_a = build_library('arm_compute-static', arm_compute_env, lib_files, static=True) 647 648Export('arm_compute_a') 649 650# SHARED library build. 651if env['os'] != 'bare_metal' and not env['standalone']: 652 if (env['multi_isa']): 653 654 arm_compute_so = build_library('arm_compute', arm_compute_env, lib_shared_objs, static=False) 655 else: 656 arm_compute_so = build_library('arm_compute', arm_compute_env, lib_files, static=False) 657 658 Export('arm_compute_so') 659 660# Generate dummy core lib for backwards compatibility 661if env['os'] == 'macos': 662 # macos static library archiver fails if given an empty list of files 663 arm_compute_core_a = build_library('arm_compute_core-static', arm_compute_env, lib_files, static=True) 664else: 665 arm_compute_core_a = build_library('arm_compute_core-static', arm_compute_env, [], static=True) 666 667Export('arm_compute_core_a') 668 669if env['os'] != 'bare_metal' and not env['standalone']: 670 arm_compute_core_a_so = build_library('arm_compute_core', arm_compute_env, [], static=False) 671 Export('arm_compute_core_a_so') 672 673arm_compute_graph_env = arm_compute_env.Clone() 674 675# Build graph libraries 676arm_compute_graph_env.Append(CXXFLAGS = ['-Wno-redundant-move', '-Wno-pessimizing-move']) 677 678arm_compute_graph_a = build_library('arm_compute_graph-static', arm_compute_graph_env, graph_files, static=True, libs = [ arm_compute_a ]) 679Export('arm_compute_graph_a') 680 681if env['os'] != 'bare_metal' and not env['standalone']: 682 arm_compute_graph_so = build_library('arm_compute_graph', arm_compute_graph_env, graph_files, static=False, libs = [ "arm_compute" ]) 683 Depends(arm_compute_graph_so, arm_compute_so) 684 Export('arm_compute_graph_so') 685 686if env['standalone']: 687 alias = arm_compute_env.Alias("arm_compute", [arm_compute_a]) 688else: 689 alias = arm_compute_env.Alias("arm_compute", [arm_compute_a, arm_compute_so]) 690 691Default(alias) 692 693if env['standalone']: 694 Depends([alias], generate_embed) 695else: 696 Depends([alias], generate_embed) 697