307 lines
		
	
	
		
			12 KiB
		
	
	
	
		
			Python
		
	
	
	
			
		
		
	
	
			307 lines
		
	
	
		
			12 KiB
		
	
	
	
		
			Python
		
	
	
	
# Copyright (c) 2016, 2017 Arm Limited.
 | 
						|
#
 | 
						|
# SPDX-License-Identifier: MIT
 | 
						|
#
 | 
						|
# Permission is hereby granted, free of charge, to any person obtaining a copy
 | 
						|
# of this software and associated documentation files (the "Software"), to
 | 
						|
# deal in the Software without restriction, including without limitation the
 | 
						|
# rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
 | 
						|
# sell copies of the Software, and to permit persons to whom the Software is
 | 
						|
# furnished to do so, subject to the following conditions:
 | 
						|
#
 | 
						|
# The above copyright notice and this permission notice shall be included in all
 | 
						|
# copies or substantial portions of the Software.
 | 
						|
#
 | 
						|
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 | 
						|
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 | 
						|
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 | 
						|
# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 | 
						|
# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 | 
						|
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 | 
						|
# SOFTWARE.
 | 
						|
import collections
 | 
						|
import os.path
 | 
						|
import re
 | 
						|
import subprocess
 | 
						|
 | 
						|
VERSION = "v20.11"
 | 
						|
LIBRARY_VERSION_MAJOR = 21
 | 
						|
LIBRARY_VERSION_MINOR =  0
 | 
						|
LIBRARY_VERSION_PATCH =  0
 | 
						|
SONAME_VERSION = str(LIBRARY_VERSION_MAJOR) + "." + str(LIBRARY_VERSION_MINOR) + "." + str(LIBRARY_VERSION_PATCH)
 | 
						|
 | 
						|
Import('env')
 | 
						|
Import('vars')
 | 
						|
Import('install_lib')
 | 
						|
 | 
						|
def build_bootcode_objs(sources):
 | 
						|
 | 
						|
    arm_compute_env.Append(ASFLAGS = "-I bootcode/")
 | 
						|
    obj = arm_compute_env.Object(sources)
 | 
						|
    obj = install_lib(obj)
 | 
						|
    Default(obj)
 | 
						|
    return obj
 | 
						|
 | 
						|
def build_library(name, sources, static=False, libs=[]):
 | 
						|
    if static:
 | 
						|
        obj = arm_compute_env.StaticLibrary(name, source=sources, LIBS = arm_compute_env["LIBS"] + libs)
 | 
						|
    else:
 | 
						|
        if env['set_soname']:
 | 
						|
            obj = arm_compute_env.SharedLibrary(name, source=sources, SHLIBVERSION = SONAME_VERSION, LIBS = arm_compute_env["LIBS"] + libs)
 | 
						|
        else:
 | 
						|
            obj = arm_compute_env.SharedLibrary(name, source=sources, LIBS = arm_compute_env["LIBS"] + libs)
 | 
						|
 | 
						|
    obj = install_lib(obj)
 | 
						|
    Default(obj)
 | 
						|
    return obj
 | 
						|
 | 
						|
def resolve_includes(target, source, env):
 | 
						|
    # File collection
 | 
						|
    FileEntry = collections.namedtuple('FileEntry', 'target_name file_contents')
 | 
						|
 | 
						|
    # Include pattern
 | 
						|
    pattern = re.compile("#include \"(.*)\"")
 | 
						|
 | 
						|
    # Get file contents
 | 
						|
    files = []
 | 
						|
    for i in range(len(source)):
 | 
						|
        src = source[i]
 | 
						|
        dst = target[i]
 | 
						|
        contents = src.get_contents().decode('utf-8').splitlines()
 | 
						|
        entry = FileEntry(target_name=dst, file_contents=contents)
 | 
						|
        files.append((os.path.basename(src.get_path()),entry))
 | 
						|
 | 
						|
    # Create dictionary of tupled list
 | 
						|
    files_dict = dict(files)
 | 
						|
 | 
						|
    # Check for includes (can only be files in the same folder)
 | 
						|
    final_files = []
 | 
						|
    for file in files:
 | 
						|
        done = False
 | 
						|
        tmp_file = file[1].file_contents
 | 
						|
        while not done:
 | 
						|
            file_count = 0
 | 
						|
            updated_file = []
 | 
						|
            for line in tmp_file:
 | 
						|
                found = pattern.search(line)
 | 
						|
                if found:
 | 
						|
                    include_file = found.group(1)
 | 
						|
                    data = files_dict[include_file].file_contents
 | 
						|
                    updated_file.extend(data)
 | 
						|
                else:
 | 
						|
                    updated_file.append(line)
 | 
						|
                    file_count += 1
 | 
						|
 | 
						|
            # Check if all include are replaced.
 | 
						|
            if file_count == len(tmp_file):
 | 
						|
                done = True
 | 
						|
 | 
						|
            # Update temp file
 | 
						|
            tmp_file = updated_file
 | 
						|
 | 
						|
        # Append and prepend string literal identifiers and add expanded file to final list
 | 
						|
        tmp_file.insert(0, "R\"(\n")
 | 
						|
        tmp_file.append("\n)\"")
 | 
						|
        entry = FileEntry(target_name=file[1].target_name, file_contents=tmp_file)
 | 
						|
        final_files.append((file[0], entry))
 | 
						|
 | 
						|
    # Write output files
 | 
						|
    for file in final_files:
 | 
						|
        with open(file[1].target_name.get_path(), 'w+') as out_file:
 | 
						|
            out_file.write( "\n".join( file[1].file_contents ))
 | 
						|
 | 
						|
def create_version_file(target, source, env):
 | 
						|
# Generate string with build options library version to embed in the library:
 | 
						|
    try:
 | 
						|
        git_hash = subprocess.check_output(["git", "rev-parse", "HEAD"])
 | 
						|
    except (OSError, subprocess.CalledProcessError):
 | 
						|
        git_hash="unknown"
 | 
						|
 | 
						|
    build_info = "\"arm_compute_version=%s Build options: %s Git hash=%s\"" % (VERSION, vars.args, git_hash.strip())
 | 
						|
    with open(target[0].get_path(), "w") as fd:
 | 
						|
        fd.write(build_info)
 | 
						|
 | 
						|
arm_compute_env = env.Clone()
 | 
						|
version_file = arm_compute_env.Command("src/core/arm_compute_version.embed", "", action=create_version_file)
 | 
						|
arm_compute_env.AlwaysBuild(version_file)
 | 
						|
 | 
						|
# Generate embed files
 | 
						|
generate_embed = [ version_file ]
 | 
						|
if env['opencl'] and env['embed_kernels']:
 | 
						|
    cl_files = Glob('src/core/CL/cl_kernels/*.cl')
 | 
						|
    cl_files += Glob('src/core/CL/cl_kernels/*.h')
 | 
						|
 | 
						|
    embed_files = [ f.get_path()+"embed" for f in cl_files ]
 | 
						|
    arm_compute_env.Append(CPPPATH =[Dir("./src/core/CL/").path] )
 | 
						|
 | 
						|
    generate_embed.append(arm_compute_env.Command(embed_files, cl_files, action=resolve_includes))
 | 
						|
 | 
						|
if env['gles_compute'] and env['embed_kernels']:
 | 
						|
    cs_files = Glob('src/core/GLES_COMPUTE/cs_shaders/*.cs')
 | 
						|
    cs_files += Glob('src/core/GLES_COMPUTE/cs_shaders/*.h')
 | 
						|
 | 
						|
    embed_files = [ f.get_path()+"embed" for f in cs_files ]
 | 
						|
    arm_compute_env.Append(CPPPATH =[Dir("./src/core/GLES_COMPUTE/").path] )
 | 
						|
 | 
						|
    generate_embed.append(arm_compute_env.Command(embed_files, cs_files, action=resolve_includes))
 | 
						|
 | 
						|
Default(generate_embed)
 | 
						|
if env["build"] == "embed_only":
 | 
						|
    Return()
 | 
						|
 | 
						|
# Append version defines for semantic versioning
 | 
						|
arm_compute_env.Append(CPPDEFINES = [('ARM_COMPUTE_VERSION_MAJOR', LIBRARY_VERSION_MAJOR),
 | 
						|
                                     ('ARM_COMPUTE_VERSION_MINOR', LIBRARY_VERSION_MINOR),
 | 
						|
                                     ('ARM_COMPUTE_VERSION_PATCH', LIBRARY_VERSION_PATCH)])
 | 
						|
 | 
						|
 | 
						|
# Don't allow undefined references in the libraries:
 | 
						|
arm_compute_env.Append(LINKFLAGS=['-Wl,--no-undefined'])
 | 
						|
arm_compute_env.Append(CPPPATH =[Dir("./src/core/").path] )
 | 
						|
 | 
						|
arm_compute_env.Append(LIBS = ['dl'])
 | 
						|
 | 
						|
core_files = Glob('src/core/*.cpp')
 | 
						|
core_files += Glob('src/core/CPP/*.cpp')
 | 
						|
core_files += Glob('src/core/CPP/kernels/*.cpp')
 | 
						|
core_files += Glob('src/core/helpers/*.cpp')
 | 
						|
core_files += Glob('src/core/utils/*.cpp')
 | 
						|
core_files += Glob('src/core/utils/helpers/*.cpp')
 | 
						|
core_files += Glob('src/core/utils/io/*.cpp')
 | 
						|
core_files += Glob('src/core/utils/quantization/*.cpp')
 | 
						|
core_files += Glob('src/core/utils/misc/*.cpp')
 | 
						|
if env["logging"]:
 | 
						|
    core_files += Glob('src/core/utils/logging/*.cpp')
 | 
						|
 | 
						|
runtime_files = Glob('src/runtime/*.cpp')
 | 
						|
runtime_files += Glob('src/runtime/CPP/ICPPSimpleFunction.cpp')
 | 
						|
runtime_files += Glob('src/runtime/CPP/functions/*.cpp')
 | 
						|
 | 
						|
# CLHarrisCorners uses the Scheduler to run CPP kernels
 | 
						|
runtime_files += Glob('src/runtime/CPP/SingleThreadScheduler.cpp')
 | 
						|
 | 
						|
graph_files = Glob('src/graph/*.cpp')
 | 
						|
graph_files += Glob('src/graph/*/*.cpp')
 | 
						|
 | 
						|
if env['cppthreads']:
 | 
						|
     runtime_files += Glob('src/runtime/CPP/CPPScheduler.cpp')
 | 
						|
 | 
						|
if env['openmp']:
 | 
						|
     runtime_files += Glob('src/runtime/OMP/OMPScheduler.cpp')
 | 
						|
 | 
						|
if env['opencl']:
 | 
						|
    core_files += Glob('src/core/CL/*.cpp')
 | 
						|
    core_files += Glob('src/core/CL/kernels/*.cpp')
 | 
						|
    core_files += Glob('src/core/CL/gemm/*.cpp')
 | 
						|
    core_files += Glob('src/core/CL/gemm/native/*.cpp')
 | 
						|
    core_files += Glob('src/core/CL/gemm/reshaped/*.cpp')
 | 
						|
    core_files += Glob('src/core/CL/gemm/reshaped_only_rhs/*.cpp')
 | 
						|
 | 
						|
    runtime_files += Glob('src/runtime/CL/*.cpp')
 | 
						|
    runtime_files += Glob('src/runtime/CL/functions/*.cpp')
 | 
						|
    runtime_files += Glob('src/runtime/CL/gemm/*.cpp')
 | 
						|
    runtime_files += Glob('src/runtime/CL/tuners/*.cpp')
 | 
						|
 | 
						|
    graph_files += Glob('src/graph/backends/CL/*.cpp')
 | 
						|
 | 
						|
 | 
						|
if env['neon']:
 | 
						|
    core_files += Glob('src/core/NEON/*.cpp')
 | 
						|
    core_files += Glob('src/core/NEON/kernels/*.cpp')
 | 
						|
    core_files += Glob('src/core/NEON/kernels/assembly/*.cpp')
 | 
						|
 | 
						|
    core_files += Glob('src/core/NEON/kernels/arm_gemm/*.cpp')
 | 
						|
 | 
						|
    # build winograd/depthwise sources for either v7a / v8a
 | 
						|
    core_files += Glob('src/core/NEON/kernels/convolution/*/*.cpp')
 | 
						|
    core_files += Glob('src/core/NEON/kernels/convolution/winograd/*/*.cpp')
 | 
						|
    arm_compute_env.Append(CPPPATH = ["src/core/NEON/kernels/convolution/common/",
 | 
						|
                                      "src/core/NEON/kernels/convolution/winograd/",
 | 
						|
                                      "src/core/NEON/kernels/convolution/depthwise/",
 | 
						|
                                      "src/core/NEON/kernels/assembly/",
 | 
						|
                                      "arm_compute/core/NEON/kernels/assembly/"])
 | 
						|
 | 
						|
    graph_files += Glob('src/graph/backends/NEON/*.cpp')
 | 
						|
 | 
						|
    if env['estate'] == '32':
 | 
						|
        core_files += Glob('src/core/NEON/kernels/arm_gemm/kernels/a32_*/*.cpp')
 | 
						|
 | 
						|
    if env['estate'] == '64':
 | 
						|
        core_files += Glob('src/core/NEON/kernels/arm_gemm/kernels/a64_*/*.cpp')
 | 
						|
        if "sve" in env['arch']:
 | 
						|
             core_files += Glob('src/core/NEON/kernels/arm_gemm/kernels/sve_*/*.cpp')
 | 
						|
 | 
						|
    if any(i in env['data_type_support'] for i in ['all', 'fp16']):
 | 
						|
        core_files += Glob('src/core/NEON/kernels/*/impl/fp16_*.cpp')
 | 
						|
    if any(i in env['data_type_support'] for i in ['all', 'fp32']):
 | 
						|
        core_files += Glob('src/core/NEON/kernels/*/impl/fp32_*.cpp')
 | 
						|
    if any(i in env['data_type_support'] for i in ['all', 'qasymm8']):
 | 
						|
        core_files += Glob('src/core/NEON/kernels/*/impl/qasymm8_neon*.cpp')
 | 
						|
    if any(i in env['data_type_support'] for i in ['all', 'qasymm8_signed']):
 | 
						|
        core_files += Glob('src/core/NEON/kernels/*/impl/qasymm8_signed_*.cpp')
 | 
						|
    if any(i in env['data_type_support'] for i in ['all', 'qsymm16']):
 | 
						|
        core_files += Glob('src/core/NEON/kernels/*/impl/qsymm16_*.cpp')
 | 
						|
 | 
						|
    runtime_files += Glob('src/runtime/NEON/*.cpp')
 | 
						|
    runtime_files += Glob('src/runtime/NEON/functions/*.cpp')
 | 
						|
    runtime_files += Glob('src/runtime/NEON/functions/assembly/*.cpp')
 | 
						|
 | 
						|
if env['gles_compute']:
 | 
						|
    if env['os'] != 'android':
 | 
						|
        arm_compute_env.Append(CPPPATH = ["#opengles-3.1/include", "#opengles-3.1/mali_include"])
 | 
						|
 | 
						|
    core_files += Glob('src/core/GLES_COMPUTE/*.cpp')
 | 
						|
    core_files += Glob('src/core/GLES_COMPUTE/kernels/*.cpp')
 | 
						|
 | 
						|
    runtime_files += Glob('src/runtime/GLES_COMPUTE/*.cpp')
 | 
						|
    runtime_files += Glob('src/runtime/GLES_COMPUTE/functions/*.cpp')
 | 
						|
 | 
						|
    graph_files += Glob('src/graph/backends/GLES/*.cpp')
 | 
						|
if env['tracing']:
 | 
						|
    arm_compute_env.Append(CPPDEFINES = ['ARM_COMPUTE_TRACING_ENABLED'])
 | 
						|
else:
 | 
						|
    # Remove TracePoint files if tracing is disabled:
 | 
						|
    core_files = [ f for f in core_files if not "TracePoint" in str(f)]
 | 
						|
    runtime_files = [ f for f in runtime_files if not "TracePoint" in str(f)]
 | 
						|
 | 
						|
bootcode_o = []
 | 
						|
if env['os'] == 'bare_metal':
 | 
						|
    bootcode_files = Glob('bootcode/*.s')
 | 
						|
    bootcode_o = build_bootcode_objs(bootcode_files)
 | 
						|
Export('bootcode_o')
 | 
						|
 | 
						|
arm_compute_core_a = build_library('arm_compute_core-static', core_files, static=True)
 | 
						|
Export('arm_compute_core_a')
 | 
						|
 | 
						|
if env['os'] != 'bare_metal' and not env['standalone']:
 | 
						|
    arm_compute_core_so = build_library('arm_compute_core', core_files, static=False)
 | 
						|
    Export('arm_compute_core_so')
 | 
						|
 | 
						|
arm_compute_a = build_library('arm_compute-static', runtime_files, static=True, libs = [ arm_compute_core_a ])
 | 
						|
Export('arm_compute_a')
 | 
						|
 | 
						|
if env['os'] != 'bare_metal' and not env['standalone']:
 | 
						|
    arm_compute_so = build_library('arm_compute', runtime_files, static=False, libs = [ "arm_compute_core" ])
 | 
						|
    Depends(arm_compute_so, arm_compute_core_so)
 | 
						|
    Export('arm_compute_so')
 | 
						|
 | 
						|
arm_compute_graph_a = build_library('arm_compute_graph-static', graph_files, static=True, libs = [ arm_compute_a])
 | 
						|
Export('arm_compute_graph_a')
 | 
						|
 | 
						|
if env['os'] != 'bare_metal' and not env['standalone']:
 | 
						|
    arm_compute_graph_so = build_library('arm_compute_graph', graph_files, static=False, libs = [ "arm_compute" , "arm_compute_core"])
 | 
						|
    Depends(arm_compute_graph_so, arm_compute_so)
 | 
						|
    Export('arm_compute_graph_so')
 | 
						|
 | 
						|
if env['standalone']:
 | 
						|
    alias = arm_compute_env.Alias("arm_compute", [arm_compute_a])
 | 
						|
else:
 | 
						|
    alias = arm_compute_env.Alias("arm_compute", [arm_compute_a, arm_compute_so])
 | 
						|
 | 
						|
Default(alias)
 | 
						|
 | 
						|
if env['standalone']:
 | 
						|
    Depends([alias,arm_compute_core_a], generate_embed)
 | 
						|
else:
 | 
						|
    Depends([alias,arm_compute_core_so, arm_compute_core_a], generate_embed)
 |