|  | #!/usr/bin/env python3 | 
|  | # | 
|  | # Copyright (c) 2017 Intel Corporation | 
|  | # | 
|  | # SPDX-License-Identifier: Apache-2.0 | 
|  |  | 
|  | """ | 
|  | Script to scan Zephyr include directories and emit system call and subsystem metadata | 
|  |  | 
|  | System calls require a great deal of boilerplate code in order to implement | 
|  | completely. This script is the first step in the build system's process of | 
|  | auto-generating this code by doing a text scan of directories containing | 
|  | C or header files, and building up a database of system calls and their | 
|  | function call prototypes. This information is emitted to a generated | 
|  | JSON file for further processing. | 
|  |  | 
|  | This script also scans for struct definitions such as __subsystem and | 
|  | __net_socket, emitting a JSON dictionary mapping tags to all the struct | 
|  | declarations found that were tagged with them. | 
|  |  | 
|  | If the output JSON file already exists, its contents are checked against | 
|  | what information this script would have outputted; if the result is that the | 
|  | file would be unchanged, it is not modified to prevent unnecessary | 
|  | incremental builds. | 
|  | """ | 
|  |  | 
|  | import sys | 
|  | import re | 
|  | import argparse | 
|  | import os | 
|  | import json | 
|  | from pathlib import PurePath | 
|  |  | 
|  | regex_flags = re.MULTILINE | re.VERBOSE | 
|  |  | 
|  | syscall_regex = re.compile(r''' | 
|  | (?:__syscall|__syscall_always_inline)\s+   # __syscall attribute, must be first | 
|  | ([^(]+)                                    # type and name of system call (split later) | 
|  | [(]                                        # Function opening parenthesis | 
|  | ([^)]*)                                    # Arg list (split later) | 
|  | [)]                                        # Closing parenthesis | 
|  | ''', regex_flags) | 
|  |  | 
|  | struct_tags = ["__subsystem", "__net_socket"] | 
|  |  | 
|  | tagged_struct_decl_template = r''' | 
|  | %s\s+                           # tag, must be first | 
|  | struct\s+                       # struct keyword is next | 
|  | ([^{]+)                         # name of subsystem | 
|  | [{]                             # Open curly bracket | 
|  | ''' | 
|  |  | 
|  | def tagged_struct_update(target_list, tag, contents): | 
|  | regex = re.compile(tagged_struct_decl_template % tag, regex_flags) | 
|  | items = [mo.groups()[0].strip() for mo in regex.finditer(contents)] | 
|  | target_list.extend(items) | 
|  |  | 
|  |  | 
|  | def analyze_headers(include_dir, scan_dir, file_list): | 
|  | syscall_ret = [] | 
|  | tagged_ret = {} | 
|  |  | 
|  | for tag in struct_tags: | 
|  | tagged_ret[tag] = [] | 
|  |  | 
|  | syscall_files = dict() | 
|  |  | 
|  | # Get the list of header files which contains syscalls to be emitted. | 
|  | # If file_list does not exist, we emit all syscalls. | 
|  | if file_list: | 
|  | with open(file_list, "r", encoding="utf-8") as fp: | 
|  | contents = fp.read() | 
|  |  | 
|  | for one_file in contents.split(";"): | 
|  | if os.path.isfile(one_file): | 
|  | syscall_files[one_file] = {"emit": True} | 
|  | else: | 
|  | sys.stderr.write(f"{one_file} does not exists!\n") | 
|  | sys.exit(1) | 
|  |  | 
|  | multiple_directories = set() | 
|  | if include_dir: | 
|  | multiple_directories |= set(include_dir) | 
|  | if scan_dir: | 
|  | multiple_directories |= set(scan_dir) | 
|  |  | 
|  | # Convert to a list to keep the output deterministic | 
|  | multiple_directories = sorted(multiple_directories) | 
|  |  | 
|  | # Look for source files under various directories. | 
|  | # Due to "syscalls/*.h" being included unconditionally in various | 
|  | # other header files. We must generate the associated syscall | 
|  | # header files (e.g. for function stubs). | 
|  | for base_path in multiple_directories: | 
|  | for root, dirs, files in os.walk(base_path, topdown=True): | 
|  | dirs.sort() | 
|  | files.sort() | 
|  | for fn in files: | 
|  |  | 
|  | # toolchain/common.h has the definitions of these tags which we | 
|  | # don't want to trip over | 
|  | path = os.path.join(root, fn) | 
|  | if (not (path.endswith(".h") or path.endswith(".c")) or | 
|  | path.endswith(os.path.join(os.sep, 'toolchain', | 
|  | 'common.h'))): | 
|  | continue | 
|  |  | 
|  | path = PurePath(os.path.normpath(path)).as_posix() | 
|  |  | 
|  | if path not in syscall_files: | 
|  | if include_dir and base_path in include_dir: | 
|  | syscall_files[path] = {"emit" : True} | 
|  | else: | 
|  | syscall_files[path] = {"emit" : False} | 
|  |  | 
|  | # Parse files to extract syscall functions | 
|  | for one_file in syscall_files: | 
|  | with open(one_file, "r", encoding="utf-8") as fp: | 
|  | try: | 
|  | contents = fp.read() | 
|  | except Exception: | 
|  | sys.stderr.write("Error decoding %s\n" % path) | 
|  | raise | 
|  |  | 
|  | fn = os.path.basename(one_file) | 
|  |  | 
|  | try: | 
|  | to_emit = syscall_files[one_file]["emit"] | args.emit_all_syscalls | 
|  |  | 
|  | syscall_result = [(mo.groups(), fn, to_emit) | 
|  | for mo in syscall_regex.finditer(contents)] | 
|  | for tag in struct_tags: | 
|  | tagged_struct_update(tagged_ret[tag], tag, contents) | 
|  | except Exception: | 
|  | sys.stderr.write("While parsing %s\n" % fn) | 
|  | raise | 
|  |  | 
|  | syscall_ret.extend(syscall_result) | 
|  |  | 
|  | return syscall_ret, tagged_ret | 
|  |  | 
|  |  | 
|  | def update_file_if_changed(path, new): | 
|  | if os.path.exists(path): | 
|  | with open(path, 'r') as fp: | 
|  | old = fp.read() | 
|  |  | 
|  | if new != old: | 
|  | with open(path, 'w') as fp: | 
|  | fp.write(new) | 
|  | else: | 
|  | with open(path, 'w') as fp: | 
|  | fp.write(new) | 
|  |  | 
|  |  | 
|  | def parse_args(): | 
|  | global args | 
|  | parser = argparse.ArgumentParser( | 
|  | description=__doc__, | 
|  | formatter_class=argparse.RawDescriptionHelpFormatter, allow_abbrev=False) | 
|  |  | 
|  | parser.add_argument( | 
|  | "-i", "--include", required=False, action="append", | 
|  | help="Include directories recursively scanned for .h files " | 
|  | "containing syscalls that must be present in final binary. " | 
|  | "Can be specified multiple times: -i topdir1 -i topdir2 ...") | 
|  | parser.add_argument( | 
|  | "--scan", required=False, action="append", | 
|  | help="Scan directories recursively for .h files containing " | 
|  | "syscalls that need stubs generated but may not need to " | 
|  | "be present in final binary. Can be specified multiple " | 
|  | "times.") | 
|  | parser.add_argument( | 
|  | "-j", "--json-file", required=True, | 
|  | help="Write system call prototype information as json to file") | 
|  | parser.add_argument( | 
|  | "-t", "--tag-struct-file", required=True, | 
|  | help="Write tagged struct name information as json to file") | 
|  | parser.add_argument( | 
|  | "--file-list", required=False, | 
|  | help="Text file containing semi-colon separated list of " | 
|  | "header file where only syscalls in these files " | 
|  | "are emitted.") | 
|  | parser.add_argument( | 
|  | "--emit-all-syscalls", required=False, action="store_true", | 
|  | help="Emit all potential syscalls in the tree") | 
|  |  | 
|  | args = parser.parse_args() | 
|  |  | 
|  |  | 
|  | def main(): | 
|  | parse_args() | 
|  |  | 
|  | syscalls, tagged = analyze_headers(args.include, args.scan, | 
|  | args.file_list) | 
|  |  | 
|  | # Only write json files if they don't exist or have changes since | 
|  | # they will force an incremental rebuild. | 
|  |  | 
|  | syscalls_in_json = json.dumps( | 
|  | syscalls, | 
|  | indent=4, | 
|  | sort_keys=True | 
|  | ) | 
|  | update_file_if_changed(args.json_file, syscalls_in_json) | 
|  |  | 
|  | tagged_struct_in_json = json.dumps( | 
|  | tagged, | 
|  | indent=4, | 
|  | sort_keys=True | 
|  | ) | 
|  | update_file_if_changed(args.tag_struct_file, tagged_struct_in_json) | 
|  |  | 
|  |  | 
|  | if __name__ == "__main__": | 
|  | main() |