214 lines
7.3 KiB
Python
214 lines
7.3 KiB
Python
#!/usr/bin/env python3
|
|
#
|
|
# Copyright (c) 2017 Intel Corporation
|
|
#
|
|
# SPDX-License-Identifier: Apache-2.0
|
|
|
|
"""
|
|
Script to scan Zephyr include directories and emit system call and subsystem metadata
|
|
|
|
System calls require a great deal of boilerplate code in order to implement
|
|
completely. This script is the first step in the build system's process of
|
|
auto-generating this code by doing a text scan of directories containing
|
|
C or header files, and building up a database of system calls and their
|
|
function call prototypes. This information is emitted to a generated
|
|
JSON file for further processing.
|
|
|
|
This script also scans for struct definitions such as __subsystem and
|
|
__net_socket, emitting a JSON dictionary mapping tags to all the struct
|
|
declarations found that were tagged with them.
|
|
|
|
If the output JSON file already exists, its contents are checked against
|
|
what information this script would have outputted; if the result is that the
|
|
file would be unchanged, it is not modified to prevent unnecessary
|
|
incremental builds.
|
|
"""
|
|
|
|
import sys
|
|
import re
|
|
import argparse
|
|
import os
|
|
import json
|
|
from pathlib import PurePath
|
|
|
|
regex_flags = re.MULTILINE | re.VERBOSE
|
|
|
|
syscall_regex = re.compile(r'''
|
|
(?:__syscall|__syscall_always_inline)\s+ # __syscall attribute, must be first
|
|
([^(]+) # type and name of system call (split later)
|
|
[(] # Function opening parenthesis
|
|
([^)]*) # Arg list (split later)
|
|
[)] # Closing parenthesis
|
|
''', regex_flags)
|
|
|
|
struct_tags = ["__subsystem", "__net_socket"]
|
|
|
|
tagged_struct_decl_template = r'''
|
|
%s\s+ # tag, must be first
|
|
struct\s+ # struct keyword is next
|
|
([^{]+) # name of subsystem
|
|
[{] # Open curly bracket
|
|
'''
|
|
|
|
def tagged_struct_update(target_list, tag, contents):
|
|
regex = re.compile(tagged_struct_decl_template % tag, regex_flags)
|
|
items = [mo.groups()[0].strip() for mo in regex.finditer(contents)]
|
|
target_list.extend(items)
|
|
|
|
|
|
def analyze_headers(include_dir, scan_dir, file_list):
|
|
syscall_ret = []
|
|
tagged_ret = {}
|
|
|
|
for tag in struct_tags:
|
|
tagged_ret[tag] = []
|
|
|
|
syscall_files = dict()
|
|
|
|
# Get the list of header files which contains syscalls to be emitted.
|
|
# If file_list does not exist, we emit all syscalls.
|
|
if file_list:
|
|
with open(file_list, "r", encoding="utf-8") as fp:
|
|
contents = fp.read()
|
|
|
|
for one_file in contents.split(";"):
|
|
if os.path.isfile(one_file):
|
|
syscall_files[one_file] = {"emit": True}
|
|
else:
|
|
sys.stderr.write(f"{one_file} does not exists!\n")
|
|
sys.exit(1)
|
|
|
|
multiple_directories = set()
|
|
if include_dir:
|
|
multiple_directories |= set(include_dir)
|
|
if scan_dir:
|
|
multiple_directories |= set(scan_dir)
|
|
|
|
# Look for source files under various directories.
|
|
# Due to "syscalls/*.h" being included unconditionally in various
|
|
# other header files. We must generate the associated syscall
|
|
# header files (e.g. for function stubs).
|
|
for base_path in multiple_directories:
|
|
for root, dirs, files in os.walk(base_path, topdown=True):
|
|
dirs.sort()
|
|
files.sort()
|
|
for fn in files:
|
|
|
|
# toolchain/common.h has the definitions of these tags which we
|
|
# don't want to trip over
|
|
path = os.path.join(root, fn)
|
|
if (not (path.endswith(".h") or path.endswith(".c")) or
|
|
path.endswith(os.path.join(os.sep, 'toolchain',
|
|
'common.h'))):
|
|
continue
|
|
|
|
path = PurePath(os.path.normpath(path)).as_posix()
|
|
|
|
if path not in syscall_files:
|
|
if include_dir and base_path in include_dir:
|
|
syscall_files[path] = {"emit" : True}
|
|
else:
|
|
syscall_files[path] = {"emit" : False}
|
|
|
|
# Parse files to extract syscall functions
|
|
for one_file in syscall_files:
|
|
with open(one_file, "r", encoding="utf-8") as fp:
|
|
try:
|
|
contents = fp.read()
|
|
except Exception:
|
|
sys.stderr.write("Error decoding %s\n" % path)
|
|
raise
|
|
|
|
fn = os.path.basename(one_file)
|
|
|
|
try:
|
|
to_emit = syscall_files[one_file]["emit"] | args.emit_all_syscalls
|
|
|
|
syscall_result = [(mo.groups(), fn, to_emit)
|
|
for mo in syscall_regex.finditer(contents)]
|
|
for tag in struct_tags:
|
|
tagged_struct_update(tagged_ret[tag], tag, contents)
|
|
except Exception:
|
|
sys.stderr.write("While parsing %s\n" % fn)
|
|
raise
|
|
|
|
syscall_ret.extend(syscall_result)
|
|
|
|
return syscall_ret, tagged_ret
|
|
|
|
|
|
def update_file_if_changed(path, new):
|
|
if os.path.exists(path):
|
|
with open(path, 'r') as fp:
|
|
old = fp.read()
|
|
|
|
if new != old:
|
|
with open(path, 'w') as fp:
|
|
fp.write(new)
|
|
else:
|
|
with open(path, 'w') as fp:
|
|
fp.write(new)
|
|
|
|
|
|
def parse_args():
|
|
global args
|
|
parser = argparse.ArgumentParser(
|
|
description=__doc__,
|
|
formatter_class=argparse.RawDescriptionHelpFormatter, allow_abbrev=False)
|
|
|
|
parser.add_argument(
|
|
"-i", "--include", required=False, action="append",
|
|
help="Include directories recursively scanned for .h files "
|
|
"containing syscalls that must be present in final binary. "
|
|
"Can be specified multiple times: -i topdir1 -i topdir2 ...")
|
|
parser.add_argument(
|
|
"--scan", required=False, action="append",
|
|
help="Scan directories recursively for .h files containing "
|
|
"syscalls that need stubs generated but may not need to "
|
|
"be present in final binary. Can be specified multiple "
|
|
"times.")
|
|
parser.add_argument(
|
|
"-j", "--json-file", required=True,
|
|
help="Write system call prototype information as json to file")
|
|
parser.add_argument(
|
|
"-t", "--tag-struct-file", required=True,
|
|
help="Write tagged struct name information as json to file")
|
|
parser.add_argument(
|
|
"--file-list", required=False,
|
|
help="Text file containing semi-colon separated list of "
|
|
"header file where only syscalls in these files "
|
|
"are emitted.")
|
|
parser.add_argument(
|
|
"--emit-all-syscalls", required=False, action="store_true",
|
|
help="Emit all potential syscalls in the tree")
|
|
|
|
args = parser.parse_args()
|
|
|
|
|
|
def main():
|
|
parse_args()
|
|
|
|
syscalls, tagged = analyze_headers(args.include, args.scan,
|
|
args.file_list)
|
|
|
|
# Only write json files if they don't exist or have changes since
|
|
# they will force an incremental rebuild.
|
|
|
|
syscalls_in_json = json.dumps(
|
|
syscalls,
|
|
indent=4,
|
|
sort_keys=True
|
|
)
|
|
update_file_if_changed(args.json_file, syscalls_in_json)
|
|
|
|
tagged_struct_in_json = json.dumps(
|
|
tagged,
|
|
indent=4,
|
|
sort_keys=True
|
|
)
|
|
update_file_if_changed(args.tag_struct_file, tagged_struct_in_json)
|
|
|
|
|
|
if __name__ == "__main__":
|
|
main()
|