diff options
Diffstat (limited to 'build-aux/stack.c.gen')
-rwxr-xr-x | build-aux/stack.c.gen | 269 |
1 files changed, 5 insertions, 264 deletions
diff --git a/build-aux/stack.c.gen b/build-aux/stack.c.gen index 06612ac..713630a 100755 --- a/build-aux/stack.c.gen +++ b/build-aux/stack.c.gen @@ -1,273 +1,14 @@ #!/usr/bin/env python3 # build-aux/stack.c.gen - Analyze stack sizes for compiled objects # -# Copyright (C) 2024 Luke T. Shumaker <lukeshu@lukeshu.com> +# Copyright (C) 2024-2025 Luke T. Shumaker <lukeshu@lukeshu.com> # SPDX-License-Identifier: AGPL-3.0-or-later -import re +import os.path import sys -import typing - -################################################################################ -# -# Parse the "VCG" language -# -# https://www.rw.cdl.uni-saarland.de/people/sander/private/html/gsvcg1.html -# -# The formal syntax is found at -# ftp://ftp.cs.uni-sb.de/pub/graphics/vcg/vcg.tgz `doc/grammar.txt`. - - -class VCGElem: - typ: str - lineno: int - attrs: dict[str, str] - - -def parse_vcg(reader: typing.TextIO) -> typing.Iterator[VCGElem]: - re_beg = re.compile(r"(edge|node):\s*\{\s*") - _re_tok = r"[a-zA-Z_][a-zA-Z0-9_]*" - _re_str = r'"(?:[^\"]|\\.)*"' - re_attr = re.compile( - "(" + _re_tok + r")\s*:\s*(" + _re_tok + "|" + _re_str + r")\s*" - ) - re_end = re.compile(r"\}\s*$") - re_skip = re.compile(r"(graph:\s*\{\s*title\s*:\s*" + _re_str + r"\s*|\})\s*") - re_esc = re.compile(r"\\.") - - for lineno, line in enumerate(reader): - pos = 0 - - def _raise(msg: str) -> typing.NoReturn: - nonlocal lineno - nonlocal line - nonlocal pos - e = SyntaxError(msg) - e.lineno = lineno - e.offset = pos - e.text = line - raise e - - if re_skip.fullmatch(line): - continue - - elem = VCGElem() - elem.lineno = lineno - - m = re_beg.match(line, pos=pos) - if not m: - _raise("does not look like a VCG line") - elem.typ = m.group(1) - pos = m.end() - - elem.attrs = {} - while True: - if re_end.match(line, pos=pos): - break - m = re_attr.match(line, pos=pos) - if not m: - _raise("unexpected character") - k = m.group(1) - v = m.group(2) - if k in elem.attrs: - _raise(f"duplicate key: {repr(k)}") - if v.startswith('"'): - - def unesc(esc: re.Match[str]) -> str: - match esc.group(0)[1:]: - case "n": - return "\n" - case '"': - return '"' - case "\\": - return "\\" - case _: - _raise(f"invalid escape code {repr(esc.group(0))}") - - v = re_esc.sub(unesc, v[1:-1]) - elem.attrs[k] = v - pos = m.end() - - yield elem - - -################################################################################ -# Main application - - -class Node: - # from .title (`static` and `__weak` functions are prefixed with - # the compilation unit .c file. For static functions that's fine, - # but we'll have to handle it specially for __weak.). - funcname: str - # .label is "{funcname}\n{location}\n{nstatic} bytes (static}\n{ndynamic} dynamic objects" - location: str - nstatic: int - ndynamic: int - - # edges with .sourcename set to this node - calls: set[str] - - -re_location = re.compile(r"(?P<filename>.+):(?P<row>[0-9]+):(?P<col>[0-9]+)") - - -def read_source(location: str) -> str: - m = re_location.fullmatch(location) - if not m: - raise ValueError(f"unexpected label value {repr(location)}") - filename = m.group("filename") - row = int(m.group("row")) - 1 - col = int(m.group("col")) - 1 - with open(m.group("filename"), "r") as fh: - return fh.readlines()[row][col:].rstrip() - - -def main(ci_fnames: list[str]) -> None: - re_node_label = re.compile( - r"(?P<funcname>[^\n]+)\n" - + r"(?P<location>[^\n]+:[0-9]+:[0-9]+)\n" - + r"(?P<nstatic>[0-9]+) bytes \(static\)\n" - + r"(?P<ndynamic>[0-9]+) dynamic objects", - flags=re.MULTILINE, - ) - re_call_vcall = re.compile(r"VCALL\((?P<obj>[^,]+), (?P<meth>[^,)]+)[,)].*") - re_call_other = re.compile(r"(?P<func>[^(]+)\(.*") - - graph: dict[str, Node] = dict() - qualified: dict[str, set[str]] = dict() - - def handle_elem(elem: VCGElem) -> None: - match elem.typ: - case "node": - node = Node() - node.calls = set() - skip = False - for k, v in elem.attrs.items(): - match k: - case "title": - node.funcname = v - case "label": - if elem.attrs.get("shape", "") != "ellipse": - m = re_node_label.fullmatch(v) - if not m: - raise ValueError( - f"unexpected label value {repr(v)}" - ) - node.location = m.group("location") - node.nstatic = int(m.group("nstatic")) - node.ndynamic = int(m.group("ndynamic")) - case "shape": - if v != "ellipse": - raise ValueError(f"unexpected shape value {repr(v)}") - skip = True - case _: - raise ValueError(f"unknown edge key {repr(k)}") - if not skip: - if node.funcname in graph: - raise ValueError(f"duplicate node {repr(node.funcname)}") - graph[node.funcname] = node - if ":" in node.funcname: - _, shortname = node.funcname.rsplit(":", 1) - if shortname not in qualified: - qualified[shortname] = set() - qualified[shortname].add(node.funcname) - case "edge": - caller: str | None = None - callee: str | None = None - for k, v in elem.attrs.items(): - match k: - case "sourcename": - caller = v - case "targetname": - callee = v - case "label": - pass - case _: - raise ValueError(f"unknown edge key {repr(k)}") - if caller is None or callee is None: - raise ValueError(f"incomplete edge: {repr(elem.attrs)}") - if caller not in graph: - raise ValueError(f"unknown caller: {caller}") - if callee == "__indirect_call": - callstr = read_source(elem.attrs.get("label", "")) - if m := re_call_vcall.fullmatch(callstr): - callee += f":{m.group('obj')}->vtable->{m.group('meth')}" - elif m := re_call_other.fullmatch(callstr): - callee += f":{m.group('func')}" - else: - callee += f':{elem.attrs.get("label", "")}' - graph[caller].calls.add(callee) - case _: - raise ValueError(f"unknown elem type {repr(elem.typ)}") - - for ci_fname in ci_fnames: - with open(ci_fname, "r") as fh: - for elem in parse_vcg(fh): - handle_elem(elem) - - missing: set[str] = set() - cycles: set[str] = set() - - print("/*") - - dbg = False - - def nstatic(funcname: str, chain: list[str] = []) -> int: - nonlocal dbg - if funcname not in graph: - if f"__wrap_{funcname}" in graph: - # Handle `ld --wrap` functions - funcname = f"__wrap_{funcname}" - elif funcname in qualified and len(qualified[funcname]) == 1: - # Handle `__weak` functions - funcname = sorted(qualified[funcname])[0] - else: - missing.add(funcname) - return 0 - if funcname in chain: - if "__assert_msg_fail" in chain: - if funcname == "__wrap_printf": - return 0 - pass - else: - cycles.add(f"{chain[chain.index(funcname):] + [funcname]}") - return 9999999 - node = graph[funcname] - if dbg: - print(f"//dbg: {funcname}\t{node.nstatic}") - return node.nstatic + max( - [0, *[nstatic(call, chain + [funcname]) for call in node.calls]] - ) - - def thread_filter(name: str) -> bool: - return name.endswith("_cr") or name == "main" - - namelen = max(len(name) for name in graph if thread_filter(name)) - numlen = max(len(str(nstatic(name))) for name in graph if name.endswith("_cr")) - print(("=" * namelen) + " " + "=" * numlen) - - for funcname in graph: - if thread_filter(funcname): - # dbg = "dhcp" in funcname - print(f"{funcname.ljust(namelen)} {str(nstatic(funcname)).rjust(numlen)}") - - print(("=" * namelen) + " " + "=" * numlen) - - for funcname in sorted(missing): - print(f"warning: missing: {funcname}") - for cycle in sorted(cycles): - print(f"warning: cycle: {cycle}") - - print("*/") +sys.path.insert(0, os.path.normpath(os.path.join(__file__, ".."))) +import measurestack # pylint: disable=wrong-import-position if __name__ == "__main__": - re_suffix = re.compile(r"\.c\.o(bj)?$") - main( - [ - re_suffix.sub(".c.ci", fname) - for fname in sys.argv[1:] - if re_suffix.search(fname) - ] - ) + measurestack.main() |