#!/usr/bin/env python3 # # Script to find stack usage at the function level. Will detect recursion and # report as infinite stack usage. # # Example: # ./scripts/stack.py lfs.ci lfs_util.ci -Slimit # # Copyright (c) 2022, The littlefs authors. # SPDX-License-Identifier: BSD-3-Clause # import collections as co import csv import itertools as it import math as m import os import re # integer fields class Int(co.namedtuple('Int', 'x')): __slots__ = () def __new__(cls, x=0): if isinstance(x, Int): return x if isinstance(x, str): try: x = int(x, 0) except ValueError: # also accept +-∞ and +-inf if re.match('^\s*\+?\s*(?:∞|inf)\s*$', x): x = m.inf elif re.match('^\s*-\s*(?:∞|inf)\s*$', x): x = -m.inf else: raise assert isinstance(x, int) or m.isinf(x), x return super().__new__(cls, x) def __str__(self): if self.x == m.inf: return '∞' elif self.x == -m.inf: return '-∞' else: return str(self.x) def __int__(self): assert not m.isinf(self.x) return self.x def __float__(self): return float(self.x) none = '%7s' % '-' def table(self): return '%7s' % (self,) diff_none = '%7s' % '-' diff_table = table def diff_diff(self, other): new = self.x if self else 0 old = other.x if other else 0 diff = new - old if diff == +m.inf: return '%7s' % '+∞' elif diff == -m.inf: return '%7s' % '-∞' else: return '%+7d' % diff def ratio(self, other): new = self.x if self else 0 old = other.x if other else 0 if m.isinf(new) and m.isinf(old): return 0.0 elif m.isinf(new): return +m.inf elif m.isinf(old): return -m.inf elif not old and not new: return 0.0 elif not old: return 1.0 else: return (new-old) / old def __add__(self, other): return self.__class__(self.x + other.x) def __sub__(self, other): return self.__class__(self.x - other.x) def __mul__(self, other): return self.__class__(self.x * other.x) # size results class StackResult(co.namedtuple('StackResult', [ 'file', 'function', 'frame', 'limit', 'children'])): _by = ['file', 'function'] _fields = ['frame', 'limit'] _sort = ['limit', 'frame'] _types = {'frame': Int, 'limit': Int} __slots__ = () def __new__(cls, file='', function='', frame=0, limit=0, children=set()): return super().__new__(cls, file, function, Int(frame), Int(limit), children) def __add__(self, other): return StackResult(self.file, self.function, self.frame + other.frame, max(self.limit, other.limit), self.children | other.children) def openio(path, mode='r', buffering=-1): # allow '-' for stdin/stdout if path == '-': if mode == 'r': return os.fdopen(os.dup(sys.stdin.fileno()), mode, buffering) else: return os.fdopen(os.dup(sys.stdout.fileno()), mode, buffering) else: return open(path, mode, buffering) def collect(ci_paths, *, sources=None, everything=False, **args): # parse the vcg format k_pattern = re.compile('([a-z]+)\s*:', re.DOTALL) v_pattern = re.compile('(?:"(.*?)"|([a-z]+))', re.DOTALL) def parse_vcg(rest): def parse_vcg(rest): node = [] while True: rest = rest.lstrip() m_ = k_pattern.match(rest) if not m_: return (node, rest) k, rest = m_.group(1), rest[m_.end(0):] rest = rest.lstrip() if rest.startswith('{'): v, rest = parse_vcg(rest[1:]) assert rest[0] == '}', "unexpected %r" % rest[0:1] rest = rest[1:] node.append((k, v)) else: m_ = v_pattern.match(rest) assert m_, "unexpected %r" % rest[0:1] v, rest = m_.group(1) or m_.group(2), rest[m_.end(0):] node.append((k, v)) node, rest = parse_vcg(rest) assert rest == '', "unexpected %r" % rest[0:1] return node # collect into functions callgraph = co.defaultdict(lambda: (None, None, 0, set())) f_pattern = re.compile( r'([^\\]*)\\n([^:]*)[^\\]*\\n([0-9]+) bytes \((.*)\)') for path in ci_paths: with open(path) as f: vcg = parse_vcg(f.read()) for k, graph in vcg: if k != 'graph': continue for k, info in graph: if k == 'node': info = dict(info) m_ = f_pattern.match(info['label']) if m_: function, file, size, type = m_.groups() if (not args.get('quiet') and 'static' not in type and 'bounded' not in type): print("warning: " "found non-static stack for %s (%s, %s)" % ( function, type, size)) _, _, _, targets = callgraph[info['title']] callgraph[info['title']] = ( file, function, int(size), targets) elif k == 'edge': info = dict(info) _, _, _, targets = callgraph[info['sourcename']] targets.add(info['targetname']) else: continue callgraph_ = co.defaultdict(lambda: (None, None, 0, set())) for source, (s_file, s_function, frame, targets) in callgraph.items(): # discard internal functions if not everything and s_function.startswith('__'): continue # ignore filtered sources if sources is not None: if not any( os.path.abspath(s_file) == os.path.abspath(s) for s in sources): continue else: # default to only cwd if not everything and not os.path.commonpath([ os.getcwd(), os.path.abspath(s_file)]) == os.getcwd(): continue # smiplify path if os.path.commonpath([ os.getcwd(), os.path.abspath(s_file)]) == os.getcwd(): s_file = os.path.relpath(s_file) else: s_file = os.path.abspath(s_file) callgraph_[source] = (s_file, s_function, frame, targets) callgraph = callgraph_ if not everything: callgraph_ = co.defaultdict(lambda: (None, None, 0, set())) for source, (s_file, s_function, frame, targets) in callgraph.items(): # discard filtered sources if sources is not None and not any( os.path.abspath(s_file) == os.path.abspath(s) for s in sources): continue # discard internal functions if s_function.startswith('__'): continue callgraph_[source] = (s_file, s_function, frame, targets) callgraph = callgraph_ # find maximum stack size recursively, this requires also detecting cycles # (in case of recursion) def find_limit(source, seen=None): seen = seen or set() if source not in callgraph: return 0 _, _, frame, targets = callgraph[source] limit = 0 for target in targets: if target in seen: # found a cycle return m.inf limit_ = find_limit(target, seen | {target}) limit = max(limit, limit_) return frame + limit def find_children(targets): children = set() for target in targets: if target in callgraph: t_file, t_function, _, _ = callgraph[target] children.add((t_file, t_function)) return children # build results results = [] for source, (s_file, s_function, frame, targets) in callgraph.items(): limit = find_limit(source) children = find_children(targets) results.append(StackResult(s_file, s_function, frame, limit, children)) return results def fold(Result, results, *, by=None, defines=None, **_): if by is None: by = Result._by for k in it.chain(by or [], (k for k, _ in defines or [])): if k not in Result._by and k not in Result._fields: print("error: could not find field %r?" % k) sys.exit(-1) # filter by matching defines if defines is not None: results_ = [] for r in results: if all(getattr(r, k) in vs for k, vs in defines): results_.append(r) results = results_ # organize results into conflicts folding = co.OrderedDict() for r in results: name = tuple(getattr(r, k) for k in by) if name not in folding: folding[name] = [] folding[name].append(r) # merge conflicts folded = [] for name, rs in folding.items(): folded.append(sum(rs[1:], start=rs[0])) return folded def table(Result, results, diff_results=None, *, by=None, fields=None, sort=None, summary=False, all=False, percent=False, tree=False, depth=1, **_): all_, all = all, __builtins__.all if by is None: by = Result._by if fields is None: fields = Result._fields types = Result._types # fold again results = fold(Result, results, by=by) if diff_results is not None: diff_results = fold(Result, diff_results, by=by) # organize by name table = { ','.join(str(getattr(r, k) or '') for k in by): r for r in results} diff_table = { ','.join(str(getattr(r, k) or '') for k in by): r for r in diff_results or []} names = list(table.keys() | diff_table.keys()) # sort again, now with diff info, note that python's sort is stable names.sort() if diff_results is not None: names.sort(key=lambda n: tuple( types[k].ratio( getattr(table.get(n), k, None), getattr(diff_table.get(n), k, None)) for k in fields), reverse=True) if sort: for k, reverse in reversed(sort): names.sort( key=lambda n: tuple( (getattr(table[n], k),) if getattr(table.get(n), k, None) is not None else () for k in ([k] if k else [ k for k in Result._sort if k in fields])), reverse=reverse ^ (not k or k in Result._fields)) # build up our lines lines = [] # header header = [] header.append('%s%s' % ( ','.join(by), ' (%d added, %d removed)' % ( sum(1 for n in table if n not in diff_table), sum(1 for n in diff_table if n not in table)) if diff_results is not None and not percent else '') if not summary else '') if diff_results is None: for k in fields: header.append(k) elif percent: for k in fields: header.append(k) else: for k in fields: header.append('o'+k) for k in fields: header.append('n'+k) for k in fields: header.append('d'+k) header.append('') lines.append(header) def table_entry(name, r, diff_r=None, ratios=[]): entry = [] entry.append(name) if diff_results is None: for k in fields: entry.append(getattr(r, k).table() if getattr(r, k, None) is not None else types[k].none) elif percent: for k in fields: entry.append(getattr(r, k).diff_table() if getattr(r, k, None) is not None else types[k].diff_none) else: for k in fields: entry.append(getattr(diff_r, k).diff_table() if getattr(diff_r, k, None) is not None else types[k].diff_none) for k in fields: entry.append(getattr(r, k).diff_table() if getattr(r, k, None) is not None else types[k].diff_none) for k in fields: entry.append(types[k].diff_diff( getattr(r, k, None), getattr(diff_r, k, None))) if diff_results is None: entry.append('') elif percent: entry.append(' (%s)' % ', '.join( '+∞%' if t == +m.inf else '-∞%' if t == -m.inf else '%+.1f%%' % (100*t) for t in ratios)) else: entry.append(' (%s)' % ', '.join( '+∞%' if t == +m.inf else '-∞%' if t == -m.inf else '%+.1f%%' % (100*t) for t in ratios if t) if any(ratios) else '') return entry # entries if not summary: for name in names: r = table.get(name) if diff_results is None: diff_r = None ratios = None else: diff_r = diff_table.get(name) ratios = [ types[k].ratio( getattr(r, k, None), getattr(diff_r, k, None)) for k in fields] if not all_ and not any(ratios): continue lines.append(table_entry(name, r, diff_r, ratios)) # total r = next(iter(fold(Result, results, by=[])), None) if diff_results is None: diff_r = None ratios = None else: diff_r = next(iter(fold(Result, diff_results, by=[])), None) ratios = [ types[k].ratio( getattr(r, k, None), getattr(diff_r, k, None)) for k in fields] lines.append(table_entry('TOTAL', r, diff_r, ratios)) # find the best widths, note that column 0 contains the names and column -1 # the ratios, so those are handled a bit differently widths = [ ((max(it.chain([w], (len(l[i]) for l in lines)))+1+4-1)//4)*4-1 for w, i in zip( it.chain([23], it.repeat(7)), range(len(lines[0])-1))] # adjust the name width based on the expected call depth, though # note this doesn't really work with unbounded recursion if not summary and not m.isinf(depth): widths[0] += 4*(depth-1) # print the tree recursively if not tree: print('%-*s %s%s' % ( widths[0], lines[0][0], ' '.join('%*s' % (w, x) for w, x in zip(widths[1:], lines[0][1:-1])), lines[0][-1])) if not summary: line_table = {n: l for n, l in zip(names, lines[1:-1])} def recurse(names_, depth_, prefixes=('', '', '', '')): for i, name in enumerate(names_): if name not in line_table: continue line = line_table[name] is_last = (i == len(names_)-1) print('%s%-*s ' % ( prefixes[0+is_last], widths[0] - ( len(prefixes[0+is_last]) if not m.isinf(depth) else 0), line[0]), end='') if not tree: print(' %s%s' % ( ' '.join('%*s' % (w, x) for w, x in zip(widths[1:], line[1:-1])), line[-1]), end='') print() # recurse? if name in table and depth_ > 1: children = { ','.join(str(getattr(Result(*c), k) or '') for k in by) for c in table[name].children} recurse( # note we're maintaining sort order [n for n in names if n in children], depth_-1, (prefixes[2+is_last] + "|-> ", prefixes[2+is_last] + "'-> ", prefixes[2+is_last] + "| ", prefixes[2+is_last] + " ")) recurse(names, depth) if not tree: print('%-*s %s%s' % ( widths[0], lines[-1][0], ' '.join('%*s' % (w, x) for w, x in zip(widths[1:], lines[-1][1:-1])), lines[-1][-1])) def main(ci_paths, by=None, fields=None, defines=None, sort=None, **args): # it doesn't really make sense to not have a depth with tree, # so assume depth=inf if tree by default if args.get('depth') is None: args['depth'] = m.inf if args['tree'] else 1 elif args.get('depth') == 0: args['depth'] = m.inf # find sizes if not args.get('use', None): results = collect(ci_paths, **args) else: results = [] with openio(args['use']) as f: reader = csv.DictReader(f, restval='') for r in reader: if not any('stack_'+k in r and r['stack_'+k].strip() for k in StackResult._fields): continue try: results.append(StackResult( **{k: r[k] for k in StackResult._by if k in r and r[k].strip()}, **{k: r['stack_'+k] for k in StackResult._fields if 'stack_'+k in r and r['stack_'+k].strip()})) except TypeError: pass # fold results = fold(StackResult, results, by=by, defines=defines) # sort, note that python's sort is stable results.sort() if sort: for k, reverse in reversed(sort): results.sort( key=lambda r: tuple( (getattr(r, k),) if getattr(r, k) is not None else () for k in ([k] if k else StackResult._sort)), reverse=reverse ^ (not k or k in StackResult._fields)) # write results to CSV if args.get('output'): with openio(args['output'], 'w') as f: writer = csv.DictWriter(f, (by if by is not None else StackResult._by) + ['stack_'+k for k in ( fields if fields is not None else StackResult._fields)]) writer.writeheader() for r in results: writer.writerow( {k: getattr(r, k) for k in ( by if by is not None else StackResult._by)} | {'stack_'+k: getattr(r, k) for k in ( fields if fields is not None else StackResult._fields)}) # find previous results? if args.get('diff'): diff_results = [] try: with openio(args['diff']) as f: reader = csv.DictReader(f, restval='') for r in reader: if not any('stack_'+k in r and r['stack_'+k].strip() for k in StackResult._fields): continue try: diff_results.append(StackResult( **{k: r[k] for k in StackResult._by if k in r and r[k].strip()}, **{k: r['stack_'+k] for k in StackResult._fields if 'stack_'+k in r and r['stack_'+k].strip()})) except TypeError: raise except FileNotFoundError: pass # fold diff_results = fold(StackResult, diff_results, by=by, defines=defines) # print table if not args.get('quiet'): table(StackResult, results, diff_results if args.get('diff') else None, by=by if by is not None else ['function'], fields=fields, sort=sort, **args) # error on recursion if args.get('error_on_recursion') and any( m.isinf(float(r.limit)) for r in results): sys.exit(2) if __name__ == "__main__": import argparse import sys parser = argparse.ArgumentParser( description="Find stack usage at the function level.", allow_abbrev=False) parser.add_argument( 'ci_paths', nargs='*', help="Input *.ci files.") parser.add_argument( '-v', '--verbose', action='store_true', help="Output commands that run behind the scenes.") parser.add_argument( '-q', '--quiet', action='store_true', help="Don't show anything, useful with -o.") parser.add_argument( '-o', '--output', help="Specify CSV file to store results.") parser.add_argument( '-u', '--use', help="Don't parse anything, use this CSV file.") parser.add_argument( '-d', '--diff', help="Specify CSV file to diff against.") parser.add_argument( '-a', '--all', action='store_true', help="Show all, not just the ones that changed.") parser.add_argument( '-p', '--percent', action='store_true', help="Only show percentage change, not a full diff.") parser.add_argument( '-b', '--by', action='append', choices=StackResult._by, help="Group by this field.") parser.add_argument( '-f', '--field', dest='fields', action='append', choices=StackResult._fields, help="Show this field.") parser.add_argument( '-D', '--define', dest='defines', action='append', type=lambda x: (lambda k,v: (k, set(v.split(','))))(*x.split('=', 1)), help="Only include results where this field is this value.") class AppendSort(argparse.Action): def __call__(self, parser, namespace, value, option): if namespace.sort is None: namespace.sort = [] namespace.sort.append((value, True if option == '-S' else False)) parser.add_argument( '-s', '--sort', nargs='?', action=AppendSort, help="Sort by this field.") parser.add_argument( '-S', '--reverse-sort', nargs='?', action=AppendSort, help="Sort by this field, but backwards.") parser.add_argument( '-Y', '--summary', action='store_true', help="Only show the total.") parser.add_argument( '-F', '--source', dest='sources', action='append', help="Only consider definitions in this file. Defaults to anything " "in the current directory.") parser.add_argument( '--everything', action='store_true', help="Include builtin and libc specific symbols.") parser.add_argument( '--tree', action='store_true', help="Only show the function call tree.") parser.add_argument( '-Z', '--depth', nargs='?', type=lambda x: int(x, 0), const=0, help="Depth of function calls to show. 0 shows all calls but may not " "terminate!") parser.add_argument( '-e', '--error-on-recursion', action='store_true', help="Error if any functions are recursive.") sys.exit(main(**{k: v for k, v in vars(parser.parse_intermixed_args()).items() if v is not None}))