stack.py 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393
  1. #!/usr/bin/env python3
  2. #
  3. # Script to find stack usage at the function level. Will detect recursion and
  4. # report as infinite stack usage.
  5. #
  6. import os
  7. import glob
  8. import itertools as it
  9. import re
  10. import csv
  11. import collections as co
  12. import math as m
  13. CI_PATHS = ['*.ci']
  14. def collect(paths, **args):
  15. # parse the vcg format
  16. k_pattern = re.compile('([a-z]+)\s*:', re.DOTALL)
  17. v_pattern = re.compile('(?:"(.*?)"|([a-z]+))', re.DOTALL)
  18. def parse_vcg(rest):
  19. def parse_vcg(rest):
  20. node = []
  21. while True:
  22. rest = rest.lstrip()
  23. m = k_pattern.match(rest)
  24. if not m:
  25. return (node, rest)
  26. k, rest = m.group(1), rest[m.end(0):]
  27. rest = rest.lstrip()
  28. if rest.startswith('{'):
  29. v, rest = parse_vcg(rest[1:])
  30. assert rest[0] == '}', "unexpected %r" % rest[0:1]
  31. rest = rest[1:]
  32. node.append((k, v))
  33. else:
  34. m = v_pattern.match(rest)
  35. assert m, "unexpected %r" % rest[0:1]
  36. v, rest = m.group(1) or m.group(2), rest[m.end(0):]
  37. node.append((k, v))
  38. node, rest = parse_vcg(rest)
  39. assert rest == '', "unexpected %r" % rest[0:1]
  40. return node
  41. # collect into functions
  42. results = co.defaultdict(lambda: (None, None, 0, set()))
  43. f_pattern = re.compile(
  44. r'([^\\]*)\\n([^:]*)[^\\]*\\n([0-9]+) bytes \((.*)\)')
  45. for path in paths:
  46. with open(path) as f:
  47. vcg = parse_vcg(f.read())
  48. for k, graph in vcg:
  49. if k != 'graph':
  50. continue
  51. for k, info in graph:
  52. if k == 'node':
  53. info = dict(info)
  54. m = f_pattern.match(info['label'])
  55. if m:
  56. function, file, size, type = m.groups()
  57. if not args.get('quiet') and type != 'static':
  58. print('warning: found non-static stack for %s (%s)'
  59. % (function, type))
  60. _, _, _, targets = results[info['title']]
  61. results[info['title']] = (
  62. file, function, int(size), targets)
  63. elif k == 'edge':
  64. info = dict(info)
  65. _, _, _, targets = results[info['sourcename']]
  66. targets.add(info['targetname'])
  67. else:
  68. continue
  69. if not args.get('everything'):
  70. for source, (s_file, s_function, _, _) in list(results.items()):
  71. # discard internal functions
  72. if s_file.startswith('<') or s_file.startswith('/usr/include'):
  73. del results[source]
  74. # find maximum stack size recursively, this requires also detecting cycles
  75. # (in case of recursion)
  76. def find_limit(source, seen=None):
  77. seen = seen or set()
  78. if source not in results:
  79. return 0
  80. _, _, frame, targets = results[source]
  81. limit = 0
  82. for target in targets:
  83. if target in seen:
  84. # found a cycle
  85. return float('inf')
  86. limit_ = find_limit(target, seen | {target})
  87. limit = max(limit, limit_)
  88. return frame + limit
  89. def find_deps(targets):
  90. deps = set()
  91. for target in targets:
  92. if target in results:
  93. t_file, t_function, _, _ = results[target]
  94. deps.add((t_file, t_function))
  95. return deps
  96. # flatten into a list
  97. flat_results = []
  98. for source, (s_file, s_function, frame, targets) in results.items():
  99. limit = find_limit(source)
  100. deps = find_deps(targets)
  101. flat_results.append((s_file, s_function, frame, limit, deps))
  102. return flat_results
  103. def main(**args):
  104. # find sizes
  105. if not args.get('use', None):
  106. # find .ci files
  107. paths = []
  108. for path in args['ci_paths']:
  109. if os.path.isdir(path):
  110. path = path + '/*.ci'
  111. for path in glob.glob(path):
  112. paths.append(path)
  113. if not paths:
  114. print('no .ci files found in %r?' % args['ci_paths'])
  115. sys.exit(-1)
  116. results = collect(paths, **args)
  117. else:
  118. with open(args['use']) as f:
  119. r = csv.DictReader(f)
  120. results = [
  121. ( result['file'],
  122. result['function'],
  123. int(result['stack_frame']),
  124. float(result['stack_limit']), # note limit can be inf
  125. set())
  126. for result in r]
  127. total_frame = 0
  128. total_limit = 0
  129. for _, _, frame, limit, _ in results:
  130. total_frame += frame
  131. total_limit = max(total_limit, limit)
  132. # find previous results?
  133. if args.get('diff'):
  134. try:
  135. with open(args['diff']) as f:
  136. r = csv.DictReader(f)
  137. prev_results = [
  138. ( result['file'],
  139. result['function'],
  140. int(result['stack_frame']),
  141. float(result['stack_limit']),
  142. set())
  143. for result in r]
  144. except FileNotFoundError:
  145. prev_results = []
  146. prev_total_frame = 0
  147. prev_total_limit = 0
  148. for _, _, frame, limit, _ in prev_results:
  149. prev_total_frame += frame
  150. prev_total_limit = max(prev_total_limit, limit)
  151. # write results to CSV
  152. if args.get('output'):
  153. with open(args['output'], 'w') as f:
  154. w = csv.writer(f)
  155. w.writerow(['file', 'function', 'stack_frame', 'stack_limit'])
  156. for file, func, frame, limit, _ in sorted(results):
  157. w.writerow((file, func, frame, limit))
  158. # print results
  159. def dedup_entries(results, by='function'):
  160. entries = co.defaultdict(lambda: (0, 0, set()))
  161. for file, func, frame, limit, deps in results:
  162. entry = (file if by == 'file' else func)
  163. entry_frame, entry_limit, entry_deps = entries[entry]
  164. entries[entry] = (
  165. entry_frame + frame,
  166. max(entry_limit, limit),
  167. entry_deps | {file if by == 'file' else func
  168. for file, func in deps})
  169. return entries
  170. def diff_entries(olds, news):
  171. diff = co.defaultdict(lambda: (None, None, None, None, 0, 0, 0, set()))
  172. for name, (new_frame, new_limit, deps) in news.items():
  173. diff[name] = (
  174. None, None,
  175. new_frame, new_limit,
  176. new_frame, new_limit,
  177. 1.0,
  178. deps)
  179. for name, (old_frame, old_limit, _) in olds.items():
  180. _, _, new_frame, new_limit, _, _, _, deps = diff[name]
  181. diff[name] = (
  182. old_frame, old_limit,
  183. new_frame, new_limit,
  184. (new_frame or 0) - (old_frame or 0),
  185. 0 if m.isinf(new_limit or 0) and m.isinf(old_limit or 0)
  186. else (new_limit or 0) - (old_limit or 0),
  187. 0.0 if m.isinf(new_limit or 0) and m.isinf(old_limit or 0)
  188. else +float('inf') if m.isinf(new_limit or 0)
  189. else -float('inf') if m.isinf(old_limit or 0)
  190. else +0.0 if not old_limit and not new_limit
  191. else +1.0 if not old_limit
  192. else ((new_limit or 0) - (old_limit or 0))/(old_limit or 0),
  193. deps)
  194. return diff
  195. def sorted_entries(entries):
  196. if args.get('limit_sort'):
  197. return sorted(entries, key=lambda x: (-x[1][1], x))
  198. elif args.get('reverse_limit_sort'):
  199. return sorted(entries, key=lambda x: (+x[1][1], x))
  200. elif args.get('frame_sort'):
  201. return sorted(entries, key=lambda x: (-x[1][0], x))
  202. elif args.get('reverse_frame_sort'):
  203. return sorted(entries, key=lambda x: (+x[1][0], x))
  204. else:
  205. return sorted(entries)
  206. def sorted_diff_entries(entries):
  207. if args.get('limit_sort'):
  208. return sorted(entries, key=lambda x: (-(x[1][3] or 0), x))
  209. elif args.get('reverse_limit_sort'):
  210. return sorted(entries, key=lambda x: (+(x[1][3] or 0), x))
  211. elif args.get('frame_sort'):
  212. return sorted(entries, key=lambda x: (-(x[1][2] or 0), x))
  213. elif args.get('reverse_frame_sort'):
  214. return sorted(entries, key=lambda x: (+(x[1][2] or 0), x))
  215. else:
  216. return sorted(entries, key=lambda x: (-x[1][6], x))
  217. def print_header(by=''):
  218. if not args.get('diff'):
  219. print('%-36s %7s %7s' % (by, 'frame', 'limit'))
  220. else:
  221. print('%-36s %15s %15s %15s' % (by, 'old', 'new', 'diff'))
  222. def print_entry(name, frame, limit):
  223. print("%-36s %7d %7s" % (name,
  224. frame, '∞' if m.isinf(limit) else int(limit)))
  225. def print_diff_entry(name,
  226. old_frame, old_limit,
  227. new_frame, new_limit,
  228. diff_frame, diff_limit,
  229. ratio):
  230. print('%-36s %7s %7s %7s %7s %+7d %7s%s' % (name,
  231. old_frame if old_frame is not None else "-",
  232. ('∞' if m.isinf(old_limit) else int(old_limit))
  233. if old_limit is not None else "-",
  234. new_frame if new_frame is not None else "-",
  235. ('∞' if m.isinf(new_limit) else int(new_limit))
  236. if new_limit is not None else "-",
  237. diff_frame,
  238. ('+∞' if diff_limit > 0 and m.isinf(diff_limit)
  239. else '-∞' if diff_limit < 0 and m.isinf(diff_limit)
  240. else '%+d' % diff_limit),
  241. '' if not ratio
  242. else ' (+∞%)' if ratio > 0 and m.isinf(ratio)
  243. else ' (-∞%)' if ratio < 0 and m.isinf(ratio)
  244. else ' (%+.1f%%)' % (100*ratio)))
  245. def print_entries(by='function'):
  246. # build optional tree of dependencies
  247. def print_deps(entries, depth, print,
  248. filter=lambda _: True,
  249. prefixes=('', '', '', '')):
  250. entries = entries if isinstance(entries, list) else list(entries)
  251. filtered_entries = [(name, entry)
  252. for name, entry in entries
  253. if filter(name)]
  254. for i, (name, entry) in enumerate(filtered_entries):
  255. last = (i == len(filtered_entries)-1)
  256. print(prefixes[0+last] + name, entry)
  257. if depth > 0:
  258. deps = entry[-1]
  259. print_deps(entries, depth-1, print,
  260. lambda name: name in deps,
  261. ( prefixes[2+last] + "|-> ",
  262. prefixes[2+last] + "'-> ",
  263. prefixes[2+last] + "| ",
  264. prefixes[2+last] + " "))
  265. entries = dedup_entries(results, by=by)
  266. if not args.get('diff'):
  267. print_header(by=by)
  268. print_deps(
  269. sorted_entries(entries.items()),
  270. args.get('depth') or 0,
  271. lambda name, entry: print_entry(name, *entry[:-1]))
  272. else:
  273. prev_entries = dedup_entries(prev_results, by=by)
  274. diff = diff_entries(prev_entries, entries)
  275. print_header(by='%s (%d added, %d removed)' % (by,
  276. sum(1 for _, old, _, _, _, _, _, _ in diff.values() if old is None),
  277. sum(1 for _, _, _, new, _, _, _, _ in diff.values() if new is None)))
  278. print_deps(
  279. filter(
  280. lambda x: x[1][6] or args.get('all'),
  281. sorted_diff_entries(diff.items())),
  282. args.get('depth') or 0,
  283. lambda name, entry: print_diff_entry(name, *entry[:-1]))
  284. def print_totals():
  285. if not args.get('diff'):
  286. print_entry('TOTAL', total_frame, total_limit)
  287. else:
  288. diff_frame = total_frame - prev_total_frame
  289. diff_limit = (
  290. 0 if m.isinf(total_limit or 0) and m.isinf(prev_total_limit or 0)
  291. else (total_limit or 0) - (prev_total_limit or 0))
  292. ratio = (
  293. 0.0 if m.isinf(total_limit or 0) and m.isinf(prev_total_limit or 0)
  294. else +float('inf') if m.isinf(total_limit or 0)
  295. else -float('inf') if m.isinf(prev_total_limit or 0)
  296. else 0.0 if not prev_total_limit and not total_limit
  297. else 1.0 if not prev_total_limit
  298. else ((total_limit or 0) - (prev_total_limit or 0))/(prev_total_limit or 0))
  299. print_diff_entry('TOTAL',
  300. prev_total_frame, prev_total_limit,
  301. total_frame, total_limit,
  302. diff_frame, diff_limit,
  303. ratio)
  304. if args.get('quiet'):
  305. pass
  306. elif args.get('summary'):
  307. print_header()
  308. print_totals()
  309. elif args.get('files'):
  310. print_entries(by='file')
  311. print_totals()
  312. else:
  313. print_entries(by='function')
  314. print_totals()
  315. if __name__ == "__main__":
  316. import argparse
  317. import sys
  318. parser = argparse.ArgumentParser(
  319. description="Find stack usage at the function level.")
  320. parser.add_argument('ci_paths', nargs='*', default=CI_PATHS,
  321. help="Description of where to find *.ci files. May be a directory \
  322. or a list of paths. Defaults to %r." % CI_PATHS)
  323. parser.add_argument('-v', '--verbose', action='store_true',
  324. help="Output commands that run behind the scenes.")
  325. parser.add_argument('-o', '--output',
  326. help="Specify CSV file to store results.")
  327. parser.add_argument('-u', '--use',
  328. help="Don't parse callgraph files, instead use this CSV file.")
  329. parser.add_argument('-d', '--diff',
  330. help="Specify CSV file to diff against.")
  331. parser.add_argument('-a', '--all', action='store_true',
  332. help="Show all functions, not just the ones that changed.")
  333. parser.add_argument('-A', '--everything', action='store_true',
  334. help="Include builtin and libc specific symbols.")
  335. parser.add_argument('-s', '--limit-sort', action='store_true',
  336. help="Sort by stack limit.")
  337. parser.add_argument('-S', '--reverse-limit-sort', action='store_true',
  338. help="Sort by stack limit, but backwards.")
  339. parser.add_argument('-f', '--frame-sort', action='store_true',
  340. help="Sort by stack frame size.")
  341. parser.add_argument('-F', '--reverse-frame-sort', action='store_true',
  342. help="Sort by stack frame size, but backwards.")
  343. parser.add_argument('-L', '--depth', default=0, type=lambda x: int(x, 0),
  344. nargs='?', const=float('inf'),
  345. help="Depth of dependencies to show.")
  346. parser.add_argument('--files', action='store_true',
  347. help="Show file-level calls.")
  348. parser.add_argument('--summary', action='store_true',
  349. help="Only show the total stack size.")
  350. parser.add_argument('-q', '--quiet', action='store_true',
  351. help="Don't show anything, useful with -o.")
  352. parser.add_argument('--build-dir',
  353. help="Specify the relative build directory. Used to map object files \
  354. to the correct source files.")
  355. sys.exit(main(**vars(parser.parse_args())))