stack.py 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439
  1. #!/usr/bin/env python3
  2. #
  3. # Script to find stack usage at the function level. Will detect recursion and
  4. # report as infinite stack usage.
  5. #
  6. import os
  7. import glob
  8. import itertools as it
  9. import re
  10. import csv
  11. import collections as co
  12. import math as m
  13. CI_PATHS = ['*.ci']
  14. def openio(path, mode='r'):
  15. if path == '-':
  16. if 'r' in mode:
  17. return os.fdopen(os.dup(sys.stdin.fileno()), 'r')
  18. else:
  19. return os.fdopen(os.dup(sys.stdout.fileno()), 'w')
  20. else:
  21. return open(path, mode)
  22. def collect(paths, **args):
  23. # parse the vcg format
  24. k_pattern = re.compile('([a-z]+)\s*:', re.DOTALL)
  25. v_pattern = re.compile('(?:"(.*?)"|([a-z]+))', re.DOTALL)
  26. def parse_vcg(rest):
  27. def parse_vcg(rest):
  28. node = []
  29. while True:
  30. rest = rest.lstrip()
  31. m = k_pattern.match(rest)
  32. if not m:
  33. return (node, rest)
  34. k, rest = m.group(1), rest[m.end(0):]
  35. rest = rest.lstrip()
  36. if rest.startswith('{'):
  37. v, rest = parse_vcg(rest[1:])
  38. assert rest[0] == '}', "unexpected %r" % rest[0:1]
  39. rest = rest[1:]
  40. node.append((k, v))
  41. else:
  42. m = v_pattern.match(rest)
  43. assert m, "unexpected %r" % rest[0:1]
  44. v, rest = m.group(1) or m.group(2), rest[m.end(0):]
  45. node.append((k, v))
  46. node, rest = parse_vcg(rest)
  47. assert rest == '', "unexpected %r" % rest[0:1]
  48. return node
  49. # collect into functions
  50. results = co.defaultdict(lambda: (None, None, 0, set()))
  51. f_pattern = re.compile(
  52. r'([^\\]*)\\n([^:]*)[^\\]*\\n([0-9]+) bytes \((.*)\)')
  53. for path in paths:
  54. with open(path) as f:
  55. vcg = parse_vcg(f.read())
  56. for k, graph in vcg:
  57. if k != 'graph':
  58. continue
  59. for k, info in graph:
  60. if k == 'node':
  61. info = dict(info)
  62. m = f_pattern.match(info['label'])
  63. if m:
  64. function, file, size, type = m.groups()
  65. if not args.get('quiet') and type != 'static':
  66. print('warning: found non-static stack for %s (%s)'
  67. % (function, type))
  68. _, _, _, targets = results[info['title']]
  69. results[info['title']] = (
  70. file, function, int(size), targets)
  71. elif k == 'edge':
  72. info = dict(info)
  73. _, _, _, targets = results[info['sourcename']]
  74. targets.add(info['targetname'])
  75. else:
  76. continue
  77. if not args.get('everything'):
  78. for source, (s_file, s_function, _, _) in list(results.items()):
  79. # discard internal functions
  80. if s_file.startswith('<') or s_file.startswith('/usr/include'):
  81. del results[source]
  82. # find maximum stack size recursively, this requires also detecting cycles
  83. # (in case of recursion)
  84. def find_limit(source, seen=None):
  85. seen = seen or set()
  86. if source not in results:
  87. return 0
  88. _, _, frame, targets = results[source]
  89. limit = 0
  90. for target in targets:
  91. if target in seen:
  92. # found a cycle
  93. return float('inf')
  94. limit_ = find_limit(target, seen | {target})
  95. limit = max(limit, limit_)
  96. return frame + limit
  97. def find_deps(targets):
  98. deps = set()
  99. for target in targets:
  100. if target in results:
  101. t_file, t_function, _, _ = results[target]
  102. deps.add((t_file, t_function))
  103. return deps
  104. # flatten into a list
  105. flat_results = []
  106. for source, (s_file, s_function, frame, targets) in results.items():
  107. limit = find_limit(source)
  108. deps = find_deps(targets)
  109. flat_results.append((s_file, s_function, frame, limit, deps))
  110. return flat_results
  111. def main(**args):
  112. # find sizes
  113. if not args.get('use', None):
  114. # find .ci files
  115. paths = []
  116. for path in args['ci_paths']:
  117. if os.path.isdir(path):
  118. path = path + '/*.ci'
  119. for path in glob.glob(path):
  120. paths.append(path)
  121. if not paths:
  122. print('no .ci files found in %r?' % args['ci_paths'])
  123. sys.exit(-1)
  124. results = collect(paths, **args)
  125. else:
  126. with openio(args['use']) as f:
  127. r = csv.DictReader(f)
  128. results = [
  129. ( result['file'],
  130. result['name'],
  131. int(result['stack_frame']),
  132. float(result['stack_limit']), # note limit can be inf
  133. set())
  134. for result in r
  135. if result.get('stack_frame') not in {None, ''}
  136. if result.get('stack_limit') not in {None, ''}]
  137. total_frame = 0
  138. total_limit = 0
  139. for _, _, frame, limit, _ in results:
  140. total_frame += frame
  141. total_limit = max(total_limit, limit)
  142. # find previous results?
  143. if args.get('diff'):
  144. try:
  145. with openio(args['diff']) as f:
  146. r = csv.DictReader(f)
  147. prev_results = [
  148. ( result['file'],
  149. result['name'],
  150. int(result['stack_frame']),
  151. float(result['stack_limit']),
  152. set())
  153. for result in r
  154. if result.get('stack_frame') not in {None, ''}
  155. if result.get('stack_limit') not in {None, ''}]
  156. except FileNotFoundError:
  157. prev_results = []
  158. prev_total_frame = 0
  159. prev_total_limit = 0
  160. for _, _, frame, limit, _ in prev_results:
  161. prev_total_frame += frame
  162. prev_total_limit = max(prev_total_limit, limit)
  163. # write results to CSV
  164. if args.get('output'):
  165. merged_results = co.defaultdict(lambda: {})
  166. other_fields = []
  167. # merge?
  168. if args.get('merge'):
  169. try:
  170. with openio(args['merge']) as f:
  171. r = csv.DictReader(f)
  172. for result in r:
  173. file = result.pop('file', '')
  174. func = result.pop('name', '')
  175. result.pop('stack_frame', None)
  176. result.pop('stack_limit', None)
  177. merged_results[(file, func)] = result
  178. other_fields = result.keys()
  179. except FileNotFoundError:
  180. pass
  181. for file, func, frame, limit, _ in results:
  182. merged_results[(file, func)]['stack_frame'] = frame
  183. merged_results[(file, func)]['stack_limit'] = limit
  184. with openio(args['output'], 'w') as f:
  185. w = csv.DictWriter(f, ['file', 'name', *other_fields, 'stack_frame', 'stack_limit'])
  186. w.writeheader()
  187. for (file, func), result in sorted(merged_results.items()):
  188. w.writerow({'file': file, 'name': func, **result})
  189. # print results
  190. def dedup_entries(results, by='name'):
  191. entries = co.defaultdict(lambda: (0, 0, set()))
  192. for file, func, frame, limit, deps in results:
  193. entry = (file if by == 'file' else func)
  194. entry_frame, entry_limit, entry_deps = entries[entry]
  195. entries[entry] = (
  196. entry_frame + frame,
  197. max(entry_limit, limit),
  198. entry_deps | {file if by == 'file' else func
  199. for file, func in deps})
  200. return entries
  201. def diff_entries(olds, news):
  202. diff = co.defaultdict(lambda: (None, None, None, None, 0, 0, 0, set()))
  203. for name, (new_frame, new_limit, deps) in news.items():
  204. diff[name] = (
  205. None, None,
  206. new_frame, new_limit,
  207. new_frame, new_limit,
  208. 1.0,
  209. deps)
  210. for name, (old_frame, old_limit, _) in olds.items():
  211. _, _, new_frame, new_limit, _, _, _, deps = diff[name]
  212. diff[name] = (
  213. old_frame, old_limit,
  214. new_frame, new_limit,
  215. (new_frame or 0) - (old_frame or 0),
  216. 0 if m.isinf(new_limit or 0) and m.isinf(old_limit or 0)
  217. else (new_limit or 0) - (old_limit or 0),
  218. 0.0 if m.isinf(new_limit or 0) and m.isinf(old_limit or 0)
  219. else +float('inf') if m.isinf(new_limit or 0)
  220. else -float('inf') if m.isinf(old_limit or 0)
  221. else +0.0 if not old_limit and not new_limit
  222. else +1.0 if not old_limit
  223. else ((new_limit or 0) - (old_limit or 0))/(old_limit or 0),
  224. deps)
  225. return diff
  226. def sorted_entries(entries):
  227. if args.get('limit_sort'):
  228. return sorted(entries, key=lambda x: (-x[1][1], x))
  229. elif args.get('reverse_limit_sort'):
  230. return sorted(entries, key=lambda x: (+x[1][1], x))
  231. elif args.get('frame_sort'):
  232. return sorted(entries, key=lambda x: (-x[1][0], x))
  233. elif args.get('reverse_frame_sort'):
  234. return sorted(entries, key=lambda x: (+x[1][0], x))
  235. else:
  236. return sorted(entries)
  237. def sorted_diff_entries(entries):
  238. if args.get('limit_sort'):
  239. return sorted(entries, key=lambda x: (-(x[1][3] or 0), x))
  240. elif args.get('reverse_limit_sort'):
  241. return sorted(entries, key=lambda x: (+(x[1][3] or 0), x))
  242. elif args.get('frame_sort'):
  243. return sorted(entries, key=lambda x: (-(x[1][2] or 0), x))
  244. elif args.get('reverse_frame_sort'):
  245. return sorted(entries, key=lambda x: (+(x[1][2] or 0), x))
  246. else:
  247. return sorted(entries, key=lambda x: (-x[1][6], x))
  248. def print_header(by=''):
  249. if not args.get('diff'):
  250. print('%-36s %7s %7s' % (by, 'frame', 'limit'))
  251. else:
  252. print('%-36s %15s %15s %15s' % (by, 'old', 'new', 'diff'))
  253. def print_entry(name, frame, limit):
  254. print("%-36s %7d %7s" % (name,
  255. frame, '∞' if m.isinf(limit) else int(limit)))
  256. def print_diff_entry(name,
  257. old_frame, old_limit,
  258. new_frame, new_limit,
  259. diff_frame, diff_limit,
  260. ratio):
  261. print('%-36s %7s %7s %7s %7s %+7d %7s%s' % (name,
  262. old_frame if old_frame is not None else "-",
  263. ('∞' if m.isinf(old_limit) else int(old_limit))
  264. if old_limit is not None else "-",
  265. new_frame if new_frame is not None else "-",
  266. ('∞' if m.isinf(new_limit) else int(new_limit))
  267. if new_limit is not None else "-",
  268. diff_frame,
  269. ('+∞' if diff_limit > 0 and m.isinf(diff_limit)
  270. else '-∞' if diff_limit < 0 and m.isinf(diff_limit)
  271. else '%+d' % diff_limit),
  272. '' if not ratio
  273. else ' (+∞%)' if ratio > 0 and m.isinf(ratio)
  274. else ' (-∞%)' if ratio < 0 and m.isinf(ratio)
  275. else ' (%+.1f%%)' % (100*ratio)))
  276. def print_entries(by='name'):
  277. # build optional tree of dependencies
  278. def print_deps(entries, depth, print,
  279. filter=lambda _: True,
  280. prefixes=('', '', '', '')):
  281. entries = entries if isinstance(entries, list) else list(entries)
  282. filtered_entries = [(name, entry)
  283. for name, entry in entries
  284. if filter(name)]
  285. for i, (name, entry) in enumerate(filtered_entries):
  286. last = (i == len(filtered_entries)-1)
  287. print(prefixes[0+last] + name, entry)
  288. if depth > 0:
  289. deps = entry[-1]
  290. print_deps(entries, depth-1, print,
  291. lambda name: name in deps,
  292. ( prefixes[2+last] + "|-> ",
  293. prefixes[2+last] + "'-> ",
  294. prefixes[2+last] + "| ",
  295. prefixes[2+last] + " "))
  296. entries = dedup_entries(results, by=by)
  297. if not args.get('diff'):
  298. print_header(by=by)
  299. print_deps(
  300. sorted_entries(entries.items()),
  301. args.get('depth') or 0,
  302. lambda name, entry: print_entry(name, *entry[:-1]))
  303. else:
  304. prev_entries = dedup_entries(prev_results, by=by)
  305. diff = diff_entries(prev_entries, entries)
  306. print_header(by='%s (%d added, %d removed)' % (by,
  307. sum(1 for _, old, _, _, _, _, _, _ in diff.values() if old is None),
  308. sum(1 for _, _, _, new, _, _, _, _ in diff.values() if new is None)))
  309. print_deps(
  310. filter(
  311. lambda x: x[1][6] or args.get('all'),
  312. sorted_diff_entries(diff.items())),
  313. args.get('depth') or 0,
  314. lambda name, entry: print_diff_entry(name, *entry[:-1]))
  315. def print_totals():
  316. if not args.get('diff'):
  317. print_entry('TOTAL', total_frame, total_limit)
  318. else:
  319. diff_frame = total_frame - prev_total_frame
  320. diff_limit = (
  321. 0 if m.isinf(total_limit or 0) and m.isinf(prev_total_limit or 0)
  322. else (total_limit or 0) - (prev_total_limit or 0))
  323. ratio = (
  324. 0.0 if m.isinf(total_limit or 0) and m.isinf(prev_total_limit or 0)
  325. else +float('inf') if m.isinf(total_limit or 0)
  326. else -float('inf') if m.isinf(prev_total_limit or 0)
  327. else 0.0 if not prev_total_limit and not total_limit
  328. else 1.0 if not prev_total_limit
  329. else ((total_limit or 0) - (prev_total_limit or 0))/(prev_total_limit or 0))
  330. print_diff_entry('TOTAL',
  331. prev_total_frame, prev_total_limit,
  332. total_frame, total_limit,
  333. diff_frame, diff_limit,
  334. ratio)
  335. if args.get('quiet'):
  336. pass
  337. elif args.get('summary'):
  338. print_header()
  339. print_totals()
  340. elif args.get('files'):
  341. print_entries(by='file')
  342. print_totals()
  343. else:
  344. print_entries(by='name')
  345. print_totals()
  346. # catch recursion
  347. if args.get('error_on_recursion') and any(
  348. m.isinf(limit) for _, _, _, limit, _ in results):
  349. sys.exit(2)
  350. if __name__ == "__main__":
  351. import argparse
  352. import sys
  353. parser = argparse.ArgumentParser(
  354. description="Find stack usage at the function level.")
  355. parser.add_argument('ci_paths', nargs='*', default=CI_PATHS,
  356. help="Description of where to find *.ci files. May be a directory \
  357. or a list of paths. Defaults to %r." % CI_PATHS)
  358. parser.add_argument('-v', '--verbose', action='store_true',
  359. help="Output commands that run behind the scenes.")
  360. parser.add_argument('-q', '--quiet', action='store_true',
  361. help="Don't show anything, useful with -o.")
  362. parser.add_argument('-o', '--output',
  363. help="Specify CSV file to store results.")
  364. parser.add_argument('-u', '--use',
  365. help="Don't parse callgraph files, instead use this CSV file.")
  366. parser.add_argument('-d', '--diff',
  367. help="Specify CSV file to diff against.")
  368. parser.add_argument('-m', '--merge',
  369. help="Merge with an existing CSV file when writing to output.")
  370. parser.add_argument('-a', '--all', action='store_true',
  371. help="Show all functions, not just the ones that changed.")
  372. parser.add_argument('-A', '--everything', action='store_true',
  373. help="Include builtin and libc specific symbols.")
  374. parser.add_argument('-s', '--limit-sort', action='store_true',
  375. help="Sort by stack limit.")
  376. parser.add_argument('-S', '--reverse-limit-sort', action='store_true',
  377. help="Sort by stack limit, but backwards.")
  378. parser.add_argument('--frame-sort', action='store_true',
  379. help="Sort by stack frame size.")
  380. parser.add_argument('--reverse-frame-sort', action='store_true',
  381. help="Sort by stack frame size, but backwards.")
  382. parser.add_argument('-L', '--depth', default=0, type=lambda x: int(x, 0),
  383. nargs='?', const=float('inf'),
  384. help="Depth of dependencies to show.")
  385. parser.add_argument('-F', '--files', action='store_true',
  386. help="Show file-level calls.")
  387. parser.add_argument('-Y', '--summary', action='store_true',
  388. help="Only show the total stack size.")
  389. parser.add_argument('-e', '--error-on-recursion', action='store_true',
  390. help="Error if any functions are recursive.")
  391. parser.add_argument('--build-dir',
  392. help="Specify the relative build directory. Used to map object files \
  393. to the correct source files.")
  394. sys.exit(main(**{k: v
  395. for k, v in vars(parser.parse_args()).items()
  396. if v is not None}))