buildstats-diff 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324
  1. #!/usr/bin/env python3
  2. #
  3. # Script for comparing buildstats from two different builds
  4. #
  5. # Copyright (c) 2016, Intel Corporation.
  6. #
  7. # SPDX-License-Identifier: GPL-2.0-only
  8. #
  9. import argparse
  10. import glob
  11. import logging
  12. import math
  13. import os
  14. import pathlib
  15. import sys
  16. from operator import attrgetter
  17. # Import oe libs
  18. scripts_path = os.path.dirname(os.path.realpath(__file__))
  19. sys.path.append(os.path.join(scripts_path, 'lib'))
  20. from buildstats import BuildStats, diff_buildstats, taskdiff_fields, BSVerDiff
  21. # Setup logging
  22. logging.basicConfig(level=logging.INFO, format="%(levelname)s: %(message)s")
  23. log = logging.getLogger()
  24. class ScriptError(Exception):
  25. """Exception for internal error handling of this script"""
  26. pass
  27. def read_buildstats(path, multi):
  28. """Read buildstats"""
  29. if not os.path.exists(path):
  30. raise ScriptError("No such file or directory: {}".format(path))
  31. if os.path.isfile(path):
  32. return BuildStats.from_file_json(path)
  33. if os.path.isfile(os.path.join(path, 'build_stats')):
  34. return BuildStats.from_dir(path)
  35. # Handle a non-buildstat directory
  36. subpaths = sorted(glob.glob(path + '/*'))
  37. if len(subpaths) > 1:
  38. if multi:
  39. log.info("Averaging over {} buildstats from {}".format(
  40. len(subpaths), path))
  41. else:
  42. raise ScriptError("Multiple buildstats found in '{}'. Please give "
  43. "a single buildstat directory of use the --multi "
  44. "option".format(path))
  45. bs = None
  46. for subpath in subpaths:
  47. if os.path.isfile(subpath):
  48. _bs = BuildStats.from_file_json(subpath)
  49. else:
  50. _bs = BuildStats.from_dir(subpath)
  51. if bs is None:
  52. bs = _bs
  53. else:
  54. bs.aggregate(_bs)
  55. if not bs:
  56. raise ScriptError("No buildstats found under {}".format(path))
  57. return bs
  58. def print_ver_diff(bs1, bs2):
  59. """Print package version differences"""
  60. diff = BSVerDiff(bs1, bs2)
  61. maxlen = max([len(r) for r in set(bs1.keys()).union(set(bs2.keys()))])
  62. fmt_str = " {:{maxlen}} ({})"
  63. if diff.new:
  64. print("\nNEW RECIPES:")
  65. print("------------")
  66. for name, val in sorted(diff.new.items()):
  67. print(fmt_str.format(name, val.nevr, maxlen=maxlen))
  68. if diff.dropped:
  69. print("\nDROPPED RECIPES:")
  70. print("----------------")
  71. for name, val in sorted(diff.dropped.items()):
  72. print(fmt_str.format(name, val.nevr, maxlen=maxlen))
  73. fmt_str = " {0:{maxlen}} {1:<20} ({2})"
  74. if diff.rchanged:
  75. print("\nREVISION CHANGED:")
  76. print("-----------------")
  77. for name, val in sorted(diff.rchanged.items()):
  78. field1 = "{} -> {}".format(val.left.revision, val.right.revision)
  79. field2 = "{} -> {}".format(val.left.nevr, val.right.nevr)
  80. print(fmt_str.format(name, field1, field2, maxlen=maxlen))
  81. if diff.vchanged:
  82. print("\nVERSION CHANGED:")
  83. print("----------------")
  84. for name, val in sorted(diff.vchanged.items()):
  85. field1 = "{} -> {}".format(val.left.version, val.right.version)
  86. field2 = "{} -> {}".format(val.left.nevr, val.right.nevr)
  87. print(fmt_str.format(name, field1, field2, maxlen=maxlen))
  88. if diff.echanged:
  89. print("\nEPOCH CHANGED:")
  90. print("--------------")
  91. for name, val in sorted(diff.echanged.items()):
  92. field1 = "{} -> {}".format(val.left.epoch, val.right.epoch)
  93. field2 = "{} -> {}".format(val.left.nevr, val.right.nevr)
  94. print(fmt_str.format(name, field1, field2, maxlen=maxlen))
  95. def print_task_diff(bs1, bs2, val_type, min_val=0, min_absdiff=0, sort_by=('absdiff',), only_tasks=[]):
  96. """Diff task execution times"""
  97. def val_to_str(val, human_readable=False):
  98. """Convert raw value to printable string"""
  99. def hms_time(secs):
  100. """Get time in human-readable HH:MM:SS format"""
  101. h = int(secs / 3600)
  102. m = int((secs % 3600) / 60)
  103. s = secs % 60
  104. if h == 0:
  105. return "{:02d}:{:04.1f}".format(m, s)
  106. else:
  107. return "{:d}:{:02d}:{:04.1f}".format(h, m, s)
  108. if 'time' in val_type:
  109. if human_readable:
  110. return hms_time(val)
  111. else:
  112. return "{:.1f}s".format(val)
  113. elif 'bytes' in val_type and human_readable:
  114. prefix = ['', 'Ki', 'Mi', 'Gi', 'Ti', 'Pi']
  115. dec = int(math.log(val, 2) / 10)
  116. prec = 1 if dec > 0 else 0
  117. return "{:.{prec}f}{}B".format(val / (2 ** (10 * dec)),
  118. prefix[dec], prec=prec)
  119. elif 'ops' in val_type and human_readable:
  120. prefix = ['', 'k', 'M', 'G', 'T', 'P']
  121. dec = int(math.log(val, 1000))
  122. prec = 1 if dec > 0 else 0
  123. return "{:.{prec}f}{}ops".format(val / (1000 ** dec),
  124. prefix[dec], prec=prec)
  125. return str(int(val))
  126. def sum_vals(buildstats):
  127. """Get cumulative sum of all tasks"""
  128. total = 0.0
  129. for recipe_data in buildstats.values():
  130. for name, bs_task in recipe_data.tasks.items():
  131. if not only_tasks or name in only_tasks:
  132. total += getattr(bs_task, val_type)
  133. return total
  134. if min_val:
  135. print("Ignoring tasks less than {} ({})".format(
  136. val_to_str(min_val, True), val_to_str(min_val)))
  137. if min_absdiff:
  138. print("Ignoring differences less than {} ({})".format(
  139. val_to_str(min_absdiff, True), val_to_str(min_absdiff)))
  140. # Prepare the data
  141. tasks_diff = diff_buildstats(bs1, bs2, val_type, min_val, min_absdiff, only_tasks)
  142. # Sort our list
  143. for field in reversed(sort_by):
  144. if field.startswith('-'):
  145. field = field[1:]
  146. reverse = True
  147. else:
  148. reverse = False
  149. tasks_diff = sorted(tasks_diff, key=attrgetter(field), reverse=reverse)
  150. linedata = [(' ', 'PKG', ' ', 'TASK', 'ABSDIFF', 'RELDIFF',
  151. val_type.upper() + '1', val_type.upper() + '2')]
  152. field_lens = dict([('len_{}'.format(i), len(f)) for i, f in enumerate(linedata[0])])
  153. # Prepare fields in string format and measure field lengths
  154. for diff in tasks_diff:
  155. task_prefix = diff.task_op if diff.pkg_op == ' ' else ' '
  156. linedata.append((diff.pkg_op, diff.pkg, task_prefix, diff.task,
  157. val_to_str(diff.absdiff),
  158. '{:+.1f}%'.format(diff.reldiff),
  159. val_to_str(diff.value1),
  160. val_to_str(diff.value2)))
  161. for i, field in enumerate(linedata[-1]):
  162. key = 'len_{}'.format(i)
  163. if len(field) > field_lens[key]:
  164. field_lens[key] = len(field)
  165. # Print data
  166. print()
  167. for fields in linedata:
  168. print("{:{len_0}}{:{len_1}} {:{len_2}}{:{len_3}} {:>{len_4}} {:>{len_5}} {:>{len_6}} -> {:{len_7}}".format(
  169. *fields, **field_lens))
  170. # Print summary of the diffs
  171. total1 = sum_vals(bs1)
  172. total2 = sum_vals(bs2)
  173. print("\nCumulative {}:".format(val_type))
  174. print (" {} {:+.1f}% {} ({}) -> {} ({})".format(
  175. val_to_str(total2 - total1), 100 * (total2-total1) / total1,
  176. val_to_str(total1, True), val_to_str(total1),
  177. val_to_str(total2, True), val_to_str(total2)))
  178. def parse_args(argv):
  179. """Parse cmdline arguments"""
  180. description="""
  181. Script for comparing buildstats of two separate builds."""
  182. parser = argparse.ArgumentParser(
  183. formatter_class=argparse.ArgumentDefaultsHelpFormatter,
  184. description=description)
  185. min_val_defaults = {'cputime': 3.0,
  186. 'read_bytes': 524288,
  187. 'write_bytes': 524288,
  188. 'read_ops': 500,
  189. 'write_ops': 500,
  190. 'walltime': 5}
  191. min_absdiff_defaults = {'cputime': 1.0,
  192. 'read_bytes': 131072,
  193. 'write_bytes': 131072,
  194. 'read_ops': 50,
  195. 'write_ops': 50,
  196. 'walltime': 2}
  197. parser.add_argument('--debug', '-d', action='store_true',
  198. help="Verbose logging")
  199. parser.add_argument('--ver-diff', action='store_true',
  200. help="Show package version differences and exit")
  201. parser.add_argument('--diff-attr', default='cputime',
  202. choices=min_val_defaults.keys(),
  203. help="Buildstat attribute which to compare")
  204. parser.add_argument('--min-val', default=min_val_defaults, type=float,
  205. help="Filter out tasks less than MIN_VAL. "
  206. "Default depends on --diff-attr.")
  207. parser.add_argument('--min-absdiff', default=min_absdiff_defaults, type=float,
  208. help="Filter out tasks whose difference is less than "
  209. "MIN_ABSDIFF, Default depends on --diff-attr.")
  210. parser.add_argument('--sort-by', default='absdiff',
  211. help="Comma-separated list of field sort order. "
  212. "Prepend the field name with '-' for reversed sort. "
  213. "Available fields are: {}".format(', '.join(taskdiff_fields)))
  214. parser.add_argument('--multi', action='store_true',
  215. help="Read all buildstats from the given paths and "
  216. "average over them")
  217. parser.add_argument('--only-task', dest='only_tasks', metavar='TASK', action='append', default=[],
  218. help="Only include TASK in report. May be specified multiple times")
  219. parser.add_argument('buildstats1', metavar='BUILDSTATS1', nargs="?", help="'Left' buildstat")
  220. parser.add_argument('buildstats2', metavar='BUILDSTATS2', nargs="?", help="'Right' buildstat")
  221. args = parser.parse_args(argv)
  222. if args.buildstats1 and args.buildstats2:
  223. # Both paths specified
  224. pass
  225. elif args.buildstats1 or args.buildstats2:
  226. # Just one path specified, this is an error
  227. parser.print_usage(sys.stderr)
  228. print("Either specify two buildstats paths, or none to use the last two paths.", file=sys.stderr)
  229. sys.exit(1)
  230. else:
  231. # No paths specified, try to find the last two buildstats
  232. try:
  233. buildstats_dir = pathlib.Path(os.environ["BUILDDIR"]) / "tmp" / "buildstats"
  234. paths = sorted(buildstats_dir.iterdir())
  235. args.buildstats2 = paths.pop()
  236. args.buildstats1 = paths.pop()
  237. print(f"Comparing {args.buildstats1} -> {args.buildstats2}\n")
  238. except KeyError:
  239. parser.print_usage(sys.stderr)
  240. print("Build environment has not been configured, cannot find buildstats", file=sys.stderr)
  241. sys.exit(1)
  242. # We do not nedd/want to read all buildstats if we just want to look at the
  243. # package versions
  244. if args.ver_diff:
  245. args.multi = False
  246. # Handle defaults for the filter arguments
  247. if args.min_val is min_val_defaults:
  248. args.min_val = min_val_defaults[args.diff_attr]
  249. if args.min_absdiff is min_absdiff_defaults:
  250. args.min_absdiff = min_absdiff_defaults[args.diff_attr]
  251. return args
  252. def main(argv=None):
  253. """Script entry point"""
  254. args = parse_args(argv)
  255. if args.debug:
  256. log.setLevel(logging.DEBUG)
  257. # Validate sort fields
  258. sort_by = []
  259. for field in args.sort_by.split(','):
  260. if field.lstrip('-') not in taskdiff_fields:
  261. log.error("Invalid sort field '%s' (must be one of: %s)" %
  262. (field, ', '.join(taskdiff_fields)))
  263. sys.exit(1)
  264. sort_by.append(field)
  265. try:
  266. bs1 = read_buildstats(args.buildstats1, args.multi)
  267. bs2 = read_buildstats(args.buildstats2, args.multi)
  268. if args.ver_diff:
  269. print_ver_diff(bs1, bs2)
  270. else:
  271. print_task_diff(bs1, bs2, args.diff_attr, args.min_val,
  272. args.min_absdiff, sort_by, args.only_tasks)
  273. except ScriptError as err:
  274. log.error(str(err))
  275. return 1
  276. return 0
  277. if __name__ == "__main__":
  278. sys.exit(main())