CbC/CbC_llvm: lldb/scripts/analyze-project-deps.py annotate

annotate lldb/scripts/analyze-project-deps.py @ 220:42394fc6a535

Added tag llvm12 for changeset 0572611fdcc8

author	Shinji KONO <kono@ie.u-ryukyu.ac.jp>
date	Tue, 15 Jun 2021 19:13:43 +0900
parents	1d019706d866
children	2e18cbf3894f

rev	line source
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1 #! /usr/bin/env python
1d019706d866 LLVM10 anatofuz parents: diff changeset	2
1d019706d866 LLVM10 anatofuz parents: diff changeset	3 import argparse
1d019706d866 LLVM10 anatofuz parents: diff changeset	4 import itertools
1d019706d866 LLVM10 anatofuz parents: diff changeset	5 import os
1d019706d866 LLVM10 anatofuz parents: diff changeset	6 import re
1d019706d866 LLVM10 anatofuz parents: diff changeset	7 import sys
1d019706d866 LLVM10 anatofuz parents: diff changeset	8 from collections import defaultdict
1d019706d866 LLVM10 anatofuz parents: diff changeset	9
1d019706d866 LLVM10 anatofuz parents: diff changeset	10 from use_lldb_suite import lldb_root
1d019706d866 LLVM10 anatofuz parents: diff changeset	11
1d019706d866 LLVM10 anatofuz parents: diff changeset	12 parser = argparse.ArgumentParser(
1d019706d866 LLVM10 anatofuz parents: diff changeset	13 description='Analyze LLDB project #include dependencies.')
1d019706d866 LLVM10 anatofuz parents: diff changeset	14 parser.add_argument('--show-counts', default=False, action='store_true',
1d019706d866 LLVM10 anatofuz parents: diff changeset	15 help='When true, show the number of dependencies from each subproject')
1d019706d866 LLVM10 anatofuz parents: diff changeset	16 parser.add_argument('--discover-cycles', default=False, action='store_true',
1d019706d866 LLVM10 anatofuz parents: diff changeset	17 help='When true, find and display all project dependency cycles. Note,'
1d019706d866 LLVM10 anatofuz parents: diff changeset	18 'this option is very slow')
1d019706d866 LLVM10 anatofuz parents: diff changeset	19
1d019706d866 LLVM10 anatofuz parents: diff changeset	20 args = parser.parse_args()
1d019706d866 LLVM10 anatofuz parents: diff changeset	21
1d019706d866 LLVM10 anatofuz parents: diff changeset	22 src_dir = os.path.join(lldb_root, "source")
1d019706d866 LLVM10 anatofuz parents: diff changeset	23 inc_dir = os.path.join(lldb_root, "include")
1d019706d866 LLVM10 anatofuz parents: diff changeset	24
1d019706d866 LLVM10 anatofuz parents: diff changeset	25 src_map = {}
1d019706d866 LLVM10 anatofuz parents: diff changeset	26
1d019706d866 LLVM10 anatofuz parents: diff changeset	27 include_regex = re.compile('#include \"((lldb\|Plugins\|clang)(./)+).\"')
1d019706d866 LLVM10 anatofuz parents: diff changeset	28
1d019706d866 LLVM10 anatofuz parents: diff changeset	29 def is_sublist(small, big):
1d019706d866 LLVM10 anatofuz parents: diff changeset	30 it = iter(big)
1d019706d866 LLVM10 anatofuz parents: diff changeset	31 return all(c in it for c in small)
1d019706d866 LLVM10 anatofuz parents: diff changeset	32
1d019706d866 LLVM10 anatofuz parents: diff changeset	33 def normalize_host(str):
1d019706d866 LLVM10 anatofuz parents: diff changeset	34 if str.startswith("lldb/Host"):
1d019706d866 LLVM10 anatofuz parents: diff changeset	35 return "lldb/Host"
1d019706d866 LLVM10 anatofuz parents: diff changeset	36 if str.startswith("Plugins"):
1d019706d866 LLVM10 anatofuz parents: diff changeset	37 return "lldb/" + str
1d019706d866 LLVM10 anatofuz parents: diff changeset	38 if str.startswith("lldb/../../source"):
1d019706d866 LLVM10 anatofuz parents: diff changeset	39 return str.replace("lldb/../../source", "lldb")
1d019706d866 LLVM10 anatofuz parents: diff changeset	40 return str
1d019706d866 LLVM10 anatofuz parents: diff changeset	41
1d019706d866 LLVM10 anatofuz parents: diff changeset	42 def scan_deps(this_dir, file):
1d019706d866 LLVM10 anatofuz parents: diff changeset	43 global src_map
1d019706d866 LLVM10 anatofuz parents: diff changeset	44 deps = {}
1d019706d866 LLVM10 anatofuz parents: diff changeset	45 this_dir = normalize_host(this_dir)
1d019706d866 LLVM10 anatofuz parents: diff changeset	46 if this_dir in src_map:
1d019706d866 LLVM10 anatofuz parents: diff changeset	47 deps = src_map[this_dir]
1d019706d866 LLVM10 anatofuz parents: diff changeset	48
1d019706d866 LLVM10 anatofuz parents: diff changeset	49 with open(file) as f:
1d019706d866 LLVM10 anatofuz parents: diff changeset	50 for line in list(f):
1d019706d866 LLVM10 anatofuz parents: diff changeset	51 m = include_regex.match(line)
1d019706d866 LLVM10 anatofuz parents: diff changeset	52 if m is None:
1d019706d866 LLVM10 anatofuz parents: diff changeset	53 continue
1d019706d866 LLVM10 anatofuz parents: diff changeset	54 relative = m.groups()[0].rstrip("/")
1d019706d866 LLVM10 anatofuz parents: diff changeset	55 if relative == this_dir:
1d019706d866 LLVM10 anatofuz parents: diff changeset	56 continue
1d019706d866 LLVM10 anatofuz parents: diff changeset	57 relative = normalize_host(relative)
1d019706d866 LLVM10 anatofuz parents: diff changeset	58 if relative in deps:
1d019706d866 LLVM10 anatofuz parents: diff changeset	59 deps[relative] += 1
1d019706d866 LLVM10 anatofuz parents: diff changeset	60 elif relative != this_dir:
1d019706d866 LLVM10 anatofuz parents: diff changeset	61 deps[relative] = 1
1d019706d866 LLVM10 anatofuz parents: diff changeset	62 if this_dir not in src_map and len(deps) > 0:
1d019706d866 LLVM10 anatofuz parents: diff changeset	63 src_map[this_dir] = deps
1d019706d866 LLVM10 anatofuz parents: diff changeset	64
1d019706d866 LLVM10 anatofuz parents: diff changeset	65 for (base, dirs, files) in os.walk(inc_dir):
1d019706d866 LLVM10 anatofuz parents: diff changeset	66 dir = os.path.basename(base)
1d019706d866 LLVM10 anatofuz parents: diff changeset	67 relative = os.path.relpath(base, inc_dir)
1d019706d866 LLVM10 anatofuz parents: diff changeset	68 inc_files = [x for x in files if os.path.splitext(x)[1] in [".h"]]
1d019706d866 LLVM10 anatofuz parents: diff changeset	69 relative = relative.replace("\\", "/")
1d019706d866 LLVM10 anatofuz parents: diff changeset	70 for inc in inc_files:
1d019706d866 LLVM10 anatofuz parents: diff changeset	71 inc_path = os.path.join(base, inc)
1d019706d866 LLVM10 anatofuz parents: diff changeset	72 scan_deps(relative, inc_path)
1d019706d866 LLVM10 anatofuz parents: diff changeset	73
1d019706d866 LLVM10 anatofuz parents: diff changeset	74 for (base, dirs, files) in os.walk(src_dir):
1d019706d866 LLVM10 anatofuz parents: diff changeset	75 dir = os.path.basename(base)
1d019706d866 LLVM10 anatofuz parents: diff changeset	76 relative = os.path.relpath(base, src_dir)
1d019706d866 LLVM10 anatofuz parents: diff changeset	77 src_files = [x for x in files if os.path.splitext(x)[1] in [".cpp", ".h", ".mm"]]
1d019706d866 LLVM10 anatofuz parents: diff changeset	78 norm_base_path = os.path.normpath(os.path.join("lldb", relative))
1d019706d866 LLVM10 anatofuz parents: diff changeset	79 norm_base_path = norm_base_path.replace("\\", "/")
1d019706d866 LLVM10 anatofuz parents: diff changeset	80 for src in src_files:
1d019706d866 LLVM10 anatofuz parents: diff changeset	81 src_path = os.path.join(base, src)
1d019706d866 LLVM10 anatofuz parents: diff changeset	82 scan_deps(norm_base_path, src_path)
1d019706d866 LLVM10 anatofuz parents: diff changeset	83 pass
1d019706d866 LLVM10 anatofuz parents: diff changeset	84
1d019706d866 LLVM10 anatofuz parents: diff changeset	85 def is_existing_cycle(path, cycles):
1d019706d866 LLVM10 anatofuz parents: diff changeset	86 # If we have a cycle like # A -> B -> C (with an implicit -> A at the end)
1d019706d866 LLVM10 anatofuz parents: diff changeset	87 # then we don't just want to check for an occurrence of A -> B -> C in the
1d019706d866 LLVM10 anatofuz parents: diff changeset	88 # list of known cycles, but every possible rotation of A -> B -> C. For
1d019706d866 LLVM10 anatofuz parents: diff changeset	89 # example, if we previously encountered B -> C -> A (with an implicit -> B
1d019706d866 LLVM10 anatofuz parents: diff changeset	90 # at the end), then A -> B -> C is also a cycle. This is an important
1d019706d866 LLVM10 anatofuz parents: diff changeset	91 # optimization which reduces the search space by multiple orders of
1d019706d866 LLVM10 anatofuz parents: diff changeset	92 # magnitude.
1d019706d866 LLVM10 anatofuz parents: diff changeset	93 for i in range(0,len(path)):
1d019706d866 LLVM10 anatofuz parents: diff changeset	94 if any(is_sublist(x, path) for x in cycles):
1d019706d866 LLVM10 anatofuz parents: diff changeset	95 return True
1d019706d866 LLVM10 anatofuz parents: diff changeset	96 path = [path[-1]] + path[0:-1]
1d019706d866 LLVM10 anatofuz parents: diff changeset	97 return False
1d019706d866 LLVM10 anatofuz parents: diff changeset	98
1d019706d866 LLVM10 anatofuz parents: diff changeset	99 def expand(path_queue, path_lengths, cycles, src_map):
1d019706d866 LLVM10 anatofuz parents: diff changeset	100 # We do a breadth first search, to make sure we visit all paths in order
1d019706d866 LLVM10 anatofuz parents: diff changeset	101 # of ascending length. This is an important optimization to make sure that
1d019706d866 LLVM10 anatofuz parents: diff changeset	102 # short cycles are discovered first, which will allow us to discard longer
1d019706d866 LLVM10 anatofuz parents: diff changeset	103 # cycles which grow the search space exponentially the longer they get.
1d019706d866 LLVM10 anatofuz parents: diff changeset	104 while len(path_queue) > 0:
1d019706d866 LLVM10 anatofuz parents: diff changeset	105 cur_path = path_queue.pop(0)
1d019706d866 LLVM10 anatofuz parents: diff changeset	106 if is_existing_cycle(cur_path, cycles):
1d019706d866 LLVM10 anatofuz parents: diff changeset	107 continue
1d019706d866 LLVM10 anatofuz parents: diff changeset	108
1d019706d866 LLVM10 anatofuz parents: diff changeset	109 next_len = path_lengths.pop(0) + 1
1d019706d866 LLVM10 anatofuz parents: diff changeset	110 last_component = cur_path[-1]
1d019706d866 LLVM10 anatofuz parents: diff changeset	111
1d019706d866 LLVM10 anatofuz parents: diff changeset	112 for item in src_map[last_component]:
1d019706d866 LLVM10 anatofuz parents: diff changeset	113 if item.startswith("clang"):
1d019706d866 LLVM10 anatofuz parents: diff changeset	114 continue
1d019706d866 LLVM10 anatofuz parents: diff changeset	115
1d019706d866 LLVM10 anatofuz parents: diff changeset	116 if item in cur_path:
1d019706d866 LLVM10 anatofuz parents: diff changeset	117 # This is a cycle. Minimize it and then check if the result is
1d019706d866 LLVM10 anatofuz parents: diff changeset	118 # already in the list of cycles. Insert it (or not) and then
1d019706d866 LLVM10 anatofuz parents: diff changeset	119 # exit.
1d019706d866 LLVM10 anatofuz parents: diff changeset	120 new_index = cur_path.index(item)
1d019706d866 LLVM10 anatofuz parents: diff changeset	121 cycle = cur_path[new_index:]
1d019706d866 LLVM10 anatofuz parents: diff changeset	122 if not is_existing_cycle(cycle, cycles):
1d019706d866 LLVM10 anatofuz parents: diff changeset	123 cycles.append(cycle)
1d019706d866 LLVM10 anatofuz parents: diff changeset	124 continue
1d019706d866 LLVM10 anatofuz parents: diff changeset	125
1d019706d866 LLVM10 anatofuz parents: diff changeset	126 path_lengths.append(next_len)
1d019706d866 LLVM10 anatofuz parents: diff changeset	127 path_queue.append(cur_path + [item])
1d019706d866 LLVM10 anatofuz parents: diff changeset	128 pass
1d019706d866 LLVM10 anatofuz parents: diff changeset	129
1d019706d866 LLVM10 anatofuz parents: diff changeset	130 cycles = []
1d019706d866 LLVM10 anatofuz parents: diff changeset	131
1d019706d866 LLVM10 anatofuz parents: diff changeset	132 path_queue = [[x] for x in iter(src_map)]
1d019706d866 LLVM10 anatofuz parents: diff changeset	133 path_lens = [1] * len(path_queue)
1d019706d866 LLVM10 anatofuz parents: diff changeset	134
1d019706d866 LLVM10 anatofuz parents: diff changeset	135 items = list(src_map.items())
1d019706d866 LLVM10 anatofuz parents: diff changeset	136 items.sort(key = lambda A : A[0])
1d019706d866 LLVM10 anatofuz parents: diff changeset	137
1d019706d866 LLVM10 anatofuz parents: diff changeset	138 for (path, deps) in items:
1d019706d866 LLVM10 anatofuz parents: diff changeset	139 print(path + ":")
1d019706d866 LLVM10 anatofuz parents: diff changeset	140 sorted_deps = list(deps.items())
1d019706d866 LLVM10 anatofuz parents: diff changeset	141 if args.show_counts:
1d019706d866 LLVM10 anatofuz parents: diff changeset	142 sorted_deps.sort(key = lambda A: (A[1], A[0]))
1d019706d866 LLVM10 anatofuz parents: diff changeset	143 for dep in sorted_deps:
1d019706d866 LLVM10 anatofuz parents: diff changeset	144 print("\t{} [{}]".format(dep[0], dep[1]))
1d019706d866 LLVM10 anatofuz parents: diff changeset	145 else:
1d019706d866 LLVM10 anatofuz parents: diff changeset	146 sorted_deps.sort(key = lambda A: A[0])
1d019706d866 LLVM10 anatofuz parents: diff changeset	147 for dep in sorted_deps:
1d019706d866 LLVM10 anatofuz parents: diff changeset	148 print("\t{}".format(dep[0]))
1d019706d866 LLVM10 anatofuz parents: diff changeset	149
1d019706d866 LLVM10 anatofuz parents: diff changeset	150 def iter_cycles(cycles):
1d019706d866 LLVM10 anatofuz parents: diff changeset	151 global src_map
1d019706d866 LLVM10 anatofuz parents: diff changeset	152 for cycle in cycles:
1d019706d866 LLVM10 anatofuz parents: diff changeset	153 cycle.append(cycle[0])
1d019706d866 LLVM10 anatofuz parents: diff changeset	154 zipper = list(zip(cycle[0:-1], cycle[1:]))
1d019706d866 LLVM10 anatofuz parents: diff changeset	155 result = [(x, src_map[x][y], y) for (x,y) in zipper]
1d019706d866 LLVM10 anatofuz parents: diff changeset	156 total = 0
1d019706d866 LLVM10 anatofuz parents: diff changeset	157 smallest = result[0][1]
1d019706d866 LLVM10 anatofuz parents: diff changeset	158 for (first, value, last) in result:
1d019706d866 LLVM10 anatofuz parents: diff changeset	159 total += value
1d019706d866 LLVM10 anatofuz parents: diff changeset	160 smallest = min(smallest, value)
1d019706d866 LLVM10 anatofuz parents: diff changeset	161 yield (total, smallest, result)
1d019706d866 LLVM10 anatofuz parents: diff changeset	162
1d019706d866 LLVM10 anatofuz parents: diff changeset	163 if args.discover_cycles:
1d019706d866 LLVM10 anatofuz parents: diff changeset	164 print("Analyzing cycles...")
1d019706d866 LLVM10 anatofuz parents: diff changeset	165
1d019706d866 LLVM10 anatofuz parents: diff changeset	166 expand(path_queue, path_lens, cycles, src_map)
1d019706d866 LLVM10 anatofuz parents: diff changeset	167
1d019706d866 LLVM10 anatofuz parents: diff changeset	168 average = sum([len(x)+1 for x in cycles]) / len(cycles)
1d019706d866 LLVM10 anatofuz parents: diff changeset	169
1d019706d866 LLVM10 anatofuz parents: diff changeset	170 print("Found {} cycles. Average cycle length = {}.".format(len(cycles), average))
1d019706d866 LLVM10 anatofuz parents: diff changeset	171 counted = list(iter_cycles(cycles))
1d019706d866 LLVM10 anatofuz parents: diff changeset	172 if args.show_counts:
1d019706d866 LLVM10 anatofuz parents: diff changeset	173 counted.sort(key = lambda A: A[0])
1d019706d866 LLVM10 anatofuz parents: diff changeset	174 for (total, smallest, cycle) in counted:
1d019706d866 LLVM10 anatofuz parents: diff changeset	175 sys.stdout.write("{} deps to break: ".format(total))
1d019706d866 LLVM10 anatofuz parents: diff changeset	176 sys.stdout.write(cycle[0][0])
1d019706d866 LLVM10 anatofuz parents: diff changeset	177 for (first, count, last) in cycle:
1d019706d866 LLVM10 anatofuz parents: diff changeset	178 sys.stdout.write(" [{}->] {}".format(count, last))
1d019706d866 LLVM10 anatofuz parents: diff changeset	179 sys.stdout.write("\n")
1d019706d866 LLVM10 anatofuz parents: diff changeset	180 else:
1d019706d866 LLVM10 anatofuz parents: diff changeset	181 for cycle in cycles:
1d019706d866 LLVM10 anatofuz parents: diff changeset	182 cycle.append(cycle[0])
1d019706d866 LLVM10 anatofuz parents: diff changeset	183 print(" -> ".join(cycle))
1d019706d866 LLVM10 anatofuz parents: diff changeset	184
1d019706d866 LLVM10 anatofuz parents: diff changeset	185 print("Analyzing islands...")
1d019706d866 LLVM10 anatofuz parents: diff changeset	186 islands = []
1d019706d866 LLVM10 anatofuz parents: diff changeset	187 outgoing_counts = defaultdict(int)
1d019706d866 LLVM10 anatofuz parents: diff changeset	188 incoming_counts = defaultdict(int)
1d019706d866 LLVM10 anatofuz parents: diff changeset	189 for (total, smallest, cycle) in counted:
1d019706d866 LLVM10 anatofuz parents: diff changeset	190 for (first, count, last) in cycle:
1d019706d866 LLVM10 anatofuz parents: diff changeset	191 outgoing_counts[first] += count
1d019706d866 LLVM10 anatofuz parents: diff changeset	192 incoming_counts[last] += count
1d019706d866 LLVM10 anatofuz parents: diff changeset	193 for cycle in cycles:
1d019706d866 LLVM10 anatofuz parents: diff changeset	194 this_cycle = set(cycle)
1d019706d866 LLVM10 anatofuz parents: diff changeset	195 disjoints = [x for x in islands if this_cycle.isdisjoint(x)]
1d019706d866 LLVM10 anatofuz parents: diff changeset	196 overlaps = [x for x in islands if not this_cycle.isdisjoint(x)]
1d019706d866 LLVM10 anatofuz parents: diff changeset	197 islands = disjoints + [set.union(this_cycle, *overlaps)]
1d019706d866 LLVM10 anatofuz parents: diff changeset	198 print("Found {} disjoint cycle islands...".format(len(islands)))
1d019706d866 LLVM10 anatofuz parents: diff changeset	199 for island in islands:
1d019706d866 LLVM10 anatofuz parents: diff changeset	200 print("Island ({} elements)".format(len(island)))
1d019706d866 LLVM10 anatofuz parents: diff changeset	201 sorted = []
1d019706d866 LLVM10 anatofuz parents: diff changeset	202 for node in island:
1d019706d866 LLVM10 anatofuz parents: diff changeset	203 sorted.append((node, incoming_counts[node], outgoing_counts[node]))
1d019706d866 LLVM10 anatofuz parents: diff changeset	204 sorted.sort(key = lambda x: x[1]+x[2])
1d019706d866 LLVM10 anatofuz parents: diff changeset	205 for (node, inc, outg) in sorted:
1d019706d866 LLVM10 anatofuz parents: diff changeset	206 print(" {} [{} in, {} out]".format(node, inc, outg))
1d019706d866 LLVM10 anatofuz parents: diff changeset	207 sys.stdout.flush()
1d019706d866 LLVM10 anatofuz parents: diff changeset	208 pass

Mercurial > hg > CbC > CbC_llvm

annotate lldb/scripts/analyze-project-deps.py @ 220:42394fc6a535