123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208 |
- #! /usr/bin/python
- import argparse
- import ast
- import os
- import re
- import sys
- import yaml
- class DefinitionVisitor(ast.NodeVisitor):
- def __init__(self):
- super().__init__()
- self.functions = {}
- self.classes = {}
- self.names = {}
- self.attrs = set()
- self.definitions = {
- "def": self.functions,
- "class": self.classes,
- "names": self.names,
- "attrs": self.attrs,
- }
- def visit_Name(self, node):
- self.names.setdefault(type(node.ctx).__name__, set()).add(node.id)
- def visit_Attribute(self, node):
- self.attrs.add(node.attr)
- for child in ast.iter_child_nodes(node):
- self.visit(child)
- def visit_ClassDef(self, node):
- visitor = DefinitionVisitor()
- self.classes[node.name] = visitor.definitions
- for child in ast.iter_child_nodes(node):
- visitor.visit(child)
- def visit_FunctionDef(self, node):
- visitor = DefinitionVisitor()
- self.functions[node.name] = visitor.definitions
- for child in ast.iter_child_nodes(node):
- visitor.visit(child)
- def non_empty(defs):
- functions = {name: non_empty(f) for name, f in defs["def"].items()}
- classes = {name: non_empty(f) for name, f in defs["class"].items()}
- result = {}
- if functions:
- result["def"] = functions
- if classes:
- result["class"] = classes
- names = defs["names"]
- uses = []
- for name in names.get("Load", ()):
- if name not in names.get("Param", ()) and name not in names.get("Store", ()):
- uses.append(name)
- uses.extend(defs["attrs"])
- if uses:
- result["uses"] = uses
- result["names"] = names
- result["attrs"] = defs["attrs"]
- return result
- def definitions_in_code(input_code):
- input_ast = ast.parse(input_code)
- visitor = DefinitionVisitor()
- visitor.visit(input_ast)
- definitions = non_empty(visitor.definitions)
- return definitions
- def definitions_in_file(filepath):
- with open(filepath) as f:
- return definitions_in_code(f.read())
- def defined_names(prefix, defs, names):
- for name, funcs in defs.get("def", {}).items():
- names.setdefault(name, {"defined": []})["defined"].append(prefix + name)
- defined_names(prefix + name + ".", funcs, names)
- for name, funcs in defs.get("class", {}).items():
- names.setdefault(name, {"defined": []})["defined"].append(prefix + name)
- defined_names(prefix + name + ".", funcs, names)
- def used_names(prefix, item, defs, names):
- for name, funcs in defs.get("def", {}).items():
- used_names(prefix + name + ".", name, funcs, names)
- for name, funcs in defs.get("class", {}).items():
- used_names(prefix + name + ".", name, funcs, names)
- path = prefix.rstrip(".")
- for used in defs.get("uses", ()):
- if used in names:
- if item:
- names[item].setdefault("uses", []).append(used)
- names[used].setdefault("used", {}).setdefault(item, []).append(path)
- if __name__ == "__main__":
- parser = argparse.ArgumentParser(description="Find definitions.")
- parser.add_argument(
- "--unused", action="store_true", help="Only list unused definitions"
- )
- parser.add_argument(
- "--ignore", action="append", metavar="REGEXP", help="Ignore a pattern"
- )
- parser.add_argument(
- "--pattern", action="append", metavar="REGEXP", help="Search for a pattern"
- )
- parser.add_argument(
- "directories",
- nargs="+",
- metavar="DIR",
- help="Directories to search for definitions",
- )
- parser.add_argument(
- "--referrers",
- default=0,
- type=int,
- help="Include referrers up to the given depth",
- )
- parser.add_argument(
- "--referred",
- default=0,
- type=int,
- help="Include referred down to the given depth",
- )
- parser.add_argument(
- "--format", default="yaml", help="Output format, one of 'yaml' or 'dot'"
- )
- args = parser.parse_args()
- definitions = {}
- for directory in args.directories:
- for root, _, files in os.walk(directory):
- for filename in files:
- if filename.endswith(".py"):
- filepath = os.path.join(root, filename)
- definitions[filepath] = definitions_in_file(filepath)
- names = {}
- for filepath, defs in definitions.items():
- defined_names(filepath + ":", defs, names)
- for filepath, defs in definitions.items():
- used_names(filepath + ":", None, defs, names)
- patterns = [re.compile(pattern) for pattern in args.pattern or ()]
- ignore = [re.compile(pattern) for pattern in args.ignore or ()]
- result = {}
- for name, definition in names.items():
- if patterns and not any(pattern.match(name) for pattern in patterns):
- continue
- if ignore and any(pattern.match(name) for pattern in ignore):
- continue
- if args.unused and definition.get("used"):
- continue
- result[name] = definition
- referrer_depth = args.referrers
- referrers = set()
- while referrer_depth:
- referrer_depth -= 1
- for entry in result.values():
- for used_by in entry.get("used", ()):
- referrers.add(used_by)
- for name, definition in names.items():
- if name not in referrers:
- continue
- if ignore and any(pattern.match(name) for pattern in ignore):
- continue
- result[name] = definition
- referred_depth = args.referred
- referred = set()
- while referred_depth:
- referred_depth -= 1
- for entry in result.values():
- for uses in entry.get("uses", ()):
- referred.add(uses)
- for name, definition in names.items():
- if name not in referred:
- continue
- if ignore and any(pattern.match(name) for pattern in ignore):
- continue
- result[name] = definition
- if args.format == "yaml":
- yaml.dump(result, sys.stdout, default_flow_style=False)
- elif args.format == "dot":
- print("digraph {")
- for name, entry in result.items():
- print(name)
- for used_by in entry.get("used", ()):
- if used_by in result:
- print(used_by, "->", name)
- print("}")
- else:
- raise ValueError("Unknown format %r" % (args.format))
|