summary refs log blame commit diff
path: root/scripts-dev/definitions.py
blob: 313860df139aa16a1ef6a4037db892d0735838da (plain) (tree)
1
2
3
4
5
6
7
8
9
10
                  
               
          


          
           
 
                                         
                          



                            


                                  






















                                                                          
                                                                       
               
                 
                                 
               
                                 
             
                                                                                     
                             
                              
            

                                   















                                                
                                                                                
                                                        
                                                                                

                                                        
                                          
                                                   
                                                           
 
                                                     
                                                           
 
                                     
                         
                    
                                                                                
 
                          
 
                                                                     





                                                                              
                                                                                   
                        
                      
                  
                                                     
     
                        


                                                       
                        


                                                        
                        
                                                                                
     
                              
                    




                                                                         




                                                  
                                                     
 







                                                                             
                                                  

                                 



                                     
                                                 
                                              
                                     



                                                                         






                                              
                                    



                                                                         
                             
                                                               
                              
                          
                                          
                       
                                                 
                                              
                                                             
#! /usr/bin/python

import argparse
import ast
import os
import re
import sys

import yaml


class DefinitionVisitor(ast.NodeVisitor):
    def __init__(self):
        super().__init__()
        self.functions = {}
        self.classes = {}
        self.names = {}
        self.attrs = set()
        self.definitions = {
            "def": self.functions,
            "class": self.classes,
            "names": self.names,
            "attrs": self.attrs,
        }

    def visit_Name(self, node):
        self.names.setdefault(type(node.ctx).__name__, set()).add(node.id)

    def visit_Attribute(self, node):
        self.attrs.add(node.attr)
        for child in ast.iter_child_nodes(node):
            self.visit(child)

    def visit_ClassDef(self, node):
        visitor = DefinitionVisitor()
        self.classes[node.name] = visitor.definitions
        for child in ast.iter_child_nodes(node):
            visitor.visit(child)

    def visit_FunctionDef(self, node):
        visitor = DefinitionVisitor()
        self.functions[node.name] = visitor.definitions
        for child in ast.iter_child_nodes(node):
            visitor.visit(child)


def non_empty(defs):
    functions = {name: non_empty(f) for name, f in defs["def"].items()}
    classes = {name: non_empty(f) for name, f in defs["class"].items()}
    result = {}
    if functions:
        result["def"] = functions
    if classes:
        result["class"] = classes
    names = defs["names"]
    uses = []
    for name in names.get("Load", ()):
        if name not in names.get("Param", ()) and name not in names.get("Store", ()):
            uses.append(name)
    uses.extend(defs["attrs"])
    if uses:
        result["uses"] = uses
    result["names"] = names
    result["attrs"] = defs["attrs"]
    return result


def definitions_in_code(input_code):
    input_ast = ast.parse(input_code)
    visitor = DefinitionVisitor()
    visitor.visit(input_ast)
    definitions = non_empty(visitor.definitions)
    return definitions


def definitions_in_file(filepath):
    with open(filepath) as f:
        return definitions_in_code(f.read())


def defined_names(prefix, defs, names):
    for name, funcs in defs.get("def", {}).items():
        names.setdefault(name, {"defined": []})["defined"].append(prefix + name)
        defined_names(prefix + name + ".", funcs, names)

    for name, funcs in defs.get("class", {}).items():
        names.setdefault(name, {"defined": []})["defined"].append(prefix + name)
        defined_names(prefix + name + ".", funcs, names)


def used_names(prefix, item, defs, names):
    for name, funcs in defs.get("def", {}).items():
        used_names(prefix + name + ".", name, funcs, names)

    for name, funcs in defs.get("class", {}).items():
        used_names(prefix + name + ".", name, funcs, names)

    path = prefix.rstrip(".")
    for used in defs.get("uses", ()):
        if used in names:
            if item:
                names[item].setdefault("uses", []).append(used)
            names[used].setdefault("used", {}).setdefault(item, []).append(path)


if __name__ == "__main__":

    parser = argparse.ArgumentParser(description="Find definitions.")
    parser.add_argument(
        "--unused", action="store_true", help="Only list unused definitions"
    )
    parser.add_argument(
        "--ignore", action="append", metavar="REGEXP", help="Ignore a pattern"
    )
    parser.add_argument(
        "--pattern", action="append", metavar="REGEXP", help="Search for a pattern"
    )
    parser.add_argument(
        "directories",
        nargs="+",
        metavar="DIR",
        help="Directories to search for definitions",
    )
    parser.add_argument(
        "--referrers",
        default=0,
        type=int,
        help="Include referrers up to the given depth",
    )
    parser.add_argument(
        "--referred",
        default=0,
        type=int,
        help="Include referred down to the given depth",
    )
    parser.add_argument(
        "--format", default="yaml", help="Output format, one of 'yaml' or 'dot'"
    )
    args = parser.parse_args()

    definitions = {}
    for directory in args.directories:
        for root, dirs, files in os.walk(directory):
            for filename in files:
                if filename.endswith(".py"):
                    filepath = os.path.join(root, filename)
                    definitions[filepath] = definitions_in_file(filepath)

    names = {}
    for filepath, defs in definitions.items():
        defined_names(filepath + ":", defs, names)

    for filepath, defs in definitions.items():
        used_names(filepath + ":", None, defs, names)

    patterns = [re.compile(pattern) for pattern in args.pattern or ()]
    ignore = [re.compile(pattern) for pattern in args.ignore or ()]

    result = {}
    for name, definition in names.items():
        if patterns and not any(pattern.match(name) for pattern in patterns):
            continue
        if ignore and any(pattern.match(name) for pattern in ignore):
            continue
        if args.unused and definition.get("used"):
            continue
        result[name] = definition

    referrer_depth = args.referrers
    referrers = set()
    while referrer_depth:
        referrer_depth -= 1
        for entry in result.values():
            for used_by in entry.get("used", ()):
                referrers.add(used_by)
        for name, definition in names.items():
            if name not in referrers:
                continue
            if ignore and any(pattern.match(name) for pattern in ignore):
                continue
            result[name] = definition

    referred_depth = args.referred
    referred = set()
    while referred_depth:
        referred_depth -= 1
        for entry in result.values():
            for uses in entry.get("uses", ()):
                referred.add(uses)
        for name, definition in names.items():
            if name not in referred:
                continue
            if ignore and any(pattern.match(name) for pattern in ignore):
                continue
            result[name] = definition

    if args.format == "yaml":
        yaml.dump(result, sys.stdout, default_flow_style=False)
    elif args.format == "dot":
        print("digraph {")
        for name, entry in result.items():
            print(name)
            for used_by in entry.get("used", ()):
                if used_by in result:
                    print(used_by, "->", name)
        print("}")
    else:
        raise ValueError("Unknown format %r" % (args.format))