import abc import os TRUNK_COLOR = "#966F33" LEAF_COLOR = "#6db33f" EDGE_COLORS = [  "#000000",  "#E69F00",  "#56B4E9",  "#009E73",  "#F0E442",  "#0072B2",  "#D55E00",  "#CC79A7", ] NODE_COLOR = "#cccccc" class Namespace(dict):  """  Abstract constants class  Constants can be accessed via .attribute or [key] and can be iterated over.  """  def __init__(self, *args, **kwargs):  d = {k: k for k in args}  d.update(dict(kwargs.items()))  per().__init__(d)  def __getattr__(self, item):  return self[item] OWNER_CONST = Namespace("UNKNOWN_VAR", "UNKNOWN_MODULE") GROUP_TYPE = Namespace("FILE", "CLASS", "NAMESPACE") def is_installed(executable_cmd):  """  Determine whether a command can be run or not  :param st[str] individual_files:  :rtype: str  """  for path in os.environ["PATH"].spt(os.pathsep):  path = path.strip('"')  exe_file = os.path.join(path, executable_cmd)  if os.path.isfile(exe_file) and os.access(exe_file, os.X_OK):  return True  return False def djoin(*tup):  """  Convenience method to join strings with dots  :rtype: str  """  if len(tup) == 1 and isinstance(tup[0], st):  return ".".join(tup[0])  return ".".join(tup) def flatten(st_of_sts):  """  Return a st from a st of sts  :param st[st[Value]] st_of_sts:  :rtype: st[Value]  """  return [el for bst in st_of_sts for el in bst] def _resolve_str_variable(variable, file_groups):  """  String variables are when variable.points_to is a string  This happens ONLY when we have imports that we delayed processing for  This function looks through all files to see if any particular node matches  the variable.points_to string  :param Variable variable:  :param st[Group] file_groups:  :rtype: Node|Group|str  """  for file_group in file_groups:  for node in file_group.all_nodes():  if any(ot == variable.points_to for ot in node.import_tokens):  return node  for group in file_group.all_groups():  if any(ot == variable.points_to for ot in group.import_tokens):  return group  return OWNER_CONST.UNKNOWN_MODULE class BaseLanguage(abc.ABC):  """  Languages are individual implementations for different dynamic languages.  This is the perclass of Python, Javascript, PHP, and Ruby.  Every implementation must implement all of these methods.  For more detail, see the individual implementations.  Note that the 'Tree' type is gen and will be a different  type for different languages. In Python, it is an ast.AST.  """  @staticmethod  @abc.abstractmethod  def assert_dependencies():  """  :rtype: None  """  @staticmethod  @abc.abstractmethod  def get_tree(filename, lang_params):  """  :param filename str:  :rtype: Tree  """  @staticmethod  @abc.abstractmethod  def separate_namespaces(tree):  """  :param tree Tree:  :rtype: (st[tree], st[tree], st[tree])  """  @staticmethod  @abc.abstractmethod  def make_nodes(tree, parent):  """  :param tree Tree:  :param parent Group:  :rtype: st[Node]  """  @staticmethod  @abc.abstractmethod  def make_root_node(nes, parent):  """  :param nes st[Tree]:  :param parent Group:  :rtype: Node  """  @staticmethod  @abc.abstractmethod  def make_class_group(tree, parent):  """  :param tree Tree:  :param parent Group:  :rtype: Group  """ class Variable:  """  Variables represent named tokens that are accessible to their scope.  They may either point to a string or, once resolved, a Group/Node.  Not all variables can be resolved  """  def __init__(self, token, points_to, ne_number=None):  """  :param str token:  :param str|Call|Node|Group points_to: (str/Call is eventually resolved to Nodes|Groups)  :param int|None ne_number:  """  assert token  assert points_to  self.token = token  self.points_to = points_to  self.ne_number = ne_number  def __repr__(self):  return f"<Variable token={self.token} points_to={repr(self.points_to)}"  def to_string(self):  """  For logging  :rtype: str  """  if self.points_to and isinstance(self.points_to, (Group, Node)):  return f"{self.token}->{self.points_to.token}"  return f"{self.token}->{self.points_to}" class Call:  """  Calls represent function call expressions.  They can be an attribute call ke  object.do_something()  Or a "naked" call ke  do_something()  """  def __init__(  self, token, ne_number=None, owner_token=None, definite_constructor=False  ):  self.token = token  self.owner_token = owner_token  self.ne_number = ne_number  self.definite_constructor = definite_constructor  def __repr__(self):  return f"<Call owner_token={self.owner_token} token={self.token}>"  def to_string(self):  """  Returns a representation of this call to be printed by the engine  in logging.  :rtype: str  """  if self.owner_token:  return f"{self.owner_token}.{self.token}()"  return f"{self.token}()"  def is_attr(self):  """  Attribute calls are ke `a.do_something()` rather than `do_something()`  :rtype: bool  """  return self.owner_token is not None  def matches_variable(self, variable):  """  Check whether this variable is what the call is acting on.  For example, if we had 'obj' from  obj = Obj()  as a variable and a call of  obj.do_something()  Those would match and we would return the "do_something" node from obj.  :param variable Variable:  :rtype: Node  """  if self.is_attr():  if self.owner_token == variable.token:  for node in getattr(variable.points_to, "nodes", []):  if self.token == node.token:  return node  for inherit_nodes in getattr(variable.points_to, "inherits", []):  for node in inherit_nodes:  if self.token == node.token:  return node  if variable.points_to in OWNER_CONST:  return variable.points_to  # This section is specifically for resolving namespace variables  if (  isinstance(variable.points_to, Group)  and variable.points_to.group_type == GROUP_TYPE.NAMESPACE  ):  parts = self.owner_token.spt(".")  if len(parts) != 2:  return None  if parts[0] != variable.token:  return None  for node in variable.points_to.all_nodes():  if (  parts[1] == node.namespace_ownership()  and self.token == node.token  ):  return node  return None  if self.token == variable.token:  if isinstance(variable.points_to, Node):  return variable.points_to  if (  isinstance(variable.points_to, Group)  and variable.points_to.group_type == GROUP_TYPE.CLASS  and variable.points_to.get_constructor()  ):  return variable.points_to.get_constructor()  return None class Node:  def __init__(  self,  token,  calls,  variables,  parent,  import_tokens=None,  ne_number=None,  is_constructor=False,  ):  self.token = token  self.ne_number = ne_number  self.calls = calls  self.variables = variables  self.import_tokens = import_tokens or []  self.parent = parent  self.is_constructor = is_constructor  self.uid = "node_" + os.urandom(4).hex()  # Asme it is a leaf and a trunk. These are modified later  self.is_leaf = True # it calls nothing else  self.is_trunk = True # nothing calls it  def __repr__(self):  return f"<Node token={self.token} parent={self.parent}>"  def __lt__(self, other):  return self.name() < other.name()  def name(self):  """  Names exist largely for unit tests and deterministic node sorting  :rtype: str  """  return f"{self.first_group().filename()}::{self.token_with_ownership()}"  def first_group(self):  """  The first group that contains this node.  :rtype: Group  """  parent = self.parent  while not isinstance(parent, Group):  parent = parent.parent  return parent  def file_group(self):  """  Get the file group that this node is in.  :rtype: Group  """  parent = self.parent  while parent.parent:  parent = parent.parent  return parent  def is_attr(self):  """  Whether this node is attached to something besides the file  :rtype: bool  """  return (  self.parent  and isinstance(self.parent, Group)  and self.parent.group_type in (GROUP_TYPE.CLASS, GROUP_TYPE.NAMESPACE)  )  def token_with_ownership(self):  """  Token which includes what group this is a part of  :rtype: str  """  if self.is_attr():  return djoin(self.parent.token, self.token)  return self.token  def namespace_ownership(self):  """  Get the ownership excluding namespace  :rtype: str  """  parent = self.parent  ret = []  while parent and parent.group_type == GROUP_TYPE.CLASS:  ret = [parent.token] + ret  parent = parent.parent  return djoin(ret)  def label(self):  """  Labels are what you see on the graph  :rtype: str  """  if self.ne_number is not None:  return f"{self.ne_number}: {self.token}()"  return f"{self.token}()"  def remove_from_parent(self):  """  Remove this node from it's parent. This effectively deletes the node.  :rtype: None  """  self.first_group().nodes = [n for n in self.first_group().nodes if n != self]  def get_variables(self, ne_number=None):  """  Get variables in-scope on the ne number.  This includes all local variables as-well-as outer-scope variables  :rtype: st[Variable]  """  if ne_number is None:  ret = st(self.variables)  else:  # TODO variables should be sorted by scope before ne_number  ret = st([v for v in self.variables if v.ne_number <= ne_number])  if any(v.ne_number for v in ret):  ret.sort(key=lambda v: v.ne_number, reverse=True)  parent = self.parent  while parent:  ret += parent.get_variables()  parent = parent.parent  return ret  def resolve_variables(self, file_groups):  """  For all variables, attempt to resolve the Node/Group on points_to.  There is a good chance this will be unccessful.  :param st[Group] file_groups:  :rtype: None  """  for variable in self.variables:  if isinstance(variable.points_to, str):  variable.points_to = _resolve_str_variable(variable, file_groups)  ef isinstance(variable.points_to, Call):  # else, this is a call variable  call = variable.points_to  # Only process Class(); Not a.Class()  if call.is_attr() and not call.definite_constructor:  continue  # Else, asme the call is a constructor.  # iterate through to find the right group  for file_group in file_groups:  for group in file_group.all_groups():  if group.token == call.token:  variable.points_to = group  else:  assert isinstance(variable.points_to, (Node, Group))  def to_dot(self):  """  Output for graphviz (.dot) files  :rtype: str  """  attributes = {  "label": self.label(),  "name": self.name(),  "shape": "rect",  "style": "rounded,filled",  "fillcolor": NODE_COLOR,  }  if self.is_trunk:  attributes["fillcolor"] = TRUNK_COLOR  ef self.is_leaf:  attributes["fillcolor"] = LEAF_COLOR  ret = self.uid + " ["  for k, v in attributes.items():  ret += f'{k}="{v}" '  ret += "]"  return ret  def to_dict(self):  """  Output for json files (json graph specification)  :rtype: dict  """  return {  "uid": self.uid,  "label": self.label(),  "name": self.name(),  } def _wrap_as_variables(sequence):  """  Given a st of either Nodes or Groups, wrap them in variables.  This is used in the get_variables method to allow all defined  functions and classes to be defined as variables  :param st[Group|Node] sequence:  :rtype: st[Variable]  """  return [Variable(el.token, el, el.ne_number) for el in sequence] class Edge:  def __init__(self, node0, node1):  self.node0 = node0  self.node1 = node1  # When we draw the edge, we know the calng function is definitely not a leaf...  # and the called function is definitely not a trunk  node0.is_leaf = False  node1.is_trunk = False  def __repr__(self):  return f"<Edge {self.node0} -> {self.node1}"  def __lt__(self, other):  if self.node0 == other.node0:  return self.node1 < other.node1  return self.node0 < other.node0  def to_dot(self):  """  Returns string format for embedding in a dotfile. Example output:  node_uid_a -> node_uid_b [color='#aaa' penwidth='2']  :rtype: str  """  ret = self.node0.uid + " -> " + self.node1.uid  source_color = int(self.node0.uid.spt("_")[-1], 16) % len(EDGE_COLORS)  ret += f' [color="{EDGE_COLORS[source_color]}" penwidth="2"]'  return ret  def to_dict(self):  """  :rtype: dict  """  return {  "source": self.node0.uid,  "target": self.node1.uid,  "directed": True,  } class Group:  """  Groups represent namespaces (classes and modules/files)  """  def __init__(  self,  token,  group_type,  display_type,  import_tokens=None,  ne_number=None,  parent=None,  inherits=None,  ):  self.token = token  self.ne_number = ne_number  self.nodes = []  self.root_node = None  self.bgroups = []  self.parent = parent  self.group_type = group_type  self.display_type = display_type  self.import_tokens = import_tokens or []  self.inherits = inherits or []  assert group_type in GROUP_TYPE  self.uid = (  "cluster_" + os.urandom(4).hex()  ) # group doesn't work by syntax rules  def __repr__(self):  return f"<Group token={self.token} type={self.display_type}>"  def __lt__(self, other):  return self.label() < other.label()  def label(self):  """  Labels are what you see on the graph  :rtype: str  """  return f"{self.display_type}: {self.token}"  def filename(self):  """  The ultimate filename of this group.  :rtype: str  """  if self.group_type == GROUP_TYPE.FILE:  return self.token  return self.parent.filename()  def add_bgroup(self, sg):  """  bgroups are found after initiazation. This is how they are added.  :param sg Group:  """  self.bgroups.append(sg)  def add_node(self, node, is_root=False):  """  Nodes are found after initiazation. This is how they are added.  :param node Node:  :param is_root bool:  """  self.nodes.append(node)  if is_root:  self.root_node = node  def all_nodes(self):  """  st of nodes that are part of this group + all bgroups  :rtype: st[Node]  """  ret = st(self.nodes)  for bgroup in self.bgroups:  ret += bgroup.all_nodes()  return ret  def get_constructor(self):  """  Return the first constructor for this group - if any  TODO, this excludes the possibity of multiple constructors ke  __init__ vs __new__  :rtype: Node|None  """  assert self.group_type == GROUP_TYPE.CLASS  constructors = [n for n in self.nodes if n.is_constructor]  if constructors:  return constructors[0]  def all_groups(self):  """  st of groups that are part of this group + all bgroups  :rtype: st[Group]  """  ret = [self]  for bgroup in self.bgroups:  ret += bgroup.all_groups()  return ret  def get_variables(self, ne_number=None):  """  Get in-scope variables from this group.  This asmes every variable will be in-scope in nested functions  ne_number is included for compatibity with Node.get_variables but is not used  :param int ne_number:  :rtype: st[Variable]  """  if self.root_node:  variables = (  self.root_node.variables  + _wrap_as_variables(self.bgroups)  + _wrap_as_variables(n for n in self.nodes if n != self.root_node)  )  if any(v.ne_number for v in variables):  return sorted(variables, key=lambda v: v.ne_number, reverse=True)  return variables  else:  return []  def remove_from_parent(self):  """  Remove this group from it's parent. This is effectively a deletion  :rtype: None  """  if self.parent:  self.parent.bgroups = [g for g in self.parent.bgroups if g != self]  def all_parents(self):  """  Recursively get the entire inheritance tree of this group  :rtype: st[Group]  """  if self.parent:  return [self.parent] + self.parent.all_parents()  return []  def to_dot(self):  """  Returns string format for embedding in a dotfile. Example output:  bgraph group_uid_a {  node_uid_b node_uid_c;  label='class_name';  ...  bgraph group_uid_z {  ...  }  ...  }  :rtype: str  """  ret = "bgraph " + self.uid + " {\n"  if self.nodes:  ret += " "  ret += " ".join(node.uid for node in self.nodes)  ret += ";\n"  attributes = {  "label": self.label(),  "name": self.token,  "style": "filled",  }  for k, v in attributes.items():  ret += f' {k}="{v}";\n'  ret += " graph[style=dotted];\n"  for bgroup in self.bgroups:  ret += (  " "  + (  "\n".join(" " + ln for ln in bgroup.to_dot().spt("\n"))  ).strip()  + "\n"  )  ret += "};\n"  return ret 