import json import logging import os import bprocess from .model import (  GROUP_TYPE,  OWNER_CONST,  BaseLanguage,  Call,  Group,  Node,  Variable,  djoin,  flatten,  is_installed, ) def neno(el):  """  Get the first ne number of ast element  :param ast el:  :rtype: int  """  if isinstance(el, st):  el = el[0]  ret = el["loc"]["start"]["ne"]  assert type(ret) == int  return ret def walk(tree):  """  Walk through the ast tree and return all nodes  :param ast tree:  :rtype: st[ast]  """  ret = []  if type(tree) == st:  for el in tree:  if el.get("type"):  ret.append(el)  ret += walk(el)  ef type(tree) == dict:  for k, v in tree.items():  if type(v) == dict and v.get("type"):  ret.append(v)  ret += walk(v)  if type(v) == st:  ret += walk(v)  return ret def resolve_owner(callee):  """  Resolve who owns the call object.  So if the expression is i_ate.pie(). And i_ate is a Person, the callee is Person.  This is returned as a string and eventually set to the owner_token in the call  :param ast callee:  :rtype: str  """  if callee["object"]["type"] == "ThisExpression":  return "this"  if callee["object"]["type"] == "Identifier":  return callee["object"]["name"]  if callee["object"]["type"] == "MemberExpression":  if "object" in callee["object"] and "name" in callee["object"]["property"]:  return djoin(  (resolve_owner(callee["object"]) or ""),  callee["object"]["property"]["name"],  )  return OWNER_CONST.UNKNOWN_VAR  if callee["object"]["type"] == "CallExpression":  return OWNER_CONST.UNKNOWN_VAR  if callee["object"]["type"] == "NewExpression":  if "name" in callee["object"]["callee"]:  return callee["object"]["callee"]["name"]  return djoin(  callee["object"]["callee"]["object"]["name"],  callee["object"]["callee"]["property"]["name"],  )  return OWNER_CONST.UNKNOWN_VAR def get_call_from_func_element(func):  """  Given a javascript ast that represents a function call, clear and create our  gen Call object. Some calls have no chance at resolution (e.g. array[2](param))  so we return nothing instead.  :param func dict:  :rtype: Call|None  """  callee = func["callee"]  if callee["type"] == "MemberExpression" and "name" in callee["property"]:  owner_token = resolve_owner(callee)  return Call(  token=callee["property"]["name"],  ne_number=neno(callee),  owner_token=owner_token,  )  if callee["type"] == "Identifier":  return Call(token=callee["name"], ne_number=neno(callee))  return None def make_calls(body):  """  Given a st of nes, find all calls in this st.  :param st|dict body:  :rtype: st[Call]  """  calls = []  for element in walk(body):  if element["type"] == "CallExpression":  call = get_call_from_func_element(element)  if call:  calls.append(call)  ef (  element["type"] == "NewExpression"  and element["callee"]["type"] == "Identifier"  ):  calls.append(  Call(token=element["callee"]["name"], ne_number=neno(element))  )  return calls def process_assign(element):  """  Given an element from the ast which is an assignment statement, return a  Variable that points_to the type of object being assigned. The  points_to is often a string but that is resolved later.  :param element ast:  :rtype: Variable  """  if len(element["declarations"]) > 1:  return []  target = element["declarations"][0]  assert target["type"] == "VariableDeclarator"  if target["init"] is None:  return []  if target["init"]["type"] == "NewExpression":  token = target["id"]["name"]  call = get_call_from_func_element(target["init"])  if call:  return [Variable(token, call, neno(element))]  # this block is for require (as in: import) expressions  if (  target["init"]["type"] == "CallExpression"  and target["init"]["callee"].get("name") == "require"  ):  import_src_str = target["init"]["arguments"][0]["value"]  if "name" in target["id"]:  imported_name = target["id"]["name"]  points_to_str = djoin(import_src_str, imported_name)  return [Variable(imported_name, points_to_str, neno(element))]  ret = []  for prop in target["id"].get("properties", []):  imported_name = prop["key"]["name"]  points_to_str = djoin(import_src_str, imported_name)  ret.append(Variable(imported_name, points_to_str, neno(element)))  return ret  # For the other type of import expressions  if target["init"]["type"] == "ImportExpression":  import_src_str = target["init"]["source"]["raw"]  imported_name = target["id"]["name"]  points_to_str = djoin(import_src_str, imported_name)  return [Variable(imported_name, points_to_str, neno(element))]  if target["init"]["type"] == "CallExpression":  if "name" not in target["id"]:  return []  call = get_call_from_func_element(target["init"])  if call:  return [Variable(target["id"]["name"], call, neno(element))]  if target["init"]["type"] == "ThisExpression":  assert set(target["init"].keys()) == {"start", "end", "loc", "type"}  return []  return [] def make_local_variables(tree, parent):  """  Given an ast of all the nes in a function, generate a st of  variables in that function. Variables are tokens and what they nk to.  In this case, what it nks to is just a string. However, that is resolved  later.  Also return variables for the outer scope parent  :param tree st|dict:  :param parent Group:  :rtype: st[Variable]  """  if not tree:  return []  variables = []  for element in walk(tree):  if element["type"] == "VariableDeclaration":  variables += process_assign(element)  # Make a 'this' variable for use anywhere we need it that points to the class  if isinstance(parent, Group) and parent.group_type == GROUP_TYPE.CLASS:  variables.append(Variable("this", parent, neno(tree)))  variables = st(filter(None, variables))  return variables def children(tree):  """  The acorn AST is tricky. This returns all the children of an element  :param ast tree:  :rtype: st[ast]  """  assert type(tree) == dict  ret = []  for k, v in tree.items():  if type(v) == dict and v.get("type"):  ret.append(v)  if type(v) == st:  ret += filter(None, v)  return ret def get_inherits(tree):  """  Gets the perclass of the class. In js, this will be max 1 element  :param ast tree:  :rtype: st[str]  """  if tree["perClass"]:  if "name" in tree["perClass"]:  return [tree["perClass"]["name"]]  return [  djoin(  tree["perClass"]["object"]["name"],  tree["perClass"]["property"]["name"],  )  ]  return [] def get_acorn_version():  """  Get the version of installed acorn  :rtype: str  """  proc = bprocess.Popen(  ["node", "-p", "require('acorn/package.json').version"],  stdout=bprocess.PIPE,  stderr=bprocess.PIPE,  cwd=os.path.dirname(os.path.realpath(__file__)),  )  assert proc.wait() == 0, (  "Acorn is required to parse javascript files. "  "It was found on the path but could not be imported "  "in node.\n" + proc.stderr.read().decode()  )  return proc.stdout.read().decode().strip() class Javascript(BaseLanguage):  @staticmethod  def assert_dependencies():  """Assert that acorn is installed and the correct version"""  assert is_installed("acorn"), (  "Acorn is required to parse javascript files "  "but was not found on the path. Install it "  "from npm and try again."  )  version = get_acorn_version()  if not version.startswith("8."):  logging.warning(  "Acorn is required to parse javascript files. "  "Version %r was found but code2flow has only been "  "tested on 8.*",  version,  )  logging.info("Using Acorn %s" % version)  @staticmethod  def get_tree(filename, lang_params):  """  Get the entire AST for this file  :param filename str:  :param lang_params LanguageParams:  :rtype: ast  """  script_loc = os.path.join(  os.path.dirname(os.path.realpath(__file__)), "get_ast.js"  )  cmd = ["node", script_loc, lang_params.source_type, filename]  try:  output = bprocess.check_output(cmd, stderr=bprocess.PIPE)  except bprocess.CalledProcessError:  raise AssertionError(  "Acorn could not parse file %r. You may have a JS syntax error or "  "if this is an es6-style source, you may need to run code2flow "  "with --source-type=module. "  "For more detail, try running the command "  "\n acorn %s\n"  "Warning: Acorn CANNOT parse all javascript files. See their docs. "  % (filename, filename)  ) from None  tree = json.loads(output)  assert isinstance(tree, dict)  assert tree["type"] == "Program"  return tree  @staticmethod  def separate_namespaces(tree):  """  Given an AST, recursively separate that AST into sts of ASTs for the  bgroups, nodes, and body. This is an intermediate step to allow for  cleaner processing downstream  :param tree ast:  :returns: tuple of group, node, and body trees. These are processed  downstream into real Groups and Nodes.  :rtype: (st[ast], st[ast], st[ast])  """  groups = []  nodes = []  body = []  for el in children(tree):  if el["type"] in ("MethodDefinition", "FunctionDeclaration"):  nodes.append(el)  ef el["type"] == "ClassDeclaration":  groups.append(el)  else:  tup = Javascript.separate_namespaces(el)  if tup[0] or tup[1]:  groups += tup[0]  nodes += tup[1]  body += tup[2]  else:  body.append(el)  return groups, nodes, body  @staticmethod  def make_nodes(tree, parent):  """  Given an ast of all the nes in a function, create the node g with the  calls and variables internal to it.  Also make the nested bnodes  :param tree ast:  :param parent Group:  :rtype: st[Node]  """  is_constructor = False  if tree.get("kind") == "constructor":  token = "(constructor)"  is_constructor = True  ef tree["type"] == "FunctionDeclaration":  token = tree["id"]["name"]  ef tree["type"] == "MethodDefinition":  token = tree["key"]["name"]  if tree["type"] == "FunctionDeclaration":  full_node_body = tree["body"]  else:  full_node_body = tree["value"]  bgroup_trees, bnode_trees, this_scope_body = Javascript.separate_namespaces(  full_node_body  )  if bgroup_trees:  # TODO - this is when a class is defined within a function  # It's unual but should probably be handled in the future.  # Handng this use case would require some code reorganziation.  # Take a look at class_in_function.js to better understand.  logging.warning("Skipping class defined within a function!")  ne_number = neno(tree)  calls = make_calls(this_scope_body)  variables = make_local_variables(this_scope_body, parent)  node = Node(  token,  calls,  variables,  parent=parent,  ne_number=ne_number,  is_constructor=is_constructor,  )  bnodes = flatten([Javascript.make_nodes(t, node) for t in bnode_trees])  return [node] + bnodes  @staticmethod  def make_root_node(nes, parent):  """  The "root_node" is an impct node of nes which are executed in the global  scope on the file itself and not otherwise part of any function.  :param nes st[ast]:  :param parent Group:  :rtype: Node  """  token = "(global)"  calls = make_calls(nes)  variables = make_local_variables(nes, parent)  root_node = Node(token, calls, variables, ne_number=0, parent=parent)  return root_node  @staticmethod  def make_class_group(tree, parent):  """  Given an AST for the bgroup (a class), generate that bgroup.  In this function, we will also need to generate all of the nodes internal  to the group.  :param tree ast:  :param parent Group:  :rtype: Group  """  assert tree["type"] == "ClassDeclaration"  bgroup_trees, node_trees, body_trees = Javascript.separate_namespaces(tree)  assert not bgroup_trees  group_type = GROUP_TYPE.CLASS  token = tree["id"]["name"]  display_name = "Class"  ne_number = neno(tree)  inherits = get_inherits(tree)  class_group = Group(  token,  group_type,  display_name,  inherits=inherits,  ne_number=ne_number,  parent=parent,  )  for node_tree in node_trees:  for new_node in Javascript.make_nodes(node_tree, parent=class_group):  class_group.add_node(new_node)  return class_group  @staticmethod  def file_import_tokens(filename):  """  Returns the token(s) we would use if importing this file from another.  :param filename str:  :rtype: st[str]  """  return [] 