You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

parser.py 22 kB

5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609
  1. # This is the Python adaptation and derivative work of Myia (https://github.com/mila-iqia/myia/).
  2. #
  3. # Copyright 2020 Huawei Technologies Co., Ltd
  4. #
  5. # Licensed under the Apache License, Version 2.0 (the "License");
  6. # you may not use this file except in compliance with the License.
  7. # You may obtain a copy of the License at
  8. #
  9. # http://www.apache.org/licenses/LICENSE-2.0
  10. #
  11. # Unless required by applicable law or agreed to in writing, software
  12. # distributed under the License is distributed on an "AS IS" BASIS,
  13. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  14. # See the License for the specific language governing permissions and
  15. # limitations under the License.
  16. # ============================================================================
  17. """The module of parser python object, called by c++."""
  18. import ast
  19. import hashlib
  20. import inspect
  21. import types
  22. from dataclasses import is_dataclass
  23. from textwrap import dedent
  24. import asttokens
  25. from mindspore import Tensor as MsTensor
  26. from mindspore import context
  27. from mindspore import log as logger
  28. from mindspore import nn
  29. from mindspore import ops
  30. from mindspore.common.api import _MindSporeFunction
  31. from mindspore.common.dtype import pytype_to_dtype
  32. from .namespace import CellNamespace, ClosureNamespace, ClassMemberNamespace
  33. from .resources import parse_object_map, convert_object_map, trope_ns, SYMBOL_UNDEFINE, NO_IMPLEMENT
  34. # define return value
  35. RET_SUCCESS = 0
  36. RET_FAILURE = 0xFF
  37. # define resolve type
  38. RESOLVE_TYPE_NONE = 0 # resolve None
  39. RESOLVE_TYPE_FUNCTION = 1 # resolve function
  40. RESOLVE_TYPE_METHOD = 2 # resolve class method
  41. RESOLVE_TYPE_CLASS_TYPE = 3 # resolve class type
  42. RESOLVE_TYPE_CLASS_INSTANCE = 4 # resolve the class instance of common class
  43. RESOLVE_TYPE_INVALID = 0xFF
  44. # define the class instance detail type
  45. # When the type is RESOLVE_TYPE_CLASS_INSTANCE
  46. CLASS_INSTANCE_TYPE_CELL = 0 # class instance type is Cell
  47. CLASS_INSTANCE_TYPE_PRIMITIVE = 1 # class instance type is Primitive
  48. CLASS_INSTANCE_TYPE_INVALID = 0xFF
  49. # Ast main type
  50. AST_MAIN_TYPE_STMT = 0 # ast.Stmt
  51. AST_MAIN_TYPE_EXPR = 1 # ast.Expr
  52. AST_MAIN_TYPE_SLICE = 2 # ast.Slice
  53. AST_MAIN_TYPE_UNKNOWN = 0xFF # unknown
  54. # Ast sub type
  55. AST_SUB_TYPE_AND = 3 # ast.And
  56. AST_SUB_TYPE_OR = 4 # ast.Or
  57. AST_SUB_TYPE_NAME = 5 # ast.Name
  58. AST_SUB_TYPE_TUPLE = 6 # ast.Tuple
  59. AST_SUB_TYPE_SUBSCRIPT = 7 # ast.Subscript
  60. AST_SUB_TYPE_STARRED = 8 # ast.Starred
  61. AST_SUB_TYPE_ATTRIBUTE = 9 # ast.Attribute
  62. AST_SUB_TYPE_UNKNOWN = 0xFF # unknown
  63. # Process expr statement white list
  64. # add as needed, eg: "clear", "extend", "insert", "remove", "reverse"
  65. parse_expr_statement_white_list = (
  66. "append",
  67. )
  68. def create_slice_obj(start, end, step):
  69. """Create slice object"""
  70. return slice(start, end, step)
  71. def parse_cb(func, parse_method=None):
  72. """Implements the function of parse."""
  73. return Parser(func, parse_method)
  74. def get_parse_method_of_class(obj, parse_method=None):
  75. """
  76. Het parse method of class.
  77. Args:
  78. obj(Object): Instance of class.
  79. parse_method(str): Save the method name. Cell object has default method named 'construct'.
  80. Returns:
  81. Function, obj's method.
  82. """
  83. method = None
  84. method_name = None
  85. if parse_method is not None:
  86. method_name = parse_method
  87. else:
  88. if isinstance(obj, nn.Cell):
  89. if obj.enable_hook:
  90. if context.get_context("mode") == context.GRAPH_MODE:
  91. raise ValueError("The graph mode does not support hook function.")
  92. method_name = "_hook_construct"
  93. else:
  94. method_name = "construct"
  95. if method_name is not None:
  96. if hasattr(obj, method_name):
  97. method = getattr(obj, method_name)
  98. return method
  99. def get_bprop_method_of_class(obj, parse_method=None):
  100. """
  101. Get bprop method of class.
  102. Args:
  103. obj (Object): Instance of class.
  104. parse_method(str): Save the method name. Cell object has default method named 'bprop'.
  105. Returns:
  106. Function, obj's method.
  107. """
  108. method = None
  109. if isinstance(obj, nn.Cell):
  110. method_name = "bprop"
  111. if hasattr(obj, method_name):
  112. method = getattr(obj, method_name)
  113. return method
  114. def resolve_symbol(namespace, symbol):
  115. """
  116. Resolve a symbol.
  117. Note:
  118. Can't get function when use closure function. So save the fn on namespace.
  119. Args:
  120. namespace (Object): Symbol's namespace.
  121. symbol (str): Need resolve symbol.
  122. Returns:
  123. Object, resolve result of symbol.
  124. """
  125. # All exceptions need to be caught in this function
  126. try:
  127. resolve_ = namespace[symbol]
  128. # list and dict is not hashable ,it can not be key for the map, just return the result
  129. if isinstance(resolve_, (tuple, list, dict)):
  130. return resolve_
  131. # dataclass may not be hashable
  132. if getattr(resolve_, "__hash__") is None:
  133. return resolve_
  134. # If need trope the obj
  135. if resolve_ in convert_object_map:
  136. resolve_ = convert_object_map.get(resolve_)
  137. logger.debug("convert resolve = %r", resolve_)
  138. if resolve_ == NO_IMPLEMENT:
  139. raise NotImplementedError("not implemented for ", str(symbol))
  140. except Exception as e:
  141. if isinstance(e, NotImplementedError):
  142. raise e
  143. resolve_ = None
  144. logger.debug("resolve exception occurred, value = %r", e)
  145. logger.debug("resolve type is invalid, namespace = %s, symbol = %s",
  146. namespace.__str__(), symbol)
  147. if isinstance(resolve_, _MindSporeFunction):
  148. logger.debug("resolve class _MindSporeFunction, resolve fn instead.")
  149. resolve_ = resolve_.fn
  150. return resolve_
  151. def generate_scope(obj):
  152. """Generate the scope for every cell object in the network."""
  153. if isinstance(obj, nn.Cell):
  154. obj.generate_scope()
  155. def get_scope_name(obj):
  156. """Returns the scope of a cell object in one network."""
  157. if isinstance(obj, nn.Cell):
  158. return obj.get_scope()
  159. return None
  160. def get_object_key(obj):
  161. """Return the function key: module + name."""
  162. obj_key = ""
  163. if hasattr(obj, "__name__"):
  164. if hasattr(obj, "cell_init_args"):
  165. obj_key = "%s_ID" % (str(obj.__class__.__name__) + str(obj.__name__) + obj.cell_init_args)
  166. obj_id = "%s_ID%d" % (str(obj.__class__.__name__) + str(obj.__name__), id(obj))
  167. else:
  168. # `<class 'xxxxxxx'>`
  169. # -> `xxxxxxx`
  170. tag = str(obj.__class__)[8:-2]
  171. if hasattr(obj, "cell_init_args"):
  172. obj_key = "%s_ID" % (tag + obj.cell_init_args)
  173. obj_id = "%s_ID%d" % (tag, id(obj))
  174. logger.debug("obj_key %s obj_id = %s", obj_key, obj_id)
  175. # method has same id of different instance
  176. if isinstance(obj, types.MethodType):
  177. method_instance = obj.__self__
  178. instance_id = "%s_ID%d" % (str(method_instance.__class__.__name__), id(method_instance))
  179. obj_id = instance_id + obj_id + str(obj.__hash__())
  180. return obj_id, obj_key
  181. def is_class_member(node):
  182. """Check the attr is class member variable."""
  183. type_ = node.__class__.__name__
  184. if type_ == "Attribute":
  185. if not hasattr(node.value, "id"):
  186. return False
  187. id_ = node.value.id
  188. if id_ == "self":
  189. return True
  190. return False
  191. def get_obj_id(obj):
  192. """Get the obj id."""
  193. return str(id(obj))
  194. def get_obj_type(obj):
  195. """Get the obj type."""
  196. obj_type = RESOLVE_TYPE_INVALID
  197. if obj is None:
  198. obj_type = RESOLVE_TYPE_NONE
  199. elif isinstance(obj, types.FunctionType):
  200. obj_type = RESOLVE_TYPE_FUNCTION
  201. elif isinstance(obj, types.MethodType):
  202. obj_type = RESOLVE_TYPE_METHOD
  203. elif isinstance(obj, type):
  204. obj_type = RESOLVE_TYPE_CLASS_TYPE
  205. elif _is_class_instance(obj):
  206. obj_type = RESOLVE_TYPE_CLASS_INSTANCE
  207. else:
  208. # here for ndarray, just print its shape (in case of the array to large and print many data in screen)
  209. is_ndarray = type(obj).__name__ == 'ndarray' and hasattr(obj, 'shape')
  210. raise TypeError(f'Invalid object with type `{type(obj)}` and {"shape" if is_ndarray else "value"} '
  211. f'`{obj.shape if is_ndarray else obj}`.')
  212. return obj_type
  213. def get_class_instance_type(obj):
  214. """Get the class instance detail type."""
  215. # check the obj type
  216. logger.debug("Get the class type(%r)", obj)
  217. class_type = CLASS_INSTANCE_TYPE_INVALID
  218. if _is_class_instance(obj):
  219. if isinstance(obj, nn.Cell):
  220. class_type = CLASS_INSTANCE_TYPE_CELL
  221. elif isinstance(obj, ops.Primitive):
  222. class_type = CLASS_INSTANCE_TYPE_PRIMITIVE
  223. # Add the other type base requirement
  224. return class_type
  225. def _is_class_instance(obj):
  226. """Confirm the obj is class instance."""
  227. return isinstance(obj, (nn.Cell, ops.Primitive)) or _is_dataclass_instance(obj)
  228. def _is_dataclass_instance(obj):
  229. """check whether a class is an instance of a dataclass (and not a dataclass itself)"""
  230. return is_dataclass(obj) and not isinstance(obj, type)
  231. def _convert_tuple_to_args_kwargs(params):
  232. args = tuple()
  233. kwargs = dict()
  234. for param in params:
  235. if isinstance(param, dict):
  236. kwargs.update(param)
  237. else:
  238. args += (param,)
  239. return (args, kwargs)
  240. def create_obj_instance(cls_type, params=None):
  241. """Create python instance."""
  242. if not isinstance(cls_type, type):
  243. logger.warning(f"create_obj_instance(), cls_type is not a type, cls_type: {cls_type}")
  244. return None
  245. # Check the type, now only support nn.Cell and Primitive.
  246. obj = None
  247. if issubclass(cls_type, (nn.Cell, ops.Primitive)):
  248. # Check arguments, only support *args or **kwargs.
  249. if params is None:
  250. obj = cls_type()
  251. elif isinstance(params, tuple):
  252. args, kwargs = _convert_tuple_to_args_kwargs(params)
  253. logger.debug(f"create_obj_instance(), args: {args}, kwargs: {kwargs}")
  254. if args and kwargs:
  255. obj = cls_type(*args, **kwargs)
  256. elif args:
  257. obj = cls_type(*args)
  258. elif kwargs:
  259. obj = cls_type(**kwargs)
  260. # If invalid parameters.
  261. if obj is None:
  262. raise ValueError(f"When call 'create_instance', the parameter should be *args or **kwargs, "
  263. f"but got {params.__class__.__name__}, params: {params}")
  264. return obj
  265. def get_module_namespace(obj):
  266. """Get the module's namespace."""
  267. logger.debug("get module namespace, module = %r", obj)
  268. mod_namespace = None
  269. if isinstance(obj, types.ModuleType):
  270. mod_namespace = CellNamespace(obj.__name__)
  271. else:
  272. logger.warning("Module(%r) is invalid, get namespace failure!", obj)
  273. return mod_namespace
  274. def get_class_member_namespace_symbol(obj):
  275. """Get obj class member type."""
  276. logger.debug("get class instance namespace, object = %r", obj)
  277. class_namespace = ClassMemberNamespace(obj)
  278. logger.debug("class namesapce = %r", class_namespace)
  279. return class_namespace
  280. def get_dataclass_attributes(cls):
  281. """Get attributes of dataclass."""
  282. fields = cls.__dataclass_fields__
  283. attributes = {name: pytype_to_dtype(field.type)
  284. for name, field in fields.items()}
  285. return attributes
  286. def get_dataclass_methods(cls):
  287. """Get functions of dataclass."""
  288. methods = {name: getattr(cls, name)
  289. for name in dir(cls)
  290. if isinstance(getattr(cls, name), (types.FunctionType,))}
  291. return methods
  292. def convert_to_ms_tensor(data):
  293. """Convert C++ tensor to mindspore tensor."""
  294. return MsTensor(data)
  295. def get_object_description(obj, fname, fline):
  296. """return method or funcition description for error report, include location, class name, etc."""
  297. if isinstance(obj, types.MethodType):
  298. obj_cls = obj.__self__.__class__
  299. class_name = f'{obj_cls.__module__}.{obj_cls.__qualname__}'
  300. cls_fname = inspect.getfile(obj_cls)
  301. _, cls_fline = inspect.getsourcelines(obj_cls)
  302. class_loc = f'{cls_fname}:{cls_fline}'
  303. return f"bound method '{obj.__name__}' at {fname}:{fline} of <{class_name} at {class_loc} object>"
  304. if isinstance(obj, types.FunctionType):
  305. return f"function '{obj.__name__}' at {fname}:{fline}"
  306. if isinstance(obj, ast.FunctionDef):
  307. return f"function '{obj.name}' at {fname}:{fline}"
  308. return str(obj)
  309. def expand_expr_statement(node):
  310. """
  311. Process the expr statement and expand it.
  312. Returns:
  313. tuple, (True, expr.value, x)/(False, None, None).
  314. """
  315. if isinstance(node, ast.Expr):
  316. expr_value = node.value
  317. if isinstance(expr_value, ast.Call):
  318. func = expr_value.func
  319. if isinstance(func, ast.Attribute) and \
  320. hasattr(func, "attr") and \
  321. hasattr(func, "value"):
  322. method = func.attr
  323. target = func.value
  324. if method in parse_expr_statement_white_list:
  325. logger.debug("Expand expr, target:%s, method:%s", target, method)
  326. return True, expr_value, target
  327. if not isinstance(expr_value, ast.Str):
  328. return True, expr_value
  329. return (False,)
  330. def get_ast_namespace_symbol(obj):
  331. """Get obj type and namespace and symbol."""
  332. # step 1:get symbol from object map
  333. ops_info = parse_object_map.get(type(obj), SYMBOL_UNDEFINE)
  334. logger.debug("ops info = %r", ops_info)
  335. return ops_info
  336. def get_operation_namespace_symbol(var: str):
  337. """Get operation namespace and symbol."""
  338. ops_info = (trope_ns, var)
  339. logger.debug("get operation ops info = %r", ops_info)
  340. return ops_info
  341. def get_ast_type(node):
  342. """Get the ast type."""
  343. ast_type = AST_SUB_TYPE_UNKNOWN
  344. if isinstance(node, ast.And):
  345. ast_type = AST_SUB_TYPE_AND
  346. elif isinstance(node, ast.Or):
  347. ast_type = AST_SUB_TYPE_OR
  348. elif isinstance(node, ast.Name):
  349. ast_type = AST_SUB_TYPE_NAME
  350. elif isinstance(node, ast.Tuple):
  351. ast_type = AST_SUB_TYPE_TUPLE
  352. elif isinstance(node, ast.Subscript):
  353. ast_type = AST_SUB_TYPE_SUBSCRIPT
  354. elif isinstance(node, ast.Starred):
  355. ast_type = AST_SUB_TYPE_STARRED
  356. elif isinstance(node, ast.Attribute):
  357. ast_type = AST_SUB_TYPE_ATTRIBUTE
  358. else:
  359. ast_type = AST_SUB_TYPE_UNKNOWN
  360. return ast_type
  361. def get_node_type(node):
  362. """Process an ast node."""
  363. method_name = f'{node.__class__.__name__}'
  364. node_type = [method_name]
  365. # judge the ast main type
  366. if isinstance(node, ast.stmt):
  367. node_type.append(AST_MAIN_TYPE_STMT)
  368. elif isinstance(node, (ast.expr, ast.slice)) or node is None:
  369. # ast.slice and ast.expr should be expr
  370. node_type.append(AST_MAIN_TYPE_EXPR)
  371. else:
  372. node_type.append(AST_MAIN_TYPE_UNKNOWN)
  373. return node_type
  374. def get_args_default_values(node):
  375. """get the args'default values of parse object."""
  376. nondefaults = [None] * (len(node.args.args) - len(node.args.defaults))
  377. defaults = nondefaults + node.args.defaults + node.args.kw_defaults
  378. if node.args.vararg:
  379. defaults.append(None)
  380. if node.args.kwarg:
  381. defaults.append(None)
  382. return defaults
  383. def get_args(node):
  384. """Get the arg of parse object."""
  385. args = []
  386. # process position args
  387. for arg in node.args.args:
  388. args.append(arg)
  389. # process kwonlyargs: kwonlyargs is append after position args
  390. if node.args.kwonlyargs:
  391. for kwarg in node.args.kwonlyargs:
  392. args.append(kwarg)
  393. # process vararg: vararg is append after kwonlyargs
  394. if node.args.vararg:
  395. args.append(node.args.vararg)
  396. # process kwarg: kwarg is append after vararg
  397. if node.args.kwarg:
  398. args.append(node.args.kwarg)
  399. return args
  400. class Parser:
  401. """
  402. Parser python code to ast tree.
  403. Args:
  404. fn(FunctionType/MethodType): Need parse object instance.
  405. parse_method(ExtendInfoOfParseObj): Extend information for parse the function.
  406. ast_cache: Dictionary for caching ast tree.
  407. """
  408. ast_cache = {}
  409. def __init__(self, fn: (types.FunctionType, types.MethodType), parse_method=None) -> None:
  410. self.fn = fn
  411. self.parse_method = parse_method
  412. self.line_offset = 0
  413. self.filename: str = inspect.getfile(self.fn)
  414. # Used to resolve the function's globals Namespace.
  415. self.global_namespace = CellNamespace(fn.__module__)
  416. self.function_module = fn.__module__
  417. # Used to resolve the function's nonlocals.
  418. self.closure_namespace = ClosureNamespace(fn)
  419. self.function_name = fn.__name__
  420. self.col_offset = 0
  421. def parse(self):
  422. """Parse the function or method."""
  423. logger.debug("fn = %r", self.fn)
  424. tree = None
  425. if isinstance(self.fn, (types.FunctionType, types.MethodType)):
  426. lines, self.line_offset = inspect.getsourcelines(self.fn)
  427. original_src = ''.join(lines)
  428. hexstr = hashlib.sha256(original_src.encode()).hexdigest()
  429. tree = Parser.ast_cache.get(hexstr)
  430. if not tree:
  431. src = dedent(original_src)
  432. self.col_offset = \
  433. len(original_src.split('\n')[0]) - len(src.split('\n')[0])
  434. logger.debug("get source = %s", src)
  435. try:
  436. tree = asttokens.ASTTokens(src, parse=True).tree
  437. except IndentationError as idt_err:
  438. idt_err.filename = self.filename
  439. idt_err.lineno = self.line_offset
  440. idt_err.msg = f"There are incorrect indentations in definition or comment of function: " \
  441. f"'{self.fn.__qualname__}'."
  442. raise idt_err
  443. Parser.ast_cache[hexstr] = tree
  444. else:
  445. logger.error("Fn type is invalid")
  446. return tree
  447. def get_namespace_symbol(self, var: str):
  448. """Get symbol type and namespace and symbol."""
  449. if var in self.closure_namespace:
  450. logger.debug("in closure_namespace")
  451. return self.closure_namespace, var
  452. if var in self.global_namespace:
  453. logger.debug("in global_namespace")
  454. value = self.global_namespace[var]
  455. if isinstance(value, type(abs)) and self.global_namespace[var] not in convert_object_map:
  456. error_info = f"The builtin function '{var}' is not supported in graph mode."
  457. return None, var, error_info
  458. return self.global_namespace, var
  459. error_info = f"The name '{var}' is not defined."
  460. return None, var, error_info
  461. def analyze_super(self, class_type_node, subclass_instance):
  462. """Analyze super and return a class instance."""
  463. sub_class = type(subclass_instance)
  464. if class_type_node is None:
  465. return super(sub_class, subclass_instance)
  466. if isinstance(class_type_node, ast.Name):
  467. class_name = getattr(class_type_node, 'id')
  468. elif isinstance(class_type_node, ast.Attribute):
  469. class_name = getattr(class_type_node, 'attr')
  470. else:
  471. raise ValueError(f"When call 'super', the first arg should be a class type, "
  472. f"but got {class_type_node.__class__.__name__}.")
  473. target_father_class = None
  474. for class_element in sub_class.mro():
  475. if class_element.__name__ == class_name:
  476. target_father_class = class_element
  477. break
  478. if target_father_class is None:
  479. raise ValueError("When call 'super', the second arg should be an instance of first arg.")
  480. return super(target_father_class, subclass_instance)
  481. def get_location(self, node):
  482. """
  483. Get location of node start and end line no.
  484. Args:
  485. node: AST op node or tuple or List. This is a node in the ANF diagram,
  486. here is the code location to get this node.
  487. Returns:
  488. List, [fileName, linestart, colstart, lineend, colend].
  489. """
  490. ret = [self.filename]
  491. err_exit = 0
  492. if isinstance(node, (list, tuple)):
  493. node_size = len(node)
  494. if node_size == 0:
  495. err_exit = 1
  496. else:
  497. start_node = node[0]
  498. end_node = node[-1]
  499. else:
  500. start_node = node
  501. end_node = node
  502. if err_exit == 0:
  503. if hasattr(start_node, "lineno") and \
  504. hasattr(end_node, "col_offset"):
  505. start_lineno, start_colno = start_node.first_token.start
  506. end_lineno, end_colno = end_node.last_token.end
  507. start_lineno += self.line_offset - 1
  508. start_colno += self.col_offset
  509. end_lineno += self.line_offset - 1
  510. end_colno += self.col_offset
  511. ret = ret + [start_lineno, start_colno, end_lineno, end_colno]
  512. else:
  513. ret = ret + [0, 0, 0, 0]
  514. return ret