You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

parser.py 17 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493
  1. # This is the Python adaptation and derivative work of Myia (https://github.com/mila-iqia/myia/).
  2. #
  3. # Copyright 2020 Huawei Technologies Co., Ltd
  4. #
  5. # Licensed under the Apache License, Version 2.0 (the "License");
  6. # you may not use this file except in compliance with the License.
  7. # You may obtain a copy of the License at
  8. #
  9. # http://www.apache.org/licenses/LICENSE-2.0
  10. #
  11. # Unless required by applicable law or agreed to in writing, software
  12. # distributed under the License is distributed on an "AS IS" BASIS,
  13. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  14. # See the License for the specific language governing permissions and
  15. # limitations under the License.
  16. # ============================================================================
  17. """The module of parser python object, called by c++."""
  18. import ast
  19. import types
  20. import inspect
  21. from textwrap import dedent
  22. from dataclasses import is_dataclass
  23. import asttokens
  24. import mindspore.nn as nn
  25. from mindspore import log as logger
  26. from mindspore import ops
  27. from mindspore.common.dtype import pytype_to_dtype
  28. from mindspore.common.api import _MindSporeFunction
  29. from .namespace import CellNamespace, ClosureNamespace, ClassMemberNamespace
  30. from .resources import parse_object_map, convert_object_map, trope_ns, SYMBOL_UNDEFINE, NO_IMPLEMENT
  31. from ..utils import Slice
  32. # define return value
  33. RET_SUCCESS = 0
  34. RET_FAILURE = 0xFF
  35. # define resolve type
  36. RESOLVE_TYPE_NONE = 0 # resolve None
  37. RESOLVE_TYPE_FUNCTION = 1 # resolve function
  38. RESOLVE_TYPE_METHOD = 2 # resolve class method
  39. RESOLVE_TYPE_CLASS_TYPE = 3 # resolve class type
  40. RESOLVE_TYPE_CLASS_INSTANCE = 4 # resolve the class instance of common class
  41. RESOLVE_TYPE_INVALID = 0xFF
  42. # define the class instance detail type
  43. # When the type is RESOLVE_TYPE_CLASS_INSTANCE
  44. CLASS_INSTANCE_TYPE_CELL = 0 # class instance type is Cell
  45. CLASS_INSTANCE_TYPE_PRIMITIVE = 1 # class instance type is Primitive
  46. CLASS_INSTANCE_TYPE_INVALID = 0xFF
  47. # Ast main type
  48. AST_MAIN_TYPE_STMT = 0 # ast.Stmt
  49. AST_MAIN_TYPE_EXPR = 1 # ast.Expr
  50. AST_MAIN_TYPE_SLICE = 2 # ast.Slice
  51. AST_MAIN_TYPE_UNKNOWN = 0xFF # unknown
  52. # Ast sub type
  53. AST_SUB_TYPE_AND = 3 # ast.And
  54. AST_SUB_TYPE_OR = 4 # ast.Or
  55. AST_SUB_TYPE_NAME = 5 # ast.Name
  56. AST_SUB_TYPE_TUPLE = 6 # ast.Tuple
  57. AST_SUB_TYPE_SUBSCRIPT = 7 # ast.Subscript
  58. AST_SUB_TYPE_STARRED = 8 # ast.Starred
  59. AST_SUB_TYPE_UNKNOWN = 0xFF # unknown
  60. # Process expr statement white list
  61. # add as needed, eg: "clear", "extend", "insert", "remove", "reverse"
  62. parse_expr_statement_white_list = (
  63. "append",
  64. )
  65. def create_slice_obj(start, end, step):
  66. """Create Slice object"""
  67. return Slice(start, end, step)
  68. def parse_cb(func, parse_method=None):
  69. """Implements the function of parse."""
  70. return Parser(func, parse_method)
  71. def get_parse_method_of_class(obj, parse_method=None):
  72. """
  73. Het parse method of class.
  74. Args:
  75. obj(Object): Instance of class.
  76. parse_method(str): Save the method name. Cell object has default method named 'construct'.
  77. Returns:
  78. Function, obj's method.
  79. """
  80. method = None
  81. method_name = None
  82. if parse_method is not None:
  83. method_name = parse_method
  84. else:
  85. if isinstance(obj, nn.Cell):
  86. method_name = "construct"
  87. if method_name is not None:
  88. if hasattr(obj, method_name):
  89. method = getattr(obj, method_name)
  90. return method
  91. def get_bprop_method_of_class(obj, parse_method=None):
  92. """
  93. Get bprop method of class.
  94. Args:
  95. obj (Object): Instance of class.
  96. parse_method(str): Save the method name. Cell object has default method named 'bprop'.
  97. Returns:
  98. Function, obj's method.
  99. """
  100. method = None
  101. if isinstance(obj, nn.Cell):
  102. method_name = "bprop"
  103. if hasattr(obj, method_name):
  104. method = getattr(obj, method_name)
  105. return method
  106. def resolve_symbol(namespace, symbol):
  107. """
  108. Resolve a symbol.
  109. Note:
  110. Can't get function when use closure function. So save the fn on namespace.
  111. Args:
  112. namespace (Object): Symbol's namespace.
  113. symbol (str): Need resolve symbol.
  114. Returns:
  115. Object, resolve result of symbol.
  116. """
  117. # All exceptions need to be caught in this function
  118. try:
  119. resolve_ = namespace[symbol]
  120. # list and dict is not hashable ,it can not be key for the map, just return the result
  121. if isinstance(resolve_, (list, dict)):
  122. return resolve_
  123. # dataclass may not be hashable
  124. if getattr(resolve_, "__hash__") is None:
  125. return resolve_
  126. # If need trope the obj
  127. if resolve_ in convert_object_map:
  128. resolve_ = convert_object_map.get(resolve_)
  129. logger.debug("convert resolve = %r", resolve_)
  130. if resolve_ == NO_IMPLEMENT:
  131. raise NotImplementedError("not implemented for ", str(symbol))
  132. except Exception as e:
  133. if isinstance(e, NotImplementedError):
  134. raise e
  135. resolve_ = None
  136. logger.debug("resolve exception occurred, value = %r", e)
  137. logger.debug("resolve type is invalid, namespace = %s, symbol = %s",
  138. namespace.__str__(), symbol)
  139. if isinstance(resolve_, _MindSporeFunction):
  140. logger.debug("resolve class _MindSporeFunction, resolve fn instead.")
  141. resolve_ = resolve_.fn
  142. return resolve_
  143. def generate_scope(obj):
  144. """Generate the scope for every cell object in the network."""
  145. if isinstance(obj, nn.Cell):
  146. obj.generate_scope()
  147. def get_scope_name(obj):
  148. """Returns the scope of a cell object in one network."""
  149. if isinstance(obj, nn.Cell):
  150. return obj.get_scope()
  151. return None
  152. def get_object_key(obj):
  153. """Return the function key: module + name."""
  154. obj_key = ""
  155. if hasattr(obj, "__name__"):
  156. if hasattr(obj, "cell_init_args"):
  157. obj_key = "%s_ID" % (str(obj.__class__.__name__) + str(obj.__name__) + obj.cell_init_args)
  158. obj_id = "%s_ID%d" % (str(obj.__class__.__name__) + str(obj.__name__), id(obj))
  159. else:
  160. if hasattr(obj, "cell_init_args"):
  161. obj_key = "%s_ID" % (str(obj.__class__.__name__) + obj.cell_init_args)
  162. obj_id = "%s_ID%d" % (str(obj.__class__.__name__), id(obj))
  163. logger.debug("obj_key %s obj_id = %s", obj_key, obj_id)
  164. # method has same id of different instance
  165. if isinstance(obj, types.MethodType):
  166. method_instance = obj.__self__
  167. instance_id = "%s_ID%d" % (str(method_instance.__class__.__name__), id(method_instance))
  168. obj_id = instance_id + obj_id
  169. return obj_id, obj_key
  170. def is_class_member(node):
  171. """Check the attr is class member variable."""
  172. type_ = node.__class__.__name__
  173. if type_ == "Attribute":
  174. if not hasattr(node.value, "id"):
  175. return False
  176. id_ = node.value.id
  177. if id_ == "self":
  178. return True
  179. return False
  180. def get_obj_type(obj):
  181. """Get the obj type."""
  182. obj_type = RESOLVE_TYPE_INVALID
  183. if obj is None:
  184. obj_type = RESOLVE_TYPE_NONE
  185. elif isinstance(obj, types.FunctionType):
  186. obj_type = RESOLVE_TYPE_FUNCTION
  187. elif isinstance(obj, types.MethodType):
  188. obj_type = RESOLVE_TYPE_METHOD
  189. elif isinstance(obj, type):
  190. obj_type = RESOLVE_TYPE_CLASS_TYPE
  191. elif _is_class_instance(obj):
  192. obj_type = RESOLVE_TYPE_CLASS_INSTANCE
  193. else:
  194. # here for ndarray, just print its shape (in case of the array to large and print many data in screen)
  195. is_ndarray = type(obj).__name__ == 'ndarray' and hasattr(obj, 'shape')
  196. raise TypeError(f'Invalid object with type `{type(obj)}` and {"shape" if is_ndarray else "value"} '
  197. f'`{obj.shape if is_ndarray else obj}`.')
  198. return obj_type
  199. def get_class_instance_type(obj):
  200. """Get the class instance detail type."""
  201. # check the obj type
  202. logger.debug("Get the class type(%r)", obj)
  203. class_type = CLASS_INSTANCE_TYPE_INVALID
  204. if _is_class_instance(obj):
  205. if isinstance(obj, nn.Cell):
  206. class_type = CLASS_INSTANCE_TYPE_CELL
  207. elif isinstance(obj, ops.Primitive):
  208. class_type = CLASS_INSTANCE_TYPE_PRIMITIVE
  209. # Add the other type base requirement
  210. return class_type
  211. def _is_class_instance(obj):
  212. """Confirm the obj is class instance."""
  213. return isinstance(obj, (nn.Cell, ops.Primitive)) or _is_dataclass_instance(obj)
  214. def _is_dataclass_instance(obj):
  215. """check whether a class is an instance of a dataclass (and not a dataclass itself)"""
  216. return is_dataclass(obj) and not isinstance(obj, type)
  217. def create_obj_instance(cls_type, args_tuple=None):
  218. """Create python instance."""
  219. obj = None
  220. if isinstance(cls_type, type):
  221. # check the type, now only support nn.Cell and Primitive
  222. if issubclass(cls_type, (nn.Cell, ops.Primitive)):
  223. if args_tuple is not None:
  224. obj = cls_type(*args_tuple)
  225. else:
  226. obj = cls_type()
  227. return obj
  228. def get_module_namespace(obj):
  229. """Get the module's namespace."""
  230. logger.debug("get module namespace, module = %r", obj)
  231. mod_namespace = None
  232. if isinstance(obj, types.ModuleType):
  233. mod_namespace = CellNamespace(obj.__name__)
  234. else:
  235. logger.warning("Module(%r) is invalid, get namespace failure!", obj)
  236. return mod_namespace
  237. def get_class_member_namespace_symbol(obj):
  238. """Get obj class member type."""
  239. logger.debug("get class instance namespace, object = %r", obj)
  240. class_namespace = ClassMemberNamespace(obj)
  241. logger.debug("class namesapce = %r", class_namespace)
  242. return class_namespace
  243. def get_dataclass_attributes(cls):
  244. """Get attributes of dataclass."""
  245. fields = cls.__dataclass_fields__
  246. attributes = {name: pytype_to_dtype(field.type)
  247. for name, field in fields.items()}
  248. return attributes
  249. def get_dataclass_methods(cls):
  250. """Get functions of dataclass."""
  251. methods = {name: getattr(cls, name)
  252. for name in dir(cls)
  253. if isinstance(getattr(cls, name), (types.FunctionType,))}
  254. return methods
  255. class Parser:
  256. """
  257. Parser python code to ast tree.
  258. Args:
  259. fn(FunctionType/MethodType): Need parse object instance.
  260. parse_method(ExtendInfoOfParseObj): Extend information for parse the function.
  261. """
  262. def __init__(self, fn: (types.FunctionType, types.MethodType), parse_method=None) -> None:
  263. self.fn = fn
  264. self.parse_method = parse_method
  265. _, self.line_offset = inspect.getsourcelines(self.fn)
  266. self.filename: str = inspect.getfile(self.fn)
  267. # Used to resolve the function's globals Namespace.
  268. self.global_namespace = CellNamespace(fn.__module__)
  269. self.function_module = fn.__module__
  270. # Used to resolve the function's nonlocals.
  271. self.closure_namespace = ClosureNamespace(fn)
  272. self.function_name = fn.__name__
  273. self.col_offset = 0
  274. def parse(self):
  275. """Parse the function or method."""
  276. logger.debug("fn = %r", self.fn)
  277. tree = None
  278. if isinstance(self.fn, (types.FunctionType, types.MethodType)):
  279. original_src = inspect.getsource(self.fn)
  280. src = dedent(original_src)
  281. self.col_offset = \
  282. len(original_src.split('\n')[0]) - len(src.split('\n')[0])
  283. logger.debug("get source = %s", src)
  284. tree = asttokens.ASTTokens(src, parse=True).tree
  285. else:
  286. logger.error("Fn type is invalid")
  287. return tree
  288. def get_args(self, node):
  289. """Get the arg of parse object."""
  290. args = []
  291. # process position args
  292. for arg in node.args.args:
  293. args.append(arg)
  294. # process kwonlyargs: kwonlyargs is append after position args
  295. if node.args.kwonlyargs:
  296. for kwarg in node.args.kwonlyargs:
  297. args.append(kwarg)
  298. # process vararg: vararg is append after kwonlyargs
  299. if node.args.vararg:
  300. args.append(node.args.vararg)
  301. # process kwarg: kwarg is append after vararg
  302. if node.args.kwarg:
  303. args.append(node.args.kwarg)
  304. return args
  305. def get_args_default_values(self, node):
  306. """get the args'default values of parse object."""
  307. nondefaults = [None] * (len(node.args.args) - len(node.args.defaults))
  308. defaults = nondefaults + node.args.defaults + node.args.kw_defaults
  309. if node.args.vararg:
  310. defaults.append(None)
  311. if node.args.kwarg:
  312. defaults.append(None)
  313. return defaults
  314. def get_node_type(self, node):
  315. """Process an ast node."""
  316. method_name = f'{node.__class__.__name__}'
  317. node_type = [method_name]
  318. # judge the ast main type
  319. if isinstance(node, ast.stmt):
  320. node_type.append(AST_MAIN_TYPE_STMT)
  321. elif isinstance(node, (ast.expr, ast.slice)) or node is None:
  322. # ast.slice and ast.expr should be expr
  323. node_type.append(AST_MAIN_TYPE_EXPR)
  324. else:
  325. node_type.append(AST_MAIN_TYPE_UNKNOWN)
  326. return node_type
  327. def get_ast_type(self, node):
  328. """Get the ast type."""
  329. ast_type = AST_SUB_TYPE_UNKNOWN
  330. if isinstance(node, ast.And):
  331. ast_type = AST_SUB_TYPE_AND
  332. elif isinstance(node, ast.Or):
  333. ast_type = AST_SUB_TYPE_OR
  334. elif isinstance(node, ast.Name):
  335. ast_type = AST_SUB_TYPE_NAME
  336. elif isinstance(node, ast.Tuple):
  337. ast_type = AST_SUB_TYPE_TUPLE
  338. elif isinstance(node, ast.Subscript):
  339. ast_type = AST_SUB_TYPE_SUBSCRIPT
  340. elif isinstance(node, ast.Starred):
  341. ast_type = AST_SUB_TYPE_STARRED
  342. else:
  343. ast_type = AST_SUB_TYPE_UNKNOWN
  344. return ast_type
  345. def get_namespace_symbol(self, var: str):
  346. """Get symbol type and namespace and symbol."""
  347. if var in self.closure_namespace:
  348. ops_info = (self.closure_namespace, var)
  349. logger.debug("in closure_namespace")
  350. elif var in self.global_namespace:
  351. ops_info = (self.global_namespace, var)
  352. logger.debug("in global_namespace")
  353. else:
  354. ops_info = parse_object_map.get(SYMBOL_UNDEFINE)
  355. ops_info = [ops_info[0], var]
  356. return ops_info
  357. def get_operation_namespace_symbol(self, var: str):
  358. """Get operation namespace and symbol."""
  359. ops_info = (trope_ns, var)
  360. logger.debug("get operation ops info = %r", ops_info)
  361. return ops_info
  362. def get_ast_namespace_symbol(self, obj):
  363. """Get obj type and namespace and symbol."""
  364. # step 1:get symbol from object map
  365. ops_info = parse_object_map.get(type(obj), SYMBOL_UNDEFINE)
  366. logger.debug("ops info = %r", ops_info)
  367. return ops_info
  368. def get_location(self, node):
  369. """
  370. Get location of node start and end line no.
  371. Args:
  372. node: AST op node or tuple or List. This is a node in the ANF diagram,
  373. here is the code location to get this node.
  374. Returns:
  375. List, [fileName, linestart, colstart, lineend, colend].
  376. """
  377. ret = [self.filename]
  378. err_exit = 0
  379. if isinstance(node, (list, tuple)):
  380. node_size = len(node)
  381. if node_size == 0:
  382. err_exit = 1
  383. else:
  384. start_node = node[0]
  385. end_node = node[-1]
  386. else:
  387. start_node = node
  388. end_node = node
  389. if err_exit == 0:
  390. if hasattr(start_node, "lineno") and \
  391. hasattr(end_node, "col_offset"):
  392. start_lineno, start_colno = start_node.first_token.start
  393. end_lineno, end_colno = end_node.last_token.end
  394. start_lineno += self.line_offset - 1
  395. start_colno += self.col_offset
  396. end_lineno += self.line_offset - 1
  397. end_colno += self.col_offset
  398. ret = ret + [start_lineno, start_colno, end_lineno, end_colno]
  399. else:
  400. ret = ret + [0, 0, 0, 0]
  401. return ret
  402. def expand_expr_statement(self, node):
  403. """
  404. Process the expr statement and expand it.
  405. Returns:
  406. tuple, (True, expr.value, x)/(False, None, None).
  407. """
  408. if isinstance(node, ast.Expr) and hasattr(node, "value"):
  409. expr_value = node.value
  410. if isinstance(expr_value, ast.Call):
  411. func = expr_value.func
  412. if isinstance(func, ast.Attribute) and \
  413. hasattr(func, "attr") and \
  414. hasattr(func, "value"):
  415. method = func.attr
  416. target = func.value
  417. if method in parse_expr_statement_white_list:
  418. logger.debug("Expand expr, target:%s, method:%s", target, method)
  419. return True, expr_value, target
  420. return True, expr_value
  421. return False, None, None