You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

execution_tree.cc 8.6 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219
  1. /**
  2. * Copyright 2019 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include "dataset/engine/execution_tree.h"
  17. #include <iostream>
  18. #include <string>
  19. #include "dataset/engine/datasetops/dataset_op.h"
  20. #include "dataset/engine/datasetops/shuffle_op.h"
  21. #include "dataset/util/task_manager.h"
  22. namespace mindspore {
  23. namespace dataset {
  24. // Constructor
  25. ExecutionTree::ExecutionTree() : id_count_(0) {
  26. tg_ = std::make_unique<TaskGroup>();
  27. tree_state_ = kDeTStateInit;
  28. prepare_flags_ = kDePrepNone;
  29. }
  30. // Destructor
  31. ExecutionTree::~ExecutionTree() { (void)tg_->ServiceStop(); }
  32. // Associates a DatasetOp with this tree. This assigns a valid node id to the operator and
  33. // provides it with a link to the tree. A node cannot form any relationships (parent/child) with
  34. // other nodes unless they are associated with the same tree.
  35. Status ExecutionTree::AssociateNode(const std::shared_ptr<DatasetOp> &op) {
  36. if (tree_state_ != kDeTStateInit && tree_state_ != kDeTStateBuilding) {
  37. std::string err_msg =
  38. "Invalid tree state for adding a node. Current state: " + std::to_string(static_cast<int>(tree_state_)) +
  39. " Expected states: " + std::to_string(static_cast<int>(kDeTStateInit)) + " or " +
  40. std::to_string(static_cast<int>(kDeTStateBuilding));
  41. RETURN_STATUS_UNEXPECTED(err_msg);
  42. }
  43. // Enter the building state if we were not already there
  44. tree_state_ = kDeTStateBuilding;
  45. // Assign an id to the operator
  46. op->set_id(id_count_);
  47. id_count_++;
  48. // Assign our tree into the op so that each op has a link back to the tree
  49. op->set_tree(this);
  50. return Status::OK();
  51. }
  52. // Sets the root node of the tree
  53. Status ExecutionTree::AssignRoot(const std::shared_ptr<DatasetOp> &op) {
  54. // Tree must be in building state before we can assign root to it
  55. if (tree_state_ != kDeTStateBuilding) {
  56. std::string err_msg =
  57. "Invalid tree state for assigning a root node. Current state: " + std::to_string(static_cast<int>(tree_state_)) +
  58. " Expected state: " + std::to_string(static_cast<int>(kDeTStateBuilding));
  59. RETURN_STATUS_UNEXPECTED(err_msg);
  60. }
  61. // If they didn't already call AssociateNode for this node before calling AssignRoot,
  62. // then do so now.
  63. if (op->operator_id_ == DatasetOp::kInvalidOperatorId) {
  64. RETURN_IF_NOT_OK(this->AssociateNode(op));
  65. }
  66. // Then add it as the root.
  67. root_ = op;
  68. // The tree has an assigned root now and it's ready to be prepared.
  69. tree_state_ = kDeTStatePrepare;
  70. return Status::OK();
  71. }
  72. // A print method typically used for debugging
  73. void ExecutionTree::Print(std::ostream &out) const {
  74. out << "Execution tree summary:\n"
  75. << "-----------------------\n";
  76. this->PrintNode(out, root_, "", true, false);
  77. out << "\nExecution tree operator details:\n"
  78. << "--------------------------------\n";
  79. this->PrintNode(out, root_, "", true, true);
  80. }
  81. // A helper functions for doing the recursive printing
  82. void ExecutionTree::PrintNode(std::ostream &out, const std::shared_ptr<DatasetOp> &dataset_op, std::string indent,
  83. bool last, bool detailed) const {
  84. // Decide which printer to use based on detailed arg.
  85. if (!detailed) {
  86. out << indent << "+- " << *dataset_op;
  87. indent += (last ? " " : "| ");
  88. } else {
  89. dataset_op->Print(out, detailed);
  90. }
  91. // Descend to children
  92. for (int32_t i = 0; i < dataset_op->child_.size(); ++i) {
  93. this->PrintNode(out, dataset_op->child_[i], indent, (i == (dataset_op->child_.size() - 1)), detailed);
  94. }
  95. }
  96. // Start the execution of the tree
  97. Status ExecutionTree::Launch() {
  98. // Tree must be built and prepared before it can be launched!
  99. if (tree_state_ != kDeTStateReady) {
  100. std::string err_msg =
  101. "Invalid tree state for launching tree. Current state: " + std::to_string(static_cast<int>(tree_state_)) +
  102. " Expected state: " + std::to_string(static_cast<int>(kDeTStateReady));
  103. RETURN_STATUS_UNEXPECTED(err_msg);
  104. }
  105. std::ostringstream ss;
  106. ss << *this;
  107. MS_LOG(INFO) << "Printing the tree before launch tasks:\n" << ss.str();
  108. for (auto itr = this->begin(); itr != this->end(); ++itr) {
  109. // An inlined operator is one that has an output connector size of 0, and it does not
  110. // require a thread to execute. Instead, the work of this operator is executed inlined
  111. // from the tree node directly above it (or in the case of a root node, it runs from within
  112. // the launching tree/user thread. Do not exec any thread for an inlined op.
  113. itr->state_ = DatasetOp::OpState::kDeOpRunning;
  114. if (!itr->inlined()) {
  115. RETURN_IF_NOT_OK(tg_->CreateAsyncTask("Op launched, OperatorId:" + std::to_string(itr->id()), std::ref(*itr)));
  116. // Set the state of the Operator as running. This only matters in Leaf ops, CacheOp and TakeOp
  117. }
  118. }
  119. tree_state_ = kDeTStateExecuting;
  120. return Status::OK();
  121. }
  122. // A function that traverse the tree in postorder then save the results in nodes
  123. void ExecutionTree::Iterator::PostOrderTraverse(const std::shared_ptr<DatasetOp> &node) {
  124. if (node == nullptr) {
  125. return;
  126. }
  127. for (int32_t i = 0; i < node->child_.size(); ++i) {
  128. PostOrderTraverse(node->child_[i]);
  129. }
  130. nodes_.push_back(node);
  131. }
  132. ExecutionTree::Iterator::Iterator(const std::shared_ptr<DatasetOp> &root) : ind_(0) {
  133. // post-order traverse the tree, if root is null, it return
  134. PostOrderTraverse(root);
  135. nodes_.emplace_back(nullptr);
  136. }
  137. // Given the number of workers, launches the worker entry function for each. Essentially a
  138. // wrapper for the TaskGroup handling that is stored inside the execution tree.
  139. Status ExecutionTree::LaunchWorkers(int32_t num_workers, std::function<Status(uint32_t)> func) {
  140. // Launch the workers
  141. for (int32_t i = 0; i < num_workers; ++i) {
  142. RETURN_IF_NOT_OK(tg_->CreateAsyncTask("Parallel Op Worker", std::bind(func, i)));
  143. }
  144. return Status::OK();
  145. }
  146. // The driver of the prepare phase of the execution tree. The prepare phase will recursively
  147. // walk the tree to perform modifications to the tree or specific nodes within the tree to get
  148. // it ready for execution.
  149. Status ExecutionTree::Prepare() {
  150. // Tree must be in pending prepare state before we can assign root to it
  151. if (tree_state_ != kDeTStatePrepare) {
  152. std::string err_msg =
  153. "Invalid tree state for preparing the tree. Current state: " + std::to_string(static_cast<int>(tree_state_)) +
  154. " Expected state: " + std::to_string(static_cast<int>(kDeTStatePrepare));
  155. RETURN_STATUS_UNEXPECTED(err_msg);
  156. }
  157. // Start the recursive prepare
  158. RETURN_IF_NOT_OK(this->PrepareNode(root_));
  159. tree_state_ = kDeTStateReady;
  160. return Status::OK();
  161. }
  162. // Recursive function used during prepare phase to visit a node and drive any pre- and post-
  163. // node actions during a tree walk.
  164. Status ExecutionTree::PrepareNode(const std::shared_ptr<DatasetOp> &dataset_op) {
  165. // execute PreAction
  166. RETURN_IF_NOT_OK(dataset_op->PrepareNodePreAction());
  167. // Before going down into children, make any prepare flags updates based on this operator.
  168. uint32_t op_prep_flags = dataset_op->PrepareFlags();
  169. BitSet(&prepare_flags_, op_prep_flags);
  170. // Now, descend to children
  171. for (const auto &i : dataset_op->child_) {
  172. RETURN_IF_NOT_OK(this->PrepareNode(i));
  173. }
  174. // Then clear the flags from this op now that we have prepared it.
  175. BitClear(&prepare_flags_, op_prep_flags);
  176. // No more children, now we execute any prepare actions before going back up the
  177. // the tree on recursive function
  178. RETURN_IF_NOT_OK(dataset_op->PrepareNodePostAction());
  179. return Status::OK();
  180. }
  181. // Adds an operator to the repeat stack during prepare phase.
  182. void ExecutionTree::AddToRepeatStack(std::shared_ptr<DatasetOp> dataset_op) { repeat_stack_.push(dataset_op); }
  183. // Pops an operator from the repeat stack during prepare phase.
  184. std::shared_ptr<DatasetOp> ExecutionTree::PopFromRepeatStack() {
  185. std::shared_ptr<DatasetOp> top_op = nullptr;
  186. if (!repeat_stack_.empty()) {
  187. top_op = repeat_stack_.top();
  188. repeat_stack_.pop();
  189. }
  190. return top_op;
  191. }
  192. } // namespace dataset
  193. } // namespace mindspore