/** * Copyright 2019 Huawei Technologies Co., Ltd * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ #ifndef DATASET_ENGINE_DATASETOPS_PARALLEL_OP_H_ #define DATASET_ENGINE_DATASETOPS_PARALLEL_OP_H_ #include #include #include "dataset/core/constants.h" #include "dataset/engine/datasetops/dataset_op.h" #include "dataset/util/status.h" namespace mindspore { namespace dataset { // global const in our namespace constexpr int32_t kEndOfActions = -1; // Forward declares class DataBuffer; class DbConnector; // A ParallelOp provides a multi-threaded DatasetOp class ParallelOp : public DatasetOp { public: // Constructor // @param num_workers // @param op_connector_size - size of the output connector for this operator // @param sampler - The sampler for the op ParallelOp(int32_t num_workers, int32_t op_connector_size, std::shared_ptr sampler = nullptr); // Destructor ~ParallelOp() = default; // Creates the internal worker connector for the parallel op if the derived class wants to use it. // @notes This changes the number of producers of this op to 1, since it establishes a master/worker // relationship within the op, making all production flow through a single master. // @return Status - The error return code Status CreateWorkerConnector(int32_t worker_connector_size); // A print method typically used for debugging // @param out - The output stream to write output to // @param show_all - A bool to control if you want to show all info or just a summary void Print(std::ostream &out, bool show_all) const override; // << Stream output operator overload // @notes This allows you to write the debug print info using stream operators // @param out - reference to the output stream being overloaded // @param pO - reference to the ParallelOp to display // @return - the output stream must be returned friend std::ostream &operator<<(std::ostream &out, const ParallelOp &po) { po.Print(out, false); return out; } // During tree prepare phase, operators may have specific pre-operations to perform depending on // their role. // @notes Derived versions of this function should always call it's superclass version first // before providing their own implementations. // @return Status - The error return code Status PrepareNodePreAction() override { // Run common code from super class before adding ParallelOp specific logic return (DatasetOp::PrepareNodePreAction()); } // During tree prepare phase, operators may have specific post-operations to perform depending on // their role. // @notes Derived versions of this function should always call it's superclass version first // before providing their own implementations. // @return Status - The error return code Status PrepareNodePostAction() override { // Run common code from super class before adding ParallelOp specific logic return (DatasetOp::PrepareNodePostAction()); } // Override base class reset to provide reset actions specific to the ParallelOp class. // @return Status - The error code return Status Reset() override; // Getter // @return the number of workers int32_t num_workers() const override { return num_workers_; } // Getter // @return the number of threads consuming from the previous Connector int32_t num_consumers() const override { return num_workers_; } // Getter // @return the number of producers pushing to the output Connector // @notes The number of producers is commonly the same as number of workers, except in the case // when a worker connector is set up. In that case, there are n workers, and a single master // such that only 1 thread is a producer rather than the n workers. // @return the number of producers int32_t num_producers() const override { return num_producers_; } // Register the internal worker connectors. // @return Status Status RegisterWorkerConnectors() override; protected: // Interface for derived classes to implement. All derived classes must provide the entry // function with the main execution loop for worker threads. // @return Status - The error code return virtual Status WorkerEntry(int32_t workerId) = 0; int32_t num_workers_; // The number of worker threads int32_t num_producers_; // The number of threads pushing to the out_connector_ int32_t worker_connector_size_; std::unique_ptr worker_connector_; // The internal connector for worker threads }; } // namespace dataset } // namespace mindspore #endif // DATASET_ENGINE_DATASETOPS_PARALLEL_OP_H_