|
- /**
- * Copyright 2020 Huawei Technologies Co., Ltd
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- * http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
- #include "kernel/cpu/allgather_cpu_kernel.h"
- #include "device/cpu/cpu_device_address.h"
- #include "device/cpu/mpi/mpi_adapter.h"
- #include "ir/primitive.h"
- #include "utils/log_adapter.h"
-
- namespace mindspore {
- namespace kernel {
- namespace {
- constexpr auto kRanksGroup = "group";
- constexpr auto kAllGatherInputNum = 1;
- } // namespace
-
- AllGatherCPUKernel::AllGatherCPUKernel() : input_data_number_(0) {}
-
- void AllGatherCPUKernel::InitKernel(const CNodePtr &kernel_node) {
- size_t input_num = AnfAlgo::GetInputTensorNum(kernel_node);
- if (input_num != kAllGatherInputNum) {
- MS_LOG(EXCEPTION) << "allgather input num:" << input_num;
- }
- for (size_t i = 0; i < input_num; ++i) {
- auto shape = AnfAlgo::GetPrevNodeOutputInferShape(kernel_node, i);
- size_t count = 1;
- for (size_t j = 0; j < shape.size(); j++) {
- count *= IntToSize(shape[j]);
- }
- input_data_number_ += count;
- }
-
- auto ranks_group = AnfAlgo::GetCNodePrimitive(kernel_node)->GetAttr(kRanksGroup);
- if (ranks_group != nullptr) {
- ranks_group_ = GetValue<std::vector<int>>(ranks_group);
- } else {
- MS_LOG(EXCEPTION) << "Miss attribute " << kRanksGroup;
- }
- }
-
- bool AllGatherCPUKernel::Launch(const std::vector<kernel::AddressPtr> &inputs,
- const std::vector<kernel::AddressPtr> & /*workspace*/,
- const std::vector<kernel::AddressPtr> &outputs) {
- auto input_addr = reinterpret_cast<float *>(inputs[0]->addr);
- auto output_addr = reinterpret_cast<float *>(outputs[0]->addr);
-
- return device::cpu::MPIAdapter::Instance().AllGather(input_addr, output_addr, ranks_group_, input_data_number_);
- }
- } // namespace kernel
- } // namespace mindspore
|