/** * Copyright 2019 Huawei Technologies Co., Ltd * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ #include "device/gpu/cuda_driver.h" #include #include "utils/log_adapter.h" #include "utils/convert_utils.h" namespace mindspore { namespace device { namespace gpu { size_t CudaDriver::AllocDeviceMem(size_t size, DeviceMemPtr *addr) { size_t retreat_count = 0; auto ret = cudaMalloc(reinterpret_cast(addr), size); // If free memory is not enough, then retry with mem_malloc_retry_rate_. while (ret == cudaErrorMemoryAllocation) { size = FloatToSize(size * mem_malloc_retry_rate_); size = (size / mem_malloc_align_size_) * mem_malloc_align_size_; ret = cudaMalloc(reinterpret_cast(addr), size); retreat_count++; if (retreat_count > mem_malloc_retry_conut_max_) { break; } } if (ret != cudaSuccess) { MS_LOG(ERROR) << "cudaMalloc failed, ret[" << static_cast(ret) << "], " << cudaGetErrorString(ret); return 0; } return size; } bool CudaDriver::FreeDeviceMem(const DeviceMemPtr &addr) { auto ret = cudaFree(addr); if (ret != cudaSuccess) { MS_LOG(ERROR) << "cudaFree failed, ret[" << static_cast(ret) << "], " << cudaGetErrorString(ret); return false; } return true; } bool CudaDriver::CopyHostMemToDevice(const DeviceMemPtr &dst, const void *src, size_t size) { auto ret = cudaMemcpy(dst, src, size, cudaMemcpyHostToDevice); if (ret != cudaSuccess) { MS_LOG(ERROR) << "cudaMemcpy failed, ret[" << static_cast(ret) << "], " << cudaGetErrorString(ret); return false; } return true; } bool CudaDriver::CopyDeviceMemToHost(const HostMemPtr &dst, const DeviceMemPtr &src, size_t size) { auto ret = cudaMemcpy(dst, src, size, cudaMemcpyDeviceToHost); if (ret != cudaSuccess) { MS_LOG(ERROR) << "cudaMemcpy failed, ret[" << static_cast(ret) << "], " << cudaGetErrorString(ret); return false; } return true; } size_t CudaDriver::total_mem_size() { size_t free; size_t total; auto ret = cudaMemGetInfo(&free, &total); if (ret != cudaSuccess) { MS_LOG(ERROR) << "cudaMemGetInfo failed, ret[" << static_cast(ret) << "], " << cudaGetErrorString(ret); return 0; } return total; } size_t CudaDriver::free_mem_size() { size_t free; size_t total; auto ret = cudaMemGetInfo(&free, &total); if (ret != cudaSuccess) { MS_LOG(ERROR) << "cudaMemGetInfo failed, ret[" << static_cast(ret) << "], " << cudaGetErrorString(ret); return 0; } return free; } bool CudaDriver::CreateStream(DeviceStream *stream) { auto ret = cudaStreamCreateWithFlags(reinterpret_cast(stream), cudaStreamNonBlocking); if (ret != cudaSuccess) { MS_LOG(ERROR) << "cudaStreamCreate failed, ret[" << static_cast(ret) << "], " << cudaGetErrorString(ret); return false; } return true; } bool CudaDriver::DestroyStream(const DeviceStream &stream) { auto ret = cudaStreamDestroy((cudaStream_t)stream); if (ret != cudaSuccess) { MS_LOG(ERROR) << "cudaStreamDestroy failed, ret[" << static_cast(ret) << "], " << cudaGetErrorString(ret); return false; } return true; } bool CudaDriver::SyncStream(const DeviceStream &stream) { auto ret = cudaStreamSynchronize((cudaStream_t)stream); if (ret != cudaSuccess) { MS_LOG(ERROR) << "cudaStreamSynchronize failed, ret[" << static_cast(ret) << "], " << cudaGetErrorString(ret); return false; } return true; } int CudaDriver::device_count() { int dev_count; auto ret = cudaGetDeviceCount(&dev_count); if (ret != cudaSuccess) { MS_LOG(ERROR) << "cudaGetDeviceCount failed, ret[" << static_cast(ret) << "], " << cudaGetErrorString(ret); } return dev_count; } bool CudaDriver::set_current_device(int index) { auto ret = cudaSetDevice(index); if (ret != cudaSuccess) { MS_LOG(ERROR) << "cudaSetDevice failed, ret[" << static_cast(ret) << "], " << cudaGetErrorString(ret); return false; } return true; } } // namespace gpu } // namespace device } // namespace mindspore