You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

api_cache.h 3.4 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109
  1. /**
  2. * \file dnn/src/cuda/api_cache.h
  3. * MegEngine is Licensed under the Apache License, Version 2.0 (the "License")
  4. *
  5. * Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
  6. *
  7. * Unless required by applicable law or agreed to in writing,
  8. * software distributed under the License is distributed on an
  9. * "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or
  10. * implied.
  11. */
  12. #pragma once
  13. #include "src/common/api_cache.h"
  14. #include "src/cuda/cudnn_wrapper.h"
  15. namespace megdnn {
  16. class CudnnConvDescParam {
  17. public:
  18. cudnnConvolutionDescriptor_t value;
  19. Empty serialize(StringSerializer& ser, Empty) {
  20. constexpr int maxNbDims = CUDNN_DIM_MAX - 2;
  21. int nbDims = maxNbDims;
  22. int padA[maxNbDims];
  23. int strideA[maxNbDims];
  24. int dilationA[maxNbDims];
  25. cudnnConvolutionMode_t mode;
  26. cudnnDataType_t computeType;
  27. cudnnGetConvolutionNdDescriptor(value, maxNbDims, &nbDims, padA,
  28. strideA, dilationA, &mode,
  29. &computeType);
  30. ser.write_plain(nbDims);
  31. for (int i = 0; i < nbDims; ++i) {
  32. ser.write_plain(padA[i]);
  33. ser.write_plain(strideA[i]);
  34. ser.write_plain(dilationA[i]);
  35. }
  36. ser.write_plain(mode);
  37. ser.write_plain(computeType);
  38. return Empty{};
  39. }
  40. };
  41. class CudnnTensorDescParam {
  42. public:
  43. cudnnTensorDescriptor_t value;
  44. Empty serialize(StringSerializer& ser, Empty) {
  45. int nbDims = MEGDNN_MAX_NDIM;
  46. cudnnDataType_t dataType;
  47. int dimA[MEGDNN_MAX_NDIM];
  48. int strideA[MEGDNN_MAX_NDIM];
  49. cudnnGetTensorNdDescriptor(value, MEGDNN_MAX_NDIM, &dataType, &nbDims,
  50. dimA, strideA);
  51. ser.write_plain(nbDims);
  52. for (int i = 0; i < nbDims; ++i) {
  53. ser.write_plain(dimA[i]);
  54. ser.write_plain(strideA[i]);
  55. }
  56. ser.write_plain(dataType);
  57. return Empty{};
  58. }
  59. };
  60. class CudnnFilterDescParam {
  61. public:
  62. cudnnFilterDescriptor_t value;
  63. Empty serialize(StringSerializer& ser, Empty) {
  64. int nbDims = MEGDNN_MAX_NDIM;
  65. cudnnDataType_t dataType;
  66. cudnnTensorFormat_t format;
  67. int filterDimA[MEGDNN_MAX_NDIM];
  68. cudnnGetFilterNdDescriptor(value, nbDims, &dataType, &format, &nbDims,
  69. filterDimA);
  70. ser.write_plain(nbDims);
  71. for (int i = 0; i < nbDims; ++i) {
  72. ser.write_plain(filterDimA[i]);
  73. }
  74. ser.write_plain(dataType);
  75. ser.write_plain(format);
  76. return Empty{};
  77. }
  78. };
  79. template <typename T>
  80. class CudnnConvAlgoPerfParam {
  81. public:
  82. T value;
  83. Empty serialize(StringSerializer& ser, Empty) {
  84. ser.write_plain(value.algo);
  85. ser.write_plain(value.status);
  86. ser.write_plain(value.time);
  87. ser.write_plain(value.memory);
  88. ser.write_plain(value.determinism);
  89. ser.write_plain(value.mathType);
  90. return Empty{};
  91. }
  92. Empty deserialize(StringSerializer& ser, Empty) {
  93. ser.read_plain(&value.algo);
  94. ser.read_plain(&value.status);
  95. ser.read_plain(&value.time);
  96. ser.read_plain(&value.memory);
  97. ser.read_plain(&value.determinism);
  98. ser.read_plain(&value.mathType);
  99. return Empty{};
  100. }
  101. };
  102. } // namespace megdnn

MegEngine 安装包中集成了使用 GPU 运行代码所需的 CUDA 环境,不用区分 CPU 和 GPU 版。 如果想要运行 GPU 程序,请确保机器本身配有 GPU 硬件设备并安装好驱动。 如果你想体验在云端 GPU 算力平台进行深度学习开发的感觉,欢迎访问 MegStudio 平台