You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

sgd.py 2.7 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354
  1. # Copyright 2020 Huawei Technologies Co., Ltd
  2. #
  3. # Licensed under the Apache License, Version 2.0 (the "License");
  4. # you may not use this file except in compliance with the License.
  5. # You may obtain a copy of the License at
  6. #
  7. # http://www.apache.org/licenses/LICENSE-2.0
  8. #
  9. # Unless required by applicable law or agreed to in writing, software
  10. # distributed under the License is distributed on an "AS IS" BASIS,
  11. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. # See the License for the specific language governing permissions and
  13. # limitations under the License.
  14. # ============================================================================
  15. """SGD op"""
  16. from mindspore.ops.op_info_register import op_info_register, TBERegOp, DataType
  17. sgd_op_info = TBERegOp("SGD") \
  18. .fusion_type("OPAQUE") \
  19. .async_flag(False) \
  20. .binfile_name("sgd.so") \
  21. .compute_cost(10) \
  22. .kernel_name("sgd") \
  23. .partial_flag(True) \
  24. .attr("dampening", "optional", "float", "all") \
  25. .attr("weight_decay", "optional", "float", "all") \
  26. .attr("nesterov", "optional", "bool", "all") \
  27. .input(0, "parameters", False, "required", "all") \
  28. .input(1, "gradient", False, "required", "all") \
  29. .input(2, "learning_rate", False, "required", "all") \
  30. .input(3, "accum", False, "required", "all") \
  31. .input(4, "momentum", False, "required", "all") \
  32. .input(5, "stat", False, "required", "all") \
  33. .output(0, "parameters", False, "required", "all") \
  34. .dtype_format(DataType.F16_5HD, DataType.F16_5HD, DataType.F16_Default, DataType.F16_5HD,
  35. DataType.F16_Default, DataType.F16_5HD, DataType.F16_5HD) \
  36. .dtype_format(DataType.F16_Default, DataType.F16_Default, DataType.F16_Default, DataType.F16_Default,
  37. DataType.F16_Default, DataType.F16_Default, DataType.F16_Default) \
  38. .dtype_format(DataType.F16_FracZ, DataType.F16_FracZ, DataType.F16_Default, DataType.F16_FracZ,
  39. DataType.F16_Default, DataType.F16_FracZ, DataType.F16_FracZ) \
  40. .dtype_format(DataType.F32_5HD, DataType.F32_5HD, DataType.F32_Default, DataType.F32_5HD,
  41. DataType.F32_Default, DataType.F32_5HD, DataType.F32_5HD) \
  42. .dtype_format(DataType.F32_Default, DataType.F32_Default, DataType.F32_Default, DataType.F32_Default,
  43. DataType.F32_Default, DataType.F32_Default, DataType.F32_Default) \
  44. .dtype_format(DataType.F32_FracZ, DataType.F32_FracZ, DataType.F32_Default, DataType.F32_FracZ,
  45. DataType.F32_Default, DataType.F32_FracZ, DataType.F32_FracZ) \
  46. .get_op_info()
  47. @op_info_register(sgd_op_info)
  48. def _sgd_tbe():
  49. """SGD TBE register"""
  50. return