You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

transforms.cc 29 kB

5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843
  1. /**
  2. * Copyright 2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include "minddata/dataset/include/transforms.h"
  17. #include "minddata/dataset/kernels/image/image_utils.h"
  18. #include "minddata/dataset/kernels/image/center_crop_op.h"
  19. #include "minddata/dataset/kernels/image/crop_op.h"
  20. #include "minddata/dataset/kernels/image/cut_out_op.h"
  21. #include "minddata/dataset/kernels/image/decode_op.h"
  22. #include "minddata/dataset/kernels/image/hwc_to_chw_op.h"
  23. #include "minddata/dataset/kernels/image/mixup_batch_op.h"
  24. #include "minddata/dataset/kernels/image/normalize_op.h"
  25. #include "minddata/dataset/kernels/data/one_hot_op.h"
  26. #include "minddata/dataset/kernels/image/pad_op.h"
  27. #include "minddata/dataset/kernels/image/random_affine_op.h"
  28. #include "minddata/dataset/kernels/image/random_color_op.h"
  29. #include "minddata/dataset/kernels/image/random_color_adjust_op.h"
  30. #include "minddata/dataset/kernels/image/random_crop_op.h"
  31. #include "minddata/dataset/kernels/image/random_horizontal_flip_op.h"
  32. #include "minddata/dataset/kernels/image/random_rotation_op.h"
  33. #include "minddata/dataset/kernels/image/random_sharpness_op.h"
  34. #include "minddata/dataset/kernels/image/random_solarize_op.h"
  35. #include "minddata/dataset/kernels/image/random_vertical_flip_op.h"
  36. #include "minddata/dataset/kernels/image/resize_op.h"
  37. #include "minddata/dataset/kernels/image/rgba_to_bgr_op.h"
  38. #include "minddata/dataset/kernels/image/rgba_to_rgb_op.h"
  39. #include "minddata/dataset/kernels/image/swap_red_blue_op.h"
  40. #include "minddata/dataset/kernels/image/uniform_aug_op.h"
  41. namespace mindspore {
  42. namespace dataset {
  43. namespace api {
  44. TensorOperation::TensorOperation() {}
  45. // Transform operations for computer vision.
  46. namespace vision {
  47. // Function to create CenterCropOperation.
  48. std::shared_ptr<CenterCropOperation> CenterCrop(std::vector<int32_t> size) {
  49. auto op = std::make_shared<CenterCropOperation>(size);
  50. // Input validation
  51. if (!op->ValidateParams()) {
  52. return nullptr;
  53. }
  54. return op;
  55. }
  56. // Function to create CropOperation.
  57. std::shared_ptr<CropOperation> Crop(std::vector<int32_t> coordinates, std::vector<int32_t> size) {
  58. auto op = std::make_shared<CropOperation>(coordinates, size);
  59. // Input validation
  60. if (!op->ValidateParams()) {
  61. return nullptr;
  62. }
  63. return op;
  64. }
  65. // Function to create CutOutOp.
  66. std::shared_ptr<CutOutOperation> CutOut(int32_t length, int32_t num_patches) {
  67. auto op = std::make_shared<CutOutOperation>(length, num_patches);
  68. // Input validation
  69. if (!op->ValidateParams()) {
  70. return nullptr;
  71. }
  72. return op;
  73. }
  74. // Function to create DecodeOperation.
  75. std::shared_ptr<DecodeOperation> Decode(bool rgb) {
  76. auto op = std::make_shared<DecodeOperation>(rgb);
  77. // Input validation
  78. if (!op->ValidateParams()) {
  79. return nullptr;
  80. }
  81. return op;
  82. }
  83. // Function to create HwcToChwOperation.
  84. std::shared_ptr<HwcToChwOperation> HWC2CHW() {
  85. auto op = std::make_shared<HwcToChwOperation>();
  86. // Input validation
  87. if (!op->ValidateParams()) {
  88. return nullptr;
  89. }
  90. return op;
  91. }
  92. // Function to create MixUpBatchOperation.
  93. std::shared_ptr<MixUpBatchOperation> MixUpBatch(float alpha) {
  94. auto op = std::make_shared<MixUpBatchOperation>(alpha);
  95. // Input validation
  96. if (!op->ValidateParams()) {
  97. return nullptr;
  98. }
  99. return op;
  100. }
  101. // Function to create NormalizeOperation.
  102. std::shared_ptr<NormalizeOperation> Normalize(std::vector<float> mean, std::vector<float> std) {
  103. auto op = std::make_shared<NormalizeOperation>(mean, std);
  104. // Input validation
  105. if (!op->ValidateParams()) {
  106. return nullptr;
  107. }
  108. return op;
  109. }
  110. // Function to create OneHotOperation.
  111. std::shared_ptr<OneHotOperation> OneHot(int32_t num_classes) {
  112. auto op = std::make_shared<OneHotOperation>(num_classes);
  113. // Input validation
  114. if (!op->ValidateParams()) {
  115. return nullptr;
  116. }
  117. return op;
  118. }
  119. // Function to create PadOperation.
  120. std::shared_ptr<PadOperation> Pad(std::vector<int32_t> padding, std::vector<uint8_t> fill_value,
  121. BorderType padding_mode) {
  122. auto op = std::make_shared<PadOperation>(padding, fill_value, padding_mode);
  123. // Input validation
  124. if (!op->ValidateParams()) {
  125. return nullptr;
  126. }
  127. return op;
  128. }
  129. // Function to create RandomColorOperation.
  130. std::shared_ptr<RandomColorOperation> RandomColor(float t_lb, float t_ub) {
  131. auto op = std::make_shared<RandomColorOperation>(t_lb, t_ub);
  132. // Input validation
  133. if (!op->ValidateParams()) {
  134. return nullptr;
  135. }
  136. return op;
  137. }
  138. std::shared_ptr<TensorOp> RandomColorOperation::Build() {
  139. std::shared_ptr<RandomColorOp> tensor_op = std::make_shared<RandomColorOp>(t_lb_, t_ub_);
  140. return tensor_op;
  141. }
  142. // Function to create RandomColorAdjustOperation.
  143. std::shared_ptr<RandomColorAdjustOperation> RandomColorAdjust(std::vector<float> brightness,
  144. std::vector<float> contrast,
  145. std::vector<float> saturation, std::vector<float> hue) {
  146. auto op = std::make_shared<RandomColorAdjustOperation>(brightness, contrast, saturation, hue);
  147. // Input validation
  148. if (!op->ValidateParams()) {
  149. return nullptr;
  150. }
  151. return op;
  152. }
  153. // Function to create RandomAffineOperation.
  154. std::shared_ptr<RandomAffineOperation> RandomAffine(const std::vector<float_t> &degrees,
  155. const std::vector<float_t> &translate_range,
  156. const std::vector<float_t> &scale_range,
  157. const std::vector<float_t> &shear_ranges,
  158. InterpolationMode interpolation,
  159. const std::vector<uint8_t> &fill_value) {
  160. auto op = std::make_shared<RandomAffineOperation>(degrees, translate_range, scale_range, shear_ranges, interpolation,
  161. fill_value);
  162. // Input validation
  163. if (!op->ValidateParams()) {
  164. return nullptr;
  165. }
  166. return op;
  167. }
  168. // Function to create RandomCropOperation.
  169. std::shared_ptr<RandomCropOperation> RandomCrop(std::vector<int32_t> size, std::vector<int32_t> padding,
  170. bool pad_if_needed, std::vector<uint8_t> fill_value,
  171. BorderType padding_mode) {
  172. auto op = std::make_shared<RandomCropOperation>(size, padding, pad_if_needed, fill_value, padding_mode);
  173. // Input validation
  174. if (!op->ValidateParams()) {
  175. return nullptr;
  176. }
  177. return op;
  178. }
  179. // Function to create RandomHorizontalFlipOperation.
  180. std::shared_ptr<RandomHorizontalFlipOperation> RandomHorizontalFlip(float prob) {
  181. auto op = std::make_shared<RandomHorizontalFlipOperation>(prob);
  182. // Input validation
  183. if (!op->ValidateParams()) {
  184. return nullptr;
  185. }
  186. return op;
  187. }
  188. // Function to create RandomRotationOperation.
  189. std::shared_ptr<RandomRotationOperation> RandomRotation(std::vector<float> degrees, InterpolationMode resample,
  190. bool expand, std::vector<float> center,
  191. std::vector<uint8_t> fill_value) {
  192. auto op = std::make_shared<RandomRotationOperation>(degrees, resample, expand, center, fill_value);
  193. // Input validation
  194. if (!op->ValidateParams()) {
  195. return nullptr;
  196. }
  197. return op;
  198. }
  199. // Function to create RandomSolarizeOperation.
  200. std::shared_ptr<RandomSolarizeOperation> RandomSolarize(uint8_t threshold_min, uint8_t threshold_max) {
  201. auto op = std::make_shared<RandomSolarizeOperation>(threshold_min, threshold_max);
  202. // Input validation
  203. if (!op->ValidateParams()) {
  204. return nullptr;
  205. }
  206. return op;
  207. }
  208. // Function to create RandomSharpnessOperation.
  209. std::shared_ptr<RandomSharpnessOperation> RandomSharpness(std::vector<float> degrees) {
  210. auto op = std::make_shared<RandomSharpnessOperation>(degrees);
  211. // Input validation
  212. if (!op->ValidateParams()) {
  213. return nullptr;
  214. }
  215. return op;
  216. }
  217. // Function to create RandomVerticalFlipOperation.
  218. std::shared_ptr<RandomVerticalFlipOperation> RandomVerticalFlip(float prob) {
  219. auto op = std::make_shared<RandomVerticalFlipOperation>(prob);
  220. // Input validation
  221. if (!op->ValidateParams()) {
  222. return nullptr;
  223. }
  224. return op;
  225. }
  226. // Function to create ResizeOperation.
  227. std::shared_ptr<ResizeOperation> Resize(std::vector<int32_t> size, InterpolationMode interpolation) {
  228. auto op = std::make_shared<ResizeOperation>(size, interpolation);
  229. // Input validation
  230. if (!op->ValidateParams()) {
  231. return nullptr;
  232. }
  233. return op;
  234. }
  235. // Function to create RgbaToBgrOperation.
  236. std::shared_ptr<RgbaToBgrOperation> RGBA2BGR() {
  237. auto op = std::make_shared<RgbaToBgrOperation>();
  238. // Input validation
  239. if (!op->ValidateParams()) {
  240. return nullptr;
  241. }
  242. return op;
  243. }
  244. // Function to create RgbaToRgbOperation.
  245. std::shared_ptr<RgbaToRgbOperation> RGBA2RGB() {
  246. auto op = std::make_shared<RgbaToRgbOperation>();
  247. // Input validation
  248. if (!op->ValidateParams()) {
  249. return nullptr;
  250. }
  251. return op;
  252. }
  253. // Function to create SwapRedBlueOperation.
  254. std::shared_ptr<SwapRedBlueOperation> SwapRedBlue() {
  255. auto op = std::make_shared<SwapRedBlueOperation>();
  256. // Input validation
  257. if (!op->ValidateParams()) {
  258. return nullptr;
  259. }
  260. return op;
  261. }
  262. // Function to create UniformAugOperation.
  263. std::shared_ptr<UniformAugOperation> UniformAugment(std::vector<std::shared_ptr<TensorOperation>> transforms,
  264. int32_t num_ops) {
  265. auto op = std::make_shared<UniformAugOperation>(transforms, num_ops);
  266. // Input validation
  267. if (!op->ValidateParams()) {
  268. return nullptr;
  269. }
  270. return op;
  271. }
  272. /* ####################################### Derived TensorOperation classes ################################# */
  273. // CenterCropOperation
  274. CenterCropOperation::CenterCropOperation(std::vector<int32_t> size) : size_(size) {}
  275. bool CenterCropOperation::ValidateParams() {
  276. if (size_.empty() || size_.size() > 2) {
  277. MS_LOG(ERROR) << "CenterCrop: size vector has incorrect size.";
  278. return false;
  279. }
  280. return true;
  281. }
  282. std::shared_ptr<TensorOp> CenterCropOperation::Build() {
  283. int32_t crop_height = size_[0];
  284. int32_t crop_width = 0;
  285. // User has specified crop_width.
  286. if (size_.size() == 2) {
  287. crop_width = size_[1];
  288. }
  289. std::shared_ptr<CenterCropOp> tensor_op = std::make_shared<CenterCropOp>(crop_height, crop_width);
  290. return tensor_op;
  291. }
  292. // CropOperation.
  293. CropOperation::CropOperation(std::vector<int32_t> coordinates, std::vector<int32_t> size)
  294. : coordinates_(coordinates), size_(size) {}
  295. bool CropOperation::ValidateParams() {
  296. // Do some input validation.
  297. if (coordinates_.empty() || coordinates_.size() > 2) {
  298. MS_LOG(ERROR) << "Crop: coordinates must be a vector of one or two values";
  299. return false;
  300. }
  301. if (size_.empty() || size_.size() > 2) {
  302. MS_LOG(ERROR) << "Crop: size must be a vector of one or two values";
  303. return false;
  304. }
  305. return true;
  306. }
  307. std::shared_ptr<TensorOp> CropOperation::Build() {
  308. int32_t x, y, height, width;
  309. x = coordinates_[0];
  310. y = coordinates_[1];
  311. height = size_[0];
  312. width = size_[1];
  313. std::shared_ptr<CropOp> tensor_op = std::make_shared<CropOp>(x, y, height, width);
  314. return tensor_op;
  315. }
  316. // CutOutOperation
  317. CutOutOperation::CutOutOperation(int32_t length, int32_t num_patches) : length_(length), num_patches_(num_patches) {}
  318. bool CutOutOperation::ValidateParams() {
  319. if (length_ < 0) {
  320. MS_LOG(ERROR) << "CutOut: length cannot be negative";
  321. return false;
  322. }
  323. if (num_patches_ < 0) {
  324. MS_LOG(ERROR) << "CutOut: number of patches cannot be negative";
  325. return false;
  326. }
  327. return true;
  328. }
  329. std::shared_ptr<TensorOp> CutOutOperation::Build() {
  330. std::shared_ptr<CutOutOp> tensor_op = std::make_shared<CutOutOp>(length_, length_, num_patches_, false, 0, 0, 0);
  331. return tensor_op;
  332. }
  333. // DecodeOperation
  334. DecodeOperation::DecodeOperation(bool rgb) : rgb_(rgb) {}
  335. bool DecodeOperation::ValidateParams() { return true; }
  336. std::shared_ptr<TensorOp> DecodeOperation::Build() { return std::make_shared<DecodeOp>(rgb_); }
  337. // HwcToChwOperation
  338. bool HwcToChwOperation::ValidateParams() { return true; }
  339. std::shared_ptr<TensorOp> HwcToChwOperation::Build() { return std::make_shared<HwcToChwOp>(); }
  340. // MixUpOperation
  341. MixUpBatchOperation::MixUpBatchOperation(float alpha) : alpha_(alpha) {}
  342. bool MixUpBatchOperation::ValidateParams() {
  343. if (alpha_ < 0) {
  344. MS_LOG(ERROR) << "MixUpBatch: alpha must be a positive floating value however it is: " << alpha_;
  345. return false;
  346. }
  347. return true;
  348. }
  349. std::shared_ptr<TensorOp> MixUpBatchOperation::Build() { return std::make_shared<MixUpBatchOp>(alpha_); }
  350. // NormalizeOperation
  351. NormalizeOperation::NormalizeOperation(std::vector<float> mean, std::vector<float> std) : mean_(mean), std_(std) {}
  352. bool NormalizeOperation::ValidateParams() {
  353. if (mean_.size() != 3) {
  354. MS_LOG(ERROR) << "Normalize: mean vector has incorrect size: " << mean_.size();
  355. return false;
  356. }
  357. if (std_.size() != 3) {
  358. MS_LOG(ERROR) << "Normalize: std vector has incorrect size: " << std_.size();
  359. return false;
  360. }
  361. return true;
  362. }
  363. std::shared_ptr<TensorOp> NormalizeOperation::Build() {
  364. return std::make_shared<NormalizeOp>(mean_[0], mean_[1], mean_[2], std_[0], std_[1], std_[2]);
  365. }
  366. // OneHotOperation
  367. OneHotOperation::OneHotOperation(int32_t num_classes) : num_classes_(num_classes) {}
  368. bool OneHotOperation::ValidateParams() {
  369. if (num_classes_ < 0) {
  370. MS_LOG(ERROR) << "OneHot: Number of classes cannot be negative. Number of classes: " << num_classes_;
  371. return false;
  372. }
  373. return true;
  374. }
  375. std::shared_ptr<TensorOp> OneHotOperation::Build() { return std::make_shared<OneHotOp>(num_classes_); }
  376. // PadOperation
  377. PadOperation::PadOperation(std::vector<int32_t> padding, std::vector<uint8_t> fill_value, BorderType padding_mode)
  378. : padding_(padding), fill_value_(fill_value), padding_mode_(padding_mode) {}
  379. bool PadOperation::ValidateParams() {
  380. if (padding_.empty() || padding_.size() == 3 || padding_.size() > 4) {
  381. MS_LOG(ERROR) << "Pad: padding vector has incorrect size: padding.size()";
  382. return false;
  383. }
  384. if (fill_value_.empty() || (fill_value_.size() != 1 && fill_value_.size() != 3)) {
  385. MS_LOG(ERROR) << "Pad: fill_value vector has incorrect size: fill_value.size()";
  386. return false;
  387. }
  388. return true;
  389. }
  390. std::shared_ptr<TensorOp> PadOperation::Build() {
  391. int32_t pad_top, pad_bottom, pad_left, pad_right;
  392. switch (padding_.size()) {
  393. case 1:
  394. pad_left = padding_[0];
  395. pad_top = padding_[0];
  396. pad_right = padding_[0];
  397. pad_bottom = padding_[0];
  398. break;
  399. case 2:
  400. pad_left = padding_[0];
  401. pad_top = padding_[1];
  402. pad_right = padding_[0];
  403. pad_bottom = padding_[1];
  404. break;
  405. default:
  406. pad_left = padding_[0];
  407. pad_top = padding_[1];
  408. pad_right = padding_[2];
  409. pad_bottom = padding_[3];
  410. }
  411. uint8_t fill_r, fill_g, fill_b;
  412. fill_r = fill_value_[0];
  413. fill_g = fill_value_[0];
  414. fill_b = fill_value_[0];
  415. if (fill_value_.size() == 3) {
  416. fill_r = fill_value_[0];
  417. fill_g = fill_value_[1];
  418. fill_b = fill_value_[2];
  419. }
  420. std::shared_ptr<PadOp> tensor_op =
  421. std::make_shared<PadOp>(pad_top, pad_bottom, pad_left, pad_right, padding_mode_, fill_r, fill_g, fill_b);
  422. return tensor_op;
  423. }
  424. // RandomColorOperation.
  425. RandomColorOperation::RandomColorOperation(float t_lb, float t_ub) : t_lb_(t_lb), t_ub_(t_ub) {}
  426. bool RandomColorOperation::ValidateParams() {
  427. // Do some input validation.
  428. if (t_lb_ > t_ub_) {
  429. MS_LOG(ERROR) << "RandomColor: lower bound must be less or equal to upper bound";
  430. return false;
  431. }
  432. return true;
  433. }
  434. // RandomColorAdjustOperation.
  435. RandomColorAdjustOperation::RandomColorAdjustOperation(std::vector<float> brightness, std::vector<float> contrast,
  436. std::vector<float> saturation, std::vector<float> hue)
  437. : brightness_(brightness), contrast_(contrast), saturation_(saturation), hue_(hue) {}
  438. bool RandomColorAdjustOperation::ValidateParams() {
  439. // Do some input validation.
  440. if (brightness_.empty() || brightness_.size() > 2) {
  441. MS_LOG(ERROR) << "RandomColorAdjust: brightness must be a vector of one or two values";
  442. return false;
  443. }
  444. if (contrast_.empty() || contrast_.size() > 2) {
  445. MS_LOG(ERROR) << "RandomColorAdjust: contrast must be a vector of one or two values";
  446. return false;
  447. }
  448. if (saturation_.empty() || saturation_.size() > 2) {
  449. MS_LOG(ERROR) << "RandomColorAdjust: saturation must be a vector of one or two values";
  450. return false;
  451. }
  452. if (hue_.empty() || hue_.size() > 2) {
  453. MS_LOG(ERROR) << "RandomColorAdjust: hue must be a vector of one or two values";
  454. return false;
  455. }
  456. return true;
  457. }
  458. std::shared_ptr<TensorOp> RandomColorAdjustOperation::Build() {
  459. float brightness_lb, brightness_ub, contrast_lb, contrast_ub, saturation_lb, saturation_ub, hue_lb, hue_ub;
  460. brightness_lb = brightness_[0];
  461. brightness_ub = brightness_[0];
  462. if (brightness_.size() == 2) brightness_ub = brightness_[1];
  463. contrast_lb = contrast_[0];
  464. contrast_ub = contrast_[0];
  465. if (contrast_.size() == 2) contrast_ub = contrast_[1];
  466. saturation_lb = saturation_[0];
  467. saturation_ub = saturation_[0];
  468. if (saturation_.size() == 2) saturation_ub = saturation_[1];
  469. hue_lb = hue_[0];
  470. hue_ub = hue_[0];
  471. if (hue_.size() == 2) hue_ub = hue_[1];
  472. std::shared_ptr<RandomColorAdjustOp> tensor_op = std::make_shared<RandomColorAdjustOp>(
  473. brightness_lb, brightness_ub, contrast_lb, contrast_ub, saturation_lb, saturation_ub, hue_lb, hue_ub);
  474. return tensor_op;
  475. }
  476. // RandomAffineOperation
  477. RandomAffineOperation::RandomAffineOperation(const std::vector<float_t> &degrees,
  478. const std::vector<float_t> &translate_range,
  479. const std::vector<float_t> &scale_range,
  480. const std::vector<float_t> &shear_ranges, InterpolationMode interpolation,
  481. const std::vector<uint8_t> &fill_value)
  482. : degrees_(degrees),
  483. translate_range_(translate_range),
  484. scale_range_(scale_range),
  485. shear_ranges_(shear_ranges),
  486. interpolation_(interpolation),
  487. fill_value_(fill_value) {}
  488. bool RandomAffineOperation::ValidateParams() {
  489. // Degrees
  490. if (degrees_.size() != 2) {
  491. MS_LOG(ERROR) << "RandomAffine: degrees vector has incorrect size: degrees.size() = " << degrees_.size();
  492. return false;
  493. }
  494. if (degrees_[0] > degrees_[1]) {
  495. MS_LOG(ERROR) << "RandomAffine: minimum of degrees range is greater than maximum: min = " << degrees_[0]
  496. << ", max = " << degrees_[1];
  497. return false;
  498. }
  499. // Translate
  500. if (translate_range_.size() != 2) {
  501. MS_LOG(ERROR) << "RandomAffine: translate_range vector has incorrect size: translate_range.size() = "
  502. << translate_range_.size();
  503. return false;
  504. }
  505. if (translate_range_[0] > translate_range_[1]) {
  506. MS_LOG(ERROR) << "RandomAffine: minimum of translate range is greater than maximum: min = " << translate_range_[0]
  507. << ", max = " << translate_range_[1];
  508. return false;
  509. }
  510. // Scale
  511. if (scale_range_.size() != 2) {
  512. MS_LOG(ERROR) << "RandomAffine: scale_range vector has incorrect size: scale_range.size() = "
  513. << scale_range_.size();
  514. return false;
  515. }
  516. if (scale_range_[0] > scale_range_[1]) {
  517. MS_LOG(ERROR) << "RandomAffine: minimum of scale range is greater than maximum: min = " << scale_range_[0]
  518. << ", max = " << scale_range_[1];
  519. return false;
  520. }
  521. // Shear
  522. if (shear_ranges_.size() != 4) {
  523. MS_LOG(ERROR) << "RandomAffine: shear_ranges vector has incorrect size: shear_ranges.size() = "
  524. << shear_ranges_.size();
  525. return false;
  526. }
  527. if (shear_ranges_[0] > shear_ranges_[1]) {
  528. MS_LOG(ERROR) << "RandomAffine: minimum of horizontal shear range is greater than maximum: min = "
  529. << shear_ranges_[0] << ", max = " << shear_ranges_[1];
  530. return false;
  531. }
  532. if (shear_ranges_[2] > shear_ranges_[3]) {
  533. MS_LOG(ERROR) << "RandomAffine: minimum of vertical shear range is greater than maximum: min = " << shear_ranges_[2]
  534. << ", max = " << scale_range_[3];
  535. return false;
  536. }
  537. // Fill Value
  538. if (fill_value_.size() != 3) {
  539. MS_LOG(ERROR) << "RandomAffine: fill_value vector has incorrect size: fill_value.size() = " << fill_value_.size();
  540. return false;
  541. }
  542. return true;
  543. }
  544. std::shared_ptr<TensorOp> RandomAffineOperation::Build() {
  545. auto tensor_op = std::make_shared<RandomAffineOp>(degrees_, translate_range_, scale_range_, shear_ranges_,
  546. interpolation_, fill_value_);
  547. return tensor_op;
  548. }
  549. // RandomCropOperation
  550. RandomCropOperation::RandomCropOperation(std::vector<int32_t> size, std::vector<int32_t> padding, bool pad_if_needed,
  551. std::vector<uint8_t> fill_value, BorderType padding_mode)
  552. : size_(size),
  553. padding_(padding),
  554. pad_if_needed_(pad_if_needed),
  555. fill_value_(fill_value),
  556. padding_mode_(padding_mode) {}
  557. bool RandomCropOperation::ValidateParams() {
  558. if (size_.empty() || size_.size() > 2) {
  559. MS_LOG(ERROR) << "RandomCrop: size vector has incorrect size: " << size_.size();
  560. return false;
  561. }
  562. if (padding_.empty() || padding_.size() != 4) {
  563. MS_LOG(ERROR) << "RandomCrop: padding vector has incorrect size: padding.size()";
  564. return false;
  565. }
  566. if (fill_value_.empty() || fill_value_.size() != 3) {
  567. MS_LOG(ERROR) << "RandomCrop: fill_value vector has incorrect size: fill_value.size()";
  568. return false;
  569. }
  570. return true;
  571. }
  572. std::shared_ptr<TensorOp> RandomCropOperation::Build() {
  573. int32_t crop_height = size_[0];
  574. int32_t crop_width = 0;
  575. int32_t pad_top = padding_[0];
  576. int32_t pad_bottom = padding_[1];
  577. int32_t pad_left = padding_[2];
  578. int32_t pad_right = padding_[3];
  579. uint8_t fill_r = fill_value_[0];
  580. uint8_t fill_g = fill_value_[1];
  581. uint8_t fill_b = fill_value_[2];
  582. // User has specified the crop_width value.
  583. if (size_.size() == 2) {
  584. crop_width = size_[1];
  585. }
  586. auto tensor_op = std::make_shared<RandomCropOp>(crop_height, crop_width, pad_top, pad_bottom, pad_left, pad_right,
  587. padding_mode_, pad_if_needed_, fill_r, fill_g, fill_b);
  588. return tensor_op;
  589. }
  590. // RandomHorizontalFlipOperation
  591. RandomHorizontalFlipOperation::RandomHorizontalFlipOperation(float probability) : probability_(probability) {}
  592. bool RandomHorizontalFlipOperation::ValidateParams() { return true; }
  593. std::shared_ptr<TensorOp> RandomHorizontalFlipOperation::Build() {
  594. std::shared_ptr<RandomHorizontalFlipOp> tensor_op = std::make_shared<RandomHorizontalFlipOp>(probability_);
  595. return tensor_op;
  596. }
  597. // Function to create RandomRotationOperation.
  598. RandomRotationOperation::RandomRotationOperation(std::vector<float> degrees, InterpolationMode interpolation_mode,
  599. bool expand, std::vector<float> center,
  600. std::vector<uint8_t> fill_value)
  601. : degrees_(degrees),
  602. interpolation_mode_(interpolation_mode),
  603. expand_(expand),
  604. center_(center),
  605. fill_value_(fill_value) {}
  606. bool RandomRotationOperation::ValidateParams() {
  607. if (degrees_.empty() || degrees_.size() != 2) {
  608. MS_LOG(ERROR) << "RandomRotation: degrees vector has incorrect size: degrees.size()";
  609. return false;
  610. }
  611. if (center_.empty() || center_.size() != 2) {
  612. MS_LOG(ERROR) << "RandomRotation: center vector has incorrect size: center.size()";
  613. return false;
  614. }
  615. if (fill_value_.empty() || fill_value_.size() != 3) {
  616. MS_LOG(ERROR) << "RandomRotation: fill_value vector has incorrect size: fill_value.size()";
  617. return false;
  618. }
  619. return true;
  620. }
  621. std::shared_ptr<TensorOp> RandomRotationOperation::Build() {
  622. std::shared_ptr<RandomRotationOp> tensor_op =
  623. std::make_shared<RandomRotationOp>(degrees_[0], degrees_[1], center_[0], center_[1], interpolation_mode_, expand_,
  624. fill_value_[0], fill_value_[1], fill_value_[2]);
  625. return tensor_op;
  626. }
  627. // Function to create RandomSharpness.
  628. RandomSharpnessOperation::RandomSharpnessOperation(std::vector<float> degrees) : degrees_(degrees) {}
  629. bool RandomSharpnessOperation::ValidateParams() {
  630. if (degrees_.empty() || degrees_.size() != 2) {
  631. MS_LOG(ERROR) << "RandomSharpness: degrees vector has incorrect size: degrees.size()";
  632. return false;
  633. }
  634. return true;
  635. }
  636. std::shared_ptr<TensorOp> RandomSharpnessOperation::Build() {
  637. std::shared_ptr<RandomSharpnessOp> tensor_op = std::make_shared<RandomSharpnessOp>(degrees_[0], degrees_[1]);
  638. return tensor_op;
  639. }
  640. // RandomSolarizeOperation.
  641. RandomSolarizeOperation::RandomSolarizeOperation(uint8_t threshold_min, uint8_t threshold_max)
  642. : threshold_min_(threshold_min), threshold_max_(threshold_max) {}
  643. bool RandomSolarizeOperation::ValidateParams() {
  644. if (threshold_max_ < threshold_min_) {
  645. MS_LOG(ERROR) << "RandomSolarize: threshold_max must be greater or equal to threshold_min";
  646. return false;
  647. }
  648. return true;
  649. }
  650. std::shared_ptr<TensorOp> RandomSolarizeOperation::Build() {
  651. std::shared_ptr<RandomSolarizeOp> tensor_op = std::make_shared<RandomSolarizeOp>(threshold_min_, threshold_max_);
  652. return tensor_op;
  653. }
  654. // RandomVerticalFlipOperation
  655. RandomVerticalFlipOperation::RandomVerticalFlipOperation(float probability) : probability_(probability) {}
  656. bool RandomVerticalFlipOperation::ValidateParams() { return true; }
  657. std::shared_ptr<TensorOp> RandomVerticalFlipOperation::Build() {
  658. std::shared_ptr<RandomVerticalFlipOp> tensor_op = std::make_shared<RandomVerticalFlipOp>(probability_);
  659. return tensor_op;
  660. }
  661. // ResizeOperation
  662. ResizeOperation::ResizeOperation(std::vector<int32_t> size, InterpolationMode interpolation)
  663. : size_(size), interpolation_(interpolation) {}
  664. bool ResizeOperation::ValidateParams() {
  665. if (size_.empty() || size_.size() > 2) {
  666. MS_LOG(ERROR) << "Resize: size vector has incorrect size: " << size_.size();
  667. return false;
  668. }
  669. return true;
  670. }
  671. std::shared_ptr<TensorOp> ResizeOperation::Build() {
  672. int32_t height = size_[0];
  673. int32_t width = 0;
  674. // User specified the width value.
  675. if (size_.size() == 2) {
  676. width = size_[1];
  677. }
  678. return std::make_shared<ResizeOp>(height, width, interpolation_);
  679. }
  680. // RgbaToBgrOperation.
  681. RgbaToBgrOperation::RgbaToBgrOperation() {}
  682. bool RgbaToBgrOperation::ValidateParams() { return true; }
  683. std::shared_ptr<TensorOp> RgbaToBgrOperation::Build() {
  684. std::shared_ptr<RgbaToBgrOp> tensor_op = std::make_shared<RgbaToBgrOp>();
  685. return tensor_op;
  686. }
  687. // RgbaToRgbOperation.
  688. RgbaToRgbOperation::RgbaToRgbOperation() {}
  689. bool RgbaToRgbOperation::ValidateParams() { return true; }
  690. std::shared_ptr<TensorOp> RgbaToRgbOperation::Build() {
  691. std::shared_ptr<RgbaToRgbOp> tensor_op = std::make_shared<RgbaToRgbOp>();
  692. return tensor_op;
  693. }
  694. // SwapRedBlueOperation.
  695. SwapRedBlueOperation::SwapRedBlueOperation() {}
  696. bool SwapRedBlueOperation::ValidateParams() { return true; }
  697. std::shared_ptr<TensorOp> SwapRedBlueOperation::Build() {
  698. std::shared_ptr<SwapRedBlueOp> tensor_op = std::make_shared<SwapRedBlueOp>();
  699. return tensor_op;
  700. }
  701. // UniformAugOperation
  702. UniformAugOperation::UniformAugOperation(std::vector<std::shared_ptr<TensorOperation>> transforms, int32_t num_ops)
  703. : transforms_(transforms), num_ops_(num_ops) {}
  704. bool UniformAugOperation::ValidateParams() { return true; }
  705. std::shared_ptr<TensorOp> UniformAugOperation::Build() {
  706. std::vector<std::shared_ptr<TensorOp>> tensor_ops;
  707. (void)std::transform(transforms_.begin(), transforms_.end(), std::back_inserter(tensor_ops),
  708. [](std::shared_ptr<TensorOperation> op) -> std::shared_ptr<TensorOp> { return op->Build(); });
  709. std::shared_ptr<UniformAugOp> tensor_op = std::make_shared<UniformAugOp>(tensor_ops, num_ops_);
  710. return tensor_op;
  711. }
  712. } // namespace vision
  713. } // namespace api
  714. } // namespace dataset
  715. } // namespace mindspore