|
- /**
- * Copyright 2020-2021 Huawei Technologies Co., Ltd
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- * http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
- #include "minddata/dataset/include/vision.h"
- #ifdef ENABLE_ACL
- #include "minddata/dataset/include/vision_ascend.h"
- #include "minddata/dataset/kernels/ir/vision/ascend_vision_ir.h"
- #endif
-
- #include "minddata/dataset/include/transforms.h"
- #include "minddata/dataset/kernels/ir/vision/vision_ir.h"
-
- #ifndef ENABLE_ANDROID
- #include "utils/log_adapter.h"
- #else
- #include "mindspore/lite/src/common/log_adapter.h"
- #endif
- #include "minddata/dataset/kernels/ir/validators.h"
-
- // Kernel image headers (in alphabetical order)
-
- namespace mindspore {
- namespace dataset {
-
- // Transform operations for computer vision.
- namespace vision {
- // CONSTRUCTORS FOR API CLASSES TO CREATE VISION TENSOR TRANSFORM OPERATIONS
- // (In alphabetical order)
-
- // Affine Transform Operation.
- struct Affine::Data {
- Data(float_t degrees, const std::vector<float> &translation, float scale, const std::vector<float> &shear,
- InterpolationMode interpolation, const std::vector<uint8_t> &fill_value)
- : degrees_(degrees),
- translation_(translation),
- scale_(scale),
- shear_(shear),
- interpolation_(interpolation),
- fill_value_(fill_value) {}
- float degrees_;
- std::vector<float> translation_;
- float scale_;
- std::vector<float> shear_;
- InterpolationMode interpolation_;
- std::vector<uint8_t> fill_value_;
- };
-
- Affine::Affine(float_t degrees, const std::vector<float> &translation, float scale, const std::vector<float> &shear,
- InterpolationMode interpolation, const std::vector<uint8_t> &fill_value)
- : data_(std::make_shared<Data>(degrees, translation, scale, shear, interpolation, fill_value)) {}
-
- std::shared_ptr<TensorOperation> Affine::Parse() {
- return std::make_shared<AffineOperation>(data_->degrees_, data_->translation_, data_->scale_, data_->shear_,
- data_->interpolation_, data_->fill_value_);
- }
-
- #ifndef ENABLE_ANDROID
- // AutoContrast Transform Operation.
- struct AutoContrast::Data {
- Data(float cutoff, const std::vector<uint32_t> &ignore) : cutoff_(cutoff), ignore_(ignore) {}
- float cutoff_;
- std::vector<uint32_t> ignore_;
- };
-
- AutoContrast::AutoContrast(float cutoff, std::vector<uint32_t> ignore)
- : data_(std::make_shared<Data>(cutoff, ignore)) {}
-
- std::shared_ptr<TensorOperation> AutoContrast::Parse() {
- return std::make_shared<AutoContrastOperation>(data_->cutoff_, data_->ignore_);
- }
-
- // BoundingBoxAugment Transform Operation.
- struct BoundingBoxAugment::Data {
- std::shared_ptr<TensorOperation> transform_;
- float ratio_;
- };
-
- BoundingBoxAugment::BoundingBoxAugment(TensorTransform *transform, float ratio) : data_(std::make_shared<Data>()) {
- data_->transform_ = transform ? transform->Parse() : nullptr;
- data_->ratio_ = ratio;
- }
-
- BoundingBoxAugment::BoundingBoxAugment(const std::shared_ptr<TensorTransform> &transform, float ratio)
- : data_(std::make_shared<Data>()) {
- data_->transform_ = transform ? transform->Parse() : nullptr;
- data_->ratio_ = ratio;
- }
-
- BoundingBoxAugment::BoundingBoxAugment(const std::reference_wrapper<TensorTransform> transform, float ratio)
- : data_(std::make_shared<Data>()) {
- data_->transform_ = transform.get().Parse();
- data_->ratio_ = ratio;
- }
-
- std::shared_ptr<TensorOperation> BoundingBoxAugment::Parse() {
- return std::make_shared<BoundingBoxAugmentOperation>(data_->transform_, data_->ratio_);
- }
- #endif // not ENABLE_ANDROID
-
- // CenterCrop Transform Operation.
- struct CenterCrop::Data {
- explicit Data(const std::vector<int32_t> &size) : size_(size) {}
- std::vector<int32_t> size_;
- };
-
- CenterCrop::CenterCrop(std::vector<int32_t> size) : data_(std::make_shared<Data>(size)) {}
-
- std::shared_ptr<TensorOperation> CenterCrop::Parse() { return std::make_shared<CenterCropOperation>(data_->size_); }
-
- std::shared_ptr<TensorOperation> CenterCrop::Parse(const MapTargetDevice &env) {
- if (env == MapTargetDevice::kAscend310) {
- #ifdef ENABLE_ACL
- std::vector<uint32_t> usize_;
- usize_.reserve(data_->size_.size());
- std::transform(data_->size_.begin(), data_->size_.end(), std::back_inserter(usize_),
- [](int32_t i) { return (uint32_t)i; });
- return std::make_shared<DvppCropJpegOperation>(usize_);
- #endif // ENABLE_ACL
- }
- return std::make_shared<CenterCropOperation>(data_->size_);
- }
-
- // RGB2GRAY Transform Operation.
- std::shared_ptr<TensorOperation> RGB2GRAY::Parse() { return std::make_shared<RgbToGrayOperation>(); }
-
- // Crop Transform Operation.
- struct Crop::Data {
- Data(const std::vector<int32_t> &coordinates, const std::vector<int32_t> &size)
- : coordinates_(coordinates), size_(size) {}
- std::vector<int32_t> coordinates_;
- std::vector<int32_t> size_;
- };
-
- Crop::Crop(std::vector<int32_t> coordinates, std::vector<int32_t> size)
- : data_(std::make_shared<Data>(coordinates, size)) {}
-
- std::shared_ptr<TensorOperation> Crop::Parse() {
- return std::make_shared<CropOperation>(data_->coordinates_, data_->size_);
- }
-
- #ifndef ENABLE_ANDROID
- // CutMixBatch Transform Operation.
- struct CutMixBatch::Data {
- Data(ImageBatchFormat image_batch_format, float alpha, float prob)
- : image_batch_format_(image_batch_format), alpha_(alpha), prob_(prob) {}
- float alpha_;
- float prob_;
- ImageBatchFormat image_batch_format_;
- };
-
- CutMixBatch::CutMixBatch(ImageBatchFormat image_batch_format, float alpha, float prob)
- : data_(std::make_shared<Data>(image_batch_format, alpha, prob)) {}
-
- std::shared_ptr<TensorOperation> CutMixBatch::Parse() {
- return std::make_shared<CutMixBatchOperation>(data_->image_batch_format_, data_->alpha_, data_->prob_);
- }
-
- // CutOutOp.
- struct CutOut::Data {
- Data(int32_t length, int32_t num_patches) : length_(length), num_patches_(num_patches) {}
- int32_t length_;
- int32_t num_patches_;
- };
-
- CutOut::CutOut(int32_t length, int32_t num_patches) : data_(std::make_shared<Data>(length, num_patches)) {}
-
- std::shared_ptr<TensorOperation> CutOut::Parse() {
- return std::make_shared<CutOutOperation>(data_->length_, data_->num_patches_);
- }
- #endif // not ENABLE_ANDROID
-
- // Decode Transform Operation.
- struct Decode::Data {
- explicit Data(bool rgb) : rgb_(rgb) {}
- bool rgb_;
- };
-
- Decode::Decode(bool rgb) : data_(std::make_shared<Data>(rgb)) {}
-
- std::shared_ptr<TensorOperation> Decode::Parse() { return std::make_shared<DecodeOperation>(data_->rgb_); }
-
- std::shared_ptr<TensorOperation> Decode::Parse(const MapTargetDevice &env) {
- if (env == MapTargetDevice::kAscend310) {
- #ifdef ENABLE_ACL
- return std::make_shared<DvppDecodeJpegOperation>();
- #endif // ENABLE_ACL
- }
- return std::make_shared<DecodeOperation>(data_->rgb_);
- }
-
- #ifdef ENABLE_ACL
- // DvppDecodeResize Transform Operation.
- struct DvppDecodeResizeJpeg::Data {
- explicit Data(const std::vector<uint32_t> &resize) : resize_(resize) {}
- std::vector<uint32_t> resize_;
- };
-
- DvppDecodeResizeJpeg::DvppDecodeResizeJpeg(std::vector<uint32_t> resize) : data_(std::make_shared<Data>(resize)) {}
-
- std::shared_ptr<TensorOperation> DvppDecodeResizeJpeg::Parse() {
- return std::make_shared<DvppDecodeResizeOperation>(data_->resize_);
- }
-
- std::shared_ptr<TensorOperation> DvppDecodeResizeJpeg::Parse(const MapTargetDevice &env) {
- return std::make_shared<DvppDecodeResizeOperation>(data_->resize_);
- }
-
- // DvppDecodeResizeCrop Transform Operation.
- struct DvppDecodeResizeCropJpeg::Data {
- Data(const std::vector<uint32_t> &crop, const std::vector<uint32_t> &resize) : crop_(crop), resize_(resize) {}
- std::vector<uint32_t> crop_;
- std::vector<uint32_t> resize_;
- };
-
- DvppDecodeResizeCropJpeg::DvppDecodeResizeCropJpeg(std::vector<uint32_t> crop, std::vector<uint32_t> resize)
- : data_(std::make_shared<Data>(crop, resize)) {}
-
- std::shared_ptr<TensorOperation> DvppDecodeResizeCropJpeg::Parse() {
- return std::make_shared<DvppDecodeResizeCropOperation>(data_->crop_, data_->resize_);
- }
-
- std::shared_ptr<TensorOperation> DvppDecodeResizeCropJpeg::Parse(const MapTargetDevice &env) {
- return std::make_shared<DvppDecodeResizeCropOperation>(data_->crop_, data_->resize_);
- }
-
- // DvppDecodePng Transform Operation.
- DvppDecodePng::DvppDecodePng() {}
-
- std::shared_ptr<TensorOperation> DvppDecodePng::Parse() { return std::make_shared<DvppDecodePngOperation>(); }
-
- std::shared_ptr<TensorOperation> DvppDecodePng::Parse(const MapTargetDevice &env) {
- return std::make_shared<DvppDecodePngOperation>();
- }
- #endif // ENABLE_ACL
-
- #ifndef ENABLE_ANDROID
- // Equalize Transform Operation.
- Equalize::Equalize() {}
-
- std::shared_ptr<TensorOperation> Equalize::Parse() { return std::make_shared<EqualizeOperation>(); }
- // HwcToChw Transform Operation.
- HWC2CHW::HWC2CHW() {}
-
- std::shared_ptr<TensorOperation> HWC2CHW::Parse() { return std::make_shared<HwcToChwOperation>(); }
-
- // Invert Transform Operation.
- Invert::Invert() {}
-
- std::shared_ptr<TensorOperation> Invert::Parse() { return std::make_shared<InvertOperation>(); }
-
- // MixUpBatch Transform Operation.
- struct MixUpBatch::Data {
- explicit Data(float alpha) : alpha_(alpha) {}
- float alpha_;
- };
-
- MixUpBatch::MixUpBatch(float alpha) : data_(std::make_shared<Data>(alpha)) {}
-
- std::shared_ptr<TensorOperation> MixUpBatch::Parse() { return std::make_shared<MixUpBatchOperation>(data_->alpha_); }
- #endif // not ENABLE_ANDROID
-
- // Normalize Transform Operation.
- struct Normalize::Data {
- Data(const std::vector<float> &mean, const std::vector<float> &std) : mean_(mean), std_(std) {}
- std::vector<float> mean_;
- std::vector<float> std_;
- };
-
- Normalize::Normalize(std::vector<float> mean, std::vector<float> std) : data_(std::make_shared<Data>(mean, std)) {}
-
- std::shared_ptr<TensorOperation> Normalize::Parse() {
- return std::make_shared<NormalizeOperation>(data_->mean_, data_->std_);
- }
-
- std::shared_ptr<TensorOperation> Normalize::Parse(const MapTargetDevice &env) {
- if (env == MapTargetDevice::kAscend310) {
- #ifdef ENABLE_ACL
- return std::make_shared<DvppNormalizeOperation>(data_->mean_, data_->std_);
- #endif // ENABLE_ACL
- }
- return std::make_shared<NormalizeOperation>(data_->mean_, data_->std_);
- }
-
- #ifndef ENABLE_ANDROID
- // NormalizePad Transform Operation.
- struct NormalizePad::Data {
- Data(const std::vector<float> &mean, const std::vector<float> &std, const std::string &dtype)
- : mean_(mean), std_(std), dtype_(dtype) {}
- std::vector<float> mean_;
- std::vector<float> std_;
- std::string dtype_;
- };
-
- NormalizePad::NormalizePad(const std::vector<float> &mean, const std::vector<float> &std,
- const std::vector<char> &dtype)
- : data_(std::make_shared<Data>(mean, std, CharToString(dtype))) {}
-
- std::shared_ptr<TensorOperation> NormalizePad::Parse() {
- return std::make_shared<NormalizePadOperation>(data_->mean_, data_->std_, data_->dtype_);
- }
-
- // Pad Transform Operation.
- struct Pad::Data {
- Data(const std::vector<int32_t> &padding, const std::vector<uint8_t> &fill_value, BorderType padding_mode)
- : padding_(padding), fill_value_(fill_value), padding_mode_(padding_mode) {}
- std::vector<int32_t> padding_;
- std::vector<uint8_t> fill_value_;
- BorderType padding_mode_;
- };
-
- Pad::Pad(std::vector<int32_t> padding, std::vector<uint8_t> fill_value, BorderType padding_mode)
- : data_(std::make_shared<Data>(padding, fill_value, padding_mode)) {}
-
- std::shared_ptr<TensorOperation> Pad::Parse() {
- return std::make_shared<PadOperation>(data_->padding_, data_->fill_value_, data_->padding_mode_);
- }
- #endif // not ENABLE_ANDROID
-
- // RandomAffine Transform Operation.
- struct RandomAffine::Data {
- Data(const std::vector<float_t> °rees, const std::vector<float_t> &translate_range,
- const std::vector<float_t> &scale_range, const std::vector<float_t> &shear_ranges,
- InterpolationMode interpolation, const std::vector<uint8_t> &fill_value)
- : degrees_(degrees),
- translate_range_(translate_range),
- scale_range_(scale_range),
- shear_ranges_(shear_ranges),
- interpolation_(interpolation),
- fill_value_(fill_value) {}
- std::vector<float_t> degrees_; // min_degree, max_degree
- std::vector<float_t> translate_range_; // maximum x translation percentage, maximum y translation percentage
- std::vector<float_t> scale_range_; // min_scale, max_scale
- std::vector<float_t> shear_ranges_; // min_x_shear, max_x_shear, min_y_shear, max_y_shear
- InterpolationMode interpolation_;
- std::vector<uint8_t> fill_value_;
- };
-
- RandomAffine::RandomAffine(const std::vector<float_t> °rees, const std::vector<float_t> &translate_range,
- const std::vector<float_t> &scale_range, const std::vector<float_t> &shear_ranges,
- InterpolationMode interpolation, const std::vector<uint8_t> &fill_value)
- : data_(std::make_shared<Data>(degrees, translate_range, scale_range, shear_ranges, interpolation, fill_value)) {}
-
- std::shared_ptr<TensorOperation> RandomAffine::Parse() {
- return std::make_shared<RandomAffineOperation>(data_->degrees_, data_->translate_range_, data_->scale_range_,
- data_->shear_ranges_, data_->interpolation_, data_->fill_value_);
- }
-
- #ifndef ENABLE_ANDROID
- // RandomColor Transform Operation.
- struct RandomColor::Data {
- Data(float t_lb, float t_ub) : t_lb_(t_lb), t_ub_(t_ub) {}
- float t_lb_;
- float t_ub_;
- };
-
- RandomColor::RandomColor(float t_lb, float t_ub) : data_(std::make_shared<Data>(t_lb, t_ub)) {}
-
- std::shared_ptr<TensorOperation> RandomColor::Parse() {
- return std::make_shared<RandomColorOperation>(data_->t_lb_, data_->t_ub_);
- }
-
- // RandomColorAdjust Transform Operation.
- struct RandomColorAdjust::Data {
- Data(const std::vector<float> &brightness, const std::vector<float> &contrast, const std::vector<float> &saturation,
- const std::vector<float> &hue)
- : brightness_(brightness), contrast_(contrast), saturation_(saturation), hue_(hue) {}
- std::vector<float> brightness_;
- std::vector<float> contrast_;
- std::vector<float> saturation_;
- std::vector<float> hue_;
- };
-
- RandomColorAdjust::RandomColorAdjust(std::vector<float> brightness, std::vector<float> contrast,
- std::vector<float> saturation, std::vector<float> hue)
- : data_(std::make_shared<Data>(brightness, contrast, saturation, hue)) {}
-
- std::shared_ptr<TensorOperation> RandomColorAdjust::Parse() {
- return std::make_shared<RandomColorAdjustOperation>(data_->brightness_, data_->contrast_, data_->saturation_,
- data_->hue_);
- }
-
- // RandomCrop Transform Operation.
- struct RandomCrop::Data {
- Data(const std::vector<int32_t> &size, const std::vector<int32_t> &padding, bool pad_if_needed,
- const std::vector<uint8_t> &fill_value, BorderType padding_mode)
- : size_(size),
- padding_(padding),
- pad_if_needed_(pad_if_needed),
- fill_value_(fill_value),
- padding_mode_(padding_mode) {}
- std::vector<int32_t> size_;
- std::vector<int32_t> padding_;
- bool pad_if_needed_;
- std::vector<uint8_t> fill_value_;
- BorderType padding_mode_;
- };
-
- RandomCrop::RandomCrop(std::vector<int32_t> size, std::vector<int32_t> padding, bool pad_if_needed,
- std::vector<uint8_t> fill_value, BorderType padding_mode)
- : data_(std::make_shared<Data>(size, padding, pad_if_needed, fill_value, padding_mode)) {}
-
- std::shared_ptr<TensorOperation> RandomCrop::Parse() {
- return std::make_shared<RandomCropOperation>(data_->size_, data_->padding_, data_->pad_if_needed_, data_->fill_value_,
- data_->padding_mode_);
- }
-
- // RandomCropDecodeResize Transform Operation.
- struct RandomCropDecodeResize::Data {
- Data(const std::vector<int32_t> &size, const std::vector<float> &scale, const std::vector<float> &ratio,
- InterpolationMode interpolation, int32_t max_attempts)
- : size_(size), scale_(scale), ratio_(ratio), interpolation_(interpolation), max_attempts_(max_attempts) {}
- std::vector<int32_t> size_;
- std::vector<float> scale_;
- std::vector<float> ratio_;
- InterpolationMode interpolation_;
- int32_t max_attempts_;
- };
-
- RandomCropDecodeResize::RandomCropDecodeResize(std::vector<int32_t> size, std::vector<float> scale,
- std::vector<float> ratio, InterpolationMode interpolation,
- int32_t max_attempts)
- : data_(std::make_shared<Data>(size, scale, ratio, interpolation, max_attempts)) {}
-
- std::shared_ptr<TensorOperation> RandomCropDecodeResize::Parse() {
- return std::make_shared<RandomCropDecodeResizeOperation>(data_->size_, data_->scale_, data_->ratio_,
- data_->interpolation_, data_->max_attempts_);
- }
-
- // RandomCropWithBBox Transform Operation.
- struct RandomCropWithBBox::Data {
- Data(const std::vector<int32_t> &size, const std::vector<int32_t> &padding, bool pad_if_needed,
- const std::vector<uint8_t> &fill_value, BorderType padding_mode)
- : size_(size),
- padding_(padding),
- pad_if_needed_(pad_if_needed),
- fill_value_(fill_value),
- padding_mode_(padding_mode) {}
- std::vector<int32_t> size_;
- std::vector<int32_t> padding_;
- bool pad_if_needed_;
- std::vector<uint8_t> fill_value_;
- BorderType padding_mode_;
- };
-
- RandomCropWithBBox::RandomCropWithBBox(std::vector<int32_t> size, std::vector<int32_t> padding, bool pad_if_needed,
- std::vector<uint8_t> fill_value, BorderType padding_mode)
- : data_(std::make_shared<Data>(size, padding, pad_if_needed, fill_value, padding_mode)) {}
-
- std::shared_ptr<TensorOperation> RandomCropWithBBox::Parse() {
- return std::make_shared<RandomCropWithBBoxOperation>(data_->size_, data_->padding_, data_->pad_if_needed_,
- data_->fill_value_, data_->padding_mode_);
- }
-
- // RandomHorizontalFlip.
- struct RandomHorizontalFlip::Data {
- explicit Data(float prob) : probability_(prob) {}
- float probability_;
- };
-
- RandomHorizontalFlip::RandomHorizontalFlip(float prob) : data_(std::make_shared<Data>(prob)) {}
-
- std::shared_ptr<TensorOperation> RandomHorizontalFlip::Parse() {
- return std::make_shared<RandomHorizontalFlipOperation>(data_->probability_);
- }
-
- // RandomHorizontalFlipWithBBox
- struct RandomHorizontalFlipWithBBox::Data {
- explicit Data(float prob) : probability_(prob) {}
- float probability_;
- };
-
- RandomHorizontalFlipWithBBox::RandomHorizontalFlipWithBBox(float prob) : data_(std::make_shared<Data>(prob)) {}
-
- std::shared_ptr<TensorOperation> RandomHorizontalFlipWithBBox::Parse() {
- return std::make_shared<RandomHorizontalFlipWithBBoxOperation>(data_->probability_);
- }
-
- // RandomPosterize Transform Operation.
- struct RandomPosterize::Data {
- explicit Data(const std::vector<uint8_t> &bit_range) : bit_range_(bit_range) {}
- std::vector<uint8_t> bit_range_;
- };
-
- RandomPosterize::RandomPosterize(const std::vector<uint8_t> &bit_range) : data_(std::make_shared<Data>(bit_range)) {}
-
- std::shared_ptr<TensorOperation> RandomPosterize::Parse() {
- return std::make_shared<RandomPosterizeOperation>(data_->bit_range_);
- }
-
- // RandomResize Transform Operation.
- struct RandomResize::Data {
- explicit Data(const std::vector<int32_t> &size) : size_(size) {}
- std::vector<int32_t> size_;
- };
-
- RandomResize::RandomResize(std::vector<int32_t> size) : data_(std::make_shared<Data>(size)) {}
-
- std::shared_ptr<TensorOperation> RandomResize::Parse() { return std::make_shared<RandomResizeOperation>(data_->size_); }
-
- // RandomResizeWithBBox Transform Operation.
- struct RandomResizeWithBBox::Data {
- explicit Data(const std::vector<int32_t> &size) : size_(size) {}
- std::vector<int32_t> size_;
- };
-
- RandomResizeWithBBox::RandomResizeWithBBox(std::vector<int32_t> size) : data_(std::make_shared<Data>(size)) {}
-
- std::shared_ptr<TensorOperation> RandomResizeWithBBox::Parse() {
- return std::make_shared<RandomResizeWithBBoxOperation>(data_->size_);
- }
-
- // RandomResizedCrop Transform Operation.
- struct RandomResizedCrop::Data {
- Data(const std::vector<int32_t> &size, const std::vector<float> &scale, const std::vector<float> &ratio,
- InterpolationMode interpolation, int32_t max_attempts)
- : size_(size), scale_(scale), ratio_(ratio), interpolation_(interpolation), max_attempts_(max_attempts) {}
- std::vector<int32_t> size_;
- std::vector<float> scale_;
- std::vector<float> ratio_;
- InterpolationMode interpolation_;
- int32_t max_attempts_;
- };
-
- RandomResizedCrop::RandomResizedCrop(std::vector<int32_t> size, std::vector<float> scale, std::vector<float> ratio,
- InterpolationMode interpolation, int32_t max_attempts)
- : data_(std::make_shared<Data>(size, scale, ratio, interpolation, max_attempts)) {}
-
- std::shared_ptr<TensorOperation> RandomResizedCrop::Parse() {
- return std::make_shared<RandomResizedCropOperation>(data_->size_, data_->scale_, data_->ratio_, data_->interpolation_,
- data_->max_attempts_);
- }
-
- // RandomResizedCrop Transform Operation.
- struct RandomResizedCropWithBBox::Data {
- Data(const std::vector<int32_t> &size, const std::vector<float> &scale, const std::vector<float> &ratio,
- InterpolationMode interpolation, int32_t max_attempts)
- : size_(size), scale_(scale), ratio_(ratio), interpolation_(interpolation), max_attempts_(max_attempts) {}
- std::vector<int32_t> size_;
- std::vector<float> scale_;
- std::vector<float> ratio_;
- InterpolationMode interpolation_;
- int32_t max_attempts_;
- };
-
- RandomResizedCropWithBBox::RandomResizedCropWithBBox(std::vector<int32_t> size, std::vector<float> scale,
- std::vector<float> ratio, InterpolationMode interpolation,
- int32_t max_attempts)
- : data_(std::make_shared<Data>(size, scale, ratio, interpolation, max_attempts)) {}
-
- std::shared_ptr<TensorOperation> RandomResizedCropWithBBox::Parse() {
- return std::make_shared<RandomResizedCropWithBBoxOperation>(data_->size_, data_->scale_, data_->ratio_,
- data_->interpolation_, data_->max_attempts_);
- }
-
- // RandomRotation Transform Operation.
- struct RandomRotation::Data {
- Data(const std::vector<float> °rees, InterpolationMode interpolation_mode, bool expand,
- const std::vector<float> ¢er, const std::vector<uint8_t> &fill_value)
- : degrees_(degrees),
- interpolation_mode_(interpolation_mode),
- expand_(expand),
- center_(center),
- fill_value_(fill_value) {}
- std::vector<float> degrees_;
- InterpolationMode interpolation_mode_;
- std::vector<float> center_;
- bool expand_;
- std::vector<uint8_t> fill_value_;
- };
-
- RandomRotation::RandomRotation(std::vector<float> degrees, InterpolationMode interpolation_mode, bool expand,
- std::vector<float> center, std::vector<uint8_t> fill_value)
- : data_(std::make_shared<Data>(degrees, interpolation_mode, expand, center, fill_value)) {}
-
- std::shared_ptr<TensorOperation> RandomRotation::Parse() {
- return std::make_shared<RandomRotationOperation>(data_->degrees_, data_->interpolation_mode_, data_->expand_,
- data_->center_, data_->fill_value_);
- }
-
- // RandomSelectSubpolicy Transform Operation.
- struct RandomSelectSubpolicy::Data {
- std::vector<std::vector<std::pair<std::shared_ptr<TensorOperation>, double>>> policy_;
- };
-
- RandomSelectSubpolicy::RandomSelectSubpolicy(
- const std::vector<std::vector<std::pair<TensorTransform *, double>>> &policy)
- : data_(std::make_shared<Data>()) {
- for (int32_t i = 0; i < policy.size(); i++) {
- std::vector<std::pair<std::shared_ptr<TensorOperation>, double>> subpolicy;
-
- for (int32_t j = 0; j < policy[i].size(); j++) {
- TensorTransform *op = policy[i][j].first;
- std::shared_ptr<TensorOperation> operation = (op ? op->Parse() : nullptr);
- double prob = policy[i][j].second;
- subpolicy.emplace_back(std::move(std::make_pair(operation, prob)));
- }
- data_->policy_.emplace_back(subpolicy);
- }
- }
-
- RandomSelectSubpolicy::RandomSelectSubpolicy(
- const std::vector<std::vector<std::pair<std::shared_ptr<TensorTransform>, double>>> &policy)
- : data_(std::make_shared<Data>()) {
- for (int32_t i = 0; i < policy.size(); i++) {
- std::vector<std::pair<std::shared_ptr<TensorOperation>, double>> subpolicy;
-
- for (int32_t j = 0; j < policy[i].size(); j++) {
- std::shared_ptr<TensorTransform> op = policy[i][j].first;
- std::shared_ptr<TensorOperation> operation = (op ? op->Parse() : nullptr);
- double prob = policy[i][j].second;
- subpolicy.emplace_back(std::move(std::make_pair(operation, prob)));
- }
- data_->policy_.emplace_back(subpolicy);
- }
- }
-
- RandomSelectSubpolicy::RandomSelectSubpolicy(
- const std::vector<std::vector<std::pair<std::reference_wrapper<TensorTransform>, double>>> &policy)
- : data_(std::make_shared<Data>()) {
- for (int32_t i = 0; i < policy.size(); i++) {
- std::vector<std::pair<std::shared_ptr<TensorOperation>, double>> subpolicy;
-
- for (int32_t j = 0; j < policy[i].size(); j++) {
- TensorTransform &op = policy[i][j].first;
- std::shared_ptr<TensorOperation> operation = op.Parse();
- double prob = policy[i][j].second;
- subpolicy.emplace_back(std::move(std::make_pair(operation, prob)));
- }
- data_->policy_.emplace_back(subpolicy);
- }
- }
-
- std::shared_ptr<TensorOperation> RandomSelectSubpolicy::Parse() {
- return std::make_shared<RandomSelectSubpolicyOperation>(data_->policy_);
- }
-
- // RandomSharpness Transform Operation.
- struct RandomSharpness::Data {
- explicit Data(const std::vector<float> °rees) : degrees_(degrees) {}
- std::vector<float> degrees_;
- };
-
- RandomSharpness::RandomSharpness(std::vector<float> degrees) : data_(std::make_shared<Data>(degrees)) {}
-
- std::shared_ptr<TensorOperation> RandomSharpness::Parse() {
- return std::make_shared<RandomSharpnessOperation>(data_->degrees_);
- }
-
- // RandomSolarize Transform Operation.
- struct RandomSolarize::Data {
- explicit Data(const std::vector<uint8_t> &threshold) : threshold_(threshold) {}
- std::vector<uint8_t> threshold_;
- };
-
- RandomSolarize::RandomSolarize(std::vector<uint8_t> threshold) : data_(std::make_shared<Data>(threshold)) {}
-
- std::shared_ptr<TensorOperation> RandomSolarize::Parse() {
- return std::make_shared<RandomSolarizeOperation>(data_->threshold_);
- }
-
- // RandomVerticalFlip Transform Operation.
- struct RandomVerticalFlip::Data {
- explicit Data(float prob) : probability_(prob) {}
- float probability_;
- };
-
- RandomVerticalFlip::RandomVerticalFlip(float prob) : data_(std::make_shared<Data>(prob)) {}
-
- std::shared_ptr<TensorOperation> RandomVerticalFlip::Parse() {
- return std::make_shared<RandomVerticalFlipOperation>(data_->probability_);
- }
-
- // RandomVerticalFlipWithBBox Transform Operation.
- struct RandomVerticalFlipWithBBox::Data {
- explicit Data(float prob) : probability_(prob) {}
- float probability_;
- };
-
- RandomVerticalFlipWithBBox::RandomVerticalFlipWithBBox(float prob) : data_(std::make_shared<Data>(prob)) {}
-
- std::shared_ptr<TensorOperation> RandomVerticalFlipWithBBox::Parse() {
- return std::make_shared<RandomVerticalFlipWithBBoxOperation>(data_->probability_);
- }
-
- // Rescale Transform Operation.
- struct Rescale::Data {
- Data(float rescale, float shift) : rescale_(rescale), shift_(shift) {}
- float rescale_;
- float shift_;
- };
-
- Rescale::Rescale(float rescale, float shift) : data_(std::make_shared<Data>(rescale, shift)) {}
-
- std::shared_ptr<TensorOperation> Rescale::Parse() {
- return std::make_shared<RescaleOperation>(data_->rescale_, data_->shift_);
- }
- #endif // not ENABLE_ANDROID
-
- // Resize Transform Operation.
- struct Resize::Data {
- Data(const std::vector<int32_t> &size, InterpolationMode interpolation)
- : size_(size), interpolation_(interpolation) {}
- std::vector<int32_t> size_;
- InterpolationMode interpolation_;
- };
-
- Resize::Resize(std::vector<int32_t> size, InterpolationMode interpolation)
- : data_(std::make_shared<Data>(size, interpolation)) {}
-
- std::shared_ptr<TensorOperation> Resize::Parse() {
- return std::make_shared<ResizeOperation>(data_->size_, data_->interpolation_);
- }
-
- std::shared_ptr<TensorOperation> Resize::Parse(const MapTargetDevice &env) {
- if (env == MapTargetDevice::kAscend310) {
- #ifdef ENABLE_ACL
- std::vector<uint32_t> usize_;
- usize_.reserve(data_->size_.size());
- std::transform(data_->size_.begin(), data_->size_.end(), std::back_inserter(usize_),
- [](int32_t i) { return (uint32_t)i; });
- return std::make_shared<DvppResizeJpegOperation>(usize_);
- #endif // ENABLE_ACL
- }
- return std::make_shared<ResizeOperation>(data_->size_, data_->interpolation_);
- }
-
- // ResizePreserveAR Transform Operation.
- struct ResizePreserveAR::Data {
- Data(int32_t height, int32_t width, int32_t img_orientation)
- : height_(height), width_(width), img_orientation_(img_orientation) {}
- int32_t height_;
- int32_t width_;
- int32_t img_orientation_;
- };
-
- ResizePreserveAR::ResizePreserveAR(int32_t height, int32_t width, int32_t img_orientation)
- : data_(std::make_shared<Data>(height, width, img_orientation)) {}
-
- std::shared_ptr<TensorOperation> ResizePreserveAR::Parse() {
- return std::make_shared<ResizePreserveAROperation>(data_->height_, data_->width_, data_->img_orientation_);
- }
-
- #ifdef ENABLE_ANDROID
- // Rotate Transform Operation.
- Rotate::Rotate() {}
-
- std::shared_ptr<TensorOperation> Rotate::Parse() { return std::make_shared<RotateOperation>(); }
- #endif // ENABLE_ANDROID
-
- #ifndef ENABLE_ANDROID
- // ResizeWithBBox Transform Operation.
- struct ResizeWithBBox::Data {
- Data(const std::vector<int32_t> &size, InterpolationMode interpolation)
- : size_(size), interpolation_(interpolation) {}
- std::vector<int32_t> size_;
- InterpolationMode interpolation_;
- };
-
- ResizeWithBBox::ResizeWithBBox(std::vector<int32_t> size, InterpolationMode interpolation)
- : data_(std::make_shared<Data>(size, interpolation)) {}
-
- std::shared_ptr<TensorOperation> ResizeWithBBox::Parse() {
- return std::make_shared<ResizeWithBBoxOperation>(data_->size_, data_->interpolation_);
- }
-
- // RgbaToBgr Transform Operation.
- RGBA2BGR::RGBA2BGR() {}
-
- std::shared_ptr<TensorOperation> RGBA2BGR::Parse() { return std::make_shared<RgbaToBgrOperation>(); }
-
- // RgbaToRgb Transform Operation.
- RGBA2RGB::RGBA2RGB() {}
-
- std::shared_ptr<TensorOperation> RGBA2RGB::Parse() { return std::make_shared<RgbaToRgbOperation>(); }
-
- // SoftDvppDecodeRandomCropResizeJpeg Transform Operation.
- struct SoftDvppDecodeRandomCropResizeJpeg::Data {
- Data(const std::vector<int32_t> &size, const std::vector<float> &scale, const std::vector<float> &ratio,
- int32_t max_attempts)
- : size_(size), scale_(scale), ratio_(ratio), max_attempts_(max_attempts) {}
- std::vector<int32_t> size_;
- std::vector<float> scale_;
- std::vector<float> ratio_;
- int32_t max_attempts_;
- };
-
- SoftDvppDecodeRandomCropResizeJpeg::SoftDvppDecodeRandomCropResizeJpeg(std::vector<int32_t> size,
- std::vector<float> scale,
- std::vector<float> ratio, int32_t max_attempts)
- : data_(std::make_shared<Data>(size, scale, ratio, max_attempts)) {}
-
- std::shared_ptr<TensorOperation> SoftDvppDecodeRandomCropResizeJpeg::Parse() {
- return std::make_shared<SoftDvppDecodeRandomCropResizeJpegOperation>(data_->size_, data_->scale_, data_->ratio_,
- data_->max_attempts_);
- }
-
- // SoftDvppDecodeResizeJpeg Transform Operation.
- struct SoftDvppDecodeResizeJpeg::Data {
- explicit Data(const std::vector<int32_t> &size) : size_(size) {}
- std::vector<int32_t> size_;
- };
-
- SoftDvppDecodeResizeJpeg::SoftDvppDecodeResizeJpeg(std::vector<int32_t> size) : data_(std::make_shared<Data>(size)) {}
-
- std::shared_ptr<TensorOperation> SoftDvppDecodeResizeJpeg::Parse() {
- return std::make_shared<SoftDvppDecodeResizeJpegOperation>(data_->size_);
- }
-
- // SwapRedBlue Transform Operation.
- SwapRedBlue::SwapRedBlue() {}
-
- std::shared_ptr<TensorOperation> SwapRedBlue::Parse() { return std::make_shared<SwapRedBlueOperation>(); }
-
- // UniformAug Transform Operation.
- struct UniformAugment::Data {
- std::vector<std::shared_ptr<TensorOperation>> transforms_;
- int32_t num_ops_;
- };
-
- UniformAugment::UniformAugment(const std::vector<TensorTransform *> &transforms, int32_t num_ops)
- : data_(std::make_shared<Data>()) {
- (void)std::transform(
- transforms.begin(), transforms.end(), std::back_inserter(data_->transforms_),
- [](TensorTransform *const op) -> std::shared_ptr<TensorOperation> { return op ? op->Parse() : nullptr; });
- data_->num_ops_ = num_ops;
- }
-
- UniformAugment::UniformAugment(const std::vector<std::shared_ptr<TensorTransform>> &transforms, int32_t num_ops)
- : data_(std::make_shared<Data>()) {
- (void)std::transform(
- transforms.begin(), transforms.end(), std::back_inserter(data_->transforms_),
- [](std::shared_ptr<TensorTransform> op) -> std::shared_ptr<TensorOperation> { return op ? op->Parse() : nullptr; });
- data_->num_ops_ = num_ops;
- }
-
- UniformAugment::UniformAugment(const std::vector<std::reference_wrapper<TensorTransform>> &transforms, int32_t num_ops)
- : data_(std::make_shared<Data>()) {
- (void)std::transform(transforms.begin(), transforms.end(), std::back_inserter(data_->transforms_),
- [](TensorTransform &op) -> std::shared_ptr<TensorOperation> { return op.Parse(); });
- data_->num_ops_ = num_ops;
- }
-
- std::shared_ptr<TensorOperation> UniformAugment::Parse() {
- return std::make_shared<UniformAugOperation>(data_->transforms_, data_->num_ops_);
- }
- #endif // not ENABLE_ANDROID
-
- } // namespace vision
- } // namespace dataset
- } // namespace mindspore
|