From bf69444b3aa519bf6b9f0df35c09137bb6f90b50 Mon Sep 17 00:00:00 2001
From: Xiao Tianci <xiaotianci1@huawei.com>
Date: Thu, 4 Mar 2021 22:25:10 +0800
Subject: [PATCH] fix the examples in docs of minddata

---
 mindspore/dataset/core/config.py              |   5 +-
 mindspore/dataset/engine/datasets.py          | 228 +++++++++---------
 mindspore/dataset/engine/graphdata.py         |  22 +-
 mindspore/dataset/engine/samplers.py          |  20 +-
 mindspore/dataset/transforms/c_transforms.py  |   9 +-
 mindspore/dataset/transforms/py_transforms.py |   2 +-
 6 files changed, 144 insertions(+), 142 deletions(-)

diff --git a/mindspore/dataset/core/config.py b/mindspore/dataset/core/config.py
index ae81997e2b..59f76ef3e4 100644
--- a/mindspore/dataset/core/config.py
+++ b/mindspore/dataset/core/config.py
@@ -340,8 +340,7 @@ def load(file):
         RuntimeError: If file is invalid and parsing fails.
 
     Examples:
-        >>> # Set new default configuration values according to values in the configuration file.
-        >>> ds.config.load("/path/to/config_directory/config.cfg")
+        >>> # Set new default configuration according to values in the configuration file.
         >>> # example config file:
         >>> # {
         >>> #     "logFilePath": "/tmp",
@@ -349,5 +348,7 @@ def load(file):
         >>> #     "seed": 5489,
         >>> #     "monitorSamplingInterval": 30
         >>> # }
+        >>> config_file = "/path/to/config/file"
+        >>> ds.config.load(config_file)
     """
     _config.load(file)
diff --git a/mindspore/dataset/engine/datasets.py b/mindspore/dataset/engine/datasets.py
index 8a4636e4cb..e53d5bf4e1 100644
--- a/mindspore/dataset/engine/datasets.py
+++ b/mindspore/dataset/engine/datasets.py
@@ -506,14 +506,18 @@ class Dataset:
             Dataset, dataset applied by the function.
 
         Examples:
-            >>> # Declare a function which returns a Dataset object
-            >>> def flat_map_func(x):
-            ...     image_folder_dataset_dir = text.to_str(x[0])
-            ...     d = ds.ImageFolderDataset(image_folder_dataset_dir)
-            ...     return d
-            >>> # dataset is an instance of a Dataset object.
-            >>> dataset = ds.TextFileDataset(text_file_dataset_dir)
+            >>> # use NumpySliceDataset as an example
+            >>> dataset = ds.NumpySliceDataset([[0, 1], [2, 3]])
+            >>>
+            >>> def flat_map_func(array):
+            ...     # create a NumpySliceDataset with the array
+            ...     dataset = ds.NumpySliceDataset(array)
+            ...     # repeat the dataset twice
+            ...     dataset = dataset.repeat(2)
+            ...     return dataset
+            >>>
             >>> dataset = dataset.flat_map(flat_map_func)
+            >>> # [[0, 1], [0, 1], [2, 3], [2, 3]]
 
         Raises:
             TypeError: If `func` is not a function.
@@ -588,60 +592,40 @@ class Dataset:
 
         Examples:
             >>> # dataset is an instance of Dataset which has 2 columns, "image" and "label".
-            >>> # ds_pyfunc is an instance of Dataset which has 3 columns, "col0", "col1", and "col2".
-            >>> # Each column is a 2D array of integers.
-            >>> # Set the global configuration value for num_parallel_workers to be 2.
-            >>> # Operations which use this configuration value will use 2 worker threads,
-            >>> # unless otherwise specified in the operator's constructor.
-            >>> # set_num_parallel_workers can be called again later if a different
-            >>> # global configuration value for the number of worker threads is desired.
-            >>> ds.config.set_num_parallel_workers(2)
             >>>
             >>> # Define two operations, where each operation accepts 1 input column and outputs 1 column.
-            >>> decode_op = c_vision.Decode(rgb_format=True)
-            >>> random_jitter_op = c_vision.RandomColorAdjust((0.8, 0.8), (1, 1), (1, 1), (0, 0))
+            >>> decode_op = c_vision.Decode(rgb=True)
+            >>> random_jitter_op = c_vision.RandomColorAdjust(brightness=(0.8, 0.8), contrast=(1, 1),
+            ...                                               saturation=(1, 1), hue=(0, 0))
             >>>
-            >>> # 1) Simple map example
-            >>>
-            >>> operations = [decode_op]
-            >>> input_columns = ["image"]
+            >>> # 1) Simple map example.
             >>>
             >>> # Apply decode_op on column "image". This column will be replaced by the outputted
             >>> # column of decode_op. Since column_order is not provided, both columns "image"
             >>> # and "label" will be propagated to the child node in their original order.
-            >>> dataset = dataset.map(operations, input_columns)
+            >>> dataset = dataset.map(operations=[decode_op], input_columns=["image"])
             >>>
-            >>> # Rename column "image" to "decoded_image".
-            >>> output_columns = ["decoded_image"]
-            >>> dataset = dataset.map(operations, input_columns, output_columns)
+            >>> # Decode and rename column "image" to "decoded_image".
+            >>> dataset = dataset.map(operations=[decode_op], input_columns=["image"], output_columns=["decoded_image"])
             >>>
-            >>> # Specify the order of the columns.
-            >>> column_order ["label", "image"]
-            >>> dataset = dataset.map(operations, input_columns, None, column_order)
+            >>> # Specify the order of the output columns.
+            >>> dataset = dataset.map(operations=[decode_op], input_columns=["image"],
+            ...                       output_columns=None, column_order=["label", "image"])
             >>>
-            >>> # Rename column "image" to "decoded_image" and also specify the order of the columns.
-            >>> column_order ["label", "decoded_image"]
-            >>> output_columns = ["decoded_image"]
-            >>> dataset = dataset.map(operations, input_columns, output_columns, column_order)
+            >>> # Rename column "image" to "decoded_image" and also specify the order of the output columns.
+            >>> dataset = dataset.map(operations=[decode_op], input_columns=["image"],
+            ...                       output_columns=["decoded_image"], column_order=["label", "decoded_image"])
             >>>
             >>> # Rename column "image" to "decoded_image" and keep only this column.
-            >>> column_order ["decoded_image"]
-            >>> output_columns = ["decoded_image"]
-            >>> dataset = dataset.map(operations, input_columns, output_columns, column_order)
+            >>> dataset = dataset.map(operations=[decode_op], input_columns=["image"],
+            ...                       output_columns=["decoded_image"], column_order=["decoded_image"])
             >>>
-            >>> # A simple example using pyfunc: Renaming columns and specifying column order
+            >>> # A simple example for mapping pyfunc. Renaming columns and specifying column order
             >>> # work in the same way as the previous examples.
-            >>> input_columns = ["col0"]
-            >>> operations = [(lambda x: x + 1)]
-            >>> dataset = dataset.map(operations, input_columns)
-            >>>
-            >>> # 2) Map example with more than one operation
+            >>> dataset = ds.NumpySlicesDataset(data=[[0, 1, 2]], column_names=["data"])
+            >>> dataset = dataset.map(operations=[(lambda x: x + 1)], input_columns=["data"])
             >>>
-            >>> # If this list of operations is used with map, decode_op will be applied
-            >>> # first, then random_jitter_op will be applied.
-            >>> operations = [decode_op, random_jitter_op]
-            >>>
-            >>> input_columns = ["image"]
+            >>> # 2) Map example with more than one operation.
             >>>
             >>> # Create a dataset where the images are decoded, then randomly color jittered.
             >>> # decode_op takes column "image" as input and outputs one column. The column
@@ -650,47 +634,47 @@ class Dataset:
             >>> # the column outputted by random_jitter_op (the very last operation). All other
             >>> # columns are unchanged. Since column_order is not specified, the order of the
             >>> # columns will remain the same.
-            >>> dataset = dataset.map(operations, input_columns)
+            >>> dataset = dataset.map(operations=[decode_op, random_jitter_op], input_columns=["image"])
             >>>
-            >>> # Create a dataset that is identical to ds_mapped, except the column "image"
-            >>> # that is outputted by random_jitter_op is renamed to "image_transformed".
+            >>> # Rename the column outputted by random_jitter_op to "image_mapped".
             >>> # Specifying column order works in the same way as examples in 1).
-            >>> output_columns = ["image_transformed"]
-            >>> dataset = dataset.map(operation, input_columns, output_columns)
+            >>> dataset = dataset.map(operation=[decode_op, random_jitter_op], input_columns=["image"],
+            ...                       output_columns=["image_mapped"])
             >>>
-            >>> # Multiple operations using pyfunc: Renaming columns and specifying column order
+            >>> # Map with multiple operations using pyfunc. Renaming columns and specifying column order
             >>> # work in the same way as examples in 1).
-            >>> input_columns = ["col0"]
-            >>> operations = [(lambda x: x + x), (lambda x: x - 1)]
-            >>> output_columns = ["col0_mapped"]
-            >>> dataset = dataset.map(operations, input_columns, output_columns)
+            >>> dataset = ds.NumpySlicesDataset(data=[[0, 1, 2]], column_names=["data"])
+            >>> dataset = dataset.map(operations=[(lambda x: x * x), (lambda x: x - 1)], input_columns=["data"],
+            ...                                   output_columns=["data_mapped"])
             >>>
-            >>> # 3) Example where number of input columns is not equal to number of output columns
+            >>> # 3) Example where number of input columns is not equal to number of output columns.
             >>>
             >>> # operations[0] is a lambda that takes 2 columns as input and outputs 3 columns.
             >>> # operations[1] is a lambda that takes 3 columns as input and outputs 1 column.
-            >>> # operations[1] is a lambda that takes 1 column as input and outputs 4 columns.
+            >>> # operations[2] is a lambda that takes 1 column as input and outputs 4 columns.
             >>> #
             >>> # Note: The number of output columns of operation[i] must equal the number of
             >>> # input columns of operation[i+1]. Otherwise, this map call will also result
             >>> # in an error.
-            >>> operations = [(lambda x y: (x, x + y, x + y + 1)),
-            >>>               (lambda x y z: x * y * z),
-            >>>               (lambda x: (x % 2, x % 3, x % 5, x % 7))]
+            >>> operations = [(lambda x, y: (x, x + y, x + y + 1)),
+            ...               (lambda x, y, z: x * y * z),
+            ...               (lambda x: (x % 2, x % 3, x % 5, x % 7))]
             >>>
             >>> # Note: Since the number of input columns is not the same as the number of
             >>> # output columns, the output_columns and column_order parameters must be
             >>> # specified. Otherwise, this map call will also result in an error.
-            >>> input_columns = ["col2", "col0"]
-            >>> output_columns = ["mod2", "mod3", "mod5", "mod7"]
+            >>>
+            >>> dataset = ds.NumpySlicesDataset(data=([[0, 1, 2]], [[3, 4, 5]]), column_names=["x", "y"])
             >>>
             >>> # Propagate all columns to the child node in this order:
-            >>> column_order = ["col0", "col2", "mod2", "mod3", "mod5", "mod7", "col1"]
-            >>> dataset = dataset.map(operations, input_columns, output_columns, column_order)
+            >>> dataset = dataset.map(operations, input_columns=["x", "y"],
+            ...                       output_columns=["mod2", "mod3", "mod5", "mod7"],
+            ...                       column_order=["mod2", "mod3", "mod5", "mod7"])
             >>>
             >>> # Propagate some columns to the child node in this order:
-            >>> column_order = ["mod7", "mod3", "col1"]
-            >>> dataset = dataset.map(operations, input_columns, output_columns, column_order)
+            >>> dataset = dataset.map(operations, input_columns=["x", "y"],
+            ...                       output_columns=["mod2", "mod3", "mod5", "mod7"],
+            ...                       column_order=["mod7", "mod3", "col2"])
         """
 
         return MapDataset(self, operations, input_columns, output_columns, column_order, num_parallel_workers,
@@ -1066,7 +1050,7 @@ class Dataset:
             ...     corpus = {"Z": 4, "Y": 4, "X": 4, "W": 3, "U": 3, "V": 2, "T": 1}
             ...     for k, v in corpus.items():
             ...         yield (np.array([k] * v, dtype='S'),)
-            >>> column_names = ["column1","column2","column3"]
+            >>> column_names = ["column1", "column2", "column3"]
             >>> dataset = ds.GeneratorDataset(gen_corpus, column_names)
             >>> dataset = dataset.build_vocab(columns=["column3", "column1", "column2"],
             ...                               freq_range=(1, 10), top_k=5,
@@ -1344,13 +1328,12 @@ class Dataset:
 
         Examples:
             >>> # dataset is an instance of Dataset object
-            >>>
-            >>> # Create an iterator
-            >>> # The columns in the dataset obtained by the iterator will not be changed.
             >>> iterator = dataset.create_tuple_iterator()
             >>> for item in iterator:
-            ...     # convert the returned tuple to a list and print
-            ...     print(list(item))
+            ...     # item is a list
+            ...     print(type(item))
+            ...     break
+            <class 'list'>
         """
         if output_numpy is None:
             output_numpy = False
@@ -1377,13 +1360,12 @@ class Dataset:
 
         Examples:
             >>> # dataset is an instance of Dataset object
-            >>>
-            >>> # create an iterator
-            >>> # The columns in the data obtained by the iterator might be changed.
             >>> iterator = dataset.create_dict_iterator()
             >>> for item in iterator:
-            ...     # print the data in column1
-            ...     print(item["column1"])
+            ...     # item is a dict
+            ...     print(type(item))
+            ...     break
+            <class 'dict'>
         """
         if output_numpy is None:
             output_numpy = False
@@ -1406,8 +1388,10 @@ class Dataset:
 
         Examples:
             >>> # dataset is an instance of Dataset object
-            >>> dataset = ds.NumpySlicesDataset([1, 2, 3], column_names=["col_1"])
+            >>> # set input_indexs
+            >>> dataset.input_indexs = 10
             >>> print(dataset.input_indexs)
+            10
         """
         if self._input_indexs != ():
             return self._input_indexs
@@ -3432,38 +3416,59 @@ class GeneratorDataset(MappableDataset):
             option could be beneficial if the Python operation is computational heavy (default=True).
 
     Examples:
-        >>> # 1) Multidimensional generator function as callable input
-        >>> def GeneratorMD():
+        >>> # 1) Multidimensional generator function as callable input.
+        >>> def generator_multidimensional():
         ...     for i in range(64):
         ...         yield (np.array([[i, i + 1], [i + 2, i + 3]]),)
-        >>> # Create multi_dimension_generator_dataset with GeneratorMD and column name "multi_dimensional_data"
-        >>> multi_dimension_generator_dataset = ds.GeneratorDataset(GeneratorMD, ["multi_dimensional_data"])
         >>>
-        >>> # 2) Multi-column generator function as callable input
-        >>> def GeneratorMC(maxid = 64):
-        ...     for i in range(maxid):
-        ...         yield (np.array([i]), np.array([[i, i + 1], [i + 2, i + 3]]))
-        >>> # Create multi_column_generator_dataset with GeneratorMC and column names "col1" and "col2"
-        >>> multi_column_generator_dataset = ds.GeneratorDataset(GeneratorMC, ["col1", "col2"])
+        >>> dataset = ds.GeneratorDataset(generator_multidimensional, ["multi_dimensional_data"])
+        >>>
+        >>> # 2) Multi-column generator function as callable input.
+        >>> def generator_multi_column():
+        ...     for i in range(64):
+        ...         yield (np.array([i]), np.array([[i, i + 1], [i + 2, i + 3]])
+        >>>
+        >>> dataset = ds.GeneratorDataset(generator_multi_column, ["col1", "col2"])
         >>>
-        >>> # 3) Iterable dataset as iterable input
+        >>> # 3) Iterable dataset as iterable input.
         >>> class MyIterable:
+        ...     def __init__(self):
+        ...         self._index = 0
+        ...         self._data = np.random.sample((5, 2))
+        ...         self._label = np.random.sample((5, 1))
+        ...
+        ...     def __next__(self):
+        ...         if self._index >= len(self._data):
+        ...             raise StopIteration
+        ...         else:
+        ...             item = (self._data[self._index], self._label[self._index])
+        ...             self._index += 1
+        ...             return item
+        ...
         ...     def __iter__(self):
-        ...         return # User implementation
-        >>> # Create iterable_generator_dataset with MyIterable object
-        >>> iterable_generator_dataset = ds.GeneratorDataset(MyIterable(), ["col1"])
+        ...         return self
+        ...
+        ...     def __len__(self):
+        ...         return len(self._data)
         >>>
-        >>> # 4) Random accessible dataset as random accessible input
-        >>> class MyRA:
+        >>> dataset = ds.GeneratorDataset(MyIterable(), ["data", "label"])
+        >>>
+        >>> # 4) Random accessible dataset as random accessible input.
+        >>> class MyAccessible:
+        ...     def __init__(self):
+        ...         self._data = np.random.sample((5, 2))
+        ...         self._label = np.random.sample((5, 1))
+        ...
         ...     def __getitem__(self, index):
-        ...         return # User implementation
-        >>> # Create ra_generator_dataset with MyRA object
-        >>> ra_generator_dataset = ds.GeneratorDataset(MyRA(), ["col1"])
-        >>> # List/Dict/Tuple is also random accessible
-        >>> list_generator = ds.GeneratorDataset([(np.array(0),), (np.array(1)), (np.array(2))], ["col1"])
+        ...         return self._data[index], self._label[index]
+        ...
+        ...     def __len__(self):
+        ...         return len(self._data)
+        >>>
+        >>> dataset = ds.GeneratorDataset(MyAccessible(), ["data", "label"])
         >>>
-        >>> # 5) Built-in Sampler
-        >>> my_generator = ds.GeneratorDataset(my_ds, ["img", "label"], sampler=samplers.RandomSampler())
+        >>> # list, dict, tuple of Python is also random accessible
+        >>> dataset = ds.GeneratorDataset([(np.array(0),), (np.array(1),), (np.array(2),)], ["col"])
     """
 
     @check_generatordataset
@@ -3582,18 +3587,19 @@ class TFRecordDataset(SourceDataset):
         >>> import mindspore.common.dtype as mstype
         >>>
         >>> tfrecord_dataset_dir = ["/path/to/tfrecord_dataset_file"] # contains 1 or multiple tf data files
+        >>> tfrecord_schema_file = "/path/to/tfrecord_schema_file"
         >>>
-        >>> # 1) Get all rows from tfrecord_dataset_dir with no explicit schema
+        >>> # 1) Get all rows from tfrecord_dataset_dir with no explicit schema.
         >>> # The meta-data in the first row will be used as a schema.
-        >>> dataset = ds.TFRecordDataset(dataset_files=tfrecord_dataset_dir)
+        >>> dataset = ds.TFRecordDataset(tfrecord_dataset_dir)
         >>>
-        >>> # 2) Get all rows from tfrecord_dataset_dir with user-defined schema
-        >>> schema = ds.Schema("/path/to/tfrecord_schema_file")
-        >>> schema.add_column('col_1d', de_type=mindspore.int64, shape=[2])
-        >>> dataset = ds.TFRecordDataset(dataset_files=tfrecord_dataset_dir, schema=schema)
+        >>> # 2) Get all rows from tfrecord_dataset_dir with user-defined schema.
+        >>> schema = ds.Schema()
+        >>> schema.add_column('col_1d', de_type=mstype.int64, shape=[2])
+        >>> dataset = ds.TFRecordDataset(tfrecord_dataset_dir, schema=schema)
         >>>
-        >>> # 3) Get all rows from tfrecord_dataset_dir with schema file "./schema.json"
-        >>> dataset = ds.TFRecordDataset(dataset_files=tfrecord_dataset_dir, schema="./schema.json")
+        >>> # 3) Get all rows from tfrecord_dataset_dir with schema file.
+        >>> dataset = ds.TFRecordDataset(dataset_files=tfrecord_dataset_dir, schema=tfrecord_schema_file)
     """
 
     @check_tfrecorddataset
@@ -4835,7 +4841,7 @@ class NumpySlicesDataset(GeneratorDataset):
         >>>
         >>> # 4) Load data from CSV file
         >>> import pandas as pd
-        >>> df = pd.read_csv(csv_dataset_dir)
+        >>> df = pd.read_csv(csv_dataset_dir[0])
         >>> dataset = ds.NumpySlicesDataset(dict(df), shuffle=False)
     """
 
diff --git a/mindspore/dataset/engine/graphdata.py b/mindspore/dataset/engine/graphdata.py
index 31d6d6a3c0..a8a29ccdbe 100644
--- a/mindspore/dataset/engine/graphdata.py
+++ b/mindspore/dataset/engine/graphdata.py
@@ -73,7 +73,7 @@ class GraphData:
 
     Examples:
         >>> graph_dataset = ds.GraphData(graph_dataset_dir, 2)
-        >>> nodes = graph_dataset.get_all_nodes(0)
+        >>> nodes = graph_dataset.get_all_nodes(1)
         >>> features = graph_dataset.get_node_feature(nodes, [1])
     """
 
@@ -114,7 +114,7 @@ class GraphData:
             numpy.ndarray, array of nodes.
 
         Examples:
-            >>> nodes = graph_dataset.get_all_nodes(0)
+            >>> nodes = graph_dataset.get_all_nodes(1)
 
         Raises:
             TypeError: If `node_type` is not integer.
@@ -175,8 +175,8 @@ class GraphData:
             numpy.ndarray, array of neighbors.
 
         Examples:
-            >>> nodes = graph_dataset.get_all_nodes(0)
-            >>> neighbors = graph_dataset.get_all_neighbors(nodes, 0)
+            >>> nodes = graph_dataset.get_all_nodes(1)
+            >>> neighbors = graph_dataset.get_all_neighbors(nodes, 2)
 
         Raises:
             TypeError: If `node_list` is not list or ndarray.
@@ -211,8 +211,8 @@ class GraphData:
             numpy.ndarray, array of neighbors.
 
         Examples:
-            >>> nodes = graph_dataset.get_all_nodes(0)
-            >>> neighbors = graph_dataset.get_sampled_neighbors(nodes, [2, 2], [0, 0])
+            >>> nodes = graph_dataset.get_all_nodes(1)
+            >>> neighbors = graph_dataset.get_sampled_neighbors(nodes, [2, 2], [2, 1])
 
         Raises:
             TypeError: If `node_list` is not list or ndarray.
@@ -240,8 +240,8 @@ class GraphData:
             numpy.ndarray, array of neighbors.
 
         Examples:
-            >>> nodes = graph_dataset.get_all_nodes(0)
-            >>> neg_neighbors = graph_dataset.get_neg_sampled_neighbors(nodes, 5, 0)
+            >>> nodes = graph_dataset.get_all_nodes(1)
+            >>> neg_neighbors = graph_dataset.get_neg_sampled_neighbors(nodes, 5, 2)
 
         Raises:
             TypeError: If `node_list` is not list or ndarray.
@@ -266,8 +266,8 @@ class GraphData:
             numpy.ndarray, array of features.
 
         Examples:
-            >>> nodes = graph_dataset.get_all_nodes(0)
-            >>> features = graph_dataset.get_node_feature(nodes, [1])
+            >>> nodes = graph_dataset.get_all_nodes(1)
+            >>> features = graph_dataset.get_node_feature(nodes, [2, 3])
 
         Raises:
             TypeError: If `node_list` is not list or ndarray.
@@ -347,7 +347,7 @@ class GraphData:
             numpy.ndarray, array of nodes.
 
         Examples:
-            >>> nodes = graph_dataset.random_walk([1,2], [1,2,1,2,1])
+            >>> nodes = graph_dataset.random_walk([1, 2], [1, 2, 1, 2, 1])
 
         Raises:
             TypeError: If `target_nodes` is not list or ndarray.
diff --git a/mindspore/dataset/engine/samplers.py b/mindspore/dataset/engine/samplers.py
index 39f9651216..748e20dda9 100644
--- a/mindspore/dataset/engine/samplers.py
+++ b/mindspore/dataset/engine/samplers.py
@@ -203,14 +203,12 @@ class Sampler(BuiltinSampler):
     dataset_size and num_samples will be set by dataset once a dataset iterator is created.
 
     Examples:
-        >>> import mindspore.dataset as ds
+        >>> class ReverseSampler(ds.Sampler):
+        ...     def __iter__(self):
+        ...         for i in range(self.dataset_size - 1, -1, -1):
+        ...             yield i
         >>>
-        >>> class ReverseSampler(ds,Sampler):
-        >>>     def __iter__(self):
-        >>>         for i in range(self.dataset_size - 1, -1, -1):
-        >>>             yield i
-        >>>
-        >>> ds = ds.ImageFolderDataset(path, sampler=ReverseSampler())
+        >>> ds = ds.ImageFolderDataset(image_folder_dataset_dir, sampler=ReverseSampler())
     """
 
     def __init__(self, num_samples=None):
@@ -698,15 +696,11 @@ class SubsetRandomSampler(SubsetSampler):
         num_samples (int, optional): Number of elements to sample (default=None, all elements).
 
     Examples:
-        >>> import mindspore.dataset as ds
-        >>>
-        >>> dataset_dir = "path/to/imagefolder_directory"
-        >>>
         >>> indices = [0, 1, 2, 3, 7, 88, 119]
         >>>
-        >>> # creates a SubsetRandomSampler, will sample from the provided indices
+        >>> # create a SubsetRandomSampler, will sample from the provided indices
         >>> sampler = ds.SubsetRandomSampler(indices)
-        >>> data = ds.ImageFolderDataset(dataset_dir, num_parallel_workers=8, sampler=sampler)
+        >>> data = ds.ImageFolderDataset(image_folder_dataset_dir, num_parallel_workers=8, sampler=sampler)
 
     Raises:
         TypeError: If type of indices element is not a number.
diff --git a/mindspore/dataset/transforms/c_transforms.py b/mindspore/dataset/transforms/c_transforms.py
index 39005d5c40..f168cf4382 100644
--- a/mindspore/dataset/transforms/c_transforms.py
+++ b/mindspore/dataset/transforms/c_transforms.py
@@ -106,14 +106,15 @@ class TypeCast(cde.TypeCastOp):
     Examples:
         >>> import numpy as np
         >>> import mindspore.common.dtype as mstype
-        >>> from mindspore.dataset import GeneratorDataset
+        >>>
         >>> # Generate 1d int numpy array from 0 - 63
         >>> def generator_1d():
-        >>>     for i in range(64):
+        ...     for i in range(64):
         ...         yield (np.array([i]),)
-        >>> generator_dataset = GeneratorDataset(generator_1d,column_names='col')
+        >>>
+        >>> dataset = ds.GeneratorDataset(generator_1d, column_names='col')
         >>> type_cast_op = c_transforms.TypeCast(mstype.int32)
-        >>> generator_dataset = generator_dataset.map(operations=type_cast_op)
+        >>> dataset = dataset.map(operations=type_cast_op)
     """
 
     @check_de_type
diff --git a/mindspore/dataset/transforms/py_transforms.py b/mindspore/dataset/transforms/py_transforms.py
index 22011393f2..b60ba57329 100644
--- a/mindspore/dataset/transforms/py_transforms.py
+++ b/mindspore/dataset/transforms/py_transforms.py
@@ -40,7 +40,7 @@ class OneHotOp:
         >>> # Assume that dataset has 10 classes, thus the label ranges from 0 to 9
         >>> transforms_list = [py_transforms.OneHotOp(num_classes=10, smoothing_rate=0.1)]
         >>> transform = py_transforms.Compose(transforms_list)
-        >>> mnist_dataset = mnist_dataset(input_columns=["label"], operations=transform)
+        >>> mnist_dataset = mnist_dataset.map(input_columns=["label"], operations=transform)
     """
 
     @check_one_hot_op