You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

test_datasets_coco.py 11 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254
  1. # Copyright 2020 Huawei Technologies Co., Ltd
  2. #
  3. # Licensed under the Apache License, Version 2.0 (the "License");
  4. # you may not use this file except in compliance with the License.
  5. # You may obtain a copy of the License at
  6. #
  7. # http://www.apache.org/licenses/LICENSE-2.0
  8. #
  9. # Unless required by applicable law or agreed to in writing, software
  10. # distributed under the License is distributed on an "AS IS" BASIS,
  11. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. # See the License for the specific language governing permissions and
  13. # limitations under the License.
  14. # ==============================================================================
  15. import numpy as np
  16. import mindspore.dataset as ds
  17. import mindspore.dataset.transforms.vision.c_transforms as vision
  18. DATA_DIR = "../data/dataset/testCOCO/train/"
  19. ANNOTATION_FILE = "../data/dataset/testCOCO/annotations/train.json"
  20. KEYPOINT_FILE = "../data/dataset/testCOCO/annotations/key_point.json"
  21. PANOPTIC_FILE = "../data/dataset/testCOCO/annotations/panoptic.json"
  22. INVALID_FILE = "../data/dataset/testCOCO/annotations/invalid.json"
  23. LACKOFIMAGE_FILE = "../data/dataset/testCOCO/annotations/lack_of_images.json"
  24. def test_coco_detection():
  25. data1 = ds.CocoDataset(DATA_DIR, annotation_file=ANNOTATION_FILE, task="Detection",
  26. decode=True, shuffle=False)
  27. num_iter = 0
  28. image_shape = []
  29. bbox = []
  30. category_id = []
  31. for data in data1.create_dict_iterator():
  32. image_shape.append(data["image"].shape)
  33. bbox.append(data["bbox"])
  34. category_id.append(data["category_id"])
  35. num_iter += 1
  36. assert num_iter == 6
  37. assert image_shape[0] == (2268, 4032, 3)
  38. assert image_shape[1] == (561, 595, 3)
  39. assert image_shape[2] == (607, 585, 3)
  40. assert image_shape[3] == (642, 675, 3)
  41. assert image_shape[4] == (2268, 4032, 3)
  42. assert image_shape[5] == (2268, 4032, 3)
  43. assert np.array_equal(np.array([[10., 10., 10., 10.], [70., 70., 70., 70.]]), bbox[0])
  44. assert np.array_equal(np.array([[20., 20., 20., 20.], [80., 80., 80.0, 80.]]), bbox[1])
  45. assert np.array_equal(np.array([[30.0, 30.0, 30.0, 30.]]), bbox[2])
  46. assert np.array_equal(np.array([[40., 40., 40., 40.]]), bbox[3])
  47. assert np.array_equal(np.array([[50., 50., 50., 50.]]), bbox[4])
  48. assert np.array_equal(np.array([[60., 60., 60., 60.]]), bbox[5])
  49. assert np.array_equal(np.array([[1], [7]]), category_id[0])
  50. assert np.array_equal(np.array([[2], [8]]), category_id[1])
  51. assert np.array_equal(np.array([[3]]), category_id[2])
  52. assert np.array_equal(np.array([[4]]), category_id[3])
  53. assert np.array_equal(np.array([[5]]), category_id[4])
  54. assert np.array_equal(np.array([[6]]), category_id[5])
  55. def test_coco_stuff():
  56. data1 = ds.CocoDataset(DATA_DIR, annotation_file=ANNOTATION_FILE, task="Stuff",
  57. decode=True, shuffle=False)
  58. num_iter = 0
  59. image_shape = []
  60. segmentation = []
  61. iscrowd = []
  62. for data in data1.create_dict_iterator():
  63. image_shape.append(data["image"].shape)
  64. segmentation.append(data["segmentation"])
  65. iscrowd.append(data["iscrowd"])
  66. num_iter += 1
  67. assert num_iter == 6
  68. assert image_shape[0] == (2268, 4032, 3)
  69. assert image_shape[1] == (561, 595, 3)
  70. assert image_shape[2] == (607, 585, 3)
  71. assert image_shape[3] == (642, 675, 3)
  72. assert image_shape[4] == (2268, 4032, 3)
  73. assert image_shape[5] == (2268, 4032, 3)
  74. assert np.array_equal(np.array([[10., 12., 13., 14., 15., 16., 17., 18., 19., 20.],
  75. [70., 72., 73., 74., 75., -1., -1., -1., -1., -1.]]),
  76. segmentation[0])
  77. assert np.array_equal(np.array([[0], [0]]), iscrowd[0])
  78. assert np.array_equal(np.array([[20.0, 22.0, 23.0, 24.0, 25.0, 26.0, 27.0, 28.0, 29.0, 30.0, 31.0],
  79. [10.0, 12.0, 13.0, 14.0, 15.0, 16.0, 17.0, 18.0, 19.0, 20.0, -1.0]]),
  80. segmentation[1])
  81. assert np.array_equal(np.array([[0], [1]]), iscrowd[1])
  82. assert np.array_equal(np.array([[40., 42., 43., 44., 45., 46., 47., 48., 49., 40., 41., 42.]]), segmentation[2])
  83. assert np.array_equal(np.array([[0]]), iscrowd[2])
  84. assert np.array_equal(np.array([[50., 52., 53., 54., 55., 56., 57., 58., 59., 60., 61., 62., 63.]]),
  85. segmentation[3])
  86. assert np.array_equal(np.array([[0]]), iscrowd[3])
  87. assert np.array_equal(np.array([[60., 62., 63., 64., 65., 66., 67., 68., 69., 70., 71., 72., 73., 74.]]),
  88. segmentation[4])
  89. assert np.array_equal(np.array([[0]]), iscrowd[4])
  90. assert np.array_equal(np.array([[60., 62., 63., 64., 65., 66., 67.], [68., 69., 70., 71., 72., 73., 74.]]),
  91. segmentation[5])
  92. assert np.array_equal(np.array([[0]]), iscrowd[5])
  93. def test_coco_keypoint():
  94. data1 = ds.CocoDataset(DATA_DIR, annotation_file=KEYPOINT_FILE, task="Keypoint",
  95. decode=True, shuffle=False)
  96. num_iter = 0
  97. image_shape = []
  98. keypoints = []
  99. num_keypoints = []
  100. for data in data1.create_dict_iterator():
  101. image_shape.append(data["image"].shape)
  102. keypoints.append(data["keypoints"])
  103. num_keypoints.append(data["num_keypoints"])
  104. num_iter += 1
  105. assert num_iter == 2
  106. assert image_shape[0] == (2268, 4032, 3)
  107. assert image_shape[1] == (561, 595, 3)
  108. assert np.array_equal(np.array([[368., 61., 1., 369., 52., 2., 0., 0., 0., 382., 48., 2., 0., 0., 0., 368., 84., 2.,
  109. 435., 81., 2., 362., 125., 2., 446., 125., 2., 360., 153., 2., 0., 0., 0., 397.,
  110. 167., 1., 439., 166., 1., 369., 193., 2., 461., 234., 2., 361., 246., 2., 474.,
  111. 287., 2.]]), keypoints[0])
  112. assert np.array_equal(np.array([[14]]), num_keypoints[0])
  113. assert np.array_equal(np.array([[244., 139., 2., 0., 0., 0., 226., 118., 2., 0., 0., 0., 154., 159., 2., 143., 261.,
  114. 2., 135., 312., 2., 271., 423., 2., 184., 530., 2., 261., 280., 2., 347., 592., 2.,
  115. 0., 0., 0., 123., 596., 2., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0.]]),
  116. keypoints[1])
  117. assert np.array_equal(np.array([[10]]), num_keypoints[1])
  118. def test_coco_panoptic():
  119. data1 = ds.CocoDataset(DATA_DIR, annotation_file=PANOPTIC_FILE, task="Panoptic", decode=True, shuffle=False)
  120. num_iter = 0
  121. image_shape = []
  122. bbox = []
  123. category_id = []
  124. iscrowd = []
  125. area = []
  126. for data in data1.create_dict_iterator():
  127. image_shape.append(data["image"].shape)
  128. bbox.append(data["bbox"])
  129. category_id.append(data["category_id"])
  130. iscrowd.append(data["iscrowd"])
  131. area.append(data["area"])
  132. num_iter += 1
  133. assert num_iter == 2
  134. assert image_shape[0] == (2268, 4032, 3)
  135. assert np.array_equal(np.array([[472, 173, 36, 48], [340, 22, 154, 301], [486, 183, 30, 35]]), bbox[0])
  136. assert np.array_equal(np.array([[1], [1], [2]]), category_id[0])
  137. assert np.array_equal(np.array([[0], [0], [0]]), iscrowd[0])
  138. assert np.array_equal(np.array([[705], [14062], [626]]), area[0])
  139. assert image_shape[1] == (642, 675, 3)
  140. assert np.array_equal(np.array([[103, 133, 229, 422], [243, 175, 93, 164]]), bbox[1])
  141. assert np.array_equal(np.array([[1], [3]]), category_id[1])
  142. assert np.array_equal(np.array([[0], [0]]), iscrowd[1])
  143. assert np.array_equal(np.array([[43102], [6079]]), area[1])
  144. def test_coco_detection_classindex():
  145. data1 = ds.CocoDataset(DATA_DIR, annotation_file=ANNOTATION_FILE, task="Detection", decode=True)
  146. class_index = data1.get_class_indexing()
  147. assert class_index == {'person': [1], 'bicycle': [2], 'car': [3], 'cat': [4], 'dog': [5], 'monkey': [7]}
  148. num_iter = 0
  149. for _ in data1.__iter__():
  150. num_iter += 1
  151. assert num_iter == 6
  152. def test_coco_panootic_classindex():
  153. data1 = ds.CocoDataset(DATA_DIR, annotation_file=PANOPTIC_FILE, task="Panoptic", decode=True)
  154. class_index = data1.get_class_indexing()
  155. assert class_index == {'person': [1, 1], 'bicycle': [2, 1], 'car': [3, 1]}
  156. num_iter = 0
  157. for _ in data1.__iter__():
  158. num_iter += 1
  159. assert num_iter == 2
  160. def test_coco_case_0():
  161. data1 = ds.CocoDataset(DATA_DIR, annotation_file=ANNOTATION_FILE, task="Detection", decode=True)
  162. data1 = data1.shuffle(10)
  163. data1 = data1.batch(3, pad_info={})
  164. num_iter = 0
  165. for _ in data1.create_dict_iterator():
  166. num_iter += 1
  167. assert num_iter == 2
  168. def test_coco_case_1():
  169. data1 = ds.CocoDataset(DATA_DIR, annotation_file=ANNOTATION_FILE, task="Detection", decode=True)
  170. sizes = [0.5, 0.5]
  171. randomize = False
  172. dataset1, dataset2 = data1.split(sizes=sizes, randomize=randomize)
  173. num_iter = 0
  174. for _ in dataset1.create_dict_iterator():
  175. num_iter += 1
  176. assert num_iter == 3
  177. num_iter = 0
  178. for _ in dataset2.create_dict_iterator():
  179. num_iter += 1
  180. assert num_iter == 3
  181. def test_coco_case_2():
  182. data1 = ds.CocoDataset(DATA_DIR, annotation_file=ANNOTATION_FILE, task="Detection", decode=True)
  183. resize_op = vision.Resize((224, 224))
  184. data1 = data1.map(input_columns=["image"], operations=resize_op)
  185. data1 = data1.repeat(4)
  186. num_iter = 0
  187. for _ in data1.__iter__():
  188. num_iter += 1
  189. assert num_iter == 24
  190. def test_coco_case_exception():
  191. try:
  192. data1 = ds.CocoDataset("path_not_exist/", annotation_file=ANNOTATION_FILE, task="Detection")
  193. for _ in data1.__iter__():
  194. pass
  195. assert False
  196. except ValueError as e:
  197. assert "does not exist or permission denied" in str(e)
  198. try:
  199. data1 = ds.CocoDataset(DATA_DIR, annotation_file="./file_not_exist", task="Detection")
  200. for _ in data1.__iter__():
  201. pass
  202. assert False
  203. except ValueError as e:
  204. assert "does not exist or permission denied" in str(e)
  205. try:
  206. data1 = ds.CocoDataset(DATA_DIR, annotation_file=ANNOTATION_FILE, task="Invalid task")
  207. for _ in data1.__iter__():
  208. pass
  209. assert False
  210. except ValueError as e:
  211. assert "Invalid task type" in str(e)
  212. try:
  213. data1 = ds.CocoDataset(DATA_DIR, annotation_file=LACKOFIMAGE_FILE, task="Detection")
  214. for _ in data1.__iter__():
  215. pass
  216. assert False
  217. except RuntimeError as e:
  218. assert "Invalid node found in json" in str(e)
  219. try:
  220. data1 = ds.CocoDataset(DATA_DIR, annotation_file=INVALID_FILE, task="Detection")
  221. for _ in data1.__iter__():
  222. pass
  223. assert False
  224. except RuntimeError as e:
  225. assert "json.exception.parse_error" in str(e)
  226. if __name__ == '__main__':
  227. test_coco_detection()
  228. test_coco_stuff()
  229. test_coco_keypoint()
  230. test_coco_panoptic()
  231. test_coco_detection_classindex()
  232. test_coco_panootic_classindex()
  233. test_coco_case_0()
  234. test_coco_case_1()
  235. test_coco_case_2()
  236. test_coco_case_exception()