|
|
|
@@ -47,7 +47,9 @@ def add_and_remove_cv_file(): |
|
|
|
os.remove("{}.db".format(x)) if os.path.exists("{}.db".format(x)) else None |
|
|
|
writer = FileWriter(CV_FILE_NAME, FILES_NUM) |
|
|
|
data = get_data(CV_DIR_NAME) |
|
|
|
cv_schema_json = {"file_name": {"type": "string"}, "label": {"type": "int32"}, |
|
|
|
cv_schema_json = {"id": {"type": "int32"}, |
|
|
|
"file_name": {"type": "string"}, |
|
|
|
"label": {"type": "int32"}, |
|
|
|
"data": {"type": "bytes"}} |
|
|
|
writer.add_schema(cv_schema_json, "img_schema") |
|
|
|
writer.add_index(["file_name", "label"]) |
|
|
|
@@ -226,6 +228,24 @@ def test_cv_minddataset_blockreader_tutorial(add_and_remove_cv_file): |
|
|
|
num_iter += 1 |
|
|
|
assert num_iter == 20 |
|
|
|
|
|
|
|
def test_cv_minddataset_blockreader_some_field_not_in_index_tutorial(add_and_remove_cv_file): |
|
|
|
"""tutorial for cv minddataset.""" |
|
|
|
columns_list = ["id", "data", "label"] |
|
|
|
num_readers = 4 |
|
|
|
data_set = ds.MindDataset(CV_FILE_NAME + "0", columns_list, num_readers, shuffle=False, |
|
|
|
block_reader=True) |
|
|
|
assert data_set.get_dataset_size() == 10 |
|
|
|
repeat_num = 2 |
|
|
|
data_set = data_set.repeat(repeat_num) |
|
|
|
num_iter = 0 |
|
|
|
for item in data_set.create_dict_iterator(): |
|
|
|
logger.info("-------------- block reader repeat tow {} -----------------".format(num_iter)) |
|
|
|
logger.info("-------------- item[id]: {} ----------------------------".format(item["id"])) |
|
|
|
logger.info("-------------- item[label]: {} ----------------------------".format(item["label"])) |
|
|
|
logger.info("-------------- item[data]: {} -----------------------------".format(item["data"])) |
|
|
|
num_iter += 1 |
|
|
|
assert num_iter == 20 |
|
|
|
|
|
|
|
|
|
|
|
def test_cv_minddataset_reader_basic_tutorial(add_and_remove_cv_file): |
|
|
|
"""tutorial for cv minderdataset.""" |
|
|
|
@@ -359,13 +379,14 @@ def get_data(dir_name): |
|
|
|
lines = file_reader.readlines() |
|
|
|
|
|
|
|
data_list = [] |
|
|
|
for line in lines: |
|
|
|
for i, line in enumerate(lines): |
|
|
|
try: |
|
|
|
filename, label = line.split(",") |
|
|
|
label = label.strip("\n") |
|
|
|
with open(os.path.join(img_dir, filename), "rb") as file_reader: |
|
|
|
img = file_reader.read() |
|
|
|
data_json = {"file_name": filename, |
|
|
|
data_json = {"id": i, |
|
|
|
"file_name": filename, |
|
|
|
"data": img, |
|
|
|
"label": int(label)} |
|
|
|
data_list.append(data_json) |
|
|
|
|