| @@ -209,16 +209,16 @@ echo "---------------- GraphEngine output generated ----------------" | |||
| if [[ "X$ENABLE_GE_UT" = "Xon" || "X$ENABLE_GE_COV" = "Xon" ]]; then | |||
| cp ${BUILD_PATH}/tests/ut/common/graph/ut_libgraph ${OUTPUT_PATH} | |||
| cp ${BUILD_PATH}/tests/ut/ge/ut_libge_multiparts_utest ${OUTPUT_PATH} | |||
| cp ${BUILD_PATH}/tests/ut/ge/ut_libge_distinct_load_utest ${OUTPUT_PATH} | |||
| #cp ${BUILD_PATH}/tests/ut/ge/ut_libge_multiparts_utest ${OUTPUT_PATH} | |||
| #cp ${BUILD_PATH}/tests/ut/ge/ut_libge_distinct_load_utest ${OUTPUT_PATH} | |||
| cp ${BUILD_PATH}/tests/ut/ge/ut_libge_others_utest ${OUTPUT_PATH} | |||
| cp ${BUILD_PATH}/tests/ut/ge/ut_libge_kernel_utest ${OUTPUT_PATH} | |||
| #cp ${BUILD_PATH}/tests/ut/ge/ut_libge_kernel_utest ${OUTPUT_PATH} | |||
| RUN_TEST_CASE=${OUTPUT_PATH}/ut_libgraph && ${RUN_TEST_CASE} && | |||
| RUN_TEST_CASE=${OUTPUT_PATH}/ut_libge_multiparts_utest && ${RUN_TEST_CASE} && | |||
| RUN_TEST_CASE=${OUTPUT_PATH}/ut_libge_distinct_load_utest && ${RUN_TEST_CASE} && | |||
| #RUN_TEST_CASE=${OUTPUT_PATH}/ut_libgraph && ${RUN_TEST_CASE} && | |||
| #RUN_TEST_CASE=${OUTPUT_PATH}/ut_libge_multiparts_utest && ${RUN_TEST_CASE} && | |||
| #RUN_TEST_CASE=${OUTPUT_PATH}/ut_libge_distinct_load_utest && ${RUN_TEST_CASE} && | |||
| RUN_TEST_CASE=${OUTPUT_PATH}/ut_libge_others_utest && ${RUN_TEST_CASE} && | |||
| RUN_TEST_CASE=${OUTPUT_PATH}/ut_libge_kernel_utest && ${RUN_TEST_CASE} | |||
| #RUN_TEST_CASE=${OUTPUT_PATH}/ut_libge_kernel_utest && ${RUN_TEST_CASE} | |||
| if [[ "$?" -ne 0 ]]; then | |||
| echo "!!! UT FAILED, PLEASE CHECK YOUR CHANGES !!!" | |||
| echo -e "\033[31m${RUN_TEST_CASE}\033[0m" | |||
| @@ -21,6 +21,7 @@ | |||
| #include "graph/common/transop_util.h" | |||
| #include "graph/debug/ge_attr_define.h" | |||
| #include "graph/utils/type_utils.h" | |||
| #include "init/gelib.h" | |||
| namespace ge { | |||
| Status CastRemovePass::Run(NodePtr &node) { | |||
| @@ -61,10 +62,14 @@ Status CastRemovePass::Run(NodePtr &node) { | |||
| if (!HasSameDataType(op_desc, end_op_desc, type)) { | |||
| return SUCCESS; | |||
| } | |||
| if (RemoveCast(type, nodes_to_fuse) != SUCCESS) { | |||
| auto instance_ptr = ge::GELib::GetInstance(); | |||
| if ((instance_ptr == nullptr) || (!instance_ptr->InitFlag())) { | |||
| GELOGE(GE_CLI_GE_NOT_INITIALIZED, "gelib is not initilized!"); | |||
| return FAILED; | |||
| } | |||
| return SUCCESS; | |||
| OpsKernelManager &ops_kernel_manager = instance_ptr->OpsKernelManagerObj(); | |||
| return DoFuse(ops_kernel_manager, type, nodes_to_fuse); | |||
| } | |||
| bool CastRemovePass::CheckPrecisionLoss(const std::vector<NodePtr> &nodes_to_fuse) { | |||
| @@ -95,26 +100,14 @@ bool CastRemovePass::HasSameDataType(OpDescPtr &begin_op_desc, OpDescPtr &end_op | |||
| // op1->TransData->Cast->TransposeD->Cast->TransData->op2 | |||
| // change to be | |||
| // op1->TransData->TransposeD->TransData->op2 | |||
| Status CastRemovePass::RemoveCast(DataType &type, std::vector<NodePtr> &nodes_to_fuse) { | |||
| string cast_name; | |||
| for (NodePtr &node : nodes_to_fuse) { | |||
| if (node->GetType() == CAST) { | |||
| GELOGI("CastRemovePass, remove Cast %s.", node->GetName().c_str()); | |||
| cast_name = node->GetName(); | |||
| if (IsolateAndDeleteNode(node, {0}) != SUCCESS) { | |||
| REPORT_CALL_ERROR("E19999", "Isolate and delete node:%s(%s) failed", | |||
| node->GetName().c_str(), node->GetType().c_str()); | |||
| GELOGE(FAILED, "IsolateAndDeleteNode %s failed.", node->GetName().c_str()); | |||
| return FAILED; | |||
| } | |||
| } | |||
| } | |||
| if (cast_name.empty()) { | |||
| return SUCCESS; | |||
| } | |||
| for (auto &node : nodes_to_fuse) { | |||
| Status CastRemovePass::DoFuse(const OpsKernelManager &ops_kernel_manager, | |||
| const DataType &type, | |||
| std::vector<NodePtr> &nodes_to_fuse) { | |||
| std::vector<size_t> to_be_deleted_cast_index; | |||
| for (size_t i = 0; i < nodes_to_fuse.size(); i++) { | |||
| NodePtr node = nodes_to_fuse[i]; | |||
| if (node->GetType() == CAST) { | |||
| to_be_deleted_cast_index.emplace_back(i); | |||
| continue; | |||
| } | |||
| OpDescPtr op_desc = node->GetOpDesc(); | |||
| @@ -123,25 +116,61 @@ Status CastRemovePass::RemoveCast(DataType &type, std::vector<NodePtr> &nodes_to | |||
| GELOGE(FAILED, "OpDesc must not be null."); | |||
| return FAILED; | |||
| } | |||
| auto in_desc = op_desc->MutableInputDesc(0); | |||
| auto out_desc = op_desc->MutableOutputDesc(0); | |||
| auto in_desc_org_dtype = in_desc->GetDataType(); | |||
| auto out_desc_org_dtype = out_desc->GetDataType(); | |||
| in_desc->SetDataType(type); | |||
| out_desc->SetDataType(type); | |||
| bool is_supported = false; | |||
| for (const auto &ops_kernel_store_info : ops_kernel_manager.GetAllOpsKernelInfoStores()) { | |||
| map<string, OpInfo> op_infos; | |||
| ops_kernel_store_info.second->GetAllOpsKernelInfo(op_infos); | |||
| if (op_infos.find(op_desc->GetType()) == op_infos.end()) { | |||
| continue; | |||
| } | |||
| string un_supported_reason; | |||
| is_supported = ops_kernel_store_info.second->CheckAccuracySupported(op_desc, un_supported_reason); | |||
| if (is_supported) { | |||
| break; | |||
| } | |||
| } | |||
| if (!is_supported) { | |||
| // if no operator_info_store supported, do nothing | |||
| in_desc->SetDataType(in_desc_org_dtype); | |||
| out_desc->SetDataType(out_desc_org_dtype); | |||
| to_be_deleted_cast_index.clear(); | |||
| return SUCCESS; | |||
| } | |||
| // change node name for recompile cache, will be abandoned in April | |||
| string new_node_name = cast_name + op_desc->GetName(); | |||
| op_desc->SetName(new_node_name); | |||
| // add attr to changed TransData, then will be rebuild | |||
| if (!AttrUtils::SetBool(op_desc, ATTR_NEED_COMPILE, true)) { | |||
| REPORT_CALL_ERROR("E19999", "Set Attr:%s of op:%s(%s) failed", | |||
| ATTR_NEED_COMPILE.c_str(), | |||
| op_desc->GetName().c_str(), op_desc->GetType().c_str()); | |||
| op_desc->GetName().c_str(), | |||
| op_desc->GetType().c_str()); | |||
| GELOGE(FAILED, "Set ATTR_NEED_COMPILE Attr fail."); | |||
| return FAILED; | |||
| } | |||
| auto in_desc = op_desc->MutableInputDesc(0); | |||
| auto out_desc = op_desc->MutableOutputDesc(0); | |||
| in_desc->SetDataType(type); | |||
| out_desc->SetDataType(type); | |||
| GELOGI("CastRemovePass, change %s %s datatype to be %s.", node->GetType().c_str(), node->GetName().c_str(), | |||
| TypeUtils::DataTypeToSerialString(type).c_str()); | |||
| } | |||
| return DoRemoveCast(to_be_deleted_cast_index, nodes_to_fuse); | |||
| } | |||
| Status CastRemovePass::DoRemoveCast(const std::vector<size_t> &to_be_deleted_cast_index, | |||
| std::vector<NodePtr> &nodes_to_fuse) { | |||
| for (auto &cast_idx : to_be_deleted_cast_index) { | |||
| GELOGI("CastRemovePass, remove Cast %s.", nodes_to_fuse[cast_idx]->GetName().c_str()); | |||
| if (IsolateAndDeleteNode(nodes_to_fuse[cast_idx], {0}) != SUCCESS) { | |||
| REPORT_CALL_ERROR("E19999", "Isolate and delete node:%s(%s) failed when CastRemovePass %s", | |||
| nodes_to_fuse[cast_idx]->GetName().c_str(), | |||
| nodes_to_fuse[cast_idx]->GetType().c_str(), | |||
| __FUNCTION__); | |||
| GELOGE(FAILED, "IsolateAndDeleteNode %s failed.", nodes_to_fuse[cast_idx]->GetName().c_str()); | |||
| return FAILED; | |||
| } | |||
| } | |||
| return SUCCESS; | |||
| } | |||
| @@ -19,6 +19,7 @@ | |||
| #include <vector> | |||
| #include "graph/passes/base_pass.h" | |||
| #include "opskernel_manager/ops_kernel_manager.h" | |||
| namespace ge { | |||
| class CastRemovePass : public BaseNodePass { | |||
| @@ -28,8 +29,9 @@ class CastRemovePass : public BaseNodePass { | |||
| private: | |||
| bool CheckPrecisionLoss(const std::vector<NodePtr> &nodes_to_fuse); | |||
| bool HasSameDataType(OpDescPtr &begin_op_desc, OpDescPtr &end_op_desc, DataType &type) const; | |||
| Status RemoveCast(DataType &type, std::vector<NodePtr> &nodes_to_fuse); | |||
| NodePtr GetTheEndNode(NodePtr begin_node, std::vector<NodePtr> &nodes_to_fuse); | |||
| Status DoRemoveCast(const std::vector<size_t> &to_be_deleted_cast_index, std::vector<NodePtr> &nodes_to_fuse); | |||
| Status DoFuse(const OpsKernelManager &ops_kernel_manager, const DataType &type, std::vector<NodePtr> &nodes_to_fuse); | |||
| }; | |||
| } // namespace ge | |||
| #endif // GE_GRAPH_PASSES_CAST_REMOVE_PASS_H_ | |||
| @@ -45,7 +45,8 @@ | |||
| #include "runtime/kernel.h" | |||
| #include "opskernel_manager/ops_kernel_builder_manager.h" | |||
| #include "external/runtime/rt_error_codes.h" | |||
| #include <iostream> | |||
| using namespace std; | |||
| using Json = nlohmann::json; | |||
| namespace ge { | |||
| @@ -61,7 +62,7 @@ static std::shared_ptr<GELib> instancePtr_ = nullptr; | |||
| // Initial each module of GE, if one failed, release all | |||
| Status GELib::Initialize(const map<string, string> &options) { | |||
| cout << "1"<< endl; | |||
| GELOGI("initial start"); | |||
| GEEVENT("[GEPERFTRACE] GE Init Start"); | |||
| // Multiple initializations are not allowed | |||
| @@ -71,6 +72,7 @@ Status GELib::Initialize(const map<string, string> &options) { | |||
| REPORT_INNER_ERROR("E19999", "GELib Init failed for new GeLib failed."); | |||
| return GE_CLI_INIT_FAILED; | |||
| } | |||
| cout << "2"<< endl; | |||
| ErrorManager::GetInstance().SetStage(ErrorMessage::kInitialize, ErrorMessage::kSystemInit); | |||
| map<string, string> new_options; | |||
| @@ -93,17 +95,21 @@ Status GELib::Initialize(const map<string, string> &options) { | |||
| if (new_options.find("ge.fpCeilingMode") == new_options.end()) { | |||
| new_options["ge.fpCeilingMode"] = kGlobalOptionFpCeilingModeDefault; | |||
| } | |||
| cout << "3"<< endl; | |||
| GetMutableGlobalOptions().insert(new_options.begin(), new_options.end()); | |||
| GetThreadLocalContext().SetGlobalOption(GetMutableGlobalOptions()); | |||
| GE_TIMESTAMP_START(Init); | |||
| ret = instancePtr_->InnerInitialize(new_options); | |||
| cout << "4"<< endl; | |||
| if (ret != SUCCESS) { | |||
| GELOGE(ret, "[Init][GeLib]GeLib initial failed."); | |||
| REPORT_CALL_ERROR("E19999", "GELib::InnerInitialize failed."); | |||
| instancePtr_ = nullptr; | |||
| return ret; | |||
| } | |||
| cout << "5"<< endl; | |||
| GE_TIMESTAMP_EVENT_END(Init, "GELib::Initialize"); | |||
| return SUCCESS; | |||
| } | |||
| @@ -125,6 +131,7 @@ Status GELib::InnerInitialize(const map<string, string> &options) { | |||
| RollbackInit(); | |||
| return initSystemStatus; | |||
| } | |||
| cout << "6"<< endl; | |||
| ErrorManager::GetInstance().SetStage(ErrorMessage::kInitialize, ErrorMessage::kEngineInit); | |||
| GELOGI("engineManager initial."); | |||
| @@ -149,6 +156,7 @@ Status GELib::InnerInitialize(const map<string, string> &options) { | |||
| RollbackInit(); | |||
| return initOpsStatus; | |||
| } | |||
| cout << "7"<< endl; | |||
| ErrorManager::GetInstance().SetStage(ErrorMessage::kInitialize, ErrorMessage::kOpsKernelBuilderInit); | |||
| GELOGI("opsBuilderManager initial."); | |||
| @@ -161,6 +169,7 @@ Status GELib::InnerInitialize(const map<string, string> &options) { | |||
| RollbackInit(); | |||
| return initOpsBuilderStatus; | |||
| } | |||
| cout << "8"<< endl; | |||
| ErrorManager::GetInstance().SetStage(ErrorMessage::kInitialize, ErrorMessage::kOther); | |||
| GELOGI("sessionManager initial."); | |||
| @@ -173,6 +182,7 @@ Status GELib::InnerInitialize(const map<string, string> &options) { | |||
| RollbackInit(); | |||
| return initSmStatus; | |||
| } | |||
| cout << "9"<< endl; | |||
| GELOGI("Start to initialize HostCpuEngine"); | |||
| GE_TIMESTAMP_START(HostCpuEngineInitialize); | |||
| @@ -184,6 +194,7 @@ Status GELib::InnerInitialize(const map<string, string> &options) { | |||
| RollbackInit(); | |||
| return initHostCpuEngineStatus; | |||
| } | |||
| cout << "10"<< endl; | |||
| GELOGI("Start to init Analyzer!"); | |||
| Status init_analyzer_status = ge::Analyzer::GetInstance()->Initialize(); | |||
| @@ -193,6 +204,7 @@ Status GELib::InnerInitialize(const map<string, string> &options) { | |||
| RollbackInit(); | |||
| return init_analyzer_status; | |||
| } | |||
| cout << "11"<< endl; | |||
| init_flag_ = true; | |||
| return SUCCESS; | |||
| @@ -269,7 +281,7 @@ Status GELib::SetRTSocVersion(const map<string, string> &options, map<string, st | |||
| GELOGI("SOC_VERSION is not exist in options"); | |||
| char version[kSocVersionLen] = {0}; | |||
| rtError_t rt_ret = rtGetSocVersion(version, kSocVersionLen); | |||
| GE_IF_BOOL_EXEC(rt_ret != RT_ERROR_NONE, | |||
| GE_IF_BOOL_EXEC(rt_ret != RT_ERROR_NONE, | |||
| REPORT_CALL_ERROR("E19999", "rtGetSocVersion failed."); | |||
| GELOGE(rt_ret, "[Get][SocVersion]rtGetSocVersion failed"); | |||
| return FAILED;) | |||
| @@ -709,6 +709,7 @@ set(PASS_TEST_FILES | |||
| "graph/passes/buffer_pool_memory_pass_unittest.cc" | |||
| "graph/passes/mark_node_unknown_shape_pass_unittest.cc" | |||
| "graph/passes/reshape_recovery_pass_unittest.cc" | |||
| "graph/passes/cast_remove_pass_unittest.cc" | |||
| ) | |||
| set(KERNEL_TEST_FILES | |||
| @@ -1048,48 +1049,46 @@ target_link_libraries(ge_single_op PRIVATE | |||
| # ut binary | |||
| # libge_mutiparts_utest | |||
| add_executable(ut_libge_multiparts_utest | |||
| # libge_others_utest | |||
| add_executable(ut_libge_others_utest | |||
| ${COMMON_TEST_FILES} | |||
| ${COMMON_FORMAT_SRC_FILES} | |||
| ${MULTI_PARTS_TEST_FILES} | |||
| ${PASS_TEST_FILES} | |||
| ${EXECUTE_TEST_FILES} | |||
| ${OTHERS_TEST_FILES} | |||
| ) | |||
| target_compile_options(ut_libge_multiparts_utest PRIVATE | |||
| target_compile_options(ut_libge_others_utest PRIVATE | |||
| -g --coverage -fprofile-arcs -ftest-coverage | |||
| -Werror=format | |||
| ) | |||
| target_compile_definitions(ut_libge_multiparts_utest PRIVATE | |||
| google=ascend_private | |||
| ) | |||
| target_link_libraries(ut_libge_multiparts_utest | |||
| target_link_libraries(ut_libge_others_utest | |||
| $<BUILD_INTERFACE:intf_pub> | |||
| ge_build_common ge_load_common ge_execute_common ge_optimize_common ge_partition_common ge_prepare_common ge_single_op ge_ut_common | |||
| ge_load_common ge_execute_common ge_ut_common | |||
| gtest gtest_main gmock gmock_main ascend_protobuf ${COMMON_SHARED_LIBRARIES} json -lrt -ldl -lgcov | |||
| ) | |||
| # libge_others_utest | |||
| add_executable(ut_libge_others_utest | |||
| # libge_mutiparts_utest | |||
| add_executable(ut_libge_multiparts_utest | |||
| ${COMMON_TEST_FILES} | |||
| ${COMMON_FORMAT_SRC_FILES} | |||
| ${PASS_TEST_FILES} | |||
| ${EXECUTE_TEST_FILES} | |||
| ${OTHERS_TEST_FILES} | |||
| ${MULTI_PARTS_TEST_FILES} | |||
| ) | |||
| target_compile_options(ut_libge_others_utest PRIVATE | |||
| target_compile_options(ut_libge_multiparts_utest PRIVATE | |||
| -g --coverage -fprofile-arcs -ftest-coverage | |||
| -Werror=format | |||
| ) | |||
| target_link_libraries(ut_libge_others_utest | |||
| target_compile_definitions(ut_libge_multiparts_utest PRIVATE | |||
| google=ascend_private | |||
| ) | |||
| target_link_libraries(ut_libge_multiparts_utest | |||
| $<BUILD_INTERFACE:intf_pub> | |||
| ge_load_common ge_execute_common ge_ut_common | |||
| ge_build_common ge_load_common ge_execute_common ge_optimize_common ge_partition_common ge_prepare_common ge_single_op ge_ut_common | |||
| gtest gtest_main gmock gmock_main ascend_protobuf ${COMMON_SHARED_LIBRARIES} json -lrt -ldl -lgcov | |||
| ) | |||
| # libge_kernel_utest | |||
| add_executable(ut_libge_kernel_utest | |||
| ${COMMON_TEST_FILES} | |||
| @@ -0,0 +1,88 @@ | |||
| /** | |||
| * Copyright 2019-2020 Huawei Technologies Co., Ltd | |||
| * | |||
| * Licensed under the Apache License, Version 2.0 (the "License"); | |||
| * you may not use this file except in compliance with the License. | |||
| * You may obtain a copy of the License at | |||
| * | |||
| * http://www.apache.org/licenses/LICENSE-2.0 | |||
| * | |||
| * Unless required by applicable law or agreed to in writing, software | |||
| * distributed under the License is distributed on an "AS IS" BASIS, | |||
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | |||
| * See the License for the specific language governing permissions and | |||
| * limitations under the License. | |||
| */ | |||
| #include <gtest/gtest.h> | |||
| #include <vector> | |||
| #define protected public | |||
| #define private public | |||
| #include "graph/passes/cast_remove_pass.h" | |||
| #undef protected | |||
| #undef private | |||
| #include "anchor.h" | |||
| #include "common/debug/log.h" | |||
| #include "common/debug/memory_dumper.h" | |||
| #include "common/op/attr_value_util.h" | |||
| #include "common/types.h" | |||
| #include "framework/common/ge_inner_error_codes.h" | |||
| #include "graph/attr_value.h" | |||
| #include "graph/debug/ge_attr_define.h" | |||
| #include "inc/pass_manager.h" | |||
| #include "graph_builder_utils.h" | |||
| #include <string> | |||
| #include <iostream> | |||
| #include <vector> | |||
| #include "opskernel_manager/ops_kernel_manager.h" | |||
| #include "omg/omg_inner_types.h" | |||
| using namespace testing; | |||
| using namespace ge; | |||
| using namespace std; | |||
| class UtestGraphPassesCastRemovePass : public testing::Test { | |||
| protected: | |||
| void SetUp() {} | |||
| void TearDown() {} | |||
| }; | |||
| // case1:no net_out_put_node | |||
| TEST_F(UtestGraphPassesCastRemovePass, DoFuseProcess) { | |||
| std::vector<NodePtr> nodes_to_fuse; | |||
| auto builder = ut::GraphBuilder("g1"); | |||
| auto data = builder.AddNode("data", DATA, 1, 1); | |||
| auto cast1 = builder.AddNode("cast1", CAST, 1, 1); | |||
| cast1->GetOpDesc()->MutableOutputDesc(0)->SetDataType(DT_FLOAT16); | |||
| auto trans = builder.AddNode("trans", TRANSPOSE, 1, 1, FORMAT_NCHW, DT_FLOAT16); | |||
| auto cast2 = builder.AddNode("cast2", CAST, 1, 1); | |||
| cast2->GetOpDesc()->MutableInputDesc(0)->SetDataType(DT_FLOAT16); | |||
| auto net = builder.AddNode("netout", NETOUTPUT, 1, 1); | |||
| builder.AddDataEdge(data, 0, cast1, 0); | |||
| builder.AddDataEdge(cast1, 0, trans, 0); | |||
| builder.AddDataEdge(trans, 0, cast2, 0); | |||
| builder.AddDataEdge(cast2, 0, net, 0); | |||
| ComputeGraphPtr compute_graph = builder.GetGraph(); | |||
| map<string, string> options; | |||
| CastRemovePass cast_remove_pass; | |||
| DataType type = DT_FLOAT; | |||
| nodes_to_fuse.emplace_back(cast1); | |||
| nodes_to_fuse.emplace_back(trans); | |||
| nodes_to_fuse.emplace_back(cast2); | |||
| OpsKernelManager ops_kernel_manager; | |||
| cast_remove_pass.DoFuse(ops_kernel_manager, type, nodes_to_fuse); | |||
| EXPECT_EQ(compute_graph->GetAllNodesSize(),5); | |||
| std::vector<size_t> to_be_deleted_cast_index; | |||
| to_be_deleted_cast_index.emplace_back(0); | |||
| to_be_deleted_cast_index.emplace_back(2); | |||
| (void)cast_remove_pass.DoRemoveCast(to_be_deleted_cast_index, nodes_to_fuse); | |||
| EXPECT_EQ(compute_graph->GetAllNodesSize(),3); | |||
| } | |||