Browse Source

Optimize inferface performance needed when running

pull/1004/head
wxl 5 years ago
parent
commit
a197177a3c
1 changed files with 23 additions and 0 deletions
  1. +23
    -0
      ge/hybrid/model/hybrid_model_builder.cc

+ 23
- 0
ge/hybrid/model/hybrid_model_builder.cc View File

@@ -28,6 +28,8 @@
#include "graph/manager/graph_mem_allocator.h"
#include "graph/manager/host_mem_allocator.h"
#include "graph/utils/graph_utils.h"
#include "graph/utils/op_desc_utils.h"
#include "graph/utils/tensor_utils.h"
#include "hybrid/common/npu_memory_allocator.h"
#include "hybrid/node_executor/node_executor.h"

@@ -1530,6 +1532,27 @@ Status HybridModelBuilder::RecoverGraphUnknownFlag() {
break;
}
}
// for performance
for (auto &subgraph : root_graph->GetAllSubgraphs()) {
GE_CHECK_NOTNULL(sub_graph);
for (const auto &node : sub_graph->GetDirectNode()) {
auto op_desc = node->GetOpDesc();
GE_CHECK_NOTNULL(op_desc);
OpDescUtils::TransformRunAttrToMember(*op_desc);
for (auto &tensor_desc : op_desc->GetAllInputsDescPtr()) {
if (tensor_desc == nullptr) {
continue;
}
TensorUtils::TransformRunAttrToMember(*tensor_desc);
}
for (auto &tensor_desc : op_desc->GetAllOutputsDescPtr()) {
if (tensor_desc == nullptr) {
continue;
}
TensorUtils::TransformRunAttrToMember(*tensor_desc);
}
}
}
return SUCCESS;
}



Loading…
Cancel
Save