add control flow

4 years ago · 8193109aec
--- a/mindspore/lite/micro/coder/graph.cc
+++ b/mindspore/lite/micro/coder/graph.cc
@@ -62,14 +62,12 @@ int CoderGraph::ConvertTensors() {
    MS_CHECK_PTR_WITH_EXE(origin_tensor, clear_tensors());
    // tensor dims
    std::vector<int> shape;
    if (origin_tensor->nodeType() == NodeType_ValueNode) {
      if (origin_tensor->dims() != nullptr) {
        for (uint32_t j = 0; j < origin_tensor->dims()->size(); j++) {
          MS_CHECK_PTR(origin_tensor->dims()->data());
          int dim = static_cast<int>(origin_tensor->dims()->data()[j]);
          MS_CHECK_RET_CODE_WITH_EXE(check_dim(dim), "parse shape failed!", clear_tensors());
          shape.push_back(dim);
        }
    if (origin_tensor->dims() != nullptr) {
      for (uint32_t j = 0; j < origin_tensor->dims()->size(); j++) {
        MS_CHECK_PTR(origin_tensor->dims()->data());
        int dim = static_cast<int>(origin_tensor->dims()->data()[j]);
        MS_CHECK_RET_CODE_WITH_EXE(check_dim(dim), "parse shape failed!", clear_tensors());
        shape.push_back(dim);
      }
    }
    // tensor Datatype
@@ -130,8 +128,8 @@ int CoderGraph::InitGraphInOutTensors() {
    for (uint32_t i = 0; i < in_node->input_indices_.size(); i++) {
      auto in_tensor_index = size_t(in_node->input_indices_.at(i));
      bool is_graph_input = false;
      for (uint32_t j = 0; j < model_->sub_graphs_.at(0)->input_indices_.size(); j++) {
        if (in_tensor_index == size_t(model_->sub_graphs_.at(0)->input_indices_.at(j))) {
      for (uint32_t j = 0; j < model_->input_indices_.size(); j++) {
        if (in_tensor_index == size_t(model_->input_indices_.at(j))) {
          input_indices.push_back(static_cast<uint32_t>(in_tensor_index));
          is_graph_input = true;
          break;
@@ -155,8 +153,8 @@ int CoderGraph::InitGraphInOutTensors() {
    for (uint32_t i = 0; i < out_node->output_indices_.size(); i++) {
      auto out_tensor_index = size_t(out_node->output_indices_.at(i));
      bool is_graph_output = false;
      for (uint32_t j = 0; j < model_->sub_graphs_.at(0)->output_indices_.size(); j++) {
        if (out_tensor_index == size_t(model_->sub_graphs_.at(0)->output_indices_.at(j))) {
      for (uint32_t j = 0; j < model_->output_indices_.size(); j++) {
        if (out_tensor_index == size_t(model_->output_indices_.at(j))) {
          output_indices.push_back(static_cast<uint32_t>(out_tensor_index));
          is_graph_output = true;
          break;
--- a/mindspore/lite/src/inner_kernel.h
+++ b/mindspore/lite/src/inner_kernel.h
@@ -117,6 +117,10 @@ class InnerKernel : public Kernel {
  OpParameter *op_parameter() const { return op_parameter_; }

  bool InferShapeDone() const {
    if (std::any_of(in_tensors_.begin(), in_tensors_.end(),
                    [](lite::Tensor *input) { return input->data_type() == kObjectTypeTensorType; })) {
      return false;
    }
    auto shape = out_tensors_.front()->shape();
    if (std::find(shape.begin(), shape.end(), -1) != shape.end()) {
      return false;
--- a/mindspore/lite/src/lite_mindrt.cc
+++ b/mindspore/lite/src/lite_mindrt.cc
@@ -15,11 +15,13 @@
 */

 #include <utility>
 #include <algorithm>
 #include "src/lite_mindrt.h"
 #include "mindrt/include/mindrt.hpp"
 #include "src/lite_kernel_util.h"
 #include "nnacl/partial_fusion_parameter.h"
 #include "src/common/tensor_util.h"
 #include "src/runtime/inner_allocator.h"
 #include "src/runtime/kernel/arm/base/partial_fusion.h"
 #ifdef ENABLE_FP16
 #include "src/runtime/kernel/arm/fp16/fp16_op_handler.h"
 #endif
@@ -55,11 +57,32 @@ void LiteOpActor::RunOpData(OpData<lite::Tensor> *inputs, OpContext<lite::Tensor
  return;
 }

 bool IsOtherOutput(const std::vector<kernel::LiteKernel *> &kernels, const kernel::LiteKernel &this_kernel,
                   const lite::Tensor &this_input_tensor) {
  for (auto &kernel : kernels) {
    if (kernel == &this_kernel) {
      continue;
    }
    if (std::any_of(kernel->out_tensors().begin(), kernel->out_tensors().end(),
                    [&this_input_tensor](lite::Tensor *tensor) { return tensor == &this_input_tensor; })) {
      return true;
    }
  }
  return false;
 }

 void LiteOpActor::IsolateInputData(std::vector<std::shared_ptr<LiteOpActor>> *actors) {
  std::vector<kernel::LiteKernel *> kernels{};
  std::transform(actors->begin(), actors->end(), std::back_inserter(kernels),
                 [](std::shared_ptr<LiteOpActor> actor) { return actor->kernel_; });
  size_t in_tensor_size = kernel_->in_tensors().size();
  for (size_t i = 0; i < in_tensor_size; i++) {
    Tensor *old_tensor = kernel_->in_tensors()[i];

    if (!IsOtherOutput(kernels, *kernel_, *old_tensor)) {
      continue;
    }

    TypeId new_data_type = old_tensor->data_type();
    if (old_tensor->data_type() == kNumberTypeFloat16 || old_tensor->data_type() == kNumberTypeFloat32) {
      new_data_type = kernel_->desc().data_type;
@@ -103,7 +126,6 @@ int LiteOpActor::LiteActorInit(std::vector<std::shared_ptr<LiteOpActor>> *actors

  /* subgraph transaction isolation */
  IsolateInputData(actors);

  return RET_OK;
 }

@@ -169,9 +191,9 @@ int LiteOpActor::CompileArrowThroughPartialCall() {
      continue;
    }
    partial_node_ = partial_node;
    auto subgraph = reinterpret_cast<kernel::PartialFusionKernel *>(partial_node->kernel())->subgraph_kernel();
    auto out_actor_id = subgraph_to_actor_.at(subgraph);

    auto partial_para = reinterpret_cast<PartialParameter *>(partial_node->op_parameter());
    auto out_actor_id = subgraph_index_to_actor.at(partial_para->sub_graph_index_);
    kernel_->set_out_tensors(partial_node->in_tensors());
    for (size_t i = 0; i < partial_node->in_tensors().size(); ++i) {
      auto arrow = std::make_shared<DataArrow>(i, out_actor_id, i);
@@ -209,45 +231,87 @@ int LiteOpActor::CompileArrow() {
  return ret;
 }

 void LiteOpActor::MoveInputData(Tensor *dst_tensor, Tensor *src_tensor) {
 void LiteOpActor::MoveTensorInputData(Tensor *dst_tensor, Tensor *src_tensor) {
  MS_ASSERT(src_tensor != dst_tensor);

  dst_tensor->FreeData();
  dst_tensor->ResetRefCount();

  if (src_tensor->allocator() == nullptr && !(src_tensor->IsConst()) && !(src_tensor->IsGraphInput())) {
    // delegate graph kernel output tensor
    dst_tensor->MallocData();
    memcpy(dst_tensor->data(), src_tensor->data(), src_tensor->Size());
    return;
  }

  dst_tensor->set_allocator(src_tensor->allocator());
  if (src_tensor->allocator() != nullptr) {
    src_tensor->allocator()->IncRefCount(src_tensor->data(), dst_tensor->ref_count());
  }
  // todo fix tensorlist
  dst_tensor->set_data(src_tensor->MutableData()); /* using MutableData to sync GPU data */

  if (src_tensor->data_c() != nullptr) {
    dst_tensor->set_data(src_tensor->MutableData()); /* using MutableData to sync GPU data */
  }
  dst_tensor->set_own_data(src_tensor->own_data());
  if (src_tensor->IsConst() || src_tensor->IsGraphInput()) {
    dst_tensor->set_own_data(false);
  } else {
    dst_tensor->set_own_data(true);
    src_tensor->DecRefCount();
  }
 }

 void LiteOpActor::MoveTensorListInputData(TensorList *dst_tensorlist, TensorList *src_tensorlist) {
  MS_ASSERT(src_tensorlist != nullptr);
  MS_ASSERT(dst_tensorlist != nullptr);
  dst_tensorlist->FreeData();
  dst_tensorlist->ResetRefCount();
  dst_tensorlist->set_allocator(src_tensorlist->allocator());

  auto src_tensorlist_tensors_size = src_tensorlist->tensors().size();
  auto dst_tensorlist_tensors_size = dst_tensorlist->tensors().size();
  if (src_tensorlist_tensors_size != dst_tensorlist_tensors_size) {
    MS_LOG(ERROR) << "src tensorlist: " << src_tensorlist->tensor_name()
                  << " tesnors size: " << src_tensorlist_tensors_size
                  << " vs dst tensorlist: " << src_tensorlist->tensor_name()
                  << " tensors size: " << dst_tensorlist_tensors_size;
    return;
  }

  dst_tensorlist->set_own_data(src_tensorlist->own_data());
  for (size_t i = 0; i < src_tensorlist_tensors_size; ++i) {
    auto &src_tensor = src_tensorlist->tensors()[i];
    auto &dst_tensor = dst_tensorlist->tensors()[i];

    if (src_tensor->allocator() != nullptr) {
      src_tensor->allocator()->IncRefCount(src_tensor->data(), dst_tensor->ref_count());
    }
    dst_tensor->set_own_data(src_tensor->own_data());
    if (src_tensor->data_c() != nullptr) {
      dst_tensor->set_data(src_tensor->MutableData()); /* using MutableData to sync GPU data */
    }
    dst_tensor->set_shape(src_tensor->shape());
  }

  if (src_tensorlist->IsConst() || src_tensorlist->IsGraphInput()) {
    dst_tensorlist->set_own_data(false);
  } else {
    src_tensorlist->DecRefCount();
  }
 }

 void LiteOpActor::MoveInputData(Tensor *dst_tensor, Tensor *src_tensor) {
  if (src_tensor == dst_tensor) {
    MS_LOG(INFO) << "no need to move.";
    return;
  }

  if (src_tensor->data_type() == kObjectTypeTensorType) {
    MoveTensorListInputData(reinterpret_cast<TensorList *>(dst_tensor), reinterpret_cast<TensorList *>(src_tensor));
  } else {
    MoveTensorInputData(dst_tensor, src_tensor);
  }
  return;
 }

 void LiteOpActor::CopyInputData(Tensor *dst_tensor, Tensor *src_tensor) {
  dst_tensor->ResetRefCount();
  dst_tensor->MallocData();

  CastTensorData(dst_tensor, src_tensor);

  src_tensor->DecRefCount();
  memcpy(dst_tensor->data(), src_tensor->data(), src_tensor->Size());
 }

 int LiteOpActor::CastTensorData(Tensor *dst, Tensor *src) {
 int LiteOpActor::CastInputData(Tensor *dst, Tensor *src) {
  dst->ResetRefCount();
  dst->MallocData();
 #if defined(ENABLE_ARM) && defined(ENABLE_FP16)
  if (dst->shape() != src->shape()) {
    MS_LOG(ERROR) << "dst tensor: " << dst->tensor_name() << " shape: " << dst->shape() << " vs "
@@ -270,20 +334,53 @@ int LiteOpActor::CastTensorData(Tensor *dst, Tensor *src) {
  }
  return RET_OK;
 #endif
  src->DecRefCount();
  return RET_ERROR;
 }

 void LiteOpActor::SetInputShape() {
  for (size_t i = 0; i < inputs_data_.size(); ++i) {
    auto &input_tensor = kernel_->in_tensors()[i];
    if (input_tensor->shape() == inputs_data_[i]->shape()) {
      continue;
    }
    MS_LOG(DEBUG) << "inputs_data_[" << i << "].shape: " << inputs_data_[i]->shape() << " vs kernel_->in_tensors()["
                  << i << "].shape: " << kernel_->in_tensors()[i]->shape() << " are not equal.";
    MS_LOG(DEBUG) << "this->kernel_->name(): " << this->kernel_->name();

    if (input_tensor->data_type() == kObjectTypeTensorType) {
      auto input_tensorlist = reinterpret_cast<TensorList *>(input_tensor);
      auto input_data_tensorlist = reinterpret_cast<TensorList *>(inputs_data_[i]);
      input_tensorlist->FreeTensorListData();
      input_tensorlist->set_element_shape(input_data_tensorlist->element_shape());
      input_tensorlist->set_shape(input_data_tensorlist->shape());
      std::vector<std::vector<int>> tensor_shape{};
      std::transform(input_data_tensorlist->tensors().begin(), input_data_tensorlist->tensors().end(),
                     std::back_inserter(tensor_shape), [](Tensor *tensor_item) { return tensor_item->shape(); });
      input_tensorlist->MallocTensorListData(input_data_tensorlist->tensors_data_type(), tensor_shape);
    } else {
      input_tensor->set_shape(inputs_data_[i]->shape());
      input_tensor->set_format(inputs_data_[i]->format());
    }
  }
 }

 int LiteOpActor::SetInputData() {
  SetInputShape();

  for (size_t i = 0; i < inputs_data_.size(); ++i) {
    auto dst_tensor = kernel_->in_tensors()[i];
    auto src_tensor = inputs_data_[i];

    /* infershape done in runtime */
    dst_tensor->set_shape(src_tensor->shape());
    dst_tensor->set_format(src_tensor->format());
    dst_tensor->ResetRefCount();
    if (dst_tensor->init_ref_count() == 0) {
      src_tensor->DecRefCount();
      continue;
    }

    if (src_tensor->data_type() != dst_tensor->data_type()) {
      CastInputData(dst_tensor, src_tensor);
    } else if (src_tensor->allocator() == nullptr && !(src_tensor->IsConst()) && !(src_tensor->IsGraphInput()) &&
               src_tensor->own_data()) {
      // delegate graph kernel output tensor
      CopyInputData(dst_tensor, src_tensor);
    } else {
      MoveInputData(dst_tensor, src_tensor);
@@ -309,7 +406,6 @@ void LiteOpActor::SetOutputData(OpContext<Tensor> *context) {

 int LiteOpActor::PrepareOutputData() {
  outputs_data_.resize(output_data_arrows_.size());

  for (size_t i = 0; i < output_data_arrows_.size(); i++) {
    auto &arrow = output_data_arrows_[i];
    auto data = std::make_shared<OpData<Tensor>>(arrow->to_op_id_, kernel_->out_tensors().at(arrow->from_output_index_),
@@ -319,58 +415,13 @@ int LiteOpActor::PrepareOutputData() {
  return RET_OK;
 }

 std::vector<std::shared_ptr<LiteOpActor>> CreateOpActor(const std::vector<kernel::LiteKernel *> &kernels,
                                                        const lite::InnerContext *ctx) {
  std::vector<std::shared_ptr<LiteOpActor>> actors;
  std::unordered_map<size_t, AID> partial_map{};
  auto thread_pool = ctx->thread_pool();
  if (thread_pool == nullptr) {
    MS_LOG(ERROR) << "thread pool is nullptr";
    return actors;
  }
  for (size_t i = 0; i < kernels.size(); ++i) {
    if ((kernel::LiteKernelUtil::IsSwitchCall(kernels[i]))) {
      auto switch_actor = std::make_shared<LiteSwitchOpActor>(kernels[i]);
      if (switch_actor == nullptr) {
        MS_LOG(ERROR) << "create LiteSwitchOpActor failed: " << kernels[i]->name();
        actors.clear();
        return actors;
      }
      switch_actor->set_thread_pool(thread_pool);
      partial_map[i] = switch_actor->GetAID();
      actors.push_back(switch_actor);
    } else {
      auto actor = std::make_shared<LiteOpActor>(kernels[i]);
      if (actor == nullptr) {
        MS_LOG(ERROR) << "create LiteOpActor failed: " << kernels[i]->name();
        actors.clear();
        return actors;
      }
      actor->set_thread_pool(thread_pool);
      partial_map[i] = actor->GetAID();
      actors.push_back(actor);
    }
  }

  for (auto &actor : actors) {
    actor->SetPartialMap(partial_map);
    auto aid = mindspore::Spawn(actor);
  }
  return actors;
 }

 int LiteSwitchOpActor::CompileTrueBranchArrow() {
  true_branch_output_data_arrows_.clear();
  if (true_partial_node_ == nullptr) {
    MS_LOG(ERROR) << "true_partial_node_ is nullptr.";
    return RET_NULL_PTR;
  }
  auto true_partial_para = reinterpret_cast<PartialParameter *>(true_partial_node_->op_parameter());
  if (true_partial_para == nullptr) {
    MS_LOG(ERROR) << "true_partial_node_->op_parameter() is nullptr.";
    return RET_NULL_PTR;
  }
  auto true_branch_actor_id = subgraph_index_to_actor.at(true_partial_para->sub_graph_index_);
  auto subgraph = static_cast<kernel::PartialFusionKernel *>(true_partial_node_->kernel())->subgraph_kernel();
  auto true_branch_actor_id = subgraph_to_actor_.at(subgraph);

  for (size_t i = 0; i < true_partial_node_->in_tensors().size(); ++i) {
    int out_tensor_size = static_cast<int>(kernel_->out_tensors().size());
@@ -390,17 +441,12 @@ int LiteSwitchOpActor::CompileTrueBranchArrow() {
 }

 int LiteSwitchOpActor::CompileFalseBranchArrow() {
  false_branch_output_data_arrows_.clear();
  if (false_partial_node_ == nullptr) {
    MS_LOG(ERROR) << "false_partial_node_ is nullptr.";
    return RET_NULL_PTR;
  }
  auto false_partial_para = reinterpret_cast<PartialParameter *>(false_partial_node_->op_parameter());
  if (false_partial_para == nullptr) {
    MS_LOG(ERROR) << "false_partial_para->op_parameter() is nullptr.";
    return RET_NULL_PTR;
  }
  auto false_branch_actor_id = subgraph_index_to_actor.at(false_partial_para->sub_graph_index_);
  auto subgraph = static_cast<kernel::PartialFusionKernel *>(false_partial_node_->kernel())->subgraph_kernel();
  auto false_branch_actor_id = subgraph_to_actor_.at(subgraph);

  for (size_t i = 0; i < false_partial_node_->in_tensors().size(); ++i) {
    int out_tensor_size = static_cast<int>(kernel_->out_tensors().size());
@@ -430,21 +476,33 @@ int LiteSwitchOpActor::GetSwitchAndCallNode(kernel::SubGraphKernel *subgraph_ker
      continue;
    }
    switch_node_ = switch_node;
    if (switch_node->in_kernels().size() != kSwitchInputsSize) {
      MS_LOG(ERROR) << "switch input size: " << switch_node->in_kernels().size();
      return RET_MEMORY_FAILED;
    if (switch_node->in_kernels().size() == kSwitchMaxInputsSize) {
      bool_node_ = switch_node->in_kernels().at(kSwitchCondInputIndex);
      true_partial_node_ = switch_node->in_kernels().at(kSwitchTruePartialInputIndex);
      false_partial_node_ = switch_node->in_kernels().at(kSwitchFalsePartialInputIndex);
    }

    if (switch_node->in_kernels().size() == kSwitchMinInputsSize) {
      if (!switch_node->in_tensors()[0]->IsConst()) {
        MS_LOG(ERROR) << "actor name: " << this->GetAID() << " ;s switch node " << switch_node->name()
                      << " input size: " << switch_node->in_kernels().size()
                      << " but switch_node->in_tensors()[0] is not const";
        return RET_MEMORY_FAILED;
      }

      true_partial_node_ = switch_node->in_kernels().at(kSwitchTruePartialInputIndex - 1);
      false_partial_node_ = switch_node->in_kernels().at(kSwitchFalsePartialInputIndex - 1);
    }

    bool_node_ = switch_node->in_kernels().at(kSwitchCondInputIndex);
    true_partial_node_ = switch_node->in_kernels().at(kSwitchTruePartialInputIndex);
    false_partial_node_ = switch_node->in_kernels().at(kSwitchFalsePartialInputIndex);
    break;
  }
  return RET_OK;
 }

 void LiteSwitchOpActor::AppendOutputTensors() {
  output_tensors_.push_back(bool_node_->out_tensors().front());
  if (bool_node_ != nullptr) {
    output_tensors_.push_back(bool_node_->out_tensors().front());
  }
  for (auto &tensor : true_partial_node_->in_tensors()) {
    if (std::find(output_tensors_.begin(), output_tensors_.end(), tensor) == output_tensors_.end()) {
      output_tensors_.push_back(tensor);
@@ -518,16 +576,25 @@ int LiteSwitchOpActor::CompileArrow() {
 }

 int LiteSwitchOpActor::PrepareOutputData() {
  for (auto &arrow : true_branch_output_data_arrows_) {
  true_branch_outputs_data_.resize(true_branch_output_data_arrows_.size());
  for (size_t i = 0; i < true_branch_output_data_arrows_.size(); i++) {
    auto &arrow = true_branch_output_data_arrows_[i];
    auto data = std::make_shared<OpData<Tensor>>(arrow->to_op_id_, kernel_->out_tensors().at(arrow->from_output_index_),
                                                 static_cast<int>(arrow->to_input_index_));
    true_branch_outputs_data_.emplace_back(data);
    true_branch_outputs_data_.at(i) = data;
  }

  for (auto &arrow : false_branch_output_data_arrows_) {
  false_branch_outputs_data_.resize(false_branch_output_data_arrows_.size());
  for (size_t i = 0; i < false_branch_output_data_arrows_.size(); i++) {
    auto &arrow = false_branch_output_data_arrows_[i];
    auto data = std::make_shared<OpData<Tensor>>(arrow->to_op_id_, kernel_->out_tensors().at(arrow->from_output_index_),
                                                 static_cast<int>(arrow->to_input_index_));
    false_branch_outputs_data_.emplace_back(data);
    auto iter = std::find_if(true_branch_outputs_data_.begin(), true_branch_outputs_data_.end(),
                             [&data](const auto &true_branch_data) { return true_branch_data->data_ == data->data_; });
    if (iter != true_branch_outputs_data_.end() && !data->data_->IsConst()) {
      data->data_->set_init_ref_count(data->data_->init_ref_count() - 1);
    }
    false_branch_outputs_data_.at(i) = data;
  }
  return RET_OK;
 }
@@ -548,6 +615,83 @@ void LiteSwitchOpActor::AsyncFalseBranchOutput(OpContext<Tensor> *context) {
  }
 }

 void LiteSwitchOpActor::RunOpData(OpData<Tensor> *inputs, OpContext<Tensor> *context) {
  auto op_uuid = context->sequential_num_;
  input_op_datas_[op_uuid].push_back(inputs);
  inputs_data_[inputs->index_] = inputs->data_;
  if (input_op_datas_[op_uuid].size() < kernel_->in_tensors().size()) {
    return;
  }

  int ret = SetInputData();
  if (ret != RET_OK) {
    input_op_datas_.erase(op_uuid);
    context->SetFailed(ret);
    return;
  }

  ret = RunKernel(*(reinterpret_cast<const KernelCallBack *>(context->kernel_call_back_before_)),
                  *(reinterpret_cast<const KernelCallBack *>(context->kernel_call_back_after_)));
  if (ret != RET_OK) {
    input_op_datas_.erase(op_uuid);
    context->SetFailed(ret);
    return;
  }
  input_op_datas_.erase(op_uuid);

  bool *cond = nullptr;
  if (bool_node_ != nullptr) {
    cond = reinterpret_cast<bool *>(output_tensors_[0]->data());
  } else {
    cond = reinterpret_cast<bool *>(switch_node_->in_tensors()[0]->data());
  }
  if (*cond) {
    AsyncTrueBranchOutput(context);
  } else {
    AsyncFalseBranchOutput(context);
  }
 }

 std::vector<std::shared_ptr<LiteOpActor>> CreateOpActor(const std::vector<kernel::LiteKernel *> &kernels,
                                                        const lite::InnerContext *ctx) {
  std::vector<std::shared_ptr<LiteOpActor>> actors;
  std::unordered_map<kernel::LiteKernel *, AID> subgraph_name_AID_map{};
  auto thread_pool = ctx->thread_pool();
  if (thread_pool == nullptr) {
    MS_LOG(ERROR) << "thread pool is nullptr";
    return actors;
  }
  for (auto &kernel : kernels) {
    if ((kernel::LiteKernelUtil::IsSwitchCall(kernel))) {
      auto switch_actor = std::make_shared<LiteSwitchOpActor>(kernel);
      if (switch_actor == nullptr) {
        MS_LOG(ERROR) << "create LiteSwitchOpActor failed: " << kernel->name();
        actors.clear();
        return actors;
      }
      switch_actor->set_thread_pool(thread_pool);
      subgraph_name_AID_map[kernel] = switch_actor->GetAID();
      actors.push_back(switch_actor);
    } else {
      auto actor = std::make_shared<LiteOpActor>(kernel);
      if (actor == nullptr) {
        MS_LOG(ERROR) << "create LiteOpActor failed: " << kernel->name();
        actors.clear();
        return actors;
      }
      actor->set_thread_pool(thread_pool);
      subgraph_name_AID_map[kernel] = actor->GetAID();
      actors.push_back(actor);
    }
  }

  for (auto &actor : actors) {
    actor->SetSubgraphAIDMap(subgraph_name_AID_map);
    auto aid = mindspore::Spawn(actor);
  }
  return actors;
 }

 int MindrtInit() { return mindspore::Initialize("tcp://127.0.0.1:8080", "", "", ""); }

 void MindrtTerminate(const std::vector<std::shared_ptr<LiteOpActor>> &actor_list) {
--- a/mindspore/lite/src/lite_mindrt.h
+++ b/mindspore/lite/src/lite_mindrt.h
@@ -27,11 +27,13 @@
 #include "async/future.h"
 #include "src/sub_graph_kernel.h"
 #include "src/cpu_info.h"
 #include "src/tensorlist.h"

 namespace mindspore::lite {

 typedef enum { GRAPH, OP_BY_OP } MindRTMode;
 const constexpr int kSwitchInputsSize = 3;
 const constexpr int kSwitchMaxInputsSize = 3;
 const constexpr int kSwitchMinInputsSize = 2;
 const constexpr int kSwitchCondInputIndex = 0;
 const constexpr int kSwitchTruePartialInputIndex = 1;
 const constexpr int kSwitchFalsePartialInputIndex = 2;
@@ -53,7 +55,6 @@ class LiteOpActor : public OpActor<lite::Tensor> {
    }
  }
  void RunOpData(OpData<lite::Tensor> *input_data, OpContext<lite::Tensor> *context = nullptr) override;
  int CastTensorData(Tensor *dst, Tensor *src);
  virtual int CompileArrow();
  int RunKernel(const KernelCallBack &before, const KernelCallBack &after) {
    auto ret = kernel_->Execute(before, after);
@@ -69,9 +70,12 @@ class LiteOpActor : public OpActor<lite::Tensor> {

 public:
  void AddResultIndex(size_t index);
  void SetPartialMap(const std::unordered_map<size_t, AID> &partial_map) { subgraph_index_to_actor = partial_map; }
  void SetSubgraphAIDMap(const std::unordered_map<kernel::LiteKernel *, AID> &partial_map) {
    subgraph_to_actor_ = partial_map;
  }

 protected:
  void SetInputShape();
  int SetInputData();
  void SetOutputData(OpContext<Tensor> *context);
  void AsyncOutput(OpContext<Tensor> *context);
@@ -81,19 +85,22 @@ class LiteOpActor : public OpActor<lite::Tensor> {

  kernel::LiteKernel *kernel_;
  std::vector<size_t> results_index_{};
  std::unordered_map<size_t, AID> subgraph_index_to_actor{};
  std::unordered_map<kernel::LiteKernel *, AID> subgraph_to_actor_{};
  std::vector<OpDataPtr<Tensor>> outputs_data_{};
  std::vector<Tensor *> inputs_data_{};
  std::unordered_map<Tensor *, Tensor *> isolate_input_map_{}; /* <calculate-tensor,  src-input-tensor> */

 private:
  void IsolateInputData(std::vector<std::shared_ptr<LiteOpActor>> *actors);
  void MoveTensorInputData(Tensor *dst_tensor, Tensor *src_tensor);
  void MoveTensorListInputData(TensorList *dst_tensor, TensorList *src_tensor);
  void MoveInputData(Tensor *dst_tensor, Tensor *src_tensor);
  void CopyInputData(Tensor *dst_tensor, Tensor *src_tensor);
  int CastInputData(Tensor *dst_tensor, Tensor *src_tensor);

 private:
  kernel::LiteKernel *partial_node_ = nullptr;
  kernel::LiteKernel *call_node_ = nullptr;
  std::unordered_map<Tensor *, Tensor *> isolate_input_map_; /* <calculate-tensor,  src-input-tensor> */
 #if defined(ENABLE_ARM) && defined(ENABLE_FP16)
  bool support_fp16_ = false;
 #endif
@@ -103,70 +110,18 @@ class LiteSwitchOpActor : public LiteOpActor {
 public:
  explicit LiteSwitchOpActor(kernel::LiteKernel *kernel) : LiteOpActor(kernel) {}
  ~LiteSwitchOpActor() override = default;
  void RunOpData(OpData<Tensor> *inputs, OpContext<Tensor> *context = nullptr) override {
    auto op_uuid = context->sequential_num_;
    input_op_datas_[op_uuid].push_back(inputs);
    inputs_data_.push_back(inputs->data_);
    if (input_op_datas_[op_uuid].size() < kernel_->in_tensors().size()) {
      return;
    }

    auto ret = SetInputData();
    if (ret != RET_OK) {
      input_op_datas_.erase(op_uuid);
      context->SetFailed(ret);
      return;
    }

    ret = RunKernel(*(reinterpret_cast<const KernelCallBack *>(context->kernel_call_back_before_)),
                    *(reinterpret_cast<const KernelCallBack *>(context->kernel_call_back_after_)));
    if (ret != RET_OK) {
      input_op_datas_.erase(op_uuid);
      context->SetFailed(ret);
      return;
    }
    input_op_datas_.erase(op_uuid);
    inputs_data_.clear();

    bool *cond = reinterpret_cast<bool *>(output_tensors_[0]->data());
    if (*cond) {
      for (auto &arrow : true_branch_output_data_arrows_) {
        kernel_->out_tensors().at(arrow->from_output_index_)->IncRefCount();
      }
      AsyncTrueBranchOutput(context);
    } else {
      for (auto &arrow : false_branch_output_data_arrows_) {
        kernel_->out_tensors().at(arrow->from_output_index_)->IncRefCount();
      }
      AsyncFalseBranchOutput(context);
    }
  }

  void Init() override {
    auto ret = CompileArrow();
    if (ret != RET_OK) {
      MS_LOG(ERROR) << "CompileArrow failed, name: " << kernel_->name();
      // do not support return error
    }

    ret = PrepareOutputData();
    if (ret != RET_OK) {
      MS_LOG(ERROR) << "PrepareOutputData failed, name: " << kernel_->name();
      // do not support return error
    }
  }
  void RunOpData(OpData<Tensor> *inputs, OpContext<Tensor> *context = nullptr) override;
  int CompileArrow() override;
  int PrepareOutputData() override;

 private:
  void AsyncTrueBranchOutput(OpContext<Tensor> *context);
  void AsyncFalseBranchOutput(OpContext<Tensor> *context);

  int GetSwitchAndCallNode(kernel::SubGraphKernel *subgraph_kernel);
  void AppendOutputTensors();
  int CompileTrueBranchArrow();
  int CompileFalseBranchArrow();
  int CompileArrowThroughSwitchCall();
  int PrepareOutputData() override;

  std::vector<DataArrowPtr> true_branch_output_data_arrows_;
  std::vector<DataArrowPtr> false_branch_output_data_arrows_;
--- a/mindspore/lite/src/lite_session.cc
+++ b/mindspore/lite/src/lite_session.cc
@@ -118,10 +118,8 @@ int LiteSession::ConvertTensorsData(const lite::Model *model, size_t tensor_inde
                                    lite::Tensor *dst_tensor) {
  MS_ASSERT(src_tensor != nullptr);
  MS_ASSERT(dst_tensor != nullptr);
  auto src_category = TensorCategory(src_tensor);
  if ((src_category == Tensor::Category::CONST_TENSOR || src_category == Tensor::Category::CONST_SCALAR) &&
      src_tensor->data() != nullptr && src_tensor->data()->size() > 0) {
    if (src_tensor->dataType() == kObjectTypeTensorType) {
  if (src_tensor->data() != nullptr && src_tensor->data()->size() > 0) {
    if (dst_tensor->data_type() == kObjectTypeTensorType) {
      auto tensor_list = reinterpret_cast<TensorList *>(dst_tensor);
      if (tensor_list->Decode(reinterpret_cast<const int *>(src_tensor->data()->data())) != RET_OK) {
        MS_LOG(ERROR) << "Decode tensorlist data failed";
@@ -147,7 +145,7 @@ lite::Tensor *LiteSession::ConvertTensor(const schema::Tensor &src_tensor) {
  if (src_tensor.dims() == nullptr) {
    MS_LOG(DEBUG) << "Dims of src_tensor is nullptr";
  }
  if (src_tensor.dims() != nullptr && src_category == Tensor::Category::CONST_TENSOR) {
  if (src_tensor.dims() != nullptr) {
    if (src_tensor.dataType() == kObjectTypeString && src_tensor.data() != nullptr) {
      shape.push_back(src_tensor.data()->size());
    } else {
--- a/mindspore/lite/src/runtime/infer_manager.cc
+++ b/mindspore/lite/src/runtime/infer_manager.cc
@@ -62,11 +62,15 @@ int KernelInferShape(const std::vector<lite::Tensor *> &inputs, const std::vecto

 int KernelInferShape(const std::vector<lite::Tensor *> &inputs, const std::vector<lite::Tensor *> &outputs,
                     OpParameter *parameter) {
  MS_ASSERT(parameter != nullptr);
  std::vector<TensorC *> in_tensors;
  std::vector<TensorC *> out_tensors;
  int ret = 0;
  ret = GenerateInTensorC(parameter, inputs, outputs, &in_tensors);
  if (parameter->type_ == schema::PrimitiveType_PartialFusion || parameter->type_ == schema::PrimitiveType_Switch ||
      parameter->type_ == schema::PrimitiveType_Call) {
    MS_LOG(INFO) << "no need infer shape.";
    return RET_OK;
  }

  int ret = GenerateInTensorC(parameter, inputs, outputs, &in_tensors);
  if (ret != RET_OK) {
    FreeAllTensorC(&in_tensors);
    return RET_ERROR;
--- a/mindspore/lite/src/runtime/kernel/arm/base/partial_fusion.h
+++ b/mindspore/lite/src/runtime/kernel/arm/base/partial_fusion.h
@@ -32,8 +32,8 @@ class PartialFusionKernel : public InnerKernel {
  int Init() override;
  int ReSize() override;
  int Run() override;
  void SetSubgraph(LiteKernel *subgraph_kernel) { subgraph_kernel_ = subgraph_kernel; }
  LiteKernel *GetSubgraph() { return subgraph_kernel_; }
  void set_subgraph_kernel(LiteKernel *subgraph_kernel) { subgraph_kernel_ = subgraph_kernel; }
  LiteKernel *subgraph_kernel() { return subgraph_kernel_; }

 private:
  LiteKernel *subgraph_kernel_ = nullptr;
--- a/mindspore/lite/src/runtime/kernel/arm/base/tensorlist_fromtensor.cc
+++ b/mindspore/lite/src/runtime/kernel/arm/base/tensorlist_fromtensor.cc
@@ -99,6 +99,7 @@ int TensorListFromTensorCPUKernel::Run() {
    out_ptr->set_data_type(dtype_);
    in_data += data_offset;
  }
  output0->set_own_data(true);
  output0->set_tensors_data_type(dtype_);
  return RET_OK;
 }
--- a/mindspore/lite/src/runtime/kernel/arm/base/tensorlist_setitem.cc
+++ b/mindspore/lite/src/runtime/kernel/arm/base/tensorlist_setitem.cc
@@ -41,7 +41,6 @@ int TensorListSetItemCPUKernel::CheckParam() {
 }

 int TensorListSetItemCPUKernel::IncrementOutputSize(int origin_size) {
  output0_ = reinterpret_cast<lite::TensorList *>(out_tensors_[0]);
  int new_tensors_size = origin_size + 1;
  output0_->set_shape({new_tensors_size});
  std::vector<std::vector<int>> out_shape;
@@ -56,15 +55,16 @@ int TensorListSetItemCPUKernel::IncrementOutputSize(int origin_size) {

 int TensorListSetItemCPUKernel::Run() {
  input0_ = reinterpret_cast<lite::TensorList *>(in_tensors_[0]);
  output0_ = reinterpret_cast<lite::TensorList *>(out_tensors_[0]);
  if (CheckParam() != RET_OK) {
    MS_LOG(ERROR) << "check param failed.";
    return RET_ERROR;
  }

  int dim0 = input0_->ElementsNum() - 1;
  int dim0 = output0_->ElementsNum() - 1;
  index_ = reinterpret_cast<int *>(in_tensors_[1]->data_c())[0];
  if (index_ < 0 || index_ > dim0) {
    if (IncrementOutputSize(output0_->shape()[0]) != RET_OK) {
    if (IncrementOutputSize(output0_->tensors().size()) != RET_OK) {
      MS_LOG(ERROR) << "Resizeoutput Error ,index tensor:[" << index_ << "] must be in [0, " << dim0 << "]!";
      return RET_ERROR;
    }
@@ -76,6 +76,7 @@ int TensorListSetItemCPUKernel::Run() {
  }
  output0_ = reinterpret_cast<lite::TensorList *>(out_tensors_[0]);
  MS_ASSERT(output0_ != nullptr);
  output0_->set_allocator(context_->allocator);
  // new loop count
  if (output0_->tensors().empty() && input0_->tensors().empty()) {
    if (IncrementOutputSize(0) != RET_OK) {
@@ -88,11 +89,14 @@ int TensorListSetItemCPUKernel::Run() {
    input0_->set_element_shape(input2_->shape());
    output0_->set_element_shape(input2_->shape());
  }
  if (output0_->allocator() == nullptr) {
    output0_->set_allocator(context_->allocator);
  }
  for (int i = 0; i < output0_->ElementsNum(); ++i) {
    if (i == index_) {
      auto dst = output0_->GetTensor(i);
      if (dst == nullptr) {
        dst = lite::Tensor::CopyTensor(*input2_, true);
        dst = lite::Tensor::CopyTensor(*input2_, true, context_->allocator);
        auto &tensors = output0_->tensors();
        tensors.emplace_back(dst);
      } else {
@@ -100,8 +104,6 @@ int TensorListSetItemCPUKernel::Run() {
        dst->set_shape(input2_->shape());
        dst->set_format(input2_->format());
        dst->set_category(input2_->category());
        dst->set_root_tensor(input2_->root_tensor());
        dst->set_tensor_name(input2_->tensor_name());
        dst->set_quant_clusters(input2_->quant_clusters());
        auto ret = lite::Tensor::CopyTensorData(*input2_, dst);
        if (ret != RET_OK) {
@@ -115,7 +117,7 @@ int TensorListSetItemCPUKernel::Run() {
      MS_ASSERT(src != nullptr);
      // merge move data will delete tensors
      if (dst == nullptr) {
        dst = lite::Tensor::CopyTensor(*src, src->data_c() != nullptr);
        dst = lite::Tensor::CopyTensor(*src, src->data_c() != nullptr, context_->allocator);
        auto &tensors = output0_->tensors();
        tensors.emplace_back(dst);
        continue;
--- a/mindspore/lite/src/runtime/kernel/arm/base/tensorlist_stack.cc
+++ b/mindspore/lite/src/runtime/kernel/arm/base/tensorlist_stack.cc
@@ -135,6 +135,7 @@ int TensorListStackCPUKernel::MergeSubShape(const std::vector<int> &shape) {
 }

 int TensorListStackCPUKernel::Run() {
  output0_ = out_tensors_[0];
  if (CheckParam() != RET_OK) {
    MS_LOG(ERROR) << "CheckParam failed!";
    return RET_ERROR;
--- a/mindspore/lite/src/scheduler.cc
+++ b/mindspore/lite/src/scheduler.cc
@@ -16,6 +16,7 @@

 #include "src/scheduler.h"
 #include <map>
 #include <set>
 #include <queue>
 #include <string>
 #include <vector>
@@ -41,6 +42,7 @@
 #include "src/runtime/gpu/opencl/opencl_runtime.h"
 #endif
 #include "include/registry/kernel_interface.h"
 #include "src/runtime/kernel/arm/base/partial_fusion.h"

 namespace mindspore::lite {
 namespace {
@@ -58,6 +60,40 @@ kernel::SubGraphKernel *CreateCustomSubGraph(std::vector<kernel::LiteKernel *> &
 }
 }  // namespace

 void Scheduler::SetSubgraphForPartialNode() {
  for (auto &pair : partial_kernel_subgraph_index_map_) {
    auto &partial_kernel = pair.first;
    auto &subgraph_index = pair.second;
    static_cast<kernel::PartialFusionKernel *>(partial_kernel->kernel())
      ->set_subgraph_kernel(subgraph_index_subgraph_kernel_map_.at(subgraph_index));
  }
 }

 int Scheduler::InitKernels(std::vector<kernel::LiteKernel *> dst_kernels) {
  if (is_train_session_) {
    return RET_OK;
  }
  for (auto kernel : dst_kernels) {
    // delegate graph kernel
    if (kernel->desc().delegate != nullptr) {
      continue;
    }
    if (kernel->subgraph_type() == kernel::kNotSubGraph) {
      MS_LOG(ERROR) << "construct subgraph failed.";
      return RET_ERROR;
    }
    auto subgraph_nodes = reinterpret_cast<kernel::SubGraphKernel *>(kernel)->nodes();
    for (auto node : subgraph_nodes) {
      auto ret = node->Init();
      if (ret != RET_OK) {
        MS_LOG(ERROR) << "Kernel " << node->name() << " Init failed.";
        return ret;
      }
    }
  }
  return RET_OK;
 }

 int Scheduler::Schedule(std::vector<kernel::LiteKernel *> *dst_kernels) {
  if (dst_kernels == nullptr) {
    return RET_ERROR;
@@ -85,12 +121,14 @@ int Scheduler::Schedule(std::vector<kernel::LiteKernel *> *dst_kernels) {
    search_sub_graph.SubGraphSplit();
  }

  int ret = ScheduleSubGraphToKernels(kMainSubGraphIndex, dst_kernels, nullptr, nullptr);
  int ret = ScheduleGraphToKernels(dst_kernels);
  op_parameters_.clear();
  if (ret != RET_OK) {
    MS_LOG(ERROR) << "Schedule main subgraph to kernels failed.";
    MS_LOG(ERROR) << "Schedule graph to kernels failed.";
    return ret;
  }

  SetSubgraphForPartialNode();
  if (delegate_ != nullptr) {
    ret = ReplaceDelegateKernels(dst_kernels);
    if (ret != RET_OK) {
@@ -99,12 +137,6 @@ int Scheduler::Schedule(std::vector<kernel::LiteKernel *> *dst_kernels) {
    }
  }
  FindAllInoutKernels(*dst_kernels);
  ret = InitKernels(*dst_kernels);
  if (ret != RET_OK) {
    MS_LOG(ERROR) << "InitKernels failed.";
    return ret;
  }

  auto src_kernel = *dst_kernels;
  dst_kernels->clear();
  std::map<const kernel::LiteKernel *, bool> is_kernel_finish;
@@ -113,37 +145,14 @@ int Scheduler::Schedule(std::vector<kernel::LiteKernel *> *dst_kernels) {
    MS_LOG(ERROR) << "ConstructSubGraphs failed.";
    return ret;
  }
  MS_LOG(DEBUG) << "schedule kernels success.";
  return RET_OK;
 }

 int Scheduler::InitKernels(std::vector<kernel::LiteKernel *> dst_kernels) {
  if (is_train_session_) {
    return RET_OK;
  }
  for (auto kernel : dst_kernels) {
    if (kernel->subgraph_type() != kernel::kNotSubGraph) {
      auto subgraph_nodes = reinterpret_cast<kernel::SubGraphKernel *>(kernel)->nodes();
      for (auto node : subgraph_nodes) {
        auto ret = node->Init();
        if (ret != RET_OK) {
          MS_LOG(ERROR) << "Kernel " << node->name() << " Init failed.";
          return ret;
        }
      }
      continue;
    }
    // delegate graph kernel
    if (kernel->desc().delegate != nullptr) {
      continue;
    }
    // origin inner kernel
    auto ret = kernel->Init();
    if (ret != RET_OK) {
      MS_LOG(ERROR) << "Kernel " << kernel->name() << " Init failed.";
      return ret;
    }
  ret = InitKernels(*dst_kernels);
  if (ret != RET_OK) {
    MS_LOG(ERROR) << "InitKernels failed.";
    return ret;
  }

  MS_LOG(DEBUG) << "schedule kernels success.";
  return RET_OK;
 }

@@ -225,9 +234,6 @@ int Scheduler::InferNodeShape(const lite::Model::Node *node) {
  MS_ASSERT(node != nullptr);
  auto primitive = node->primitive_;
  MS_ASSERT(primitive != nullptr);
  if (IsPartialNode(primitive)) {
    return InferPartialShape(node);
  }
  std::vector<Tensor *> inputs;
  std::vector<Tensor *> outputs;
  FindNodeInoutTensors(*node, &inputs, &outputs);
@@ -252,7 +258,26 @@ int Scheduler::InferNodeShape(const lite::Model::Node *node) {
  parameter->thread_num_ = context_->thread_num_;

  op_parameters_[node->output_indices_.at(0)] = parameter;
  if (IsCallNode(primitive)) {
    return InferCallShape(node);
  }
  ret = KernelInferShape(inputs, outputs, parameter);

  bool not_able_to_infer = false;
  for (auto &input : inputs) {
    if (input->data_type() == kObjectTypeTensorType) {
      not_able_to_infer = true;
      break;
    }
  }

  if (not_able_to_infer) {
    for (auto &output : outputs) {
      output->set_shape({-1});
    }
    return RET_INFER_INVALID;
  }

  if (ret == RET_OK) {
    for (auto &output : outputs) {
      if (output->ElementsNum() >= MAX_MALLOC_SIZE / static_cast<int>(sizeof(int64_t))) {
@@ -267,6 +292,66 @@ int Scheduler::InferNodeShape(const lite::Model::Node *node) {
  return ret;
 }

 int Scheduler::RestoreSubGraphInput(const lite::Model::Node *partial_node) {
  auto subgraph_index = GetPartialGraphIndex(partial_node->primitive_);
  auto subgraph = src_model_->sub_graphs_.at(subgraph_index);
  for (size_t i = 0; i < subgraph->input_indices_.size(); ++i) {
    auto &subgraph_input = src_tensors_->at(subgraph->input_indices_[i]);
    subgraph_input->set_data(nullptr);
  }
  return RET_OK;
 }

 void CopyTensorList(TensorList *dst_tensor, TensorList *src_tensor) {
  dst_tensor->set_data_type(src_tensor->data_type());
  dst_tensor->set_format(src_tensor->format());
  dst_tensor->set_element_shape(src_tensor->element_shape());
  dst_tensor->set_shape(src_tensor->shape());
  std::vector<Tensor *> cpy_tensors{};
  for (auto &tensor : src_tensor->tensors()) {
    auto new_tensor = Tensor::CopyTensor(*tensor, false);
    cpy_tensors.push_back(new_tensor);
  }
  dst_tensor->set_tensors(cpy_tensors);
 }

 void CopyCommonTensor(Tensor *dst_tensor, Tensor *src_tensor) {
  dst_tensor->set_data_type(src_tensor->data_type());
  dst_tensor->set_shape(src_tensor->shape());
  dst_tensor->set_format(src_tensor->format());
  dst_tensor->set_data(src_tensor->data());
 }

 int Scheduler::CopyPartialShapeToSubGraph(const lite::Model::Node *partial_node) {
  auto subgraph_index = GetPartialGraphIndex(partial_node->primitive_);
  auto subgraph = src_model_->sub_graphs_.at(subgraph_index);
  if (subgraph->input_indices_.size() != partial_node->input_indices_.size()) {
    MS_LOG(ERROR) << "partial node " << partial_node->name_ << " inputs size: " << partial_node->input_indices_.size()
                  << " vs "
                  << " subgraph input size: " << subgraph->input_indices_.size();
    return RET_PARAM_INVALID;
  }

  for (size_t i = 0; i < partial_node->input_indices_.size(); ++i) {
    auto &subgraph_input = src_tensors_->at(subgraph->input_indices_[i]);
    auto &partial_input = src_tensors_->at(partial_node->input_indices_[i]);
    switch (partial_input->data_type()) {
      case kObjectTypeTensorType: {
        auto partial_input_tensorlist = reinterpret_cast<TensorList *>(partial_input);
        auto subgraph_input_tensorlist = reinterpret_cast<TensorList *>(subgraph_input);
        CopyTensorList(subgraph_input_tensorlist, partial_input_tensorlist);
        break;
      }
      default: {
        CopyCommonTensor(subgraph_input, partial_input);
        break;
      }
    }
  }

  return RET_OK;
 }

 int Scheduler::InferPartialShape(const lite::Model::Node *node) {
  MS_ASSERT(src_model_ != nullptr);
  MS_ASSERT(node != nullptr);
@@ -274,7 +359,96 @@ int Scheduler::InferPartialShape(const lite::Model::Node *node) {
    MS_LOG(ERROR) << "Node is not a partial";
    return RET_PARAM_INVALID;
  }
  return InferSubGraphShape(GetPartialGraphIndex(node->primitive_));
  CopyPartialShapeToSubGraph(node);
  int subgraph_index = GetPartialGraphIndex(node->primitive_);
  auto ret = InferSubGraphShape(subgraph_index);
  if (ret != RET_OK) {
    MS_LOG(WARNING) << "infer subgraph: " << subgraph_index << " failed, ret:" << ret;
  }
  RestoreSubGraphInput(node);
  return ret;
 }

 int Scheduler::InferSwitchShape(const lite::Model::Node *switch_node) {
  MS_ASSERT(src_model_ != nullptr);
  MS_ASSERT(switch_node != nullptr);
  if (!IsSwitchNode(switch_node->primitive_)) {
    MS_LOG(ERROR) << "Node is not a switch";
    return RET_PARAM_INVALID;
  }
  std::deque<lite::Model::Node *> partial_cnode_to_infer{};
  auto true_branch_output_index = switch_node->input_indices_.at(1);
  auto false_branch_output_index = switch_node->input_indices_.at(2);
  for (auto &node : src_model_->all_nodes_) {
    if ((IsContain(node->output_indices_, true_branch_output_index) ||
         IsContain(node->output_indices_, false_branch_output_index)) &&
        IsPartialNode(node->primitive_) && partial_cnode_inferred_.find(node) == partial_cnode_inferred_.end()) {
      partial_cnode_inferred_.insert(node);
      partial_cnode_to_infer.push_back(node);
    }
  }

  while (!partial_cnode_to_infer.empty()) {
    auto &node = partial_cnode_to_infer.front();
    partial_cnode_to_infer.pop_front();
    int ret = InferPartialShape(node);
    if (ret != RET_OK) {
      MS_LOG(WARNING) << "partial infer not ok, ret: " << ret;
    }
  }
  return RET_OK;
 }

 Model::Node *Scheduler::NodeInputIsPartial(const lite::Model::Node *node) {
  MS_ASSERT(src_model_ != nullptr);
  MS_ASSERT(node != nullptr);
  for (auto &iter : src_model_->all_nodes_) {
    if (iter->output_indices_ == node->input_indices_) {
      if (IsPartialNode(iter->primitive_)) {
        return iter;
      } else {
        return nullptr;
      }
    }
  }
  return nullptr;
 }

 Model::Node *Scheduler::NodeInputIsSwitch(const lite::Model::Node *node) {
  MS_ASSERT(src_model_ != nullptr);
  MS_ASSERT(node != nullptr);
  for (auto &iter : src_model_->all_nodes_) {
    if (iter->output_indices_ == node->input_indices_) {
      if (IsSwitchNode(iter->primitive_)) {
        return iter;
      } else {
        return nullptr;
      }
    }
  }
  return nullptr;
 }

 int Scheduler::InferCallShape(const lite::Model::Node *node) {
  MS_ASSERT(src_model_ != nullptr);
  MS_ASSERT(node != nullptr);
  if (!IsCallNode(node->primitive_)) {
    MS_LOG(ERROR) << "Node is not a call cnode";
    return RET_PARAM_INVALID;
  }

  auto partial_input = NodeInputIsPartial(node);
  if (partial_input) {
    return InferPartialShape(partial_input);
  }

  auto switch_input = NodeInputIsSwitch(node);
  if (switch_input) {
    return InferSwitchShape(switch_input);
  }

  MS_LOG(ERROR) << "call input is not partial and also not switch.";
  return RET_ERROR;
 }

 int Scheduler::InferSubGraphShape(size_t subgraph_index) {
@@ -664,6 +838,31 @@ kernel::LiteKernel *Scheduler::SchedulePartialToKernel(const lite::Model::Node *
  return subgraph;
 }

 std::vector<kernel::LiteKernel *> Scheduler::ScheduleSubGraphToSubGraphKernels(const int &subgraph_index) {
  std::vector<kernel::LiteKernel *> kernels;
  std::vector<lite::Tensor *> in_tensors;
  std::vector<lite::Tensor *> out_tensors;
  auto ret = ScheduleSubGraphToKernels(subgraph_index, &kernels, &in_tensors, &out_tensors);
  if (ret != RET_OK) {
    MS_LOG(ERROR) << "Schedule subgraph failed, index: " << subgraph_index;
    return {};
  }

  if (subgraph_index != kMainSubGraphIndex) {
    FindAllInoutKernels(kernels);
    auto cur_sub_graph_type = mindspore::lite::Scheduler::GetKernelSubGraphType(kernels.front());
    MS_LOG(INFO) << "cur_sub_graph_type: " << cur_sub_graph_type;
    auto subgraph_kernel = CreateSubGraphKernel(kernels, &in_tensors, &out_tensors, cur_sub_graph_type);
    if (subgraph_kernel == nullptr) {
      MS_LOG(ERROR) << "CreateSubGraphKernel failed, cur_sub_graph_type: " << cur_sub_graph_type;
      return {};
    }
    subgraph_index_subgraph_kernel_map_[subgraph_index] = subgraph_kernel;
    kernels = {subgraph_kernel};
  }
  return kernels;
 }

 kernel::LiteKernel *Scheduler::ScheduleNodeToKernel(const lite::Model::Node *src_node, TypeId prefer_data_type) {
  std::vector<Tensor *> inputs;
  std::vector<Tensor *> outputs;
@@ -679,6 +878,43 @@ kernel::LiteKernel *Scheduler::ScheduleNodeToKernel(const lite::Model::Node *src
  return kernel;
 }

 bool Scheduler::SubGraphHasScheduled(const int &index) {
  return scheduled_subgraph_index_.find(index) != scheduled_subgraph_index_.end();
 }

 void Scheduler::SubGraphMarkScheduled(const int &index) { scheduled_subgraph_index_.insert(index); }

 bool Scheduler::IsControlFlowPattern(const lite::Model::Node &partial_node) {
  lite::Model::Node *partial_node_output = nullptr;
  for (auto output_index : partial_node.output_indices_) {
    for (auto &node : src_model_->all_nodes_) {
      if (IsContain(node->input_indices_, output_index)) {
        partial_node_output = node;
        break;
      }
    }
  }

  return partial_node_output == nullptr
           ? false
           : (IsCallNode(partial_node_output->primitive_) || IsSwitchNode(partial_node_output->primitive_));
 }

 int Scheduler::ScheduleGraphToKernels(std::vector<kernel::LiteKernel *> *dst_kernels, TypeId prefer_data_type) {
  subgraphs_to_schedule_.push_back(kMainSubGraphIndex);
  while (!subgraphs_to_schedule_.empty()) {
    auto cur_subgraph_index = subgraphs_to_schedule_.front();
    subgraphs_to_schedule_.pop_front();
    auto kernels = ScheduleSubGraphToSubGraphKernels(cur_subgraph_index);
    if (kernels.empty()) {
      MS_LOG(ERROR) << "ScheduleSubGraphToSubGraphKernel failed";
      return RET_ERROR;
    }
    std::copy(kernels.begin(), kernels.end(), std::back_inserter(*dst_kernels));
  }
  return RET_OK;
 }

 int Scheduler::ScheduleSubGraphToKernels(size_t subgraph_index, std::vector<kernel::LiteKernel *> *dst_kernels,
                                         std::vector<lite::Tensor *> *in_tensors,
                                         std::vector<lite::Tensor *> *out_tensors, TypeId prefer_data_type) {
@@ -696,9 +932,23 @@ int Scheduler::ScheduleSubGraphToKernels(size_t subgraph_index, std::vector<kern
    MS_ASSERT(primitive != nullptr);
    kernel::LiteKernel *kernel = nullptr;
    auto prim_type = GetPrimitiveType(primitive);
    if (IsPartialNode(primitive)) {  // sub_graph
      kernel = SchedulePartialToKernel(node);
    } else {  // kernel

    if (IsPartialNode(primitive)) {
      if (IsControlFlowPattern(*node)) {
        kernel = ScheduleNodeToKernel(node, prefer_data_type);
        auto partial_subgraph_index = GetPartialGraphIndex(primitive);
        if (SubGraphHasScheduled(partial_subgraph_index)) {
          partial_kernel_subgraph_index_map_[kernel] = partial_subgraph_index;
          MS_LOG(INFO) << "subgraph has scheduled. ";
        } else {
          SubGraphMarkScheduled(partial_subgraph_index);
          partial_kernel_subgraph_index_map_[kernel] = partial_subgraph_index;
          subgraphs_to_schedule_.push_back(partial_subgraph_index);
        }
      } else {
        kernel = SchedulePartialToKernel(node);
      }
    } else {
      kernel = ScheduleNodeToKernel(node, prefer_data_type);
    }
    if (kernel == nullptr || ret != RET_OK) {
@@ -719,7 +969,7 @@ int Scheduler::ScheduleSubGraphToKernels(size_t subgraph_index, std::vector<kern
                   [&](const uint32_t index) { return this->src_tensors_->at(index); });
  }
  return RET_OK;
 }
 }  // namespace mindspore::lite

 bool Scheduler::KernelFitCurrentSubGraph(const kernel::SubGraphType subgraph_type, const kernel::LiteKernel &kernel) {
  switch (subgraph_type) {
@@ -760,11 +1010,6 @@ std::vector<kernel::LiteKernel *> Scheduler::FindAllSubGraphKernels(
  for (kernel::LiteKernel *head_kernel : head_kernels) {
    MS_ASSERT(head_kernel != nullptr);
    MS_ASSERT(sinked_kernel_map != nullptr);
    if (head_kernel->type() == schema::PrimitiveType_Switch || head_kernel->type() == schema::PrimitiveType_Merge) {
      (*sinked_kernel_map)[head_kernel] = true;
      sub_kernels.emplace_back(head_kernel);
      return sub_kernels;
    }
    std::queue<kernel::LiteKernel *> kernel_queue;
    kernel_queue.emplace(head_kernel);
    auto cur_sub_graph_type = mindspore::lite::Scheduler::GetKernelSubGraphType(head_kernel);
@@ -775,8 +1020,7 @@ std::vector<kernel::LiteKernel *> Scheduler::FindAllSubGraphKernels(
      sub_kernels.emplace_back(cur_kernel);
      auto post_kernels = cur_kernel->out_kernels();
      for (auto post_kernel : post_kernels) {
        if (post_kernel->subgraph_type() != kernel::kNotSubGraph ||
            post_kernel->type() == schema::PrimitiveType_Merge || post_kernel->type() == schema::PrimitiveType_Switch) {
        if (post_kernel->subgraph_type() != kernel::kNotSubGraph) {
          continue;
        }
        if (cur_sub_graph_type == mindspore::lite::Scheduler::GetKernelSubGraphType(post_kernel)) {
@@ -973,7 +1217,7 @@ TypeId Scheduler::GetFirstFp32Fp16OrInt8Type(const std::vector<Tensor *> &in_ten
    }
    if (dtype == kObjectTypeTensorType) {
      auto tensor_list = reinterpret_cast<TensorList *>(tensor);
      auto tensor_list_dtype = tensor_list->data_type();
      auto tensor_list_dtype = tensor_list->tensors_data_type();
      if (tensor_list_dtype == kNumberTypeFloat32 || tensor_list_dtype == kNumberTypeFloat16 ||
          tensor_list_dtype == kNumberTypeInt8 || tensor_list_dtype == kNumberTypeInt32 ||
          tensor_list_dtype == kNumberTypeBool) {
@@ -986,7 +1230,7 @@ TypeId Scheduler::GetFirstFp32Fp16OrInt8Type(const std::vector<Tensor *> &in_ten
    }
  }
  MS_ASSERT(!in_tensors.empty());
  return in_tensors[0]->data_type();
  return in_tensors[0]->data_type() == kObjectTypeTensorType ? kNumberTypeFloat32 : in_tensors[0]->data_type();
 }

 void Scheduler::SetKernelTensorDataType(kernel::LiteKernel *kernel) {
--- a/mindspore/lite/src/scheduler.h
+++ b/mindspore/lite/src/scheduler.h
@@ -1,5 +1,5 @@
 /**
 * Copyright 2020 Huawei Technologies Co., Ltd
 * Copyright 2020-2021 Huawei Technologies Co., Ltd
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
@@ -21,6 +21,9 @@
 #include <vector>
 #include <memory>
 #include <map>
 #include <deque>
 #include <unordered_map>
 #include <set>
 #include "src/sub_graph_kernel.h"
 #include "src/inner_context.h"
 #include "include/model.h"
@@ -39,25 +42,22 @@ class Scheduler {
        is_train_session_(is_train_session),
        delegate_(delegate) {}
  ~Scheduler() = default;

  int Schedule(std::vector<kernel::LiteKernel *> *dst_kernels);
  void SetupSchedulerCb(std::unique_ptr<SchedulerCb> cb) { sched_cb_ = std::move(cb); }

 private:
  void FindNodeInoutTensors(const lite::Model::Node &node, std::vector<Tensor *> *inputs,
                            std::vector<Tensor *> *outputs);
  // infer shape for a partial node
  int InferPartialShape(const lite::Model::Node *node);
  // infer shape for a node
  int InferNodeShape(const lite::Model::Node *node);
  // infer shape for a subgraph
  void FindNodeInoutTensors(const Model::Node &node, std::vector<Tensor *> *inputs, std::vector<Tensor *> *outputs);
  Model::Node *NodeInputIsPartial(const Model::Node *node);
  int InferPartialShape(const Model::Node *node);
  Model::Node *NodeInputIsSwitch(const Model::Node *node);
  int InferSwitchShape(const Model::Node *node);
  int InferCallShape(const Model::Node *node);
  int InferNodeShape(const Model::Node *node);
  int InferSubGraphShape(size_t subgraph_index);

  // schedule a node to kernel according to context and kernels registered
  kernel::LiteKernel *FindBackendKernel(const std::vector<Tensor *> &in_tensors,
                                        const std::vector<Tensor *> &out_tensors, const Model::Node *node,
                                        TypeId prefer_data_type = kTypeUnknown);

  int FindCpuKernel(const std::vector<Tensor *> &in_tensors, const std::vector<Tensor *> &out_tensors,
                    OpParameter *op_parameter, const kernel::KernelKey &desc, TypeId kernel_data_type,
                    kernel::LiteKernel **kernel);
@@ -65,49 +65,47 @@ class Scheduler {
                    OpParameter *op_parameter, const kernel::KernelKey &desc, kernel::LiteKernel **kernel);
  int FindNpuKernel(const std::vector<Tensor *> &in_tensors, const std::vector<Tensor *> &out_tensors,
                    OpParameter *op_parameter, const kernel::KernelKey &desc, kernel::LiteKernel **kernel);

  int FindProviderKernel(const std::vector<Tensor *> &in_tensors, const std::vector<Tensor *> &out_tensors,
                         const Model::Node *node, TypeId data_type, kernel::LiteKernel **kernel);

  int ReplaceDelegateKernels(std::vector<kernel::LiteKernel *> *dst_kernels);

  int InitKernels(std::vector<kernel::LiteKernel *> dst_kernels);

  // schedule a partial node to a subgraph_kernel
  kernel::LiteKernel *SchedulePartialToKernel(const lite::Model::Node *src_node);
  // schedule a partial node to a subgraph_kernel
  std::vector<kernel::LiteKernel *> ScheduleSubGraphToSubGraphKernels(const int &subgraph_index);
  // schedule a node to a kernel
  kernel::LiteKernel *ScheduleNodeToKernel(const lite::Model::Node *src_node, TypeId prefer_data_type = kTypeUnknown);
  kernel::LiteKernel *ScheduleNodeToKernel(const Model::Node *src_node, TypeId prefer_data_type = kTypeUnknown);
  // schedule a Model::Graph into a vector of subgraph_kernel
  int ScheduleGraphToKernels(std::vector<kernel::LiteKernel *> *dst_kernels, TypeId prefer_data_type = kTypeUnknown);
  // schedule a Model::SubGraph into a vector of kernel and subgraph_kernel
  int ScheduleSubGraphToKernels(size_t subgraph_index, std::vector<kernel::LiteKernel *> *dst_kernels,
                                std::vector<lite::Tensor *> *in_tensors, std::vector<lite::Tensor *> *out_tensors,
                                TypeId prefer_data_type = kTypeUnknown);

  // find in_kernels_ and out_kernels of kernel, sub_graph and nodes_ in sub_graph
  static void FindAllInoutKernels(const std::vector<kernel::LiteKernel *> &kernels);

  // vector<LiteKernel/SubGraphKernel> --> vector<SubGraphKernel>
  int ConstructSubGraphs(std::vector<kernel::LiteKernel *> src_kernel, std::vector<kernel::LiteKernel *> *dst_kernel,
                         std::map<const kernel::LiteKernel *, bool> *sinked_kernel_map);

  // create subgraph_kernel from a vector of kernel
  kernel::SubGraphKernel *CreateSubGraphKernel(const std::vector<kernel::LiteKernel *> &kernels,
                                               const std::vector<lite::Tensor *> *in_tensors,
                                               const std::vector<lite::Tensor *> *out_tensors,
                                               kernel::SubGraphType type);

  bool MergeOpIsReady(const kernel::LiteKernel *kernel, std::map<const kernel::LiteKernel *, bool> is_kernel_finish);

  bool KernelFitCurrentSubGraph(const kernel::SubGraphType subgraph_type, const kernel::LiteKernel &kernel);

  std::vector<kernel::LiteKernel *> FindAllSubGraphKernels(
    std::vector<kernel::LiteKernel *> head_kernels, std::map<const kernel::LiteKernel *, bool> *sinked_kernel_map);

  // other methods
  static TypeId GetFirstFp32Fp16OrInt8Type(const std::vector<Tensor *> &in_tensors);

  static void SetKernelTensorDataType(kernel::LiteKernel *kernel);

  static kernel::SubGraphType GetKernelSubGraphType(const kernel::LiteKernel *kernel);
  int CopyPartialShapeToSubGraph(const lite::Model::Node *partial_node);
  int RestoreSubGraphInput(const lite::Model::Node *partial_node);
  bool SubGraphHasScheduled(const int &index);
  void SubGraphMarkScheduled(const int &index);
  void SetSubgraphForPartialNode();
  bool IsControlFlowPattern(const lite::Model::Node &partial_node);

 protected:
  const InnerContext *context_ = nullptr;
@@ -119,6 +117,11 @@ class Scheduler {
  std::unique_ptr<SchedulerCb> sched_cb_;
  std::map<kernel::Kernel *, const schema::Primitive *> primitives_;
  std::shared_ptr<Delegate> delegate_ = nullptr;
  std::set<int> scheduled_subgraph_index_{};
  std::deque<int> subgraphs_to_schedule_{};
  std::unordered_map<kernel::LiteKernel *, size_t> partial_kernel_subgraph_index_map_{};
  std::unordered_map<size_t, kernel::LiteKernel *> subgraph_index_subgraph_kernel_map_{};
  std::set<lite::Model::Node *> partial_cnode_inferred_{};
 };
 }  // namespace mindspore::lite

--- a/mindspore/lite/src/sub_graph_kernel.cc
+++ b/mindspore/lite/src/sub_graph_kernel.cc
@@ -138,7 +138,17 @@ void SubGraphKernel::InitOutTensorInitRefCount() {
  for (auto *node : nodes_) {
    node->InitOutTensorInitRefCount();
  }
  for (auto &input : this->in_tensors()) {
    int input_init_ref_count = input->init_ref_count();
    for (auto *node : nodes_) {
      if (lite::IsContain(node->in_tensors(), input)) {
        input_init_ref_count++;
      }
    }
    input->set_init_ref_count(input_init_ref_count);
  }
 }

 void SubGraphKernel::DropNode(LiteKernel *node) {
  lite::VectorErase(&nodes_, node);
  lite::VectorErase(&in_nodes_, node);
@@ -202,6 +212,9 @@ int CpuSubGraph::Prepare() {
      tensor->set_allocator(this->Context()->allocator);
    }
  }
  for (auto &out : this->out_tensors()) {
    out->set_allocator(this->Context()->allocator);
  }
  return RET_OK;
 }

--- a/mindspore/lite/src/tensorlist.cc
+++ b/mindspore/lite/src/tensorlist.cc
@@ -161,10 +161,10 @@ int TensorList::FreeTensorListData() {
  if (this->tensors_.empty()) {
    return RET_OK;
  }
  for (size_t i = 0; i < this->tensors_.size(); ++i) {
    if (this->tensors_[i] != nullptr) {
      delete this->tensors_[i];
      this->tensors_[i] = nullptr;
  for (auto &tensor : this->tensors_) {
    if (tensor != nullptr) {
      delete tensor;
      tensor = nullptr;
    }
  }
  tensors_.clear();
--- a/mindspore/lite/src/train/train_export.cc
+++ b/mindspore/lite/src/train/train_export.cc
@@ -416,7 +416,7 @@ int TrainExport::SaveToFile() { return Storage::Save(*meta_graph_, file_name_);

 int TrainExport::IsInputTensor(const schema::TensorT &t) {
  int total_dims = std::accumulate(t.dims.begin(), t.dims.end(), 1, std::multiplies<int>());
  return ((t.nodeType == NodeType_ValueNode) && (t.data.size() == 0) && (total_dims != 0));
  return ((t.data.size() == 0) && (total_dims != 0));
 }

 TrainExport::~TrainExport() { delete meta_graph_; }
--- a/mindspore/lite/test/CMakeLists.txt
+++ b/mindspore/lite/test/CMakeLists.txt
@@ -226,8 +226,7 @@ if(MSLITE_ENABLE_CONVERTER)
            ${LITE_DIR}/tools/optimizer/graph/redundant_op_remove_pass.cc
            ${LITE_DIR}/tools/optimizer/graph/infershape_pass.cc
            ${LITE_DIR}/tools/optimizer/graph/slice_prepose_pass.cc
            ${LITE_DIR}/tools/optimizer/graph/while_pass.cc
            ${LITE_DIR}/tools/optimizer/graph/if_pass.cc
            ${LITE_DIR}/tools/optimizer/graph/control_flow_pass.cc
            ${LITE_DIR}/tools/optimizer/graph/unify_format_pass.cc
            ${LITE_DIR}/tools/optimizer/graph/node_infershape.cc
            ${LITE_DIR}/tools/optimizer/graph/transpose_strategy.cc
@@ -314,7 +313,6 @@ if(MSLITE_ENABLE_CONVERTER)
    set(TEST_SRC
            ${TEST_SRC}
            ${TEST_DIR}/st/converter_test.cc
            ${TEST_DIR}/st/control_flow_test.cc
            ${TEST_DIR}/st/mindrt_parallel_test.cc
            ${TEST_DIR}/st/sub_graph_test.cc
            ${TEST_DIR}/common/import_from_meta_graphT.cc
--- a/mindspore/lite/test/config/models_for_process_only.cfg
+++ b/mindspore/lite/test/config/models_for_process_only.cfg
@@ -21,7 +21,7 @@ mtk_transformer_decoder_joint.tflite
 quant_aware_bank_card_detection_inception.onnx
 quant_aware_bank_card_recognition_fcny.onnx
 quant_aware_identify_card_detect.onnx
 tiny-yolov3-11.onnx;2;1,416,416,3:1,2
 #tiny-yolov3-11.onnx;2;1,416,416,3:1,2 to open
 # cur acc for ml_video_edit_art_transfer is 2+%
 ml_video_edit_art_transfer.onnx;3
 #ml_table_detection.onnx: onnx quantized model
--- a/mindspore/lite/test/config/models_onnx_fp16.cfg
+++ b/mindspore/lite/test/config/models_onnx_fp16.cfg
@@ -84,7 +84,7 @@ Q_face_recognition.onnx 3.2
 ml_video_edit_enhance_update_tmp.onnx 0.5
 Q888_face_recognition.onnx 3.5
 Q888_iris_detect.onnx 0.5
 ssd_mobilenet_v1_10.onnx;1;1,383,640,3 0.5
 #ssd_mobilenet_v1_10.onnx;1;1,383,640,3 0.5 to open
 # The output from a conv in the later part contains many minus values, the following leakyRelu makes them become very
 # close to 0 (-e^-4). The fp16 precision lost a lot in this case and it affects the following computation.
 Harmony_Voiceprint.onnx;1;1,200,40,1 21.5 # small output causes big bias
--- a/mindspore/lite/test/config/models_tf.cfg
+++ b/mindspore/lite/test/config/models_tf.cfg
@@ -87,11 +87,11 @@ ml_video_edit_video_segment_gauss_adaptis_part2.pb;2
 #encoder_0111.pb;4;1:1,44:1:1
 encoder_201228.pb;3;1:1,22:1;;input_dependent
 ml_video_edit_oneclick_adaptis.pb;3
 tacotron_encoder_stf.pb;5;1:1,62:1,62:1,62:1,62;;input_dependent
 #tacotron_encoder_stf.pb;5;1:1,62:1,62:1,62:1,62;;input_dependent need open
 female_model_step2_int16_noiseout.pb;66
 ml_female_model_step6_noiseout.pb;66
 ml_male_model_step6_noiseout.pb;66
 ml_tts_decoder_control_flow.pb;5
 #ml_tts_decoder_control_flow.pb;5 need update outputFile
 ml_tts_decoder.pb;5
 ml_tts_encoder_control_flow.pb;4;1:1,22:1:1;;input_dependent
 ml_tts_vocoder.pb;66
--- a/mindspore/lite/test/config/models_tf_fp16.cfg
+++ b/mindspore/lite/test/config/models_tf_fp16.cfg
@@ -65,7 +65,7 @@ siteAI_trans_nonlinear134g.pb;1;1,137 0.5
 siteAI_trans_nonlinear134g_nrz.pb;1;1,182 0.6
 ml_vision_guide_detection2.pb;1;1,320,320,1 1
 # ml_tts_encoder.pb has a round op, which will cause round-off error when the decimal of input value is near 0.5
 ml_tts_encoder.pb;4;1:1,44:1:1 9
 #ml_tts_encoder.pb;4;1:1,44:1:1 9 to open
 # encoder_0111_control_flow.pb is same as ml_tts_encoder_control_flow.pb
 #encoder_0111_control_flow.pb;4;1:1,44:1:1 10
 ml_video_edit_video_segment_gauss_adaptis_part2.pb;2 11
@@ -80,9 +80,9 @@ ml_video_edit_oneclick_adaptis.pb;3 6
 #encoder_0111.pb;4;1:1,44:1:1
 ml_female_model_step6_noiseout.pb;66 2
 ml_male_model_step6_noiseout.pb;66 2.5
 ml_tts_encoder_control_flow.pb;4;1:1,22:1:1 1.5
 ml_tts_decoder_control_flow.pb;5 1
 ml_tts_decoder.pb;5 2.5
 #ml_tts_encoder_control_flow.pb;4;1:1,22:1:1 1.5 to open
 #ml_tts_decoder_control_flow.pb;5 1 need update
 #ml_tts_decoder.pb;5 2.5 to open
 ml_tts_vocoder.pb;66 53
 hiai_transformer_encoder.pb;15 4
 decoder_step_nocumsum_v5.pb;13;1:1,512:1,1429,2:1,127:1,127:1,127:1,127,320:1,80:1,512:1,512:1,512:1,512:1,512 1.2
--- a/mindspore/lite/test/st/control_flow_test.cc
+++ b/mindspore/lite/test/st/control_flow_test.cc
@@ -1,459 +0,0 @@
 /**
 * Copyright 2020 Huawei Technologies Co., Ltd
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

 #include <cmath>
 #include <memory>
 #include "schema/inner/model_generated.h"
 #include "mindspore/lite/include/model.h"
 #include "common/common_test.h"
 #include "include/lite_session.h"
 #include "include/context.h"
 #include "include/errorcode.h"
 #include "src/common/log_adapter.h"
 #include "src/lite_session.h"
 #include "include/version.h"

 namespace mindspore {
 class ControlFlowTest : public mindspore::CommonTest {
 public:
  ControlFlowTest() {}
 };

 TEST_F(ControlFlowTest, TestMergeWhileModel) {
  // make graph
  auto meta_graph = std::make_shared<schema::MetaGraphT>();
  MS_LOG(DEBUG) << "make subgraph";
  meta_graph->name = "graph";
  meta_graph->version = lite::Version();
  meta_graph->inputIndex = {0};
  meta_graph->outputIndex = {9};
  //  subgraph 0 : main graph
  auto sub_graph_0 = std::make_unique<schema::SubGraphT>();
  sub_graph_0->name = "main_graph";

  //  subgraph 1 : cond graph
  auto sub_graph_1 = std::make_unique<schema::SubGraphT>();
  sub_graph_1->name = "cond_graph";

  //  subgraph 2: body graph
  auto sub_graph_2 = std::make_unique<schema::SubGraphT>();
  sub_graph_2->name = "body_graph";

  MS_LOG(DEBUG) << "make subgraph";

  // subgraph 0:  node 0    before-add-1
  auto sub_graph_0_node_0 = std::make_unique<schema::CNodeT>();
  sub_graph_0_node_0->inputIndex = {0, 1};
  sub_graph_0_node_0->outputIndex = {2};
  sub_graph_0_node_0->primitive = std::make_unique<schema::PrimitiveT>();
  sub_graph_0_node_0->primitive->value.type = schema::PrimitiveType_AddFusion;
  auto primitive_sub_graph_0_node_0 = new schema::AddFusionT;
  primitive_sub_graph_0_node_0->activation_type = schema::ActivationType_NO_ACTIVATION;
  sub_graph_0_node_0->primitive->value.value = primitive_sub_graph_0_node_0;
  sub_graph_0_node_0->name = "before_Add_1";
  meta_graph->nodes.emplace_back(std::move(sub_graph_0_node_0));
  sub_graph_0->nodeIndices.push_back(0);
  MS_LOG(DEBUG) << "node 0";

  // subgraph 0:  node 1    before-add-1
  auto sub_graph_0_node_1 = std::make_unique<schema::CNodeT>();
  sub_graph_0_node_1->inputIndex = {2, 3};
  sub_graph_0_node_1->outputIndex = {4};
  sub_graph_0_node_1->primitive = std::make_unique<schema::PrimitiveT>();
  sub_graph_0_node_1->primitive->value.type = schema::PrimitiveType_AddFusion;
  auto primitive_sub_graph_0_node_1 = new schema::AddFusionT;
  primitive_sub_graph_0_node_1->activation_type = schema::ActivationType_NO_ACTIVATION;
  sub_graph_0_node_1->primitive->value.value = primitive_sub_graph_0_node_1;
  sub_graph_0_node_1->name = "before_Add_2";
  meta_graph->nodes.emplace_back(std::move(sub_graph_0_node_1));
  sub_graph_0->nodeIndices.push_back(1);
  MS_LOG(DEBUG) << "node 1";

  // subgraph 0:  node 2    merge
  auto sub_graph_0_node_2 = std::make_unique<schema::CNodeT>();
  sub_graph_0_node_2->inputIndex = {4, 17};
  sub_graph_0_node_2->outputIndex = {16};
  sub_graph_0_node_2->primitive = std::make_unique<schema::PrimitiveT>();
  sub_graph_0_node_2->primitive->value.type = schema::PrimitiveType_Merge;
  auto primitive_sub_graph_0_node_2 = new schema::MergeT;
  sub_graph_0_node_2->primitive->value.value = primitive_sub_graph_0_node_2;
  sub_graph_0_node_2->name = "merge";
  meta_graph->nodes.emplace_back(std::move(sub_graph_0_node_2));
  sub_graph_0->nodeIndices.push_back(2);
  MS_LOG(DEBUG) << "node 2";

  // subgraph 0:  node 3   partial   cond subGraph
  auto sub_graph_0_node_3 = std::make_unique<schema::CNodeT>();
  sub_graph_0_node_3->inputIndex = {16};
  sub_graph_0_node_3->outputIndex = {5};  // 5 : bool
  sub_graph_0_node_3->primitive = std::make_unique<schema::PrimitiveT>();
  sub_graph_0_node_3->primitive->value.type = schema::PrimitiveType_PartialFusion;
  auto primitive_sub_graph_0_node_3 = new schema::PartialFusionT;
  primitive_sub_graph_0_node_3->sub_graph_index = 1;
  sub_graph_0_node_3->primitive->value.value = primitive_sub_graph_0_node_3;
  sub_graph_0_node_3->name = "Partial_cond";
  meta_graph->nodes.emplace_back(std::move(sub_graph_0_node_3));
  sub_graph_0->nodeIndices.push_back(3);
  MS_LOG(DEBUG) << "node 2";

  // subgraph 0:  node 4   switch
  auto sub_graph_0_node_4 = std::make_unique<schema::CNodeT>();
  sub_graph_0_node_4->inputIndex = {5, 16};  // 5 : bool; 16 data
  sub_graph_0_node_4->outputIndex = {6, 7};
  sub_graph_0_node_4->primitive = std::make_unique<schema::PrimitiveT>();
  sub_graph_0_node_4->primitive->value.type = schema::PrimitiveType_Switch;
  auto primitive_sub_graph_0_node_4 = new schema::SwitchT;
  sub_graph_0_node_4->primitive->value.value = primitive_sub_graph_0_node_4;
  sub_graph_0_node_4->name = "Switch";
  meta_graph->nodes.emplace_back(std::move(sub_graph_0_node_4));
  sub_graph_0->nodeIndices.push_back(4);
  MS_LOG(DEBUG) << "node 4";

  // subgraph 0:  node 5    partial  body subgraph
  auto sub_graph_0_node_5 = std::make_unique<schema::CNodeT>();
  sub_graph_0_node_5->inputIndex = {6};
  sub_graph_0_node_5->outputIndex = {17};
  sub_graph_0_node_5->primitive = std::make_unique<schema::PrimitiveT>();
  sub_graph_0_node_5->primitive->value.type = schema::PrimitiveType_PartialFusion;
  auto primitive_sub_graph_0_node_5 = new schema::PartialFusionT;
  primitive_sub_graph_0_node_5->sub_graph_index = 2;
  sub_graph_0_node_5->primitive->value.value = primitive_sub_graph_0_node_5;
  sub_graph_0_node_5->name = "Partial_body";
  meta_graph->nodes.emplace_back(std::move(sub_graph_0_node_5));
  sub_graph_0->nodeIndices.push_back(5);
  MS_LOG(DEBUG) << "node 5";

  // subgraph 0:  node 6     add-after
  auto sub_graph_0_node_6 = std::make_unique<schema::CNodeT>();
  sub_graph_0_node_6->inputIndex = {7, 8};
  sub_graph_0_node_6->outputIndex = {9};
  sub_graph_0_node_6->primitive = std::make_unique<schema::PrimitiveT>();
  sub_graph_0_node_6->primitive->value.type = schema::PrimitiveType_AddFusion;
  auto primitive_sub_graph_0_node_6 = new schema::AddFusionT;
  sub_graph_0_node_6->primitive->value.value = primitive_sub_graph_0_node_6;
  sub_graph_0_node_6->name = "Add-after";
  meta_graph->nodes.emplace_back(std::move(sub_graph_0_node_6));
  sub_graph_0->nodeIndices.push_back(6);
  MS_LOG(DEBUG) << "node 6";

  sub_graph_0->inputIndices = {0};
  sub_graph_0->outputIndices = {9};
  sub_graph_0->tensorIndices = {0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 16, 17};

  meta_graph->subGraph.push_back(std::move(sub_graph_0));

  // subgraph 1 ;  node:0   add   cond
  auto sub_graph_1_node_0 = std::make_unique<schema::CNodeT>();
  sub_graph_1_node_0->inputIndex = {16, 10};
  sub_graph_1_node_0->outputIndex = {11};
  sub_graph_1_node_0->primitive = std::make_unique<schema::PrimitiveT>();
  sub_graph_1_node_0->primitive->value.type = schema::PrimitiveType_AddFusion;
  auto primitive_sub_graph_1_node_0 = new schema::AddFusionT;
  sub_graph_1_node_0->primitive->value.value = primitive_sub_graph_1_node_0;
  sub_graph_1_node_0->name = "cond_add";
  meta_graph->nodes.emplace_back(std::move(sub_graph_1_node_0));
  sub_graph_1->nodeIndices.push_back(7);
  MS_LOG(DEBUG) << "node 6";

  // subgraph 1 ;  node:1   Less   cond
  auto sub_graph_1_node_1 = std::make_unique<schema::CNodeT>();
  sub_graph_1_node_1->inputIndex = {11, 12};
  sub_graph_1_node_1->outputIndex = {5};
  sub_graph_1_node_1->primitive = std::make_unique<schema::PrimitiveT>();
  sub_graph_1_node_1->primitive->value.type = schema::PrimitiveType_Less;
  auto primitive_sub_graph_1_node_1 = new schema::LessT;
  sub_graph_1_node_1->primitive->value.value = primitive_sub_graph_1_node_1;
  sub_graph_1_node_1->name = "cond_Less";
  meta_graph->nodes.emplace_back(std::move(sub_graph_1_node_1));
  sub_graph_1->nodeIndices.push_back(8);
  MS_LOG(DEBUG) << "node 7";

  sub_graph_1->inputIndices = {16};
  sub_graph_1->outputIndices = {5};
  sub_graph_1->tensorIndices = {16, 10, 11, 12, 5};
  meta_graph->subGraph.push_back(std::move(sub_graph_1));

  // subgraph 2 ;  node:0   body add-1
  auto sub_graph_2_node_0 = std::make_unique<schema::CNodeT>();
  sub_graph_2_node_0->inputIndex = {6, 13};
  sub_graph_2_node_0->outputIndex = {14};
  sub_graph_2_node_0->primitive = std::make_unique<schema::PrimitiveT>();
  sub_graph_2_node_0->primitive->value.type = schema::PrimitiveType_AddFusion;
  auto primitive_sub_graph_2_node_0 = new schema::AddFusionT;
  sub_graph_2_node_0->primitive->value.value = primitive_sub_graph_2_node_0;
  sub_graph_2_node_0->name = "body_add_1";
  meta_graph->nodes.emplace_back(std::move(sub_graph_2_node_0));
  sub_graph_2->nodeIndices.push_back(9);
  MS_LOG(DEBUG) << "node 8";

  // subgraph 2 ;  node:1   body add-2
  auto sub_graph_2_node_1 = std::make_unique<schema::CNodeT>();
  sub_graph_2_node_1->inputIndex = {14, 15};
  sub_graph_2_node_1->outputIndex = {17};
  sub_graph_2_node_1->primitive = std::make_unique<schema::PrimitiveT>();
  sub_graph_2_node_1->primitive->value.type = schema::PrimitiveType_AddFusion;
  auto primitive_sub_graph_2_node_1 = new schema::AddFusionT;
  sub_graph_2_node_1->primitive->value.value = primitive_sub_graph_2_node_1;
  sub_graph_2_node_1->name = "body_add_2";
  meta_graph->nodes.emplace_back(std::move(sub_graph_2_node_1));
  sub_graph_2->nodeIndices.push_back(10);
  MS_LOG(DEBUG) << "node 9";

  sub_graph_2->inputIndices = {6};
  sub_graph_2->outputIndices = {17};
  sub_graph_2->tensorIndices = {13, 14, 15, 6, 17};

  meta_graph->subGraph.push_back(std::move(sub_graph_2));

  //  -------   tensor    ---------
  //  tensor: 0   before-add input0 <main graph input>
  auto tensor_0 = std::make_unique<schema::TensorT>();
  tensor_0->nodeType = lite::NodeType_ValueNode;
  tensor_0->format = schema::Format_NHWC;
  tensor_0->dataType = TypeId::kNumberTypeFloat32;
  tensor_0->dims = {1};
  tensor_0->offset = -1;
  meta_graph->allTensors.emplace_back(std::move(tensor_0));
  MS_LOG(DEBUG) << "tensor 0";

  //  tensor: 1    before-add input1 <const>
  auto tensor_1 = std::make_unique<schema::TensorT>();
  tensor_1->nodeType = lite::NodeType_ValueNode;
  tensor_1->format = schema::Format_NHWC;
  tensor_1->dataType = TypeId::kNumberTypeFloat32;
  tensor_1->dims = {1};
  tensor_1->data.resize(sizeof(float) * 1);
  float input1_data[] = {1};
  memcpy(tensor_1->data.data(), input1_data, sizeof(float) * 1);
  tensor_1->offset = -1;
  meta_graph->allTensors.emplace_back(std::move(tensor_1));
  MS_LOG(DEBUG) << "tensor 1";

  //  tensor: 2  before-add output/partial input
  auto tensor_2 = std::make_unique<schema::TensorT>();
  tensor_2->nodeType = lite::NodeType_Parameter;
  tensor_2->format = schema::Format_NHWC;
  tensor_2->dataType = TypeId::kNumberTypeFloat32;
  tensor_2->dims = {1};
  tensor_2->offset = -1;
  meta_graph->allTensors.emplace_back(std::move(tensor_2));
  MS_LOG(DEBUG) << "tensor 2";

  //  tensor: 3    before-add input1 <const>
  auto tensor_3 = std::make_unique<schema::TensorT>();
  tensor_3->nodeType = lite::NodeType_ValueNode;
  tensor_3->format = schema::Format_NHWC;
  tensor_3->dataType = TypeId::kNumberTypeFloat32;
  tensor_3->dims = {1};
  tensor_3->data.resize(sizeof(float) * 1);
  float tensor_3_data[] = {1};
  memcpy(tensor_3->data.data(), tensor_3_data, sizeof(float) * 1);
  tensor_3->offset = -1;
  meta_graph->allTensors.emplace_back(std::move(tensor_3));
  MS_LOG(DEBUG) << "tensor 3";

  auto tensor_4 = std::make_unique<schema::TensorT>();
  tensor_4->nodeType = lite::NodeType_Parameter;
  tensor_4->format = schema::Format_NHWC;
  tensor_4->dataType = TypeId::kNumberTypeFloat32;
  tensor_4->dims = {1};
  tensor_4->offset = -1;
  meta_graph->allTensors.emplace_back(std::move(tensor_4));
  MS_LOG(DEBUG) << "tensor 4";

  //  tensor :5   partial output <bool>
  auto tensor_5 = std::make_unique<schema::TensorT>();
  tensor_5->nodeType = lite::NodeType_Parameter;
  tensor_5->format = schema::Format_NHWC;
  tensor_5->dataType = TypeId::kNumberTypeBool;
  tensor_5->dims = {1};
  tensor_5->offset = -1;
  meta_graph->allTensors.emplace_back(std::move(tensor_5));
  MS_LOG(DEBUG) << "tensor_4";

  //  tensor: 6 switch true output
  auto tensor_6 = std::make_unique<schema::TensorT>();
  tensor_6->nodeType = lite::NodeType_Parameter;
  tensor_6->format = schema::Format_NHWC;
  tensor_6->dataType = TypeId::kNumberTypeFloat32;
  tensor_6->dims = {1};
  tensor_6->offset = -1;
  meta_graph->allTensors.emplace_back(std::move(tensor_6));
  MS_LOG(DEBUG) << "tensor 6";

  //  tensor: 5  switch False output
  auto tensor_7 = std::make_unique<schema::TensorT>();
  tensor_7->nodeType = lite::NodeType_Parameter;
  tensor_7->format = schema::Format_NHWC;
  tensor_7->dataType = TypeId::kNumberTypeFloat32;
  tensor_7->dims = {1};
  tensor_7->offset = -1;
  meta_graph->allTensors.emplace_back(std::move(tensor_7));
  MS_LOG(DEBUG) << "tensor_7";

  //  tensor: 6  body-add input ,other input is switch true output
  auto tensor_8 = std::make_unique<schema::TensorT>();
  tensor_8->nodeType = lite::NodeType_ValueNode;
  tensor_8->format = schema::Format_NHWC;
  tensor_8->dataType = TypeId::kNumberTypeFloat32;
  tensor_8->dims = {1};
  tensor_8->data.resize(sizeof(float) * 1);
  float tensor_8_data[] = {10};
  memcpy(tensor_8->data.data(), tensor_8_data, sizeof(float) * 1);
  tensor_8->offset = -1;
  meta_graph->allTensors.emplace_back(std::move(tensor_8));
  MS_LOG(DEBUG) << "tensor_8";

  auto tensor_9 = std::make_unique<schema::TensorT>();
  tensor_9->nodeType = lite::NodeType_Parameter;
  tensor_9->format = schema::Format_NHWC;
  tensor_9->dataType = TypeId::kNumberTypeFloat32;
  tensor_9->dims = {1};
  tensor_9->offset = -1;
  meta_graph->allTensors.emplace_back(std::move(tensor_9));
  MS_LOG(DEBUG) << "tensor_9";

  //  tensor: 7  after-add input ,other input is switch false output
  auto tensor_10 = std::make_unique<schema::TensorT>();
  tensor_10->nodeType = lite::NodeType_ValueNode;
  tensor_10->format = schema::Format_NHWC;
  tensor_10->dataType = TypeId::kNumberTypeFloat32;
  tensor_10->dims = {1};
  tensor_10->data.resize(sizeof(float) * 1);
  float tensor_10_data[] = {1};
  memcpy(tensor_10->data.data(), tensor_10_data, sizeof(float) * 1);
  tensor_10->offset = -1;
  meta_graph->allTensors.emplace_back(std::move(tensor_10));
  MS_LOG(DEBUG) << "tensor_10";

  //  tensor: 8   main graph output
  auto tensor_11 = std::make_unique<schema::TensorT>();
  tensor_11->nodeType = lite::NodeType_Parameter;
  tensor_11->format = schema::Format_NHWC;
  tensor_11->dataType = TypeId::kNumberTypeFloat32;
  tensor_11->dims = {1};
  tensor_11->offset = -1;
  meta_graph->allTensors.emplace_back(std::move(tensor_11));
  MS_LOG(DEBUG) << "tensor 11";

  //  tensor: 9  cond-Less  input, other input is tensor 2
  auto tensor_12 = std::make_unique<schema::TensorT>();
  tensor_12->nodeType = lite::NodeType_ValueNode;
  tensor_12->format = schema::Format_NHWC;
  tensor_12->dataType = TypeId::kNumberTypeFloat32;
  tensor_12->dims = {1};
  tensor_12->data.resize(sizeof(float) * 1);
  float tensor_12_data[] = {10};
  memcpy(tensor_12->data.data(), tensor_12_data, sizeof(float) * 1);
  tensor_12->offset = -1;
  meta_graph->allTensors.emplace_back(std::move(tensor_12));
  MS_LOG(DEBUG) << "tensor_12";

  auto tensor_13 = std::make_unique<schema::TensorT>();
  tensor_13->nodeType = lite::NodeType_ValueNode;
  tensor_13->format = schema::Format_NHWC;
  tensor_13->dataType = TypeId::kNumberTypeFloat32;
  tensor_13->dims = {1};
  tensor_13->data.resize(sizeof(float) * 1);
  float tensor_13_data[] = {1};
  memcpy(tensor_13->data.data(), tensor_13_data, sizeof(float) * 1);
  tensor_13->offset = -1;
  meta_graph->allTensors.emplace_back(std::move(tensor_13));
  MS_LOG(DEBUG) << "tensor_13";

  auto tensor_14 = std::make_unique<schema::TensorT>();
  tensor_14->nodeType = lite::NodeType_Parameter;
  tensor_14->format = schema::Format_NHWC;
  tensor_14->dataType = TypeId::kNumberTypeFloat32;
  tensor_14->dims = {1};
  tensor_14->offset = -1;
  meta_graph->allTensors.emplace_back(std::move(tensor_14));
  MS_LOG(DEBUG) << "tensor 14";

  auto tensor_15 = std::make_unique<schema::TensorT>();
  tensor_15->nodeType = lite::NodeType_ValueNode;
  tensor_15->format = schema::Format_NHWC;
  tensor_15->dataType = TypeId::kNumberTypeFloat32;
  tensor_15->dims = {1};
  tensor_15->data.resize(sizeof(float) * 1);
  float tensor_15_data[] = {1};
  memcpy(tensor_15->data.data(), tensor_15_data, sizeof(float) * 1);
  tensor_15->offset = -1;
  meta_graph->allTensors.emplace_back(std::move(tensor_15));
  MS_LOG(DEBUG) << "tensor_15";

  auto tensor_16 = std::make_unique<schema::TensorT>();
  tensor_16->nodeType = lite::NodeType_Parameter;
  tensor_16->format = schema::Format_NHWC;
  tensor_16->dataType = TypeId::kNumberTypeFloat32;
  tensor_16->dims = {1};
  tensor_16->offset = -1;
  meta_graph->allTensors.emplace_back(std::move(tensor_16));
  MS_LOG(DEBUG) << "tensor_16";

  auto tensor_17 = std::make_unique<schema::TensorT>();
  tensor_17->nodeType = lite::NodeType_Parameter;
  tensor_17->format = schema::Format_NHWC;
  tensor_17->dataType = TypeId::kNumberTypeFloat32;
  tensor_17->dims = {1};
  tensor_17->offset = -1;
  meta_graph->allTensors.emplace_back(std::move(tensor_17));
  MS_LOG(DEBUG) << "tensor_17";
  //  -----------------------------------------------------------------------

  flatbuffers::FlatBufferBuilder builder(1024);
  auto offset = schema::MetaGraph::Pack(builder, meta_graph.get());
  builder.Finish(offset);
  schema::FinishMetaGraphBuffer(builder, offset);
  size_t size = builder.GetSize();
  const char *content = reinterpret_cast<char *>(builder.GetBufferPointer());

  auto model = std::shared_ptr<lite::Model>(lite::Model::Import(content, size));
  ASSERT_NE(model, nullptr);
  lite::Context context;
  context.thread_num_ = 2;
  auto &cpu_device_ctx = context.device_list_[0];
  cpu_device_ctx.device_info_.cpu_device_info_.cpu_bind_mode_ = lite::MID_CPU;
  cpu_device_ctx.device_info_.cpu_device_info_.enable_float16_ = false;
  auto session = std::shared_ptr<session::LiteSession>(session::LiteSession::CreateSession(&context));
  ASSERT_NE(session, nullptr);
  auto ret = session->CompileGraph(model.get());
  ASSERT_EQ(ret, lite::RET_OK);
  model->Free();
  auto inputs = session->GetInputs();
  ASSERT_EQ(inputs.size(), 1);
  auto input = inputs.front();
  ASSERT_NE(input, nullptr);
  ASSERT_EQ(input->data_type(), kNumberTypeFloat32);
  ASSERT_EQ(input->shape().size(), 1);
  ASSERT_EQ(input->shape().at(0), 1);
  auto in_data = reinterpret_cast<float *>(input->MutableData());
  ASSERT_NE(in_data, nullptr);
  in_data[0] = 1;
  ret = session->RunGraph();
  ASSERT_EQ(ret, lite::RET_OK);
  auto outputs = session->GetOutputs();
  ASSERT_EQ(outputs.size(), 1);
  auto output = outputs.begin()->second;
  ASSERT_NE(output, nullptr);
  ASSERT_EQ(output->data_type(), kNumberTypeFloat32);
  ASSERT_EQ(output->shape().size(), 1);
  ASSERT_EQ(output->shape().at(0), 1);
  auto out_data = reinterpret_cast<float *>(output->MutableData());
  ASSERT_NE(out_data, nullptr);
  ASSERT_EQ(out_data[0], 19);
 }
 }  // namespace mindspore
--- a/mindspore/lite/tools/anf_exporter/anf_exporter.cc
+++ b/mindspore/lite/tools/anf_exporter/anf_exporter.cc
@@ -27,6 +27,8 @@
 #include "mindspore/core/ir/primitive.h"
 #include "mindspore/core/ops/op_utils.h"
 #include "ops/fusion/partial_fusion.h"
 #include "ops/call.h"
 #include "ops/control_depend.h"
 #include "ops/depend.h"
 #include "tools/converter/ops/ops_def.h"
 #include "ops/quant_dtype_cast.h"
@@ -199,53 +201,62 @@ int AnfExporter::ConvertQuantParam(const std::unique_ptr<schema::MetaGraphT> &me
  return RET_OK;
 }

 std::vector<schema::CNodeT *> AnfExporter::GetSubgraphNodes(const std::unique_ptr<schema::MetaGraphT> &meta_graphT,
                                                            const size_t &subgraph_index) {
  std::vector<schema::CNodeT *> subgraph_nodes{};
  subgraph_nodes.resize(meta_graphT->subGraph.at(subgraph_index)->nodeIndices.size());
  std::transform(meta_graphT->subGraph.at(subgraph_index)->nodeIndices.begin(),
                 meta_graphT->subGraph.at(subgraph_index)->nodeIndices.end(), subgraph_nodes.begin(),
                 [&meta_graphT](const uint32_t idx) { return meta_graphT->nodes.at(idx).get(); });
  return subgraph_nodes;
 int AnfExporter::CreateNewTensorForParameter(const std::unique_ptr<schema::MetaGraphT> &meta_graphT,
                                             const AnfNodePtr &input) {
  lite::DataInfo data_info;
  auto param_node = input->cast<ParameterPtr>();
  if (FetchFromDefaultParam(param_node, converter::FmkType(meta_graphT->fmkType), &data_info) != RET_OK) {
    MS_LOG(ERROR) << "FetchFromDefaultParam failed.";
    return RET_ERROR;
  }
  auto schema_tensor = std::make_unique<schema::TensorT>();
  schema_tensor->format = static_cast<schema::Format>(data_info.format_);
  schema_tensor->name = param_node->name();
  schema_tensor->dims = data_info.shape_;
  schema_tensor->dataType = data_info.data_type_;
  schema_tensor->data = data_info.data_;
  schema_tensor->enableHuffmanCode = data_info.enable_huffman_code_;
  schema_tensor->nodeType = NodeType_CNode;
  auto key = std::make_pair(input, 0);
  node_id_map_[key] = static_cast<int>(meta_graphT->allTensors.size());
  meta_graphT->allTensors.emplace_back(std::move(schema_tensor));
  return RET_OK;
 }

 int AnfExporter::SetGraphInputIndex(const std::unique_ptr<schema::MetaGraphT> &meta_graphT,
                                    const size_t &subgraph_index) {
 int AnfExporter::SetSubGraphInputIndex(const std::unique_ptr<schema::MetaGraphT> &meta_graphT,
                                       const size_t &subgraph_index) {
  auto &subgraph = meta_graphT->subGraph.at(subgraph_index);
  auto subgraph_nodes = GetSubgraphNodes(meta_graphT, subgraph_index);
  std::vector<schema::CNodeT *> subgraph_input_nodes{};
  for (auto &node : subgraph_nodes) {
    if (IsContain(graph_input_nodes_, node)) {
      subgraph_input_nodes.push_back(node);
    }
  }
  std::vector<schema::TensorT *> subgraph_inputs{};
  for (auto &node : subgraph_input_nodes) {
    for (auto input : node->inputIndex) {
      auto tensor = meta_graphT->allTensors[input].get();
      if (tensor->nodeType != NodeType_CNode && tensor->data.empty()) {
        tensor->nodeType = NodeType_ValueNode;
        tensor->format = schema::Format_NHWC;
        if (!IsContain(subgraph->inputIndices, input)) {
          if (subgraph_index == kMainGraphIndex) {
            meta_graphT->inputIndex.push_back(input);
          }
          subgraph->inputIndices.push_back(input);
          subgraph_inputs.push_back(tensor);
        }
  FuncGraphPtr fg;
  std::for_each(fg_subgraph_map_.begin(), fg_subgraph_map_.end(),
                [&subgraph_index, &fg](const std::pair<const FuncGraphPtr, size_t> &it) {
                  if (it.second == subgraph_index) {
                    fg = it.first;
                  }
                });

  auto inputs = fg->get_inputs();
  for (auto &input : inputs) {
    auto key = std::make_pair(input, 0);
    auto iter = node_id_map_.find(key);
    if (iter != node_id_map_.end()) {
      subgraph->inputIndices.emplace_back(iter->second);
    } else {
      if (CreateNewTensorForParameter(meta_graphT, input) != RET_OK) {
        MS_LOG(ERROR) << "CreateNewTensorForParameter failed.";
        return RET_ERROR;
      }
      subgraph->inputIndices.emplace_back(meta_graphT->allTensors.size() - 1);
    }
  }

  return RET_OK;
 }

 int AnfExporter::SetGraphoutputIndex(const CNodePtr &cnode, const size_t subgraph_index,
                                     const std::unique_ptr<schema::MetaGraphT> &meta_graphT,
                                     schema::CNodeT *return_node) {
 int AnfExporter::SetSubGraphOutputIndex(const CNodePtr &cnode, const size_t subgraph_index,
                                        const std::unique_ptr<schema::MetaGraphT> &meta_graphT,
                                        schema::CNodeT *return_node) {
  MS_ASSERT(meta_graphT != nullptr);
  MS_ASSERT(return_node != nullptr);
  for (size_t i = 1; i < cnode->inputs().size(); i++) {
  for (size_t i = kFirstDataIndex; i < cnode->inputs().size(); i++) {
    auto input_node = cnode->input(i);
    if (input_node == nullptr) {
      MS_LOG(ERROR) << "output node is nullptr";
@@ -257,19 +268,23 @@ int AnfExporter::SetGraphoutputIndex(const CNodePtr &cnode, const size_t subgrap
        return ret;
      }
    } else if (input_node->isa<Parameter>()) {
      MS_LOG(INFO) << "the node " << input_node->fullname_with_scope().c_str() << "is parameter node";
      continue;
      auto key = std::make_pair(input_node, 0);
      auto iter = node_id_map_.find(key);
      if (iter != node_id_map_.end()) {
        return_node->inputIndex.emplace_back(iter->second);
      } else {
        if (CreateNewTensorForParameter(meta_graphT, input_node) != RET_OK) {
          MS_LOG(ERROR) << "CreateNewTensorForParameter failed.";
          return RET_ERROR;
        }
        return_node->inputIndex.emplace_back(meta_graphT->allTensors.size() - 1);
      }
    } else {
      MS_LOG(ERROR) << "the node " << input_node->fullname_with_scope().c_str() << "is not output node";
      return RET_ERROR;
    }
  }
  for (unsigned int &i : return_node->inputIndex) {
    if (subgraph_index == kMainGraphIndex) {
      auto &tensor = meta_graphT->allTensors.at(i);
      ConverterContext::GetInstance()->UpdateGraphOutputDType(meta_graphT->outputIndex.size(), tensor->dataType);
      meta_graphT->outputIndex.push_back(i);
    }
    meta_graphT->subGraph.at(subgraph_index)->outputIndices.push_back(i);
  }
  return RET_OK;
@@ -282,39 +297,72 @@ bool AnfExporter::HasExported(const FuncGraphPtr &func_graph) {
  return false;
 }

 int AnfExporter::ExportPartialNode(const std::unique_ptr<schema::MetaGraphT> &meta_graphT, const bool &keep_graph,
                                   const bool &copy_primitive, const CNodePtr &partial_cnode,
                                   const std::unique_ptr<schema::CNodeT> &schema_cnode) {
  auto prim = GetValueNode<std::shared_ptr<mindspore::Primitive>>(partial_cnode->input(0));
  if (prim->name() != mindspore::ops::kNamePartialFusion) {
    MS_LOG(INFO) << "not is partial";
    return RET_OK;
  }

  auto partial_fusion_primc = schema_cnode->primitive->value.AsPartialFusion();
  auto vnode = partial_cnode->input(kFirstDataIndex)->cast<ValueNodePtr>();
  MS_ASSERT(vnode != nullptr);
  auto fg = vnode->value()->cast<FuncGraphPtr>();
  if (fg == nullptr) {
    MS_LOG(ERROR) << "func graph is nullptr.";
    return RET_NULL_PTR;
  }

  if (fg_subgraph_map_.find(fg) != fg_subgraph_map_.end()) {
    partial_fusion_primc->sub_graph_index = fg_subgraph_map_.at(fg);
    return RET_OK;
  }

  partial_fusion_primc->sub_graph_index = static_cast<int>(meta_graphT->subGraph.size());
  auto ret = ExportSubgraph(fg, meta_graphT, keep_graph, copy_primitive, partial_cnode);
  if (ret != RET_OK) {
    MS_LOG(ERROR) << "ExportSubgraph failed";
    return ret;
  }
  return RET_OK;
 }

 std::list<CNodePtr> AnfExporter::InsertCallNode(const FuncGraphPtr &func_graph) {
  auto cnodes = GetOrderedCNodes(func_graph);
  for (auto it = cnodes.begin(); it != cnodes.end();) {
    auto prim = GetValueNode<std::shared_ptr<mindspore::Primitive>>((*it)->input(kPrimIndex));
    if (prim == nullptr) {
      auto fg = GetValueNode<FuncGraphPtr>((*it)->input(kPrimIndex));
      if (fg != nullptr) {
        auto partial_cnode = CreatePartialCnode(fg, (*it));
        auto call_cnode = CreateCallCnode(fg, partial_cnode);
        it++;
        it = cnodes.insert(it, call_cnode);
        continue;
      } else {
        auto call_anf_prim_vnode = GetCallAnfPrim();
        auto cnode_input = (*it)->inputs();
        cnode_input.insert(cnode_input.begin(), call_anf_prim_vnode);
        (*it)->set_inputs(cnode_input);
      }
    }
    it++;
  }
  return cnodes;
 }

 int AnfExporter::Anf2Fb(const FuncGraphPtr &func_graph, const std::unique_ptr<schema::MetaGraphT> &meta_graphT,
                        const size_t &subgraph_index, const bool &keep_graph, const bool &copy_primitive) {
  int ret = RET_OK;
  auto cnodes = GetOrderedCNodes(func_graph);
  auto cnodes = InsertCallNode(func_graph);
  for (const auto &cnode : cnodes) {
    auto prim = GetValueNode<std::shared_ptr<mindspore::Primitive>>(cnode->input(0));
    auto prim = GetValueNode<std::shared_ptr<mindspore::Primitive>>(cnode->input(kPrimIndex));
    std::unique_ptr<schema::PrimitiveT> primT;
    if (prim == nullptr) {
      auto fg = GetValueNode<FuncGraphPtr>(cnode->input(0));
      if (fg != nullptr) {
        auto partial_cnode = CreatePartialCnode(fg, cnode);
        prim = GetValueNode<std::shared_ptr<mindspore::Primitive>>(partial_cnode->input(0));
        primT = GetPrimitiveT(partial_cnode->input(0));
        MS_ASSERT(primT != nullptr);
        auto pos = fg_subgraph_map_.find(fg);
        if (pos != fg_subgraph_map_.end()) {
          MS_ASSERT(primT->value.AsPartialFusion() != nullptr);
          primT->value.AsPartialFusion()->sub_graph_index = fg_subgraph_map_.at(fg);
        } else {
          size_t next_subgraph_index = meta_graphT->subGraph.size();
          MS_ASSERT(primT->value.AsPartialFusion() != nullptr);
          primT->value.AsPartialFusion()->sub_graph_index = next_subgraph_index;
          ret = ExportSubgraph(fg, meta_graphT, keep_graph, copy_primitive, cnode);
          if (ret != RET_OK) {
            MS_LOG(ERROR) << "ExportSubgraph failed";
            return ret;
          }
        }
      } else {
        MS_LOG(ERROR) << "primitive_c is nullptr";
        ret = RET_MEMORY_FAILED;
        break;
      }
      MS_LOG(ERROR) << "prim is nullptr.";
      return RET_ERROR;
    }

    RemoveIfDepend(cnode);
@@ -326,7 +374,6 @@ int AnfExporter::Anf2Fb(const FuncGraphPtr &func_graph, const std::unique_ptr<sc
      continue;
    }
    RemoveIfMakeTuple(cnode);

    auto node = std::make_unique<schema::CNodeT>();
    if (node == nullptr) {
      MS_LOG(ERROR) << "object failed to be constructed";
@@ -335,16 +382,14 @@ int AnfExporter::Anf2Fb(const FuncGraphPtr &func_graph, const std::unique_ptr<sc
    }
    if (opt::CheckPrimitiveType(cnode, prim::kPrimReturn)) {
      node->name = mindspore::lite::kNameReturn;
      ret = SetGraphoutputIndex(cnode, subgraph_index, meta_graphT, node.get());
      ret = SetSubGraphOutputIndex(cnode, subgraph_index, meta_graphT, node.get());
      if (ret != RET_OK) {
        MS_LOG(ERROR) << "SetOpOutputN failed";
        break;
      }
      continue;
    }
    if (primT == nullptr) {
      primT = GetPrimitiveT(cnode->input(0));
    }
    primT = GetPrimitiveT(cnode->input(kPrimIndex));
    node->name = cnode->fullname_with_scope();
    node->primitive = std::move(primT);
    auto device_type_attr = cnode->GetAttr(mindspore::ops::kDeviceType);
@@ -354,6 +399,13 @@ int AnfExporter::Anf2Fb(const FuncGraphPtr &func_graph, const std::unique_ptr<sc
      MS_LOG(ERROR) << "SetOpInputNode failed";
      break;
    }

    ret = ExportPartialNode(meta_graphT, keep_graph, copy_primitive, cnode, node);
    if (ret != RET_OK) {
      MS_LOG(ERROR) << "ExportPartialNode failed.";
      return ret;
    }

    SetOpOutputNode(cnode, meta_graphT, node.get());
    ret = ConvertQuantParam(meta_graphT, prim, node);
    if (ret != RET_OK) {
@@ -385,18 +437,19 @@ int AnfExporter::ExportSubgraph(const FuncGraphPtr &func_graph, const std::uniqu
  fg_subgraph_map_[func_graph] = subgraph_index;
  auto subgraph_name = func_graph->get_attr("graph_name");
  MS_ASSERT(subgraph_name != nullptr);
  meta_graphT->subGraph.back()->name = GetValue<std::string>(subgraph_name);
  meta_graphT->subGraph.back()->name =
    "subgraph_" + std::to_string(meta_graphT->subGraph.size() - 1) + "_" + GetValue<std::string>(subgraph_name);

  int ret = Anf2Fb(func_graph, meta_graphT, subgraph_index, keep_graph, copy_primitive);
  auto ret = Anf2Fb(func_graph, meta_graphT, subgraph_index, keep_graph, copy_primitive);
  if (ret != RET_OK) {
    MS_LOG(ERROR) << "Anf2Fb failed";
    ReturnCode::GetSingleReturnCode()->UpdateReturnCode(ret);
    return ret;
  }

  ret = SetGraphInputIndex(meta_graphT, subgraph_index);
  ret = SetSubGraphInputIndex(meta_graphT, subgraph_index);
  if (ret != RET_OK) {
    MS_LOG(ERROR) << "SetGraphInputIndex failed";
    MS_LOG(ERROR) << "SetSubGraphInputIndex failed";
    ReturnCode::GetSingleReturnCode()->UpdateReturnCode(ret);
    return ret;
  }
@@ -411,6 +464,80 @@ int AnfExporter::ExportSubgraph(const FuncGraphPtr &func_graph, const std::uniqu
  return RET_OK;
 }

 bool AnfExporter::IsCall(const AnfNodePtr node) {
  if (!utils::isa<CNodePtr>(node)) {
    return false;
  }
  auto cnode = node->cast<CNodePtr>();
  if (cnode->inputs().empty()) {
    return false;
  }
  auto cnode_first_input = cnode->input(kPrimIndex);
  if (utils::isa<CNodePtr>(cnode_first_input)) {
    return true;
  }

  return false;
 }

 bool IsPartialFusion(const AnfNodePtr &node) {
  if (node == nullptr) {
    lite::ReturnCode::GetSingleReturnCode()->UpdateReturnCode(lite::RET_NULL_PTR);
    return false;
  }
  if (node->isa<mindspore::CNode>()) {
    auto cnode = node->cast<CNodePtr>();
    auto vnode_value = cnode->input(0)->cast<ValueNodePtr>()->value();
    return GetValue<NamedPtr>(vnode_value)->name() == "PartialFusion";
  }
  return false;
 }

 FuncGraphPtr GetFinalGraph(const FuncGraphPtr &func_graph) {
  // get output
  CNodePtr call_cnode = nullptr;
  auto fg_output = func_graph->output();

  if (opt::CheckPrimitiveType(fg_output, prim::kPrimCall)) {
    call_cnode = fg_output->cast<CNodePtr>();
  } else {
    return func_graph;
  }

  // if call input is switch, meta output is call switch false partial's fg'output!
  auto cnode = call_cnode->input(kFirstDataIndex)->cast<CNodePtr>();
  if (opt::CheckPrimitiveType(cnode, prim::kPrimSwitch)) {
    auto false_cnode = cnode->input(kSwitchFalseIndex)->cast<CNodePtr>();
    auto false_fg = GetValueNode<FuncGraphPtr>(false_cnode->input(kFirstDataIndex));
    return GetFinalGraph(false_fg);
  } else {
    auto fg = GetValueNode<FuncGraphPtr>(cnode->input(kFirstDataIndex));
    return GetFinalGraph(fg);
  }

  MS_LOG(ERROR) << "Can not find final graph.";
  return nullptr;
 }

 int AnfExporter::SetMetaGraphOutput(const FuncGraphPtr &func_graph,
                                    const std::unique_ptr<schema::MetaGraphT> &meta_graphT) {
  auto final_fg = GetFinalGraph(func_graph);
  if (final_fg == nullptr) {
    MS_LOG(ERROR) << "GetFinalGraph failed.";
    return RET_ERROR;
  }
  auto final_meta_graph_index = fg_subgraph_map_.at(final_fg);
  auto &final_meta_graph = meta_graphT->subGraph.at(final_meta_graph_index);
  meta_graphT->outputIndex.assign(final_meta_graph->outputIndices.begin(), final_meta_graph->outputIndices.end());

  for (auto &output_index : meta_graphT->outputIndex) {
    auto &tensor = meta_graphT->allTensors.at(output_index);
    ConverterContext::GetInstance()->UpdateGraphOutputDType(meta_graphT->outputIndex.size(), tensor->dataType);
  }

  return RET_OK;
 }

 schema::MetaGraphT *AnfExporter::Export(const FuncGraphPtr &func_graph, bool keep_graph, bool copy_primitive,
                                        bool train_flag) {
  this->train_flag_ = train_flag;
@@ -418,12 +545,18 @@ schema::MetaGraphT *AnfExporter::Export(const FuncGraphPtr &func_graph, bool kee
  auto fmk = func_graph->get_attr("fmk");
  MS_ASSERT(fmk != nullptr);
  meta_graphT->fmkType = GetValue<int>(fmk);

  graph_inputs_ = func_graph->get_inputs();

  int ret = ExportSubgraph(func_graph, meta_graphT, keep_graph, copy_primitive);
  if (ret != RET_OK) {
    MS_LOG(ERROR) << "Export subgraph failed.";
    ReturnCode::GetSingleReturnCode()->UpdateReturnCode(ret);
    return nullptr;
  }

  SetMetaGraphOutput(func_graph, meta_graphT);

  return meta_graphT.release();
 }

@@ -460,11 +593,21 @@ int AnfExporter::ConvertInputCNodeCommonOp(const AnfNodePtr &input_anode, schema

 int AnfExporter::ConvertInputCNode(const std::shared_ptr<AnfNode> &input_anode, schema::CNodeT *output_cnode) {
  auto input_cnode = utils::cast<CNodePtr>(input_anode);
  auto input_value_node = input_cnode->input(0)->cast<ValueNodePtr>();
  auto input_value_node = input_cnode->input(kPrimIndex)->cast<ValueNodePtr>();
  if (input_value_node == nullptr) {
    MS_LOG(ERROR) << "value node is invalid.";
    return RET_ERROR;
    if (!IsCall(input_cnode)) {
      MS_LOG(ERROR) << "value node is invalid.";
      return RET_ERROR;
    } else {
      auto call_anf_prim_vnode = GetCallAnfPrim();
      auto cnode_input = input_cnode->inputs();
      cnode_input.insert(cnode_input.begin(), call_anf_prim_vnode);
      input_cnode->set_inputs(cnode_input);
    }
  }

  input_value_node = input_cnode->input(kPrimIndex)->cast<ValueNodePtr>();

  if (input_value_node->value() == nullptr || !opt::CheckPrimitiveType(input_cnode, prim::kPrimTupleGetItem)) {
    return ConvertInputCNodeCommonOp(input_anode, output_cnode);
  } else {
@@ -525,6 +668,11 @@ int AnfExporter::ConvertInputParameter(const CNodePtr &cnode, size_t index, cons
  schema_tensor->dims = data_info.shape_;
  schema_tensor->dataType = data_info.data_type_;
  schema_tensor->data = data_info.data_;
  if (!schema_tensor->data.empty()) {
    schema_tensor->nodeType = NodeType_ValueNode;
  } else {
    schema_tensor->nodeType = NodeType_CNode;
  }
  schema_tensor->enableHuffmanCode = data_info.enable_huffman_code_;

  node_id_map_[key] = meta_graphT->allTensors.size();
@@ -571,7 +719,6 @@ int AnfExporter::SetOpInputNode(const CNodePtr &cnode, const std::unique_ptr<sch
    MS_LOG(ERROR) << "primitive_c is nullptr: " << cnode->fullname_with_scope();
    return RET_ERROR;
  }
  bool is_graph_input = false;
  for (size_t i = 1; i < cnode->inputs().size(); i++) {
    auto input_node = cnode->input(i);
    if (input_node->isa<mindspore::CNode>()) {
@@ -586,8 +733,11 @@ int AnfExporter::SetOpInputNode(const CNodePtr &cnode, const std::unique_ptr<sch
        MS_LOG(ERROR) << "ConvertInputParameter failed";
        return ret;
      }
      if (!input_node->cast<ParameterPtr>()->has_default()) {
        is_graph_input = true;
      if (IsContain(graph_inputs_, input_node->cast<AnfNodePtr>()) &&
          graph_inputs_has_exported_.find(input_node) == graph_inputs_has_exported_.end()) {
        graph_inputs_has_exported_.insert(input_node);
        meta_graphT->inputIndex.push_back(meta_graphT->allTensors.size() - 1);
        meta_graphT->allTensors.back()->format = schema::Format_NHWC;
      }
    } else if (input_node->isa<ValueNode>()) {
      auto ret = ConvertInputValueNode(cnode, i, primitive_c, meta_graphT, fb_node);
@@ -598,9 +748,6 @@ int AnfExporter::SetOpInputNode(const CNodePtr &cnode, const std::unique_ptr<sch
    }
  }
  fb_node->name = cnode->fullname_with_scope();
  if (is_graph_input) {
    graph_input_nodes_.emplace_back(fb_node);
  }
  return RET_OK;
 }

@@ -702,10 +849,24 @@ ValueNodePtr AnfExporter::GetPartialAnfPrim() {
  return partial_anf_prim;
 }

 CNodePtr AnfExporter::CreatePartialCnode(const FuncGraphPtr &fg, AnfNodePtr node) {
 ValueNodePtr AnfExporter::GetCallAnfPrim() {
  auto call_prim = std::make_shared<mindspore::ops::Call>();
  ValueNodePtr call_anf_prim = NewValueNode(call_prim);
  return call_anf_prim;
 }

 CNodePtr AnfExporter::CreateCallCnode(const FuncGraphPtr &fg, const AnfNodePtr &node) {
  auto call_anf_prim_vnode = GetCallAnfPrim();
  std::vector<AnfNodePtr> inputs{call_anf_prim_vnode, node};
  auto cnode = fg->NewCNodeInOrder(inputs);
  cnode->set_func_graph(fg);
  return cnode;
 }

 CNodePtr AnfExporter::CreatePartialCnode(const FuncGraphPtr &fg, const AnfNodePtr &node) {
  if (utils::isa<CNodePtr>(node)) {
    auto cnode = utils::cast<CNodePtr>(node);
    auto primitive_c = GetValueNode<std::shared_ptr<PrimitiveC>>(cnode->input(0));
    auto primitive_c = GetValueNode<std::shared_ptr<PrimitiveC>>(cnode->input(kPrimIndex));
    if (primitive_c != nullptr) {
      return cnode;
    }
--- a/mindspore/lite/tools/anf_exporter/anf_exporter.h
+++ b/mindspore/lite/tools/anf_exporter/anf_exporter.h
@@ -22,6 +22,8 @@
 #include <vector>
 #include <memory>
 #include <utility>
 #include <set>
 #include <list>
 #include "schema/inner/model_generated.h"
 #include "ops/primitive_c.h"
 #include "ir/func_graph.h"
@@ -35,6 +37,10 @@ using mindspore::ops::PrimitiveC;
 namespace mindspore::lite {

 constexpr const int kMainGraphIndex = 0;
 constexpr const int kFirstDataIndex = 1;
 constexpr const int kSecondDataIndex = 2;
 constexpr const int kPrimIndex = 0;
 constexpr const int kSwitchFalseIndex = 3;

 class AnfExporter {
 public:
@@ -55,9 +61,9 @@ class AnfExporter {
                            const std::unique_ptr<schema::MetaGraphT> &meta_graphT, schema::CNodeT *op_node);
  int ConvertInputValueNode(const CNodePtr &cnode, size_t index, const PrimitivePtr &primitive,
                            const std::unique_ptr<schema::MetaGraphT> &meta_graphT, schema::CNodeT *op_node);
  int SetGraphInputIndex(const std::unique_ptr<schema::MetaGraphT> &meta_graphT, const size_t &subgraph_index);
  int SetGraphoutputIndex(const CNodePtr &cnode, size_t subgraph_index,
                          const std::unique_ptr<schema::MetaGraphT> &meta_graphT, schema::CNodeT *return_node);
  int SetSubGraphInputIndex(const std::unique_ptr<schema::MetaGraphT> &meta_graphT, const size_t &subgraph_index);
  int SetSubGraphOutputIndex(const CNodePtr &cnode, size_t subgraph_index,
                             const std::unique_ptr<schema::MetaGraphT> &meta_graphT, schema::CNodeT *return_node);
  static int SetPostTrainOutputTensorType(const std::unique_ptr<schema::MetaGraphT> &meta_graph,
                                          const std::shared_ptr<mindspore::Primitive> &primitive,
                                          const std::unique_ptr<schema::CNodeT> &dst_node);
@@ -69,17 +75,25 @@ class AnfExporter {
  int ExportSubgraph(const FuncGraphPtr &func_graph, const std::unique_ptr<schema::MetaGraphT> &meta_graphT,
                     bool keep_graph, bool copy_primitive, const std::shared_ptr<AnfNode> &partial_anode = nullptr);
  static ValueNodePtr GetPartialAnfPrim();
  static CNodePtr CreatePartialCnode(const FuncGraphPtr &fg, AnfNodePtr cnode);
  static std::vector<schema::CNodeT *> GetSubgraphNodes(const std::unique_ptr<schema::MetaGraphT> &meta_graphT,
                                                        const size_t &subgraph_index);
  static ValueNodePtr GetCallAnfPrim();
  static CNodePtr CreateCallCnode(const FuncGraphPtr &fg, const AnfNodePtr &cnode);
  static CNodePtr CreatePartialCnode(const FuncGraphPtr &fg, const AnfNodePtr &node);
  bool HasExported(const FuncGraphPtr &func_graph);
  int ExportPartialNode(const std::unique_ptr<schema::MetaGraphT> &meta_graphT, const bool &keep_graph,
                        const bool &copy_primitive, const CNodePtr &partial_cnode,
                        const std::unique_ptr<schema::CNodeT> &schema_cnode);
  std::list<CNodePtr> InsertCallNode(const FuncGraphPtr &func_graph);
  int SetMetaGraphOutput(const FuncGraphPtr &func_graph, const std::unique_ptr<schema::MetaGraphT> &meta_graphT);
  bool IsCall(const AnfNodePtr node);
  int CreateNewTensorForParameter(const std::unique_ptr<schema::MetaGraphT> &meta_graphT, const AnfNodePtr &input);

 private:
  std::map<std::pair<AnfNodePtr, int>, int> node_id_map_;
  // Key is a pair of node and its output id. Value is the mapped tensor id of meta_graph.
  std::vector<schema::CNodeT *> graph_input_nodes_;
  std::map<std::pair<AnfNodePtr, int>, int> node_id_map_;
  // The first item is FuncGraph which has been exported, the second item is the subgraph index in meta_graph
  std::map<FuncGraphPtr, int> fg_subgraph_map_;
  std::map<FuncGraphPtr, size_t> fg_subgraph_map_;
  std::vector<AnfNodePtr> graph_inputs_;
  std::set<AnfNodePtr> graph_inputs_has_exported_;
  uint32_t node_idx_ = 0;
  bool train_flag_ = false;
 };
--- a/mindspore/lite/tools/common/graph_util.cc
+++ b/mindspore/lite/tools/common/graph_util.cc
@@ -645,6 +645,8 @@ std::string GetModelName(const std::string &modelFile) {
 int SetSubgraphTensorIndices(schema::MetaGraphT *meta_graphT) {
  for (auto &subgraph : meta_graphT->subGraph) {
    std::vector<uint32_t> subgraph_indices{};
    subgraph_indices.assign(subgraph->inputIndices.begin(), subgraph->inputIndices.end());
    subgraph_indices.assign(subgraph->outputIndices.begin(), subgraph->outputIndices.end());
    for (auto &node_idx : subgraph->nodeIndices) {
      auto &node = meta_graphT->nodes.at(node_idx);
      for (auto &input_idx : node->inputIndex) {
--- a/mindspore/lite/tools/converter/CMakeLists.txt
+++ b/mindspore/lite/tools/converter/CMakeLists.txt
@@ -98,8 +98,6 @@ file(GLOB_RECURSE CONVERTER_SRC RELATIVE ${CMAKE_CURRENT_SOURCE_DIR}
        ../optimizer/graph/infershape_pass.cc
        ../optimizer/graph/slice_prepose_pass.cc
        ../optimizer/graph/mindir_adjust_pass.cc
        ../optimizer/graph/while_pass.cc
        ../optimizer/graph/if_pass.cc
        ../optimizer/graph/control_flow_pass.cc
        ../optimizer/graph/primitive_adjust_pass.cc
        ../optimizer/graph/unify_format_pass.cc
--- a/mindspore/lite/tools/converter/anf_transform.cc
+++ b/mindspore/lite/tools/converter/anf_transform.cc
@@ -52,8 +52,7 @@
 #include "tools/optimizer/graph/unused_cast_node_remove_pass.h"
 #include "tools/optimizer/graph/infershape_pass.h"
 #include "tools/optimizer/graph/slice_prepose_pass.h"
 #include "tools/optimizer/graph/while_pass.h"
 #include "tools/optimizer/graph/if_pass.h"
 #include "tools/optimizer/graph/control_flow_pass.h"
 #include "tools/optimizer/graph/reduce_same_act_pass.h"
 #include "tools/optimizer/graph/split_one_pass.h"
 #include "tools/optimizer/graph/unify_format_pass.h"
@@ -190,8 +189,7 @@ int AnfTransform::RunGraphPass(const FuncGraphPtr &old_graph, const converter::F
  auto graph_pm = std::make_shared<opt::PassManager>("anf graph pass manager", true);
  if (config->fmk == lite::converter::FmkType_TFLITE || config->fmk == lite::converter::FmkType_TF ||
      config->fmk == lite::converter::FmkType_ONNX) {
    graph_pm->AddPass(std::make_shared<opt::WhilePass>());
    graph_pm->AddPass(std::make_shared<opt::IfPass>());
    graph_pm->AddPass(std::make_shared<opt::ControlFlowPass>());
  }
  auto slice_prepose_pass = std::make_shared<opt::SlicePreposePass>();
  slice_prepose_pass->SetFmkType(config->fmk);
@@ -289,19 +287,16 @@ FuncGraphPtr AnfTransform::TransformFuncGraph(const FuncGraphPtr &old_graph, con
    MS_LOG(ERROR) << "config should be specified";
    return nullptr;
  }
  int status;
  for (auto &fg : func_graphs_) {
    status = RunConstFoldPass(fg, config);
    if (status != RET_OK) {
      MS_LOG(ERROR) << "Run const fold pass failed.";
      return nullptr;
    }
  int status = RunConstFoldPass(old_graph, config);
  if (status != RET_OK) {
    MS_LOG(ERROR) << "Run const fold pass failed.";
    return nullptr;
  }

    status = RunConvertPass(fg, config);
    if (status != RET_OK) {
      MS_LOG(ERROR) << "Run convert pass failed.";
      return nullptr;
    }
  status = RunConvertPass(old_graph, config);
  if (status != RET_OK) {
    MS_LOG(ERROR) << "Run convert pass failed.";
    return nullptr;
  }

  auto format_pass = std::make_shared<opt::UnifyFormatPass>();
@@ -318,28 +313,22 @@ FuncGraphPtr AnfTransform::TransformFuncGraph(const FuncGraphPtr &old_graph, con
  }

  auto reduce_act_pass = std::make_shared<opt::ReduceSameActPass>();
  for (auto &fg : func_graphs_) {
    if (!reduce_act_pass->Run(fg)) {
      MS_LOG(ERROR) << "Run reduce same act pass failed.";
      return nullptr;
    }
  if (!reduce_act_pass->Run(old_graph)) {
    MS_LOG(ERROR) << "Run reduce same act pass failed.";
    return nullptr;
  }

  auto split_one_pass = std::make_shared<opt::SplitOnePass>();
  for (auto &fg : func_graphs_) {
    if (!split_one_pass->Run(fg)) {
      MS_LOG(ERROR) << "Run split one pass failed.";
      return nullptr;
    }
  if (!split_one_pass->Run(old_graph)) {
    MS_LOG(ERROR) << "Run split one pass failed.";
    return nullptr;
  }

  for (auto &fg : func_graphs_) {
    if (!config->disableFusion) {
      status = RunFusionPass(fg, config);
      if (status != RET_OK) {
        MS_LOG(ERROR) << "Run fusion pass failed.";
        return nullptr;
      }
  if (!config->disableFusion) {
    status = RunFusionPass(old_graph, config);
    if (status != RET_OK) {
      MS_LOG(ERROR) << "Run fusion pass failed.";
      return nullptr;
    }
  }

@@ -356,57 +345,27 @@ FuncGraphPtr AnfTransform::TransformFuncGraph(const FuncGraphPtr &old_graph, con
    return nullptr;
  }

  for (auto &fg : func_graphs_) {
    status = RunGraphPass(fg, config);
    if (status != RET_OK) {
      MS_LOG(ERROR) << "Run convert pass failed.";
      return nullptr;
    }

    status = RunParallelPass(fg, config);
    if (status != RET_OK) {
      MS_LOG(ERROR) << "Run convert pass failed.";
      return nullptr;
    }

    status = DoQuantize(fg, config);
    if (status != RET_OK) {
      MS_LOG(ERROR) << "Do Quantize failed.";
      return nullptr;
    }
  status = RunGraphPass(old_graph, config);
  if (status != RET_OK) {
    MS_LOG(ERROR) << "Run convert pass failed.";
    return nullptr;
  }
  return old_graph;
 }

 void AnfTransform::GetAllFuncGraph(const FuncGraphPtr &func_graph) {
  if (func_graphs_.find(func_graph) == func_graphs_.end()) {
    func_graphs_.insert(func_graph);
  } else {
    return;
  status = RunParallelPass(old_graph, config);
  if (status != RET_OK) {
    MS_LOG(ERROR) << "Run convert pass failed.";
    return nullptr;
  }

  auto nodes = func_graph->nodes();
  for (auto &node : nodes) {
    if (IsValueNode<FuncGraph>(node)) {
      auto new_fg = (node->cast<ValueNodePtr>()->value())->cast<FuncGraphPtr>();
      GetAllFuncGraph(new_fg);
    }
    if (utils::isa<CNodePtr>(node)) {
      auto cnode = node->cast<CNodePtr>();
      for (auto &input : cnode->inputs()) {
        if (input->isa<ValueNode>()) {
          if (IsValueNode<FuncGraph>(input)) {
            auto new_fg = (input->cast<ValueNodePtr>()->value())->cast<FuncGraphPtr>();
            GetAllFuncGraph(new_fg);
          }
        }
      }
    }
  status = DoQuantize(old_graph, config);
  if (status != RET_OK) {
    MS_LOG(ERROR) << "Do Quantize failed.";
    return nullptr;
  }
  return old_graph;
 }

 FuncGraphPtr AnfTransform::Transform(const FuncGraphPtr &main_graph, const converter::Flags *config) {
  GetAllFuncGraph(main_graph);
  auto new_graph = TransformFuncGraph(main_graph, config);
  if (new_graph == nullptr) {
    MS_LOG(ERROR) << "optimizer failed.";
--- a/mindspore/lite/tools/converter/anf_transform.h
+++ b/mindspore/lite/tools/converter/anf_transform.h
@@ -54,10 +54,6 @@ class AnfTransform {
  static STATUS RunPluginPass(const FuncGraphPtr &old_graph, int position);

  int DoQuantize(const FuncGraphPtr &old_graph, const converter::Flags *config);

  void GetAllFuncGraph(const FuncGraphPtr &func_graph);

  std::set<FuncGraphPtr> func_graphs_{};
 };
 }  // namespace lite
 }  // namespace mindspore
--- a/mindspore/lite/tools/converter/export_model.cc
+++ b/mindspore/lite/tools/converter/export_model.cc
@@ -27,8 +27,7 @@
 #include "tools/converter/graphdef_transform.h"
 #include "tools/converter/dump_graph_init.h"
 #include "tools/optimizer/graph/unify_format_pass.h"
 #include "tools/optimizer/graph/while_pass.h"
 #include "tools/optimizer/graph/if_pass.h"
 #include "tools/optimizer/graph/control_flow_pass.h"

 namespace mindspore {
 namespace lite {
@@ -203,8 +202,7 @@ STATUS ExportModel(const FuncGraphPtr &graph) {
  auto graph_pm = std::make_shared<opt::PassManager>("anf graph pass manager", true);
  if (flags->fmk == lite::converter::FmkType_TFLITE || flags->fmk == lite::converter::FmkType_TF ||
      flags->fmk == lite::converter::FmkType_ONNX) {
    graph_pm->AddPass(std::make_shared<opt::WhilePass>());
    graph_pm->AddPass(std::make_shared<opt::IfPass>());
    graph_pm->AddPass(std::make_shared<opt::ControlFlowPass>());
  }
  optimizer->AddPassManager(graph_pm);
  if (optimizer->Optimize(mirror_graph) == nullptr) {
--- a/mindspore/lite/tools/converter/graphdef_transform.cc
+++ b/mindspore/lite/tools/converter/graphdef_transform.cc
@@ -153,12 +153,10 @@ int GraphDefTransform::Transform(const converter::Flags &ctx) {
    }
  }

  // controlflow pass
  {
    // init old node indices
    auto old_nodes = GetGraphNodes();
    Optimizer switch_optimizer;
    switch_optimizer.AddPass(new (std::nothrow) SwitchPass());
    switch_optimizer.AddPass(new (std::nothrow) IsolatedNodeRemovePass());
    switch_optimizer.AddPass(new (std::nothrow) SubgraphNodePass(old_nodes));
    switch_optimizer.AddPass(new (std::nothrow) SubgraphTensorPass());
@@ -174,7 +172,6 @@ int GraphDefTransform::Transform(const converter::Flags &ctx) {
    auto old_nodes = GetGraphNodes();
    nested_loop_optimizer.AddPass(new (std::nothrow) SubgraphNodePass(old_nodes));
    nested_loop_optimizer.AddPass(new (std::nothrow) TopologicalSortPass());
    nested_loop_optimizer.AddPass(new (std::nothrow) NestedLoopExpandPass());
    status = nested_loop_optimizer.Run(graph_defT_);
    if (status != RET_OK && status != RET_NO_CHANGE) {
      MS_LOG(ERROR) << "Run nested_loop_optimizer graphPasses Failed";
--- a/mindspore/lite/tools/converter/legacy_optimizer/graph/dropout_node_remove_pass.cc
+++ b/mindspore/lite/tools/converter/legacy_optimizer/graph/dropout_node_remove_pass.cc
@@ -108,8 +108,15 @@ STATUS DropoutNodeRemovePass::Run(schema::MetaGraphT *graph) {
  for (size_t i = 0; i < graph->nodes.size(); i++) {
    auto &node = graph->nodes.at(i);
    if (node->primitive == nullptr) {
      MS_LOG(ERROR) << "node->primitive is nullptr, node name: " << node->name;
      return RET_ERROR;
      MS_LOG(INFO) << "node->primitive is nullptr, node name: " << node->name;
      ifChanged = true;
      auto status = IsolateDropoutNode(graph, i);
      if (status != RET_OK) {
        MS_LOG(ERROR) << "IsolateDropoutNode failed, subGraph: " << graph->name << ", node: " << node->name
                      << ", error: " << status;
        return status;
      }
      continue;
    }
    if (node->primitive->value.type == schema::PrimitiveType_Dropout) {
      ifChanged = true;
--- a/mindspore/lite/tools/converter/legacy_optimizer/graph/infer_quant_param_pass.cc
+++ b/mindspore/lite/tools/converter/legacy_optimizer/graph/infer_quant_param_pass.cc
@@ -49,6 +49,10 @@ STATUS InferQuantParamPass::Run(schema::MetaGraphT *graph) {
      return RET_NULL_PTR;
    }

    if (!node->primitive) {
      continue;
    }

    auto quant_helper = QuantHelperRegister::GetInstance()->GetQuantHelper(node->primitive->value.type);

    quant_helper->NodeQuantPreprocess(graph, node.get());
--- a/mindspore/lite/tools/converter/legacy_optimizer/graph/infershape_pass.cc
+++ b/mindspore/lite/tools/converter/legacy_optimizer/graph/infershape_pass.cc
@@ -16,6 +16,8 @@

 #include "tools/converter/legacy_optimizer/graph/infershape_pass.h"
 #include <vector>
 #include <deque>
 #include <set>
 #include "src/common/common.h"
 #include "src/common/log_adapter.h"
 #include "include/errorcode.h"
@@ -34,6 +36,9 @@ namespace lite {
 namespace {
 constexpr int DEFAULT_DIM_VALUE = -1;
 constexpr size_t kInitialSize = 1024;
 constexpr int kMainGraphIndex = 0;
 constexpr int kCallInputMinSize = 1;
 constexpr int kSwitchInputMinSize = 3;

 void FreeTensors(std::vector<Tensor *> *input_tensors, std::vector<Tensor *> *output_tensors) {
  if (input_tensors == nullptr) {
@@ -63,20 +68,23 @@ void FreeTensors(std::vector<Tensor *> *input_tensors, std::vector<Tensor *> *ou
 void ConvertTensorList(MetaGraphT *graph, uint32_t index, bool *convert_succ, std::vector<Tensor *> *lite_tensors) {
  std::unique_ptr<Tensor> lite_tensor = nullptr;
  auto &tensorT = graph->allTensors.at(index);
  auto tensor_shape = tensorT->dims;
  std::vector<int32_t> tensor_shape{};
  TypeId type = kTypeUnknown;
  std::vector<int> element_shape;
  if (!tensorT->data.empty()) {
    int *data = reinterpret_cast<int *>(tensorT->data.data());
    type = TypeId(data[0]);
    if (tensorT->data.size() < 8 || (data[1] != 0 && (data[1] + 2) * 4 != static_cast<int>(tensorT->data.size()))) {
      MS_LOG(ERROR) << "tensorlist data length illegal";
    if (tensorT->data.size() < 8 || (data[1] != 0 && (data[1] + 3) * 4 != static_cast<int>(tensorT->data.size()))) {
      MS_LOG(ERROR) << "tensorlist data length illegal, tensorT name: " << tensorT->name;
      MS_LOG(ERROR) << "(data[1] + 3) * 4: " << (data[1] + 3) * 4;
      MS_LOG(ERROR) << "static_cast<int>(tensorT->data.size()): " << static_cast<int>(tensorT->data.size());
      *convert_succ = false;
      return;
    }
    for (int j = 0; j < data[1]; ++j) {
      element_shape.push_back(data[j + 2]);
    }
    tensor_shape = {data[data[1] + 2]};
  }
  lite_tensor = std::make_unique<TensorList>(tensor_shape, element_shape);
  if (lite_tensor == nullptr) {
@@ -84,7 +92,22 @@ void ConvertTensorList(MetaGraphT *graph, uint32_t index, bool *convert_succ, st
    *convert_succ = false;
    return;
  }
  reinterpret_cast<TensorList *>(lite_tensor.get())->set_tensors_data_type(type);

  auto lite_tensor_list = reinterpret_cast<TensorList *>(lite_tensor.get());
  std::vector<Tensor *> tensors{};
  if (!tensor_shape.empty() && tensor_shape.front() == -1) {
    MS_LOG(ERROR) << "tensor_shape is -1, tensor name: " << lite_tensor->tensor_name();
  }
  if (!tensor_shape.empty() && tensor_shape.front() != -1) {
    for (int32_t i = 0; i < tensor_shape.front(); ++i) {
      auto tensor = new (std::nothrow) Tensor(type, element_shape);
      tensors.emplace_back(tensor);
    }
  }

  lite_tensor_list->set_tensors_data_type(type);
  lite_tensor_list->set_element_shape(element_shape);
  lite_tensor_list->set_tensors(tensors);
  lite_tensors->emplace_back(lite_tensor.release());
 }

@@ -221,7 +244,7 @@ void PrintTensorShape(const std::vector<Tensor *> &input_tensors, const std::vec
 }
 #endif

 void SetDataType(MetaGraphT *graph, const std::vector<Tensor *> &output_tensors, std::vector<InferTensor> *tensors_,
 void SetDataType(MetaGraphT *graph, const std::vector<Tensor *> &output_tensors, std::vector<InferTensor> *tensors,
                 uint32_t i, uint32_t infer_node_index) {
  auto &node = graph->nodes.at(infer_node_index);
  auto &output_tensor = graph->allTensors.at(node->outputIndex[i]);
@@ -229,26 +252,112 @@ void SetDataType(MetaGraphT *graph, const std::vector<Tensor *> &output_tensors,
  output_tensor->dataType = output_tensors[i]->data_type();
  if (output_tensors[i]->data_type() == kObjectTypeTensorType) {
    auto tensor_list = reinterpret_cast<TensorList *>(output_tensors[i]);
    if (output_tensor->data.empty()) {
      output_tensor->data.resize(8, 0);
    int tensor_shape_dims = 0;
    if (!tensor_list->tensors().empty()) {
      tensor_shape_dims = static_cast<int>(tensor_list->tensors().front()->shape().size());
    }
    auto total_size = (tensor_shape_dims + 3) * sizeof(int);
    output_tensor->data.resize(total_size, 0);
    auto output_tensor_data = reinterpret_cast<int *>(output_tensor->data.data());
    if (tensor_list->tensors_data_type() == kTypeUnknown) {
      tensors_->at(node->outputIndex[i]).is_inferred_ = false;
      return;
      if (!tensor_list->tensors().empty()) {
        tensor_list->set_tensors_data_type(tensor_list->tensors().front()->data_type());
      }
    }
    output_tensor->data.at(0) = tensor_list->tensors_data_type();
    output_tensor_data[0] = tensor_list->tensors_data_type();
    if (tensor_list->element_shape().empty() && !tensor_list->tensors().empty()) {
      tensor_list->set_element_shape(tensor_list->tensors().front()->shape());
    }
    output_tensor_data[1] = static_cast<int>(tensor_list->element_shape().size());
    for (size_t j = 0; j < tensor_list->element_shape().size(); ++j) {
      output_tensor_data[j + 2] = tensor_list->element_shape().at(j);
    }
    output_tensor_data[2 + output_tensor_data[1]] = static_cast<int>(tensor_list->tensors().size());

  } else if (output_tensors[i]->data_type() == kTypeUnknown) {
    tensors_->at(node->outputIndex[i]).is_inferred_ = false;
    tensors->at(node->outputIndex[i]).is_inferred_ = false;
    return;
  }
  tensors_->at(node->outputIndex[i]).is_inferred_ = true;
  return;
  tensors->at(node->outputIndex[i]).is_inferred_ = true;
 }

 int PartialGraphIndex(const CNodeT *partial_node) {
  return partial_node->primitive->value.AsPartialFusion()->sub_graph_index;
 }

 }  // namespace

 STATUS InferShapePass::Run(MetaGraphT *graph) {
  MS_ASSERT(graph != nullptr);
  InitSearchTensor(graph);
 int InferShapePass::CopyPartialShapeToSubGraph(const CNodeT *partial_node, MetaGraphT *graph) {
  auto subgraph_index = PartialGraphIndex(partial_node);
  auto &subgraph = graph->subGraph.at(subgraph_index);

  if (subgraph->inputIndices.size() != partial_node->inputIndex.size()) {
    MS_LOG(ERROR) << "partial node " << partial_node->name << " inputs size: " << partial_node->inputIndex.size()
                  << " vs "
                  << " subgraph " << subgraph_index << " input size: " << subgraph->inputIndices.size();
    return RET_PARAM_INVALID;
  }

  for (size_t i = 0; i < partial_node->inputIndex.size(); ++i) {
    auto &subgraph_input = graph->allTensors.at(subgraph->inputIndices[i]);
    auto &partial_input = graph->allTensors.at(partial_node->inputIndex[i]);
    subgraph_input->dataType = partial_input->dataType;
    subgraph_input->dims = partial_input->dims;
    subgraph_input->format = partial_input->format;
    subgraph_input->data.resize(partial_input->data.size(), 0);
    memcpy(subgraph_input->data.data(), partial_input->data.data(), partial_input->data.size());
  }
  return RET_OK;
 }

 int InferShapePass::RestoreSubGraphInput(const CNodeT *partial_node, MetaGraphT *graph) {
  auto subgraph_index = PartialGraphIndex(partial_node);
  auto &subgraph = graph->subGraph.at(subgraph_index);
  for (size_t i = 0; i < subgraph->inputIndices.size(); ++i) {
    auto &subgraph_input = graph->allTensors.at(subgraph->inputIndices[i]);
    if (subgraph_input->dataType != kObjectTypeTensorType) {
      subgraph_input->data = {};
    }
  }
  return RET_OK;
 }

 int InferShapePass::InferPartialNode(const CNodeT *partial_node, MetaGraphT *graph) {
  int subgraph_index = PartialGraphIndex(partial_node);
  int ret = CopyPartialShapeToSubGraph(partial_node, graph);
  if (ret != RET_OK) {
    MS_LOG(ERROR) << "CopyPartialShapeToSubGraph failed, ret: " << ret;
    return ret;
  }

  ret = InferSubgraph(subgraph_index, graph);
  if (ret != RET_OK) {
    // not return ret here to infer the following part of graph
    MS_LOG(WARNING) << "InferSubgraph index: " << subgraph_index << " failed, ret: " << ret;
  }

  ret = RestoreSubGraphInput(partial_node, graph);
  if (ret != RET_OK) {
    MS_LOG(ERROR) << "RestoreSubGraphInput failed, ret: " << ret;
  }
  return ret;
 }

 void InferShapePass::InitInferTensor(MetaGraphT *graph) {
  tensors_.resize(graph->allTensors.size());
  for (size_t i = 0; i < graph->nodes.size(); i++) {
    auto &node = graph->nodes.at(i);
    auto node_input_indexes = node->inputIndex;
    //  init in_nodes index
    for (size_t j = 0; j < node_input_indexes.size(); j++) {
      tensors_[node_input_indexes[j]].next_nodes_.push_back(i);
    }
    auto node_output_indexes = node->outputIndex;
    for (size_t j = 0; j < node_output_indexes.size(); j++) {
      tensors_[node_output_indexes[j]].prev_nodes_.push_back(i);
    }
  }

  for (auto input_idx : graph->inputIndex) {
    auto input_tensor = graph->allTensors[input_idx].get();
    for (auto &dim : input_tensor->dims) {
@@ -258,18 +367,110 @@ STATUS InferShapePass::Run(MetaGraphT *graph) {
      }
    }
  }
  while (!infer_node_indexes_.empty()) {
    auto infer_node_index = infer_node_indexes_.front();
    auto &node = graph->nodes.at(infer_node_index);
    auto node_type = node->primitive->value.type;
    if (node_type == PrimitiveType_Switch && node->outputIndex.size() != 2 * (node->inputIndex.size() - 1)) {
      MS_LOG(WARNING) << "do infershape after switch pass.";
      return RET_OK;
 }

 int InferShapePass::InferSwitchNode(const std::unique_ptr<CNodeT> &switch_node, MetaGraphT *graph) {
  if (switch_node->inputIndex.size() < kSwitchInputMinSize) {
    MS_LOG(ERROR) << "switch node input size: " << switch_node->inputIndex.size() << " is less than three.";
    return RET_PARAM_INVALID;
  }

  static std::set<CNodeT *> partial_cnode_inferred{};
  std::deque<CNodeT *> to_process{};
  auto true_branch_output_index = switch_node->inputIndex.at(1);
  auto false_branch_output_index = switch_node->inputIndex.at(2);
  for (auto &node : graph->nodes) {
    if (node->primitive->value.type != PrimitiveType_PartialFusion) {
      continue;
    }
    infer_node_indexes_.erase(infer_node_indexes_.begin());
    if (node_type == PrimitiveType_PartialFusion) {
    if (IsContain(node->outputIndex, true_branch_output_index) &&
        partial_cnode_inferred.find(node.get()) == partial_cnode_inferred.end()) {
      to_process.push_back(node.get());
      partial_cnode_inferred.insert(node.get());
      break;
    }
  }
  for (auto &node : graph->nodes) {
    if (node->primitive->value.type != PrimitiveType_PartialFusion) {
      continue;
    }
    if (IsContain(node->outputIndex, false_branch_output_index) &&
        partial_cnode_inferred.find(node.get()) == partial_cnode_inferred.end()) {
      to_process.push_back(node.get());
      partial_cnode_inferred.insert(node.get());
      break;
    }
  }

  while (!to_process.empty()) {
    auto node = to_process.front();
    to_process.pop_front();
    int ret = InferPartialNode(node, graph);
    if (ret != RET_OK) {
      MS_LOG(WARNING) << "not support partial infer.";
      return ret;
    }
  }

  return RET_OK;
 }

 int InferShapePass::InferCallNode(const std::unique_ptr<CNodeT> &call_node, MetaGraphT *graph) {
  if (call_node->inputIndex.size() < kCallInputMinSize) {
    MS_LOG(ERROR) << "call node input size: " << call_node->inputIndex.size() << " is less than one.";
    return RET_PARAM_INVALID;
  }
  auto call_first_input_index = call_node->inputIndex.front();
  bool find_partial = false;
  bool find_switch = false;
  for (auto &node : graph->nodes) {
    if (IsContain(node->outputIndex, call_first_input_index) &&
        node->primitive->value.type == PrimitiveType_PartialFusion) {
      find_partial = true;
      int ret = InferPartialNode(node.get(), graph);
      if (ret != RET_OK) {
        MS_LOG(WARNING) << "not support partial infer.";
        return ret;
      }
      break;
    }
    if (IsContain(node->outputIndex, call_first_input_index) && node->primitive->value.type == PrimitiveType_Switch) {
      find_switch = true;
      int ret = InferSwitchNode(node, graph);
      if (ret != RET_OK) {
        MS_LOG(WARNING) << "not support partial infer.";
        return ret;
      }
      break;
    }
  }
  if (!find_partial && !find_switch) {
    MS_LOG(ERROR) << "not able to call partial or call switch.";
    return RET_ERROR;
  }
  return RET_OK;
 }

 int InferShapePass::InferSubgraph(const int &subgraph_index, MetaGraphT *graph) {
  auto infer_node_indexes = InitSearchTensor(subgraph_index, graph);
  if (infer_node_indexes.empty()) {
    MS_LOG(ERROR) << "InitSearchTensor failed.";
    return RET_ERROR;
  }

  while (!infer_node_indexes.empty()) {
    auto infer_node_index = infer_node_indexes.front();
    auto &node = graph->nodes.at(infer_node_index);
    auto node_type = node->primitive->value.type;
    if (node_type == PrimitiveType_Call) {
      int ret = InferCallNode(node, graph);
      if (ret != RET_OK) {
        MS_LOG(ERROR) << "infer call node failed.";
        return ret;
      }
    }

    infer_node_indexes.erase(infer_node_indexes.begin());
    auto input_tensors = ConvertTensorToLiteTensor(graph, node->inputIndex);
    auto output_tensors = ConvertTensorToLiteTensor(graph, node->outputIndex);
    if (output_tensors.empty() || output_tensors.size() != node->outputIndex.size() || input_tensors.empty() ||
@@ -287,8 +488,8 @@ STATUS InferShapePass::Run(MetaGraphT *graph) {
      // copy output shape to tensorT
      for (size_t i = 0; i < output_tensors.size(); i++) {
        auto output_dims = output_tensors[i]->shape();
        auto &output_tensor = graph->allTensors.at(node->outputIndex[i]);
        output_tensor->dims.swap(output_dims);
        auto &output_tensorT = graph->allTensors.at(node->outputIndex[i]);
        output_tensorT->dims.swap(output_dims);
        SetDataType(graph, output_tensors, &tensors_, i, infer_node_index);
      }
    } else {
@@ -298,44 +499,50 @@ STATUS InferShapePass::Run(MetaGraphT *graph) {
      return RET_INFER_ERR;
    }
    FreeTensors(&input_tensors, &output_tensors);
    AddOutputNodes(graph, infer_node_index);
    AddOutputNodes(graph, &infer_node_indexes, infer_node_index);
  }
  return RET_OK;
 }

 STATUS InferShapePass::Run(MetaGraphT *graph) {
  MS_ASSERT(graph != nullptr);
  InitInferTensor(graph);

  int ret = InferSubgraph(kMainGraphIndex, graph);
  if (ret != RET_OK) {
    MS_LOG(ERROR) << "InferSubgraph index: " << kMainGraphIndex << " failed, ret: " << ret;
    return ret;
  }

  ResetIncorrectTensorShape(graph);
  return RET_OK;
 }

 void InferShapePass::InitSearchTensor(MetaGraphT *graph) {
  std::vector<uint32_t> all_node_output_tensor_indexes = {};
  tensors_.resize(graph->allTensors.size());
  for (size_t i = 0; i < graph->nodes.size(); i++) {
    auto &node = graph->nodes.at(i);
    auto node_input_indexes = node->inputIndex;
    //  init in_nodes index
    for (size_t j = 0; j < node_input_indexes.size(); j++) {
      tensors_[node_input_indexes[j]].next_nodes_.push_back(i);
    }
    auto node_output_indexes = node->outputIndex;
    for (size_t j = 0; j < node_output_indexes.size(); j++) {
      tensors_[node_output_indexes[j]].prev_nodes_.push_back(i);
    }
    all_node_output_tensor_indexes.insert(all_node_output_tensor_indexes.end(), node_output_indexes.begin(),
                                          node_output_indexes.end());
 std::vector<uint32_t> InferShapePass::InitSearchTensor(const int &subgraph_index, MetaGraphT *graph) {
  std::vector<uint32_t> infer_node_indexes = {};
  if (static_cast<size_t>(subgraph_index) >= graph->subGraph.size()) {
    MS_LOG(ERROR) << "subgraph_index: " << subgraph_index
                  << " is larger than graph->subGraph.size(): " << graph->subGraph.size();
    return {};
  }
  auto &subgraph = graph->subGraph.at(subgraph_index);
  for (uint32_t i = 0; i < tensors_.size(); i++) {
    if (tensors_[i].prev_nodes_.empty() || IsContain(graph->inputIndex, i) || !graph->allTensors.at(i)->data.empty()) {
    if (IsContain(subgraph->inputIndices, i) || !graph->allTensors.at(i)->data.empty()) {
      tensors_[i].is_inferred_ = true;
    }
  }
  for (size_t i = 0; i < graph->nodes.size(); i++) {
    auto &node = graph->nodes.at(i);
  for (size_t i = 0; i < subgraph->nodeIndices.size(); i++) {
    auto &node = graph->nodes.at(subgraph->nodeIndices.at(i));
    if (std::all_of(node->inputIndex.begin(), node->inputIndex.end(),
                    [&](uint32_t idx) { return tensors_[idx].is_inferred_; })) {
      infer_node_indexes_.push_back(i);
      infer_node_indexes.push_back(subgraph->nodeIndices.at(i));
    }
  }
  return infer_node_indexes;
 }

 void InferShapePass::AddOutputNodes(MetaGraphT *graph, uint32_t infer_node_index) {
 void InferShapePass::AddOutputNodes(MetaGraphT *graph, std::vector<uint32_t> *infer_node_indexes,
                                    uint32_t infer_node_index) {
  auto &node = graph->nodes.at(infer_node_index);
  for (size_t i = 0; i < node->outputIndex.size(); i++) {
    auto next_nodes_indexes = tensors_[node->outputIndex[i]].next_nodes_;
@@ -343,29 +550,20 @@ void InferShapePass::AddOutputNodes(MetaGraphT *graph, uint32_t infer_node_index
      auto &next_node = graph->nodes.at(next_nodes_indexes[j]);
      if (std::any_of(next_node->outputIndex.begin(), next_node->outputIndex.end(),
                      [&](uint32_t idx) { return !tensors_[idx].is_inferred_; })) {
        AddNextInferShapeNode(graph, next_nodes_indexes, j);
        AddNextInferShapeNode(graph, infer_node_indexes, next_nodes_indexes, j);
      }
    }
  }
 }

 void InferShapePass::AddNextInferShapeNode(MetaGraphT *graph, std::vector<uint32_t> next_nodes_indexes, size_t index) {
 void InferShapePass::AddNextInferShapeNode(MetaGraphT *graph, std::vector<uint32_t> *infer_node_indexes,
                                           std::vector<uint32_t> next_nodes_indexes, size_t index) {
  auto &next_node = graph->nodes.at(next_nodes_indexes[index]);
  if (find(infer_node_indexes_.begin(), infer_node_indexes_.end(), next_nodes_indexes[index]) ==
      infer_node_indexes_.end()) {
    auto next_node_type = next_node->primitive->value.type;
    if (next_node_type == schema::PrimitiveType_Merge) {
      if (std::all_of(next_node->inputIndex.begin(), next_node->inputIndex.begin() + next_node->inputIndex.size() / 2,
                      [&](uint32_t i) { return tensors_[i].is_inferred_; }) ||
          std::all_of(next_node->inputIndex.begin() + next_node->inputIndex.size() / 2, next_node->inputIndex.end(),
                      [&](uint32_t i) { return tensors_[i].is_inferred_; })) {
        infer_node_indexes_.push_back(next_nodes_indexes[index]);
      }
    } else if (std::all_of(next_node->inputIndex.begin(), next_node->inputIndex.end(),
                           [&](uint32_t i) { return tensors_[i].is_inferred_; }) ||
               std::any_of(next_node->inputIndex.begin(), next_node->inputIndex.end(),
                           [&](uint32_t i) { return graph->allTensors.at(i)->dataType == kObjectTypeTensorType; })) {
      infer_node_indexes_.push_back(next_nodes_indexes[index]);
  if (find(infer_node_indexes->begin(), infer_node_indexes->end(), next_nodes_indexes[index]) ==
      infer_node_indexes->end()) {
    if (std::all_of(next_node->inputIndex.begin(), next_node->inputIndex.end(),
                    [&](uint32_t i) { return tensors_[i].is_inferred_; })) {
      infer_node_indexes->push_back(next_nodes_indexes[index]);
    }
  }
 }
@@ -375,9 +573,13 @@ void InferShapePass::ResetIncorrectTensorShape(MetaGraphT *graph) {
  for (auto &node : graph->nodes) {
    auto out_tensors_index = node->outputIndex;
    for (auto index : out_tensors_index) {
      auto shape = graph->allTensors.at(index)->dims;
      auto &tensor = graph->allTensors.at(index);
      auto shape = tensor->dims;
      if (shape == std::vector{-1}) {
        graph->allTensors.at(index)->dims = {};
        tensor->dims = {};
        if (tensor->dataType == kObjectTypeTensorType) {
          reinterpret_cast<TensorList *>(tensor.get())->set_tensors({});
        }
      }
    }
  }
--- a/mindspore/lite/tools/converter/legacy_optimizer/graph/infershape_pass.h
+++ b/mindspore/lite/tools/converter/legacy_optimizer/graph/infershape_pass.h
@@ -44,14 +44,21 @@ class InferShapePass : public GraphPass {
  STATUS Run(MetaGraphT *graph) override;

 private:
  void InitSearchTensor(MetaGraphT *graph);
  void AddNextInferShapeNode(MetaGraphT *graph, std::vector<uint32_t> next_nodes_indexes, size_t index);
  void AddOutputNodes(MetaGraphT *graph, uint32_t infer_node_index);
  std::vector<uint32_t> InitSearchTensor(const int &subgraph_index, MetaGraphT *graph);
  void AddNextInferShapeNode(MetaGraphT *graph, std::vector<uint32_t> *infer_node_indexes,
                             std::vector<uint32_t> next_nodes_indexes, size_t index);
  void AddOutputNodes(MetaGraphT *graph, std::vector<uint32_t> *infer_node_indexes, uint32_t infer_node_index);
  void ResetIncorrectTensorShape(MetaGraphT *graph);
  int InferPartialNode(const CNodeT *partial_node, MetaGraphT *graph);
  int InferSwitchNode(const std::unique_ptr<CNodeT> &switch_node, MetaGraphT *graph);
  int InferCallNode(const std::unique_ptr<CNodeT> &call_node, MetaGraphT *graph);
  int CopyPartialShapeToSubGraph(const CNodeT *partial_node, MetaGraphT *graph);
  int RestoreSubGraphInput(const CNodeT *partial_node, MetaGraphT *graph);
  void InitInferTensor(MetaGraphT *graph);
  int InferSubgraph(const int &subgraph_index, MetaGraphT *graph);

  lite::converter::FmkType fmk_type_ = FmkType_TF;
  std::vector<InferTensor> tensors_ = {};
  std::vector<uint32_t> infer_node_indexes_ = {};
 };
 }  // namespace lite
 }  // namespace mindspore
--- a/mindspore/lite/tools/converter/legacy_optimizer/graph/topological_sort_pass.cc
+++ b/mindspore/lite/tools/converter/legacy_optimizer/graph/topological_sort_pass.cc
@@ -29,11 +29,13 @@ STATUS TopologicalSortPass::Run(schema::MetaGraphT *graph) {
  MS_ASSERT(graph != nullptr);
  std::vector<std::unique_ptr<schema::CNodeT>> new_nodes;
  std::vector<size_t> sinked_tensor_idxes;
  for (auto &subgraph : graph->subGraph) {
    std::copy(subgraph->inputIndices.begin(), subgraph->inputIndices.end(), std::back_inserter(sinked_tensor_idxes));
  }
  // put all const tensor index into sinked_tensor_idxes
  for (size_t i = 0; i < graph->allTensors.size(); i++) {
    if (graph->allTensors.at(i)->nodeType == NodeType_ValueNode ||
        graph->allTensors.at(i)->nodeType == NodeType_Parameter) {
      sinked_tensor_idxes.insert(sinked_tensor_idxes.end(), i);
    if (graph->allTensors.at(i)->nodeType == NodeType_ValueNode) {
      sinked_tensor_idxes.push_back(i);
    }
  }
  auto &old_nodes = graph->nodes;
@@ -81,17 +83,8 @@ STATUS TopologicalSortPass::Run(schema::MetaGraphT *graph) {
 bool TopologicalSortPass::IsNodeNonDepend(const std::unique_ptr<schema::CNodeT> &node,
                                          const std::vector<size_t> &sinked_tensor_idxes) {
  MS_ASSERT(node != nullptr);
  if (node->primitive && node->primitive->value.type == schema::PrimitiveType_Merge) {
    auto node_input_index = node->inputIndex;
    MS_ASSERT(node_input_index.size() % 2 == 0);
    return std::all_of(node_input_index.begin(), node_input_index.begin() + node_input_index.size() / 2,
                       [&](size_t input_idx) { return IsContain(sinked_tensor_idxes, input_idx); }) ||
           std::all_of(node_input_index.begin() + node_input_index.size() / 2, node_input_index.end(),
                       [&](size_t input_idx) { return IsContain(sinked_tensor_idxes, input_idx); });
  } else {
    return std::all_of(node->inputIndex.begin(), node->inputIndex.end(),
                       [&](size_t input_idx) { return IsContain(sinked_tensor_idxes, size_t(input_idx)); });
  }
  return std::all_of(node->inputIndex.begin(), node->inputIndex.end(),
                     [&](size_t input_idx) { return IsContain(sinked_tensor_idxes, size_t(input_idx)); });
 }
 }  // namespace lite
 }  // namespace mindspore
--- a/mindspore/lite/tools/optimizer/graph/if_pass.cc
+++ b/mindspore/lite/tools/optimizer/graph/if_pass.cc
@@ -1,128 +0,0 @@
 /**
 * Copyright 2020 Huawei Technologies Co., Ltd
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
 #include "tools/optimizer/graph/if_pass.h"
 #include <vector>
 #include <memory>
 #include "tools/optimizer/common/gllo_utils.h"
 #include "src/common/log_adapter.h"
 #include "ops/switch.h"

 namespace mindspore::opt {

 ValueNodePtr IfPass::GetSwitchAnfPrim() {
  auto switch_prim = std::make_shared<ops::Switch>();
  if (switch_prim == nullptr) {
    MS_LOG(ERROR) << "new prim failed.";
    return nullptr;
  }
  ValueNodePtr switch_anf_prim = NewValueNode(switch_prim);
  return switch_anf_prim;
 }

 void IfPass::ReplaceInput(const std::vector<AnfNodePtr> &node_list, const AnfNodePtr &new_input_cnode,
                          const std::string &para_name) {
  for (auto &node : node_list) {
    if (utils::isa<CNodePtr>(node)) {
      auto cnode = utils::cast<CNodePtr>(node);
      for (size_t k = 0; k < cnode->inputs().size(); k++) {
        if (!utils::isa<ParameterPtr>(cnode->input(k))) {
          continue;
        }
        auto para_input = utils::cast<ParameterPtr>(cnode->input(k));
        if (para_input->name() == para_name) {
          cnode->set_input(k, new_input_cnode);
        }
      }
    }
  }
 }

 bool IfPass::Run(const FuncGraphPtr &graph) {
  auto node_list = TopoSort(graph->get_return());
  for (auto &node : node_list) {
    if (!utils::isa<CNodePtr>(node)) {
      continue;
    }
    if (!CheckPrimitiveType(node, prim::kPrimIf)) {
      continue;
    }
    auto if_cnode = node->cast<CNodePtr>();
    MS_ASSERT(if_cnode != nullptr);
    if (if_cnode->inputs().size() < kIfMinInputSize) {
      MS_LOG(ERROR) << "if input is not right.";
      return false;
    }

    // the order is fixed.
    auto then_vnode = if_cnode->input(kIfThenIndex);
    auto else_vnode = if_cnode->input(kIfElseIndex);
    auto cond_vnode = if_cnode->input(kIfCondIndex);

    // else_vnode->cast<ValueNodePtr>()->set_value()
    auto then_fg = GetValueNode<std::shared_ptr<FuncGraph>>(then_vnode);
    auto else_fg = GetValueNode<std::shared_ptr<FuncGraph>>(else_vnode);

    if (then_fg == nullptr || else_fg == nullptr) {
      MS_LOG(ERROR) << "Get value as func_graph failed.";
      lite::ReturnCode::GetSingleReturnCode()->UpdateReturnCode(RET_FAILED);
      return false;
    }

    // create then partial cnode
    std::vector<AnfNodePtr> then_partial_op_inputs{then_vnode};

    // create else partial cnode
    std::vector<AnfNodePtr> else_partial_op_inputs{else_vnode};

    // add if op input to then_cnode and else_cnode
    then_partial_op_inputs.insert(then_partial_op_inputs.end(), if_cnode->inputs().begin() + kIfMinInputSize,
                                  if_cnode->inputs().end());
    else_partial_op_inputs.insert(else_partial_op_inputs.end(), if_cnode->inputs().begin() + kIfMinInputSize,
                                  if_cnode->inputs().end());

    auto then_partial_node = graph->NewCNode(then_partial_op_inputs);
    then_partial_node->set_fullname_with_scope(node->fullname_with_scope() + "-partial-if-then");
    then_partial_node->set_abstract(then_fg->output()->abstract());

    auto else_partial_node = graph->NewCNode(else_partial_op_inputs);
    else_partial_node->set_fullname_with_scope(node->fullname_with_scope() + "-partial-if-else");

    // create switch cnode
    ValueNodePtr switch_anf_primitive = GetSwitchAnfPrim();
    if (switch_anf_primitive == nullptr) {
      MS_LOG(ERROR) << "GetSwitchAnfPrim failed.";
      return false;
    }

    // insert switch node
    std::vector<AnfNodePtr> switch_op_inputs = {switch_anf_primitive, then_partial_node, else_partial_node, cond_vnode};
    switch_op_inputs.insert(switch_op_inputs.end(), if_cnode->inputs().begin() + kIfMinInputSize,
                            if_cnode->inputs().end());
    auto switch_cnode = graph->NewCNode(switch_op_inputs);
    switch_cnode->set_fullname_with_scope(node->fullname_with_scope() + "-Switch");
    switch_cnode->set_abstract(if_cnode->abstract());

    // create then partial cnode
    auto manager = graph->manager();
    auto node_users = manager->node_users()[if_cnode];
    for (auto &node_user : node_users) {
      manager->SetEdge(node_user.first, node_user.second, switch_cnode);
    }
  }

  return true;
 }
 }  // namespace mindspore::opt
--- a/mindspore/lite/tools/optimizer/graph/if_pass.h
+++ b/mindspore/lite/tools/optimizer/graph/if_pass.h
@@ -1,44 +0,0 @@
 /**
 * Copyright 2020 Huawei Technologies Co., Ltd
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

 #ifndef MINDSPORE_LITE_TOOLS_OPTIMIZER_GRAPH_IF_PASS_H_
 #define MINDSPORE_LITE_TOOLS_OPTIMIZER_GRAPH_IF_PASS_H_
 #include <string>
 #include <vector>
 #include "schema/inner/model_generated.h"
 #include "tools/converter/converter_flags.h"
 #include "backend/optimizer/common/pass.h"

 using mindspore::lite::converter::FmkType;
 namespace mindspore::opt {
 class IfPass : public Pass {
 public:
  IfPass() : Pass("if_pass") {}
  ~IfPass() override = default;
  bool Run(const FuncGraphPtr &graph) override;

 private:
  static void ReplaceInput(const std::vector<AnfNodePtr> &node_list, const AnfNodePtr &new_input_cnode,
                           const std::string &para_name);
  static ValueNodePtr GetSwitchAnfPrim();

  const size_t kIfMinInputSize = 4;
  const size_t kIfThenIndex = 1;
  const size_t kIfElseIndex = 2;
  const size_t kIfCondIndex = 3;
 };
 }  // namespace mindspore::opt
 #endif  // MINDSPORE_LITE_TOOLS_OPTIMIZER_GRAPH_IF_PASS_H_
--- a/mindspore/lite/tools/optimizer/graph/while_pass.cc
+++ b/mindspore/lite/tools/optimizer/graph/while_pass.cc
@@ -1,130 +0,0 @@
 /**
 * Copyright 2020-2021 Huawei Technologies Co., Ltd
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
 #include "tools/optimizer/graph/while_pass.h"
 #include <vector>
 #include <memory>
 #include "ops/switch.h"
 #include "tools/optimizer/common/gllo_utils.h"
 #include "src/common/log_adapter.h"

 namespace mindspore::opt {

 ValueNodePtr WhilePass::GetSwitchAnfPrim() {
  auto switch_prim = std::make_shared<mindspore::ops::Switch>();
  ValueNodePtr partial_anf_prim = NewValueNode(switch_prim);
  return partial_anf_prim;
 }

 bool WhilePass::Run(const FuncGraphPtr &graph) {
  auto node_list = TopoSort(graph->get_return());
  static int count = 0;
  for (auto &node : node_list) {
    if (!utils::isa<CNodePtr>(node)) {
      continue;
    }
    if (!CheckPrimitiveType(node, prim::kPrimWhile)) {
      continue;
    }
    auto while_cnode = node->cast<CNodePtr>();
    MS_ASSERT(while_cnode != nullptr);
    if (while_cnode->inputs().size() < kWhileMinInputSize) {
      MS_LOG(ERROR) << "while input is not right.";
      return false;
    }

    // the order is fixed.
    auto cond_vnode = while_cnode->input(kWhileCondIndex);
    auto body_vnode = while_cnode->input(kWhileBodyIndex);
    auto cond_fg = GetValueNode<std::shared_ptr<FuncGraph>>(cond_vnode);
    auto body_fg = GetValueNode<std::shared_ptr<FuncGraph>>(body_vnode);
    if (cond_fg == nullptr || body_fg == nullptr) {
      MS_LOG(ERROR) << "Get value as func_graph failed.";
      lite::ReturnCode::GetSingleReturnCode()->UpdateReturnCode(RET_FAILED);
      return false;
    }
    std::vector<AnfNodePtr> cond_partial_op_inputs{cond_vnode};
    std::vector<AnfNodePtr> body_partial_op_inputs{body_vnode};
    cond_partial_op_inputs.insert(cond_partial_op_inputs.end(), while_cnode->inputs().begin() + kWhileMinInputSize,
                                  while_cnode->inputs().end());
    body_partial_op_inputs.insert(body_partial_op_inputs.end(), while_cnode->inputs().begin() + kWhileMinInputSize,
                                  while_cnode->inputs().end());
    static int idx = 0;
    auto cond_partial_node = graph->NewCNode(cond_partial_op_inputs);
    cond_partial_node->set_fullname_with_scope("Partial-while-cond-" + std::to_string(idx));
    cond_partial_node->set_abstract(cond_fg->output()->abstract());
    auto body_partial_node = graph->NewCNode(body_partial_op_inputs);
    body_partial_node->set_fullname_with_scope("Partial-while-body-" + std::to_string(idx));
    idx++;

    // concat body_fg output to cond_fg input
    auto body_output = body_fg->output();
    auto body_output_cnode = utils::cast<CNodePtr>(body_output);
    auto prim = GetValueNode<PrimitiveCPtr>(body_output_cnode->input(0));
    if (prim == nullptr) {
      MS_LOG(ERROR) << "Get PrimitiveC of node:" << body_output_cnode->fullname_with_scope() << " failed.";
      return false;
    }

    // concat body to cond
    std::vector<AnfNodePtr> body_to_cond_inputs{cond_vnode};
    if (CheckPrimitiveType(body_output_cnode, prim::kPrimMakeTuple)) {
      for (size_t i = 1; i < body_output_cnode->inputs().size(); ++i) {
        body_to_cond_inputs.emplace_back(body_output_cnode->input(i));
      }
    } else {
      body_to_cond_inputs.emplace_back(body_output_cnode);
    }

    // concat body to cond
    auto body_to_cond_cnode = body_fg->NewCNode(body_to_cond_inputs);
    body_to_cond_cnode->set_fullname_with_scope("Partial-while-body-to-cond");
    auto body_fg_manager = body_fg->manager();
    body_fg_manager->Replace(body_fg->output(), body_to_cond_cnode);
    body_fg->set_output(body_to_cond_cnode);
    body_partial_node->set_abstract(cond_fg->output()->abstract());

    // create switch cnode
    ValueNodePtr switch_anf_primitive = GetSwitchAnfPrim();
    if (switch_anf_primitive == nullptr) {
      MS_LOG(ERROR) << "GetSwitchAnfPrim failed.";
      return false;
    }

    // insert switch node
    std::vector<AnfNodePtr> switch_op_inputs = {switch_anf_primitive, cond_partial_node, body_partial_node};
    auto switch_cnode = graph->NewCNode(switch_op_inputs);
    switch_cnode->set_fullname_with_scope("Switch-" + std::to_string(count++));

    AbstractBasePtrList abstract_list;
    auto body_fg_output_cnode = utils::cast<CNodePtr>(body_fg->output());
    for (auto &cnode : body_fg_output_cnode->inputs()) {
      if (!utils::isa<CNodePtr>(cnode) && !utils::isa<ParameterPtr>(cnode)) {
        continue;
      }
      abstract_list.push_back(cnode->abstract());
    }
    switch_cnode->set_abstract(std::make_shared<abstract::AbstractTuple>(abstract_list));

    // create cond partial cnode
    auto manager = graph->manager();
    if (!manager->Replace(while_cnode, switch_cnode)) {
      MS_LOG(ERROR) << "replace node failed.";
      return false;
    }
  }
  return true;
 }
 }  // namespace mindspore::opt
--- a/mindspore/lite/tools/optimizer/graph/while_pass.h
+++ b/mindspore/lite/tools/optimizer/graph/while_pass.h
@@ -1,41 +0,0 @@
 /**
 * Copyright 2020-2021 Huawei Technologies Co., Ltd
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

 #ifndef MINDSPORE_LITE_TOOLS_OPTIMIZER_GRAPH_WHILE_PASS_H_
 #define MINDSPORE_LITE_TOOLS_OPTIMIZER_GRAPH_WHILE_PASS_H_
 #include <string>
 #include <vector>
 #include "schema/inner/model_generated.h"
 #include "tools/converter/converter_flags.h"
 #include "backend/optimizer/common/pass.h"

 using mindspore::lite::converter::FmkType;
 namespace mindspore::opt {
 class WhilePass : public Pass {
 public:
  WhilePass() : Pass("while_pass") {}
  ~WhilePass() override = default;
  bool Run(const FuncGraphPtr &graph) override;

 private:
  static ValueNodePtr GetSwitchAnfPrim();

  const size_t kWhileMinInputSize = 3;
  const size_t kWhileCondIndex = 1;
  const size_t kWhileBodyIndex = 2;
 };
 }  // namespace mindspore::opt
 #endif  // MINDSPORE_LITE_SRC_PASS_REMOVE_IDENTITY_PASS_H_