* Copyright (c) 2025 Huawei Technologies Co., Ltd.
* This program is free software, you can redistribute it and/or modify it under the terms and conditions of
* CANN Open Software License Agreement Version 2.0 (the "License").
* Please refer to the License for details. You may not use this file except in compliance with the License.
* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, EITHER EXPRESS OR IMPLIED,
* INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, MERCHANTABILITY, OR FITNESS FOR A PARTICULAR PURPOSE.
* See LICENSE in the root of the software repository for the full text of the License.
*/
#include "graph/passes/multi_batch/multi_batch_clone_pass.h"
#include "formats/utils/formats_trans_utils.h"
#include "common/plugin/ge_make_unique_util.h"
#include "common/context/local_context.h"
#include "graph/preprocess/multi_batch_options.h"
#include "graph/utils/node_utils.h"
#include "graph/utils/op_desc_utils.h"
#include "graph/utils/op_desc_utils_ex.h"
#include "graph/utils/tensor_utils.h"
#include "graph/utils/type_utils.h"
#include "common/omg_util/omg_util.h"
#include "graph/manager/graph_var_manager.h"
#include "graph/utils/op_type_utils.h"
#include "common/checker.h"
#include "graph/ge_context.h"
#include "base/err_msg.h"
namespace ge {
namespace {
constexpr uint8_t kDataInIndex = 0;
constexpr uint8_t kDataOutIndex = 0;
constexpr uint8_t kCaseArgIndex = 1;
const int32_t kDivisionConst = 2;
const size_t kNumOfGetnextNode = 1;
const std::string kMultiBatchCaseNode = "ascend_mbatch_shape_case";
const std::string kMultiBatchDataNode = "ascend_mbatch_shape_data";
const std::string kMultiBatchGetDynamicDimsNode = "ascend_mbatch_get_dynamic_dims_node";
const std::string kMultiBatchConstNode = "ascend_mbatch_shape_const";
const std::string kMultiBatchMapIndexNode = "ascend_mbatch_shape_mapindex";
const std::string kMultiBatchNodePostfix = "_ascend_mbatch_batch_";
const char *const kMbatchCaseName = "mbatch-switch-name";
}
inline bool IsGetNextType(const NodePtr &node) {
std::string original_type;
GE_IF_BOOL_EXEC(GetOriginalType(node, original_type) != SUCCESS,
GELOGW("Get original type failed."); return false);
return (original_type == ITERATORV2);
}
Status MultiBatchClonePass::Run(ComputeGraphPtr graph) {
GE_IF_BOOL_EXEC(graph == nullptr,
REPORT_INNER_ERR_MSG("E19999", "Param graph is nullptr, check invalid");
GELOGE(FAILED, "[Check][Param] Original graph is nullptr"); return FAILED);
if (GetLocalOmgContext().is_subgraph_multi_batch) {
GELOGI("SubgraphMultiBatch skip the MultiBatchClonePass.");
return SUCCESS;
}
if (graph->GetParentGraph() != nullptr) {
GELOGD("Subgraph %s skip the MultiBatchClonePass", graph->GetName().c_str());
return SUCCESS;
}
if (!GetLocalOmgContext().need_multi_batch) {
GELOGI("No need to process_multi for no_train graph.");
return SUCCESS;
}
std::vector<NodePtr> data_nodes;
std::vector<NodePtr> getnext_nosink_nodes;
std::vector<NodePtr> getnext_sink_nodes;
bool need_multi_batch = true;
if (multibatch::CheckSequenceOfOptions(graph, data_nodes, getnext_nosink_nodes,
getnext_sink_nodes, need_multi_batch) != SUCCESS) {
GELOGE(PARAM_INVALID, "[Train_Dynamic] [Check][SequenceOfOptions] failed, graph:%s.", graph->GetName().c_str());
return PARAM_INVALID;
}
if (!need_multi_batch) {
GELOGI("No need to process multi for graph %s.", graph->GetName().c_str());
return SUCCESS;
}
if (multibatch::UpdateNameOfInputShape(graph, data_nodes, getnext_nosink_nodes, getnext_sink_nodes) != SUCCESS) {
GELOGE(PARAM_INVALID, "[Train_Dynamic] [Update][Name] Of InputShape failed, graph:%s.", graph->GetName().c_str());
return PARAM_INVALID;
}
if (multibatch::DeleteIdentityInsertByAdapter(graph) != SUCCESS) {
GELOGE(PARAM_INVALID, "[Train_Dynamic] [Delete][IdentityInsertByAdapter] failed, graph:%s.",
graph->GetName().c_str());
return PARAM_INVALID;
}
if (multibatch::InitDynamicParams(batch_shapes_) != SUCCESS) {
GELOGE(PARAM_INVALID, "[Train_Dynamic] [Init][InitDynamicParams] failed, graph:%s.",
graph->GetName().c_str());
return PARAM_INVALID;
}
if (batch_shapes_.empty()) {
GELOGD("There is no multi-batch options, no need clone multi-batch graph");
return SUCCESS;
}
if (multibatch::CheckNegativeCountOfOptions(batch_shapes_) != SUCCESS) {
GELOGE(PARAM_INVALID, "[Train_Dynamic] [Check][Param] Input_shape and dynamic_dims should set correct params.");
return PARAM_INVALID;
}
GELOGD("Begin to run Multi-batch clone on graph: %s", graph->GetName().c_str());
GE_CHK_STATUS_RET(multibatch::CheckDynamicParams(batch_shapes_), "[Check][Params] Invalid multi-batch param");
if (CollectIoNodes(graph) != SUCCESS) {
GELOGE(INTERNAL_ERROR, "[Collect][IoNodes] failed, graph:%s", graph->GetName().c_str());
return INTERNAL_ERROR;
}
if (CheckAndParseDynamicData() != SUCCESS) {
GELOGE(PARAM_INVALID, "[CheckAndParse][DynamicData] failed");
return PARAM_INVALID;
}
GE_ASSERT_SUCCESS(multibatch::UpdateDataShapeByUserInput());
GE_ASSERT_SUCCESS(SortDynamicDimsWithIndex());
(void)AttrUtils::GetStr(graph, ATTR_NAME_SESSION_GRAPH_ID, session_graph_id_);
ComputeGraphPtr branch = MakeShared<ComputeGraph>(graph->GetName());
GE_IF_BOOL_EXEC(branch == nullptr, REPORT_INNER_ERR_MSG("E19999", "New ComputeGraph failed");
GELOGE(OUT_OF_MEMORY, "[New][ComputeGraph] failed"); return OUT_OF_MEMORY);
(void)AttrUtils::SetStr(branch, ATTR_NAME_SESSION_GRAPH_ID, session_graph_id_);
branch->SetGraphID(graph->GetGraphID());
branch->SetSessionID(session_id_);
graph->InValid();
graph->Swap(*branch);
graph->SetNeedIteration(branch->GetNeedIteration());
branch->SetNeedIteration(false);
(void)ge::AttrUtils::SetBool(graph, "_enable_dynamic_batch", true);
GELOGI("Root graph get need_iteration: %s", (graph->GetNeedIteration() ? "true" : "false"));
GE_CHK_STATUS_RET(CreateRootGraph(graph), "[Construct][RootGraph] for graph:%s failed.", graph->GetName().c_str());
GE_CHK_STATUS_RET(CreateOriGraph(branch), "[Construct][OriGraph] for graph:%s failed.", graph->GetName().c_str());
GE_CHK_STATUS_RET(CreateSubgraphs(graph, branch),
"[Construct][Subgraphs] for graph:%s failed.", graph->GetName().c_str());
GE_CHK_STATUS_RET(PruneDirectOutput(graph), "[Prune][DirectOutput] for graph:%s failed.", graph->GetName().c_str());
GE_CHK_STATUS_RET(UpdateSubgraphOutput(), "[Update][SubgraphOutput] failed, graph:%s", graph->GetName().c_str());
GELOGD("MultiBatchClonePass Leave");
return SUCCESS;
}
Status MultiBatchClonePass::CollectIoNodes(const ComputeGraphPtr &graph) {
for (const auto &node : graph->GetDirectNode()) {
if (!GetLocalOmgContext().dynamic_node_type.empty() && IsGetNextType(node)) {
all_data_nodes_.emplace_back(node);
GE_CHK_STATUS_RET(InitParamsOfGetNext(node), "[Init][Params] of %s failed.", node->GetName().c_str());
}
if (OpTypeUtils::IsDataNode(node->GetType())) {
all_data_nodes_.emplace_back(node);
} else if (node->GetType() == CONSTANT || node->GetType() == CONSTANTOP) {
all_const_nodes_.emplace_back(node);
} else if (node->GetType() == NETOUTPUT) {
all_output_nodes_.emplace_back(node);
}
}
if (all_data_nodes_.empty() || all_output_nodes_.size() != 1) {
REPORT_INNER_ERR_MSG("E19999", "Data node num is 0 or output node num != 1, graph:%s, check invalid",
graph->GetName().c_str());
GELOGE(FAILED, "[Check][Param] Data node num is 0 or output node num != 1, graph:%s", graph->GetName().c_str());
return FAILED;
}
int64_t data_index = 0;
size_t getnext_node_count = 0;
for (size_t i = 0; i < all_data_nodes_.size(); ++i) {
if (IsGetNextType(all_data_nodes_[i])) {
getnext_node_count++;
continue;
}
const auto &op_desc = all_data_nodes_[i]->GetOpDesc();
if (!AttrUtils::GetInt(op_desc, ATTR_NAME_INDEX, data_index)) {
(void)AttrUtils::SetInt(op_desc, ATTR_NAME_INDEX, i - getnext_node_count);
}
}
const auto &output = all_output_nodes_[0];
for (size_t i = 0; i < output->GetAllInDataAnchorsSize(); ++i) {
const auto in_anchor = output->GetInDataAnchor(i);
GE_CHECK_NOTNULL(in_anchor);
const auto out_anchor = in_anchor->GetPeerOutAnchor();
GE_CHECK_NOTNULL(out_anchor);
const auto data_node = out_anchor->GetOwnerNode();
if (OpTypeUtils::IsDataNode(data_node->GetType())) {
direct_output_[i] = data_node->GetName();
GE_CHK_GRAPH_STATUS_RET(GraphUtils::RemoveEdge(data_node->GetOutDataAnchor(kDataOutIndex),
output->GetInDataAnchor(i)),
"[Remove][Edge] between %s(index:%u) and %s(index:%zu) failed",
data_node->GetName().c_str(), kDataOutIndex, output->GetName().c_str(), i);
}
}
GELOGD("Data count is %zu, const count is %zu, getnext count is %zu, output count is %zu, direct out count is %zu.",
all_data_nodes_.size(), all_const_nodes_.size(), getnext_node_count, all_output_nodes_.size(),
direct_output_.size());
return SUCCESS;
}
void MultiBatchClonePass::GetDataNodes(std::vector<NodePtr> &data_nodes) const {
if (GetLocalOmgContext().dynamic_node_type == DATA) {
data_nodes = GetLocalOmgContext().data_nodes;
} else {
data_nodes = GetLocalOmgContext().getnext_nosink_nodes;
}
multibatch::SortDataNodesByIndex(data_nodes);
}
int32_t MultiBatchClonePass::FindIndexForInputDims(const std::string &node_name,
const std::vector<std::pair<std::string, std::vector<int64_t>>> &data_name_and_shape) const {
for (size_t i = 0UL; i < data_name_and_shape.size(); i++) {
if (data_name_and_shape[i].first == node_name) {
return static_cast<int32_t>(i);
}
}
return -1;
}
Status MultiBatchClonePass::SortDynamicDimsWithIndex() {
if (GetLocalOmgContext().dynamic_node_type.empty()) {
GELOGI("No need to sort dynamic dims when offline infer.");
GetLocalOmgContext().batch_shapes = batch_shapes_;
return SUCCESS;
}
std::vector<NodePtr> data_nodes;
GetDataNodes(data_nodes);
if (data_nodes.empty()) {
GetLocalOmgContext().batch_shapes = batch_shapes_;
return SUCCESS;
}
auto data_name_and_shape = GetLocalOmgContext().user_input_dims;
std::vector<std::pair<std::string, std::vector<int64_t>>> user_data_name_and_shape;
for (size_t i = 0UL; i < data_nodes.size(); i++) {
int32_t index = FindIndexForInputDims(data_nodes[i]->GetName(), data_name_and_shape);
GE_ASSERT_TRUE(index >= 0LL);
const auto data_shape = data_name_and_shape[index].second;
user_data_name_and_shape.emplace_back(std::make_pair(data_nodes[i]->GetName(), data_shape));
}
GetLocalOmgContext().user_input_dims = user_data_name_and_shape;
const size_t batch_size = batch_shapes_.size();
GE_ASSERT_TRUE(batch_size > 0UL);
batch_shapes_.clear();
batch_shapes_.resize(batch_size);
for (const auto &name_and_shape : user_data_name_and_shape) {
std::string data_name = name_and_shape.first;
const auto iter = data_to_dynamic_info_.find(data_name);
if (iter != data_to_dynamic_info_.end()) {
std::vector<std::vector<int64_t>> &dynamic_dim = iter->second;
for (size_t i = 0UL; i < batch_shapes_.size(); i++) {
GE_ASSERT_TRUE(i < dynamic_dim.size());
for (size_t j = 0UL; j < dynamic_dim[i].size(); j++) {
batch_shapes_[i].emplace_back(dynamic_dim[i][j]);
}
}
}
}
GetLocalOmgContext().batch_shapes = batch_shapes_;
return SUCCESS;
}
Status MultiBatchClonePass::CheckAndParseDynamicData() {
size_t unknown_shape_count = 0;
auto data_name_and_shape = GetLocalOmgContext().user_input_dims;
std::vector<std::string> data_name_order;
for (auto &item : data_name_and_shape) {
data_name_order.push_back(item.first);
}
if (!getnext_sink_dynamic_dims_) {
for (const auto &node : all_data_nodes_) {
auto data_desc = NodeUtils::GetOutputDesc(*node, kDataOutIndex);
auto data_shape = data_desc.GetShape();
auto data_format = data_desc.GetFormat() == Format::FORMAT_NCHW ? "NCHW" :
data_desc.GetFormat() == Format::FORMAT_NHWC ? "NHWC" : "Others";
auto data_name = node->GetName();
const auto &data_shape_dims = data_shape.GetDims();
if (std::all_of(data_shape_dims.begin(), data_shape_dims.end(), [](int64_t val) { return val >= 0; })) {
continue;
}
++unknown_shape_count;
auto iter = find(data_name_order.begin(), data_name_order.end(), data_name);
if (iter == data_name_order.end()) {
if (!GetLocalOmgContext().dynamic_batch_size.empty()) {
bool ret = multibatch::CheckDynamicBatchShape(data_shape_dims, data_name);
GE_IF_BOOL_EXEC(!ret,
GELOGE(PARAM_INVALID, "[Check][DynamicBatchShape] of %s failed.", data_name.c_str());
return PARAM_INVALID);
} else if (!GetLocalOmgContext().dynamic_image_size.empty()) {
bool ret = multibatch::CheckDynamicImageSizeShape(data_shape_dims, data_format);
GE_IF_BOOL_EXEC(!ret,
GELOGE(PARAM_INVALID, "[Check][DynamicImageSizeShape] of %s failed.", data_name.c_str());
return PARAM_INVALID);
} else if (!GetLocalOmgContext().dynamic_dims.empty()) {
REPORT_PREDEFINED_ERR_MSG(
"E10001", std::vector<const char *>({"parameter", "value", "reason"}),
std::vector<const char *>({"--dynamic_dims", data_name.c_str(),
"All dynamic nodes must be set in --input_shape."}));
GELOGE(INTERNAL_ERROR, "[Check][Param] data:%s shape:%s must be set in --input_shape",
node->GetName().c_str(), data_shape.ToString().c_str());
return INTERNAL_ERROR;
}
data_name_and_shape.emplace_back(data_name, data_shape_dims);
}
}
}
auto ret = multibatch::ParserDataToDynamicInfo(batch_shapes_, data_name_and_shape, data_to_dynamic_info_);
GE_CHK_STATUS_RET(ret, "[Parser][DataToDynamicInfo] failed.");
if ((!getnext_sink_dynamic_dims_) && (unknown_shape_count == 0) &&
(GetLocalOmgContext().dynamic_dims.empty())) {
REPORT_PREDEFINED_ERR_MSG("E10040", std::vector<const char *>({}), std::vector<const char *>({}));
GELOGE(PARAM_INVALID, "[Check][Param] Need unknown shape data "
"when user set --dynamic_batch_size, --dynamic_image_size or --dynamic_dims");
return PARAM_INVALID;
}
return SUCCESS;
}
Status MultiBatchClonePass::InitParamsOfGetNext(const NodePtr &node) {
data_count_from_getnext_ = 0;
getnext_sink_dynamic_dims_ = false;
GE_CHECK_NOTNULL(node->GetOpDesc());
data_count_from_getnext_ = node->GetOpDesc()->GetOutputsSize();
if (GetLocalOmgContext().dynamic_node_type == GETNEXT) {
data_count_from_getnext_ = data_count_from_getnext_ / kDivisionConst;
for (size_t i = 0; i < data_count_from_getnext_; ++i) {
GeTensorDesc output_desc = node->GetOpDesc()->GetOutputDesc(i);
GELOGD("The %zu data shape from getnext sink is %s.", i,
ToString(output_desc.GetShape().GetDims()).c_str());
const auto &dims = output_desc.GetShape().GetDims();
if (std::all_of(dims.begin(), dims.end(), [](int64_t val) {return val >= 0; })) {
GELOGD("The %zu data from %s is static.", i, node->GetName().c_str());
} else {
getnext_sink_dynamic_dims_ = true;
GELOGD("Dynamic dims in the pattern of getnext sink.");
}
}
}
if (node->GetOutControlAnchor() != nullptr) {
for (const auto &peer_in_control_anchor : node->GetOutControlAnchor()->GetPeerInControlAnchors()) {
NodePtr next_node = peer_in_control_anchor->GetOwnerNode();
if (next_node->GetType() == CONSTANTOP) {
out_control_nodes_.insert(next_node);
GELOGD("Control edge: %s connect with %s.", node->GetName().c_str(), next_node->GetName().c_str());
}
}
}
return SUCCESS;
}
Status MultiBatchClonePass::GetInputAndOutputNum(uint32_t &input_num, uint32_t &output_num) {
if (all_data_nodes_.size() + all_const_nodes_.size() > UINT32_MAX) {
REPORT_INNER_ERR_MSG("E19999", "Sum of data node size[%zu] and const node size[%zu] exceed UINT32_MAX.",
all_data_nodes_.size(), all_const_nodes_.size());
GELOGE(FAILED, "[Exceed][UINT32_MAX] Sum of data node size[%zu] and const node size[%zu] exceed UINT32_MAX.",
all_data_nodes_.size(), all_const_nodes_.size());
return FAILED;
}
input_num = all_data_nodes_.size() + all_const_nodes_.size();
if (data_count_from_getnext_ != 0) {
if (input_num + data_count_from_getnext_ - kNumOfGetnextNode > UINT32_MAX) {
REPORT_INNER_ERR_MSG("E19999", "Sum[%zu] exceed UINT32_MAX.",
input_num + data_count_from_getnext_ - kNumOfGetnextNode);
GELOGE(FAILED, "[Exceed][UINT32_MAX] Sum[%zu] exceed UINT32_MAX.",
input_num + data_count_from_getnext_ - kNumOfGetnextNode);
return FAILED;
}
input_num = input_num + data_count_from_getnext_ - kNumOfGetnextNode;
}
output_num = all_output_nodes_[0]->GetAllInDataAnchorsSize();
return SUCCESS;
}
Status MultiBatchClonePass::CreateRootGraph(const ComputeGraphPtr &graph) {
GELOGD("Start create root graph of %s.", graph->GetName().c_str());
uint32_t input_num = 0;
uint32_t output_num = 0;
if (GetInputAndOutputNum(input_num, output_num) != SUCCESS) {
GELOGE(FAILED, "[Get][Num] Get input and output num of graph: %s failed.", graph->GetName().c_str());
return FAILED;
}
OpDescBuilder op_builder(kMultiBatchCaseNode, CASE);
op_builder.AddInput("branch_index").AddDynamicInput("input", input_num).AddDynamicOutput("output", output_num);
const OpDescPtr op_desc = op_builder.Build();
if (op_desc == nullptr) {
REPORT_INNER_ERR_MSG("E19999", "Build op:%s(%s) failed", kMultiBatchCaseNode.c_str(), CASE);
GELOGE(OUT_OF_MEMORY, "[Build][Op] %s(%s) failed", kMultiBatchCaseNode.c_str(), CASE);
return OUT_OF_MEMORY;
}
op_desc->RegisterSubgraphIrName("branches", kDynamic);
case_node_ = graph->AddNode(op_desc);
if (case_node_ == nullptr) {
REPORT_INNER_ERR_MSG("E19999", "Add node:%s(%s) to graph:%s failed",
op_desc->GetName().c_str(), op_desc->GetType().c_str(), graph->GetName().c_str());
GELOGE(OUT_OF_MEMORY, "[Add][Node] %s(%s) to graph:%s failed",
op_desc->GetName().c_str(), op_desc->GetType().c_str(), graph->GetName().c_str());
return OUT_OF_MEMORY;
}
uint32_t batch_num = static_cast<uint32_t>(batch_shapes_.size());
if (!AttrUtils::SetInt(op_desc, ATTR_NAME_BATCH_NUM, batch_num)) {
REPORT_INNER_ERR_MSG("E19999", "Set Attr:%s to op:%s(%s) failed", ATTR_NAME_BATCH_NUM.c_str(),
op_desc->GetName().c_str(), op_desc->GetType().c_str());
GELOGE(FAILED, "[Set][Attr] %s to op:%s(%s) failed", ATTR_NAME_BATCH_NUM.c_str(),
op_desc->GetName().c_str(), op_desc->GetType().c_str());
return FAILED;
}
for (uint32_t i = 0; i < batch_num; i++) {
const std::string &attr_name = ATTR_NAME_PRED_VALUE + "_" + std::to_string(i);
if (!AttrUtils::SetListInt(op_desc, attr_name, batch_shapes_[i])) {
REPORT_INNER_ERR_MSG("E19999", "Set Attr:%s to op:%s(%s) failed", attr_name.c_str(),
op_desc->GetName().c_str(), op_desc->GetType().c_str());
GELOGE(FAILED, "[Set][Attr] %s to op:%s(%s) failed", attr_name.c_str(),
op_desc->GetName().c_str(), op_desc->GetType().c_str());
return FAILED;
}
}
std::vector<std::string> data_name_order;
for (auto &item : GetLocalOmgContext().user_input_dims) {
data_name_order.push_back(item.first);
}
if (!AttrUtils::SetListStr(op_desc, ATTR_USER_DESIGNEATE_SHAPE_ORDER, data_name_order)) {
REPORT_INNER_ERR_MSG("E19999", "Set Attr:%s to op:%s(%s) failed", ATTR_USER_DESIGNEATE_SHAPE_ORDER.c_str(),
op_desc->GetName().c_str(), op_desc->GetType().c_str());
GELOGE(FAILED, "[Set][Attr] %s to op:%s(%s) failed", ATTR_USER_DESIGNEATE_SHAPE_ORDER.c_str(),
op_desc->GetName().c_str(), op_desc->GetType().c_str());
return FAILED;
}
if (!AttrUtils::SetBool(op_desc, ATTR_INSERT_BY_MBATCH, true)) {
REPORT_INNER_ERR_MSG("E19999", "Set Attr:%s to op:%s(%s) failed", ATTR_INSERT_BY_MBATCH.c_str(),
op_desc->GetName().c_str(), op_desc->GetType().c_str());
GELOGE(INTERNAL_ERROR, "[Set][Attr] %s to op:%s(%s) failed", ATTR_INSERT_BY_MBATCH.c_str(),
op_desc->GetName().c_str(), op_desc->GetType().c_str());
return INTERNAL_ERROR;
}
GE_CHK_STATUS_RET(multibatch::StampDynamicType(op_desc),
"[Call][StampDynamicType] for op:%s(%s) failed",
op_desc->GetName().c_str(), op_desc->GetType().c_str());
GE_CHK_STATUS_RET(CreateIndexNode(graph), "[Create][IndexNode] for graph:%s failed", graph->GetName().c_str());
GE_CHK_STATUS_RET(CreateInputNode(graph), "[Create][InputNode] for graph:%s failed", graph->GetName().c_str());
GE_CHK_STATUS_RET(CreateConstNode(graph), "[Create][ConstNode] for graph:%s failed", graph->GetName().c_str());
GE_CHK_STATUS_RET(CreateOutputNode(graph), "[Create][OutputNode] for graph:%s failed", graph->GetName().c_str());
return SUCCESS;
}
Status MultiBatchClonePass::CreateIndexDataNode(const ComputeGraphPtr &graph, NodePtr &shape_node) {
const OpDescPtr data_desc = MakeShared<OpDesc>(kMultiBatchDataNode, DATA);
if (data_desc == nullptr) {
REPORT_INNER_ERR_MSG("E19999", "New OpDesc failed");
GELOGE(OUT_OF_MEMORY, "[New][OpDesc] failed");
return FAILED;
}
GeTensorDesc data_tensor(GeShape({static_cast<int64_t>(batch_shapes_[0].size())}), FORMAT_ND, DT_INT32);
data_tensor.SetOriginShape(ge::GeShape(data_tensor.GetShape().GetDims()));
if (data_desc->AddInputDesc(data_tensor) != GRAPH_SUCCESS) {
REPORT_INNER_ERR_MSG("E19999", "Add input desc to op:%s(%s) failed",
data_desc->GetName().c_str(), data_desc->GetType().c_str());
GELOGE(FAILED, "[Add][InputDesc] to op:%s(%s) failed",
data_desc->GetName().c_str(), data_desc->GetType().c_str());
return FAILED;
}
if (data_desc->AddOutputDesc(data_tensor) != GRAPH_SUCCESS) {
REPORT_INNER_ERR_MSG("E19999", "Add output desc to op:%s(%s) failed.",
data_desc->GetName().c_str(), data_desc->GetType().c_str());
GELOGE(FAILED, "[Add][OutputDesc] to op:%s(%s) failed",
data_desc->GetName().c_str(), data_desc->GetType().c_str());
return FAILED;
}
size_t data_index = all_data_nodes_.size();
data_index = data_count_from_getnext_ != 0 ? data_index - kNumOfGetnextNode : data_index;
(void)AttrUtils::SetInt(data_desc, ATTR_NAME_INDEX, data_index);
(void)AttrUtils::SetBool(data_desc, "_is_multi_batch_shape_data", true);
(void)AttrUtils::SetBool(data_desc, ATTR_INSERT_BY_MBATCH, true);
(void)AttrUtils::SetStr(data_desc, "_ge_attr_lowering_func", "multi_batch_shape_data");
(void)AttrUtils::SetBool(data_desc, ATTR_NAME_HOST_TENSOR, true);
shape_node = graph->AddNode(data_desc);
if (shape_node == nullptr) {
REPORT_INNER_ERR_MSG("E19999", "Add node:%s(%s) to graph:%s failed",
data_desc->GetName().c_str(), data_desc->GetType().c_str(), graph->GetName().c_str());
GELOGE(OUT_OF_MEMORY, "[Add][Node] %s(%s) to graph:%s failed",
data_desc->GetName().c_str(), data_desc->GetType().c_str(), graph->GetName().c_str());
return OUT_OF_MEMORY;
}
return SUCCESS;
}
Status MultiBatchClonePass::CreateIndexConstNode(const ComputeGraphPtr &graph, NodePtr &node) {
const OpDescPtr const_desc = MakeShared<OpDesc>(kMultiBatchConstNode, CONSTANT);
if (const_desc == nullptr) {
REPORT_INNER_ERR_MSG("E19999", "New OpDesc failed");
GELOGE(OUT_OF_MEMORY, "[New][OpDesc] failed");
return FAILED;
}
int64_t count = static_cast<int64_t>(batch_shapes_.size() * batch_shapes_[0].size());
std::unique_ptr<int32_t[]> addr(new (std::nothrow) int32_t[count]);
GE_CHECK_NOTNULL(addr);
size_t i = 0;
for (auto &batch_shape : batch_shapes_) {
for (int64_t dim : batch_shape) {
addr[i++] = static_cast<int32_t>(dim);
}
}
GeTensorDesc const_tensor(GeShape({count}), FORMAT_ND, DT_INT32);
const_tensor.SetOriginShape(const_tensor.GetShape());
GeTensor tensor(const_tensor);
(void)tensor.SetData(reinterpret_cast<uint8_t *>(addr.get()), count * sizeof(int32_t));
if (!AttrUtils::SetTensor(const_desc, ATTR_NAME_WEIGHTS, tensor)) {
REPORT_INNER_ERR_MSG("E19999", "Set Attr:%s to op:%s(%s) failed", ATTR_NAME_WEIGHTS.c_str(),
const_desc->GetName().c_str(), const_desc->GetType().c_str());
GELOGE(OUT_OF_MEMORY, "[Set][Attr] %s to op:%s(%s) failed", ATTR_NAME_WEIGHTS.c_str(),
const_desc->GetName().c_str(), const_desc->GetType().c_str());
return FAILED;
}
if (const_desc->AddOutputDesc(const_tensor) != GRAPH_SUCCESS) {
REPORT_INNER_ERR_MSG("E19999", "Add output desc to op:%s(%s) failed.",
const_desc->GetName().c_str(), const_desc->GetType().c_str());
GELOGE(OUT_OF_MEMORY, "[Add][OutputDesc] to op:%s(%s) failed",
const_desc->GetName().c_str(), const_desc->GetType().c_str());
return FAILED;
}
node = graph->AddNode(const_desc);
if (node == nullptr) {
REPORT_INNER_ERR_MSG("E19999", "Add node:%s(%s) to graph:%s failed",
const_desc->GetName().c_str(), const_desc->GetType().c_str(), graph->GetName().c_str());
GELOGE(OUT_OF_MEMORY, "[Add][Node] %s(%s) to graph:%s failed",
const_desc->GetName().c_str(), const_desc->GetType().c_str(), graph->GetName().c_str());
return OUT_OF_MEMORY;
}
return SUCCESS;
}
Status MultiBatchClonePass::CreateIndexNode(const ComputeGraphPtr &graph) {
if (!getnext_sink_dynamic_dims_) {
GE_CHK_STATUS_RET(CreateIndexDataNode(graph, shape_node_),
"[Create][IndexDataNode] failed, graph:%s", graph->GetName().c_str());
} else {
GE_CHK_STATUS_RET(CreateGetDynamicDimsNode(graph, shape_node_),
"[Create][GetDynamicDimsNode] failed, graph:%s", graph->GetName().c_str());
}
NodePtr const_node;
GE_CHK_STATUS_RET(CreateIndexConstNode(graph, const_node),
"[Create][ConstNode] failed, graph:%s", graph->GetName().c_str());
GELOGD("Shape node name is %s, type is %s, const node name is %s.", shape_node_->GetName().c_str(),
shape_node_->GetType().c_str(), const_node->GetName().c_str());
OpDescBuilder op_builder(kMultiBatchMapIndexNode, "MapIndex");
GE_CHECK_NOTNULL(shape_node_->GetOpDesc());
GE_CHECK_NOTNULL(const_node->GetOpDesc());
op_builder.AddInput("x", shape_node_->GetOpDesc()->GetOutputDesc(0))
.AddInput("data_seq", const_node->GetOpDesc()->GetOutputDesc(0))
.AddOutput("y", GeTensorDesc(GeShape(), FORMAT_ND, DT_INT32));
const OpDescPtr op_desc = op_builder.Build();
if (op_desc == nullptr) {
REPORT_INNER_ERR_MSG("E19999", "Build op:%s(%s) failed", kMultiBatchMapIndexNode.c_str(), "MapIndex");
GELOGE(OUT_OF_MEMORY, "[Build][Op] %s(MapIndex) failed", kMultiBatchMapIndexNode.c_str());
return FAILED;
}
NodePtr index_node = graph->AddNode(op_desc);
if (index_node == nullptr) {
REPORT_INNER_ERR_MSG("E19999", "Add node:%s(%s) to graph:%s failed",
op_desc->GetName().c_str(), op_desc->GetType().c_str(), graph->GetName().c_str());
GELOGE(OUT_OF_MEMORY, "[Add][Node] %s(%s) to graph:%s failed",
op_desc->GetName().c_str(), op_desc->GetType().c_str(), graph->GetName().c_str());
return OUT_OF_MEMORY;
}
GE_CHK_STATUS_RET(AddAttrForGetDynamicDims(shape_node_), "[Add][Attr] for %s failed.",
shape_node_->GetName().c_str());
if (GraphUtils::AddEdge(shape_node_->GetOutDataAnchor(0), index_node->GetInDataAnchor(0)) != GRAPH_SUCCESS) {
REPORT_INNER_ERR_MSG("E19999", "Add edge between op:%s(%s)(index:0) and op:%s(%s)(index:0) failed",
shape_node_->GetName().c_str(), shape_node_->GetType().c_str(),
index_node->GetName().c_str(), index_node->GetType().c_str());
GELOGE(FAILED, "[Add][Edge] between op:%s(%s)(index:0) and op:%s(%s)(index:0) failed",
shape_node_->GetName().c_str(), shape_node_->GetType().c_str(),
index_node->GetName().c_str(), index_node->GetType().c_str());
return FAILED;
}
if (GraphUtils::AddEdge(const_node->GetOutDataAnchor(0), index_node->GetInDataAnchor(1)) != GRAPH_SUCCESS) {
REPORT_INNER_ERR_MSG("E19999", "Add edge between op:%s(%s)(index:0) and op:%s(%s)(index:1) failed",
const_node->GetName().c_str(), const_node->GetType().c_str(),
index_node->GetName().c_str(), index_node->GetType().c_str());
GELOGE(FAILED, "[Add][Edge] between node:%s to MapIndex:%s", const_node->GetName().c_str(),
index_node->GetName().c_str());
return FAILED;
}
if (GraphUtils::AddEdge(index_node->GetOutDataAnchor(0), case_node_->GetInDataAnchor(0)) != GRAPH_SUCCESS) {
REPORT_INNER_ERR_MSG("E19999", "Add edge between op:%s(%s)(index:0) and op:%s(%s)(index:0) failed",
index_node->GetName().c_str(), index_node->GetType().c_str(),
case_node_->GetName().c_str(), case_node_->GetType().c_str());
GELOGE(FAILED, "[Add][Edge] between op:%s(%s)(index:0) and op:%s(%s)(index:0) failed",
index_node->GetName().c_str(), index_node->GetType().c_str(),
case_node_->GetName().c_str(), case_node_->GetType().c_str());
return FAILED;
}
return SUCCESS;
}
Status MultiBatchClonePass::CreateGetDynamicDimsNode(const ComputeGraphPtr &graph, NodePtr &shape_node) {
const OpDescPtr data_desc = MakeShared<OpDesc>(kMultiBatchGetDynamicDimsNode, GETDYNAMICDIMS);
if (data_desc == nullptr) {
REPORT_INNER_ERR_MSG("E19999", "New OpDesc failed");
GELOGE(OUT_OF_MEMORY, "[New][OpDesc] failed");
return OUT_OF_MEMORY;
}
for (size_t i = 0; i < GetLocalOmgContext().user_input_dims.size(); ++i) {
size_t input_shape_dims = GetLocalOmgContext().user_input_dims.at(i).second.size();
if (input_shape_dims == 1 && GetLocalOmgContext().user_input_dims.at(i).second.at(0) == 0) {
GeTensorDesc tensor_desc;
tensor_desc.SetFormat(FORMAT_ND);
tensor_desc.SetDataType(DT_INT32);
auto ret = data_desc->AddInputDesc(tensor_desc);
GE_IF_BOOL_EXEC(ret != GRAPH_SUCCESS,
REPORT_INNER_ERR_MSG("E19999", "Add input desc to op:%s(%s) failed",
data_desc->GetName().c_str(), data_desc->GetType().c_str());
GELOGE(INTERNAL_ERROR, "[Add][InputDesc] to op:%s(%s) failed",
data_desc->GetName().c_str(), data_desc->GetType().c_str());
return FAILED);
continue;
}
GeTensorDesc tensor_desc(GeShape({static_cast<int32_t>(input_shape_dims)}), FORMAT_ND, DT_INT32);
tensor_desc.SetOriginShape(ge::GeShape(tensor_desc.GetShape().GetDims()));
auto ret = data_desc->AddInputDesc(tensor_desc);
GE_IF_BOOL_EXEC(ret != GRAPH_SUCCESS,
REPORT_INNER_ERR_MSG("E19999", "Add input desc to op:%s(%s) failed",
data_desc->GetName().c_str(), data_desc->GetType().c_str());
GELOGE(INTERNAL_ERROR, "[Add][InputDesc] to op:%s(%s) failed",
data_desc->GetName().c_str(), data_desc->GetType().c_str());
return FAILED);
}
GeTensorDesc tensor_desc(GeShape({static_cast<int32_t>(batch_shapes_.at(0).size())}), FORMAT_ND, DT_INT32);
tensor_desc.SetOriginShape(ge::GeShape(tensor_desc.GetShape().GetDims()));
auto ret = data_desc->AddOutputDesc(tensor_desc);
GE_IF_BOOL_EXEC(ret != GRAPH_SUCCESS,
REPORT_INNER_ERR_MSG("E19999", "Add output desc to op:%s(%s) failed",
data_desc->GetName().c_str(), data_desc->GetType().c_str());
GELOGE(INTERNAL_ERROR, "[Add][OutputDesc] to op:%s(%s) failed",
data_desc->GetName().c_str(), data_desc->GetType().c_str());
return FAILED);
(void)AttrUtils::SetBool(data_desc, ATTR_INSERT_BY_MBATCH, true);
shape_node = graph->AddNode(data_desc);
if (shape_node == nullptr) {
REPORT_INNER_ERR_MSG("E19999", "Add node:%s(%s) to graph:%s failed",
data_desc->GetName().c_str(), data_desc->GetType().c_str(), graph->GetName().c_str());
GELOGE(OUT_OF_MEMORY, "[Add][Node] %s(%s) to graph:%s failed",
data_desc->GetName().c_str(), data_desc->GetType().c_str(), graph->GetName().c_str());
return OUT_OF_MEMORY;
}
return SUCCESS;
}
Status MultiBatchClonePass::AddAttrForGetDynamicDims(const NodePtr &shape_node) const {
if (!getnext_sink_dynamic_dims_) {
GELOGD("No need to add attr when not insert get dynamic dims node.");
return SUCCESS;
}
GELOGD("Add attr for %s, type is %s", shape_node->GetName().c_str(), shape_node->GetType().c_str());
if (!AttrUtils::SetInt(shape_node->GetOpDesc(), ATTR_GETNEXT_SINK_DATA_COUNT, data_count_from_getnext_)) {
REPORT_INNER_ERR_MSG("E19999", "Set Attr:%s to op:%s(%s) failed", ATTR_GETNEXT_SINK_DATA_COUNT.c_str(),
shape_node->GetName().c_str(), shape_node->GetType().c_str());
GELOGE(INTERNAL_ERROR, "[Set][Attr] %s to op:%s(%s) failed", ATTR_GETNEXT_SINK_DATA_COUNT.c_str(),
shape_node->GetName().c_str(), shape_node->GetType().c_str());
return INTERNAL_ERROR;
}
std::vector<int64_t> shape_info;
for (size_t i = 0; i < GetLocalOmgContext().user_input_dims.size(); ++i) {
if (GetLocalOmgContext().user_input_dims.at(i).second.size() == 1 &&
GetLocalOmgContext().user_input_dims.at(i).second.at(0) == 0) {
shape_info.emplace_back(0);
continue;
}
shape_info.emplace_back(GetLocalOmgContext().user_input_dims.at(i).second.size());
for (size_t j = 0; j < GetLocalOmgContext().user_input_dims.at(i).second.size(); ++j) {
shape_info.emplace_back(GetLocalOmgContext().user_input_dims.at(i).second.at(j));
}
}
if (!AttrUtils::SetListInt(shape_node->GetOpDesc(), ATTR_GETNEXT_SINK_SHAPE_INFO, shape_info)) {
REPORT_INNER_ERR_MSG("E19999", "Set Attr:%s to op:%s(%s) failed", ATTR_GETNEXT_SINK_SHAPE_INFO.c_str(),
shape_node->GetName().c_str(), shape_node->GetType().c_str());
GELOGE(INTERNAL_ERROR, "[Set][Attr] %s to op:%s(%s) failed", ATTR_GETNEXT_SINK_SHAPE_INFO.c_str(),
shape_node->GetName().c_str(), shape_node->GetType().c_str());
return INTERNAL_ERROR;
}
return SUCCESS;
}
Status MultiBatchClonePass::LinkGetNextToGetDynamicDims(const NodePtr &getnext_node, const NodePtr &shape_node) const {
GELOGD("Start relink shape anchor of %s to %s.", getnext_node->GetName().c_str(), shape_node->GetName().c_str());
size_t input_index = 0;
size_t data_count = getnext_node->GetAllOutDataAnchors().size() / kDivisionConst;
for (size_t out_index = data_count; out_index < getnext_node->GetAllOutDataAnchors().size(); ++out_index,
++input_index) {
GELOGD("Start add %s of %zu out_anchor to %s of %zu in_anchor.", getnext_node->GetName().c_str(), out_index,
shape_node->GetName().c_str(), input_index);
auto out_data_anchor = getnext_node->GetOutDataAnchor(out_index);
auto ret = GraphUtils::AddEdge(out_data_anchor, shape_node->GetInDataAnchor(input_index));
GE_IF_BOOL_EXEC(ret != GRAPH_SUCCESS,
REPORT_INNER_ERR_MSG("E19999", "Add edge between op:%s(%s)(index:%zu) and op:%s(%s)(index:%zu) failed",
getnext_node->GetName().c_str(), getnext_node->GetType().c_str(), out_index,
shape_node->GetName().c_str(), shape_node->GetType().c_str(), input_index);
GELOGE(INTERNAL_ERROR, "[Add][Edge] between op:%s(%s)(index:%zu) and op:%s(%s)(index:%zu) failed",
getnext_node->GetName().c_str(), getnext_node->GetType().c_str(), out_index,
shape_node->GetName().c_str(), shape_node->GetType().c_str(), input_index);
return INTERNAL_ERROR);
}
return SUCCESS;
}
Status MultiBatchClonePass::LinkGetDynamicDimsToNetOutput(const NodePtr &output_node) {
if (getnext_sink_dynamic_dims_) {
GELOGD("Start link %s to %s.", shape_node_->GetName().c_str(), output_node->GetName().c_str());
size_t input_index = output_node->GetAllInDataAnchors().size();
if (NodeUtils::AppendInputAnchor(output_node, input_index + 1) != GRAPH_SUCCESS) {
REPORT_INNER_ERR_MSG("E19999", "Append input anchor to op:%s(%s) failed, size:%zu",
output_node->GetName().c_str(), output_node->GetType().c_str(), input_index + 1);
GELOGE(INTERNAL_ERROR, "[Append][InputAnchor] to op:%s(%s) failed, size:%zu",
output_node->GetName().c_str(), output_node->GetType().c_str(), input_index + 1);
return INTERNAL_ERROR;
}
auto ret = GraphUtils::AddEdge(shape_node_->GetOutDataAnchor(kDataOutIndex),
output_node->GetInDataAnchor(input_index));
GE_IF_BOOL_EXEC(ret != GRAPH_SUCCESS,
REPORT_INNER_ERR_MSG("E19999", "Add edge between op:%s(%s)(index:%d) and op:%s(%s)(index:%zu) failed",
shape_node_->GetName().c_str(), shape_node_->GetType().c_str(), kDataOutIndex,
output_node->GetName().c_str(), output_node->GetType().c_str(), input_index);
GELOGE(INTERNAL_ERROR, "[Add][Edge] between op:%s(%s)(index:%d) and op:%s(%s)(index:%zu) failed",
shape_node_->GetName().c_str(), shape_node_->GetType().c_str(), kDataOutIndex,
output_node->GetName().c_str(), output_node->GetType().c_str(), input_index);
return INTERNAL_ERROR);
if (!AttrUtils::SetBool(output_node->GetOpDesc(), ATTR_GETNEXT_SINK_DYNMAIC, true)) {
REPORT_INNER_ERR_MSG("E19999", "Set Attr:%s to op:%s(%s) failed", ATTR_GETNEXT_SINK_DYNMAIC.c_str(),
output_node->GetName().c_str(), output_node->GetType().c_str());
GELOGE(INTERNAL_ERROR, "[Set][Attr] %s to op:%s(%s) failed", ATTR_GETNEXT_SINK_DYNMAIC.c_str(),
output_node->GetName().c_str(), output_node->GetType().c_str());
return INTERNAL_ERROR;
}
}
return SUCCESS;
}
Status MultiBatchClonePass::NormalizeDataType(const NodePtr &node) const {
if (OpTypeUtils::IsDataNode(node->GetType()) && (node->GetType() != DATA)) {
const auto ref_data_desc = node->GetOpDesc();
GE_ASSERT_NOTNULL(ref_data_desc);
ref_data_desc->SetType(DATA);
}
return SUCCESS;
}
Status MultiBatchClonePass::CreateInputNode(const ComputeGraphPtr &graph) {
std::vector<NodePtr> all_data_nodes;
size_t case_input_index = kCaseArgIndex;
NodePtr getnext_node = nullptr;
size_t input_index_of_getnext = 0;
GE_ASSERT_NOTNULL(shape_node_);
std::vector<int32_t> unknown_shape_data_index;
for (size_t i = 0UL; i < all_data_nodes_.size(); ++i, ++case_input_index) {
const auto &node = all_data_nodes_[i];
const OpDescPtr op_desc = OpDescUtils::CopyOpDesc(node->GetOpDesc());
if (op_desc == nullptr) {
REPORT_INNER_ERR_MSG("E19999", "Copy op_desc from op:%s(%s) failed",
node->GetName().c_str(), node->GetType().c_str());
GELOGE(OUT_OF_MEMORY, "[Copy][OpDesc] from op:%s(%s) failed",
node->GetName().c_str(), node->GetType().c_str());
return FAILED;
}
if (GraphUtils::CopyTensorAttrs(op_desc, node) != GRAPH_SUCCESS) {
REPORT_INNER_ERR_MSG("E19999", "Copy tensor attr from op:%s(%s) failed",
node->GetName().c_str(), node->GetType().c_str());
GELOGE(OUT_OF_MEMORY, "[Copy][TensorAttrs] from op:%s(%s) failed",
node->GetName().c_str(), node->GetType().c_str());
return FAILED;
}
op_desc->SetName(node->GetName());
const NodePtr &data = graph->AddNode(op_desc);
GE_CHK_BOOL_EXEC(data != nullptr,
REPORT_INNER_ERR_MSG("E19999", "Add node:%s(%s) to graph:%s failed",
op_desc->GetName().c_str(), op_desc->GetType().c_str(),
graph->GetName().c_str());
return FAILED,
"[Add][Node] %s(%s) to graph:%s failed",
op_desc->GetName().c_str(), op_desc->GetType().c_str(), graph->GetName().c_str());
if (IsGetNextType(node)) {
getnext_node = data;
input_index_of_getnext = case_input_index;
case_input_index = case_input_index + data_count_from_getnext_;
continue;
} else {
int32_t data_index = -1;
GE_ASSERT_TRUE(AttrUtils::GetInt(node->GetOpDesc(), ATTR_NAME_INDEX, data_index));
if (data_index != -1) {
index_to_case_input_.emplace(std::make_pair(data_index, static_cast<int32_t>(i + 1UL)));
}
if (GraphUtils::AddEdge(data->GetOutDataAnchor(0), case_node_->GetInDataAnchor(case_input_index)) !=
GRAPH_SUCCESS) {
REPORT_INNER_ERR_MSG("E19999", "Add edge between op:%s(%s)(index:0) and op:%s(%s)(index:%zu) failed",
data->GetName().c_str(), data->GetType().c_str(),
case_node_->GetName().c_str(), case_node_->GetType().c_str(), case_input_index);
GELOGE(FAILED, "[Add][Edge] between op:%s(%s)(index:0) and op:%s(%s)(index:%zu) failed",
data->GetName().c_str(), data->GetType().c_str(),
case_node_->GetName().c_str(), case_node_->GetType().c_str(), case_input_index);
return FAILED;
}
std::vector<int32_t> unknown_dim_index = multibatch::GetDataNodesUnknownDimIndex(data);
if (!unknown_dim_index.empty()) {
unknown_shape_data_index.emplace_back(data_index);
(void)ge::AttrUtils::SetListInt(data->GetOpDesc(), "_dynamic_batch_unknown_dim_index", unknown_dim_index);
GE_ASSERT_SUCCESS(GraphUtils::AddEdge(data->GetOutControlAnchor(),
shape_node_->GetInControlAnchor()));
}
}
if (SetMaxShape(data) != SUCCESS) {
GELOGE(FAILED, "[Set][MaxShape] of %s failed.", data->GetName().c_str());
return FAILED;
}
all_data_nodes.emplace_back(data);
GE_ASSERT_SUCCESS(NormalizeDataType(node));
}
if (getnext_node != nullptr) {
if (LinkEdgeForGetNext(getnext_node, input_index_of_getnext) != SUCCESS) {
GELOGE(FAILED, "[Link][Edge] for %s failed.", getnext_node->GetName().c_str());
return FAILED;
}
if (SetMaxShape(getnext_node) != SUCCESS) {
GELOGE(FAILED, "[Set][MaxShape] of %s failed.", getnext_node->GetName().c_str());
return FAILED;
}
all_data_nodes.emplace_back(getnext_node);
}
std::sort(unknown_shape_data_index.begin(), unknown_shape_data_index.end());
(void)ge::AttrUtils::SetListInt(shape_node_->GetOpDesc(),
"_dynamic_batch_unknown_data_index", unknown_shape_data_index);
all_data_nodes_.swap(all_data_nodes);
return SUCCESS;
}
Status MultiBatchClonePass::LinkEdgeForGetNext(const NodePtr &getnext_node, size_t &case_input_index) {
GELOGD("Start link edge for %s, which is the %zu input of %s.", getnext_node->GetName().c_str(),
case_input_index, case_node_->GetName().c_str());
for (size_t out_index = 0; out_index < data_count_from_getnext_; ++out_index, ++case_input_index) {
if (GraphUtils::AddEdge(getnext_node->GetOutDataAnchor(out_index),
case_node_->GetInDataAnchor(case_input_index)) != GRAPH_SUCCESS) {
REPORT_INNER_ERR_MSG("E19999", "Add edge between op:%s(%s)(index:%zu) and op:%s(%s)(index:%zu) failed",
getnext_node->GetName().c_str(), getnext_node->GetType().c_str(), out_index,
case_node_->GetName().c_str(), case_node_->GetType().c_str(), case_input_index);
GELOGE(FAILED, "[Add][Edge] between op:%s(%s)(index:%zu) and op:%s(%s)(index:%zu) failed",
getnext_node->GetName().c_str(), getnext_node->GetType().c_str(), out_index,
case_node_->GetName().c_str(), case_node_->GetType().c_str(), case_input_index);
return FAILED;
}
}
if (getnext_sink_dynamic_dims_) {
GE_CHK_STATUS_RET(LinkGetNextToGetDynamicDims(getnext_node, shape_node_), "[Add][Link] for %s failed.",
shape_node_->GetName().c_str());
}
return SUCCESS;
}
Status MultiBatchClonePass::CreateConstNode(const ComputeGraphPtr &graph) {
std::vector<NodePtr> all_const_nodes;
size_t arg_index = kCaseArgIndex + all_data_nodes_.size();
if (data_count_from_getnext_ != 0) {
arg_index = arg_index + data_count_from_getnext_ - kNumOfGetnextNode;
}
for (size_t i = 0; i < all_const_nodes_.size(); ++i) {
const auto &node = all_const_nodes_[i];
const OpDescPtr op_desc = OpDescUtils::CopyOpDesc(node->GetOpDesc());
if (op_desc == nullptr) {
REPORT_INNER_ERR_MSG("E19999", "Copy op_desc from op:%s(%s) failed",
node->GetName().c_str(), node->GetType().c_str());
GELOGE(OUT_OF_MEMORY, "[Copy][OpDesc] from op:%s(%s) failed", node->GetName().c_str(), node->GetType().c_str());
return FAILED;
}
op_desc->SetName(node->GetName());
if (GraphUtils::CopyTensorAttrs(op_desc, node) != GRAPH_SUCCESS) {
REPORT_INNER_ERR_MSG("E19999", "Copy tensor attr from op:%s(%s) failed",
node->GetName().c_str(), node->GetType().c_str());
GELOGE(OUT_OF_MEMORY, "[Copy][TensorAttrs] from op:%s(%s) failed",
node->GetName().c_str(), node->GetType().c_str());
return FAILED;
}
const NodePtr &data = graph->AddNode(op_desc);
GE_CHK_BOOL_EXEC(data != nullptr,
REPORT_INNER_ERR_MSG("E19999", "Add node:%s(%s) to graph:%s failed",
op_desc->GetName().c_str(), op_desc->GetType().c_str(),
graph->GetName().c_str());
return FAILED,
"[Add][Node] %s(%s) to graph:%s failed",
op_desc->GetName().c_str(), op_desc->GetType().c_str(), graph->GetName().c_str());
if (GraphUtils::AddEdge(data->GetOutDataAnchor(0), case_node_->GetInDataAnchor(arg_index + i)) != GRAPH_SUCCESS) {
REPORT_INNER_ERR_MSG("E19999", "Add edge between op:%s(%s)(index:0) and op:%s(%s)(index:%zu) failed",
data->GetName().c_str(), data->GetType().c_str(),
case_node_->GetName().c_str(), case_node_->GetType().c_str(), arg_index + i);
GELOGE(FAILED, "[Add][Edge] between op:%s(%s)(index:0) and op:%s(%s)(index:%zu) failed",
data->GetName().c_str(), data->GetType().c_str(),
case_node_->GetName().c_str(), case_node_->GetType().c_str(), arg_index + i);
return FAILED;
}
all_const_nodes.emplace_back(data);
}
ChangeConstToData();
all_const_nodes_.swap(all_const_nodes);
return SUCCESS;
}
void MultiBatchClonePass::ChangeConstToData() {
size_t data_index = all_data_nodes_.size();
if (data_count_from_getnext_ != 0) {
data_index = data_index + data_count_from_getnext_ - kNumOfGetnextNode;
}
for (size_t i = 0; i < all_const_nodes_.size(); ++i, ++data_index) {
const auto &const_node = all_const_nodes_[i];
bool need_change_type = true;
if (out_control_nodes_.find(const_node) != out_control_nodes_.end()) {
GELOGD("No need to change %s to data type.", const_node->GetName().c_str());
need_change_type = false;
break;
}
if (!need_change_type) {
continue;
}
auto op_desc = const_node->GetOpDesc();
if (op_desc == nullptr) {
continue;
}
ge::OpDescUtilsEx::SetType(op_desc, DATA);
op_desc->AddInferFunc(nullptr);
(void)op_desc->DelAttr(ATTR_NAME_WEIGHTS);
const auto &owner_graph = const_node->GetOwnerComputeGraph();
GE_CHECK_NOTNULL_JUST_RETURN(owner_graph);
(void)owner_graph->AddInputNode(const_node);
(void)op_desc->AddInputDesc(op_desc->GetOutputDesc(kDataOutIndex));
(void)AttrUtils::SetInt(op_desc, ATTR_NAME_INDEX, data_index);
index_to_case_input_.emplace(std::make_pair(static_cast<int32_t>(data_index),
static_cast<int32_t>(data_index + 1UL)));
(void)NodeUtils::AppendInputAnchor(all_const_nodes_[i], 1);
}
}
NodePtr MultiBatchClonePass::AddOutputNodeToGraph(const ComputeGraphPtr &graph) {
const auto &output = all_output_nodes_[0];
const OpDescPtr op_desc = OpDescUtils::CopyOpDesc(output->GetOpDesc());
if (op_desc == nullptr) {
REPORT_INNER_ERR_MSG("E19999", "Copy op_desc from op:%s(%s) failed",
output->GetName().c_str(), output->GetType().c_str());
GELOGE(OUT_OF_MEMORY, "[Copy][OpDesc] from op:%s(%s) failed",
output->GetName().c_str(), output->GetType().c_str());
return nullptr;
}
if (GraphUtils::CopyTensorAttrs(op_desc, output) != GRAPH_SUCCESS) {
REPORT_INNER_ERR_MSG("E19999", "Copy tensor attr from op:%s(%s) failed",
output->GetName().c_str(), output->GetType().c_str());
GELOGE(OUT_OF_MEMORY, "[Copy][TensorAttrs] from op:%s(%s) failed",
output->GetName().c_str(), output->GetType().c_str());
return nullptr;
}
op_desc->SetName(output->GetName());
const auto node = graph->AddNode(op_desc);
if (node == nullptr) {
REPORT_INNER_ERR_MSG("E19999", "Add node:%s to graph:%s failed", op_desc->GetName().c_str(), graph->GetName().c_str());
GELOGE(FAILED, "[Add][Node] Node:%s, graph:%s", op_desc->GetName().c_str(), graph->GetName().c_str());
}
return node;
}
Status MultiBatchClonePass::CreateOutputNode(const ComputeGraphPtr &graph) {
const auto &output = all_output_nodes_[0];
const NodePtr &node = AddOutputNodeToGraph(graph);
GE_CHECK_NOTNULL(node);
for (size_t i = 0; i < case_node_->GetAllOutDataAnchorsSize(); ++i) {
const auto it = direct_output_.find(i);
if (it == direct_output_.end()) {
if (GraphUtils::AddEdge(case_node_->GetOutDataAnchor(i), node->GetInDataAnchor(i)) != GRAPH_SUCCESS) {
REPORT_INNER_ERR_MSG("E19999", "Add edge between op:%s(%s)(index:%zu) and op:%s(%s)(index:%zu) failed",
case_node_->GetName().c_str(), case_node_->GetType().c_str(), i,
node->GetName().c_str(), node->GetType().c_str(), i);
GELOGE(FAILED, "[Add][Edge] between op:%s(%s)(index:%zu) and op:%s(%s)(index:%zu) failed",
case_node_->GetName().c_str(), case_node_->GetType().c_str(), i,
node->GetName().c_str(), node->GetType().c_str(), i);
return FAILED;
}
} else {
const auto data_node = graph->FindNode(it->second);
if (data_node == nullptr) {
REPORT_INNER_ERR_MSG("E19999", "Find node:%s from graph:%s failed", it->second.c_str(), graph->GetName().c_str());
GELOGE(GE_GRAPH_GRAPH_NODE_NULL, "[Check][Param] Data node:%s not found in graph:%s",
it->second.c_str(), graph->GetName().c_str());
return GE_GRAPH_GRAPH_NODE_NULL;
}
if (GraphUtils::AddEdge(data_node->GetOutDataAnchor(kDataOutIndex), node->GetInDataAnchor(i)) != GRAPH_SUCCESS) {
REPORT_INNER_ERR_MSG("E19999", "Add edge between op:%s(%s)(index:%d) and op:%s(%s)(index:%zu) failed",
data_node->GetName().c_str(), data_node->GetType().c_str(), kDataOutIndex,
node->GetName().c_str(), node->GetType().c_str(), i);
GELOGE(FAILED, "[Add][Edge] between op:%s(%s)(index:%d) and op:%s(%s)(index:%zu) failed",
data_node->GetName().c_str(), data_node->GetType().c_str(), kDataOutIndex,
node->GetName().c_str(), node->GetType().c_str(), i);
return FAILED;
}
}
}
GE_CHK_STATUS_RET(LinkGetDynamicDimsToNetOutput(node), "[Add][Edge] between %s and netoutput:%s failed.",
shape_node_->GetName().c_str(), output->GetName().c_str());
(void)GraphUtils::AddEdge(case_node_->GetOutControlAnchor(), node->GetInControlAnchor());
all_output_nodes_.clear();
all_output_nodes_.emplace_back(node);
return SUCCESS;
}
Status MultiBatchClonePass::SetMaxShape(const NodePtr &data) {
GELOGD("Start set max shape for %s.", data->GetName().c_str());
if (!IsGetNextType(data)) {
if (SetMaxShapeToData(data, kDataOutIndex) != SUCCESS) {
GELOGE(PARAM_INVALID, "[Update][MaxShape] of %s failed.", data->GetName().c_str());
return PARAM_INVALID;
}
} else {
for (size_t out_anchor_index = 0; out_anchor_index < data_count_from_getnext_; ++out_anchor_index) {
if (SetMaxShapeToData(data, out_anchor_index) != SUCCESS) {
GELOGE(PARAM_INVALID, "[Update][MaxShape] of %s failed.", data->GetName().c_str());
return PARAM_INVALID;
}
}
}
return SUCCESS;
}
Status MultiBatchClonePass::SetMaxShapeToData(const NodePtr &node, size_t out_anchor_index) {
GELOGD("Start update max shape of %s, %zu output.", node->GetName().c_str(), out_anchor_index);
auto data_shape = NodeUtils::GetOutputDesc(*node, out_anchor_index).GetShape();
std::string data_name = node->GetName();
if (IsGetNextType(node)) {
data_name.append("_").append(std::to_string(out_anchor_index));
}
GELOGD("Update max shape of %s, shape dims is %s.", data_name.c_str(),
ToString(data_shape.GetDims()).c_str());
const auto &dims = data_shape.GetDims();
if (!IsGetNextType(node)) {
if (std::all_of(dims.begin(), dims.end(), [](int64_t val) { return val >= 0; })) {
GELOGD("No need to do anything for static data.");
return SUCCESS;
}
} else {
if (std::all_of(dims.begin(), dims.end(), [](int64_t val) { return val >= 0; })) {
if (getnext_sink_dynamic_dims_) {
GE_CHK_STATUS_RET(UpdateShapeOfShapeNode(node, out_anchor_index),
"[Update][Shape] of shape node:%s failed, out_anchor_index:%zu",
node->GetName().c_str(), out_anchor_index);
}
return SUCCESS;
}
}
(void)AttrUtils::SetListInt(node->GetOpDesc(), ATTR_MBATCH_ORIGIN_INPUT_DIMS, data_shape.GetDims());
if (!AttrUtils::SetStr(node->GetOpDesc(), kMbatchCaseName, case_node_->GetName())) {
REPORT_INNER_ERR_MSG("E19999", "Set Attr:%s to node:%s(%s) failed",
kMbatchCaseName, node->GetName().c_str(), node->GetType().c_str());
GELOGE(INTERNAL_ERROR, "[Set][Attr] %s to node:%s(%s) failed",
kMbatchCaseName, node->GetName().c_str(), node->GetType().c_str());
return INTERNAL_ERROR;
}
GeTensorDesc tensor(NodeUtils::GetOutputDesc(*node, kDataOutIndex));
std::vector<std::string> input_dims_str;
for (size_t i = 0; i < batch_shapes_.size(); ++i) {
auto shape = data_shape;
auto ret = multibatch::CalcShape(data_to_dynamic_info_.at(data_name).at(i), shape);
if (ret != SUCCESS) {
GELOGE(ret, "[Calculate][Shape] for data node %s failed, the shape may not match", node->GetName().c_str());
return ret;
}
tensor.SetShape(shape);
int64_t tensor_size = 0;
(void)TensorUtils::GetTensorSizeInBytes(tensor, tensor_size);
std::string input_str = TypeUtils::FormatToSerialString(tensor.GetFormat()) + ":" +
TypeUtils::DataTypeToSerialString(tensor.GetDataType()) + ":" + node->GetName() + ":" +
std::to_string(tensor_size) + ":" + std::to_string(tensor.GetShape().GetDimNum()) + ":" +
formats::JoinToString(tensor.GetShape().GetDims());
input_dims_str.emplace_back(input_str);
}
(void)AttrUtils::SetListStr(node->GetOpDesc(), "_all_origin_gears_inputs", input_dims_str);
size_t max_shape_index = 0;
int64_t max_size = 0;
for (size_t i = 0; i < batch_shapes_.size(); ++i) {
int64_t size = 1;
for (auto dim : data_to_dynamic_info_.at(data_name).at(i)) {
if (dim == 0) {
continue;
}
if (INT64_MAX / dim < size) {
REPORT_INNER_ERR_MSG("E19999", "The shape %s size will overflow after multi",
ToString(data_to_dynamic_info_.at(data_name).at(i)).c_str());
GELOGE(PARAM_INVALID, "[Check][Param] The shape %s size overflow",
ToString(data_to_dynamic_info_.at(data_name).at(i)).c_str());
return PARAM_INVALID;
}
size *= dim;
}
if (size > max_size) {
max_size = size;
max_shape_index = i;
}
}
return SetShapeToData(data_to_dynamic_info_.at(data_name).at(max_shape_index), node, data_shape, out_anchor_index);
}
Status MultiBatchClonePass::SetShapeToData(const std::vector<int64_t> &shapes, const NodePtr &data, GeShape &data_shape,
size_t out_anchor_index) const {
GELOGD("Start set shape to %zu out of %s.", out_anchor_index, data->GetName().c_str());
if (multibatch::CalcShape(shapes, data_shape) != SUCCESS) {
GELOGE(INTERNAL_ERROR, "[Calculate][Shape] for data node %s failed, the shapes may not match",
data->GetName().c_str());
return INTERNAL_ERROR;
}
if (NodeUtils::UpdateOutputOriginalShapeAndShape(*data, out_anchor_index, data_shape) != GRAPH_SUCCESS) {
REPORT_INNER_ERR_MSG("E19999", "Update output desc shape to op:%s(%s) failed, index:%zu.",
data->GetName().c_str(), data->GetType().c_str(), out_anchor_index);
GELOGE(INTERNAL_ERROR, "[Update][OutputShape] to op:%s(%s) failed, index:%zu",
data->GetName().c_str(), data->GetType().c_str(), out_anchor_index);
return INTERNAL_ERROR;
}
if (!IsGetNextType(data)) {
if (NodeUtils::UpdateInputOriginalShapeAndShape(*data, kDataInIndex, data_shape) != GRAPH_SUCCESS) {
REPORT_INNER_ERR_MSG("E19999", "Update input desc shape to op:%s(%s) failed, index:%u",
data->GetName().c_str(), data->GetType().c_str(), kDataInIndex);
GELOGE(INTERNAL_ERROR, "[Update][InputShape] to op:%s(%s) failed, index:%u",
data->GetName().c_str(), data->GetType().c_str(), kDataInIndex);
return INTERNAL_ERROR;
}
} else {
if (getnext_sink_dynamic_dims_) {
GE_CHK_STATUS_RET(UpdateShapeOfShapeNode(data, out_anchor_index),
"[Update][ShapeOfShapeNode] for %s(%s) failed, index:%zu,",
data->GetName().c_str(), data->GetType().c_str(), out_anchor_index);
}
}
auto input_desc = data->GetOpDesc()->MutableInputDesc(kDataInIndex);
auto output_desc = data->GetOpDesc()->MutableOutputDesc(kDataOutIndex);
if (input_desc != nullptr) {
ge::TensorUtils::SetSize(*input_desc, 0);
}
GE_CHECK_NOTNULL(output_desc);
ge::TensorUtils::SetSize(*output_desc, 0);
GELOGI("Update the data %s input/output shape to the max %s", data->GetName().c_str(),
ToString(data_shape.GetDims()).c_str());
return SUCCESS;
}
Status MultiBatchClonePass::UpdateShapeOfShapeNode(const NodePtr &node, size_t out_anchor_index) const {
GELOGD("Start update output shape of shape node insert by adapter, which is the %zu out of %s.", out_anchor_index,
node->GetName().c_str());
auto data_shape = NodeUtils::GetOutputDesc(*node, out_anchor_index).GetShape();
size_t shape_index = out_anchor_index + (node->GetAllOutDataAnchors().size() / kDivisionConst);
GE_CHECK_NOTNULL(node->GetOpDesc());
GeTensorDesc output_desc = node->GetOpDesc()->GetOutputDesc(shape_index);
std::vector<int64_t> output_dims = {static_cast<int64_t>(data_shape.GetDims().size())};
GeShape output_shape(output_dims);
output_desc.SetShape(output_shape);
output_desc.SetOriginShape(output_shape);
output_desc.SetDataType(DT_INT32);
if (node->GetOpDesc()->UpdateOutputDesc(shape_index, output_desc) != SUCCESS) {
REPORT_INNER_ERR_MSG("E19999", "Update output desc to op:%s(%s) failed, index:%zu.",
node->GetName().c_str(), node->GetType().c_str(), shape_index);
GELOGE(FAILED, "[Update][OutputDesc] to op:%s(%s) failed, index:%zu",
node->GetName().c_str(), node->GetType().c_str(), shape_index);
return FAILED;
}
return SUCCESS;
}
Status MultiBatchClonePass::UpdateSubgraphData(const NodePtr &data, size_t batch_index) {
GE_CHECK_NOTNULL(data->GetOpDesc());
int32_t node_index = -1;
if (!AttrUtils::GetInt(data->GetOpDesc(), ATTR_NAME_INDEX, node_index)) {
REPORT_INNER_ERR_MSG("E19999", "Get Attr:%s from op:%s(%s) failed", ATTR_NAME_INDEX.c_str(),
data->GetName().c_str(), data->GetType().c_str());
GELOGE(FAILED, "[Get][Attr] %s from op:%s(%s) failed", ATTR_NAME_INDEX.c_str(),
data->GetName().c_str(), data->GetType().c_str());
return FAILED;
}
const auto iter = index_to_case_input_.find(node_index);
GE_ASSERT_TRUE(iter != index_to_case_input_.end());
if (!AttrUtils::SetInt(data->GetOpDesc(), ATTR_NAME_PARENT_NODE_INDEX, iter->second)) {
REPORT_INNER_ERR_MSG("E19999", "Set Attr:%s to op:%s(%s) failed", ATTR_NAME_PARENT_NODE_INDEX.c_str(),
data->GetName().c_str(), data->GetType().c_str());
GELOGE(FAILED, "[Set][Attr] %s to op:%s(%s) failed", ATTR_NAME_PARENT_NODE_INDEX.c_str(),
data->GetName().c_str(), data->GetType().c_str());
return FAILED;
}
auto data_shape = NodeUtils::GetOutputDesc(*data, kDataOutIndex).GetShape();
const auto &dims = data_shape.GetDims();
GELOGD("Start update shape of %s , batch index is %zu, dims is %s.", data->GetName().c_str(), batch_index,
ToString(dims).c_str());
if (std::all_of(dims.begin(), dims.end(), [](int64_t val) { return val >= 0; })) {
return SUCCESS;
}
auto output_desc = NodeUtils::GetOutputDesc(*data, kDataOutIndex);
TensorUtils::SetSize(output_desc, 0);
GE_CHK_STATUS_RET(data->GetOpDesc()->UpdateOutputDesc(kDataOutIndex, output_desc),
"[Update] [OutputDesc] Data:%s(%s) output desc update failed.",
data->GetName().c_str(), data->GetType().c_str());
(void)AttrUtils::SetListInt(data->GetOpDesc(), ATTR_MBATCH_ORIGIN_INPUT_DIMS, data_shape.GetDims());
auto data_name = data->GetName();
size_t pos = data_name.find(kMultiBatchNodePostfix);
if (pos == std::string::npos) {
REPORT_INNER_ERR_MSG("E19999", "Cannot find key std::string [%s] of multi-batch in name of virtual input node:%s(%s)",
kMultiBatchNodePostfix.c_str(), data->GetName().c_str(), data->GetType().c_str());
GELOGE(FAILED, "[Check][Param] Cannot find key std::string [%s] of multi-batch in name of virtual input node, "
"node name: %s.", kMultiBatchNodePostfix.c_str(), data_name.c_str());
return FAILED;
}
auto parent_name = data_name.substr(0, pos);
return SetShapeToData(data_to_dynamic_info_.at(parent_name).at(batch_index), data, data_shape, kDataOutIndex);
}
Status MultiBatchClonePass::CreateOriGraph(const ComputeGraphPtr &graph) {
if (data_count_from_getnext_ == 0) {
GELOGD("No need to change original graph without getnext node.");
return SUCCESS;
}
GELOGD("Start change original graph: %s when exit getnext node.", graph->GetName().c_str());
size_t data_index = all_data_nodes_.size() - kNumOfGetnextNode;
for (const auto &node : graph->GetDirectNode()) {
if (IsGetNextType(node)) {
for (size_t out_index = 0; out_index < data_count_from_getnext_; ++out_index, ++data_index) {
auto out_data_anchor = node->GetOutDataAnchor(out_index);
GE_IF_BOOL_EXEC(out_data_anchor == nullptr, continue);
NodePtr data_node = CreateDataNode(graph, out_data_anchor, data_index);
GE_IF_BOOL_EXEC(data_node == nullptr,
REPORT_INNER_ERR_MSG("E19999", "Create data node in graph:%s failed", graph->GetName().c_str());
GELOGE(INTERNAL_ERROR, "[Create][DataNode] in graph:%s failed", graph->GetName().c_str());
return INTERNAL_ERROR);
for (auto &in_anchor : out_data_anchor->GetPeerInDataAnchors()) {
GE_IF_BOOL_EXEC(in_anchor == nullptr, continue);
NodePtr dst_node = in_anchor->GetOwnerNode();
if (GraphUtils::RemoveEdge(out_data_anchor, in_anchor) != GRAPH_SUCCESS) {
REPORT_INNER_ERR_MSG("E19999", "Remove edge between op:%s(%s)(index:%zu) and op:%s(%s)(index:%d) failed",
node->GetName().c_str(), node->GetType().c_str(), out_index,
dst_node->GetName().c_str(), dst_node->GetType().c_str(), in_anchor->GetIdx());
GELOGE(INTERNAL_ERROR, "[Remove][Edge] between op:%s(%s)(index:%zu) and op:%s(%s)(index:%d) failed",
node->GetName().c_str(), node->GetType().c_str(), out_index,
dst_node->GetName().c_str(), dst_node->GetType().c_str(), in_anchor->GetIdx());
return INTERNAL_ERROR;
}
if (GraphUtils::AddEdge(data_node->GetOutDataAnchor(0), dst_node->GetInDataAnchor(in_anchor->GetIdx())) !=
GRAPH_SUCCESS) {
REPORT_INNER_ERR_MSG("E19999", "Add edge between op:%s(%s)(index:0) and op:%s(%s)(index:%d) failed",
data_node->GetName().c_str(), data_node->GetType().c_str(),
dst_node->GetName().c_str(), dst_node->GetType().c_str(), in_anchor->GetIdx());
GELOGE(INTERNAL_ERROR, "[Add][Edge] between op:%s(%s)(index:0) and op:%s(%s)(index:%d) failed",
data_node->GetName().c_str(), data_node->GetType().c_str(),
dst_node->GetName().c_str(), dst_node->GetType().c_str(), in_anchor->GetIdx());
return INTERNAL_ERROR;
}
}
}
if (graph->RemoveNode(node) != GRAPH_SUCCESS) {
REPORT_INNER_ERR_MSG("E19999", "Remove node:%s(%s) from graph:%s failed",
node->GetName().c_str(), node->GetType().c_str(), graph->GetName().c_str());
GELOGE(GRAPH_FAILED, "[Remove][Node] %s(%s) from graph:%s failed",
node->GetName().c_str(), node->GetType().c_str(), graph->GetName().c_str());
return GRAPH_FAILED;
}
break;
}
}
return SUCCESS;
}
NodePtr MultiBatchClonePass::CreateDataNode(const ComputeGraphPtr &graph, const OutDataAnchorPtr &out_data_anchor,
size_t data_index) {
size_t out_anchor_index = out_data_anchor->GetIdx();
std::string node_name = out_data_anchor->GetOwnerNode()->GetName() + "_" + std::to_string(out_anchor_index);
OpDescPtr op_desc = MakeShared<OpDesc>(node_name, DATA);
if (op_desc == nullptr) {
REPORT_INNER_ERR_MSG("E19999", "New OpDesc failed");
GELOGE(OUT_OF_MEMORY, "[New][OpDesc] failed.");
return nullptr;
}
(void)AttrUtils::SetInt(op_desc, ATTR_NAME_INDEX, data_index);
index_to_case_input_.emplace(std::make_pair(static_cast<int32_t>(data_index),
static_cast<int32_t>(data_index + 1UL)));
OpDescPtr getnext_op_desc = out_data_anchor->GetOwnerNode()->GetOpDesc();
if (getnext_op_desc == nullptr) {
REPORT_INNER_ERR_MSG("E19999", "Param out_data_anchor's owner node is nullptr, check invalid");
GELOGE(OUT_OF_MEMORY, "[Get][OpDesc] failed, Param out_data_anchor's owner node is nullptr.");
return nullptr;
}
if (op_desc->AddInputDesc(getnext_op_desc->GetOutputDesc(out_anchor_index)) != GRAPH_SUCCESS) {
REPORT_INNER_ERR_MSG("E19999", "Add input desc to op:%s(%s) failed",
op_desc->GetName().c_str(), op_desc->GetType().c_str());
GELOGE(INTERNAL_ERROR, "[Add][InputDesc] to op:%s(%s) failed",
op_desc->GetName().c_str(), op_desc->GetType().c_str());
return nullptr;
}
if (op_desc->AddOutputDesc(getnext_op_desc->GetOutputDesc(out_anchor_index)) != GRAPH_SUCCESS) {
REPORT_INNER_ERR_MSG("E19999", "Add output desc to op:%s(%s) failed",
getnext_op_desc->GetName().c_str(), getnext_op_desc->GetType().c_str());
GELOGE(INTERNAL_ERROR, "[Add][OutputDesc] to op:%s(%s) failed",
getnext_op_desc->GetName().c_str(), getnext_op_desc->GetType().c_str());
return nullptr;
}
NodePtr data_node = graph->AddNode(op_desc);
GE_ASSERT_NOTNULL(data_node);
GELOGD("Success create %s node.", data_node->GetName().c_str());
return data_node;
}
void MultiBatchClonePass::RenameAndAddRecursiveSubgraphs(const ComputeGraphPtr &graph,
const ComputeGraphPtr &batch_graph,
const std::string &suffix) {
GELOGI("Add subgraph[%s] to root graph[%s]", batch_graph->GetName().c_str(), graph->GetName().c_str());
batch_graph->SetParentGraph(graph);
(void)graph->AddSubgraph(batch_graph->GetName(), batch_graph);
std::unordered_set<NodePtr> visited;
for (const auto &subgraph : batch_graph->GetAllSubgraphs()) {
const auto parent_node = subgraph->GetParentNode();
if ((parent_node == nullptr) || (parent_node->GetOpDesc() == nullptr)) {
continue;
}
if (visited.insert(parent_node).second) {
const auto &subgraph_names = parent_node->GetOpDesc()->GetSubgraphInstanceNames();
const auto subgraph_num = static_cast<uint32_t>(subgraph_names.size());
for (uint32_t i = 0; i < subgraph_num; ++i) {
const auto new_inst_name = subgraph_names[i] + suffix;
(void)parent_node->GetOpDesc()->SetSubgraphInstanceName(i, new_inst_name);
GELOGI("Rename instance name[%s] for node[%s], subgraph index[%u].",
new_inst_name.c_str(), parent_node->GetName().c_str(), i);
}
}
(void)batch_graph->RemoveSubgraph(subgraph);
subgraph->SetName(subgraph->GetName() + suffix);
(void)graph->AddSubgraph(subgraph->GetName(), subgraph);
GELOGI("Add subgraph[%s] to root graph[%s], parent node[%s].",
subgraph->GetName().c_str(), graph->GetName().c_str(), parent_node->GetName().c_str());
}
}
Status MultiBatchClonePass::AddBatchSubgraph(const ComputeGraphPtr &graph,
const ComputeGraphPtr &batch_graph, const size_t batch_idx) {
GE_CHECK_NOTNULL(batch_graph);
batch_graph->SetName("Batch_" + std::to_string(batch_idx));
const std::string suffix = kMultiBatchNodePostfix + std::to_string(batch_idx);
for (const auto &node : batch_graph->GetAllNodes()) {
const auto &node_op_desc = node->GetOpDesc();
GE_CHECK_NOTNULL(node_op_desc);
const std::string new_name = node->GetName() + suffix;
if (node->GetType() == VARIABLE) {
GE_ASSERT_NOTNULL(VarManager::Instance(session_id_));
VarManager::Instance(session_id_)->SetBatchVariablesKeyName(new_name, node->GetName());
}
node_op_desc->SetName(new_name);
if ((node->GetType() == DATA) && (node->GetOwnerComputeGraph() == batch_graph)) {
const auto ret = UpdateSubgraphData(node, batch_idx);
if (ret != SUCCESS) {
GELOGE(INTERNAL_ERROR, "[Update][SubgraphData] Subgraph:%s, node:%s, batch index:%zu",
batch_graph->GetName().c_str(), node->GetName().c_str(), batch_idx);
return INTERNAL_ERROR;
}
}
}
const auto &case_op_desc = case_node_->GetOpDesc();
GE_CHECK_NOTNULL(case_op_desc);
const std::string key_name = "branches" + std::to_string(batch_idx);
(void)case_op_desc->AddSubgraphName(key_name);
(void)case_op_desc->SetSubgraphInstanceName(batch_idx, batch_graph->GetName());
batch_graph->SetParentNode(case_node_);
RenameAndAddRecursiveSubgraphs(graph, batch_graph, suffix);
all_branch_output_[batch_graph] = batch_graph->FindFirstNodeMatchType(NETOUTPUT);
return SUCCESS;
}
Status MultiBatchClonePass::CreateSubgraphs(const ComputeGraphPtr &graph, const ComputeGraphPtr &branch) {
GELOGI("Start create subgraphs for %s.", graph->GetName().c_str());
for (size_t i = 0; i < batch_shapes_.size(); ++i) {
ComputeGraphPtr batch_graph = nullptr;
if (i != (batch_shapes_.size() - 1)) {
batch_graph = MakeShared<ComputeGraph>(branch->GetName());
GE_CHECK_NOTNULL(batch_graph);
const auto graph_ret = GraphUtils::CopyComputeGraph(branch, batch_graph);
if (graph_ret != GRAPH_SUCCESS) {
GELOGE(FAILED, "[Copy][ComputeGraph] origin graph:%s, batch index:%zu", branch->GetName().c_str(), i);
return FAILED;
}
} else {
batch_graph = branch;
}
const auto ret = AddBatchSubgraph(graph, batch_graph, i);
if (ret != SUCCESS) {
GELOGE(ret, "[Add][BatchSubgraph] origin graph:%s, batch index:%zu", branch->GetName().c_str(), i);
return ret;
}
GELOGI("Add batch graph[%s] to graph[%s], batch index:%zu.",
batch_graph->GetName().c_str(), graph->GetName().c_str(), i);
}
return SUCCESS;
}
Status MultiBatchClonePass::UpdateSubgraphOutput() {
for (const auto &item : all_branch_output_) {
const auto &output_node = item.second;
const auto &op_desc = output_node->GetOpDesc();
GE_CHECK_NOTNULL(op_desc);
for (size_t index = 0; index < op_desc->GetInputsSize(); ++index) {
GeTensorDescPtr tensor = op_desc->MutableInputDesc(index);
GE_CHECK_NOTNULL(tensor);
if (!AttrUtils::SetInt(tensor, ATTR_NAME_PARENT_NODE_INDEX, index)) {
REPORT_INNER_ERR_MSG("E19999", "Set Attr:%s to input:%zu tensor of op:%s(%s) failed",
ATTR_NAME_PARENT_NODE_INDEX.c_str(), index,
op_desc->GetName().c_str(), op_desc->GetType().c_str());
GELOGE(FAILED, "[Set][Attr] %s to input:%zu tensor of op:%s(%s) failed",
ATTR_NAME_PARENT_NODE_INDEX.c_str(), index,
op_desc->GetName().c_str(), op_desc->GetType().c_str());
return FAILED;
}
}
}
return SUCCESS;
}
Status MultiBatchClonePass::PruneDirectOutput(const ComputeGraphPtr &graph) {
GELOGD("Start prune direct output.");
const auto &func_desc = case_node_->GetOpDesc();
uint32_t unused_num = 0;
uint32_t output_num = func_desc->GetOutputsSize();
for (size_t i = 0; i < output_num; ++i) {
bool is_unused_tensor = true;
for (const auto &item : all_branch_output_) {
const auto &netoutput = item.second;
GE_CHECK_NOTNULL(netoutput);
const auto in_anchor = netoutput->GetInDataAnchor(i);
GE_ASSERT_NOTNULL(in_anchor);
if (in_anchor->GetPeerOutAnchor() != nullptr) {
is_unused_tensor = false;
break;
}
}
if (is_unused_tensor) {
unused_num++;
continue;
}
GE_CHK_STATUS_RET(UpdateOutputTensor(i, unused_num),
"[Update][OutputTensor] in graph:%s failed, parent_index:%zu, unused_num:%u",
graph->GetName().c_str(), i, unused_num);
}
if (unused_num == 0) {
return SUCCESS;
}
GE_CHK_GRAPH_STATUS_RET(NodeUtils::RemoveOutputAnchor(case_node_, output_num - unused_num),
"[Remove][OutputAnchor] for node:%s failed", case_node_->GetName().c_str());
for (const auto &item : all_branch_output_) {
GE_CHK_GRAPH_STATUS_RET(NodeUtils::RemoveInputAnchor(item.second, output_num - unused_num),
"[Remove][InputAnchor] for node:%s failed", item.second->GetName().c_str());
}
return SUCCESS;
}
Status MultiBatchClonePass::UpdateOutputTensor(uint32_t parent_index, uint32_t unused_num) {
if (unused_num == 0) {
GELOGD("No need to update output tensor.");
return SUCCESS;
}
uint32_t update_index = parent_index - unused_num;
for (const auto &item : all_branch_output_) {
const auto &node = item.second;
const auto &new_anchor = node->GetInDataAnchor(update_index);
GE_ASSERT_NOTNULL(new_anchor);
const auto &old_anchor = node->GetInDataAnchor(parent_index);
GE_ASSERT_NOTNULL(old_anchor);
const auto &out_anchor = old_anchor->GetPeerOutAnchor();
GE_ASSERT_NOTNULL(out_anchor);
const auto &out_node = out_anchor->GetOwnerNode();
GE_ASSERT_NOTNULL(out_node);
const auto &op_desc = node->GetOpDesc();
(void)op_desc->UpdateInputDesc(update_index, op_desc->GetInputDesc(parent_index));
GE_CHK_GRAPH_STATUS_RET(GraphUtils::AddEdge(out_anchor, new_anchor),
"[Add][Edge] between %s(index:%d) and %s(index:%u) failed",
out_node->GetName().c_str(), out_anchor->GetIdx(),
new_anchor->GetOwnerNode()->GetName().c_str(), update_index);
GELOGI("Add edge success, func node: %s, node: %s, parent index: %u, update index: %u",
case_node_->GetName().c_str(), out_node->GetName().c_str(), parent_index, update_index);
GE_CHK_GRAPH_STATUS_RET(GraphUtils::RemoveEdge(out_anchor, old_anchor),
"[Remove][Edge] between %s(index:%d) and %s(index:%u) failed",
out_node->GetName().c_str(), out_anchor->GetIdx(),
old_anchor->GetOwnerNode()->GetName().c_str(), parent_index);
GELOGI("Remove edge success, func node: %s, node: %s", case_node_->GetName().c_str(), out_node->GetName().c_str());
}
const auto &new_anchor = case_node_->GetOutDataAnchor(update_index);
const auto &old_anchor = case_node_->GetOutDataAnchor(parent_index);
GE_ASSERT_NOTNULL(old_anchor);
for (const auto &in_anchor : old_anchor->GetPeerInDataAnchors()) {
const auto &in_node = in_anchor->GetOwnerNode();
GE_CHK_GRAPH_STATUS_RET(GraphUtils::RemoveEdge(old_anchor, in_anchor),
"[Remove][Edge] between %s(index:%u) and %s(index:%d) failed",
case_node_->GetName().c_str(), parent_index,
in_node->GetName().c_str(), in_anchor->GetIdx());
GELOGI("Remove edge success, func node: %s, node: %s", case_node_->GetName().c_str(), in_node->GetName().c_str());
GE_CHK_GRAPH_STATUS_RET(GraphUtils::AddEdge(new_anchor, in_anchor),
"[Add][Edge] between %s(index:%u) and %s(index:%d) failed",
case_node_->GetName().c_str(), update_index,
in_node->GetName().c_str(), in_anchor->GetIdx());
GELOGI("Add edge success, func node: %s, node: %s, parent index: %u, update index: %u",
case_node_->GetName().c_str(), in_node->GetName().c_str(), parent_index, update_index);
}
return SUCCESS;
}
REG_PASS_OPTION("MultiBatchClonePass").LEVELS(OoLevel::kO1);
}