diff --git a/ge/graph/manager/graph_manager.cc b/ge/graph/manager/graph_manager.cc index 030b864e..1aee79a4 100755 --- a/ge/graph/manager/graph_manager.cc +++ b/ge/graph/manager/graph_manager.cc @@ -687,7 +687,7 @@ Status GraphManager::PreRunOptimizeOriginalGraph(const GraphNodePtr &graph_node, CompilerStages &stages = GetCompilerStages(graph_node->GetGraphId()); GM_RUN_AND_DUMP_PERF("OptimizeGraphPrepare", stages.optimizer.OptimizeOriginalGraphForQuantize, compute_graph); GM_RUN_AND_DUMP_PERF("HandleSummaryOp", stages.optimizer.HandleSummaryOp, compute_graph); - GM_RUN_AND_DUMP_PERF("Prepare", stages.preparer.PrepareDynShape, graph_node->GetGraph(), inputs, compute_graph, + GM_RUN_AND_DUMP_PERF("Prepare", stages.preparer.PrepareDynShape, graph_node, inputs, compute_graph, session_id); GM_RUN_AND_DUMP_PERF("OptimizeOriginalGraph", stages.optimizer.OptimizeOriginalGraph, compute_graph); @@ -1173,7 +1173,7 @@ Status GraphManager::BuildGraphForUnregisteredOp(const GraphId &graph_id, const auto compute_graph = GraphUtils::GetComputeGraph(*graph_node->GetGraph()); GE_CHECK_NOTNULL(compute_graph); - GM_RUN_AND_DUMP_PERF("Prepare", GetCompilerStages(graph_id).preparer.PrepareDynShape, graph_node->GetGraph(), inputs, + GM_RUN_AND_DUMP_PERF("Prepare", GetCompilerStages(graph_id).preparer.PrepareDynShape, graph_node, inputs, compute_graph, session_id); for (auto &node : compute_graph->GetAllNodes()) { diff --git a/ge/graph/preprocess/graph_preprocess.cc b/ge/graph/preprocess/graph_preprocess.cc index 32f877cf..3f4c7f16 100644 --- a/ge/graph/preprocess/graph_preprocess.cc +++ b/ge/graph/preprocess/graph_preprocess.cc @@ -898,6 +898,117 @@ Status ProcessNetoutputNodeDynShape(NodePtr &node) { } return SUCCESS; } +/** + * Parser shape_range from string to vector + * shape_range from option normally is "[1~20],[3],[3~6],[-1]" + * @param shape_range + */ +void ParseDynamicInputShapeRange(const std::string &shape_range, + std::vector>> &range) { + if (shape_range.empty() || shape_range.size() < 2) { + GELOGW("Shape range %s is invalid.", shape_range); + return; + } + // different parameter sets are split by ';' + vector shape_set = ge::StringUtils::Split(shape_range, ']'); + if (shape_set.empty()) { + return; + } + for (auto shape_str : shape_set) { + if (shape_str.empty()) { + continue; + } + if (ge::StringUtils::StartWith(shape_str, "[")) { + shape_str = shape_str.substr(1, shape_str.size()); + } + if (ge::StringUtils::StartWith(shape_str, ",")) { + shape_str = shape_str.substr(2, shape_str.size()); + } + std::vector> range_of_single; + vector range_set = ge::StringUtils::Split(shape_str, ','); + for (auto range_str : range_set) { + vector pair_set = ge::StringUtils::Split(range_str, '~'); + pair range_pair; + if (pair_set.size() == 1) { + auto range_value = atoi(pair_set.at(0).c_str()); + if (range_value < 0) { + range_pair = std::make_pair(1, range_value); + } else { + range_pair = std::make_pair(range_value, range_value); + } + } else if (pair_set.size() == 2) { + auto range_left = atoi(pair_set.at(0).c_str()); + auto range_right = atoi(pair_set.at(1).c_str()); + range_pair = std::make_pair(range_left, range_right); + } + range_of_single.emplace_back(range_pair); + } + range.emplace_back(range_of_single); + } +} + +Status GetDynamicInputShapeRange(const std::vector &user_input, const std::map &graph_option, + vector>> &range_vec) { + auto mode_iter = graph_option.find(OPTION_EXEC_DYNAMIC_EXECUTE_MODE); + if (mode_iter == graph_option.end()) { + GELOGD("Graph Option: Can not find %s option in graph options.", OPTION_EXEC_DYNAMIC_EXECUTE_MODE); + return SUCCESS; + } + GELOGD("Graph Option: dynamic_input_mode value is %s.", mode_iter->second.c_str()); + if (mode_iter->second != "dynamic_execute") { + return SUCCESS; + } + auto iter = graph_option.find(OPTION_EXEC_DATA_INPUTS_SHAPE_RANGE); + if (iter == graph_option.end()) { + GELOGE(PARAM_INVALID, "Graph option %s is required when %s is dynamic_execute", OPTION_EXEC_DATA_INPUTS_SHAPE_RANGE, + OPTION_EXEC_DYNAMIC_EXECUTE_MODE); + return PARAM_INVALID; + } + GELOGD("GraphOption: dynamic_inputs_shape_range value is %s.", iter->second.c_str()); + ParseDynamicInputShapeRange(iter->second, range_vec); + if (range_vec.size() != user_input.size()) { + GELOGE(PARAM_INVALID, "Dynamic input shape range size is %zu, inputs size is %zu. Not match.", range_vec.size(), + user_input.size()); + return PARAM_INVALID; + } + return SUCCESS; +} + +Status UpdateDynamicInputShapeRange(const ge::GeAttrValue::INT index, + const ector>> &range_vec, OpDescPtr &op, + GeTensorDesc &desc) { + auto unkown_shape = desc.GetShape(); + auto shape_range = range_vec.at(index); + for (size_t i = 0; i < unkown_shape.GetDimNum(); ++i) { + if (shape_range.at(i).first == shape_range.at(i).second) { + unkown_shape.SetDim(i, shape_range.at(i).first); + } else { + unkown_shape.SetDim(i, -1); + } + } + desc.SetShape(unkown_shape); + desc.SetShapeRange(shape_range); + int64_t dynamic_shape_size = 1; + for (const auto range_pair : range_vec.at(index)) { + FMK_INT64_MULCHECK(dynamic_shape_size, range_pair.second); + dynamic_shape_size *= range_pair.second; + } + auto data_type_size = GetSizeByDataType(desc.GetDataType()); + if (data_type_size < 0) { + GELOGE(PARAM_INVALID, "Input data type is %s, is not supported.", + TypeUtils::DataTypeToSerialString(desc.GetDataType()).c_str()); + return PARAM_INVALID; + } + FMK_INT64_MULCHECK(dynamic_shape_size, data_type_size); + dynamic_shape_size *= data_type_size; + GELOGI("In dynamic_execute mode ,set input %s shape range size %ld", op->GetName().c_str(), dynamic_shape_size); + ge::TensorUtils::SetSize(desc, dynamic_shape_size); + graphStatus graph_ret = op->UpdateInputDesc(0, desc); + GE_CHK_STATUS_RET(graph_ret, "UpdateInputDesc fail, graph ret: %u", graph_ret); + graph_ret = op->UpdateOutputDesc(0, desc); + GE_CHK_STATUS_RET(graph_ret, "UpdateInputDesc fail, graph ret: %u", graph_ret); + return SUCCESS; +} } // namespace GraphPrepare::GraphPrepare() : compute_graph_(nullptr) {} @@ -1102,7 +1213,11 @@ Status GraphPrepare::AdjustDataOpOutput(const NodePtr &node) { return SUCCESS; } -Status GraphPrepare::UpdateInput(const std::vector &user_input) { +Status GraphPrepare::UpdateInput(const std::vector &user_input, const std::map &graph_option) { + // Get shape range of input in dynamic_execute mode + vector>> dynamic_shape_range_vec; + auto ret = GetDynamicInputShapeRange(user_input, graph_option, dynamic_shape_range_vec); + GE_CHK_STATUS_RET(ret, "Graph option is not right on Dynamic execute mode."); compute_graph_->SaveDataFormat(ge::TypeUtils::DomiFormatToFormat(GetLocalOmgContext().format)); for (NodePtr &input_node : compute_graph_->GetDirectNode()) { GE_CHECK_NOTNULL(input_node); @@ -1185,6 +1300,12 @@ Status GraphPrepare::UpdateInput(const std::vector &user_input) { return graph_ret; } + if (!dynamic_shape_range_vec.empty()) { + ret = UpdateDynamicInputShapeRange(index, dynamic_shape_range_vec, op, desc); + GE_CHK_STATUS_RET(ret, "Fail to update dynamic input shape range on %s.", op->GetName().c_str()); + continue; + } + if (!options_.train_graph_flag) { Status ret = AdjustDataOpOutput(input_node); GE_IF_BOOL_EXEC(ret != SUCCESS, GELOGE(ret, "AdjustDataOpOutput fail, ret:%u", ret); return ret); @@ -1358,17 +1479,17 @@ Status GraphPrepare::SaveOriginalGraphToOmModel() { GELOGI("Prepare %s on graph %s success.", name, compute_graph->GetName().c_str()); \ } while (0) -Status GraphPrepare::PrepareDynShape(ConstGraphPtr graph, const std::vector &user_input, +Status GraphPrepare::PrepareDynShape(const GraphNodePtr &graph_node, const std::vector &user_input, ge::ComputeGraphPtr &compute_graph, uint64_t session_id) { - GE_CHECK_NOTNULL(graph); + GE_CHECK_NOTNULL(graph_node->GetGraph()); GE_CHECK_NOTNULL(compute_graph); GetLocalOmgContext().type = static_cast(options_.framework_type); - const Graph &const_graph = *graph; + const Graph &const_graph = *graph_node->GetGraph(); PP_RUN("Init", Init, const_graph, session_id); PP_RUN("SetRtContext", SetRtContext, rtContext_t(), RT_CTX_GEN_MODE); - PP_RUN_AND_DUMP("CheckAndUpdateInput", CheckAndUpdateInput, user_input); + PP_RUN_AND_DUMP("CheckAndUpdateInput", CheckAndUpdateInput, user_input, graph_node->GetGraph()); PP_RUN_AND_DUMP("GraphEquivalentTransformation", GraphEquivalentTransformation); PP_RUN_AND_DUMP("ProcessOutput", ProcessNetOutput); PP_RUN_AND_DUMP("ProcessMultiBatch", multibatch::ProcessMultiBatch, compute_graph_); @@ -1831,7 +1952,7 @@ Status GraphPrepare::ProcessNetOutput() { return SUCCESS; } -Status GraphPrepare::CheckAndUpdateInput(const std::vector &user_input) { +Status GraphPrepare::CheckAndUpdateInput(const std::vector &user_input,const std::map &graph_option) { compute_graph_->SetInputSize(user_input.size()); if (user_input.empty()) { return SUCCESS; @@ -1843,7 +1964,7 @@ Status GraphPrepare::CheckAndUpdateInput(const std::vector &user_input return ret; } - ret = UpdateInput(user_input); + ret = UpdateInput(user_input, graph_option); if (ret != SUCCESS) { GELOGE(ret, "UpdateInput fail, ret:%u", ret); return ret; diff --git a/ge/graph/preprocess/graph_preprocess.h b/ge/graph/preprocess/graph_preprocess.h index a3bbf433..de755418 100755 --- a/ge/graph/preprocess/graph_preprocess.h +++ b/ge/graph/preprocess/graph_preprocess.h @@ -45,7 +45,7 @@ class GraphPrepare { virtual ~GraphPrepare(); GraphPrepare(const GraphPrepare &in) = delete; GraphPrepare &operator=(const GraphPrepare &in) = delete; - Status PrepareDynShape(ConstGraphPtr graph, + Status PrepareDynShape(const GraphNodePtr &graph_node, const std::vector &user_input, ge::ComputeGraphPtr &compute_graph, uint64_t session_id = 0); @@ -63,8 +63,8 @@ class GraphPrepare { Status CheckRefOp(); Status SetRtContext(rtContext_t rt_context, rtCtxMode_t mode); Status AdjustDataOpOutput(const NodePtr &node); - Status UpdateInput(const std::vector &user_input); - Status CheckAndUpdateInput(const std::vector &user_input); + Status UpdateInput(const std::vector &user_input, const std::map &graph_option); + Status CheckAndUpdateInput(const std::vector &user_input, const std::map &graph_option); Status CheckConstOp(); Status VerifyConstOp(const NodePtr &node); Status CheckUserInput(const std::vector &user_input); diff --git a/inc/external/ge/ge_api_types.h b/inc/external/ge/ge_api_types.h index d0f2105f..250252f9 100644 --- a/inc/external/ge/ge_api_types.h +++ b/inc/external/ge/ge_api_types.h @@ -61,6 +61,11 @@ const char *const OPTION_EXEC_HCCL_FLAG = "ge.exec.hcclFlag"; const char *const OPTION_EXEC_ATOMIC_FLAG = "ge.exec.enable_atomic"; const char *const OPTION_EXEC_DISABLE_REUSED_MEMORY = "ge.exec.disableReuseMemory"; const char *const OPTION_EXEC_ENABLE_TAILING_OPTIMIZATION = "ge.exec.isTailingOptimization"; +// Dynamic input flag. ge.exec.dynamicInput=1, means enable dynaimc input, +// ge.exec.dynamicGraphExecuteMode, dynamic_execute[default] +const char *const OPTION_EXEC_DYNAMIC_INPUT = "ge.exec.dynamicInput"; +const char *const OPTION_EXEC_DYNAMIC_EXECUTE_MODE = "ge.exec.dynamicGraphExecuteMode"; +const char *const OPTION_EXEC_DATA_INPUTS_SHAPE_RANGE = "ge.exec.dataInputsShapeRange"; // Option key: memory init const char *const GRAPH_MEMORY_MAX_SIZE = "ge.graphMemoryMaxSize";