Browse Source

Merge branch 'development' of https://gitee.com/mindspore/graphengine into review_control_passes

pull/449/head
chenyemeng 4 years ago
parent
commit
381254639c
100 changed files with 1945 additions and 1000 deletions
  1. +14
    -1
      CMakeLists.txt
  2. +20
    -17
      build.sh
  3. +60
    -0
      cmake/external_libs/gtest.cmake
  4. +9
    -9
      cmake/external_libs/json.cmake
  5. +11
    -8
      cmake/external_libs/protobuf_shared.cmake
  6. +11
    -7
      cmake/external_libs/protobuf_static.cmake
  7. +10
    -7
      cmake/external_libs/protoc.cmake
  8. +1
    -1
      ge/common/CMakeLists.txt
  9. +10
    -10
      ge/common/helper/model_helper.cc
  10. +2
    -2
      ge/common/helper/om_file_helper.cc
  11. +3
    -3
      ge/common/model_parser/base.cc
  12. +1
    -0
      ge/common/types.cc
  13. +19
    -1
      ge/generator/ge_generator.cc
  14. +3
    -1
      ge/graph/build/graph_builder.cc
  15. +1
    -1
      ge/graph/build/stream_allocator.cc
  16. +2
    -1
      ge/graph/load/new_model_manager/davinci_model.cc
  17. +4
    -4
      ge/graph/load/new_model_manager/model_manager.cc
  18. +1
    -1
      ge/graph/load/new_model_manager/task_info/hccl_task_info.cc
  19. +12
    -43
      ge/graph/manager/graph_manager.cc
  20. +0
    -2
      ge/graph/manager/graph_manager.h
  21. +2
    -2
      ge/graph/manager/util/hcom_util.cc
  22. +1
    -1
      ge/graph/optimize/mem_rw_conflict_optimize.cc
  23. +10
    -3
      ge/graph/passes/mark_agnostic_pass.cc
  24. +1
    -1
      ge/graph/passes/switch_data_edges_bypass.cc
  25. +5
    -0
      ge/graph/preprocess/multi_batch_options.cc
  26. +6
    -0
      ge/hybrid/common/npu_memory_allocator.cc
  27. +1
    -0
      ge/hybrid/common/tensor_value.cc
  28. +4
    -4
      ge/hybrid/executor/hybrid_model_async_executor.cc
  29. +26
    -20
      ge/hybrid/executor/node_state.cc
  30. +3
    -3
      ge/hybrid/executor/node_state.h
  31. +6
    -6
      ge/hybrid/executor/worker/execution_engine.cc
  32. +7
    -4
      ge/hybrid/executor/worker/shape_inference_engine.cc
  33. +2
    -2
      ge/hybrid/model/graph_item.cc
  34. +2
    -2
      ge/hybrid/model/hybrid_model.cc
  35. +54
    -47
      ge/hybrid/model/hybrid_model_builder.cc
  36. +1
    -0
      ge/hybrid/model/hybrid_model_builder.h
  37. +95
    -19
      ge/hybrid/model/node_item.cc
  38. +28
    -12
      ge/hybrid/model/node_item.h
  39. +4
    -8
      ge/hybrid/node_executor/aicore/aicore_node_executor.cc
  40. +6
    -3
      ge/hybrid/node_executor/aicpu/aicpu_ext_info.cc
  41. +39
    -40
      ge/hybrid/node_executor/aicpu/aicpu_node_executor.cc
  42. +12
    -16
      ge/hybrid/node_executor/compiledsubgraph/known_node_executor.cc
  43. +5
    -2
      ge/hybrid/node_executor/controlop/control_op_executor.cc
  44. +9
    -6
      ge/hybrid/node_executor/hccl/hccl_node_executor.cc
  45. +5
    -5
      ge/hybrid/node_executor/host_cpu/host_cpu_node_executor.cc
  46. +15
    -11
      ge/hybrid/node_executor/node_executor.cc
  47. +10
    -10
      ge/hybrid/node_executor/task_context.cc
  48. +4
    -4
      ge/hybrid/node_executor/task_context.h
  49. +6
    -1
      ge/ir_build/atc_ir_common.cc
  50. +7
    -1
      ge/ir_build/ge_ir_build.cc
  51. +4
    -4
      ge/session/omg.cc
  52. +2
    -1
      ge/single_op/task/aicpu_task_builder.cc
  53. +1
    -1
      ge/single_op/task/op_task.cc
  54. +1
    -0
      ge/single_op/task/op_task.h
  55. +0
    -3
      inc/external/ge/ge_api_error_codes.h
  56. +0
    -3
      inc/external/ge/ge_error_codes.h
  57. +1
    -0
      inc/framework/common/types.h
  58. +1
    -1
      metadef
  59. +1
    -1
      parser
  60. +1
    -0
      tests/CMakeLists.txt
  61. +67
    -43
      tests/depends/cce/CMakeLists.txt
  62. +34
    -0
      tests/depends/error_manager/CMakeLists.txt
  63. +85
    -0
      tests/depends/error_manager/src/error_manager_stub.cc
  64. +8
    -4
      tests/depends/hccl/CMakeLists.txt
  65. +9
    -9
      tests/depends/hccl/src/hccl_stub.cc
  66. +14
    -6
      tests/depends/mmpa/CMakeLists.txt
  67. +55
    -0
      tests/depends/mmpa/src/mmpa_stub.cc
  68. +31
    -17
      tests/depends/omg/CMakeLists.txt
  69. +3
    -1
      tests/depends/omg/src/omg_stub.cc
  70. +7
    -3
      tests/depends/profiler/CMakeLists.txt
  71. +8
    -3
      tests/depends/runtime/CMakeLists.txt
  72. +78
    -1
      tests/depends/runtime/src/runtime_stub.cc
  73. +6
    -3
      tests/depends/slog/CMakeLists.txt
  74. +2
    -0
      tests/depends/slog/src/slog_stub.cc
  75. +73
    -51
      tests/ut/common/graph/CMakeLists.txt
  76. +16
    -16
      tests/ut/common/graph/testcase/ge_graph/ge_format_refiner_unittest.cc
  77. +55
    -55
      tests/ut/common/graph/testcase/ge_graph/ge_model_serialize_unittest.cc
  78. +2
    -1
      tests/ut/common/graph/testcase/ge_graph/ge_node_unittest.cc
  79. +667
    -354
      tests/ut/ge/CMakeLists.txt
  80. +3
    -1
      tests/ut/ge/common/datatype_transfer_unittest.cc
  81. +4
    -3
      tests/ut/ge/common/format_transfer_5d_nchw_unittest.cc
  82. +5
    -2
      tests/ut/ge/common/format_transfer_5d_nhwc_unittest.cc
  83. +5
    -2
      tests/ut/ge/common/format_transfer_c1hwncoc0_hwcn_unittest.cc
  84. +18
    -10
      tests/ut/ge/common/format_transfer_fractal_nz_unittest.cc
  85. +6
    -2
      tests/ut/ge/common/format_transfer_fractal_zz_unittest.cc
  86. +4
    -1
      tests/ut/ge/common/format_transfer_fracz_hwcn_unittest.cc
  87. +5
    -2
      tests/ut/ge/common/format_transfer_fracz_nchw_unittest.cc
  88. +5
    -2
      tests/ut/ge/common/format_transfer_fracz_nhwc_unittest.cc
  89. +5
    -2
      tests/ut/ge/common/format_transfer_hwcn_c1hwncoc0_unittest.cc
  90. +5
    -2
      tests/ut/ge/common/format_transfer_hwcn_fractalz_unittest.cc
  91. +4
    -1
      tests/ut/ge/common/format_transfer_nchw_5d_unittest.cc
  92. +5
    -2
      tests/ut/ge/common/format_transfer_nchw_fractalz_unittest.cc
  93. +7
    -2
      tests/ut/ge/common/format_transfer_nhwc_5d_unittest.cc
  94. +5
    -2
      tests/ut/ge/common/format_transfer_nhwc_fractalz_unittest.cc
  95. +3
    -1
      tests/ut/ge/common/format_transfer_transpose_unittest.cc
  96. +6
    -2
      tests/ut/ge/common/format_transfer_unittest.cc
  97. +30
    -18
      tests/ut/ge/graph/build/logical_stream_allocator_unittest.cc
  98. +6
    -3
      tests/ut/ge/graph/build/mem_assigner_unittest.cc
  99. +2
    -0
      tests/ut/ge/graph/ge_executor_unittest.cc
  100. +10
    -7
      tests/ut/ge/graph/load/data_dumper_unittest.cc

+ 14
- 1
CMakeLists.txt View File

@@ -13,6 +13,12 @@ if(DEFINED ENV{ASCEND_CUSTOM_PATH})
else() else()
set(ASCEND_DIR /usr/local/Ascend) set(ASCEND_DIR /usr/local/Ascend)
endif() endif()

if(DEFINED ENV{D_PKG_SERVER})
set(GE_PB_PKG $ENV{D_PKG_SERVER})
message("Download packages from PKG server")
endif()

set(ASCEND_DRIVER_DIR ${ASCEND_DIR}/driver/lib64) set(ASCEND_DRIVER_DIR ${ASCEND_DIR}/driver/lib64)
set(ASCEND_DRIVER_COMMON_DIR ${ASCEND_DIR}/driver/lib64/common) set(ASCEND_DRIVER_COMMON_DIR ${ASCEND_DIR}/driver/lib64/common)
set(ASCEND_DRIVER_SHARE_DIR ${ASCEND_DIR}/driver/lib64/share) set(ASCEND_DRIVER_SHARE_DIR ${ASCEND_DIR}/driver/lib64/share)
@@ -37,6 +43,7 @@ if (ENABLE_OPEN_SRC)
include(cmake/external_libs/protobuf_static.cmake) include(cmake/external_libs/protobuf_static.cmake)
include(cmake/external_libs/protoc.cmake) include(cmake/external_libs/protoc.cmake)
include(cmake/external_libs/gflags.cmake) include(cmake/external_libs/gflags.cmake)
include(cmake/external_libs/gtest.cmake)
include(cmake/external_libs/securec.cmake) include(cmake/external_libs/securec.cmake)
include(cmake/external_libs/json.cmake) include(cmake/external_libs/json.cmake)
include(cmake/FindModule.cmake) include(cmake/FindModule.cmake)
@@ -78,6 +85,7 @@ if (ENABLE_OPEN_SRC)
else() else()
find_module(slog libslog.so ${ASCEND_ATC_DIR}) find_module(slog libslog.so ${ASCEND_ATC_DIR})
find_module(static_mmpa libmmpa.a ${ASCEND_ATC_DIR}) find_module(static_mmpa libmmpa.a ${ASCEND_ATC_DIR})
find_module(error_manager liberror_manager.so ${ASCEND_ATC_DIR})
if(PLATFORM STREQUAL "train") if(PLATFORM STREQUAL "train")
find_module(msprof libmsprof.so ${ASCEND_DRIVER_COMMON_DIR}) find_module(msprof libmsprof.so ${ASCEND_DRIVER_COMMON_DIR})
find_module(hccl libhccl.so ${ASCEND_RUNTIME_DIR}) find_module(hccl libhccl.so ${ASCEND_RUNTIME_DIR})
@@ -123,8 +131,13 @@ if (ENABLE_OPEN_SRC)
find_module(ascend_hal_stub libascend_hal.so ${ASCEND_DRIVER_DIR}/driver) find_module(ascend_hal_stub libascend_hal.so ${ASCEND_DRIVER_DIR}/driver)
#find_module(ascendcl_static libascendcl.a ${ASCEND_ACL_DIR}) #find_module(ascendcl_static libascendcl.a ${ASCEND_ACL_DIR})
else() else()
message(FATAL_ERROR "PLATFORM param is invalid, should be train or inference, build terminated")
message(STATUS "PLATFORM param is invalid, should be train or inference, you choose nothing!")
endif() endif()

if (ENABLE_GE_COV OR ENABLE_GE_UT)
add_subdirectory(tests)
endif()

endif() endif()


set(METADEF_DIR ${CMAKE_CURRENT_LIST_DIR}/metadef) set(METADEF_DIR ${CMAKE_CURRENT_LIST_DIR}/metadef)


+ 20
- 17
build.sh View File

@@ -59,7 +59,7 @@ checkopts()
ENABLE_GE_ST="off" ENABLE_GE_ST="off"
ENABLE_GE_COV="off" ENABLE_GE_COV="off"
GE_ONLY="on" GE_ONLY="on"
PLATFORM="inference"
PLATFORM=""
PRODUCT="normal" PRODUCT="normal"
ENABLE_GITEE="off" ENABLE_GITEE="off"
# Process the options # Process the options
@@ -166,6 +166,9 @@ build_graphengine()
elif [ "x${PLATFORM}" = "xinference" ] elif [ "x${PLATFORM}" = "xinference" ]
then then
TARGET="ge_compiler atc_ge_local_engine atc_ge_local_opskernel_builder atc_host_cpu_engine atc_host_cpu_opskernel_builder atc opensrc_ascendcl ${TARGET}" TARGET="ge_compiler atc_ge_local_engine atc_ge_local_opskernel_builder atc_host_cpu_engine atc_host_cpu_opskernel_builder atc opensrc_ascendcl ${TARGET}"
elif [ "X$ENABLE_GE_UT" = "Xon" ]
then
TARGET="ut_libgraph ut_libge_multiparts_utest ut_libge_others_utest ut_libge_kernel_utest ut_libge_distinct_load_utest"
elif [ "x${PLATFORM}" = "xall" ] elif [ "x${PLATFORM}" = "xall" ]
then then
# build all the target # build all the target
@@ -199,25 +202,25 @@ echo "---------------- GraphEngine output generated ----------------"
# cp ${BUILD_PATH}/graphengine/tests/st/st_resnet50_train ${OUTPUT_PATH} # cp ${BUILD_PATH}/graphengine/tests/st/st_resnet50_train ${OUTPUT_PATH}
# fi # fi


# if [[ "X$ENABLE_GE_UT" = "Xon" || "X$ENABLE_GE_COV" = "Xon" ]]; then
# cp ${BUILD_PATH}/graphengine/tests/ut/common/graph/ut_libgraph ${OUTPUT_PATH}
# cp ${BUILD_PATH}/graphengine/tests/ut/ge/ut_libge_multiparts_utest ${OUTPUT_PATH}
# cp ${BUILD_PATH}/graphengine/tests/ut/ge/ut_libge_distinct_load_utest ${OUTPUT_PATH}
# cp ${BUILD_PATH}/graphengine/tests/ut/ge/ut_libge_others_utest ${OUTPUT_PATH}
# cp ${BUILD_PATH}/graphengine/tests/ut/ge/ut_libge_kernel_utest ${OUTPUT_PATH}
if [[ "X$ENABLE_GE_UT" = "Xon" || "X$ENABLE_GE_COV" = "Xon" ]]; then
cp ${BUILD_PATH}/tests/ut/common/graph/ut_libgraph ${OUTPUT_PATH}
cp ${BUILD_PATH}/tests/ut/ge/ut_libge_multiparts_utest ${OUTPUT_PATH}
cp ${BUILD_PATH}/tests/ut/ge/ut_libge_distinct_load_utest ${OUTPUT_PATH}
cp ${BUILD_PATH}/tests/ut/ge/ut_libge_others_utest ${OUTPUT_PATH}
cp ${BUILD_PATH}/tests/ut/ge/ut_libge_kernel_utest ${OUTPUT_PATH}


# if [[ "X${ENABLE_GE_UT_ONLY_COMPILE}" != "Xon" ]]; then # if [[ "X${ENABLE_GE_UT_ONLY_COMPILE}" != "Xon" ]]; then
# export LD_LIBRARY_PATH=${D_LINK_PATH}/x86_64/:${BUILD_PATH}../third_party/prebuild/x86_64/:${BUILD_PATH}/graphengine/:/usr/local/HiAI/driver/lib64:/usr/local/HiAI/runtime/lib64:${LD_LIBRARY_PATH} # export LD_LIBRARY_PATH=${D_LINK_PATH}/x86_64/:${BUILD_PATH}../third_party/prebuild/x86_64/:${BUILD_PATH}/graphengine/:/usr/local/HiAI/driver/lib64:/usr/local/HiAI/runtime/lib64:${LD_LIBRARY_PATH}
# echo ${LD_LIBRARY_PATH} # echo ${LD_LIBRARY_PATH}
# ${OUTPUT_PATH}/ut_libgraph &&
# ${OUTPUT_PATH}/ut_libge_multiparts_utest &&
# ${OUTPUT_PATH}/ut_libge_distinct_load_utest &&
# ${OUTPUT_PATH}/ut_libge_others_utest &&
# ${OUTPUT_PATH}/ut_libge_kernel_utest
# if [[ "$?" -ne 0 ]]; then
# echo "!!! UT FAILED, PLEASE CHECK YOUR CHANGES !!!"
# exit 1;
# fi
${OUTPUT_PATH}/ut_libgraph &&
${OUTPUT_PATH}/ut_libge_multiparts_utest &&
${OUTPUT_PATH}/ut_libge_distinct_load_utest &&
${OUTPUT_PATH}/ut_libge_others_utest &&
${OUTPUT_PATH}/ut_libge_kernel_utest
if [[ "$?" -ne 0 ]]; then
echo "!!! UT FAILED, PLEASE CHECK YOUR CHANGES !!!"
exit 1;
fi
# fi # fi


# if [[ "X$ENABLE_GE_COV" = "Xon" ]]; then # if [[ "X$ENABLE_GE_COV" = "Xon" ]]; then
@@ -227,7 +230,7 @@ echo "---------------- GraphEngine output generated ----------------"
# mkdir ${BASEPATH}/cov # mkdir ${BASEPATH}/cov
# gcovr -r ./ --exclude 'third_party' --exclude 'build' --exclude 'tests' --exclude 'prebuild' --exclude 'inc' --print-summary --html --html-details -d -o cov/index.html # gcovr -r ./ --exclude 'third_party' --exclude 'build' --exclude 'tests' --exclude 'prebuild' --exclude 'inc' --print-summary --html --html-details -d -o cov/index.html
# fi # fi
# fi
fi


# generate output package in tar form, including ut/st libraries/executables # generate output package in tar form, including ut/st libraries/executables
generate_package() generate_package()


+ 60
- 0
cmake/external_libs/gtest.cmake View File

@@ -0,0 +1,60 @@
if (HAVE_GTEST)
return()
endif()

include(ExternalProject)

if ((${CMAKE_INSTALL_PREFIX} STREQUAL /usr/local) OR
(${CMAKE_INSTALL_PREFIX} STREQUAL "C:/Program Files (x86)/ascend"))
set(CMAKE_INSTALL_PREFIX ${GE_CODE_DIR}/output CACHE STRING "path for install()" FORCE)
message(STATUS "No install prefix selected, default to ${CMAKE_INSTALL_PREFIX}.")
endif()

if (ENABLE_GITEE)
set(REQ_URL "https://gitee.com/mirrors/googletest/repository/archive/release-1.8.0.tar.gz")
set(MD5 "")
else()
set(REQ_URL "https://github.com/google/googletest/archive/release-1.8.0.tar.gz")
set(MD5 "")
endif ()

set (gtest_CXXFLAGS "-D_GLIBCXX_USE_CXX11_ABI=0 -D_FORTIFY_SOURCE=2 -O2 -fstack-protector-all -Wl,-z,relro,-z,now,-z,noexecstack")
set (gtest_CFLAGS "-D_GLIBCXX_USE_CXX11_ABI=0 -D_FORTIFY_SOURCE=2 -O2 -fstack-protector-all -Wl,-z,relro,-z,now,-z,noexecstack")
ExternalProject_Add(gtest_build
URL ${REQ_URL}
CONFIGURE_COMMAND ${CMAKE_COMMAND} -DCMAKE_CXX_FLAGS=${gtest_CXXFLAGS} -DCMAKE_INSTALL_PREFIX=${CMAKE_INSTALL_PREFIX}/gtest <SOURCE_DIR>
-DBUILD_TESTING=OFF -DCMAKE_POSITION_INDEPENDENT_CODE=ON -DBUILD_SHARED_LIBS=ON -DCMAKE_MACOSX_RPATH=TRUE -Dgtest_disable_pthreads=ON
BUILD_COMMAND $(MAKE)
INSTALL_COMMAND $(MAKE) install
EXCLUDE_FROM_ALL TRUE
)

set(GTEST_PKG_DIR ${CMAKE_INSTALL_PREFIX}/gtest)

file(MAKE_DIRECTORY ${GTEST_PKG_DIR}/include)

add_library(gtest SHARED IMPORTED)

set_target_properties(gtest PROPERTIES
IMPORTED_LOCATION ${GTEST_PKG_DIR}/lib/libgtest.so
)

add_library(gtest_main SHARED IMPORTED)

set_target_properties(gtest_main PROPERTIES
IMPORTED_LOCATION ${GTEST_PKG_DIR}/lib/libgtest_main.so
)

target_include_directories(gtest INTERFACE ${GTEST_PKG_DIR}/include)
target_include_directories(gtest_main INTERFACE ${GTEST_PKG_DIR}/include)

set(INSTALL_BASE_DIR "")
set(INSTALL_LIBRARY_DIR lib)

install(FILES ${GTEST_PKG_DIR}/lib/libgtest.so ${GTEST_PKG_DIR}/lib/libgtest_main.so OPTIONAL
DESTINATION ${INSTALL_LIBRARY_DIR})

add_dependencies(gtest gtest_build)

#set(HAVE_GFLAGS TRUE CACHE BOOL "gflags build add")
set(HAVE_GTEST TRUE)

+ 9
- 9
cmake/external_libs/json.cmake View File

@@ -5,15 +5,15 @@ endif()
include(ExternalProject) include(ExternalProject)


set(JSON_SRC_DIR ${CMAKE_BINARY_DIR}/opensrc/json/include) set(JSON_SRC_DIR ${CMAKE_BINARY_DIR}/opensrc/json/include)
if (ENABLE_GITEE)
set(REQ_URL "https://gitee.com/mirrors/JSON-for-Modern-CPP/repository/archive/v3.6.1.zip")
set(MD5 "5bda78ce308e6cfcf614dcf1d5ff27a7")
set(JSON_INCLUDE_DIR "${JSON_SRC_DIR}/include")
else()
set(REQ_URL "https://github.com/nlohmann/json/releases/download/v3.6.1/include.zip")
set(MD5 "0dc903888211db3a0f170304cd9f3a89")
set(JSON_INCLUDE_DIR ${JSON_SRC_DIR})
endif ()
#if (ENABLE_GITEE)
# set(REQ_URL "https://gitee.com/mirrors/JSON-for-Modern-CPP/repository/archive/v3.6.1.zip")
# set(MD5 "5bda78ce308e6cfcf614dcf1d5ff27a7")
# set(JSON_INCLUDE_DIR "${JSON_SRC_DIR}/include")
#else()
set(REQ_URL "https://github.com/nlohmann/json/releases/download/v3.6.1/include.zip")
set(MD5 "0dc903888211db3a0f170304cd9f3a89")
set(JSON_INCLUDE_DIR ${JSON_SRC_DIR})
#endif ()
ExternalProject_Add(json_build ExternalProject_Add(json_build
URL ${REQ_URL} URL ${REQ_URL}
#URL /home/txd/workspace/cloud_code/pkg/include.zip #URL /home/txd/workspace/cloud_code/pkg/include.zip


+ 11
- 8
cmake/external_libs/protobuf_shared.cmake View File

@@ -10,19 +10,22 @@ if ((${CMAKE_INSTALL_PREFIX} STREQUAL /usr/local) OR
set(CMAKE_INSTALL_PREFIX ${GE_CODE_DIR}/output CACHE STRING "path for install()" FORCE) set(CMAKE_INSTALL_PREFIX ${GE_CODE_DIR}/output CACHE STRING "path for install()" FORCE)
message(STATUS "No install prefix selected, default to ${CMAKE_INSTALL_PREFIX}.") message(STATUS "No install prefix selected, default to ${CMAKE_INSTALL_PREFIX}.")
endif() endif()

if (ENABLE_GITEE)
set(REQ_URL "https://gitee.com/mirrors/protobuf_source/repository/archive/v3.8.0.tar.gz")
set(MD5 "eba86ae9f07ba5cfbaf8af3bc4e84236")
if (GE_PB_PKG)
set(REQ_URL "${GE_PB_PKG}/libs/protobuf/v3.8.0.tar.gz")
else() else()
set(REQ_URL "https://github.com/protocolbuffers/protobuf/archive/v3.8.0.tar.gz")
set(MD5 "3d9e32700639618a4d2d342c99d4507a")
endif ()
if (ENABLE_GITEE)
set(REQ_URL "https://gitee.com/mirrors/protobuf_source/repository/archive/v3.8.0.tar.gz")
set(MD5 "eba86ae9f07ba5cfbaf8af3bc4e84236")
else()
set(REQ_URL "https://github.com/protocolbuffers/protobuf/archive/v3.8.0.tar.gz")
set(MD5 "3d9e32700639618a4d2d342c99d4507a")
endif ()
endif()


set(protobuf_CXXFLAGS "-Wno-maybe-uninitialized -Wno-unused-parameter -fPIC -fstack-protector-all -D_FORTIFY_SOURCE=2 -D_GLIBCXX_USE_CXX11_ABI=0 -O2 -Dgoogle=ascend_private") set(protobuf_CXXFLAGS "-Wno-maybe-uninitialized -Wno-unused-parameter -fPIC -fstack-protector-all -D_FORTIFY_SOURCE=2 -D_GLIBCXX_USE_CXX11_ABI=0 -O2 -Dgoogle=ascend_private")
set(protobuf_LDFLAGS "-Wl,-z,relro,-z,now,-z,noexecstack") set(protobuf_LDFLAGS "-Wl,-z,relro,-z,now,-z,noexecstack")
ExternalProject_Add(protobuf_build ExternalProject_Add(protobuf_build
URL https://github.com/protocolbuffers/protobuf/archive/v3.8.0.tar.gz
URL ${REQ_URL}
CONFIGURE_COMMAND ${CMAKE_COMMAND} CONFIGURE_COMMAND ${CMAKE_COMMAND}
-Dprotobuf_WITH_ZLIB=OFF -Dprotobuf_WITH_ZLIB=OFF
-DCMAKE_INSTALL_LIBDIR=${CMAKE_INSTALL_LIBDIR} -DCMAKE_INSTALL_LIBDIR=${CMAKE_INSTALL_LIBDIR}


+ 11
- 7
cmake/external_libs/protobuf_static.cmake View File

@@ -8,19 +8,23 @@ if ((${CMAKE_INSTALL_PREFIX} STREQUAL /usr/local) OR
message(STATUS "No install prefix selected, default to ${CMAKE_INSTALL_PREFIX}.") message(STATUS "No install prefix selected, default to ${CMAKE_INSTALL_PREFIX}.")
endif() endif()


if (ENABLE_GITEE)
set(REQ_URL "https://gitee.com/mirrors/protobuf_source/repository/archive/v3.8.0.tar.gz")
set(MD5 "eba86ae9f07ba5cfbaf8af3bc4e84236")
if(GE_PB_PKG)
set(REQ_URL "${GE_PB_PKG}/libs/protobuf/v3.8.0.tar.gz")
else() else()
set(REQ_URL "https://github.com/protocolbuffers/protobuf/archive/v3.8.0.tar.gz")
set(MD5 "3d9e32700639618a4d2d342c99d4507a")
endif ()
if (ENABLE_GITEE)
set(REQ_URL "https://gitee.com/mirrors/protobuf_source/repository/archive/v3.8.0.tar.gz")
set(MD5 "eba86ae9f07ba5cfbaf8af3bc4e84236")
else()
set(REQ_URL "https://github.com/protocolbuffers/protobuf/archive/v3.8.0.tar.gz")
set(MD5 "3d9e32700639618a4d2d342c99d4507a")
endif ()
endif()


set(protobuf_CXXFLAGS "-Wno-maybe-uninitialized -Wno-unused-parameter -fPIC -fstack-protector-all -D_FORTIFY_SOURCE=2 -D_GLIBCXX_USE_CXX11_ABI=0 -O2 -Dgoogle=ascend_private") set(protobuf_CXXFLAGS "-Wno-maybe-uninitialized -Wno-unused-parameter -fPIC -fstack-protector-all -D_FORTIFY_SOURCE=2 -D_GLIBCXX_USE_CXX11_ABI=0 -O2 -Dgoogle=ascend_private")
set(protobuf_LDFLAGS "-Wl,-z,relro,-z,now,-z,noexecstack") set(protobuf_LDFLAGS "-Wl,-z,relro,-z,now,-z,noexecstack")
set(PROTOBUF_STATIC_PKG_DIR ${CMAKE_INSTALL_PREFIX}/protobuf_static) set(PROTOBUF_STATIC_PKG_DIR ${CMAKE_INSTALL_PREFIX}/protobuf_static)
ExternalProject_Add(protobuf_static_build ExternalProject_Add(protobuf_static_build
URL https://github.com/protocolbuffers/protobuf/archive/v3.8.0.tar.gz
URL ${REQ_URL}
#URL /home/txd/workspace/linux_cmake/pkg/protobuf-3.8.0.tar.gz #URL /home/txd/workspace/linux_cmake/pkg/protobuf-3.8.0.tar.gz
#SOURCE_DIR ${METADEF_DIR}/../../third_party/protobuf/src/protobuf-3.8.0 #SOURCE_DIR ${METADEF_DIR}/../../third_party/protobuf/src/protobuf-3.8.0
CONFIGURE_COMMAND ${CMAKE_COMMAND} CONFIGURE_COMMAND ${CMAKE_COMMAND}


+ 10
- 7
cmake/external_libs/protoc.cmake View File

@@ -12,14 +12,17 @@ if ((${CMAKE_INSTALL_PREFIX} STREQUAL /usr/local) OR
message(STATUS "No install prefix selected, default to ${CMAKE_INSTALL_PREFIX}.") message(STATUS "No install prefix selected, default to ${CMAKE_INSTALL_PREFIX}.")
endif() endif()
if (ENABLE_GITEE)
set(REQ_URL "https://gitee.com/mirrors/protobuf_source/repository/archive/v3.8.0.tar.gz")
set(MD5 "eba86ae9f07ba5cfbaf8af3bc4e84236")
if(GE_PB_PKG)
set(REQ_URL "${GE_PB_PKG}/libs/protobuf/v3.8.0.tar.gz")
else() else()
set(REQ_URL "https://github.com/protocolbuffers/protobuf/archive/v3.8.0.tar.gz")
set(MD5 "3d9e32700639618a4d2d342c99d4507a")
endif ()
if (ENABLE_GITEE)
set(REQ_URL "https://gitee.com/mirrors/protobuf_source/repository/archive/v3.8.0.tar.gz")
set(MD5 "eba86ae9f07ba5cfbaf8af3bc4e84236")
else()
set(REQ_URL "https://github.com/protocolbuffers/protobuf/archive/v3.8.0.tar.gz")
set(MD5 "3d9e32700639618a4d2d342c99d4507a")
endif ()
endif()
set(protobuf_CXXFLAGS "-Wno-maybe-uninitialized -Wno-unused-parameter -fPIC -fstack-protector-all -D_FORTIFY_SOURCE=2 -D_GLIBCXX_USE_CXX11_ABI=0 -O2") set(protobuf_CXXFLAGS "-Wno-maybe-uninitialized -Wno-unused-parameter -fPIC -fstack-protector-all -D_FORTIFY_SOURCE=2 -D_GLIBCXX_USE_CXX11_ABI=0 -O2")
set(protobuf_LDFLAGS "-Wl,-z,relro,-z,now,-z,noexecstack") set(protobuf_LDFLAGS "-Wl,-z,relro,-z,now,-z,noexecstack")


+ 1
- 1
ge/common/CMakeLists.txt View File

@@ -115,7 +115,7 @@ target_link_libraries(ge_common PRIVATE
slog slog
-Wl,--as-needed -Wl,--as-needed
json json
-lrt
$<$<NOT:$<STREQUAL:${TARGET_SYSTEM_NAME},Android>>:-lrt>
-ldl -ldl
) )




+ 10
- 10
ge/common/helper/model_helper.cc View File

@@ -140,8 +140,8 @@ FMK_FUNC_HOST_VISIBILITY FMK_FUNC_DEV_VISIBILITY Status ModelHelper::SaveToOmMod


std::shared_ptr<ModelTaskDef> model_task_def = ge_model->GetModelTaskDefPtr(); std::shared_ptr<ModelTaskDef> model_task_def = ge_model->GetModelTaskDefPtr();
if (model_task_def == nullptr) { if (model_task_def == nullptr) {
GELOGE(MEMALLOC_FAILED, "Create model task def ptr failed");
return FAILED;
GELOGE(ACL_ERROR_GE_MEMORY_ALLOCATION, "Create model task def ptr failed");
return ACL_ERROR_GE_MEMORY_ALLOCATION;
} }
size_t partition_task_size = model_task_def->ByteSizeLong(); size_t partition_task_size = model_task_def->ByteSizeLong();
GE_IF_BOOL_EXEC(partition_task_size == 0 || partition_task_size > INT_MAX, GE_IF_BOOL_EXEC(partition_task_size == 0 || partition_task_size > INT_MAX,
@@ -150,8 +150,8 @@ FMK_FUNC_HOST_VISIBILITY FMK_FUNC_DEV_VISIBILITY Status ModelHelper::SaveToOmMod


ge::Buffer task_buffer(partition_task_size); ge::Buffer task_buffer(partition_task_size);
if (task_buffer.GetSize() == 0) { if (task_buffer.GetSize() == 0) {
GELOGE(MEMALLOC_FAILED, "Alloc model task def buffer failed");
return MEMALLOC_FAILED;
GELOGE(ACL_ERROR_GE_MEMORY_ALLOCATION, "Alloc model task def buffer failed");
return ACL_ERROR_GE_MEMORY_ALLOCATION;
} }
(void)model_task_def->SerializePartialToArray(task_buffer.GetData(), static_cast<int>(partition_task_size)); (void)model_task_def->SerializePartialToArray(task_buffer.GetData(), static_cast<int>(partition_task_size));


@@ -173,8 +173,8 @@ FMK_FUNC_HOST_VISIBILITY FMK_FUNC_DEV_VISIBILITY Status ModelHelper::SaveToOmMod
err = memcpy_s(model_header.platform_version, PLATFORM_VERSION_LEN, platform_version.c_str(), err = memcpy_s(model_header.platform_version, PLATFORM_VERSION_LEN, platform_version.c_str(),
platform_version.size() + 1); platform_version.size() + 1);
if (err != EOK) { if (err != EOK) {
GELOGE(MEMALLOC_FAILED, "ModelHelper SaveModel failed while allocating memory for platform_version.");
return MEMALLOC_FAILED;
GELOGE(ACL_ERROR_GE_MEMORY_ALLOCATION, "ModelHelper SaveModel failed while allocating memory for platform_version.");
return ACL_ERROR_GE_MEMORY_ALLOCATION;
} }
string version = reinterpret_cast<char *>(model_header.platform_version); string version = reinterpret_cast<char *>(model_header.platform_version);
GELOGD("Platform version save: %s", version.c_str()); GELOGD("Platform version save: %s", version.c_str());
@@ -183,8 +183,8 @@ FMK_FUNC_HOST_VISIBILITY FMK_FUNC_DEV_VISIBILITY Status ModelHelper::SaveToOmMod
name_size = name_size > (MODEL_NAME_LENGTH - 1) ? (MODEL_NAME_LENGTH - 1) : name_size; name_size = name_size > (MODEL_NAME_LENGTH - 1) ? (MODEL_NAME_LENGTH - 1) : name_size;
err = memcpy_s(model_header.name, MODEL_NAME_LENGTH, ge_model->GetName().c_str(), name_size); err = memcpy_s(model_header.name, MODEL_NAME_LENGTH, ge_model->GetName().c_str(), name_size);
if (err != EOK) { if (err != EOK) {
GELOGE(MEMALLOC_FAILED, "ModelHelper SaveModel failed while allocating memory for name");
return MEMALLOC_FAILED;
GELOGE(ACL_ERROR_GE_MEMORY_ALLOCATION, "ModelHelper SaveModel failed while allocating memory for name");
return ACL_ERROR_GE_MEMORY_ALLOCATION;
} }
string model_name = reinterpret_cast<char *>(model_header.name); string model_name = reinterpret_cast<char *>(model_header.name);
GELOGD("Model name save:%s", model_name.c_str()); GELOGD("Model name save:%s", model_name.c_str());
@@ -299,8 +299,8 @@ FMK_FUNC_HOST_VISIBILITY FMK_FUNC_DEV_VISIBILITY Status ModelHelper::LoadModel(c
auto partition_table = reinterpret_cast<ModelPartitionTable *>(model_addr_tmp_); auto partition_table = reinterpret_cast<ModelPartitionTable *>(model_addr_tmp_);
if (partition_table->num == kOriginalOmPartitionNum) { if (partition_table->num == kOriginalOmPartitionNum) {
model_addr_tmp_ = nullptr; model_addr_tmp_ = nullptr;
GELOGE(ACL_ERROR_GE_EXEC_MODEL_PARTITION_NUM_INVALID, "om model is error,please use executable om model");
return ACL_ERROR_GE_EXEC_MODEL_PARTITION_NUM_INVALID;
GELOGE(ACL_ERROR_GE_PARAM_INVALID, "om model is error,please use executable om model");
return ACL_ERROR_GE_PARAM_INVALID;
} }
// Encrypt model need to del temp model/no encrypt model don't need to del model // Encrypt model need to del temp model/no encrypt model don't need to del model
model_addr_tmp_ = nullptr; model_addr_tmp_ = nullptr;


+ 2
- 2
ge/common/helper/om_file_helper.cc View File

@@ -119,8 +119,8 @@ Status OmFileLoadHelper::LoadModelPartitionTable(uint8_t *model_data, const uint
// Original model partition include graph-info // Original model partition include graph-info
if ((partition_table->num != PARTITION_SIZE) && (partition_table->num != (PARTITION_SIZE - 1)) && if ((partition_table->num != PARTITION_SIZE) && (partition_table->num != (PARTITION_SIZE - 1)) &&
(partition_table->num != (PARTITION_SIZE - kOptionalNum)) && (partition_table->num != 1)) { (partition_table->num != (PARTITION_SIZE - kOptionalNum)) && (partition_table->num != 1)) {
GELOGE(ACL_ERROR_GE_EXEC_MODEL_PARTITION_NUM_INVALID, "Invalid partition_table->num:%u", partition_table->num);
return ACL_ERROR_GE_EXEC_MODEL_PARTITION_NUM_INVALID;
GELOGE(ACL_ERROR_GE_PARAM_INVALID, "Invalid partition_table->num:%u", partition_table->num);
return ACL_ERROR_GE_PARAM_INVALID;
} }
size_t mem_offset = SIZE_OF_MODEL_PARTITION_TABLE(*partition_table); size_t mem_offset = SIZE_OF_MODEL_PARTITION_TABLE(*partition_table);
GELOGD("ModelPartitionTable num :%u, ModelFileHeader length :%zu, ModelPartitionTable length :%zu", GELOGD("ModelPartitionTable num :%u, ModelFileHeader length :%zu, ModelPartitionTable length :%zu",


+ 3
- 3
ge/common/model_parser/base.cc View File

@@ -101,15 +101,15 @@ FMK_FUNC_HOST_VISIBILITY FMK_FUNC_DEV_VISIBILITY Status ModelParserBase::ParseMo
// Get data address // Get data address
uint8_t *data = reinterpret_cast<uint8_t *>(model.model_data) + sizeof(ModelFileHeader); uint8_t *data = reinterpret_cast<uint8_t *>(model.model_data) + sizeof(ModelFileHeader);
if (file_header->is_encrypt == ModelEncryptType::UNENCRYPTED) { // Unencrypted model if (file_header->is_encrypt == ModelEncryptType::UNENCRYPTED) { // Unencrypted model
GE_CHK_BOOL_RET_STATUS(model.key.empty(), ACL_ERROR_GE_EXEC_MODEL_NOT_SUPPORT_ENCRYPTION,
GE_CHK_BOOL_RET_STATUS(model.key.empty(), ACL_ERROR_GE_PARAM_INVALID,
"Invalid param. model is unencrypted, but key is not empty."); "Invalid param. model is unencrypted, but key is not empty.");


model_data = data; model_data = data;
model_len = file_header->length; model_len = file_header->length;
GELOGD("Model_len is %u, model_file_head_len is %zu.", model_len, sizeof(ModelFileHeader)); GELOGD("Model_len is %u, model_file_head_len is %zu.", model_len, sizeof(ModelFileHeader));
} else { } else {
GELOGE(ACL_ERROR_GE_EXEC_MODEL_NOT_SUPPORT_ENCRYPTION, "Invalid model. ModelEncryptType not supported.");
res = ACL_ERROR_GE_EXEC_MODEL_NOT_SUPPORT_ENCRYPTION;
GELOGE(ACL_ERROR_GE_PARAM_INVALID, "Invalid model. ModelEncryptType not supported.");
res = ACL_ERROR_GE_PARAM_INVALID;
} }


return res; return res;


+ 1
- 0
ge/common/types.cc View File

@@ -382,6 +382,7 @@ REGISTER_OPTYPE_DEFINE(HCOMBROADCAST, "HcomBroadcast");
REGISTER_OPTYPE_DEFINE(HCOMALLGATHER, "HcomAllGather"); REGISTER_OPTYPE_DEFINE(HCOMALLGATHER, "HcomAllGather");
REGISTER_OPTYPE_DEFINE(HCOMALLREDUCE, "HcomAllReduce"); REGISTER_OPTYPE_DEFINE(HCOMALLREDUCE, "HcomAllReduce");
REGISTER_OPTYPE_DEFINE(HCOMREDUCESCATTER, "HcomReduceScatter"); REGISTER_OPTYPE_DEFINE(HCOMREDUCESCATTER, "HcomReduceScatter");
REGISTER_OPTYPE_DEFINE(HCOMREDUCE, "HcomReduce");
REGISTER_OPTYPE_DEFINE(HCOMSEND, "HcomSend"); REGISTER_OPTYPE_DEFINE(HCOMSEND, "HcomSend");
REGISTER_OPTYPE_DEFINE(HCOMRECEIVE, "HcomReceive"); REGISTER_OPTYPE_DEFINE(HCOMRECEIVE, "HcomReceive");
REGISTER_OPTYPE_DEFINE(HCOMREMOTEREAD, "HcomRemoteRead"); REGISTER_OPTYPE_DEFINE(HCOMREMOTEREAD, "HcomRemoteRead");


+ 19
- 1
ge/generator/ge_generator.cc View File

@@ -25,6 +25,7 @@
#include "common/util.h" #include "common/util.h"
#include "common/util/error_manager/error_manager.h" #include "common/util/error_manager/error_manager.h"
#include "framework/common/debug/ge_log.h" #include "framework/common/debug/ge_log.h"
#include "framework/common/debug/log.h"
#include "ge/ge_api.h" #include "ge/ge_api.h"
#include "graph/debug/ge_attr_define.h" #include "graph/debug/ge_attr_define.h"
#include "graph/ge_context.h" #include "graph/ge_context.h"
@@ -76,6 +77,9 @@ static Status CheckEngineTypeSupport(const OpDescPtr &op_desc, OpEngineType engi
op_engine_name = iter->second; op_engine_name = iter->second;
GELOGI("CheckEngineType: engine type: %d", static_cast<int>(engine_type)); GELOGI("CheckEngineType: engine type: %d", static_cast<int>(engine_type));
} else { } else {
ErrorManager::GetInstance().ATCReportErrMessage("E14001", {"opname", "optype", "value", "reason"},
{op_desc->GetName(), op_desc->GetType(), "engine type",
"it only support kEngineNameDefault/kAIcoreEngine/kVectorEngine"});
GELOGE(FAILED, "CheckEngineType: engine type: %d not support", static_cast<int>(engine_type)); GELOGE(FAILED, "CheckEngineType: engine type: %d not support", static_cast<int>(engine_type));
return FAILED; return FAILED;
} }
@@ -94,6 +98,8 @@ static Status CheckEngineTypeSupport(const OpDescPtr &op_desc, OpEngineType engi
OpsKernelManager &ops_kernel_manager = instance_ptr->OpsKernelManagerObj(); OpsKernelManager &ops_kernel_manager = instance_ptr->OpsKernelManagerObj();
std::vector<OpInfo> op_infos = ops_kernel_manager.GetOpsKernelInfo(op_desc->GetType()); std::vector<OpInfo> op_infos = ops_kernel_manager.GetOpsKernelInfo(op_desc->GetType());
if (op_infos.empty()) { if (op_infos.empty()) {
ErrorManager::GetInstance().ATCReportErrMessage("E14001", {"opname", "optype", "value", "reason"},
{op_desc->GetName(), op_desc->GetType(), "optype", "it can not find"});
GELOGE(FAILED, "CheckEngineType: Can not get op info by op type %s", op_desc->GetType().c_str()); GELOGE(FAILED, "CheckEngineType: Can not get op info by op type %s", op_desc->GetType().c_str());
return FAILED; return FAILED;
} }
@@ -105,7 +111,9 @@ static Status CheckEngineTypeSupport(const OpDescPtr &op_desc, OpEngineType engi
} }
} }
if (kernel_name.empty()) { if (kernel_name.empty()) {
GELOGE(FAILED, "CheckEngineType:Can not find ops kernel,engine name: %s.", op_engine_name.c_str());
ErrorManager::GetInstance().ATCReportErrMessage("E14001", {"opname", "optype", "value", "reason"},
{op_desc->GetName(), op_desc->GetType(), "engine name" + FmtToStr(op_engine_name), "it can not find"});
GELOGE(FAILED, "CheckEngineType:Can not find ops kernel, engine name: %s.", op_engine_name.c_str());
return FAILED; return FAILED;
} }
auto &kernel_map = ops_kernel_manager.GetAllOpsKernelInfoStores(); auto &kernel_map = ops_kernel_manager.GetAllOpsKernelInfoStores();
@@ -119,11 +127,15 @@ static Status CheckEngineTypeSupport(const OpDescPtr &op_desc, OpEngineType engi
op_engine_name.c_str(), op_desc->GetName().c_str()); op_engine_name.c_str(), op_desc->GetName().c_str());
return SUCCESS; return SUCCESS;
} else { } else {
ErrorManager::GetInstance().ATCReportErrMessage(
"E13002", {"optype", "opskernel", "reason"}, {op_desc->GetType(), kernel_name, unsupported_reason});
GELOGE(FAILED, "CheckEngineType: check support failed, Op type %s of ops kernel %s is unsupported, reason:%s", GELOGE(FAILED, "CheckEngineType: check support failed, Op type %s of ops kernel %s is unsupported, reason:%s",
op_desc->GetType().c_str(), kernel_name.c_str(), unsupported_reason.c_str()); op_desc->GetType().c_str(), kernel_name.c_str(), unsupported_reason.c_str());
return FAILED; return FAILED;
} }
} else { } else {
ErrorManager::GetInstance().ATCReportErrMessage(
"E13003", {"opname", "optype"}, {op_desc->GetName(), op_desc->GetType()});
GELOGE(FAILED, GELOGE(FAILED,
"CheckEngineType:Can not find any supported ops kernel info store by kernel_name %s," "CheckEngineType:Can not find any supported ops kernel info store by kernel_name %s,"
"op type is %s, op name is %s", "op type is %s, op name is %s",
@@ -536,10 +548,16 @@ Status GeGenerator::CheckForSingleOp(OpDescPtr &op_desc, const vector<GeTensor>
const vector<GeTensor> &outputs) { const vector<GeTensor> &outputs) {
GE_CHECK_NOTNULL_EXEC(op_desc, return PARAM_INVALID); GE_CHECK_NOTNULL_EXEC(op_desc, return PARAM_INVALID);
if (!inputs.empty() && (inputs.size() != op_desc->GetAllInputsSize())) { if (!inputs.empty() && (inputs.size() != op_desc->GetAllInputsSize())) {
ErrorManager::GetInstance().ATCReportErrMessage("E14001", {"opname", "optype", "value", "reason"},
{op_desc->GetName(), op_desc->GetType(), "inputs size" + FmtToStr(op_desc->GetAllInputsSize()),
"tensor size is " + FmtToStr(inputs.size())});
GELOGE(PARAM_INVALID, "Tensor size: %zu, Inputs size: %zu", inputs.size(), op_desc->GetAllInputsSize()); GELOGE(PARAM_INVALID, "Tensor size: %zu, Inputs size: %zu", inputs.size(), op_desc->GetAllInputsSize());
return PARAM_INVALID; return PARAM_INVALID;
} }
if (!outputs.empty() && (outputs.size() != op_desc->GetOutputsSize())) { if (!outputs.empty() && (outputs.size() != op_desc->GetOutputsSize())) {
ErrorManager::GetInstance().ATCReportErrMessage("E14001", {"opname", "optype", "value", "reason"},
{op_desc->GetName(), op_desc->GetType(), "outputs size" + FmtToStr(op_desc->GetOutputsSize()),
"tensor size is " + FmtToStr(outputs.size())});
GELOGE(PARAM_INVALID, "Tensor size: %zu, Outputs size: %zu", outputs.size(), op_desc->GetOutputsSize()); GELOGE(PARAM_INVALID, "Tensor size: %zu, Outputs size: %zu", outputs.size(), op_desc->GetOutputsSize());
return PARAM_INVALID; return PARAM_INVALID;
} }


+ 3
- 1
ge/graph/build/graph_builder.cc View File

@@ -377,7 +377,9 @@ Status GraphBuilder::GetTaskInfo(const ge::ModelBuilder &builder, const ModelPtr
} }


auto var_manager = VarManager::Instance(session_id); auto var_manager = VarManager::Instance(session_id);
auto *get_mem_base = reinterpret_cast<uint8_t *>(reinterpret_cast<uintptr_t>(var_manager->GetVarMemMaxSize()));
// since var_mem_logic_base_ = graph_mem_max_size_ + kGraphMemoryBuffer in graph_var_manager.cc,
// get_mem_base should not bigger than kGraphMemoryBuffer
auto *get_mem_base = reinterpret_cast<uint8_t *>(reinterpret_cast<uintptr_t>(kGraphMemoryBuffer>>1));
uint8_t *get_weight_mem_base = get_mem_base; uint8_t *get_weight_mem_base = get_mem_base;
if (weight_size > 0) { if (weight_size > 0) {
get_weight_mem_base = get_mem_base + memory_size + p2p_memory_size; get_weight_mem_base = get_mem_base + memory_size + p2p_memory_size;


+ 1
- 1
ge/graph/build/stream_allocator.cc View File

@@ -49,7 +49,7 @@ inline bool HasContinuousStreamLabel(const ge::OpDescPtr &op_desc, std::string &
} }


bool IsHcclOp(const string &op_type) { bool IsHcclOp(const string &op_type) {
const set<string> hccl_op_types({ge::HCOMBROADCAST, ge::HCOMALLGATHER, ge::HCOMALLREDUCE, ge::HCOMREDUCESCATTER});
const set<string> hccl_op_types({ge::HCOMBROADCAST, ge::HCOMALLGATHER, ge::HCOMALLREDUCE, ge::HCOMREDUCESCATTER, ge::HCOMREDUCE});
return hccl_op_types.find(op_type) != hccl_op_types.end(); return hccl_op_types.find(op_type) != hccl_op_types.end();
} }
} // namespace } // namespace


+ 2
- 1
ge/graph/load/new_model_manager/davinci_model.cc View File

@@ -411,7 +411,8 @@ void DavinciModel::CheckHasHcomOp() {
(op_desc->GetType() == HCOMALLREDUCE) || (op_desc->GetType() == HCOMSEND) || (op_desc->GetType() == HCOMALLREDUCE) || (op_desc->GetType() == HCOMSEND) ||
(op_desc->GetType() == HCOMRECEIVE) || (op_desc->GetType() == HCOMREDUCESCATTER) || (op_desc->GetType() == HCOMRECEIVE) || (op_desc->GetType() == HCOMREDUCESCATTER) ||
(op_desc->GetType() == HVDCALLBACKALLREDUCE) || (op_desc->GetType() == HVDCALLBACKALLGATHER) || (op_desc->GetType() == HVDCALLBACKALLREDUCE) || (op_desc->GetType() == HVDCALLBACKALLGATHER) ||
(op_desc->GetType() == HVDCALLBACKBROADCAST) || (op_desc->GetType() == HVDWAIT)),
(op_desc->GetType() == HVDCALLBACKBROADCAST) || (op_desc->GetType() == HVDWAIT) ||
(op_desc->GetType() == HCOMREDUCE)),
uint32_t stream_id = static_cast<uint32_t>(op_desc->GetStreamId()); uint32_t stream_id = static_cast<uint32_t>(op_desc->GetStreamId());
(void)hcom_streams_.emplace(stream_id); GELOGD("hcom stream: %u.", stream_id); continue); (void)hcom_streams_.emplace(stream_id); GELOGD("hcom stream: %u.", stream_id); continue);
} }


+ 4
- 4
ge/graph/load/new_model_manager/model_manager.cc View File

@@ -1044,7 +1044,7 @@ Status ModelManager::GenSessionId(uint64_t &session_id) {
Status ModelManager::LoadModelOffline(uint32_t &model_id, const ModelData &model, shared_ptr<ModelListener> listener, Status ModelManager::LoadModelOffline(uint32_t &model_id, const ModelData &model, shared_ptr<ModelListener> listener,
void *dev_ptr, size_t mem_size, void *weight_ptr, size_t weight_size) { void *dev_ptr, size_t mem_size, void *weight_ptr, size_t weight_size) {
GE_CHK_BOOL_RET_STATUS(model.key.empty() || mmAccess2(model.key.c_str(), M_F_OK) == EN_OK, GE_CHK_BOOL_RET_STATUS(model.key.empty() || mmAccess2(model.key.c_str(), M_F_OK) == EN_OK,
ACL_ERROR_GE_EXEC_MODEL_KEY_PATH_INVALID,
ACL_ERROR_GE_PARAM_INVALID,
"input key file path %s is invalid, %s", model.key.c_str(), strerror(errno)); "input key file path %s is invalid, %s", model.key.c_str(), strerror(errno));
GenModelId(&model_id); GenModelId(&model_id);


@@ -1130,7 +1130,7 @@ Status ModelManager::LoadModelWithQ(uint32_t &model_id, const ModelData &model_d
const std::vector<uint32_t> &input_queue_ids, const std::vector<uint32_t> &input_queue_ids,
const std::vector<uint32_t> &output_queue_ids) { const std::vector<uint32_t> &output_queue_ids) {
GE_CHK_BOOL_RET_STATUS(model_data.key.empty() || mmAccess2(model_data.key.c_str(), M_F_OK) == EN_OK, GE_CHK_BOOL_RET_STATUS(model_data.key.empty() || mmAccess2(model_data.key.c_str(), M_F_OK) == EN_OK,
ACL_ERROR_GE_EXEC_MODEL_KEY_PATH_INVALID, "input key file path %s is not valid, %s",
ACL_ERROR_GE_PARAM_INVALID, "input key file path %s is not valid, %s",
model_data.key.c_str(), strerror(errno)); model_data.key.c_str(), strerror(errno));


ModelHelper model_helper; ModelHelper model_helper;
@@ -1397,8 +1397,8 @@ Status ModelManager::GetModelMemAndWeightSize(const ModelData &model, size_t &me


auto partition_table = reinterpret_cast<ModelPartitionTable *>(model_data); auto partition_table = reinterpret_cast<ModelPartitionTable *>(model_data);
if (partition_table->num == 1) { if (partition_table->num == 1) {
GELOGE(ACL_ERROR_GE_EXEC_MODEL_PARTITION_NUM_INVALID, "om model is error,please use executable om model");
return ACL_ERROR_GE_EXEC_MODEL_PARTITION_NUM_INVALID;
GELOGE(ACL_ERROR_GE_PARAM_INVALID, "om model is error,please use executable om model");
return ACL_ERROR_GE_PARAM_INVALID;
} }
ModelPartition task_partition; ModelPartition task_partition;
if (om_file_helper.GetModelPartition(ModelPartitionType::TASK_INFO, task_partition) != SUCCESS) { if (om_file_helper.GetModelPartition(ModelPartitionType::TASK_INFO, task_partition) != SUCCESS) {


+ 1
- 1
ge/graph/load/new_model_manager/task_info/hccl_task_info.cc View File

@@ -279,7 +279,7 @@ Status HcclTaskInfo::SetAddrs(const std::shared_ptr<OpDesc> &op_desc,
output_data_addr = output_data_addrs_.empty() ? nullptr : output_data_addrs_[i]; output_data_addr = output_data_addrs_.empty() ? nullptr : output_data_addrs_[i];
} }
kernel_hccl_infos[i].inputDataAddr = input_data_addr; kernel_hccl_infos[i].inputDataAddr = input_data_addr;
if (hccl_type == HCOMALLGATHER || hccl_type == HCOMRECEIVE || hccl_type == HVDCALLBACKALLGATHER) {
if (hccl_type == HCOMALLGATHER || hccl_type == HCOMRECEIVE || hccl_type == HVDCALLBACKALLGATHER || hccl_type == HCOMREDUCE) {
kernel_hccl_infos[i].outputDataAddr = output_data_addr; kernel_hccl_infos[i].outputDataAddr = output_data_addr;
} else if (hccl_type == HCOMALLREDUCE || hccl_type == HCOMREDUCESCATTER || hccl_type == HVDCALLBACKALLREDUCE) { } else if (hccl_type == HCOMALLREDUCE || hccl_type == HCOMREDUCESCATTER || hccl_type == HVDCALLBACKALLREDUCE) {
GE_CHK_STATUS_RET(HcomOmeUtil::GetHcclOperationType(op_desc, op_type), GE_CHK_STATUS_RET(HcomOmeUtil::GetHcclOperationType(op_desc, op_type),


+ 12
- 43
ge/graph/manager/graph_manager.cc View File

@@ -131,6 +131,8 @@ const int64_t kInvalidDynaimcDimsType = -1;
const char *const kSubstrOfGetNextNosinkName = "IteratorGetNext"; const char *const kSubstrOfGetNextNosinkName = "IteratorGetNext";
const char *const kShapeDataName = "ascend_mbatch_shape_data"; const char *const kShapeDataName = "ascend_mbatch_shape_data";
const char *const kGetNextName = "IteratorV2"; const char *const kGetNextName = "IteratorV2";
const char *const kExtAttrDataNodes = "data_nodes";
const char *const kExtAttrGetNextNoSink = "getnext_no_sink";


bool IsTailingOptimization() { bool IsTailingOptimization() {
string is_tailing_optimization_option; string is_tailing_optimization_option;
@@ -2335,11 +2337,12 @@ Status GraphManager::OptimizeStage2(ge::ComputeGraphPtr &compute_graph) {
GE_CHK_STATUS_RET(pass_for_control_attr_optimize.AddPass("OptimizeStage2::AfterMergePasses::" GE_CHK_STATUS_RET(pass_for_control_attr_optimize.AddPass("OptimizeStage2::AfterMergePasses::"
"EndOfSequenceAddControlPass", "EndOfSequenceAddControlPass",
new (std::nothrow) EndOfSequenceAddControlPass)) new (std::nothrow) EndOfSequenceAddControlPass))
// SubgraphPass solves memory_assign_conflicts by insert MemcpyAsync node, which depends on multi attrs and
// graph-structure. So try not to add new pass after SubgraphPass.
// 'SubgraphPass' solves memory_assign_conflicts by insert MemcpyAsync node, which depends on multi attrs and
// graph-structure. Passes after 'SubgraphPass' MUST NOT remove MemcpyAsync/Identity nodes in subgraphs.
GE_CHK_STATUS_RET(pass_for_control_attr_optimize.AddPass("OptimizeStage2::ControlAttrOptimize::SubgraphPass", GE_CHK_STATUS_RET(pass_for_control_attr_optimize.AddPass("OptimizeStage2::ControlAttrOptimize::SubgraphPass",
new (std::nothrow) SubgraphPass)) new (std::nothrow) SubgraphPass))
// AttachStreamLabelPass modifies attr without changing structure of compute_graph
// 'AttachStreamLabelPass' modifies attr without changing structure of compute_graph
// All passes after 'AttachStreamLabelPass' MUST mark stream_label on new nodes by self.
GE_CHK_STATUS_RET(pass_for_control_attr_optimize.AddPass("OptimizeStage2::ControlAttrOptimize::AttachStreamLabelPass", GE_CHK_STATUS_RET(pass_for_control_attr_optimize.AddPass("OptimizeStage2::ControlAttrOptimize::AttachStreamLabelPass",
new (std::nothrow) AttachStreamLabelPass)) new (std::nothrow) AttachStreamLabelPass))


@@ -2483,15 +2486,15 @@ Status GraphManager::CheckAndReleaseMemory(const GeModelPtr &ge_model, const Gra
GELOGE(RT_FAILED, "[GraphManager:] rtSetDevice failed, modelId=%u, graphId=%u.", model_id, graph_id); GELOGE(RT_FAILED, "[GraphManager:] rtSetDevice failed, modelId=%u, graphId=%u.", model_id, graph_id);
continue; continue;
} }
result = GraphLoader::UnloadModel(model_id);
if (result != SUCCESS) {
GELOGW("[GraphManager:] unload model failed, modelId=%u, graphId=%u.", model_id, graph_id);
}
result = GraphLoader::DestroyAicpuKernel(session_id, model_id); result = GraphLoader::DestroyAicpuKernel(session_id, model_id);
if (result != SUCCESS) { if (result != SUCCESS) {
GELOGW("[GraphManager:] destroy aicpu kernel failed when dynamic memory, modelId=%u, graphId=%u.", model_id, GELOGW("[GraphManager:] destroy aicpu kernel failed when dynamic memory, modelId=%u, graphId=%u.", model_id,
graph_id); graph_id);
} }
result = GraphLoader::UnloadModel(model_id);
if (result != SUCCESS) {
GELOGW("[GraphManager:] unload model failed, modelId=%u, graphId=%u.", model_id, graph_id);
}
rt_ret = rtDeviceReset(GetContext().DeviceId()); rt_ret = rtDeviceReset(GetContext().DeviceId());
if (rt_ret != RT_ERROR_NONE) { if (rt_ret != RT_ERROR_NONE) {
GELOGE(RT_FAILED, "[GraphManager:] rtDeviceReset failed, modelId=%u, graphId=%u.", model_id, graph_id); GELOGE(RT_FAILED, "[GraphManager:] rtDeviceReset failed, modelId=%u, graphId=%u.", model_id, graph_id);
@@ -2730,37 +2733,6 @@ void GraphManager::PreRunThread(GraphManager *graph_manager) {
} }
} }


Status GraphManager::DistinguishGetNextAndData(ComputeGraphPtr &graph, vector<NodePtr> &data_nodes,
vector<NodePtr> &getnext_nosink_nodes,
vector<NodePtr> &getnext_sink_nodes) {
GELOGD("Start distinguish getnext and data node.");
for (NodePtr &input_node : graph->GetDirectNode()) {
GE_CHECK_NOTNULL(input_node);
OpDescPtr op_desc = input_node->GetOpDesc();
GE_CHECK_NOTNULL(op_desc);
if (op_desc->GetType() == DATA && op_desc->GetName() != kShapeDataName) {
if (op_desc->GetName().find(kSubstrOfGetNextNosinkName) == string::npos) {
data_nodes.emplace_back(input_node);
} else {
getnext_nosink_nodes.emplace_back(input_node);
}
}
std::string op_type;
auto ret = GetOriginalType(input_node, op_type);
if (ret != SUCCESS) {
GELOGE(FAILED, "Failed to get node %s original type.", input_node->GetName().c_str());
return FAILED;
}
if (op_type == kGetNextName) {
GELOGD("Name of getnext sink is %s.", op_desc->GetName().c_str());
getnext_sink_nodes.emplace_back(input_node);
}
}
GELOGI("data count is %zu, getnext nosink count is %zu, getnext sink count is %zu.", data_nodes.size(),
getnext_nosink_nodes.size(), getnext_sink_nodes.size());
return SUCCESS;
}

void GraphManager::ParseInputsDimsForData(const std::vector<InputTensorInfo> &input_tensor) { void GraphManager::ParseInputsDimsForData(const std::vector<InputTensorInfo> &input_tensor) {
GELOGD("Start parse input dims from data."); GELOGD("Start parse input dims from data.");
for (size_t i = 0; i < input_tensor.size(); ++i) { for (size_t i = 0; i < input_tensor.size(); ++i) {
@@ -2803,11 +2775,8 @@ Status GraphManager::ParseInputsDims(const std::vector<InputTensorInfo> &input_t
if (!GetLocalOmgContext().dynamic_node_type.empty()) { if (!GetLocalOmgContext().dynamic_node_type.empty()) {
vector<NodePtr> data_nodes; vector<NodePtr> data_nodes;
vector<NodePtr> getnext_nosink_nodes; vector<NodePtr> getnext_nosink_nodes;
vector<NodePtr> getnext_sink_nodes;
if (DistinguishGetNextAndData(compute_graph_, data_nodes, getnext_nosink_nodes, getnext_sink_nodes) != SUCCESS) {
GELOGE(PARAM_INVALID, "Failed to distinguish getnext and data node.");
return PARAM_INVALID;
}
data_nodes = compute_graph_->TryGetExtAttr(kExtAttrDataNodes, data_nodes);
getnext_nosink_nodes = compute_graph_->TryGetExtAttr(kExtAttrGetNextNoSink, getnext_nosink_nodes);
if (GetLocalOmgContext().dynamic_node_type == DATA) { if (GetLocalOmgContext().dynamic_node_type == DATA) {
if (getnext_nosink_nodes.empty()) { if (getnext_nosink_nodes.empty()) {
// just data or data+getnext_sink // just data or data+getnext_sink


+ 0
- 2
ge/graph/manager/graph_manager.h View File

@@ -222,8 +222,6 @@ class GraphManager {
const ComputeGraphPtr &compute_graph, uint64_t session_id, const ComputeGraphPtr &compute_graph, uint64_t session_id,
const GEThreadLocalContext &ge_context); const GEThreadLocalContext &ge_context);
Status ParseInputsDims(const std::vector<InputTensorInfo> &input_tensor); Status ParseInputsDims(const std::vector<InputTensorInfo> &input_tensor);
Status DistinguishGetNextAndData(ComputeGraphPtr &graph, vector<NodePtr> &data_nodes,
vector<NodePtr> &getnext_nosink_nodes, vector<NodePtr> &getnext_sink_nodes);
void ParseInputsDimsForData(const std::vector<InputTensorInfo> &input_tensor); void ParseInputsDimsForData(const std::vector<InputTensorInfo> &input_tensor);
Status ParseInputsDimsForGetNexNosinkAndData(const vector<NodePtr> &dynamic_nodes, Status ParseInputsDimsForGetNexNosinkAndData(const vector<NodePtr> &dynamic_nodes,
const std::vector<InputTensorInfo> &input_tensor); const std::vector<InputTensorInfo> &input_tensor);


+ 2
- 2
ge/graph/manager/util/hcom_util.cc View File

@@ -263,7 +263,7 @@ Status HcomOmeUtil::GetHcclRootId(const ge::ConstOpDescPtr &op_desc, int64_t &ro
Status HcomOmeUtil::GetAllRootId(const ge::ConstOpDescPtr &op_desc, Status HcomOmeUtil::GetAllRootId(const ge::ConstOpDescPtr &op_desc,
std::vector<GETaskKernelHcclInfo> &kernel_hccl_infos) { std::vector<GETaskKernelHcclInfo> &kernel_hccl_infos) {
GE_CHECK_NOTNULL(op_desc); GE_CHECK_NOTNULL(op_desc);
if (op_desc->GetType() == HCOMBROADCAST || op_desc->GetType() == HVDCALLBACKBROADCAST) {
if (op_desc->GetType() == HCOMBROADCAST || op_desc->GetType() == HVDCALLBACKBROADCAST || op_desc->GetType() == HCOMREDUCE) {
GELOGI("GetAllRootId Node[%s] opType[%s] get hccl rootId.", op_desc->GetName().c_str(), op_desc->GetType().c_str()); GELOGI("GetAllRootId Node[%s] opType[%s] get hccl rootId.", op_desc->GetName().c_str(), op_desc->GetType().c_str());
int64_t root_id = 0; int64_t root_id = 0;
Status dmrt = GetHcclRootId(op_desc, root_id); Status dmrt = GetHcclRootId(op_desc, root_id);
@@ -281,7 +281,7 @@ Status HcomOmeUtil::GetAllRootId(const ge::ConstOpDescPtr &op_desc,


bool HcomOmeUtil::IsHCOMOp(const string &op_type) { bool HcomOmeUtil::IsHCOMOp(const string &op_type) {
return (op_type == HCOMALLREDUCE) || (op_type == HCOMALLGATHER) || (op_type == HCOMBROADCAST) || return (op_type == HCOMALLREDUCE) || (op_type == HCOMALLGATHER) || (op_type == HCOMBROADCAST) ||
(op_type == HCOMSEND) || (op_type == HCOMRECEIVE) || (op_type == HCOMREDUCESCATTER);
(op_type == HCOMSEND) || (op_type == HCOMRECEIVE) || (op_type == HCOMREDUCESCATTER) || (op_type == HCOMREDUCE);
} }


bool HcomOmeUtil::IsHorovodOp(const string &op_type) { bool HcomOmeUtil::IsHorovodOp(const string &op_type) {


+ 1
- 1
ge/graph/optimize/mem_rw_conflict_optimize.cc View File

@@ -234,7 +234,7 @@ InputRWType GetSingleNodeInputRWTypeByIndex(const Node &node, uint32_t index) {
return InputRWType::kInvalidRWType; return InputRWType::kInvalidRWType;
} }
if (op_desc->GetType() == HCOMALLREDUCE || op_desc->GetType() == HCOMALLGATHER if (op_desc->GetType() == HCOMALLREDUCE || op_desc->GetType() == HCOMALLGATHER
|| op_desc->GetType() == HCOMREDUCESCATTER) {
|| op_desc->GetType() == HCOMREDUCESCATTER || op_desc->GetType() == HCOMREDUCE) {
return InputRWType::kScopeWriteable; return InputRWType::kScopeWriteable;
} }
// check if it is ref input // check if it is ref input


+ 10
- 3
ge/graph/passes/mark_agnostic_pass.cc View File

@@ -48,13 +48,12 @@ Status MarkAgnosticPass::Run(ComputeGraphPtr graph) {
} }
if (node_type == MERGE) { if (node_type == MERGE) {
GELOGD("Mark format agnostic and continuous for merge node %s", node->GetName().c_str()); GELOGD("Mark format agnostic and continuous for merge node %s", node->GetName().c_str());
auto in_nodes = node->GetInAllNodes();
vector<NodePtr> input_nodes(in_nodes.begin(), in_nodes.end());
const auto &input_nodes = node->GetInAllNodes();
/// Enter-----------+ /// Enter-----------+
/// +-> Merge /// +-> Merge
/// NextIteration---+ /// NextIteration---+
if (input_nodes.size() == 2) { if (input_nodes.size() == 2) {
if (input_nodes[0]->GetType() == ENTER && input_nodes[1]->GetType() == NEXTITERATION) {
if (input_nodes.at(0)->GetType() == ENTER && input_nodes.at(1)->GetType() == NEXTITERATION) {
continue; continue;
} }
} }
@@ -65,6 +64,14 @@ Status MarkAgnosticPass::Run(ComputeGraphPtr graph) {
continue; continue;
} }
AttrUtils::SetInt(op_tensor, "_format_continuous", 1); AttrUtils::SetInt(op_tensor, "_format_continuous", 1);

// Merge----------->NetOutput only set format_cofntinuous attr
const auto &output_nodes = node->GetOutAllNodes();
if (output_nodes.size() > 0) {
if (output_nodes.at(0)->GetType() == NETOUTPUT) {
continue;
}
}
AttrUtils::SetInt(node->GetOpDesc(), "_format_agnostic", 1); AttrUtils::SetInt(node->GetOpDesc(), "_format_agnostic", 1);
AttrUtils::SetListInt(node->GetOpDesc(), "_format_agnostic_except_output", std::vector<int64_t>({1})); AttrUtils::SetListInt(node->GetOpDesc(), "_format_agnostic_except_output", std::vector<int64_t>({1}));
continue; continue;


+ 1
- 1
ge/graph/passes/switch_data_edges_bypass.cc View File

@@ -181,7 +181,7 @@ Status BypassSwitchOut(const NodePtr &switch_node, int out_index) {


auto head_node = node_and_anchor.first; auto head_node = node_and_anchor.first;
auto head_node_type = NodeUtils::GetNodeType(*head_node); auto head_node_type = NodeUtils::GetNodeType(*head_node);
if (head_node_type == MERGE || head_node_type == REFMERGE) {
if (head_node_type == MEMCPYASYNC) {
// if the switch connect to the merge directly, insert memcpy before merge // if the switch connect to the merge directly, insert memcpy before merge
auto memcpy_node = AddMemcpyBeforeNode(head_node, head_anchor->GetIdx()); auto memcpy_node = AddMemcpyBeforeNode(head_node, head_anchor->GetIdx());
GE_CHECK_NOTNULL(memcpy_node); GE_CHECK_NOTNULL(memcpy_node);


+ 5
- 0
ge/graph/preprocess/multi_batch_options.cc View File

@@ -46,6 +46,8 @@ const int kDivisionConst = 2;
const char *const kSubstrOfGetNextNosinkName = "IteratorGetNext"; const char *const kSubstrOfGetNextNosinkName = "IteratorGetNext";
const char *const kShapeDataName = "ascend_mbatch_shape_data"; const char *const kShapeDataName = "ascend_mbatch_shape_data";
const char *const kGetNextName = "IteratorV2"; const char *const kGetNextName = "IteratorV2";
const char *const kExtAttrDataNodes = "data_nodes";
const char *const kExtAttrGetNextNoSink = "getnext_no_sink";


inline bool IsGetNextType(const NodePtr &node) { inline bool IsGetNextType(const NodePtr &node) {
std::string original_type; std::string original_type;
@@ -97,6 +99,9 @@ Status DistinguishGetNextAndData(ComputeGraphPtr &graph, vector<NodePtr> &data_n
} }
GELOGI("Data count is %zu, getnext nosink count is %zu, getnext sink count is %zu.", data_nodes.size(), GELOGI("Data count is %zu, getnext nosink count is %zu, getnext sink count is %zu.", data_nodes.size(),
getnext_nosink_nodes.size(), getnext_sink_nodes.size()); getnext_nosink_nodes.size(), getnext_sink_nodes.size());
GE_IF_BOOL_EXEC(!graph->SetExtAttr(kExtAttrDataNodes, data_nodes), GELOGW("Set data nodes attr failed.");)
GE_IF_BOOL_EXEC(!graph->SetExtAttr(kExtAttrGetNextNoSink, getnext_nosink_nodes),
GELOGW("Set getnext nosink nodes attr failed.");)
return SUCCESS; return SUCCESS;
} }




+ 6
- 0
ge/hybrid/common/npu_memory_allocator.cc View File

@@ -23,6 +23,8 @@


namespace ge { namespace ge {
namespace hybrid { namespace hybrid {
size_t kMaxHbmMemorySize = 1024UL * 1024UL * 1024UL * 1024UL; // 1024G

std::map<uint32_t, std::unique_ptr<NpuMemoryAllocator>> NpuMemoryAllocator::allocators_; std::map<uint32_t, std::unique_ptr<NpuMemoryAllocator>> NpuMemoryAllocator::allocators_;
std::mutex NpuMemoryAllocator::mu_; std::mutex NpuMemoryAllocator::mu_;


@@ -62,6 +64,10 @@ void *NpuMemoryAllocator::Allocate(std::size_t size, AllocationAttr *attr) {
} else if (mem_type == HOST_DDR) { } else if (mem_type == HOST_DDR) {
buffer = malloc(allocate_size); buffer = malloc(allocate_size);
} else { } else {
if (allocate_size > kMaxHbmMemorySize) {
GELOGE(PARAM_INVALID, "Invalid HBM memory size: %zu", allocate_size);
return nullptr;
}
void *try_reuse_addr = nullptr; void *try_reuse_addr = nullptr;
int padding = kDefaultPadding; int padding = kDefaultPadding;
if (attr != nullptr) { if (attr != nullptr) {


+ 1
- 0
ge/hybrid/common/tensor_value.cc View File

@@ -58,6 +58,7 @@ std::unique_ptr<TensorBuffer> TensorBuffer::Create(void *buffer, size_t size) {
TensorBuffer::~TensorBuffer() { TensorBuffer::~TensorBuffer() {
if (allocator_ != nullptr && buffer_ != nullptr) { if (allocator_ != nullptr && buffer_ != nullptr) {
allocator_->Deallocate(buffer_, mem_type_); allocator_->Deallocate(buffer_, mem_type_);
buffer_ = nullptr;
} }
} }




+ 4
- 4
ge/hybrid/executor/hybrid_model_async_executor.cc View File

@@ -52,7 +52,7 @@ Status HybridModelAsyncExecutor::EnqueueData(const shared_ptr<InputDataWrapper>
} }


Status HybridModelAsyncExecutor::Start(const std::shared_ptr<ModelListener> &listener) { Status HybridModelAsyncExecutor::Start(const std::shared_ptr<ModelListener> &listener) {
GELOGD("HybridModelExecutor::Start IN, listener = %p", listener.get());
GELOGD("HybridModelExecutor::Start IN, has listener = %d", listener != nullptr);
std::lock_guard<std::mutex> lk(mu_); std::lock_guard<std::mutex> lk(mu_);
GE_CHK_BOOL_RET_STATUS(!run_flag_, INTERNAL_ERROR, "Model already started."); GE_CHK_BOOL_RET_STATUS(!run_flag_, INTERNAL_ERROR, "Model already started.");


@@ -219,11 +219,11 @@ Status HybridModelAsyncExecutor::CopyInputData(const InputData &current_data) {
auto mem_size = static_cast<uint32_t>(data_size); auto mem_size = static_cast<uint32_t>(data_size);
GE_CHK_BOOL_RET_STATUS(mem_size >= data_buf.length, GE_CHK_BOOL_RET_STATUS(mem_size >= data_buf.length,
PARAM_INVALID, PARAM_INVALID,
"input data size(%u) does not match model required size(%u), ret failed.",
"input data size(%lu) does not match model required size(%u), ret failed.",
data_buf.length, data_buf.length,
mem_size); mem_size);


GELOGI("[IMAS]CopyPlainData memcpy graph_%u type[F] output[%u] memaddr[%p] mem_size[%u] datasize[%u]",
GELOGI("[IMAS]CopyPlainData memcpy graph_%u type[F] output[%u] memaddr[%p] mem_size[%u] datasize[%lu]",
model_->root_runtime_param_.graph_id, input_index, input_tensor.GetData(), mem_size, data_buf.length); model_->root_runtime_param_.graph_id, input_index, input_tensor.GetData(), mem_size, data_buf.length);
GE_CHK_RT_RET(rtMemcpy(input_tensor.MutableData(), GE_CHK_RT_RET(rtMemcpy(input_tensor.MutableData(),
mem_size, mem_size,
@@ -241,7 +241,7 @@ Status HybridModelAsyncExecutor::InitInputTensors() {
int input_index = 0; int input_index = 0;
for (const auto &input_node : model_->GetRootGraphItem()->GetInputNodes()) { for (const auto &input_node : model_->GetRootGraphItem()->GetInputNodes()) {
GELOGD("Init input[%u], node = %s", input_index, input_node->NodeName().c_str()); GELOGD("Init input[%u], node = %s", input_index, input_node->NodeName().c_str());
auto output_desc = input_node->op_desc->GetOutputDescPtr(kDataOutputIndex);
auto output_desc = input_node->MutableOutputDesc(kDataOutputIndex);
GE_CHECK_NOTNULL(output_desc); GE_CHECK_NOTNULL(output_desc);
int64_t tensor_size = 0; int64_t tensor_size = 0;
GE_CHK_GRAPH_STATUS_RET(TensorUtils::GetSize(*output_desc, tensor_size), GE_CHK_GRAPH_STATUS_RET(TensorUtils::GetSize(*output_desc, tensor_size),


+ 26
- 20
ge/hybrid/executor/node_state.cc View File

@@ -35,39 +35,43 @@ ShapeInferenceState::ShapeInferenceState(const NodeItem &node_item) : node_item(
this->num_pending_shapes_); this->num_pending_shapes_);
} }


void ShapeInferenceState::UpdateInputShape(uint32_t idx,
const GeShape &ori_shape,
const GeShape &shape) {
if (!node_item.is_dynamic || node_item.is_input_shape_static[idx]) {
GELOGD("[%s] Trying to update static shape, idx = %u. old shape = [%s], new shape = [%s]",
Status ShapeInferenceState::UpdateInputShape(int idx,
const GeShape &ori_shape,
const GeShape &shape) {
if (node_item.IsInputShapeStatic(idx)) {
GELOGD("[%s] Trying to update static shape, idx = %d. old shape = [%s], new shape = [%s]",
node_item.NodeName().c_str(), node_item.NodeName().c_str(),
idx, idx,
node_item.op_desc->MutableInputDesc(idx)->GetShape().ToString().c_str(),
node_item.MutableInputDesc(idx)->GetShape().ToString().c_str(),
shape.ToString().c_str()); shape.ToString().c_str());
return;
return SUCCESS;
} }


GELOGD("[%s] Update input shape [%u] with Shape: [%s] and OriginalShape: [%s]",
GELOGD("[%s] Update input shape [%d] with Shape: [%s] and OriginalShape: [%s]",
node_item.NodeName().c_str(), node_item.NodeName().c_str(),
idx, idx,
shape.ToString().c_str(), shape.ToString().c_str(),
ori_shape.ToString().c_str()); ori_shape.ToString().c_str());


std::lock_guard<std::mutex> lk(mu_); std::lock_guard<std::mutex> lk(mu_);
node_item.op_desc->MutableInputDesc(idx)->SetShape(shape);
node_item.op_desc->MutableInputDesc(idx)->SetOriginShape(ori_shape);
auto tensor_desc = node_item.MutableInputDesc(idx);
GE_CHECK_NOTNULL(tensor_desc);
tensor_desc->SetShape(shape);
tensor_desc->SetOriginShape(ori_shape);
if (--num_pending_shapes_ == 0) { if (--num_pending_shapes_ == 0) {
ready_cv_.notify_all(); ready_cv_.notify_all();
} }

return SUCCESS;
} }


void ShapeInferenceState::UpdateInputShapeFuture(uint32_t idx, ShapeFuture &&future) {
if (!node_item.is_dynamic || node_item.is_input_shape_static[idx]) {
GELOGD("[%s] Trying to update constant shape, idx = %u", node_item.NodeName().c_str(), idx);
void ShapeInferenceState::UpdateInputShapeFuture(int idx, ShapeFuture &&future) {
if (node_item.IsInputShapeStatic(idx)) {
GELOGD("[%s] Trying to update constant shape, idx = %d", node_item.NodeName().c_str(), idx);
return; return;
} }


GELOGD("[%s] Update input shape [%u] with ShapeFuture.", node_item.NodeName().c_str(), idx);
GELOGD("[%s] Update input shape [%d] with ShapeFuture.", node_item.NodeName().c_str(), idx);
std::lock_guard<std::mutex> lk(mu_); std::lock_guard<std::mutex> lk(mu_);
shape_futures.emplace_back(idx, std::move(future)); shape_futures.emplace_back(idx, std::move(future));
if (--num_pending_shapes_ == 0) { if (--num_pending_shapes_ == 0) {
@@ -120,8 +124,10 @@ Status ShapeInferenceState::AwaitShapesReady(const GraphExecutionContext &contex
idx, idx,
shape.ToString().c_str(), shape.ToString().c_str(),
ori_shape.ToString().c_str()); ori_shape.ToString().c_str());
node_item.op_desc->MutableInputDesc(idx)->SetShape(std::move(shape));
node_item.op_desc->MutableInputDesc(idx)->SetOriginShape(ori_shape);
auto input_desc = node_item.MutableInputDesc(idx);
GE_CHECK_NOTNULL(input_desc);
input_desc->SetShape(std::move(shape));
input_desc->SetOriginShape(ori_shape);
} }


return SUCCESS; return SUCCESS;
@@ -140,7 +146,7 @@ NodeState::NodeState(const NodeItem &node_item, SubgraphContext *subgraph_contex


Status NodeState::AwaitInputTensors(GraphExecutionContext &context) const { Status NodeState::AwaitInputTensors(GraphExecutionContext &context) const {
for (auto &src_node : node_item_->dependents_for_execution) { for (auto &src_node : node_item_->dependents_for_execution) {
GELOGI("[%s] Start to wait for data dependent node: [%s]",
GELOGD("[%s] Start to wait for data dependent node: [%s]",
node_item_->NodeName().c_str(), node_item_->NodeName().c_str(),
src_node->GetName().c_str()); src_node->GetName().c_str());
RECORD_EXECUTION_EVENT(&context, RECORD_EXECUTION_EVENT(&context,
@@ -156,7 +162,7 @@ Status NodeState::AwaitInputTensors(GraphExecutionContext &context) const {
node_item_->NodeName().c_str(), node_item_->NodeName().c_str(),
"[AwaitNodeDone] [%s] End", "[AwaitNodeDone] [%s] End",
src_node->GetName().c_str()); src_node->GetName().c_str());
GELOGI("[%s] Done waiting node.", src_node->GetName().c_str());
GELOGD("[%s] Done waiting node.", src_node->GetName().c_str());
} }


return SUCCESS; return SUCCESS;
@@ -173,7 +179,7 @@ Status NodeState::WaitForPrepareDone() {
} }


Status ShapeFuture::Get(GeShape &ori_shape, GeShape &shape) { Status ShapeFuture::Get(GeShape &ori_shape, GeShape &shape) {
GELOGI("Start to wait node: %s for getting shape", src_node_->GetName().c_str());
GELOGD("Start to wait node: %s for getting shape", src_node_->GetName().c_str());
if (!subgraph_context_->Await(src_node_)) { if (!subgraph_context_->Await(src_node_)) {
GELOGE(INTERNAL_ERROR, "cancelled"); GELOGE(INTERNAL_ERROR, "cancelled");
return INTERNAL_ERROR; return INTERNAL_ERROR;
@@ -181,7 +187,7 @@ Status ShapeFuture::Get(GeShape &ori_shape, GeShape &shape) {


shape = src_node_->GetOpDesc()->MutableOutputDesc(src_index_)->MutableShape(); shape = src_node_->GetOpDesc()->MutableOutputDesc(src_index_)->MutableShape();
ori_shape = src_node_->GetOpDesc()->MutableOutputDesc(src_index_)->GetOriginShape(); ori_shape = src_node_->GetOpDesc()->MutableOutputDesc(src_index_)->GetOriginShape();
GELOGI("Get shape from %s:%u. shape = [%s]", src_node_->GetName().c_str(), src_index_, shape.ToString().c_str());
GELOGD("Get shape from %s:%u. shape = [%s]", src_node_->GetName().c_str(), src_index_, shape.ToString().c_str());
return SUCCESS; return SUCCESS;
} }
} // namespace hybrid } // namespace hybrid


+ 3
- 3
ge/hybrid/executor/node_state.h View File

@@ -45,16 +45,16 @@ class ShapeFuture {
struct ShapeInferenceState { struct ShapeInferenceState {
explicit ShapeInferenceState(const NodeItem &node_item); explicit ShapeInferenceState(const NodeItem &node_item);


void UpdateInputShape(uint32_t idx, const GeShape &ori_shape, const GeShape &shape);
Status UpdateInputShape(int idx, const GeShape &ori_shape, const GeShape &shape);


void UpdateInputShapeFuture(uint32_t idx, ShapeFuture &&future);
void UpdateInputShapeFuture(int idx, ShapeFuture &&future);


Status AwaitShapesReady(const GraphExecutionContext &context); Status AwaitShapesReady(const GraphExecutionContext &context);


const NodeItem &node_item; const NodeItem &node_item;


private: private:
std::vector<std::pair<uint32_t, ShapeFuture>> shape_futures;
std::vector<std::pair<int, ShapeFuture>> shape_futures;
int num_pending_shapes_ = 0; int num_pending_shapes_ = 0;
std::condition_variable ready_cv_; std::condition_variable ready_cv_;
std::mutex mu_; std::mutex mu_;


+ 6
- 6
ge/hybrid/executor/worker/execution_engine.cc View File

@@ -36,13 +36,13 @@ Status LogInputs(const NodeItem &node_item, const TaskContext &task_context) {
for (auto i = 0; i < task_context.NumInputs(); ++i) { for (auto i = 0; i < task_context.NumInputs(); ++i) {
const auto &input_tensor = task_context.GetInput(i); const auto &input_tensor = task_context.GetInput(i);
GE_CHECK_NOTNULL(input_tensor); GE_CHECK_NOTNULL(input_tensor);
const auto &tensor_desc = node_item.op_desc->MutableInputDesc(i);
const auto &tensor_desc = task_context.GetInputDesc(i);
GE_CHECK_NOTNULL(tensor_desc); GE_CHECK_NOTNULL(tensor_desc);
GELOGD("[%s] Print task args. input[%d] = %s, shape = [%s]", GELOGD("[%s] Print task args. input[%d] = %s, shape = [%s]",
node_item.NodeName().c_str(), node_item.NodeName().c_str(),
i, i,
input_tensor->DebugString().c_str(), input_tensor->DebugString().c_str(),
tensor_desc->MutableShape().ToString().c_str());
tensor_desc->GetShape().ToString().c_str());
} }


return SUCCESS; return SUCCESS;
@@ -52,7 +52,7 @@ Status LogOutputs(const NodeItem &node_item, const TaskContext &task_context) {
for (auto i = 0; i < task_context.NumOutputs(); ++i) { for (auto i = 0; i < task_context.NumOutputs(); ++i) {
const auto &output_tensor = task_context.GetOutput(i); const auto &output_tensor = task_context.GetOutput(i);
GE_CHECK_NOTNULL(output_tensor); GE_CHECK_NOTNULL(output_tensor);
const auto &tensor_desc = node_item.op_desc->MutableOutputDesc(i);
const auto &tensor_desc = node_item.MutableOutputDesc(i);
GE_CHECK_NOTNULL(tensor_desc); GE_CHECK_NOTNULL(tensor_desc);
GELOGD("[%s] Print task args. output[%d] = %s, shape = [%s]", GELOGD("[%s] Print task args. output[%d] = %s, shape = [%s]",
node_item.NodeName().c_str(), node_item.NodeName().c_str(),
@@ -97,7 +97,7 @@ Status NodeDoneCallback::PrepareConstInputs(const NodeItem &node_item) {
GE_CHECK_NOTNULL(output_tensor); GE_CHECK_NOTNULL(output_tensor);


Tensor tensor; Tensor tensor;
auto ge_tensor_desc = node_item.op_desc->MutableOutputDesc(output_idx);
auto ge_tensor_desc = node_item.MutableOutputDesc(output_idx);
GE_CHECK_NOTNULL(ge_tensor_desc); GE_CHECK_NOTNULL(ge_tensor_desc);
tensor.SetTensorDesc(TensorAdapter::GeTensorDesc2TensorDesc(*ge_tensor_desc)); tensor.SetTensorDesc(TensorAdapter::GeTensorDesc2TensorDesc(*ge_tensor_desc));


@@ -107,7 +107,7 @@ Status NodeDoneCallback::PrepareConstInputs(const NodeItem &node_item) {


if (output_tensor->GetSize() < static_cast<size_t>(tensor_size)) { if (output_tensor->GetSize() < static_cast<size_t>(tensor_size)) {
GELOGE(INTERNAL_ERROR, GELOGE(INTERNAL_ERROR,
"[%s] Tensor size is not enough. output index = %d, required size = %zu, tensor = %s",
"[%s] Tensor size is not enough. output index = %d, required size = %ld, tensor = %s",
node_item.NodeName().c_str(), node_item.NodeName().c_str(),
output_idx, output_idx,
tensor_size, tensor_size,
@@ -453,7 +453,7 @@ Status ExecutionEngine::ValidateInputTensors(const NodeState &node_state, const
continue; continue;
} }


const auto &tensor_desc = node_state.GetOpDesc()->MutableInputDesc(i);
const auto &tensor_desc = task_context.MutableInputDesc(i);
GE_CHECK_NOTNULL(tensor_desc); GE_CHECK_NOTNULL(tensor_desc);
if (tensor_desc->GetDataType() == DT_STRING) { if (tensor_desc->GetDataType() == DT_STRING) {
GELOGD("[%s] Skipping DT_STRING input, index = %d", task_context.GetNodeName(), i); GELOGD("[%s] Skipping DT_STRING input, index = %d", task_context.GetNodeName(), i);


+ 7
- 4
ge/hybrid/executor/worker/shape_inference_engine.cc View File

@@ -142,12 +142,15 @@ Status ShapeInferenceEngine::PropagateOutputShapes(const NodeItem &node_item) {
dst_input_index_and_node.first); dst_input_index_and_node.first);


// in case type 3 and 4, shape will be valid after computing is done // in case type 3 and 4, shape will be valid after computing is done
auto &infer_state = dst_node_state->GetShapeInferenceState();
if (shape_is_future) { if (shape_is_future) {
ShapeFuture future(node_item.node, i, subgraph_context_); ShapeFuture future(node_item.node, i, subgraph_context_);
dst_node_state->GetShapeInferenceState().UpdateInputShapeFuture(dst_input_index_and_node.first,
std::move(future));
infer_state.UpdateInputShapeFuture(dst_input_index_and_node.first,
std::move(future));
} else { } else {
dst_node_state->GetShapeInferenceState().UpdateInputShape(dst_input_index_and_node.first, ori_shape, shape);
GE_CHK_STATUS_RET_NOLOG(infer_state.UpdateInputShape(dst_input_index_and_node.first,
ori_shape,
shape));
} }
} }
} }
@@ -159,7 +162,7 @@ Status ShapeInferenceEngine::PropagateOutputShapes(const NodeItem &node_item) {
Status ShapeInferenceEngine::InferShapeForSubgraph(const NodeItem &node_item, const FusedSubgraph &fused_subgraph) { Status ShapeInferenceEngine::InferShapeForSubgraph(const NodeItem &node_item, const FusedSubgraph &fused_subgraph) {
GELOGD("[%s] Start to infer shape by fused subgraph", node_item.NodeName().c_str()); GELOGD("[%s] Start to infer shape by fused subgraph", node_item.NodeName().c_str());
for (auto &it : fused_subgraph.input_mapping) { for (auto &it : fused_subgraph.input_mapping) {
auto parent_tensor_desc = node_item.op_desc->MutableInputDesc(it.first);
auto parent_tensor_desc = node_item.MutableInputDesc(it.first);
GE_CHECK_NOTNULL(parent_tensor_desc); GE_CHECK_NOTNULL(parent_tensor_desc);
GELOGD("Start to update shape by input[%u]", it.first); GELOGD("Start to update shape by input[%u]", it.first);
GELOGD("Update shape to [%s]", parent_tensor_desc->GetShape().ToString().c_str()); GELOGD("Update shape to [%s]", parent_tensor_desc->GetShape().ToString().c_str());


+ 2
- 2
ge/hybrid/model/graph_item.cc View File

@@ -40,11 +40,11 @@ Status GraphItem::GetOutputDescList(vector<ConstGeTensorDescPtr> &output_desc_li
} }


if (is_dynamic_) { if (is_dynamic_) {
for (auto &tensor_desc : output_node_->op_desc->GetAllInputsDescPtr()) {
for (auto &tensor_desc : output_node_->GetOpDesc()->GetAllInputsDescPtr()) {
output_desc_list.emplace_back(tensor_desc); output_desc_list.emplace_back(tensor_desc);
} }
} else { } else {
for (auto &tensor_desc : output_node_->op_desc->GetAllOutputsDescPtr()) {
for (auto &tensor_desc : output_node_->GetOpDesc()->GetAllOutputsDescPtr()) {
output_desc_list.emplace_back(tensor_desc); output_desc_list.emplace_back(tensor_desc);
} }
} }


+ 2
- 2
ge/hybrid/model/hybrid_model.cc View File

@@ -44,7 +44,7 @@ Status HybridModel::Init() {
TensorValue* HybridModel::GetVariable(const string &name) const { TensorValue* HybridModel::GetVariable(const string &name) const {
auto it = variable_tensors_.find(name); auto it = variable_tensors_.find(name);
if (it == variable_tensors_.end()) { if (it == variable_tensors_.end()) {
GELOGI("Failed to get variable tensor. var name = [%s]", name.c_str());
GELOGD("Failed to get variable tensor. var name = [%s]", name.c_str());
return nullptr; return nullptr;
} }


@@ -61,7 +61,7 @@ NodePtr HybridModel::GetVariableNode(const string &name) const {
if (host_find != host_variable_nodes_.end()) { if (host_find != host_variable_nodes_.end()) {
return host_find->second; return host_find->second;
} }
GELOGI("Failed to get variable node by name = [%s]", name.c_str());
GELOGD("Failed to get variable node by name = [%s]", name.c_str());
return nullptr; return nullptr;
} }




+ 54
- 47
ge/hybrid/model/hybrid_model_builder.cc View File

@@ -19,14 +19,12 @@
#include "common/math/math_util.h" #include "common/math/math_util.h"
#include "graph/ge_context.h" #include "graph/ge_context.h"
#include "graph/build/memory/var_mem_assign_util.h" #include "graph/build/memory/var_mem_assign_util.h"
#include "graph/utils/node_utils.h"
#include "graph/debug/ge_attr_define.h" #include "graph/debug/ge_attr_define.h"
#include "graph/load/new_model_manager/model_utils.h" #include "graph/load/new_model_manager/model_utils.h"
#include "graph/manager/graph_var_manager.h" #include "graph/manager/graph_var_manager.h"
#include "graph/manager/host_mem_manager.h" #include "graph/manager/host_mem_manager.h"
#include "graph/manager/trans_var_data_utils.h" #include "graph/manager/trans_var_data_utils.h"
#include "graph/utils/graph_utils.h" #include "graph/utils/graph_utils.h"
#include "graph/utils/type_utils.h"
#include "hybrid/common/npu_memory_allocator.h" #include "hybrid/common/npu_memory_allocator.h"
#include "hybrid/node_executor/node_executor.h" #include "hybrid/node_executor/node_executor.h"


@@ -39,34 +37,19 @@ const uint32_t kAlignment = 32;
const int kBytes = 8; const int kBytes = 8;
const char *const kOwnerGraphIsUnknown = "OwnerGraphIsUnknown"; const char *const kOwnerGraphIsUnknown = "OwnerGraphIsUnknown";


bool IsGraphUnknown(ComputeGraph &graph) {
for (const auto &node : graph.GetDirectNode()) {
bool is_unknown_shape = false;
(void)AttrUtils::GetBool(node->GetOpDesc(), kOwnerGraphIsUnknown, is_unknown_shape);
return is_unknown_shape;
}
return false;
}

int64_t CalcVarSizeInBytes(const GeTensorDesc &desc) { int64_t CalcVarSizeInBytes(const GeTensorDesc &desc) {
int64_t var_size = 0; int64_t var_size = 0;
auto data_type = desc.GetDataType(); auto data_type = desc.GetDataType();
if (data_type == DT_STRING) { if (data_type == DT_STRING) {
(void) TensorUtils::GetSize(desc, var_size); (void) TensorUtils::GetSize(desc, var_size);
} else {
var_size = GetSizeByDataType(data_type);
if (var_size <= 0) {
GELOGW("Failed to calc var data size from data type %s", TypeUtils::DataTypeToSerialString(data_type).c_str());
return -1;
}
auto shape = desc.GetShape();
auto dim_num = shape.GetDimNum();
for (size_t dim_index = 0; dim_index < dim_num; ++dim_index) {
var_size *= shape.GetDim(dim_index);
}
// padding up to multiple of kAlignment, and add extra kAlignment
var_size = (var_size + kAlignment * 2 - 1) / kAlignment * kAlignment;
return var_size;
} }

if (TensorUtils::GetTensorMemorySizeInBytes(desc, var_size) != GRAPH_SUCCESS) {
GELOGW("Failed to calc var data size");
return -1;
}

return var_size; return var_size;
} }


@@ -111,6 +94,7 @@ Status HybridModelBuilder::Build() {
hybrid_model_.model_name_ = ge_root_model_->GetRootGraph()->GetName(); hybrid_model_.model_name_ = ge_root_model_->GetRootGraph()->GetName();
GELOGI("[%s] Start to build hybrid model.", GetGraphName()); GELOGI("[%s] Start to build hybrid model.", GetGraphName());
GE_CHK_STATUS_RET(InitRuntimeParams(), "[%s] Failed to InitRuntimeParams", GetGraphName()); GE_CHK_STATUS_RET(InitRuntimeParams(), "[%s] Failed to InitRuntimeParams", GetGraphName());
GE_CHK_STATUS_RET(RecoverGraphUnknownFlag(), "[%s] Failed to RecoverGraphUnknownFlag", GetGraphName());
GE_CHK_STATUS_RET(IndexSpecialNodes(), "[%s] Failed to index nodes", GetGraphName()); GE_CHK_STATUS_RET(IndexSpecialNodes(), "[%s] Failed to index nodes", GetGraphName());
GE_CHK_STATUS_RET(IndexTaskDefs(), "[%s] Failed to index task defs", GetGraphName()); GE_CHK_STATUS_RET(IndexTaskDefs(), "[%s] Failed to index task defs", GetGraphName());
GE_CHK_STATUS_RET(LoadGraph(), "[%s] Failed to load graph", GetGraphName()); GE_CHK_STATUS_RET(LoadGraph(), "[%s] Failed to load graph", GetGraphName());
@@ -158,7 +142,12 @@ Status HybridModelBuilder::BuildNodeItem(const NodePtr &node, NodeItem &node_ite
GE_CHK_STATUS_RET(GetOrCreateNodeItem(dst_node, &dst_node_item), GE_CHK_STATUS_RET(GetOrCreateNodeItem(dst_node, &dst_node_item),
"[%s] Failed to get or create node item.", "[%s] Failed to get or create node item.",
dst_node->GetName().c_str()); dst_node->GetName().c_str());
node_item.outputs[i].emplace_back(dst_in_anchor->GetIdx(), dst_node_item);
int canonical_index;
GE_CHK_STATUS_RET(dst_node_item->GetCanonicalInputIndex(dst_in_anchor->GetIdx(), canonical_index),
"[%s] Failed to canonical input index",
dst_node->GetName().c_str());

node_item.outputs[i].emplace_back(canonical_index, dst_node_item);
} }
} }


@@ -179,7 +168,8 @@ Status HybridModelBuilder::ResolveRefIo(NodeItem &node_item) {
for (auto &output : outputs) { for (auto &output : outputs) {
for (auto &input : inputs) { for (auto &input : inputs) {
if (input.first == output.first) { if (input.first == output.first) {
auto input_idx = static_cast<int>(input.second);
int input_idx;
GE_CHK_STATUS_RET_NOLOG(node_item.GetCanonicalInputIndex(input.second, input_idx));
auto output_idx = static_cast<int>(output.second); auto output_idx = static_cast<int>(output.second);
node_item.reuse_inputs[output_idx] = input_idx; node_item.reuse_inputs[output_idx] = input_idx;
GELOGD("[%s] Output[%d] reuse input[%d]", node_item.NodeName().c_str(), output_idx, input_idx); GELOGD("[%s] Output[%d] reuse input[%d]", node_item.NodeName().c_str(), output_idx, input_idx);
@@ -198,10 +188,8 @@ Status HybridModelBuilder::GetOrCreateNodeItem(const NodePtr &node, NodeItem **n
return SUCCESS; return SUCCESS;
} }


auto new_node = std::unique_ptr<NodeItem>(new(std::nothrow) NodeItem(node));
GE_CHECK_NOTNULL(new_node);
GE_CHECK_NOTNULL(new_node->op_desc);
GE_CHK_STATUS_RET(new_node->Init(), "Failed to init NodeItem [%s] .", node->GetName().c_str());
std::unique_ptr<NodeItem> new_node;
GE_CHK_STATUS_RET(NodeItem::Create(node, new_node), "Failed to create node item");
GE_CHK_STATUS_RET_NOLOG(NodeExecutorManager::GetInstance().GetExecutor(*node, &new_node->node_executor)); GE_CHK_STATUS_RET_NOLOG(NodeExecutorManager::GetInstance().GetExecutor(*node, &new_node->node_executor));


// we do not need L2 Buffer // we do not need L2 Buffer
@@ -210,10 +198,6 @@ Status HybridModelBuilder::GetOrCreateNodeItem(const NodePtr &node, NodeItem **n
(void) AttrUtils::SetBool(new_node->op_desc, kIsFirstNode, false); (void) AttrUtils::SetBool(new_node->op_desc, kIsFirstNode, false);
(void) AttrUtils::SetBool(new_node->op_desc, kIsLastNode, false); (void) AttrUtils::SetBool(new_node->op_desc, kIsLastNode, false);


if (new_node->is_dynamic && (new_node->IsControlOp() || new_node->NodeType() == PARTITIONEDCALL)) {
new_node->shape_inference_type = DEPEND_COMPUTE;
}

new_node->node_id = node_index; new_node->node_id = node_index;
new_node->op_desc->SetId(node_index); new_node->op_desc->SetId(node_index);
node_index += 1; node_index += 1;
@@ -454,7 +438,6 @@ Status HybridModelBuilder::MergeInputNodes(ComputeGraph &graph) {
if (src_out_anchor == nullptr || src_out_anchor->GetOwnerNode() == nullptr) { if (src_out_anchor == nullptr || src_out_anchor->GetOwnerNode() == nullptr) {
continue; continue;
} }
auto src_node = wrapped_node_in_anchor->GetPeerOutAnchor()->GetOwnerNode();
wrapped_node_in_anchor->UnlinkAll(); wrapped_node_in_anchor->UnlinkAll();


// link src to outputs of DataNode // link src to outputs of DataNode
@@ -462,6 +445,7 @@ Status HybridModelBuilder::MergeInputNodes(ComputeGraph &graph) {
GE_CHECK_NOTNULL(out_data_anchor); GE_CHECK_NOTNULL(out_data_anchor);
for (auto &peer_in_data_anchor : out_data_anchor->GetPeerInDataAnchors()) { for (auto &peer_in_data_anchor : out_data_anchor->GetPeerInDataAnchors()) {
auto dst_node = peer_in_data_anchor->GetOwnerNode(); auto dst_node = peer_in_data_anchor->GetOwnerNode();
GE_CHECK_NOTNULL(dst_node);
root_nodes.emplace(dst_node); root_nodes.emplace(dst_node);
GE_CHK_STATUS_RET_NOLOG(DoUnlinkDataAnchors(out_data_anchor, peer_in_data_anchor)); GE_CHK_STATUS_RET_NOLOG(DoUnlinkDataAnchors(out_data_anchor, peer_in_data_anchor));
GE_CHK_STATUS_RET_NOLOG(DoLinkDataAnchors(src_out_anchor, peer_in_data_anchor)); GE_CHK_STATUS_RET_NOLOG(DoLinkDataAnchors(src_out_anchor, peer_in_data_anchor));
@@ -504,6 +488,7 @@ Status HybridModelBuilder::MergeNetOutputNode(ComputeGraph &graph) {
for (const auto &in_data_anchor : net_output_node->GetAllInDataAnchors()) { for (const auto &in_data_anchor : net_output_node->GetAllInDataAnchors()) {
auto src_out_anchor = in_data_anchor->GetPeerOutAnchor(); auto src_out_anchor = in_data_anchor->GetPeerOutAnchor();
GE_CHECK_NOTNULL(src_out_anchor); GE_CHECK_NOTNULL(src_out_anchor);
GE_CHECK_NOTNULL(src_out_anchor->GetOwnerNode());
GE_CHK_STATUS_RET_NOLOG(DoUnlinkDataAnchors(src_out_anchor, in_data_anchor)); GE_CHK_STATUS_RET_NOLOG(DoUnlinkDataAnchors(src_out_anchor, in_data_anchor));


auto index = in_data_anchor->GetIdx(); auto index = in_data_anchor->GetIdx();
@@ -527,6 +512,7 @@ Status HybridModelBuilder::MergeNetOutputNode(ComputeGraph &graph) {
continue; continue;
} }


GE_CHECK_NOTNULL(dst_in_anchor->GetOwnerNode());
GE_CHK_STATUS_RET_NOLOG(DoUnlinkDataAnchors(parent_out_anchor, dst_in_anchor)); GE_CHK_STATUS_RET_NOLOG(DoUnlinkDataAnchors(parent_out_anchor, dst_in_anchor));
GE_CHK_STATUS_RET_NOLOG(DoLinkDataAnchors(src_out_anchor, dst_in_anchor)); GE_CHK_STATUS_RET_NOLOG(DoLinkDataAnchors(src_out_anchor, dst_in_anchor));
} }
@@ -566,7 +552,7 @@ Status HybridModelBuilder::UnfoldSubgraphs(ComputeGraph &root_graph, ComputeGrap


auto subgraph = NodeUtils::GetSubgraph(*node, kSubgraphIndex); auto subgraph = NodeUtils::GetSubgraph(*node, kSubgraphIndex);
GE_CHECK_NOTNULL(subgraph); GE_CHECK_NOTNULL(subgraph);
bool is_unknown_shape = IsGraphUnknown(*subgraph);
bool is_unknown_shape = subgraph->GetGraphUnknownFlag();
if (!is_unknown_shape) { if (!is_unknown_shape) {
merged_graph->AddNode(node); merged_graph->AddNode(node);
GELOGD("[%s] Known shape partitioned call added to merged graph.", op_desc->GetName().c_str()); GELOGD("[%s] Known shape partitioned call added to merged graph.", op_desc->GetName().c_str());
@@ -613,7 +599,7 @@ Status HybridModelBuilder::UnfoldSubgraph(ComputeGraph &root_graph,
if (sub_op_type == PARTITIONEDCALL) { if (sub_op_type == PARTITIONEDCALL) {
auto sub_sub_graph = NodeUtils::GetSubgraph(*sub_node, kSubgraphIndex); auto sub_sub_graph = NodeUtils::GetSubgraph(*sub_node, kSubgraphIndex);
GE_CHECK_NOTNULL(sub_sub_graph); GE_CHECK_NOTNULL(sub_sub_graph);
if (IsGraphUnknown(*sub_sub_graph)) {
if (sub_sub_graph->GetGraphUnknownFlag()) {
GE_CHK_STATUS_RET(UnfoldSubgraph(root_graph, parent_graph, *sub_sub_graph), GE_CHK_STATUS_RET(UnfoldSubgraph(root_graph, parent_graph, *sub_sub_graph),
"[%s] Failed to merge subgraph", "[%s] Failed to merge subgraph",
sub_sub_graph->GetName().c_str()); sub_sub_graph->GetName().c_str());
@@ -636,8 +622,7 @@ Status HybridModelBuilder::UnfoldSubgraph(ComputeGraph &root_graph,
Status HybridModelBuilder::BuildOutputMapping(GraphItem &graph_item, Status HybridModelBuilder::BuildOutputMapping(GraphItem &graph_item,
const NodeItem &node_item, const NodeItem &node_item,
bool is_root_graph) { bool is_root_graph) {
auto output_size = node_item.op_desc->GetAllInputsSize();
GE_CHECK_LE(output_size, UINT32_MAX);
auto output_size = node_item.num_inputs;
graph_item.output_edges_.resize(output_size); graph_item.output_edges_.resize(output_size);


for (auto &in_data_anchor : node_item.node->GetAllInDataAnchors()) { for (auto &in_data_anchor : node_item.node->GetAllInDataAnchors()) {
@@ -648,14 +633,16 @@ Status HybridModelBuilder::BuildOutputMapping(GraphItem &graph_item,


auto src_node_item = GetNodeItem(src_node); auto src_node_item = GetNodeItem(src_node);
GE_CHECK_NOTNULL(src_node_item); GE_CHECK_NOTNULL(src_node_item);
auto output_idx = in_data_anchor->GetIdx();
auto output_offset = src_node_item->output_start + peer_out_anchor->GetIdx(); auto output_offset = src_node_item->output_start + peer_out_anchor->GetIdx();
GELOGI("Output[%d], node = %s, output_index = %d, output_offset = %d ", GELOGI("Output[%d], node = %s, output_index = %d, output_offset = %d ",
in_data_anchor->GetIdx(),
output_idx,
src_node_item->NodeName().c_str(), src_node_item->NodeName().c_str(),
peer_out_anchor->GetIdx(), peer_out_anchor->GetIdx(),
output_offset); output_offset);


graph_item.output_edges_[in_data_anchor->GetIdx()] = {src_node_item, peer_out_anchor->GetIdx()};
GE_CHECK_LE(output_idx, output_size - 1);
graph_item.output_edges_[output_idx] = {src_node_item, peer_out_anchor->GetIdx()};
} }


if (!is_root_graph) { if (!is_root_graph) {
@@ -703,7 +690,7 @@ Status HybridModelBuilder::LoadGraph() {
continue; continue;
} }


if (IsGraphUnknown(*sub_graph)) {
if (sub_graph->GetGraphUnknownFlag()) {
GE_CHK_STATUS_RET(LoadDynamicSubgraph(*sub_graph, false), GE_CHK_STATUS_RET(LoadDynamicSubgraph(*sub_graph, false),
"Failed to load subgraph: [%s]", "Failed to load subgraph: [%s]",
sub_graph->GetName().c_str()); sub_graph->GetName().c_str());
@@ -828,6 +815,10 @@ Status HybridModelBuilder::InitConstantOps() {
const NodePtr &var_node = it.second; const NodePtr &var_node = it.second;
auto op_desc = var_node->GetOpDesc(); auto op_desc = var_node->GetOpDesc();
auto v_weights = ModelUtils::GetWeights(op_desc); auto v_weights = ModelUtils::GetWeights(op_desc);
if (v_weights.empty()) {
GELOGE(INTERNAL_ERROR, "[%s] Constant no not have value", var_node->GetName().c_str());
return INTERNAL_ERROR;
}
auto *ge_tensor = const_cast<GeTensor *>(v_weights[0].get()); auto *ge_tensor = const_cast<GeTensor *>(v_weights[0].get());


std::unique_ptr<TensorValue> var_tensor; std::unique_ptr<TensorValue> var_tensor;
@@ -892,6 +883,7 @@ Status HybridModelBuilder::InitVariableTensors() {
GELOGD("Host variable [%s] malloc success.", it.first.c_str()); GELOGD("Host variable [%s] malloc success.", it.first.c_str());


std::unique_ptr<TensorValue> tensor(new (std::nothrow) TensorValue(mem_info.host_address, tensor_size)); std::unique_ptr<TensorValue> tensor(new (std::nothrow) TensorValue(mem_info.host_address, tensor_size));
GE_CHECK_NOTNULL(tensor);
hybrid_model_.variable_tensors_.emplace(it.first, std::move(tensor)); hybrid_model_.variable_tensors_.emplace(it.first, std::move(tensor));
} }


@@ -939,7 +931,7 @@ Status HybridModelBuilder::LoadGeModel(ComputeGraph &sub_graph, const GeModelPtr
GELOGD("Set ge_model for subgraph: [%s], task_size = %d", GELOGD("Set ge_model for subgraph: [%s], task_size = %d",
sub_graph.GetName().c_str(), sub_graph.GetName().c_str(),
ge_model->GetModelTaskDefPtr()->task_size()); ge_model->GetModelTaskDefPtr()->task_size());
hybrid_model_.known_shape_sub_models_.emplace(sub_graph.GetParentNode(), ge_model);
hybrid_model_.known_shape_sub_models_.emplace(parent_node, ge_model);
} }


return SUCCESS; return SUCCESS;
@@ -957,7 +949,7 @@ Status HybridModelBuilder::IndexTaskDefs() {
continue; continue;
} }


bool is_unknown_shape = IsGraphUnknown(*sub_graph);
bool is_unknown_shape = sub_graph->GetGraphUnknownFlag();
if (!is_unknown_shape) { if (!is_unknown_shape) {
GE_CHK_STATUS_RET_NOLOG(LoadGeModel(*sub_graph, ge_model)); GE_CHK_STATUS_RET_NOLOG(LoadGeModel(*sub_graph, ge_model));
continue; continue;
@@ -1106,7 +1098,7 @@ Status HybridModelBuilder::GetPeerNodeAcrossSubGraphs(const NodePtr &data_node,
GE_CHECK_NOTNULL(net_output_desc); GE_CHECK_NOTNULL(net_output_desc);


auto out_index = static_cast<uint32_t>(src_wrapped_node_out_anchor->GetIdx()); auto out_index = static_cast<uint32_t>(src_wrapped_node_out_anchor->GetIdx());
GELOGD("src graph = %s, src parent output index = %d", src_graph->GetName().c_str(), out_index);
GELOGD("src graph = %s, src parent output index = %u", src_graph->GetName().c_str(), out_index);


// link src to outputs of DataNode // link src to outputs of DataNode
auto input_size = net_output_desc->GetAllInputsSize(); auto input_size = net_output_desc->GetAllInputsSize();
@@ -1208,7 +1200,7 @@ Status HybridModelBuilder::IdentifySameInputs(NodeItem &node_item) {
in_data_anchor->GetIdx(), in_data_anchor->GetIdx(),
it->second, it->second,
src_node->GetName().c_str(), src_node->GetName().c_str(),
out_data_anchor->GetIdx());
out_data_anchor->GetIdx());
node_item.reuse_outputs.emplace(in_data_anchor->GetIdx(), it->second); node_item.reuse_outputs.emplace(in_data_anchor->GetIdx(), it->second);
} }
} }
@@ -1245,7 +1237,8 @@ Status HybridModelBuilder::IdentifyVariableOutputs(NodeItem &node_item) {
uint32_t parent_index = 0; uint32_t parent_index = 0;
GE_CHK_STATUS_RET_NOLOG(GetParentNodeOutputIndex(*net_output_desc, in_data_anchor->GetIdx(), parent_index)); GE_CHK_STATUS_RET_NOLOG(GetParentNodeOutputIndex(*net_output_desc, in_data_anchor->GetIdx(), parent_index));
GELOGD("Got parent output index = %u", parent_index); GELOGD("Got parent output index = %u", parent_index);
node_item.ref_outputs.emplace(parent_index, src_node);
GE_CHECK_LE(parent_index, INT32_MAX);
node_item.ref_outputs.emplace(static_cast<int>(parent_index), src_node);
} }


// Data nodes marked with REF_VAR_SRC_VAR_NAME // Data nodes marked with REF_VAR_SRC_VAR_NAME
@@ -1421,6 +1414,20 @@ Status HybridModelBuilder::LoadKnownShapedSubgraph(ComputeGraph &graph, NodeItem
return SUCCESS; return SUCCESS;
} }


Status HybridModelBuilder::RecoverGraphUnknownFlag() {
const auto &root_graph = ge_root_model_->GetRootGraph();
for (auto &sub_graph : root_graph->GetAllSubgraphs()) {
GE_CHECK_NOTNULL(sub_graph);
for (const auto &node : sub_graph->GetDirectNode()) {
bool is_unknown_shape = false;
(void)AttrUtils::GetBool(node->GetOpDesc(), kOwnerGraphIsUnknown, is_unknown_shape);
sub_graph->SetGraphUnknownFlag(is_unknown_shape);
break;
}
}
return SUCCESS;
}

Status HybridModelBuilder::LoadDynamicSubgraph(ComputeGraph &graph, bool is_root_graph) { Status HybridModelBuilder::LoadDynamicSubgraph(ComputeGraph &graph, bool is_root_graph) {
GELOGD("Start to load subgraph [%s]", graph.GetName().c_str()); GELOGD("Start to load subgraph [%s]", graph.GetName().c_str());
// for known partitioned call, load all nodes // for known partitioned call, load all nodes


+ 1
- 0
ge/hybrid/model/hybrid_model_builder.h View File

@@ -77,6 +77,7 @@ class HybridModelBuilder {
Status LoadDynamicSubgraph(ComputeGraph &graph, bool is_root_graph); Status LoadDynamicSubgraph(ComputeGraph &graph, bool is_root_graph);
Status ParseVarOutputs(NodeItem &node_item); Status ParseVarOutputs(NodeItem &node_item);
Status LoadKnownShapedSubgraph(ComputeGraph &graph, NodeItem *parent_node_item); Status LoadKnownShapedSubgraph(ComputeGraph &graph, NodeItem *parent_node_item);
Status RecoverGraphUnknownFlag();


const char* GetGraphName() const { const char* GetGraphName() const {
return hybrid_model_.model_name_.c_str(); return hybrid_model_.model_name_.c_str();


+ 95
- 19
ge/hybrid/model/node_item.cc View File

@@ -26,9 +26,9 @@
namespace ge { namespace ge {
namespace hybrid { namespace hybrid {
namespace { namespace {
const char * const kAttrNameOriginalFusionGraph = "_original_fusion_graph";
const char * const kNodeTypeRetVal = "_RetVal";
std::set<std::string> kControlOpTypes {
const char *const kAttrNameOriginalFusionGraph = "_original_fusion_graph";
const char *const kNodeTypeRetVal = "_RetVal";
std::set<std::string> kControlOpTypes{
IF, STATELESSIF, CASE, WHILE, STATELESSWHILE IF, STATELESSIF, CASE, WHILE, STATELESSWHILE
}; };


@@ -54,7 +54,7 @@ Status ParseInputMapping(Node &node, OpDesc &op_desc, FusedSubgraph &fused_subgr
return SUCCESS; return SUCCESS;
} }


Status ParseOutputMapping(OpDescPtr op_desc, FusedSubgraph &fused_subgraph) {
Status ParseOutputMapping(const OpDescPtr &op_desc, FusedSubgraph &fused_subgraph) {
uint32_t parent_index = 0; uint32_t parent_index = 0;
if (!AttrUtils::GetInt(op_desc, ATTR_NAME_PARENT_NODE_INDEX, parent_index)) { if (!AttrUtils::GetInt(op_desc, ATTR_NAME_PARENT_NODE_INDEX, parent_index)) {
GELOGE(FAILED, GELOGE(FAILED,
@@ -74,7 +74,7 @@ Status ParseFusedSubgraph(NodeItem &node_item) {
} }


GELOGI("[%s] Start to parse fused subgraph.", node_item.node_name.c_str()); GELOGI("[%s] Start to parse fused subgraph.", node_item.node_name.c_str());
auto fused_subgraph = std::unique_ptr<FusedSubgraph>(new (std::nothrow)FusedSubgraph());
auto fused_subgraph = std::unique_ptr<FusedSubgraph>(new(std::nothrow)FusedSubgraph());
GE_CHECK_NOTNULL(fused_subgraph); GE_CHECK_NOTNULL(fused_subgraph);


ComputeGraphPtr fused_graph; ComputeGraphPtr fused_graph;
@@ -110,19 +110,39 @@ bool IsControlOp(const std::string &op_type) {
return kControlOpTypes.count(op_type) > 0; return kControlOpTypes.count(op_type) > 0;
} }


NodeItem::NodeItem(NodePtr node): node(std::move(node)) {
NodeItem::NodeItem(NodePtr node) : node(std::move(node)) {
this->op_desc = this->node->GetOpDesc().get(); this->op_desc = this->node->GetOpDesc().get();
this->node_id = this->op_desc->GetId();
this->num_inputs = this->op_desc->GetInputsSize();
this->num_outputs = this->op_desc->GetOutputsSize();
this->node_name = this->node->GetName(); this->node_name = this->node->GetName();
this->node_type = this->node->GetType(); this->node_type = this->node->GetType();
} }


Status NodeItem::Create(const NodePtr &node, std::unique_ptr<NodeItem> &node_item) {
GE_CHECK_NOTNULL(node);
GE_CHECK_NOTNULL(node->GetOpDesc());
std::unique_ptr<NodeItem> instance(new(std::nothrow)NodeItem(node));
GE_CHECK_NOTNULL(instance);
GE_CHK_STATUS_RET(instance->Init(), "Failed to init NodeItem [%s] .", node->GetName().c_str());
node_item = std::move(instance);
return SUCCESS;
}

Status NodeItem::Init() { Status NodeItem::Init() {
int32_t unknown_shape_type_val = 0;
(void) AttrUtils::GetInt(op_desc, ::ge::ATTR_NAME_UNKNOWN_SHAPE_TYPE, unknown_shape_type_val);
shape_inference_type = static_cast<UnknowShapeOpType>(unknown_shape_type_val);
GE_CHECK_LE(op_desc->GetInputsSize(), INT32_MAX);
GE_CHECK_LE(op_desc->GetOutputsSize(), INT32_MAX);
num_inputs = static_cast<int>(op_desc->GetInputsSize());
num_outputs = static_cast<int>(op_desc->GetOutputsSize());

if (op_desc->GetAllInputsSize() != op_desc->GetInputsSize()) {
has_optional_inputs = true;
for (size_t i = 0; i < op_desc->GetAllInputsSize(); ++i) {
const auto &input_desc = op_desc->MutableInputDesc(i);
if (input_desc == nullptr) {
GELOGD("[%s] Input[%zu] is optional and invalid", NodeName().c_str(), i);
} else {
input_desc_indices_.emplace_back(static_cast<uint32_t>(i));
}
}
}


(void) AttrUtils::GetBool(op_desc, ATTR_NAME_FORCE_UNKNOWN_SHAPE, is_dynamic); (void) AttrUtils::GetBool(op_desc, ATTR_NAME_FORCE_UNKNOWN_SHAPE, is_dynamic);
GELOGD("node name = %s, is_dynamic = %d.", this->node_name.c_str(), is_dynamic); GELOGD("node name = %s, is_dynamic = %d.", this->node_name.c_str(), is_dynamic);
@@ -132,16 +152,15 @@ Status NodeItem::Init() {
node->GetName().c_str()); node->GetName().c_str());
} }


GE_CHK_STATUS_RET(ParseFusedSubgraph(*this), "[%s] Failed to parse fused subgraph", node_name.c_str());
if (is_dynamic) { if (is_dynamic) {
for (int i = 0; i < num_inputs; ++i) { for (int i = 0; i < num_inputs; ++i) {
const auto &input_desc = op_desc->MutableInputDesc(i);
const auto &input_desc = MutableInputDesc(i);
GE_CHECK_NOTNULL(input_desc); GE_CHECK_NOTNULL(input_desc);
if (input_desc->MutableShape().IsUnknownShape()) { if (input_desc->MutableShape().IsUnknownShape()) {
is_input_shape_static.push_back(false);
is_input_shape_static_.push_back(false);
} else { } else {
num_static_input_shapes++; num_static_input_shapes++;
is_input_shape_static.push_back(true);
is_input_shape_static_.push_back(true);
GELOGD("[%s] The shape of input[%d] is static. shape = [%s]", GELOGD("[%s] The shape of input[%d] is static. shape = [%s]",
NodeName().c_str(), i, input_desc->MutableShape().ToString().c_str()); NodeName().c_str(), i, input_desc->MutableShape().ToString().c_str());
} }
@@ -155,6 +174,16 @@ Status NodeItem::Init() {
break; break;
} }
} }

if (IsControlOp() || node_type == PARTITIONEDCALL) {
shape_inference_type = DEPEND_COMPUTE;
} else {
int32_t unknown_shape_type_val = 0;
(void) AttrUtils::GetInt(op_desc, ::ge::ATTR_NAME_UNKNOWN_SHAPE_TYPE, unknown_shape_type_val);
shape_inference_type = static_cast<UnknowShapeOpType>(unknown_shape_type_val);
}

GE_CHK_STATUS_RET(ParseFusedSubgraph(*this), "[%s] Failed to parse fused subgraph", node_name.c_str());
} }


return SUCCESS; return SUCCESS;
@@ -186,7 +215,7 @@ std::string NodeItem::DebugString() const {
for (auto &items : outputs) { for (auto &items : outputs) {
ss << ", output[" << index++ << "]: "; ss << ", output[" << index++ << "]: ";
for (auto &item : items) { for (auto &item : items) {
ss << "(" << item.second->NodeName() << ":" <<item.first << "), ";
ss << "(" << item.second->NodeName() << ":" << item.first << "), ";
} }
} }


@@ -196,13 +225,60 @@ std::string NodeItem::DebugString() const {
void NodeItem::SetToDynamic() { void NodeItem::SetToDynamic() {
num_static_input_shapes = 0; num_static_input_shapes = 0;
is_dynamic = true; is_dynamic = true;
for (size_t i = 0; i < is_input_shape_static.size(); ++i) {
is_input_shape_static[i] = false;
for (size_t i = 0; i < is_input_shape_static_.size(); ++i) {
is_input_shape_static_[i] = false;
} }
if (kernel_task != nullptr && !kernel_task->IsSupportDynamicShape()) { if (kernel_task != nullptr && !kernel_task->IsSupportDynamicShape()) {
GELOGD("[%s] Dynamic shape is not supported, clear node task.", node_name.c_str()); GELOGD("[%s] Dynamic shape is not supported, clear node task.", node_name.c_str());
kernel_task = nullptr; kernel_task = nullptr;
} }
} }

GeTensorDescPtr NodeItem::MutableInputDesc(int index) const {
if (!has_optional_inputs) {
return op_desc->MutableInputDesc(static_cast<uint32_t>(index));
}

if (index < 0 || index >= num_inputs) {
GELOGE(PARAM_INVALID,
"[%s] Invalid input index, num inputs = %d, index = %d",
node_name.c_str(),
num_inputs,
index);
return nullptr;
}

return op_desc->MutableInputDesc(input_desc_indices_[index]);
}

Status NodeItem::GetCanonicalInputIndex(uint32_t index, int &canonical_index) const {
if (!has_optional_inputs) {
canonical_index = index;
return SUCCESS;
}

auto iter = std::find(input_desc_indices_.begin(), input_desc_indices_.end(), index);
if (iter == input_desc_indices_.end()) {
GELOGE(INTERNAL_ERROR, "[%s] Invalid input index: %u", node_name.c_str(), index);
return INTERNAL_ERROR;
}

canonical_index = static_cast<int>(iter - input_desc_indices_.begin());
GELOGD("[%s] Canonicalize input index from [%u] to [%d]", node_name.c_str(), index, canonical_index);
return SUCCESS;
}

bool NodeItem::IsInputShapeStatic(int index) const {
if (!is_dynamic) {
return true;
}

if (static_cast<size_t>(index) >= is_input_shape_static_.size()) {
GELOGE(PARAM_INVALID, "Input index(%d) out of range: [0, %zu)", index, is_input_shape_static_.size());
return false;
}

return is_input_shape_static_[index];
}
} // namespace hybrid } // namespace hybrid
} // namespace ge } // namespace ge

+ 28
- 12
ge/hybrid/model/node_item.h View File

@@ -40,10 +40,8 @@ bool IsControlOp(const std::string &op_type);


// for caching static information across execution // for caching static information across execution
struct NodeItem { struct NodeItem {
explicit NodeItem(NodePtr node);
~NodeItem() = default; ~NodeItem() = default;

Status Init();
static Status Create(const NodePtr &node, std::unique_ptr<NodeItem> &node_item);


const std::string &NodeName() const { const std::string &NodeName() const {
return node_name; return node_name;
@@ -53,6 +51,20 @@ struct NodeItem {
return node_type; return node_type;
} }


OpDescPtr GetOpDesc() const {
return node->GetOpDesc();
}

bool IsInputShapeStatic(int index) const;

GeTensorDescPtr MutableOutputDesc(int index) const {
return op_desc->MutableOutputDesc(static_cast<uint32_t>(index));
}

GeTensorDescPtr MutableInputDesc(int index) const;

Status GetCanonicalInputIndex(uint32_t index, int &canonical_index) const;

bool IsControlOp() const; bool IsControlOp() const;


void SetToDynamic(); void SetToDynamic();
@@ -61,14 +73,15 @@ struct NodeItem {


NodePtr node; NodePtr node;
OpDesc *op_desc; OpDesc *op_desc;
int node_id;
int num_inputs;
int num_outputs;

int node_id = -1;
int num_inputs = 0;
int num_outputs = 0;
int input_start = -1; int input_start = -1;
int output_start = -1; int output_start = -1;
bool is_dynamic = false; bool is_dynamic = false;
bool has_observer = false; bool has_observer = false;
bool has_optional_inputs = false;
bool is_output_shape_static = true;
UnknowShapeOpType shape_inference_type = DEPEND_IN_SHAPE; UnknowShapeOpType shape_inference_type = DEPEND_IN_SHAPE;
std::string node_name; std::string node_name;
std::string node_type; std::string node_type;
@@ -76,9 +89,8 @@ struct NodeItem {
std::vector<ge::NodePtr> dependents_for_execution; std::vector<ge::NodePtr> dependents_for_execution;
std::set<int> to_const_output_id_list; std::set<int> to_const_output_id_list;


vector<NodeItem *> inputs;
// src_output_id, dst_anchor_id, dst_node // src_output_id, dst_anchor_id, dst_node
vector<vector<pair<uint32_t, NodeItem *>>> outputs;
vector<vector<pair<int, NodeItem *>>> outputs;


std::shared_ptr<NodeTask> kernel_task; std::shared_ptr<NodeTask> kernel_task;
std::unique_ptr<FusedSubgraph> fused_subgraph; std::unique_ptr<FusedSubgraph> fused_subgraph;
@@ -86,10 +98,14 @@ struct NodeItem {
std::map<int, ge::NodePtr> ref_outputs; std::map<int, ge::NodePtr> ref_outputs;
std::map<int, int> reuse_inputs; std::map<int, int> reuse_inputs;
std::map<int, int> reuse_outputs; std::map<int, int> reuse_outputs;

std::vector<bool> is_input_shape_static;
bool is_output_shape_static = true;
int num_static_input_shapes = 0; int num_static_input_shapes = 0;

private:
explicit NodeItem(NodePtr node);
Status Init();

std::vector<bool> is_input_shape_static_;
std::vector<uint32_t> input_desc_indices_;
}; };
} // namespace hybrid } // namespace hybrid
} // namespace ge } // namespace ge


+ 4
- 8
ge/hybrid/node_executor/aicore/aicore_node_executor.cc View File

@@ -157,9 +157,7 @@ Status AiCoreNodeTask::ExecuteAsync(TaskContext &context, std::function<void()>
return ret; return ret;
} }


auto op_desc = context.GetNodeItem().op_desc;
GE_CHECK_NOTNULL(op_desc);
GELOGI("[%s] ExecuteAsync Start.", op_desc->GetName().c_str());
GELOGI("[%s] ExecuteAsync Start.", context.GetNodeName());
for (auto it = tasks_.begin(); it != tasks_.end(); ++it) { for (auto it = tasks_.begin(); it != tasks_.end(); ++it) {
// AtomicAddrClean has 2 tasks // AtomicAddrClean has 2 tasks
if (tasks_.size() == 2 && it == tasks_.begin() && !(*(tasks_.rbegin()))->GetClearAtomic()) { if (tasks_.size() == 2 && it == tasks_.begin() && !(*(tasks_.rbegin()))->GetClearAtomic()) {
@@ -177,15 +175,13 @@ Status AiCoreNodeTask::ExecuteAsync(TaskContext &context, std::function<void()>
RECORD_EXECUTION_EVENT(context.GetExecutionContext(), context.GetNodeName(), "[AiCoreNodeRegisterCallback] End"); RECORD_EXECUTION_EVENT(context.GetExecutionContext(), context.GetNodeName(), "[AiCoreNodeRegisterCallback] End");
} }


GELOGD("[%s] ExecuteAsync End.", op_desc->GetName().c_str());
GELOGD("[%s] ExecuteAsync End.", context.GetNodeName());
RECORD_EXECUTION_EVENT(context.GetExecutionContext(), context.GetNodeName(), "[AiCoreNodeTaskExecuteAsync] End"); RECORD_EXECUTION_EVENT(context.GetExecutionContext(), context.GetNodeName(), "[AiCoreNodeTaskExecuteAsync] End");
return SUCCESS; return SUCCESS;
} }


Status AiCoreNodeTask::UpdateArgs(TaskContext &context) { Status AiCoreNodeTask::UpdateArgs(TaskContext &context) {
auto op_desc = context.GetNodeItem().op_desc;
GE_CHECK_NOTNULL(op_desc);
GELOGI("[%s] AiCoreNodeTask UpdateArgs Start.", op_desc->GetName().c_str());
GELOGI("[%s] AiCoreNodeTask UpdateArgs Start.", context.GetNodeName());
for (auto it = tasks_.rbegin(); it != tasks_.rend(); ++it) { for (auto it = tasks_.rbegin(); it != tasks_.rend(); ++it) {
GE_CHK_STATUS_RET_NOLOG((*it)->UpdateArgs(context)); GE_CHK_STATUS_RET_NOLOG((*it)->UpdateArgs(context));
// AtomicAddrClean has 2 tasks // AtomicAddrClean has 2 tasks
@@ -193,7 +189,7 @@ Status AiCoreNodeTask::UpdateArgs(TaskContext &context) {
break; break;
} }
} }
GELOGI("[%s] AiCoreNodeTask UpdateArgs End.", op_desc->GetName().c_str());
GELOGI("[%s] AiCoreNodeTask UpdateArgs End.", context.GetNodeName());
return SUCCESS; return SUCCESS;
} }




+ 6
- 3
ge/hybrid/node_executor/aicpu/aicpu_ext_info.cc View File

@@ -37,7 +37,10 @@ Status AicpuExtInfoHandler::Parse(const std::string &ext_info) {
ext_info_.reset(new(std::nothrow)uint8_t[ext_info_len_]); ext_info_.reset(new(std::nothrow)uint8_t[ext_info_len_]);
GE_CHECK_NOTNULL(ext_info_); GE_CHECK_NOTNULL(ext_info_);


(void) memcpy_s(ext_info_.get(), ext_info_len_, ext_info.c_str(), ext_info.size());
if (memcpy_s(ext_info_.get(), ext_info_len_, ext_info.c_str(), ext_info.size()) != EOK) {
GELOGE(FAILED, "[%s] Failed to coy ext info", node_name_.c_str());
return FAILED;
}


input_shape_and_type_.clear(); input_shape_and_type_.clear();
output_shape_and_type_.clear(); output_shape_and_type_.clear();
@@ -94,7 +97,7 @@ Status AicpuExtInfoHandler::ParseExtInputShape(AicpuExtInfo *aicpu_ext_info) {
auto need_len = input_num_ * sizeof(AicpuShapeAndType); auto need_len = input_num_ * sizeof(AicpuShapeAndType);
GE_CHK_BOOL_RET_STATUS(aicpu_ext_info->infoLen == need_len, PARAM_INVALID, GE_CHK_BOOL_RET_STATUS(aicpu_ext_info->infoLen == need_len, PARAM_INVALID,
"Node[%s] parse ext input shape failed as infoLen must be " "Node[%s] parse ext input shape failed as infoLen must be "
"input_num[%zu]*sizeof(ShapeAndType)[%zu] but %u.",
"input_num[%u]*sizeof(ShapeAndType)[%zu] but %u.",
node_name_.c_str(), input_num_, sizeof(AicpuShapeAndType), aicpu_ext_info->infoLen); node_name_.c_str(), input_num_, sizeof(AicpuShapeAndType), aicpu_ext_info->infoLen);


auto input = reinterpret_cast<AicpuShapeAndType *>(aicpu_ext_info->infoMsg); auto input = reinterpret_cast<AicpuShapeAndType *>(aicpu_ext_info->infoMsg);
@@ -115,7 +118,7 @@ Status AicpuExtInfoHandler::ParseExtOutputShape(AicpuExtInfo *aicpu_ext_info) {
auto need_len = output_num_ * sizeof(AicpuShapeAndType); auto need_len = output_num_ * sizeof(AicpuShapeAndType);
GE_CHK_BOOL_RET_STATUS(aicpu_ext_info->infoLen == need_len, PARAM_INVALID, GE_CHK_BOOL_RET_STATUS(aicpu_ext_info->infoLen == need_len, PARAM_INVALID,
"Node[%s] parse ext output shape failed as infoLen must be " "Node[%s] parse ext output shape failed as infoLen must be "
"output_num[%zu]*sizeof(ShapeAndType)[%zu] but %u.",
"output_num[%u]*sizeof(ShapeAndType)[%zu] but %u.",
node_name_.c_str(), output_num_, sizeof(AicpuShapeAndType), aicpu_ext_info->infoLen); node_name_.c_str(), output_num_, sizeof(AicpuShapeAndType), aicpu_ext_info->infoLen);


auto output = reinterpret_cast<AicpuShapeAndType *>(aicpu_ext_info->infoMsg); auto output = reinterpret_cast<AicpuShapeAndType *>(aicpu_ext_info->infoMsg);


+ 39
- 40
ge/hybrid/node_executor/aicpu/aicpu_node_executor.cc View File

@@ -48,7 +48,7 @@ Status AicpuNodeTaskBase::InitExtInfo(const std::string &kernel_ext_info, int64_
return PARAM_INVALID; return PARAM_INVALID;
} else { } else {
// if no ext info no need copy to device. // if no ext info no need copy to device.
GELOGI("Node[%s] kernel_ext_info is empty, no need copy to device, is_dynamic=%s.",
GELOGD("Node[%s] kernel_ext_info is empty, no need copy to device, is_dynamic=%s.",
node_name_.c_str(), node_item_->is_dynamic ? "true" : "false"); node_name_.c_str(), node_item_->is_dynamic ? "true" : "false");
return SUCCESS; return SUCCESS;
} }
@@ -76,7 +76,7 @@ Status AicpuNodeTaskBase::InitExtInfo(const std::string &kernel_ext_info, int64_


Status AicpuNodeTaskBase::UpdateOutputShapeFromExtInfo() { Status AicpuNodeTaskBase::UpdateOutputShapeFromExtInfo() {
if (node_item_->num_outputs == 0) { if (node_item_->num_outputs == 0) {
GELOGI("Task [%s] output_num is 0, no need update output shape.", node_name_.c_str());
GELOGD("Task [%s] output_num is 0, no need update output shape.", node_name_.c_str());
return SUCCESS; return SUCCESS;
} }
// copy to host buf // copy to host buf
@@ -91,7 +91,7 @@ Status AicpuNodeTaskBase::UpdateOutputShapeFromExtInfo() {
// not support update data type now, just for param // not support update data type now, just for param
DataType data_type; DataType data_type;
aicpu_ext_handle_.GetOutputShapeAndType(i, shape, data_type); aicpu_ext_handle_.GetOutputShapeAndType(i, shape, data_type);
auto output_desc = node_item_->op_desc->MutableOutputDesc(i);
auto output_desc = node_item_->MutableOutputDesc(i);
GE_CHECK_NOTNULL(output_desc); GE_CHECK_NOTNULL(output_desc);
GE_CHK_STATUS_RET(UpdateShapeToOutputDesc(shape, i, output_desc), GE_CHK_STATUS_RET(UpdateShapeToOutputDesc(shape, i, output_desc),
"Update node %s [%d]th output shape failed.", "Update node %s [%d]th output shape failed.",
@@ -104,7 +104,7 @@ Status AicpuNodeTaskBase::UpdateShapeToOutputDesc(const GeShape &shape_new,
int32_t output_index, GeTensorDescPtr &output_desc) { int32_t output_index, GeTensorDescPtr &output_desc) {
auto shape_old = output_desc->GetShape(); auto shape_old = output_desc->GetShape();
output_desc->SetShape(shape_new); output_desc->SetShape(shape_new);
GELOGI("Update node[%s] out[%d] shape from %s to %s.", node_name_.c_str(), output_index,
GELOGD("Update node[%s] out[%d] shape from %s to %s.", node_name_.c_str(), output_index,
shape_old.ToString().c_str(), shape_new.ToString().c_str()); shape_old.ToString().c_str(), shape_new.ToString().c_str());


auto origin_shape_old = output_desc->GetOriginShape(); auto origin_shape_old = output_desc->GetOriginShape();
@@ -123,7 +123,7 @@ Status AicpuNodeTaskBase::UpdateShapeToOutputDesc(const GeShape &shape_new,
node_name_.c_str(), output_index, origin_format, format, shape_new.ToString().c_str()); node_name_.c_str(), output_index, origin_format, format, shape_new.ToString().c_str());
auto origin_shape_new = GeShape(origin_dims_new); auto origin_shape_new = GeShape(origin_dims_new);
output_desc->SetOriginShape(origin_shape_new); output_desc->SetOriginShape(origin_shape_new);
GELOGI("Node[%s] out[%d] originFormat[%d] is not same as format[%d], need update from %s ro %s.",
GELOGD("Node[%s] out[%d] originFormat[%d] is not same as format[%d], need update from %s ro %s.",
node_name_.c_str(), output_index, origin_format, format, node_name_.c_str(), output_index, origin_format, format,
origin_shape_old.ToString().c_str(), origin_shape_new.ToString().c_str()); origin_shape_old.ToString().c_str(), origin_shape_new.ToString().c_str());
return SUCCESS; return SUCCESS;
@@ -132,12 +132,12 @@ Status AicpuNodeTaskBase::UpdateShapeToOutputDesc(const GeShape &shape_new,
Status AicpuNodeTaskBase::UpdateExtInfo() { Status AicpuNodeTaskBase::UpdateExtInfo() {
GELOGI("Node[%s] update ext info begin, unknown_type=%d.", node_name_.c_str(), unknown_type_); GELOGI("Node[%s] update ext info begin, unknown_type=%d.", node_name_.c_str(), unknown_type_);
if (node_item_->num_inputs == 0 && node_item_->num_outputs == 0) { if (node_item_->num_inputs == 0 && node_item_->num_outputs == 0) {
GELOGI("Node[%s] has no input and output, no need update ext info.", node_name_.c_str());
GELOGD("Node[%s] has no input and output, no need update ext info.", node_name_.c_str());
return SUCCESS; return SUCCESS;
} }


for (auto i = 0; i < node_item_->num_inputs; ++i) { for (auto i = 0; i < node_item_->num_inputs; ++i) {
auto input_desc = node_item_->op_desc->MutableInputDesc(i);
auto input_desc = node_item_->MutableInputDesc(i);
GE_CHECK_NOTNULL(input_desc); GE_CHECK_NOTNULL(input_desc);
GE_CHK_STATUS_RET(aicpu_ext_handle_.UpdateInputShapeAndType(i, *input_desc), GE_CHK_STATUS_RET(aicpu_ext_handle_.UpdateInputShapeAndType(i, *input_desc),
"Node[%s] input[%d] update input shape failed.", "Node[%s] input[%d] update input shape failed.",
@@ -146,7 +146,7 @@ Status AicpuNodeTaskBase::UpdateExtInfo() {


if (unknown_type_ != DEPEND_COMPUTE) { if (unknown_type_ != DEPEND_COMPUTE) {
for (auto j = 0; j < node_item_->num_outputs; ++j) { for (auto j = 0; j < node_item_->num_outputs; ++j) {
auto output_desc = node_item_->op_desc->MutableOutputDesc(j);
auto output_desc = node_item_->MutableOutputDesc(j);
GE_CHECK_NOTNULL(output_desc); GE_CHECK_NOTNULL(output_desc);


GE_CHK_STATUS_RET(aicpu_ext_handle_.UpdateOutputShapeAndType(j, *output_desc), GE_CHK_STATUS_RET(aicpu_ext_handle_.UpdateOutputShapeAndType(j, *output_desc),
@@ -162,15 +162,15 @@ Status AicpuNodeTaskBase::UpdateExtInfo() {
aicpu_ext_handle_.GetExtInfoLen(), aicpu_ext_handle_.GetExtInfoLen(),
RT_MEMCPY_HOST_TO_DEVICE)); RT_MEMCPY_HOST_TO_DEVICE));


GELOGI("Node[%s] update ext info end.", node_name_.c_str());
GELOGD("Node[%s] update ext info end.", node_name_.c_str());
return SUCCESS; return SUCCESS;
} }


Status AicpuNodeTaskBase::UpdateArgs(TaskContext &context) { Status AicpuNodeTaskBase::UpdateArgs(TaskContext &context) {
GELOGI("Node[%s] update args begin. is_dynamic=%s, unknown_type=%d",
GELOGD("Node[%s] update args begin. is_dynamic=%s, unknown_type=%d",
node_name_.c_str(), node_item_->is_dynamic ? "true" : "false", unknown_type_); node_name_.c_str(), node_item_->is_dynamic ? "true" : "false", unknown_type_);
if (node_item_->num_inputs == 0 && node_item_->num_outputs == 0) { if (node_item_->num_inputs == 0 && node_item_->num_outputs == 0) {
GELOGI("Node[%s] has no input and output, no need update args.", node_name_.c_str());
GELOGD("Node[%s] has no input and output, no need update args.", node_name_.c_str());
return SUCCESS; return SUCCESS;
} }


@@ -179,41 +179,41 @@ Status AicpuNodeTaskBase::UpdateArgs(TaskContext &context) {
// dynamic node need update ext info. // dynamic node need update ext info.
GE_CHK_STATUS_RET(UpdateExtInfo(), "Node[%s] update ext info failed.", node_name_.c_str()); GE_CHK_STATUS_RET(UpdateExtInfo(), "Node[%s] update ext info failed.", node_name_.c_str());
} }
GELOGI("Node[%s] update args end.", node_name_.c_str());
GELOGD("Node[%s] update args end.", node_name_.c_str());
return SUCCESS; return SUCCESS;
} }


Status AicpuNodeTaskBase::ExecuteAsync(TaskContext &context, std::function<void()> done_callback) { Status AicpuNodeTaskBase::ExecuteAsync(TaskContext &context, std::function<void()> done_callback) {
RECORD_EXECUTION_EVENT(context.GetExecutionContext(), context.GetNodeName(), "[AicpuNodeTaskBaseExecuteAsync] Start"); RECORD_EXECUTION_EVENT(context.GetExecutionContext(), context.GetNodeName(), "[AicpuNodeTaskBaseExecuteAsync] Start");
GELOGI("Node[%s] execute async start. unknown_type=%d.", node_name_.c_str(), unknown_type_);
GELOGD("Node[%s] execute async start. unknown_type=%d.", node_name_.c_str(), unknown_type_);


GE_CHK_STATUS_RET(LaunchTask(context)); GE_CHK_STATUS_RET(LaunchTask(context));


auto callback = [=, &context]() { auto callback = [=, &context]() {
GELOGI("Node[%s] callback start.", node_name_.c_str());
GELOGD("Node[%s] callback start.", node_name_.c_str());
RECORD_CALLBACK_EVENT(context.GetExecutionContext(), node_name_.c_str(), "[TaskCallback] Start"); RECORD_CALLBACK_EVENT(context.GetExecutionContext(), node_name_.c_str(), "[TaskCallback] Start");
Status callback_ret = TaskCallback(context); Status callback_ret = TaskCallback(context);
RECORD_CALLBACK_EVENT(context.GetExecutionContext(), node_name_.c_str(), "[TaskCallback] End"); RECORD_CALLBACK_EVENT(context.GetExecutionContext(), node_name_.c_str(), "[TaskCallback] End");


GELOGI("Node[%s] task callBack ret = %u.", node_name_.c_str(), callback_ret);
GELOGD("Node[%s] task callBack ret = %u.", node_name_.c_str(), callback_ret);
if (done_callback != nullptr) { if (done_callback != nullptr) {
context.SetStatus(callback_ret); context.SetStatus(callback_ret);
done_callback(); done_callback();
} }


GELOGI("Node[%s] callback end.", node_name_.c_str());
GELOGD("Node[%s] callback end.", node_name_.c_str());
}; };


GE_CHK_STATUS_RET_NOLOG(context.RegisterCallback(callback)); GE_CHK_STATUS_RET_NOLOG(context.RegisterCallback(callback));


GELOGI("Node[%s] execute async end.", node_name_.c_str());
GELOGD("Node[%s] execute async end.", node_name_.c_str());
RECORD_EXECUTION_EVENT(context.GetExecutionContext(), context.GetNodeName(), "[AicpuNodeTaskBaseExecuteAsync] End"); RECORD_EXECUTION_EVENT(context.GetExecutionContext(), context.GetNodeName(), "[AicpuNodeTaskBaseExecuteAsync] End");
return SUCCESS; return SUCCESS;
} }


Status AicpuTfNodeTask::InitForDependComputeTask() { Status AicpuTfNodeTask::InitForDependComputeTask() {
if ((unknown_type_ != DEPEND_COMPUTE) || (node_item_->num_outputs == 0)) { if ((unknown_type_ != DEPEND_COMPUTE) || (node_item_->num_outputs == 0)) {
GELOGI("Node[%s] type[%s] unknown_type is %d, output num is %d.",
GELOGD("Node[%s] type[%s] unknown_type is %d, output num is %d.",
node_name_.c_str(), node_item_->node_type.c_str(), unknown_type_, node_item_->num_outputs); node_name_.c_str(), node_item_->node_type.c_str(), unknown_type_, node_item_->num_outputs);
return SUCCESS; return SUCCESS;
} }
@@ -438,7 +438,7 @@ Status AicpuTfNodeTask::PrepareCopyInputs(const TaskContext &context,


for (auto i = 0; i < node_item_->num_outputs; ++i) { for (auto i = 0; i < node_item_->num_outputs; ++i) {
const auto &summary = output_summary_host_[i]; const auto &summary = output_summary_host_[i];
GELOGI("Node[%s] out[%d] summary, shape data=0x%lx, shape data size=%lu, raw data=0x%lx, raw data size=%lu.",
GELOGD("Node[%s] out[%d] summary, shape data=0x%lx, shape data size=%lu, raw data=0x%lx, raw data size=%lu.",
node_name_.c_str(), i, node_name_.c_str(), i,
summary.shape_data_ptr, summary.shape_data_size, summary.shape_data_ptr, summary.shape_data_size,
summary.raw_data_ptr, summary.raw_data_size); summary.raw_data_ptr, summary.raw_data_size);
@@ -499,7 +499,7 @@ Status AicpuTfNodeTask::UpdateShapeByHbmBuffer(TaskContext &context,
node_name_.c_str(), node_item_->num_outputs, out_shape_hbm.size()); node_name_.c_str(), node_item_->num_outputs, out_shape_hbm.size());
for (auto i = 0; i < node_item_->num_outputs; ++i) { for (auto i = 0; i < node_item_->num_outputs; ++i) {
const auto &result_summary = output_summary_host_[i]; const auto &result_summary = output_summary_host_[i];
auto output_desc = node_item_->op_desc->MutableOutputDesc(i);
auto output_desc = node_item_->MutableOutputDesc(i);
std::vector<int64_t> shape_dims; std::vector<int64_t> shape_dims;
if (result_summary.shape_data_size > 0) { if (result_summary.shape_data_size > 0) {
const auto &shape_hbm = out_shape_hbm[i]; const auto &shape_hbm = out_shape_hbm[i];
@@ -507,7 +507,7 @@ Status AicpuTfNodeTask::UpdateShapeByHbmBuffer(TaskContext &context,
"Node[%s] [%d]th output shape data size is %lu is not divided by int64_t.", "Node[%s] [%d]th output shape data size is %lu is not divided by int64_t.",
node_name_.c_str(), i, result_summary.shape_data_size); node_name_.c_str(), i, result_summary.shape_data_size);
uint32_t dim_num = result_summary.shape_data_size / sizeof(int64_t); uint32_t dim_num = result_summary.shape_data_size / sizeof(int64_t);
GELOGI("Node[%s] [%d]th output dim num=%u.", node_name_.c_str(), i, dim_num);
GELOGD("Node[%s] [%d]th output dim num=%u.", node_name_.c_str(), i, dim_num);
std::unique_ptr<int64_t[]> shape_addr(new(std::nothrow) int64_t[dim_num]()); std::unique_ptr<int64_t[]> shape_addr(new(std::nothrow) int64_t[dim_num]());
GE_CHECK_NOTNULL(shape_addr); GE_CHECK_NOTNULL(shape_addr);
GE_CHK_RT_RET(rtMemcpy(shape_addr.get(), result_summary.shape_data_size, GE_CHK_RT_RET(rtMemcpy(shape_addr.get(), result_summary.shape_data_size,
@@ -525,7 +525,7 @@ Status AicpuTfNodeTask::UpdateShapeByHbmBuffer(TaskContext &context,
} }


Status AicpuTfNodeTask::UpdateShapeAndDataByResultSummary(TaskContext &context) { Status AicpuTfNodeTask::UpdateShapeAndDataByResultSummary(TaskContext &context) {
GELOGI("Node[%s] update shape and data by result summary begin.", node_name_.c_str());
GELOGD("Node[%s] update shape and data by result summary begin.", node_name_.c_str());


std::vector<std::unique_ptr<TensorBuffer>> out_shape_hbm; std::vector<std::unique_ptr<TensorBuffer>> out_shape_hbm;
GE_CHK_STATUS_RET(ReadResultSummaryAndPrepareMemory(context, out_shape_hbm), GE_CHK_STATUS_RET(ReadResultSummaryAndPrepareMemory(context, out_shape_hbm),
@@ -545,7 +545,7 @@ Status AicpuTfNodeTask::UpdateShapeAndDataByResultSummary(TaskContext &context)
"Node[%s] update shape by hbm buffer failed.", "Node[%s] update shape by hbm buffer failed.",
node_name_.c_str()); node_name_.c_str());


GELOGI("Node[%s] update shape and data by result summary end.", node_name_.c_str());
GELOGD("Node[%s] update shape and data by result summary end.", node_name_.c_str());
return SUCCESS; return SUCCESS;
} }


@@ -574,7 +574,7 @@ Status AicpuTfNodeTask::UpdateIoAddr(TaskContext &context) {
} }
} else { } else {
// unknown type 4 use result summary update ioaddr. // unknown type 4 use result summary update ioaddr.
GELOGI("Node[%s] is depend compute node, use result summary as out addr.", node_name_.c_str());
GELOGD("Node[%s] is depend compute node, use result summary as out addr.", node_name_.c_str());
GE_CHK_BOOL_RET_STATUS(output_summary_.size() == static_cast<std::size_t>(node_item_->num_outputs), GE_CHK_BOOL_RET_STATUS(output_summary_.size() == static_cast<std::size_t>(node_item_->num_outputs),
INTERNAL_ERROR, INTERNAL_ERROR,
"Node[%s] has %d output but %zu output summary.", "Node[%s] has %d output but %zu output summary.",
@@ -599,17 +599,17 @@ Status AicpuTfNodeTask::UpdateIoAddr(TaskContext &context) {
} }


Status AicpuTfNodeTask::LaunchTask(TaskContext &context) { Status AicpuTfNodeTask::LaunchTask(TaskContext &context) {
GELOGI("Node[%s] launch task start, unknown_type=%d.", node_name_.c_str(), unknown_type_);
GELOGD("Node[%s] launch task start, unknown_type=%d.", node_name_.c_str(), unknown_type_);
uint32_t flag = RT_KERNEL_DEFAULT; uint32_t flag = RT_KERNEL_DEFAULT;
RECORD_EXECUTION_EVENT(context.GetExecutionContext(), node_name_.c_str(), "[AicpuTfNodertKernelLaunchEx] Start"); RECORD_EXECUTION_EVENT(context.GetExecutionContext(), node_name_.c_str(), "[AicpuTfNodertKernelLaunchEx] Start");
GE_CHK_RT_RET(rtKernelLaunchEx(kernel_buf_->GetData(), kernel_buf_->GetSize(), flag, context.GetStream())); GE_CHK_RT_RET(rtKernelLaunchEx(kernel_buf_->GetData(), kernel_buf_->GetSize(), flag, context.GetStream()));
RECORD_EXECUTION_EVENT(context.GetExecutionContext(), node_name_.c_str(), "[AicpuTfNodertKernelLaunchEx] End"); RECORD_EXECUTION_EVENT(context.GetExecutionContext(), node_name_.c_str(), "[AicpuTfNodertKernelLaunchEx] End");
GELOGI("Node[%s] launch end.", node_name_.c_str());
GELOGD("Node[%s] launch end.", node_name_.c_str());
return SUCCESS; return SUCCESS;
} }


Status AicpuTfNodeTask::TaskCallback(TaskContext &context) { Status AicpuTfNodeTask::TaskCallback(TaskContext &context) {
GELOGI("Node[%s] task callback start. is_dynamic=%s, unknown_type=%d.",
GELOGD("Node[%s] task callback start. is_dynamic=%s, unknown_type=%d.",
node_name_.c_str(), node_item_->is_dynamic ? "true" : "false", unknown_type_); node_name_.c_str(), node_item_->is_dynamic ? "true" : "false", unknown_type_);
Status callback_ret = SUCCESS; Status callback_ret = SUCCESS;
if (node_item_->is_dynamic) { if (node_item_->is_dynamic) {
@@ -621,13 +621,13 @@ Status AicpuTfNodeTask::TaskCallback(TaskContext &context) {
callback_ret = UpdateShapeAndDataByResultSummary(context); callback_ret = UpdateShapeAndDataByResultSummary(context);
} }
} }
GELOGI("Node[%s] task callback end.", node_name_.c_str());
GELOGD("Node[%s] task callback end.", node_name_.c_str());
return callback_ret; return callback_ret;
} }


Status AicpuNodeTask::Init(const HybridModel &model) { Status AicpuNodeTask::Init(const HybridModel &model) {
auto node_name = node_name_; auto node_name = node_name_;
GELOGI("Node[%s] init start.", node_name.c_str());
GELOGD("Node[%s] init start.", node_name.c_str());


GE_CHK_BOOL_RET_STATUS(unknown_type_ != DEPEND_COMPUTE, FAILED, GE_CHK_BOOL_RET_STATUS(unknown_type_ != DEPEND_COMPUTE, FAILED,
"Node[%s] unknown type[%d] is depend compute, it's not supported now.", "Node[%s] unknown type[%d] is depend compute, it's not supported now.",
@@ -640,13 +640,12 @@ Status AicpuNodeTask::Init(const HybridModel &model) {
args_size_ = kernel_def.args_size(); args_size_ = kernel_def.args_size();


const std::string &so_name = kernel_def.so_name(); const std::string &so_name = kernel_def.so_name();
const OpDescPtr op_desc = MakeShared<OpDesc>(*(node_item_->op_desc));
const OpDescPtr op_desc = node_item_->GetOpDesc();
const auto &context = kernel_def.context(); const auto &context = kernel_def.context();
auto kernel_type = static_cast<cce::ccKernelType>(context.kernel_type()); auto kernel_type = static_cast<cce::ccKernelType>(context.kernel_type());
if (kernel_type == cce::ccKernelType::CUST_AI_CPU) { if (kernel_type == cce::ccKernelType::CUST_AI_CPU) {
GE_CHK_STATUS_RET(ModelManager::GetInstance()->LoadCustAicpuSo(op_desc, so_name), "load cust aicpu so failed."); GE_CHK_STATUS_RET(ModelManager::GetInstance()->LoadCustAicpuSo(op_desc, so_name), "load cust aicpu so failed.");
GE_CHK_STATUS_RET(ModelManager::GetInstance()->LaunchCustAicpuSo(), "Launch cust aicpu so failed."); GE_CHK_STATUS_RET(ModelManager::GetInstance()->LaunchCustAicpuSo(), "Launch cust aicpu so failed.");

} }


GE_CHK_BOOL_RET_STATUS(args.size() == args_size_, FAILED, GE_CHK_BOOL_RET_STATUS(args.size() == args_size_, FAILED,
@@ -698,7 +697,7 @@ Status AicpuNodeTask::Init(const HybridModel &model) {
aicpu_param_head->extInfoAddr = reinterpret_cast<uintptr_t>(ext_info_addr_dev_->GetData()); aicpu_param_head->extInfoAddr = reinterpret_cast<uintptr_t>(ext_info_addr_dev_->GetData());
} }


GELOGI("Node[%s] init end.", node_name.c_str());
GELOGD("Node[%s] init end.", node_name.c_str());
return SUCCESS; return SUCCESS;
} }


@@ -733,14 +732,14 @@ Status AicpuNodeTask::UpdateIoAddr(TaskContext &context) {
} }


Status AicpuNodeTask::LaunchTask(TaskContext &context) { Status AicpuNodeTask::LaunchTask(TaskContext &context) {
GELOGI("Node[%s] launch task start. unknown_type=%d.", node_name_.c_str(), unknown_type_);
GELOGD("Node[%s] launch task start. unknown_type=%d.", node_name_.c_str(), unknown_type_);
const auto &so_name = task_def_.kernel().so_name(); const auto &so_name = task_def_.kernel().so_name();
const auto &kernel_name = task_def_.kernel().kernel_name(); const auto &kernel_name = task_def_.kernel().kernel_name();
const auto &kcontext = task_def_.kernel().context(); const auto &kcontext = task_def_.kernel().context();
auto kernel_type = static_cast<cce::ccKernelType>(kcontext.kernel_type()); auto kernel_type = static_cast<cce::ccKernelType>(kcontext.kernel_type());
uint32_t flag = RT_KERNEL_DEFAULT; uint32_t flag = RT_KERNEL_DEFAULT;
if (kernel_type == cce::ccKernelType::CUST_AI_CPU) { if (kernel_type == cce::ccKernelType::CUST_AI_CPU) {
flag |= RT_KERNEL_CUSTOM_AICPU;
flag |= static_cast<uint32_t>(RT_KERNEL_CUSTOM_AICPU);
} }
auto rt_ret = rtCpuKernelLaunchWithFlag(reinterpret_cast<const void *>(so_name.c_str()), auto rt_ret = rtCpuKernelLaunchWithFlag(reinterpret_cast<const void *>(so_name.c_str()),
reinterpret_cast<const void *>(kernel_name.c_str()), reinterpret_cast<const void *>(kernel_name.c_str()),
@@ -748,12 +747,12 @@ Status AicpuNodeTask::LaunchTask(TaskContext &context) {
args_.get(), args_size_, args_.get(), args_size_,
nullptr, context.GetStream(), flag); nullptr, context.GetStream(), flag);
GE_CHK_RT_RET(rt_ret); GE_CHK_RT_RET(rt_ret);
GELOGI("Node[%s] launch task end.", node_name_.c_str());
GELOGD("Node[%s] launch task end.", node_name_.c_str());
return SUCCESS; return SUCCESS;
} }


Status AicpuNodeTask::TaskCallback(TaskContext &context) { Status AicpuNodeTask::TaskCallback(TaskContext &context) {
GELOGI("Node[%s] task callback start, is_dynamic = %s, unknown_type=%d.",
GELOGD("Node[%s] task callback start, is_dynamic = %s, unknown_type=%d.",
node_name_.c_str(), node_item_->is_dynamic ? "true" : "false", unknown_type_); node_name_.c_str(), node_item_->is_dynamic ? "true" : "false", unknown_type_);
Status callback_ret = SUCCESS; Status callback_ret = SUCCESS;


@@ -762,10 +761,10 @@ Status AicpuNodeTask::TaskCallback(TaskContext &context) {
// check result // check result
callback_ret = UpdateOutputShapeFromExtInfo(); callback_ret = UpdateOutputShapeFromExtInfo();
} else { } else {
GELOGI("Node[%s] unknown shape type is %d no need update output shape.",
GELOGD("Node[%s] unknown shape type is %d no need update output shape.",
node_name_.c_str(), unknown_type_); node_name_.c_str(), unknown_type_);
} }
GELOGI("Node[%s] task callback end.", node_name_.c_str());
GELOGD("Node[%s] task callback end.", node_name_.c_str());
return callback_ret; return callback_ret;
} }


@@ -781,7 +780,7 @@ Status AiCpuNodeExecutor::LoadTask(const HybridModel &model,
const NodePtr &node, const NodePtr &node,
std::shared_ptr<NodeTask> &task) const { std::shared_ptr<NodeTask> &task) const {
GE_CHECK_NOTNULL(node); GE_CHECK_NOTNULL(node);
GELOGI("Node[%s] load task start.", node->GetName().c_str());
GELOGD("Node[%s] load task start.", node->GetName().c_str());
auto node_item = model.GetNodeItem(node); auto node_item = model.GetNodeItem(node);
GE_CHECK_NOTNULL(node_item); GE_CHECK_NOTNULL(node_item);
auto task_defs = model.GetTaskDefs(node); auto task_defs = model.GetTaskDefs(node);
@@ -815,7 +814,7 @@ Status AiCpuNodeExecutor::LoadTask(const HybridModel &model,
GE_CHK_STATUS_RET(aicpu_task->Init(model), "Node[%s] task init failed.", node->GetName().c_str()); GE_CHK_STATUS_RET(aicpu_task->Init(model), "Node[%s] task init failed.", node->GetName().c_str());


task = std::move(aicpu_task); task = std::move(aicpu_task);
GELOGI("Node[%s] load task end.", node->GetName().c_str());
GELOGD("Node[%s] load task end.", node->GetName().c_str());
return SUCCESS; return SUCCESS;
} }
} // namespace hybrid } // namespace hybrid


+ 12
- 16
ge/hybrid/node_executor/compiledsubgraph/known_node_executor.cc View File

@@ -31,14 +31,12 @@ REGISTER_NODE_EXECUTOR_BUILDER(NodeExecutorManager::ExecutorType::COMPILED_SUBGR


Status KnownNodeTask:: ExecuteAsync(TaskContext &context, std::function<void()> done_callback) { Status KnownNodeTask:: ExecuteAsync(TaskContext &context, std::function<void()> done_callback) {
RECORD_EXECUTION_EVENT(context.GetExecutionContext(), context.GetNodeName(), "[KnownNodeTaskExecuteAsync] Start"); RECORD_EXECUTION_EVENT(context.GetExecutionContext(), context.GetNodeName(), "[KnownNodeTaskExecuteAsync] Start");
GELOGI("[%s] KnownNodeTask::ExecuteAsync in.", context.GetNodeName());
if (davinci_model_->GetTaskList().size() == 0) {
GELOGW("KnownNodeExecutor::ExecuteAsync davinci moel has no taskinfo.");
GELOGD("[%s] KnownNodeTask::ExecuteAsync in.", context.GetNodeName());
if (davinci_model_->GetTaskList().empty()) {
GELOGW("KnownNodeExecutor::ExecuteAsync davinci model has no taskinfo.");


// todo if data is connected to netoutput, forward address ? copy data? // todo if data is connected to netoutput, forward address ? copy data?
if (context.NumInputs() == context.NumOutputs()){ if (context.NumInputs() == context.NumOutputs()){
GELOGW("[%s] KnownNodeExecutor::ExecuteAsync davinci moel has no taskinfo.",
context.GetNodeName());
for (int i = 0; i < context.NumInputs(); ++i) { for (int i = 0; i < context.NumInputs(); ++i) {
auto tensor = context.MutableInput(i); auto tensor = context.MutableInput(i);
GE_CHECK_NOTNULL(tensor); GE_CHECK_NOTNULL(tensor);
@@ -54,24 +52,22 @@ Status KnownNodeTask:: ExecuteAsync(TaskContext &context, std::function<void()
} }


rtError_t rt_ret; rtError_t rt_ret;
GELOGI("rtModelExecute start.");
RECORD_EXECUTION_EVENT(context.GetExecutionContext(), context.GetNodeName(), "[KnownNodertModelExecute] Start"); RECORD_EXECUTION_EVENT(context.GetExecutionContext(), context.GetNodeName(), "[KnownNodertModelExecute] Start");
rt_ret = rtModelExecute(davinci_model_->GetRtModelHandle(), context.GetStream(), 0); rt_ret = rtModelExecute(davinci_model_->GetRtModelHandle(), context.GetStream(), 0);
GE_IF_BOOL_EXEC(rt_ret != RT_ERROR_NONE, GE_IF_BOOL_EXEC(rt_ret != RT_ERROR_NONE,
GELOGE(rt_ret, "rtModelExecute error, ret: hybrid_model_executorOx%X", rt_ret); return FAILED;); GELOGE(rt_ret, "rtModelExecute error, ret: hybrid_model_executorOx%X", rt_ret); return FAILED;);
RECORD_EXECUTION_EVENT(context.GetExecutionContext(), context.GetNodeName(), "[KnownNodertModelExecute] End"); RECORD_EXECUTION_EVENT(context.GetExecutionContext(), context.GetNodeName(), "[KnownNodertModelExecute] End");
GELOGI("rtModelExecute end");


GE_CHK_STATUS_RET_NOLOG(context.RegisterCallback(done_callback)); GE_CHK_STATUS_RET_NOLOG(context.RegisterCallback(done_callback));
GELOGI("[%s] KnownNodeTask::ExecuteAsync success.", context.GetNodeName());
GELOGD("[%s] KnownNodeTask::ExecuteAsync success.", context.GetNodeName());
RECORD_EXECUTION_EVENT(context.GetExecutionContext(), context.GetNodeName(), "[KnownNodeTaskExecuteAsync] End"); RECORD_EXECUTION_EVENT(context.GetExecutionContext(), context.GetNodeName(), "[KnownNodeTaskExecuteAsync] End");
return SUCCESS; return SUCCESS;
} }


Status KnownNodeTask::UpdateArgs(TaskContext &context) { Status KnownNodeTask::UpdateArgs(TaskContext &context) {
GELOGI("[%s] KnownNodeExecutor::UpdateArgs in.", context.GetNodeName());
if (davinci_model_->GetTaskList().size() == 0) {
GELOGW("KnownNodeExecutor::UpdateArgs davinci moel has no taskinfo.");
GELOGD("[%s] KnownNodeExecutor::UpdateArgs in.", context.GetNodeName());
if (davinci_model_->GetTaskList().empty()) {
GELOGW("KnownNodeExecutor::UpdateArgs davinci model has no taskinfo.");
return SUCCESS; return SUCCESS;
} }


@@ -91,7 +87,7 @@ Status KnownNodeTask::UpdateArgs(TaskContext &context) {


GE_CHK_STATUS_RET(davinci_model_->UpdateKnownNodeArgs(inputs, outputs), GE_CHK_STATUS_RET(davinci_model_->UpdateKnownNodeArgs(inputs, outputs),
"known node task update known node args failed."); "known node task update known node args failed.");
GELOGI("[%s] KnownNodeExecutor::UpdateArgs success, task_size = %d:", context.GetNodeName(),
GELOGD("[%s] KnownNodeExecutor::UpdateArgs success, task_size = %zu", context.GetNodeName(),
davinci_model_->GetTaskList().size()); davinci_model_->GetTaskList().size());
return SUCCESS; return SUCCESS;
} }
@@ -123,7 +119,7 @@ Status KnownNodeTask::Init(TaskContext &context) {
davinci_model_->SetKnownNodeAddrNotChanged(addr_not_changed); davinci_model_->SetKnownNodeAddrNotChanged(addr_not_changed);
// update mem base // update mem base
davinci_model_->UpdateMemBase(static_cast<uint8_t *>(buffer)); davinci_model_->UpdateMemBase(static_cast<uint8_t *>(buffer));
GELOGI("KnownNodeTask::Init mem base is %p, size %u.",
GELOGI("KnownNodeTask::Init mem base is %p, size %lu.",
davinci_model_->GetRuntimeParam().mem_base, davinci_model_->GetRuntimeParam().mem_size); davinci_model_->GetRuntimeParam().mem_base, davinci_model_->GetRuntimeParam().mem_size);
} }
if (!load_flag_) { if (!load_flag_) {
@@ -138,7 +134,7 @@ Status KnownNodeTask::Init(TaskContext &context) {
} }


Status KnownNodeExecutor::PrepareTask(NodeTask &task, TaskContext &context) const { Status KnownNodeExecutor::PrepareTask(NodeTask &task, TaskContext &context) const {
GELOGI("[%s] KnownNodeExecutor::PrepareTask in.", context.GetNodeName());
GELOGD("[%s] KnownNodeExecutor::PrepareTask in.", context.GetNodeName());
RECORD_EXECUTION_EVENT(context.GetExecutionContext(), context.GetNodeName(), "[KnownNodeExecutorPrepareTask] Start"); RECORD_EXECUTION_EVENT(context.GetExecutionContext(), context.GetNodeName(), "[KnownNodeExecutorPrepareTask] Start");
RECORD_EXECUTION_EVENT(context.GetExecutionContext(), context.GetNodeName(), "[KnownNodeExecutorTaskInit] Start"); RECORD_EXECUTION_EVENT(context.GetExecutionContext(), context.GetNodeName(), "[KnownNodeExecutorTaskInit] Start");
GE_CHK_STATUS_RET(task.Init(context), "known node init davinci model failed."); GE_CHK_STATUS_RET(task.Init(context), "known node init davinci model failed.");
@@ -148,7 +144,7 @@ Status KnownNodeExecutor::PrepareTask(NodeTask &task, TaskContext &context) cons
GE_CHK_STATUS_RET(task.UpdateArgs(context), "known node task update args failed."); GE_CHK_STATUS_RET(task.UpdateArgs(context), "known node task update args failed.");
RECORD_EXECUTION_EVENT(context.GetExecutionContext(), context.GetNodeName(), "[KnownNodeExecutorUpdateArgs] End"); RECORD_EXECUTION_EVENT(context.GetExecutionContext(), context.GetNodeName(), "[KnownNodeExecutorUpdateArgs] End");
RECORD_EXECUTION_EVENT(context.GetExecutionContext(), context.GetNodeName(), "[KnownNodeExecutorPrepareTask] End"); RECORD_EXECUTION_EVENT(context.GetExecutionContext(), context.GetNodeName(), "[KnownNodeExecutorPrepareTask] End");
GELOGI("[%s] KnownNodeExecutor::PrepareTask success.", context.GetNodeName());
GELOGD("[%s] KnownNodeExecutor::PrepareTask success.", context.GetNodeName());
return SUCCESS; return SUCCESS;
} }


@@ -167,7 +163,7 @@ Status KnownNodeExecutor::LoadTask(const HybridModel &model, const NodePtr &node
davinci_model->SetKnownNode(true); davinci_model->SetKnownNode(true);
// set model id as root node's node id // set model id as root node's node id
davinci_model->SetId(node->GetOpDesc()->GetId()); davinci_model->SetId(node->GetOpDesc()->GetId());
GELOGD("KnownNodeExecutor::LoadTask node id %u.", node->GetOpDesc()->GetId());
GELOGD("KnownNodeExecutor::LoadTask node id %ld.", node->GetOpDesc()->GetId());


GE_CHK_STATUS_RET(davinci_model->Assign(ge_model), "KnownNodeExecutor::LoadTask davincimodel assign failed."); GE_CHK_STATUS_RET(davinci_model->Assign(ge_model), "KnownNodeExecutor::LoadTask davincimodel assign failed.");




+ 5
- 2
ge/hybrid/node_executor/controlop/control_op_executor.cc View File

@@ -119,6 +119,7 @@ Status IfOpNodeTask::Init(const NodePtr &node, const HybridModel &model) {


Status IfOpNodeTask::DoExecuteAsync(TaskContext &task_context, const std::function<void()> &done_callback) const { Status IfOpNodeTask::DoExecuteAsync(TaskContext &task_context, const std::function<void()> &done_callback) const {
auto cond_tensor_desc = task_context.MutableInputDesc(kIfCondIndex); auto cond_tensor_desc = task_context.MutableInputDesc(kIfCondIndex);
GE_CHECK_NOTNULL(cond_tensor_desc);
auto data_type = cond_tensor_desc->GetDataType(); auto data_type = cond_tensor_desc->GetDataType();
const auto &shape = cond_tensor_desc->MutableShape(); const auto &shape = cond_tensor_desc->MutableShape();
bool cond_val = false; bool cond_val = false;
@@ -362,14 +363,16 @@ Status WhileOpNodeTask::MoveOutputs2Inputs(TaskContext &task_context) {
*input_tensor = *output_tensor; *input_tensor = *output_tensor;
output_tensor->Destroy(); output_tensor->Destroy();


auto input_tensor_desc = task_context.MutableInputDesc(i);
GE_CHECK_NOTNULL(input_tensor_desc);
auto output_tensor_desc = task_context.MutableOutputDesc(i); auto output_tensor_desc = task_context.MutableOutputDesc(i);
GE_CHECK_NOTNULL(output_tensor_desc); GE_CHECK_NOTNULL(output_tensor_desc);
GELOGD("[%s] To update input shape[%d] by output shape. from [%s] to [%s]", GELOGD("[%s] To update input shape[%d] by output shape. from [%s] to [%s]",
task_context.GetNodeName(), task_context.GetNodeName(),
i, i,
task_context.MutableInputDesc(i)->GetShape().ToString().c_str(),
input_tensor_desc->GetShape().ToString().c_str(),
output_tensor_desc->GetShape().ToString().c_str()); output_tensor_desc->GetShape().ToString().c_str());
*task_context.MutableInputDesc(i) = *output_tensor_desc;
*input_tensor_desc = *output_tensor_desc;
} }


return SUCCESS; return SUCCESS;


+ 9
- 6
ge/hybrid/node_executor/hccl/hccl_node_executor.cc View File

@@ -67,14 +67,16 @@ Status HcclNodeTask::ExecuteAsync(TaskContext &context, std::function<void()> do
} }


const NodeItem &node_item = context.GetNodeItem(); const NodeItem &node_item = context.GetNodeItem();
const OpDescPtr op_desc = MakeShared<OpDesc>(*(node_item.op_desc));
const OpDescPtr op_desc = node_item.GetOpDesc();
GE_CHECK_NOTNULL(op_desc); GE_CHECK_NOTNULL(op_desc);


HcomOpertion op_info; HcomOpertion op_info;
op_info.hcclType = op_desc->GetType(); op_info.hcclType = op_desc->GetType();
op_info.inputPtr = inputs.empty() ? nullptr : inputs[0]; op_info.inputPtr = inputs.empty() ? nullptr : inputs[0];
op_info.outputPtr = outputs.empty() ? nullptr : outputs[0]; op_info.outputPtr = outputs.empty() ? nullptr : outputs[0];
ge::DataType src_data_type = op_desc->GetInputDescPtr(0)->GetDataType();
auto input_desc = node_item.MutableInputDesc(0);
GE_CHECK_NOTNULL(input_desc);
ge::DataType src_data_type = input_desc->GetDataType();
auto iter = kConstOpHcclDataType.find(static_cast<int64_t>(src_data_type)); auto iter = kConstOpHcclDataType.find(static_cast<int64_t>(src_data_type));
if (iter == kConstOpHcclDataType.end()) { if (iter == kConstOpHcclDataType.end()) {
GELOGE(PARAM_INVALID, "kConstOpHcclDataType find failed."); GELOGE(PARAM_INVALID, "kConstOpHcclDataType find failed.");
@@ -83,7 +85,7 @@ Status HcclNodeTask::ExecuteAsync(TaskContext &context, std::function<void()> do
op_info.dataType = iter->second; op_info.dataType = iter->second;
HcclReduceOp op_type = HCCL_REDUCE_SUM; HcclReduceOp op_type = HCCL_REDUCE_SUM;
if (op_desc->GetType() == HCOMALLREDUCE || op_desc->GetType() == HCOMREDUCESCATTER || if (op_desc->GetType() == HCOMALLREDUCE || op_desc->GetType() == HCOMREDUCESCATTER ||
op_desc->GetType() == HVDCALLBACKALLREDUCE) {
op_desc->GetType() == HVDCALLBACKALLREDUCE || op_desc->GetType() == HCOMREDUCE) {
GE_CHK_STATUS_RET(HcomOmeUtil::GetHcclOperationType(op_desc, op_type), "GetHcclOperationType failed"); GE_CHK_STATUS_RET(HcomOmeUtil::GetHcclOperationType(op_desc, op_type), "GetHcclOperationType failed");
op_info.opType = op_type; op_info.opType = op_type;
} }
@@ -128,8 +130,9 @@ Status RdmaNodeTask::UpdateArgs(TaskContext &context) { return SUCCESS; }
Status RdmaNodeTask::Init(TaskContext &context) { Status RdmaNodeTask::Init(TaskContext &context) {
GELOGI("[%s] RdmaNodeTask::Init in.", context.GetNodeName()); GELOGI("[%s] RdmaNodeTask::Init in.", context.GetNodeName());
const NodeItem &node_item = context.GetNodeItem(); const NodeItem &node_item = context.GetNodeItem();
GE_CHECK_NOTNULL(node_item.op_desc);
auto remote_idx = node_item.op_desc->GetInputIndexByName("remote");
auto op_desc = node_item.GetOpDesc();
GE_CHECK_NOTNULL(op_desc);
auto remote_idx = op_desc->GetInputIndexByName("remote");
auto in_data_anchor = node_item.node->GetInDataAnchor(remote_idx); auto in_data_anchor = node_item.node->GetInDataAnchor(remote_idx);
GE_CHECK_NOTNULL(in_data_anchor); GE_CHECK_NOTNULL(in_data_anchor);
auto out_data_anchor = in_data_anchor->GetPeerOutAnchor(); auto out_data_anchor = in_data_anchor->GetPeerOutAnchor();
@@ -141,7 +144,7 @@ Status RdmaNodeTask::Init(TaskContext &context) {
if (node_item.node->GetType() == HCOMREMOTEREAD) { if (node_item.node->GetType() == HCOMREMOTEREAD) {
local_index_ = 0; local_index_ = 0;
} else { } else {
local_index_ = node_item.op_desc->GetInputIndexByName("local");
local_index_ = op_desc->GetInputIndexByName("local");
} }
return SUCCESS; return SUCCESS;
} }


+ 5
- 5
ge/hybrid/node_executor/host_cpu/host_cpu_node_executor.cc View File

@@ -47,7 +47,9 @@ Status CpuKernelNodeTask::Execute(TaskContext &context) {


std::vector<ConstGeTensorPtr> inputs; std::vector<ConstGeTensorPtr> inputs;
for (int32_t i = 0; i < context.NumInputs(); ++i) { for (int32_t i = 0; i < context.NumInputs(); ++i) {
const auto &input_desc = op_desc->GetInputDesc(i);
auto input_desc_ptr = context.GetInputDesc(i);
GE_CHECK_NOTNULL(input_desc_ptr);
const auto &input_desc = *input_desc_ptr;
GE_CHECK_NOTNULL(context.GetInput(i)); GE_CHECK_NOTNULL(context.GetInput(i));
auto in_tensor = MakeShared<GeTensor>(input_desc, auto in_tensor = MakeShared<GeTensor>(input_desc,
reinterpret_cast<const uint8_t *>(context.GetInput(i)->GetData()), reinterpret_cast<const uint8_t *>(context.GetInput(i)->GetData()),
@@ -56,8 +58,7 @@ Status CpuKernelNodeTask::Execute(TaskContext &context) {
in_tensor->MutableTensorDesc().SetDataType(input_desc.GetDataType()); in_tensor->MutableTensorDesc().SetDataType(input_desc.GetDataType());
in_tensor->MutableTensorDesc().SetShape(input_desc.GetShape()); in_tensor->MutableTensorDesc().SetShape(input_desc.GetShape());
inputs.emplace_back(in_tensor); inputs.emplace_back(in_tensor);
GELOGI("node:%s allocate input %zu, addr=%p, size=%lld", op_desc->GetName().c_str(), i,
reinterpret_cast<const uint8_t *>(in_tensor->GetData().data()), in_tensor->GetData().size());
GELOGI("node:%s allocate input %d, size=%zu", op_desc->GetName().c_str(), i, in_tensor->GetData().size());
} }


std::vector<GeTensorPtr> outputs; std::vector<GeTensorPtr> outputs;
@@ -78,8 +79,7 @@ Status CpuKernelNodeTask::Execute(TaskContext &context) {
out_tensor->MutableTensorDesc().SetDataType(output_desc.GetDataType()); out_tensor->MutableTensorDesc().SetDataType(output_desc.GetDataType());
out_tensor->MutableTensorDesc().SetShape(output_desc.GetShape()); out_tensor->MutableTensorDesc().SetShape(output_desc.GetShape());
outputs.emplace_back(out_tensor); outputs.emplace_back(out_tensor);
GELOGI("node:%s allocate output %d, addr=%p, size=%zu", op_desc->GetName().c_str(), i,
reinterpret_cast<const uint8_t *>(out_tensor->GetData().data()), out_tensor->GetData().size());
GELOGI("node:%s allocate output %d, size=%zu", op_desc->GetName().c_str(), i, out_tensor->GetData().size());
} }


return HostCpuEngine::GetInstance().Run(node_, inputs, outputs); return HostCpuEngine::GetInstance().Run(node_, inputs, outputs);


+ 15
- 11
ge/hybrid/node_executor/node_executor.cc View File

@@ -16,6 +16,7 @@


#include "hybrid/node_executor/node_executor.h" #include "hybrid/node_executor/node_executor.h"
#include "framework/common/debug/log.h" #include "framework/common/debug/log.h"
#include "common/math/math_util.h"
#include "graph/utils/node_utils.h" #include "graph/utils/node_utils.h"
#include "init/gelib.h" #include "init/gelib.h"
#include "graph/utils/tensor_utils.h" #include "graph/utils/tensor_utils.h"
@@ -82,17 +83,15 @@ NodeExecutorManager::ExecutorType NodeExecutorManager::ResolveExecutorType(Node
auto op_type = node.GetType(); auto op_type = node.GetType();
if (op_type == PARTITIONEDCALL) { if (op_type == PARTITIONEDCALL) {
const auto &subgraph = NodeUtils::GetSubgraph(node, 0); const auto &subgraph = NodeUtils::GetSubgraph(node, 0);
if (subgraph != nullptr) {
for (const auto &node : subgraph->GetDirectNode()) {
bool is_unknown_shape = false;
(void)AttrUtils::GetBool(node->GetOpDesc(), kOwnerGraphIsUnknown, is_unknown_shape);
if (is_unknown_shape) {
return ExecutorType::DYNAMIC_SUBGRAPH;
} else {
return ExecutorType::COMPILED_SUBGRAPH;
}
}
if (subgraph != nullptr && subgraph->GetGraphUnknownFlag()) {
return ExecutorType::DYNAMIC_SUBGRAPH;
}
bool is_dynamic = false;
(void)NodeUtils::GetNodeUnknownShapeStatus(node, is_dynamic);
if (is_dynamic) {
return ExecutorType::DYNAMIC_SUBGRAPH;
} }
return ExecutorType::COMPILED_SUBGRAPH;
} }


// rts kernel store is assigned to NetOutput // rts kernel store is assigned to NetOutput
@@ -140,8 +139,9 @@ Status NodeExecutorManager::CalcOpRunningParam(Node &node) const {
GELOGD("[%s] Skipping CalcOpRunningParam for PartitionedCall.", node.GetName().c_str()); GELOGD("[%s] Skipping CalcOpRunningParam for PartitionedCall.", node.GetName().c_str());
return SUCCESS; return SUCCESS;
} }
for (size_t i = 0; i < node.GetOpDesc()->GetOutputsSize(); ++i) {
for (size_t i = 0; i < op_desc->GetOutputsSize(); ++i) {
GeTensorDescPtr output_tensor = op_desc->MutableOutputDesc(static_cast<uint32_t>(i)); GeTensorDescPtr output_tensor = op_desc->MutableOutputDesc(static_cast<uint32_t>(i));
GE_CHECK_NOTNULL(output_tensor);
TensorUtils::SetSize(*(output_tensor.get()), 0); TensorUtils::SetSize(*(output_tensor.get()), 0);
} }


@@ -157,6 +157,10 @@ Status NodeExecutorManager::CalcOpRunningParam(Node &node) const {
int64_t output_mem_size = 0; int64_t output_mem_size = 0;
GE_CHK_STATUS_RET(TensorUtils::CalcTensorMemSize(output_shape, format, data_type, output_mem_size), GE_CHK_STATUS_RET(TensorUtils::CalcTensorMemSize(output_shape, format, data_type, output_mem_size),
"hccl calc tensor mem size failed."); "hccl calc tensor mem size failed.");
GE_CHK_STATUS_RET(CheckInt64AddOverflow(output_mem_size, MEMORY_ALIGN_RATIO * MEMORY_ALIGN_SIZE - 1),
"[%s] Invalid output mem size: %ld",
node.GetName().c_str(),
output_mem_size);
output_mem_size = ((output_mem_size + output_mem_size = ((output_mem_size +
MEMORY_ALIGN_RATIO * MEMORY_ALIGN_SIZE - 1) / MEMORY_ALIGN_SIZE) * MEMORY_ALIGN_SIZE; MEMORY_ALIGN_RATIO * MEMORY_ALIGN_SIZE - 1) / MEMORY_ALIGN_SIZE) * MEMORY_ALIGN_SIZE;
TensorUtils::SetSize(output_tensor, output_mem_size); TensorUtils::SetSize(output_tensor, output_mem_size);


+ 10
- 10
ge/hybrid/node_executor/task_context.cc View File

@@ -253,7 +253,7 @@ Status TaskContext::AllocateOutput(int index,


Status TaskContext::AllocateOutputs(AllocationAttr *attr) { Status TaskContext::AllocateOutputs(AllocationAttr *attr) {
for (int i = 0; i < node_item_->num_outputs; ++i) { for (int i = 0; i < node_item_->num_outputs; ++i) {
const auto &output_desc = node_item_->op_desc->MutableOutputDesc(i);
const auto &output_desc = node_item_->MutableOutputDesc(i);
GE_CHECK_NOTNULL(output_desc); GE_CHECK_NOTNULL(output_desc);
uint32_t mem_type = 0; uint32_t mem_type = 0;
(void)AttrUtils::GetInt(output_desc, ATTR_OUTPUT_MEMORY_TYPE, mem_type); (void)AttrUtils::GetInt(output_desc, ATTR_OUTPUT_MEMORY_TYPE, mem_type);
@@ -349,7 +349,7 @@ Status TaskContext::PropagateOutputs() {
auto dst_input_idx = dst_input_index_and_node.first; auto dst_input_idx = dst_input_index_and_node.first;
auto dst_node_item = dst_input_index_and_node.second; auto dst_node_item = dst_input_index_and_node.second;
auto input_offset = dst_node_item->input_start + dst_input_idx; auto input_offset = dst_node_item->input_start + dst_input_idx;
GELOGI(
GELOGD(
"Propagate output of node %s, output index = %d, dst node = %s, " "Propagate output of node %s, output index = %d, dst node = %s, "
"dst_input_index = %d, dst_input_offset = %d.", "dst_input_index = %d, dst_input_offset = %d.",
node_item_->NodeName().c_str(), node_item_->NodeName().c_str(),
@@ -394,20 +394,20 @@ void TaskContext::ReleaseInput(int index) {
} }
} }


ConstGeTensorDescPtr TaskContext::GetOutputDesc(int index) {
return node_item_->op_desc->MutableOutputDesc(static_cast<uint32_t>(index));
ConstGeTensorDescPtr TaskContext::GetOutputDesc(int index) const {
return node_item_->MutableOutputDesc(static_cast<uint32_t>(index));
} }


ConstGeTensorDescPtr TaskContext::GetInputDesc(int index) {
return node_item_->op_desc->MutableInputDesc(static_cast<uint32_t>(index));
ConstGeTensorDescPtr TaskContext::GetInputDesc(int index) const {
return node_item_->MutableInputDesc(index);
} }


GeTensorDescPtr TaskContext::MutableInputDesc(int index) {
return node_item_->op_desc->MutableInputDesc(static_cast<uint32_t>(index));
GeTensorDescPtr TaskContext::MutableInputDesc(int index) const {
return node_item_->MutableInputDesc(index);
} }


GeTensorDescPtr TaskContext::MutableOutputDesc(int index) {
return node_item_->op_desc->MutableOutputDesc(static_cast<uint32_t>(index));
GeTensorDescPtr TaskContext::MutableOutputDesc(int index) const {
return node_item_->MutableOutputDesc(static_cast<uint32_t>(index));
} }


bool TaskContext::IsForceInferShape() const { bool TaskContext::IsForceInferShape() const {


+ 4
- 4
ge/hybrid/node_executor/task_context.h View File

@@ -46,10 +46,10 @@ class TaskContext {
const NodeItem &GetNodeItem() const; const NodeItem &GetNodeItem() const;
const char *GetNodeName() const; const char *GetNodeName() const;
TensorValue *MutableInput(int index); TensorValue *MutableInput(int index);
ConstGeTensorDescPtr GetInputDesc(int index);
ConstGeTensorDescPtr GetOutputDesc(int index);
GeTensorDescPtr MutableInputDesc(int index);
GeTensorDescPtr MutableOutputDesc(int index);
ConstGeTensorDescPtr GetInputDesc(int index) const;
ConstGeTensorDescPtr GetOutputDesc(int index) const;
GeTensorDescPtr MutableInputDesc(int index) const;
GeTensorDescPtr MutableOutputDesc(int index) const;
void ReleaseInput(int index); void ReleaseInput(int index);
const TensorValue *GetInput(int index) const; const TensorValue *GetInput(int index) const;
const TensorValue *GetOutput(int index) const; const TensorValue *GetOutput(int index) const;


+ 6
- 1
ge/ir_build/atc_ir_common.cc View File

@@ -19,6 +19,7 @@
#include "framework/common/string_util.h" #include "framework/common/string_util.h"
#include "framework/common/types.h" #include "framework/common/types.h"
#include "framework/common/util.h" #include "framework/common/util.h"
#include "graph/utils/type_utils.h"


using std::pair; using std::pair;
using std::string; using std::string;
@@ -106,6 +107,10 @@ bool CheckDynamicBatchSizeInputShapeValid(unordered_map<string, vector<int64_t>>


bool CheckDynamicImagesizeInputShapeValid(unordered_map<string, vector<int64_t>> shape_map, bool CheckDynamicImagesizeInputShapeValid(unordered_map<string, vector<int64_t>> shape_map,
const std::string input_format, std::string &dynamic_image_size) { const std::string input_format, std::string &dynamic_image_size) {
if (!input_format.empty() && !ge::TypeUtils::IsFormatValid(input_format.c_str())) {
GELOGE(ge::PARAM_INVALID, "user input format [%s] is not found!", input_format.c_str());
return false;
}
int32_t size = 0; int32_t size = 0;
for (auto iter = shape_map.begin(); iter != shape_map.end(); ++iter) { for (auto iter = shape_map.begin(); iter != shape_map.end(); ++iter) {
vector<int64_t> shape = iter->second; vector<int64_t> shape = iter->second;
@@ -413,7 +418,7 @@ Status CheckCompressWeightParamValid(const std::string enable_compress_weight, c
} }


if ((enable_compress_weight == "true") && (!compress_weight_conf.empty())) { if ((enable_compress_weight == "true") && (!compress_weight_conf.empty())) {
ErrorManager::GetInstance().ATCReportErrMessage("E10009", {"parameter0", "parameter1"},
ErrorManager::GetInstance().ATCReportErrMessage("E10047", {"parameter0", "parameter1"},
{"enable_compress_weight", "compress_weight_conf"}); {"enable_compress_weight", "compress_weight_conf"});
GELOGE(ge::PARAM_INVALID, "enable_compress_weight and compress_weight_conf can not both exist!!"); GELOGE(ge::PARAM_INVALID, "enable_compress_weight and compress_weight_conf can not both exist!!");
return ge::PARAM_INVALID; return ge::PARAM_INVALID;


+ 7
- 1
ge/ir_build/ge_ir_build.cc View File

@@ -542,7 +542,13 @@ graphStatus aclgrphInferShapeAndType(ge::Graph &graph) {
return GRAPH_PARAM_INVALID; return GRAPH_PARAM_INVALID;
} }


auto ret = compute_graph->InferOriginFormat();
auto ret = compute_graph->TopologicalSorting();
if(ret != GRAPH_SUCCESS) {
GELOGE(ret, "Acl topo logical sort failed.");
return ret;
}

ret = compute_graph->InferOriginFormat();
if (ret != GRAPH_SUCCESS) { if (ret != GRAPH_SUCCESS) {
GELOGE(ret, "Acl InferOriginFormat failed."); GELOGE(ret, "Acl InferOriginFormat failed.");
return ret; return ret;


+ 4
- 4
ge/session/omg.cc View File

@@ -95,8 +95,8 @@ static void ParseAtcParms(const std::map<std::string, std::string> &atc_params,
} }
} }


static Status CheckInputShapeNode(const ComputeGraphPtr &graph, const bool is_dynamic_input) {
if (!is_dynamic_input) {
static Status CheckInputShapeNode(const ComputeGraphPtr &graph, const bool is_dynamic_input, RunMode run_mode) {
if (!is_dynamic_input && run_mode != MODEL_TO_JSON) {
for (auto node : graph->GetDirectNode()) { for (auto node : graph->GetDirectNode()) {
if (node->GetType() == DATA) { if (node->GetType() == DATA) {
auto data_op_desc = node->GetOpDesc(); auto data_op_desc = node->GetOpDesc();
@@ -793,7 +793,7 @@ FMK_FUNC_HOST_VISIBILITY Status ParseGraph(ge::Graph &graph, const std::map<stri
compute_graph = GraphUtils::GetComputeGraph(graph); compute_graph = GraphUtils::GetComputeGraph(graph);
GE_RETURN_IF_ERROR(CheckInputFp16Nodes(compute_graph, input_fp16_nodes, is_input_adjust_hw_layout)); GE_RETURN_IF_ERROR(CheckInputFp16Nodes(compute_graph, input_fp16_nodes, is_input_adjust_hw_layout));


GE_RETURN_IF_ERROR(CheckInputShapeNode(compute_graph, is_dynamic_input));
GE_RETURN_IF_ERROR(CheckInputShapeNode(compute_graph, is_dynamic_input, run_mode));


std::string compress_weight_conf; std::string compress_weight_conf;
ParseAtcParms(atc_params, "compress_weight_conf", compress_weight_conf); ParseAtcParms(atc_params, "compress_weight_conf", compress_weight_conf);
@@ -999,7 +999,7 @@ FMK_FUNC_HOST_VISIBILITY Status ConvertFwkModelToJson(const domi::FrameworkType
ErrorManager::GetInstance().ATCReportErrMessage( ErrorManager::GetInstance().ATCReportErrMessage(
"E10001", {"parameter", "value", "reason"}, "E10001", {"parameter", "value", "reason"},
{"--framework", std::to_string(framework), "only support 0(Caffe) 3(TensorFlow) 5(Onnx)"}); {"--framework", std::to_string(framework), "only support 0(Caffe) 3(TensorFlow) 5(Onnx)"});
GELOGE(PARAM_INVALID, "Input parameter[--framework] is mandatory and it's value must be: 0(Caffe) 3(TensorFlow) "
GELOGE(PARAM_INVALID, "Input parameter[--framework] is mandatory and it's value must be: 0(Caffe) 3(TensorFlow) "
"or 5(Onnx)."); "or 5(Onnx).");
return PARAM_INVALID; return PARAM_INVALID;
} }


+ 2
- 1
ge/single_op/task/aicpu_task_builder.cc View File

@@ -150,9 +150,10 @@ namespace ge {
task.op_type_ = op_desc_->GetName(); task.op_type_ = op_desc_->GetName();
task.task_info_ = kernel_def_.task_info(); task.task_info_ = kernel_def_.task_info();
task.dynamic_flag_ = dynamic_flag; task.dynamic_flag_ = dynamic_flag;
task.kernel_id_ = kernel_id;


auto debug_info = BuildTaskUtils::GetTaskInfo(op_desc_); auto debug_info = BuildTaskUtils::GetTaskInfo(op_desc_);
GELOGI("[TASK_INFO] %s %s", task.task_info_.c_str(), debug_info.c_str());
GELOGI("[TASK_INFO] %s/%s %s", std::to_string(kernel_id).c_str(), task.op_type_.c_str(), debug_info.c_str());
return SUCCESS; return SUCCESS;
} }
} // namespace ge } // namespace ge

+ 1
- 1
ge/single_op/task/op_task.cc View File

@@ -401,7 +401,7 @@ Status AiCpuTask::LaunchKernel(rtStream_t stream) {
GELOGE(RT_FAILED, "Invoke rtKernelLaunch failed. ret = %d, task = %s", ret, this->op_type_.c_str()); GELOGE(RT_FAILED, "Invoke rtKernelLaunch failed. ret = %d, task = %s", ret, this->op_type_.c_str());
return RT_FAILED; return RT_FAILED;
} }
GELOGI("[TASK_INFO] is %s", this->task_info_.c_str());
GELOGI("[TASK_INFO] %s/%s", std::to_string(kernel_id_).c_str(), op_type_.c_str());


auto status = OpenDump(stream); auto status = OpenDump(stream);
if (status != SUCCESS) { if (status != SUCCESS) {


+ 1
- 0
ge/single_op/task/op_task.h View File

@@ -207,6 +207,7 @@ class AiCpuTask : public AiCpuBaseTask {
void *copy_input_dst_dev_; void *copy_input_dst_dev_;


vector<void *> out_shape_hbm_; vector<void *> out_shape_hbm_;
uint64_t kernel_id_ = 0;
}; };


class AiCpuCCTask : public AiCpuBaseTask { class AiCpuCCTask : public AiCpuBaseTask {


+ 0
- 3
inc/external/ge/ge_api_error_codes.h View File

@@ -97,13 +97,10 @@ GE_ERRORNO_EXTERNAL(ACL_ERROR_GE_PARAM_INVALID, "Parameter invalid.");
GE_ERRORNO_EXTERNAL(ACL_ERROR_GE_EXEC_NOT_INIT, "GE executor not initialized yet."); GE_ERRORNO_EXTERNAL(ACL_ERROR_GE_EXEC_NOT_INIT, "GE executor not initialized yet.");
GE_ERRORNO_EXTERNAL(ACL_ERROR_GE_EXEC_MODEL_PATH_INVALID, "Model file path invalid."); GE_ERRORNO_EXTERNAL(ACL_ERROR_GE_EXEC_MODEL_PATH_INVALID, "Model file path invalid.");
GE_ERRORNO_EXTERNAL(ACL_ERROR_GE_EXEC_MODEL_ID_INVALID, "Model id invalid."); GE_ERRORNO_EXTERNAL(ACL_ERROR_GE_EXEC_MODEL_ID_INVALID, "Model id invalid.");
GE_ERRORNO_EXTERNAL(ACL_ERROR_GE_EXEC_MODEL_KEY_PATH_INVALID, "Model key path invalid.");
GE_ERRORNO_EXTERNAL(ACL_ERROR_GE_EXEC_MODEL_NOT_SUPPORT_ENCRYPTION, "Model does not support encryption.");
GE_ERRORNO_EXTERNAL(ACL_ERROR_GE_EXEC_MODEL_DATA_SIZE_INVALID, "Data size of model invalid."); GE_ERRORNO_EXTERNAL(ACL_ERROR_GE_EXEC_MODEL_DATA_SIZE_INVALID, "Data size of model invalid.");
GE_ERRORNO_EXTERNAL(ACL_ERROR_GE_EXEC_MODEL_ADDR_INVALID, "Model addr invalid."); GE_ERRORNO_EXTERNAL(ACL_ERROR_GE_EXEC_MODEL_ADDR_INVALID, "Model addr invalid.");
GE_ERRORNO_EXTERNAL(ACL_ERROR_GE_EXEC_MODEL_QUEUE_ID_INVALID, "Queue id of model invalid."); GE_ERRORNO_EXTERNAL(ACL_ERROR_GE_EXEC_MODEL_QUEUE_ID_INVALID, "Queue id of model invalid.");
GE_ERRORNO_EXTERNAL(ACL_ERROR_GE_EXEC_LOAD_MODEL_REPEATED, "The model loaded repeatedly."); GE_ERRORNO_EXTERNAL(ACL_ERROR_GE_EXEC_LOAD_MODEL_REPEATED, "The model loaded repeatedly.");
GE_ERRORNO_EXTERNAL(ACL_ERROR_GE_EXEC_MODEL_PARTITION_NUM_INVALID, "Model partition num invalid.");
GE_ERRORNO_EXTERNAL(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID, "Dynamic input addr invalid."); GE_ERRORNO_EXTERNAL(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID, "Dynamic input addr invalid.");
GE_ERRORNO_EXTERNAL(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID, "Dynamic input size invalid."); GE_ERRORNO_EXTERNAL(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID, "Dynamic input size invalid.");
GE_ERRORNO_EXTERNAL(ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID, "Dynamic batch size invalid."); GE_ERRORNO_EXTERNAL(ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID, "Dynamic batch size invalid.");


+ 0
- 3
inc/external/ge/ge_error_codes.h View File

@@ -26,13 +26,10 @@ static const uint32_t ACL_ERROR_GE_PARAM_INVALID = 145000;
static const uint32_t ACL_ERROR_GE_EXEC_NOT_INIT = 145001; static const uint32_t ACL_ERROR_GE_EXEC_NOT_INIT = 145001;
static const uint32_t ACL_ERROR_GE_EXEC_MODEL_PATH_INVALID = 145002; static const uint32_t ACL_ERROR_GE_EXEC_MODEL_PATH_INVALID = 145002;
static const uint32_t ACL_ERROR_GE_EXEC_MODEL_ID_INVALID = 145003; static const uint32_t ACL_ERROR_GE_EXEC_MODEL_ID_INVALID = 145003;
static const uint32_t ACL_ERROR_GE_EXEC_MODEL_KEY_PATH_INVALID = 145004;
static const uint32_t ACL_ERROR_GE_EXEC_MODEL_NOT_SUPPORT_ENCRYPTION = 145005;
static const uint32_t ACL_ERROR_GE_EXEC_MODEL_DATA_SIZE_INVALID = 145006; static const uint32_t ACL_ERROR_GE_EXEC_MODEL_DATA_SIZE_INVALID = 145006;
static const uint32_t ACL_ERROR_GE_EXEC_MODEL_ADDR_INVALID = 145007; static const uint32_t ACL_ERROR_GE_EXEC_MODEL_ADDR_INVALID = 145007;
static const uint32_t ACL_ERROR_GE_EXEC_MODEL_QUEUE_ID_INVALID = 145008; static const uint32_t ACL_ERROR_GE_EXEC_MODEL_QUEUE_ID_INVALID = 145008;
static const uint32_t ACL_ERROR_GE_EXEC_LOAD_MODEL_REPEATED = 145009; static const uint32_t ACL_ERROR_GE_EXEC_LOAD_MODEL_REPEATED = 145009;
static const uint32_t ACL_ERROR_GE_EXEC_MODEL_PARTITION_NUM_INVALID = 145010;
static const uint32_t ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID = 145011; static const uint32_t ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID = 145011;
static const uint32_t ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID = 145012; static const uint32_t ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID = 145012;
static const uint32_t ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID = 145013; static const uint32_t ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID = 145013;


+ 1
- 0
inc/framework/common/types.h View File

@@ -431,6 +431,7 @@ REGISTER_OPTYPE_DECLARE(HCOMBROADCAST, "HcomBroadcast");
REGISTER_OPTYPE_DECLARE(HCOMALLGATHER, "HcomAllGather"); REGISTER_OPTYPE_DECLARE(HCOMALLGATHER, "HcomAllGather");
REGISTER_OPTYPE_DECLARE(HCOMALLREDUCE, "HcomAllReduce"); REGISTER_OPTYPE_DECLARE(HCOMALLREDUCE, "HcomAllReduce");
REGISTER_OPTYPE_DECLARE(HCOMREDUCESCATTER, "HcomReduceScatter"); REGISTER_OPTYPE_DECLARE(HCOMREDUCESCATTER, "HcomReduceScatter");
REGISTER_OPTYPE_DECLARE(HCOMREDUCE, "HcomReduce");
REGISTER_OPTYPE_DECLARE(HCOMSEND, "HcomSend"); REGISTER_OPTYPE_DECLARE(HCOMSEND, "HcomSend");
REGISTER_OPTYPE_DECLARE(HCOMRECEIVE, "HcomReceive"); REGISTER_OPTYPE_DECLARE(HCOMRECEIVE, "HcomReceive");
REGISTER_OPTYPE_DECLARE(HCOMREMOTEREAD, "HcomRemoteRead"); REGISTER_OPTYPE_DECLARE(HCOMREMOTEREAD, "HcomRemoteRead");


+ 1
- 1
metadef

@@ -1 +1 @@
Subproject commit 0f5ddb10ce79ea2c01b8b9cab5ec3102879610bb
Subproject commit 6995fa3682b9e1147c5173e56192126d2f91a2b7

+ 1
- 1
parser

@@ -1 +1 @@
Subproject commit cf60b0c02d1a6e844fcec4202d18a069e9502b0f
Subproject commit 742f940d8868fbd2f5de19f726d6d28142bc0a6e

+ 1
- 0
tests/CMakeLists.txt View File

@@ -22,6 +22,7 @@ add_subdirectory(depends/runtime)
add_subdirectory(depends/omg) add_subdirectory(depends/omg)
add_subdirectory(depends/hccl) add_subdirectory(depends/hccl)
add_subdirectory(depends/profiler) add_subdirectory(depends/profiler)
add_subdirectory(depends/error_manager)


if (ENABLE_GE_COV OR ENABLE_GE_UT) if (ENABLE_GE_COV OR ENABLE_GE_UT)
add_subdirectory(ut) add_subdirectory(ut)


+ 67
- 43
tests/depends/cce/CMakeLists.txt View File

@@ -13,60 +13,84 @@
# limitations under the License. # limitations under the License.
# ============================================================================ # ============================================================================


cmake_minimum_required(VERSION 2.8)
#cmake_minimum_required(VERSION 2.8)


project(STUB_CCE) project(STUB_CCE)


set(CMAKE_CXX_STANDARD 11) set(CMAKE_CXX_STANDARD 11)


include_directories(${GE_SOURCE_DIR}/inc)
include_directories(${GE_SOURCE_DIR}/inc/framework)
include_directories(${GE_SOURCE_DIR}/inc/graph)
include_directories(${GE_SOURCE_DIR}/inc/external)
include_directories(${GE_SOURCE_DIR}/inc/external/graph)
include_directories(${GE_SOURCE_DIR}/src/common)
include_directories(${GE_SOURCE_DIR}/src/common/graph)
include_directories(${GE_SOURCE_DIR}/third_party/fwkacllib/inc)
include_directories(${GE_SOURCE_DIR}/third_party/fwkacllib/inc/cce)
include_directories(${GE_SOURCE_DIR}/third_party/fwkacllib/inc/ops)
include_directories(${GE_CODE_DIR}/inc)
include_directories(${GE_CODE_DIR}/inc/framework)
include_directories(${GE_CODE_DIR}/metadef/inc/graph)
include_directories(${GE_CODE_DIR}/inc/external)
include_directories(${GE_CODE_DIR}/metadef/inc/external)
include_directories(${GE_CODE_DIR}/metadef/inc/external/graph)
include_directories(${GE_CODE_DIR}/metadef)
include_directories(${GE_CODE_DIR}/metadef/inc)
include_directories(${GE_CODE_DIR}/metadef/graph)
include_directories(${GE_CODE_DIR}/third_party/fwkacllib/inc)
include_directories(${GE_CODE_DIR}/third_party/fwkacllib/inc/cce)
include_directories(${GE_CODE_DIR}/third_party/fwkacllib/inc/ops)
include_directories(${CMAKE_BINARY_DIR}) include_directories(${CMAKE_BINARY_DIR})
include_directories(${CMAKE_BINARY_DIR}/proto/ge) include_directories(${CMAKE_BINARY_DIR}/proto/ge)
file(GLOB_RECURSE PROTO_LIST RELATIVE ${CMAKE_CURRENT_LIST_DIR}
"${GE_SOURCE_DIR}/src/proto/om.proto"
"${GE_SOURCE_DIR}/src/proto/ge_ir.proto"
"${GE_SOURCE_DIR}/src/proto/task.proto"
set(PROTO_LIST
"${GE_CODE_DIR}/metadef/proto/om.proto"
"${GE_CODE_DIR}/metadef/proto/ge_ir.proto"
"${GE_CODE_DIR}/metadef/proto/task.proto"
) )


ge_protobuf_generate(ge PROTO_SRCS PROTO_HDRS ${PROTO_LIST})
protobuf_generate(ge PROTO_SRCS PROTO_HDRS ${PROTO_LIST})


file(GLOB_RECURSE SRCS RELATIVE ${CMAKE_CURRENT_LIST_DIR}
"${GE_SOURCE_DIR}/src/common/graph/ge_attr_define.cc"
"${GE_SOURCE_DIR}/src/common/graph/anchor.cc"
"${GE_SOURCE_DIR}/src/common/graph/ge_attr_value.cc"
"${GE_SOURCE_DIR}/src/common/graph/buffer.cc"
"${GE_SOURCE_DIR}/src/common/graph/compute_graph.cc"
"${GE_SOURCE_DIR}/src/common/graph/graph.cc"
"${GE_SOURCE_DIR}/src/common/graph/model.cc"
"${GE_SOURCE_DIR}/src/common/graph/model_serialize.cc"
"${GE_SOURCE_DIR}/src/common/graph/node.cc"
"${GE_SOURCE_DIR}/src/common/graph/op_desc.cc"
"${GE_SOURCE_DIR}/src/common/graph/operator.cc"
"${GE_SOURCE_DIR}/src/common/graph/operator_factory.cc"
"${GE_SOURCE_DIR}/src/common/graph/operator_factory_impl.cc"
"${GE_SOURCE_DIR}/src/common/graph/tensor.cc"
"${GE_SOURCE_DIR}/src/common/graph/detail/attributes_holder.cc"
"${GE_SOURCE_DIR}/src/common/graph/utils/anchor_utils.cc"
"${GE_SOURCE_DIR}/src/common/graph/utils/graph_utils.cc"
"${GE_SOURCE_DIR}/src/common/graph/utils/node_utils.cc"
"${GE_SOURCE_DIR}/src/common/graph/utils/op_desc_utils.cc"
"${GE_SOURCE_DIR}/src/common/graph/utils/type_utils.cc"
"${GE_SOURCE_DIR}/src/common/graph/op_imp.cc"
"${GE_SOURCE_DIR}/src/common/graph/shape_refiner.cc"
"${GE_SOURCE_DIR}/src/common/graph/ge_tensor.cc"
"${GE_SOURCE_DIR}/src/common/graph/opsproto/opsproto_manager.cc"
set(SRCS
"${GE_CODE_DIR}/metadef/graph/ge_attr_define.cc"
"${GE_CODE_DIR}/metadef/graph/anchor.cc"
"${GE_CODE_DIR}/metadef/graph/ge_attr_value.cc"
"${GE_CODE_DIR}/metadef/graph/buffer.cc"
"${GE_CODE_DIR}/metadef/graph/compute_graph.cc"
"${GE_CODE_DIR}/metadef/graph/graph.cc"
"${GE_CODE_DIR}/metadef/graph/model.cc"
"${GE_CODE_DIR}/metadef/graph/model_serialize.cc"
"${GE_CODE_DIR}/metadef/graph/node.cc"
"${GE_CODE_DIR}/metadef/graph/op_desc.cc"
"${GE_CODE_DIR}/metadef/graph/operator.cc"
"${GE_CODE_DIR}/metadef/graph/operator_factory.cc"
"${GE_CODE_DIR}/metadef/graph/operator_factory_impl.cc"
"${GE_CODE_DIR}/metadef/graph/tensor.cc"
"${GE_CODE_DIR}/metadef/graph/detail/attributes_holder.cc"
"${GE_CODE_DIR}/metadef/graph/utils/anchor_utils.cc"
"${GE_CODE_DIR}/metadef/graph/utils/graph_utils.cc"
"${GE_CODE_DIR}/metadef/graph/utils/node_utils.cc"
"${GE_CODE_DIR}/metadef/graph/utils/op_desc_utils.cc"
"${GE_CODE_DIR}/metadef/graph/utils/type_utils.cc"
"${GE_CODE_DIR}/metadef/ops/op_imp.cpp"
"${GE_CODE_DIR}/metadef/graph/shape_refiner.cc"
"${GE_CODE_DIR}/metadef/graph/ge_tensor.cc"
"${GE_CODE_DIR}/metadef/graph/opsproto/opsproto_manager.cc"
) )
add_library(cce_ge_stub SHARED src/cce_stub.cc ${PROTO_SRCS} ${PROTO_HDRS}) add_library(cce_ge_stub SHARED src/cce_stub.cc ${PROTO_SRCS} ${PROTO_HDRS})
target_link_libraries(cce_ge_stub protobuf::protobuf)

target_compile_definitions(cce_ge_stub PRIVATE
google=ascend_private
)

target_link_libraries(cce_ge_stub
$<BUILD_INTERFACE:intf_pub>
-Wl,--no-as-needed
ascend_protobuf
-Wl,--as-needed
c_sec
)


add_library(cce_stub SHARED ${SRCS} ${PROTO_SRCS} ${PROTO_HDRS}) add_library(cce_stub SHARED ${SRCS} ${PROTO_SRCS} ${PROTO_HDRS})
target_link_libraries(cce_stub protobuf::protobuf)

target_compile_definitions(cce_stub PRIVATE
google=ascend_private
)

target_link_libraries(cce_stub PRIVATE
$<BUILD_INTERFACE:intf_pub>
-Wl,--no-as-needed
ascend_protobuf
-Wl,--as-needed
c_sec
)

+ 34
- 0
tests/depends/error_manager/CMakeLists.txt View File

@@ -0,0 +1,34 @@
# Copyright 2019-2020 Huawei Technologies Co., Ltd
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ============================================================================

#cmake_minimum_required(VERSION 2.8)

project(STUB_ERROR_MANAGER)

file(GLOB_RECURSE SRCS RELATIVE ${CMAKE_CURRENT_LIST_DIR}
"src/error_manager_stub.cc"
)

include_directories(${GE_CODE_DIR}/third_party/fwkacllib/inc)
include_directories(${GE_CODE_DIR}/inc)
include_directories(${GE_CODE_DIR}/inc/external)
include_directories(${GE_CODE_DIR}/metadef/inc)
include_directories(${GE_CODE_DIR}/inc/framework)
include_directories(${GE_CODE_DIR}/metadef/inc/external)

add_library(error_manager_stub SHARED ${SRCS})
target_link_libraries(error_manager_stub PRIVATE
$<BUILD_INTERFACE:intf_pub>
)

+ 85
- 0
tests/depends/error_manager/src/error_manager_stub.cc View File

@@ -0,0 +1,85 @@
/**
* Copyright 2019-2020 Huawei Technologies Co., Ltd
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/

#include "common/util/error_manager/error_manager.h"

ErrorManager &ErrorManager::GetInstance() {
static ErrorManager instance;
return instance;
}

///
/// @brief init
/// @param [in] path: current so path
/// @return int 0(success) -1(fail)
///
int ErrorManager::Init(std::string path) { return 0; }

///
/// @brief Report error message
/// @param [in] error_code: error code
/// @param [in] args_map: parameter map
/// @return int 0(success) -1(fail)
///
int ErrorManager::ReportErrMessage(std::string error_code, const std::map<std::string, std::string> &args_map) {
return 0;
}

///
/// @brief output error message
/// @param [in] handle: print handle
/// @return int 0(success) -1(fail)
///
int ErrorManager::OutputErrMessage(int handle) { return 0; }

///
/// @brief output message
/// @param [in] handle: print handle
/// @return int 0(success) -1(fail)
///
int ErrorManager::OutputMessage(int handle) { return 0; }

///
/// @brief Report error message
/// @param [in] key: vector parameter key
/// @param [in] value: vector parameter value
///
void ErrorManager::ATCReportErrMessage(std::string error_code, const std::vector<std::string> &key,
const std::vector<std::string> &value) {
}

///
/// @brief report graph compile failed message such as error code and op_name in mstune case
/// @param [in] msg: failed message map, key is error code, value is op_name
/// @return int 0(success) -1(fail)
///
int ErrorManager::ReportMstuneCompileFailedMsg(const std::map<std::string, std::string> &msg) { return 0; }

///
/// @brief save graph compile failed message from thread local map to global map
/// @param [in] graph_name: graph name
///
void ErrorManager::SaveMstuneCompileFailedMsg(const std::string &graph_name) {}

///
/// @brief get graph compile failed message in mstune case
/// @param [in] graph_name: graph name
/// @param [out] msg_map: failed message map, key is error code, value is op_name list
/// @return int 0(success) -1(fail)
///
int ErrorManager::GetMstuneCompileFailedMsg(const std::string &graph_name, std::map<std::string, std::vector<std::string>> &msg_map) { return 0; }



+ 8
- 4
tests/depends/hccl/CMakeLists.txt View File

@@ -13,14 +13,18 @@
# limitations under the License. # limitations under the License.
# ============================================================================ # ============================================================================


cmake_minimum_required(VERSION 2.8)
#cmake_minimum_required(VERSION 2.8)
project(hccl_stub) project(hccl_stub)


file(GLOB_RECURSE SRC_FILES RELATIVE ${CMAKE_CURRENT_SOURCE_DIR} file(GLOB_RECURSE SRC_FILES RELATIVE ${CMAKE_CURRENT_SOURCE_DIR}
"src/hccl_stub.cc" "src/hccl_stub.cc"
) )


include_directories(${GE_SOURCE_DIR}/third_party/fwkacllib/inc)
include_directories(${GE_SOURCE_DIR}/inc)
include_directories(${GE_CODE_DIR}/third_party/fwkacllib/inc)
include_directories(${GE_CODE_DIR}/inc)


add_library(hccl_stub SHARED ${SRC_FILES})
add_library(hccl_stub SHARED ${SRC_FILES})

target_link_libraries(hccl_stub PRIVATE
$<BUILD_INTERFACE:intf_pub>
)

+ 9
- 9
tests/depends/hccl/src/hccl_stub.cc View File

@@ -18,27 +18,27 @@


#include "hccl/hcom.h" #include "hccl/hcom.h"


hcclResult_t hcom_all_gather(const char *tag, void *input_count_ptr, void *output_ptr, u64 input_count,
hcclDataType_t data_type, const char *group, rtStream_t stream) {
HcclResult hcom_all_gather(const char *tag, void *input_count_ptr, void *output_ptr, u64 input_count,
HcclDataType data_type, const char *group, rtStream_t stream) {
return HCCL_SUCCESS; return HCCL_SUCCESS;
} }


hcclResult_t hcom_broadcast(const char *tag, void *ptr, u64 count, hcclDataType_t data_type, u32 root,
HcclResult hcom_broadcast(const char *tag, void *ptr, u64 count, HcclDataType data_type, u32 root,
const char *group, rtStream_t stream) { const char *group, rtStream_t stream) {
return HCCL_SUCCESS; return HCCL_SUCCESS;
} }


hcclResult_t hcom_all_reduce(const char *tag, void *input_ptr, void *output_ptr, u64 count, hcclDataType_t data_type,
hcclRedOp_t op, const char *group, rtStream_t stream) {
HcclResult hcom_all_reduce(const char *tag, void *input_ptr, void *output_ptr, u64 count, HcclDataType data_type,
HcclReduceOp op, const char *group, rtStream_t stream) {
return HCCL_SUCCESS; return HCCL_SUCCESS;
} }


hcclResult_t hcom_get_split_strategy(const char *group, const struct model_feature *feature, u32 max_segment_num,
HcclResult hcom_get_split_strategy(const char *group, const struct model_feature *feature, u32 max_segment_num,
u32 *segment_num, u32 *segment_idx) { u32 *segment_num, u32 *segment_idx) {
return HCCL_SUCCESS; return HCCL_SUCCESS;
} }


hcclResult_t hcom_reduce_scatter(const char *tag, void *input_ptr, void *output_ptr, u64 count,
hcclDataType_t data_type, hcclRedOp_t op, const char *group, rtStream_t stream) {
HcclResult hcom_reduce_scatter(const char *tag, void *input_ptr, void *output_ptr, u64 count,
HcclDataType data_type, HcclReduceOp op, const char *group, rtStream_t stream) {
return HCCL_SUCCESS; return HCCL_SUCCESS;
}
}

+ 14
- 6
tests/depends/mmpa/CMakeLists.txt View File

@@ -13,7 +13,7 @@
# limitations under the License. # limitations under the License.
# ============================================================================ # ============================================================================


cmake_minimum_required(VERSION 2.8)
#cmake_minimum_required(VERSION 2.8)


project(STUB_MMPA) project(STUB_MMPA)


@@ -21,10 +21,18 @@ file(GLOB_RECURSE SRCS RELATIVE ${CMAKE_CURRENT_LIST_DIR}
"src/mmpa_stub.cc" "src/mmpa_stub.cc"
) )


include_directories(${GE_SOURCE_DIR}/third_party/fwkacllib/inc)
include_directories(${GE_SOURCE_DIR}/inc)
include_directories(${GE_SOURCE_DIR}/inc/framework)
include_directories(${GE_SOURCE_DIR}/inc/external)
include_directories(${GE_CODE_DIR}/third_party/fwkacllib/inc)
include_directories(${GE_CODE_DIR}/inc)
include_directories(${GE_CODE_DIR}/inc/external)
include_directories(${GE_CODE_DIR}/metadef/inc)
include_directories(${GE_CODE_DIR}/inc/framework)
include_directories(${GE_CODE_DIR}/metadef/inc/external)


add_library(mmpa_stub SHARED ${SRCS}) add_library(mmpa_stub SHARED ${SRCS})
target_link_libraries(mmpa_stub protobuf::protobuf)
target_link_libraries(mmpa_stub PRIVATE
$<BUILD_INTERFACE:intf_pub>
-Wl,--no-as-needed
ascend_protobuf
-Wl,--as-needed
c_sec
)

+ 55
- 0
tests/depends/mmpa/src/mmpa_stub.cc View File

@@ -217,3 +217,58 @@ INT32 mmScandir(const CHAR *path, mmDirent ***entryList, mmFilter filterFunc, m
VOID mmScandirFree(mmDirent **entryList, INT32 count) VOID mmScandirFree(mmDirent **entryList, INT32 count)
{ {
} }

INT32 mmAccess2(const CHAR *pathName, INT32 mode)
{
return 0;
}

INT32 mmGetTimeOfDay(mmTimeval *timeVal, mmTimezone *timeZone)
{
return 0;
}

INT32 mmRealPath(const CHAR *path, CHAR *realPath, INT32 realPathLen)
{
return 0;
}

INT32 mmGetErrorCode()
{
return 0;
}

INT32 mmIsDir(const CHAR *fileName)
{
return 0;
}

INT32 mmGetEnv(const CHAR *name, CHAR *value, UINT32 len)
{
return 0;
}

INT32 mmDlclose(VOID *handle)
{
return 0;
}

CHAR *mmDlerror()
{
return "";
}

INT32 mmDladdr(VOID *addr, mmDlInfo *info)
{
return 0;
}

VOID *mmDlopen(const CHAR *fileName, INT32 mode)
{
return NULL;
}

VOID *mmDlsym(VOID *handle, const CHAR *funcName)
{
return NULL;
}

+ 31
- 17
tests/depends/omg/CMakeLists.txt View File

@@ -13,33 +13,47 @@
# limitations under the License. # limitations under the License.
# ============================================================================ # ============================================================================


cmake_minimum_required(VERSION 2.8)
#cmake_minimum_required(VERSION 2.8)


project(OMG_CCE) project(OMG_CCE)


set(CMAKE_CXX_STANDARD 11) set(CMAKE_CXX_STANDARD 11)


include_directories(${GE_SOURCE_DIR}/third_party/fwkacllib/inc)
include_directories(${GE_SOURCE_DIR}/third_party/fwkacllib/inc/cce)
include_directories(${GE_SOURCE_DIR}/inc)
include_directories(${GE_SOURCE_DIR}/inc/framework)
include_directories(${GE_SOURCE_DIR}/inc/graph)
include_directories(${GE_SOURCE_DIR}/inc/external)
include_directories(${GE_SOURCE_DIR}/inc/external/graph)
include_directories(${GE_SOURCE_DIR}/src/ge)
include_directories(${GE_CODE_DIR}/third_party/fwkacllib/inc)
include_directories(${GE_CODE_DIR}/third_party/fwkacllib/inc/cce)
include_directories(${GE_CODE_DIR}/inc)
include_directories(${GE_CODE_DIR}/metadef/inc)
include_directories(${GE_CODE_DIR}/inc/framework)
include_directories(${GE_CODE_DIR}/metadef/inc/graph)
include_directories(${GE_CODE_DIR}/inc/external)
include_directories(${GE_CODE_DIR}/metadef/inc/external)
include_directories(${GE_CODE_DIR}/metadef/inc/external/graph)
include_directories(${GE_CODE_DIR}/ge)
include_directories(${CMAKE_BINARY_DIR}) include_directories(${CMAKE_BINARY_DIR})
include_directories(${CMAKE_BINARY_DIR}/proto/ge) include_directories(${CMAKE_BINARY_DIR}/proto/ge)
file(GLOB_RECURSE PROTO_LIST RELATIVE ${CMAKE_CURRENT_LIST_DIR}
"${GE_SOURCE_DIR}/src/proto/om.proto"
"${GE_SOURCE_DIR}/src/proto/task.proto"
set(PROTO_LIST
"${GE_CODE_DIR}/metadef/proto/om.proto"
"${GE_CODE_DIR}/metadef/proto/task.proto"
) )


ge_protobuf_generate(ge PROTO_SRCS PROTO_HDRS ${PROTO_LIST})
protobuf_generate(ge PROTO_SRCS PROTO_HDRS ${PROTO_LIST})


file(GLOB_RECURSE SRCS RELATIVE ${CMAKE_CURRENT_LIST_DIR}
# "${GE_SOURCE_DIR}/src/ge/common/util.cc"
"src/omg_stub.cc"
set(SRCS
# "${GE_CODE_DIR}/src/ge/common/util.cc"
"src/omg_stub.cc"
) )


add_library(omg_stub SHARED ${SRCS} ${PROTO_SRCS} ${PROTO_HDRS}) add_library(omg_stub SHARED ${SRCS} ${PROTO_SRCS} ${PROTO_HDRS})
target_link_libraries(omg_stub protobuf::protobuf)

target_compile_definitions(omg_stub PRIVATE
google=ascend_private
)

target_link_libraries(omg_stub PRIVATE
$<BUILD_INTERFACE:intf_pub>
-Wl,--no-as-needed
ascend_protobuf
-Wl,--as-needed
c_sec
json
)

+ 3
- 1
tests/depends/omg/src/omg_stub.cc View File

@@ -643,7 +643,7 @@ Status GetInputOutputDescInfo(uint32_t model_id, vector<InputOutputDescInfo> &in
} }


Status DataInput(const InputData *input_data, OutputData *output_data) { return SUCCESS; } Status DataInput(const InputData *input_data, OutputData *output_data) { return SUCCESS; }
/*
class ModelManager { class ModelManager {
public: public:
static std::shared_ptr<ModelManager> GetInstance(); static std::shared_ptr<ModelManager> GetInstance();
@@ -741,6 +741,8 @@ Status ModelManager::ExecuteModel(uint32_t model_id, rtStream_t stream, bool asy
return SUCCESS; return SUCCESS;
} }


*/

} // namespace ge } // namespace ge


namespace ge { namespace ge {


+ 7
- 3
tests/depends/profiler/CMakeLists.txt View File

@@ -13,12 +13,16 @@
# limitations under the License. # limitations under the License.
# ============================================================================ # ============================================================================


cmake_minimum_required(VERSION 2.8)
#cmake_minimum_required(VERSION 2.8)
project(profiler_stub) project(profiler_stub)


file(GLOB_RECURSE SRC_FILES RELATIVE ${CMAKE_CURRENT_SOURCE_DIR} file(GLOB_RECURSE SRC_FILES RELATIVE ${CMAKE_CURRENT_SOURCE_DIR}
"src/profiler_stub.cc" "src/profiler_stub.cc"
) )
include_directories(${GE_SOURCE_DIR}/third_party/fwkacllib/inc)
include_directories(${GE_CODE_DIR}/third_party/fwkacllib/inc)


add_library(profiler_stub SHARED ${SRC_FILES})
add_library(profiler_stub SHARED ${SRC_FILES})

target_link_libraries(profiler_stub PRIVATE
$<BUILD_INTERFACE:intf_pub>
)

+ 8
- 3
tests/depends/runtime/CMakeLists.txt View File

@@ -13,7 +13,7 @@
# limitations under the License. # limitations under the License.
# ============================================================================ # ============================================================================


cmake_minimum_required(VERSION 2.8)
#cmake_minimum_required(VERSION 2.8)


project(STUB_MMPA) project(STUB_MMPA)


@@ -21,7 +21,12 @@ file(GLOB_RECURSE SRCS RELATIVE ${CMAKE_CURRENT_LIST_DIR}
"src/runtime_stub.cc" "src/runtime_stub.cc"
) )


include_directories(${GE_SOURCE_DIR}/third_party/fwkacllib/inc)
include_directories(${GE_SOURCE_DIR}/inc/framework)
include_directories(${GE_CODE_DIR}/third_party/fwkacllib/inc)
include_directories(${GE_CODE_DIR}/inc/framework)


add_library(runtime_stub SHARED ${SRCS}) add_library(runtime_stub SHARED ${SRCS})

target_link_libraries(runtime_stub PRIVATE
$<BUILD_INTERFACE:intf_pub>
c_sec
)

+ 78
- 1
tests/depends/runtime/src/runtime_stub.cc View File

@@ -221,8 +221,9 @@ rtError_t rtCpuKernelLaunch(const void *so_name, const void *kernel_name, uint32
return RT_ERROR_NONE; return RT_ERROR_NONE;
} }


rtError_t rtModelGetTaskId(void *handle, uint32_t *task_id) {
rtError_t rtModelGetTaskId(void *handle, uint32_t *task_id, uint32_t *stream_id) {
*task_id = 0; *task_id = 0;
*stream_id = 0;
return RT_ERROR_NONE; return RT_ERROR_NONE;
} }
rtError_t rtEndGraph(rtModel_t model, rtStream_t stream) { return RT_ERROR_NONE; } rtError_t rtEndGraph(rtModel_t model, rtStream_t stream) { return RT_ERROR_NONE; }
@@ -307,3 +308,79 @@ rtError_t rtModelBindQueue(rtModel_t model, uint32_t queueId, rtModelQueueFlag_t
{ {
return RT_ERROR_NONE; return RT_ERROR_NONE;
} }

rtError_t rtSetSocVersion(const char *version)
{
return RT_ERROR_NONE;
}

rtError_t rtGetSocVersion(char *version, const uint32_t maxLen)
{
return RT_ERROR_NONE;
}

rtError_t rtSetTaskFailCallback(rtTaskFailCallback callback)
{
return RT_ERROR_NONE;
}

rtError_t rtMallocHostSharedMemory(rtMallocHostSharedMemoryIn *in,
rtMallocHostSharedMemoryOut *out)
{
out->ptr = new uint8_t[in->size];
out->devPtr = new uint8_t[in->size];
return RT_ERROR_NONE;
}

rtError_t rtFreeHostSharedMemory(rtFreeHostSharedMemoryIn *in)
{
delete[] (uint8_t*)in->ptr;
delete[] (uint8_t*)in->devPtr;
return RT_ERROR_NONE;
}

rtError_t rtGetAicpuDeploy(rtAicpuDeployType_t *deplyType)
{
return RT_ERROR_NONE;
}

rtError_t rtDebugRegister(rtModel_t model, uint32_t flag, const void *addr, uint32_t *streamId, uint32_t *taskId)
{
return RT_ERROR_NONE;
}

rtError_t rtDebugUnRegister(rtModel_t model)
{
return RT_ERROR_NONE;
}

rtError_t rtDumpAddrSet(rtModel_t model, void *addr, uint32_t dumpSize, uint32_t flag)
{
return RT_ERROR_NONE;
}

rtError_t rtSetCtxINFMode(bool mode)
{
return RT_ERROR_NONE;
}

rtError_t rtLabelCreateEx(rtLabel_t *label, rtStream_t stream)
{
*label = new uint32_t;
return RT_ERROR_NONE;
}

rtError_t rtGetRtCapability(rtFeatureType_t featureType, int32_t featureInfo, int64_t *value)
{
return RT_ERROR_NONE;
}

rtError_t rtGetMaxStreamAndTask(uint32_t streamType, uint32_t *maxStrCount, uint32_t *maxTaskCount)
{
return RT_ERROR_NONE;
}

rtError_t rtModelExit(rtModel_t model, rtStream_t stream)
{
return RT_ERROR_NONE;
}

+ 6
- 3
tests/depends/slog/CMakeLists.txt View File

@@ -13,11 +13,14 @@
# limitations under the License. # limitations under the License.
# ============================================================================ # ============================================================================


cmake_minimum_required(VERSION 2.8)
#cmake_minimum_required(VERSION 2.8)
project(slog_stub) project(slog_stub)


file(GLOB_RECURSE SRC_FILES RELATIVE ${CMAKE_CURRENT_SOURCE_DIR} file(GLOB_RECURSE SRC_FILES RELATIVE ${CMAKE_CURRENT_SOURCE_DIR}
"src/*.cc" "src/*.cc"
) )
include_directories(${GE_SOURCE_DIR}/third_party/fwkacllib/inc)
add_library(slog_stub SHARED ${SRC_FILES})
include_directories(${GE_CODE_DIR}/third_party/fwkacllib/inc)
add_library(slog_stub SHARED ${SRC_FILES})
target_link_libraries(slog_stub PRIVATE
$<BUILD_INTERFACE:intf_pub>
)

+ 2
- 0
tests/depends/slog/src/slog_stub.cc View File

@@ -38,6 +38,8 @@ void DlogWithKVInner(int module_id, int level, KeyValue *pst_kv_array, int kv_nu
dav_log(module_id, fmt); dav_log(module_id, fmt);
} }


int dlog_setlevel(int module_id, int level, int enable_event) { return DLOG_DEBUG; }

int dlog_getlevel(int module_id, int *enable_event) { return DLOG_DEBUG; } int dlog_getlevel(int module_id, int *enable_event) { return DLOG_DEBUG; }


int CheckLogLevel(int moduleId, int logLevel) int CheckLogLevel(int moduleId, int logLevel)


+ 73
- 51
tests/ut/common/graph/CMakeLists.txt View File

@@ -17,30 +17,34 @@ project(ut_libgraph)


set(CMAKE_CXX_STANDARD 11) set(CMAKE_CXX_STANDARD 11)


file(GLOB_RECURSE PROTO_LIST RELATIVE ${CMAKE_CURRENT_LIST_DIR}
"${GE_SOURCE_DIR}/src/proto/om.proto"
"${GE_SOURCE_DIR}/src/proto/ge_ir.proto"
"${onnx_INC}/onnx/onnx.proto"
set(PROTO_LIST
"${GE_CODE_DIR}/metadef/proto/om.proto"
"${GE_CODE_DIR}/metadef/proto/ge_ir.proto"
"${GE_CODE_DIR}/metadef/proto/proto_inner/ge_onnx.proto"
) )


ge_protobuf_generate(ge PROTO_SRCS PROTO_HDRS ${PROTO_LIST})
protobuf_generate(ge PROTO_SRCS PROTO_HDRS ${PROTO_LIST})


# include directories # include directories
include_directories(${CMAKE_CURRENT_LIST_DIR}) include_directories(${CMAKE_CURRENT_LIST_DIR})
include_directories(${GE_SOURCE_DIR}/src)
include_directories(${GE_SOURCE_DIR}/src/common)
include_directories(${GE_SOURCE_DIR}/src/common/graph)
include_directories(${GE_SOURCE_DIR}/inc)
include_directories(${GE_SOURCE_DIR}/inc/external)
include_directories(${GE_SOURCE_DIR}/inc/external/graph)
include_directories(${GE_SOURCE_DIR}/inc/graph)
include_directories(${GE_SOURCE_DIR}/inc/common)
include_directories(${GE_SOURCE_DIR}/third_party/fwkacllib/inc)
include_directories(${GE_SOURCE_DIR}/third_party/fwkacllib/inc/ops)
include_directories(${GE_CODE_DIR})
include_directories(${GE_CODE_DIR}/metadef)
include_directories(${GE_CODE_DIR}/metadef/graph)
include_directories(${GE_CODE_DIR}/inc)
include_directories(${GE_CODE_DIR}/inc/external)
include_directories(${GE_CODE_DIR}/metadef/inc/external)
include_directories(${GE_CODE_DIR}/metadef/inc/external/graph)
include_directories(${GE_CODE_DIR}/metadef/inc)
include_directories(${GE_CODE_DIR}/metadef/inc/graph)
include_directories(${GE_CODE_DIR}/metadef/inc/common)
include_directories(${GE_CODE_DIR}/metadef/third_party)
include_directories(${GE_CODE_DIR}/third_party/fwkacllib/inc)
include_directories(${GE_CODE_DIR}/third_party/fwkacllib/inc/ops)
include_directories(${CMAKE_BINARY_DIR}) include_directories(${CMAKE_BINARY_DIR})
include_directories(${CMAKE_BINARY_DIR}/proto/ge) include_directories(${CMAKE_BINARY_DIR}/proto/ge)
include_directories(${CMAKE_BINARY_DIR}/proto/ge/proto)


file(GLOB_RECURSE UT_FILES RELATIVE ${CMAKE_CURRENT_SOURCE_DIR}
set(UT_FILES
"testcase/ge_graph/ge_anchor_utils_unittest.cc" "testcase/ge_graph/ge_anchor_utils_unittest.cc"
"testcase/ge_graph/ge_def_type_unittest.cc" "testcase/ge_graph/ge_def_type_unittest.cc"
"testcase/ge_graph/ge_graph_anchor_unittest.cc" "testcase/ge_graph/ge_graph_anchor_unittest.cc"
@@ -56,41 +60,59 @@ file(GLOB_RECURSE UT_FILES RELATIVE ${CMAKE_CURRENT_SOURCE_DIR}
"testcase/ge_graph/ge_model_unittest.cc" "testcase/ge_graph/ge_model_unittest.cc"
) )


file(GLOB_RECURSE SRC_FILES RELATIVE ${CMAKE_CURRENT_SOURCE_DIR}
"${GE_SOURCE_DIR}/src/common/graph/option/ge_local_context.cc"
"${GE_SOURCE_DIR}/src/common/graph/option/ge_context.cc"
"${GE_SOURCE_DIR}/src/common/graph/anchor.cc"
"${GE_SOURCE_DIR}/src/common/graph/ge_attr_value.cc"
"${GE_SOURCE_DIR}/src/common/graph/attr_value.cc"
"${GE_SOURCE_DIR}/src/common/graph/buffer.cc"
"${GE_SOURCE_DIR}/src/common/graph/compute_graph.cc"
"${GE_SOURCE_DIR}/src/common/graph/ge_attr_define.cc"
"${GE_SOURCE_DIR}/src/common/graph/graph.cc"
"${GE_SOURCE_DIR}/src/common/graph/model.cc"
"${GE_SOURCE_DIR}/src/common/graph/model_serialize.cc"
"${GE_SOURCE_DIR}/src/common/graph/node.cc"
"${GE_SOURCE_DIR}/src/common/graph/op_desc.cc"
"${GE_SOURCE_DIR}/src/common/graph/operator.cc"
"${GE_SOURCE_DIR}/src/common/graph/operator_reg.cc"
"${GE_SOURCE_DIR}/src/common/graph/operator_factory.cc"
"${GE_SOURCE_DIR}/src/common/graph/operator_factory_impl.cc"
"${GE_SOURCE_DIR}/src/common/graph/range_vistor.cc"
"${GE_SOURCE_DIR}/src/common/graph/tensor.cc"
"${GE_SOURCE_DIR}/src/common/graph/ge_tensor.cc"
"${GE_SOURCE_DIR}/src/common/graph/shape_refiner.cc"
"${GE_SOURCE_DIR}/src/common/graph/format_refiner.cc"
"${GE_SOURCE_DIR}/src/common/graph/inference_context.cc"
"${GE_SOURCE_DIR}/src/common/graph/detail/attributes_holder.cc"
"${GE_SOURCE_DIR}/src/common/graph/utils/anchor_utils.cc"
"${GE_SOURCE_DIR}/src/common/graph/utils/graph_utils.cc"
"${GE_SOURCE_DIR}/src/common/graph/utils/node_utils.cc"
"${GE_SOURCE_DIR}/src/common/graph/utils/op_desc_utils.cc"
"${GE_SOURCE_DIR}/src/common/graph/utils/type_utils.cc"
"${GE_SOURCE_DIR}/src/common/graph/utils/ge_ir_utils.cc"
"${GE_SOURCE_DIR}/src/common/graph/utils/tensor_utils.cc"
"${GE_SOURCE_DIR}/src/common/ops/op_imp.cc"
"${GE_SOURCE_DIR}/src/common/graph/opsproto/opsproto_manager.cc"
set(SRC_FILES
#"${GE_CODE_DIR}/metadef/graph/option/ge_local_context.cc"
#"${GE_CODE_DIR}/metadef/graph/option/ge_context.cc"
#"${GE_CODE_DIR}/metadef/graph/anchor.cc"
#"${GE_CODE_DIR}/metadef/graph/ge_attr_value.cc"
#"${GE_CODE_DIR}/metadef/graph/attr_value.cc"
#"${GE_CODE_DIR}/metadef/graph/buffer.cc"
#"${GE_CODE_DIR}/metadef/graph/compute_graph.cc"
#"${GE_CODE_DIR}/metadef/graph/ge_attr_define.cc"
#"${GE_CODE_DIR}/metadef/graph/graph.cc"
#"${GE_CODE_DIR}/metadef/graph/gnode.cc"
#"${GE_CODE_DIR}/metadef/graph/ascend_string.cc"
#"${GE_CODE_DIR}/metadef/graph/model.cc"
#"${GE_CODE_DIR}/metadef/graph/model_serialize.cc"
#"${GE_CODE_DIR}/metadef/graph/node.cc"
#"${GE_CODE_DIR}/metadef/graph/op_desc.cc"
#"${GE_CODE_DIR}/metadef/graph/operator.cc"
#"${GE_CODE_DIR}/metadef/graph/operator_reg.cc"
#"${GE_CODE_DIR}/metadef/graph/operator_factory.cc"
#"${GE_CODE_DIR}/metadef/graph/operator_factory_impl.cc"
#"${GE_CODE_DIR}/metadef/graph/range_vistor.cc"
#"${GE_CODE_DIR}/metadef/graph/tensor.cc"
#"${GE_CODE_DIR}/metadef/graph/ge_tensor.cc"
#"${GE_CODE_DIR}/metadef/graph/shape_refiner.cc"
#"${GE_CODE_DIR}/metadef/graph/format_refiner.cc"
#"${GE_CODE_DIR}/metadef/graph/inference_context.cc"
#"${GE_CODE_DIR}/metadef/graph/detail/attributes_holder.cc"
#"${GE_CODE_DIR}/metadef/graph/utils/anchor_utils.cc"
#"${GE_CODE_DIR}/metadef/graph/utils/graph_utils.cc"
#"${GE_CODE_DIR}/metadef/graph/utils/node_utils.cc"
#"${GE_CODE_DIR}/metadef/graph/utils/op_desc_utils.cc"
#"${GE_CODE_DIR}/metadef/graph/utils/type_utils.cc"
#"${GE_CODE_DIR}/metadef/graph/utils/ge_ir_utils.cc"
#"${GE_CODE_DIR}/metadef/graph/utils/tensor_utils.cc"
"${GE_CODE_DIR}/metadef/ops/op_imp.cpp"
#"${GE_CODE_DIR}/metadef/graph/opsproto/opsproto_manager.cc"
) )


#add_executable(ut_libgraph ${UT_FILES} ${SRC_FILES} ${PROTO_SRCS} ${PROTO_HDRS})
add_executable(ut_libgraph ${UT_FILES} ${SRC_FILES} ${PROTO_SRCS} ${PROTO_HDRS}) add_executable(ut_libgraph ${UT_FILES} ${SRC_FILES} ${PROTO_SRCS} ${PROTO_HDRS})
target_link_libraries(ut_libgraph graphengine::gtest graphengine::gtest_main slog_stub protobuf::protobuf graphengine::securec rt dl)

target_compile_definitions(ut_libgraph PRIVATE
google=ascend_private
)

target_link_libraries(ut_libgraph
$<BUILD_INTERFACE:intf_pub>
graph
gtest
gtest_main
slog_stub
ascend_protobuf
c_sec
-lrt
-ldl
)

+ 16
- 16
tests/ut/common/graph/testcase/ge_graph/ge_format_refiner_unittest.cc View File

@@ -85,7 +85,7 @@ ut::GraphBuilder BuildGraph1() {
builder.AddDataEdge(var2, 0, conv1, 1); builder.AddDataEdge(var2, 0, conv1, 1);
builder.AddDataEdge(conv1, 0, relu1, 0); builder.AddDataEdge(conv1, 0, relu1, 0);
builder.AddDataEdge(relu1, 0, netoutput1, 0); builder.AddDataEdge(relu1, 0, netoutput1, 0);
FormatRefiner::SetInferOrigineFormatFlag(true);
//FormatRefiner::SetInferOrigineFormatFlag(true);
return builder; return builder;
} }


@@ -134,7 +134,7 @@ ut::GraphBuilder BuildGraph2() {
builder.AddDataEdge(var6, 0, bn1, 4); builder.AddDataEdge(var6, 0, bn1, 4);
builder.AddDataEdge(bn1, 0, relu1, 0); builder.AddDataEdge(bn1, 0, relu1, 0);
builder.AddDataEdge(relu1, 0, netoutput1, 0); builder.AddDataEdge(relu1, 0, netoutput1, 0);
FormatRefiner::SetInferOrigineFormatFlag(true);
//FormatRefiner::SetInferOrigineFormatFlag(true);
return builder; return builder;
} }


@@ -189,7 +189,7 @@ ut::GraphBuilder BuildGraph3() {
builder.AddDataEdge(relu1, 0, conv2, 0); builder.AddDataEdge(relu1, 0, conv2, 0);
builder.AddDataEdge(var3, 0, conv2, 1); builder.AddDataEdge(var3, 0, conv2, 1);
builder.AddDataEdge(conv2, 0, netoutput1, 0); builder.AddDataEdge(conv2, 0, netoutput1, 0);
FormatRefiner::SetInferOrigineFormatFlag(true);
//FormatRefiner::SetInferOrigineFormatFlag(true);
return builder; return builder;
} }


@@ -248,7 +248,7 @@ ut::GraphBuilder BuildGraph4() {
builder.AddDataEdge(relu1, 0, conv2, 0); builder.AddDataEdge(relu1, 0, conv2, 0);
builder.AddDataEdge(var3, 0, conv2, 1); builder.AddDataEdge(var3, 0, conv2, 1);
builder.AddDataEdge(conv2, 0, netoutput1, 0); builder.AddDataEdge(conv2, 0, netoutput1, 0);
FormatRefiner::SetInferOrigineFormatFlag(true);
//FormatRefiner::SetInferOrigineFormatFlag(true);
return builder; return builder;
} }


@@ -305,7 +305,7 @@ ut::GraphBuilder BuilderGraph5() {
builder.AddDataEdge(relug1, 0, bng1, 0); builder.AddDataEdge(relug1, 0, bng1, 0);
builder.AddDataEdge(bng1, 0, apply1, 0); builder.AddDataEdge(bng1, 0, apply1, 0);
builder.AddDataEdge(apply1, 0, netoutput1, 0); builder.AddDataEdge(apply1, 0, netoutput1, 0);
FormatRefiner::SetInferOrigineFormatFlag(true);
//FormatRefiner::SetInferOrigineFormatFlag(true);
return builder; return builder;
} }


@@ -353,7 +353,7 @@ ut::GraphBuilder BuildGraph6() {
builder.AddDataEdge(constant, 0, addn, 2); builder.AddDataEdge(constant, 0, addn, 2);
builder.AddDataEdge(addn, 0, netoutput, 0); builder.AddDataEdge(addn, 0, netoutput, 0);


FormatRefiner::SetInferOrigineFormatFlag(true);
//FormatRefiner::SetInferOrigineFormatFlag(true);


return builder; return builder;
} }
@@ -397,7 +397,7 @@ ut::GraphBuilder BuildGraph7() {
builder.AddDataEdge(constant, 0, addn, 2); builder.AddDataEdge(constant, 0, addn, 2);
builder.AddDataEdge(addn, 0, netoutput, 0); builder.AddDataEdge(addn, 0, netoutput, 0);


FormatRefiner::SetInferOrigineFormatFlag(true);
//FormatRefiner::SetInferOrigineFormatFlag(true);


return builder; return builder;
} }
@@ -449,15 +449,15 @@ ut::GraphBuilder BuildGraph8() {
builder.AddDataEdge(relu, 0, reshape, 0); builder.AddDataEdge(relu, 0, reshape, 0);
builder.AddDataEdge(reshape, 0, conv, 1); builder.AddDataEdge(reshape, 0, conv, 1);
builder.AddDataEdge(conv, 0, netoutput, 0); builder.AddDataEdge(conv, 0, netoutput, 0);
FormatRefiner::SetInferOrigineFormatFlag(true);
//FormatRefiner::SetInferOrigineFormatFlag(true);
return builder; return builder;
} }
} // namespace } // namespace
/*
TEST_F(UtestFormatRefiner, data_format) { TEST_F(UtestFormatRefiner, data_format) {
auto builder = BuildGraph8(); auto builder = BuildGraph8();
auto graph = builder.GetGraph(); auto graph = builder.GetGraph();
FormatRefiner::SetInferOrigineFormatFlag(false);
//FormatRefiner::SetInferOrigineFormatFlag(false);
graph->SaveDataFormat(FORMAT_NCHW); graph->SaveDataFormat(FORMAT_NCHW);
EXPECT_EQ(FormatRefiner::InferOrigineFormat(graph), GRAPH_SUCCESS); EXPECT_EQ(FormatRefiner::InferOrigineFormat(graph), GRAPH_SUCCESS);
auto data2 = graph->FindNode("data2"); auto data2 = graph->FindNode("data2");
@@ -466,18 +466,18 @@ TEST_F(UtestFormatRefiner, data_format) {
EXPECT_EQ(data2->GetOpDesc()->GetOutputDesc(0).GetOriginFormat(), FORMAT_NCHW); EXPECT_EQ(data2->GetOpDesc()->GetOutputDesc(0).GetOriginFormat(), FORMAT_NCHW);
EXPECT_EQ(relu->GetOpDesc()->GetInputDesc(0).GetOriginFormat(), FORMAT_NCHW); EXPECT_EQ(relu->GetOpDesc()->GetInputDesc(0).GetOriginFormat(), FORMAT_NCHW);
EXPECT_EQ(relu->GetOpDesc()->GetOutputDesc(0).GetOriginFormat(), FORMAT_NCHW); EXPECT_EQ(relu->GetOpDesc()->GetOutputDesc(0).GetOriginFormat(), FORMAT_NCHW);
FormatRefiner::SetInferOrigineFormatFlag(true);
//FormatRefiner::SetInferOrigineFormatFlag(true);
} }
*/
TEST_F(UtestFormatRefiner, constant_fail) { TEST_F(UtestFormatRefiner, constant_fail) {
FormatRefiner::SetInferOrigineFormatFlag(true);
//FormatRefiner::SetInferOrigineFormatFlag(true);
auto builder = BuildGraph6(); auto builder = BuildGraph6();
auto graph = builder.GetGraph(); auto graph = builder.GetGraph();
EXPECT_EQ(FormatRefiner::InferOrigineFormat(graph), GRAPH_FAILED); EXPECT_EQ(FormatRefiner::InferOrigineFormat(graph), GRAPH_FAILED);
} }


TEST_F(UtestFormatRefiner, scalar_nodes_infer) { TEST_F(UtestFormatRefiner, scalar_nodes_infer) {
FormatRefiner::SetInferOrigineFormatFlag(true);
//FormatRefiner::SetInferOrigineFormatFlag(true);
auto builder = BuildGraph6(); auto builder = BuildGraph6();
auto graph = builder.GetGraph(); auto graph = builder.GetGraph();
auto constant = graph->FindNode("constant"); auto constant = graph->FindNode("constant");
@@ -650,7 +650,7 @@ TEST_F(UtestFormatRefiner, infer_origine_format_failed) {
} }


TEST_F(UtestFormatRefiner, save_format) { TEST_F(UtestFormatRefiner, save_format) {
FormatRefiner::SetInferOrigineFormatFlag(true);
//FormatRefiner::SetInferOrigineFormatFlag(true);
auto builder = BuildGraph6(); auto builder = BuildGraph6();
auto graph = builder.GetGraph(); auto graph = builder.GetGraph();
graph->SaveDataFormat(FORMAT_NHWC); graph->SaveDataFormat(FORMAT_NHWC);
@@ -658,4 +658,4 @@ TEST_F(UtestFormatRefiner, save_format) {
EXPECT_EQ(save_format, FORMAT_NHWC); EXPECT_EQ(save_format, FORMAT_NHWC);
graph->SaveDataFormat(FORMAT_ND); graph->SaveDataFormat(FORMAT_ND);
} }
} // namespace ge
} // namespace ge

+ 55
- 55
tests/ut/common/graph/testcase/ge_graph/ge_model_serialize_unittest.cc View File

@@ -1060,7 +1060,7 @@ TEST(UtestGeModelSerialize, test_model_serialize_imp_invalid_param) {
auto graph = std::make_shared<ComputeGraph>("test_graph"); auto graph = std::make_shared<ComputeGraph>("test_graph");
auto node = graph->AddNode(std::make_shared<OpDesc>()); auto node = graph->AddNode(std::make_shared<OpDesc>());
node->op_ = nullptr; node->op_ = nullptr;
proto::ModelDef model_def;
ge::proto::ModelDef model_def;
Model model; Model model;
model.SetGraph(GraphUtils::CreateGraphFromComputeGraph(graph)); model.SetGraph(GraphUtils::CreateGraphFromComputeGraph(graph));
EXPECT_FALSE(imp.SerializeModel(model, &model_def)); EXPECT_FALSE(imp.SerializeModel(model, &model_def));
@@ -1101,26 +1101,26 @@ TEST(UTEST_ge_model_unserialize, test_invalid_tensor) {


TEST(UTEST_ge_model_unserialize, test_invalid_TensorDesc) { TEST(UTEST_ge_model_unserialize, test_invalid_TensorDesc) {
{ // valid { // valid
proto::ModelDef mode_def;
ge::proto::ModelDef mode_def;
auto attrs = mode_def.mutable_attr(); auto attrs = mode_def.mutable_attr();


proto::AttrDef *attr_def = &(*attrs)["key1"];
ge::proto::AttrDef *attr_def = &(*attrs)["key1"];
auto tensor_desc_attr = attr_def->mutable_td(); auto tensor_desc_attr = attr_def->mutable_td();
tensor_desc_attr->set_layout("NCHW"); tensor_desc_attr->set_layout("NCHW");
tensor_desc_attr->set_dtype(proto::DataType::DT_INT8);
tensor_desc_attr->set_dtype(ge::proto::DataType::DT_INT8);


ModelSerializeImp imp; ModelSerializeImp imp;
Model model; Model model;
EXPECT_TRUE(imp.UnserializeModel(model, mode_def)); EXPECT_TRUE(imp.UnserializeModel(model, mode_def));
} }
{ // invalid layout { // invalid layout
proto::ModelDef mode_def;
ge::proto::ModelDef mode_def;
auto attrs = mode_def.mutable_attr(); auto attrs = mode_def.mutable_attr();


proto::AttrDef *attr_def = &(*attrs)["key1"];
ge::proto::AttrDef *attr_def = &(*attrs)["key1"];
auto tensor_desc_attr = attr_def->mutable_td(); auto tensor_desc_attr = attr_def->mutable_td();
tensor_desc_attr->set_layout("InvalidLayout"); tensor_desc_attr->set_layout("InvalidLayout");
tensor_desc_attr->set_dtype(proto::DataType::DT_INT8);
tensor_desc_attr->set_dtype(ge::proto::DataType::DT_INT8);


ModelSerializeImp imp; ModelSerializeImp imp;
Model model; Model model;
@@ -1131,13 +1131,13 @@ TEST(UTEST_ge_model_unserialize, test_invalid_TensorDesc) {
EXPECT_EQ(tensor_desc.GetDataType(), DT_INT8); EXPECT_EQ(tensor_desc.GetDataType(), DT_INT8);
} }
{ // invalid datatype { // invalid datatype
proto::ModelDef mode_def;
ge::proto::ModelDef mode_def;
auto attrs = mode_def.mutable_attr(); auto attrs = mode_def.mutable_attr();


proto::AttrDef *attr_def = &(*attrs)["key1"];
ge::proto::AttrDef *attr_def = &(*attrs)["key1"];
auto tensor_desc_attr = attr_def->mutable_td(); // tensor desc auto tensor_desc_attr = attr_def->mutable_td(); // tensor desc
tensor_desc_attr->set_layout("NHWC"); tensor_desc_attr->set_layout("NHWC");
tensor_desc_attr->set_dtype((proto::DataType)100);
tensor_desc_attr->set_dtype((ge::proto::DataType)100);


ModelSerializeImp imp; ModelSerializeImp imp;
Model model; Model model;
@@ -1148,13 +1148,13 @@ TEST(UTEST_ge_model_unserialize, test_invalid_TensorDesc) {
EXPECT_EQ(tensor_desc.GetDataType(), DT_UNDEFINED); EXPECT_EQ(tensor_desc.GetDataType(), DT_UNDEFINED);
} }
{ // invalid datatype { // invalid datatype
proto::ModelDef mode_def;
ge::proto::ModelDef mode_def;
auto attrs = mode_def.mutable_attr(); auto attrs = mode_def.mutable_attr();


proto::AttrDef *attr_def = &(*attrs)["key1"];
ge::proto::AttrDef *attr_def = &(*attrs)["key1"];
auto tensor_desc_attr = attr_def->mutable_t()->mutable_desc(); // tensor auto tensor_desc_attr = attr_def->mutable_t()->mutable_desc(); // tensor
tensor_desc_attr->set_layout("NHWC"); tensor_desc_attr->set_layout("NHWC");
tensor_desc_attr->set_dtype((proto::DataType)100);
tensor_desc_attr->set_dtype((ge::proto::DataType)100);


ModelSerializeImp imp; ModelSerializeImp imp;
Model model; Model model;
@@ -1167,13 +1167,13 @@ TEST(UTEST_ge_model_unserialize, test_invalid_TensorDesc) {
EXPECT_EQ(tensor_desc.GetDataType(), DT_UNDEFINED); EXPECT_EQ(tensor_desc.GetDataType(), DT_UNDEFINED);
} }
{ // invalid attrmap { // invalid attrmap
proto::ModelDef mode_def;
ge::proto::ModelDef mode_def;
auto attrs = mode_def.add_graph()->mutable_attr(); // graph attr auto attrs = mode_def.add_graph()->mutable_attr(); // graph attr


proto::AttrDef *attr_def = &(*attrs)["key1"];
ge::proto::AttrDef *attr_def = &(*attrs)["key1"];
auto tensor_desc_attr = attr_def->mutable_t()->mutable_desc(); // tensor auto tensor_desc_attr = attr_def->mutable_t()->mutable_desc(); // tensor
tensor_desc_attr->set_layout("NCHW"); tensor_desc_attr->set_layout("NCHW");
tensor_desc_attr->set_dtype(proto::DataType::DT_INT8);
tensor_desc_attr->set_dtype(ge::proto::DataType::DT_INT8);
auto attrs1 = tensor_desc_attr->mutable_attr(); auto attrs1 = tensor_desc_attr->mutable_attr();
auto attr1 = (*attrs1)["key2"]; // empty attr auto attr1 = (*attrs1)["key2"]; // empty attr


@@ -1191,13 +1191,13 @@ TEST(UTEST_ge_model_unserialize, test_invalid_TensorDesc) {
EXPECT_EQ(attr_value.GetValueType(), GeAttrValue::VT_NONE); EXPECT_EQ(attr_value.GetValueType(), GeAttrValue::VT_NONE);
} }
{ // invalid attrmap2 { // invalid attrmap2
proto::ModelDef mode_def;
ge::proto::ModelDef mode_def;
auto attrs = mode_def.add_graph()->add_op()->mutable_attr(); // node attr auto attrs = mode_def.add_graph()->add_op()->mutable_attr(); // node attr


proto::AttrDef *attr_def = &(*attrs)["key1"];
ge::proto::AttrDef *attr_def = &(*attrs)["key1"];
auto tensor_desc_attr = attr_def->mutable_t()->mutable_desc(); // tensor auto tensor_desc_attr = attr_def->mutable_t()->mutable_desc(); // tensor
tensor_desc_attr->set_layout("NCHW"); tensor_desc_attr->set_layout("NCHW");
tensor_desc_attr->set_dtype(proto::DataType::DT_INT8);
tensor_desc_attr->set_dtype(ge::proto::DataType::DT_INT8);
auto attrs1 = tensor_desc_attr->mutable_attr(); auto attrs1 = tensor_desc_attr->mutable_attr();
auto attr1 = (*attrs1)["key2"].mutable_list(); // empty list attr auto attr1 = (*attrs1)["key2"].mutable_list(); // empty list attr


@@ -1219,14 +1219,14 @@ TEST(UTEST_ge_model_unserialize, test_invalid_TensorDesc) {
} }
TEST(UTEST_ge_model_unserialize, test_invalid_attr) { TEST(UTEST_ge_model_unserialize, test_invalid_attr) {
{ // invalid graph { // invalid graph
proto::ModelDef mode_def;
ge::proto::ModelDef mode_def;
auto attrs = mode_def.add_graph()->add_op()->mutable_attr(); // node attr auto attrs = mode_def.add_graph()->add_op()->mutable_attr(); // node attr


proto::AttrDef *attr_def = &(*attrs)["key1"];
ge::proto::AttrDef *attr_def = &(*attrs)["key1"];
auto graph_attr = attr_def->mutable_g(); auto graph_attr = attr_def->mutable_g();
auto attrs_of_graph = graph_attr->mutable_attr(); auto attrs_of_graph = graph_attr->mutable_attr();
auto tensor_val = (*attrs_of_graph)["key2"].mutable_td(); auto tensor_val = (*attrs_of_graph)["key2"].mutable_td();
tensor_val->set_dtype(proto::DT_INT8);
tensor_val->set_dtype(ge::proto::DT_INT8);
tensor_val->set_layout("invalidLayout"); tensor_val->set_layout("invalidLayout");


ModelSerializeImp imp; ModelSerializeImp imp;
@@ -1245,15 +1245,15 @@ TEST(UTEST_ge_model_unserialize, test_invalid_attr) {
EXPECT_EQ(tensor_desc1.GetDataType(), DT_INT8); EXPECT_EQ(tensor_desc1.GetDataType(), DT_INT8);
} }
{ // invalid list graph { // invalid list graph
proto::ModelDef mode_def;
ge::proto::ModelDef mode_def;
auto attrs = mode_def.add_graph()->add_op()->mutable_attr(); // node attr auto attrs = mode_def.add_graph()->add_op()->mutable_attr(); // node attr


proto::AttrDef *attr_def = &(*attrs)["key1"];
ge::proto::AttrDef *attr_def = &(*attrs)["key1"];
attr_def->mutable_list()->set_val_type(ge::proto::AttrDef_ListValue_ListValueType_VT_LIST_GRAPH); attr_def->mutable_list()->set_val_type(ge::proto::AttrDef_ListValue_ListValueType_VT_LIST_GRAPH);
auto graph_attr = attr_def->mutable_list()->add_g(); auto graph_attr = attr_def->mutable_list()->add_g();
auto attrs_of_graph = graph_attr->mutable_attr(); auto attrs_of_graph = graph_attr->mutable_attr();
auto tensor_val = (*attrs_of_graph)["key2"].mutable_td(); auto tensor_val = (*attrs_of_graph)["key2"].mutable_td();
tensor_val->set_dtype(proto::DT_INT8);
tensor_val->set_dtype(ge::proto::DT_INT8);
tensor_val->set_layout("invalidLayout"); tensor_val->set_layout("invalidLayout");


ModelSerializeImp imp; ModelSerializeImp imp;
@@ -1273,14 +1273,14 @@ TEST(UTEST_ge_model_unserialize, test_invalid_attr) {
EXPECT_EQ(tensor_desc1.GetDataType(), DT_INT8); EXPECT_EQ(tensor_desc1.GetDataType(), DT_INT8);
} }
{ // invalid named_attrs { // invalid named_attrs
proto::ModelDef mode_def;
ge::proto::ModelDef mode_def;
auto attrs = mode_def.add_graph()->add_op()->mutable_attr(); // node attr auto attrs = mode_def.add_graph()->add_op()->mutable_attr(); // node attr


proto::AttrDef *attr_def = &(*attrs)["key1"];
ge::proto::AttrDef *attr_def = &(*attrs)["key1"];
auto graph_attr = attr_def->mutable_func(); auto graph_attr = attr_def->mutable_func();
auto attrs_of_graph = graph_attr->mutable_attr(); auto attrs_of_graph = graph_attr->mutable_attr();
auto tensor_val = (*attrs_of_graph)["key2"].mutable_td(); auto tensor_val = (*attrs_of_graph)["key2"].mutable_td();
tensor_val->set_dtype(proto::DT_INT8);
tensor_val->set_dtype(ge::proto::DT_INT8);
tensor_val->set_layout("invalidLayout"); tensor_val->set_layout("invalidLayout");


ModelSerializeImp imp; ModelSerializeImp imp;
@@ -1298,15 +1298,15 @@ TEST(UTEST_ge_model_unserialize, test_invalid_attr) {
EXPECT_EQ(tensor_desc1.GetDataType(), DT_INT8); EXPECT_EQ(tensor_desc1.GetDataType(), DT_INT8);
} }
{ // invalid list named_attrs { // invalid list named_attrs
proto::ModelDef mode_def;
ge::proto::ModelDef mode_def;
auto attrs = mode_def.add_graph()->add_op()->mutable_attr(); // node attr auto attrs = mode_def.add_graph()->add_op()->mutable_attr(); // node attr


proto::AttrDef *attr_def = &(*attrs)["key1"];
ge::proto::AttrDef *attr_def = &(*attrs)["key1"];
attr_def->mutable_list()->set_val_type(ge::proto::AttrDef_ListValue_ListValueType_VT_LIST_NAMED_ATTRS); attr_def->mutable_list()->set_val_type(ge::proto::AttrDef_ListValue_ListValueType_VT_LIST_NAMED_ATTRS);
auto graph_attr = attr_def->mutable_list()->add_na(); auto graph_attr = attr_def->mutable_list()->add_na();
auto attrs_of_graph = graph_attr->mutable_attr(); auto attrs_of_graph = graph_attr->mutable_attr();
auto tensor_val = (*attrs_of_graph)["key2"].mutable_td(); auto tensor_val = (*attrs_of_graph)["key2"].mutable_td();
tensor_val->set_dtype(proto::DT_INT8);
tensor_val->set_dtype(ge::proto::DT_INT8);
tensor_val->set_layout("invalidLayout"); tensor_val->set_layout("invalidLayout");


ModelSerializeImp imp; ModelSerializeImp imp;
@@ -1325,14 +1325,14 @@ TEST(UTEST_ge_model_unserialize, test_invalid_attr) {
EXPECT_EQ(tensor_desc1.GetDataType(), DT_INT8); EXPECT_EQ(tensor_desc1.GetDataType(), DT_INT8);
} }
{ // invalid tensor_desc { // invalid tensor_desc
proto::ModelDef mode_def;
ge::proto::ModelDef mode_def;
auto attrs = mode_def.add_graph()->add_op()->mutable_attr(); // node attr auto attrs = mode_def.add_graph()->add_op()->mutable_attr(); // node attr


proto::AttrDef *attr_def = &(*attrs)["key1"];
ge::proto::AttrDef *attr_def = &(*attrs)["key1"];
auto graph_attr = attr_def->mutable_td(); auto graph_attr = attr_def->mutable_td();
auto attrs_of_graph = graph_attr->mutable_attr(); auto attrs_of_graph = graph_attr->mutable_attr();
auto tensor_val = (*attrs_of_graph)["key2"].mutable_td(); auto tensor_val = (*attrs_of_graph)["key2"].mutable_td();
tensor_val->set_dtype(proto::DT_INT8);
tensor_val->set_dtype(ge::proto::DT_INT8);
tensor_val->set_layout("invalidLayout"); tensor_val->set_layout("invalidLayout");


ModelSerializeImp imp; ModelSerializeImp imp;
@@ -1350,15 +1350,15 @@ TEST(UTEST_ge_model_unserialize, test_invalid_attr) {
EXPECT_EQ(tensor_desc1.GetDataType(), DT_INT8); EXPECT_EQ(tensor_desc1.GetDataType(), DT_INT8);
} }
{ // invalid list tensor_desc { // invalid list tensor_desc
proto::ModelDef mode_def;
ge::proto::ModelDef mode_def;
auto attrs = mode_def.add_graph()->add_op()->mutable_attr(); // node attr auto attrs = mode_def.add_graph()->add_op()->mutable_attr(); // node attr


proto::AttrDef *attr_def = &(*attrs)["key1"];
ge::proto::AttrDef *attr_def = &(*attrs)["key1"];
attr_def->mutable_list()->set_val_type(ge::proto::AttrDef_ListValue_ListValueType_VT_LIST_TENSOR_DESC); attr_def->mutable_list()->set_val_type(ge::proto::AttrDef_ListValue_ListValueType_VT_LIST_TENSOR_DESC);
auto graph_attr = attr_def->mutable_list()->add_td(); auto graph_attr = attr_def->mutable_list()->add_td();
auto attrs_of_graph = graph_attr->mutable_attr(); auto attrs_of_graph = graph_attr->mutable_attr();
auto tensor_val = (*attrs_of_graph)["key2"].mutable_td(); auto tensor_val = (*attrs_of_graph)["key2"].mutable_td();
tensor_val->set_dtype(proto::DT_INT8);
tensor_val->set_dtype(ge::proto::DT_INT8);
tensor_val->set_layout("invalidLayout"); tensor_val->set_layout("invalidLayout");


ModelSerializeImp imp; ModelSerializeImp imp;
@@ -1377,14 +1377,14 @@ TEST(UTEST_ge_model_unserialize, test_invalid_attr) {
EXPECT_EQ(tensor_desc1.GetDataType(), DT_INT8); EXPECT_EQ(tensor_desc1.GetDataType(), DT_INT8);
} }
{ // invalid tensor { // invalid tensor
proto::ModelDef mode_def;
ge::proto::ModelDef mode_def;
auto attrs = mode_def.add_graph()->add_op()->mutable_attr(); // node attr auto attrs = mode_def.add_graph()->add_op()->mutable_attr(); // node attr


proto::AttrDef *attr_def = &(*attrs)["key1"];
ge::proto::AttrDef *attr_def = &(*attrs)["key1"];
auto graph_attr = attr_def->mutable_t()->mutable_desc(); auto graph_attr = attr_def->mutable_t()->mutable_desc();
auto attrs_of_graph = graph_attr->mutable_attr(); auto attrs_of_graph = graph_attr->mutable_attr();
auto tensor_val = (*attrs_of_graph)["key2"].mutable_td(); auto tensor_val = (*attrs_of_graph)["key2"].mutable_td();
tensor_val->set_dtype(proto::DT_INT8);
tensor_val->set_dtype(ge::proto::DT_INT8);
tensor_val->set_layout("invalidLayout"); tensor_val->set_layout("invalidLayout");


ModelSerializeImp imp; ModelSerializeImp imp;
@@ -1402,15 +1402,15 @@ TEST(UTEST_ge_model_unserialize, test_invalid_attr) {
EXPECT_EQ(tensor_desc1.GetDataType(), DT_INT8); EXPECT_EQ(tensor_desc1.GetDataType(), DT_INT8);
} }
{ // invalid list tensor { // invalid list tensor
proto::ModelDef mode_def;
ge::proto::ModelDef mode_def;
auto attrs = mode_def.add_graph()->add_op()->mutable_attr(); // node attr auto attrs = mode_def.add_graph()->add_op()->mutable_attr(); // node attr


proto::AttrDef *attr_def = &(*attrs)["key1"];
ge::proto::AttrDef *attr_def = &(*attrs)["key1"];
attr_def->mutable_list()->set_val_type(ge::proto::AttrDef_ListValue_ListValueType_VT_LIST_TENSOR); attr_def->mutable_list()->set_val_type(ge::proto::AttrDef_ListValue_ListValueType_VT_LIST_TENSOR);
auto graph_attr = attr_def->mutable_list()->add_t()->mutable_desc(); auto graph_attr = attr_def->mutable_list()->add_t()->mutable_desc();
auto attrs_of_graph = graph_attr->mutable_attr(); auto attrs_of_graph = graph_attr->mutable_attr();
auto tensor_val = (*attrs_of_graph)["key2"].mutable_td(); auto tensor_val = (*attrs_of_graph)["key2"].mutable_td();
tensor_val->set_dtype(proto::DT_INT8);
tensor_val->set_dtype(ge::proto::DT_INT8);
tensor_val->set_layout("invalidLayout"); tensor_val->set_layout("invalidLayout");


ModelSerializeImp imp; ModelSerializeImp imp;
@@ -1429,15 +1429,15 @@ TEST(UTEST_ge_model_unserialize, test_invalid_attr) {
EXPECT_EQ(tensor_desc1.GetDataType(), DT_INT8); EXPECT_EQ(tensor_desc1.GetDataType(), DT_INT8);
} }
{ // invalid list tensor { // invalid list tensor
proto::GraphDef graph_def;
ge::proto::GraphDef graph_def;
auto attrs = graph_def.add_op()->mutable_attr(); // node attr auto attrs = graph_def.add_op()->mutable_attr(); // node attr


proto::AttrDef *attr_def = &(*attrs)["key1"];
ge::proto::AttrDef *attr_def = &(*attrs)["key1"];
attr_def->mutable_list()->set_val_type(ge::proto::AttrDef_ListValue_ListValueType_VT_LIST_TENSOR); attr_def->mutable_list()->set_val_type(ge::proto::AttrDef_ListValue_ListValueType_VT_LIST_TENSOR);
auto graph_attr = attr_def->mutable_list()->add_t()->mutable_desc(); auto graph_attr = attr_def->mutable_list()->add_t()->mutable_desc();
auto attrs_of_graph = graph_attr->mutable_attr(); auto attrs_of_graph = graph_attr->mutable_attr();
auto tensor_val = (*attrs_of_graph)["key2"].mutable_td(); auto tensor_val = (*attrs_of_graph)["key2"].mutable_td();
tensor_val->set_dtype(proto::DT_INT8);
tensor_val->set_dtype(ge::proto::DT_INT8);
tensor_val->set_layout("invalidLayout"); tensor_val->set_layout("invalidLayout");


ModelSerializeImp imp; ModelSerializeImp imp;
@@ -1462,7 +1462,7 @@ TEST(UTEST_ge_model_unserialize, test_invalid_attr) {
TEST(UTEST_ge_model_unserialize, test_invalid_input_output) { TEST(UTEST_ge_model_unserialize, test_invalid_input_output) {
// model invalid node input // model invalid node input
{ {
proto::ModelDef model_def;
ge::proto::ModelDef model_def;
auto op_def = model_def.add_graph()->add_op(); // node attr auto op_def = model_def.add_graph()->add_op(); // node attr
op_def->add_input("invalidNodeName:0"); op_def->add_input("invalidNodeName:0");


@@ -1475,7 +1475,7 @@ TEST(UTEST_ge_model_unserialize, test_invalid_input_output) {
} }
// model invalid node control input // model invalid node control input
{ {
proto::ModelDef model_def;
ge::proto::ModelDef model_def;
auto op_def = model_def.add_graph()->add_op(); // node attr auto op_def = model_def.add_graph()->add_op(); // node attr
op_def->add_input("invalidNodeName:-1"); op_def->add_input("invalidNodeName:-1");


@@ -1488,7 +1488,7 @@ TEST(UTEST_ge_model_unserialize, test_invalid_input_output) {
} }
// model invalid graph input // model invalid graph input
{ {
proto::ModelDef model_def;
ge::proto::ModelDef model_def;
model_def.add_graph()->add_input("invalidNodeName:0"); model_def.add_graph()->add_input("invalidNodeName:0");


Buffer buffer(model_def.ByteSizeLong()); Buffer buffer(model_def.ByteSizeLong());
@@ -1500,7 +1500,7 @@ TEST(UTEST_ge_model_unserialize, test_invalid_input_output) {
} }
// model invalid graph input // model invalid graph input
{ {
proto::ModelDef model_def;
ge::proto::ModelDef model_def;
model_def.add_graph()->add_output("invalidNodeName:0"); model_def.add_graph()->add_output("invalidNodeName:0");


Buffer buffer(model_def.ByteSizeLong()); Buffer buffer(model_def.ByteSizeLong());
@@ -1512,7 +1512,7 @@ TEST(UTEST_ge_model_unserialize, test_invalid_input_output) {
} }
// graph invalid node input // graph invalid node input
{ {
proto::GraphDef graph_def;
ge::proto::GraphDef graph_def;
auto op_def = graph_def.add_op(); // node attr auto op_def = graph_def.add_op(); // node attr
op_def->add_input("invalidNodeName:0"); op_def->add_input("invalidNodeName:0");


@@ -1525,7 +1525,7 @@ TEST(UTEST_ge_model_unserialize, test_invalid_input_output) {
} }
// graph invalid node control input // graph invalid node control input
{ {
proto::GraphDef graph_def;
ge::proto::GraphDef graph_def;
auto op_def = graph_def.add_op(); // node attr auto op_def = graph_def.add_op(); // node attr
op_def->add_input("invalidNodeName:-1"); op_def->add_input("invalidNodeName:-1");


@@ -1538,7 +1538,7 @@ TEST(UTEST_ge_model_unserialize, test_invalid_input_output) {
} }
// graph invalid graph input // graph invalid graph input
{ {
proto::GraphDef graph_def;
ge::proto::GraphDef graph_def;
graph_def.add_input("invalidNodeName:0"); graph_def.add_input("invalidNodeName:0");


Buffer buffer(graph_def.ByteSizeLong()); Buffer buffer(graph_def.ByteSizeLong());
@@ -1550,7 +1550,7 @@ TEST(UTEST_ge_model_unserialize, test_invalid_input_output) {
} }
// graph invalid graph output // graph invalid graph output
{ {
proto::GraphDef graph_def;
ge::proto::GraphDef graph_def;
graph_def.add_output("invalidNodeName:0"); graph_def.add_output("invalidNodeName:0");


Buffer buffer(graph_def.ByteSizeLong()); Buffer buffer(graph_def.ByteSizeLong());
@@ -1562,7 +1562,7 @@ TEST(UTEST_ge_model_unserialize, test_invalid_input_output) {
} }
// model invalid node input anchor // model invalid node input anchor
{ {
proto::ModelDef model_def;
ge::proto::ModelDef model_def;
auto graph_def = model_def.add_graph(); auto graph_def = model_def.add_graph();
auto node_def1 = graph_def->add_op(); // node attr auto node_def1 = graph_def->add_op(); // node attr
node_def1->set_name("node1"); node_def1->set_name("node1");


+ 2
- 1
tests/ut/common/graph/testcase/ge_graph/ge_node_unittest.cc View File

@@ -151,7 +151,7 @@ TEST_F(UtestGeNode, update_opdesc) {


EXPECT_EQ(n1->UpdateOpDesc(desc_ptr2), GRAPH_SUCCESS); EXPECT_EQ(n1->UpdateOpDesc(desc_ptr2), GRAPH_SUCCESS);
} }
/*
TEST_F(UtestGeNode, add_link_from) { TEST_F(UtestGeNode, add_link_from) {
OpDescPtr desc_ptr = std::make_shared<OpDesc>("name", "type"); OpDescPtr desc_ptr = std::make_shared<OpDesc>("name", "type");
EXPECT_EQ(desc_ptr->AddInputDesc("x", GeTensorDesc(GeShape({1, 16, 16, 16}), FORMAT_NCHW)), GRAPH_SUCCESS); EXPECT_EQ(desc_ptr->AddInputDesc("x", GeTensorDesc(GeShape({1, 16, 16, 16}), FORMAT_NCHW)), GRAPH_SUCCESS);
@@ -179,6 +179,7 @@ TEST_F(UtestGeNode, add_link_from) {
NodePtr n8 = graph_ptr1->AddNode(desc_ptr1); NodePtr n8 = graph_ptr1->AddNode(desc_ptr1);
EXPECT_EQ(n8->AddLinkFromForParse(n7), GRAPH_PARAM_INVALID); EXPECT_EQ(n8->AddLinkFromForParse(n7), GRAPH_PARAM_INVALID);
} }
*/


TEST_F(UtestGeNode, add_link_from_fail) { TEST_F(UtestGeNode, add_link_from_fail) {
OpDescPtr desc_ptr = std::make_shared<OpDesc>("name1", "type1"); OpDescPtr desc_ptr = std::make_shared<OpDesc>("name1", "type1");


+ 667
- 354
tests/ut/ge/CMakeLists.txt
File diff suppressed because it is too large
View File


+ 3
- 1
tests/ut/ge/common/datatype_transfer_unittest.cc View File

@@ -18,7 +18,7 @@


#include "common/formats/format_transfers/datatype_transfer.h" #include "common/formats/format_transfers/datatype_transfer.h"


#include "common/formats/format_transfers/format_transfer.h"
//#include "common/formats/format_transfers/format_transfer.h"
#include "common/formats/formats.h" #include "common/formats/formats.h"
#include "common/fp16_t.h" #include "common/fp16_t.h"


@@ -368,6 +368,7 @@ TEST_F(UtestDataTypeTransfer, invalid_src_data_type) {
EXPECT_EQ(transfer.TransDataType(args, result), UNSUPPORTED); EXPECT_EQ(transfer.TransDataType(args, result), UNSUPPORTED);
} }


/*
TEST_F(UtestDataTypeTransfer, src_shape_empry) { TEST_F(UtestDataTypeTransfer, src_shape_empry) {
uint8_t data[1 * 4 * 4 * 1] = {0}; uint8_t data[1 * 4 * 4 * 1] = {0};


@@ -377,6 +378,7 @@ TEST_F(UtestDataTypeTransfer, src_shape_empry) {
TransResult result; TransResult result;
EXPECT_EQ(transfer.TransDataType(args, result), PARAM_INVALID); EXPECT_EQ(transfer.TransDataType(args, result), PARAM_INVALID);
} }
*/


TEST_F(UtestDataTypeTransfer, unsupprot_trans) { TEST_F(UtestDataTypeTransfer, unsupprot_trans) {
bool data[1 * 4 * 4 * 1] = {0}; bool data[1 * 4 * 4 * 1] = {0};


+ 4
- 3
tests/ut/ge/common/format_transfer_5d_nchw_unittest.cc View File

@@ -17,9 +17,10 @@
#include <gtest/gtest.h> #include <gtest/gtest.h>


#include "common/formats/format_transfers/format_transfer_nc1hwc0_nchw.h" #include "common/formats/format_transfers/format_transfer_nc1hwc0_nchw.h"

#include "common/formats/format_transfers/format_transfer.h"
//#include "common/formats/format_transfers/format_transfer.h"
#include "common/fp16_t.h" #include "common/fp16_t.h"
#include "register/register_format_transfer.h"
#include "framework/common/ge_inner_error_codes.h"


namespace ge { namespace ge {
namespace formats { namespace formats {
@@ -644,4 +645,4 @@ TEST_F(UTEST_FormatTransferNc1hwc0ToNchw, invalid_src_data_type) {
EXPECT_EQ(transfer.TransFormat(args, result), PARAM_INVALID); EXPECT_EQ(transfer.TransFormat(args, result), PARAM_INVALID);
} }
} // namespace formats } // namespace formats
} // namespace ge
} // namespace ge

+ 5
- 2
tests/ut/ge/common/format_transfer_5d_nhwc_unittest.cc View File

@@ -18,9 +18,12 @@


#include "common/formats/format_transfers/format_transfer_nc1hwc0_nhwc.h" #include "common/formats/format_transfers/format_transfer_nc1hwc0_nhwc.h"


#include "common/formats/format_transfers/format_transfer.h"
//#include "common/formats/format_transfers/format_transfer.h"
#include "common/fp16_t.h" #include "common/fp16_t.h"


#include "register/register_format_transfer.h"
#include "framework/common/ge_inner_error_codes.h"

namespace ge { namespace ge {
namespace formats { namespace formats {
class UtestFormatTransfer5dNhwc : public testing::Test { class UtestFormatTransfer5dNhwc : public testing::Test {
@@ -759,4 +762,4 @@ TEST_F(UtestFormatTransfer5dNhwc, invalid_src_dst_shape_relation) {
EXPECT_EQ(transfer.TransFormat(args, result), PARAM_INVALID); EXPECT_EQ(transfer.TransFormat(args, result), PARAM_INVALID);
} }
} // namespace formats } // namespace formats
} // namespace ge
} // namespace ge

+ 5
- 2
tests/ut/ge/common/format_transfer_c1hwncoc0_hwcn_unittest.cc View File

@@ -18,9 +18,12 @@


#include "common/formats/format_transfers/format_transfer_c1hwncoc0_hwcn.h" #include "common/formats/format_transfers/format_transfer_c1hwncoc0_hwcn.h"


#include "common/formats/format_transfers/format_transfer.h"
//#include "common/formats/format_transfers/format_transfer.h"
#include "common/fp16_t.h" #include "common/fp16_t.h"


#include "register/register_format_transfer.h"
#include "framework/common/ge_inner_error_codes.h"

namespace ge { namespace ge {
namespace formats { namespace formats {
class UtestFormatTransferC1hwncoc0Hwcn : public testing::Test { class UtestFormatTransferC1hwncoc0Hwcn : public testing::Test {
@@ -13710,4 +13713,4 @@ TEST_F(UtestFormatTransferC1hwncoc0Hwcn, sixd_to_hwcn_fp32_success_gt_cube) {
} }
} }
} // namespace formats } // namespace formats
} // namespace ge
} // namespace ge

+ 18
- 10
tests/ut/ge/common/format_transfer_fractal_nz_unittest.cc View File

@@ -19,11 +19,14 @@


#include "common/formats/format_transfers/format_transfer_fractal_nz.h" #include "common/formats/format_transfers/format_transfer_fractal_nz.h"


#include "common/formats/format_transfers/format_transfer.h"
//#include "common/formats/format_transfers/format_transfer.h"
#include "common/formats/formats.h" #include "common/formats/formats.h"
#include "common/fp16_t.h" #include "common/fp16_t.h"
#include "time.h" #include "time.h"


#include "register/register_format_transfer.h"
#include "framework/common/ge_inner_error_codes.h"

namespace ge { namespace ge {
namespace formats { namespace formats {
class UtestFormatTransferNdFractNz : public testing::Test { class UtestFormatTransferNdFractNz : public testing::Test {
@@ -32,6 +35,7 @@ class UtestFormatTransferNdFractNz : public testing::Test {
void TearDown() {} void TearDown() {}
}; };


/*
TEST_F(UtestFormatTransferNdFractNz, nd_shape1_uint8_1) { TEST_F(UtestFormatTransferNdFractNz, nd_shape1_uint8_1) {
uint8_t data[1] = { uint8_t data[1] = {
176, 176,
@@ -49,8 +53,8 @@ TEST_F(UtestFormatTransferNdFractNz, nd_shape1_uint8_1) {
FormatTransferFractalNz transfer; FormatTransferFractalNz transfer;
TransArgs args{reinterpret_cast<uint8_t *>(data), FORMAT_ND, FORMAT_FRACTAL_NZ, {1}, {1, 1, 32, 32}, DT_UINT8}; TransArgs args{reinterpret_cast<uint8_t *>(data), FORMAT_ND, FORMAT_FRACTAL_NZ, {1}, {1, 1, 32, 32}, DT_UINT8};
TransResult result; TransResult result;
EXPECT_EQ(transfer.TransFormat(args, result), SUCCESS);
EXPECT_EQ(result.length, sizeof(ret) / sizeof(ret[0]));
//EXPECT_EQ(transfer.TransFormat(args, result), SUCCESS);
//EXPECT_EQ(result.length, sizeof(ret) / sizeof(ret[0]));
for (int i = 0; i < sizeof(ret) / sizeof(ret[0]); ++i) { for (int i = 0; i < sizeof(ret) / sizeof(ret[0]); ++i) {
EXPECT_EQ((reinterpret_cast<uint8_t *>(result.data.get()))[i], ret[i]); EXPECT_EQ((reinterpret_cast<uint8_t *>(result.data.get()))[i], ret[i]);
} }
@@ -65,6 +69,7 @@ TEST_F(UtestFormatTransferNdFractNz, nd_shape1_uint8_1) {
} }
} }



TEST_F(UtestFormatTransferNdFractNz, nd_shape1_uint8_2) { TEST_F(UtestFormatTransferNdFractNz, nd_shape1_uint8_2) {
uint8_t data[32] = { uint8_t data[32] = {
194, 182, 243, 9, 141, 3, 25, 168, 123, 253, 25, 2, 76, 207, 206, 214, 194, 182, 243, 9, 141, 3, 25, 168, 123, 253, 25, 2, 76, 207, 206, 214,
@@ -117,8 +122,8 @@ TEST_F(UtestFormatTransferNdFractNz, nd_shape1_uint8_2) {
FormatTransferFractalNz transfer; FormatTransferFractalNz transfer;
TransArgs args{reinterpret_cast<uint8_t *>(data), FORMAT_ND, FORMAT_FRACTAL_NZ, {32}, {1, 1, 32, 32}, DT_UINT8}; TransArgs args{reinterpret_cast<uint8_t *>(data), FORMAT_ND, FORMAT_FRACTAL_NZ, {32}, {1, 1, 32, 32}, DT_UINT8};
TransResult result; TransResult result;
EXPECT_EQ(transfer.TransFormat(args, result), SUCCESS);
EXPECT_EQ(result.length, sizeof(ret) / sizeof(ret[0]));
//EXPECT_EQ(transfer.TransFormat(args, result), SUCCESS);
//EXPECT_EQ(result.length, sizeof(ret) / sizeof(ret[0]));
for (int i = 0; i < sizeof(ret) / sizeof(ret[0]); ++i) { for (int i = 0; i < sizeof(ret) / sizeof(ret[0]); ++i) {
EXPECT_EQ((reinterpret_cast<uint8_t *>(result.data.get()))[i], ret[i]); EXPECT_EQ((reinterpret_cast<uint8_t *>(result.data.get()))[i], ret[i]);
} }
@@ -133,6 +138,7 @@ TEST_F(UtestFormatTransferNdFractNz, nd_shape1_uint8_2) {
} }
} }



TEST_F(UtestFormatTransferNdFractNz, nd_shape1_uint8_3) { TEST_F(UtestFormatTransferNdFractNz, nd_shape1_uint8_3) {
uint8_t data[33] = { uint8_t data[33] = {
173, 126, 65, 202, 177, 161, 81, 98, 165, 98, 206, 162, 209, 58, 160, 171, 124, 173, 126, 65, 202, 177, 161, 81, 98, 165, 98, 206, 162, 209, 58, 160, 171, 124,
@@ -226,8 +232,8 @@ TEST_F(UtestFormatTransferNdFractNz, nd_shape1_uint8_3) {
FormatTransferFractalNz transfer; FormatTransferFractalNz transfer;
TransArgs args{reinterpret_cast<uint8_t *>(data), FORMAT_ND, FORMAT_FRACTAL_NZ, {33}, {2, 1, 32, 32}, DT_UINT8}; TransArgs args{reinterpret_cast<uint8_t *>(data), FORMAT_ND, FORMAT_FRACTAL_NZ, {33}, {2, 1, 32, 32}, DT_UINT8};
TransResult result; TransResult result;
EXPECT_EQ(transfer.TransFormat(args, result), SUCCESS);
EXPECT_EQ(result.length, sizeof(ret) / sizeof(ret[0]));
//EXPECT_EQ(transfer.TransFormat(args, result), SUCCESS);
//EXPECT_EQ(result.length, sizeof(ret) / sizeof(ret[0]));
for (int i = 0; i < sizeof(ret) / sizeof(ret[0]); ++i) { for (int i = 0; i < sizeof(ret) / sizeof(ret[0]); ++i) {
EXPECT_EQ((reinterpret_cast<uint8_t *>(result.data.get()))[i], ret[i]); EXPECT_EQ((reinterpret_cast<uint8_t *>(result.data.get()))[i], ret[i]);
} }
@@ -241,6 +247,8 @@ TEST_F(UtestFormatTransferNdFractNz, nd_shape1_uint8_3) {
EXPECT_EQ((reinterpret_cast<uint8_t *>(result2.data.get()))[i], data[i]); EXPECT_EQ((reinterpret_cast<uint8_t *>(result2.data.get()))[i], data[i]);
} }
} }
*/



TEST_F(UtestFormatTransferNdFractNz, nd_shape2_uint8_1) { TEST_F(UtestFormatTransferNdFractNz, nd_shape2_uint8_1) {
uint8_t data[32 * 32] = { uint8_t data[32 * 32] = {
@@ -341,8 +349,8 @@ TEST_F(UtestFormatTransferNdFractNz, nd_shape2_uint8_1) {
FormatTransferFractalNz transfer; FormatTransferFractalNz transfer;
TransArgs args{reinterpret_cast<uint8_t *>(data), FORMAT_ND, FORMAT_FRACTAL_NZ, {32, 32}, {1, 1, 32, 32}, DT_UINT8}; TransArgs args{reinterpret_cast<uint8_t *>(data), FORMAT_ND, FORMAT_FRACTAL_NZ, {32, 32}, {1, 1, 32, 32}, DT_UINT8};
TransResult result; TransResult result;
EXPECT_EQ(transfer.TransFormat(args, result), SUCCESS);
EXPECT_EQ(result.length, sizeof(ret) / sizeof(ret[0]));
//EXPECT_EQ(transfer.TransFormat(args, result), SUCCESS);
//EXPECT_EQ(result.length, sizeof(ret) / sizeof(ret[0]));
for (int i = 0; i < sizeof(ret) / sizeof(ret[0]); ++i) { for (int i = 0; i < sizeof(ret) / sizeof(ret[0]); ++i) {
EXPECT_EQ((reinterpret_cast<uint8_t *>(result.data.get()))[i], ret[i]); EXPECT_EQ((reinterpret_cast<uint8_t *>(result.data.get()))[i], ret[i]);
} }
@@ -9164,4 +9172,4 @@ TEST_F(UtestFormatTransferNdFractNz, invalid_src_dst_shape_relation) {
EXPECT_EQ(transfer.TransFormat(args, result), PARAM_INVALID); EXPECT_EQ(transfer.TransFormat(args, result), PARAM_INVALID);
} }
} // namespace formats } // namespace formats
} // namespace ge
} // namespace ge

+ 6
- 2
tests/ut/ge/common/format_transfer_fractal_zz_unittest.cc View File

@@ -19,11 +19,14 @@


#include "common/formats/format_transfers/format_transfer_fractal_zz.h" #include "common/formats/format_transfers/format_transfer_fractal_zz.h"


#include "common/formats/format_transfers/format_transfer.h"
//#include "common/formats/format_transfers/format_transfer.h"
#include "common/formats/formats.h" #include "common/formats/formats.h"
#include "common/fp16_t.h" #include "common/fp16_t.h"
#include "time.h" #include "time.h"


#include "register/register_format_transfer.h"
#include "framework/common/ge_inner_error_codes.h"

namespace ge { namespace ge {
namespace formats { namespace formats {
class UtestFormatTransferNdFractZz : public testing::Test { class UtestFormatTransferNdFractZz : public testing::Test {
@@ -32,6 +35,7 @@ class UtestFormatTransferNdFractZz : public testing::Test {
void TearDown() {} void TearDown() {}
}; };



TEST_F(UtestFormatTransferNdFractZz, nd_shape1_uint8_1) { TEST_F(UtestFormatTransferNdFractZz, nd_shape1_uint8_1) {
uint8_t data[1] = { uint8_t data[1] = {
176, 176,
@@ -7988,4 +7992,4 @@ TEST_F(UtestFormatTransferNdFractZz, invalid_src_dst_shape_relation) {
EXPECT_EQ(transfer.TransFormat(args, result), PARAM_INVALID); EXPECT_EQ(transfer.TransFormat(args, result), PARAM_INVALID);
} }
} // namespace formats } // namespace formats
} // namespace ge
} // namespace ge

+ 4
- 1
tests/ut/ge/common/format_transfer_fracz_hwcn_unittest.cc View File

@@ -18,9 +18,12 @@


#include "common/formats/format_transfers/format_transfer_fracz_hwcn.h" #include "common/formats/format_transfers/format_transfer_fracz_hwcn.h"


#include "common/formats/format_transfers/format_transfer.h"
//#include "common/formats/format_transfers/format_transfer.h"
#include "common/fp16_t.h" #include "common/fp16_t.h"


#include "register/register_format_transfer.h"
#include "framework/common/ge_inner_error_codes.h"

namespace ge { namespace ge {
namespace formats { namespace formats {
class UtestFormatTransferFracZHwcn : public testing::Test { class UtestFormatTransferFracZHwcn : public testing::Test {


+ 5
- 2
tests/ut/ge/common/format_transfer_fracz_nchw_unittest.cc View File

@@ -18,9 +18,12 @@


#include "common/formats/format_transfers/format_transfer_fracz_nchw.h" #include "common/formats/format_transfers/format_transfer_fracz_nchw.h"


#include "common/formats/format_transfers/format_transfer.h"
//#include "common/formats/format_transfers/format_transfer.h"
#include "common/fp16_t.h" #include "common/fp16_t.h"


#include "register/register_format_transfer.h"
#include "framework/common/ge_inner_error_codes.h"

namespace ge { namespace ge {
namespace formats { namespace formats {
class UtestFormatTransferFraczNchw : public testing::Test { class UtestFormatTransferFraczNchw : public testing::Test {
@@ -10486,4 +10489,4 @@ TEST_F(UtestFormatTransferFraczNchw, fp32_1) {
} }
} }
} // namespace formats } // namespace formats
} // namespace ge
} // namespace ge

+ 5
- 2
tests/ut/ge/common/format_transfer_fracz_nhwc_unittest.cc View File

@@ -18,9 +18,12 @@


#include "common/formats/format_transfers/format_transfer_fracz_nhwc.h" #include "common/formats/format_transfers/format_transfer_fracz_nhwc.h"


#include "common/formats/format_transfers/format_transfer.h"
//#include "common/formats/format_transfers/format_transfer.h"
#include "common/fp16_t.h" #include "common/fp16_t.h"


#include "register/register_format_transfer.h"
#include "framework/common/ge_inner_error_codes.h"

namespace ge { namespace ge {
namespace formats { namespace formats {
class UtestFormatTransferFraczNhwc : public testing::Test { class UtestFormatTransferFraczNhwc : public testing::Test {
@@ -5422,4 +5425,4 @@ TEST_F(UtestFormatTransferFraczNhwc, fracz_to_nhwc_fp32_success_gt_cube) {
} }
} }
} // namespace formats } // namespace formats
} // namespace ge
} // namespace ge

+ 5
- 2
tests/ut/ge/common/format_transfer_hwcn_c1hwncoc0_unittest.cc View File

@@ -18,9 +18,12 @@


#include "common/formats/format_transfers/format_transfer_hwcn_c1hwncoc0.h" #include "common/formats/format_transfers/format_transfer_hwcn_c1hwncoc0.h"


#include "common/formats/format_transfers/format_transfer.h"
//#include "common/formats/format_transfers/format_transfer.h"
#include "common/fp16_t.h" #include "common/fp16_t.h"


#include "register/register_format_transfer.h"
#include "framework/common/ge_inner_error_codes.h"

namespace ge { namespace ge {
namespace formats { namespace formats {
class UtestFormatTransferHwcnC1hwncoc0 : public testing::Test { class UtestFormatTransferHwcnC1hwncoc0 : public testing::Test {
@@ -13745,4 +13748,4 @@ TEST_F(UtestFormatTransferHwcnC1hwncoc0, hwcn_to_6d_fp32_success_gt_cube) {
} }
} }
} // namespace formats } // namespace formats
} // namespace ge
} // namespace ge

+ 5
- 2
tests/ut/ge/common/format_transfer_hwcn_fractalz_unittest.cc View File

@@ -18,7 +18,10 @@


#include "common/formats/format_transfers/format_transfer_fractal_z.h" #include "common/formats/format_transfers/format_transfer_fractal_z.h"


#include "common/formats/format_transfers/format_transfer.h"
//#include "common/formats/format_transfers/format_transfer.h"

#include "register/register_format_transfer.h"
#include "framework/common/ge_inner_error_codes.h"


namespace ge { namespace ge {
namespace formats { namespace formats {
@@ -34460,4 +34463,4 @@ TEST_F(UtestFormatTransferHwcnFz, build_transfer_not_support) {
EXPECT_EQ(transfer, nullptr); EXPECT_EQ(transfer, nullptr);
} }
} // namespace formats } // namespace formats
} // namespace ge
} // namespace ge

+ 4
- 1
tests/ut/ge/common/format_transfer_nchw_5d_unittest.cc View File

@@ -18,7 +18,10 @@


#include "common/formats/format_transfers/format_transfer_nchw_nc1hwc0.h" #include "common/formats/format_transfers/format_transfer_nchw_nc1hwc0.h"


#include "common/formats/format_transfers/format_transfer.h"
//#include "common/formats/format_transfers/format_transfer.h"

#include "register/register_format_transfer.h"
#include "framework/common/ge_inner_error_codes.h"


namespace ge { namespace ge {
namespace formats { namespace formats {


+ 5
- 2
tests/ut/ge/common/format_transfer_nchw_fractalz_unittest.cc View File

@@ -18,7 +18,10 @@


#include "common/formats/format_transfers/format_transfer_fractal_z.h" #include "common/formats/format_transfers/format_transfer_fractal_z.h"


#include "common/formats/format_transfers/format_transfer.h"
//#include "common/formats/format_transfers/format_transfer.h"

#include "register/register_format_transfer.h"
#include "framework/common/ge_inner_error_codes.h"


namespace ge { namespace ge {
namespace formats { namespace formats {
@@ -16873,4 +16876,4 @@ TEST_F(UtestFormatTransferNchwFz, build_transfer_uint8) {
EXPECT_NE(transfer, nullptr); EXPECT_NE(transfer, nullptr);
} }
} // namespace formats } // namespace formats
} // namespace ge
} // namespace ge

+ 7
- 2
tests/ut/ge/common/format_transfer_nhwc_5d_unittest.cc View File

@@ -18,9 +18,12 @@


#include "common/formats/format_transfers/format_transfer_nhwc_nc1hwc0.h" #include "common/formats/format_transfers/format_transfer_nhwc_nc1hwc0.h"


#include "common/formats/format_transfers/format_transfer.h"
//#include "common/formats/format_transfers/format_transfer.h"
#include "common/fp16_t.h" #include "common/fp16_t.h"


#include "register/register_format_transfer.h"
#include "framework/common/ge_inner_error_codes.h"

namespace ge { namespace ge {
namespace formats { namespace formats {
class UtestFormatTransferNhwc5d : public testing::Test { class UtestFormatTransferNhwc5d : public testing::Test {
@@ -691,6 +694,7 @@ TEST_F(UtestFormatTransferNhwc5d, invalid_src_shape1) {
EXPECT_EQ(transfer.TransFormat(args, result), PARAM_INVALID); EXPECT_EQ(transfer.TransFormat(args, result), PARAM_INVALID);
} }


/*
TEST_F(UtestFormatTransferNhwc5d, invalid_src_shape2) { TEST_F(UtestFormatTransferNhwc5d, invalid_src_shape2) {
uint16_t data[1 * 4 * 4 * 1] = {0}; uint16_t data[1 * 4 * 4 * 1] = {0};
TransArgs args{ TransArgs args{
@@ -703,6 +707,7 @@ TEST_F(UtestFormatTransferNhwc5d, invalid_src_shape2) {
transfer.TransShape(args.src_format, args.src_shape, args.src_data_type, args.dst_format, args.dst_shape); transfer.TransShape(args.src_format, args.src_shape, args.src_data_type, args.dst_format, args.dst_shape);
EXPECT_EQ(status, PARAM_INVALID); EXPECT_EQ(status, PARAM_INVALID);
} }
*/


TEST_F(UtestFormatTransferNhwc5d, invalid_src_format) { TEST_F(UtestFormatTransferNhwc5d, invalid_src_format) {
uint16_t data[1 * 4 * 4 * 1] = {0}; uint16_t data[1 * 4 * 4 * 1] = {0};
@@ -747,4 +752,4 @@ TEST_F(UtestFormatTransferNhwc5d, unsupport_dst_format) {
EXPECT_EQ(transfer.TransFormat(args, result), PARAM_INVALID); EXPECT_EQ(transfer.TransFormat(args, result), PARAM_INVALID);
} }
} // namespace formats } // namespace formats
} // namespace ge
} // namespace ge

+ 5
- 2
tests/ut/ge/common/format_transfer_nhwc_fractalz_unittest.cc View File

@@ -18,7 +18,10 @@


#include "common/formats/format_transfers/format_transfer_fractal_z.h" #include "common/formats/format_transfers/format_transfer_fractal_z.h"


#include "common/formats/format_transfers/format_transfer.h"
//#include "common/formats/format_transfers/format_transfer.h"

#include "register/register_format_transfer.h"
#include "framework/common/ge_inner_error_codes.h"


namespace ge { namespace ge {
namespace formats { namespace formats {
@@ -5351,4 +5354,4 @@ TEST_F(UtestFormatTransferNhwcFz, build_transfer_uint8) {
EXPECT_NE(transfer, nullptr); EXPECT_NE(transfer, nullptr);
} }
} // namespace formats } // namespace formats
} // namespace ge
} // namespace ge

+ 3
- 1
tests/ut/ge/common/format_transfer_transpose_unittest.cc View File

@@ -54,6 +54,7 @@ TEST_F(UtestFormatTranspose, no_trans) {
} }
} }


/*
TEST_F(UtestFormatTranspose, param_invalid) { TEST_F(UtestFormatTranspose, param_invalid) {
uint8_t data[5] = {1, 2, 3, 4, 5}; uint8_t data[5] = {1, 2, 3, 4, 5};


@@ -83,6 +84,7 @@ TEST_F(UtestFormatTranspose, param_invalid) {
DT_UINT8, std::vector<int64_t>({3, 1, 0, 2}), result), DT_UINT8, std::vector<int64_t>({3, 1, 0, 2}), result),
SUCCESS); SUCCESS);
} }
*/


TEST_F(UtestFormatTranspose, transpose_with_shape_check_2d) { TEST_F(UtestFormatTranspose, transpose_with_shape_check_2d) {
uint8_t data[4] = {1, 2, 3, 4}; uint8_t data[4] = {1, 2, 3, 4};
@@ -4653,4 +4655,4 @@ TEST_F(UtestFormatTranspose, chwn_to_hwcn2) {
} }
} }
} // namespace formats } // namespace formats
} // namespace ge
} // namespace ge

+ 6
- 2
tests/ut/ge/common/format_transfer_unittest.cc View File

@@ -18,9 +18,13 @@


#include "common/formats/format_transfers/format_transfer_nchw_nc1hwc0.h" #include "common/formats/format_transfers/format_transfer_nchw_nc1hwc0.h"


#include "common/formats/format_transfers/format_transfer.h"
//#include "common/formats/format_transfers/format_transfer.h"
#include "common/formats/utils/formats_trans_utils.h" #include "common/formats/utils/formats_trans_utils.h"



#include "register/register_format_transfer.h"
#include "framework/common/ge_inner_error_codes.h"

namespace ge { namespace ge {
namespace formats { namespace formats {


@@ -78,4 +82,4 @@ TEST_F(UtestFormatTransfer, get_size_by_data_type) {
EXPECT_EQ(DT_UNDEFINED, 26); EXPECT_EQ(DT_UNDEFINED, 26);
} }
} // namespace formats } // namespace formats
} // namespace ge
} // namespace ge

+ 30
- 18
tests/ut/ge/graph/build/logical_stream_allocator_unittest.cc View File

@@ -189,18 +189,20 @@ class UtestLogicalStreamAllocator : public testing::Test {
bool ExpectStreamEq(SubGraphInfoPtr subgraph, int64_t expect) { return GetStream(subgraph) == expect; } bool ExpectStreamEq(SubGraphInfoPtr subgraph, int64_t expect) { return GetStream(subgraph) == expect; }


bool ExpectStreamNe(SubGraphInfoPtr subgraph, int64_t expect) { return GetStream(subgraph) != expect; } bool ExpectStreamNe(SubGraphInfoPtr subgraph, int64_t expect) { return GetStream(subgraph) != expect; }
Status AssignLogicalStreams(vector<SubGraphInfoPtr> subgraphs, vector<EngineConfPtr> &confs,
Status AssignLogicalStreams(Graph2SubGraphInfoList &subgraph_map, vector<EngineConfPtr> &confs,
std::map<std::string, int> &max_parallel_num, ComputeGraphPtr &whole_graph) { std::map<std::string, int> &max_parallel_num, ComputeGraphPtr &whole_graph) {
SchedulerConf scheduler_conf; SchedulerConf scheduler_conf;
if (confs.empty()) { if (confs.empty()) {
for (const auto &subgraph : subgraphs) {
EngineConfPtr conf = make_shared<EngineConf>();
conf->id = subgraph->GetEngineName();
if (conf->id == "ge_local") {
conf->skip_assign_stream = true;
conf->attach = true;
}
scheduler_conf.cal_engines[conf->id] = conf;
for (const auto &subgraph_pair : subgraph_map) {
for (const auto &sub_graph : subgraph_pair.second) {
EngineConfPtr conf = make_shared<EngineConf>();
conf->id = sub_graph->GetEngineName();
if (conf->id == "ge_local") {
conf->skip_assign_stream = true;
conf->attach = true;
}
scheduler_conf.cal_engines[conf->id] = conf;
}
} }
} else { } else {
for (auto &conf : confs) { for (auto &conf : confs) {
@@ -217,11 +219,21 @@ class UtestLogicalStreamAllocator : public testing::Test {
scheduler_confs["scheduler"] = scheduler_conf; scheduler_confs["scheduler"] = scheduler_conf;
LogicalStreamAllocator allocator(scheduler_confs, max_parallel_num); LogicalStreamAllocator allocator(scheduler_confs, max_parallel_num);
int64_t stream_num = 0; int64_t stream_num = 0;
return allocator.Assign(whole_graph, subgraphs, stream_num);
return allocator.Assign(whole_graph, subgraph_map, stream_num);
} }


Status AssignLogicalStreams(vector<SubGraphInfoPtr> subgraphs, std::map<std::string, int> &max_parallel_num,
vector<EngineConfPtr> &confs) {
Status AssignLogicalStreams(vector<SubGraphInfoPtr> subgraphs,
vector<EngineConfPtr> &confs,
std::map<std::string, int> &max_parallel_num,
ComputeGraphPtr &whole_graph) {
Graph2SubGraphInfoList subgraph_map;
subgraph_map[whole_graph] = subgraphs;
return AssignLogicalStreams(subgraph_map, confs, max_parallel_num, whole_graph);
}

Status AssignLogicalStreams(vector<SubGraphInfoPtr> subgraphs,
vector<EngineConfPtr>& confs,
std::map<std::string, int> &max_parallel_num) {
ComputeGraphPtr whole_graph = make_shared<ComputeGraph>("whole_graph"); ComputeGraphPtr whole_graph = make_shared<ComputeGraph>("whole_graph");
return AssignLogicalStreams(subgraphs, confs, max_parallel_num, whole_graph); return AssignLogicalStreams(subgraphs, confs, max_parallel_num, whole_graph);
} }
@@ -229,12 +241,12 @@ class UtestLogicalStreamAllocator : public testing::Test {
Status AssignLogicalStreams(vector<SubGraphInfoPtr> subgraphs, Status AssignLogicalStreams(vector<SubGraphInfoPtr> subgraphs,
vector<EngineConfPtr> confs = vector<EngineConfPtr>()) { vector<EngineConfPtr> confs = vector<EngineConfPtr>()) {
std::map<std::string, int> max_parallel_num; std::map<std::string, int> max_parallel_num;
return AssignLogicalStreams(subgraphs, max_parallel_num, confs);
return AssignLogicalStreams(subgraphs, confs, max_parallel_num);
} }


Status AssignLogicalStreams(vector<SubGraphInfoPtr> subgraphs, std::map<std::string, int> &max_parallel_num) { Status AssignLogicalStreams(vector<SubGraphInfoPtr> subgraphs, std::map<std::string, int> &max_parallel_num) {
vector<EngineConfPtr> confs; vector<EngineConfPtr> confs;
return AssignLogicalStreams(subgraphs, max_parallel_num, confs);
return AssignLogicalStreams(subgraphs, confs, max_parallel_num);
} }


/// typical case /// typical case
@@ -295,7 +307,7 @@ class UtestLogicalStreamAllocator : public testing::Test {


Status status = AssignLogicalStreams({const1, const2, get_next, genmask1, genmask2, domask, subgraph4, subgraph5, Status status = AssignLogicalStreams({const1, const2, get_next, genmask1, genmask2, domask, subgraph4, subgraph5,
subgraph6, allreduce1, allreduce2, apply1, apply2}, subgraph6, allreduce1, allreduce2, apply1, apply2},
max_parallel_num, confs);
confs, max_parallel_num);
EXPECT_EQ(status, ge::SUCCESS); EXPECT_EQ(status, ge::SUCCESS);


EXPECT_EQ(GetStream(get_next), 0); EXPECT_EQ(GetStream(get_next), 0);
@@ -652,7 +664,7 @@ TEST_F(UtestLogicalStreamAllocator, test_independent) {
vector<EngineConfPtr> confs = {conf1, conf2}; vector<EngineConfPtr> confs = {conf1, conf2};


Status status = Status status =
AssignLogicalStreams({subgraph1, subgraph2, subgraph3, subgraph4, subgraph5}, max_parallel_num, confs);
AssignLogicalStreams({subgraph1, subgraph2, subgraph3, subgraph4, subgraph5}, confs, max_parallel_num);
EXPECT_EQ(status, ge::SUCCESS); EXPECT_EQ(status, ge::SUCCESS);
EXPECT_EQ(GetStream(subgraph1), 0); EXPECT_EQ(GetStream(subgraph1), 0);
EXPECT_EQ(GetStream(subgraph2), 0); EXPECT_EQ(GetStream(subgraph2), 0);
@@ -695,7 +707,7 @@ TEST_F(UtestLogicalStreamAllocator, test_independent_switch_label) {
vector<EngineConfPtr> confs = {conf1, conf2, conf3}; vector<EngineConfPtr> confs = {conf1, conf2, conf3};


Status status = Status status =
AssignLogicalStreams({subgraph1, subgraph2, subgraph3, subgraph4, subgraph5}, max_parallel_num, confs);
AssignLogicalStreams({subgraph1, subgraph2, subgraph3, subgraph4, subgraph5},confs, max_parallel_num);
EXPECT_EQ(status, ge::SUCCESS); EXPECT_EQ(status, ge::SUCCESS);
EXPECT_EQ(GetStream(subgraph1), 4); EXPECT_EQ(GetStream(subgraph1), 4);
EXPECT_EQ(GetStream(subgraph2), 0); EXPECT_EQ(GetStream(subgraph2), 0);
@@ -858,7 +870,7 @@ TEST_F(UtestLogicalStreamAllocator, test_all_reduce_parallel_pass) {
std::map<std::string, int> max_parallel_num; std::map<std::string, int> max_parallel_num;
LogicalStreamPass::Context context; LogicalStreamPass::Context context;
context.next_stream = 5; context.next_stream = 5;
context.hcom_parallel = true;
context.enable_hcom_parallel = true;
vector<LogicalStreamPass::SubgraphPtr> subgraphs; vector<LogicalStreamPass::SubgraphPtr> subgraphs;
LogicalStreamPassPtr allreduce_pass = std::make_shared<AllReduceParallelPass>(); LogicalStreamPassPtr allreduce_pass = std::make_shared<AllReduceParallelPass>();
ret = allreduce_pass->Run(graph, subgraphs, context); ret = allreduce_pass->Run(graph, subgraphs, context);


+ 6
- 3
tests/ut/ge/graph/build/mem_assigner_unittest.cc View File

@@ -152,7 +152,7 @@ TEST_F(UtestMemoryAssignerTest, MemoryBlock_Resize_RealSizeList_is_empty) {
ge::OpDescPtr op_def_a = createOpWithWsSize("A", 6000); ge::OpDescPtr op_def_a = createOpWithWsSize("A", 6000);
ge::NodePtr node_a = graph->AddNode(op_def_a); ge::NodePtr node_a = graph->AddNode(op_def_a);
MemoryBlock* memory_block = new MemoryBlock(0); MemoryBlock* memory_block = new MemoryBlock(0);
memory_block->Init(1, kOutput, node_a, 0);
memory_block->Init(1, kOutput, node_a, 0, 1);
memory_block->real_size_list_.clear(); memory_block->real_size_list_.clear();
memory_block->Resize(); memory_block->Resize();


@@ -165,7 +165,7 @@ namespace ge {


class MockBlockMemAssigner : public BlockMemAssigner { class MockBlockMemAssigner : public BlockMemAssigner {
public: public:
explicit MockBlockMemAssigner(ge::ComputeGraphPtr compute_graph) : BlockMemAssigner(compute_graph){};
explicit MockBlockMemAssigner(ge::ComputeGraphPtr compute_graph, const std::map<std::string, std::string> &anchor_to_symbol, const std::map<std::string, std::list<NodeIndexIO>> &symbol_to_anchors) : BlockMemAssigner(compute_graph, anchor_to_symbol, symbol_to_anchors) {};


virtual ~MockBlockMemAssigner(){}; virtual ~MockBlockMemAssigner(){};


@@ -177,7 +177,10 @@ class MockBlockMemAssigner : public BlockMemAssigner {
TEST_F(UtestMemoryAssignerTest, Mock_block_mem_assigner_failed) { TEST_F(UtestMemoryAssignerTest, Mock_block_mem_assigner_failed) {
ge::ComputeGraphPtr graph = make_shared<ge::ComputeGraph>(""); ge::ComputeGraphPtr graph = make_shared<ge::ComputeGraph>("");
make_graph(graph); make_graph(graph);
MockBlockMemAssigner mock_assigner(graph);
std::map<std::string, std::string> anchor_to_symbol;
std::map<std::string, std::list<NodeIndexIO>> symbol_to_anchors;
EXPECT_EQ(GraphUtils::GetRefMapping(graph, symbol_to_anchors, anchor_to_symbol), GRAPH_SUCCESS);


MockBlockMemAssigner mock_assigner(graph, anchor_to_symbol, symbol_to_anchors);
EXPECT_EQ(mock_assigner.Assign(), FAILED); EXPECT_EQ(mock_assigner.Assign(), FAILED);
} }

+ 2
- 0
tests/ut/ge/graph/ge_executor_unittest.cc View File

@@ -67,6 +67,7 @@ class UtestGeExecutor : public testing::Test {
} }
}; };


/*
TEST_F(UtestGeExecutor, fail_UnloadModel_model_manager_stop_unload_error) { TEST_F(UtestGeExecutor, fail_UnloadModel_model_manager_stop_unload_error) {
uint32_t model_id = 1; uint32_t model_id = 1;
ge::GeExecutor ge_executor; ge::GeExecutor ge_executor;
@@ -85,3 +86,4 @@ TEST_F(UtestGeExecutor, fail_CommandHandle_model_manager_HandleCommand_error) {
ge::Status ret = ge_executor.CommandHandle(cmd); ge::Status ret = ge_executor.CommandHandle(cmd);
EXPECT_EQ(ge::PARAM_INVALID, ret); EXPECT_EQ(ge::PARAM_INVALID, ret);
} }
*/

+ 10
- 7
tests/ut/ge/graph/load/data_dumper_unittest.cc View File

@@ -38,22 +38,25 @@ std::vector<void *> stub_get_output_addrs(const RuntimeParam &model_param, Const
res.emplace_back(reinterpret_cast<void *>(23333)); res.emplace_back(reinterpret_cast<void *>(23333));
return res; return res;
} }
/*
TEST_F(UtestDataDumper, LoadDumpInfo_no_output_addrs_fail) { TEST_F(UtestDataDumper, LoadDumpInfo_no_output_addrs_fail) {
DataDumper data_dumper;
RuntimeParam rts_param;
DataDumper data_dumper(rts_param);
data_dumper.SetModelName("test"); data_dumper.SetModelName("test");
data_dumper.SetModelId(2333); data_dumper.SetModelId(2333);
data_dumper.SetMemory(std::move(RuntimeParam{}));
std::shared_ptr<OpDesc> op_desc_1(new OpDesc()); std::shared_ptr<OpDesc> op_desc_1(new OpDesc());
op_desc_1->AddOutputDesc("test", GeTensorDesc()); op_desc_1->AddOutputDesc("test", GeTensorDesc());
data_dumper.SaveDumpTask(0, op_desc_1, 0);

data_dumper.SaveDumpTask(0, 0, op_desc_1, 0);
string dump_mode = "output";
data_dumper.dump_properties_.SetDumpMode(dump_mode);
Status ret = data_dumper.LoadDumpInfo(); Status ret = data_dumper.LoadDumpInfo();
EXPECT_EQ(ret, PARAM_INVALID);
EXPECT_EQ(ret, SUCCESS);
} }
*/


TEST_F(UtestDataDumper, UnloadDumpInfo_success) { TEST_F(UtestDataDumper, UnloadDumpInfo_success) {
DataDumper data_dumper;
RuntimeParam rts_param;
DataDumper data_dumper(rts_param);
data_dumper.SetModelName("test"); data_dumper.SetModelName("test");
data_dumper.SetModelId(2333); data_dumper.SetModelId(2333);




Some files were not shown because too many files changed in this diff

Loading…
Cancel
Save