You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

CMakeLists.txt 39 kB

4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055
  1. if (NOT ENABLE_D AND NOT ENABLE_ACL AND NOT ENABLE_MS_TESTCASES)
  2. add_subdirectory(common)
  3. add_subdirectory(plugin/engine)
  4. add_subdirectory(ge_local_engine)
  5. add_subdirectory(offline)
  6. elseif (ENABLE_D)
  7. add_subdirectory(common)
  8. add_subdirectory(ge_runtime)
  9. endif ()
  10. set(GRAPHENGINE_PROTO_LIST
  11. "${METADEF_DIR}/proto/om.proto"
  12. "${METADEF_DIR}/proto/task.proto"
  13. "${METADEF_DIR}/proto/insert_op.proto"
  14. "${METADEF_DIR}/proto/ge_ir.proto"
  15. "${METADEF_DIR}/proto/ge_api.proto"
  16. "${METADEF_DIR}/proto/fusion_model.proto"
  17. "${METADEF_DIR}/proto/optimizer_priority.proto"
  18. "${METADEF_DIR}/proto/fwk_adapter.proto"
  19. "${METADEF_DIR}/proto/op_mapping.proto"
  20. "${METADEF_DIR}/proto/dump_task.proto"
  21. "${METADEF_DIR}/proto/tensorflow/graph_library.proto"
  22. "${METADEF_DIR}/proto/tensorflow/graph.proto"
  23. "${METADEF_DIR}/proto/tensorflow/node_def.proto"
  24. "${METADEF_DIR}/proto/tensorflow/function.proto"
  25. "${METADEF_DIR}/proto/tensorflow/versions.proto"
  26. "${METADEF_DIR}/proto/tensorflow/attr_value.proto"
  27. "${METADEF_DIR}/proto/tensorflow/op_def.proto"
  28. "${METADEF_DIR}/proto/tensorflow/tensor.proto"
  29. "${METADEF_DIR}/proto/tensorflow/tensor_shape.proto"
  30. "${METADEF_DIR}/proto/tensorflow/types.proto"
  31. "${METADEF_DIR}/proto/tensorflow/resource_handle.proto"
  32. )
  33. protobuf_generate(graphengine_protos GRAPHENGINE_PROTO_SRCS GRAPHENGINE_PROTO_HDRS ${GRAPHENGINE_PROTO_LIST} TARGET)
  34. set(GE_FUSION_MODEL_PROTO_SRCS
  35. "${CMAKE_BINARY_DIR}/proto/graphengine_protos/proto/fusion_model.pb.cc"
  36. "${CMAKE_BINARY_DIR}/proto/graphengine_protos/proto/optimizer_priority.pb.cc"
  37. )
  38. add_library(ge_fusion_model_protos_obj OBJECT ${GE_FUSION_MODEL_PROTO_SRCS})
  39. add_dependencies(ge_fusion_model_protos_obj graphengine_protos)
  40. target_include_directories(ge_fusion_model_protos_obj PRIVATE
  41. #### blue zone ####
  42. ${PROTOBUF_SHARED_PKG_DIR}/include
  43. #### yellow zone ####
  44. ${ASCEND_PROTOBUF_SHARED_PKG_DIR}/include
  45. )
  46. target_compile_definitions(ge_fusion_model_protos_obj PRIVATE
  47. google=ascend_private
  48. )
  49. target_link_libraries(ge_fusion_model_protos_obj PRIVATE ascend_protobuf $<BUILD_INTERFACE:intf_pub>)
  50. target_compile_options(ge_fusion_model_protos_obj PRIVATE
  51. $<$<STREQUAL:${TARGET_SYSTEM_NAME},Linux>:-O2 -fPIC>
  52. $<$<OR:$<STREQUAL:${PRODUCT_SIDE},host>,$<STREQUAL:${ENABLE_OPEN_SRC},True>>:-fexceptions>
  53. $<$<OR:$<STREQUAL:${TARGET_SYSTEM_NAME},Linux>,$<STREQUAL:${TARGET_SYSTEM_NAME},Android>>: -Wno-deprecated-declarations -fno-common>
  54. $<$<AND:$<STREQUAL:${TARGET_SYSTEM_NAME},Windows>,$<STREQUAL:${CMAKE_CONFIGURATION_TYPES},Debug>>:/MTd>
  55. $<$<AND:$<STREQUAL:${TARGET_SYSTEM_NAME},Windows>,$<STREQUAL:${CMAKE_CONFIGURATION_TYPES},Release>>:/MT>
  56. )
  57. if (NOT ENABLE_D AND NOT ENABLE_ACL AND NOT ENABLE_MS_TESTCASES)
  58. ############ libge_proto_common.a ############
  59. add_library(ge_proto_common STATIC
  60. $<TARGET_OBJECTS:ge_fusion_model_protos_obj>
  61. )
  62. target_compile_definitions(ge_proto_common PRIVATE
  63. PROTOBUF_INLINE_NOT_IN_HEADERS=0
  64. google=ascend_private
  65. )
  66. target_compile_options(ge_proto_common PRIVATE
  67. -O2
  68. -fno-common
  69. )
  70. target_link_libraries(ge_proto_common PRIVATE
  71. $<BUILD_INTERFACE:intf_pub>
  72. ascend_protobuf
  73. )
  74. ############ libge_proto_client.a ############
  75. add_library(ge_proto_client STATIC
  76. $<TARGET_OBJECTS:ge_fusion_model_protos_obj>
  77. )
  78. target_compile_definitions(ge_proto_client PRIVATE
  79. PROTOBUF_INLINE_NOT_IN_HEADERS=0
  80. google=ascend_private
  81. )
  82. target_include_directories(ge_proto_client PRIVATE
  83. ${CMAKE_BINARY_DIR}/proto/graphengine_protos
  84. ${CMAKE_BINARY_DIR}/proto/graphengine_protos/proto
  85. )
  86. target_compile_options(ge_proto_client PRIVATE
  87. -O2
  88. -fno-common
  89. )
  90. target_link_libraries(ge_proto_client PRIVATE
  91. $<BUILD_INTERFACE:intf_pub>
  92. ascend_protobuf
  93. )
  94. endif ()
  95. ##################################################################
  96. set(EXECUTOR_SRC_LIST
  97. "analyzer/analyzer.cc"
  98. "common/dump/dump_manager.cc"
  99. "common/dump/dump_op.cc"
  100. "common/dump/dump_properties.cc"
  101. "common/dump/exception_dumper.cc"
  102. "common/dump/opdebug_register.cc"
  103. "common/formats/format_transfers/format_transfer_transpose.cc"
  104. "common/formats/utils/formats_trans_utils.cc"
  105. "common/fp16_t.cc"
  106. "common/ge/op_tiling_manager.cc"
  107. "common/ge/plugin_manager.cc"
  108. "common/profiling/ge_profiling.cc"
  109. "common/profiling/profiling_manager.cc"
  110. "engine_manager/dnnengine_manager.cc"
  111. "executor/ge_executor.cc"
  112. "ge_local_engine/engine/host_cpu_engine.cc"
  113. "graph/build/memory/var_mem_assign_util.cc"
  114. "graph/common/bcast.cc"
  115. "graph/common/local_context.cc"
  116. "graph/common/omg_util.cc"
  117. "graph/execute/graph_execute.cc"
  118. "graph/execute/model_executor.cc"
  119. "graph/load/graph_loader.cc"
  120. "graph/load/model_manager/aipp_utils.cc"
  121. "graph/load/model_manager/cpu_queue_schedule.cc"
  122. "graph/load/model_manager/data_dumper.cc"
  123. "graph/load/model_manager/data_inputer.cc"
  124. "graph/load/model_manager/davinci_model.cc"
  125. "graph/load/model_manager/model_manager.cc"
  126. "graph/load/model_manager/model_utils.cc"
  127. "graph/load/model_manager/task_info/end_graph_task_info.cc"
  128. "graph/load/model_manager/task_info/event_record_task_info.cc"
  129. "graph/load/model_manager/task_info/event_wait_task_info.cc"
  130. "graph/load/model_manager/task_info/ffts_task_info.cc"
  131. "graph/load/model_manager/task_info/fusion_start_task_info.cc"
  132. "graph/load/model_manager/task_info/fusion_stop_task_info.cc"
  133. #"graph/load/model_manager/task_info/hccl_task_info.cc" # Just for runner.
  134. "graph/load/model_manager/task_info/kernel_ex_task_info.cc"
  135. "graph/load/model_manager/task_info/kernel_task_info.cc"
  136. "graph/load/model_manager/task_info/label_goto_ex_task_info.cc"
  137. "graph/load/model_manager/task_info/label_set_task_info.cc"
  138. "graph/load/model_manager/task_info/label_switch_by_index_task_info.cc"
  139. "graph/load/model_manager/task_info/memcpy_addr_async_task_info.cc"
  140. "graph/load/model_manager/task_info/memcpy_async_task_info.cc"
  141. "graph/load/model_manager/task_info/model_exit_task_info.cc"
  142. "graph/load/model_manager/task_info/profiler_trace_task_info.cc"
  143. "graph/load/model_manager/task_info/stream_active_task_info.cc"
  144. "graph/load/model_manager/task_info/stream_switch_task_info.cc"
  145. "graph/load/model_manager/task_info/stream_switchn_task_info.cc"
  146. "graph/load/model_manager/task_info/super_kernel/super_kernel.cc"
  147. "graph/load/model_manager/task_info/super_kernel/super_kernel_factory.cc"
  148. "graph/load/model_manager/task_info/task_info.cc"
  149. "graph/load/model_manager/tbe_handle_store.cc"
  150. "graph/load/model_manager/zero_copy_offset.cc"
  151. "graph/load/model_manager/zero_copy_task.cc"
  152. "graph/manager/graph_caching_allocator.cc"
  153. "graph/manager/graph_manager_utils.cc"
  154. "graph/manager/graph_mem_allocator.cc"
  155. "graph/manager/graph_mem_manager.cc"
  156. "graph/manager/graph_var_manager.cc"
  157. "graph/manager/host_mem_allocator.cc"
  158. "graph/manager/host_mem_manager.cc"
  159. #"graph/manager/memory_api.cc" # Just for runner.
  160. "graph/manager/rdma_pool_allocator.cc"
  161. "graph/manager/session_scope_mem_allocator.cc"
  162. "graph/manager/trans_var_data_utils.cc"
  163. "graph/manager/util/debug.cc"
  164. #"graph/manager/util/hcom_util.cc" # Just for runner.
  165. "graph/passes/pass_utils.cc"
  166. "host_kernels/add_kernel.cc"
  167. "host_kernels/broadcast_args_kernel.cc"
  168. "host_kernels/broadcast_gradient_args_kernel.cc"
  169. "host_kernels/cast_kernel.cc"
  170. "host_kernels/concat_offset_kernel.cc"
  171. "host_kernels/concat_v2_kernel.cc"
  172. "host_kernels/dynamic_stitch_kernel.cc"
  173. "host_kernels/empty_kernel.cc"
  174. "host_kernels/expanddims_kernel.cc"
  175. "host_kernels/fill_kernel.cc"
  176. "host_kernels/floordiv_kernel.cc"
  177. "host_kernels/floormod_kernel.cc"
  178. "host_kernels/gather_v2_kernel.cc"
  179. "host_kernels/greater_kernel.cc"
  180. "host_kernels/identity_kernel.cc"
  181. "host_kernels/kernel_utils.cc"
  182. "host_kernels/maximum_kernel.cc"
  183. "host_kernels/mul_kernel.cc"
  184. "host_kernels/pack_kernel.cc"
  185. "host_kernels/permute_kernel.cc"
  186. "host_kernels/range_kernel.cc"
  187. "host_kernels/rank_kernel.cc"
  188. "host_kernels/reduce_prod_kernel.cc"
  189. "host_kernels/reformat_kernel.cc"
  190. "host_kernels/reshape_kernel.cc"
  191. "host_kernels/rsqrt_kernel.cc"
  192. "host_kernels/shape_kernel.cc"
  193. "host_kernels/shape_n_kernel.cc"
  194. "host_kernels/size_kernel.cc"
  195. "host_kernels/slice_d_kernel.cc"
  196. "host_kernels/slice_kernel.cc"
  197. "host_kernels/squeeze_kernel.cc"
  198. "host_kernels/ssd_prior_box_kernel.cc"
  199. "host_kernels/strided_slice_kernel.cc"
  200. "host_kernels/sub_kernel.cc"
  201. "host_kernels/transdata_kernel.cc"
  202. "host_kernels/transpose_kernel.cc"
  203. "host_kernels/unpack_kernel.cc"
  204. "host_kernels/unsqueeze_kernel.cc"
  205. "hybrid/common/npu_memory_allocator.cc"
  206. "hybrid/common/tensor_value.cc"
  207. "hybrid/executor/hybrid_execution_context.cc"
  208. "hybrid/executor/hybrid_model_async_executor.cc"
  209. "hybrid/executor/hybrid_model_executor.cc"
  210. "hybrid/executor/hybrid_model_pipeline_executor.cc"
  211. "hybrid/executor/hybrid_profiler.cc"
  212. "hybrid/executor/node_done_manager.cc"
  213. "hybrid/executor/node_state.cc"
  214. "hybrid/executor/rt_callback_manager.cc"
  215. "hybrid/executor/subgraph_context.cc"
  216. "hybrid/executor/subgraph_executor.cc"
  217. "hybrid/executor/worker/execution_engine.cc"
  218. "hybrid/executor/worker/shape_inference_engine.cc"
  219. "hybrid/executor/worker/task_compile_engine.cc"
  220. "hybrid/hybrid_davinci_model.cc"
  221. "hybrid/model/graph_item.cc"
  222. "hybrid/model/hybrid_model.cc"
  223. "hybrid/model/hybrid_model_builder.cc"
  224. "hybrid/model/node_item.cc"
  225. "hybrid/node_executor/aicore/aicore_node_executor.cc"
  226. "hybrid/node_executor/aicore/aicore_op_task.cc"
  227. "hybrid/node_executor/aicore/aicore_task_builder.cc"
  228. "hybrid/node_executor/aicore/aicore_task_compiler.cc"
  229. "hybrid/node_executor/aicpu/aicpu_ext_info.cc"
  230. "hybrid/node_executor/aicpu/aicpu_node_executor.cc"
  231. "hybrid/node_executor/compiledsubgraph/known_node_executor.cc"
  232. "hybrid/node_executor/controlop/control_op_executor.cc"
  233. "hybrid/node_executor/ge_local/ge_local_node_executor.cc"
  234. #"hybrid/node_executor/hccl/hccl_node_executor.cc" # Just for runner.
  235. "hybrid/node_executor/host_cpu/host_cpu_node_executor.cc"
  236. "hybrid/node_executor/node_executor.cc"
  237. "hybrid/node_executor/partitioned_call/partitioned_call_node_executor.cc"
  238. "hybrid/node_executor/rts/rts_node_executor.cc"
  239. "hybrid/node_executor/rts/rts_node_task.cc"
  240. "hybrid/node_executor/rts/rts_task_factory.cc"
  241. "hybrid/node_executor/task_context.cc"
  242. "init/gelib.cc"
  243. "model/ge_model.cc"
  244. "model/ge_root_model.cc"
  245. "opskernel_manager/ops_kernel_builder_manager.cc"
  246. "opskernel_manager/ops_kernel_manager.cc"
  247. "single_op/single_op.cc"
  248. "single_op/single_op_manager.cc"
  249. "single_op/single_op_model.cc"
  250. "single_op/stream_resource.cc"
  251. "single_op/task/aicpu_kernel_task_builder.cc"
  252. "single_op/task/aicpu_task_builder.cc"
  253. "single_op/task/build_task_utils.cc"
  254. "single_op/task/op_task.cc"
  255. "single_op/task/rts_kernel_task_builder.cc"
  256. "single_op/task/tbe_task_builder.cc"
  257. )
  258. ##################################################################
  259. set(COMPILER_SRC_LIST
  260. "analyzer/analyzer.cc"
  261. "common/dump/dump_manager.cc"
  262. "common/dump/dump_op.cc"
  263. "common/dump/dump_properties.cc"
  264. "common/formats/format_transfers/datatype_transfer.cc"
  265. "common/formats/format_transfers/format_transfer_c1hwncoc0_hwcn.cc"
  266. "common/formats/format_transfers/format_transfer_dhwcn_fracz3D.cc"
  267. "common/formats/format_transfers/format_transfer_dhwnc_fracz3D_transpose.cc"
  268. "common/formats/format_transfers/format_transfer_fractal_nz.cc"
  269. "common/formats/format_transfers/format_transfer_fractal_z.cc"
  270. "common/formats/format_transfers/format_transfer_fractal_zz.cc"
  271. "common/formats/format_transfers/format_transfer_fracz_hwcn.cc"
  272. "common/formats/format_transfers/format_transfer_fracz_nchw.cc"
  273. "common/formats/format_transfers/format_transfer_fracz_nhwc.cc"
  274. "common/formats/format_transfers/format_transfer_hwcn_c1hwncoc0.cc"
  275. "common/formats/format_transfers/format_transfer_nc1hwc0_nchw.cc"
  276. "common/formats/format_transfers/format_transfer_nc1hwc0_nhwc.cc"
  277. "common/formats/format_transfers/format_transfer_nchw_fz_c04.cc"
  278. "common/formats/format_transfers/format_transfer_nchw_nc1hwc0.cc"
  279. "common/formats/format_transfers/format_transfer_nhwc_nc1hwc0.cc"
  280. "common/formats/format_transfers/format_transfer_transpose.cc"
  281. "common/formats/formats.cc"
  282. "common/formats/utils/formats_trans_utils.cc"
  283. "common/fp16_t.cc"
  284. "common/ge/op_tiling_manager.cc"
  285. "common/ge/plugin_manager.cc"
  286. "common/helper/model_cache_helper.cc"
  287. "common/profiling/profiling_manager.cc"
  288. "engine_manager/dnnengine_manager.cc"
  289. "ge_local_engine/engine/host_cpu_engine.cc"
  290. "ge_opt_info/ge_opt_info.cc"
  291. "generator/ge_generator.cc"
  292. "generator/generator_api.cc"
  293. "graph/build/graph_builder.cc"
  294. "graph/build/label_allocator.cc"
  295. "graph/build/logical_stream_allocator.cc"
  296. "graph/build/memory/binary_block_mem_assigner.cc"
  297. "graph/build/memory/block_mem_assigner.cc"
  298. "graph/build/memory/buffer_pool_mem_assigner.cc"
  299. "graph/build/memory/graph_mem_assigner.cc"
  300. "graph/build/memory/hybrid_mem_assigner.cc"
  301. "graph/build/memory/max_block_mem_assigner.cc"
  302. "graph/build/memory/memory_assigner.cc"
  303. "graph/build/memory/var_mem_assign_util.cc"
  304. "graph/build/model_builder.cc"
  305. "graph/build/run_context.cc"
  306. "graph/build/stream_allocator.cc"
  307. "graph/build/stream_graph_optimizer.cc"
  308. "graph/build/task_generator.cc"
  309. "graph/common/bcast.cc"
  310. "graph/common/local_context.cc"
  311. "graph/common/omg_util.cc"
  312. "graph/common/transop_util.cc"
  313. "graph/label/case_label_maker.cc"
  314. "graph/label/if_label_maker.cc"
  315. "graph/label/label_maker.cc"
  316. "graph/label/partitioned_call_label_maker.cc"
  317. "graph/label/while_label_maker.cc"
  318. "graph/load/model_manager/model_utils.cc"
  319. "graph/manager/graph_caching_allocator.cc"
  320. "graph/manager/graph_context.cc"
  321. "graph/manager/graph_manager.cc"
  322. "graph/manager/graph_manager_utils.cc"
  323. "graph/manager/graph_mem_allocator.cc"
  324. "graph/manager/graph_mem_manager.cc"
  325. "graph/manager/graph_var_manager.cc"
  326. "graph/manager/host_mem_allocator.cc"
  327. "graph/manager/host_mem_manager.cc"
  328. "graph/manager/model_manager/event_manager.cc"
  329. "graph/manager/rdma_pool_allocator.cc"
  330. "graph/manager/session_scope_mem_allocator.cc"
  331. "graph/manager/trans_var_data_utils.cc"
  332. "graph/manager/util/debug.cc"
  333. "graph/manager/util/rt_context_util.cc"
  334. "graph/manager/util/variable_accelerate_ctrl.cc"
  335. "graph/optimize/graph_optimize.cc"
  336. "graph/optimize/mem_rw_conflict_optimize.cc"
  337. "graph/optimize/summary_optimize.cc"
  338. "graph/partition/dynamic_shape_partition.cc"
  339. "graph/partition/engine_place.cc"
  340. "graph/partition/graph_partition.cc"
  341. "graph/partition/stage_partition.cc"
  342. "graph/passes/addn_pass.cc"
  343. "graph/passes/aicpu_constant_folding_pass.cc"
  344. "graph/passes/assert_pass.cc"
  345. "graph/passes/assign_remove_pass.cc"
  346. "graph/passes/atomic_addr_clean_pass.cc"
  347. "graph/passes/attach_stream_label_pass.cc"
  348. "graph/passes/base_pass.cc"
  349. "graph/passes/bitcast_pass.cc"
  350. "graph/passes/buffer_pool_memory_pass.cc"
  351. "graph/passes/cast_remove_pass.cc"
  352. "graph/passes/cast_translate_pass.cc"
  353. "graph/passes/common_subexpression_elimination_pass.cc"
  354. "graph/passes/compile_nodes_pass.cc"
  355. "graph/passes/cond_pass.cc"
  356. "graph/passes/cond_remove_pass.cc"
  357. "graph/passes/constant_folding_pass.cc"
  358. "graph/passes/constant_fuse_same_pass.cc"
  359. "graph/passes/control_trigger_pass.cc"
  360. "graph/passes/ctrl_edge_transfer_pass.cc"
  361. "graph/passes/data_pass.cc"
  362. "graph/passes/dimension_adjust_pass.cc"
  363. "graph/passes/dimension_compute_pass.cc"
  364. "graph/passes/dropout_pass.cc"
  365. "graph/passes/end_of_sequence_add_control_pass.cc"
  366. "graph/passes/enter_pass.cc"
  367. "graph/passes/flow_ctrl_pass.cc"
  368. "graph/passes/folding_pass.cc"
  369. "graph/passes/for_pass.cc"
  370. "graph/passes/fuse_data_nodes_with_common_input_pass.cc"
  371. "graph/passes/get_original_format_pass.cc"
  372. "graph/passes/global_step_insert_pass.cc"
  373. "graph/passes/guarantee_const_pass.cc"
  374. "graph/passes/hccl_continuous_memcpy_pass.cc"
  375. "graph/passes/hccl_group_pass.cc"
  376. "graph/passes/hccl_memcpy_pass.cc"
  377. "graph/passes/hccl_tailing_optimization_pass.cc"
  378. "graph/passes/identity_pass.cc"
  379. "graph/passes/infer_base_pass.cc"
  380. "graph/passes/infer_value_range_pass.cc"
  381. "graph/passes/infershape_pass.cc"
  382. "graph/passes/inplace_support_check_pass.cc"
  383. "graph/passes/input_output_connection_identify_pass.cc"
  384. "graph/passes/iterator_op_pass.cc"
  385. "graph/passes/link_gen_mask_nodes_pass.cc"
  386. "graph/passes/mark_agnostic_pass.cc"
  387. "graph/passes/mark_force_unknown_for_cond_pass.cc"
  388. "graph/passes/mark_graph_unknown_status_pass.cc"
  389. "graph/passes/mark_node_unknown_shape_pass.cc"
  390. "graph/passes/mark_same_addr_pass.cc"
  391. "graph/passes/memcpy_addr_async_pass.cc"
  392. "graph/passes/merge_input_memcpy_pass.cc"
  393. "graph/passes/merge_pass.cc"
  394. "graph/passes/merge_to_stream_merge_pass.cc"
  395. "graph/passes/multi_batch_clone_pass.cc"
  396. "graph/passes/multi_batch_pass.cc"
  397. "graph/passes/net_output_pass.cc"
  398. "graph/passes/next_iteration_pass.cc"
  399. "graph/passes/no_use_reshape_remove_pass.cc"
  400. "graph/passes/parallel_concat_start_op_pass.cc"
  401. "graph/passes/parallel_group_pass.cc"
  402. "graph/passes/pass_manager.cc"
  403. "graph/passes/pass_utils.cc"
  404. "graph/passes/permute_pass.cc"
  405. "graph/passes/placeholder_with_default_pass.cc"
  406. "graph/passes/prevent_gradient_pass.cc"
  407. "graph/passes/print_op_pass.cc"
  408. "graph/passes/prune_pass.cc"
  409. "graph/passes/ref_identity_delete_op_pass.cc"
  410. "graph/passes/remove_same_const_pass.cc"
  411. "graph/passes/replace_transshape_pass.cc"
  412. "graph/passes/replace_with_empty_const_pass.cc"
  413. "graph/passes/reshape_recovery_pass.cc"
  414. "graph/passes/reshape_remove_pass.cc"
  415. "graph/passes/resource_pair_add_control_pass.cc"
  416. "graph/passes/resource_pair_remove_control_pass.cc"
  417. "graph/passes/same_transdata_breadth_fusion_pass.cc"
  418. "graph/passes/save_pass.cc"
  419. "graph/passes/set_input_output_offset_pass.cc"
  420. "graph/passes/shape_operate_op_remove_pass.cc"
  421. "graph/passes/snapshot_pass.cc"
  422. "graph/passes/stop_gradient_pass.cc"
  423. "graph/passes/subexpression_migration_pass.cc"
  424. "graph/passes/subgraph_const_migration_pass.cc"
  425. "graph/passes/subgraph_pass.cc"
  426. "graph/passes/switch_data_edges_bypass.cc"
  427. "graph/passes/switch_dead_branch_elimination.cc"
  428. "graph/passes/switch_logic_remove_pass.cc"
  429. "graph/passes/switch_to_stream_switch_pass.cc"
  430. "graph/passes/transop_breadth_fusion_pass.cc"
  431. "graph/passes/transop_depth_fusion_pass.cc"
  432. "graph/passes/transop_nearby_allreduce_fusion_pass.cc"
  433. "graph/passes/transop_symmetry_elimination_pass.cc"
  434. "graph/passes/transop_without_reshape_fusion_pass.cc"
  435. "graph/passes/transpose_transdata_pass.cc"
  436. "graph/passes/unused_args_clean_pass.cc"
  437. "graph/passes/unused_const_pass.cc"
  438. "graph/passes/useless_control_out_remove_pass.cc"
  439. "graph/passes/var_is_initialized_op_pass.cc"
  440. "graph/passes/variable_op_pass.cc"
  441. "graph/passes/variable_prepare_op_pass.cc"
  442. "graph/passes/variable_ref_delete_op_pass.cc"
  443. "graph/passes/variable_ref_useless_control_out_delete_pass.cc"
  444. "graph/preprocess/graph_preprocess.cc"
  445. "graph/preprocess/insert_op/ge_aipp_op.cc"
  446. "graph/preprocess/insert_op/util_insert_aipp_op.cc"
  447. "graph/preprocess/multi_batch_copy_graph.cc"
  448. "graph/preprocess/multi_batch_options.cc"
  449. "host_kernels/add_kernel.cc"
  450. "host_kernels/broadcast_args_kernel.cc"
  451. "host_kernels/broadcast_gradient_args_kernel.cc"
  452. "host_kernels/cast_kernel.cc"
  453. "host_kernels/concat_offset_kernel.cc"
  454. "host_kernels/concat_v2_kernel.cc"
  455. "host_kernels/dynamic_stitch_kernel.cc"
  456. "host_kernels/empty_kernel.cc"
  457. "host_kernels/expanddims_kernel.cc"
  458. "host_kernels/fill_kernel.cc"
  459. "host_kernels/floordiv_kernel.cc"
  460. "host_kernels/floormod_kernel.cc"
  461. "host_kernels/gather_v2_kernel.cc"
  462. "host_kernels/greater_kernel.cc"
  463. "host_kernels/identity_kernel.cc"
  464. "host_kernels/kernel_utils.cc"
  465. "host_kernels/maximum_kernel.cc"
  466. "host_kernels/mul_kernel.cc"
  467. "host_kernels/pack_kernel.cc"
  468. "host_kernels/permute_kernel.cc"
  469. "host_kernels/range_kernel.cc"
  470. "host_kernels/rank_kernel.cc"
  471. "host_kernels/reduce_prod_kernel.cc"
  472. "host_kernels/reformat_kernel.cc"
  473. "host_kernels/reshape_kernel.cc"
  474. "host_kernels/rsqrt_kernel.cc"
  475. "host_kernels/shape_kernel.cc"
  476. "host_kernels/shape_n_kernel.cc"
  477. "host_kernels/size_kernel.cc"
  478. "host_kernels/slice_d_kernel.cc"
  479. "host_kernels/slice_kernel.cc"
  480. "host_kernels/squeeze_kernel.cc"
  481. "host_kernels/ssd_prior_box_kernel.cc"
  482. "host_kernels/strided_slice_kernel.cc"
  483. "host_kernels/sub_kernel.cc"
  484. "host_kernels/transdata_kernel.cc"
  485. "host_kernels/transpose_kernel.cc"
  486. "host_kernels/unpack_kernel.cc"
  487. "host_kernels/unsqueeze_kernel.cc"
  488. "hybrid/node_executor/aicpu/aicpu_ext_info.cc"
  489. "init/gelib.cc"
  490. "ir_build/attr_options/keep_dtype_option.cc"
  491. "ir_build/attr_options/utils.cc"
  492. "ir_build/attr_options/weight_compress_option.cc"
  493. "ir_build/ge_ir_build.cc"
  494. "ir_build/option_utils.cc"
  495. "model/ge_model.cc"
  496. "model/ge_root_model.cc"
  497. "opskernel_manager/ops_kernel_builder_manager.cc"
  498. "opskernel_manager/ops_kernel_manager.cc"
  499. )
  500. set(RUNNER_SRC_LIST
  501. "client/ge_api.cc"
  502. "session/inner_session.cc"
  503. "session/session_manager.cc"
  504. "common/profiling/ge_runner_profiling.cc"
  505. "graph/manager/memory_api.cc"
  506. "graph/manager/util/hcom_util.cc"
  507. "graph/load/model_manager/task_info/hccl_task_info.cc"
  508. "hybrid/node_executor/hccl/hccl_node_executor.cc"
  509. )
  510. if (NOT ENABLE_D AND NOT ENABLE_ACL AND NOT ENABLE_MS_TESTCASES)
  511. message("CMAKE_CXX_COMPILER_VERSION = ${CMAKE_CXX_COMPILER_VERSION}")
  512. ############ libge_runner.so ############
  513. add_library(ge_runner SHARED
  514. ${EXECUTOR_SRC_LIST}
  515. ${COMPILER_SRC_LIST}
  516. ${RUNNER_SRC_LIST}
  517. $<TARGET_OBJECTS:$<IF:$<TARGET_EXISTS:msprofiler_fwk>,msprofiler_fwk,msprofiler_fwk_object>>
  518. )
  519. add_library(msprofiler_fwk_object OBJECT IMPORTED GLOBAL)
  520. if (msprofiler_fwk_ext_LIBRARY_DIR)
  521. file(MAKE_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR}/msprofiler_fwk_object)
  522. execute_process(
  523. COMMAND ar x ${msprofiler_fwk_ext_LIBRARY_DIR}
  524. WORKING_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR}/msprofiler_fwk_object
  525. )
  526. file(GLOB MSPROFILER_FWK_OBJECT_LIST ${CMAKE_CURRENT_BINARY_DIR}/msprofiler_fwk_object/*.o)
  527. set_property(TARGET msprofiler_fwk_object PROPERTY IMPORTED_OBJECTS ${MSPROFILER_FWK_OBJECT_LIST})
  528. endif()
  529. target_compile_definitions(ge_runner PRIVATE
  530. PROTOBUF_INLINE_NOT_IN_HEADERS=0
  531. DAVINCI_SUPPORT_PROFILING
  532. REUSE_MEMORY=1
  533. FMK_SUPPORT_DUMP
  534. DAVINCI_CLOUD
  535. google=ascend_private
  536. FUNC_VISIBILITY
  537. $<$<STREQUAL:${ENABLE_OPEN_SRC},True>:ONLY_COMPILE_OPEN_SRC>
  538. )
  539. target_compile_options(ge_runner PRIVATE
  540. -O2
  541. -fno-common
  542. -fvisibility=hidden
  543. $<$<STREQUAL:${CMAKE_CXX_COMPILER_VERSION},7.3.0>:-Werror=unused-variable>
  544. $<$<STREQUAL:${CMAKE_CXX_COMPILER_VERSION},7.3.0>:-Werror=unused-const-variable -Werror=format>
  545. )
  546. target_include_directories(ge_runner SYSTEM PRIVATE
  547. ${GE_CODE_DIR}/ge
  548. ${GE_CODE_DIR}/inc
  549. ${GE_CODE_DIR}/inc/external
  550. ${GE_CODE_DIR}/inc/framework
  551. ${METADEF_DIR}/inc
  552. ${METADEF_DIR}/inc/external
  553. ${CMAKE_BINARY_DIR}
  554. ${CMAKE_BINARY_DIR}/proto/graphengine_protos
  555. #### yellow zone ####
  556. ${GE_CODE_DIR}/../inc
  557. ${GE_CODE_DIR}/../toolchain/ide/ide-daemon/external
  558. ${GE_CODE_DIR}/../abl/adump/external
  559. ${GE_CODE_DIR}/../abl/licctrl
  560. ${GE_CODE_DIR}/../ace/comop/inc
  561. ${GE_CODE_DIR}/../ace/comop/inc/external
  562. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:${GE_DEPEND_DIR}/inc>
  563. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:$<TARGET_PROPERTY:runtime_headers,INTERFACE_INCLUDE_DIRECTORIES>>
  564. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:$<TARGET_PROPERTY:cce_headers,INTERFACE_INCLUDE_DIRECTORIES>>
  565. #### blue zone ####
  566. ${ASCEND_DIR}/driver/include
  567. ${ASCEND_DIR}/fwkacllib/include
  568. $<$<BOOL:${ENABLE_OPEN_SRC}>:${GE_CODE_DIR}/third_party/fwkacllib/inc>
  569. $<$<BOOL:${ENABLE_OPEN_SRC}>:${GE_CODE_DIR}/third_party/fwkacllib/inc/toolchain>
  570. $<$<BOOL:${ENABLE_OPEN_SRC}>:${GE_CODE_DIR}/third_party/fwkacllib/inc/opt_info>
  571. )
  572. target_link_options(ge_runner PRIVATE
  573. -Wl,-Bsymbolic
  574. )
  575. target_link_libraries(ge_runner PRIVATE
  576. $<BUILD_INTERFACE:intf_pub>
  577. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:$<BUILD_INTERFACE:slog_headers>>
  578. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:$<BUILD_INTERFACE:msprof_headers>>
  579. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:$<BUILD_INTERFACE:mmpa_headers>>
  580. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:$<BUILD_INTERFACE:runtime_headers>>
  581. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:$<BUILD_INTERFACE:cce_headers>>
  582. adump_server
  583. static_mmpa
  584. ge_proto_common
  585. ge_proto_client
  586. -Wl,--no-as-needed
  587. graph
  588. ge_common
  589. ascend_protobuf
  590. register
  591. c_sec
  592. slog
  593. runtime
  594. error_manager
  595. ascend_hal_stub
  596. opt_feature
  597. -Wl,--as-needed
  598. json
  599. -lrt
  600. -ldl
  601. )
  602. ############ libge_compiler.so ############
  603. add_library(ge_compiler SHARED
  604. ${COMPILER_SRC_LIST}
  605. )
  606. add_dependencies(ge_compiler
  607. graphengine_protos
  608. )
  609. target_compile_definitions(ge_compiler PRIVATE
  610. PROTOBUF_INLINE_NOT_IN_HEADERS=0
  611. REUSE_MEMORY=1
  612. FMK_SUPPORT_DUMP
  613. FMK_HOST_INFER
  614. COMPILE_OMG_PACKAGE
  615. google=ascend_private
  616. FUNC_VISIBILITY
  617. $<$<STREQUAL:${ENABLE_OPEN_SRC},True>:ONLY_COMPILE_OPEN_SRC>
  618. )
  619. target_compile_options(ge_compiler PRIVATE
  620. -O2
  621. -fno-common
  622. -fvisibility=hidden
  623. $<$<STREQUAL:${CMAKE_CXX_COMPILER_VERSION},7.3.0>:-Werror=unused-variable>
  624. $<$<STREQUAL:${CMAKE_CXX_COMPILER_VERSION},7.3.0>:-Werror=unused-const-variable -Werror=format>
  625. )
  626. target_include_directories(ge_compiler SYSTEM PRIVATE
  627. ${GE_CODE_DIR}/ge
  628. ${GE_CODE_DIR}/inc
  629. ${GE_CODE_DIR}/inc/external
  630. ${GE_CODE_DIR}/inc/framework
  631. ${METADEF_DIR}/inc
  632. ${METADEF_DIR}/inc/external
  633. ${CMAKE_BINARY_DIR}
  634. ${CMAKE_BINARY_DIR}/proto/graphengine_protos
  635. #### yellow zone ####
  636. ${GE_CODE_DIR}/../inc
  637. ${GE_CODE_DIR}/../toolchain/ide/ide-daemon/external
  638. ${GE_CODE_DIR}/../abl/adump/external
  639. ${GE_CODE_DIR}/../abl/licctrl
  640. ${GE_CODE_DIR}/../ace/comop/inc
  641. ${GE_CODE_DIR}/../ace/comop/inc/external
  642. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:${GE_DEPEND_DIR}/inc>
  643. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:$<TARGET_PROPERTY:runtime_headers,INTERFACE_INCLUDE_DIRECTORIES>>
  644. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:$<TARGET_PROPERTY:cce_headers,INTERFACE_INCLUDE_DIRECTORIES>>
  645. #### blue zone ####
  646. ${ASCEND_DIR}/driver/include
  647. ${ASCEND_DIR}/fwkacllib/include
  648. $<$<BOOL:${ENABLE_OPEN_SRC}>:${GE_CODE_DIR}/third_party/fwkacllib/inc>
  649. $<$<BOOL:${ENABLE_OPEN_SRC}>:${GE_CODE_DIR}/third_party/fwkacllib/inc/toolchain>
  650. $<$<BOOL:${ENABLE_OPEN_SRC}>:${GE_CODE_DIR}/third_party/fwkacllib/inc/opt_info>
  651. )
  652. target_link_options(ge_compiler PRIVATE
  653. -Wl,-Bsymbolic
  654. )
  655. target_link_libraries(ge_compiler PRIVATE
  656. $<BUILD_INTERFACE:intf_pub>
  657. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:$<BUILD_INTERFACE:slog_headers>>
  658. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:$<BUILD_INTERFACE:msprof_headers>>
  659. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:$<BUILD_INTERFACE:mmpa_headers>>
  660. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:$<BUILD_INTERFACE:runtime_headers>>
  661. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:$<BUILD_INTERFACE:cce_headers>>
  662. static_mmpa
  663. ge_proto_common
  664. -Wl,--no-as-needed
  665. graph
  666. ge_common
  667. ascend_protobuf
  668. register
  669. c_sec
  670. error_manager
  671. slog
  672. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:$<BUILD_INTERFACE:runtime>>
  673. $<$<BOOL:${ENABLE_OPEN_SRC}>:$<BUILD_INTERFACE:runtime_compile>>
  674. opt_feature
  675. -Wl,--as-needed
  676. json
  677. -lrt
  678. -ldl
  679. )
  680. ######## libge_executor.a ########
  681. add_library(ge_executor STATIC
  682. ${EXECUTOR_SRC_LIST}
  683. )
  684. add_dependencies(ge_executor
  685. graphengine_protos
  686. )
  687. target_compile_options(ge_executor PRIVATE
  688. $<$<OR:$<STREQUAL:${TARGET_SYSTEM_NAME},Linux>,$<STREQUAL:${TARGET_SYSTEM_NAME},Android>>:-fvisibility=hidden -O2 -Werror -Wno-deprecated-declarations -fno-common>
  689. $<$<AND:$<STREQUAL:${TARGET_SYSTEM_NAME},Windows>,$<STREQUAL:${CMAKE_CONFIGURATION_TYPES},Debug>>:/MTd>
  690. $<$<AND:$<STREQUAL:${TARGET_SYSTEM_NAME},Windows>,$<STREQUAL:${CMAKE_CONFIGURATION_TYPES},Release>>:/MT>
  691. $<$<STREQUAL:${CMAKE_CXX_COMPILER_VERSION},7.3.0>:-Werror=unused-variable>
  692. $<$<STREQUAL:${CMAKE_CXX_COMPILER_VERSION},7.3.0>:-Werror=unused-const-variable -Werror=format>
  693. )
  694. target_compile_definitions(ge_executor PRIVATE
  695. PROTOBUF_INLINE_NOT_IN_HEADERS=0
  696. DAVINCI_SUPPORT_PROFILING
  697. google=ascend_private
  698. $<IF:$<STREQUAL:${TARGET_SYSTEM_NAME},Windows>,OS_TYPE=WIN,OS_TYPE=0>
  699. $<$<STREQUAL:${TARGET_SYSTEM_NAME},Windows>:SECUREC_USING_STD_SECURE_LIB=0 NOMINMAX>
  700. $<$<STREQUAL:${ENABLE_OPEN_SRC},True>:ONLY_COMPILE_OPEN_SRC>
  701. LOG_CPP
  702. )
  703. target_include_directories(ge_executor SYSTEM PRIVATE
  704. ${GE_CODE_DIR}/ge
  705. ${GE_CODE_DIR}/inc
  706. ${GE_CODE_DIR}/inc/external
  707. ${GE_CODE_DIR}/inc/framework
  708. ${METADEF_DIR}/inc
  709. ${METADEF_DIR}/inc/external
  710. ${CMAKE_BINARY_DIR}
  711. ${CMAKE_BINARY_DIR}/proto/graphengine_protos
  712. #### yellow zone ####
  713. ${GE_CODE_DIR}/../ace/comop/inc
  714. ${GE_CODE_DIR}/../ace/comop/inc/external
  715. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:${GE_DEPEND_DIR}/inc>
  716. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:$<TARGET_PROPERTY:runtime_headers,INTERFACE_INCLUDE_DIRECTORIES>>
  717. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:$<TARGET_PROPERTY:cce_headers,INTERFACE_INCLUDE_DIRECTORIES>>
  718. #### blue zone ####
  719. $<$<BOOL:${ENABLE_OPEN_SRC}>:${GE_CODE_DIR}/third_party/fwkacllib/inc>
  720. $<$<BOOL:${ENABLE_OPEN_SRC}>:${GE_CODE_DIR}/third_party/fwkacllib/inc/toolchain>
  721. )
  722. target_link_libraries(ge_executor PRIVATE
  723. $<BUILD_INTERFACE:intf_pub>
  724. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:$<BUILD_INTERFACE:slog_headers>>
  725. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:$<BUILD_INTERFACE:msprof_headers>>
  726. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:$<BUILD_INTERFACE:mmpa_headers>>
  727. json
  728. ge_proto_client
  729. ascend_protobuf_static
  730. c_sec
  731. $<$<NOT:$<STREQUAL:${TARGET_SYSTEM_NAME},Android>>:-lrt>
  732. -ldl
  733. )
  734. ######## libge_executor.so ########
  735. add_library(ge_executor_shared SHARED
  736. ${EXECUTOR_SRC_LIST}
  737. )
  738. add_dependencies(ge_executor_shared
  739. graphengine_protos
  740. )
  741. target_compile_options(ge_executor_shared PRIVATE
  742. -fno-common
  743. -Werror
  744. -O2
  745. -Wno-deprecated-declarations
  746. -fvisibility=hidden
  747. )
  748. target_compile_definitions(ge_executor_shared PRIVATE
  749. PROTOBUF_INLINE_NOT_IN_HEADERS=0
  750. DAVINCI_SUPPORT_PROFILING
  751. google=ascend_private
  752. FUNC_VISIBILITY
  753. $<$<STREQUAL:${ENABLE_OPEN_SRC},True>:ONLY_COMPILE_OPEN_SRC>
  754. )
  755. target_include_directories(ge_executor_shared PRIVATE
  756. ${GE_CODE_DIR}/ge
  757. ${GE_CODE_DIR}/inc
  758. ${GE_CODE_DIR}/inc/external
  759. ${GE_CODE_DIR}/inc/framework
  760. ${METADEF_DIR}/inc
  761. ${METADEF_DIR}/inc/external
  762. ${CMAKE_BINARY_DIR}
  763. ${CMAKE_BINARY_DIR}/proto/graphengine_protos
  764. #### yellow zone ####
  765. ${GE_CODE_DIR}/../ace/comop/inc
  766. ${GE_CODE_DIR}/../ace/comop/inc/external
  767. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:${GE_DEPEND_DIR}/inc>
  768. #### blue zone ####
  769. $<$<BOOL:${ENABLE_OPEN_SRC}>:${GE_CODE_DIR}/third_party/fwkacllib/inc>
  770. )
  771. target_link_options(ge_executor_shared PRIVATE
  772. -Wl,-Bsymbolic
  773. -Wl,--exclude-libs,ALL
  774. )
  775. target_link_libraries(ge_executor_shared PRIVATE
  776. $<BUILD_INTERFACE:intf_pub>
  777. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:$<BUILD_INTERFACE:slog_headers>>
  778. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:$<BUILD_INTERFACE:msprof_headers>>
  779. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:$<BUILD_INTERFACE:mmpa_headers>>
  780. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:$<BUILD_INTERFACE:runtime_headers>>
  781. $<$<NOT:$<BOOL:${ENABLE_OPEN_SRC}>>:$<BUILD_INTERFACE:cce_headers>>
  782. -Wl,--no-as-needed
  783. ge_common
  784. ge_proto_client
  785. runtime
  786. slog
  787. graph
  788. register
  789. error_manager
  790. ascend_protobuf
  791. c_sec
  792. -Wl,--as-needed
  793. json
  794. $<$<NOT:$<STREQUAL:${TARGET_SYSTEM_NAME},Android>>:-lrt>
  795. -ldl
  796. )
  797. set_target_properties(ge_executor_shared PROPERTIES
  798. OUTPUT_NAME ge_executor
  799. )
  800. ############ libascendcl.so ############
  801. file(GENERATE OUTPUT ${CMAKE_BINARY_DIR}/dummy.c CONTENT "")
  802. #add_library(dummy_obj OBJECT ${CMAKE_BINARY_DIR}/dummy.c)
  803. #set(DUMMY_OBJ $<TARGET_OBJECTS:dummy_obj>)
  804. file(MAKE_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR}/ascendcl_object)
  805. if(EXISTS ${STATIC_ACL_LIB}/libascendcl.a)
  806. execute_process(
  807. COMMAND ar x ${STATIC_ACL_LIB}/libascendcl.a
  808. WORKING_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR}/ascendcl_object
  809. )
  810. file(GLOB OBJECT_LIST ${CMAKE_CURRENT_BINARY_DIR}/ascendcl_object/*.o)
  811. else()
  812. set(OBJECT_LIST ${CMAKE_BINARY_DIR}/dummy.c)
  813. endif()
  814. add_library(opensrc_ascendcl SHARED
  815. ${OBJECT_LIST}
  816. $<TARGET_OBJECTS:$<IF:$<TARGET_EXISTS:msprofiler>,msprofiler,msprofiler_object>>
  817. )
  818. add_library(msprofiler_object OBJECT IMPORTED GLOBAL)
  819. if (msprofiler_ext_LIBRARY_DIR)
  820. file(MAKE_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR}/msprofiler_object)
  821. execute_process(
  822. COMMAND ar x ${msprofiler_ext_LIBRARY_DIR}
  823. WORKING_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR}/msprofiler_object
  824. )
  825. file(GLOB MSPROFILER_OBJECT_LIST ${CMAKE_CURRENT_BINARY_DIR}/msprofiler_object/*.o)
  826. set_property(TARGET msprofiler_object PROPERTY IMPORTED_OBJECTS ${MSPROFILER_OBJECT_LIST})
  827. endif()
  828. target_compile_definitions(opensrc_ascendcl PRIVATE
  829. google=ascend_private
  830. )
  831. target_compile_options(opensrc_ascendcl PRIVATE
  832. -O2
  833. -fvisibility=hidden
  834. )
  835. target_link_options(opensrc_ascendcl PRIVATE
  836. -rdynamic
  837. -Wl,--allow-multiple-definition
  838. -Wl,-z,muldefs
  839. -Wl,-Bsymbolic
  840. -Wl,--exclude-libs,ALL
  841. )
  842. target_link_libraries(opensrc_ascendcl PRIVATE
  843. -Wl,--whole-archive
  844. ge_executor
  845. ge_common_static
  846. graph_static
  847. static_mmpa
  848. ascend_protobuf_static
  849. register_static
  850. error_manager_static
  851. adump_server
  852. -Wl,--no-whole-archive
  853. -Wl,--no-as-needed
  854. c_sec
  855. runtime
  856. slog
  857. ascend_hal_stub
  858. -Wl,--as-needed
  859. -lrt
  860. -ldl
  861. json
  862. )
  863. set_target_properties(opensrc_ascendcl PROPERTIES
  864. OUTPUT_NAME ascendcl
  865. )
  866. ##################################################################
  867. add_custom_command(
  868. OUTPUT ${CMAKE_CURRENT_BINARY_DIR}/stub_ge_ir_build.cc
  869. ${CMAKE_CURRENT_BINARY_DIR}/stub_ge_api.cc
  870. COMMAND echo "Generating stub files."
  871. && ${HI_PYTHON} ${CMAKE_CURRENT_LIST_DIR}/stub/gen_stubapi.py ${GE_CODE_DIR}/inc/external ${CMAKE_CURRENT_BINARY_DIR}
  872. && mv ge_ir_build.cc stub_ge_ir_build.cc
  873. && mv ge_api.cc stub_ge_api.cc
  874. && echo "Generating stub files end."
  875. #WORKING_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR}
  876. #DEPENDS stub/gen_stubapi.py ${TOP_DIR}/inc/external ${CMAKE_CURRENT_BINARY_DIR}
  877. )
  878. add_custom_target(ge_stub
  879. DEPENDS ${CMAKE_CURRENT_BINARY_DIR}/stub_ge_ir_build.cc
  880. ${CMAKE_CURRENT_BINARY_DIR}/stub_ge_api.cc
  881. )
  882. ##################################################################
  883. ############ stub/libge_compiler.so ############
  884. add_library(atc_stub_ge_compiler SHARED
  885. stub_ge_ir_build.cc
  886. )
  887. add_dependencies(atc_stub_ge_compiler ge_stub)
  888. target_compile_options(atc_stub_ge_compiler PRIVATE
  889. -fno-common
  890. )
  891. target_link_libraries(atc_stub_ge_compiler PRIVATE
  892. $<BUILD_INTERFACE:intf_pub>
  893. )
  894. set_target_properties(atc_stub_ge_compiler PROPERTIES
  895. OUTPUT_NAME ge_compiler
  896. LIBRARY_OUTPUT_DIRECTORY atc_stub
  897. )
  898. target_include_directories(atc_stub_ge_compiler PRIVATE
  899. ${GE_CODE_DIR}/ge
  900. ${GE_CODE_DIR}/inc
  901. ${GE_CODE_DIR}/inc/framework
  902. ${GE_CODE_DIR}/inc/external
  903. ${METADEF_DIR}/inc/external
  904. ${METADEF_DIR}/inc
  905. #### yellow zone ####
  906. ${GE_CODE_DIR}/../inc
  907. ${GE_CODE_DIR}/../toolchain/ide/ide-daemon/external
  908. ${GE_CODE_DIR}/../abl/adump/external
  909. #### blue zone ####
  910. ${ASCEND_DIR}/driver/include
  911. ${ASCEND_DIR}/fwkacllib/include
  912. )
  913. ############ stub/libge_runner.so ############
  914. add_library(fwk_stub_ge_runner SHARED
  915. stub_ge_api.cc
  916. stub_ge_ir_build.cc
  917. )
  918. add_dependencies(fwk_stub_ge_runner ge_stub)
  919. target_compile_options(fwk_stub_ge_runner PRIVATE
  920. -fno-common
  921. )
  922. target_link_libraries(fwk_stub_ge_runner PRIVATE
  923. $<BUILD_INTERFACE:intf_pub>
  924. )
  925. set_target_properties(fwk_stub_ge_runner PROPERTIES
  926. OUTPUT_NAME ge_runner
  927. LIBRARY_OUTPUT_DIRECTORY fwk_stub
  928. )
  929. target_include_directories(fwk_stub_ge_runner PRIVATE
  930. ${GE_CODE_DIR}/ge
  931. ${GE_CODE_DIR}/inc
  932. ${GE_CODE_DIR}/inc/external
  933. ${GE_CODE_DIR}/inc/framework
  934. ${METADEF_DIR}/inc/external
  935. ${METADEF_DIR}/inc
  936. #### yellow zone ####
  937. ${GE_CODE_DIR}/../inc
  938. ${GE_CODE_DIR}/../toolchain/ide/ide-daemon/external
  939. ${GE_CODE_DIR}/../abl/adump/external
  940. #### blue zone ####
  941. ${ASCEND_DIR}/driver/include
  942. ${ASCEND_DIR}/fwkacllib/include
  943. )
  944. ###############################################################
  945. add_custom_target(
  946. engine_conf.json ALL
  947. DEPENDS ${CMAKE_CURRENT_BINARY_DIR}/engine_conf.json
  948. )
  949. add_custom_command(
  950. OUTPUT ${CMAKE_CURRENT_BINARY_DIR}/engine_conf.json
  951. COMMAND cp ${CMAKE_CURRENT_LIST_DIR}/engine_manager/engine_conf.json ${CMAKE_CURRENT_BINARY_DIR}/
  952. )
  953. ###############################################################
  954. add_custom_target(
  955. optimizer_priority.pbtxt ALL
  956. DEPENDS ${CMAKE_CURRENT_BINARY_DIR}/optimizer_priority.pbtxt
  957. )
  958. add_custom_command(
  959. OUTPUT ${CMAKE_CURRENT_BINARY_DIR}/optimizer_priority.pbtxt
  960. COMMAND cp ${CMAKE_CURRENT_LIST_DIR}/opskernel_manager/optimizer_priority.pbtxt ${CMAKE_CURRENT_BINARY_DIR}/
  961. )
  962. ###############################################################
  963. ############ install ############
  964. set(INSTALL_BASE_DIR "")
  965. set(INSTALL_LIBRARY_DIR lib)
  966. install(TARGETS ge_runner ge_compiler ge_executor_shared opensrc_ascendcl OPTIONAL
  967. LIBRARY DESTINATION ${INSTALL_LIBRARY_DIR}
  968. )
  969. install(TARGETS atc_stub_ge_compiler fwk_stub_ge_runner OPTIONAL
  970. LIBRARY DESTINATION ${INSTALL_LIBRARY_DIR}/stub
  971. )
  972. install(FILES
  973. ${CMAKE_CURRENT_BINARY_DIR}/engine_conf.json
  974. ${CMAKE_CURRENT_BINARY_DIR}/optimizer_priority.pbtxt OPTIONAL
  975. DESTINATION ${INSTALL_LIBRARY_DIR}
  976. )
  977. endif()

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示