|
|
@@ -210,6 +210,85 @@ TEST_F(UtestAicpuNodeExecutor, aicpu_memcopy_task) { |
|
|
|
ASSERT_EQ(aicpu_node_task2.SetMemCopyTask(task_def), FAILED);
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST_F(UtestAicpuNodeExecutor, aicpu_copy_data_to_hbm) {
|
|
|
|
ComputeGraphPtr graph = std::make_shared<ComputeGraph>("test");
|
|
|
|
GeModelPtr ge_sub_model = std::make_shared<GeModel>();
|
|
|
|
GeRootModelPtr ge_root_model = std::make_shared<GeRootModel>(graph);
|
|
|
|
ge_root_model->SetModelName("test_name");
|
|
|
|
ge_root_model->SetSubgraphInstanceNameToModel("sub", ge_sub_model);
|
|
|
|
HybridModel hybrid_model(ge_root_model);
|
|
|
|
|
|
|
|
NodePtr node = CreateNode(graph, "frameworkop", FRAMEWORK_OP_TYPE, 4, 2);
|
|
|
|
|
|
|
|
std::unique_ptr<NodeItem> new_node;
|
|
|
|
ASSERT_EQ(NodeItem::Create(node, new_node), SUCCESS);
|
|
|
|
NodeItem *node_item = new_node.get();
|
|
|
|
hybrid_model.node_items_[node] = std::move(new_node);
|
|
|
|
node_item->input_start = 0;
|
|
|
|
node_item->output_start = 0;
|
|
|
|
node_item->is_dynamic = true;
|
|
|
|
node_item->shape_inference_type = DEPEND_COMPUTE;
|
|
|
|
node_item->num_outputs = 2;
|
|
|
|
GraphItem graph_item;
|
|
|
|
graph_item.node_items_.emplace_back(node_item);
|
|
|
|
graph_item.total_inputs_ = 4;
|
|
|
|
graph_item.total_outputs_ = 2;
|
|
|
|
|
|
|
|
GraphExecutionContext graph_context;
|
|
|
|
SubgraphContext subgraph_context(&graph_item, &graph_context);
|
|
|
|
ASSERT_EQ(subgraph_context.Init(), SUCCESS);
|
|
|
|
graph_context.callback_manager = std::unique_ptr<CallbackManager>(new CallbackManager());
|
|
|
|
|
|
|
|
auto node_state = subgraph_context.GetOrCreateNodeState(node_item);
|
|
|
|
ASSERT_NE(node_state, nullptr);
|
|
|
|
|
|
|
|
for (int i=0; i<4; ++i) {
|
|
|
|
uint64_t value_0 = 512;
|
|
|
|
TensorValue in_tensor0(&value_0, sizeof(value_0));
|
|
|
|
subgraph_context.SetInput(*node_item, 0, in_tensor0);
|
|
|
|
}
|
|
|
|
|
|
|
|
uint64_t value_0 = 512;
|
|
|
|
TensorValue out_tensor0(&value_0, sizeof(value_0));
|
|
|
|
subgraph_context.SetOutput(*node_item, 0, out_tensor0);
|
|
|
|
|
|
|
|
uint64_t value_1 = 512;
|
|
|
|
TensorValue out_tensor1(&value_1, sizeof(value_1));
|
|
|
|
subgraph_context.SetOutput(*node_item, 1, out_tensor1);
|
|
|
|
|
|
|
|
// task
|
|
|
|
domi::TaskDef task_def;
|
|
|
|
AicpuTaskStruct args;
|
|
|
|
args.head.length = sizeof(args);
|
|
|
|
args.head.ioAddrNum = 6;
|
|
|
|
task_def.set_type(RT_MODEL_TASK_ALL_KERNEL);
|
|
|
|
domi::KernelDef *kernel_def = task_def.mutable_kernel();
|
|
|
|
kernel_def->set_args(reinterpret_cast<const char *>(&args), args.head.length);
|
|
|
|
kernel_def->set_args_size(args.head.length);
|
|
|
|
AicpuExtInfo aicpu_ext_info;
|
|
|
|
aicpu_ext_info.infoType = aicpu::FWKAdapter::FWK_ADPT_EXT_SHAPE_TYPE;
|
|
|
|
aicpu_ext_info.infoLen = sizeof(int32_t);
|
|
|
|
memcpy_s(aicpu_ext_info.infoMsg, sizeof(int32_t), &type, sizeof(int32_t));
|
|
|
|
char *ext_mem = (char*)malloc(sizeof(AicpuExtInfo) + sizeof(int32_t));
|
|
|
|
memcpy_s(ext_mem, sizeof(AicpuExtInfo) + sizeof(int32_t), &aicpu_ext_info2, sizeof(AicpuExtInfo) + sizeof(int32_t));
|
|
|
|
kernel_def->set_kernel_ext_info(ext_mem, sizeof(AicpuExtInfo) + sizeof(int32_t));
|
|
|
|
kernel_def->set_kernel_ext_info_size(sizeof(AicpuExtInfo) + sizeof(int32_t));
|
|
|
|
hybrid_model.task_defs_[node] = std::vector<domi::TaskDef>({task_def, task_def});
|
|
|
|
|
|
|
|
AicpuNodeTask aicpu_node_task(node_item, task_def);
|
|
|
|
std::vector<std::unique_ptr<TensorBuffer>> &out_shape_hbm;
|
|
|
|
ASSERT_EQ(aicpu_node_task.Init(hybrid_model), SUCCESS);
|
|
|
|
for (int i = 0; i < node_item->num_outputs; i++) {
|
|
|
|
aicpu_node_task.output_summary_[i].shape_data_size = 1;
|
|
|
|
aicpu_node_task.output_summary_[i].raw_data_size = 1;
|
|
|
|
aicpu_node_task.output_summary_[i].shape_data_ptr = 0;
|
|
|
|
aicpu_node_task.output_summary_[i].raw_data_ptr = 0;
|
|
|
|
}
|
|
|
|
ASSERT_EQ(aicpu_node_task.ReadResultSummaryAndPrepareMemory(*node_state->GetTaskContext(), out_shape_hbm), SUCCESS);
|
|
|
|
ASSERT_EQ(aicpu_node_task.CopyDataToHbm(*node_state->GetTaskContext(), out_shape_hbm), SUCCESS);
|
|
|
|
free(ext_mem);
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST_F(UtestAicpuNodeExecutor, aicpu_blocking_node_task) {
|
|
|
|
ComputeGraphPtr graph = std::make_shared<ComputeGraph>("test");
|
|
|
|
GeRootModelPtr ge_root_model = std::make_shared<GeRootModel>(graph);
|
|
|
|