| @@ -210,6 +210,85 @@ TEST_F(UtestAicpuNodeExecutor, aicpu_memcopy_task) { | |||||
| ASSERT_EQ(aicpu_node_task2.SetMemCopyTask(task_def), FAILED); | ASSERT_EQ(aicpu_node_task2.SetMemCopyTask(task_def), FAILED); | ||||
| } | } | ||||
| TEST_F(UtestAicpuNodeExecutor, aicpu_copy_data_to_hbm) { | |||||
| ComputeGraphPtr graph = std::make_shared<ComputeGraph>("test"); | |||||
| GeModelPtr ge_sub_model = std::make_shared<GeModel>(); | |||||
| GeRootModelPtr ge_root_model = std::make_shared<GeRootModel>(graph); | |||||
| ge_root_model->SetModelName("test_name"); | |||||
| ge_root_model->SetSubgraphInstanceNameToModel("sub", ge_sub_model); | |||||
| HybridModel hybrid_model(ge_root_model); | |||||
| NodePtr node = CreateNode(graph, "frameworkop", FRAMEWORK_OP_TYPE, 4, 2); | |||||
| std::unique_ptr<NodeItem> new_node; | |||||
| ASSERT_EQ(NodeItem::Create(node, new_node), SUCCESS); | |||||
| NodeItem *node_item = new_node.get(); | |||||
| hybrid_model.node_items_[node] = std::move(new_node); | |||||
| node_item->input_start = 0; | |||||
| node_item->output_start = 0; | |||||
| node_item->is_dynamic = true; | |||||
| node_item->shape_inference_type = DEPEND_COMPUTE; | |||||
| node_item->num_outputs = 2; | |||||
| GraphItem graph_item; | |||||
| graph_item.node_items_.emplace_back(node_item); | |||||
| graph_item.total_inputs_ = 4; | |||||
| graph_item.total_outputs_ = 2; | |||||
| GraphExecutionContext graph_context; | |||||
| SubgraphContext subgraph_context(&graph_item, &graph_context); | |||||
| ASSERT_EQ(subgraph_context.Init(), SUCCESS); | |||||
| graph_context.callback_manager = std::unique_ptr<CallbackManager>(new CallbackManager()); | |||||
| auto node_state = subgraph_context.GetOrCreateNodeState(node_item); | |||||
| ASSERT_NE(node_state, nullptr); | |||||
| for (int i=0; i<4; ++i) { | |||||
| uint64_t value_0 = 512; | |||||
| TensorValue in_tensor0(&value_0, sizeof(value_0)); | |||||
| subgraph_context.SetInput(*node_item, 0, in_tensor0); | |||||
| } | |||||
| uint64_t value_0 = 512; | |||||
| TensorValue out_tensor0(&value_0, sizeof(value_0)); | |||||
| subgraph_context.SetOutput(*node_item, 0, out_tensor0); | |||||
| uint64_t value_1 = 512; | |||||
| TensorValue out_tensor1(&value_1, sizeof(value_1)); | |||||
| subgraph_context.SetOutput(*node_item, 1, out_tensor1); | |||||
| // task | |||||
| domi::TaskDef task_def; | |||||
| AicpuTaskStruct args; | |||||
| args.head.length = sizeof(args); | |||||
| args.head.ioAddrNum = 6; | |||||
| task_def.set_type(RT_MODEL_TASK_ALL_KERNEL); | |||||
| domi::KernelDef *kernel_def = task_def.mutable_kernel(); | |||||
| kernel_def->set_args(reinterpret_cast<const char *>(&args), args.head.length); | |||||
| kernel_def->set_args_size(args.head.length); | |||||
| AicpuExtInfo aicpu_ext_info; | |||||
| aicpu_ext_info.infoType = aicpu::FWKAdapter::FWK_ADPT_EXT_SHAPE_TYPE; | |||||
| aicpu_ext_info.infoLen = sizeof(int32_t); | |||||
| memcpy_s(aicpu_ext_info.infoMsg, sizeof(int32_t), &type, sizeof(int32_t)); | |||||
| char *ext_mem = (char*)malloc(sizeof(AicpuExtInfo) + sizeof(int32_t)); | |||||
| memcpy_s(ext_mem, sizeof(AicpuExtInfo) + sizeof(int32_t), &aicpu_ext_info2, sizeof(AicpuExtInfo) + sizeof(int32_t)); | |||||
| kernel_def->set_kernel_ext_info(ext_mem, sizeof(AicpuExtInfo) + sizeof(int32_t)); | |||||
| kernel_def->set_kernel_ext_info_size(sizeof(AicpuExtInfo) + sizeof(int32_t)); | |||||
| hybrid_model.task_defs_[node] = std::vector<domi::TaskDef>({task_def, task_def}); | |||||
| AicpuNodeTask aicpu_node_task(node_item, task_def); | |||||
| std::vector<std::unique_ptr<TensorBuffer>> &out_shape_hbm; | |||||
| ASSERT_EQ(aicpu_node_task.Init(hybrid_model), SUCCESS); | |||||
| for (int i = 0; i < node_item->num_outputs; i++) { | |||||
| aicpu_node_task.output_summary_[i].shape_data_size = 1; | |||||
| aicpu_node_task.output_summary_[i].raw_data_size = 1; | |||||
| aicpu_node_task.output_summary_[i].shape_data_ptr = 0; | |||||
| aicpu_node_task.output_summary_[i].raw_data_ptr = 0; | |||||
| } | |||||
| ASSERT_EQ(aicpu_node_task.ReadResultSummaryAndPrepareMemory(*node_state->GetTaskContext(), out_shape_hbm), SUCCESS); | |||||
| ASSERT_EQ(aicpu_node_task.CopyDataToHbm(*node_state->GetTaskContext(), out_shape_hbm), SUCCESS); | |||||
| free(ext_mem); | |||||
| } | |||||
| TEST_F(UtestAicpuNodeExecutor, aicpu_blocking_node_task) { | TEST_F(UtestAicpuNodeExecutor, aicpu_blocking_node_task) { | ||||
| ComputeGraphPtr graph = std::make_shared<ComputeGraph>("test"); | ComputeGraphPtr graph = std::make_shared<ComputeGraph>("test"); | ||||
| GeRootModelPtr ge_root_model = std::make_shared<GeRootModel>(graph); | GeRootModelPtr ge_root_model = std::make_shared<GeRootModel>(graph); | ||||