You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

aicpu_ext_info.cc 10 kB

5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241
  1. /**
  2. * Copyright 2019-2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include "hybrid/node_executor/aicpu/aicpu_ext_info.h"
  17. #include "framework/common/util.h"
  18. #include "framework/common/fmk_error_codes.h"
  19. #include "framework/common/debug/log.h"
  20. namespace ge {
  21. namespace hybrid {
  22. namespace {
  23. // if dim count is not reach kMaxShapeDims(8), use INT64_MIN to mark dim end.
  24. constexpr int64_t kDimEndFlag = INT64_MIN;
  25. }
  26. Status AicpuExtInfoHandler::Parse(const std::string &ext_info) {
  27. GELOGI("Node[%s] parse ext info start.", node_name_.c_str());
  28. if (ext_info.empty()) {
  29. GELOGE(PARAM_INVALID, "Node[%s] parse ext info failed as ext info is empty.", node_name_.c_str());
  30. return PARAM_INVALID;
  31. }
  32. ext_info_len_ = ext_info.size();
  33. ext_info_.reset(new(std::nothrow)uint8_t[ext_info_len_]);
  34. GE_CHECK_NOTNULL(ext_info_);
  35. (void) memcpy_s(ext_info_.get(), ext_info_len_, ext_info.c_str(), ext_info.size());
  36. input_shape_and_type_.clear();
  37. output_shape_and_type_.clear();
  38. auto ext_info_data = ext_info_.get();
  39. size_t offset = 0;
  40. while (offset + sizeof(AicpuExtInfo) <= ext_info_len_) {
  41. auto aicpu_ext_info = reinterpret_cast<AicpuExtInfo *>(ext_info_data + offset);
  42. GELOGD("Ext infoType=%d, infoLen=%u.", aicpu_ext_info->infoType, aicpu_ext_info->infoLen);
  43. switch (aicpu_ext_info->infoType) {
  44. case aicpu::FWKAdapter::FWK_ADPT_EXT_SHAPE_TYPE:
  45. GE_CHK_STATUS_RET(ParseExtShapeType(aicpu_ext_info), "Parse ext shape type failed.");
  46. break;
  47. case aicpu::FWKAdapter::FWK_ADPT_EXT_INPUT_SHAPE:
  48. GE_CHK_STATUS_RET(ParseExtInputShape(aicpu_ext_info), "Parse ext input shape failed.");
  49. break;
  50. case aicpu::FWKAdapter::FWK_ADPT_EXT_OUTPUT_SHAPE:
  51. GE_CHK_STATUS_RET(ParseExtOutputShape(aicpu_ext_info), "Parse ext output shape failed.");
  52. break;
  53. case aicpu::FWKAdapter::FWK_ADPT_EXT_SESSION_INFO:
  54. GE_CHK_STATUS_RET(ParseExtSessionInfo(aicpu_ext_info), "Parse ext session info failed.");
  55. break;
  56. default:
  57. GELOGD("Node[%s] ignore infoType=%d, infoLen=%u.",
  58. node_name_.c_str(), aicpu_ext_info->infoType, aicpu_ext_info->infoLen);
  59. break;
  60. }
  61. offset += sizeof(AicpuExtInfo);
  62. offset += aicpu_ext_info->infoLen;
  63. }
  64. GE_CHK_BOOL_RET_STATUS(offset == ext_info_len_, PARAM_INVALID,
  65. "Node[%s] ext_info format error, parse not reach end, offset=%zu, ext_info_len=%zu.",
  66. node_name_.c_str(), offset, ext_info_len_);
  67. GELOGI("Node[%s] parse ext info end.", node_name_.c_str());
  68. return SUCCESS;
  69. }
  70. Status AicpuExtInfoHandler::ParseExtShapeType(AicpuExtInfo *aicpu_ext_info) {
  71. GE_CHK_BOOL_RET_STATUS(aicpu_ext_info->infoLen == sizeof(int32_t), PARAM_INVALID,
  72. "Node[%s] parse ext shape type failed as infoLen must be %zu but %u.",
  73. node_name_.c_str(), sizeof(int32_t), aicpu_ext_info->infoLen);
  74. auto type = reinterpret_cast<const int32_t *>(aicpu_ext_info->infoMsg);
  75. GE_CHK_BOOL_RET_STATUS(*type == unknown_type_, PARAM_INVALID,
  76. "Node[%s] parse ext shape type failed as need %d but %d.",
  77. node_name_.c_str(), unknown_type_, *type);
  78. GELOGI("Node[%s] parse ext shape type success infoLen=%u.", node_name_.c_str(), aicpu_ext_info->infoLen);
  79. return SUCCESS;
  80. }
  81. Status AicpuExtInfoHandler::ParseExtInputShape(AicpuExtInfo *aicpu_ext_info) {
  82. auto need_len = input_num_ * sizeof(AicpuShapeAndType);
  83. GE_CHK_BOOL_RET_STATUS(aicpu_ext_info->infoLen == need_len, PARAM_INVALID,
  84. "Node[%s] parse ext input shape failed as infoLen must be "
  85. "input_num[%zu]*sizeof(ShapeAndType)[%zu] but %u.",
  86. node_name_.c_str(), input_num_, sizeof(AicpuShapeAndType), aicpu_ext_info->infoLen);
  87. auto input = reinterpret_cast<AicpuShapeAndType *>(aicpu_ext_info->infoMsg);
  88. for (uint32_t index = 0; index < input_num_; ++index) {
  89. input_shape_and_type_.emplace_back(&input[index]);
  90. }
  91. GELOGI("Node[%s] parse ext input shape success infoLen=%u.", node_name_.c_str(), aicpu_ext_info->infoLen);
  92. return SUCCESS;
  93. }
  94. Status AicpuExtInfoHandler::ParseExtOutputShape(AicpuExtInfo *aicpu_ext_info) {
  95. if (unknown_type_ == DEPEND_COMPUTE) {
  96. GELOGD("Node[%s] is depend compute type no need ext output shape, ignore it, infoLen=%u.",
  97. node_name_.c_str(), aicpu_ext_info->infoLen);
  98. return SUCCESS;
  99. }
  100. auto need_len = output_num_ * sizeof(AicpuShapeAndType);
  101. GE_CHK_BOOL_RET_STATUS(aicpu_ext_info->infoLen == need_len, PARAM_INVALID,
  102. "Node[%s] parse ext output shape failed as infoLen must be "
  103. "output_num[%zu]*sizeof(ShapeAndType)[%zu] but %u.",
  104. node_name_.c_str(), output_num_, sizeof(AicpuShapeAndType), aicpu_ext_info->infoLen);
  105. auto output = reinterpret_cast<AicpuShapeAndType *>(aicpu_ext_info->infoMsg);
  106. for (uint32_t index = 0; index < output_num_; ++index) {
  107. output_shape_and_type_.emplace_back(&output[index]);
  108. }
  109. GELOGI("Node[%s] parse ext output shape success infoLen=%u.", node_name_.c_str(), aicpu_ext_info->infoLen);
  110. return SUCCESS;
  111. }
  112. Status AicpuExtInfoHandler::ParseExtSessionInfo(AicpuExtInfo *aicpu_ext_info) {
  113. GE_CHK_BOOL_RET_STATUS(aicpu_ext_info->infoLen == sizeof(AicpuSessionInfo), PARAM_INVALID,
  114. "Node[%s] parse ext session info failed as infoLen must be %zu but %u.",
  115. node_name_.c_str(), sizeof(SessionInfo), aicpu_ext_info->infoLen);
  116. session_info_ = reinterpret_cast<AicpuSessionInfo *>(aicpu_ext_info->infoMsg);
  117. GELOGI("Node[%s] parse session info success infoLen=%u.", node_name_.c_str(), aicpu_ext_info->infoLen);
  118. return SUCCESS;
  119. }
  120. Status AicpuExtInfoHandler::UpdateSessionInfo(uint64_t session_id, uint64_t kernel_id, bool sess_flag) {
  121. if (session_info_ == nullptr) {
  122. GELOGD("There is no session info in ext_info, no need update.");
  123. return SUCCESS;
  124. }
  125. session_info_->sessionId = session_id;
  126. session_info_->kernelId = kernel_id;
  127. session_info_->sessFlag = sess_flag;
  128. return SUCCESS;
  129. }
  130. Status AicpuExtInfoHandler::UpdateSessionInfoSessionId(uint64_t session_id) {
  131. if (session_info_ == nullptr) {
  132. GELOGD("There is no session info in ext_info, no need update.");
  133. return SUCCESS;
  134. }
  135. session_info_->sessionId = session_id;
  136. session_info_->sessFlag = true;
  137. return SUCCESS;
  138. }
  139. Status AicpuExtInfoHandler::UpdateInputShapeAndType(uint32_t input_index, const GeTensorDesc &input_desc) {
  140. GE_CHECK_LE(input_index, input_num_);
  141. const auto &shape = input_desc.GetShape();
  142. GE_CHK_STATUS_RET(UpdateShapeAndType(shape, input_desc.GetDataType(), input_shape_and_type_[input_index]),
  143. "Node[%s] input[%u] update input shape and type failed.",
  144. node_name_.c_str(), input_index);
  145. return SUCCESS;
  146. }
  147. Status AicpuExtInfoHandler::UpdateOutputShapeAndType(uint32_t output_index, const GeTensorDesc &output_desc) {
  148. GE_CHK_BOOL_RET_STATUS((unknown_type_ != DEPEND_COMPUTE), INTERNAL_ERROR,
  149. "Node[%s] is depend compute is no need update output shape and type by ext.",
  150. node_name_.c_str());
  151. GE_CHECK_LE(output_index, output_num_);
  152. auto shape = output_desc.GetShape();
  153. // shape range need use range update shape
  154. if (unknown_type_ == DEPEND_SHAPE_RANGE) {
  155. std::vector<std::pair<int64_t, int64_t>> range;
  156. auto range_ret = output_desc.GetShapeRange(range);
  157. GE_CHK_BOOL_RET_STATUS(range_ret == GRAPH_SUCCESS, INTERNAL_ERROR,
  158. "Node[%s] is shape range type but get GetShapeRange failed, ret=%u.",
  159. node_name_.c_str(), range_ret);
  160. for (size_t k = 0; k < range.size(); ++k) {
  161. if (shape.GetDim(k) < 0 && k < range.size()) {
  162. GELOGD("Node[%s] output[%u] update dim[%zu] from %ld to range max %ld.",
  163. node_name_.c_str(), output_index, k, shape.GetDim(k), range[k].second);
  164. shape.SetDim(k, range[k].second);
  165. }
  166. }
  167. }
  168. return UpdateShapeAndType(shape, output_desc.GetDataType(), output_shape_and_type_[output_index]);
  169. }
  170. Status AicpuExtInfoHandler::GetOutputShapeAndType(uint32_t output_index, GeShape &shape, DataType &data_type) {
  171. GE_CHK_BOOL_RET_STATUS((unknown_type_ != DEPEND_COMPUTE), INTERNAL_ERROR,
  172. "Node[%s] is depend compute type can not get output shape and type by ext.",
  173. node_name_.c_str());
  174. GetShapeAndType(output_shape_and_type_[output_index], shape, data_type);
  175. return SUCCESS;
  176. }
  177. Status AicpuExtInfoHandler::UpdateShapeAndType(const GeShape &shape, DataType data_type,
  178. AicpuShapeAndType *shape_and_type) {
  179. auto dim_num = shape.GetDimNum();
  180. if (dim_num > aicpu::FWKAdapter::kMaxShapeDims) {
  181. GELOGE(PARAM_INVALID, "Update shape and type failed, as dim_num %zu is over max shape dims %u.",
  182. dim_num, aicpu::FWKAdapter::kMaxShapeDims);
  183. return PARAM_INVALID;
  184. }
  185. size_t index = 0;
  186. for (; index < dim_num; ++index) {
  187. shape_and_type->dims[index] = shape.GetDim(index);
  188. }
  189. if (index < aicpu::FWKAdapter::kMaxShapeDims) {
  190. shape_and_type->dims[index] = kDimEndFlag;
  191. }
  192. // now only support update shape, type is not support
  193. return SUCCESS;
  194. }
  195. void AicpuExtInfoHandler::GetShapeAndType(const AicpuShapeAndType *shape_and_type,
  196. GeShape &shape,
  197. DataType &data_type) {
  198. std::vector<int64_t> dims;
  199. for (uint32_t index = 0; index < aicpu::FWKAdapter::kMaxShapeDims; ++index) {
  200. auto tmpDim = shape_and_type->dims[index];
  201. if (tmpDim == kDimEndFlag) {
  202. break;
  203. }
  204. dims.emplace_back(tmpDim);
  205. }
  206. data_type = static_cast<DataType>(shape_and_type->type);
  207. shape = GeShape(dims);
  208. }
  209. } // namespace hybrid
  210. } // namespace ge

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示