You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

hybrid_davinci_model.cc 7.0 kB

5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
4 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225
  1. /**
  2. * Copyright 2019-2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include <memory>
  17. #include "hybrid_davinci_model.h"
  18. #include "hybrid/model/hybrid_model.h"
  19. #include "hybrid/executor/hybrid_model_async_executor.h"
  20. #include "hybrid/node_executor/node_executor.h"
  21. namespace ge {
  22. namespace hybrid {
  23. class HybridDavinciModel::Impl {
  24. public:
  25. explicit Impl(GeRootModelPtr ge_model) : model_(std::move(ge_model)), executor_(&model_) {
  26. }
  27. ~Impl() {
  28. NodeExecutorManager::GetInstance().FinalizeExecutors();
  29. }
  30. Status Init() {
  31. GE_CHK_STATUS_RET(NodeExecutorManager::GetInstance().EnsureInitialized(), "Failed to initialize executors");
  32. GE_CHK_STATUS_RET(model_.Init(), "Failed to init model.")
  33. GE_CHK_STATUS_RET(executor_.Init(), "Failed to init model executor.")
  34. return SUCCESS;
  35. }
  36. Status Execute(const std::vector<DataBuffer> &inputs,
  37. const std::vector<GeTensorDesc> &input_desc,
  38. std::vector<DataBuffer> &outputs,
  39. std::vector<GeTensorDesc> &output_desc,
  40. rtStream_t stream) {
  41. return executor_.Execute(inputs, input_desc, outputs, output_desc);
  42. }
  43. Status Execute(const vector<GeTensor> &inputs, vector<GeTensor> &outputs) {
  44. return executor_.Execute(inputs, outputs);
  45. }
  46. Status ModelRunStart() {
  47. return executor_.Start(listener_);
  48. }
  49. Status ModelRunStop() {
  50. return executor_.Stop();
  51. }
  52. Status EnqueueData(const std::shared_ptr<InputDataWrapper> &data) {
  53. return executor_.EnqueueData(data);
  54. }
  55. void SetListener(const shared_ptr<ModelListener> &listener) {
  56. listener_ = listener;
  57. }
  58. void SetModelId(uint32_t model_id) {
  59. executor_.SetModelId(model_id);
  60. model_.SetModelId(model_id);
  61. }
  62. void SetDeviceId(uint32_t device_id) {
  63. model_.SetDeviceId(device_id);
  64. executor_.SetDeviceId(device_id);
  65. }
  66. void SetOmName(const string &model_name) {
  67. model_.SetOmName(model_name);
  68. }
  69. uint64_t GetSessionId() {
  70. return model_.GetSessionId();
  71. }
  72. Status GetDynamicBatchInfo(std::vector<std::vector<int64_t>> &batch_info, int32_t &dynamic_type) {
  73. return model_.GetDynamicBatchInfo(batch_info, dynamic_type);
  74. }
  75. void GetUserDesignateShapeOrder(std::vector<std::string> &user_input_shape_order) {
  76. model_.GetUserDesignateShapeOrder(user_input_shape_order);
  77. }
  78. void GetModelAttr(std::vector<std::string> &dynamic_output_shape_info) {
  79. model_.GetModelAttr(dynamic_output_shape_info);
  80. }
  81. Status GetInputOutputDescInfo(vector<InputOutputDescInfo> &input_desc,
  82. vector<InputOutputDescInfo> &output_desc,
  83. std::vector<uint32_t> &input_formats,
  84. std::vector<uint32_t> &output_formats) {
  85. return model_.GetInputOutputDescInfo(input_desc, output_desc, input_formats, output_formats);
  86. }
  87. void SetModelDescVersion(bool is_new_model_desc) {
  88. model_.SetModelDescVersion(is_new_model_desc);
  89. }
  90. private:
  91. std::shared_ptr<ModelListener> listener_;
  92. HybridModel model_;
  93. HybridModelAsyncExecutor executor_;
  94. };
  95. HybridDavinciModel::~HybridDavinciModel() {
  96. delete impl_;
  97. }
  98. std::unique_ptr<HybridDavinciModel> HybridDavinciModel::Create(const GeRootModelPtr &ge_root_model) {
  99. auto instance = std::unique_ptr<HybridDavinciModel>(new (std::nothrow)HybridDavinciModel());
  100. if (instance != nullptr) {
  101. instance->impl_ = new (std::nothrow) HybridDavinciModel::Impl(ge_root_model);
  102. if (instance->impl_ != nullptr) {
  103. return instance;
  104. }
  105. }
  106. return nullptr;
  107. }
  108. Status HybridDavinciModel::Init() {
  109. GE_CHECK_NOTNULL(impl_);
  110. return impl_->Init();
  111. }
  112. Status HybridDavinciModel::Execute(const std::vector<DataBuffer> &inputs,
  113. const std::vector<GeTensorDesc> &input_desc,
  114. std::vector<DataBuffer> &outputs,
  115. std::vector<GeTensorDesc> &output_desc, rtStream_t stream) {
  116. GE_CHECK_NOTNULL(impl_);
  117. return impl_->Execute(inputs, input_desc, outputs, output_desc, stream);
  118. }
  119. Status HybridDavinciModel::Execute(const vector<GeTensor> &inputs, vector<GeTensor> &outputs) {
  120. GE_CHECK_NOTNULL(impl_);
  121. return impl_->Execute(inputs, outputs);
  122. }
  123. Status HybridDavinciModel::ModelRunStart() {
  124. GE_CHECK_NOTNULL(impl_);
  125. return impl_->ModelRunStart();
  126. }
  127. Status HybridDavinciModel::ModelRunStop() {
  128. GE_CHECK_NOTNULL(impl_);
  129. return impl_->ModelRunStop();
  130. }
  131. Status HybridDavinciModel::EnqueueData(const shared_ptr<InputDataWrapper> &data) {
  132. GE_CHECK_NOTNULL(impl_);
  133. return impl_->EnqueueData(data);
  134. }
  135. void HybridDavinciModel::SetListener(const shared_ptr<ModelListener> &listener) {
  136. if (impl_ != nullptr) {
  137. impl_->SetListener(listener);
  138. }
  139. }
  140. void HybridDavinciModel::SetModelId(uint32_t model_id) {
  141. if (impl_ != nullptr) {
  142. impl_->SetModelId(model_id);
  143. }
  144. }
  145. void HybridDavinciModel::SetDeviceId(uint32_t device_id) {
  146. if (impl_ != nullptr) {
  147. impl_->SetDeviceId(device_id);
  148. }
  149. }
  150. void HybridDavinciModel::SetOmName(const string &om_name) {
  151. if (impl_ != nullptr) {
  152. impl_->SetOmName(om_name);
  153. }
  154. }
  155. Status HybridDavinciModel::GetDynamicBatchInfo(std::vector<std::vector<int64_t>> &batch_info, int32_t &dynamic_type) {
  156. GE_CHECK_NOTNULL(impl_);
  157. return impl_->GetDynamicBatchInfo(batch_info, dynamic_type);
  158. }
  159. void HybridDavinciModel::GetUserDesignateShapeOrder(std::vector<std::string> &user_input_shape_order) {
  160. if (impl_ != nullptr) {
  161. impl_->GetUserDesignateShapeOrder(user_input_shape_order);
  162. }
  163. }
  164. void HybridDavinciModel::GetModelAttr(std::vector<std::string> &dynamic_output_shape_info) {
  165. if (impl_ != nullptr) {
  166. impl_->GetModelAttr(dynamic_output_shape_info);
  167. }
  168. }
  169. Status HybridDavinciModel::GetInputOutputDescInfo(vector<InputOutputDescInfo> &input_desc,
  170. vector<InputOutputDescInfo> &output_desc,
  171. std::vector<uint32_t> &input_formats,
  172. std::vector<uint32_t> &output_formats) {
  173. GE_CHECK_NOTNULL(impl_);
  174. return impl_->GetInputOutputDescInfo(input_desc, output_desc, input_formats, output_formats);
  175. }
  176. void HybridDavinciModel::SetModelDescVersion(bool is_new_model_desc) {
  177. if (impl_ != nullptr) {
  178. impl_->SetModelDescVersion(is_new_model_desc);
  179. }
  180. }
  181. uint64_t HybridDavinciModel::GetSessionId() {
  182. GE_CHECK_NOTNULL(impl_);
  183. return impl_->GetSessionId();
  184. }
  185. } // namespace hybrid
  186. } // namespace ge

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示