You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

hybrid_davinci_model.cc 7.1 kB

5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226
  1. /**
  2. * Copyright 2019-2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include <memory>
  17. #include "hybrid_davinci_model.h"
  18. #include "hybrid/model/hybrid_model.h"
  19. #include "hybrid/executor/hybrid_model_async_executor.h"
  20. #include "hybrid/node_executor/node_executor.h"
  21. namespace ge {
  22. namespace hybrid {
  23. class HybridDavinciModel::Impl {
  24. public:
  25. explicit Impl(GeRootModelPtr ge_model) : model_(std::move(ge_model)), executor_(&model_) {
  26. }
  27. ~Impl() {
  28. NodeExecutorManager::GetInstance().FinalizeExecutors();
  29. }
  30. Status Init() {
  31. GE_CHK_STATUS_RET(NodeExecutorManager::GetInstance().EnsureInitialized(), "Failed to initialize executors");
  32. GE_CHK_STATUS_RET(model_.Init(), "Failed to init model.")
  33. GE_CHK_STATUS_RET(executor_.Init(), "Failed to init model executor.")
  34. return SUCCESS;
  35. }
  36. Status Execute(const std::vector<DataBuffer> &inputs,
  37. const std::vector<GeTensorDesc> &input_desc,
  38. std::vector<DataBuffer> &outputs,
  39. std::vector<GeTensorDesc> &output_desc,
  40. rtStream_t stream) {
  41. return executor_.Execute(inputs, input_desc, outputs, output_desc);
  42. }
  43. Status Execute(const vector<GeTensor> &inputs, vector<GeTensor> &outputs) {
  44. return executor_.Execute(inputs, outputs);
  45. }
  46. Status ModelRunStart() {
  47. return executor_.Start(listener_);
  48. }
  49. Status ModelRunStop() {
  50. return executor_.Stop();
  51. }
  52. Status EnqueueData(const std::shared_ptr<InputDataWrapper> &data) {
  53. return executor_.EnqueueData(data);
  54. }
  55. void SetListener(const shared_ptr<ModelListener> &listener) {
  56. listener_ = listener;
  57. }
  58. void SetModelId(uint32_t model_id) {
  59. executor_.SetModelId(model_id);
  60. model_.SetModelId(model_id);
  61. }
  62. void SetDeviceId(uint32_t device_id) {
  63. model_.SetDeviceId(device_id);
  64. executor_.SetDeviceId(device_id);
  65. }
  66. void SetModelName(const string &model_name) {
  67. model_.SetModelName(model_name);
  68. executor_.SetModelName(model_name);
  69. }
  70. uint64_t GetSessionId() {
  71. return model_.GetSessionId();
  72. }
  73. Status GetDynamicBatchInfo(std::vector<std::vector<int64_t>> &batch_info, int32_t &dynamic_type) {
  74. return model_.GetDynamicBatchInfo(batch_info, dynamic_type);
  75. }
  76. void GetUserDesignateShapeOrder(std::vector<std::string> &user_input_shape_order) {
  77. model_.GetUserDesignateShapeOrder(user_input_shape_order);
  78. }
  79. void GetModelAttr(std::vector<std::string> &dynamic_output_shape_info) {
  80. model_.GetModelAttr(dynamic_output_shape_info);
  81. }
  82. Status GetInputOutputDescInfo(vector<InputOutputDescInfo> &input_desc,
  83. vector<InputOutputDescInfo> &output_desc,
  84. std::vector<uint32_t> &input_formats,
  85. std::vector<uint32_t> &output_formats) {
  86. return model_.GetInputOutputDescInfo(input_desc, output_desc, input_formats, output_formats);
  87. }
  88. void SetModelDescVersion(bool is_new_model_desc) {
  89. model_.SetModelDescVersion(is_new_model_desc);
  90. }
  91. private:
  92. std::shared_ptr<ModelListener> listener_;
  93. HybridModel model_;
  94. HybridModelAsyncExecutor executor_;
  95. };
  96. HybridDavinciModel::~HybridDavinciModel() {
  97. delete impl_;
  98. }
  99. std::unique_ptr<HybridDavinciModel> HybridDavinciModel::Create(const GeRootModelPtr &ge_root_model) {
  100. auto instance = std::unique_ptr<HybridDavinciModel>(new (std::nothrow)HybridDavinciModel());
  101. if (instance != nullptr) {
  102. instance->impl_ = new (std::nothrow) HybridDavinciModel::Impl(ge_root_model);
  103. if (instance->impl_ != nullptr) {
  104. return instance;
  105. }
  106. }
  107. return nullptr;
  108. }
  109. Status HybridDavinciModel::Init() {
  110. GE_CHECK_NOTNULL(impl_);
  111. return impl_->Init();
  112. }
  113. Status HybridDavinciModel::Execute(const std::vector<DataBuffer> &inputs,
  114. const std::vector<GeTensorDesc> &input_desc,
  115. std::vector<DataBuffer> &outputs,
  116. std::vector<GeTensorDesc> &output_desc, rtStream_t stream) {
  117. GE_CHECK_NOTNULL(impl_);
  118. return impl_->Execute(inputs, input_desc, outputs, output_desc, stream);
  119. }
  120. Status HybridDavinciModel::Execute(const vector<GeTensor> &inputs, vector<GeTensor> &outputs) {
  121. GE_CHECK_NOTNULL(impl_);
  122. return impl_->Execute(inputs, outputs);
  123. }
  124. Status HybridDavinciModel::ModelRunStart() {
  125. GE_CHECK_NOTNULL(impl_);
  126. return impl_->ModelRunStart();
  127. }
  128. Status HybridDavinciModel::ModelRunStop() {
  129. GE_CHECK_NOTNULL(impl_);
  130. return impl_->ModelRunStop();
  131. }
  132. Status HybridDavinciModel::EnqueueData(const shared_ptr<InputDataWrapper> &data) {
  133. GE_CHECK_NOTNULL(impl_);
  134. return impl_->EnqueueData(data);
  135. }
  136. void HybridDavinciModel::SetListener(const shared_ptr<ModelListener> &listener) {
  137. if (impl_ != nullptr) {
  138. impl_->SetListener(listener);
  139. }
  140. }
  141. void HybridDavinciModel::SetModelId(uint32_t model_id) {
  142. if (impl_ != nullptr) {
  143. impl_->SetModelId(model_id);
  144. }
  145. }
  146. void HybridDavinciModel::SetDeviceId(uint32_t device_id) {
  147. if (impl_ != nullptr) {
  148. impl_->SetDeviceId(device_id);
  149. }
  150. }
  151. void HybridDavinciModel::SetModelName(const string &model_name) {
  152. if (impl_ != nullptr) {
  153. impl_->SetModelName(model_name);
  154. }
  155. }
  156. Status HybridDavinciModel::GetDynamicBatchInfo(std::vector<std::vector<int64_t>> &batch_info, int32_t &dynamic_type) {
  157. GE_CHECK_NOTNULL(impl_);
  158. return impl_->GetDynamicBatchInfo(batch_info, dynamic_type);
  159. }
  160. void HybridDavinciModel::GetUserDesignateShapeOrder(std::vector<std::string> &user_input_shape_order) {
  161. if (impl_ != nullptr) {
  162. impl_->GetUserDesignateShapeOrder(user_input_shape_order);
  163. }
  164. }
  165. void HybridDavinciModel::GetModelAttr(std::vector<std::string> &dynamic_output_shape_info) {
  166. if (impl_ != nullptr) {
  167. impl_->GetModelAttr(dynamic_output_shape_info);
  168. }
  169. }
  170. Status HybridDavinciModel::GetInputOutputDescInfo(vector<InputOutputDescInfo> &input_desc,
  171. vector<InputOutputDescInfo> &output_desc,
  172. std::vector<uint32_t> &input_formats,
  173. std::vector<uint32_t> &output_formats) {
  174. GE_CHECK_NOTNULL(impl_);
  175. return impl_->GetInputOutputDescInfo(input_desc, output_desc, input_formats, output_formats);
  176. }
  177. void HybridDavinciModel::SetModelDescVersion(bool is_new_model_desc) {
  178. if (impl_ != nullptr) {
  179. impl_->SetModelDescVersion(is_new_model_desc);
  180. }
  181. }
  182. uint64_t HybridDavinciModel::GetSessionId() {
  183. GE_CHECK_NOTNULL(impl_);
  184. return impl_->GetSessionId();
  185. }
  186. } // namespace hybrid
  187. } // namespace ge

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示