You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

hybrid_execution_context.cc 2.9 kB

4 years ago
4 years ago
4 years ago
4 years ago
12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091
  1. /**
  2. * Copyright 2019-2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include "hybrid_execution_context.h"
  17. #include <atomic>
  18. namespace ge {
  19. namespace hybrid {
  20. namespace {
  21. const uint32_t kEndOfSequence = 0x0704000a;
  22. const uint32_t kEndOfSequenceNew = 507005;
  23. const int32_t kModelAbortNormal = 0x0704000e;
  24. const int32_t kModelAbortNormalNew = 507024;
  25. std::atomic_ulong context_id_gen {};
  26. } // namespace
  27. long GraphExecutionContext::profiling_level = 0;
  28. GraphExecutionContext::GraphExecutionContext() {
  29. context_id = context_id_gen++;
  30. }
  31. void GraphExecutionContext::SetErrorCode(Status error_code) {
  32. std::lock_guard<std::mutex> lk(mu);
  33. this->status = error_code;
  34. }
  35. Status GraphExecutionContext::GetStatus() const {
  36. std::lock_guard<std::mutex> lk(mu);
  37. return this->status;
  38. }
  39. Status GraphExecutionContext::Synchronize(rtStream_t rt_stream) {
  40. auto rt_ret = rtStreamSynchronize(rt_stream);
  41. if (rt_ret == RT_ERROR_NONE) {
  42. return SUCCESS;
  43. }
  44. if (rt_ret == kEndOfSequence || rt_ret == kEndOfSequenceNew) {
  45. GELOGI("Got end of sequence");
  46. is_eos_ = true;
  47. return END_OF_SEQUENCE;
  48. }
  49. if (rt_ret == kModelAbortNormal || rt_ret == kModelAbortNormalNew) {
  50. GELOGI("The model with multiple datasets aborts normally");
  51. return SUCCESS;
  52. }
  53. GELOGE(RT_FAILED, "[Invoke][rtStreamSynchronize] failed, ret = %d", rt_ret);
  54. REPORT_CALL_ERROR("E19999", "invoke rtStreamSynchronize failed, ret = %d", rt_ret);
  55. return RT_FAILED;
  56. }
  57. Status GraphExecutionContext::DumpExceptionInfo(const std::vector<rtExceptionInfo> &exception_infos) {
  58. if (exception_infos.empty()) {
  59. GELOGI("[Dump][ExceptionInfo] Exception info is null.");
  60. return SUCCESS;
  61. }
  62. GELOGI("[Dump][ExceptionInfo] Start to search dynamic op info and to dump.");
  63. if (exception_dumper.DumpExceptionInfo(exception_infos) != SUCCESS) {
  64. GELOGE(FAILED, "[Dump][Exception] Dump dynamic op exception info failed.");
  65. return FAILED;
  66. }
  67. GELOGI("[Dump][ExceptionInfo] Start to search static op info and to dump.");
  68. for (const auto &iter : davinci_model) {
  69. if (iter != nullptr) {
  70. if (iter->DumpExceptionInfo(exception_infos) != SUCCESS) {
  71. GELOGE(FAILED, "[Dump][ExceptionInfo] Dump static op exception info failed.");
  72. return FAILED;
  73. }
  74. }
  75. }
  76. return SUCCESS;
  77. }
  78. } // namespace hybrid
  79. } // namespace ge

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示