You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

data_dumper.h 6.3 kB

5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165
  1. /**
  2. * Copyright 2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #ifndef GE_GRAPH_LOAD_NEW_MODEL_MANAGER_DATA_DUMPER_H_
  17. #define GE_GRAPH_LOAD_NEW_MODEL_MANAGER_DATA_DUMPER_H_
  18. #include <map>
  19. #include <memory>
  20. #include <string>
  21. #include <vector>
  22. #include "framework/common/ge_inner_error_codes.h"
  23. #include "common/properties_manager.h"
  24. #include "graph/node.h"
  25. #include "graph/compute_graph.h"
  26. #include "proto/ge_ir.pb.h"
  27. #include "proto/op_mapping_info.pb.h"
  28. #include "runtime/mem.h"
  29. #include "task_info/task_info.h"
  30. #include "framework/common/ge_types.h"
  31. #include "runtime/base.h"
  32. namespace ge {
  33. class DataDumper {
  34. public:
  35. DataDumper() : runtime_param_{} {}
  36. explicit DataDumper(const RuntimeParam &rsh) : runtime_param_(rsh) {}
  37. ~DataDumper();
  38. void SetModelName(const std::string &model_name) { model_name_ = model_name; }
  39. void SetModelId(uint32_t model_id) { model_id_ = model_id; }
  40. void SetDeviceId(uint32_t device_id) { device_id_ = device_id; }
  41. void SetComputeGraph(const ComputeGraphPtr &compute_graph) { compute_graph_ = compute_graph; };
  42. void SetRefInfo(const std::map<OpDescPtr, void *> &ref_info) { ref_info_ = ref_info; };
  43. void SetL1FusionAddr(void *addr) { l1_fusion_addr_ = addr; };
  44. void SetLoopAddr(void *global_step, void *loop_per_iter, void *loop_cond);
  45. void SaveDumpInput(const std::shared_ptr<Node> &node);
  46. void SaveDumpOpInfo(const RuntimeParam &model_param, const OpDescPtr &op, uint32_t task_id, uint32_t stream_id);
  47. // args is device memory stored first output addr
  48. void SaveDumpTask(uint32_t task_id, uint32_t stream_id, const std::shared_ptr<OpDesc> &op_desc, uintptr_t args);
  49. void SaveEndGraphId(uint32_t task_id, uint32_t stream_id);
  50. void SetOmName(const std::string &om_name) { om_name_ = om_name; }
  51. void SaveOpDebugId(uint32_t task_id, uint32_t stream_id, void *op_debug_addr, bool is_op_debug);
  52. Status LoadDumpInfo();
  53. Status UnloadDumpInfo();
  54. void DumpShrink();
  55. void SetDumpProperties(const DumpProperties &dump_properties) { dump_properties_ = dump_properties; }
  56. const DumpProperties &GetDumpProperties() const { return dump_properties_; }
  57. bool GetOpDescInfo(uint32_t stream_id, uint32_t task_id, OpDescInfo &op_desc_info) const;
  58. const std::vector<OpDescInfo> &GetAllOpDescInfo() const { return op_desc_info_; }
  59. // Dump exception info
  60. Status DumpExceptionInput(const OpDescInfo &op_desc_info, const string &dump_file);
  61. Status DumpExceptionOutput(const OpDescInfo &op_desc_info, const string &dump_file);
  62. Status DumpExceptionInfo(const std::vector<rtExceptionInfo> exception_infos);
  63. private:
  64. void ReleaseDevMem(void **ptr) noexcept;
  65. void PrintCheckLog(string &dump_list_key);
  66. std::string model_name_;
  67. // for inference data dump
  68. std::string om_name_;
  69. uint32_t model_id_ = 0;
  70. const RuntimeParam &runtime_param_;
  71. void *dev_mem_load_ = nullptr;
  72. void *dev_mem_unload_ = nullptr;
  73. struct InnerDumpInfo;
  74. struct InnerInputMapping;
  75. std::vector<OpDescInfo> op_desc_info_;
  76. std::vector<InnerDumpInfo> op_list_; // release after DavinciModel::Init
  77. uint32_t end_graph_task_id_ = 0;
  78. uint32_t end_graph_stream_id_ = 0;
  79. bool is_end_graph_ = false;
  80. std::multimap<std::string, InnerInputMapping> input_map_; // release after DavinciModel::Init
  81. bool load_flag_ = false;
  82. uint32_t device_id_ = 0;
  83. uintptr_t global_step_ = 0;
  84. uintptr_t loop_per_iter_ = 0;
  85. uintptr_t loop_cond_ = 0;
  86. ComputeGraphPtr compute_graph_ = nullptr; // release after DavinciModel::Init
  87. std::map<OpDescPtr, void *> ref_info_; // release after DavinciModel::Init
  88. void *l1_fusion_addr_ = nullptr;
  89. uint32_t op_debug_task_id_ = 0;
  90. uint32_t op_debug_stream_id_ = 0;
  91. void *op_debug_addr_ = nullptr;
  92. bool is_op_debug_ = false;
  93. DumpProperties dump_properties_;
  94. // Build task info of op mapping info
  95. Status BuildTaskInfo(aicpu::dump::OpMappingInfo &op_mapping_info);
  96. Status DumpOutput(const InnerDumpInfo &inner_dump_info, aicpu::dump::Task &task);
  97. Status DumpRefOutput(const DataDumper::InnerDumpInfo &inner_dump_info, aicpu::dump::Output &output, size_t i,
  98. const std::string &node_name_index);
  99. Status DumpOutputWithTask(const InnerDumpInfo &inner_dump_info, aicpu::dump::Task &task);
  100. Status DumpInput(const InnerDumpInfo &inner_dump_info, aicpu::dump::Task &task);
  101. Status DumpRefInput(const DataDumper::InnerDumpInfo &inner_dump_info, aicpu::dump::Input &input, size_t i,
  102. const std::string &node_name_index);
  103. Status ExecuteLoadDumpInfo(aicpu::dump::OpMappingInfo &op_mapping_info);
  104. void SetEndGraphIdToAicpu(uint32_t task_id, uint32_t stream_id, aicpu::dump::OpMappingInfo &op_mapping_info);
  105. void SetOpDebugIdToAicpu(uint32_t task_id, uint32_t stream_id, void *op_debug_addr,
  106. aicpu::dump::OpMappingInfo &op_mapping_info);
  107. Status ExecuteUnLoadDumpInfo(aicpu::dump::OpMappingInfo &op_mapping_info);
  108. Status GenerateInput(aicpu::dump::Input &input, const OpDesc::Vistor<GeTensorDesc> &tensor_descs,
  109. const uintptr_t &addr, size_t index);
  110. Status GenerateOutput(aicpu::dump::Output &output, const OpDesc::Vistor<GeTensorDesc> &tensor_descs,
  111. const uintptr_t &addr, size_t index);
  112. void GenerateOpBuffer(const int64_t &size, aicpu::dump::Task &task);
  113. };
  114. struct DataDumper::InnerDumpInfo {
  115. uint32_t task_id;
  116. uint32_t stream_id;
  117. std::shared_ptr<OpDesc> op;
  118. uintptr_t args;
  119. bool is_task;
  120. int input_anchor_index;
  121. int output_anchor_index;
  122. std::vector<int64_t> dims;
  123. int64_t data_size;
  124. };
  125. struct DataDumper::InnerInputMapping {
  126. std::shared_ptr<OpDesc> data_op;
  127. int input_anchor_index;
  128. int output_anchor_index;
  129. };
  130. } // namespace ge
  131. #endif // GE_GRAPH_LOAD_NEW_MODEL_MANAGER_DATA_DUMPER_H_

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示