You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

profiling_manager.h 5.4 kB

5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119
  1. /**
  2. * Copyright 2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #ifndef GE_COMMON_PROFILING_PROFILING_MANAGER_H_
  17. #define GE_COMMON_PROFILING_PROFILING_MANAGER_H_
  18. #include <nlohmann/json.hpp>
  19. #include <mutex>
  20. #include <map>
  21. #include <string>
  22. #include <vector>
  23. #include "framework/common/ge_inner_error_codes.h"
  24. #include "framework/common/ge_types.h"
  25. #include "external/register/register_types.h"
  26. #include "runtime/stream.h"
  27. #include "toolchain/prof_callback.h"
  28. #include "common/profiling/profiling_properties.h"
  29. using std::map;
  30. using std::string;
  31. using std::vector;
  32. using Json = nlohmann::json;
  33. namespace ge {
  34. class OpDesc;
  35. using OpDescPtr = std::shared_ptr<OpDesc>;
  36. struct DeviceSubsInfo {
  37. uint64_t module;
  38. uint32_t subscribe_count;
  39. };
  40. struct ProfSubscribeInfo {
  41. bool is_subscribe;
  42. uint64_t prof_switch;
  43. uint32_t graph_id;
  44. };
  45. class ProfilingManager {
  46. public:
  47. ProfilingManager();
  48. virtual ~ProfilingManager();
  49. static ProfilingManager &Instance();
  50. Status ProfInit(uint64_t module);
  51. Status ProfFinalize();
  52. Status ProfStartProfiling(uint64_t module, const std::map<std::string, std::string> &config_para);
  53. Status ProfStopProfiling(uint64_t module, const std::map<std::string, std::string> &config_para);
  54. Status ProfModelSubscribe(uint64_t module, void *model);
  55. Status ProfModelUnsubscribe(void *model);
  56. // report model load profiling data flag, data contain task desc info, step info, model load fusion op info
  57. bool ProfilingModelLoadOn() const { return ProfilingProperties::Instance().IsLoadProfiling(); }
  58. // report model execute profiling data flag, data contain model execute time info
  59. bool ProfilingModelExecuteOn() const;
  60. // is_execute_profiling_ only used by ge option and env
  61. void ReportProfilingData(uint32_t model_id, const std::vector<TaskDescInfo> &task_desc_info);
  62. void ProfilingTaskDescInfo(uint32_t model_id, const std::vector<TaskDescInfo> &task_desc_info,
  63. const int32_t &device_id);
  64. void ProfilingOpInputOutInfo(const TaskDescInfo &task, Json &task_json);
  65. Status PluginInit();
  66. void PluginUnInit() const;
  67. Status CallMsprofReport(ReporterData &reporter_data) const;
  68. const MsprofReporterCallback GetMsprofReporterCallback() const { return reporter_callback_; }
  69. void SetMsprofReporterCallback(MsprofReporterCallback func) { reporter_callback_ = func; }
  70. void GetFpBpPoint(std::string &fp_point, std::string &bp_point);
  71. void GetOpInputOutputInfo(const OpDescPtr &op, TaskDescInfo &task_desc_info) const;
  72. void ReportData(const int32_t &device_id, const std::string &data, const std::string &tag_name);
  73. Status ProfileStepInfo(uint64_t index_id, uint64_t model_id, uint16_t tag_id, rtStream_t stream, int32_t device_id);
  74. void SetStepInfoIndex(uint64_t index_id) { index_id_ = index_id; }
  75. uint64_t GetStepInfoIndex() const { return index_id_; }
  76. void SetGraphIdToDeviceMap(uint32_t graph_id, uint32_t device_id) { device_id_map_[graph_id] = device_id; }
  77. Status GetDeviceIdFromGraph(uint32_t graph_id, uint32_t &device_id);
  78. void SetSubscribeInfo(uint64_t prof_switch, uint32_t model_id, bool is_subscribe);
  79. const ProfSubscribeInfo &GetSubscribeInfo() const { return subscribe_info_; }
  80. void CleanSubscribeInfo();
  81. void SetGraphIdToModelMap(uint32_t graph_id, uint32_t model_id) { model_id_map_[graph_id] = model_id; }
  82. Status GetModelIdFromGraph(uint32_t graph_id, uint32_t &model_id);
  83. const vector<int32_t> &GetDeviceID() const { return device_id_; }
  84. private:
  85. Status ProfParseParam(const std::map<std::string, std::string> &config_para, int32_t &device_num,
  86. vector<int32_t> &device_list);
  87. Status ProfParseDeviceId(const std::map<std::string, std::string> &config_para,
  88. vector<int32_t> &device_list);
  89. uint64_t GetProfilingModule();
  90. void UpdateDeviceIdModuleMap(string prof_type, uint64_t module, const vector<int32_t> &device_list);
  91. void UpdateSubscribeDeviceModuleMap(std::string prof_type, uint32_t device_id, uint64_t module);
  92. void GetOpInputInfo(const OpDescPtr &op, TaskDescInfo &task_desc_info) const;
  93. void GetOpOutputInfo(const OpDescPtr &op, TaskDescInfo &task_desc_info) const;
  94. vector<int32_t> device_id_;
  95. map<int32_t, uint64_t> device_id_module_map_; // key: device_id, value: profiling on module
  96. map<uint32_t, DeviceSubsInfo> subs_dev_module_; // key: device_id, value: profiling on module
  97. uint32_t subscribe_count_;
  98. std::mutex mutex_;
  99. std::mutex mutex_report_;
  100. std::string fp_point_;
  101. std::string bp_point_;
  102. uint32_t reporter_max_len_ = 0;
  103. uint64_t index_id_;
  104. std::map<uint32_t, uint32_t> device_id_map_; // key: graph_id, value: device_id
  105. std::map<uint32_t, uint32_t> model_id_map_; // key: graph_id, value: model_id
  106. ProfSubscribeInfo subscribe_info_;
  107. MsprofReporterCallback reporter_callback_;
  108. };
  109. } // namespace ge
  110. #endif // GE_COMMON_PROFILING_PROFILING_MANAGER_H_

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示