You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

graph_manager.h 18 kB

5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449
  1. /**
  2. * Copyright 2019-2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #ifndef GE_GRAPH_MANAGER_GRAPH_MANAGER_H_
  17. #define GE_GRAPH_MANAGER_GRAPH_MANAGER_H_
  18. #include <iostream>
  19. #include <map>
  20. #include <memory>
  21. #include <set>
  22. #include <string>
  23. #include <thread>
  24. #include <vector>
  25. #include "common/blocking_queue.h"
  26. #include "framework/common/ge_inner_error_codes.h"
  27. #include "common/helper/model_cache_helper.h"
  28. #include "external/graph/types.h"
  29. #include "external/ge/ge_api_types.h"
  30. #include "graph/build/graph_builder.h"
  31. #include "graph/ge_local_context.h"
  32. #include "graph/load/graph_loader.h"
  33. #include "graph/manager/graph_manager_utils.h"
  34. #include "graph/manager/util/variable_accelerate_ctrl.h"
  35. #include "graph/optimize/graph_optimize.h"
  36. #include "graph/partition/graph_partition.h"
  37. #include "graph/preprocess/graph_preprocess.h"
  38. #include "graph/tuning_utils.h"
  39. #include "model/ge_model.h"
  40. #include "common/executor.h"
  41. namespace ge {
  42. class GraphManager {
  43. public:
  44. GraphManager() = default;
  45. ~GraphManager() = default;
  46. ///
  47. /// @ingroup ge_graph
  48. /// @brief graph manager init
  49. /// @param [in] options user config params
  50. /// @return Status result of function
  51. ///
  52. Status Initialize(const std::map<string, string> &options, Executor *executor = nullptr);
  53. ///
  54. /// @ingroup ge_graph
  55. /// @brief graph manager finalize
  56. /// @return Status result of function
  57. ///
  58. Status Finalize();
  59. ///
  60. /// @ingroup ge_graph
  61. /// @brief add specific graph
  62. /// @param [in] graph_id graph id
  63. /// @param [out] Graph output graph
  64. /// @return Status result of function
  65. ///
  66. Status AddGraph(const GraphId &graph_id, const Graph &graph, const std::map<std::string, std::string> &options,
  67. const OmgContext &omg_context);
  68. Status InitDynamicParams(ComputeGraphPtr &compute_graph);
  69. ///
  70. /// @ingroup ge_graph
  71. /// @brief add a copy graph
  72. /// @param [in] graph_id graph id
  73. /// @param [out] Graph output graph
  74. /// @return Status result of function
  75. ///
  76. Status AddGraphWithCopy(const GraphId &graph_id, const Graph &graph,
  77. const std::map<std::string, std::string> &options, const OmgContext &omg_context);
  78. ///
  79. /// @ingroup ge_graph
  80. /// @brief remove specific graph
  81. /// @param [in] graph_id graph id
  82. /// @return Status result of function
  83. ///
  84. Status RemoveGraph(const GraphId &graph_id);
  85. ///
  86. /// @ingroup ge_graph
  87. /// @brief run specific graph
  88. /// @param [in] graph_id graph id
  89. /// @param [in] inputs input data
  90. /// @param [out] outputs output data
  91. /// @return Status result of function
  92. ///
  93. Status RunGraph(const GraphId &graph_id, const std::vector<GeTensor> &inputs, std::vector<GeTensor> &outputs,
  94. uint64_t session_id = INVALID_SESSION_ID);
  95. ///
  96. /// @ingroup ge_graph
  97. /// @brief run specific graph with specific session id and stream
  98. /// @param [in] graph_id graph id
  99. /// @param [in] stream specific stream
  100. /// @param [in] session_id session id
  101. /// @param [in] inputs input data
  102. /// @param [out] outputs output data
  103. /// @return Status result of function
  104. ///
  105. Status RunGraphWithStreamAsync(const GraphId &graph_id, rtStream_t stream, uint64_t session_id,
  106. const std::vector<GeTensor> &inputs, std::vector<GeTensor> &outputs);
  107. ///
  108. /// @ingroup ge_graph
  109. /// @brief build specific graph
  110. /// @param [in] graph_id graph id
  111. /// @param [in] inputs input data
  112. /// @param [out] models build result
  113. /// @return Status result of function
  114. ///
  115. ge::Status BuildGraph(const GraphId &graph_id, const std::vector<GeTensor> &inputs, GeRootModelPtr &models,
  116. uint64_t session_id = 0, bool async = false);
  117. Status BuildGraphForUnregisteredOp(const GraphId &graph_id, const std::vector<GeTensor> &inputs,
  118. GeRootModelPtr &ge_root_model, uint64_t session_id);
  119. ///
  120. /// @ingroup ge_graph
  121. /// @brief Save extra attribute to Model
  122. /// @param [in] model: Model attribues will save to.
  123. /// @param [in] type: type of OpDesc.
  124. /// @param [in] attrs: attributes of OpDesc
  125. /// @param [in] inputs: input tensor
  126. /// @param [in] outputs: output tensor
  127. /// @return: Status
  128. ///
  129. Status SaveParams(ge::GeModel &model, const std::string &type, const std::map<string, GeAttrValue> &attrs,
  130. const std::vector<GeTensor> &inputs, const std::vector<GeTensor> &outputs);
  131. ///
  132. /// @ingroup ge_graph
  133. /// @brief get variable value from the session with specific session id
  134. /// @param [in] sessionId session id
  135. /// @param [in] name op name
  136. /// @param [out] val out value tensor
  137. /// @return Status result of function
  138. ///
  139. Status GetVariable(const std::string &name, Tensor &val);
  140. ///
  141. /// @ingroup ge_graph
  142. /// @brief run graph async on session with specific session id
  143. /// @param [in] graph_id graph id
  144. /// @param [in] inputs input data
  145. /// @param [out] callback: callback while run graph async finish
  146. /// @return Status result of function
  147. ///
  148. Status RunGraphAsync(const GraphId &graph_id, const std::vector<ge::Tensor> &inputs,
  149. uint64_t session_id, RunAsyncCallback callback);
  150. ///
  151. /// @ingroup ge_graph
  152. /// @brief me register the callback function to get the result of summary or checkpoin
  153. /// @param [in] key: summary or checkpoint
  154. /// @param [in] callbak: The real callback object of me
  155. /// @return Status result of function
  156. ///
  157. Status RegisterCallBackFunc(
  158. const std::string &key,
  159. const std::function<Status(uint32_t, const std::map<std::string, ge::Tensor> &)> &callback);
  160. Status RegisterCallBackFunc(
  161. const std::string &key,
  162. const std::function<Status(uint32_t, const std::map<AscendString, ge::Tensor> &)> &callback);
  163. const bool GetTrainFlag() const { return options_.train_graph_flag; }
  164. bool IsGraphNeedRebuild(uint32_t graph_id);
  165. Status GenerateInfershapeGraph(GraphId &graph_id);
  166. const std::map<std::string, std::string> *GetGraphOptions(uint32_t graph_id);
  167. void SetOptionsRunGraphFlag(bool run_graph_flag);
  168. Status GenCheckPointGraph(const std::map<std::string, GeTensorDesc> &all_variables, Graph &graph);
  169. Status SaveVariables(const Graph &graph, const std::vector<std::string> &var_names,
  170. const std::vector<Tensor> &outputs, std::vector<Tensor> &var_values);
  171. Status SaveCheckPointResult(const Graph &graph, const std::vector<Tensor> &outputs, map<string, Tensor> &var_results);
  172. void RemoveGraphCount(GraphId graph_id);
  173. void IncreaseGraphCount(GraphId graph_id);
  174. void DecreaseGraphCount(GraphId graph_id);
  175. Status GetGraphCount(GraphId graph_id, uint32_t &count);
  176. void SetAddGraphCondition(GraphId graph_id, uint32_t cond);
  177. uint32_t GetAddGraphCondition(GraphId graph_id);
  178. void RemoveAddGraphCondition(GraphId graph_id);
  179. private:
  180. struct CompilerStages {
  181. GraphPrepare preparer;
  182. GraphOptimize optimizer;
  183. GraphPartitioner partitioner;
  184. GraphBuilder builder;
  185. };
  186. struct PreRunArgs {
  187. GraphId graph_id;
  188. std::vector<ge::Tensor> input_tensor;
  189. uint64_t session_id;
  190. struct error_message::Context error_context;
  191. GEThreadLocalContext context;
  192. RunAsyncCallback callback;
  193. };
  194. void AddGraphNode(GraphId graph_id, const GraphNodePtr &graph_node);
  195. void RemoveGraphNode(GraphId graph_id);
  196. bool HasGraphNode(GraphId graph_id);
  197. Status GetGraphNode(const GraphId &graph_id, GraphNodePtr &out);
  198. static Status ProcessSubGraphWithMultiThreads(GraphManager *graph_manager, GraphId root_graph_id,
  199. const SubGraphInfoPtr &sub_graph_info_ptr,
  200. const std::string &root_graph_name,
  201. uint64_t session_id,
  202. const struct error_message::Context &error_context,
  203. const GEThreadLocalContext &ge_context);
  204. Status RunCustomPass(const GraphNodePtr &graph_node);
  205. Status PreRun(const GraphNodePtr &graph_node, const std::vector<GeTensor> &inputs, GeRootModelPtr &ge_root_model,
  206. uint64_t session_id = INVALID_SESSION_ID);
  207. Status OptimizeSubgraph(const GraphNodePtr &graph_node, ComputeGraphPtr &compute_graph, uint64_t session_id);
  208. Status Build(const GraphNodePtr &graph_node, ComputeGraphPtr &compute_graph,
  209. GeRootModelPtr &ge_root_model, uint64_t session_id);
  210. Status StartForRunGraph(const GraphNodePtr &graph_node, const std::vector<GeTensor> &inputs,
  211. GeRootModelPtr &ge_root_model, uint64_t session_id = INVALID_SESSION_ID);
  212. Status InnerRunGraph(GraphNodePtr &graph_node, const GraphId &graph_id, const std::vector<GeTensor> &inputs,
  213. std::vector<GeTensor> &outputs);
  214. Status InnerRunGraphWithStream(GraphNodePtr &graph_node, const GraphId &graph_id, rtStream_t stream,
  215. const std::vector<GeTensor> &inputs, std::vector<GeTensor> &outputs);
  216. Status ParseOptions(const std::map<std::string, std::string> &options);
  217. static void ParseOption(const std::map<std::string, std::string> &options, const std::string &key,
  218. std::string &option);
  219. static Status ParseOption(const std::map<std::string, std::string> &options, const std::string &key, bool &option);
  220. static Status ParseOption(const std::map<std::string, std::string> &options, const std::string &key, int &option);
  221. static Status ParseOption(const std::map<std::string, std::string> &options, const std::string &key,
  222. std::map<std::string, int> &option);
  223. static void Trim(std::string &str);
  224. static Status CheckEngineName(const std::string &engine_name, const std::string &key,
  225. const std::map<std::string, int> &option);
  226. static Status ParseParallelNum(const std::string &parallel_num, const std::string &key, int &num);
  227. static Status ParseTrainGraphFlag(bool &train_flag);
  228. static bool IsPerfLevelInvalid(int32_t perf_level);
  229. Status SummaryHandle(const GraphId &graph_id, std::vector<GeTensor> &outputs);
  230. Status CheckpointHandle(const GraphId &graph_id, const ComputeGraphPtr &compute_graph,
  231. const std::vector<GeTensor> &outputs);
  232. // call the callback function of ME to push summary result data to ME
  233. Status PushSummaryData2ME(const GraphId &graph_id, const std::map<std::string, ge::Tensor> &summary_data);
  234. // call the callback function of ME to push save result data to ME
  235. Status PushSaveData2ME(const GraphId &graph_id, const std::map<std::string, ge::Tensor> &save_data);
  236. bool IsCheckpointGraph(ComputeGraphPtr &compute_graph);
  237. bool CheckNetOutputForCheckpointGraph(NodePtr &node);
  238. bool CheckVariableForCheckpointGraph(NodePtr &node);
  239. bool CheckTransOpForCheckpointGraph(NodePtr &node);
  240. Status MergeSubGraph(ComputeGraphPtr &compute_graph, const ge::ComputeGraphPtr &original_compute_graph,
  241. GraphId root_graph_id);
  242. Status ConvertGraphToFile(ComputeGraphPtr &compute_graph, GraphPartitioner &partitioner, std::string file_path,
  243. bool exe_flag = false);
  244. Status SetSubgraph(uint64_t session_id, ComputeGraphPtr compute_graph, GraphPartitioner &partitioner);
  245. void SetAttrForHcomBroadCastOp(ge::ComputeGraphPtr &compute_graph);
  246. bool IsBroadCastOpData(const ge::NodePtr &var_node);
  247. void AdjustBroadCastOpData(const ge::NodePtr &var_node);
  248. bool IsAssignOpData(const ge::NodePtr &var_node);
  249. void AdjustAssignOpData(const ge::NodePtr &var_node);
  250. bool ConfirmUseOpAndIndexByAnchor(const ge::InDataAnchorPtr &in_anchor, const map<string, std::set<int>> &confirm_ops,
  251. ge::NodePtr &use_node);
  252. bool ConfirmUseOpAndIndexByNode(const ge::NodePtr &var_node, const map<string, std::set<int>> &confirm_ops,
  253. ge::NodePtr &use_node);
  254. // graph context
  255. std::shared_ptr<GraphContext> GetGraphContext() const { return graph_context_; }
  256. Status RemoveIsolatedConst(ge::ComputeGraphPtr &compute_graph);
  257. Status RemoveIsolatedConstInThisGraph(ge::ComputeGraphPtr &compute_graph);
  258. Status OptimizeStage1(ComputeGraphPtr &compute_graph);
  259. Status OptimizeStage2(ComputeGraphPtr &compute_graph);
  260. Status SubexpressionMigration(ComputeGraphPtr &compute_graph);
  261. bool CheckModelLoad(const GeRootModelPtr &ge_model, bool load_flag);
  262. Status LoadGraph(const GeRootModelPtr &ge_root_model, const GraphNodePtr &graph_node);
  263. bool IsGraphNeedBuild(const GraphNodePtr &graph_node);
  264. Status LoadFromCache(const GraphNodePtr &graph_node, const ModelCacheHelperPtr &cache_helper, GeModelPtr &ge_model);
  265. Status SaveCacheBeforeBuild(uint32_t graph_id, const ModelCacheHelperPtr &cache_helper);
  266. Status SaveCacheAfterBuild(uint32_t graph_id, ComputeGraphPtr graph, GeModelPtr &ge_model);
  267. void AddModelCacheHelperToMap(const GraphId &graph_id, uint64_t session_id, ComputeGraphPtr &compute_graph);
  268. Status IncreBuild(const GraphNodePtr &graph_node, GeModelPtr &ge_model);
  269. void RemoveModelCacheHelper(const GraphId &graph_id);
  270. ModelCacheHelperPtr FindModelCacheHelper(GraphId graph_id);
  271. void SetRunContext(const GraphNodePtr &graph_node);
  272. void PushGraph(const RunArgs &args);
  273. void PreRunThread();
  274. void StopQueue();
  275. void ReturnError(RunAsyncCallback callback, Status ret, const string &log);
  276. void ChangeConstTypeWhenTraining(const ComputeGraphPtr &compute_graph);
  277. Status PreRunOptimizeOriginalGraph(const GraphNodePtr &graph_node, const std::vector<GeTensor> &inputs,
  278. ge::ComputeGraphPtr &compute_graph, uint64_t session_id);
  279. Status PreRunOptimizeSubGraph(const GraphNodePtr &graph_node,
  280. ge::ComputeGraphPtr &compute_graph,
  281. uint64_t session_id);
  282. Status PreRunAfterOptimizeSubGraph(const GraphNodePtr &graph_node,
  283. ComputeGraphPtr &compute_graph,
  284. GeRootModelPtr &ge_root_model,
  285. uint64_t session_id);
  286. Status SetFuzzCompileFlag(ComputeGraphPtr &compute_graph);
  287. Status CopySubGraphAndMarkFusion(const ComputeGraphPtr &compute_graph,
  288. Graph2SubGraphInfoList &sub_graph_map,
  289. std::unordered_map<std::string, ComputeGraphPtr> &copy_graphs);
  290. Status OptimizeSubGraphWithMultiThreads(ComputeGraphPtr compute_graph,
  291. Graph2SubGraphInfoList &sub_graph_map,
  292. uint64_t session_id);
  293. bool CheckAllFusionOptimizeSuccess(const ComputeGraphPtr &compute_graph, Graph2SubGraphInfoList &sub_graph_map);
  294. Status ReplaceSubgraphWithOriGraph(const ComputeGraphPtr &compute_graph,
  295. Graph2SubGraphInfoList &sub_graph_map,
  296. std::unordered_map<std::string, ComputeGraphPtr> &copy_graphs);
  297. Status SetRtContext(rtContext_t rt_context, rtCtxMode_t mode, uint64_t session_id, uint32_t graph_id);
  298. void AddLocalOmgContext(GraphId graph_id, const OmgContext &omg_context);
  299. void UpdateLocalOmgContext(GraphId graph_id);
  300. CompilerStages &GetCompilerStages(GraphId graph_id);
  301. void RemoveCompilerStages(GraphId graph_id);
  302. Status CheckIncreBuildAndPreRun(const PreRunArgs &args, GraphNodePtr &graph_node, GeRootModelPtr &ge_root_model);
  303. Status CheckRepeatAdd(uint32_t graph_id, bool &is_added);
  304. Status NotifyWaittingGraph(uint32_t graph_id);
  305. Status CreateGraphNode(uint32_t graph_id, const Graph &graph, const std::map<std::string, std::string> &options);
  306. Status SetStagesOptions(uint32_t graph_id, const GraphManagerOptions &options);
  307. Status UnloadModel(GeRootModelPtr ge_root_model, uint32_t graph_id);
  308. void SetSessionGraphId(ComputeGraphPtr compute_graph, uint32_t graph_id);
  309. Status ModifyDataIndex(const Graph &graph, const std::map<std::string, std::string> &graph_option);
  310. static Status CheckGraphAdded(const GraphId &graph_id, const Graph &graph);
  311. std::atomic_bool thread_run_flag_{false};
  312. BlockingQueue<PreRunArgs> prerun_args_q_{};
  313. std::thread prerun_thread_;
  314. ComputeGraphPtr compute_graph_;
  315. std::map<GraphId, GraphNodePtr> graph_map_;
  316. std::map<GraphId, ModelCacheHelperPtr> cache_helper_map_;
  317. // summary and checkpoint callback function list for ME, key is summary or checkpoint
  318. std::map<std::string, std::function<Status(uint32_t, const std::map<std::string, ge::Tensor> &)>> me_callback_map_;
  319. std::map<std::string, std::function<Status(uint32_t, const std::map<AscendString, ge::Tensor> &)>> callback_map_;
  320. bool init_flag_{false};
  321. GraphManagerOptions options_;
  322. GraphContextPtr graph_context_ = nullptr;
  323. map<GraphId, OmgContext> omg_contexts_;
  324. map<GraphId, CompilerStages> compiler_stages_;
  325. Executor *executor_{nullptr};
  326. VarAccelerateCtrl var_acc_ctrl_;
  327. std::mutex run_mutex_;
  328. std::mutex member_mutex_;
  329. std::mutex unload_model_mutex_;
  330. // avoid repeatively add same graph (owns same graph id)
  331. std::mutex add_graph_mutex_;
  332. std::mutex add_graph_cond_mutex_;
  333. std::condition_variable add_graph_cv_;
  334. std::map<GraphId, uint32_t> graph_id_to_add_graph_cond_;
  335. // use for multi-thread online-infer scenario
  336. std::set<GraphId> to_be_deleted_graphs_;
  337. std::map<GraphId, uint32_t> graph_count_;
  338. std::mutex graph_count_mutex_;
  339. };
  340. } // namespace ge
  341. #endif // GE_GRAPH_MANAGER_GRAPH_MANAGER_H_

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示