You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

rt_ffts_plus.h 894 B

4 years ago
123456789101112131415161718192021222324252627282930313233
  1. /*
  2. * Copyright (c) Huawei Technologies Co., Ltd. 2021. All rights reserved.
  3. * Description: ffts plus interface
  4. */
  5. #ifndef __CCE_RUNTIME_FFTS_PLUS_H
  6. #define __CCE_RUNTIME_FFTS_PLUS_H
  7. #include "base.h"
  8. #include "rt_stars_define.h"
  9. #if defined(__cplusplus) && !defined(COMPILE_OMG_PACKAGE)
  10. extern "C" {
  11. #endif
  12. #pragma pack(push)
  13. #pragma pack (1)
  14. typedef struct tagFftsPlusTaskInfo {
  15. const rtFftsPlusSqe_t *fftsPlusSqe;
  16. const void *descBuf; // include total context
  17. size_t descBufLen; // the length of descBuf
  18. } rtFftsPlusTaskInfo_t;
  19. #pragma pack(pop)
  20. RTS_API rtError_t rtGetAddrAndPrefCntWithHandle(void *handle, const void *devFunc, void **addr, uint32_t *prefetchCnt);
  21. RTS_API rtError_t rtFftsPlusTaskLaunch(rtFftsPlusTaskInfo_t *fftsPlusTaskInfo, rtStream_t stream);
  22. #if defined(__cplusplus) && !defined(COMPILE_OMG_PACKAGE)
  23. }
  24. #endif
  25. #endif // __CCE_RUNTIME_FFTS_H

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示