You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

common_sb.h 2.4 kB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677
  1. #ifndef COMMON_SH_H
  2. #define COMMON_SH_H
  3. #ifndef DYNAMIC_ARCH
  4. #define SHDOT_K shdot_k
  5. #define SHSTOBF16_K shstobf16_k
  6. #define SHDTOBF16_K shdtobf16_k
  7. #define SBF16TOS_K sbf16tos_k
  8. #define DBF16TOD_K dbf16tod_k
  9. #define SHGEMM_ONCOPY shgemm_oncopy
  10. #define SHGEMM_OTCOPY shgemm_otcopy
  11. #if SHGEMM_DEFAULT_UNROLL_M == SHGEMM_DEFAULT_UNROLL_N
  12. #define SHGEMM_INCOPY shgemm_oncopy
  13. #define SHGEMM_ITCOPY shgemm_otcopy
  14. #else
  15. #define SHGEMM_INCOPY shgemm_incopy
  16. #define SHGEMM_ITCOPY shgemm_itcopy
  17. #endif
  18. #define SHGEMM_BETA shgemm_beta
  19. #define SHGEMM_KERNEL shgemm_kernel
  20. #else
  21. #define SHDOT_K gotoblas -> shdot_k
  22. #define SHSTOBF16_K gotoblas -> shstobf16_k
  23. #define SHDTOBF16_K gotoblas -> shdtobf16_k
  24. #define SBF16TOS_K gotoblas -> sbf16tos_k
  25. #define DBF16TOD_K gotoblas -> dbf16tod_k
  26. #define SHGEMM_ONCOPY gotoblas -> shgemm_oncopy
  27. #define SHGEMM_OTCOPY gotoblas -> shgemm_otcopy
  28. #define SHGEMM_INCOPY gotoblas -> shgemm_incopy
  29. #define SHGEMM_ITCOPY gotoblas -> shgemm_itcopy
  30. #define SHGEMM_BETA gotoblas -> shgemm_beta
  31. #define SHGEMM_KERNEL gotoblas -> shgemm_kernel
  32. #endif
  33. #define SHGEMM_NN shgemm_nn
  34. #define SHGEMM_CN shgemm_tn
  35. #define SHGEMM_TN shgemm_tn
  36. #define SHGEMM_NC shgemm_nt
  37. #define SHGEMM_NT shgemm_nt
  38. #define SHGEMM_CC shgemm_tt
  39. #define SHGEMM_CT shgemm_tt
  40. #define SHGEMM_TC shgemm_tt
  41. #define SHGEMM_TT shgemm_tt
  42. #define SHGEMM_NR shgemm_nn
  43. #define SHGEMM_TR shgemm_tn
  44. #define SHGEMM_CR shgemm_tn
  45. #define SHGEMM_RN shgemm_nn
  46. #define SHGEMM_RT shgemm_nt
  47. #define SHGEMM_RC shgemm_nt
  48. #define SHGEMM_RR shgemm_nn
  49. #define SHGEMM_THREAD_NN shgemm_thread_nn
  50. #define SHGEMM_THREAD_CN shgemm_thread_tn
  51. #define SHGEMM_THREAD_TN shgemm_thread_tn
  52. #define SHGEMM_THREAD_NC shgemm_thread_nt
  53. #define SHGEMM_THREAD_NT shgemm_thread_nt
  54. #define SHGEMM_THREAD_CC shgemm_thread_tt
  55. #define SHGEMM_THREAD_CT shgemm_thread_tt
  56. #define SHGEMM_THREAD_TC shgemm_thread_tt
  57. #define SHGEMM_THREAD_TT shgemm_thread_tt
  58. #define SHGEMM_THREAD_NR shgemm_thread_nn
  59. #define SHGEMM_THREAD_TR shgemm_thread_tn
  60. #define SHGEMM_THREAD_CR shgemm_thread_tn
  61. #define SHGEMM_THREAD_RN shgemm_thread_nn
  62. #define SHGEMM_THREAD_RT shgemm_thread_nt
  63. #define SHGEMM_THREAD_RC shgemm_thread_nt
  64. #define SHGEMM_THREAD_RR shgemm_thread_nn
  65. #endif