|
|
@@ -1,77 +1,77 @@ |
|
|
|
#ifndef COMMON_SH_H |
|
|
|
#define COMMON_SH_H |
|
|
|
#ifndef COMMON_SB_H |
|
|
|
#define COMMON_SB_H |
|
|
|
|
|
|
|
#ifndef DYNAMIC_ARCH |
|
|
|
|
|
|
|
#define SHDOT_K shdot_k |
|
|
|
#define SHSTOBF16_K shstobf16_k |
|
|
|
#define SHDTOBF16_K shdtobf16_k |
|
|
|
#define SBDOT_K sbdot_k |
|
|
|
#define SBSTOBF16_K sbstobf16_k |
|
|
|
#define SBDTOBF16_K sbdtobf16_k |
|
|
|
#define SBF16TOS_K sbf16tos_k |
|
|
|
#define DBF16TOD_K dbf16tod_k |
|
|
|
|
|
|
|
#define SHGEMM_ONCOPY shgemm_oncopy |
|
|
|
#define SHGEMM_OTCOPY shgemm_otcopy |
|
|
|
#define SBGEMM_ONCOPY sbgemm_oncopy |
|
|
|
#define SBGEMM_OTCOPY sbgemm_otcopy |
|
|
|
|
|
|
|
#if SHGEMM_DEFAULT_UNROLL_M == SHGEMM_DEFAULT_UNROLL_N |
|
|
|
#define SHGEMM_INCOPY shgemm_oncopy |
|
|
|
#define SHGEMM_ITCOPY shgemm_otcopy |
|
|
|
#if SBGEMM_DEFAULT_UNROLL_M == SBGEMM_DEFAULT_UNROLL_N |
|
|
|
#define SBGEMM_INCOPY sbgemm_oncopy |
|
|
|
#define SBGEMM_ITCOPY sbgemm_otcopy |
|
|
|
#else |
|
|
|
#define SHGEMM_INCOPY shgemm_incopy |
|
|
|
#define SHGEMM_ITCOPY shgemm_itcopy |
|
|
|
#define SBGEMM_INCOPY sbgemm_incopy |
|
|
|
#define SBGEMM_ITCOPY sbgemm_itcopy |
|
|
|
#endif |
|
|
|
#define SHGEMM_BETA shgemm_beta |
|
|
|
#define SHGEMM_KERNEL shgemm_kernel |
|
|
|
#define SBGEMM_BETA sbgemm_beta |
|
|
|
#define SBGEMM_KERNEL sbgemm_kernel |
|
|
|
|
|
|
|
#else |
|
|
|
|
|
|
|
#define SHDOT_K gotoblas -> shdot_k |
|
|
|
#define SHSTOBF16_K gotoblas -> shstobf16_k |
|
|
|
#define SHDTOBF16_K gotoblas -> shdtobf16_k |
|
|
|
#define SBDOT_K gotoblas -> sbdot_k |
|
|
|
#define SBSTOBF16_K gotoblas -> sbstobf16_k |
|
|
|
#define SBDTOBF16_K gotoblas -> sbdtobf16_k |
|
|
|
#define SBF16TOS_K gotoblas -> sbf16tos_k |
|
|
|
#define DBF16TOD_K gotoblas -> dbf16tod_k |
|
|
|
|
|
|
|
#define SHGEMM_ONCOPY gotoblas -> shgemm_oncopy |
|
|
|
#define SHGEMM_OTCOPY gotoblas -> shgemm_otcopy |
|
|
|
#define SHGEMM_INCOPY gotoblas -> shgemm_incopy |
|
|
|
#define SHGEMM_ITCOPY gotoblas -> shgemm_itcopy |
|
|
|
#define SHGEMM_BETA gotoblas -> shgemm_beta |
|
|
|
#define SHGEMM_KERNEL gotoblas -> shgemm_kernel |
|
|
|
#define SBGEMM_ONCOPY gotoblas -> sbgemm_oncopy |
|
|
|
#define SBGEMM_OTCOPY gotoblas -> sbgemm_otcopy |
|
|
|
#define SBGEMM_INCOPY gotoblas -> sbgemm_incopy |
|
|
|
#define SBGEMM_ITCOPY gotoblas -> sbgemm_itcopy |
|
|
|
#define SBGEMM_BETA gotoblas -> sbgemm_beta |
|
|
|
#define SBGEMM_KERNEL gotoblas -> sbgemm_kernel |
|
|
|
|
|
|
|
#endif |
|
|
|
|
|
|
|
#define SHGEMM_NN shgemm_nn |
|
|
|
#define SHGEMM_CN shgemm_tn |
|
|
|
#define SHGEMM_TN shgemm_tn |
|
|
|
#define SHGEMM_NC shgemm_nt |
|
|
|
#define SHGEMM_NT shgemm_nt |
|
|
|
#define SHGEMM_CC shgemm_tt |
|
|
|
#define SHGEMM_CT shgemm_tt |
|
|
|
#define SHGEMM_TC shgemm_tt |
|
|
|
#define SHGEMM_TT shgemm_tt |
|
|
|
#define SHGEMM_NR shgemm_nn |
|
|
|
#define SHGEMM_TR shgemm_tn |
|
|
|
#define SHGEMM_CR shgemm_tn |
|
|
|
#define SHGEMM_RN shgemm_nn |
|
|
|
#define SHGEMM_RT shgemm_nt |
|
|
|
#define SHGEMM_RC shgemm_nt |
|
|
|
#define SHGEMM_RR shgemm_nn |
|
|
|
#define SBGEMM_NN sbgemm_nn |
|
|
|
#define SBGEMM_CN sbgemm_tn |
|
|
|
#define SBGEMM_TN sbgemm_tn |
|
|
|
#define SBGEMM_NC sbgemm_nt |
|
|
|
#define SBGEMM_NT sbgemm_nt |
|
|
|
#define SBGEMM_CC sbgemm_tt |
|
|
|
#define SBGEMM_CT sbgemm_tt |
|
|
|
#define SBGEMM_TC sbgemm_tt |
|
|
|
#define SBGEMM_TT sbgemm_tt |
|
|
|
#define SBGEMM_NR sbgemm_nn |
|
|
|
#define SBGEMM_TR sbgemm_tn |
|
|
|
#define SBGEMM_CR sbgemm_tn |
|
|
|
#define SBGEMM_RN sbgemm_nn |
|
|
|
#define SBGEMM_RT sbgemm_nt |
|
|
|
#define SBGEMM_RC sbgemm_nt |
|
|
|
#define SBGEMM_RR sbgemm_nn |
|
|
|
|
|
|
|
#define SHGEMM_THREAD_NN shgemm_thread_nn |
|
|
|
#define SHGEMM_THREAD_CN shgemm_thread_tn |
|
|
|
#define SHGEMM_THREAD_TN shgemm_thread_tn |
|
|
|
#define SHGEMM_THREAD_NC shgemm_thread_nt |
|
|
|
#define SHGEMM_THREAD_NT shgemm_thread_nt |
|
|
|
#define SHGEMM_THREAD_CC shgemm_thread_tt |
|
|
|
#define SHGEMM_THREAD_CT shgemm_thread_tt |
|
|
|
#define SHGEMM_THREAD_TC shgemm_thread_tt |
|
|
|
#define SHGEMM_THREAD_TT shgemm_thread_tt |
|
|
|
#define SHGEMM_THREAD_NR shgemm_thread_nn |
|
|
|
#define SHGEMM_THREAD_TR shgemm_thread_tn |
|
|
|
#define SHGEMM_THREAD_CR shgemm_thread_tn |
|
|
|
#define SHGEMM_THREAD_RN shgemm_thread_nn |
|
|
|
#define SHGEMM_THREAD_RT shgemm_thread_nt |
|
|
|
#define SHGEMM_THREAD_RC shgemm_thread_nt |
|
|
|
#define SHGEMM_THREAD_RR shgemm_thread_nn |
|
|
|
#define SBGEMM_THREAD_NN sbgemm_thread_nn |
|
|
|
#define SBGEMM_THREAD_CN sbgemm_thread_tn |
|
|
|
#define SBGEMM_THREAD_TN sbgemm_thread_tn |
|
|
|
#define SBGEMM_THREAD_NC sbgemm_thread_nt |
|
|
|
#define SBGEMM_THREAD_NT sbgemm_thread_nt |
|
|
|
#define SBGEMM_THREAD_CC sbgemm_thread_tt |
|
|
|
#define SBGEMM_THREAD_CT sbgemm_thread_tt |
|
|
|
#define SBGEMM_THREAD_TC sbgemm_thread_tt |
|
|
|
#define SBGEMM_THREAD_TT sbgemm_thread_tt |
|
|
|
#define SBGEMM_THREAD_NR sbgemm_thread_nn |
|
|
|
#define SBGEMM_THREAD_TR sbgemm_thread_tn |
|
|
|
#define SBGEMM_THREAD_CR sbgemm_thread_tn |
|
|
|
#define SBGEMM_THREAD_RN sbgemm_thread_nn |
|
|
|
#define SBGEMM_THREAD_RT sbgemm_thread_nt |
|
|
|
#define SBGEMM_THREAD_RC sbgemm_thread_nt |
|
|
|
#define SBGEMM_THREAD_RR sbgemm_thread_nn |
|
|
|
|
|
|
|
#endif |
|
|
|
|