|
@@ -72,6 +72,11 @@ BLASLONG shgemm_p = DEFAULT_GEMM_P; |
|
|
#else |
|
|
#else |
|
|
BLASLONG shgemm_p = SHGEMM_P; |
|
|
BLASLONG shgemm_p = SHGEMM_P; |
|
|
#endif |
|
|
#endif |
|
|
|
|
|
#if BGEMM_P == bgemm_p |
|
|
|
|
|
BLASLONG bgemm_p = DEFAULT_GEMM_P; |
|
|
|
|
|
#else |
|
|
|
|
|
BLASLONG bgemm_p = BGEMM_P; |
|
|
|
|
|
#endif |
|
|
#if SGEMM_P == sgemm_p |
|
|
#if SGEMM_P == sgemm_p |
|
|
BLASLONG sgemm_p = DEFAULT_GEMM_P; |
|
|
BLASLONG sgemm_p = DEFAULT_GEMM_P; |
|
|
#else |
|
|
#else |
|
@@ -103,6 +108,11 @@ BLASLONG shgemm_q = DEFAULT_GEMM_Q; |
|
|
#else |
|
|
#else |
|
|
BLASLONG shgemm_q = SHGEMM_Q; |
|
|
BLASLONG shgemm_q = SHGEMM_Q; |
|
|
#endif |
|
|
#endif |
|
|
|
|
|
#if BGEMM_Q == bgemm_q |
|
|
|
|
|
BLASLONG bgemm_q = DEFAULT_GEMM_Q; |
|
|
|
|
|
#else |
|
|
|
|
|
BLASLONG bgemm_q = BGEMM_Q; |
|
|
|
|
|
#endif |
|
|
#if SGEMM_Q == sgemm_q |
|
|
#if SGEMM_Q == sgemm_q |
|
|
BLASLONG sgemm_q = DEFAULT_GEMM_Q; |
|
|
BLASLONG sgemm_q = DEFAULT_GEMM_Q; |
|
|
#else |
|
|
#else |
|
@@ -134,6 +144,11 @@ BLASLONG shgemm_r = DEFAULT_GEMM_R; |
|
|
#else |
|
|
#else |
|
|
BLASLONG shgemm_r = SHGEMM_R; |
|
|
BLASLONG shgemm_r = SHGEMM_R; |
|
|
#endif |
|
|
#endif |
|
|
|
|
|
#if BGEMM_R == bgemm_r |
|
|
|
|
|
BLASLONG bgemm_r = DEFAULT_GEMM_R; |
|
|
|
|
|
#else |
|
|
|
|
|
BLASLONG bgemm_r = BGEMM_R; |
|
|
|
|
|
#endif |
|
|
#if SGEMM_R == sgemm_r |
|
|
#if SGEMM_R == sgemm_r |
|
|
BLASLONG sgemm_r = DEFAULT_GEMM_R; |
|
|
BLASLONG sgemm_r = DEFAULT_GEMM_R; |
|
|
#else |
|
|
#else |
|
@@ -541,6 +556,7 @@ void blas_set_parameter(void){ |
|
|
|
|
|
|
|
|
#ifdef BUILD_BFLOAT16 |
|
|
#ifdef BUILD_BFLOAT16 |
|
|
sbgemm_r = (((BUFFER_SIZE - ((SBGEMM_P * SBGEMM_Q * 4 + GEMM_OFFSET_A + GEMM_ALIGN) & ~GEMM_ALIGN)) / (SBGEMM_Q * 4)) - 15) & ~15; |
|
|
sbgemm_r = (((BUFFER_SIZE - ((SBGEMM_P * SBGEMM_Q * 4 + GEMM_OFFSET_A + GEMM_ALIGN) & ~GEMM_ALIGN)) / (SBGEMM_Q * 4)) - 15) & ~15; |
|
|
|
|
|
bgemm_r = (((BUFFER_SIZE - ((BGEMM_P * BGEMM_Q * 4 + GEMM_OFFSET_A + GEMM_ALIGN) & ~GEMM_ALIGN)) / (BGEMM_Q * 4)) - 15) & ~15; |
|
|
#endif |
|
|
#endif |
|
|
#ifdef BUILD_HFLOAT16 |
|
|
#ifdef BUILD_HFLOAT16 |
|
|
shgemm_r = (((BUFFER_SIZE - ((SHGEMM_P * SHGEMM_Q * 4 + GEMM_OFFSET_A + GEMM_ALIGN) & ~GEMM_ALIGN)) / (SHGEMM_Q * 4)) - 15) & ~15; |
|
|
shgemm_r = (((BUFFER_SIZE - ((SHGEMM_P * SHGEMM_Q * 4 + GEMM_OFFSET_A + GEMM_ALIGN) & ~GEMM_ALIGN)) / (SHGEMM_Q * 4)) - 15) & ~15; |
|
@@ -653,6 +669,7 @@ void blas_set_parameter(void){ |
|
|
|
|
|
|
|
|
#ifdef BUILD_BFLOAT16 |
|
|
#ifdef BUILD_BFLOAT16 |
|
|
sbgemm_r = (((BUFFER_SIZE - ((SBGEMM_P * SBGEMM_Q * 4 + GEMM_OFFSET_A + GEMM_ALIGN) & ~GEMM_ALIGN)) / (SBGEMM_Q * 4)) - 15) & ~15; |
|
|
sbgemm_r = (((BUFFER_SIZE - ((SBGEMM_P * SBGEMM_Q * 4 + GEMM_OFFSET_A + GEMM_ALIGN) & ~GEMM_ALIGN)) / (SBGEMM_Q * 4)) - 15) & ~15; |
|
|
|
|
|
bgemm_r = (((BUFFER_SIZE - ((BGEMM_P * BGEMM_Q * 4 + GEMM_OFFSET_A + GEMM_ALIGN) & ~GEMM_ALIGN)) / (BGEMM_Q * 4)) - 15) & ~15; |
|
|
#endif |
|
|
#endif |
|
|
#ifdef BUILD_HFLOAT16 |
|
|
#ifdef BUILD_HFLOAT16 |
|
|
shgemm_r = (((BUFFER_SIZE - ((SHGEMM_P * SHGEMM_Q * 4 + GEMM_OFFSET_A + GEMM_ALIGN) & ~GEMM_ALIGN)) / (SHGEMM_Q * 4)) - 15) & ~15; |
|
|
shgemm_r = (((BUFFER_SIZE - ((SHGEMM_P * SHGEMM_Q * 4 + GEMM_OFFSET_A + GEMM_ALIGN) & ~GEMM_ALIGN)) / (SHGEMM_Q * 4)) - 15) & ~15; |
|
|