Author | SHA1 | Message | Date |
---|---|---|---|
|
92058a75e2 |
For gemm multi-threading, simply split M.
e.g. layer 1: A (1600k, 576), B(576, 64) B is very small. We split M. |
10 years ago |
@@ -80,7 +80,7 @@ VERSION = 0.2.16.dev | |||||
# NO_LAPACKE = 1 | # NO_LAPACKE = 1 | ||||
# If you want to use legacy threaded Level 3 implementation. | # If you want to use legacy threaded Level 3 implementation. | ||||
# USE_SIMPLE_THREADED_LEVEL3 = 1 | |||||
USE_SIMPLE_THREADED_LEVEL3 = 1 | |||||
# If you want to drive whole 64bit region by BLAS. Not all Fortran | # If you want to drive whole 64bit region by BLAS. Not all Fortran | ||||
# compiler supports this. It's safe to keep comment it out if you | # compiler supports this. It's safe to keep comment it out if you | ||||
@@ -1194,6 +1194,8 @@ extern gotoblas_t *gotoblas; | |||||
#define XGEMM_DEFAULT_UNROLL_N 2 | #define XGEMM_DEFAULT_UNROLL_N 2 | ||||
#endif | #endif | ||||
#define GEMM_THREAD gemm_thread_m | |||||
#ifndef GEMM_THREAD | #ifndef GEMM_THREAD | ||||
#define GEMM_THREAD gemm_thread_n | #define GEMM_THREAD gemm_thread_n | ||||
#endif | #endif | ||||