|
|
@@ -3128,7 +3128,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
|
|
|
|
|
|
|
#define SYMV_P 16 |
|
|
|
|
|
|
|
#if defined(CORTEXA57) || \ |
|
|
|
#if defined(CORTEXA57) || defined(CORTEXX1) \ |
|
|
|
defined(CORTEXA72) || defined(CORTEXA73) || \ |
|
|
|
defined(FALKOR) || defined(TSV110) || defined(EMAG8180) || defined(VORTEX) || defined(FT2000) |
|
|
|
|
|
|
@@ -3147,7 +3147,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
|
|
|
/*FIXME: this should be using the cache size, but there is currently no easy way to |
|
|
|
query that on ARM. So if getarch counted more than 8 cores we simply assume the host |
|
|
|
is a big desktop or server with abundant cache rather than a phone or embedded device */ |
|
|
|
#if NUM_CORES > 8 || defined(TSV110) || defined(EMAG8180) || defined(VORTEX) |
|
|
|
#if NUM_CORES > 8 || defined(TSV110) || defined(EMAG8180) || defined(VORTEX)|| defined(CORTEXX1) |
|
|
|
#define SGEMM_DEFAULT_P 512 |
|
|
|
#define DGEMM_DEFAULT_P 256 |
|
|
|
#define CGEMM_DEFAULT_P 256 |
|
|
@@ -3377,7 +3377,7 @@ is a big desktop or server with abundant cache rather than a phone or embedded d |
|
|
|
#define CGEMM_DEFAULT_R 4096 |
|
|
|
#define ZGEMM_DEFAULT_R 4096 |
|
|
|
|
|
|
|
#elif defined(ARMV8SVE) || defined(A64FX) || defined(ARMV9) || defined(CORTEXA510) |
|
|
|
#elif defined(ARMV8SVE) || defined(A64FX) || defined(ARMV9) || defined(CORTEXA510)|| defined(CORTEXA710) || defined(CORTEXX2) |
|
|
|
|
|
|
|
/* When all BLAS3 routines are implemeted with SVE, SGEMM_DEFAULT_UNROLL_M should be "sve_vl". |
|
|
|
Until then, just keep it different than DGEMM_DEFAULT_UNROLL_N to keep copy routines in both directions seperated. */ |
|
|
|