Browse Source

Merge pull request #4585 from martin-frbg/issue1881

Cap the number of parallel threads for GEMM;GETRF and POTRF to ensure sensible workloads on big systems
tags/v0.3.27
Martin Kroeker GitHub 1 year ago
parent
commit
d277c6d15b
No known key found for this signature in database GPG Key ID: B5690EEEBB952194
3 changed files with 25 additions and 12 deletions
  1. +5
    -1
      interface/gemm.c
  2. +11
    -6
      interface/lapack/getrf.c
  3. +9
    -5
      interface/lapack/potrf.c

+ 5
- 1
interface/gemm.c View File

@@ -533,8 +533,12 @@ void CNAME(enum CBLAS_ORDER order, enum CBLAS_TRANSPOSE TransA, enum CBLAS_TRANS
MNK = (double) args.m * (double) args.n * (double) args.k;
if ( MNK <= (SMP_THRESHOLD_MIN * (double) GEMM_MULTITHREAD_THRESHOLD) )
args.nthreads = 1;
else
else {
args.nthreads = num_cpu_avail(3);
if (MNK/args.nthreads < SMP_THRESHOLD_MIN*(double)GEMM_MULTITHREAD_THRESHOLD)
args.nthreads = MNK/(SMP_THRESHOLD_MIN*(double)GEMM_MULTITHREAD_THRESHOLD);
}

args.common = NULL;

if (args.nthreads == 1) {


+ 11
- 6
interface/lapack/getrf.c View File

@@ -95,14 +95,19 @@ int NAME(blasint *M, blasint *N, FLOAT *a, blasint *ldA, blasint *ipiv, blasint

#ifdef SMP
args.common = NULL;

#ifndef DOUBLE
if (args.m*args.n < 40000)
#else
if (args.m*args.n < 10000)
int nmax = 40000;
#else
int nmax = 10000;
#endif
args.nthreads=1;
else
args.nthreads = num_cpu_avail(4);
if (args.m*args.n <nmax) {
args.nthreads = 1;
} else {
args.nthreads = num_cpu_avail(4);
if ((args.m*args.n)/args.nthreads <nmax)
args.nthreads = (args.m*args.n)/nmax;
}

if (args.nthreads == 1) {
#endif


+ 9
- 5
interface/lapack/potrf.c View File

@@ -113,13 +113,17 @@ int NAME(char *UPLO, blasint *N, FLOAT *a, blasint *ldA, blasint *Info){
#ifdef SMP
args.common = NULL;
#ifndef DOUBLE
if (args.n <128)
#else
if (args.n <64)
int nmax = 128;
#else
int nmax = 64;
#endif
if (args.n <nmax) {
args.nthreads = 1;
else
args.nthreads = num_cpu_avail(4);
} else {
args.nthreads = num_cpu_avail(4);
if (args.n/args.nthreads <nmax)
args.nthreads = args.n/nmax;
}

if (args.nthreads == 1) {
#endif


Loading…
Cancel
Save