|
|
@@ -13,25 +13,25 @@ extern gotoblas_t gotoblas_POWER10; |
|
|
|
extern void openblas_warning(int verbose, const char *msg); |
|
|
|
|
|
|
|
static char *corename[] = { |
|
|
|
"unknown", |
|
|
|
"POWER6", |
|
|
|
"POWER8", |
|
|
|
"POWER9", |
|
|
|
"POWER10" |
|
|
|
"unknown", |
|
|
|
"POWER6", |
|
|
|
"POWER8", |
|
|
|
"POWER9", |
|
|
|
"POWER10" |
|
|
|
}; |
|
|
|
|
|
|
|
#define NUM_CORETYPES 5 |
|
|
|
|
|
|
|
char *gotoblas_corename(void) { |
|
|
|
if (gotoblas == &gotoblas_POWER6) return corename[1]; |
|
|
|
if (gotoblas == &gotoblas_POWER8) return corename[2]; |
|
|
|
if (gotoblas == &gotoblas_POWER6) return corename[1]; |
|
|
|
if (gotoblas == &gotoblas_POWER8) return corename[2]; |
|
|
|
#if (!defined __GNUC__) || ( __GNUC__ >= 6) |
|
|
|
if (gotoblas == &gotoblas_POWER9) return corename[3]; |
|
|
|
if (gotoblas == &gotoblas_POWER9) return corename[3]; |
|
|
|
#endif |
|
|
|
#ifdef HAVE_P10_SUPPORT |
|
|
|
if (gotoblas == &gotoblas_POWER10) return corename[4]; |
|
|
|
if (gotoblas == &gotoblas_POWER10) return corename[4]; |
|
|
|
#endif |
|
|
|
return corename[0]; |
|
|
|
return corename[0]; |
|
|
|
} |
|
|
|
|
|
|
|
#ifdef _AIX |
|
|
@@ -90,13 +90,13 @@ static int __builtin_cpu_supports(char* arg) |
|
|
|
|
|
|
|
static gotoblas_t *get_coretype(void) { |
|
|
|
|
|
|
|
if (__builtin_cpu_supports("power6")) |
|
|
|
return &gotoblas_POWER6; |
|
|
|
if (__builtin_cpu_supports("power8")) |
|
|
|
return &gotoblas_POWER8; |
|
|
|
if (__builtin_cpu_supports("power6")) |
|
|
|
return &gotoblas_POWER6; |
|
|
|
if (__builtin_cpu_supports("power8")) |
|
|
|
return &gotoblas_POWER8; |
|
|
|
#if (!defined __GNUC__) || ( __GNUC__ >= 6) |
|
|
|
if (__builtin_cpu_supports("power9")) |
|
|
|
return &gotoblas_POWER9; |
|
|
|
if (__builtin_cpu_supports("power9")) |
|
|
|
return &gotoblas_POWER9; |
|
|
|
#endif |
|
|
|
#ifdef HAVE_P10_SUPPORT |
|
|
|
#ifdef _AIX |
|
|
@@ -104,84 +104,84 @@ static gotoblas_t *get_coretype(void) { |
|
|
|
#else |
|
|
|
if (__builtin_cpu_supports("arch_3_1") && __builtin_cpu_supports("mma")) |
|
|
|
#endif |
|
|
|
return &gotoblas_POWER10; |
|
|
|
return &gotoblas_POWER10; |
|
|
|
#endif |
|
|
|
/* Fall back to the POWER9 implementation if the toolchain is too old or the MMA feature is not set */ |
|
|
|
/* Fall back to the POWER9 implementation if the toolchain is too old or the MMA feature is not set */ |
|
|
|
#if (!defined __GNUC__) || ( __GNUC__ < 11) || (__GNUC__ == 10 && __GNUC_MINOR__ < 2) |
|
|
|
if (__builtin_cpu_supports("power10")) |
|
|
|
return &gotoblas_POWER9; |
|
|
|
#endif |
|
|
|
return NULL; |
|
|
|
if (__builtin_cpu_supports("power10")) |
|
|
|
return &gotoblas_POWER9; |
|
|
|
#endif |
|
|
|
return NULL; |
|
|
|
} |
|
|
|
|
|
|
|
static gotoblas_t *force_coretype(char * coretype) { |
|
|
|
|
|
|
|
int i ; |
|
|
|
int found = -1; |
|
|
|
char message[128]; |
|
|
|
|
|
|
|
for ( i = 0 ; i < NUM_CORETYPES; i++) |
|
|
|
{ |
|
|
|
if (!strncasecmp(coretype, corename[i], 20)) |
|
|
|
{ |
|
|
|
found = i; |
|
|
|
break; |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
switch (found) |
|
|
|
{ |
|
|
|
case 1: return (&gotoblas_POWER6); |
|
|
|
case 2: return (&gotoblas_POWER8); |
|
|
|
int i ; |
|
|
|
int found = -1; |
|
|
|
char message[128]; |
|
|
|
|
|
|
|
for ( i = 0 ; i < NUM_CORETYPES; i++) |
|
|
|
{ |
|
|
|
if (!strncasecmp(coretype, corename[i], 20)) |
|
|
|
{ |
|
|
|
found = i; |
|
|
|
break; |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
switch (found) |
|
|
|
{ |
|
|
|
case 1: return (&gotoblas_POWER6); |
|
|
|
case 2: return (&gotoblas_POWER8); |
|
|
|
#if (!defined __GNUC__) || ( __GNUC__ >= 6) |
|
|
|
case 3: return (&gotoblas_POWER9); |
|
|
|
case 3: return (&gotoblas_POWER9); |
|
|
|
#endif |
|
|
|
#ifdef HAVE_P10_SUPPORT |
|
|
|
case 4: return (&gotoblas_POWER10); |
|
|
|
case 4: return (&gotoblas_POWER10); |
|
|
|
#endif |
|
|
|
default: return NULL; |
|
|
|
} |
|
|
|
snprintf(message, 128, "Core not found: %s\n", coretype); |
|
|
|
openblas_warning(1, message); |
|
|
|
default: return NULL; |
|
|
|
} |
|
|
|
snprintf(message, 128, "Core not found: %s\n", coretype); |
|
|
|
openblas_warning(1, message); |
|
|
|
} |
|
|
|
|
|
|
|
void gotoblas_dynamic_init(void) { |
|
|
|
|
|
|
|
char coremsg[128]; |
|
|
|
char coren[22]; |
|
|
|
char *p; |
|
|
|
|
|
|
|
|
|
|
|
if (gotoblas) return; |
|
|
|
|
|
|
|
p = getenv("OPENBLAS_CORETYPE"); |
|
|
|
if ( p ) |
|
|
|
{ |
|
|
|
gotoblas = force_coretype(p); |
|
|
|
} |
|
|
|
else |
|
|
|
{ |
|
|
|
gotoblas = get_coretype(); |
|
|
|
} |
|
|
|
|
|
|
|
if (gotoblas == NULL) |
|
|
|
{ |
|
|
|
snprintf(coremsg, 128, "Falling back to POWER8 core\n"); |
|
|
|
openblas_warning(1, coremsg); |
|
|
|
gotoblas = &gotoblas_POWER8; |
|
|
|
} |
|
|
|
|
|
|
|
if (gotoblas && gotoblas -> init) { |
|
|
|
strncpy(coren,gotoblas_corename(),20); |
|
|
|
sprintf(coremsg, "Core: %s\n",coren); |
|
|
|
openblas_warning(2, coremsg); |
|
|
|
gotoblas -> init(); |
|
|
|
} else { |
|
|
|
openblas_warning(0, "OpenBLAS : Architecture Initialization failed. No initialization function found.\n"); |
|
|
|
exit(1); |
|
|
|
} |
|
|
|
char coremsg[128]; |
|
|
|
char coren[22]; |
|
|
|
char *p; |
|
|
|
|
|
|
|
|
|
|
|
if (gotoblas) return; |
|
|
|
|
|
|
|
p = getenv("OPENBLAS_CORETYPE"); |
|
|
|
if ( p ) |
|
|
|
{ |
|
|
|
gotoblas = force_coretype(p); |
|
|
|
} |
|
|
|
else |
|
|
|
{ |
|
|
|
gotoblas = get_coretype(); |
|
|
|
} |
|
|
|
|
|
|
|
if (gotoblas == NULL) |
|
|
|
{ |
|
|
|
snprintf(coremsg, 128, "Falling back to POWER8 core\n"); |
|
|
|
openblas_warning(1, coremsg); |
|
|
|
gotoblas = &gotoblas_POWER8; |
|
|
|
} |
|
|
|
|
|
|
|
if (gotoblas && gotoblas -> init) { |
|
|
|
strncpy(coren,gotoblas_corename(),20); |
|
|
|
sprintf(coremsg, "Core: %s\n",coren); |
|
|
|
openblas_warning(2, coremsg); |
|
|
|
gotoblas -> init(); |
|
|
|
} else { |
|
|
|
openblas_warning(0, "OpenBLAS : Architecture Initialization failed. No initialization function found.\n"); |
|
|
|
exit(1); |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
void gotoblas_dynamic_quit(void) { |
|
|
|
gotoblas = NULL; |
|
|
|
gotoblas = NULL; |
|
|
|
} |