|
- /**************************************************************************
- Copyright (c) 2013, The OpenBLAS Project
- All rights reserved.
- Redistribution and use in source and binary forms, with or without
- modification, are permitted provided that the following conditions are
- met:
- 1. Redistributions of source code must retain the above copyright
- notice, this list of conditions and the following disclaimer.
- 2. Redistributions in binary form must reproduce the above copyright
- notice, this list of conditions and the following disclaimer in
- the documentation and/or other materials provided with the
- distribution.
- 3. Neither the name of the OpenBLAS project nor the names of
- its contributors may be used to endorse or promote products
- derived from this software without specific prior written permission.
- THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
- AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
- IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
- ARE DISCLAIMED. IN NO EVENT SHALL THE OPENBLAS PROJECT OR CONTRIBUTORS BE
- LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
- DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
- SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
- CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
- OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE
- USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *****************************************************************************/
-
- #include <string.h>
- #ifdef OS_DARWIN
- #include <sys/sysctl.h>
- int32_t value;
- size_t length=sizeof(value);
- #endif
-
- #define CPU_UNKNOWN 0
- #define CPU_ARMV8 1
- // Arm
- #define CPU_CORTEXA53 2
- #define CPU_CORTEXA57 3
- #define CPU_CORTEXA72 4
- #define CPU_CORTEXA73 5
- #define CPU_NEOVERSEN1 11
- // Qualcomm
- #define CPU_FALKOR 6
- // Cavium
- #define CPU_THUNDERX 7
- #define CPU_THUNDERX2T99 8
- #define CPU_THUNDERX3T110 12
- //Hisilicon
- #define CPU_TSV110 9
- // Ampere
- #define CPU_EMAG8180 10
- // Apple
- #define CPU_VORTEX 13
-
- static char *cpuname[] = {
- "UNKNOWN",
- "ARMV8" ,
- "CORTEXA53",
- "CORTEXA57",
- "CORTEXA72",
- "CORTEXA73",
- "FALKOR",
- "THUNDERX",
- "THUNDERX2T99",
- "TSV110",
- "EMAG8180",
- "NEOVERSEN1",
- "THUNDERX3T110",
- "VORTEX"
- };
-
- static char *cpuname_lower[] = {
- "unknown",
- "armv8",
- "cortexa53",
- "cortexa57",
- "cortexa72",
- "cortexa73",
- "falkor",
- "thunderx",
- "thunderx2t99",
- "tsv110",
- "emag8180",
- "neoversen1",
- "thunderx3t110",
- "vortex"
- };
-
- int get_feature(char *search)
- {
-
- #ifdef __linux
- FILE *infile;
- char buffer[2048], *p,*t;
- p = (char *) NULL ;
-
- infile = fopen("/proc/cpuinfo", "r");
-
- while (fgets(buffer, sizeof(buffer), infile))
- {
-
- if (!strncmp("Features", buffer, 8))
- {
- p = strchr(buffer, ':') + 2;
- break;
- }
- }
-
- fclose(infile);
-
-
- if( p == NULL ) return 0;
-
- t = strtok(p," ");
- while( (t = strtok(NULL," ")))
- {
- if (!strcmp(t, search)) { return(1); }
- }
-
- #endif
- return(0);
- }
-
-
- int detect(void)
- {
-
- #ifdef __linux
-
- FILE *infile;
- char buffer[512], *p, *cpu_part = NULL, *cpu_implementer = NULL;
- p = (char *) NULL ;
-
- infile = fopen("/proc/cpuinfo", "r");
- while (fgets(buffer, sizeof(buffer), infile)) {
- if ((cpu_part != NULL) && (cpu_implementer != NULL)) {
- break;
- }
-
- if ((cpu_part == NULL) && !strncmp("CPU part", buffer, 8)) {
- cpu_part = strchr(buffer, ':') + 2;
- cpu_part = strdup(cpu_part);
- } else if ((cpu_implementer == NULL) && !strncmp("CPU implementer", buffer, 15)) {
- cpu_implementer = strchr(buffer, ':') + 2;
- cpu_implementer = strdup(cpu_implementer);
- }
- }
-
- fclose(infile);
- if(cpu_part != NULL && cpu_implementer != NULL) {
- // Arm
- if (strstr(cpu_implementer, "0x41")) {
- if (strstr(cpu_part, "0xd03"))
- return CPU_CORTEXA53;
- else if (strstr(cpu_part, "0xd07"))
- return CPU_CORTEXA57;
- else if (strstr(cpu_part, "0xd08"))
- return CPU_CORTEXA72;
- else if (strstr(cpu_part, "0xd09"))
- return CPU_CORTEXA73;
- else if (strstr(cpu_part, "0xd0c"))
- return CPU_NEOVERSEN1;
- }
- // Qualcomm
- else if (strstr(cpu_implementer, "0x51") && strstr(cpu_part, "0xc00"))
- return CPU_FALKOR;
- // Cavium
- else if (strstr(cpu_implementer, "0x43") && strstr(cpu_part, "0x0a1"))
- return CPU_THUNDERX;
- else if (strstr(cpu_implementer, "0x43") && strstr(cpu_part, "0x0af"))
- return CPU_THUNDERX2T99;
- else if (strstr(cpu_implementer, "0x43") && strstr(cpu_part, "0x0b8"))
- return CPU_THUNDERX3T110;
- // HiSilicon
- else if (strstr(cpu_implementer, "0x48") && strstr(cpu_part, "0xd01"))
- return CPU_TSV110;
- // Ampere
- else if (strstr(cpu_implementer, "0x50") && strstr(cpu_part, "0x000"))
- return CPU_EMAG8180;
- }
-
- p = (char *) NULL ;
- infile = fopen("/proc/cpuinfo", "r");
- while (fgets(buffer, sizeof(buffer), infile))
- {
-
- if ((!strncmp("model name", buffer, 10)) || (!strncmp("Processor", buffer, 9)) ||
- (!strncmp("CPU architecture", buffer, 16)))
- {
- p = strchr(buffer, ':') + 2;
- break;
- }
- }
-
- fclose(infile);
-
- if(p != NULL)
- {
-
- if ((strstr(p, "AArch64")) || (strstr(p, "8")))
- {
- return CPU_ARMV8;
-
- }
-
-
- }
- #else
- #ifdef DARWIN
- sysctlbyname("hw.cpufamily",&value,&length,NULL,0);
- if (value ==131287967) return CPU_VORTEX;
- #endif
- return CPU_ARMV8;
- #endif
-
- return CPU_UNKNOWN;
- }
-
- char *get_corename(void)
- {
- return cpuname[detect()];
- }
-
- void get_architecture(void)
- {
- printf("ARM64");
- }
-
- void get_subarchitecture(void)
- {
- int d = detect();
- printf("%s", cpuname[d]);
- }
-
- void get_subdirname(void)
- {
- printf("arm64");
- }
-
- void get_cpucount(void)
- {
- int n=0;
-
- #ifdef __linux
- FILE *infile;
- char buffer[2048], *p,*t;
- p = (char *) NULL ;
-
- infile = fopen("/proc/cpuinfo", "r");
-
- while (fgets(buffer, sizeof(buffer), infile))
- {
-
- if (!strncmp("processor", buffer, 9))
- n++;
- }
-
- fclose(infile);
-
- printf("#define NUM_CORES %d\n",n);
- #endif
- #ifdef DARWIN
- sysctlbyname("hw.physicalcpu_max",&value,&length,NULL,0);
- printf("#define NUM_CORES %d\n",value);
- #endif
- }
-
-
-
- void get_cpuconfig(void)
- {
-
- // All arches should define ARMv8
- printf("#define ARMV8\n");
- printf("#define HAVE_NEON\n"); // This shouldn't be necessary
- printf("#define HAVE_VFPV4\n"); // This shouldn't be necessary
-
- int d = detect();
- switch (d)
- {
-
- case CPU_CORTEXA53:
- printf("#define %s\n", cpuname[d]);
- // Fall-through
- case CPU_ARMV8:
- // Minimum parameters for ARMv8 (based on A53)
- printf("#define L1_DATA_SIZE 32768\n");
- printf("#define L1_DATA_LINESIZE 64\n");
- printf("#define L2_SIZE 262144\n");
- printf("#define L2_LINESIZE 64\n");
- printf("#define DTB_DEFAULT_ENTRIES 64\n");
- printf("#define DTB_SIZE 4096\n");
- printf("#define L2_ASSOCIATIVE 4\n");
- break;
-
- case CPU_CORTEXA57:
- case CPU_CORTEXA72:
- case CPU_CORTEXA73:
- // Common minimum settings for these Arm cores
- // Can change a lot, but we need to be conservative
- // TODO: detect info from /sys if possible
- printf("#define %s\n", cpuname[d]);
- printf("#define L1_CODE_SIZE 49152\n");
- printf("#define L1_CODE_LINESIZE 64\n");
- printf("#define L1_CODE_ASSOCIATIVE 3\n");
- printf("#define L1_DATA_SIZE 32768\n");
- printf("#define L1_DATA_LINESIZE 64\n");
- printf("#define L1_DATA_ASSOCIATIVE 2\n");
- printf("#define L2_SIZE 524288\n");
- printf("#define L2_LINESIZE 64\n");
- printf("#define L2_ASSOCIATIVE 16\n");
- printf("#define DTB_DEFAULT_ENTRIES 64\n");
- printf("#define DTB_SIZE 4096\n");
- break;
- case CPU_NEOVERSEN1:
- printf("#define %s\n", cpuname[d]);
- printf("#define L1_CODE_SIZE 65536\n");
- printf("#define L1_CODE_LINESIZE 64\n");
- printf("#define L1_CODE_ASSOCIATIVE 4\n");
- printf("#define L1_DATA_SIZE 65536\n");
- printf("#define L1_DATA_LINESIZE 64\n");
- printf("#define L1_DATA_ASSOCIATIVE 4\n");
- printf("#define L2_SIZE 1048576\n");
- printf("#define L2_LINESIZE 64\n");
- printf("#define L2_ASSOCIATIVE 16\n");
- printf("#define DTB_DEFAULT_ENTRIES 64\n");
- printf("#define DTB_SIZE 4096\n");
- break;
-
- case CPU_FALKOR:
- printf("#define FALKOR\n");
- printf("#define L1_CODE_SIZE 65536\n");
- printf("#define L1_CODE_LINESIZE 64\n");
- printf("#define L1_DATA_SIZE 32768\n");
- printf("#define L1_DATA_LINESIZE 128\n");
- printf("#define L2_SIZE 524288\n");
- printf("#define L2_LINESIZE 64\n");
- printf("#define DTB_DEFAULT_ENTRIES 64\n");
- printf("#define DTB_SIZE 4096\n");
- printf("#define L2_ASSOCIATIVE 16\n");
- break;
-
- case CPU_THUNDERX:
- printf("#define THUNDERX\n");
- printf("#define L1_DATA_SIZE 32768\n");
- printf("#define L1_DATA_LINESIZE 128\n");
- printf("#define L2_SIZE 16777216\n");
- printf("#define L2_LINESIZE 128\n");
- printf("#define DTB_DEFAULT_ENTRIES 64\n");
- printf("#define DTB_SIZE 4096\n");
- printf("#define L2_ASSOCIATIVE 16\n");
- break;
-
- case CPU_THUNDERX2T99:
- printf("#define THUNDERX2T99 \n");
- printf("#define L1_CODE_SIZE 32768 \n");
- printf("#define L1_CODE_LINESIZE 64 \n");
- printf("#define L1_CODE_ASSOCIATIVE 8 \n");
- printf("#define L1_DATA_SIZE 32768 \n");
- printf("#define L1_DATA_LINESIZE 64 \n");
- printf("#define L1_DATA_ASSOCIATIVE 8 \n");
- printf("#define L2_SIZE 262144 \n");
- printf("#define L2_LINESIZE 64 \n");
- printf("#define L2_ASSOCIATIVE 8 \n");
- printf("#define L3_SIZE 33554432 \n");
- printf("#define L3_LINESIZE 64 \n");
- printf("#define L3_ASSOCIATIVE 32 \n");
- printf("#define DTB_DEFAULT_ENTRIES 64 \n");
- printf("#define DTB_SIZE 4096 \n");
- break;
-
- case CPU_TSV110:
- printf("#define TSV110 \n");
- printf("#define L1_CODE_SIZE 65536 \n");
- printf("#define L1_CODE_LINESIZE 64 \n");
- printf("#define L1_CODE_ASSOCIATIVE 4 \n");
- printf("#define L1_DATA_SIZE 65536 \n");
- printf("#define L1_DATA_LINESIZE 64 \n");
- printf("#define L1_DATA_ASSOCIATIVE 4 \n");
- printf("#define L2_SIZE 524228 \n");
- printf("#define L2_LINESIZE 64 \n");
- printf("#define L2_ASSOCIATIVE 8 \n");
- printf("#define DTB_DEFAULT_ENTRIES 64 \n");
- printf("#define DTB_SIZE 4096 \n");
- break;
-
- case CPU_EMAG8180:
- // Minimum parameters for ARMv8 (based on A53)
- printf("#define EMAG8180\n");
- printf("#define L1_CODE_SIZE 32768\n");
- printf("#define L1_DATA_SIZE 32768\n");
- printf("#define L1_DATA_LINESIZE 64\n");
- printf("#define L2_SIZE 262144\n");
- printf("#define L2_LINESIZE 64\n");
- printf("#define DTB_DEFAULT_ENTRIES 64\n");
- printf("#define DTB_SIZE 4096\n");
- break;
-
- case CPU_THUNDERX3T110:
- printf("#define THUNDERX3T110 \n");
- printf("#define L1_CODE_SIZE 65536 \n");
- printf("#define L1_CODE_LINESIZE 64 \n");
- printf("#define L1_CODE_ASSOCIATIVE 8 \n");
- printf("#define L1_DATA_SIZE 32768 \n");
- printf("#define L1_DATA_LINESIZE 64 \n");
- printf("#define L1_DATA_ASSOCIATIVE 8 \n");
- printf("#define L2_SIZE 524288 \n");
- printf("#define L2_LINESIZE 64 \n");
- printf("#define L2_ASSOCIATIVE 8 \n");
- printf("#define L3_SIZE 94371840 \n");
- printf("#define L3_LINESIZE 64 \n");
- printf("#define L3_ASSOCIATIVE 32 \n");
- printf("#define DTB_DEFAULT_ENTRIES 64 \n");
- printf("#define DTB_SIZE 4096 \n");
- break;
- #ifdef DARWIN
- case CPU_VORTEX:
- printf("#define VORTEX \n");
- sysctlbyname("hw.l1icachesize",&value,&length,NULL,0);
- printf("#define L1_CODE_SIZE %d \n",value);
- sysctlbyname("hw.cachelinesize",&value,&length,NULL,0);
- printf("#define L1_CODE_LINESIZE %d \n",value);
- sysctlbyname("hw.l1dcachesize",&value,&length,NULL,0);
- printf("#define L1_DATA_SIZE %d \n",value);
- sysctlbyname("hw.l2dcachesize",&value,&length,NULL,0);
- printf("#define L2_SIZE %d \n",value);
- break;
- #endif
- }
- get_cpucount();
- }
-
-
- void get_libname(void)
- {
- int d = detect();
- printf("%s", cpuname_lower[d]);
- }
-
- void get_features(void)
- {
-
- #ifdef __linux
- FILE *infile;
- char buffer[2048], *p,*t;
- p = (char *) NULL ;
-
- infile = fopen("/proc/cpuinfo", "r");
-
- while (fgets(buffer, sizeof(buffer), infile))
- {
-
- if (!strncmp("Features", buffer, 8))
- {
- p = strchr(buffer, ':') + 2;
- break;
- }
- }
-
- fclose(infile);
-
-
- if( p == NULL ) return;
-
- t = strtok(p," ");
- while( (t = strtok(NULL," ")))
- {
- }
-
- #endif
- return;
- }
|