484 lines
		
	
	
		
			13 KiB
		
	
	
	
		
			C
		
	
	
	
			
		
		
	
	
			484 lines
		
	
	
		
			13 KiB
		
	
	
	
		
			C
		
	
	
	
| /**************************************************************************
 | |
|   Copyright (c) 2013, The OpenBLAS Project
 | |
|   All rights reserved.
 | |
|   Redistribution and use in source and binary forms, with or without
 | |
|   modification, are permitted provided that the following conditions are
 | |
|   met:
 | |
|   1. Redistributions of source code must retain the above copyright
 | |
|   notice, this list of conditions and the following disclaimer.
 | |
|   2. Redistributions in binary form must reproduce the above copyright
 | |
|   notice, this list of conditions and the following disclaimer in
 | |
|   the documentation and/or other materials provided with the
 | |
|   distribution.
 | |
|   3. Neither the name of the OpenBLAS project nor the names of
 | |
|   its contributors may be used to endorse or promote products
 | |
|   derived from this software without specific prior written permission.
 | |
|   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 | |
|   AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 | |
|   IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 | |
|   ARE DISCLAIMED. IN NO EVENT SHALL THE OPENBLAS PROJECT OR CONTRIBUTORS BE
 | |
|   LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 | |
|   DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
 | |
|   SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
 | |
|   CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
 | |
|   OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE
 | |
|   USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 | |
|   *****************************************************************************/
 | |
| 
 | |
| #include <string.h>
 | |
| #ifdef __APPLE__
 | |
| #include <sys/sysctl.h>
 | |
| int32_t value;
 | |
| size_t length=sizeof(value);
 | |
| int64_t value64;
 | |
| size_t length64=sizeof(value64);
 | |
| #endif
 | |
| 
 | |
| #define CPU_UNKNOWN     	0
 | |
| #define CPU_ARMV8       	1
 | |
| // Arm
 | |
| #define CPU_CORTEXA53     2
 | |
| #define CPU_CORTEXA55     14
 | |
| #define CPU_CORTEXA57     3
 | |
| #define CPU_CORTEXA72     4
 | |
| #define CPU_CORTEXA73     5
 | |
| #define CPU_NEOVERSEN1    11
 | |
| // Qualcomm
 | |
| #define CPU_FALKOR        6
 | |
| // Cavium
 | |
| #define CPU_THUNDERX      7
 | |
| #define CPU_THUNDERX2T99  8
 | |
| #define CPU_THUNDERX3T110 12
 | |
| //Hisilicon
 | |
| #define CPU_TSV110        9
 | |
| // Ampere
 | |
| #define CPU_EMAG8180	 10
 | |
| // Apple
 | |
| #define CPU_VORTEX       13
 | |
| 
 | |
| static char *cpuname[] = {
 | |
|   "UNKNOWN",
 | |
|   "ARMV8" ,
 | |
|   "CORTEXA53",
 | |
|   "CORTEXA57",
 | |
|   "CORTEXA72",
 | |
|   "CORTEXA73",
 | |
|   "FALKOR",
 | |
|   "THUNDERX",
 | |
|   "THUNDERX2T99",
 | |
|   "TSV110",
 | |
|   "EMAG8180",
 | |
|   "NEOVERSEN1",
 | |
|   "THUNDERX3T110",
 | |
|   "VORTEX",
 | |
|   "CORTEXA55"
 | |
| };
 | |
| 
 | |
| static char *cpuname_lower[] = {
 | |
|   "unknown",
 | |
|   "armv8",
 | |
|   "cortexa53",
 | |
|   "cortexa57",
 | |
|   "cortexa72",
 | |
|   "cortexa73",
 | |
|   "falkor",
 | |
|   "thunderx",
 | |
|   "thunderx2t99",
 | |
|   "tsv110",
 | |
|   "emag8180",
 | |
|   "neoversen1",
 | |
|   "thunderx3t110",
 | |
|   "vortex",
 | |
|   "cortexa55"
 | |
| };
 | |
| 
 | |
| int get_feature(char *search)
 | |
| {
 | |
| 
 | |
| #ifdef __linux
 | |
| 	FILE *infile;
 | |
|   	char buffer[2048], *p,*t;
 | |
|   	p = (char *) NULL ;
 | |
| 
 | |
|   	infile = fopen("/proc/cpuinfo", "r");
 | |
| 
 | |
| 	while (fgets(buffer, sizeof(buffer), infile))
 | |
| 	{
 | |
| 
 | |
| 		if (!strncmp("Features", buffer, 8))
 | |
| 		{
 | |
| 			p = strchr(buffer, ':') + 2;
 | |
| 			break;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	fclose(infile);
 | |
| 
 | |
| 
 | |
| 	if( p == NULL ) return 0;
 | |
| 
 | |
| 	t = strtok(p," ");
 | |
| 	while( (t = strtok(NULL," ")))
 | |
| 	{
 | |
| 		if (!strcmp(t, search))   { return(1); }
 | |
| 	}
 | |
| 
 | |
| #endif
 | |
| 	return(0);
 | |
| }
 | |
| 
 | |
| 
 | |
| int detect(void)
 | |
| {
 | |
| 
 | |
| #ifdef __linux
 | |
| 
 | |
| 	FILE *infile;
 | |
| 	char buffer[512], *p, *cpu_part = NULL, *cpu_implementer = NULL;
 | |
| 	p = (char *) NULL ;
 | |
| 
 | |
| 	infile = fopen("/proc/cpuinfo", "r");
 | |
| 	while (fgets(buffer, sizeof(buffer), infile)) {
 | |
| 		if ((cpu_part != NULL) && (cpu_implementer != NULL)) {
 | |
| 			break;
 | |
| 		}
 | |
| 
 | |
| 		if ((cpu_part == NULL) && !strncmp("CPU part", buffer, 8)) {
 | |
| 			cpu_part = strchr(buffer, ':') + 2;
 | |
| 			cpu_part = strdup(cpu_part);
 | |
| 		} else if ((cpu_implementer == NULL) && !strncmp("CPU implementer", buffer, 15)) {
 | |
| 			cpu_implementer = strchr(buffer, ':') + 2;
 | |
| 			cpu_implementer = strdup(cpu_implementer);
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	fclose(infile);
 | |
| 	if(cpu_part != NULL && cpu_implementer != NULL) {
 | |
|     // Arm
 | |
|     if (strstr(cpu_implementer, "0x41")) {
 | |
|       if (strstr(cpu_part, "0xd03"))
 | |
|         return CPU_CORTEXA53;
 | |
|       else if (strstr(cpu_part, "0xd07"))
 | |
|         return CPU_CORTEXA57;
 | |
|       else if (strstr(cpu_part, "0xd08"))
 | |
|         return CPU_CORTEXA72;
 | |
|       else if (strstr(cpu_part, "0xd09"))
 | |
|         return CPU_CORTEXA73;
 | |
|       else if (strstr(cpu_part, "0xd0c"))
 | |
|         return CPU_NEOVERSEN1;
 | |
|       else if (strstr(cpu_part, "0xd05"))
 | |
| 	return CPU_CORTEXA55;
 | |
|     }
 | |
|     // Qualcomm
 | |
|     else if (strstr(cpu_implementer, "0x51") && strstr(cpu_part, "0xc00"))
 | |
|       return CPU_FALKOR;
 | |
|     // Cavium
 | |
|     else if (strstr(cpu_implementer, "0x43") && strstr(cpu_part, "0x0a1"))
 | |
| 			return CPU_THUNDERX;
 | |
|     else if (strstr(cpu_implementer, "0x43") && strstr(cpu_part, "0x0af"))
 | |
| 			return CPU_THUNDERX2T99;
 | |
|     else if (strstr(cpu_implementer, "0x43") && strstr(cpu_part, "0x0b8"))
 | |
| 			return CPU_THUNDERX3T110;
 | |
|     // HiSilicon
 | |
|     else if (strstr(cpu_implementer, "0x48") && strstr(cpu_part, "0xd01"))
 | |
|                         return CPU_TSV110;
 | |
|     // Ampere
 | |
|     else if (strstr(cpu_implementer, "0x50") && strstr(cpu_part, "0x000"))
 | |
|                         return CPU_EMAG8180;
 | |
| 	}
 | |
| 
 | |
| 	p = (char *) NULL ;
 | |
| 	infile = fopen("/proc/cpuinfo", "r");
 | |
| 	while (fgets(buffer, sizeof(buffer), infile))
 | |
| 	{
 | |
| 
 | |
| 		if ((!strncmp("model name", buffer, 10)) || (!strncmp("Processor", buffer, 9)) ||
 | |
| 		    (!strncmp("CPU architecture", buffer, 16)))
 | |
| 		{
 | |
| 			p = strchr(buffer, ':') + 2;
 | |
| 			break;
 | |
|       		}
 | |
|   	}
 | |
| 
 | |
|   	fclose(infile);
 | |
| 
 | |
|   	if(p != NULL)
 | |
| 	{
 | |
| 
 | |
| 		if ((strstr(p, "AArch64")) || (strstr(p, "8")))
 | |
| 		{
 | |
| 			return CPU_ARMV8;
 | |
| 
 | |
| 		}
 | |
| 
 | |
| 
 | |
| 	}
 | |
| #else
 | |
| #ifdef __APPLE__
 | |
| 	sysctlbyname("hw.cpufamily",&value,&length,NULL,0);
 | |
| 	if (value ==131287967|| value == 458787763 ) return CPU_VORTEX;
 | |
| #endif
 | |
| 	return CPU_ARMV8;	
 | |
| #endif
 | |
| 
 | |
| 	return CPU_UNKNOWN;
 | |
| }
 | |
| 
 | |
| char *get_corename(void)
 | |
| {
 | |
| 	return cpuname[detect()];
 | |
| }
 | |
| 
 | |
| void get_architecture(void)
 | |
| {
 | |
| 	printf("ARM64");
 | |
| }
 | |
| 
 | |
| void get_subarchitecture(void)
 | |
| {
 | |
| 	int d = detect();
 | |
| 	printf("%s", cpuname[d]);
 | |
| }
 | |
| 
 | |
| void get_subdirname(void)
 | |
| {
 | |
| 	printf("arm64");
 | |
| }
 | |
| 
 | |
| void get_cpucount(void)
 | |
| {
 | |
| int n=0;
 | |
| 
 | |
| #ifdef __linux
 | |
| 	FILE *infile;
 | |
|   	char buffer[2048], *p,*t;
 | |
|   	p = (char *) NULL ;
 | |
| 
 | |
|   	infile = fopen("/proc/cpuinfo", "r");
 | |
| 
 | |
| 	while (fgets(buffer, sizeof(buffer), infile))
 | |
| 	{
 | |
| 
 | |
| 		if (!strncmp("processor", buffer, 9))
 | |
| 		n++;
 | |
|   	}
 | |
| 
 | |
|   	fclose(infile);
 | |
| 
 | |
| 	printf("#define NUM_CORES %d\n",n);
 | |
| #endif
 | |
| #ifdef __APPLE__
 | |
| 	sysctlbyname("hw.physicalcpu_max",&value,&length,NULL,0);
 | |
| 	printf("#define NUM_CORES %d\n",value);
 | |
| #endif	
 | |
| }
 | |
| 
 | |
| 
 | |
| 
 | |
| void get_cpuconfig(void)
 | |
| {
 | |
| 
 | |
|   // All arches should define ARMv8
 | |
|   printf("#define ARMV8\n");
 | |
|   printf("#define HAVE_NEON\n"); // This shouldn't be necessary
 | |
|   printf("#define HAVE_VFPV4\n"); // This shouldn't be necessary
 | |
| 
 | |
| 	int d = detect();
 | |
| 	switch (d)
 | |
| 	{
 | |
| 
 | |
|     case CPU_CORTEXA53:
 | |
|     case CPU_CORTEXA55:			
 | |
|       printf("#define %s\n", cpuname[d]);
 | |
|       // Fall-through
 | |
| 		case CPU_ARMV8:
 | |
|       // Minimum parameters for ARMv8 (based on A53)
 | |
|     	printf("#define L1_DATA_SIZE 32768\n");
 | |
|     	printf("#define L1_DATA_LINESIZE 64\n");
 | |
|     	printf("#define L2_SIZE 262144\n");
 | |
|     	printf("#define L2_LINESIZE 64\n");
 | |
|     	printf("#define DTB_DEFAULT_ENTRIES 64\n");
 | |
|     	printf("#define DTB_SIZE 4096\n");
 | |
|     	printf("#define L2_ASSOCIATIVE 4\n");
 | |
| 			break;
 | |
| 
 | |
| 		case CPU_CORTEXA57:
 | |
| 		case CPU_CORTEXA72:
 | |
| 		case CPU_CORTEXA73:
 | |
|       // Common minimum settings for these Arm cores
 | |
|       // Can change a lot, but we need to be conservative
 | |
|       // TODO: detect info from /sys if possible
 | |
|       printf("#define %s\n", cpuname[d]);
 | |
| 			printf("#define L1_CODE_SIZE 49152\n");
 | |
| 			printf("#define L1_CODE_LINESIZE 64\n");
 | |
| 			printf("#define L1_CODE_ASSOCIATIVE 3\n");
 | |
| 			printf("#define L1_DATA_SIZE 32768\n");
 | |
| 			printf("#define L1_DATA_LINESIZE 64\n");
 | |
| 			printf("#define L1_DATA_ASSOCIATIVE 2\n");
 | |
|       printf("#define L2_SIZE 524288\n");
 | |
| 			printf("#define L2_LINESIZE 64\n");
 | |
| 			printf("#define L2_ASSOCIATIVE 16\n");
 | |
| 			printf("#define DTB_DEFAULT_ENTRIES 64\n");
 | |
| 			printf("#define DTB_SIZE 4096\n");
 | |
| 			break;
 | |
| 		case CPU_NEOVERSEN1:
 | |
| 			printf("#define %s\n", cpuname[d]);
 | |
| 			printf("#define L1_CODE_SIZE 65536\n");
 | |
| 			printf("#define L1_CODE_LINESIZE 64\n");
 | |
| 			printf("#define L1_CODE_ASSOCIATIVE 4\n");
 | |
| 			printf("#define L1_DATA_SIZE 65536\n");
 | |
| 			printf("#define L1_DATA_LINESIZE 64\n");
 | |
| 			printf("#define L1_DATA_ASSOCIATIVE 4\n");
 | |
| 			printf("#define L2_SIZE 1048576\n");
 | |
| 			printf("#define L2_LINESIZE 64\n");
 | |
| 			printf("#define L2_ASSOCIATIVE 16\n");
 | |
| 			printf("#define DTB_DEFAULT_ENTRIES 64\n");
 | |
| 			printf("#define DTB_SIZE 4096\n");
 | |
| 			break;
 | |
| 
 | |
|     case CPU_FALKOR:
 | |
|       printf("#define FALKOR\n");
 | |
|       printf("#define L1_CODE_SIZE 65536\n");
 | |
|       printf("#define L1_CODE_LINESIZE 64\n");
 | |
|       printf("#define L1_DATA_SIZE 32768\n");
 | |
|       printf("#define L1_DATA_LINESIZE 128\n");
 | |
|       printf("#define L2_SIZE 524288\n");
 | |
|       printf("#define L2_LINESIZE 64\n");
 | |
|       printf("#define DTB_DEFAULT_ENTRIES 64\n");
 | |
|       printf("#define DTB_SIZE 4096\n");
 | |
|       printf("#define L2_ASSOCIATIVE 16\n");
 | |
|       break;
 | |
| 
 | |
| 		case CPU_THUNDERX:
 | |
| 			printf("#define THUNDERX\n");
 | |
| 			printf("#define L1_DATA_SIZE 32768\n");
 | |
| 			printf("#define L1_DATA_LINESIZE 128\n");
 | |
| 			printf("#define L2_SIZE 16777216\n");
 | |
| 			printf("#define L2_LINESIZE 128\n");
 | |
| 			printf("#define DTB_DEFAULT_ENTRIES 64\n");
 | |
| 			printf("#define DTB_SIZE 4096\n");
 | |
| 			printf("#define L2_ASSOCIATIVE 16\n");
 | |
| 			break;
 | |
| 
 | |
| 		case CPU_THUNDERX2T99:
 | |
| 			printf("#define THUNDERX2T99                  \n");
 | |
| 			printf("#define L1_CODE_SIZE         32768    \n");
 | |
| 			printf("#define L1_CODE_LINESIZE     64       \n");
 | |
| 			printf("#define L1_CODE_ASSOCIATIVE  8        \n");
 | |
| 			printf("#define L1_DATA_SIZE         32768    \n");
 | |
| 			printf("#define L1_DATA_LINESIZE     64       \n");
 | |
| 			printf("#define L1_DATA_ASSOCIATIVE  8        \n");
 | |
| 			printf("#define L2_SIZE              262144   \n");
 | |
| 			printf("#define L2_LINESIZE          64       \n");
 | |
| 			printf("#define L2_ASSOCIATIVE       8        \n");
 | |
| 			printf("#define L3_SIZE              33554432 \n");
 | |
| 			printf("#define L3_LINESIZE          64       \n");
 | |
| 			printf("#define L3_ASSOCIATIVE       32       \n");
 | |
| 			printf("#define DTB_DEFAULT_ENTRIES  64       \n");
 | |
| 			printf("#define DTB_SIZE             4096     \n");
 | |
| 			break;
 | |
| 			
 | |
| 		case CPU_TSV110:
 | |
| 			printf("#define TSV110                        \n");
 | |
| 			printf("#define L1_CODE_SIZE         65536    \n");
 | |
| 			printf("#define L1_CODE_LINESIZE     64       \n");
 | |
| 			printf("#define L1_CODE_ASSOCIATIVE  4        \n");
 | |
| 			printf("#define L1_DATA_SIZE         65536    \n");
 | |
| 			printf("#define L1_DATA_LINESIZE     64       \n");
 | |
| 			printf("#define L1_DATA_ASSOCIATIVE  4        \n");
 | |
| 			printf("#define L2_SIZE              524228   \n");
 | |
| 			printf("#define L2_LINESIZE          64       \n");
 | |
| 			printf("#define L2_ASSOCIATIVE       8        \n");
 | |
| 			printf("#define DTB_DEFAULT_ENTRIES  64       \n");
 | |
| 			printf("#define DTB_SIZE             4096     \n");
 | |
| 			break;	
 | |
| 
 | |
| 		case CPU_EMAG8180:
 | |
|       // Minimum parameters for ARMv8 (based on A53)
 | |
| 	printf("#define EMAG8180\n");
 | |
|     	printf("#define L1_CODE_SIZE 32768\n");
 | |
|     	printf("#define L1_DATA_SIZE 32768\n");
 | |
|     	printf("#define L1_DATA_LINESIZE 64\n");
 | |
|     	printf("#define L2_SIZE 262144\n");
 | |
|     	printf("#define L2_LINESIZE 64\n");
 | |
|     	printf("#define DTB_DEFAULT_ENTRIES 64\n");
 | |
|     	printf("#define DTB_SIZE 4096\n");
 | |
| 			break;
 | |
| 
 | |
| 		case CPU_THUNDERX3T110:
 | |
| 			printf("#define THUNDERX3T110                 \n");
 | |
| 			printf("#define L1_CODE_SIZE         65536    \n");
 | |
| 			printf("#define L1_CODE_LINESIZE     64       \n");
 | |
| 			printf("#define L1_CODE_ASSOCIATIVE  8        \n");
 | |
| 			printf("#define L1_DATA_SIZE         32768    \n");
 | |
| 			printf("#define L1_DATA_LINESIZE     64       \n");
 | |
| 			printf("#define L1_DATA_ASSOCIATIVE  8        \n");
 | |
| 			printf("#define L2_SIZE              524288   \n");
 | |
| 			printf("#define L2_LINESIZE          64       \n");
 | |
| 			printf("#define L2_ASSOCIATIVE       8        \n");
 | |
| 			printf("#define L3_SIZE              94371840 \n");
 | |
| 			printf("#define L3_LINESIZE          64       \n");
 | |
| 			printf("#define L3_ASSOCIATIVE       32       \n");
 | |
| 			printf("#define DTB_DEFAULT_ENTRIES  64       \n");
 | |
| 			printf("#define DTB_SIZE             4096     \n");
 | |
| 			break;
 | |
| #ifdef __APPLE__
 | |
| 		case CPU_VORTEX:
 | |
| 			printf("#define VORTEX			      \n");
 | |
| 			sysctlbyname("hw.l1icachesize",&value64,&length64,NULL,0);
 | |
| 			printf("#define L1_CODE_SIZE	     %lld       \n",value64);
 | |
| 			sysctlbyname("hw.cachelinesize",&value64,&length64,NULL,0);
 | |
| 			printf("#define L1_CODE_LINESIZE     %lld       \n",value64);
 | |
| 			sysctlbyname("hw.l1dcachesize",&value64,&length64,NULL,0);
 | |
| 			printf("#define L1_DATA_SIZE	     %lld       \n",value64);
 | |
| 			sysctlbyname("hw.l2cachesize",&value64,&length64,NULL,0);
 | |
| 			printf("#define L2_SIZE	     %lld       \n",value64);
 | |
| 			printf("#define DTB_DEFAULT_ENTRIES  64       \n");
 | |
| 			printf("#define DTB_SIZE             4096     \n");
 | |
| 			break;
 | |
| #endif			
 | |
| 	}
 | |
| 	get_cpucount();
 | |
| }
 | |
| 
 | |
| 
 | |
| void get_libname(void)
 | |
| {
 | |
| 	int d = detect();
 | |
| 	printf("%s", cpuname_lower[d]);
 | |
| }
 | |
| 
 | |
| void get_features(void)
 | |
| {
 | |
| 
 | |
| #ifdef __linux
 | |
| 	FILE *infile;
 | |
|   	char buffer[2048], *p,*t;
 | |
|   	p = (char *) NULL ;
 | |
| 
 | |
|   	infile = fopen("/proc/cpuinfo", "r");
 | |
| 
 | |
| 	while (fgets(buffer, sizeof(buffer), infile))
 | |
| 	{
 | |
| 
 | |
| 		if (!strncmp("Features", buffer, 8))
 | |
| 		{
 | |
| 			p = strchr(buffer, ':') + 2;
 | |
| 			break;
 | |
|       		}
 | |
|   	}
 | |
| 
 | |
|   	fclose(infile);
 | |
| 
 | |
| 
 | |
| 	if( p == NULL ) return;
 | |
| 
 | |
| 	t = strtok(p," ");
 | |
| 	while( (t = strtok(NULL," ")))
 | |
| 	{
 | |
| 	}
 | |
| 
 | |
| #endif
 | |
| 	return;
 | |
| }
 |