mirror of
https://github.com/Dr-Noob/cpufetch.git
synced 2026-03-25 07:50:40 +01:00
Compare commits
37 Commits
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
fd2d1fc120 | ||
|
|
add4bd0a71 | ||
|
|
1e55713ebc | ||
|
|
128062a1dc | ||
|
|
321a1ec375 | ||
|
|
48c598cf3b | ||
|
|
aa94389bbe | ||
|
|
8d10a03adc | ||
|
|
2410fd16d3 | ||
|
|
f63178b41c | ||
|
|
2788e6831e | ||
|
|
146f2a13aa | ||
|
|
90624b9aaa | ||
|
|
e42f04cca8 | ||
|
|
3aacaf5f9e | ||
|
|
50f66ec571 | ||
|
|
cb186a2f97 | ||
|
|
6164884415 | ||
|
|
260f9ec3b8 | ||
|
|
79013d0ec9 | ||
|
|
e4227388b9 | ||
|
|
8fca4cb250 | ||
|
|
7c947bdf64 | ||
|
|
1ed3a0f2bf | ||
|
|
0fe6fc3f4d | ||
|
|
96c784026b | ||
|
|
59cd2dd128 | ||
|
|
da1981b97c | ||
|
|
8506c91e00 | ||
|
|
ece28cbdee | ||
|
|
7b46c78249 | ||
|
|
e0095c303d | ||
|
|
65378aaed9 | ||
|
|
946729dd06 | ||
|
|
9212f19de1 | ||
|
|
b019256515 | ||
|
|
d4cadbd807 |
44
Makefile
44
Makefile
@@ -13,17 +13,27 @@ COMMON_HDR = $(SRC_COMMON)ascii.h $(SRC_COMMON)cpu.h $(SRC_COMMON)udev.h $(SRC_C
|
|||||||
ifneq ($(OS),Windows_NT)
|
ifneq ($(OS),Windows_NT)
|
||||||
GIT_VERSION := "$(shell git describe --abbrev=4 --dirty --always --tags)"
|
GIT_VERSION := "$(shell git describe --abbrev=4 --dirty --always --tags)"
|
||||||
arch := $(shell uname -m)
|
arch := $(shell uname -m)
|
||||||
|
os := $(shell uname -s)
|
||||||
|
|
||||||
|
ifeq ($(os), Linux)
|
||||||
|
COMMON_SRC += $(SRC_COMMON)freq.c
|
||||||
|
COMMON_HDR += $(SRC_COMMON)freq.h
|
||||||
|
endif
|
||||||
|
|
||||||
ifeq ($(arch), $(filter $(arch), x86_64 amd64 i386 i486 i586 i686))
|
ifeq ($(arch), $(filter $(arch), x86_64 amd64 i386 i486 i586 i686))
|
||||||
SRC_DIR=src/x86/
|
SRC_DIR=src/x86/
|
||||||
SOURCE += $(COMMON_SRC) $(SRC_DIR)cpuid.c $(SRC_DIR)apic.c $(SRC_DIR)cpuid_asm.c $(SRC_DIR)uarch.c
|
SOURCE += $(COMMON_SRC) $(SRC_DIR)cpuid.c $(SRC_DIR)apic.c $(SRC_DIR)cpuid_asm.c $(SRC_DIR)uarch.c
|
||||||
HEADERS += $(COMMON_HDR) $(SRC_DIR)cpuid.h $(SRC_DIR)apic.h $(SRC_DIR)cpuid_asm.h $(SRC_DIR)uarch.h $(SRC_DIR)freq/freq.h
|
HEADERS += $(COMMON_HDR) $(SRC_DIR)cpuid.h $(SRC_DIR)apic.h $(SRC_DIR)cpuid_asm.h $(SRC_DIR)uarch.h $(SRC_DIR)freq/freq.h
|
||||||
|
|
||||||
os := $(shell uname -s)
|
ifeq ($(os), Linux)
|
||||||
ifeq ($(os), Linux)
|
|
||||||
SOURCE += $(SRC_DIR)freq/freq.c freq_nov.o freq_avx.o freq_avx512.o
|
SOURCE += $(SRC_DIR)freq/freq.c freq_nov.o freq_avx.o freq_avx512.o
|
||||||
HEADERS += $(SRC_DIR)freq/freq.h
|
HEADERS += $(SRC_DIR)freq/freq.h
|
||||||
CFLAGS += -pthread
|
CFLAGS += -pthread
|
||||||
endif
|
endif
|
||||||
|
ifeq ($(os), FreeBSD)
|
||||||
|
SOURCE += $(SRC_COMMON)sysctl.c
|
||||||
|
HEADERS += $(SRC_COMMON)sysctl.h
|
||||||
|
endif
|
||||||
CFLAGS += -DARCH_X86 -std=c99 -fstack-protector-all
|
CFLAGS += -DARCH_X86 -std=c99 -fstack-protector-all
|
||||||
else ifeq ($(arch), $(filter $(arch), ppc64le ppc64 ppcle ppc))
|
else ifeq ($(arch), $(filter $(arch), ppc64le ppc64 ppcle ppc))
|
||||||
SRC_DIR=src/ppc/
|
SRC_DIR=src/ppc/
|
||||||
@@ -32,20 +42,25 @@ ifneq ($(OS),Windows_NT)
|
|||||||
CFLAGS += -DARCH_PPC -std=gnu99 -fstack-protector-all -Wno-language-extension-token
|
CFLAGS += -DARCH_PPC -std=gnu99 -fstack-protector-all -Wno-language-extension-token
|
||||||
else ifeq ($(arch), $(filter $(arch), arm aarch64_be aarch64 arm64 armv8b armv8l armv7l armv6l))
|
else ifeq ($(arch), $(filter $(arch), arm aarch64_be aarch64 arm64 armv8b armv8l armv7l armv6l))
|
||||||
SRC_DIR=src/arm/
|
SRC_DIR=src/arm/
|
||||||
SOURCE += $(COMMON_SRC) $(SRC_DIR)midr.c $(SRC_DIR)uarch.c $(SRC_COMMON)soc.c $(SRC_DIR)soc.c $(SRC_COMMON)pci.c $(SRC_DIR)udev.c
|
SOURCE += $(COMMON_SRC) $(SRC_DIR)midr.c $(SRC_DIR)uarch.c $(SRC_COMMON)soc.c $(SRC_DIR)soc.c $(SRC_COMMON)pci.c $(SRC_DIR)udev.c sve.o
|
||||||
HEADERS += $(COMMON_HDR) $(SRC_DIR)midr.h $(SRC_DIR)uarch.h $(SRC_COMMON)soc.h $(SRC_DIR)soc.h $(SRC_COMMON)pci.h $(SRC_DIR)udev.c $(SRC_DIR)socs.h
|
HEADERS += $(COMMON_HDR) $(SRC_DIR)midr.h $(SRC_DIR)uarch.h $(SRC_COMMON)soc.h $(SRC_DIR)soc.h $(SRC_COMMON)pci.h $(SRC_DIR)udev.c $(SRC_DIR)socs.h
|
||||||
CFLAGS += -DARCH_ARM -Wno-unused-parameter -std=c99 -fstack-protector-all
|
CFLAGS += -DARCH_ARM -Wno-unused-parameter -std=c99 -fstack-protector-all
|
||||||
|
|
||||||
os := $(shell uname -s)
|
# Check if the compiler supports -march=armv8-a+sve. We will use it (if supported) to compile SVE detection code later
|
||||||
ifeq ($(os), Darwin)
|
is_sve_flag_supported := $(shell $(CC) -march=armv8-a+sve -c $(SRC_DIR)sve.c -o sve_test.o 2> /dev/null && echo 'yes'; rm -f sve_test.o)
|
||||||
SOURCE += $(SRC_DIR)sysctl.c
|
ifeq ($(is_sve_flag_supported), yes)
|
||||||
HEADERS += $(SRC_DIR)sysctl.h
|
SVE_FLAGS += -march=armv8-a+sve
|
||||||
endif
|
endif
|
||||||
else ifeq ($(arch), $(filter $(arch), riscv64 riscv32))
|
|
||||||
SRC_DIR=src/riscv/
|
ifeq ($(os), Darwin)
|
||||||
SOURCE += $(COMMON_SRC) $(SRC_DIR)riscv.c $(SRC_DIR)uarch.c $(SRC_COMMON)soc.c $(SRC_DIR)soc.c $(SRC_DIR)udev.c
|
SOURCE += $(SRC_COMMON)sysctl.c
|
||||||
HEADERS += $(COMMON_HDR) $(SRC_DIR)riscv.h $(SRC_DIR)uarch.h $(SRC_COMMON)soc.h $(SRC_DIR)soc.h $(SRC_DIR)udev.h $(SRC_DIR)socs.h
|
HEADERS += $(SRC_COMMON)sysctl.h
|
||||||
CFLAGS += -DARCH_RISCV -Wno-unused-parameter -std=c99 -fstack-protector-all
|
endif
|
||||||
|
else ifeq ($(arch), $(filter $(arch), riscv64 riscv32))
|
||||||
|
SRC_DIR=src/riscv/
|
||||||
|
SOURCE += $(COMMON_SRC) $(SRC_DIR)riscv.c $(SRC_DIR)uarch.c $(SRC_COMMON)soc.c $(SRC_DIR)soc.c $(SRC_DIR)udev.c
|
||||||
|
HEADERS += $(COMMON_HDR) $(SRC_DIR)riscv.h $(SRC_DIR)uarch.h $(SRC_COMMON)soc.h $(SRC_DIR)soc.h $(SRC_DIR)udev.h $(SRC_DIR)socs.h
|
||||||
|
CFLAGS += -DARCH_RISCV -Wno-unused-parameter -std=c99 -fstack-protector-all
|
||||||
else
|
else
|
||||||
# Error lines should not be tabulated because Makefile complains about it
|
# Error lines should not be tabulated because Makefile complains about it
|
||||||
$(warning Unsupported arch detected: $(arch). See https://github.com/Dr-Noob/cpufetch#1-support)
|
$(warning Unsupported arch detected: $(arch). See https://github.com/Dr-Noob/cpufetch#1-support)
|
||||||
@@ -86,6 +101,9 @@ freq_avx.o: Makefile $(SRC_DIR)freq/freq_avx.c $(SRC_DIR)freq/freq_avx.h $(SRC_D
|
|||||||
freq_avx512.o: Makefile $(SRC_DIR)freq/freq_avx512.c $(SRC_DIR)freq/freq_avx512.h $(SRC_DIR)freq/freq.h
|
freq_avx512.o: Makefile $(SRC_DIR)freq/freq_avx512.c $(SRC_DIR)freq/freq_avx512.h $(SRC_DIR)freq/freq.h
|
||||||
$(CC) $(CFLAGS) $(SANITY_FLAGS) -c -mavx512f -pthread $(SRC_DIR)freq/freq_avx512.c -o $@
|
$(CC) $(CFLAGS) $(SANITY_FLAGS) -c -mavx512f -pthread $(SRC_DIR)freq/freq_avx512.c -o $@
|
||||||
|
|
||||||
|
sve.o: Makefile $(SRC_DIR)sve.c $(SRC_DIR)sve.h
|
||||||
|
$(CC) $(CFLAGS) $(SANITY_FLAGS) $(SVE_FLAGS) -c $(SRC_DIR)sve.c -o $@
|
||||||
|
|
||||||
$(OUTPUT): Makefile $(SOURCE) $(HEADERS)
|
$(OUTPUT): Makefile $(SOURCE) $(HEADERS)
|
||||||
ifeq ($(GIT_VERSION),"")
|
ifeq ($(GIT_VERSION),"")
|
||||||
$(CC) $(CFLAGS) $(SANITY_FLAGS) $(SOURCE) -o $(OUTPUT)
|
$(CC) $(CFLAGS) $(SANITY_FLAGS) $(SOURCE) -o $(OUTPUT)
|
||||||
|
|||||||
@@ -45,6 +45,7 @@ cpufetch is a command-line tool written in C that displays the CPU information i
|
|||||||
- [3.1 x86_64](#31-x86_64)
|
- [3.1 x86_64](#31-x86_64)
|
||||||
- [3.2 ARM](#32-arm)
|
- [3.2 ARM](#32-arm)
|
||||||
- [3.3 PowerPC](#33-powerpc)
|
- [3.3 PowerPC](#33-powerpc)
|
||||||
|
- [3.4 RISC-V](#34-risc-v)
|
||||||
- [4. Colors](#4-colors)
|
- [4. Colors](#4-colors)
|
||||||
- [4.1 Specifying a name](#41-specifying-a-name)
|
- [4.1 Specifying a name](#41-specifying-a-name)
|
||||||
- [4.2 Specifying the colors in RGB format](#42-specifying-the-colors-in-rgb-format)
|
- [4.2 Specifying the colors in RGB format](#42-specifying-the-colors-in-rgb-format)
|
||||||
@@ -120,6 +121,11 @@ make
|
|||||||
<p align="center"><img width=90% src="pictures/ibm.png"></p>
|
<p align="center"><img width=90% src="pictures/ibm.png"></p>
|
||||||
<p align="center">Talos II</p>
|
<p align="center">Talos II</p>
|
||||||
|
|
||||||
|
## 3.4 RISC-V
|
||||||
|
|
||||||
|
<p align="center"><img width=80% src="pictures/starfive.png"></p>
|
||||||
|
<p align="center">StarFive VisionFive 2</p>
|
||||||
|
|
||||||
## 4. Colors
|
## 4. Colors
|
||||||
By default, `cpufetch` will print the CPU logo with the system colorscheme. However, you can set a custom color scheme in two different ways:
|
By default, `cpufetch` will print the CPU logo with the system colorscheme. However, you can set a custom color scheme in two different ways:
|
||||||
|
|
||||||
@@ -175,6 +181,7 @@ Thanks to the fellow contributors and interested people in the project. Special
|
|||||||
- [mdoksa76](https://github.com/mdoksa76) and [exkc](https://github.com/exkc): Excellent ideas and feedback for supporting Allwinner SoCs.
|
- [mdoksa76](https://github.com/mdoksa76) and [exkc](https://github.com/exkc): Excellent ideas and feedback for supporting Allwinner SoCs.
|
||||||
- [Sakura286](https://github.com/Sakura286), [exkc](https://github.com/exkc) and [Patola](https://github.com/Patola): Helped with RISC-V port with ssh access, ideas, testing, etc.
|
- [Sakura286](https://github.com/Sakura286), [exkc](https://github.com/exkc) and [Patola](https://github.com/Patola): Helped with RISC-V port with ssh access, ideas, testing, etc.
|
||||||
- [ThomasKaiser](https://github.com/ThomasKaiser): Very valuable feedback on improving ARM SoC detection (Apple, Allwinner, Rockchip).
|
- [ThomasKaiser](https://github.com/ThomasKaiser): Very valuable feedback on improving ARM SoC detection (Apple, Allwinner, Rockchip).
|
||||||
|
- [zerkerX](https://github.com/zerkerX): Helped with feedback for supporting old (e.g., Pentium III) Intel CPUs.
|
||||||
|
|
||||||
## 8. cpufetch for GPUs (gpufetch)
|
## 8. cpufetch for GPUs (gpufetch)
|
||||||
See [gpufetch](https://github.com/Dr-Noob/gpufetch) project!
|
See [gpufetch](https://github.com/Dr-Noob/gpufetch) project!
|
||||||
|
|||||||
BIN
pictures/starfive.png
Normal file
BIN
pictures/starfive.png
Normal file
Binary file not shown.
|
After Width: | Height: | Size: 42 KiB |
@@ -8,15 +8,18 @@
|
|||||||
#ifdef __linux__
|
#ifdef __linux__
|
||||||
#include <sys/auxv.h>
|
#include <sys/auxv.h>
|
||||||
#include <asm/hwcap.h>
|
#include <asm/hwcap.h>
|
||||||
|
#include "../common/freq.h"
|
||||||
#elif defined __APPLE__ || __MACH__
|
#elif defined __APPLE__ || __MACH__
|
||||||
#include "sysctl.h"
|
#include "../common/sysctl.h"
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
#include "../common/global.h"
|
#include "../common/global.h"
|
||||||
#include "../common/soc.h"
|
#include "../common/soc.h"
|
||||||
|
#include "../common/args.h"
|
||||||
#include "udev.h"
|
#include "udev.h"
|
||||||
#include "midr.h"
|
#include "midr.h"
|
||||||
#include "uarch.h"
|
#include "uarch.h"
|
||||||
|
#include "sve.h"
|
||||||
|
|
||||||
bool cores_are_equal(int c1pos, int c2pos, uint32_t* midr_array, int32_t* freq_array) {
|
bool cores_are_equal(int c1pos, int c2pos, uint32_t* midr_array, int32_t* freq_array) {
|
||||||
return midr_array[c1pos] == midr_array[c2pos] && freq_array[c1pos] == freq_array[c2pos];
|
return midr_array[c1pos] == midr_array[c2pos] && freq_array[c1pos] == freq_array[c2pos];
|
||||||
@@ -39,8 +42,17 @@ struct cache* get_cache_info(struct cpuInfo* cpu) {
|
|||||||
struct frequency* get_frequency_info(uint32_t core) {
|
struct frequency* get_frequency_info(uint32_t core) {
|
||||||
struct frequency* freq = emalloc(sizeof(struct frequency));
|
struct frequency* freq = emalloc(sizeof(struct frequency));
|
||||||
|
|
||||||
|
freq->measured = false;
|
||||||
freq->base = UNKNOWN_DATA;
|
freq->base = UNKNOWN_DATA;
|
||||||
freq->max = get_max_freq_from_file(core);
|
freq->max = get_max_freq_from_file(core);
|
||||||
|
#ifdef __linux__
|
||||||
|
if (freq->max == UNKNOWN_DATA || measure_max_frequency_flag()) {
|
||||||
|
if (freq->max == UNKNOWN_DATA)
|
||||||
|
printWarn("Unable to find max frequency from udev, measuring CPU frequency");
|
||||||
|
freq->max = measure_max_frequency(core);
|
||||||
|
freq->measured = true;
|
||||||
|
}
|
||||||
|
#endif
|
||||||
|
|
||||||
return freq;
|
return freq;
|
||||||
}
|
}
|
||||||
@@ -157,6 +169,15 @@ struct features* get_features_info(void) {
|
|||||||
feat->SHA1 = hwcaps & HWCAP_SHA1;
|
feat->SHA1 = hwcaps & HWCAP_SHA1;
|
||||||
feat->SHA2 = hwcaps & HWCAP_SHA2;
|
feat->SHA2 = hwcaps & HWCAP_SHA2;
|
||||||
feat->NEON = hwcaps & HWCAP_ASIMD;
|
feat->NEON = hwcaps & HWCAP_ASIMD;
|
||||||
|
feat->SVE = hwcaps & HWCAP_SVE;
|
||||||
|
|
||||||
|
hwcaps = getauxval(AT_HWCAP2);
|
||||||
|
if (errno == ENOENT) {
|
||||||
|
printWarn("Unable to retrieve AT_HWCAP2 using getauxval");
|
||||||
|
}
|
||||||
|
else {
|
||||||
|
feat->SVE2 = hwcaps & HWCAP2_SVE2;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
#else
|
#else
|
||||||
else {
|
else {
|
||||||
@@ -172,6 +193,8 @@ struct features* get_features_info(void) {
|
|||||||
feat->CRC32 = hwcaps & HWCAP2_CRC32;
|
feat->CRC32 = hwcaps & HWCAP2_CRC32;
|
||||||
feat->SHA1 = hwcaps & HWCAP2_SHA1;
|
feat->SHA1 = hwcaps & HWCAP2_SHA1;
|
||||||
feat->SHA2 = hwcaps & HWCAP2_SHA2;
|
feat->SHA2 = hwcaps & HWCAP2_SHA2;
|
||||||
|
feat->SVE = false;
|
||||||
|
feat->SVE2 = false;
|
||||||
}
|
}
|
||||||
#endif // ifdef __aarch64__
|
#endif // ifdef __aarch64__
|
||||||
#elif defined __APPLE__ || __MACH__
|
#elif defined __APPLE__ || __MACH__
|
||||||
@@ -181,8 +204,14 @@ struct features* get_features_info(void) {
|
|||||||
feat->SHA1 = true;
|
feat->SHA1 = true;
|
||||||
feat->SHA2 = true;
|
feat->SHA2 = true;
|
||||||
feat->NEON = true;
|
feat->NEON = true;
|
||||||
|
feat->SVE = false;
|
||||||
|
feat->SVE2 = false;
|
||||||
#endif // ifdef __linux__
|
#endif // ifdef __linux__
|
||||||
|
|
||||||
|
if (feat->SVE || feat->SVE2) {
|
||||||
|
feat->cntb = sve_cntb();
|
||||||
|
}
|
||||||
|
|
||||||
return feat;
|
return feat;
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -419,7 +448,7 @@ char* get_str_topology(struct cpuInfo* cpu, struct topology* topo, bool dual_soc
|
|||||||
|
|
||||||
char* get_str_features(struct cpuInfo* cpu) {
|
char* get_str_features(struct cpuInfo* cpu) {
|
||||||
struct features* feat = cpu->feat;
|
struct features* feat = cpu->feat;
|
||||||
uint32_t max_len = strlen("NEON,SHA1,SHA2,AES,CRC32,") + 1;
|
uint32_t max_len = strlen("NEON,SHA1,SHA2,AES,CRC32,SVE,SVE2,") + 1;
|
||||||
uint32_t len = 0;
|
uint32_t len = 0;
|
||||||
char* string = ecalloc(max_len, sizeof(char));
|
char* string = ecalloc(max_len, sizeof(char));
|
||||||
|
|
||||||
@@ -427,6 +456,14 @@ char* get_str_features(struct cpuInfo* cpu) {
|
|||||||
strcat(string, "NEON,");
|
strcat(string, "NEON,");
|
||||||
len += 5;
|
len += 5;
|
||||||
}
|
}
|
||||||
|
if(feat->SVE) {
|
||||||
|
strcat(string, "SVE,");
|
||||||
|
len += 4;
|
||||||
|
}
|
||||||
|
if(feat->SVE2) {
|
||||||
|
strcat(string, "SVE2,");
|
||||||
|
len += 5;
|
||||||
|
}
|
||||||
if(feat->SHA1) {
|
if(feat->SHA1) {
|
||||||
strcat(string, "SHA1,");
|
strcat(string, "SHA1,");
|
||||||
len += 5;
|
len += 5;
|
||||||
@@ -476,6 +513,10 @@ void print_debug(struct cpuInfo* cpu) {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
if (cpu->feat->SVE || cpu->feat->SVE2) {
|
||||||
|
printf("- cntb: %d\n", (int) cpu->feat->cntb);
|
||||||
|
}
|
||||||
|
|
||||||
#if defined(__APPLE__) || defined(__MACH__)
|
#if defined(__APPLE__) || defined(__MACH__)
|
||||||
printf("hw.cpufamily: 0x%.8X\n", get_sys_info_by_name("hw.cpufamily"));
|
printf("hw.cpufamily: 0x%.8X\n", get_sys_info_by_name("hw.cpufamily"));
|
||||||
printf("hw.cpusubfamily: 0x%.8X\n", get_sys_info_by_name("hw.cpusubfamily"));
|
printf("hw.cpusubfamily: 0x%.8X\n", get_sys_info_by_name("hw.cpusubfamily"));
|
||||||
|
|||||||
152
src/arm/soc.c
152
src/arm/soc.c
@@ -11,7 +11,7 @@
|
|||||||
#include "../common/pci.h"
|
#include "../common/pci.h"
|
||||||
|
|
||||||
#if defined(__APPLE__) || defined(__MACH__)
|
#if defined(__APPLE__) || defined(__MACH__)
|
||||||
#include "sysctl.h"
|
#include "../common/sysctl.h"
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
#define NA -1
|
#define NA -1
|
||||||
@@ -167,11 +167,13 @@ bool match_google(char* soc_name, struct system_on_chip* soc) {
|
|||||||
|
|
||||||
// https://www.techinsights.com/
|
// https://www.techinsights.com/
|
||||||
// https://datasheetspdf.com/pdf-file/1316605/HiSilicon/Hi3660/1
|
// https://datasheetspdf.com/pdf-file/1316605/HiSilicon/Hi3660/1
|
||||||
|
// https://github.com/Dr-Noob/cpufetch/issues/259
|
||||||
bool match_hisilicon(char* soc_name, struct system_on_chip* soc) {
|
bool match_hisilicon(char* soc_name, struct system_on_chip* soc) {
|
||||||
char* tmp;
|
char* tmp;
|
||||||
|
|
||||||
if((tmp = strstr(soc_name, "hi")) == NULL)
|
if((tmp = strstr(soc_name, "hi")) != NULL);
|
||||||
return false;
|
else if((tmp = strstr(soc_name, "kirin")) != NULL);
|
||||||
|
else return false;
|
||||||
|
|
||||||
soc->soc_vendor = SOC_VENDOR_KIRIN;
|
soc->soc_vendor = SOC_VENDOR_KIRIN;
|
||||||
|
|
||||||
@@ -204,6 +206,7 @@ bool match_hisilicon(char* soc_name, struct system_on_chip* soc) {
|
|||||||
SOC_EQ(tmp, "hi3680", "980", SOC_HISILICON_3680, soc, 7)
|
SOC_EQ(tmp, "hi3680", "980", SOC_HISILICON_3680, soc, 7)
|
||||||
//SOC_EQ(tmp, "?", "985", SOC_KIRIN, soc, 7)
|
//SOC_EQ(tmp, "?", "985", SOC_KIRIN, soc, 7)
|
||||||
SOC_EQ(tmp, "hi3690", "990", SOC_HISILICON_3690, soc, 7)
|
SOC_EQ(tmp, "hi3690", "990", SOC_HISILICON_3690, soc, 7)
|
||||||
|
SOC_EQ(tmp, "kirin9000s", "9000s", SOC_HISILICON_9000S,soc, 7)
|
||||||
SOC_END
|
SOC_END
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -421,6 +424,9 @@ bool match_mediatek(char* soc_name, struct system_on_chip* soc) {
|
|||||||
}
|
}
|
||||||
|
|
||||||
/*
|
/*
|
||||||
|
* Good sources:
|
||||||
|
* https://www.geektopia.es/es/products/company/qualcomm/socs/
|
||||||
|
*
|
||||||
* APQ: Application Processor Qualcomm
|
* APQ: Application Processor Qualcomm
|
||||||
* MSM: Mobile Station Modem
|
* MSM: Mobile Station Modem
|
||||||
* In a APQXXXX or MSMXXXX, the second digit represents:
|
* In a APQXXXX or MSMXXXX, the second digit represents:
|
||||||
@@ -578,6 +584,25 @@ bool match_qualcomm(char* soc_name, struct system_on_chip* soc) {
|
|||||||
SOC_EQ(tmp, "SM8250-AB", "865+", SOC_SNAPD_SM8250_AB, soc, 7)
|
SOC_EQ(tmp, "SM8250-AB", "865+", SOC_SNAPD_SM8250_AB, soc, 7)
|
||||||
SOC_EQ(tmp, "SM8350", "888", SOC_SNAPD_SM8350, soc, 5)
|
SOC_EQ(tmp, "SM8350", "888", SOC_SNAPD_SM8350, soc, 5)
|
||||||
SOC_EQ(tmp, "SM8350-AC", "888+", SOC_SNAPD_SM8350, soc, 5)
|
SOC_EQ(tmp, "SM8350-AC", "888+", SOC_SNAPD_SM8350, soc, 5)
|
||||||
|
// Snapdragon Gen 4 //
|
||||||
|
SOC_EQ(tmp, "SM4375", "4 Gen 1", SOC_SNAPD_SM4375, soc, 6)
|
||||||
|
SOC_EQ(tmp, "SM4450", "4 Gen 2", SOC_SNAPD_SM4450, soc, 4)
|
||||||
|
SOC_EQ(tmp, "SM4635", "4s Gen 2", SOC_SNAPD_SM4635, soc, 4)
|
||||||
|
// Snapdragon Gen 6 //
|
||||||
|
SOC_EQ(tmp, "SM6375-AC", "6s Gen 3", SOC_SNAPD_SM6375_AC, soc, 6)
|
||||||
|
SOC_EQ(tmp, "SM6450", "6 Gen 1", SOC_SNAPD_SM6450, soc, 4)
|
||||||
|
// Snapdragon Gen 7 //
|
||||||
|
SOC_EQ(tmp, "SM7435-AB", "7s Gen 2", SOC_SNAPD_SM7435_AB, soc, 4)
|
||||||
|
SOC_EQ(tmp, "SM7450", "7 Gen 1", SOC_SNAPD_SM7450, soc, 4)
|
||||||
|
SOC_EQ(tmp, "SM7475", "7+ Gen 2", SOC_SNAPD_SM7475, soc, 4)
|
||||||
|
SOC_EQ(tmp, "SM7550-AB", "7 Gen 3", SOC_SNAPD_SM7550_AB, soc, 4)
|
||||||
|
SOC_EQ(tmp, "SM7675-AB", "7+ Gen 3", SOC_SNAPD_SM7675_AB, soc, 4)
|
||||||
|
// Snapdragon Gen 8 //
|
||||||
|
SOC_EQ(tmp, "SM8450", "8 Gen 1", SOC_SNAPD_SM8450, soc, 4)
|
||||||
|
SOC_EQ(tmp, "SM8475", "8+ Gen 1", SOC_SNAPD_SM8475, soc, 4)
|
||||||
|
SOC_EQ(tmp, "SM8550-AB", "8 Gen 2", SOC_SNAPD_SM8550_AB, soc, 4)
|
||||||
|
SOC_EQ(tmp, "SM8635", "8s Gen 3", SOC_SNAPD_SM8635, soc, 4)
|
||||||
|
SOC_EQ(tmp, "SM8650-AB", "8 Gen 3", SOC_SNAPD_SM8650_AB, soc, 4)
|
||||||
SOC_END
|
SOC_END
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -624,12 +649,37 @@ bool match_special(char* soc_name, struct system_on_chip* soc) {
|
|||||||
return true;
|
return true;
|
||||||
}
|
}
|
||||||
|
|
||||||
// Snapdragon 8 Gen 1 reported as "taro"
|
// New Snapdragon SoCs codenames
|
||||||
|
// https://github.com/sm8450-mainline/fdt?tab=readme-ov-file#chipsets
|
||||||
|
// https://github.com/Dr-Noob/cpufetch/issues/253
|
||||||
|
if (strcmp(soc_name, "cape") == 0) {
|
||||||
|
fill_soc(soc, "8+ Gen 1", SOC_SNAPD_SM8475, 4);
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
if(strcmp(soc_name, "taro") == 0) {
|
if(strcmp(soc_name, "taro") == 0) {
|
||||||
fill_soc(soc, "8 Gen 1", SOC_SNAPD_SM8450, 4);
|
fill_soc(soc, "8 Gen 1", SOC_SNAPD_SM8450, 4);
|
||||||
return true;
|
return true;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
if(strcmp(soc_name, "ukee") == 0) {
|
||||||
|
fill_soc(soc, "7+ Gen 2", SOC_SNAPD_SM7475, 4);
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
if(strcmp(soc_name, "diwali") == 0) {
|
||||||
|
fill_soc(soc, "7 Gen 1", SOC_SNAPD_SM7450, 4);
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
// parrot can be either SM7435 or SM6450, we need more data
|
||||||
|
// to distingish between those two
|
||||||
|
|
||||||
|
if(strcmp(soc_name, "ravelin") == 0) {
|
||||||
|
fill_soc(soc, "4 Gen 2", SOC_SNAPD_SM4450, 4);
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
// Google Pixel 6
|
// Google Pixel 6
|
||||||
// https://github.com/Dr-Noob/cpufetch/issues/134
|
// https://github.com/Dr-Noob/cpufetch/issues/134
|
||||||
if(strcmp(soc_name, "oriole") == 0) {
|
if(strcmp(soc_name, "oriole") == 0) {
|
||||||
@@ -702,6 +752,16 @@ struct system_on_chip* guess_soc_from_android(struct system_on_chip* soc) {
|
|||||||
else return soc;
|
else return soc;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// https://github.com/Dr-Noob/cpufetch/issues/253
|
||||||
|
// ro.soc.model might be more reliable than ro.product.board or
|
||||||
|
// ro.board.platform, so try with it first
|
||||||
|
property_len = android_property_get("ro.soc.model", (char *) &tmp);
|
||||||
|
if(property_len > 0) {
|
||||||
|
try_parse_soc_from_string(soc, property_len, tmp);
|
||||||
|
if(soc->soc_vendor == SOC_VENDOR_UNKNOWN) printWarn("SoC detection failed using Android property ro.soc.model: %s", tmp);
|
||||||
|
else return soc;
|
||||||
|
}
|
||||||
|
|
||||||
property_len = android_property_get("ro.product.board", (char *) &tmp);
|
property_len = android_property_get("ro.product.board", (char *) &tmp);
|
||||||
if(property_len > 0) {
|
if(property_len > 0) {
|
||||||
try_parse_soc_from_string(soc, property_len, tmp);
|
try_parse_soc_from_string(soc, property_len, tmp);
|
||||||
@@ -835,6 +895,79 @@ struct system_on_chip* guess_soc_from_uarch(struct system_on_chip* soc, struct c
|
|||||||
return soc;
|
return soc;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// Return the dt string without the NULL characters.
|
||||||
|
char* get_dt_str(char* dt, int filelen) {
|
||||||
|
char* dt_without_null = (char *) malloc(sizeof(char) * filelen);
|
||||||
|
memcpy(dt_without_null, dt, filelen);
|
||||||
|
|
||||||
|
for (int i=0; i < filelen-1; i++) {
|
||||||
|
if (dt_without_null[i] == '\0')
|
||||||
|
dt_without_null[i] = ',';
|
||||||
|
}
|
||||||
|
return dt_without_null;
|
||||||
|
}
|
||||||
|
|
||||||
|
bool match_dt(struct system_on_chip* soc, char* dt, int filelen, char* expected_name, char* soc_name, SOC soc_model, int32_t process) {
|
||||||
|
// The /proc/device-tree/compatible file (passed by dt) uses NULL
|
||||||
|
// to separate the strings, so we need to make an special case here
|
||||||
|
// and iterate over the NULL characters, thus iterating over each
|
||||||
|
// individual compatible strings.
|
||||||
|
|
||||||
|
if (strstr(dt, expected_name) != NULL) {
|
||||||
|
fill_soc(soc, soc_name, soc_model, process);
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
char *compatible = dt;
|
||||||
|
char *end_of_dt = dt + filelen;
|
||||||
|
|
||||||
|
while ((compatible = strchr(compatible, '\0')) != end_of_dt) {
|
||||||
|
compatible++;
|
||||||
|
if (strstr(compatible, expected_name) != NULL) {
|
||||||
|
fill_soc(soc, soc_name, soc_model, process);
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
#define DT_START if (false) {}
|
||||||
|
#define DT_EQ(dt, filelen, soc, expected_name, soc_name, soc_model, process) \
|
||||||
|
else if (match_dt(soc, dt, filelen, expected_name, soc_name, soc_model, process)) return soc;
|
||||||
|
#define DT_END(dt, filelen) else { printWarn("guess_soc_from_devtree: No match found for '%s'", get_dt_str(dt, filelen)); return soc; }
|
||||||
|
|
||||||
|
// TODO: Move this to doc
|
||||||
|
// The number of fields seems non-standard, so for now it seems wiser
|
||||||
|
// to just get the entire string with all fields and just look for the
|
||||||
|
// substring.
|
||||||
|
// TODO: Implement this by going trough NULL-separated fields rather than
|
||||||
|
// using strstr.
|
||||||
|
struct system_on_chip* guess_soc_from_devtree(struct system_on_chip* soc) {
|
||||||
|
int len;
|
||||||
|
char* dt = get_devtree_compatible(&len);
|
||||||
|
if (dt == NULL) {
|
||||||
|
return soc;
|
||||||
|
}
|
||||||
|
|
||||||
|
// The following are internal codenames of Asahi Linux
|
||||||
|
// https://github.com/AsahiLinux/docs/wiki/Codenames
|
||||||
|
DT_START
|
||||||
|
DT_EQ(dt, len, soc, "apple,t8103", "M1", SOC_APPLE_M1, 5)
|
||||||
|
DT_EQ(dt, len, soc, "apple,t6000", "M1 Pro", SOC_APPLE_M1_PRO, 5)
|
||||||
|
DT_EQ(dt, len, soc, "apple,t6001", "M1 Max", SOC_APPLE_M1_MAX, 5)
|
||||||
|
DT_EQ(dt, len, soc, "apple,t6002", "M1 Ultra", SOC_APPLE_M1_ULTRA, 5)
|
||||||
|
DT_EQ(dt, len, soc, "apple,t8112", "M2", SOC_APPLE_M2, 5)
|
||||||
|
DT_EQ(dt, len, soc, "apple,t6020", "M2 Pro", SOC_APPLE_M2_PRO, 5)
|
||||||
|
DT_EQ(dt, len, soc, "apple,t6021", "M2 Max", SOC_APPLE_M2_MAX, 5)
|
||||||
|
DT_EQ(dt, len, soc, "apple,t6022", "M2 Ultra", SOC_APPLE_M2_ULTRA, 5)
|
||||||
|
DT_EQ(dt, len, soc, "apple,t8122", "M3", SOC_APPLE_M3, 3)
|
||||||
|
DT_EQ(dt, len, soc, "apple,t6030", "M3 Pro", SOC_APPLE_M3_PRO, 3)
|
||||||
|
DT_EQ(dt, len, soc, "apple,t6031", "M3 Max", SOC_APPLE_M3_MAX, 3)
|
||||||
|
DT_EQ(dt, len, soc, "apple,t6034", "M3 Max", SOC_APPLE_M3_MAX, 3)
|
||||||
|
DT_END(dt, len)
|
||||||
|
}
|
||||||
|
|
||||||
struct system_on_chip* guess_soc_from_pci(struct system_on_chip* soc, struct cpuInfo* cpu) {
|
struct system_on_chip* guess_soc_from_pci(struct system_on_chip* soc, struct cpuInfo* cpu) {
|
||||||
struct pci_devices * pci = get_pci_devices();
|
struct pci_devices * pci = get_pci_devices();
|
||||||
if (pci == NULL) {
|
if (pci == NULL) {
|
||||||
@@ -849,9 +982,10 @@ struct system_on_chip* guess_soc_from_pci(struct system_on_chip* soc, struct cpu
|
|||||||
} pciToSoC;
|
} pciToSoC;
|
||||||
|
|
||||||
pciToSoC socFromPCI[] = {
|
pciToSoC socFromPCI[] = {
|
||||||
{PCI_VENDOR_NVIDIA, PCI_DEVICE_TEGRA_X1, {SOC_TEGRA_X1, SOC_VENDOR_NVIDIA, 20, "Tegra X1", NULL} },
|
{PCI_VENDOR_NVIDIA, PCI_DEVICE_TEGRA_X1, {SOC_TEGRA_X1, SOC_VENDOR_NVIDIA, 20, "Tegra X1", NULL} },
|
||||||
// {PCI_VENDOR_NVIDIA, PCI_DEVICE_GH_200,{SOC_GH_200, SOC_VENDOR_NVIDIA, ?, "Grace Hopper", NULL} },
|
// {PCI_VENDOR_NVIDIA, PCI_DEVICE_GH_200,{SOC_GH_200, SOC_VENDOR_NVIDIA, ?, "Grace Hopper", NULL} },
|
||||||
{0x0000, 0x0000, {UNKNOWN, SOC_VENDOR_UNKNOWN, -1, "", NULL} }
|
{PCI_VENDOR_AMPERE, PCI_DEVICE_ALTRA, {SOC_AMPERE_ALTRA, SOC_VENDOR_AMPERE, 7, "Altra", NULL} }, // https://www.anandtech.com/show/15575/amperes-altra-80-core-n1-soc-for-hyperscalers-against-rome-and-xeon
|
||||||
|
{0x0000, 0x0000, {UNKNOWN, SOC_VENDOR_UNKNOWN, -1, "", NULL} }
|
||||||
};
|
};
|
||||||
|
|
||||||
int index = 0;
|
int index = 0;
|
||||||
@@ -1042,6 +1176,10 @@ struct system_on_chip* get_soc(struct cpuInfo* cpu) {
|
|||||||
printWarn("SoC detection failed using Android: Found '%s' string", soc->raw_name);
|
printWarn("SoC detection failed using Android: Found '%s' string", soc->raw_name);
|
||||||
}
|
}
|
||||||
#endif // ifdef __ANDROID__
|
#endif // ifdef __ANDROID__
|
||||||
|
// If previous steps failed, try with the device tree
|
||||||
|
if (soc->soc_vendor == SOC_VENDOR_UNKNOWN) {
|
||||||
|
soc = guess_soc_from_devtree(soc);
|
||||||
|
}
|
||||||
// If previous steps failed, try with nvmem
|
// If previous steps failed, try with nvmem
|
||||||
if(soc->soc_vendor == SOC_VENDOR_UNKNOWN) {
|
if(soc->soc_vendor == SOC_VENDOR_UNKNOWN) {
|
||||||
soc = guess_soc_from_nvmem(soc);
|
soc = guess_soc_from_nvmem(soc);
|
||||||
|
|||||||
@@ -29,6 +29,7 @@ enum {
|
|||||||
SOC_HISILICON_3670,
|
SOC_HISILICON_3670,
|
||||||
SOC_HISILICON_3680,
|
SOC_HISILICON_3680,
|
||||||
SOC_HISILICON_3690,
|
SOC_HISILICON_3690,
|
||||||
|
SOC_HISILICON_9000S,
|
||||||
// Kunpeng //
|
// Kunpeng //
|
||||||
SOC_KUNPENG_920,
|
SOC_KUNPENG_920,
|
||||||
SOC_KUNPENG_930,
|
SOC_KUNPENG_930,
|
||||||
@@ -270,11 +271,16 @@ enum {
|
|||||||
SOC_SNAPD_SDM660,
|
SOC_SNAPD_SDM660,
|
||||||
SOC_SNAPD_SM6115,
|
SOC_SNAPD_SM6115,
|
||||||
SOC_SNAPD_SM6125,
|
SOC_SNAPD_SM6125,
|
||||||
|
SOC_SNAPD_SM6375_AC,
|
||||||
|
SOC_SNAPD_SM6450,
|
||||||
SOC_SNAPD_SDM670,
|
SOC_SNAPD_SDM670,
|
||||||
SOC_SNAPD_SM6150,
|
SOC_SNAPD_SM6150,
|
||||||
SOC_SNAPD_SM6350,
|
SOC_SNAPD_SM6350,
|
||||||
SOC_SNAPD_SDM710,
|
SOC_SNAPD_SDM710,
|
||||||
SOC_SNAPD_SDM712,
|
SOC_SNAPD_SDM712,
|
||||||
|
SOC_SNAPD_SM4375,
|
||||||
|
SOC_SNAPD_SM4450,
|
||||||
|
SOC_SNAPD_SM4635,
|
||||||
SOC_SNAPD_SM7125,
|
SOC_SNAPD_SM7125,
|
||||||
SOC_SNAPD_SM7150_AA,
|
SOC_SNAPD_SM7150_AA,
|
||||||
SOC_SNAPD_SM7150_AB,
|
SOC_SNAPD_SM7150_AB,
|
||||||
@@ -283,6 +289,11 @@ enum {
|
|||||||
SOC_SNAPD_SM7250_AA,
|
SOC_SNAPD_SM7250_AA,
|
||||||
SOC_SNAPD_SM7250_AB,
|
SOC_SNAPD_SM7250_AB,
|
||||||
SOC_SNAPD_SM7250_AC,
|
SOC_SNAPD_SM7250_AC,
|
||||||
|
SOC_SNAPD_SM7435_AB,
|
||||||
|
SOC_SNAPD_SM7450,
|
||||||
|
SOC_SNAPD_SM7475,
|
||||||
|
SOC_SNAPD_SM7550_AB,
|
||||||
|
SOC_SNAPD_SM7675_AB,
|
||||||
SOC_SNAPD_MSM8974AA,
|
SOC_SNAPD_MSM8974AA,
|
||||||
SOC_SNAPD_MSM8974AB,
|
SOC_SNAPD_MSM8974AB,
|
||||||
SOC_SNAPD_MSM8974AC,
|
SOC_SNAPD_MSM8974AC,
|
||||||
@@ -303,6 +314,10 @@ enum {
|
|||||||
SOC_SNAPD_SM8250_AB,
|
SOC_SNAPD_SM8250_AB,
|
||||||
SOC_SNAPD_SM8350,
|
SOC_SNAPD_SM8350,
|
||||||
SOC_SNAPD_SM8450,
|
SOC_SNAPD_SM8450,
|
||||||
|
SOC_SNAPD_SM8475,
|
||||||
|
SOC_SNAPD_SM8550_AB,
|
||||||
|
SOC_SNAPD_SM8635,
|
||||||
|
SOC_SNAPD_SM8650_AB,
|
||||||
// APPLE
|
// APPLE
|
||||||
SOC_APPLE_M1,
|
SOC_APPLE_M1,
|
||||||
SOC_APPLE_M1_PRO,
|
SOC_APPLE_M1_PRO,
|
||||||
@@ -365,22 +380,25 @@ enum {
|
|||||||
SOC_GOOGLE_TENSOR_G3,
|
SOC_GOOGLE_TENSOR_G3,
|
||||||
// NVIDIA,
|
// NVIDIA,
|
||||||
SOC_TEGRA_X1,
|
SOC_TEGRA_X1,
|
||||||
|
// ALTRA
|
||||||
|
SOC_AMPERE_ALTRA,
|
||||||
// UNKNOWN
|
// UNKNOWN
|
||||||
SOC_MODEL_UNKNOWN
|
SOC_MODEL_UNKNOWN
|
||||||
};
|
};
|
||||||
|
|
||||||
inline static VENDOR get_soc_vendor_from_soc(SOC soc) {
|
inline static VENDOR get_soc_vendor_from_soc(SOC soc) {
|
||||||
if(soc >= SOC_BCM_2835 && soc <= SOC_BCM_2712) return SOC_VENDOR_BROADCOM;
|
if(soc >= SOC_BCM_2835 && soc <= SOC_BCM_2712) return SOC_VENDOR_BROADCOM;
|
||||||
else if(soc >= SOC_HISILICON_3620 && soc <= SOC_HISILICON_3690) return SOC_VENDOR_KIRIN;
|
else if(soc >= SOC_HISILICON_3620 && soc <= SOC_HISILICON_9000S) return SOC_VENDOR_KIRIN;
|
||||||
else if(soc >= SOC_KUNPENG_920 && soc <= SOC_KUNPENG_930) return SOC_VENDOR_KUNPENG;
|
else if(soc >= SOC_KUNPENG_920 && soc <= SOC_KUNPENG_930) return SOC_VENDOR_KUNPENG;
|
||||||
else if(soc >= SOC_EXYNOS_3475 && soc <= SOC_EXYNOS_880) return SOC_VENDOR_EXYNOS;
|
else if(soc >= SOC_EXYNOS_3475 && soc <= SOC_EXYNOS_880) return SOC_VENDOR_EXYNOS;
|
||||||
else if(soc >= SOC_MTK_MT6893 && soc <= SOC_MTK_MT8783) return SOC_VENDOR_MEDIATEK;
|
else if(soc >= SOC_MTK_MT6893 && soc <= SOC_MTK_MT8783) return SOC_VENDOR_MEDIATEK;
|
||||||
else if(soc >= SOC_SNAPD_QSD8650 && soc <= SOC_SNAPD_SM8450) return SOC_VENDOR_SNAPDRAGON;
|
else if(soc >= SOC_SNAPD_QSD8650 && soc <= SOC_SNAPD_SM8650_AB) return SOC_VENDOR_SNAPDRAGON;
|
||||||
else if(soc >= SOC_APPLE_M1 && soc <= SOC_APPLE_M3_MAX) return SOC_VENDOR_APPLE;
|
else if(soc >= SOC_APPLE_M1 && soc <= SOC_APPLE_M3_MAX) return SOC_VENDOR_APPLE;
|
||||||
else if(soc >= SOC_ALLWINNER_A10 && soc <= SOC_ALLWINNER_R328) return SOC_VENDOR_ALLWINNER;
|
else if(soc >= SOC_ALLWINNER_A10 && soc <= SOC_ALLWINNER_R328) return SOC_VENDOR_ALLWINNER;
|
||||||
else if(soc >= SOC_ROCKCHIP_3288 && soc <= SOC_ROCKCHIP_3588) return SOC_VENDOR_ROCKCHIP;
|
else if(soc >= SOC_ROCKCHIP_3288 && soc <= SOC_ROCKCHIP_3588) return SOC_VENDOR_ROCKCHIP;
|
||||||
else if(soc >= SOC_GOOGLE_TENSOR && soc <= SOC_GOOGLE_TENSOR_G3) return SOC_VENDOR_GOOGLE;
|
else if(soc >= SOC_GOOGLE_TENSOR && soc <= SOC_GOOGLE_TENSOR_G3) return SOC_VENDOR_GOOGLE;
|
||||||
else if(soc >= SOC_TEGRA_X1 && soc <= SOC_TEGRA_X1) return SOC_VENDOR_NVIDIA;
|
else if(soc >= SOC_TEGRA_X1 && soc <= SOC_TEGRA_X1) return SOC_VENDOR_NVIDIA;
|
||||||
|
else if(soc >= SOC_AMPERE_ALTRA && soc <= SOC_AMPERE_ALTRA) return SOC_VENDOR_AMPERE;
|
||||||
return SOC_VENDOR_UNKNOWN;
|
return SOC_VENDOR_UNKNOWN;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|||||||
15
src/arm/sve.c
Normal file
15
src/arm/sve.c
Normal file
@@ -0,0 +1,15 @@
|
|||||||
|
#include <stdint.h>
|
||||||
|
#include "../common/global.h"
|
||||||
|
|
||||||
|
// https://learn.arm.com/learning-paths/servers-and-cloud-computing/sve/sve_basics/#:~:text=Using%20a%20text%20editor%20of%20your%20choice%2C%20copy,svcntb%28%29%29%3B%20%7D%20This%20program%20prints%20the%20vector%20length
|
||||||
|
uint64_t sve_cntb(void) {
|
||||||
|
#ifdef __ARM_FEATURE_SVE
|
||||||
|
uint64_t x0 = 0;
|
||||||
|
__asm volatile("cntb %0"
|
||||||
|
: "=r"(x0));
|
||||||
|
return x0;
|
||||||
|
#else
|
||||||
|
printWarn("sve_cntb: Hardware supports SVE, but it was not enabled by the compiler");
|
||||||
|
return 0;
|
||||||
|
#endif
|
||||||
|
}
|
||||||
6
src/arm/sve.h
Normal file
6
src/arm/sve.h
Normal file
@@ -0,0 +1,6 @@
|
|||||||
|
#ifndef __SVE_DETECTION__
|
||||||
|
#define __SVE_DETECTION__
|
||||||
|
|
||||||
|
uint64_t sve_cntb(void);
|
||||||
|
|
||||||
|
#endif
|
||||||
@@ -75,6 +75,7 @@ static const ISA isas_uarch[] = {
|
|||||||
[UARCH_THUNDERX] = ISA_ARMv8_A,
|
[UARCH_THUNDERX] = ISA_ARMv8_A,
|
||||||
[UARCH_THUNDERX2] = ISA_ARMv8_1_A,
|
[UARCH_THUNDERX2] = ISA_ARMv8_1_A,
|
||||||
[UARCH_TAISHAN_V110] = ISA_ARMv8_2_A,
|
[UARCH_TAISHAN_V110] = ISA_ARMv8_2_A,
|
||||||
|
[UARCH_TAISHAN_V120] = ISA_ARMv8_2_A, // Not confirmed
|
||||||
[UARCH_TAISHAN_V200] = ISA_ARMv8_2_A, // Not confirmed
|
[UARCH_TAISHAN_V200] = ISA_ARMv8_2_A, // Not confirmed
|
||||||
[UARCH_DENVER] = ISA_ARMv8_A,
|
[UARCH_DENVER] = ISA_ARMv8_A,
|
||||||
[UARCH_DENVER2] = ISA_ARMv8_A,
|
[UARCH_DENVER2] = ISA_ARMv8_A,
|
||||||
@@ -202,8 +203,10 @@ struct uarch* get_uarch_from_midr(uint32_t midr, struct cpuInfo* cpu) {
|
|||||||
CHECK_UARCH(arch, cpu, 'C', 0x0AF, NA, NA, "ThunderX2 99XX", UARCH_THUNDERX2, CPU_VENDOR_CAVIUM)
|
CHECK_UARCH(arch, cpu, 'C', 0x0AF, NA, NA, "ThunderX2 99XX", UARCH_THUNDERX2, CPU_VENDOR_CAVIUM)
|
||||||
|
|
||||||
CHECK_UARCH(arch, cpu, 'H', 0xD01, NA, NA, "TaiShan v110", UARCH_TAISHAN_V110, CPU_VENDOR_HUAWEI) // Kunpeng 920 series
|
CHECK_UARCH(arch, cpu, 'H', 0xD01, NA, NA, "TaiShan v110", UARCH_TAISHAN_V110, CPU_VENDOR_HUAWEI) // Kunpeng 920 series
|
||||||
|
CHECK_UARCH(arch, cpu, 'H', 0xD02, 2, 2, "TaiShan v120", UARCH_TAISHAN_V120, CPU_VENDOR_HUAWEI) // Kiring 9000S Big cores (https://github.com/Dr-Noob/cpufetch/issues/259)
|
||||||
CHECK_UARCH(arch, cpu, 'H', 0xD02, NA, NA, "TaiShan v200", UARCH_TAISHAN_V200, CPU_VENDOR_HUAWEI) // Kunpeng 930 series (found in openeuler: https://mailweb.openeuler.org/hyperkitty/list/kernel@openeuler.org/message/XQCV7NX2UKRIUWUFKRF4PO3QENCOUFR3)
|
CHECK_UARCH(arch, cpu, 'H', 0xD02, NA, NA, "TaiShan v200", UARCH_TAISHAN_V200, CPU_VENDOR_HUAWEI) // Kunpeng 930 series (found in openeuler: https://mailweb.openeuler.org/hyperkitty/list/kernel@openeuler.org/message/XQCV7NX2UKRIUWUFKRF4PO3QENCOUFR3)
|
||||||
CHECK_UARCH(arch, cpu, 'H', 0xD40, NA, NA, "Cortex-A76", UARCH_CORTEX_A76, CPU_VENDOR_ARM) // Kirin 980 Big/Medium cores -> Cortex-A76
|
CHECK_UARCH(arch, cpu, 'H', 0xD40, NA, NA, "Cortex-A76", UARCH_CORTEX_A76, CPU_VENDOR_ARM) // Kirin 980 Big/Medium cores -> Cortex-A76
|
||||||
|
CHECK_UARCH(arch, cpu, 'H', 0xD42, NA, NA, "TaiShan v120", UARCH_TAISHAN_V120, CPU_VENDOR_HUAWEI) // Kiring 9000S Small Cores (https://github.com/Dr-Noob/cpufetch/issues/259)
|
||||||
|
|
||||||
CHECK_UARCH(arch, cpu, 'N', 0x000, NA, NA, "Denver", UARCH_DENVER, CPU_VENDOR_NVIDIA)
|
CHECK_UARCH(arch, cpu, 'N', 0x000, NA, NA, "Denver", UARCH_DENVER, CPU_VENDOR_NVIDIA)
|
||||||
CHECK_UARCH(arch, cpu, 'N', 0x003, NA, NA, "Denver2", UARCH_DENVER2, CPU_VENDOR_NVIDIA)
|
CHECK_UARCH(arch, cpu, 'N', 0x003, NA, NA, "Denver2", UARCH_DENVER2, CPU_VENDOR_NVIDIA)
|
||||||
@@ -245,6 +248,8 @@ struct uarch* get_uarch_from_midr(uint32_t midr, struct cpuInfo* cpu) {
|
|||||||
|
|
||||||
CHECK_UARCH(arch, cpu, 'a', 0x022, NA, NA, "Icestorm", UARCH_ICESTORM, CPU_VENDOR_APPLE)
|
CHECK_UARCH(arch, cpu, 'a', 0x022, NA, NA, "Icestorm", UARCH_ICESTORM, CPU_VENDOR_APPLE)
|
||||||
CHECK_UARCH(arch, cpu, 'a', 0x023, NA, NA, "Firestorm", UARCH_FIRESTORM, CPU_VENDOR_APPLE)
|
CHECK_UARCH(arch, cpu, 'a', 0x023, NA, NA, "Firestorm", UARCH_FIRESTORM, CPU_VENDOR_APPLE)
|
||||||
|
CHECK_UARCH(arch, cpu, 'a', 0x024, NA, NA, "Icestorm", UARCH_ICESTORM, CPU_VENDOR_APPLE) // https://github.com/Dr-Noob/cpufetch/issues/263
|
||||||
|
CHECK_UARCH(arch, cpu, 'a', 0x025, NA, NA, "Firestorm", UARCH_FIRESTORM, CPU_VENDOR_APPLE) // https://github.com/Dr-Noob/cpufetch/issues/263
|
||||||
CHECK_UARCH(arch, cpu, 'a', 0x030, NA, NA, "Blizzard", UARCH_BLIZZARD, CPU_VENDOR_APPLE)
|
CHECK_UARCH(arch, cpu, 'a', 0x030, NA, NA, "Blizzard", UARCH_BLIZZARD, CPU_VENDOR_APPLE)
|
||||||
CHECK_UARCH(arch, cpu, 'a', 0x031, NA, NA, "Avalanche", UARCH_AVALANCHE, CPU_VENDOR_APPLE)
|
CHECK_UARCH(arch, cpu, 'a', 0x031, NA, NA, "Avalanche", UARCH_AVALANCHE, CPU_VENDOR_APPLE)
|
||||||
CHECK_UARCH(arch, cpu, 'a', 0x048, NA, NA, "Sawtooth", UARCH_SAWTOOTH, CPU_VENDOR_APPLE)
|
CHECK_UARCH(arch, cpu, 'a', 0x048, NA, NA, "Sawtooth", UARCH_SAWTOOTH, CPU_VENDOR_APPLE)
|
||||||
@@ -291,7 +296,10 @@ int get_vpus_width(struct cpuInfo* cpu) {
|
|||||||
case UARCH_NEOVERSE_V1:
|
case UARCH_NEOVERSE_V1:
|
||||||
return 256;
|
return 256;
|
||||||
default:
|
default:
|
||||||
if(cpu->feat->NEON) {
|
if (cpu->feat->SVE && cpu->feat->cntb > 0) {
|
||||||
|
return cpu->feat->cntb * 8;
|
||||||
|
}
|
||||||
|
else if (cpu->feat->NEON) {
|
||||||
if(is_ARMv8_or_newer(cpu)) {
|
if(is_ARMv8_or_newer(cpu)) {
|
||||||
return 128;
|
return 128;
|
||||||
}
|
}
|
||||||
@@ -325,6 +333,7 @@ int get_number_of_vpus(struct cpuInfo* cpu) {
|
|||||||
case UARCH_ICESTORM: // [https://dougallj.github.io/applecpu/icestorm-simd.html]
|
case UARCH_ICESTORM: // [https://dougallj.github.io/applecpu/icestorm-simd.html]
|
||||||
case UARCH_BLIZZARD: // [https://en.wikipedia.org/wiki/Comparison_of_ARM_processors]
|
case UARCH_BLIZZARD: // [https://en.wikipedia.org/wiki/Comparison_of_ARM_processors]
|
||||||
case UARCH_TAISHAN_V110:// [https://www-file.huawei.com/-/media/corp2020/pdf/publications/huawei-research/2022/huawei-research-issue1-en.pdf]: "128-bit x 2 for single precision"
|
case UARCH_TAISHAN_V110:// [https://www-file.huawei.com/-/media/corp2020/pdf/publications/huawei-research/2022/huawei-research-issue1-en.pdf]: "128-bit x 2 for single precision"
|
||||||
|
case UARCH_TAISHAN_V120:// Not confirmed, asssuming same as v110
|
||||||
case UARCH_TAISHAN_V200:// Not confirmed, asssuming same as v110
|
case UARCH_TAISHAN_V200:// Not confirmed, asssuming same as v110
|
||||||
case UARCH_CORTEX_A57: // [https://www.anandtech.com/show/8718/the-samsung-galaxy-note-4-exynos-review/5]
|
case UARCH_CORTEX_A57: // [https://www.anandtech.com/show/8718/the-samsung-galaxy-note-4-exynos-review/5]
|
||||||
case UARCH_CORTEX_A72: // [https://www.anandtech.com/show/10347/arm-cortex-a73-artemis-unveiled/2]
|
case UARCH_CORTEX_A72: // [https://www.anandtech.com/show/10347/arm-cortex-a73-artemis-unveiled/2]
|
||||||
|
|||||||
@@ -83,7 +83,9 @@ enum {
|
|||||||
UARCH_BRAHMA_B15,
|
UARCH_BRAHMA_B15,
|
||||||
UARCH_BRAHMA_B53,
|
UARCH_BRAHMA_B53,
|
||||||
UARCH_XGENE, // Applied Micro X-Gene.
|
UARCH_XGENE, // Applied Micro X-Gene.
|
||||||
|
// HUAWEI
|
||||||
UARCH_TAISHAN_V110, // HiSilicon TaiShan v110
|
UARCH_TAISHAN_V110, // HiSilicon TaiShan v110
|
||||||
|
UARCH_TAISHAN_V120, // HiSilicon TaiShan v120
|
||||||
UARCH_TAISHAN_V200, // HiSilicon TaiShan v200
|
UARCH_TAISHAN_V200, // HiSilicon TaiShan v200
|
||||||
// PHYTIUM
|
// PHYTIUM
|
||||||
UARCH_XIAOMI, // Not to be confused with Xiaomi Inc
|
UARCH_XIAOMI, // Not to be confused with Xiaomi Inc
|
||||||
|
|||||||
@@ -28,6 +28,7 @@ struct args_struct {
|
|||||||
bool help_flag;
|
bool help_flag;
|
||||||
bool raw_flag;
|
bool raw_flag;
|
||||||
bool accurate_pp;
|
bool accurate_pp;
|
||||||
|
bool measure_max_frequency_flag;
|
||||||
bool full_cpu_name_flag;
|
bool full_cpu_name_flag;
|
||||||
bool logo_long;
|
bool logo_long;
|
||||||
bool logo_short;
|
bool logo_short;
|
||||||
@@ -40,35 +41,37 @@ struct args_struct {
|
|||||||
};
|
};
|
||||||
|
|
||||||
const char args_chr[] = {
|
const char args_chr[] = {
|
||||||
/* [ARG_STYLE] = */ 's',
|
/* [ARG_STYLE] = */ 's',
|
||||||
/* [ARG_COLOR] = */ 'c',
|
/* [ARG_COLOR] = */ 'c',
|
||||||
/* [ARG_HELP] = */ 'h',
|
/* [ARG_HELP] = */ 'h',
|
||||||
/* [ARG_RAW] = */ 'r',
|
/* [ARG_RAW] = */ 'r',
|
||||||
/* [ARG_FULLCPUNAME] = */ 'F',
|
/* [ARG_FULLCPUNAME] = */ 'F',
|
||||||
/* [ARG_LOGO_LONG] = */ 1,
|
/* [ARG_LOGO_LONG] = */ 1,
|
||||||
/* [ARG_LOGO_SHORT] = */ 2,
|
/* [ARG_LOGO_SHORT] = */ 2,
|
||||||
/* [ARG_LOGO_INTEL_NEW] = */ 3,
|
/* [ARG_LOGO_INTEL_NEW] = */ 3,
|
||||||
/* [ARG_LOGO_INTEL_OLD] = */ 4,
|
/* [ARG_LOGO_INTEL_OLD] = */ 4,
|
||||||
/* [ARG_ACCURATE_PP] = */ 5,
|
/* [ARG_ACCURATE_PP] = */ 5,
|
||||||
/* [ARG_DEBUG] = */ 'd',
|
/* [ARG_MEASURE_MAX_FREQ] = */ 6,
|
||||||
/* [ARG_VERBOSE] = */ 'v',
|
/* [ARG_DEBUG] = */ 'd',
|
||||||
/* [ARG_VERSION] = */ 'V',
|
/* [ARG_VERBOSE] = */ 'v',
|
||||||
|
/* [ARG_VERSION] = */ 'V',
|
||||||
};
|
};
|
||||||
|
|
||||||
const char *args_str[] = {
|
const char *args_str[] = {
|
||||||
/* [ARG_STYLE] = */ "style",
|
/* [ARG_STYLE] = */ "style",
|
||||||
/* [ARG_COLOR] = */ "color",
|
/* [ARG_COLOR] = */ "color",
|
||||||
/* [ARG_HELP] = */ "help",
|
/* [ARG_HELP] = */ "help",
|
||||||
/* [ARG_RAW] = */ "raw",
|
/* [ARG_RAW] = */ "raw",
|
||||||
/* [ARG_FULLCPUNAME] = */ "full-cpu-name",
|
/* [ARG_FULLCPUNAME] = */ "full-cpu-name",
|
||||||
/* [ARG_LOGO_LONG] = */ "logo-long",
|
/* [ARG_LOGO_LONG] = */ "logo-long",
|
||||||
/* [ARG_LOGO_SHORT] = */ "logo-short",
|
/* [ARG_LOGO_SHORT] = */ "logo-short",
|
||||||
/* [ARG_LOGO_INTEL_NEW] = */ "logo-intel-new",
|
/* [ARG_LOGO_INTEL_NEW] = */ "logo-intel-new",
|
||||||
/* [ARG_LOGO_INTEL_OLD] = */ "logo-intel-old",
|
/* [ARG_LOGO_INTEL_OLD] = */ "logo-intel-old",
|
||||||
/* [ARG_ACCURATE_PP] = */ "accurate-pp",
|
/* [ARG_ACCURATE_PP] = */ "accurate-pp",
|
||||||
/* [ARG_DEBUG] = */ "debug",
|
/* [ARG_MEASURE_MAX_FREQ] = */ "measure-max-freq",
|
||||||
/* [ARG_VERBOSE] = */ "verbose",
|
/* [ARG_DEBUG] = */ "debug",
|
||||||
/* [ARG_VERSION] = */ "version",
|
/* [ARG_VERBOSE] = */ "verbose",
|
||||||
|
/* [ARG_VERSION] = */ "version",
|
||||||
};
|
};
|
||||||
|
|
||||||
static struct args_struct args;
|
static struct args_struct args;
|
||||||
@@ -101,6 +104,10 @@ bool accurate_pp(void) {
|
|||||||
return args.accurate_pp;
|
return args.accurate_pp;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
bool measure_max_frequency_flag(void) {
|
||||||
|
return args.measure_max_frequency_flag;
|
||||||
|
}
|
||||||
|
|
||||||
bool show_full_cpu_name(void) {
|
bool show_full_cpu_name(void) {
|
||||||
return args.full_cpu_name_flag;
|
return args.full_cpu_name_flag;
|
||||||
}
|
}
|
||||||
@@ -222,12 +229,20 @@ char* build_short_options(void) {
|
|||||||
memset(str, 0, sizeof(char) * (len*2 + 1));
|
memset(str, 0, sizeof(char) * (len*2 + 1));
|
||||||
|
|
||||||
#ifdef ARCH_X86
|
#ifdef ARCH_X86
|
||||||
sprintf(str, "%c:%c:%c%c%c%c%c%c%c%c%c%c%c",
|
sprintf(str, "%c:%c:%c%c%c%c%c%c%c%c%c%c%c%c",
|
||||||
c[ARG_STYLE], c[ARG_COLOR], c[ARG_HELP],
|
c[ARG_STYLE], c[ARG_COLOR], c[ARG_HELP],
|
||||||
c[ARG_RAW], c[ARG_FULLCPUNAME],
|
c[ARG_RAW], c[ARG_FULLCPUNAME],
|
||||||
c[ARG_LOGO_SHORT], c[ARG_LOGO_LONG],
|
c[ARG_LOGO_SHORT], c[ARG_LOGO_LONG],
|
||||||
c[ARG_LOGO_INTEL_NEW], c[ARG_LOGO_INTEL_OLD],
|
c[ARG_LOGO_INTEL_NEW], c[ARG_LOGO_INTEL_OLD],
|
||||||
c[ARG_ACCURATE_PP], c[ARG_DEBUG], c[ARG_VERBOSE],
|
c[ARG_ACCURATE_PP], c[ARG_MEASURE_MAX_FREQ],
|
||||||
|
c[ARG_DEBUG], c[ARG_VERBOSE],
|
||||||
|
c[ARG_VERSION]);
|
||||||
|
#elif ARCH_ARM
|
||||||
|
sprintf(str, "%c:%c:%c%c%c%c%c%c%c",
|
||||||
|
c[ARG_STYLE], c[ARG_COLOR], c[ARG_HELP],
|
||||||
|
c[ARG_LOGO_SHORT], c[ARG_LOGO_LONG],
|
||||||
|
c[ARG_MEASURE_MAX_FREQ],
|
||||||
|
c[ARG_DEBUG], c[ARG_VERBOSE],
|
||||||
c[ARG_VERSION]);
|
c[ARG_VERSION]);
|
||||||
#else
|
#else
|
||||||
sprintf(str, "%c:%c:%c%c%c%c%c%c",
|
sprintf(str, "%c:%c:%c%c%c%c%c%c",
|
||||||
@@ -263,21 +278,24 @@ bool parse_args(int argc, char* argv[]) {
|
|||||||
set_log_level(true);
|
set_log_level(true);
|
||||||
|
|
||||||
const struct option long_options[] = {
|
const struct option long_options[] = {
|
||||||
{args_str[ARG_STYLE], required_argument, 0, args_chr[ARG_STYLE] },
|
{args_str[ARG_STYLE], required_argument, 0, args_chr[ARG_STYLE] },
|
||||||
{args_str[ARG_COLOR], required_argument, 0, args_chr[ARG_COLOR] },
|
{args_str[ARG_COLOR], required_argument, 0, args_chr[ARG_COLOR] },
|
||||||
{args_str[ARG_HELP], no_argument, 0, args_chr[ARG_HELP] },
|
{args_str[ARG_HELP], no_argument, 0, args_chr[ARG_HELP] },
|
||||||
#ifdef ARCH_X86
|
#ifdef ARCH_X86
|
||||||
{args_str[ARG_LOGO_INTEL_NEW], no_argument, 0, args_chr[ARG_LOGO_INTEL_NEW] },
|
{args_str[ARG_LOGO_INTEL_NEW], no_argument, 0, args_chr[ARG_LOGO_INTEL_NEW] },
|
||||||
{args_str[ARG_LOGO_INTEL_OLD], no_argument, 0, args_chr[ARG_LOGO_INTEL_OLD] },
|
{args_str[ARG_LOGO_INTEL_OLD], no_argument, 0, args_chr[ARG_LOGO_INTEL_OLD] },
|
||||||
{args_str[ARG_ACCURATE_PP], no_argument, 0, args_chr[ARG_ACCURATE_PP] },
|
{args_str[ARG_ACCURATE_PP], no_argument, 0, args_chr[ARG_ACCURATE_PP] },
|
||||||
{args_str[ARG_FULLCPUNAME], no_argument, 0, args_chr[ARG_FULLCPUNAME] },
|
{args_str[ARG_MEASURE_MAX_FREQ], no_argument, 0, args_chr[ARG_MEASURE_MAX_FREQ] },
|
||||||
{args_str[ARG_RAW], no_argument, 0, args_chr[ARG_RAW] },
|
{args_str[ARG_FULLCPUNAME], no_argument, 0, args_chr[ARG_FULLCPUNAME] },
|
||||||
|
{args_str[ARG_RAW], no_argument, 0, args_chr[ARG_RAW] },
|
||||||
|
#elif ARCH_ARM
|
||||||
|
{args_str[ARG_MEASURE_MAX_FREQ], no_argument, 0, args_chr[ARG_MEASURE_MAX_FREQ] },
|
||||||
#endif
|
#endif
|
||||||
{args_str[ARG_LOGO_SHORT], no_argument, 0, args_chr[ARG_LOGO_SHORT] },
|
{args_str[ARG_LOGO_SHORT], no_argument, 0, args_chr[ARG_LOGO_SHORT] },
|
||||||
{args_str[ARG_LOGO_LONG], no_argument, 0, args_chr[ARG_LOGO_LONG] },
|
{args_str[ARG_LOGO_LONG], no_argument, 0, args_chr[ARG_LOGO_LONG] },
|
||||||
{args_str[ARG_DEBUG], no_argument, 0, args_chr[ARG_DEBUG] },
|
{args_str[ARG_DEBUG], no_argument, 0, args_chr[ARG_DEBUG] },
|
||||||
{args_str[ARG_VERBOSE], no_argument, 0, args_chr[ARG_VERBOSE] },
|
{args_str[ARG_VERBOSE], no_argument, 0, args_chr[ARG_VERBOSE] },
|
||||||
{args_str[ARG_VERSION], no_argument, 0, args_chr[ARG_VERSION] },
|
{args_str[ARG_VERSION], no_argument, 0, args_chr[ARG_VERSION] },
|
||||||
{0, 0, 0, 0}
|
{0, 0, 0, 0}
|
||||||
};
|
};
|
||||||
|
|
||||||
@@ -313,6 +331,9 @@ bool parse_args(int argc, char* argv[]) {
|
|||||||
else if(opt == args_chr[ARG_ACCURATE_PP]) {
|
else if(opt == args_chr[ARG_ACCURATE_PP]) {
|
||||||
args.accurate_pp = true;
|
args.accurate_pp = true;
|
||||||
}
|
}
|
||||||
|
else if(opt == args_chr[ARG_MEASURE_MAX_FREQ]) {
|
||||||
|
args.measure_max_frequency_flag = true;
|
||||||
|
}
|
||||||
else if(opt == args_chr[ARG_FULLCPUNAME]) {
|
else if(opt == args_chr[ARG_FULLCPUNAME]) {
|
||||||
args.full_cpu_name_flag = true;
|
args.full_cpu_name_flag = true;
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -29,6 +29,7 @@ enum {
|
|||||||
ARG_LOGO_INTEL_NEW,
|
ARG_LOGO_INTEL_NEW,
|
||||||
ARG_LOGO_INTEL_OLD,
|
ARG_LOGO_INTEL_OLD,
|
||||||
ARG_ACCURATE_PP,
|
ARG_ACCURATE_PP,
|
||||||
|
ARG_MEASURE_MAX_FREQ,
|
||||||
ARG_DEBUG,
|
ARG_DEBUG,
|
||||||
ARG_VERBOSE,
|
ARG_VERBOSE,
|
||||||
ARG_VERSION
|
ARG_VERSION
|
||||||
@@ -43,6 +44,7 @@ int max_arg_str_length(void);
|
|||||||
bool parse_args(int argc, char* argv[]);
|
bool parse_args(int argc, char* argv[]);
|
||||||
bool show_help(void);
|
bool show_help(void);
|
||||||
bool accurate_pp(void);
|
bool accurate_pp(void);
|
||||||
|
bool measure_max_frequency_flag(void);
|
||||||
bool show_full_cpu_name(void);
|
bool show_full_cpu_name(void);
|
||||||
bool show_logo_long(void);
|
bool show_logo_long(void);
|
||||||
bool show_logo_short(void);
|
bool show_logo_short(void);
|
||||||
|
|||||||
@@ -105,6 +105,19 @@ $C1 MMM :MMM NMM dMMK dMMX MMN \
|
|||||||
$C1 MMM :MMM NMM dMMMoo OMM0....:Nx. MMN \
|
$C1 MMM :MMM NMM dMMMoo OMM0....:Nx. MMN \
|
||||||
$C1 MMM :WWW XWW lONMM 'xXMMMMNOc MMN "
|
$C1 MMM :WWW XWW lONMM 'xXMMMMNOc MMN "
|
||||||
|
|
||||||
|
#define ASCII_HYGON \
|
||||||
|
"$C1 \
|
||||||
|
$C1 \
|
||||||
|
$C1 \
|
||||||
|
$C1 ## ## ## ## ###### ###### ## # \
|
||||||
|
$C1 ##....## ## ## ## ## ## #### # \
|
||||||
|
$C1 ######## ## ## ##. ## ## # #### \
|
||||||
|
$C1 ## ## ## *######. ###### # ## \
|
||||||
|
$C1 \
|
||||||
|
$C1 \
|
||||||
|
$C1 \
|
||||||
|
$C1 "
|
||||||
|
|
||||||
#define ASCII_SNAPD \
|
#define ASCII_SNAPD \
|
||||||
" $C1@@$C2######## \
|
" $C1@@$C2######## \
|
||||||
$C1@@@@@$C2########### \
|
$C1@@@@@$C2########### \
|
||||||
@@ -381,6 +394,25 @@ $C2## ## ## ## ## ## ## ## #: :# \
|
|||||||
$C2## ## ## ## ## ## ## ## ####### \
|
$C2## ## ## ## ## ## ## ## ####### \
|
||||||
$C2## ## ### ## ###### ## ## ## "
|
$C2## ## ### ## ###### ## ## ## "
|
||||||
|
|
||||||
|
#define ASCII_AMPERE \
|
||||||
|
"$C1 \
|
||||||
|
$C1 \
|
||||||
|
$C1 ## \
|
||||||
|
$C1 #### \
|
||||||
|
$C1 ### ## \
|
||||||
|
$C1 ### ### \
|
||||||
|
$C1 ### ### \
|
||||||
|
$C1 ### ### \
|
||||||
|
$C1 ## ### \
|
||||||
|
$C1 ####### ### ### \
|
||||||
|
$C1 ###### ## ###### ### \
|
||||||
|
$C1 #### ### ######## \
|
||||||
|
$C1 #### ### #### \
|
||||||
|
$C1 ### ### #### \
|
||||||
|
$C1 ## ### ### \
|
||||||
|
$C1 \
|
||||||
|
$C1 "
|
||||||
|
|
||||||
// --------------------- LONG LOGOS ------------------------- //
|
// --------------------- LONG LOGOS ------------------------- //
|
||||||
#define ASCII_AMD_L \
|
#define ASCII_AMD_L \
|
||||||
"$C1 \
|
"$C1 \
|
||||||
@@ -538,6 +570,7 @@ typedef struct ascii_logo asciiL;
|
|||||||
asciiL logo_amd = { ASCII_AMD, 39, 15, false, {C_FG_WHITE, C_FG_GREEN}, {C_FG_WHITE, C_FG_GREEN} };
|
asciiL logo_amd = { ASCII_AMD, 39, 15, false, {C_FG_WHITE, C_FG_GREEN}, {C_FG_WHITE, C_FG_GREEN} };
|
||||||
asciiL logo_intel = { ASCII_INTEL, 48, 14, false, {C_FG_CYAN}, {C_FG_CYAN, C_FG_WHITE} };
|
asciiL logo_intel = { ASCII_INTEL, 48, 14, false, {C_FG_CYAN}, {C_FG_CYAN, C_FG_WHITE} };
|
||||||
asciiL logo_intel_new = { ASCII_INTEL_NEW, 51, 9, false, {C_FG_CYAN}, {C_FG_CYAN, C_FG_WHITE} };
|
asciiL logo_intel_new = { ASCII_INTEL_NEW, 51, 9, false, {C_FG_CYAN}, {C_FG_CYAN, C_FG_WHITE} };
|
||||||
|
asciiL logo_hygon = { ASCII_HYGON, 51, 11, false, {C_FG_RED}, {C_FG_RED, C_FG_WHITE} };
|
||||||
asciiL logo_snapd = { ASCII_SNAPD, 39, 16, false, {C_FG_RED, C_FG_WHITE}, {C_FG_RED, C_FG_WHITE} };
|
asciiL logo_snapd = { ASCII_SNAPD, 39, 16, false, {C_FG_RED, C_FG_WHITE}, {C_FG_RED, C_FG_WHITE} };
|
||||||
asciiL logo_mtk = { ASCII_MTK, 59, 5, false, {C_FG_BLUE, C_FG_YELLOW}, {C_FG_BLUE, C_FG_YELLOW} };
|
asciiL logo_mtk = { ASCII_MTK, 59, 5, false, {C_FG_BLUE, C_FG_YELLOW}, {C_FG_BLUE, C_FG_YELLOW} };
|
||||||
asciiL logo_exynos = { ASCII_EXYNOS, 22, 13, true, {C_BG_BLUE, C_FG_WHITE}, {C_FG_BLUE, C_FG_WHITE} };
|
asciiL logo_exynos = { ASCII_EXYNOS, 22, 13, true, {C_BG_BLUE, C_FG_WHITE}, {C_FG_BLUE, C_FG_WHITE} };
|
||||||
@@ -555,6 +588,7 @@ asciiL logo_sifive = { ASCII_SIFIVE, 48, 19, true, {C_BG_WHITE, C_BG_
|
|||||||
asciiL logo_starfive = { ASCII_STARFIVE, 33, 17, false, {C_FG_WHITE}, {C_FG_WHITE, C_FG_BLUE} };
|
asciiL logo_starfive = { ASCII_STARFIVE, 33, 17, false, {C_FG_WHITE}, {C_FG_WHITE, C_FG_BLUE} };
|
||||||
asciiL logo_sipeed = { ASCII_SIPEED, 41, 16, true, {C_BG_RED, C_BG_WHITE}, {C_FG_RED, C_FG_WHITE} };
|
asciiL logo_sipeed = { ASCII_SIPEED, 41, 16, true, {C_BG_RED, C_BG_WHITE}, {C_FG_RED, C_FG_WHITE} };
|
||||||
asciiL logo_nvidia = { ASCII_NVIDIA, 45, 19, false, {C_FG_GREEN, C_FG_WHITE}, {C_FG_WHITE, C_FG_GREEN} };
|
asciiL logo_nvidia = { ASCII_NVIDIA, 45, 19, false, {C_FG_GREEN, C_FG_WHITE}, {C_FG_WHITE, C_FG_GREEN} };
|
||||||
|
asciiL logo_ampere = { ASCII_AMPERE, 50, 17, false, {C_FG_RED}, {C_FG_WHITE, C_FG_RED} };
|
||||||
|
|
||||||
// Long variants | ----------------------------------------------------------------------------------------------------------------|
|
// Long variants | ----------------------------------------------------------------------------------------------------------------|
|
||||||
asciiL logo_amd_l = { ASCII_AMD_L, 62, 19, true, {C_BG_WHITE, C_BG_GREEN}, {C_FG_WHITE, C_FG_GREEN} };
|
asciiL logo_amd_l = { ASCII_AMD_L, 62, 19, true, {C_BG_WHITE, C_BG_GREEN}, {C_FG_WHITE, C_FG_GREEN} };
|
||||||
|
|||||||
@@ -145,17 +145,25 @@ char* get_str_l3(struct cache* cach) {
|
|||||||
|
|
||||||
char* get_str_freq(struct frequency* freq) {
|
char* get_str_freq(struct frequency* freq) {
|
||||||
//Max 3 digits and 3 for '(M/G)Hz' plus 1 for '\0'
|
//Max 3 digits and 3 for '(M/G)Hz' plus 1 for '\0'
|
||||||
uint32_t size = (5+1+3+1);
|
uint32_t size = (1+5+1+3+1);
|
||||||
assert(strlen(STRING_UNKNOWN)+1 <= size);
|
assert(strlen(STRING_UNKNOWN)+1 <= size);
|
||||||
char* string = emalloc(sizeof(char)*size);
|
char* string = ecalloc(size, sizeof(char));
|
||||||
memset(string, 0, sizeof(char)*size);
|
|
||||||
|
|
||||||
if(freq->max == UNKNOWN_DATA || freq->max < 0)
|
if(freq->max == UNKNOWN_DATA || freq->max < 0) {
|
||||||
snprintf(string,strlen(STRING_UNKNOWN)+1,STRING_UNKNOWN);
|
snprintf(string,strlen(STRING_UNKNOWN)+1,STRING_UNKNOWN);
|
||||||
else if(freq->max >= 1000)
|
}
|
||||||
snprintf(string,size,"%.3f "STRING_GIGAHERZ,(float)(freq->max)/1000);
|
else if(freq->max >= 1000) {
|
||||||
else
|
if (freq->measured)
|
||||||
snprintf(string,size,"%d "STRING_MEGAHERZ,freq->max);
|
snprintf(string,size,"~%.3f "STRING_GIGAHERZ,(float)(freq->max)/1000);
|
||||||
|
else
|
||||||
|
snprintf(string,size,"%.3f "STRING_GIGAHERZ,(float)(freq->max)/1000);
|
||||||
|
}
|
||||||
|
else {
|
||||||
|
if (freq->measured)
|
||||||
|
snprintf(string,size,"~%d "STRING_MEGAHERZ,freq->max);
|
||||||
|
else
|
||||||
|
snprintf(string,size,"%d "STRING_MEGAHERZ,freq->max);
|
||||||
|
}
|
||||||
|
|
||||||
return string;
|
return string;
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -8,6 +8,7 @@ enum {
|
|||||||
// ARCH_X86
|
// ARCH_X86
|
||||||
CPU_VENDOR_INTEL,
|
CPU_VENDOR_INTEL,
|
||||||
CPU_VENDOR_AMD,
|
CPU_VENDOR_AMD,
|
||||||
|
CPU_VENDOR_HYGON,
|
||||||
// ARCH_ARM
|
// ARCH_ARM
|
||||||
CPU_VENDOR_ARM,
|
CPU_VENDOR_ARM,
|
||||||
CPU_VENDOR_APPLE,
|
CPU_VENDOR_APPLE,
|
||||||
@@ -57,6 +58,8 @@ typedef int32_t VENDOR;
|
|||||||
struct frequency {
|
struct frequency {
|
||||||
int32_t base;
|
int32_t base;
|
||||||
int32_t max;
|
int32_t max;
|
||||||
|
// Indicates if max frequency was measured
|
||||||
|
bool measured;
|
||||||
};
|
};
|
||||||
|
|
||||||
struct hypervisor {
|
struct hypervisor {
|
||||||
@@ -121,6 +124,9 @@ struct features {
|
|||||||
bool SHA1;
|
bool SHA1;
|
||||||
bool SHA2;
|
bool SHA2;
|
||||||
bool CRC32;
|
bool CRC32;
|
||||||
|
bool SVE;
|
||||||
|
bool SVE2;
|
||||||
|
uint64_t cntb;
|
||||||
#endif
|
#endif
|
||||||
};
|
};
|
||||||
|
|
||||||
|
|||||||
195
src/common/freq.c
Normal file
195
src/common/freq.c
Normal file
@@ -0,0 +1,195 @@
|
|||||||
|
#ifdef __linux__
|
||||||
|
|
||||||
|
#define _GNU_SOURCE
|
||||||
|
|
||||||
|
#include <time.h>
|
||||||
|
#include <stdio.h>
|
||||||
|
#include <stdint.h>
|
||||||
|
#include <string.h>
|
||||||
|
#include <errno.h>
|
||||||
|
#include <unistd.h>
|
||||||
|
#include <asm/unistd.h>
|
||||||
|
#include <sys/ioctl.h>
|
||||||
|
#include <linux/perf_event.h>
|
||||||
|
|
||||||
|
#include "global.h"
|
||||||
|
#include "cpu.h"
|
||||||
|
|
||||||
|
static long
|
||||||
|
perf_event_open(struct perf_event_attr *hw_event, pid_t pid,
|
||||||
|
int cpu, int group_fd, unsigned long flags) {
|
||||||
|
int ret;
|
||||||
|
ret = syscall(__NR_perf_event_open, hw_event, pid, cpu,
|
||||||
|
group_fd, flags);
|
||||||
|
return ret;
|
||||||
|
}
|
||||||
|
|
||||||
|
#define INSERT_ASM_ONCE __asm volatile("nop");
|
||||||
|
#define INSERT_ASM_10_TIMES \
|
||||||
|
INSERT_ASM_ONCE \
|
||||||
|
INSERT_ASM_ONCE \
|
||||||
|
INSERT_ASM_ONCE \
|
||||||
|
INSERT_ASM_ONCE \
|
||||||
|
INSERT_ASM_ONCE \
|
||||||
|
INSERT_ASM_ONCE \
|
||||||
|
INSERT_ASM_ONCE \
|
||||||
|
INSERT_ASM_ONCE \
|
||||||
|
INSERT_ASM_ONCE \
|
||||||
|
INSERT_ASM_ONCE \
|
||||||
|
|
||||||
|
#define INSERT_ASM_100_TIMES \
|
||||||
|
INSERT_ASM_10_TIMES \
|
||||||
|
INSERT_ASM_10_TIMES \
|
||||||
|
INSERT_ASM_10_TIMES \
|
||||||
|
INSERT_ASM_10_TIMES \
|
||||||
|
INSERT_ASM_10_TIMES \
|
||||||
|
INSERT_ASM_10_TIMES \
|
||||||
|
INSERT_ASM_10_TIMES \
|
||||||
|
INSERT_ASM_10_TIMES \
|
||||||
|
INSERT_ASM_10_TIMES \
|
||||||
|
INSERT_ASM_10_TIMES
|
||||||
|
|
||||||
|
#define INSERT_ASM_1000_TIMES \
|
||||||
|
INSERT_ASM_100_TIMES \
|
||||||
|
INSERT_ASM_100_TIMES \
|
||||||
|
INSERT_ASM_100_TIMES \
|
||||||
|
INSERT_ASM_100_TIMES \
|
||||||
|
INSERT_ASM_100_TIMES \
|
||||||
|
INSERT_ASM_100_TIMES \
|
||||||
|
INSERT_ASM_100_TIMES \
|
||||||
|
INSERT_ASM_100_TIMES \
|
||||||
|
INSERT_ASM_100_TIMES \
|
||||||
|
INSERT_ASM_100_TIMES \
|
||||||
|
|
||||||
|
void nop_function(uint64_t iters) {
|
||||||
|
for (uint64_t i = 0; i < iters; i++) {
|
||||||
|
INSERT_ASM_1000_TIMES
|
||||||
|
INSERT_ASM_1000_TIMES
|
||||||
|
INSERT_ASM_1000_TIMES
|
||||||
|
INSERT_ASM_1000_TIMES
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
// Run the nop_function with the number of iterations specified and
|
||||||
|
// measure both the time and number of cycles
|
||||||
|
int measure_freq_iters(uint64_t iters, uint32_t core, double* freq) {
|
||||||
|
clockid_t clock = CLOCK_PROCESS_CPUTIME_ID;
|
||||||
|
struct timespec start, end;
|
||||||
|
struct perf_event_attr pe;
|
||||||
|
uint64_t cycles;
|
||||||
|
int fd;
|
||||||
|
int pid = 0;
|
||||||
|
memset(&pe, 0, sizeof(struct perf_event_attr));
|
||||||
|
pe.type = PERF_TYPE_HARDWARE;
|
||||||
|
pe.size = sizeof(struct perf_event_attr);
|
||||||
|
pe.config = PERF_COUNT_HW_CPU_CYCLES;
|
||||||
|
pe.disabled = 1;
|
||||||
|
pe.exclude_kernel = 1;
|
||||||
|
pe.exclude_hv = 1;
|
||||||
|
|
||||||
|
fd = perf_event_open(&pe, pid, core, -1, 0);
|
||||||
|
if (fd == -1) {
|
||||||
|
perror("perf_event_open");
|
||||||
|
if (errno == EPERM || errno == EACCES) {
|
||||||
|
printErr("You may not have permission to collect stats.\n"\
|
||||||
|
"Consider tweaking /proc/sys/kernel/perf_event_paranoid or running as root");
|
||||||
|
}
|
||||||
|
return -1;
|
||||||
|
}
|
||||||
|
|
||||||
|
if (clock_gettime(clock, &start) == -1) {
|
||||||
|
perror("clock_gettime");
|
||||||
|
return -1;
|
||||||
|
}
|
||||||
|
if(ioctl(fd, PERF_EVENT_IOC_RESET, 0) == -1) {
|
||||||
|
perror("ioctl");
|
||||||
|
return -1;
|
||||||
|
}
|
||||||
|
if(ioctl(fd, PERF_EVENT_IOC_ENABLE, 0) == -1) {
|
||||||
|
perror("ioctl");
|
||||||
|
return -1;
|
||||||
|
}
|
||||||
|
|
||||||
|
nop_function(iters);
|
||||||
|
|
||||||
|
ssize_t ret = read(fd, &cycles, sizeof(uint64_t));
|
||||||
|
if (ret == -1) {
|
||||||
|
perror("read");
|
||||||
|
return -1;
|
||||||
|
}
|
||||||
|
if (ret != sizeof(uint64_t)) {
|
||||||
|
printErr("Read returned %d, expected %d", ret, sizeof(uint64_t));
|
||||||
|
return -1;
|
||||||
|
}
|
||||||
|
if(ioctl(fd, PERF_EVENT_IOC_DISABLE, 0) == -1) {
|
||||||
|
perror("ioctl");
|
||||||
|
return -1;
|
||||||
|
}
|
||||||
|
if (clock_gettime(clock, &end) == -1) {
|
||||||
|
perror("clock_gettime");
|
||||||
|
return -1;
|
||||||
|
}
|
||||||
|
|
||||||
|
uint64_t nsecs = (end.tv_sec*1e9 + end.tv_nsec) - (start.tv_sec*1e9 + start.tv_nsec);
|
||||||
|
uint64_t usecs = nsecs/1000;
|
||||||
|
*freq = cycles/((double)usecs);
|
||||||
|
return 0;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Return a good number of iterations to run the nop_function in
|
||||||
|
// order to get a precise measurement of the frequency without taking
|
||||||
|
// too much time.
|
||||||
|
uint64_t get_num_iters_from_freq(double frequency) {
|
||||||
|
// Truncate to reduce variability
|
||||||
|
uint64_t freq_trunc = ((uint64_t) frequency / 100) * 100;
|
||||||
|
uint64_t osp_per_iter = 4 * 1000;
|
||||||
|
|
||||||
|
return freq_trunc * 1e7 * 1/osp_per_iter;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Differences between x86 measure_frequency and this measure_max_frequency:
|
||||||
|
// - measure_frequency employs all cores simultaneously whereas
|
||||||
|
// measure_max_frequency only employs 1.
|
||||||
|
// - measure_frequency runs the computation and checks /proc/cpuinfo whereas
|
||||||
|
// measure_max_frequency does not rely on /proc/cpuinfo and simply
|
||||||
|
// counts cpu cycles to measure frequency.
|
||||||
|
// - measure_frequency uses actual computation while measuring the frequency
|
||||||
|
// whereas measure_max_frequency uses nop instructions. This makes the former
|
||||||
|
// x86 dependant whereas the latter is architecture independant.
|
||||||
|
int64_t measure_max_frequency(uint32_t core) {
|
||||||
|
if (!bind_to_cpu(core)) {
|
||||||
|
printErr("Failed binding the process to CPU %d", core);
|
||||||
|
return UNKNOWN_DATA;
|
||||||
|
}
|
||||||
|
|
||||||
|
// First, get very rough estimation of clock cycle to
|
||||||
|
// compute a reasonable value for the iterations
|
||||||
|
double estimation_freq, frequency;
|
||||||
|
uint64_t iters = 100000;
|
||||||
|
if (measure_freq_iters(iters, core, &estimation_freq) == -1)
|
||||||
|
return UNKNOWN_DATA;
|
||||||
|
|
||||||
|
if (estimation_freq <= 0.0) {
|
||||||
|
printErr("First frequency measurement yielded an invalid value: %f", estimation_freq);
|
||||||
|
return UNKNOWN_DATA;
|
||||||
|
}
|
||||||
|
iters = get_num_iters_from_freq(estimation_freq);
|
||||||
|
printWarn("Running frequency measurement with %ld iterations on core %d...", iters, core);
|
||||||
|
|
||||||
|
// Now perform actual measurement
|
||||||
|
const char* frequency_banner = "cpufetch is measuring the max frequency...";
|
||||||
|
printf("%s", frequency_banner);
|
||||||
|
fflush(stdout);
|
||||||
|
|
||||||
|
if (measure_freq_iters(iters, core, &frequency) == -1)
|
||||||
|
return UNKNOWN_DATA;
|
||||||
|
|
||||||
|
// Clean screen once measurement is finished
|
||||||
|
printf("\r%*c\r", (int) strlen(frequency_banner), ' ');
|
||||||
|
|
||||||
|
// Discard last digit in the frequency, which should help providing
|
||||||
|
// more reliable and predictable values.
|
||||||
|
return (((int) frequency + 5)/10) * 10;
|
||||||
|
}
|
||||||
|
|
||||||
|
#endif // #ifdef __linux__
|
||||||
6
src/common/freq.h
Normal file
6
src/common/freq.h
Normal file
@@ -0,0 +1,6 @@
|
|||||||
|
#ifndef __COMMON_FREQ__
|
||||||
|
#define __COMMON_FREQ__
|
||||||
|
|
||||||
|
int64_t measure_max_frequency(uint32_t core);
|
||||||
|
|
||||||
|
#endif
|
||||||
@@ -1,3 +1,14 @@
|
|||||||
|
#ifdef _WIN32
|
||||||
|
#define NOMINMAX
|
||||||
|
#include <windows.h>
|
||||||
|
#elif defined __linux__
|
||||||
|
#define _GNU_SOURCE
|
||||||
|
#include <sched.h>
|
||||||
|
#elif defined __FreeBSD__
|
||||||
|
#include <sys/param.h>
|
||||||
|
#include <sys/cpuset.h>
|
||||||
|
#endif
|
||||||
|
|
||||||
#include <stdarg.h>
|
#include <stdarg.h>
|
||||||
#include <stdio.h>
|
#include <stdio.h>
|
||||||
#include <stdlib.h>
|
#include <stdlib.h>
|
||||||
@@ -51,7 +62,7 @@
|
|||||||
#endif
|
#endif
|
||||||
|
|
||||||
#ifndef GIT_FULL_VERSION
|
#ifndef GIT_FULL_VERSION
|
||||||
static const char* VERSION = "1.05";
|
static const char* VERSION = "1.06";
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
enum {
|
enum {
|
||||||
@@ -199,6 +210,34 @@ void* erealloc(void *ptr, size_t size) {
|
|||||||
return newptr;
|
return newptr;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#ifndef __APPLE__
|
||||||
|
bool bind_to_cpu(int cpu_id) {
|
||||||
|
#ifdef _WIN32
|
||||||
|
HANDLE process = GetCurrentProcess();
|
||||||
|
DWORD_PTR processAffinityMask = 1 << cpu_id;
|
||||||
|
return SetProcessAffinityMask(process, processAffinityMask);
|
||||||
|
#elif defined __linux__
|
||||||
|
cpu_set_t currentCPU;
|
||||||
|
CPU_ZERO(¤tCPU);
|
||||||
|
CPU_SET(cpu_id, ¤tCPU);
|
||||||
|
if (sched_setaffinity (0, sizeof(currentCPU), ¤tCPU) == -1) {
|
||||||
|
printWarn("sched_setaffinity: %s", strerror(errno));
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
return true;
|
||||||
|
#elif defined __FreeBSD__
|
||||||
|
cpuset_t currentCPU;
|
||||||
|
CPU_ZERO(¤tCPU);
|
||||||
|
CPU_SET(cpu_id, ¤tCPU);
|
||||||
|
if(cpuset_setaffinity(CPU_LEVEL_WHICH, CPU_WHICH_TID, -1, sizeof(cpuset_t), ¤tCPU) == -1) {
|
||||||
|
printWarn("cpuset_setaffinity: %s", strerror(errno));
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
return true;
|
||||||
|
#endif
|
||||||
|
}
|
||||||
|
#endif
|
||||||
|
|
||||||
void print_version(FILE *restrict stream) {
|
void print_version(FILE *restrict stream) {
|
||||||
#ifdef GIT_FULL_VERSION
|
#ifdef GIT_FULL_VERSION
|
||||||
fprintf(stream, "cpufetch %s (%s %s)\n", GIT_FULL_VERSION, OS_STR, ARCH_STR);
|
fprintf(stream, "cpufetch %s (%s %s)\n", GIT_FULL_VERSION, OS_STR, ARCH_STR);
|
||||||
|
|||||||
@@ -19,6 +19,9 @@ char *strremove(char *str, const char *sub);
|
|||||||
void* emalloc(size_t size);
|
void* emalloc(size_t size);
|
||||||
void* ecalloc(size_t nmemb, size_t size);
|
void* ecalloc(size_t nmemb, size_t size);
|
||||||
void* erealloc(void *ptr, size_t size);
|
void* erealloc(void *ptr, size_t size);
|
||||||
|
#ifndef __APPLE__
|
||||||
|
bool bind_to_cpu(int cpu_id);
|
||||||
|
#endif
|
||||||
void print_version(FILE *restrict stream);
|
void print_version(FILE *restrict stream);
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
|||||||
@@ -30,11 +30,17 @@ void print_help(char *argv[]) {
|
|||||||
#ifdef ARCH_X86
|
#ifdef ARCH_X86
|
||||||
#ifdef __linux__
|
#ifdef __linux__
|
||||||
printf(" --%s %*s Compute the peak performance accurately (measure the CPU frequency instead of using the maximum)\n", t[ARG_ACCURATE_PP], (int) (max_len-strlen(t[ARG_ACCURATE_PP])), "");
|
printf(" --%s %*s Compute the peak performance accurately (measure the CPU frequency instead of using the maximum)\n", t[ARG_ACCURATE_PP], (int) (max_len-strlen(t[ARG_ACCURATE_PP])), "");
|
||||||
#endif
|
printf(" --%s %*s Measure the max CPU frequency instead of reading it\n", t[ARG_MEASURE_MAX_FREQ], (int) (max_len-strlen(t[ARG_MEASURE_MAX_FREQ])), "");
|
||||||
|
#endif // __linux__
|
||||||
printf(" --%s %*s Show the old Intel logo\n", t[ARG_LOGO_INTEL_OLD], (int) (max_len-strlen(t[ARG_LOGO_INTEL_OLD])), "");
|
printf(" --%s %*s Show the old Intel logo\n", t[ARG_LOGO_INTEL_OLD], (int) (max_len-strlen(t[ARG_LOGO_INTEL_OLD])), "");
|
||||||
printf(" --%s %*s Show the new Intel logo\n", t[ARG_LOGO_INTEL_NEW], (int) (max_len-strlen(t[ARG_LOGO_INTEL_NEW])), "");
|
printf(" --%s %*s Show the new Intel logo\n", t[ARG_LOGO_INTEL_NEW], (int) (max_len-strlen(t[ARG_LOGO_INTEL_NEW])), "");
|
||||||
printf(" -%c, --%s %*s Show the full CPU name (do not abbreviate it)\n", c[ARG_FULLCPUNAME], t[ARG_FULLCPUNAME], (int) (max_len-strlen(t[ARG_FULLCPUNAME])), "");
|
printf(" -%c, --%s %*s Show the full CPU name (do not abbreviate it)\n", c[ARG_FULLCPUNAME], t[ARG_FULLCPUNAME], (int) (max_len-strlen(t[ARG_FULLCPUNAME])), "");
|
||||||
printf(" -%c, --%s %*s Print raw cpuid data (debug purposes)\n", c[ARG_RAW], t[ARG_RAW], (int) (max_len-strlen(t[ARG_RAW])), "");
|
printf(" -%c, --%s %*s Print raw cpuid data (debug purposes)\n", c[ARG_RAW], t[ARG_RAW], (int) (max_len-strlen(t[ARG_RAW])), "");
|
||||||
|
#endif // ARCH_X86
|
||||||
|
#ifdef ARCH_ARM
|
||||||
|
#ifdef __linux__
|
||||||
|
printf(" --%s %*s Measure the max CPU frequency instead of reading it\n", t[ARG_MEASURE_MAX_FREQ], (int) (max_len-strlen(t[ARG_MEASURE_MAX_FREQ])), "");
|
||||||
|
#endif
|
||||||
#endif
|
#endif
|
||||||
printf(" -%c, --%s %*s Print this help and exit\n", c[ARG_HELP], t[ARG_HELP], (int) (max_len-strlen(t[ARG_HELP])), "");
|
printf(" -%c, --%s %*s Print this help and exit\n", c[ARG_HELP], t[ARG_HELP], (int) (max_len-strlen(t[ARG_HELP])), "");
|
||||||
printf(" -%c, --%s %*s Print cpufetch version and exit\n", c[ARG_VERSION], t[ARG_VERSION], (int) (max_len-strlen(t[ARG_VERSION])), "");
|
printf(" -%c, --%s %*s Print cpufetch version and exit\n", c[ARG_VERSION], t[ARG_VERSION], (int) (max_len-strlen(t[ARG_VERSION])), "");
|
||||||
@@ -45,7 +51,7 @@ void print_help(char *argv[]) {
|
|||||||
printf(" * \"amd\": Use AMD color scheme \n");
|
printf(" * \"amd\": Use AMD color scheme \n");
|
||||||
printf(" * \"ibm\", Use IBM color scheme \n");
|
printf(" * \"ibm\", Use IBM color scheme \n");
|
||||||
printf(" * \"arm\": Use ARM color scheme \n");
|
printf(" * \"arm\": Use ARM color scheme \n");
|
||||||
printf(" * \"rockchip\": Use ARM color scheme \n");
|
printf(" * \"rockchip\": Use Rockchip color scheme \n");
|
||||||
printf(" * \"sifive\": Use SiFive color scheme \n");
|
printf(" * \"sifive\": Use SiFive color scheme \n");
|
||||||
printf(" * custom: If the argument of --color does not match any of the previous strings, a custom scheme can be specified.\n");
|
printf(" * custom: If the argument of --color does not match any of the previous strings, a custom scheme can be specified.\n");
|
||||||
printf(" 5 colors must be given in RGB with the format: R,G,B:R,G,B:...\n");
|
printf(" 5 colors must be given in RGB with the format: R,G,B:R,G,B:...\n");
|
||||||
@@ -80,6 +86,11 @@ void print_help(char *argv[]) {
|
|||||||
printf(" --accurate-pp option, which will measure the AVX frequency and show a more precise estimation\n");
|
printf(" --accurate-pp option, which will measure the AVX frequency and show a more precise estimation\n");
|
||||||
printf(" (this option is only available in x86 architectures).\n");
|
printf(" (this option is only available in x86 architectures).\n");
|
||||||
printf(" To precisely measure peak performance, see: https://github.com/Dr-Noob/peakperf\n");
|
printf(" To precisely measure peak performance, see: https://github.com/Dr-Noob/peakperf\n");
|
||||||
|
printf("\n");
|
||||||
|
printf(" Both --accurate-pp and --measure-max-freq measure the actual frequency of the CPU. However,\n");
|
||||||
|
printf(" they differ slightly. The former measures the max frequency while running vectorized SSE/AVX\n");
|
||||||
|
printf(" instructions and it is thus x86 only, whereas the latter simply measures the max clock cycle\n");
|
||||||
|
printf(" and is architecture independent.\n");
|
||||||
}
|
}
|
||||||
|
|
||||||
int main(int argc, char* argv[]) {
|
int main(int argc, char* argv[]) {
|
||||||
|
|||||||
@@ -14,14 +14,6 @@
|
|||||||
#define PCI_PATH "/sys/bus/pci/devices/"
|
#define PCI_PATH "/sys/bus/pci/devices/"
|
||||||
#define MAX_LENGTH_PCI_DIR_NAME 1024
|
#define MAX_LENGTH_PCI_DIR_NAME 1024
|
||||||
|
|
||||||
/*
|
|
||||||
* doc: https://wiki.osdev.org/PCI#Class_Codes
|
|
||||||
* https://pci-ids.ucw.cz/read/PC
|
|
||||||
*/
|
|
||||||
#define PCI_VENDOR_ID_AMD 0x1002
|
|
||||||
#define CLASS_VGA_CONTROLLER 0x0300
|
|
||||||
#define CLASS_3D_CONTROLLER 0x0302
|
|
||||||
|
|
||||||
// Return a list of PCI devices containing only
|
// Return a list of PCI devices containing only
|
||||||
// the sysfs path
|
// the sysfs path
|
||||||
struct pci_devices * get_pci_paths(void) {
|
struct pci_devices * get_pci_paths(void) {
|
||||||
@@ -98,9 +90,9 @@ void populate_pci_devices(struct pci_devices * pci) {
|
|||||||
int path_size = strlen(PCI_PATH) + strlen(dev->path) + 2;
|
int path_size = strlen(PCI_PATH) + strlen(dev->path) + 2;
|
||||||
|
|
||||||
// Read vendor_id
|
// Read vendor_id
|
||||||
char *vendor_id_path = emalloc(sizeof(char) * (path_size + strlen("vendor")));
|
char *vendor_id_path = emalloc(sizeof(char) * (path_size + strlen("vendor") + 1));
|
||||||
sprintf(vendor_id_path, "%s/%s/%s", PCI_PATH, dev->path, "vendor");
|
sprintf(vendor_id_path, "%s/%s/%s", PCI_PATH, dev->path, "vendor");
|
||||||
|
|
||||||
if ((buf = read_file(vendor_id_path, &filelen)) == NULL) {
|
if ((buf = read_file(vendor_id_path, &filelen)) == NULL) {
|
||||||
printWarn("read_file: %s: %s\n", vendor_id_path, strerror(errno));
|
printWarn("read_file: %s: %s\n", vendor_id_path, strerror(errno));
|
||||||
dev->vendor_id = 0;
|
dev->vendor_id = 0;
|
||||||
@@ -110,7 +102,7 @@ void populate_pci_devices(struct pci_devices * pci) {
|
|||||||
}
|
}
|
||||||
|
|
||||||
// Read device_id
|
// Read device_id
|
||||||
char *device_id_path = emalloc(sizeof(char) * (path_size + strlen("device")));
|
char *device_id_path = emalloc(sizeof(char) * (path_size + strlen("device") + 1));
|
||||||
sprintf(device_id_path, "%s/%s/%s", PCI_PATH, dev->path, "device");
|
sprintf(device_id_path, "%s/%s/%s", PCI_PATH, dev->path, "device");
|
||||||
|
|
||||||
if ((buf = read_file(device_id_path, &filelen)) == NULL) {
|
if ((buf = read_file(device_id_path, &filelen)) == NULL) {
|
||||||
@@ -126,43 +118,6 @@ void populate_pci_devices(struct pci_devices * pci) {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
// Right now, we are interested in PCI devices which
|
|
||||||
// vendor is NVIDIA (to be extended in the future).
|
|
||||||
// Should we also restrict to VGA controllers only?
|
|
||||||
bool pci_device_is_useful(struct pci_device* dev) {
|
|
||||||
return dev->vendor_id == PCI_VENDOR_NVIDIA;
|
|
||||||
}
|
|
||||||
|
|
||||||
// Filter the input list in order to get only those PCI devices which
|
|
||||||
// we are interested in (decided by pci_device_is_useful)
|
|
||||||
// and return the filtered result.
|
|
||||||
struct pci_devices * filter_pci_devices(struct pci_devices * pci) {
|
|
||||||
int * devices_to_get = emalloc(sizeof(int) * pci->num_devices);
|
|
||||||
int dev_ptr = 0;
|
|
||||||
|
|
||||||
for (int i=0; i < pci->num_devices; i++) {
|
|
||||||
if (pci_device_is_useful(pci->devices[i])) {
|
|
||||||
devices_to_get[dev_ptr] = i;
|
|
||||||
dev_ptr++;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
struct pci_devices * pci_filtered = emalloc(sizeof(struct pci_devices));
|
|
||||||
pci_filtered->num_devices = dev_ptr;
|
|
||||||
|
|
||||||
if (pci_filtered->num_devices == 0) {
|
|
||||||
pci_filtered->devices = NULL;
|
|
||||||
}
|
|
||||||
else {
|
|
||||||
pci_filtered->devices = emalloc(sizeof(struct pci_device) * pci_filtered->num_devices);
|
|
||||||
|
|
||||||
for (int i=0; i < pci_filtered->num_devices; i++)
|
|
||||||
pci_filtered->devices[i] = pci->devices[devices_to_get[i]];
|
|
||||||
}
|
|
||||||
|
|
||||||
return pci_filtered;
|
|
||||||
}
|
|
||||||
|
|
||||||
// Return a list of PCI devices that could be used to infer the SoC.
|
// Return a list of PCI devices that could be used to infer the SoC.
|
||||||
// The criteria to determine which devices are suitable for this task
|
// The criteria to determine which devices are suitable for this task
|
||||||
// is decided in filter_pci_devices.
|
// is decided in filter_pci_devices.
|
||||||
@@ -174,5 +129,5 @@ struct pci_devices * get_pci_devices(void) {
|
|||||||
|
|
||||||
populate_pci_devices(pci);
|
populate_pci_devices(pci);
|
||||||
|
|
||||||
return filter_pci_devices(pci);
|
return pci;
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -1,8 +1,11 @@
|
|||||||
#ifndef __PCI__
|
#ifndef __PCI__
|
||||||
#define __PCI__
|
#define __PCI__
|
||||||
|
|
||||||
#define PCI_VENDOR_NVIDIA 0x10de
|
#define PCI_VENDOR_NVIDIA 0x10de
|
||||||
|
#define PCI_VENDOR_AMPERE 0x1def
|
||||||
|
|
||||||
#define PCI_DEVICE_TEGRA_X1 0x0faf
|
#define PCI_DEVICE_TEGRA_X1 0x0faf
|
||||||
|
#define PCI_DEVICE_ALTRA 0xe100
|
||||||
|
|
||||||
struct pci_device {
|
struct pci_device {
|
||||||
char * path;
|
char * path;
|
||||||
|
|||||||
@@ -61,6 +61,7 @@ enum {
|
|||||||
ATTRIBUTE_NCORES,
|
ATTRIBUTE_NCORES,
|
||||||
ATTRIBUTE_NCORES_DUAL,
|
ATTRIBUTE_NCORES_DUAL,
|
||||||
#ifdef ARCH_X86
|
#ifdef ARCH_X86
|
||||||
|
ATTRIBUTE_SSE,
|
||||||
ATTRIBUTE_AVX,
|
ATTRIBUTE_AVX,
|
||||||
ATTRIBUTE_FMA,
|
ATTRIBUTE_FMA,
|
||||||
#elif ARCH_PPC
|
#elif ARCH_PPC
|
||||||
@@ -96,6 +97,7 @@ static const char* ATTRIBUTE_FIELDS [] = {
|
|||||||
"Cores:",
|
"Cores:",
|
||||||
"Cores (Total):",
|
"Cores (Total):",
|
||||||
#ifdef ARCH_X86
|
#ifdef ARCH_X86
|
||||||
|
"SSE:",
|
||||||
"AVX:",
|
"AVX:",
|
||||||
"FMA:",
|
"FMA:",
|
||||||
#elif ARCH_PPC
|
#elif ARCH_PPC
|
||||||
@@ -131,6 +133,7 @@ static const char* ATTRIBUTE_FIELDS_SHORT [] = {
|
|||||||
"Cores:",
|
"Cores:",
|
||||||
"Cores (Total):",
|
"Cores (Total):",
|
||||||
#ifdef ARCH_X86
|
#ifdef ARCH_X86
|
||||||
|
"SSE:",
|
||||||
"AVX:",
|
"AVX:",
|
||||||
"FMA:",
|
"FMA:",
|
||||||
#elif ARCH_PPC
|
#elif ARCH_PPC
|
||||||
@@ -357,6 +360,9 @@ void choose_ascii_art(struct ascii* art, struct color** cs, struct terminal* ter
|
|||||||
else if(art->vendor == CPU_VENDOR_AMD) {
|
else if(art->vendor == CPU_VENDOR_AMD) {
|
||||||
art->art = choose_ascii_art_aux(&logo_amd_l, &logo_amd, term, lf);
|
art->art = choose_ascii_art_aux(&logo_amd_l, &logo_amd, term, lf);
|
||||||
}
|
}
|
||||||
|
else if(art->vendor == CPU_VENDOR_HYGON) {
|
||||||
|
art->art = &logo_hygon;
|
||||||
|
}
|
||||||
else {
|
else {
|
||||||
art->art = &logo_unknown;
|
art->art = &logo_unknown;
|
||||||
}
|
}
|
||||||
@@ -383,6 +389,8 @@ void choose_ascii_art(struct ascii* art, struct color** cs, struct terminal* ter
|
|||||||
art->art = &logo_allwinner;
|
art->art = &logo_allwinner;
|
||||||
else if(art->vendor == SOC_VENDOR_ROCKCHIP)
|
else if(art->vendor == SOC_VENDOR_ROCKCHIP)
|
||||||
art->art = &logo_rockchip;
|
art->art = &logo_rockchip;
|
||||||
|
else if(art->vendor == SOC_VENDOR_AMPERE)
|
||||||
|
art->art = &logo_ampere;
|
||||||
else if(art->vendor == SOC_VENDOR_NVIDIA)
|
else if(art->vendor == SOC_VENDOR_NVIDIA)
|
||||||
art->art = choose_ascii_art_aux(&logo_nvidia_l, &logo_nvidia, term, lf);
|
art->art = choose_ascii_art_aux(&logo_nvidia_l, &logo_nvidia, term, lf);
|
||||||
else {
|
else {
|
||||||
@@ -591,6 +599,7 @@ bool print_cpufetch_x86(struct cpuInfo* cpu, STYLE s, struct color** cs, struct
|
|||||||
for(int i = 0; i < cpu->num_cpus; ptr = ptr->next_cpu, i++) {
|
for(int i = 0; i < cpu->num_cpus; ptr = ptr->next_cpu, i++) {
|
||||||
char* max_frequency = get_str_freq(ptr->freq);
|
char* max_frequency = get_str_freq(ptr->freq);
|
||||||
char* avx = get_str_avx(ptr);
|
char* avx = get_str_avx(ptr);
|
||||||
|
char* sse = get_str_sse(ptr);
|
||||||
char* fma = get_str_fma(ptr);
|
char* fma = get_str_fma(ptr);
|
||||||
char* cpu_num = emalloc(sizeof(char) * 9);
|
char* cpu_num = emalloc(sizeof(char) * 9);
|
||||||
|
|
||||||
@@ -625,8 +634,18 @@ bool print_cpufetch_x86(struct cpuInfo* cpu, STYLE s, struct color** cs, struct
|
|||||||
setAttribute(art, ATTRIBUTE_NCORES, n_cores);
|
setAttribute(art, ATTRIBUTE_NCORES, n_cores);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
setAttribute(art, ATTRIBUTE_AVX, avx);
|
|
||||||
setAttribute(art, ATTRIBUTE_FMA, fma);
|
// Show the most modern vector instructions.
|
||||||
|
if (strcmp(avx, "No") == 0) {
|
||||||
|
if (strcmp(sse, "No") != 0) {
|
||||||
|
setAttribute(art, ATTRIBUTE_SSE, sse);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
else {
|
||||||
|
setAttribute(art, ATTRIBUTE_AVX, avx);
|
||||||
|
setAttribute(art, ATTRIBUTE_FMA, fma);
|
||||||
|
}
|
||||||
|
|
||||||
if(l1i != NULL) setAttribute(art, ATTRIBUTE_L1i, l1i);
|
if(l1i != NULL) setAttribute(art, ATTRIBUTE_L1i, l1i);
|
||||||
if(l1d != NULL) setAttribute(art, ATTRIBUTE_L1d, l1d);
|
if(l1d != NULL) setAttribute(art, ATTRIBUTE_L1d, l1d);
|
||||||
if(l2 != NULL) setAttribute(art, ATTRIBUTE_L2, l2);
|
if(l2 != NULL) setAttribute(art, ATTRIBUTE_L2, l2);
|
||||||
|
|||||||
@@ -21,6 +21,7 @@ static char* soc_trademark_string[] = {
|
|||||||
[SOC_VENDOR_ROCKCHIP] = "Rockchip ",
|
[SOC_VENDOR_ROCKCHIP] = "Rockchip ",
|
||||||
[SOC_VENDOR_GOOGLE] = "Google ",
|
[SOC_VENDOR_GOOGLE] = "Google ",
|
||||||
[SOC_VENDOR_NVIDIA] = "NVIDIA ",
|
[SOC_VENDOR_NVIDIA] = "NVIDIA ",
|
||||||
|
[SOC_VENDOR_AMPERE] = "Ampere ",
|
||||||
// RISC-V
|
// RISC-V
|
||||||
[SOC_VENDOR_SIFIVE] = "SiFive ",
|
[SOC_VENDOR_SIFIVE] = "SiFive ",
|
||||||
[SOC_VENDOR_STARFIVE] = "StarFive ",
|
[SOC_VENDOR_STARFIVE] = "StarFive ",
|
||||||
|
|||||||
@@ -25,6 +25,7 @@ enum {
|
|||||||
SOC_VENDOR_ROCKCHIP,
|
SOC_VENDOR_ROCKCHIP,
|
||||||
SOC_VENDOR_GOOGLE,
|
SOC_VENDOR_GOOGLE,
|
||||||
SOC_VENDOR_NVIDIA,
|
SOC_VENDOR_NVIDIA,
|
||||||
|
SOC_VENDOR_AMPERE,
|
||||||
// RISC-V
|
// RISC-V
|
||||||
SOC_VENDOR_SIFIVE,
|
SOC_VENDOR_SIFIVE,
|
||||||
SOC_VENDOR_STARFIVE,
|
SOC_VENDOR_STARFIVE,
|
||||||
|
|||||||
@@ -4,8 +4,8 @@
|
|||||||
#include <string.h>
|
#include <string.h>
|
||||||
#include <errno.h>
|
#include <errno.h>
|
||||||
|
|
||||||
#include "../common/global.h"
|
#include "global.h"
|
||||||
#include "../common/cpu.h"
|
#include "cpu.h"
|
||||||
|
|
||||||
uint32_t get_sys_info_by_name(char* name) {
|
uint32_t get_sys_info_by_name(char* name) {
|
||||||
size_t size = 0;
|
size_t size = 0;
|
||||||
@@ -40,6 +40,14 @@
|
|||||||
#define CPUSUBFAMILY_ARM_HC_HD 5
|
#define CPUSUBFAMILY_ARM_HC_HD 5
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
|
// For alternative way to get CPU frequency on macOS and *BSD
|
||||||
|
#ifdef __APPLE__
|
||||||
|
#define CPUFREQUENCY_SYSCTL "hw.cpufrequency_max"
|
||||||
|
#else
|
||||||
|
// For FreeBSD, not sure about other *BSD
|
||||||
|
#define CPUFREQUENCY_SYSCTL "dev.cpu.0.freq"
|
||||||
|
#endif
|
||||||
|
|
||||||
uint32_t get_sys_info_by_name(char* name);
|
uint32_t get_sys_info_by_name(char* name);
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
@@ -1,7 +1,10 @@
|
|||||||
|
#include "../common/global.h"
|
||||||
#include "udev.h"
|
#include "udev.h"
|
||||||
#include "global.h"
|
#include "global.h"
|
||||||
#include "cpu.h"
|
#include "cpu.h"
|
||||||
|
|
||||||
|
#define _PATH_DEVTREE "/proc/device-tree/compatible"
|
||||||
|
|
||||||
// https://www.kernel.org/doc/html/latest/core-api/cpu_hotplug.html
|
// https://www.kernel.org/doc/html/latest/core-api/cpu_hotplug.html
|
||||||
int get_ncores_from_cpuinfo(void) {
|
int get_ncores_from_cpuinfo(void) {
|
||||||
// Examples:
|
// Examples:
|
||||||
@@ -349,3 +352,13 @@ bool is_devtree_compatible(char* str) {
|
|||||||
}
|
}
|
||||||
return true;
|
return true;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
char* get_devtree_compatible(int *filelen) {
|
||||||
|
char* buf;
|
||||||
|
|
||||||
|
if ((buf = read_file(_PATH_DEVTREE, filelen)) == NULL) {
|
||||||
|
printWarn("read_file: %s: %s", _PATH_DEVTREE, strerror(errno));
|
||||||
|
}
|
||||||
|
|
||||||
|
return buf;
|
||||||
|
}
|
||||||
|
|||||||
@@ -43,5 +43,6 @@ int get_num_sockets_package_cpus(struct topology* topo);
|
|||||||
int get_ncores_from_cpuinfo(void);
|
int get_ncores_from_cpuinfo(void);
|
||||||
char* get_field_from_cpuinfo(char* CPUINFO_FIELD);
|
char* get_field_from_cpuinfo(char* CPUINFO_FIELD);
|
||||||
bool is_devtree_compatible(char* str);
|
bool is_devtree_compatible(char* str);
|
||||||
|
char* get_devtree_compatible(int *filelen);
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
|||||||
@@ -146,6 +146,7 @@ struct uarch* get_cpu_uarch(struct cpuInfo* cpu) {
|
|||||||
struct frequency* get_frequency_info(void) {
|
struct frequency* get_frequency_info(void) {
|
||||||
struct frequency* freq = emalloc(sizeof(struct frequency));
|
struct frequency* freq = emalloc(sizeof(struct frequency));
|
||||||
|
|
||||||
|
freq->measured = false;
|
||||||
freq->max = get_max_freq_from_file(0);
|
freq->max = get_max_freq_from_file(0);
|
||||||
freq->base = get_min_freq_from_file(0);
|
freq->base = get_min_freq_from_file(0);
|
||||||
|
|
||||||
|
|||||||
@@ -19,6 +19,7 @@
|
|||||||
struct frequency* get_frequency_info(uint32_t core) {
|
struct frequency* get_frequency_info(uint32_t core) {
|
||||||
struct frequency* freq = emalloc(sizeof(struct frequency));
|
struct frequency* freq = emalloc(sizeof(struct frequency));
|
||||||
|
|
||||||
|
freq->measured = false;
|
||||||
freq->base = UNKNOWN_DATA;
|
freq->base = UNKNOWN_DATA;
|
||||||
freq->max = get_max_freq_from_file(core);
|
freq->max = get_max_freq_from_file(core);
|
||||||
|
|
||||||
|
|||||||
@@ -72,34 +72,6 @@ uint32_t get_apic_id(bool x2apic_id) {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
#ifndef __APPLE__
|
|
||||||
bool bind_to_cpu(int cpu_id) {
|
|
||||||
#ifdef _WIN32
|
|
||||||
HANDLE process = GetCurrentProcess();
|
|
||||||
DWORD_PTR processAffinityMask = 1 << cpu_id;
|
|
||||||
return SetProcessAffinityMask(process, processAffinityMask);
|
|
||||||
#elif defined __linux__
|
|
||||||
cpu_set_t currentCPU;
|
|
||||||
CPU_ZERO(¤tCPU);
|
|
||||||
CPU_SET(cpu_id, ¤tCPU);
|
|
||||||
if (sched_setaffinity (0, sizeof(currentCPU), ¤tCPU) == -1) {
|
|
||||||
printWarn("sched_setaffinity: %s", strerror(errno));
|
|
||||||
return false;
|
|
||||||
}
|
|
||||||
return true;
|
|
||||||
#elif defined __FreeBSD__
|
|
||||||
cpuset_t currentCPU;
|
|
||||||
CPU_ZERO(¤tCPU);
|
|
||||||
CPU_SET(cpu_id, ¤tCPU);
|
|
||||||
if(cpuset_setaffinity(CPU_LEVEL_WHICH, CPU_WHICH_TID, -1, sizeof(cpuset_t), ¤tCPU) == -1) {
|
|
||||||
printWarn("cpuset_setaffinity: %s", strerror(errno));
|
|
||||||
return false;
|
|
||||||
}
|
|
||||||
return true;
|
|
||||||
#endif
|
|
||||||
}
|
|
||||||
#endif
|
|
||||||
|
|
||||||
#ifdef __linux__
|
#ifdef __linux__
|
||||||
int get_total_cores_module(int total_cores, int module) {
|
int get_total_cores_module(int total_cores, int module) {
|
||||||
int total_modules = 2;
|
int total_modules = 2;
|
||||||
@@ -397,6 +369,11 @@ bool fill_apic_ids(uint32_t* apic_ids, int first_core, int n, bool x2apic_id) {
|
|||||||
}
|
}
|
||||||
|
|
||||||
bool get_topology_from_apic(struct cpuInfo* cpu, struct topology* topo) {
|
bool get_topology_from_apic(struct cpuInfo* cpu, struct topology* topo) {
|
||||||
|
if (topo->cach == NULL) {
|
||||||
|
printWarn("get_topology_from_apic: cach is NULL");
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
uint32_t apic_id;
|
uint32_t apic_id;
|
||||||
uint32_t* apic_ids = emalloc(sizeof(uint32_t) * topo->total_cores_module);
|
uint32_t* apic_ids = emalloc(sizeof(uint32_t) * topo->total_cores_module);
|
||||||
uint32_t* apic_pkg = emalloc(sizeof(uint32_t) * topo->total_cores_module);
|
uint32_t* apic_pkg = emalloc(sizeof(uint32_t) * topo->total_cores_module);
|
||||||
|
|||||||
@@ -17,10 +17,6 @@ struct apic {
|
|||||||
bool get_topology_from_apic(struct cpuInfo* cpu, struct topology* topo);
|
bool get_topology_from_apic(struct cpuInfo* cpu, struct topology* topo);
|
||||||
uint32_t is_smt_enabled_amd(struct topology* topo);
|
uint32_t is_smt_enabled_amd(struct topology* topo);
|
||||||
|
|
||||||
#ifndef __APPLE__
|
|
||||||
bool bind_to_cpu(int cpu_id);
|
|
||||||
#endif
|
|
||||||
|
|
||||||
#ifdef __linux__
|
#ifdef __linux__
|
||||||
int get_total_cores_module(int total_cores, int module);
|
int get_total_cores_module(int total_cores, int module);
|
||||||
#endif
|
#endif
|
||||||
|
|||||||
175
src/x86/cpuid.c
175
src/x86/cpuid.c
@@ -5,6 +5,13 @@
|
|||||||
#include "../common/udev.h"
|
#include "../common/udev.h"
|
||||||
#include <unistd.h>
|
#include <unistd.h>
|
||||||
#endif
|
#endif
|
||||||
|
#if defined (__FreeBSD__) || defined (__APPLE__)
|
||||||
|
#include "../common/sysctl.h"
|
||||||
|
#endif
|
||||||
|
|
||||||
|
#ifdef __linux__
|
||||||
|
#include "../common/freq.h"
|
||||||
|
#endif
|
||||||
|
|
||||||
#include <stdio.h>
|
#include <stdio.h>
|
||||||
#include <stdlib.h>
|
#include <stdlib.h>
|
||||||
@@ -22,6 +29,7 @@
|
|||||||
|
|
||||||
#define CPU_VENDOR_INTEL_STRING "GenuineIntel"
|
#define CPU_VENDOR_INTEL_STRING "GenuineIntel"
|
||||||
#define CPU_VENDOR_AMD_STRING "AuthenticAMD"
|
#define CPU_VENDOR_AMD_STRING "AuthenticAMD"
|
||||||
|
#define CPU_VENDOR_HYGON_STRING "HygonGenuine"
|
||||||
|
|
||||||
static const char *hv_vendors_string[] = {
|
static const char *hv_vendors_string[] = {
|
||||||
[HV_VENDOR_KVM] = "KVMKVMKVM",
|
[HV_VENDOR_KVM] = "KVMKVMKVM",
|
||||||
@@ -218,7 +226,7 @@ int64_t get_peak_performance(struct cpuInfo* cpu, bool accurate_pp) {
|
|||||||
#endif
|
#endif
|
||||||
|
|
||||||
//First, check we have consistent data
|
//First, check we have consistent data
|
||||||
if(freq == UNKNOWN_DATA || topo->logical_cores == UNKNOWN_DATA) {
|
if(freq == UNKNOWN_DATA || topo == NULL || topo->logical_cores == UNKNOWN_DATA) {
|
||||||
return -1;
|
return -1;
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -451,7 +459,7 @@ struct cpuInfo* get_cpu_info(void) {
|
|||||||
cpu->cach = NULL;
|
cpu->cach = NULL;
|
||||||
cpu->feat = NULL;
|
cpu->feat = NULL;
|
||||||
|
|
||||||
uint32_t modules = 1;
|
cpu->num_cpus = 1;
|
||||||
uint32_t eax = 0;
|
uint32_t eax = 0;
|
||||||
uint32_t ebx = 0;
|
uint32_t ebx = 0;
|
||||||
uint32_t ecx = 0;
|
uint32_t ecx = 0;
|
||||||
@@ -470,6 +478,8 @@ struct cpuInfo* get_cpu_info(void) {
|
|||||||
cpu->cpu_vendor = CPU_VENDOR_INTEL;
|
cpu->cpu_vendor = CPU_VENDOR_INTEL;
|
||||||
else if (strcmp(CPU_VENDOR_AMD_STRING,name) == 0)
|
else if (strcmp(CPU_VENDOR_AMD_STRING,name) == 0)
|
||||||
cpu->cpu_vendor = CPU_VENDOR_AMD;
|
cpu->cpu_vendor = CPU_VENDOR_AMD;
|
||||||
|
else if (strcmp(CPU_VENDOR_HYGON_STRING,name) == 0)
|
||||||
|
cpu->cpu_vendor = CPU_VENDOR_HYGON;
|
||||||
else {
|
else {
|
||||||
cpu->cpu_vendor = CPU_VENDOR_INVALID;
|
cpu->cpu_vendor = CPU_VENDOR_INVALID;
|
||||||
printErr("Unknown CPU vendor: %s", name);
|
printErr("Unknown CPU vendor: %s", name);
|
||||||
@@ -507,12 +517,12 @@ struct cpuInfo* get_cpu_info(void) {
|
|||||||
cpu->hybrid_flag = (edx >> 15) & 0x1;
|
cpu->hybrid_flag = (edx >> 15) & 0x1;
|
||||||
}
|
}
|
||||||
|
|
||||||
if(cpu->hybrid_flag) modules = 2;
|
if(cpu->hybrid_flag) cpu->num_cpus = 2;
|
||||||
|
|
||||||
struct cpuInfo* ptr = cpu;
|
struct cpuInfo* ptr = cpu;
|
||||||
for(uint32_t i=0; i < modules; i++) {
|
for(uint32_t i=0; i < cpu->num_cpus; i++) {
|
||||||
int32_t first_core;
|
int32_t first_core;
|
||||||
set_cpu_module(i, modules, &first_core);
|
set_cpu_module(i, cpu->num_cpus, &first_core);
|
||||||
|
|
||||||
if(i > 0) {
|
if(i > 0) {
|
||||||
ptr->next_cpu = emalloc(sizeof(struct cpuInfo));
|
ptr->next_cpu = emalloc(sizeof(struct cpuInfo));
|
||||||
@@ -547,11 +557,7 @@ struct cpuInfo* get_cpu_info(void) {
|
|||||||
cpu->cpu_name = infer_cpu_name_from_uarch(cpu->arch);
|
cpu->cpu_name = infer_cpu_name_from_uarch(cpu->arch);
|
||||||
}
|
}
|
||||||
|
|
||||||
// If any field of the struct is NULL,
|
|
||||||
// return early, as next functions
|
|
||||||
// require non NULL fields in cach and topo
|
|
||||||
ptr->cach = get_cache_info(ptr);
|
ptr->cach = get_cache_info(ptr);
|
||||||
if(ptr->cach == NULL) return cpu;
|
|
||||||
|
|
||||||
if(cpu->hybrid_flag) {
|
if(cpu->hybrid_flag) {
|
||||||
ptr->topo = get_topology_info(ptr, ptr->cach, i);
|
ptr->topo = get_topology_info(ptr, ptr->cach, i);
|
||||||
@@ -559,16 +565,23 @@ struct cpuInfo* get_cpu_info(void) {
|
|||||||
else {
|
else {
|
||||||
ptr->topo = get_topology_info(ptr, ptr->cach, -1);
|
ptr->topo = get_topology_info(ptr, ptr->cach, -1);
|
||||||
}
|
}
|
||||||
if(cpu->topo == NULL) return cpu;
|
|
||||||
|
// If topo is NULL, return early, as get_peak_performance
|
||||||
|
// requries non-NULL topology.
|
||||||
|
if(ptr->topo == NULL) return cpu;
|
||||||
}
|
}
|
||||||
|
|
||||||
cpu->num_cpus = modules;
|
|
||||||
cpu->peak_performance = get_peak_performance(cpu, accurate_pp());
|
cpu->peak_performance = get_peak_performance(cpu, accurate_pp());
|
||||||
|
|
||||||
return cpu;
|
return cpu;
|
||||||
}
|
}
|
||||||
|
|
||||||
bool get_cache_topology_amd(struct cpuInfo* cpu, struct topology* topo) {
|
bool get_cache_topology_amd(struct cpuInfo* cpu, struct topology* topo) {
|
||||||
|
if (topo->cach == NULL) {
|
||||||
|
printWarn("get_cache_topology_amd: cach is NULL");
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
if(cpu->maxExtendedLevels >= 0x8000001D && cpu->topology_extensions) {
|
if(cpu->maxExtendedLevels >= 0x8000001D && cpu->topology_extensions) {
|
||||||
uint32_t i, eax, ebx, ecx, edx, num_sharing_cache, cache_type, cache_level;
|
uint32_t i, eax, ebx, ecx, edx, num_sharing_cache, cache_type, cache_level;
|
||||||
|
|
||||||
@@ -644,10 +657,17 @@ bool get_cache_topology_amd(struct cpuInfo* cpu, struct topology* topo) {
|
|||||||
|
|
||||||
#ifdef __linux__
|
#ifdef __linux__
|
||||||
void get_topology_from_udev(struct topology* topo) {
|
void get_topology_from_udev(struct topology* topo) {
|
||||||
// TODO: To be improved in the future
|
|
||||||
topo->total_cores = get_ncores_from_cpuinfo();
|
topo->total_cores = get_ncores_from_cpuinfo();
|
||||||
topo->logical_cores = topo->total_cores;
|
// TODO: To be improved in the future
|
||||||
topo->physical_cores = topo->total_cores;
|
if (topo->total_cores == 1) {
|
||||||
|
// We can assume it's a single core CPU
|
||||||
|
topo->logical_cores = topo->total_cores;
|
||||||
|
topo->physical_cores = topo->total_cores;
|
||||||
|
}
|
||||||
|
else {
|
||||||
|
topo->logical_cores = UNKNOWN_DATA;
|
||||||
|
topo->physical_cores = UNKNOWN_DATA;
|
||||||
|
}
|
||||||
topo->smt_available = 1;
|
topo->smt_available = 1;
|
||||||
topo->smt_supported = 1;
|
topo->smt_supported = 1;
|
||||||
topo->sockets = 1;
|
topo->sockets = 1;
|
||||||
@@ -692,32 +712,31 @@ struct topology* get_topology_info(struct cpuInfo* cpu, struct cache* cach, int
|
|||||||
topo->total_cores_module = topo->total_cores;
|
topo->total_cores_module = topo->total_cores;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
bool toporet = false;
|
||||||
switch(cpu->cpu_vendor) {
|
switch(cpu->cpu_vendor) {
|
||||||
case CPU_VENDOR_INTEL:
|
case CPU_VENDOR_INTEL:
|
||||||
if (cpu->maxLevels >= 0x00000004) {
|
if (cpu->maxLevels >= 0x00000004) {
|
||||||
bool toporet = get_topology_from_apic(cpu, topo);
|
toporet = get_topology_from_apic(cpu, topo);
|
||||||
if(!toporet) {
|
|
||||||
#ifdef __linux__
|
|
||||||
printWarn("Failed to retrieve topology from APIC, using udev...\n");
|
|
||||||
get_topology_from_udev(topo);
|
|
||||||
#else
|
|
||||||
printErr("Failed to retrieve topology from APIC, assumming default values...\n");
|
|
||||||
topo->logical_cores = UNKNOWN_DATA;
|
|
||||||
topo->physical_cores = UNKNOWN_DATA;
|
|
||||||
topo->smt_available = 1;
|
|
||||||
topo->smt_supported = 1;
|
|
||||||
#endif
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
else {
|
else {
|
||||||
printWarn("Can't read topology information from cpuid (needed level is 0x%.8X, max is 0x%.8X)", 0x00000001, cpu->maxLevels);
|
printWarn("Can't read topology information from cpuid (needed level is 0x%.8X, max is 0x%.8X)", 0x00000004, cpu->maxLevels);
|
||||||
topo->physical_cores = 1;
|
}
|
||||||
topo->logical_cores = 1;
|
if(!toporet) {
|
||||||
topo->smt_available = 1;
|
#ifdef __linux__
|
||||||
topo->smt_supported = 1;
|
printWarn("Failed to retrieve topology from APIC, using udev...");
|
||||||
|
get_topology_from_udev(topo);
|
||||||
|
#else
|
||||||
|
if (cpu->maxLevels >= 0x00000004)
|
||||||
|
printErr("Failed to retrieve topology from APIC, assumming default values...");
|
||||||
|
topo->logical_cores = UNKNOWN_DATA;
|
||||||
|
topo->physical_cores = UNKNOWN_DATA;
|
||||||
|
topo->smt_available = 1;
|
||||||
|
topo->smt_supported = 1;
|
||||||
|
#endif
|
||||||
}
|
}
|
||||||
break;
|
break;
|
||||||
case CPU_VENDOR_AMD:
|
case CPU_VENDOR_AMD:
|
||||||
|
case CPU_VENDOR_HYGON:
|
||||||
if (cpu->maxExtendedLevels >= 0x80000008) {
|
if (cpu->maxExtendedLevels >= 0x80000008) {
|
||||||
eax = 0x80000008;
|
eax = 0x80000008;
|
||||||
cpuid(&eax, &ebx, &ecx, &edx);
|
cpuid(&eax, &ebx, &ecx, &edx);
|
||||||
@@ -734,10 +753,15 @@ struct topology* get_topology_info(struct cpuInfo* cpu, struct cache* cach, int
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
else {
|
else {
|
||||||
printWarn("Can't read topology information from cpuid (needed extended level is 0x%.8X, max is 0x%.8X)", 0x80000008, cpu->maxExtendedLevels);
|
#ifdef __linux__
|
||||||
topo->physical_cores = 1;
|
printWarn("Can't read topology information from cpuid (needed extended level is 0x%.8X, max is 0x%.8X), using udev...", 0x80000008, cpu->maxExtendedLevels);
|
||||||
topo->logical_cores = 1;
|
get_topology_from_udev(topo);
|
||||||
topo->smt_supported = 1;
|
#else
|
||||||
|
printWarn("Can't read topology information from cpuid (needed extended level is 0x%.8X, max is 0x%.8X)", 0x80000008, cpu->maxExtendedLevels);
|
||||||
|
topo->physical_cores = 1;
|
||||||
|
topo->logical_cores = 1;
|
||||||
|
topo->smt_supported = 1;
|
||||||
|
#endif
|
||||||
}
|
}
|
||||||
|
|
||||||
if (cpu->maxLevels >= 0x00000001) {
|
if (cpu->maxLevels >= 0x00000001) {
|
||||||
@@ -914,16 +938,27 @@ struct cache* get_cache_info(struct cpuInfo* cpu) {
|
|||||||
|
|
||||||
struct frequency* get_frequency_info(struct cpuInfo* cpu) {
|
struct frequency* get_frequency_info(struct cpuInfo* cpu) {
|
||||||
struct frequency* freq = emalloc(sizeof(struct frequency));
|
struct frequency* freq = emalloc(sizeof(struct frequency));
|
||||||
|
freq->measured = false;
|
||||||
|
|
||||||
if(cpu->maxLevels < 0x00000016) {
|
if(cpu->maxLevels < 0x00000016) {
|
||||||
#if defined (_WIN32) || defined (__APPLE__)
|
#if defined (_WIN32)
|
||||||
printWarn("Can't read frequency information from cpuid (needed level is 0x%.8X, max is 0x%.8X)", 0x00000016, cpu->maxLevels);
|
printWarn("Can't read frequency information from cpuid (needed level is 0x%.8X, max is 0x%.8X)", 0x00000016, cpu->maxLevels);
|
||||||
freq->base = UNKNOWN_DATA;
|
freq->base = UNKNOWN_DATA;
|
||||||
freq->max = UNKNOWN_DATA;
|
freq->max = UNKNOWN_DATA;
|
||||||
|
#elif defined (__FreeBSD__) || defined (__APPLE__)
|
||||||
|
printWarn("Can't read frequency information from cpuid (needed level is 0x%.8X, max is 0x%.8X). Using sysctl", 0x00000016, cpu->maxLevels);
|
||||||
|
uint32_t freq_hz = get_sys_info_by_name(CPUFREQUENCY_SYSCTL);
|
||||||
|
if (freq_hz == 0) {
|
||||||
|
printWarn("Read max CPU frequency from sysctl and got 0 MHz");
|
||||||
|
freq->max = UNKNOWN_DATA;
|
||||||
|
}
|
||||||
|
|
||||||
|
freq->base = UNKNOWN_DATA;
|
||||||
|
freq->max = freq_hz;
|
||||||
#else
|
#else
|
||||||
printWarn("Can't read frequency information from cpuid (needed level is 0x%.8X, max is 0x%.8X). Using udev", 0x00000016, cpu->maxLevels);
|
printWarn("Can't read frequency information from cpuid (needed level is 0x%.8X, max is 0x%.8X). Using udev", 0x00000016, cpu->maxLevels);
|
||||||
freq->base = UNKNOWN_DATA;
|
freq->base = UNKNOWN_DATA;
|
||||||
freq->max = get_max_freq_from_file(0);
|
freq->max = get_max_freq_from_file(cpu->first_core_id);
|
||||||
|
|
||||||
if(freq->max == 0) {
|
if(freq->max == 0) {
|
||||||
printWarn("Read max CPU frequency from udev and got 0 MHz");
|
printWarn("Read max CPU frequency from udev and got 0 MHz");
|
||||||
@@ -950,7 +985,7 @@ struct frequency* get_frequency_info(struct cpuInfo* cpu) {
|
|||||||
printWarn("Read max CPU frequency from CPUID and got 0 MHz");
|
printWarn("Read max CPU frequency from CPUID and got 0 MHz");
|
||||||
#ifdef __linux__
|
#ifdef __linux__
|
||||||
printWarn("Using udev to detect frequency");
|
printWarn("Using udev to detect frequency");
|
||||||
freq->max = get_max_freq_from_file(0);
|
freq->max = get_max_freq_from_file(cpu->first_core_id);
|
||||||
|
|
||||||
if(freq->max == 0) {
|
if(freq->max == 0) {
|
||||||
printWarn("Read max CPU frequency from udev and got 0 MHz");
|
printWarn("Read max CPU frequency from udev and got 0 MHz");
|
||||||
@@ -962,6 +997,15 @@ struct frequency* get_frequency_info(struct cpuInfo* cpu) {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#ifdef __linux__
|
||||||
|
if (freq->max == UNKNOWN_DATA || measure_max_frequency_flag()) {
|
||||||
|
if (freq->max == UNKNOWN_DATA)
|
||||||
|
printWarn("All previous methods failed, measuring CPU frequency");
|
||||||
|
freq->max = measure_max_frequency(cpu->first_core_id);
|
||||||
|
freq->measured = true;
|
||||||
|
}
|
||||||
|
#endif
|
||||||
|
|
||||||
return freq;
|
return freq;
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -983,24 +1027,33 @@ char* get_str_topology(struct cpuInfo* cpu, struct topology* topo, bool dual_soc
|
|||||||
string = emalloc(sizeof(char) * (strlen(STRING_UNKNOWN) + 1));
|
string = emalloc(sizeof(char) * (strlen(STRING_UNKNOWN) + 1));
|
||||||
strcpy(string, STRING_UNKNOWN);
|
strcpy(string, STRING_UNKNOWN);
|
||||||
}
|
}
|
||||||
else if(topo->smt_supported > 1) {
|
|
||||||
// 4 for digits, 21 for ' cores (SMT disabled)' which is the longest possible output
|
|
||||||
uint32_t max_size = 4+21+1;
|
|
||||||
string = emalloc(sizeof(char) * max_size);
|
|
||||||
|
|
||||||
if(topo->smt_available > 1)
|
|
||||||
snprintf(string, max_size, "%d cores (%d threads)", topo->physical_cores * topo_sockets, topo->logical_cores * topo_sockets);
|
|
||||||
else {
|
|
||||||
if(cpu->cpu_vendor == CPU_VENDOR_AMD)
|
|
||||||
snprintf(string, max_size, "%d cores (SMT disabled)", topo->physical_cores * topo_sockets);
|
|
||||||
else
|
|
||||||
snprintf(string, max_size, "%d cores (HT disabled)", topo->physical_cores * topo_sockets);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
else {
|
else {
|
||||||
uint32_t max_size = 4+7+1;
|
char cores_str[6];
|
||||||
string = emalloc(sizeof(char) * max_size);
|
memset(cores_str, 0, sizeof(char) * 6);
|
||||||
snprintf(string, max_size, "%d cores",topo->physical_cores * topo_sockets);
|
if (topo->physical_cores * topo_sockets > 1)
|
||||||
|
strcpy(cores_str, "cores");
|
||||||
|
else
|
||||||
|
strcpy(cores_str, "core");
|
||||||
|
|
||||||
|
if(topo->smt_supported > 1) {
|
||||||
|
// 4 for digits, 21 for ' cores (SMT disabled)' which is the longest possible output
|
||||||
|
uint32_t max_size = 4+21+1;
|
||||||
|
string = emalloc(sizeof(char) * max_size);
|
||||||
|
|
||||||
|
if(topo->smt_available > 1)
|
||||||
|
snprintf(string, max_size, "%d %s (%d threads)", topo->physical_cores * topo_sockets, cores_str, topo->logical_cores * topo_sockets);
|
||||||
|
else {
|
||||||
|
if(cpu->cpu_vendor == CPU_VENDOR_AMD)
|
||||||
|
snprintf(string, max_size, "%d %s (SMT disabled)", topo->physical_cores * topo_sockets, cores_str);
|
||||||
|
else
|
||||||
|
snprintf(string, max_size, "%d %s (HT disabled)", topo->physical_cores * topo_sockets, cores_str);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
else {
|
||||||
|
uint32_t max_size = 4+7+1;
|
||||||
|
string = emalloc(sizeof(char) * max_size);
|
||||||
|
snprintf(string, max_size, "%d %s",topo->physical_cores * topo_sockets, cores_str);
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
return string;
|
return string;
|
||||||
@@ -1061,8 +1114,14 @@ char* get_str_sse(struct cpuInfo* cpu) {
|
|||||||
last+=SSE4_2_sl;
|
last+=SSE4_2_sl;
|
||||||
}
|
}
|
||||||
|
|
||||||
//Purge last comma
|
if (last == 0) {
|
||||||
string[last-1] = '\0';
|
snprintf(string, 2+1, "No");
|
||||||
|
}
|
||||||
|
else {
|
||||||
|
//Purge last comma
|
||||||
|
string[last-1] = '\0';
|
||||||
|
}
|
||||||
|
|
||||||
return string;
|
return string;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|||||||
118
src/x86/uarch.c
118
src/x86/uarch.c
@@ -47,8 +47,10 @@ typedef uint32_t MICROARCH;
|
|||||||
enum {
|
enum {
|
||||||
UARCH_UNKNOWN,
|
UARCH_UNKNOWN,
|
||||||
// INTEL //
|
// INTEL //
|
||||||
|
UARCH_I486,
|
||||||
UARCH_P5,
|
UARCH_P5,
|
||||||
UARCH_P5_MMX,
|
UARCH_P5_MMX,
|
||||||
|
UARCH_P6_PRO,
|
||||||
UARCH_P6_PENTIUM_II,
|
UARCH_P6_PENTIUM_II,
|
||||||
UARCH_P6_PENTIUM_III,
|
UARCH_P6_PENTIUM_III,
|
||||||
UARCH_DOTHAN,
|
UARCH_DOTHAN,
|
||||||
@@ -97,6 +99,8 @@ enum {
|
|||||||
// AMD //
|
// AMD //
|
||||||
UARCH_AM486,
|
UARCH_AM486,
|
||||||
UARCH_AM5X86,
|
UARCH_AM5X86,
|
||||||
|
UARCH_SSA5,
|
||||||
|
UARCH_K5,
|
||||||
UARCH_K6,
|
UARCH_K6,
|
||||||
UARCH_K7,
|
UARCH_K7,
|
||||||
UARCH_K8,
|
UARCH_K8,
|
||||||
@@ -149,16 +153,30 @@ struct uarch* get_uarch_from_cpuid_intel(uint32_t ef, uint32_t f, uint32_t em, u
|
|||||||
// ------------------------------------------------------------------------------- //
|
// ------------------------------------------------------------------------------- //
|
||||||
// EF F EM M S //
|
// EF F EM M S //
|
||||||
UARCH_START
|
UARCH_START
|
||||||
|
CHECK_UARCH(arch, 0, 4, 0, 0, NA, "i80486DX", UARCH_I486, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||||
|
CHECK_UARCH(arch, 0, 4, 0, 1, NA, "i80486DX-50", UARCH_I486, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||||
|
CHECK_UARCH(arch, 0, 4, 0, 2, NA, "i80486SX", UARCH_I486, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||||
|
CHECK_UARCH(arch, 0, 4, 0, 3, NA, "i80486DX2", UARCH_I486, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||||
|
CHECK_UARCH(arch, 0, 4, 0, 4, NA, "i80486SL", UARCH_I486, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||||
|
CHECK_UARCH(arch, 0, 4, 0, 5, NA, "i80486SX2", UARCH_I486, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||||
|
CHECK_UARCH(arch, 0, 4, 0, 7, NA, "i80486DX2WB", UARCH_I486, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||||
|
CHECK_UARCH(arch, 0, 4, 0, 8, NA, "i80486DX4", UARCH_I486, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||||
|
CHECK_UARCH(arch, 0, 4, 0, 9, NA, "i80486DX4WB", UARCH_I486, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||||
CHECK_UARCH(arch, 0, 5, 0, 0, NA, "P5", UARCH_P5, 800)
|
CHECK_UARCH(arch, 0, 5, 0, 0, NA, "P5", UARCH_P5, 800)
|
||||||
CHECK_UARCH(arch, 0, 5, 0, 1, NA, "P5", UARCH_P5, 800)
|
CHECK_UARCH(arch, 0, 5, 0, 1, NA, "P5", UARCH_P5, 800)
|
||||||
CHECK_UARCH(arch, 0, 5, 0, 2, NA, "P5", UARCH_P5, UNK)
|
CHECK_UARCH(arch, 0, 5, 0, 2, NA, "P54C", UARCH_P5, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||||
CHECK_UARCH(arch, 0, 5, 0, 3, NA, "P5", UARCH_P5, 600)
|
CHECK_UARCH(arch, 0, 5, 0, 3, NA, "P24T (Overdrive)", UARCH_P5, 600) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||||
CHECK_UARCH(arch, 0, 5, 0, 4, NA, "P5 (MMX)", UARCH_P5_MMX, UNK)
|
CHECK_UARCH(arch, 0, 5, 0, 4, NA, "P55C (MMX)", UARCH_P5_MMX, 350) // https://www.cpu-world.com/CPUs/Pentium/TYPE-Pentium%20MMX.html
|
||||||
CHECK_UARCH(arch, 0, 5, 0, 7, NA, "P5 (MMX)", UARCH_P5_MMX, UNK)
|
CHECK_UARCH(arch, 0, 5, 0, 7, NA, "P54C", UARCH_P5, 350) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||||
CHECK_UARCH(arch, 0, 5, 0, 8, NA, "P5 (MMX)", UARCH_P5_MMX, 250)
|
CHECK_UARCH(arch, 0, 5, 0, 8, NA, "Tillamook", UARCH_P5_MMX, 250) // http://instlatx64.atw.hu./
|
||||||
CHECK_UARCH(arch, 0, 5, 0, 9, 0, "Lakemont", UARCH_LAKEMONT, 32)
|
CHECK_UARCH(arch, 0, 5, 0, 9, 0, "Lakemont", UARCH_LAKEMONT, 32)
|
||||||
CHECK_UARCH(arch, 0, 5, 0, 9, NA, "P5 (MMX)", UARCH_P5_MMX, UNK)
|
CHECK_UARCH(arch, 0, 5, 0, 9, NA, "P5 (MMX)", UARCH_P5_MMX, UNK)
|
||||||
CHECK_UARCH(arch, 0, 5, 0, 10, 0, "Lakemont", UARCH_LAKEMONT, 32)
|
CHECK_UARCH(arch, 0, 5, 0, 10, 0, "Lakemont", UARCH_LAKEMONT, 32)
|
||||||
|
CHECK_UARCH(arch, 0, 6, 0, 1, 1, "P6", UARCH_P6_PRO, UNK)
|
||||||
|
CHECK_UARCH(arch, 0, 6, 0, 1, 2, "P6", UARCH_P6_PRO, UNK)
|
||||||
|
CHECK_UARCH(arch, 0, 6, 0, 1, 6, "P6", UARCH_P6_PRO, 350)
|
||||||
|
CHECK_UARCH(arch, 0, 6, 0, 1, 7, "P6", UARCH_P6_PRO, 350)
|
||||||
|
CHECK_UARCH(arch, 0, 6, 0, 1, 9, "P6", UARCH_P6_PRO, 350)
|
||||||
CHECK_UARCH(arch, 0, 6, 0, 0, NA, "P6 (Pentium II)", UARCH_P6_PENTIUM_II, UNK)
|
CHECK_UARCH(arch, 0, 6, 0, 0, NA, "P6 (Pentium II)", UARCH_P6_PENTIUM_II, UNK)
|
||||||
CHECK_UARCH(arch, 0, 6, 0, 1, NA, "P6 (Pentium II)", UARCH_P6_PENTIUM_II, UNK) // process depends on core
|
CHECK_UARCH(arch, 0, 6, 0, 1, NA, "P6 (Pentium II)", UARCH_P6_PENTIUM_II, UNK) // process depends on core
|
||||||
CHECK_UARCH(arch, 0, 6, 0, 2, NA, "P6 (Pentium II)", UARCH_P6_PENTIUM_II, UNK)
|
CHECK_UARCH(arch, 0, 6, 0, 2, NA, "P6 (Pentium II)", UARCH_P6_PENTIUM_II, UNK)
|
||||||
@@ -279,11 +297,16 @@ struct uarch* get_uarch_from_cpuid_amd(uint32_t ef, uint32_t f, uint32_t em, uin
|
|||||||
// ----------------------------------------------------------------------------- //
|
// ----------------------------------------------------------------------------- //
|
||||||
// EF F EM M S //
|
// EF F EM M S //
|
||||||
UARCH_START
|
UARCH_START
|
||||||
CHECK_UARCH(arch, 0, 4, 0, 3, NA, "Am486", UARCH_AM486, UNK)
|
CHECK_UARCH(arch, 0, 4, 0, 3, NA, "Am486DX2", UARCH_AM486, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||||
CHECK_UARCH(arch, 0, 4, 0, 7, NA, "Am486", UARCH_AM486, UNK)
|
CHECK_UARCH(arch, 0, 4, 0, 7, NA, "Am486DX2WB", UARCH_AM486, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||||
CHECK_UARCH(arch, 0, 4, 0, 8, NA, "Am486", UARCH_AM486, UNK)
|
CHECK_UARCH(arch, 0, 4, 0, 8, NA, "Am486DX4", UARCH_AM486, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||||
CHECK_UARCH(arch, 0, 4, 0, 9, NA, "Am486", UARCH_AM486, UNK)
|
CHECK_UARCH(arch, 0, 4, 0, 9, NA, "Am486DX4WB", UARCH_AM486, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||||
CHECK_UARCH(arch, 0, 4, NA, NA, NA, "Am5x86", UARCH_AM5X86, UNK)
|
CHECK_UARCH(arch, 0, 4, 0, 14, NA, "Am5x86", UARCH_AM5X86, 350) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||||
|
CHECK_UARCH(arch, 0, 4, 0, 15, NA, "Am5x86WB", UARCH_AM5X86, 350) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||||
|
CHECK_UARCH(arch, 0, 5, 0, 0, NA, "SSA5 (K5)", UARCH_SSA5, 350) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||||
|
CHECK_UARCH(arch, 0, 5, 0, 1, NA, "K5", UARCH_K5, 350) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||||
|
CHECK_UARCH(arch, 0, 5, 0, 2, NA, "K5", UARCH_K5, 350) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||||
|
CHECK_UARCH(arch, 0, 5, 0, 3, NA, "K5", UARCH_K5, 350) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||||
CHECK_UARCH(arch, 0, 5, 0, 6, NA, "K6", UARCH_K6, 300)
|
CHECK_UARCH(arch, 0, 5, 0, 6, NA, "K6", UARCH_K6, 300)
|
||||||
CHECK_UARCH(arch, 0, 5, 0, 7, NA, "K6", UARCH_K6, 250) // *p from sandpile.org
|
CHECK_UARCH(arch, 0, 5, 0, 7, NA, "K6", UARCH_K6, 250) // *p from sandpile.org
|
||||||
CHECK_UARCH(arch, 0, 5, 0, 10, NA, "K7", UARCH_K7, 130) // Geode NX
|
CHECK_UARCH(arch, 0, 5, 0, 10, NA, "K7", UARCH_K7, 130) // Geode NX
|
||||||
@@ -392,6 +415,25 @@ struct uarch* get_uarch_from_cpuid_amd(uint32_t ef, uint32_t f, uint32_t em, uin
|
|||||||
return arch;
|
return arch;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
struct uarch* get_uarch_from_cpuid_hygon(uint32_t ef, uint32_t f, uint32_t em, uint32_t m, int s) {
|
||||||
|
struct uarch* arch = emalloc(sizeof(struct uarch));
|
||||||
|
|
||||||
|
// EF: Extended Family //
|
||||||
|
// F: Family //
|
||||||
|
// EM: Extended Model //
|
||||||
|
// M: Model //
|
||||||
|
// S: Stepping //
|
||||||
|
// ----------------------------------------------------------------------------- //
|
||||||
|
// EF F EM M S //
|
||||||
|
UARCH_START
|
||||||
|
// https://www.phoronix.com/news/Hygon-Dhyana-AMD-China-CPUs
|
||||||
|
CHECK_UARCH(arch, 9, 15, 0, 1, NA, "Zen", UARCH_ZEN, UNK) // https://github.com/Dr-Noob/cpufetch/issues/244
|
||||||
|
// CHECK_UARCH(arch, 9, 15, 0, 2, NA, "???", ?????????, UNK) // http://instlatx64.atw.hu/
|
||||||
|
UARCH_END
|
||||||
|
|
||||||
|
return arch;
|
||||||
|
}
|
||||||
|
|
||||||
struct uarch* get_uarch_from_cpuid(struct cpuInfo* cpu, uint32_t dump, uint32_t ef, uint32_t f, uint32_t em, uint32_t m, int s) {
|
struct uarch* get_uarch_from_cpuid(struct cpuInfo* cpu, uint32_t dump, uint32_t ef, uint32_t f, uint32_t em, uint32_t m, int s) {
|
||||||
if(cpu->cpu_vendor == CPU_VENDOR_INTEL) {
|
if(cpu->cpu_vendor == CPU_VENDOR_INTEL) {
|
||||||
struct uarch* arch = emalloc(sizeof(struct uarch));
|
struct uarch* arch = emalloc(sizeof(struct uarch));
|
||||||
@@ -436,8 +478,16 @@ struct uarch* get_uarch_from_cpuid(struct cpuInfo* cpu, uint32_t dump, uint32_t
|
|||||||
}
|
}
|
||||||
return get_uarch_from_cpuid_intel(ef, f, em, m, s);
|
return get_uarch_from_cpuid_intel(ef, f, em, m, s);
|
||||||
}
|
}
|
||||||
else
|
else if(cpu->cpu_vendor == CPU_VENDOR_AMD) {
|
||||||
return get_uarch_from_cpuid_amd(ef, f, em, m, s);
|
return get_uarch_from_cpuid_amd(ef, f, em, m, s);
|
||||||
|
}
|
||||||
|
else if(cpu->cpu_vendor == CPU_VENDOR_HYGON) {
|
||||||
|
return get_uarch_from_cpuid_hygon(ef, f, em, m, s);
|
||||||
|
}
|
||||||
|
else {
|
||||||
|
printBug("Invalid CPU vendor: %d", cpu->cpu_vendor);
|
||||||
|
return NULL;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
// If we cannot get the CPU name from CPUID, try to infer it from uarch
|
// If we cannot get the CPU name from CPUID, try to infer it from uarch
|
||||||
@@ -452,16 +502,42 @@ char* infer_cpu_name_from_uarch(struct uarch* arch) {
|
|||||||
|
|
||||||
char *str = NULL;
|
char *str = NULL;
|
||||||
|
|
||||||
if (arch->uarch == UARCH_P5)
|
switch (arch->uarch) {
|
||||||
str = "Intel Pentium";
|
// Intel
|
||||||
else if (arch->uarch == UARCH_P5_MMX)
|
case UARCH_I486:
|
||||||
str = "Intel Pentium MMX";
|
str = "Intel 486";
|
||||||
else if (arch->uarch == UARCH_P6_PENTIUM_II)
|
break;
|
||||||
str = "Intel Pentium II";
|
case UARCH_P5:
|
||||||
else if (arch->uarch == UARCH_P6_PENTIUM_III)
|
str = "Intel Pentium";
|
||||||
str = "Intel Pentium III";
|
break;
|
||||||
else
|
case UARCH_P5_MMX:
|
||||||
printErr("Unable to find name from uarch: %d", arch->uarch);
|
str = "Intel Pentium MMX";
|
||||||
|
break;
|
||||||
|
case UARCH_P6_PRO:
|
||||||
|
str = "Intel Pentium Pro";
|
||||||
|
break;
|
||||||
|
case UARCH_P6_PENTIUM_II:
|
||||||
|
str = "Intel Pentium II";
|
||||||
|
break;
|
||||||
|
case UARCH_P6_PENTIUM_III:
|
||||||
|
str = "Intel Pentium III";
|
||||||
|
break;
|
||||||
|
|
||||||
|
// AMD
|
||||||
|
case UARCH_AM486:
|
||||||
|
str = "AMD 486";
|
||||||
|
break;
|
||||||
|
case UARCH_AM5X86:
|
||||||
|
str = "AMD 5x86";
|
||||||
|
break;
|
||||||
|
case UARCH_SSA5:
|
||||||
|
str = "AMD 5k86";
|
||||||
|
break;
|
||||||
|
|
||||||
|
default:
|
||||||
|
printErr("Unable to find name from uarch: %d", arch->uarch);
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
|
||||||
if (str == NULL) {
|
if (str == NULL) {
|
||||||
cpu_name = ecalloc(strlen(STRING_UNKNOWN) + 1, sizeof(char));
|
cpu_name = ecalloc(strlen(STRING_UNKNOWN) + 1, sizeof(char));
|
||||||
|
|||||||
Reference in New Issue
Block a user