mirror of
https://github.com/Dr-Noob/cpufetch.git
synced 2026-03-25 07:50:40 +01:00
Compare commits
37 Commits
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
e5e317ea92 | ||
|
|
41a194948d | ||
|
|
5dc2234e97 | ||
|
|
21dddc63ff | ||
|
|
8fca4cb250 | ||
|
|
7c947bdf64 | ||
|
|
1ed3a0f2bf | ||
|
|
0fe6fc3f4d | ||
|
|
96c784026b | ||
|
|
59cd2dd128 | ||
|
|
da1981b97c | ||
|
|
8506c91e00 | ||
|
|
ece28cbdee | ||
|
|
7b46c78249 | ||
|
|
e0095c303d | ||
|
|
65378aaed9 | ||
|
|
946729dd06 | ||
|
|
9212f19de1 | ||
|
|
b019256515 | ||
|
|
d4cadbd807 | ||
|
|
4f081ef1a2 | ||
|
|
1b746bc67d | ||
|
|
dfa2b773d1 | ||
|
|
59efbf4e08 | ||
|
|
29768e841d | ||
|
|
cc16bc56ef | ||
|
|
1504c5d0ef | ||
|
|
08919916dc | ||
|
|
4a8a7567f0 | ||
|
|
c01f60fa6c | ||
|
|
b610dc8c7d | ||
|
|
0967e3597b | ||
|
|
14df701707 | ||
|
|
cbcce9c2ed | ||
|
|
b072e5c331 | ||
|
|
4b42d2c89d | ||
|
|
d221f578b7 |
17
Makefile
17
Makefile
@@ -13,12 +13,18 @@ COMMON_HDR = $(SRC_COMMON)ascii.h $(SRC_COMMON)cpu.h $(SRC_COMMON)udev.h $(SRC_C
|
||||
ifneq ($(OS),Windows_NT)
|
||||
GIT_VERSION := "$(shell git describe --abbrev=4 --dirty --always --tags)"
|
||||
arch := $(shell uname -m)
|
||||
os := $(shell uname -s)
|
||||
|
||||
ifeq ($(os), Linux)
|
||||
COMMON_SRC += $(SRC_COMMON)freq.c
|
||||
COMMON_HDR += $(SRC_COMMON)freq.h
|
||||
endif
|
||||
|
||||
ifeq ($(arch), $(filter $(arch), x86_64 amd64 i386 i486 i586 i686))
|
||||
SRC_DIR=src/x86/
|
||||
SOURCE += $(COMMON_SRC) $(SRC_DIR)cpuid.c $(SRC_DIR)apic.c $(SRC_DIR)cpuid_asm.c $(SRC_DIR)uarch.c
|
||||
HEADERS += $(COMMON_HDR) $(SRC_DIR)cpuid.h $(SRC_DIR)apic.h $(SRC_DIR)cpuid_asm.h $(SRC_DIR)uarch.h $(SRC_DIR)freq/freq.h
|
||||
|
||||
os := $(shell uname -s)
|
||||
ifeq ($(os), Linux)
|
||||
SOURCE += $(SRC_DIR)freq/freq.c freq_nov.o freq_avx.o freq_avx512.o
|
||||
HEADERS += $(SRC_DIR)freq/freq.h
|
||||
@@ -32,14 +38,13 @@ ifneq ($(OS),Windows_NT)
|
||||
CFLAGS += -DARCH_PPC -std=gnu99 -fstack-protector-all -Wno-language-extension-token
|
||||
else ifeq ($(arch), $(filter $(arch), arm aarch64_be aarch64 arm64 armv8b armv8l armv7l armv6l))
|
||||
SRC_DIR=src/arm/
|
||||
SOURCE += $(COMMON_SRC) $(SRC_DIR)midr.c $(SRC_DIR)uarch.c $(SRC_COMMON)soc.c $(SRC_DIR)soc.c $(SRC_DIR)udev.c
|
||||
HEADERS += $(COMMON_HDR) $(SRC_DIR)midr.h $(SRC_DIR)uarch.h $(SRC_COMMON)soc.h $(SRC_DIR)soc.h $(SRC_DIR)udev.c $(SRC_DIR)socs.h
|
||||
SOURCE += $(COMMON_SRC) $(SRC_DIR)midr.c $(SRC_DIR)uarch.c $(SRC_COMMON)soc.c $(SRC_DIR)soc.c $(SRC_COMMON)pci.c $(SRC_DIR)udev.c
|
||||
HEADERS += $(COMMON_HDR) $(SRC_DIR)midr.h $(SRC_DIR)uarch.h $(SRC_COMMON)soc.h $(SRC_DIR)soc.h $(SRC_COMMON)pci.h $(SRC_DIR)udev.c $(SRC_DIR)socs.h
|
||||
CFLAGS += -DARCH_ARM -Wno-unused-parameter -std=c99 -fstack-protector-all
|
||||
|
||||
os := $(shell uname -s)
|
||||
ifeq ($(os), Darwin)
|
||||
SOURCE += $(SRC_DIR)sysctl.c
|
||||
HEADERS += $(SRC_DIR)sysctl.h
|
||||
SOURCE += $(SRC_COMMON)sysctl.c
|
||||
HEADERS += $(SRC_COMMON)sysctl.h
|
||||
endif
|
||||
else ifeq ($(arch), $(filter $(arch), riscv64 riscv32))
|
||||
SRC_DIR=src/riscv/
|
||||
|
||||
@@ -174,6 +174,7 @@ Thanks to the fellow contributors and interested people in the project. Special
|
||||
- [bbonev](https://github.com/bbonev) and [stephan-cr](https://github.com/stephan-cr): Reviewed the source code.
|
||||
- [mdoksa76](https://github.com/mdoksa76) and [exkc](https://github.com/exkc): Excellent ideas and feedback for supporting Allwinner SoCs.
|
||||
- [Sakura286](https://github.com/Sakura286), [exkc](https://github.com/exkc) and [Patola](https://github.com/Patola): Helped with RISC-V port with ssh access, ideas, testing, etc.
|
||||
- [ThomasKaiser](https://github.com/ThomasKaiser): Very valuable feedback on improving ARM SoC detection (Apple, Allwinner, Rockchip).
|
||||
|
||||
## 8. cpufetch for GPUs (gpufetch)
|
||||
See [gpufetch](https://github.com/Dr-Noob/gpufetch) project!
|
||||
|
||||
122
src/arm/midr.c
122
src/arm/midr.c
@@ -8,12 +8,14 @@
|
||||
#ifdef __linux__
|
||||
#include <sys/auxv.h>
|
||||
#include <asm/hwcap.h>
|
||||
#include "../common/freq.h"
|
||||
#elif defined __APPLE__ || __MACH__
|
||||
#include "sysctl.h"
|
||||
#include "../common/sysctl.h"
|
||||
#endif
|
||||
|
||||
#include "../common/global.h"
|
||||
#include "../common/soc.h"
|
||||
#include "../common/args.h"
|
||||
#include "udev.h"
|
||||
#include "midr.h"
|
||||
#include "uarch.h"
|
||||
@@ -39,8 +41,17 @@ struct cache* get_cache_info(struct cpuInfo* cpu) {
|
||||
struct frequency* get_frequency_info(uint32_t core) {
|
||||
struct frequency* freq = emalloc(sizeof(struct frequency));
|
||||
|
||||
freq->measured = false;
|
||||
freq->base = UNKNOWN_DATA;
|
||||
freq->max = get_max_freq_from_file(core);
|
||||
#ifdef __linux__
|
||||
if (freq->max == UNKNOWN_DATA || measure_max_frequency_flag()) {
|
||||
if (freq->max == UNKNOWN_DATA)
|
||||
printWarn("Unable to find max frequency from udev, measuring CPU frequency");
|
||||
freq->max = measure_max_frequency(core);
|
||||
freq->measured = true;
|
||||
}
|
||||
#endif
|
||||
|
||||
return freq;
|
||||
}
|
||||
@@ -237,7 +248,7 @@ struct cpuInfo* get_cpu_info_linux(struct cpuInfo* cpu) {
|
||||
cpu->num_cpus = sockets;
|
||||
cpu->hv = emalloc(sizeof(struct hypervisor));
|
||||
cpu->hv->present = false;
|
||||
cpu->soc = get_soc();
|
||||
cpu->soc = get_soc(cpu);
|
||||
cpu->peak_performance = get_peak_performance(cpu);
|
||||
|
||||
return cpu;
|
||||
@@ -350,97 +361,47 @@ void fill_cpu_info_everest_sawtooth(struct cpuInfo* cpu, uint32_t pcores, uint32
|
||||
}
|
||||
|
||||
struct cpuInfo* get_cpu_info_mach(struct cpuInfo* cpu) {
|
||||
uint32_t cpu_family = get_sys_info_by_name("hw.cpufamily");
|
||||
// https://developer.apple.com/documentation/kernel/1387446-sysctlbyname/determining_system_capabilities
|
||||
uint32_t nperflevels = get_sys_info_by_name("hw.nperflevels");
|
||||
|
||||
if((cpu->num_cpus = nperflevels) != 2) {
|
||||
printBug("Expected to find SoC with 2 perf levels, found: %d", cpu->num_cpus);
|
||||
return NULL;
|
||||
}
|
||||
|
||||
uint32_t pcores = get_sys_info_by_name("hw.perflevel0.physicalcpu");
|
||||
uint32_t ecores = get_sys_info_by_name("hw.perflevel1.physicalcpu");
|
||||
if(ecores <= 0) {
|
||||
printBug("Expected to find a numer of ecores > 0, found: %d", ecores);
|
||||
return NULL;
|
||||
}
|
||||
if(pcores <= 0) {
|
||||
printBug("Expected to find a numer of pcores > 0, found: %d", pcores);
|
||||
return NULL;
|
||||
}
|
||||
|
||||
uint32_t cpu_family = get_sys_info_by_name("hw.cpufamily");
|
||||
// Manually fill the cpuInfo assuming that
|
||||
// the CPU is an Apple M1/M2
|
||||
// the CPU is an Apple SoC
|
||||
if(cpu_family == CPUFAMILY_ARM_FIRESTORM_ICESTORM) {
|
||||
cpu->num_cpus = 2;
|
||||
// Now detect the M1 version
|
||||
uint32_t cpu_subfamily = get_sys_info_by_name("hw.cpusubfamily");
|
||||
if(cpu_subfamily == CPUSUBFAMILY_ARM_HG) {
|
||||
// Apple M1
|
||||
fill_cpu_info_firestorm_icestorm(cpu, 4, 4);
|
||||
}
|
||||
else if(cpu_subfamily == CPUSUBFAMILY_ARM_HS || cpu_subfamily == CPUSUBFAMILY_ARM_HC_HD) {
|
||||
// Apple M1 Pro/Max/Ultra. Detect number of cores
|
||||
uint32_t physicalcpu = get_sys_info_by_name("hw.physicalcpu");
|
||||
if(physicalcpu == 20) {
|
||||
// M1 Ultra
|
||||
fill_cpu_info_firestorm_icestorm(cpu, 16, 4);
|
||||
}
|
||||
else if(physicalcpu == 8 || physicalcpu == 10) {
|
||||
// M1 Pro/Max
|
||||
fill_cpu_info_firestorm_icestorm(cpu, physicalcpu-2, 2);
|
||||
}
|
||||
else {
|
||||
printBug("Found invalid physical cpu number: %d", physicalcpu);
|
||||
return NULL;
|
||||
}
|
||||
}
|
||||
else {
|
||||
printBug("Found invalid cpu_subfamily: 0x%.8X", cpu_subfamily);
|
||||
return NULL;
|
||||
}
|
||||
cpu->soc = get_soc();
|
||||
fill_cpu_info_firestorm_icestorm(cpu, pcores, ecores);
|
||||
cpu->soc = get_soc(cpu);
|
||||
cpu->peak_performance = get_peak_performance(cpu);
|
||||
}
|
||||
else if(cpu_family == CPUFAMILY_ARM_AVALANCHE_BLIZZARD) {
|
||||
cpu->num_cpus = 2;
|
||||
// Now detect the M2 version
|
||||
uint32_t cpu_subfamily = get_sys_info_by_name("hw.cpusubfamily");
|
||||
if(cpu_subfamily == CPUSUBFAMILY_ARM_HG) {
|
||||
// Apple M2
|
||||
fill_cpu_info_avalanche_blizzard(cpu, 4, 4);
|
||||
}
|
||||
else if(cpu_subfamily == CPUSUBFAMILY_ARM_HS) {
|
||||
// Apple M2 Pro/Max/Ultra. Detect number of cores
|
||||
uint32_t physicalcpu = get_sys_info_by_name("hw.physicalcpu");
|
||||
if(physicalcpu == 24) {
|
||||
// M2 Ultra
|
||||
fill_cpu_info_avalanche_blizzard(cpu, 16, 8);
|
||||
}
|
||||
else if(physicalcpu == 10 || physicalcpu == 12) {
|
||||
// M2 Pro/Max
|
||||
fill_cpu_info_avalanche_blizzard(cpu, physicalcpu-4, 4);
|
||||
}
|
||||
else {
|
||||
printBug("Found invalid physical cpu number: %d", physicalcpu);
|
||||
return NULL;
|
||||
}
|
||||
}
|
||||
else {
|
||||
printBug("Found invalid cpu_subfamily: 0x%.8X", cpu_subfamily);
|
||||
return NULL;
|
||||
}
|
||||
cpu->soc = get_soc();
|
||||
fill_cpu_info_avalanche_blizzard(cpu, pcores, ecores);
|
||||
cpu->soc = get_soc(cpu);
|
||||
cpu->peak_performance = get_peak_performance(cpu);
|
||||
}
|
||||
else if(cpu_family == CPUFAMILY_ARM_EVEREST_SAWTOOTH ||
|
||||
cpu_family == CPUFAMILY_ARM_EVEREST_SAWTOOTH_PRO ||
|
||||
cpu_family == CPUFAMILY_ARM_EVEREST_SAWTOOTH_MAX) {
|
||||
cpu->num_cpus = 2;
|
||||
// Now detect the M3 version
|
||||
if(cpu_family == CPUFAMILY_ARM_EVEREST_SAWTOOTH) {
|
||||
fill_cpu_info_everest_sawtooth(cpu, 4, 4);
|
||||
}
|
||||
else if(cpu_family == CPUFAMILY_ARM_EVEREST_SAWTOOTH_PRO) {
|
||||
uint32_t physicalcpu = get_sys_info_by_name("hw.physicalcpu");
|
||||
fill_cpu_info_everest_sawtooth(cpu, physicalcpu-6, 6);
|
||||
}
|
||||
else if(cpu_family == CPUFAMILY_ARM_EVEREST_SAWTOOTH_MAX) {
|
||||
uint32_t physicalcpu = get_sys_info_by_name("hw.physicalcpu");
|
||||
fill_cpu_info_everest_sawtooth(cpu, physicalcpu-4, 4);
|
||||
}
|
||||
else {
|
||||
printBug("Found invalid cpu_family: 0x%.8X", cpu_family);
|
||||
return NULL;
|
||||
}
|
||||
cpu->soc = get_soc();
|
||||
fill_cpu_info_everest_sawtooth(cpu, pcores, ecores);
|
||||
cpu->soc = get_soc(cpu);
|
||||
cpu->peak_performance = get_peak_performance(cpu);
|
||||
}
|
||||
else {
|
||||
printBug("Found invalid cpu_family: 0x%.8X", cpu_family);
|
||||
printBugCheckRelease("Found invalid cpu_family: 0x%.8X", cpu_family);
|
||||
return NULL;
|
||||
}
|
||||
|
||||
@@ -529,7 +490,10 @@ void print_debug(struct cpuInfo* cpu) {
|
||||
#if defined(__APPLE__) || defined(__MACH__)
|
||||
printf("hw.cpufamily: 0x%.8X\n", get_sys_info_by_name("hw.cpufamily"));
|
||||
printf("hw.cpusubfamily: 0x%.8X\n", get_sys_info_by_name("hw.cpusubfamily"));
|
||||
printf("hw.nperflevels: %d\n", get_sys_info_by_name("hw.nperflevels"));
|
||||
printf("hw.physicalcpu: %d\n", get_sys_info_by_name("hw.physicalcpu"));
|
||||
printf("hw.perflevel0.physicalcpu: %d\n", get_sys_info_by_name("hw.perflevel0.physicalcpu"));
|
||||
printf("hw.perflevel1.physicalcpu: %d\n", get_sys_info_by_name("hw.perflevel1.physicalcpu"));
|
||||
#endif
|
||||
}
|
||||
|
||||
|
||||
117
src/arm/soc.c
117
src/arm/soc.c
@@ -6,10 +6,12 @@
|
||||
#include "soc.h"
|
||||
#include "socs.h"
|
||||
#include "udev.h"
|
||||
#include "uarch.h"
|
||||
#include "../common/global.h"
|
||||
#include "../common/pci.h"
|
||||
|
||||
#if defined(__APPLE__) || defined(__MACH__)
|
||||
#include "sysctl.h"
|
||||
#include "../common/sysctl.h"
|
||||
#endif
|
||||
|
||||
#define NA -1
|
||||
@@ -50,6 +52,8 @@ uint32_t get_sid_from_nvmem(char* buf) {
|
||||
// SIDs list:
|
||||
// - https://linux-sunxi.org/SID_Register_Guide#Currently_known_SID.27s
|
||||
// - https://github.com/Dr-Noob/cpufetch/issues/173
|
||||
// - https://github.com/ThomasKaiser/sbc-bench/blob/master/sbc-bench.sh
|
||||
// - https://linux-sunxi.org/*CHIP_NAME*
|
||||
bool get_sunxisoc_from_sid(struct system_on_chip* soc, char* raw_name, uint32_t sid) {
|
||||
typedef struct {
|
||||
uint32_t sid;
|
||||
@@ -58,21 +62,39 @@ bool get_sunxisoc_from_sid(struct system_on_chip* soc, char* raw_name, uint32_t
|
||||
|
||||
sidToSoC socFromSid[] = {
|
||||
// --- sun8i Family ---
|
||||
// A33
|
||||
{0x0461872a, {SOC_ALLWINNER_A33, SOC_VENDOR_ALLWINNER, 40, "A33", raw_name} },
|
||||
// A83T
|
||||
{0x32c00401, {SOC_ALLWINNER_A83T, SOC_VENDOR_ALLWINNER, 28, "A83T", raw_name} },
|
||||
{0x32c00403, {SOC_ALLWINNER_A83T, SOC_VENDOR_ALLWINNER, 28, "A83T", raw_name} },
|
||||
// S3
|
||||
{0x12c00001, {SOC_ALLWINNER_S3, SOC_VENDOR_ALLWINNER, 40, "S3", raw_name} },
|
||||
// H2+
|
||||
{0x02c00042, {SOC_ALLWINNER_H2PLUS, SOC_VENDOR_ALLWINNER, 40, "H2+", raw_name} },
|
||||
{0x02c00142, {SOC_ALLWINNER_H2PLUS, SOC_VENDOR_ALLWINNER, 40, "H2+", raw_name} },
|
||||
{0x02c00242, {SOC_ALLWINNER_H2PLUS, SOC_VENDOR_ALLWINNER, 40, "H2+", raw_name} },
|
||||
// H3
|
||||
{0x02c00181, {SOC_ALLWINNER_H3, SOC_VENDOR_ALLWINNER, 40, "H3", raw_name} },
|
||||
{0x02c00081, {SOC_ALLWINNER_H3, SOC_VENDOR_ALLWINNER, 40, "H3", raw_name} },
|
||||
// Others
|
||||
// R40
|
||||
{0x12c00017, {SOC_ALLWINNER_R40, SOC_VENDOR_ALLWINNER, 40, "R40", raw_name} },
|
||||
// V3S
|
||||
{0x12c00000, {SOC_ALLWINNER_V3S, SOC_VENDOR_ALLWINNER, 40, "V3s", raw_name} }, // 40nm is only my guess, no source
|
||||
// --- sun50i Family ---
|
||||
// H5
|
||||
{0x82800001, {SOC_ALLWINNER_H5, SOC_VENDOR_ALLWINNER, 40, "H5", raw_name} },
|
||||
// H6
|
||||
{0x82c00001, {SOC_ALLWINNER_H6, SOC_VENDOR_ALLWINNER, 28, "H6", raw_name} },
|
||||
{0x82c00007, {SOC_ALLWINNER_H6, SOC_VENDOR_ALLWINNER, 28, "H6", raw_name} },
|
||||
{0x92c000bb, {SOC_ALLWINNER_H64, SOC_VENDOR_ALLWINNER, 40, "H64", raw_name} }, // Same as A64
|
||||
// H64
|
||||
{0x92c000bb, {SOC_ALLWINNER_H64, SOC_VENDOR_ALLWINNER, 40, "H64", raw_name} }, // Same manufacturing process as A64
|
||||
// H616
|
||||
{0x32c05000, {SOC_ALLWINNER_H616, SOC_VENDOR_ALLWINNER, 28, "H616", raw_name} },
|
||||
// H618
|
||||
{0x33802000, {SOC_ALLWINNER_H618, SOC_VENDOR_ALLWINNER, 28, "H618", raw_name} },
|
||||
// A64
|
||||
{0x92c000ba, {SOC_ALLWINNER_A64, SOC_VENDOR_ALLWINNER, 40, "A64", raw_name} },
|
||||
{0x92c001ba, {SOC_ALLWINNER_A64, SOC_VENDOR_ALLWINNER, 40, "A64", raw_name} },
|
||||
// Unknown
|
||||
{0x00000000, {UNKNOWN, SOC_VENDOR_UNKNOWN, -1, "", raw_name} }
|
||||
};
|
||||
@@ -781,6 +803,75 @@ struct system_on_chip* guess_soc_from_nvmem(struct system_on_chip* soc) {
|
||||
return soc;
|
||||
}
|
||||
|
||||
struct system_on_chip* guess_soc_from_uarch(struct system_on_chip* soc, struct cpuInfo* cpu) {
|
||||
// Currently we only support CPUs with only one uarch (in other words, one socket)
|
||||
struct uarch* arch = cpu->arch;
|
||||
if (arch == NULL) {
|
||||
printWarn("guess_soc_from_uarch: uarch is NULL");
|
||||
return soc;
|
||||
}
|
||||
|
||||
typedef struct {
|
||||
MICROARCH u;
|
||||
struct system_on_chip soc;
|
||||
} uarchToSoC;
|
||||
|
||||
uarchToSoC socFromUarch[] = {
|
||||
{UARCH_TAISHAN_V110, {SOC_KUNPENG_920, SOC_VENDOR_KUNPENG, 7, "920", NULL} },
|
||||
{UARCH_TAISHAN_V200, {SOC_KUNPENG_930, SOC_VENDOR_KUNPENG, 7, "930", NULL} }, // manufacturing process is not well-known
|
||||
{UARCH_UNKNOWN, {UNKNOWN, SOC_VENDOR_UNKNOWN, -1, "", NULL} }
|
||||
};
|
||||
|
||||
int index = 0;
|
||||
while(socFromUarch[index].u != UARCH_UNKNOWN) {
|
||||
if(socFromUarch[index].u == get_uarch(arch)) {
|
||||
fill_soc(soc, socFromUarch[index].soc.soc_name, socFromUarch[index].soc.soc_model, socFromUarch[index].soc.process);
|
||||
return soc;
|
||||
}
|
||||
index++;
|
||||
}
|
||||
|
||||
printWarn("guess_soc_from_uarch: No uarch matched the list");
|
||||
return soc;
|
||||
}
|
||||
|
||||
struct system_on_chip* guess_soc_from_pci(struct system_on_chip* soc, struct cpuInfo* cpu) {
|
||||
struct pci_devices * pci = get_pci_devices();
|
||||
if (pci == NULL) {
|
||||
printWarn("guess_soc_from_pci: Unable to find suitable PCI devices");
|
||||
return soc;
|
||||
}
|
||||
|
||||
typedef struct {
|
||||
uint16_t vendor_id;
|
||||
uint16_t device_id;
|
||||
struct system_on_chip soc;
|
||||
} pciToSoC;
|
||||
|
||||
pciToSoC socFromPCI[] = {
|
||||
{PCI_VENDOR_NVIDIA, PCI_DEVICE_TEGRA_X1, {SOC_TEGRA_X1, SOC_VENDOR_NVIDIA, 20, "Tegra X1", NULL} },
|
||||
// {PCI_VENDOR_NVIDIA, PCI_DEVICE_GH_200,{SOC_GH_200, SOC_VENDOR_NVIDIA, ?, "Grace Hopper", NULL} },
|
||||
{0x0000, 0x0000, {UNKNOWN, SOC_VENDOR_UNKNOWN, -1, "", NULL} }
|
||||
};
|
||||
|
||||
int index = 0;
|
||||
while (socFromPCI[index].vendor_id != 0x0) {
|
||||
for (int i=0; i < pci->num_devices; i++) {
|
||||
struct pci_device * dev = pci->devices[i];
|
||||
|
||||
if (socFromPCI[index].vendor_id == dev->vendor_id &&
|
||||
socFromPCI[index].device_id == dev->device_id) {
|
||||
fill_soc(soc, socFromPCI[index].soc.soc_name, socFromPCI[index].soc.soc_model, socFromPCI[index].soc.process);
|
||||
return soc;
|
||||
}
|
||||
}
|
||||
index++;
|
||||
}
|
||||
|
||||
printWarn("guess_soc_from_pci: No PCI device matched the list");
|
||||
return soc;
|
||||
}
|
||||
|
||||
int hex2int(char c) {
|
||||
if (c >= '0' && c <= '9')
|
||||
return c - '0';
|
||||
@@ -858,7 +949,7 @@ struct system_on_chip* guess_soc_apple(struct system_on_chip* soc) {
|
||||
}
|
||||
}
|
||||
else {
|
||||
printBug("Found invalid cpu_subfamily: 0x%.8X", cpu_subfamily);
|
||||
printBugCheckRelease("Found invalid cpu_subfamily: 0x%.8X", cpu_subfamily);
|
||||
soc->soc_vendor = SOC_VENDOR_UNKNOWN;
|
||||
}
|
||||
}
|
||||
@@ -885,7 +976,7 @@ struct system_on_chip* guess_soc_apple(struct system_on_chip* soc) {
|
||||
}
|
||||
}
|
||||
else {
|
||||
printBug("Found invalid cpu_subfamily: 0x%.8X", cpu_subfamily);
|
||||
printBugCheckRelease("Found invalid cpu_subfamily: 0x%.8X", cpu_subfamily);
|
||||
soc->soc_vendor = SOC_VENDOR_UNKNOWN;
|
||||
}
|
||||
}
|
||||
@@ -903,19 +994,19 @@ struct system_on_chip* guess_soc_apple(struct system_on_chip* soc) {
|
||||
fill_soc(soc, "M3 Max", SOC_APPLE_M3_MAX, 3);
|
||||
}
|
||||
else {
|
||||
printBug("Found invalid cpu_family: 0x%.8X", cpu_family);
|
||||
printBugCheckRelease("Found invalid cpu_family: 0x%.8X", cpu_family);
|
||||
soc->soc_vendor = SOC_VENDOR_UNKNOWN;
|
||||
}
|
||||
}
|
||||
else {
|
||||
printBug("Found invalid cpu_family: 0x%.8X", cpu_family);
|
||||
printBugCheckRelease("Found invalid cpu_family: 0x%.8X", cpu_family);
|
||||
soc->soc_vendor = SOC_VENDOR_UNKNOWN;
|
||||
}
|
||||
return soc;
|
||||
}
|
||||
#endif
|
||||
|
||||
struct system_on_chip* get_soc(void) {
|
||||
struct system_on_chip* get_soc(struct cpuInfo* cpu) {
|
||||
struct system_on_chip* soc = emalloc(sizeof(struct system_on_chip));
|
||||
soc->raw_name = NULL;
|
||||
soc->soc_vendor = SOC_VENDOR_UNKNOWN;
|
||||
@@ -951,10 +1042,18 @@ struct system_on_chip* get_soc(void) {
|
||||
printWarn("SoC detection failed using Android: Found '%s' string", soc->raw_name);
|
||||
}
|
||||
#endif // ifdef __ANDROID__
|
||||
// If cpufinfo/Android (if available) detection fails, try with nvmem
|
||||
// If previous steps failed, try with nvmem
|
||||
if(soc->soc_vendor == SOC_VENDOR_UNKNOWN) {
|
||||
soc = guess_soc_from_nvmem(soc);
|
||||
}
|
||||
// If previous steps failed, try infering it from the microarchitecture
|
||||
if(soc->soc_vendor == SOC_VENDOR_UNKNOWN) {
|
||||
soc = guess_soc_from_uarch(soc, cpu);
|
||||
}
|
||||
// If previous steps failed, try infering it from the pci device id
|
||||
if(soc->soc_vendor == SOC_VENDOR_UNKNOWN) {
|
||||
soc = guess_soc_from_pci(soc, cpu);
|
||||
}
|
||||
}
|
||||
#elif defined __APPLE__ || __MACH__
|
||||
soc = guess_soc_apple(soc);
|
||||
|
||||
@@ -5,6 +5,6 @@
|
||||
#include "../common/soc.h"
|
||||
#include <stdint.h>
|
||||
|
||||
struct system_on_chip* get_soc(void);
|
||||
struct system_on_chip* get_soc(struct cpuInfo* cpu);
|
||||
|
||||
#endif
|
||||
|
||||
@@ -29,6 +29,9 @@ enum {
|
||||
SOC_HISILICON_3670,
|
||||
SOC_HISILICON_3680,
|
||||
SOC_HISILICON_3690,
|
||||
// Kunpeng //
|
||||
SOC_KUNPENG_920,
|
||||
SOC_KUNPENG_930,
|
||||
// Exynos //
|
||||
SOC_EXYNOS_3475,
|
||||
SOC_EXYNOS_4210,
|
||||
@@ -329,12 +332,14 @@ enum {
|
||||
SOC_ALLWINNER_V3S,
|
||||
SOC_ALLWINNER_HZP,
|
||||
SOC_ALLWINNER_H2PLUS,
|
||||
SOC_ALLWINNER_S3,
|
||||
SOC_ALLWINNER_H3,
|
||||
SOC_ALLWINNER_H8,
|
||||
SOC_ALLWINNER_H5,
|
||||
SOC_ALLWINNER_H6,
|
||||
SOC_ALLWINNER_H64,
|
||||
SOC_ALLWINNER_H616,
|
||||
SOC_ALLWINNER_H618,
|
||||
SOC_ALLWINNER_R8,
|
||||
SOC_ALLWINNER_R16,
|
||||
SOC_ALLWINNER_R40,
|
||||
@@ -358,6 +363,8 @@ enum {
|
||||
SOC_GOOGLE_TENSOR,
|
||||
SOC_GOOGLE_TENSOR_G2,
|
||||
SOC_GOOGLE_TENSOR_G3,
|
||||
// NVIDIA,
|
||||
SOC_TEGRA_X1,
|
||||
// UNKNOWN
|
||||
SOC_MODEL_UNKNOWN
|
||||
};
|
||||
@@ -365,6 +372,7 @@ enum {
|
||||
inline static VENDOR get_soc_vendor_from_soc(SOC soc) {
|
||||
if(soc >= SOC_BCM_2835 && soc <= SOC_BCM_2712) return SOC_VENDOR_BROADCOM;
|
||||
else if(soc >= SOC_HISILICON_3620 && soc <= SOC_HISILICON_3690) return SOC_VENDOR_KIRIN;
|
||||
else if(soc >= SOC_KUNPENG_920 && soc <= SOC_KUNPENG_930) return SOC_VENDOR_KUNPENG;
|
||||
else if(soc >= SOC_EXYNOS_3475 && soc <= SOC_EXYNOS_880) return SOC_VENDOR_EXYNOS;
|
||||
else if(soc >= SOC_MTK_MT6893 && soc <= SOC_MTK_MT8783) return SOC_VENDOR_MEDIATEK;
|
||||
else if(soc >= SOC_SNAPD_QSD8650 && soc <= SOC_SNAPD_SM8450) return SOC_VENDOR_SNAPDRAGON;
|
||||
@@ -372,6 +380,7 @@ inline static VENDOR get_soc_vendor_from_soc(SOC soc) {
|
||||
else if(soc >= SOC_ALLWINNER_A10 && soc <= SOC_ALLWINNER_R328) return SOC_VENDOR_ALLWINNER;
|
||||
else if(soc >= SOC_ROCKCHIP_3288 && soc <= SOC_ROCKCHIP_3588) return SOC_VENDOR_ROCKCHIP;
|
||||
else if(soc >= SOC_GOOGLE_TENSOR && soc <= SOC_GOOGLE_TENSOR_G3) return SOC_VENDOR_GOOGLE;
|
||||
else if(soc >= SOC_TEGRA_X1 && soc <= SOC_TEGRA_X1) return SOC_VENDOR_NVIDIA;
|
||||
return SOC_VENDOR_UNKNOWN;
|
||||
}
|
||||
|
||||
|
||||
@@ -10,7 +10,6 @@
|
||||
// Data not available
|
||||
#define NA -1
|
||||
|
||||
typedef uint32_t MICROARCH;
|
||||
typedef uint32_t ISA;
|
||||
|
||||
struct uarch {
|
||||
@@ -37,89 +36,6 @@ enum {
|
||||
ISA_ARMv9_A
|
||||
};
|
||||
|
||||
enum {
|
||||
UARCH_UNKNOWN,
|
||||
// ARM
|
||||
UARCH_ARM7,
|
||||
UARCH_ARM9,
|
||||
UARCH_ARM1136,
|
||||
UARCH_ARM1156,
|
||||
UARCH_ARM1176,
|
||||
UARCH_ARM11MPCORE,
|
||||
UARCH_CORTEX_A5,
|
||||
UARCH_CORTEX_A7,
|
||||
UARCH_CORTEX_A8,
|
||||
UARCH_CORTEX_A9,
|
||||
UARCH_CORTEX_A12,
|
||||
UARCH_CORTEX_A15,
|
||||
UARCH_CORTEX_A17,
|
||||
UARCH_CORTEX_A32,
|
||||
UARCH_CORTEX_A35,
|
||||
UARCH_CORTEX_A53,
|
||||
UARCH_CORTEX_A55r0, // ARM Cortex-A55 revision 0 (restricted dual-issue capabilities compared to revision 1+).
|
||||
UARCH_CORTEX_A55,
|
||||
UARCH_CORTEX_A57,
|
||||
UARCH_CORTEX_A65,
|
||||
UARCH_CORTEX_A72,
|
||||
UARCH_CORTEX_A73,
|
||||
UARCH_CORTEX_A75,
|
||||
UARCH_CORTEX_A76,
|
||||
UARCH_CORTEX_A77,
|
||||
UARCH_CORTEX_A78,
|
||||
UARCH_CORTEX_A510,
|
||||
UARCH_CORTEX_A710,
|
||||
UARCH_CORTEX_A715,
|
||||
UARCH_CORTEX_X1,
|
||||
UARCH_CORTEX_X2,
|
||||
UARCH_CORTEX_X3,
|
||||
UARCH_NEOVERSE_N1,
|
||||
UARCH_NEOVERSE_E1,
|
||||
UARCH_NEOVERSE_V1,
|
||||
UARCH_SCORPION,
|
||||
UARCH_KRAIT,
|
||||
UARCH_KYRO,
|
||||
UARCH_FALKOR,
|
||||
UARCH_SAPHIRA,
|
||||
UARCH_DENVER,
|
||||
UARCH_DENVER2,
|
||||
UARCH_CARMEL,
|
||||
// SAMSUNG
|
||||
UARCH_EXYNOS_M1, // Samsung Exynos M1 (Exynos 8890 big cores)
|
||||
UARCH_EXYNOS_M2, // Samsung Exynos M2 (Exynos 8895 big cores)
|
||||
UARCH_EXYNOS_M3, // Samsung Exynos M3 (Exynos 9810 big cores)
|
||||
UARCH_EXYNOS_M4, // Samsung Exynos M4 (Exynos 9820 big cores)
|
||||
UARCH_EXYNOS_M5, // Samsung Exynos M5 (Exynos 9830 big cores)
|
||||
// APPLE
|
||||
UARCH_SWIFT, // Apple A6 and A6X processors.
|
||||
UARCH_CYCLONE, // Apple A7 processor.
|
||||
UARCH_TYPHOON, // Apple A8 and A8X processor
|
||||
UARCH_TWISTER, // Apple A9 and A9X processor.
|
||||
UARCH_HURRICANE, // Apple A10 and A10X processor.
|
||||
UARCH_MONSOON, // Apple A11 processor (big cores).
|
||||
UARCH_MISTRAL, // Apple A11 processor (little cores).
|
||||
UARCH_VORTEX, // Apple A12 processor (big cores).
|
||||
UARCH_TEMPEST, // Apple A12 processor (big cores).
|
||||
UARCH_LIGHTNING, // Apple A13 processor (big cores).
|
||||
UARCH_THUNDER, // Apple A13 processor (little cores).
|
||||
UARCH_ICESTORM, // Apple M1 processor (little cores).
|
||||
UARCH_FIRESTORM, // Apple M1 processor (big cores).
|
||||
UARCH_BLIZZARD, // Apple M2 processor (little cores).
|
||||
UARCH_AVALANCHE, // Apple M2 processor (big cores).
|
||||
UARCH_SAWTOOTH, // Apple M3 processor (little cores).
|
||||
UARCH_EVEREST, // Apple M3 processor (big cores).
|
||||
// CAVIUM
|
||||
UARCH_THUNDERX, // Cavium ThunderX
|
||||
UARCH_THUNDERX2, // Cavium ThunderX2 (originally Broadcom Vulkan).
|
||||
// MARVELL
|
||||
UARCH_PJ4,
|
||||
UARCH_BRAHMA_B15,
|
||||
UARCH_BRAHMA_B53,
|
||||
UARCH_XGENE, // Applied Micro X-Gene.
|
||||
UARCH_TAISHAN_V110, // HiSilicon TaiShan v110 (Huawei Kunpeng 920 series processors).
|
||||
// PHYTIUM
|
||||
UARCH_XIAOMI, // Not to be confused with Xiaomi Inc
|
||||
};
|
||||
|
||||
static const ISA isas_uarch[] = {
|
||||
[UARCH_ARM1136] = ISA_ARMv6,
|
||||
[UARCH_ARM1156] = ISA_ARMv6_T2,
|
||||
@@ -159,6 +75,7 @@ static const ISA isas_uarch[] = {
|
||||
[UARCH_THUNDERX] = ISA_ARMv8_A,
|
||||
[UARCH_THUNDERX2] = ISA_ARMv8_1_A,
|
||||
[UARCH_TAISHAN_V110] = ISA_ARMv8_2_A,
|
||||
[UARCH_TAISHAN_V200] = ISA_ARMv8_2_A, // Not confirmed
|
||||
[UARCH_DENVER] = ISA_ARMv8_A,
|
||||
[UARCH_DENVER2] = ISA_ARMv8_A,
|
||||
[UARCH_CARMEL] = ISA_ARMv8_A,
|
||||
@@ -200,8 +117,7 @@ static char* isas_string[] = {
|
||||
#define UARCH_START if (false) {}
|
||||
#define CHECK_UARCH(arch, cpu, im_, p_, v_, r_, str, uarch, vendor) \
|
||||
else if (im_ == im && p_ == p && (v_ == NA || v_ == v) && (r_ == NA || r_ == r)) fill_uarch(arch, cpu, str, uarch, vendor);
|
||||
#define UARCH_END else { printErr("Unknown microarchitecture detected: IM=0x%X P=0x%X V=0x%X R=0x%X", im, p, v, r); \
|
||||
fprintf(stderr, "Please see https://github.com/Dr-Noob/cpufetch#61-unknown-microarchitecture-error to know how to report this error\n"); \
|
||||
#define UARCH_END else { printBugCheckRelease("Unknown microarchitecture detected: IM=0x%X P=0x%X V=0x%X R=0x%X", im, p, v, r); \
|
||||
fill_uarch(arch, cpu, "Unknown", UARCH_UNKNOWN, CPU_VENDOR_UNKNOWN); }
|
||||
|
||||
void fill_uarch(struct uarch* arch, struct cpuInfo* cpu, char* str, MICROARCH u, VENDOR vendor) {
|
||||
@@ -285,7 +201,8 @@ struct uarch* get_uarch_from_midr(uint32_t midr, struct cpuInfo* cpu) {
|
||||
CHECK_UARCH(arch, cpu, 'C', 0x0A3, NA, NA, "ThunderX 81XX", UARCH_THUNDERX, CPU_VENDOR_CAVIUM)
|
||||
CHECK_UARCH(arch, cpu, 'C', 0x0AF, NA, NA, "ThunderX2 99XX", UARCH_THUNDERX2, CPU_VENDOR_CAVIUM)
|
||||
|
||||
CHECK_UARCH(arch, cpu, 'H', 0xD01, NA, NA, "TaiShan v110", UARCH_TAISHAN_V110, CPU_VENDOR_HUAWUEI) // Kunpeng 920 series
|
||||
CHECK_UARCH(arch, cpu, 'H', 0xD01, NA, NA, "TaiShan v110", UARCH_TAISHAN_V110, CPU_VENDOR_HUAWEI) // Kunpeng 920 series
|
||||
CHECK_UARCH(arch, cpu, 'H', 0xD02, NA, NA, "TaiShan v200", UARCH_TAISHAN_V200, CPU_VENDOR_HUAWEI) // Kunpeng 930 series (found in openeuler: https://mailweb.openeuler.org/hyperkitty/list/kernel@openeuler.org/message/XQCV7NX2UKRIUWUFKRF4PO3QENCOUFR3)
|
||||
CHECK_UARCH(arch, cpu, 'H', 0xD40, NA, NA, "Cortex-A76", UARCH_CORTEX_A76, CPU_VENDOR_ARM) // Kirin 980 Big/Medium cores -> Cortex-A76
|
||||
|
||||
CHECK_UARCH(arch, cpu, 'N', 0x000, NA, NA, "Denver", UARCH_DENVER, CPU_VENDOR_NVIDIA)
|
||||
@@ -407,6 +324,8 @@ int get_number_of_vpus(struct cpuInfo* cpu) {
|
||||
return 3;
|
||||
case UARCH_ICESTORM: // [https://dougallj.github.io/applecpu/icestorm-simd.html]
|
||||
case UARCH_BLIZZARD: // [https://en.wikipedia.org/wiki/Comparison_of_ARM_processors]
|
||||
case UARCH_TAISHAN_V110:// [https://www-file.huawei.com/-/media/corp2020/pdf/publications/huawei-research/2022/huawei-research-issue1-en.pdf]: "128-bit x 2 for single precision"
|
||||
case UARCH_TAISHAN_V200:// Not confirmed, asssuming same as v110
|
||||
case UARCH_CORTEX_A57: // [https://www.anandtech.com/show/8718/the-samsung-galaxy-note-4-exynos-review/5]
|
||||
case UARCH_CORTEX_A72: // [https://www.anandtech.com/show/10347/arm-cortex-a73-artemis-unveiled/2]
|
||||
case UARCH_CORTEX_A73: // [https://www.anandtech.com/show/10347/arm-cortex-a73-artemis-unveiled/2]
|
||||
@@ -438,6 +357,10 @@ char* get_str_uarch(struct cpuInfo* cpu) {
|
||||
return cpu->arch->uarch_str;
|
||||
}
|
||||
|
||||
MICROARCH get_uarch(struct uarch* arch) {
|
||||
return arch->uarch;
|
||||
}
|
||||
|
||||
void free_uarch_struct(struct uarch* arch) {
|
||||
free(arch->uarch_str);
|
||||
free(arch);
|
||||
|
||||
@@ -5,11 +5,98 @@
|
||||
|
||||
#include "midr.h"
|
||||
|
||||
enum {
|
||||
UARCH_UNKNOWN,
|
||||
// ARM
|
||||
UARCH_ARM7,
|
||||
UARCH_ARM9,
|
||||
UARCH_ARM1136,
|
||||
UARCH_ARM1156,
|
||||
UARCH_ARM1176,
|
||||
UARCH_ARM11MPCORE,
|
||||
UARCH_CORTEX_A5,
|
||||
UARCH_CORTEX_A7,
|
||||
UARCH_CORTEX_A8,
|
||||
UARCH_CORTEX_A9,
|
||||
UARCH_CORTEX_A12,
|
||||
UARCH_CORTEX_A15,
|
||||
UARCH_CORTEX_A17,
|
||||
UARCH_CORTEX_A32,
|
||||
UARCH_CORTEX_A35,
|
||||
UARCH_CORTEX_A53,
|
||||
UARCH_CORTEX_A55r0, // ARM Cortex-A55 revision 0 (restricted dual-issue capabilities compared to revision 1+).
|
||||
UARCH_CORTEX_A55,
|
||||
UARCH_CORTEX_A57,
|
||||
UARCH_CORTEX_A65,
|
||||
UARCH_CORTEX_A72,
|
||||
UARCH_CORTEX_A73,
|
||||
UARCH_CORTEX_A75,
|
||||
UARCH_CORTEX_A76,
|
||||
UARCH_CORTEX_A77,
|
||||
UARCH_CORTEX_A78,
|
||||
UARCH_CORTEX_A510,
|
||||
UARCH_CORTEX_A710,
|
||||
UARCH_CORTEX_A715,
|
||||
UARCH_CORTEX_X1,
|
||||
UARCH_CORTEX_X2,
|
||||
UARCH_CORTEX_X3,
|
||||
UARCH_NEOVERSE_N1,
|
||||
UARCH_NEOVERSE_E1,
|
||||
UARCH_NEOVERSE_V1,
|
||||
UARCH_SCORPION,
|
||||
UARCH_KRAIT,
|
||||
UARCH_KYRO,
|
||||
UARCH_FALKOR,
|
||||
UARCH_SAPHIRA,
|
||||
UARCH_DENVER,
|
||||
UARCH_DENVER2,
|
||||
UARCH_CARMEL,
|
||||
// SAMSUNG
|
||||
UARCH_EXYNOS_M1, // Samsung Exynos M1 (Exynos 8890 big cores)
|
||||
UARCH_EXYNOS_M2, // Samsung Exynos M2 (Exynos 8895 big cores)
|
||||
UARCH_EXYNOS_M3, // Samsung Exynos M3 (Exynos 9810 big cores)
|
||||
UARCH_EXYNOS_M4, // Samsung Exynos M4 (Exynos 9820 big cores)
|
||||
UARCH_EXYNOS_M5, // Samsung Exynos M5 (Exynos 9830 big cores)
|
||||
// APPLE
|
||||
UARCH_SWIFT, // Apple A6 and A6X processors.
|
||||
UARCH_CYCLONE, // Apple A7 processor.
|
||||
UARCH_TYPHOON, // Apple A8 and A8X processor
|
||||
UARCH_TWISTER, // Apple A9 and A9X processor.
|
||||
UARCH_HURRICANE, // Apple A10 and A10X processor.
|
||||
UARCH_MONSOON, // Apple A11 processor (big cores).
|
||||
UARCH_MISTRAL, // Apple A11 processor (little cores).
|
||||
UARCH_VORTEX, // Apple A12 processor (big cores).
|
||||
UARCH_TEMPEST, // Apple A12 processor (big cores).
|
||||
UARCH_LIGHTNING, // Apple A13 processor (big cores).
|
||||
UARCH_THUNDER, // Apple A13 processor (little cores).
|
||||
UARCH_ICESTORM, // Apple M1 processor (little cores).
|
||||
UARCH_FIRESTORM, // Apple M1 processor (big cores).
|
||||
UARCH_BLIZZARD, // Apple M2 processor (little cores).
|
||||
UARCH_AVALANCHE, // Apple M2 processor (big cores).
|
||||
UARCH_SAWTOOTH, // Apple M3 processor (little cores).
|
||||
UARCH_EVEREST, // Apple M3 processor (big cores).
|
||||
// CAVIUM
|
||||
UARCH_THUNDERX, // Cavium ThunderX
|
||||
UARCH_THUNDERX2, // Cavium ThunderX2 (originally Broadcom Vulkan).
|
||||
// MARVELL
|
||||
UARCH_PJ4,
|
||||
UARCH_BRAHMA_B15,
|
||||
UARCH_BRAHMA_B53,
|
||||
UARCH_XGENE, // Applied Micro X-Gene.
|
||||
UARCH_TAISHAN_V110, // HiSilicon TaiShan v110
|
||||
UARCH_TAISHAN_V200, // HiSilicon TaiShan v200
|
||||
// PHYTIUM
|
||||
UARCH_XIAOMI, // Not to be confused with Xiaomi Inc
|
||||
};
|
||||
|
||||
typedef uint32_t MICROARCH;
|
||||
|
||||
struct uarch* get_uarch_from_midr(uint32_t midr, struct cpuInfo* cpu);
|
||||
int get_number_of_vpus(struct cpuInfo* cpu);
|
||||
int get_vpus_width(struct cpuInfo* cpu);
|
||||
bool has_fma_support(struct cpuInfo* cpu);
|
||||
char* get_str_uarch(struct cpuInfo* cpu);
|
||||
void free_uarch_struct(struct uarch* arch);
|
||||
MICROARCH get_uarch(struct uarch* arch);
|
||||
|
||||
#endif
|
||||
|
||||
@@ -28,6 +28,7 @@ struct args_struct {
|
||||
bool help_flag;
|
||||
bool raw_flag;
|
||||
bool accurate_pp;
|
||||
bool measure_max_frequency_flag;
|
||||
bool full_cpu_name_flag;
|
||||
bool logo_long;
|
||||
bool logo_short;
|
||||
@@ -50,6 +51,7 @@ const char args_chr[] = {
|
||||
/* [ARG_LOGO_INTEL_NEW] = */ 3,
|
||||
/* [ARG_LOGO_INTEL_OLD] = */ 4,
|
||||
/* [ARG_ACCURATE_PP] = */ 5,
|
||||
/* [ARG_MEASURE_MAX_FREQ] = */ 6,
|
||||
/* [ARG_DEBUG] = */ 'd',
|
||||
/* [ARG_VERBOSE] = */ 'v',
|
||||
/* [ARG_VERSION] = */ 'V',
|
||||
@@ -66,6 +68,7 @@ const char *args_str[] = {
|
||||
/* [ARG_LOGO_INTEL_NEW] = */ "logo-intel-new",
|
||||
/* [ARG_LOGO_INTEL_OLD] = */ "logo-intel-old",
|
||||
/* [ARG_ACCURATE_PP] = */ "accurate-pp",
|
||||
/* [ARG_MEASURE_MAX_FREQ] = */ "measure-max-freq",
|
||||
/* [ARG_DEBUG] = */ "debug",
|
||||
/* [ARG_VERBOSE] = */ "verbose",
|
||||
/* [ARG_VERSION] = */ "version",
|
||||
@@ -101,6 +104,10 @@ bool accurate_pp(void) {
|
||||
return args.accurate_pp;
|
||||
}
|
||||
|
||||
bool measure_max_frequency_flag(void) {
|
||||
return args.measure_max_frequency_flag;
|
||||
}
|
||||
|
||||
bool show_full_cpu_name(void) {
|
||||
return args.full_cpu_name_flag;
|
||||
}
|
||||
@@ -222,12 +229,20 @@ char* build_short_options(void) {
|
||||
memset(str, 0, sizeof(char) * (len*2 + 1));
|
||||
|
||||
#ifdef ARCH_X86
|
||||
sprintf(str, "%c:%c:%c%c%c%c%c%c%c%c%c%c%c",
|
||||
sprintf(str, "%c:%c:%c%c%c%c%c%c%c%c%c%c%c%c",
|
||||
c[ARG_STYLE], c[ARG_COLOR], c[ARG_HELP],
|
||||
c[ARG_RAW], c[ARG_FULLCPUNAME],
|
||||
c[ARG_LOGO_SHORT], c[ARG_LOGO_LONG],
|
||||
c[ARG_LOGO_INTEL_NEW], c[ARG_LOGO_INTEL_OLD],
|
||||
c[ARG_ACCURATE_PP], c[ARG_DEBUG], c[ARG_VERBOSE],
|
||||
c[ARG_ACCURATE_PP], c[ARG_MEASURE_MAX_FREQ],
|
||||
c[ARG_DEBUG], c[ARG_VERBOSE],
|
||||
c[ARG_VERSION]);
|
||||
#elif ARCH_ARM
|
||||
sprintf(str, "%c:%c:%c%c%c%c%c%c%c",
|
||||
c[ARG_STYLE], c[ARG_COLOR], c[ARG_HELP],
|
||||
c[ARG_LOGO_SHORT], c[ARG_LOGO_LONG],
|
||||
c[ARG_MEASURE_MAX_FREQ],
|
||||
c[ARG_DEBUG], c[ARG_VERBOSE],
|
||||
c[ARG_VERSION]);
|
||||
#else
|
||||
sprintf(str, "%c:%c:%c%c%c%c%c%c",
|
||||
@@ -270,8 +285,11 @@ bool parse_args(int argc, char* argv[]) {
|
||||
{args_str[ARG_LOGO_INTEL_NEW], no_argument, 0, args_chr[ARG_LOGO_INTEL_NEW] },
|
||||
{args_str[ARG_LOGO_INTEL_OLD], no_argument, 0, args_chr[ARG_LOGO_INTEL_OLD] },
|
||||
{args_str[ARG_ACCURATE_PP], no_argument, 0, args_chr[ARG_ACCURATE_PP] },
|
||||
{args_str[ARG_MEASURE_MAX_FREQ], no_argument, 0, args_chr[ARG_MEASURE_MAX_FREQ] },
|
||||
{args_str[ARG_FULLCPUNAME], no_argument, 0, args_chr[ARG_FULLCPUNAME] },
|
||||
{args_str[ARG_RAW], no_argument, 0, args_chr[ARG_RAW] },
|
||||
#elif ARCH_ARM
|
||||
{args_str[ARG_MEASURE_MAX_FREQ], no_argument, 0, args_chr[ARG_MEASURE_MAX_FREQ] },
|
||||
#endif
|
||||
{args_str[ARG_LOGO_SHORT], no_argument, 0, args_chr[ARG_LOGO_SHORT] },
|
||||
{args_str[ARG_LOGO_LONG], no_argument, 0, args_chr[ARG_LOGO_LONG] },
|
||||
@@ -313,6 +331,9 @@ bool parse_args(int argc, char* argv[]) {
|
||||
else if(opt == args_chr[ARG_ACCURATE_PP]) {
|
||||
args.accurate_pp = true;
|
||||
}
|
||||
else if(opt == args_chr[ARG_MEASURE_MAX_FREQ]) {
|
||||
args.measure_max_frequency_flag = true;
|
||||
}
|
||||
else if(opt == args_chr[ARG_FULLCPUNAME]) {
|
||||
args.full_cpu_name_flag = true;
|
||||
}
|
||||
|
||||
@@ -29,6 +29,7 @@ enum {
|
||||
ARG_LOGO_INTEL_NEW,
|
||||
ARG_LOGO_INTEL_OLD,
|
||||
ARG_ACCURATE_PP,
|
||||
ARG_MEASURE_MAX_FREQ,
|
||||
ARG_DEBUG,
|
||||
ARG_VERBOSE,
|
||||
ARG_VERSION
|
||||
@@ -43,6 +44,7 @@ int max_arg_str_length(void);
|
||||
bool parse_args(int argc, char* argv[]);
|
||||
bool show_help(void);
|
||||
bool accurate_pp(void);
|
||||
bool measure_max_frequency_flag(void);
|
||||
bool show_full_cpu_name(void);
|
||||
bool show_logo_long(void);
|
||||
bool show_logo_short(void);
|
||||
|
||||
@@ -105,6 +105,19 @@ $C1 MMM :MMM NMM dMMK dMMX MMN \
|
||||
$C1 MMM :MMM NMM dMMMoo OMM0....:Nx. MMN \
|
||||
$C1 MMM :WWW XWW lONMM 'xXMMMMNOc MMN "
|
||||
|
||||
#define ASCII_HYGON \
|
||||
"$C1 \
|
||||
$C1 \
|
||||
$C1 \
|
||||
$C1 ## ## ## ## ###### ###### ## # \
|
||||
$C1 ##....## ## ## ## ## ## #### # \
|
||||
$C1 ######## ## ## ##. ## ## # #### \
|
||||
$C1 ## ## ## *######. ###### # ## \
|
||||
$C1 \
|
||||
$C1 \
|
||||
$C1 \
|
||||
$C1 "
|
||||
|
||||
#define ASCII_SNAPD \
|
||||
" $C1@@$C2######## \
|
||||
$C1@@@@@$C2########### \
|
||||
@@ -145,6 +158,25 @@ $C2 Exynos \
|
||||
$C2 \
|
||||
$C2 "
|
||||
|
||||
#define ASCII_KUNPENG \
|
||||
"$C2 . \
|
||||
$C2 .. \
|
||||
$C2 .## \
|
||||
$C1 .$CR $C2.###. \
|
||||
$C1 ..$CR $C2#####. \
|
||||
$C1 .#.$CR $C2.#######. \
|
||||
$C1 .####.$CR $C2.#######. \
|
||||
$C1 ..######*$CR $C2.#######. . \
|
||||
$C1 .#########*$CR $C2.#######* . \
|
||||
$C1 ######*$CR $C2.#######. .#. \
|
||||
$C1*#######*$CR $C2.#######. *##. \
|
||||
$C1 ##*$CR $C2.#######. ####### \
|
||||
$C2 ###.$CR $C1#####$C2 *### \
|
||||
$C1 *########## \
|
||||
$C1 *######## \
|
||||
$C1 #####. \
|
||||
$C1 *###. "
|
||||
|
||||
#define ASCII_KIRIN \
|
||||
"$C1 ####### \
|
||||
$C1 ##### #################### \
|
||||
@@ -341,6 +373,27 @@ $C1##########@@@@@@@@@@@@@@@@############## \
|
||||
$C1######################################## \
|
||||
$C1 #################################### "
|
||||
|
||||
#define ASCII_NVIDIA \
|
||||
"$C1 'cccccccccccccccccccccccccc \
|
||||
$C1 ;oooooooooooooooooooooooool \
|
||||
$C1 .:::. .oooooooooooooooooool \
|
||||
$C1 .:cll; ,c:::. cooooooooooooool \
|
||||
$C1 ,clo' ;. oolc: ooooooooooool \
|
||||
$C1.cloo ;cclo . .olc. coooooooool \
|
||||
$C1oooo :lo, ;ll; looc :oooooooool \
|
||||
$C1 oooc ool. ;oooc;clol :looooooooool \
|
||||
$C1 :ooc ,ol; ;oooooo. .cloo; loool \
|
||||
$C1 ool; .olc. ,:lool .lool \
|
||||
$C1 ool:. ,::::ccloo. :clooool \
|
||||
$C1 oolc::. ':cclooooooool \
|
||||
$C1 ;oooooooooooooooooooooooool \
|
||||
$C1 \
|
||||
$C1 \
|
||||
$C2######. ## ## ## ###### ## ### \
|
||||
$C2## ## ## ## ## ## ## ## #: :# \
|
||||
$C2## ## ## ## ## ## ## ## ####### \
|
||||
$C2## ## ### ## ###### ## ## ## "
|
||||
|
||||
// --------------------- LONG LOGOS ------------------------- //
|
||||
#define ASCII_AMD_L \
|
||||
"$C1 \
|
||||
@@ -473,6 +526,23 @@ $C1 ###########. ############ \
|
||||
$C1 ################ \
|
||||
$C1 ####### "
|
||||
|
||||
#define ASCII_NVIDIA_L \
|
||||
"$C1 MMMMMMMMMMMMMMMMMMMMMMMMMMMMMM \
|
||||
$C1 MMMMMMMMMMMMMMMMMMMMMMMMMMMMMM \
|
||||
$C1 .:: 'MMMMMMMMMMMMMMMMMMMMMMMMM \
|
||||
$C1 ccllooo;:;. ;MMMMMMMMMMMMMMMMMM \
|
||||
$C1 cloc :ooollcc: :MMMMMMMMMMMMMMM \
|
||||
$C1 cloc :ccl; lolc, ;MMMMMMMMMMMM \
|
||||
$C1.cloo: :clo ;c: .ool; MMMMMMMMMMM \
|
||||
$C1 ooo: ooo :ool, .cloo. ;lMMMMMMMMMMM \
|
||||
$C1 ooo: ooc :ooooccooo. :MMMM lMMMMMMM \
|
||||
$C1 ooc. ool: :oooooo' ,cloo. MMMM \
|
||||
$C1 ool:. olc: .:cloo. :MMMM \
|
||||
$C1 olc, ;:::cccloo. :MMMMMMMM \
|
||||
$C1 olcc::; ,:ccloMMMMMMMMM \
|
||||
$C1 :......oMMMMMMMMMMMMMMMMMMMMMM \
|
||||
$C1 :lllMMMMMMMMMMMMMMMMMMMMMMMMMM "
|
||||
|
||||
typedef struct ascii_logo asciiL;
|
||||
|
||||
// +-----------------------------------------------------------------------------------------------------------------+
|
||||
@@ -481,10 +551,12 @@ typedef struct ascii_logo asciiL;
|
||||
asciiL logo_amd = { ASCII_AMD, 39, 15, false, {C_FG_WHITE, C_FG_GREEN}, {C_FG_WHITE, C_FG_GREEN} };
|
||||
asciiL logo_intel = { ASCII_INTEL, 48, 14, false, {C_FG_CYAN}, {C_FG_CYAN, C_FG_WHITE} };
|
||||
asciiL logo_intel_new = { ASCII_INTEL_NEW, 51, 9, false, {C_FG_CYAN}, {C_FG_CYAN, C_FG_WHITE} };
|
||||
asciiL logo_hygon = { ASCII_HYGON, 51, 11, false, {C_FG_RED}, {C_FG_RED, C_FG_WHITE} };
|
||||
asciiL logo_snapd = { ASCII_SNAPD, 39, 16, false, {C_FG_RED, C_FG_WHITE}, {C_FG_RED, C_FG_WHITE} };
|
||||
asciiL logo_mtk = { ASCII_MTK, 59, 5, false, {C_FG_BLUE, C_FG_YELLOW}, {C_FG_BLUE, C_FG_YELLOW} };
|
||||
asciiL logo_exynos = { ASCII_EXYNOS, 22, 13, true, {C_BG_BLUE, C_FG_WHITE}, {C_FG_BLUE, C_FG_WHITE} };
|
||||
asciiL logo_kirin = { ASCII_KIRIN, 53, 12, false, {C_FG_RED}, {C_FG_WHITE, C_FG_RED} };
|
||||
asciiL logo_kunpeng = { ASCII_KUNPENG, 48, 17, false, {C_FG_RED, C_FG_WHITE}, {C_FG_WHITE, C_FG_RED} };
|
||||
asciiL logo_broadcom = { ASCII_BROADCOM, 44, 19, false, {C_FG_WHITE, C_FG_RED}, {C_FG_WHITE, C_FG_RED} };
|
||||
asciiL logo_arm = { ASCII_ARM, 42, 5, false, {C_FG_CYAN}, {C_FG_WHITE, C_FG_CYAN} };
|
||||
asciiL logo_ibm = { ASCII_IBM, 42, 9, false, {C_FG_CYAN, C_FG_WHITE}, {C_FG_CYAN, C_FG_WHITE} };
|
||||
@@ -496,6 +568,7 @@ asciiL logo_riscv = { ASCII_RISCV, 63, 18, false, {C_FG_CYAN, C_FG_Y
|
||||
asciiL logo_sifive = { ASCII_SIFIVE, 48, 19, true, {C_BG_WHITE, C_BG_BLACK}, {C_FG_WHITE, C_FG_BLUE} };
|
||||
asciiL logo_starfive = { ASCII_STARFIVE, 33, 17, false, {C_FG_WHITE}, {C_FG_WHITE, C_FG_BLUE} };
|
||||
asciiL logo_sipeed = { ASCII_SIPEED, 41, 16, true, {C_BG_RED, C_BG_WHITE}, {C_FG_RED, C_FG_WHITE} };
|
||||
asciiL logo_nvidia = { ASCII_NVIDIA, 45, 19, false, {C_FG_GREEN, C_FG_WHITE}, {C_FG_WHITE, C_FG_GREEN} };
|
||||
|
||||
// Long variants | ----------------------------------------------------------------------------------------------------------------|
|
||||
asciiL logo_amd_l = { ASCII_AMD_L, 62, 19, true, {C_BG_WHITE, C_BG_GREEN}, {C_FG_WHITE, C_FG_GREEN} };
|
||||
@@ -505,6 +578,7 @@ asciiL logo_arm_l = { ASCII_ARM_L, 60, 8, true, {C_BG_CYAN},
|
||||
asciiL logo_ibm_l = { ASCII_IBM_L, 62, 13, true, {C_BG_CYAN, C_FG_WHITE}, {C_FG_CYAN, C_FG_WHITE} };
|
||||
asciiL logo_starfive_l = { ASCII_STARFIVE_L, 50, 22, false, {C_FG_WHITE}, {C_FG_WHITE, C_FG_BLUE} };
|
||||
asciiL logo_sifive_l = { ASCII_SIFIVE_L, 53, 21, true, {C_BG_WHITE, C_BG_BLACK}, {C_FG_WHITE, C_FG_CYAN} };
|
||||
asciiL logo_nvidia_l = { ASCII_NVIDIA_L, 50, 15, false, {C_FG_GREEN, C_FG_WHITE}, {C_FG_WHITE, C_FG_GREEN} };
|
||||
asciiL logo_unknown = { NULL, 0, 0, false, {COLOR_NONE}, {COLOR_NONE, COLOR_NONE} };
|
||||
|
||||
#endif
|
||||
|
||||
@@ -145,17 +145,25 @@ char* get_str_l3(struct cache* cach) {
|
||||
|
||||
char* get_str_freq(struct frequency* freq) {
|
||||
//Max 3 digits and 3 for '(M/G)Hz' plus 1 for '\0'
|
||||
uint32_t size = (5+1+3+1);
|
||||
uint32_t size = (1+5+1+3+1);
|
||||
assert(strlen(STRING_UNKNOWN)+1 <= size);
|
||||
char* string = emalloc(sizeof(char)*size);
|
||||
memset(string, 0, sizeof(char)*size);
|
||||
char* string = ecalloc(size, sizeof(char));
|
||||
|
||||
if(freq->max == UNKNOWN_DATA || freq->max < 0)
|
||||
if(freq->max == UNKNOWN_DATA || freq->max < 0) {
|
||||
snprintf(string,strlen(STRING_UNKNOWN)+1,STRING_UNKNOWN);
|
||||
else if(freq->max >= 1000)
|
||||
}
|
||||
else if(freq->max >= 1000) {
|
||||
if (freq->measured)
|
||||
snprintf(string,size,"~%.3f "STRING_GIGAHERZ,(float)(freq->max)/1000);
|
||||
else
|
||||
snprintf(string,size,"%.3f "STRING_GIGAHERZ,(float)(freq->max)/1000);
|
||||
}
|
||||
else {
|
||||
if (freq->measured)
|
||||
snprintf(string,size,"~%d "STRING_MEGAHERZ,freq->max);
|
||||
else
|
||||
snprintf(string,size,"%d "STRING_MEGAHERZ,freq->max);
|
||||
}
|
||||
|
||||
return string;
|
||||
}
|
||||
|
||||
@@ -8,6 +8,7 @@ enum {
|
||||
// ARCH_X86
|
||||
CPU_VENDOR_INTEL,
|
||||
CPU_VENDOR_AMD,
|
||||
CPU_VENDOR_HYGON,
|
||||
// ARCH_ARM
|
||||
CPU_VENDOR_ARM,
|
||||
CPU_VENDOR_APPLE,
|
||||
@@ -16,7 +17,7 @@ enum {
|
||||
CPU_VENDOR_NVIDIA,
|
||||
CPU_VENDOR_APM,
|
||||
CPU_VENDOR_QUALCOMM,
|
||||
CPU_VENDOR_HUAWUEI,
|
||||
CPU_VENDOR_HUAWEI,
|
||||
CPU_VENDOR_SAMSUNG,
|
||||
CPU_VENDOR_MARVELL,
|
||||
CPU_VENDOR_PHYTIUM,
|
||||
@@ -32,6 +33,7 @@ enum {
|
||||
enum {
|
||||
HV_VENDOR_KVM,
|
||||
HV_VENDOR_QEMU,
|
||||
HV_VENDOR_VBOX,
|
||||
HV_VENDOR_HYPERV,
|
||||
HV_VENDOR_VMWARE,
|
||||
HV_VENDOR_XEN,
|
||||
@@ -56,6 +58,8 @@ typedef int32_t VENDOR;
|
||||
struct frequency {
|
||||
int32_t base;
|
||||
int32_t max;
|
||||
// Indicates if max frequency was measured
|
||||
bool measured;
|
||||
};
|
||||
|
||||
struct hypervisor {
|
||||
|
||||
195
src/common/freq.c
Normal file
195
src/common/freq.c
Normal file
@@ -0,0 +1,195 @@
|
||||
#ifdef __linux__
|
||||
|
||||
#define _GNU_SOURCE
|
||||
|
||||
#include <time.h>
|
||||
#include <stdio.h>
|
||||
#include <stdint.h>
|
||||
#include <string.h>
|
||||
#include <errno.h>
|
||||
#include <unistd.h>
|
||||
#include <asm/unistd.h>
|
||||
#include <sys/ioctl.h>
|
||||
#include <linux/perf_event.h>
|
||||
|
||||
#include "global.h"
|
||||
#include "cpu.h"
|
||||
|
||||
static long
|
||||
perf_event_open(struct perf_event_attr *hw_event, pid_t pid,
|
||||
int cpu, int group_fd, unsigned long flags) {
|
||||
int ret;
|
||||
ret = syscall(__NR_perf_event_open, hw_event, pid, cpu,
|
||||
group_fd, flags);
|
||||
return ret;
|
||||
}
|
||||
|
||||
#define INSERT_ASM_ONCE __asm volatile("nop");
|
||||
#define INSERT_ASM_10_TIMES \
|
||||
INSERT_ASM_ONCE \
|
||||
INSERT_ASM_ONCE \
|
||||
INSERT_ASM_ONCE \
|
||||
INSERT_ASM_ONCE \
|
||||
INSERT_ASM_ONCE \
|
||||
INSERT_ASM_ONCE \
|
||||
INSERT_ASM_ONCE \
|
||||
INSERT_ASM_ONCE \
|
||||
INSERT_ASM_ONCE \
|
||||
INSERT_ASM_ONCE \
|
||||
|
||||
#define INSERT_ASM_100_TIMES \
|
||||
INSERT_ASM_10_TIMES \
|
||||
INSERT_ASM_10_TIMES \
|
||||
INSERT_ASM_10_TIMES \
|
||||
INSERT_ASM_10_TIMES \
|
||||
INSERT_ASM_10_TIMES \
|
||||
INSERT_ASM_10_TIMES \
|
||||
INSERT_ASM_10_TIMES \
|
||||
INSERT_ASM_10_TIMES \
|
||||
INSERT_ASM_10_TIMES \
|
||||
INSERT_ASM_10_TIMES
|
||||
|
||||
#define INSERT_ASM_1000_TIMES \
|
||||
INSERT_ASM_100_TIMES \
|
||||
INSERT_ASM_100_TIMES \
|
||||
INSERT_ASM_100_TIMES \
|
||||
INSERT_ASM_100_TIMES \
|
||||
INSERT_ASM_100_TIMES \
|
||||
INSERT_ASM_100_TIMES \
|
||||
INSERT_ASM_100_TIMES \
|
||||
INSERT_ASM_100_TIMES \
|
||||
INSERT_ASM_100_TIMES \
|
||||
INSERT_ASM_100_TIMES \
|
||||
|
||||
void nop_function(uint64_t iters) {
|
||||
for (uint64_t i = 0; i < iters; i++) {
|
||||
INSERT_ASM_1000_TIMES
|
||||
INSERT_ASM_1000_TIMES
|
||||
INSERT_ASM_1000_TIMES
|
||||
INSERT_ASM_1000_TIMES
|
||||
}
|
||||
}
|
||||
|
||||
// Run the nop_function with the number of iterations specified and
|
||||
// measure both the time and number of cycles
|
||||
int measure_freq_iters(uint64_t iters, uint32_t core, double* freq) {
|
||||
clockid_t clock = CLOCK_PROCESS_CPUTIME_ID;
|
||||
struct timespec start, end;
|
||||
struct perf_event_attr pe;
|
||||
uint64_t cycles;
|
||||
int fd;
|
||||
int pid = 0;
|
||||
memset(&pe, 0, sizeof(struct perf_event_attr));
|
||||
pe.type = PERF_TYPE_HARDWARE;
|
||||
pe.size = sizeof(struct perf_event_attr);
|
||||
pe.config = PERF_COUNT_HW_CPU_CYCLES;
|
||||
pe.disabled = 1;
|
||||
pe.exclude_kernel = 1;
|
||||
pe.exclude_hv = 1;
|
||||
|
||||
fd = perf_event_open(&pe, pid, core, -1, 0);
|
||||
if (fd == -1) {
|
||||
perror("perf_event_open");
|
||||
if (errno == EPERM || errno == EACCES) {
|
||||
printErr("You may not have permission to collect stats.\n"\
|
||||
"Consider tweaking /proc/sys/kernel/perf_event_paranoid or running as root");
|
||||
}
|
||||
return -1;
|
||||
}
|
||||
|
||||
if (clock_gettime(clock, &start) == -1) {
|
||||
perror("clock_gettime");
|
||||
return -1;
|
||||
}
|
||||
if(ioctl(fd, PERF_EVENT_IOC_RESET, 0) == -1) {
|
||||
perror("ioctl");
|
||||
return -1;
|
||||
}
|
||||
if(ioctl(fd, PERF_EVENT_IOC_ENABLE, 0) == -1) {
|
||||
perror("ioctl");
|
||||
return -1;
|
||||
}
|
||||
|
||||
nop_function(iters);
|
||||
|
||||
ssize_t ret = read(fd, &cycles, sizeof(uint64_t));
|
||||
if (ret == -1) {
|
||||
perror("read");
|
||||
return -1;
|
||||
}
|
||||
if (ret != sizeof(uint64_t)) {
|
||||
printErr("Read returned %d, expected %d", ret, sizeof(uint64_t));
|
||||
return -1;
|
||||
}
|
||||
if(ioctl(fd, PERF_EVENT_IOC_DISABLE, 0) == -1) {
|
||||
perror("ioctl");
|
||||
return -1;
|
||||
}
|
||||
if (clock_gettime(clock, &end) == -1) {
|
||||
perror("clock_gettime");
|
||||
return -1;
|
||||
}
|
||||
|
||||
uint64_t nsecs = (end.tv_sec*1e9 + end.tv_nsec) - (start.tv_sec*1e9 + start.tv_nsec);
|
||||
uint64_t usecs = nsecs/1000;
|
||||
*freq = cycles/((double)usecs);
|
||||
return 0;
|
||||
}
|
||||
|
||||
// Return a good number of iterations to run the nop_function in
|
||||
// order to get a precise measurement of the frequency without taking
|
||||
// too much time.
|
||||
uint64_t get_num_iters_from_freq(double frequency) {
|
||||
// Truncate to reduce variability
|
||||
uint64_t freq_trunc = ((uint64_t) frequency / 100) * 100;
|
||||
uint64_t osp_per_iter = 4 * 1000;
|
||||
|
||||
return freq_trunc * 1e7 * 1/osp_per_iter;
|
||||
}
|
||||
|
||||
// Differences between x86 measure_frequency and this measure_max_frequency:
|
||||
// - measure_frequency employs all cores simultaneously whereas
|
||||
// measure_max_frequency only employs 1.
|
||||
// - measure_frequency runs the computation and checks /proc/cpuinfo whereas
|
||||
// measure_max_frequency does not rely on /proc/cpuinfo and simply
|
||||
// counts cpu cycles to measure frequency.
|
||||
// - measure_frequency uses actual computation while measuring the frequency
|
||||
// whereas measure_max_frequency uses nop instructions. This makes the former
|
||||
// x86 dependant whereas the latter is architecture independant.
|
||||
int64_t measure_max_frequency(uint32_t core) {
|
||||
if (!bind_to_cpu(core)) {
|
||||
printErr("Failed binding the process to CPU %d", core);
|
||||
return UNKNOWN_DATA;
|
||||
}
|
||||
|
||||
// First, get very rough estimation of clock cycle to
|
||||
// compute a reasonable value for the iterations
|
||||
double estimation_freq, frequency;
|
||||
uint64_t iters = 100000;
|
||||
if (measure_freq_iters(iters, core, &estimation_freq) == -1)
|
||||
return UNKNOWN_DATA;
|
||||
|
||||
if (estimation_freq <= 0.0) {
|
||||
printErr("First frequency measurement yielded an invalid value: %f", estimation_freq);
|
||||
return UNKNOWN_DATA;
|
||||
}
|
||||
iters = get_num_iters_from_freq(estimation_freq);
|
||||
printWarn("Running frequency measurement with %ld iterations on core %d...", iters, core);
|
||||
|
||||
// Now perform actual measurement
|
||||
const char* frequency_banner = "cpufetch is measuring the max frequency...";
|
||||
printf("%s", frequency_banner);
|
||||
fflush(stdout);
|
||||
|
||||
if (measure_freq_iters(iters, core, &frequency) == -1)
|
||||
return UNKNOWN_DATA;
|
||||
|
||||
// Clean screen once measurement is finished
|
||||
printf("\r%*c\r", (int) strlen(frequency_banner), ' ');
|
||||
|
||||
// Discard last digit in the frequency, which should help providing
|
||||
// more reliable and predictable values.
|
||||
return (((int) frequency + 5)/10) * 10;
|
||||
}
|
||||
|
||||
#endif // #ifdef __linux__
|
||||
6
src/common/freq.h
Normal file
6
src/common/freq.h
Normal file
@@ -0,0 +1,6 @@
|
||||
#ifndef __COMMON_FREQ__
|
||||
#define __COMMON_FREQ__
|
||||
|
||||
int64_t measure_max_frequency(uint32_t core);
|
||||
|
||||
#endif
|
||||
@@ -1,3 +1,14 @@
|
||||
#ifdef _WIN32
|
||||
#define NOMINMAX
|
||||
#include <windows.h>
|
||||
#elif defined __linux__
|
||||
#define _GNU_SOURCE
|
||||
#include <sched.h>
|
||||
#elif defined __FreeBSD__
|
||||
#include <sys/param.h>
|
||||
#include <sys/cpuset.h>
|
||||
#endif
|
||||
|
||||
#include <stdarg.h>
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
@@ -21,7 +32,7 @@
|
||||
#endif
|
||||
|
||||
#ifdef ARCH_X86
|
||||
static const char* ARCH_STR = "x86_64 build";
|
||||
static const char* ARCH_STR = "x86 / x86_64 build";
|
||||
#include "../x86/cpuid.h"
|
||||
#elif ARCH_PPC
|
||||
static const char* ARCH_STR = "PowerPC build";
|
||||
@@ -51,7 +62,7 @@
|
||||
#endif
|
||||
|
||||
#ifndef GIT_FULL_VERSION
|
||||
static const char* VERSION = "1.04";
|
||||
static const char* VERSION = "1.05";
|
||||
#endif
|
||||
|
||||
enum {
|
||||
@@ -61,6 +72,14 @@ enum {
|
||||
|
||||
int LOG_LEVEL;
|
||||
|
||||
void printBugMessage(FILE *restrict stream) {
|
||||
#if defined(ARCH_X86) || defined(ARCH_PPC)
|
||||
fprintf(stream, "Please, create a new issue with this error message, the output of 'cpufetch' and 'cpufetch --debug' on https://github.com/Dr-Noob/cpufetch/issues\n");
|
||||
#elif ARCH_ARM
|
||||
fprintf(stream, "Please, create a new issue with this error message, your smartphone/computer model, the output of 'cpufetch --verbose' and 'cpufetch --debug' on https://github.com/Dr-Noob/cpufetch/issues\n");
|
||||
#endif
|
||||
}
|
||||
|
||||
void printWarn(const char *fmt, ...) {
|
||||
if(LOG_LEVEL == LOG_LEVEL_VERBOSE) {
|
||||
int buffer_size = 4096;
|
||||
@@ -95,10 +114,40 @@ void printBug(const char *fmt, ...) {
|
||||
fprintf(stderr,RED "[ERROR]: "RESET "%s\n",buffer);
|
||||
fprintf(stderr,"[VERSION]: ");
|
||||
print_version(stderr);
|
||||
#if defined(ARCH_X86) || defined(ARCH_PPC)
|
||||
fprintf(stderr, "Please, create a new issue with this error message, the output of 'cpufetch' and 'cpufetch --debug' on https://github.com/Dr-Noob/cpufetch/issues\n");
|
||||
#elif ARCH_ARM
|
||||
fprintf(stderr, "Please, create a new issue with this error message, your smartphone/computer model, the output of 'cpufetch --verbose' and 'cpufetch --debug' on https://github.com/Dr-Noob/cpufetch/issues\n");
|
||||
printBugMessage(stderr);
|
||||
}
|
||||
|
||||
bool isReleaseVersion(char *git_full_version) {
|
||||
return strstr(git_full_version, "-") == NULL;
|
||||
}
|
||||
|
||||
/// The unknown uarch errors are by far the most common error a user will encounter.
|
||||
/// Rather than using the generic printBug function, which asks the user to report
|
||||
/// the problem on the issues webpage, this function will check if the program is
|
||||
/// the release version. In such case, support for this feature is most likely already
|
||||
/// in the last version, so just tell the user to compile that one and not report this
|
||||
/// in github.
|
||||
void printBugCheckRelease(const char *fmt, ...) {
|
||||
int buffer_size = 4096;
|
||||
char buffer[buffer_size];
|
||||
va_list args;
|
||||
va_start(args, fmt);
|
||||
vsnprintf(buffer,buffer_size, fmt, args);
|
||||
va_end(args);
|
||||
|
||||
fprintf(stderr, RED "[ERROR]: "RESET "%s\n", buffer);
|
||||
fprintf(stderr, "[VERSION]: ");
|
||||
print_version(stderr);
|
||||
|
||||
#ifdef GIT_FULL_VERSION
|
||||
if (isReleaseVersion(GIT_FULL_VERSION)) {
|
||||
fprintf(stderr, RED "[ERROR]: "RESET "You are using an outdated version of cpufetch. Please compile cpufetch from source (see https://github.com/Dr-Noob/cpufetch?tab=readme-ov-file#22-building-from-source)");
|
||||
}
|
||||
else {
|
||||
printBugMessage(stderr);
|
||||
}
|
||||
#else
|
||||
printBugMessage(stderr);
|
||||
#endif
|
||||
}
|
||||
|
||||
@@ -161,6 +210,34 @@ void* erealloc(void *ptr, size_t size) {
|
||||
return newptr;
|
||||
}
|
||||
|
||||
#ifndef __APPLE__
|
||||
bool bind_to_cpu(int cpu_id) {
|
||||
#ifdef _WIN32
|
||||
HANDLE process = GetCurrentProcess();
|
||||
DWORD_PTR processAffinityMask = 1 << cpu_id;
|
||||
return SetProcessAffinityMask(process, processAffinityMask);
|
||||
#elif defined __linux__
|
||||
cpu_set_t currentCPU;
|
||||
CPU_ZERO(¤tCPU);
|
||||
CPU_SET(cpu_id, ¤tCPU);
|
||||
if (sched_setaffinity (0, sizeof(currentCPU), ¤tCPU) == -1) {
|
||||
printWarn("sched_setaffinity: %s", strerror(errno));
|
||||
return false;
|
||||
}
|
||||
return true;
|
||||
#elif defined __FreeBSD__
|
||||
cpuset_t currentCPU;
|
||||
CPU_ZERO(¤tCPU);
|
||||
CPU_SET(cpu_id, ¤tCPU);
|
||||
if(cpuset_setaffinity(CPU_LEVEL_WHICH, CPU_WHICH_TID, -1, sizeof(cpuset_t), ¤tCPU) == -1) {
|
||||
printWarn("cpuset_setaffinity: %s", strerror(errno));
|
||||
return false;
|
||||
}
|
||||
return true;
|
||||
#endif
|
||||
}
|
||||
#endif
|
||||
|
||||
void print_version(FILE *restrict stream) {
|
||||
#ifdef GIT_FULL_VERSION
|
||||
fprintf(stream, "cpufetch %s (%s %s)\n", GIT_FULL_VERSION, OS_STR, ARCH_STR);
|
||||
|
||||
@@ -12,12 +12,16 @@ void set_log_level(bool verbose);
|
||||
void printWarn(const char *fmt, ...);
|
||||
void printErr(const char *fmt, ...);
|
||||
void printBug(const char *fmt, ...);
|
||||
void printBugCheckRelease(const char *fmt, ...);
|
||||
int min(int a, int b);
|
||||
int max(int a, int b);
|
||||
char *strremove(char *str, const char *sub);
|
||||
void* emalloc(size_t size);
|
||||
void* ecalloc(size_t nmemb, size_t size);
|
||||
void* erealloc(void *ptr, size_t size);
|
||||
#ifndef __APPLE__
|
||||
bool bind_to_cpu(int cpu_id);
|
||||
#endif
|
||||
void print_version(FILE *restrict stream);
|
||||
|
||||
#endif
|
||||
|
||||
@@ -30,11 +30,17 @@ void print_help(char *argv[]) {
|
||||
#ifdef ARCH_X86
|
||||
#ifdef __linux__
|
||||
printf(" --%s %*s Compute the peak performance accurately (measure the CPU frequency instead of using the maximum)\n", t[ARG_ACCURATE_PP], (int) (max_len-strlen(t[ARG_ACCURATE_PP])), "");
|
||||
#endif
|
||||
printf(" --%s %*s Measure the max CPU frequency instead of reading it\n", t[ARG_MEASURE_MAX_FREQ], (int) (max_len-strlen(t[ARG_MEASURE_MAX_FREQ])), "");
|
||||
#endif // __linux__
|
||||
printf(" --%s %*s Show the old Intel logo\n", t[ARG_LOGO_INTEL_OLD], (int) (max_len-strlen(t[ARG_LOGO_INTEL_OLD])), "");
|
||||
printf(" --%s %*s Show the new Intel logo\n", t[ARG_LOGO_INTEL_NEW], (int) (max_len-strlen(t[ARG_LOGO_INTEL_NEW])), "");
|
||||
printf(" -%c, --%s %*s Show the full CPU name (do not abbreviate it)\n", c[ARG_FULLCPUNAME], t[ARG_FULLCPUNAME], (int) (max_len-strlen(t[ARG_FULLCPUNAME])), "");
|
||||
printf(" -%c, --%s %*s Print raw cpuid data (debug purposes)\n", c[ARG_RAW], t[ARG_RAW], (int) (max_len-strlen(t[ARG_RAW])), "");
|
||||
#endif // ARCH_X86
|
||||
#ifdef ARCH_ARM
|
||||
#ifdef __linux__
|
||||
printf(" --%s %*s Measure the max CPU frequency instead of reading it\n", t[ARG_MEASURE_MAX_FREQ], (int) (max_len-strlen(t[ARG_MEASURE_MAX_FREQ])), "");
|
||||
#endif
|
||||
#endif
|
||||
printf(" -%c, --%s %*s Print this help and exit\n", c[ARG_HELP], t[ARG_HELP], (int) (max_len-strlen(t[ARG_HELP])), "");
|
||||
printf(" -%c, --%s %*s Print cpufetch version and exit\n", c[ARG_VERSION], t[ARG_VERSION], (int) (max_len-strlen(t[ARG_VERSION])), "");
|
||||
@@ -45,7 +51,7 @@ void print_help(char *argv[]) {
|
||||
printf(" * \"amd\": Use AMD color scheme \n");
|
||||
printf(" * \"ibm\", Use IBM color scheme \n");
|
||||
printf(" * \"arm\": Use ARM color scheme \n");
|
||||
printf(" * \"rockchip\": Use ARM color scheme \n");
|
||||
printf(" * \"rockchip\": Use Rockchip color scheme \n");
|
||||
printf(" * \"sifive\": Use SiFive color scheme \n");
|
||||
printf(" * custom: If the argument of --color does not match any of the previous strings, a custom scheme can be specified.\n");
|
||||
printf(" 5 colors must be given in RGB with the format: R,G,B:R,G,B:...\n");
|
||||
@@ -80,6 +86,11 @@ void print_help(char *argv[]) {
|
||||
printf(" --accurate-pp option, which will measure the AVX frequency and show a more precise estimation\n");
|
||||
printf(" (this option is only available in x86 architectures).\n");
|
||||
printf(" To precisely measure peak performance, see: https://github.com/Dr-Noob/peakperf\n");
|
||||
printf("\n");
|
||||
printf(" Both --accurate-pp and --measure-max-freq measure the actual frequency of the CPU. However,\n");
|
||||
printf(" they differ slightly. The former measures the max frequency while running vectorized SSE/AVX\n");
|
||||
printf(" instructions and it is thus x86 only, whereas the latter simply measures the max clock cycle\n");
|
||||
printf(" and is architecture independent.\n");
|
||||
}
|
||||
|
||||
int main(int argc, char* argv[]) {
|
||||
|
||||
178
src/common/pci.c
Normal file
178
src/common/pci.c
Normal file
@@ -0,0 +1,178 @@
|
||||
#define _GNU_SOURCE
|
||||
|
||||
#include <sys/stat.h>
|
||||
#include <dirent.h>
|
||||
|
||||
#include "udev.h"
|
||||
#include "global.h"
|
||||
#include "pci.h"
|
||||
|
||||
#ifndef PATH_MAX
|
||||
#define PATH_MAX 1024
|
||||
#endif
|
||||
|
||||
#define PCI_PATH "/sys/bus/pci/devices/"
|
||||
#define MAX_LENGTH_PCI_DIR_NAME 1024
|
||||
|
||||
/*
|
||||
* doc: https://wiki.osdev.org/PCI#Class_Codes
|
||||
* https://pci-ids.ucw.cz/read/PC
|
||||
*/
|
||||
#define PCI_VENDOR_ID_AMD 0x1002
|
||||
#define CLASS_VGA_CONTROLLER 0x0300
|
||||
#define CLASS_3D_CONTROLLER 0x0302
|
||||
|
||||
// Return a list of PCI devices containing only
|
||||
// the sysfs path
|
||||
struct pci_devices * get_pci_paths(void) {
|
||||
DIR *dirp;
|
||||
|
||||
if ((dirp = opendir(PCI_PATH)) == NULL) {
|
||||
perror("opendir");
|
||||
return NULL;
|
||||
}
|
||||
|
||||
struct dirent *dp;
|
||||
int numDirs = 0;
|
||||
errno = 0;
|
||||
|
||||
while ((dp = readdir(dirp)) != NULL) {
|
||||
if (strcmp(dp->d_name, ".") != 0 && strcmp(dp->d_name, "..") != 0)
|
||||
numDirs++;
|
||||
}
|
||||
if (errno != 0) {
|
||||
perror("readdir");
|
||||
return NULL;
|
||||
}
|
||||
|
||||
rewinddir(dirp);
|
||||
|
||||
struct pci_devices * pci = emalloc(sizeof(struct pci_devices));
|
||||
pci->num_devices = numDirs;
|
||||
pci->devices = emalloc(sizeof(struct pci_device) * pci->num_devices);
|
||||
char * full_path = emalloc(PATH_MAX * sizeof(char));
|
||||
struct stat stbuf;
|
||||
int i = 0;
|
||||
|
||||
while ((dp = readdir(dirp)) != NULL) {
|
||||
if (strcmp(dp->d_name, ".") == 0 || strcmp(dp->d_name, "..") == 0)
|
||||
continue;
|
||||
|
||||
if (strlen(dp->d_name) > MAX_LENGTH_PCI_DIR_NAME) {
|
||||
printErr("Directory name is too long: %s", dp->d_name);
|
||||
return NULL;
|
||||
}
|
||||
|
||||
memset(full_path, 0, PATH_MAX * sizeof(char));
|
||||
snprintf(full_path, min(strlen(PCI_PATH) + strlen(dp->d_name) + 1, PATH_MAX), "%s%s", PCI_PATH, dp->d_name);
|
||||
|
||||
if (stat(full_path, &stbuf) == -1) {
|
||||
perror("stat");
|
||||
return NULL;
|
||||
}
|
||||
|
||||
if ((stbuf.st_mode & S_IFMT) == S_IFDIR) {
|
||||
int strLen = min(MAX_LENGTH_PCI_DIR_NAME, strlen(dp->d_name)) + 1;
|
||||
pci->devices[i] = emalloc(sizeof(struct pci_device));
|
||||
pci->devices[i]->path = ecalloc(sizeof(char), strLen);
|
||||
strncpy(pci->devices[i]->path, dp->d_name, strLen);
|
||||
i++;
|
||||
}
|
||||
}
|
||||
if (errno != 0) {
|
||||
perror("readdir");
|
||||
return NULL;
|
||||
}
|
||||
|
||||
return pci;
|
||||
}
|
||||
|
||||
// For each PCI device in the list pci, fetch its vendor and
|
||||
// device id using sysfs (e.g., /sys/bus/pci/devices/XXX/{vendor/device})
|
||||
void populate_pci_devices(struct pci_devices * pci) {
|
||||
int filelen;
|
||||
char* buf;
|
||||
|
||||
for (int i=0; i < pci->num_devices; i++) {
|
||||
struct pci_device* dev = pci->devices[i];
|
||||
int path_size = strlen(PCI_PATH) + strlen(dev->path) + 2;
|
||||
|
||||
// Read vendor_id
|
||||
char *vendor_id_path = emalloc(sizeof(char) * (path_size + strlen("vendor")));
|
||||
sprintf(vendor_id_path, "%s/%s/%s", PCI_PATH, dev->path, "vendor");
|
||||
|
||||
if ((buf = read_file(vendor_id_path, &filelen)) == NULL) {
|
||||
printWarn("read_file: %s: %s\n", vendor_id_path, strerror(errno));
|
||||
dev->vendor_id = 0;
|
||||
}
|
||||
else {
|
||||
dev->vendor_id = strtol(buf, NULL, 16);
|
||||
}
|
||||
|
||||
// Read device_id
|
||||
char *device_id_path = emalloc(sizeof(char) * (path_size + strlen("device")));
|
||||
sprintf(device_id_path, "%s/%s/%s", PCI_PATH, dev->path, "device");
|
||||
|
||||
if ((buf = read_file(device_id_path, &filelen)) == NULL) {
|
||||
printWarn("read_file: %s: %s\n", device_id_path, strerror(errno));
|
||||
dev->device_id = 0;
|
||||
}
|
||||
else {
|
||||
dev->device_id = strtol(buf, NULL, 16);
|
||||
}
|
||||
|
||||
free(vendor_id_path);
|
||||
free(device_id_path);
|
||||
}
|
||||
}
|
||||
|
||||
// Right now, we are interested in PCI devices which
|
||||
// vendor is NVIDIA (to be extended in the future).
|
||||
// Should we also restrict to VGA controllers only?
|
||||
bool pci_device_is_useful(struct pci_device* dev) {
|
||||
return dev->vendor_id == PCI_VENDOR_NVIDIA;
|
||||
}
|
||||
|
||||
// Filter the input list in order to get only those PCI devices which
|
||||
// we are interested in (decided by pci_device_is_useful)
|
||||
// and return the filtered result.
|
||||
struct pci_devices * filter_pci_devices(struct pci_devices * pci) {
|
||||
int * devices_to_get = emalloc(sizeof(int) * pci->num_devices);
|
||||
int dev_ptr = 0;
|
||||
|
||||
for (int i=0; i < pci->num_devices; i++) {
|
||||
if (pci_device_is_useful(pci->devices[i])) {
|
||||
devices_to_get[dev_ptr] = i;
|
||||
dev_ptr++;
|
||||
}
|
||||
}
|
||||
|
||||
struct pci_devices * pci_filtered = emalloc(sizeof(struct pci_devices));
|
||||
pci_filtered->num_devices = dev_ptr;
|
||||
|
||||
if (pci_filtered->num_devices == 0) {
|
||||
pci_filtered->devices = NULL;
|
||||
}
|
||||
else {
|
||||
pci_filtered->devices = emalloc(sizeof(struct pci_device) * pci_filtered->num_devices);
|
||||
|
||||
for (int i=0; i < pci_filtered->num_devices; i++)
|
||||
pci_filtered->devices[i] = pci->devices[devices_to_get[i]];
|
||||
}
|
||||
|
||||
return pci_filtered;
|
||||
}
|
||||
|
||||
// Return a list of PCI devices that could be used to infer the SoC.
|
||||
// The criteria to determine which devices are suitable for this task
|
||||
// is decided in filter_pci_devices.
|
||||
struct pci_devices * get_pci_devices(void) {
|
||||
struct pci_devices * pci = get_pci_paths();
|
||||
|
||||
if (pci == NULL)
|
||||
return NULL;
|
||||
|
||||
populate_pci_devices(pci);
|
||||
|
||||
return filter_pci_devices(pci);
|
||||
}
|
||||
20
src/common/pci.h
Normal file
20
src/common/pci.h
Normal file
@@ -0,0 +1,20 @@
|
||||
#ifndef __PCI__
|
||||
#define __PCI__
|
||||
|
||||
#define PCI_VENDOR_NVIDIA 0x10de
|
||||
#define PCI_DEVICE_TEGRA_X1 0x0faf
|
||||
|
||||
struct pci_device {
|
||||
char * path;
|
||||
uint16_t vendor_id;
|
||||
uint16_t device_id;
|
||||
};
|
||||
|
||||
struct pci_devices {
|
||||
struct pci_device ** devices;
|
||||
int num_devices;
|
||||
};
|
||||
|
||||
struct pci_devices * get_pci_devices(void);
|
||||
|
||||
#endif
|
||||
@@ -61,6 +61,7 @@ enum {
|
||||
ATTRIBUTE_NCORES,
|
||||
ATTRIBUTE_NCORES_DUAL,
|
||||
#ifdef ARCH_X86
|
||||
ATTRIBUTE_SSE,
|
||||
ATTRIBUTE_AVX,
|
||||
ATTRIBUTE_FMA,
|
||||
#elif ARCH_PPC
|
||||
@@ -96,6 +97,7 @@ static const char* ATTRIBUTE_FIELDS [] = {
|
||||
"Cores:",
|
||||
"Cores (Total):",
|
||||
#ifdef ARCH_X86
|
||||
"SSE:",
|
||||
"AVX:",
|
||||
"FMA:",
|
||||
#elif ARCH_PPC
|
||||
@@ -131,6 +133,7 @@ static const char* ATTRIBUTE_FIELDS_SHORT [] = {
|
||||
"Cores:",
|
||||
"Cores (Total):",
|
||||
#ifdef ARCH_X86
|
||||
"SSE:",
|
||||
"AVX:",
|
||||
"FMA:",
|
||||
#elif ARCH_PPC
|
||||
@@ -336,6 +339,13 @@ struct ascii_logo* choose_ascii_art_aux(struct ascii_logo* logo_long, struct asc
|
||||
}
|
||||
}
|
||||
|
||||
// https://no-color.org/
|
||||
bool is_color_enabled(void) {
|
||||
const char *var_name = "NO_COLOR";
|
||||
char *no_color = getenv(var_name);
|
||||
return no_color == NULL || no_color[0] == '\0';
|
||||
}
|
||||
|
||||
void choose_ascii_art(struct ascii* art, struct color** cs, struct terminal* term, int lf) {
|
||||
// 1. Choose logo
|
||||
#ifdef ARCH_X86
|
||||
@@ -350,6 +360,9 @@ void choose_ascii_art(struct ascii* art, struct color** cs, struct terminal* ter
|
||||
else if(art->vendor == CPU_VENDOR_AMD) {
|
||||
art->art = choose_ascii_art_aux(&logo_amd_l, &logo_amd, term, lf);
|
||||
}
|
||||
else if(art->vendor == CPU_VENDOR_HYGON) {
|
||||
art->art = &logo_hygon;
|
||||
}
|
||||
else {
|
||||
art->art = &logo_unknown;
|
||||
}
|
||||
@@ -364,6 +377,8 @@ void choose_ascii_art(struct ascii* art, struct color** cs, struct terminal* ter
|
||||
art->art = &logo_exynos;
|
||||
else if(art->vendor == SOC_VENDOR_KIRIN)
|
||||
art->art = &logo_kirin;
|
||||
else if(art->vendor == SOC_VENDOR_KUNPENG)
|
||||
art->art = &logo_kunpeng;
|
||||
else if(art->vendor == SOC_VENDOR_BROADCOM)
|
||||
art->art = &logo_broadcom;
|
||||
else if(art->vendor == SOC_VENDOR_APPLE)
|
||||
@@ -374,6 +389,8 @@ void choose_ascii_art(struct ascii* art, struct color** cs, struct terminal* ter
|
||||
art->art = &logo_allwinner;
|
||||
else if(art->vendor == SOC_VENDOR_ROCKCHIP)
|
||||
art->art = &logo_rockchip;
|
||||
else if(art->vendor == SOC_VENDOR_NVIDIA)
|
||||
art->art = choose_ascii_art_aux(&logo_nvidia_l, &logo_nvidia, term, lf);
|
||||
else {
|
||||
art->art = choose_ascii_art_aux(&logo_arm_l, &logo_arm, term, lf);
|
||||
}
|
||||
@@ -392,6 +409,9 @@ void choose_ascii_art(struct ascii* art, struct color** cs, struct terminal* ter
|
||||
|
||||
// 2. Choose colors
|
||||
struct ascii_logo* logo = art->art;
|
||||
bool color = is_color_enabled();
|
||||
if (!color)
|
||||
art->style = STYLE_LEGACY;
|
||||
|
||||
switch(art->style) {
|
||||
case STYLE_LEGACY:
|
||||
@@ -577,6 +597,7 @@ bool print_cpufetch_x86(struct cpuInfo* cpu, STYLE s, struct color** cs, struct
|
||||
for(int i = 0; i < cpu->num_cpus; ptr = ptr->next_cpu, i++) {
|
||||
char* max_frequency = get_str_freq(ptr->freq);
|
||||
char* avx = get_str_avx(ptr);
|
||||
char* sse = get_str_sse(ptr);
|
||||
char* fma = get_str_fma(ptr);
|
||||
char* cpu_num = emalloc(sizeof(char) * 9);
|
||||
|
||||
@@ -611,8 +632,17 @@ bool print_cpufetch_x86(struct cpuInfo* cpu, STYLE s, struct color** cs, struct
|
||||
setAttribute(art, ATTRIBUTE_NCORES, n_cores);
|
||||
}
|
||||
}
|
||||
|
||||
// Show the most modern vector instructions.
|
||||
// If AVX is supported show it, otherwise show SSE
|
||||
if (strcmp(avx, "No") == 0) {
|
||||
setAttribute(art, ATTRIBUTE_SSE, sse);
|
||||
}
|
||||
else {
|
||||
setAttribute(art, ATTRIBUTE_AVX, avx);
|
||||
setAttribute(art, ATTRIBUTE_FMA, fma);
|
||||
}
|
||||
|
||||
if(l1i != NULL) setAttribute(art, ATTRIBUTE_L1i, l1i);
|
||||
if(l1d != NULL) setAttribute(art, ATTRIBUTE_L1d, l1d);
|
||||
if(l2 != NULL) setAttribute(art, ATTRIBUTE_L2, l2);
|
||||
|
||||
@@ -15,10 +15,12 @@ static char* soc_trademark_string[] = {
|
||||
[SOC_VENDOR_MEDIATEK] = "MediaTek ",
|
||||
[SOC_VENDOR_EXYNOS] = "Exynos ",
|
||||
[SOC_VENDOR_KIRIN] = "Kirin ",
|
||||
[SOC_VENDOR_KUNPENG] = "Kunpeng ",
|
||||
[SOC_VENDOR_BROADCOM] = "Broadcom BCM",
|
||||
[SOC_VENDOR_APPLE] = "Apple ",
|
||||
[SOC_VENDOR_ROCKCHIP] = "Rockchip ",
|
||||
[SOC_VENDOR_GOOGLE] = "Google ",
|
||||
[SOC_VENDOR_NVIDIA] = "NVIDIA ",
|
||||
// RISC-V
|
||||
[SOC_VENDOR_SIFIVE] = "SiFive ",
|
||||
[SOC_VENDOR_STARFIVE] = "StarFive ",
|
||||
|
||||
@@ -19,10 +19,12 @@ enum {
|
||||
SOC_VENDOR_MEDIATEK,
|
||||
SOC_VENDOR_EXYNOS,
|
||||
SOC_VENDOR_KIRIN,
|
||||
SOC_VENDOR_KUNPENG,
|
||||
SOC_VENDOR_BROADCOM,
|
||||
SOC_VENDOR_APPLE,
|
||||
SOC_VENDOR_ROCKCHIP,
|
||||
SOC_VENDOR_GOOGLE,
|
||||
SOC_VENDOR_NVIDIA,
|
||||
// RISC-V
|
||||
SOC_VENDOR_SIFIVE,
|
||||
SOC_VENDOR_STARFIVE,
|
||||
@@ -39,7 +41,7 @@ struct system_on_chip {
|
||||
char* raw_name;
|
||||
};
|
||||
|
||||
struct system_on_chip* get_soc(void);
|
||||
struct system_on_chip* get_soc(struct cpuInfo* cpu);
|
||||
char* get_soc_name(struct system_on_chip* soc);
|
||||
VENDOR get_soc_vendor(struct system_on_chip* soc);
|
||||
bool match_soc(struct system_on_chip* soc, char* raw_name, char* expected_name, char* soc_name, SOC soc_model, int32_t process);
|
||||
|
||||
@@ -4,8 +4,8 @@
|
||||
#include <string.h>
|
||||
#include <errno.h>
|
||||
|
||||
#include "../common/global.h"
|
||||
#include "../common/cpu.h"
|
||||
#include "global.h"
|
||||
#include "cpu.h"
|
||||
|
||||
uint32_t get_sys_info_by_name(char* name) {
|
||||
size_t size = 0;
|
||||
@@ -14,6 +14,7 @@
|
||||
static char *hv_vendors_name[] = {
|
||||
[HV_VENDOR_KVM] = "KVM",
|
||||
[HV_VENDOR_QEMU] = "QEMU",
|
||||
[HV_VENDOR_VBOX] = "VirtualBox",
|
||||
[HV_VENDOR_HYPERV] = "Microsoft Hyper-V",
|
||||
[HV_VENDOR_VMWARE] = "VMware",
|
||||
[HV_VENDOR_XEN] = "Xen",
|
||||
@@ -145,6 +146,7 @@ struct uarch* get_cpu_uarch(struct cpuInfo* cpu) {
|
||||
struct frequency* get_frequency_info(void) {
|
||||
struct frequency* freq = emalloc(sizeof(struct frequency));
|
||||
|
||||
freq->measured = false;
|
||||
freq->max = get_max_freq_from_file(0);
|
||||
freq->base = get_min_freq_from_file(0);
|
||||
|
||||
|
||||
@@ -280,9 +280,6 @@ char* get_str_process(struct cpuInfo* cpu) {
|
||||
if(process == UNK) {
|
||||
snprintf(str, strlen(STRING_UNKNOWN)+1, STRING_UNKNOWN);
|
||||
}
|
||||
else if(process > 100) {
|
||||
sprintf(str, "%.2fum", (double)process/100);
|
||||
}
|
||||
else if(process > 0){
|
||||
sprintf(str, "%dnm", process);
|
||||
}
|
||||
|
||||
@@ -19,6 +19,7 @@
|
||||
struct frequency* get_frequency_info(uint32_t core) {
|
||||
struct frequency* freq = emalloc(sizeof(struct frequency));
|
||||
|
||||
freq->measured = false;
|
||||
freq->base = UNKNOWN_DATA;
|
||||
freq->max = get_max_freq_from_file(core);
|
||||
|
||||
@@ -163,7 +164,7 @@ struct cpuInfo* get_cpu_info(void) {
|
||||
cpu->ext = get_extensions_from_str(ext_str);
|
||||
if(cpu->ext->str != NULL && cpu->ext->mask == 0) return NULL;
|
||||
cpu->arch = get_uarch_from_cpuinfo_str(cpuinfo_str, cpu);
|
||||
cpu->soc = get_soc();
|
||||
cpu->soc = get_soc(cpu);
|
||||
cpu->freq = get_frequency_info(0);
|
||||
cpu->peak_performance = get_peak_performance(cpu);
|
||||
|
||||
|
||||
@@ -65,7 +65,7 @@ struct system_on_chip* guess_soc_from_devtree(struct system_on_chip* soc) {
|
||||
return soc;
|
||||
}
|
||||
|
||||
struct system_on_chip* get_soc(void) {
|
||||
struct system_on_chip* get_soc(struct cpuInfo* cpu) {
|
||||
struct system_on_chip* soc = emalloc(sizeof(struct system_on_chip));
|
||||
soc->raw_name = NULL;
|
||||
soc->soc_vendor = SOC_VENDOR_UNKNOWN;
|
||||
|
||||
@@ -5,6 +5,6 @@
|
||||
#include "../common/cpu.h"
|
||||
#include <stdint.h>
|
||||
|
||||
struct system_on_chip* get_soc(void);
|
||||
struct system_on_chip* get_soc(struct cpuInfo* cpu);
|
||||
|
||||
#endif
|
||||
|
||||
@@ -72,34 +72,6 @@ uint32_t get_apic_id(bool x2apic_id) {
|
||||
}
|
||||
}
|
||||
|
||||
#ifndef __APPLE__
|
||||
bool bind_to_cpu(int cpu_id) {
|
||||
#ifdef _WIN32
|
||||
HANDLE process = GetCurrentProcess();
|
||||
DWORD_PTR processAffinityMask = 1 << cpu_id;
|
||||
return SetProcessAffinityMask(process, processAffinityMask);
|
||||
#elif defined __linux__
|
||||
cpu_set_t currentCPU;
|
||||
CPU_ZERO(¤tCPU);
|
||||
CPU_SET(cpu_id, ¤tCPU);
|
||||
if (sched_setaffinity (0, sizeof(currentCPU), ¤tCPU) == -1) {
|
||||
printWarn("sched_setaffinity: %s", strerror(errno));
|
||||
return false;
|
||||
}
|
||||
return true;
|
||||
#elif defined __FreeBSD__
|
||||
cpuset_t currentCPU;
|
||||
CPU_ZERO(¤tCPU);
|
||||
CPU_SET(cpu_id, ¤tCPU);
|
||||
if(cpuset_setaffinity(CPU_LEVEL_WHICH, CPU_WHICH_TID, -1, sizeof(cpuset_t), ¤tCPU) == -1) {
|
||||
printWarn("cpuset_setaffinity: %s", strerror(errno));
|
||||
return false;
|
||||
}
|
||||
return true;
|
||||
#endif
|
||||
}
|
||||
#endif
|
||||
|
||||
#ifdef __linux__
|
||||
int get_total_cores_module(int total_cores, int module) {
|
||||
int total_modules = 2;
|
||||
@@ -397,6 +369,11 @@ bool fill_apic_ids(uint32_t* apic_ids, int first_core, int n, bool x2apic_id) {
|
||||
}
|
||||
|
||||
bool get_topology_from_apic(struct cpuInfo* cpu, struct topology* topo) {
|
||||
if (topo->cach == NULL) {
|
||||
printWarn("get_topology_from_apic: cach is NULL");
|
||||
return false;
|
||||
}
|
||||
|
||||
uint32_t apic_id;
|
||||
uint32_t* apic_ids = emalloc(sizeof(uint32_t) * topo->total_cores_module);
|
||||
uint32_t* apic_pkg = emalloc(sizeof(uint32_t) * topo->total_cores_module);
|
||||
|
||||
@@ -17,10 +17,6 @@ struct apic {
|
||||
bool get_topology_from_apic(struct cpuInfo* cpu, struct topology* topo);
|
||||
uint32_t is_smt_enabled_amd(struct topology* topo);
|
||||
|
||||
#ifndef __APPLE__
|
||||
bool bind_to_cpu(int cpu_id);
|
||||
#endif
|
||||
|
||||
#ifdef __linux__
|
||||
int get_total_cores_module(int total_cores, int module);
|
||||
#endif
|
||||
|
||||
107
src/x86/cpuid.c
107
src/x86/cpuid.c
@@ -6,6 +6,10 @@
|
||||
#include <unistd.h>
|
||||
#endif
|
||||
|
||||
#ifdef __linux__
|
||||
#include "../common/freq.h"
|
||||
#endif
|
||||
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
#include <string.h>
|
||||
@@ -22,10 +26,12 @@
|
||||
|
||||
#define CPU_VENDOR_INTEL_STRING "GenuineIntel"
|
||||
#define CPU_VENDOR_AMD_STRING "AuthenticAMD"
|
||||
#define CPU_VENDOR_HYGON_STRING "HygonGenuine"
|
||||
|
||||
static const char *hv_vendors_string[] = {
|
||||
[HV_VENDOR_KVM] = "KVMKVMKVM",
|
||||
[HV_VENDOR_QEMU] = "TCGTCGTCGTCG",
|
||||
[HV_VENDOR_VBOX] = "VBoxVBoxVBox",
|
||||
[HV_VENDOR_HYPERV] = "Microsoft Hv",
|
||||
[HV_VENDOR_VMWARE] = "VMwareVMware",
|
||||
[HV_VENDOR_XEN] = "XenVMMXenVMM",
|
||||
@@ -38,6 +44,7 @@ static const char *hv_vendors_string[] = {
|
||||
static char *hv_vendors_name[] = {
|
||||
[HV_VENDOR_KVM] = "KVM",
|
||||
[HV_VENDOR_QEMU] = "QEMU",
|
||||
[HV_VENDOR_VBOX] = "VirtualBox",
|
||||
[HV_VENDOR_HYPERV] = "Microsoft Hyper-V",
|
||||
[HV_VENDOR_VMWARE] = "VMware",
|
||||
[HV_VENDOR_XEN] = "Xen",
|
||||
@@ -216,7 +223,7 @@ int64_t get_peak_performance(struct cpuInfo* cpu, bool accurate_pp) {
|
||||
#endif
|
||||
|
||||
//First, check we have consistent data
|
||||
if(freq == UNKNOWN_DATA || topo->logical_cores == UNKNOWN_DATA) {
|
||||
if(freq == UNKNOWN_DATA || topo == NULL || topo->logical_cores == UNKNOWN_DATA) {
|
||||
return -1;
|
||||
}
|
||||
|
||||
@@ -449,7 +456,7 @@ struct cpuInfo* get_cpu_info(void) {
|
||||
cpu->cach = NULL;
|
||||
cpu->feat = NULL;
|
||||
|
||||
uint32_t modules = 1;
|
||||
cpu->num_cpus = 1;
|
||||
uint32_t eax = 0;
|
||||
uint32_t ebx = 0;
|
||||
uint32_t ecx = 0;
|
||||
@@ -468,6 +475,8 @@ struct cpuInfo* get_cpu_info(void) {
|
||||
cpu->cpu_vendor = CPU_VENDOR_INTEL;
|
||||
else if (strcmp(CPU_VENDOR_AMD_STRING,name) == 0)
|
||||
cpu->cpu_vendor = CPU_VENDOR_AMD;
|
||||
else if (strcmp(CPU_VENDOR_HYGON_STRING,name) == 0)
|
||||
cpu->cpu_vendor = CPU_VENDOR_HYGON;
|
||||
else {
|
||||
cpu->cpu_vendor = CPU_VENDOR_INVALID;
|
||||
printErr("Unknown CPU vendor: %s", name);
|
||||
@@ -486,9 +495,8 @@ struct cpuInfo* get_cpu_info(void) {
|
||||
cpu->cpu_name = get_str_cpu_name_internal();
|
||||
}
|
||||
else {
|
||||
cpu->cpu_name = emalloc(sizeof(char) * (strlen(STRING_UNKNOWN) + 1));
|
||||
strcpy(cpu->cpu_name, STRING_UNKNOWN);
|
||||
printWarn("Can't read cpu name from cpuid (needed extended level is 0x%.8X, max is 0x%.8X)", 0x80000004, cpu->maxExtendedLevels);
|
||||
cpu->cpu_name = NULL;
|
||||
printWarn("Can't read CPU name from cpuid (needed extended level is 0x%.8X, max is 0x%.8X)", 0x80000004, cpu->maxExtendedLevels);
|
||||
}
|
||||
|
||||
cpu->topology_extensions = false;
|
||||
@@ -506,12 +514,12 @@ struct cpuInfo* get_cpu_info(void) {
|
||||
cpu->hybrid_flag = (edx >> 15) & 0x1;
|
||||
}
|
||||
|
||||
if(cpu->hybrid_flag) modules = 2;
|
||||
if(cpu->hybrid_flag) cpu->num_cpus = 2;
|
||||
|
||||
struct cpuInfo* ptr = cpu;
|
||||
for(uint32_t i=0; i < modules; i++) {
|
||||
for(uint32_t i=0; i < cpu->num_cpus; i++) {
|
||||
int32_t first_core;
|
||||
set_cpu_module(i, modules, &first_core);
|
||||
set_cpu_module(i, cpu->num_cpus, &first_core);
|
||||
|
||||
if(i > 0) {
|
||||
ptr->next_cpu = emalloc(sizeof(struct cpuInfo));
|
||||
@@ -538,14 +546,15 @@ struct cpuInfo* get_cpu_info(void) {
|
||||
ptr->first_core_id = first_core;
|
||||
ptr->feat = get_features_info(ptr);
|
||||
|
||||
// If any field of the struct is NULL,
|
||||
// return inmideately, as further functions
|
||||
// require valid fields (cach, topo, etc)
|
||||
ptr->arch = get_cpu_uarch(ptr);
|
||||
ptr->freq = get_frequency_info(ptr);
|
||||
|
||||
if (cpu->cpu_name == NULL && ptr == cpu) {
|
||||
// If we couldnt read CPU name from cpuid, infer it now
|
||||
cpu->cpu_name = infer_cpu_name_from_uarch(cpu->arch);
|
||||
}
|
||||
|
||||
ptr->cach = get_cache_info(ptr);
|
||||
if(ptr->cach == NULL) return cpu;
|
||||
|
||||
if(cpu->hybrid_flag) {
|
||||
ptr->topo = get_topology_info(ptr, ptr->cach, i);
|
||||
@@ -553,16 +562,23 @@ struct cpuInfo* get_cpu_info(void) {
|
||||
else {
|
||||
ptr->topo = get_topology_info(ptr, ptr->cach, -1);
|
||||
}
|
||||
if(cpu->topo == NULL) return cpu;
|
||||
|
||||
// If topo is NULL, return early, as get_peak_performance
|
||||
// requries non-NULL topology.
|
||||
if(ptr->topo == NULL) return cpu;
|
||||
}
|
||||
|
||||
cpu->num_cpus = modules;
|
||||
cpu->peak_performance = get_peak_performance(cpu, accurate_pp());
|
||||
|
||||
return cpu;
|
||||
}
|
||||
|
||||
bool get_cache_topology_amd(struct cpuInfo* cpu, struct topology* topo) {
|
||||
if (topo->cach == NULL) {
|
||||
printWarn("get_cache_topology_amd: cach is NULL");
|
||||
return false;
|
||||
}
|
||||
|
||||
if(cpu->maxExtendedLevels >= 0x8000001D && cpu->topology_extensions) {
|
||||
uint32_t i, eax, ebx, ecx, edx, num_sharing_cache, cache_type, cache_level;
|
||||
|
||||
@@ -638,10 +654,17 @@ bool get_cache_topology_amd(struct cpuInfo* cpu, struct topology* topo) {
|
||||
|
||||
#ifdef __linux__
|
||||
void get_topology_from_udev(struct topology* topo) {
|
||||
// TODO: To be improved in the future
|
||||
topo->total_cores = get_ncores_from_cpuinfo();
|
||||
// TODO: To be improved in the future
|
||||
if (topo->total_cores == 1) {
|
||||
// We can assume it's a single core CPU
|
||||
topo->logical_cores = topo->total_cores;
|
||||
topo->physical_cores = topo->total_cores;
|
||||
}
|
||||
else {
|
||||
topo->logical_cores = UNKNOWN_DATA;
|
||||
topo->physical_cores = UNKNOWN_DATA;
|
||||
}
|
||||
topo->smt_available = 1;
|
||||
topo->smt_supported = 1;
|
||||
topo->sockets = 1;
|
||||
@@ -688,30 +711,29 @@ struct topology* get_topology_info(struct cpuInfo* cpu, struct cache* cach, int
|
||||
|
||||
switch(cpu->cpu_vendor) {
|
||||
case CPU_VENDOR_INTEL:
|
||||
bool toporet = false;
|
||||
if (cpu->maxLevels >= 0x00000004) {
|
||||
bool toporet = get_topology_from_apic(cpu, topo);
|
||||
toporet = get_topology_from_apic(cpu, topo);
|
||||
}
|
||||
else {
|
||||
printWarn("Can't read topology information from cpuid (needed level is 0x%.8X, max is 0x%.8X)", 0x00000004, cpu->maxLevels);
|
||||
}
|
||||
if(!toporet) {
|
||||
#ifdef __linux__
|
||||
printWarn("Failed to retrieve topology from APIC, using udev...\n");
|
||||
printWarn("Failed to retrieve topology from APIC, using udev...");
|
||||
get_topology_from_udev(topo);
|
||||
#else
|
||||
printErr("Failed to retrieve topology from APIC, assumming default values...\n");
|
||||
if (cpu->maxLevels >= 0x00000004)
|
||||
printErr("Failed to retrieve topology from APIC, assumming default values...");
|
||||
topo->logical_cores = UNKNOWN_DATA;
|
||||
topo->physical_cores = UNKNOWN_DATA;
|
||||
topo->smt_available = 1;
|
||||
topo->smt_supported = 1;
|
||||
#endif
|
||||
}
|
||||
}
|
||||
else {
|
||||
printWarn("Can't read topology information from cpuid (needed level is 0x%.8X, max is 0x%.8X)", 0x00000001, cpu->maxLevels);
|
||||
topo->physical_cores = 1;
|
||||
topo->logical_cores = 1;
|
||||
topo->smt_available = 1;
|
||||
topo->smt_supported = 1;
|
||||
}
|
||||
break;
|
||||
case CPU_VENDOR_AMD:
|
||||
case CPU_VENDOR_HYGON:
|
||||
if (cpu->maxExtendedLevels >= 0x80000008) {
|
||||
eax = 0x80000008;
|
||||
cpuid(&eax, &ebx, &ecx, &edx);
|
||||
@@ -908,6 +930,7 @@ struct cache* get_cache_info(struct cpuInfo* cpu) {
|
||||
|
||||
struct frequency* get_frequency_info(struct cpuInfo* cpu) {
|
||||
struct frequency* freq = emalloc(sizeof(struct frequency));
|
||||
freq->measured = false;
|
||||
|
||||
if(cpu->maxLevels < 0x00000016) {
|
||||
#if defined (_WIN32) || defined (__APPLE__)
|
||||
@@ -917,7 +940,7 @@ struct frequency* get_frequency_info(struct cpuInfo* cpu) {
|
||||
#else
|
||||
printWarn("Can't read frequency information from cpuid (needed level is 0x%.8X, max is 0x%.8X). Using udev", 0x00000016, cpu->maxLevels);
|
||||
freq->base = UNKNOWN_DATA;
|
||||
freq->max = get_max_freq_from_file(0);
|
||||
freq->max = get_max_freq_from_file(cpu->first_core_id);
|
||||
|
||||
if(freq->max == 0) {
|
||||
printWarn("Read max CPU frequency from udev and got 0 MHz");
|
||||
@@ -944,7 +967,7 @@ struct frequency* get_frequency_info(struct cpuInfo* cpu) {
|
||||
printWarn("Read max CPU frequency from CPUID and got 0 MHz");
|
||||
#ifdef __linux__
|
||||
printWarn("Using udev to detect frequency");
|
||||
freq->max = get_max_freq_from_file(0);
|
||||
freq->max = get_max_freq_from_file(cpu->first_core_id);
|
||||
|
||||
if(freq->max == 0) {
|
||||
printWarn("Read max CPU frequency from udev and got 0 MHz");
|
||||
@@ -956,6 +979,15 @@ struct frequency* get_frequency_info(struct cpuInfo* cpu) {
|
||||
}
|
||||
}
|
||||
|
||||
#ifdef __linux__
|
||||
if (freq->max == UNKNOWN_DATA || measure_max_frequency_flag()) {
|
||||
if (freq->max == UNKNOWN_DATA)
|
||||
printWarn("All previous methods failed, measuring CPU frequency");
|
||||
freq->max = measure_max_frequency(cpu->first_core_id);
|
||||
freq->measured = true;
|
||||
}
|
||||
#endif
|
||||
|
||||
return freq;
|
||||
}
|
||||
|
||||
@@ -977,24 +1009,33 @@ char* get_str_topology(struct cpuInfo* cpu, struct topology* topo, bool dual_soc
|
||||
string = emalloc(sizeof(char) * (strlen(STRING_UNKNOWN) + 1));
|
||||
strcpy(string, STRING_UNKNOWN);
|
||||
}
|
||||
else if(topo->smt_supported > 1) {
|
||||
else {
|
||||
char cores_str[6];
|
||||
memset(cores_str, 0, sizeof(char) * 6);
|
||||
if (topo->physical_cores * topo_sockets > 1)
|
||||
strcpy(cores_str, "cores");
|
||||
else
|
||||
strcpy(cores_str, "core");
|
||||
|
||||
if(topo->smt_supported > 1) {
|
||||
// 4 for digits, 21 for ' cores (SMT disabled)' which is the longest possible output
|
||||
uint32_t max_size = 4+21+1;
|
||||
string = emalloc(sizeof(char) * max_size);
|
||||
|
||||
if(topo->smt_available > 1)
|
||||
snprintf(string, max_size, "%d cores (%d threads)", topo->physical_cores * topo_sockets, topo->logical_cores * topo_sockets);
|
||||
snprintf(string, max_size, "%d %s (%d threads)", topo->physical_cores * topo_sockets, cores_str, topo->logical_cores * topo_sockets);
|
||||
else {
|
||||
if(cpu->cpu_vendor == CPU_VENDOR_AMD)
|
||||
snprintf(string, max_size, "%d cores (SMT disabled)", topo->physical_cores * topo_sockets);
|
||||
snprintf(string, max_size, "%d %s (SMT disabled)", topo->physical_cores * topo_sockets, cores_str);
|
||||
else
|
||||
snprintf(string, max_size, "%d cores (HT disabled)", topo->physical_cores * topo_sockets);
|
||||
snprintf(string, max_size, "%d %s (HT disabled)", topo->physical_cores * topo_sockets, cores_str);
|
||||
}
|
||||
}
|
||||
else {
|
||||
uint32_t max_size = 4+7+1;
|
||||
string = emalloc(sizeof(char) * max_size);
|
||||
snprintf(string, max_size, "%d cores",topo->physical_cores * topo_sockets);
|
||||
snprintf(string, max_size, "%d %s",topo->physical_cores * topo_sockets, cores_str);
|
||||
}
|
||||
}
|
||||
|
||||
return string;
|
||||
|
||||
132
src/x86/uarch.c
132
src/x86/uarch.c
@@ -48,7 +48,9 @@ enum {
|
||||
UARCH_UNKNOWN,
|
||||
// INTEL //
|
||||
UARCH_P5,
|
||||
UARCH_P6,
|
||||
UARCH_P5_MMX,
|
||||
UARCH_P6_PENTIUM_II,
|
||||
UARCH_P6_PENTIUM_III,
|
||||
UARCH_DOTHAN,
|
||||
UARCH_YONAH,
|
||||
UARCH_MEROM,
|
||||
@@ -125,8 +127,7 @@ struct uarch {
|
||||
#define UARCH_START if (false) {}
|
||||
#define CHECK_UARCH(arch, ef_, f_, em_, m_, s_, str, uarch, process) \
|
||||
else if (ef_ == ef && f_ == f && (em_ == NA || em_ == em) && (m_ == NA || m_ == m) && (s_ == NA || s_ == s)) fill_uarch(arch, str, uarch, process);
|
||||
#define UARCH_END else { printErr("Unknown microarchitecture detected: M=0x%X EM=0x%X F=0x%X EF=0x%X S=0x%X", m, em, f, ef, s); \
|
||||
fprintf(stderr, "Please see https://github.com/Dr-Noob/cpufetch#61-unknown-microarchitecture-error to know how to report this error\n"); \
|
||||
#define UARCH_END else { printBugCheckRelease("Unknown microarchitecture detected: M=0x%X EM=0x%X F=0x%X EF=0x%X S=0x%X", m, em, f, ef, s); \
|
||||
fill_uarch(arch, STRING_UNKNOWN, UARCH_UNKNOWN, UNK); }
|
||||
|
||||
void fill_uarch(struct uarch* arch, char* str, MICROARCH u, uint32_t process) {
|
||||
@@ -145,31 +146,31 @@ struct uarch* get_uarch_from_cpuid_intel(uint32_t ef, uint32_t f, uint32_t em, u
|
||||
// EM: Extended Model //
|
||||
// M: Model //
|
||||
// S: Stepping //
|
||||
// ----------------------------------------------------------------------------- //
|
||||
// ------------------------------------------------------------------------------- //
|
||||
// EF F EM M S //
|
||||
UARCH_START
|
||||
CHECK_UARCH(arch, 0, 5, 0, 0, NA, "P5", UARCH_P5, 800)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 1, NA, "P5", UARCH_P5, 800)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 2, NA, "P5", UARCH_P5, UNK)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 3, NA, "P5", UARCH_P5, 600)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 4, NA, "P5 MMX", UARCH_P5, UNK)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 7, NA, "P5 MMX", UARCH_P5, UNK)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 8, NA, "P5 MMX", UARCH_P5, 250)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 4, NA, "P5 (MMX)", UARCH_P5_MMX, UNK)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 7, NA, "P5 (MMX)", UARCH_P5_MMX, UNK)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 8, NA, "P5 (MMX)", UARCH_P5_MMX, 250)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 9, 0, "Lakemont", UARCH_LAKEMONT, 32)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 9, NA, "P5 MMX", UARCH_P5, UNK)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 9, NA, "P5 (MMX)", UARCH_P5_MMX, UNK)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 10, 0, "Lakemont", UARCH_LAKEMONT, 32)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 0, NA, "P6 Pentium II", UARCH_P6, UNK)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 1, NA, "P6 Pentium II", UARCH_P6, UNK) // process depends on core
|
||||
CHECK_UARCH(arch, 0, 6, 0, 2, NA, "P6 Pentium II", UARCH_P6, UNK)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 3, NA, "P6 Pentium II", UARCH_P6, 350)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 4, NA, "P6 Pentium II", UARCH_P6, UNK)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 5, NA, "P6 Pentium II", UARCH_P6, 250)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 6, NA, "P6 Pentium II", UARCH_P6, UNK)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 7, NA, "P6 Pentium III", UARCH_P6, 250)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 8, NA, "P6 Pentium III", UARCH_P6, 180)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 9, NA, "P6 Pentium M", UARCH_P6, 130)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 10, NA, "P6 Pentium III", UARCH_P6, 180)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 11, NA, "P6 Pentium III", UARCH_P6, 130)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 0, NA, "P6 (Pentium II)", UARCH_P6_PENTIUM_II, UNK)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 1, NA, "P6 (Pentium II)", UARCH_P6_PENTIUM_II, UNK) // process depends on core
|
||||
CHECK_UARCH(arch, 0, 6, 0, 2, NA, "P6 (Pentium II)", UARCH_P6_PENTIUM_II, UNK)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 3, NA, "P6 (Klamath)", UARCH_P6_PENTIUM_II, 350) // http://instlatx64.atw.hu.
|
||||
CHECK_UARCH(arch, 0, 6, 0, 4, NA, "P6 (Pentium II)", UARCH_P6_PENTIUM_II, UNK)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 5, NA, "P6 (Deschutes)", UARCH_P6_PENTIUM_II, 250) // http://instlatx64.atw.hu.
|
||||
CHECK_UARCH(arch, 0, 6, 0, 6, NA, "P6 (Dixon)", UARCH_P6_PENTIUM_II, UNK) // http://instlatx64.atw.hu.
|
||||
CHECK_UARCH(arch, 0, 6, 0, 7, NA, "P6 (Katmai)", UARCH_P6_PENTIUM_III, 250) // Core names from: https://en.wikichip.org/wiki/intel/cpuid. NOTE: Xeon core names are different! https://www.techpowerup.com/cpu-specs/?generation=Intel+Pentium+III+Xeon
|
||||
CHECK_UARCH(arch, 0, 6, 0, 8, NA, "P6 (Coppermine)", UARCH_P6_PENTIUM_III, 180) // Also: https://en.wikipedia.org/wiki/Pentium_III
|
||||
CHECK_UARCH(arch, 0, 6, 0, 9, NA, "P6 (Pentium M)", UARCH_P6_PENTIUM_III, 130)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 10, NA, "P6 (Coppermine T)", UARCH_P6_PENTIUM_III, 180)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 11, NA, "P6 (Tualatin)", UARCH_P6_PENTIUM_III, 130)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 13, NA, "Dothan", UARCH_DOTHAN, UNK) // process depends on core
|
||||
CHECK_UARCH(arch, 0, 6, 0, 14, NA, "Yonah", UARCH_YONAH, 65)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 15, NA, "Merom", UARCH_MEROM, 65)
|
||||
@@ -381,6 +382,7 @@ struct uarch* get_uarch_from_cpuid_amd(uint32_t ef, uint32_t f, uint32_t em, uin
|
||||
CHECK_UARCH(arch, 10, 15, 5, 0, NA, "Zen 3", UARCH_ZEN3, 7) // instlatx64
|
||||
CHECK_UARCH(arch, 10, 15, 6, 1, 2, "Zen 4", UARCH_ZEN4, 5) // instlatx64
|
||||
CHECK_UARCH(arch, 10, 15, 7, 4, 1, "Zen 4", UARCH_ZEN4, 4) // instlatx64
|
||||
CHECK_UARCH(arch, 10, 15, 7, 5, 2, "Zen 4", UARCH_ZEN4, 4) // instlatx64
|
||||
CHECK_UARCH(arch, 10, 15, 7, 8, 0, "Zen 4", UARCH_ZEN4, 4) // instlatx64
|
||||
CHECK_UARCH(arch, 10, 15, 8, NA, NA, "Zen 4", UARCH_ZEN4, 5) // instlatx64 (AMD MI300C)
|
||||
CHECK_UARCH(arch, 10, 15, 9, NA, NA, "Zen 4", UARCH_ZEN4, 5) // instlatx64 (AMD MI300A)
|
||||
@@ -390,13 +392,37 @@ struct uarch* get_uarch_from_cpuid_amd(uint32_t ef, uint32_t f, uint32_t em, uin
|
||||
return arch;
|
||||
}
|
||||
|
||||
struct uarch* get_uarch_from_cpuid(struct cpuInfo* cpu, uint32_t dump, uint32_t ef, uint32_t f, uint32_t em, uint32_t m, int s) {
|
||||
if(cpu->cpu_vendor == CPU_VENDOR_INTEL) {
|
||||
if(dump == 0x000806E9) {
|
||||
// It is not possible to determine uarch only from CPUID dump (can be Kaby Lake or Amber Lake)
|
||||
// See issue https://github.com/Dr-Noob/cpufetch/issues/122
|
||||
struct uarch* get_uarch_from_cpuid_hygon(uint32_t ef, uint32_t f, uint32_t em, uint32_t m, int s) {
|
||||
struct uarch* arch = emalloc(sizeof(struct uarch));
|
||||
|
||||
// EF: Extended Family //
|
||||
// F: Family //
|
||||
// EM: Extended Model //
|
||||
// M: Model //
|
||||
// S: Stepping //
|
||||
// ----------------------------------------------------------------------------- //
|
||||
// EF F EM M S //
|
||||
UARCH_START
|
||||
// https://www.phoronix.com/news/Hygon-Dhyana-AMD-China-CPUs
|
||||
CHECK_UARCH(arch, 9, 15, 0, 1, NA, "Zen", UARCH_ZEN, UNK) // https://github.com/Dr-Noob/cpufetch/issues/244
|
||||
// CHECK_UARCH(arch, 9, 15, 0, 2, NA, "???", ?????????, UNK) // http://instlatx64.atw.hu/
|
||||
UARCH_END
|
||||
|
||||
return arch;
|
||||
}
|
||||
|
||||
struct uarch* get_uarch_from_cpuid(struct cpuInfo* cpu, uint32_t dump, uint32_t ef, uint32_t f, uint32_t em, uint32_t m, int s) {
|
||||
if(cpu->cpu_vendor == CPU_VENDOR_INTEL) {
|
||||
struct uarch* arch = emalloc(sizeof(struct uarch));
|
||||
if(dump == 0x000806E9) {
|
||||
if (cpu->cpu_name == NULL) {
|
||||
printErr("Unable to find uarch without CPU name");
|
||||
fill_uarch(arch, STRING_UNKNOWN, UARCH_UNKNOWN, UNK);
|
||||
return arch;
|
||||
}
|
||||
|
||||
// It is not possible to determine uarch only from CPUID dump (can be Kaby Lake or Amber Lake)
|
||||
// See issue https://github.com/Dr-Noob/cpufetch/issues/122
|
||||
if(strstr(cpu->cpu_name, "Y") != NULL) {
|
||||
fill_uarch(arch, "Amber Lake", UARCH_AMBER_LAKE, 14);
|
||||
}
|
||||
@@ -407,10 +433,14 @@ struct uarch* get_uarch_from_cpuid(struct cpuInfo* cpu, uint32_t dump, uint32_t
|
||||
return arch;
|
||||
}
|
||||
else if (dump == 0x000806EA) {
|
||||
if (cpu->cpu_name == NULL) {
|
||||
printErr("Unable to find uarch without CPU name");
|
||||
fill_uarch(arch, STRING_UNKNOWN, UARCH_UNKNOWN, UNK);
|
||||
return arch;
|
||||
}
|
||||
|
||||
// It is not possible to determine uarch only from CPUID dump (can be Kaby Lake R or Coffee Lake U)
|
||||
// See issue https://github.com/Dr-Noob/cpufetch/issues/149
|
||||
struct uarch* arch = emalloc(sizeof(struct uarch));
|
||||
|
||||
if(strstr(cpu->cpu_name, "i5-8250U") != NULL ||
|
||||
strstr(cpu->cpu_name, "i5-8350U") != NULL ||
|
||||
strstr(cpu->cpu_name, "i7-8550U") != NULL ||
|
||||
@@ -425,8 +455,51 @@ struct uarch* get_uarch_from_cpuid(struct cpuInfo* cpu, uint32_t dump, uint32_t
|
||||
}
|
||||
return get_uarch_from_cpuid_intel(ef, f, em, m, s);
|
||||
}
|
||||
else
|
||||
else if(cpu->cpu_vendor == CPU_VENDOR_AMD) {
|
||||
return get_uarch_from_cpuid_amd(ef, f, em, m, s);
|
||||
}
|
||||
else if(cpu->cpu_vendor == CPU_VENDOR_HYGON) {
|
||||
return get_uarch_from_cpuid_hygon(ef, f, em, m, s);
|
||||
}
|
||||
else {
|
||||
printBug("Invalid CPU vendor: %d", cpu->cpu_vendor);
|
||||
return NULL;
|
||||
}
|
||||
}
|
||||
|
||||
// If we cannot get the CPU name from CPUID, try to infer it from uarch
|
||||
char* infer_cpu_name_from_uarch(struct uarch* arch) {
|
||||
char* cpu_name = NULL;
|
||||
if (arch == NULL) {
|
||||
printErr("infer_cpu_name_from_uarch: Unable to find CPU name");
|
||||
cpu_name = ecalloc(strlen(STRING_UNKNOWN) + 1, sizeof(char));
|
||||
strcpy(cpu_name, STRING_UNKNOWN);
|
||||
return cpu_name;
|
||||
}
|
||||
|
||||
char *str = NULL;
|
||||
|
||||
if (arch->uarch == UARCH_P5)
|
||||
str = "Intel Pentium";
|
||||
else if (arch->uarch == UARCH_P5_MMX)
|
||||
str = "Intel Pentium MMX";
|
||||
else if (arch->uarch == UARCH_P6_PENTIUM_II)
|
||||
str = "Intel Pentium II";
|
||||
else if (arch->uarch == UARCH_P6_PENTIUM_III)
|
||||
str = "Intel Pentium III";
|
||||
else
|
||||
printErr("Unable to find name from uarch: %d", arch->uarch);
|
||||
|
||||
if (str == NULL) {
|
||||
cpu_name = ecalloc(strlen(STRING_UNKNOWN) + 1, sizeof(char));
|
||||
strcpy(cpu_name, STRING_UNKNOWN);
|
||||
}
|
||||
else {
|
||||
cpu_name = ecalloc(strlen(str) + 1, sizeof(char));
|
||||
strcpy(cpu_name, str);
|
||||
}
|
||||
|
||||
return cpu_name;
|
||||
}
|
||||
|
||||
bool vpus_are_AVX512(struct cpuInfo* cpu) {
|
||||
@@ -499,9 +572,6 @@ char* get_str_process(struct cpuInfo* cpu) {
|
||||
if(process == UNK) {
|
||||
snprintf(str, strlen(STRING_UNKNOWN)+1, STRING_UNKNOWN);
|
||||
}
|
||||
else if(process > 100) {
|
||||
sprintf(str, "%.2fum", (double)process/100);
|
||||
}
|
||||
else if(process > 0){
|
||||
sprintf(str, "%dnm", process);
|
||||
}
|
||||
|
||||
@@ -8,6 +8,7 @@
|
||||
struct uarch;
|
||||
|
||||
struct uarch* get_uarch_from_cpuid(struct cpuInfo* cpu, uint32_t dump, uint32_t ef, uint32_t f, uint32_t em, uint32_t m, int s);
|
||||
char* infer_cpu_name_from_uarch(struct uarch* arch);
|
||||
bool vpus_are_AVX512(struct cpuInfo* cpu);
|
||||
bool is_knights_landing(struct cpuInfo* cpu);
|
||||
int get_number_of_vpus(struct cpuInfo* cpu);
|
||||
|
||||
Reference in New Issue
Block a user