mirror of
https://github.com/Dr-Noob/cpufetch.git
synced 2026-03-25 07:50:40 +01:00
Compare commits
142 Commits
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
0133edfa7f | ||
|
|
9106579bea | ||
|
|
1dd8016487 | ||
|
|
7689355a72 | ||
|
|
321a1ec375 | ||
|
|
48c598cf3b | ||
|
|
aa94389bbe | ||
|
|
8d10a03adc | ||
|
|
2410fd16d3 | ||
|
|
f63178b41c | ||
|
|
2788e6831e | ||
|
|
146f2a13aa | ||
|
|
90624b9aaa | ||
|
|
e42f04cca8 | ||
|
|
3aacaf5f9e | ||
|
|
50f66ec571 | ||
|
|
cb186a2f97 | ||
|
|
6164884415 | ||
|
|
260f9ec3b8 | ||
|
|
79013d0ec9 | ||
|
|
e4227388b9 | ||
|
|
8fca4cb250 | ||
|
|
7c947bdf64 | ||
|
|
1ed3a0f2bf | ||
|
|
0fe6fc3f4d | ||
|
|
96c784026b | ||
|
|
59cd2dd128 | ||
|
|
da1981b97c | ||
|
|
8506c91e00 | ||
|
|
ece28cbdee | ||
|
|
7b46c78249 | ||
|
|
e0095c303d | ||
|
|
65378aaed9 | ||
|
|
946729dd06 | ||
|
|
9212f19de1 | ||
|
|
b019256515 | ||
|
|
d4cadbd807 | ||
|
|
4f081ef1a2 | ||
|
|
1b746bc67d | ||
|
|
dfa2b773d1 | ||
|
|
59efbf4e08 | ||
|
|
29768e841d | ||
|
|
cc16bc56ef | ||
|
|
1504c5d0ef | ||
|
|
08919916dc | ||
|
|
4a8a7567f0 | ||
|
|
c01f60fa6c | ||
|
|
b610dc8c7d | ||
|
|
0967e3597b | ||
|
|
14df701707 | ||
|
|
cbcce9c2ed | ||
|
|
b072e5c331 | ||
|
|
4b42d2c89d | ||
|
|
d221f578b7 | ||
|
|
7b4b94bb93 | ||
|
|
5e00d554aa | ||
|
|
5ffac60622 | ||
|
|
6566ac3ccf | ||
|
|
0a048717bf | ||
|
|
ce6e6f9cd8 | ||
|
|
2feee25659 | ||
|
|
8335bd004d | ||
|
|
a172b4b281 | ||
|
|
d88a6bf763 | ||
|
|
8870a0ca0c | ||
|
|
a43b700540 | ||
|
|
9a578d3670 | ||
|
|
bf890965a3 | ||
|
|
530207aee0 | ||
|
|
f64ff0d4cf | ||
|
|
4b7600d49e | ||
|
|
d8ce2de287 | ||
|
|
bc9b9c1e99 | ||
|
|
b17df01958 | ||
|
|
44e5e1b6dc | ||
|
|
fe4bcde898 | ||
|
|
45854a00d6 | ||
|
|
6c69ab0a00 | ||
|
|
bd3c66395d | ||
|
|
a12defaf4b | ||
|
|
4fa3dc2076 | ||
|
|
bcf8b8171d | ||
|
|
7d81d895b0 | ||
|
|
6a5b4c3da4 | ||
|
|
5f5561f177 | ||
|
|
9a46e310e4 | ||
|
|
36071b8eb8 | ||
|
|
6349f4435e | ||
|
|
bddf6cfe31 | ||
|
|
53e5dd19f7 | ||
|
|
b3719dc216 | ||
|
|
7a3fd539c3 | ||
|
|
f6bf00e33d | ||
|
|
985bd6f25f | ||
|
|
f599613f5e | ||
|
|
8a8b1dffa8 | ||
|
|
8e95828fb1 | ||
|
|
93f733cb12 | ||
|
|
0397db2fd8 | ||
|
|
ebe7312c9d | ||
|
|
8c72295f47 | ||
|
|
bec47a44a7 | ||
|
|
de638aba50 | ||
|
|
5be6f8bba0 | ||
|
|
10d4f67cdb | ||
|
|
5dd6ab60cb | ||
|
|
99fd108d0f | ||
|
|
f28f3ef70d | ||
|
|
89aadeead8 | ||
|
|
f58d76ccac | ||
|
|
889fbf2d67 | ||
|
|
91cc04c653 | ||
|
|
05744f4e40 | ||
|
|
4405a262ca | ||
|
|
9e9828d210 | ||
|
|
65bad8721e | ||
|
|
13e86d7f14 | ||
|
|
69dd47bab0 | ||
|
|
0ef08ef53e | ||
|
|
2b4e675800 | ||
|
|
30a2493ad9 | ||
|
|
a496f694a6 | ||
|
|
14819c350e | ||
|
|
9a69a7f58d | ||
|
|
1f450b23a1 | ||
|
|
cf77360d1b | ||
|
|
dfa321d4f4 | ||
|
|
522a1c6ddd | ||
|
|
994dc0334d | ||
|
|
ec9b88cc7c | ||
|
|
c3b5dd0eb0 | ||
|
|
eaee997945 | ||
|
|
5dced25745 | ||
|
|
dc69a9f8a6 | ||
|
|
3b54f62d62 | ||
|
|
3296dc960e | ||
|
|
be600728d7 | ||
|
|
6eb2357485 | ||
|
|
b0354e28ff | ||
|
|
687459961d | ||
|
|
07e920896b | ||
|
|
57f11f3eab |
49
Makefile
49
Makefile
@@ -1,7 +1,7 @@
|
||||
CC ?= gcc
|
||||
|
||||
CFLAGS+=-Wall -Wextra -pedantic
|
||||
SANITY_FLAGS=-Wfloat-equal -Wshadow -Wpointer-arith
|
||||
SANITY_FLAGS=-Wfloat-equal -Wshadow -Wpointer-arith -Wstrict-prototypes
|
||||
|
||||
PREFIX ?= /usr
|
||||
|
||||
@@ -11,18 +11,29 @@ COMMON_SRC = $(SRC_COMMON)main.c $(SRC_COMMON)cpu.c $(SRC_COMMON)udev.c $(SRC_CO
|
||||
COMMON_HDR = $(SRC_COMMON)ascii.h $(SRC_COMMON)cpu.h $(SRC_COMMON)udev.h $(SRC_COMMON)printer.h $(SRC_COMMON)args.h $(SRC_COMMON)global.h
|
||||
|
||||
ifneq ($(OS),Windows_NT)
|
||||
GIT_VERSION := "$(shell git describe --abbrev=4 --dirty --always --tags)"
|
||||
arch := $(shell uname -m)
|
||||
os := $(shell uname -s)
|
||||
|
||||
ifeq ($(os), Linux)
|
||||
COMMON_SRC += $(SRC_COMMON)freq.c
|
||||
COMMON_HDR += $(SRC_COMMON)freq.h
|
||||
endif
|
||||
|
||||
ifeq ($(arch), $(filter $(arch), x86_64 amd64 i386 i486 i586 i686))
|
||||
SRC_DIR=src/x86/
|
||||
SOURCE += $(COMMON_SRC) $(SRC_DIR)cpuid.c $(SRC_DIR)apic.c $(SRC_DIR)cpuid_asm.c $(SRC_DIR)uarch.c
|
||||
HEADERS += $(COMMON_HDR) $(SRC_DIR)cpuid.h $(SRC_DIR)apic.h $(SRC_DIR)cpuid_asm.h $(SRC_DIR)uarch.h $(SRC_DIR)freq/freq.h
|
||||
|
||||
os := $(shell uname -s)
|
||||
ifeq ($(os), Linux)
|
||||
ifeq ($(os), Linux)
|
||||
SOURCE += $(SRC_DIR)freq/freq.c freq_nov.o freq_avx.o freq_avx512.o
|
||||
HEADERS += $(SRC_DIR)freq/freq.h
|
||||
CFLAGS += -pthread
|
||||
endif
|
||||
endif
|
||||
ifeq ($(os), FreeBSD)
|
||||
SOURCE += $(SRC_COMMON)sysctl.c
|
||||
HEADERS += $(SRC_COMMON)sysctl.h
|
||||
endif
|
||||
CFLAGS += -DARCH_X86 -std=c99 -fstack-protector-all
|
||||
else ifeq ($(arch), $(filter $(arch), ppc64le ppc64 ppcle ppc))
|
||||
SRC_DIR=src/ppc/
|
||||
@@ -31,15 +42,25 @@ ifneq ($(OS),Windows_NT)
|
||||
CFLAGS += -DARCH_PPC -std=gnu99 -fstack-protector-all -Wno-language-extension-token
|
||||
else ifeq ($(arch), $(filter $(arch), arm aarch64_be aarch64 arm64 armv8b armv8l armv7l armv6l))
|
||||
SRC_DIR=src/arm/
|
||||
SOURCE += $(COMMON_SRC) $(SRC_DIR)midr.c $(SRC_DIR)uarch.c $(SRC_DIR)soc.c $(SRC_DIR)udev.c
|
||||
HEADERS += $(COMMON_HDR) $(SRC_DIR)midr.h $(SRC_DIR)uarch.h $(SRC_DIR)soc.h $(SRC_DIR)udev.c $(SRC_DIR)socs.h
|
||||
SOURCE += $(COMMON_SRC) $(SRC_DIR)midr.c $(SRC_DIR)uarch.c $(SRC_COMMON)soc.c $(SRC_DIR)soc.c $(SRC_COMMON)pci.c $(SRC_DIR)udev.c sve.o
|
||||
HEADERS += $(COMMON_HDR) $(SRC_DIR)midr.h $(SRC_DIR)uarch.h $(SRC_COMMON)soc.h $(SRC_DIR)soc.h $(SRC_COMMON)pci.h $(SRC_DIR)udev.c $(SRC_DIR)socs.h
|
||||
CFLAGS += -DARCH_ARM -Wno-unused-parameter -std=c99 -fstack-protector-all
|
||||
|
||||
os := $(shell uname -s)
|
||||
ifeq ($(os), Darwin)
|
||||
SOURCE += $(SRC_DIR)sysctl.c
|
||||
HEADERS += $(SRC_DIR)sysctl.h
|
||||
# Check if the compiler supports -march=armv8-a+sve. We will use it (if supported) to compile SVE detection code later
|
||||
is_sve_flag_supported := $(shell $(CC) -march=armv8-a+sve -c $(SRC_DIR)sve.c -o sve_test.o 2> /dev/null && echo 'yes'; rm -f sve_test.o)
|
||||
ifeq ($(is_sve_flag_supported), yes)
|
||||
SVE_FLAGS += -march=armv8-a+sve
|
||||
endif
|
||||
|
||||
ifeq ($(os), Darwin)
|
||||
SOURCE += $(SRC_COMMON)sysctl.c
|
||||
HEADERS += $(SRC_COMMON)sysctl.h
|
||||
endif
|
||||
else ifeq ($(arch), $(filter $(arch), riscv64 riscv32))
|
||||
SRC_DIR=src/riscv/
|
||||
SOURCE += $(COMMON_SRC) $(SRC_DIR)riscv.c $(SRC_DIR)uarch.c $(SRC_COMMON)soc.c $(SRC_DIR)soc.c $(SRC_DIR)udev.c
|
||||
HEADERS += $(COMMON_HDR) $(SRC_DIR)riscv.h $(SRC_DIR)uarch.h $(SRC_COMMON)soc.h $(SRC_DIR)soc.h $(SRC_DIR)udev.h $(SRC_DIR)socs.h
|
||||
CFLAGS += -DARCH_RISCV -Wno-unused-parameter -std=c99 -fstack-protector-all
|
||||
else
|
||||
# Error lines should not be tabulated because Makefile complains about it
|
||||
$(warning Unsupported arch detected: $(arch). See https://github.com/Dr-Noob/cpufetch#1-support)
|
||||
@@ -50,6 +71,7 @@ $(error Aborting compilation)
|
||||
OUTPUT=cpufetch
|
||||
else
|
||||
# Assume x86_64
|
||||
GIT_VERSION := ""
|
||||
SRC_DIR=src/x86/
|
||||
SOURCE += $(COMMON_SRC) $(SRC_DIR)cpuid.c $(SRC_DIR)apic.c $(SRC_DIR)cpuid_asm.c $(SRC_DIR)uarch.c
|
||||
HEADERS += $(COMMON_HDR) $(SRC_DIR)cpuid.h $(SRC_DIR)apic.h $(SRC_DIR)cpuid_asm.h $(SRC_DIR)uarch.h
|
||||
@@ -79,8 +101,15 @@ freq_avx.o: Makefile $(SRC_DIR)freq/freq_avx.c $(SRC_DIR)freq/freq_avx.h $(SRC_D
|
||||
freq_avx512.o: Makefile $(SRC_DIR)freq/freq_avx512.c $(SRC_DIR)freq/freq_avx512.h $(SRC_DIR)freq/freq.h
|
||||
$(CC) $(CFLAGS) $(SANITY_FLAGS) -c -mavx512f -pthread $(SRC_DIR)freq/freq_avx512.c -o $@
|
||||
|
||||
sve.o: Makefile $(SRC_DIR)sve.c $(SRC_DIR)sve.h
|
||||
$(CC) $(CFLAGS) $(SANITY_FLAGS) $(SVE_FLAGS) -c $(SRC_DIR)sve.c -o $@
|
||||
|
||||
$(OUTPUT): Makefile $(SOURCE) $(HEADERS)
|
||||
ifeq ($(GIT_VERSION),"")
|
||||
$(CC) $(CFLAGS) $(SANITY_FLAGS) $(SOURCE) -o $(OUTPUT)
|
||||
else
|
||||
$(CC) $(CFLAGS) $(SANITY_FLAGS) -DGIT_FULL_VERSION=\"$(GIT_VERSION)\" $(SOURCE) -o $(OUTPUT)
|
||||
endif
|
||||
|
||||
run: $(OUTPUT)
|
||||
./$(OUTPUT)
|
||||
|
||||
49
README.md
49
README.md
@@ -45,11 +45,14 @@ cpufetch is a command-line tool written in C that displays the CPU information i
|
||||
- [3.1 x86_64](#31-x86_64)
|
||||
- [3.2 ARM](#32-arm)
|
||||
- [3.3 PowerPC](#33-powerpc)
|
||||
- [3.4 RISC-V](#34-risc-v)
|
||||
- [4. Colors](#4-colors)
|
||||
- [4.1 Specifying a name](#41-specifying-a-name)
|
||||
- [4.2 Specifying the colors in RGB format](#42-specifying-the-colors-in-rgb-format)
|
||||
- [5. Implementation](#5-implementation)
|
||||
- [6. Bugs or improvements](#6-bugs-or-improvements)
|
||||
- [6.1 Unknown microarchitecture error](#61-unknown-microarchitecture-error)
|
||||
- [6.2 Other situations](#62-other-situations)
|
||||
- [7. Acknowledgements](#7-acknowledgements)
|
||||
- [8. cpufetch for GPUs (gpufetch)](#8-cpufetch-for-gpus-gpufetch)
|
||||
|
||||
@@ -57,17 +60,17 @@ cpufetch is a command-line tool written in C that displays the CPU information i
|
||||
|
||||
## 1. Support
|
||||
|
||||
| OS | x86_64 / x86 | ARM | PowerPC |
|
||||
|:-----------:|:------------------:|:------------------:|:------------------:|
|
||||
| GNU / Linux | :heavy_check_mark: | :heavy_check_mark: | :heavy_check_mark: |
|
||||
| Windows | :heavy_check_mark: | :x: | :x: |
|
||||
| Android | :heavy_check_mark: | :heavy_check_mark: | :x: |
|
||||
| macOS | :heavy_check_mark: | :heavy_check_mark: | :x: |
|
||||
| FreeBSD | :heavy_check_mark: | :x: | :x: |
|
||||
| OS | x86_64 / x86 | ARM | RISC-V | PowerPC |
|
||||
|:-----------:|:------------------:|:------------------:|:------------------:|:------------------:|
|
||||
| GNU / Linux | :heavy_check_mark: | :heavy_check_mark: | :heavy_check_mark: | :heavy_check_mark: |
|
||||
| Windows | :heavy_check_mark: | :x: | :x: | :x: |
|
||||
| Android | :heavy_check_mark: | :heavy_check_mark: | :x: | :x: |
|
||||
| macOS | :heavy_check_mark: | :heavy_check_mark: | :x: | :heavy_check_mark: |
|
||||
| FreeBSD | :heavy_check_mark: | :x: | :x: | :x: |
|
||||
|
||||
**NOTES:**
|
||||
- Colors will be used in Windows only if the terminal supports it.
|
||||
- Support in macOS ARM is limited to Apple M1 only
|
||||
- Support in macOS ARM is limited to Apple chips only
|
||||
|
||||
## 2. Installation
|
||||
### 2.1 Installing from a package
|
||||
@@ -118,6 +121,11 @@ make
|
||||
<p align="center"><img width=90% src="pictures/ibm.png"></p>
|
||||
<p align="center">Talos II</p>
|
||||
|
||||
## 3.4 RISC-V
|
||||
|
||||
<p align="center"><img width=80% src="pictures/starfive.png"></p>
|
||||
<p align="center">StarFive VisionFive 2</p>
|
||||
|
||||
## 4. Colors
|
||||
By default, `cpufetch` will print the CPU logo with the system colorscheme. However, you can set a custom color scheme in two different ways:
|
||||
|
||||
@@ -147,14 +155,33 @@ By default, `cpufetch` will print the CPU logo with the system colorscheme. Howe
|
||||
See [cpufetch programming documentation](https://github.com/Dr-Noob/cpufetch/tree/master/doc).
|
||||
|
||||
## 6. Bugs or improvements
|
||||
### 6.1 Unknown microarchitecture error
|
||||
If you get the `Unknown microarchitecture detected` error when running cpufetch, it might be caused by two possible reasons:
|
||||
|
||||
1. You are running an old release of cpufetch (most likely)
|
||||
2. Your microarchitecture is not yet supported
|
||||
|
||||
Download and compile the latest version (see https://github.com/Dr-Noob/cpufetch#22-building-from-source for instructions)
|
||||
and verify if the error persists.
|
||||
|
||||
* __If the error dissapears__: It means that this is the first situation. In this case, just use the
|
||||
latest version of cpufetch which already has support for your hardware.
|
||||
* __If the error does not dissapear__: It means that this is the
|
||||
second situation. In this case, please create a new issue with the error message and the output of 'cpufetch --debug' on https://github.com/Dr-Noob/cpufetch/issues
|
||||
|
||||
### 6.2 Other situations
|
||||
See [cpufetch contributing guidelines](https://github.com/Dr-Noob/cpufetch/blob/master/CONTRIBUTING.md).
|
||||
|
||||
## 7. Acknowledgements
|
||||
Thanks to the fellow contributors and interested people in the project. Special thanks to:
|
||||
- [Gonzalocl](https://github.com/Gonzalocl), [OdnetninI](https://github.com/OdnetninI): Tested cpufetch in the earlier versions of the project in many different CPUs.
|
||||
- [Gonzalocl](https://github.com/Gonzalocl) and [OdnetninI](https://github.com/OdnetninI): Tested cpufetch in the earlier versions of the project in many different CPUs.
|
||||
- [Kyngo](https://github.com/Kyngo): Tested cpufetch in the Apple M1 CPU.
|
||||
- [avollmerhaus](https://github.com/avollmerhaus): Gave me ssh acess to a PowerPC machine, allowing me to develop the PowerPC port.
|
||||
- [bbonev](https://github.com/bbonev), [stephan-cr](https://github.com/stephan-cr): Reviewed the source code.
|
||||
- [avollmerhaus](https://github.com/avollmerhaus): Helped with PowerPC port giving ssh access to a PowerPC machine.
|
||||
- [bbonev](https://github.com/bbonev) and [stephan-cr](https://github.com/stephan-cr): Reviewed the source code.
|
||||
- [mdoksa76](https://github.com/mdoksa76) and [exkc](https://github.com/exkc): Excellent ideas and feedback for supporting Allwinner SoCs.
|
||||
- [Sakura286](https://github.com/Sakura286), [exkc](https://github.com/exkc) and [Patola](https://github.com/Patola): Helped with RISC-V port with ssh access, ideas, testing, etc.
|
||||
- [ThomasKaiser](https://github.com/ThomasKaiser): Very valuable feedback on improving ARM SoC detection (Apple, Allwinner, Rockchip).
|
||||
- [zerkerX](https://github.com/zerkerX): Helped with feedback for supporting old (e.g., Pentium III) Intel CPUs.
|
||||
|
||||
## 8. cpufetch for GPUs (gpufetch)
|
||||
See [gpufetch](https://github.com/Dr-Noob/gpufetch) project!
|
||||
|
||||
BIN
pictures/starfive.png
Normal file
BIN
pictures/starfive.png
Normal file
Binary file not shown.
|
After Width: | Height: | Size: 42 KiB |
196
src/arm/midr.c
196
src/arm/midr.c
@@ -8,15 +8,18 @@
|
||||
#ifdef __linux__
|
||||
#include <sys/auxv.h>
|
||||
#include <asm/hwcap.h>
|
||||
#include "../common/freq.h"
|
||||
#elif defined __APPLE__ || __MACH__
|
||||
#include "sysctl.h"
|
||||
#include "../common/sysctl.h"
|
||||
#endif
|
||||
|
||||
#include "../common/global.h"
|
||||
#include "../common/soc.h"
|
||||
#include "../common/args.h"
|
||||
#include "udev.h"
|
||||
#include "midr.h"
|
||||
#include "uarch.h"
|
||||
#include "soc.h"
|
||||
#include "sve.h"
|
||||
|
||||
bool cores_are_equal(int c1pos, int c2pos, uint32_t* midr_array, int32_t* freq_array) {
|
||||
return midr_array[c1pos] == midr_array[c2pos] && freq_array[c1pos] == freq_array[c2pos];
|
||||
@@ -39,8 +42,17 @@ struct cache* get_cache_info(struct cpuInfo* cpu) {
|
||||
struct frequency* get_frequency_info(uint32_t core) {
|
||||
struct frequency* freq = emalloc(sizeof(struct frequency));
|
||||
|
||||
freq->measured = false;
|
||||
freq->base = UNKNOWN_DATA;
|
||||
freq->max = get_max_freq_from_file(core);
|
||||
#ifdef __linux__
|
||||
if (freq->max == UNKNOWN_DATA || measure_max_frequency_flag()) {
|
||||
if (freq->max == UNKNOWN_DATA)
|
||||
printWarn("Unable to find max frequency from udev, measuring CPU frequency");
|
||||
freq->max = measure_max_frequency(core);
|
||||
freq->measured = true;
|
||||
}
|
||||
#endif
|
||||
|
||||
return freq;
|
||||
}
|
||||
@@ -80,26 +92,21 @@ int64_t get_peak_performance(struct cpuInfo* cpu) {
|
||||
}
|
||||
}
|
||||
|
||||
int64_t flops = 0;
|
||||
int64_t total_flops = 0;
|
||||
ptr = cpu;
|
||||
|
||||
if(cpu->soc->soc_vendor == SOC_VENDOR_APPLE) {
|
||||
// Special case for M1/M2
|
||||
// First we find the E cores, then the P
|
||||
// M1 have 2 (E cores) or 4 (P cores) FMA units
|
||||
// Source: https://dougallj.github.io/applecpu/firestorm-simd.html
|
||||
flops += ptr->topo->total_cores * (get_freq(ptr->freq) * 1000000) * 2 * 4 * 2;
|
||||
ptr = ptr->next_cpu;
|
||||
flops += ptr->topo->total_cores * (get_freq(ptr->freq) * 1000000) * 2 * 4 * 4;
|
||||
}
|
||||
else {
|
||||
for(int i=0; i < cpu->num_cpus; ptr = ptr->next_cpu, i++) {
|
||||
flops += ptr->topo->total_cores * (get_freq(ptr->freq) * 1000000);
|
||||
}
|
||||
if(cpu->feat->NEON) flops = flops * 4;
|
||||
for(int i=0; i < cpu->num_cpus; ptr = ptr->next_cpu, i++) {
|
||||
int vpus = get_number_of_vpus(ptr);
|
||||
int vpus_width = get_vpus_width(ptr);
|
||||
bool has_fma = has_fma_support(ptr);
|
||||
|
||||
int64_t flops = ptr->topo->total_cores * get_freq(ptr->freq) * 1000000 * vpus * (vpus_width/32);
|
||||
if(has_fma) flops = flops * 2;
|
||||
|
||||
total_flops += flops;
|
||||
}
|
||||
|
||||
return flops;
|
||||
return total_flops;
|
||||
}
|
||||
|
||||
uint32_t fill_ids_from_midr(uint32_t* midr_array, int32_t* freq_array, uint32_t* ids_array, int len) {
|
||||
@@ -141,7 +148,7 @@ void init_cpu_info(struct cpuInfo* cpu) {
|
||||
// true...
|
||||
// ARM32 https://elixir.bootlin.com/linux/latest/source/arch/arm/include/uapi/asm/hwcap.h
|
||||
// ARM64 https://elixir.bootlin.com/linux/latest/source/arch/arm64/include/uapi/asm/hwcap.h
|
||||
struct features* get_features_info() {
|
||||
struct features* get_features_info(void) {
|
||||
struct features* feat = emalloc(sizeof(struct features));
|
||||
bool *ptr = &(feat->AES);
|
||||
for(uint32_t i = 0; i < sizeof(struct features)/sizeof(bool); i++, ptr++) {
|
||||
@@ -162,6 +169,15 @@ struct features* get_features_info() {
|
||||
feat->SHA1 = hwcaps & HWCAP_SHA1;
|
||||
feat->SHA2 = hwcaps & HWCAP_SHA2;
|
||||
feat->NEON = hwcaps & HWCAP_ASIMD;
|
||||
feat->SVE = hwcaps & HWCAP_SVE;
|
||||
|
||||
hwcaps = getauxval(AT_HWCAP2);
|
||||
if (errno == ENOENT) {
|
||||
printWarn("Unable to retrieve AT_HWCAP2 using getauxval");
|
||||
}
|
||||
else {
|
||||
feat->SVE2 = hwcaps & HWCAP2_SVE2;
|
||||
}
|
||||
}
|
||||
#else
|
||||
else {
|
||||
@@ -177,6 +193,8 @@ struct features* get_features_info() {
|
||||
feat->CRC32 = hwcaps & HWCAP2_CRC32;
|
||||
feat->SHA1 = hwcaps & HWCAP2_SHA1;
|
||||
feat->SHA2 = hwcaps & HWCAP2_SHA2;
|
||||
feat->SVE = false;
|
||||
feat->SVE2 = false;
|
||||
}
|
||||
#endif // ifdef __aarch64__
|
||||
#elif defined __APPLE__ || __MACH__
|
||||
@@ -186,8 +204,14 @@ struct features* get_features_info() {
|
||||
feat->SHA1 = true;
|
||||
feat->SHA2 = true;
|
||||
feat->NEON = true;
|
||||
feat->SVE = false;
|
||||
feat->SVE2 = false;
|
||||
#endif // ifdef __linux__
|
||||
|
||||
if (feat->SVE || feat->SVE2) {
|
||||
feat->cntb = sve_cntb();
|
||||
}
|
||||
|
||||
return feat;
|
||||
}
|
||||
|
||||
@@ -294,7 +318,7 @@ void fill_cpu_info_avalanche_blizzard(struct cpuInfo* cpu, uint32_t pcores, uint
|
||||
bli->feat = get_features_info();
|
||||
bli->topo = malloc(sizeof(struct topology));
|
||||
bli->topo->cach = bli->cach;
|
||||
bli->topo->total_cores = pcores;
|
||||
bli->topo->total_cores = ecores;
|
||||
bli->freq = malloc(sizeof(struct frequency));
|
||||
bli->freq->base = UNKNOWN_DATA;
|
||||
bli->freq->max = 2800;
|
||||
@@ -310,7 +334,7 @@ void fill_cpu_info_avalanche_blizzard(struct cpuInfo* cpu, uint32_t pcores, uint
|
||||
ava->feat = get_features_info();
|
||||
ava->topo = malloc(sizeof(struct topology));
|
||||
ava->topo->cach = ava->cach;
|
||||
ava->topo->total_cores = ecores;
|
||||
ava->topo->total_cores = pcores;
|
||||
ava->freq = malloc(sizeof(struct frequency));
|
||||
ava->freq->base = UNKNOWN_DATA;
|
||||
ava->freq->max = 3500;
|
||||
@@ -319,51 +343,84 @@ void fill_cpu_info_avalanche_blizzard(struct cpuInfo* cpu, uint32_t pcores, uint
|
||||
ava->next_cpu = NULL;
|
||||
}
|
||||
|
||||
struct cpuInfo* get_cpu_info_mach(struct cpuInfo* cpu) {
|
||||
uint32_t cpu_family = get_sys_info_by_name("hw.cpufamily");
|
||||
void fill_cpu_info_everest_sawtooth(struct cpuInfo* cpu, uint32_t pcores, uint32_t ecores) {
|
||||
// 1. Fill SAWTOOTH
|
||||
struct cpuInfo* saw = cpu;
|
||||
|
||||
saw->midr = MIDR_APPLE_M3_SAWTOOTH;
|
||||
saw->arch = get_uarch_from_midr(saw->midr, saw);
|
||||
saw->cach = get_cache_info(saw);
|
||||
saw->feat = get_features_info();
|
||||
saw->topo = malloc(sizeof(struct topology));
|
||||
saw->topo->cach = saw->cach;
|
||||
saw->topo->total_cores = ecores;
|
||||
saw->freq = malloc(sizeof(struct frequency));
|
||||
saw->freq->base = UNKNOWN_DATA;
|
||||
saw->freq->max = 2750;
|
||||
saw->hv = malloc(sizeof(struct hypervisor));
|
||||
saw->hv->present = false;
|
||||
saw->next_cpu = malloc(sizeof(struct cpuInfo));
|
||||
|
||||
// 2. Fill EVEREST
|
||||
struct cpuInfo* eve = saw->next_cpu;
|
||||
eve->midr = MIDR_APPLE_M3_EVEREST;
|
||||
eve->arch = get_uarch_from_midr(eve->midr, eve);
|
||||
eve->cach = get_cache_info(eve);
|
||||
eve->feat = get_features_info();
|
||||
eve->topo = malloc(sizeof(struct topology));
|
||||
eve->topo->cach = eve->cach;
|
||||
eve->topo->total_cores = pcores;
|
||||
eve->freq = malloc(sizeof(struct frequency));
|
||||
eve->freq->base = UNKNOWN_DATA;
|
||||
eve->freq->max = 4050;
|
||||
eve->hv = malloc(sizeof(struct hypervisor));
|
||||
eve->hv->present = false;
|
||||
eve->next_cpu = NULL;
|
||||
}
|
||||
|
||||
struct cpuInfo* get_cpu_info_mach(struct cpuInfo* cpu) {
|
||||
// https://developer.apple.com/documentation/kernel/1387446-sysctlbyname/determining_system_capabilities
|
||||
uint32_t nperflevels = get_sys_info_by_name("hw.nperflevels");
|
||||
|
||||
if((cpu->num_cpus = nperflevels) != 2) {
|
||||
printBug("Expected to find SoC with 2 perf levels, found: %d", cpu->num_cpus);
|
||||
return NULL;
|
||||
}
|
||||
|
||||
uint32_t pcores = get_sys_info_by_name("hw.perflevel0.physicalcpu");
|
||||
uint32_t ecores = get_sys_info_by_name("hw.perflevel1.physicalcpu");
|
||||
if(ecores <= 0) {
|
||||
printBug("Expected to find a numer of ecores > 0, found: %d", ecores);
|
||||
return NULL;
|
||||
}
|
||||
if(pcores <= 0) {
|
||||
printBug("Expected to find a numer of pcores > 0, found: %d", pcores);
|
||||
return NULL;
|
||||
}
|
||||
|
||||
uint32_t cpu_family = get_sys_info_by_name("hw.cpufamily");
|
||||
// Manually fill the cpuInfo assuming that
|
||||
// the CPU is an Apple M1/M2
|
||||
// the CPU is an Apple SoC
|
||||
if(cpu_family == CPUFAMILY_ARM_FIRESTORM_ICESTORM) {
|
||||
cpu->num_cpus = 2;
|
||||
// Now detect the M1 version
|
||||
uint32_t cpu_subfamily = get_sys_info_by_name("hw.cpusubfamily");
|
||||
if(cpu_subfamily == CPUSUBFAMILY_ARM_HG) {
|
||||
// Apple M1
|
||||
fill_cpu_info_firestorm_icestorm(cpu, 4, 4);
|
||||
}
|
||||
else if(cpu_subfamily == CPUSUBFAMILY_ARM_HS || cpu_subfamily == CPUSUBFAMILY_ARM_HC_HD) {
|
||||
// Apple M1 Pro/Max/Ultra. Detect number of cores
|
||||
uint32_t physicalcpu = get_sys_info_by_name("hw.physicalcpu");
|
||||
if(physicalcpu == 20) {
|
||||
// M1 Ultra
|
||||
fill_cpu_info_firestorm_icestorm(cpu, 16, 4);
|
||||
}
|
||||
else if(physicalcpu == 8 || physicalcpu == 10) {
|
||||
// M1 Pro/Max
|
||||
fill_cpu_info_firestorm_icestorm(cpu, physicalcpu-2, 2);
|
||||
}
|
||||
else {
|
||||
printBug("Found invalid physical cpu number: %d", physicalcpu);
|
||||
return NULL;
|
||||
}
|
||||
}
|
||||
else {
|
||||
printBug("Found invalid cpu_subfamily: 0x%.8X", cpu_subfamily);
|
||||
return NULL;
|
||||
}
|
||||
cpu->soc = get_soc();
|
||||
fill_cpu_info_firestorm_icestorm(cpu, pcores, ecores);
|
||||
cpu->soc = get_soc(cpu);
|
||||
cpu->peak_performance = get_peak_performance(cpu);
|
||||
}
|
||||
else if(cpu_family == CPUFAMILY_ARM_AVALANCHE_BLIZZARD) {
|
||||
// Just the "normal" M2 exists for now
|
||||
cpu->num_cpus = 2;
|
||||
fill_cpu_info_avalanche_blizzard(cpu, 4, 4);
|
||||
cpu->soc = get_soc();
|
||||
fill_cpu_info_avalanche_blizzard(cpu, pcores, ecores);
|
||||
cpu->soc = get_soc(cpu);
|
||||
cpu->peak_performance = get_peak_performance(cpu);
|
||||
}
|
||||
else if(cpu_family == CPUFAMILY_ARM_EVEREST_SAWTOOTH ||
|
||||
cpu_family == CPUFAMILY_ARM_EVEREST_SAWTOOTH_2 ||
|
||||
cpu_family == CPUFAMILY_ARM_EVEREST_SAWTOOTH_PRO ||
|
||||
cpu_family == CPUFAMILY_ARM_EVEREST_SAWTOOTH_MAX) {
|
||||
fill_cpu_info_everest_sawtooth(cpu, pcores, ecores);
|
||||
cpu->soc = get_soc(cpu);
|
||||
cpu->peak_performance = get_peak_performance(cpu);
|
||||
}
|
||||
else {
|
||||
printBug("Found invalid cpu_family: 0x%.8X", cpu_family);
|
||||
printBugCheckRelease("Found invalid cpu_family: 0x%.8X", cpu_family);
|
||||
return NULL;
|
||||
}
|
||||
|
||||
@@ -371,7 +428,7 @@ struct cpuInfo* get_cpu_info_mach(struct cpuInfo* cpu) {
|
||||
}
|
||||
#endif
|
||||
|
||||
struct cpuInfo* get_cpu_info() {
|
||||
struct cpuInfo* get_cpu_info(void) {
|
||||
struct cpuInfo* cpu = malloc(sizeof(struct cpuInfo));
|
||||
init_cpu_info(cpu);
|
||||
|
||||
@@ -392,7 +449,7 @@ char* get_str_topology(struct cpuInfo* cpu, struct topology* topo, bool dual_soc
|
||||
|
||||
char* get_str_features(struct cpuInfo* cpu) {
|
||||
struct features* feat = cpu->feat;
|
||||
uint32_t max_len = strlen("NEON,SHA1,SHA2,AES,CRC32,") + 1;
|
||||
uint32_t max_len = strlen("NEON,SHA1,SHA2,AES,CRC32,SVE,SVE2,") + 1;
|
||||
uint32_t len = 0;
|
||||
char* string = ecalloc(max_len, sizeof(char));
|
||||
|
||||
@@ -400,6 +457,14 @@ char* get_str_features(struct cpuInfo* cpu) {
|
||||
strcat(string, "NEON,");
|
||||
len += 5;
|
||||
}
|
||||
if(feat->SVE) {
|
||||
strcat(string, "SVE,");
|
||||
len += 4;
|
||||
}
|
||||
if(feat->SVE2) {
|
||||
strcat(string, "SVE2,");
|
||||
len += 5;
|
||||
}
|
||||
if(feat->SHA1) {
|
||||
strcat(string, "SHA1,");
|
||||
len += 5;
|
||||
@@ -448,6 +513,19 @@ void print_debug(struct cpuInfo* cpu) {
|
||||
printf("%ld MHz\n", freq);
|
||||
}
|
||||
}
|
||||
|
||||
if (cpu->feat->SVE || cpu->feat->SVE2) {
|
||||
printf("- cntb: %d\n", (int) cpu->feat->cntb);
|
||||
}
|
||||
|
||||
#if defined(__APPLE__) || defined(__MACH__)
|
||||
printf("hw.cpufamily: 0x%.8X\n", get_sys_info_by_name("hw.cpufamily"));
|
||||
printf("hw.cpusubfamily: 0x%.8X\n", get_sys_info_by_name("hw.cpusubfamily"));
|
||||
printf("hw.nperflevels: %d\n", get_sys_info_by_name("hw.nperflevels"));
|
||||
printf("hw.physicalcpu: %d\n", get_sys_info_by_name("hw.physicalcpu"));
|
||||
printf("hw.perflevel0.physicalcpu: %d\n", get_sys_info_by_name("hw.perflevel0.physicalcpu"));
|
||||
printf("hw.perflevel1.physicalcpu: %d\n", get_sys_info_by_name("hw.perflevel1.physicalcpu"));
|
||||
#endif
|
||||
}
|
||||
|
||||
void free_topo_struct(struct topology* topo) {
|
||||
|
||||
@@ -3,7 +3,7 @@
|
||||
|
||||
#include "../common/cpu.h"
|
||||
|
||||
struct cpuInfo* get_cpu_info();
|
||||
struct cpuInfo* get_cpu_info(void);
|
||||
|
||||
uint32_t get_nsockets(struct topology* topo);
|
||||
char* get_str_topology(struct cpuInfo* cpu, struct topology* topo, bool dual_socket);
|
||||
|
||||
740
src/arm/soc.c
740
src/arm/soc.c
File diff suppressed because it is too large
Load Diff
@@ -1,33 +1,10 @@
|
||||
#ifndef __SOC__
|
||||
#define __SOC__
|
||||
#ifndef __SOC_ARM__
|
||||
#define __SOC_ARM__
|
||||
|
||||
#include "../common/cpu.h"
|
||||
#include "../common/soc.h"
|
||||
#include <stdint.h>
|
||||
|
||||
typedef int32_t SOC;
|
||||
|
||||
enum {
|
||||
SOC_VENDOR_UNKNOWN,
|
||||
SOC_VENDOR_SNAPDRAGON,
|
||||
SOC_VENDOR_MEDIATEK,
|
||||
SOC_VENDOR_EXYNOS,
|
||||
SOC_VENDOR_KIRIN,
|
||||
SOC_VENDOR_BROADCOM,
|
||||
SOC_VENDOR_APPLE,
|
||||
SOC_VENDOR_ALLWINNER
|
||||
};
|
||||
|
||||
struct system_on_chip {
|
||||
SOC soc_model;
|
||||
VENDOR soc_vendor;
|
||||
int32_t process;
|
||||
char* soc_name;
|
||||
char* raw_name;
|
||||
};
|
||||
|
||||
struct system_on_chip* get_soc(struct cpuInfo* cpu);
|
||||
char* get_soc_name(struct system_on_chip* soc);
|
||||
VENDOR get_soc_vendor(struct system_on_chip* soc);
|
||||
char* get_str_process(struct system_on_chip* soc);
|
||||
|
||||
#endif
|
||||
|
||||
183
src/arm/socs.h
183
src/arm/socs.h
@@ -10,7 +10,6 @@ enum {
|
||||
SOC_BCM_2836,
|
||||
SOC_BCM_2837,
|
||||
SOC_BCM_2837B0,
|
||||
SOC_BCM_2711,
|
||||
SOC_BCM_21553,
|
||||
SOC_BCM_21553T,
|
||||
SOC_BCM_21663,
|
||||
@@ -20,6 +19,8 @@ enum {
|
||||
SOC_BCM_28145,
|
||||
SOC_BCM_2157,
|
||||
SOC_BCM_21654,
|
||||
SOC_BCM_2711,
|
||||
SOC_BCM_2712,
|
||||
// Hisilicon //
|
||||
SOC_HISILICON_3620,
|
||||
SOC_HISILICON_3630,
|
||||
@@ -28,6 +29,10 @@ enum {
|
||||
SOC_HISILICON_3670,
|
||||
SOC_HISILICON_3680,
|
||||
SOC_HISILICON_3690,
|
||||
SOC_HISILICON_9000S,
|
||||
// Kunpeng //
|
||||
SOC_KUNPENG_920,
|
||||
SOC_KUNPENG_930,
|
||||
// Exynos //
|
||||
SOC_EXYNOS_3475,
|
||||
SOC_EXYNOS_4210,
|
||||
@@ -63,39 +68,23 @@ enum {
|
||||
SOC_EXYNOS_980,
|
||||
SOC_EXYNOS_880,
|
||||
// Mediatek //
|
||||
SOC_MTK_MT6893,
|
||||
SOC_MTK_MT6891,
|
||||
SOC_MTK_MT6889,
|
||||
SOC_MTK_MT6885Z,
|
||||
SOC_MTK_MT6853,
|
||||
SOC_MTK_MT6873,
|
||||
SOC_MTK_MT6875,
|
||||
SOC_MTK_MT6761D,
|
||||
SOC_MTK_MT6761,
|
||||
SOC_MTK_MT6762D,
|
||||
SOC_MTK_MT6755,
|
||||
SOC_MTK_MT6755M,
|
||||
SOC_MTK_MT6755T,
|
||||
SOC_MTK_MT6757,
|
||||
SOC_MTK_MT6762,
|
||||
SOC_MTK_MT6763V,
|
||||
SOC_MTK_MT6763T,
|
||||
SOC_MTK_MT6757CD,
|
||||
SOC_MTK_MT6758,
|
||||
SOC_MTK_MT6765,
|
||||
SOC_MTK_MT6771,
|
||||
SOC_MTK_MT6768,
|
||||
SOC_MTK_MT6771T,
|
||||
SOC_MTK_MT6771V,
|
||||
SOC_MTK_MT6779,
|
||||
SOC_MTK_MT6795,
|
||||
SOC_MTK_MT6795T,
|
||||
SOC_MTK_MT6797,
|
||||
SOC_MTK_MT6797M,
|
||||
SOC_MTK_MT6797D,
|
||||
SOC_MTK_MT6797T,
|
||||
SOC_MTK_MT6797X,
|
||||
SOC_MTK_MT6799,
|
||||
SOC_MTK_MT5327,
|
||||
SOC_MTK_MT5329,
|
||||
SOC_MTK_MT5366,
|
||||
SOC_MTK_MT5389,
|
||||
SOC_MTK_MT5395,
|
||||
SOC_MTK_MT5396,
|
||||
SOC_MTK_MT5398,
|
||||
SOC_MTK_MT5505,
|
||||
SOC_MTK_MT5561,
|
||||
SOC_MTK_MT5580,
|
||||
SOC_MTK_MT5582,
|
||||
SOC_MTK_MT5592,
|
||||
SOC_MTK_MT5595,
|
||||
SOC_MTK_MT5596,
|
||||
SOC_MTK_MT5597,
|
||||
SOC_MTK_MT5889,
|
||||
SOC_MTK_MT5895,
|
||||
SOC_MTK_MT6515,
|
||||
SOC_MTK_MT6516,
|
||||
SOC_MTK_MT6517,
|
||||
@@ -125,7 +114,51 @@ enum {
|
||||
SOC_MTK_MT6750T,
|
||||
SOC_MTK_MT6752,
|
||||
SOC_MTK_MT6753,
|
||||
SOC_MTK_MT6755M,
|
||||
SOC_MTK_MT6755T,
|
||||
SOC_MTK_MT6757,
|
||||
SOC_MTK_MT6757CD,
|
||||
SOC_MTK_MT6758,
|
||||
SOC_MTK_MT6761,
|
||||
SOC_MTK_MT6761D,
|
||||
SOC_MTK_MT6762,
|
||||
SOC_MTK_MT6762D,
|
||||
SOC_MTK_MT6762G,
|
||||
SOC_MTK_MT6763T,
|
||||
SOC_MTK_MT6763V,
|
||||
SOC_MTK_MT6765,
|
||||
SOC_MTK_MT6765G,
|
||||
SOC_MTK_MT6765H,
|
||||
SOC_MTK_MT6768,
|
||||
SOC_MTK_MT6769H,
|
||||
SOC_MTK_MT6769T,
|
||||
SOC_MTK_MT6769V,
|
||||
SOC_MTK_MT6769Z,
|
||||
SOC_MTK_MT6771,
|
||||
SOC_MTK_MT6779V_CU,
|
||||
SOC_MTK_MT6779V_CV,
|
||||
SOC_MTK_MT6785V_CC,
|
||||
SOC_MTK_MT6785V_CD,
|
||||
SOC_MTK_MT6789,
|
||||
SOC_MTK_MT6795,
|
||||
SOC_MTK_MT6797,
|
||||
SOC_MTK_MT6797T,
|
||||
SOC_MTK_MT6797X,
|
||||
SOC_MTK_MT6799,
|
||||
SOC_MTK_MT6833,
|
||||
SOC_MTK_MT6850,
|
||||
SOC_MTK_MT6853,
|
||||
SOC_MTK_MT6853V,
|
||||
SOC_MTK_MT6873,
|
||||
SOC_MTK_MT6875,
|
||||
SOC_MTK_MT6879,
|
||||
SOC_MTK_MT6883Z,
|
||||
SOC_MTK_MT6885Z,
|
||||
SOC_MTK_MT6889,
|
||||
SOC_MTK_MT6889Z,
|
||||
SOC_MTK_MT6891,
|
||||
SOC_MTK_MT6893,
|
||||
SOC_MTK_MT6893Z,
|
||||
SOC_MTK_MT8121,
|
||||
SOC_MTK_MT8125,
|
||||
SOC_MTK_MT8127,
|
||||
@@ -140,7 +173,25 @@ enum {
|
||||
SOC_MTK_MT8581,
|
||||
SOC_MTK_MT8735,
|
||||
SOC_MTK_MT8765B,
|
||||
SOC_MTK_MT8781V,
|
||||
SOC_MTK_MT8783,
|
||||
SOC_MTK_MT9602,
|
||||
SOC_MTK_MT9612,
|
||||
SOC_MTK_MT9613,
|
||||
SOC_MTK_MT9615,
|
||||
SOC_MTK_MT9618,
|
||||
SOC_MTK_MT9632,
|
||||
SOC_MTK_MT9638,
|
||||
SOC_MTK_MT9652,
|
||||
SOC_MTK_MT9653,
|
||||
SOC_MTK_MT9675,
|
||||
SOC_MTK_MT9685,
|
||||
SOC_MTK_MT9686,
|
||||
SOC_MTK_MT9689,
|
||||
SOC_MTK_MT9902,
|
||||
SOC_MTK_MT9950,
|
||||
SOC_MTK_MT9972,
|
||||
SOC_MTK_MT9982,
|
||||
// Snapdragon //
|
||||
SOC_SNAPD_QSD8650,
|
||||
SOC_SNAPD_QSD8250,
|
||||
@@ -220,11 +271,16 @@ enum {
|
||||
SOC_SNAPD_SDM660,
|
||||
SOC_SNAPD_SM6115,
|
||||
SOC_SNAPD_SM6125,
|
||||
SOC_SNAPD_SM6375_AC,
|
||||
SOC_SNAPD_SM6450,
|
||||
SOC_SNAPD_SDM670,
|
||||
SOC_SNAPD_SM6150,
|
||||
SOC_SNAPD_SM6350,
|
||||
SOC_SNAPD_SDM710,
|
||||
SOC_SNAPD_SDM712,
|
||||
SOC_SNAPD_SM4375,
|
||||
SOC_SNAPD_SM4450,
|
||||
SOC_SNAPD_SM4635,
|
||||
SOC_SNAPD_SM7125,
|
||||
SOC_SNAPD_SM7150_AA,
|
||||
SOC_SNAPD_SM7150_AB,
|
||||
@@ -233,6 +289,11 @@ enum {
|
||||
SOC_SNAPD_SM7250_AA,
|
||||
SOC_SNAPD_SM7250_AB,
|
||||
SOC_SNAPD_SM7250_AC,
|
||||
SOC_SNAPD_SM7435_AB,
|
||||
SOC_SNAPD_SM7450,
|
||||
SOC_SNAPD_SM7475,
|
||||
SOC_SNAPD_SM7550_AB,
|
||||
SOC_SNAPD_SM7675_AB,
|
||||
SOC_SNAPD_MSM8974AA,
|
||||
SOC_SNAPD_MSM8974AB,
|
||||
SOC_SNAPD_MSM8974AC,
|
||||
@@ -254,12 +315,21 @@ enum {
|
||||
SOC_SNAPD_SM8350,
|
||||
SOC_SNAPD_SM8450,
|
||||
SOC_SNAPD_SM8475,
|
||||
SOC_SNAPD_SM8550_AB,
|
||||
SOC_SNAPD_SM8635,
|
||||
SOC_SNAPD_SM8650_AB,
|
||||
// APPLE
|
||||
SOC_APPLE_M1,
|
||||
SOC_APPLE_M1_PRO,
|
||||
SOC_APPLE_M1_MAX,
|
||||
SOC_APPLE_M1_ULTRA,
|
||||
SOC_APPLE_M2,
|
||||
SOC_APPLE_M2_PRO,
|
||||
SOC_APPLE_M2_MAX,
|
||||
SOC_APPLE_M2_ULTRA,
|
||||
SOC_APPLE_M3,
|
||||
SOC_APPLE_M3_PRO,
|
||||
SOC_APPLE_M3_MAX,
|
||||
// ALLWINNER
|
||||
SOC_ALLWINNER_A10,
|
||||
SOC_ALLWINNER_A13,
|
||||
@@ -271,29 +341,64 @@ enum {
|
||||
SOC_ALLWINNER_A33,
|
||||
SOC_ALLWINNER_A40,
|
||||
SOC_ALLWINNER_A50,
|
||||
SOC_ALLWINNER_A64,
|
||||
SOC_ALLWINNER_A80,
|
||||
SOC_ALLWINNER_A83T,
|
||||
SOC_ALLWINNER_V3S,
|
||||
SOC_ALLWINNER_HZP,
|
||||
SOC_ALLWINNER_H2PLUS,
|
||||
SOC_ALLWINNER_S3,
|
||||
SOC_ALLWINNER_H3,
|
||||
SOC_ALLWINNER_H8,
|
||||
SOC_ALLWINNER_H5,
|
||||
SOC_ALLWINNER_H6,
|
||||
SOC_ALLWINNER_H64,
|
||||
SOC_ALLWINNER_H616,
|
||||
SOC_ALLWINNER_H618,
|
||||
SOC_ALLWINNER_R8,
|
||||
SOC_ALLWINNER_R16,
|
||||
SOC_ALLWINNER_R40,
|
||||
SOC_ALLWINNER_R58,
|
||||
SOC_ALLWINNER_R328
|
||||
SOC_ALLWINNER_R328,
|
||||
// ROCKCHIP
|
||||
SOC_ROCKCHIP_3288,
|
||||
SOC_ROCKCHIP_3229,
|
||||
SOC_ROCKCHIP_3308,
|
||||
SOC_ROCKCHIP_3318,
|
||||
SOC_ROCKCHIP_3326,
|
||||
SOC_ROCKCHIP_3328,
|
||||
SOC_ROCKCHIP_3368,
|
||||
SOC_ROCKCHIP_3399,
|
||||
SOC_ROCKCHIP_3528,
|
||||
SOC_ROCKCHIP_3562,
|
||||
SOC_ROCKCHIP_3566,
|
||||
SOC_ROCKCHIP_3568,
|
||||
SOC_ROCKCHIP_3588,
|
||||
// GOOGLE
|
||||
SOC_GOOGLE_TENSOR,
|
||||
SOC_GOOGLE_TENSOR_G2,
|
||||
SOC_GOOGLE_TENSOR_G3,
|
||||
// NVIDIA,
|
||||
SOC_TEGRA_X1,
|
||||
// ALTRA
|
||||
SOC_AMPERE_ALTRA,
|
||||
// UNKNOWN
|
||||
SOC_MODEL_UNKNOWN
|
||||
};
|
||||
|
||||
inline static VENDOR get_soc_vendor_from_soc(SOC soc) {
|
||||
if(soc >= SOC_BCM_2835 && soc <= SOC_BCM_21654) return SOC_VENDOR_BROADCOM;
|
||||
else if(soc >= SOC_HISILICON_3620 && soc <= SOC_HISILICON_3690) return SOC_VENDOR_KIRIN;
|
||||
if(soc >= SOC_BCM_2835 && soc <= SOC_BCM_2712) return SOC_VENDOR_BROADCOM;
|
||||
else if(soc >= SOC_HISILICON_3620 && soc <= SOC_HISILICON_9000S) return SOC_VENDOR_KIRIN;
|
||||
else if(soc >= SOC_KUNPENG_920 && soc <= SOC_KUNPENG_930) return SOC_VENDOR_KUNPENG;
|
||||
else if(soc >= SOC_EXYNOS_3475 && soc <= SOC_EXYNOS_880) return SOC_VENDOR_EXYNOS;
|
||||
else if(soc >= SOC_MTK_MT6893 && soc <= SOC_MTK_MT8783) return SOC_VENDOR_MEDIATEK;
|
||||
else if(soc >= SOC_SNAPD_QSD8650 && soc <= SOC_SNAPD_SM8475) return SOC_VENDOR_SNAPDRAGON;
|
||||
else if(soc >= SOC_APPLE_M1 && soc <= SOC_APPLE_M2) return SOC_VENDOR_APPLE;
|
||||
else if(soc >= SOC_SNAPD_QSD8650 && soc <= SOC_SNAPD_SM8650_AB) return SOC_VENDOR_SNAPDRAGON;
|
||||
else if(soc >= SOC_APPLE_M1 && soc <= SOC_APPLE_M3_MAX) return SOC_VENDOR_APPLE;
|
||||
else if(soc >= SOC_ALLWINNER_A10 && soc <= SOC_ALLWINNER_R328) return SOC_VENDOR_ALLWINNER;
|
||||
else if(soc >= SOC_ROCKCHIP_3288 && soc <= SOC_ROCKCHIP_3588) return SOC_VENDOR_ROCKCHIP;
|
||||
else if(soc >= SOC_GOOGLE_TENSOR && soc <= SOC_GOOGLE_TENSOR_G3) return SOC_VENDOR_GOOGLE;
|
||||
else if(soc >= SOC_TEGRA_X1 && soc <= SOC_TEGRA_X1) return SOC_VENDOR_NVIDIA;
|
||||
else if(soc >= SOC_AMPERE_ALTRA && soc <= SOC_AMPERE_ALTRA) return SOC_VENDOR_AMPERE;
|
||||
return SOC_VENDOR_UNKNOWN;
|
||||
}
|
||||
|
||||
|
||||
15
src/arm/sve.c
Normal file
15
src/arm/sve.c
Normal file
@@ -0,0 +1,15 @@
|
||||
#include <stdint.h>
|
||||
#include "../common/global.h"
|
||||
|
||||
// https://learn.arm.com/learning-paths/servers-and-cloud-computing/sve/sve_basics/#:~:text=Using%20a%20text%20editor%20of%20your%20choice%2C%20copy,svcntb%28%29%29%3B%20%7D%20This%20program%20prints%20the%20vector%20length
|
||||
uint64_t sve_cntb(void) {
|
||||
#ifdef __ARM_FEATURE_SVE
|
||||
uint64_t x0 = 0;
|
||||
__asm volatile("cntb %0"
|
||||
: "=r"(x0));
|
||||
return x0;
|
||||
#else
|
||||
printWarn("sve_cntb: Hardware supports SVE, but it was not enabled by the compiler");
|
||||
return 0;
|
||||
#endif
|
||||
}
|
||||
6
src/arm/sve.h
Normal file
6
src/arm/sve.h
Normal file
@@ -0,0 +1,6 @@
|
||||
#ifndef __SVE_DETECTION__
|
||||
#define __SVE_DETECTION__
|
||||
|
||||
uint64_t sve_cntb(void);
|
||||
|
||||
#endif
|
||||
220
src/arm/uarch.c
220
src/arm/uarch.c
@@ -10,7 +10,6 @@
|
||||
// Data not available
|
||||
#define NA -1
|
||||
|
||||
typedef uint32_t MICROARCH;
|
||||
typedef uint32_t ISA;
|
||||
|
||||
struct uarch {
|
||||
@@ -34,87 +33,10 @@ enum {
|
||||
ISA_ARMv8_3_A,
|
||||
ISA_ARMv8_4_A,
|
||||
ISA_ARMv8_5_A,
|
||||
ISA_ARMv8_6_A,
|
||||
ISA_ARMv9_A
|
||||
};
|
||||
|
||||
enum {
|
||||
UARCH_UNKNOWN,
|
||||
// ARM
|
||||
UARCH_ARM7,
|
||||
UARCH_ARM9,
|
||||
UARCH_ARM1136,
|
||||
UARCH_ARM1156,
|
||||
UARCH_ARM1176,
|
||||
UARCH_ARM11MPCORE,
|
||||
UARCH_CORTEX_A5,
|
||||
UARCH_CORTEX_A7,
|
||||
UARCH_CORTEX_A8,
|
||||
UARCH_CORTEX_A9,
|
||||
UARCH_CORTEX_A12,
|
||||
UARCH_CORTEX_A15,
|
||||
UARCH_CORTEX_A17,
|
||||
UARCH_CORTEX_A32,
|
||||
UARCH_CORTEX_A35,
|
||||
UARCH_CORTEX_A53,
|
||||
UARCH_CORTEX_A55r0, // ARM Cortex-A55 revision 0 (restricted dual-issue capabilities compared to revision 1+).
|
||||
UARCH_CORTEX_A55,
|
||||
UARCH_CORTEX_A57,
|
||||
UARCH_CORTEX_A65,
|
||||
UARCH_CORTEX_A72,
|
||||
UARCH_CORTEX_A73,
|
||||
UARCH_CORTEX_A75,
|
||||
UARCH_CORTEX_A76,
|
||||
UARCH_CORTEX_A77,
|
||||
UARCH_CORTEX_A78,
|
||||
UARCH_CORTEX_A510,
|
||||
UARCH_CORTEX_A710,
|
||||
UARCH_CORTEX_X1,
|
||||
UARCH_CORTEX_X2,
|
||||
UARCH_NEOVERSE_N1,
|
||||
UARCH_NEOVERSE_E1,
|
||||
UARCH_SCORPION,
|
||||
UARCH_KRAIT,
|
||||
UARCH_KYRO,
|
||||
UARCH_FALKOR,
|
||||
UARCH_SAPHIRA,
|
||||
UARCH_DENVER,
|
||||
UARCH_DENVER2,
|
||||
UARCH_CARMEL,
|
||||
// SAMSUNG
|
||||
UARCH_EXYNOS_M1, // Samsung Exynos M1 (Exynos 8890 big cores)
|
||||
UARCH_EXYNOS_M2, // Samsung Exynos M2 (Exynos 8895 big cores)
|
||||
UARCH_EXYNOS_M3, // Samsung Exynos M3 (Exynos 9810 big cores)
|
||||
UARCH_EXYNOS_M4, // Samsung Exynos M4 (Exynos 9820 big cores)
|
||||
UARCH_EXYNOS_M5, // Samsung Exynos M5 (Exynos 9830 big cores)
|
||||
// APPLE
|
||||
UARCH_SWIFT, // Apple A6 and A6X processors.
|
||||
UARCH_CYCLONE, // Apple A7 processor.
|
||||
UARCH_TYPHOON, // Apple A8 and A8X processor
|
||||
UARCH_TWISTER, // Apple A9 and A9X processor.
|
||||
UARCH_HURRICANE, // Apple A10 and A10X processor.
|
||||
UARCH_MONSOON, // Apple A11 processor (big cores).
|
||||
UARCH_MISTRAL, // Apple A11 processor (little cores).
|
||||
UARCH_VORTEX, // Apple A12 processor (big cores).
|
||||
UARCH_TEMPEST, // Apple A12 processor (big cores).
|
||||
UARCH_LIGHTNING, // Apple A13 processor (big cores).
|
||||
UARCH_THUNDER, // Apple A13 processor (little cores).
|
||||
UARCH_ICESTORM, // Apple M1 processor (little cores).
|
||||
UARCH_FIRESTORM, // Apple M1 processor (big cores).
|
||||
UARCH_BLIZZARD, // Apple M2 processor (little cores).
|
||||
UARCH_AVALANCHE, // Apple M2 processor (big cores).
|
||||
// CAVIUM
|
||||
UARCH_THUNDERX, // Cavium ThunderX
|
||||
UARCH_THUNDERX2, // Cavium ThunderX2 (originally Broadcom Vulkan).
|
||||
// MARVELL
|
||||
UARCH_PJ4,
|
||||
UARCH_BRAHMA_B15,
|
||||
UARCH_BRAHMA_B53,
|
||||
UARCH_XGENE, // Applied Micro X-Gene.
|
||||
UARCH_TAISHAN_V110, // HiSilicon TaiShan v110 (Huawei Kunpeng 920 series processors).
|
||||
// PHYTIUM
|
||||
UARCH_XIAOMI, // Not to be confused with Xiaomi Inc
|
||||
};
|
||||
|
||||
static const ISA isas_uarch[] = {
|
||||
[UARCH_ARM1136] = ISA_ARMv6,
|
||||
[UARCH_ARM1156] = ISA_ARMv6_T2,
|
||||
@@ -142,15 +64,20 @@ static const ISA isas_uarch[] = {
|
||||
[UARCH_CORTEX_A78] = ISA_ARMv8_2_A,
|
||||
[UARCH_CORTEX_A510] = ISA_ARMv9_A,
|
||||
[UARCH_CORTEX_A710] = ISA_ARMv9_A,
|
||||
[UARCH_CORTEX_A715] = ISA_ARMv9_A,
|
||||
[UARCH_CORTEX_X1] = ISA_ARMv8_2_A,
|
||||
[UARCH_CORTEX_X2] = ISA_ARMv9_A,
|
||||
[UARCH_CORTEX_X3] = ISA_ARMv9_A,
|
||||
[UARCH_NEOVERSE_N1] = ISA_ARMv8_2_A,
|
||||
[UARCH_NEOVERSE_E1] = ISA_ARMv8_2_A,
|
||||
[UARCH_NEOVERSE_V1] = ISA_ARMv8_4_A,
|
||||
[UARCH_BRAHMA_B15] = ISA_ARMv7_A, // Same as Cortex-A15
|
||||
[UARCH_BRAHMA_B53] = ISA_ARMv8_A, // Same as Cortex-A53
|
||||
[UARCH_THUNDERX] = ISA_ARMv8_A,
|
||||
[UARCH_THUNDERX2] = ISA_ARMv8_1_A,
|
||||
[UARCH_TAISHAN_V110] = ISA_ARMv8_2_A,
|
||||
[UARCH_TAISHAN_V120] = ISA_ARMv8_2_A, // Not confirmed
|
||||
[UARCH_TAISHAN_V200] = ISA_ARMv8_2_A, // Not confirmed
|
||||
[UARCH_DENVER] = ISA_ARMv8_A,
|
||||
[UARCH_DENVER2] = ISA_ARMv8_A,
|
||||
[UARCH_CARMEL] = ISA_ARMv8_A,
|
||||
@@ -167,8 +94,10 @@ static const ISA isas_uarch[] = {
|
||||
[UARCH_EXYNOS_M5] = ISA_ARMv8_2_A,
|
||||
[UARCH_ICESTORM] = ISA_ARMv8_5_A, // https://github.com/llvm/llvm-project/blob/main/llvm/include/llvm/Support/AArch64TargetParser.def
|
||||
[UARCH_FIRESTORM] = ISA_ARMv8_5_A,
|
||||
[UARCH_BLIZZARD] = ISA_ARMv8_5_A, // Not confirmed
|
||||
[UARCH_AVALANCHE] = ISA_ARMv8_5_A,
|
||||
[UARCH_BLIZZARD] = ISA_ARMv8_6_A, // https://github.com/llvm/llvm-project/blob/main/llvm/unittests/TargetParser/TargetParserTest.cpp
|
||||
[UARCH_AVALANCHE] = ISA_ARMv8_6_A, // https://github.com/llvm/llvm-project/blob/main/llvm/unittests/TargetParser/TargetParserTest.cpp
|
||||
[UARCH_SAWTOOTH] = ISA_ARMv8_6_A, // https://github.com/llvm/llvm-project/blob/main/llvm/unittests/TargetParser/TargetParserTest.cpp
|
||||
[UARCH_EVEREST] = ISA_ARMv8_6_A, // https://github.com/llvm/llvm-project/blob/main/llvm/unittests/TargetParser/TargetParserTest.cpp
|
||||
[UARCH_PJ4] = ISA_ARMv7_A,
|
||||
[UARCH_XIAOMI] = ISA_ARMv8_A,
|
||||
};
|
||||
@@ -186,13 +115,15 @@ static char* isas_string[] = {
|
||||
[ISA_ARMv8_3_A] = "ARMv8.3",
|
||||
[ISA_ARMv8_4_A] = "ARMv8.4",
|
||||
[ISA_ARMv8_5_A] = "ARMv8.5",
|
||||
[ISA_ARMv8_6_A] = "ARMv8.6",
|
||||
[ISA_ARMv9_A] = "ARMv9"
|
||||
};
|
||||
|
||||
#define UARCH_START if (false) {}
|
||||
#define CHECK_UARCH(arch, cpu, im_, p_, v_, r_, str, uarch, vendor) \
|
||||
else if (im_ == im && p_ == p && (v_ == NA || v_ == v) && (r_ == NA || r_ == r)) fill_uarch(arch, cpu, str, uarch, vendor);
|
||||
#define UARCH_END else { printBug("Unknown microarchitecture detected: IM=0x%.8X P=0x%.8X V=0x%.8X R=0x%.8X", im, p, v, r); fill_uarch(arch, cpu, "Unknown", UARCH_UNKNOWN, CPU_VENDOR_UNKNOWN); }
|
||||
#define UARCH_END else { printBugCheckRelease("Unknown microarchitecture detected: IM=0x%X P=0x%X V=0x%X R=0x%X", im, p, v, r); \
|
||||
fill_uarch(arch, cpu, "Unknown", UARCH_UNKNOWN, CPU_VENDOR_UNKNOWN); }
|
||||
|
||||
void fill_uarch(struct uarch* arch, struct cpuInfo* cpu, char* str, MICROARCH u, VENDOR vendor) {
|
||||
arch->uarch = u;
|
||||
@@ -208,10 +139,11 @@ void fill_uarch(struct uarch* arch, struct cpuInfo* cpu, char* str, MICROARCH u,
|
||||
|
||||
/*
|
||||
* Codes are based on pytorch/cpuinfo, more precisely:
|
||||
* - https://github.com/pytorch/cpuinfo/blob/master/src/arm/uarch.c
|
||||
* - https://github.com/pytorch/cpuinfo/blob/main/src/arm/uarch.c
|
||||
* Other sources:
|
||||
* - https://elixir.bootlin.com/linux/latest/source/arch/arm64/include/asm/cputype.h
|
||||
* - https://elixir.bootlin.com/linux/latest/source/arch/arm/include/asm/cputype.h
|
||||
* - https://github.com/AsahiLinux/m1n1/blob/main/src/chickens.c
|
||||
*/
|
||||
struct uarch* get_uarch_from_midr(uint32_t midr, struct cpuInfo* cpu) {
|
||||
struct uarch* arch = emalloc(sizeof(struct uarch));
|
||||
@@ -254,12 +186,15 @@ struct uarch* get_uarch_from_midr(uint32_t midr, struct cpuInfo* cpu) {
|
||||
CHECK_UARCH(arch, cpu, 'A', 0xD0C, NA, NA, "Neoverse N1", UARCH_NEOVERSE_N1, CPU_VENDOR_ARM)
|
||||
CHECK_UARCH(arch, cpu, 'A', 0xD0D, NA, NA, "Cortex-A77", UARCH_CORTEX_A77, CPU_VENDOR_ARM)
|
||||
CHECK_UARCH(arch, cpu, 'A', 0xD0E, NA, NA, "Cortex-A76", UARCH_CORTEX_A76, CPU_VENDOR_ARM)
|
||||
CHECK_UARCH(arch, cpu, 'A', 0xD40, NA, NA, "Neoverse V1", UARCH_NEOVERSE_V1, CPU_VENDOR_ARM)
|
||||
CHECK_UARCH(arch, cpu, 'A', 0xD41, NA, NA, "Cortex-A78", UARCH_CORTEX_A78, CPU_VENDOR_ARM)
|
||||
CHECK_UARCH(arch, cpu, 'A', 0xD44, NA, NA, "Cortex-X1", UARCH_CORTEX_X1, CPU_VENDOR_ARM)
|
||||
CHECK_UARCH(arch, cpu, 'A', 0xD46, NA, NA, "Cortex‑A510", UARCH_CORTEX_A510, CPU_VENDOR_ARM)
|
||||
CHECK_UARCH(arch, cpu, 'A', 0xD47, NA, NA, "Cortex‑A710", UARCH_CORTEX_A710, CPU_VENDOR_ARM)
|
||||
CHECK_UARCH(arch, cpu, 'A', 0xD48, NA, NA, "Cortex-X2", UARCH_CORTEX_X2, CPU_VENDOR_ARM)
|
||||
CHECK_UARCH(arch, cpu, 'A', 0xD4A, NA, NA, "Neoverse E1", UARCH_NEOVERSE_E1, CPU_VENDOR_ARM)
|
||||
CHECK_UARCH(arch, cpu, 'A', 0xD4D, NA, NA, "Cortex-A715", UARCH_CORTEX_A715, CPU_VENDOR_ARM)
|
||||
CHECK_UARCH(arch, cpu, 'A', 0xD4E, NA, NA, "Cortex-X3", UARCH_CORTEX_X3, CPU_VENDOR_ARM)
|
||||
|
||||
CHECK_UARCH(arch, cpu, 'B', 0x00F, NA, NA, "Brahma B15", UARCH_BRAHMA_B15, CPU_VENDOR_BROADCOM)
|
||||
CHECK_UARCH(arch, cpu, 'B', 0x100, NA, NA, "Brahma B53", UARCH_BRAHMA_B53, CPU_VENDOR_BROADCOM)
|
||||
@@ -271,8 +206,11 @@ struct uarch* get_uarch_from_midr(uint32_t midr, struct cpuInfo* cpu) {
|
||||
CHECK_UARCH(arch, cpu, 'C', 0x0A3, NA, NA, "ThunderX 81XX", UARCH_THUNDERX, CPU_VENDOR_CAVIUM)
|
||||
CHECK_UARCH(arch, cpu, 'C', 0x0AF, NA, NA, "ThunderX2 99XX", UARCH_THUNDERX2, CPU_VENDOR_CAVIUM)
|
||||
|
||||
CHECK_UARCH(arch, cpu, 'H', 0xD01, NA, NA, "TaiShan v110", UARCH_TAISHAN_V110, CPU_VENDOR_HUAWUEI) // Kunpeng 920 series
|
||||
CHECK_UARCH(arch, cpu, 'H', 0xD40, NA, NA, "Cortex-A76", UARCH_CORTEX_A76, CPU_VENDOR_ARM) // Kirin 980 Big/Medium cores -> Cortex-A76
|
||||
CHECK_UARCH(arch, cpu, 'H', 0xD01, NA, NA, "TaiShan v110", UARCH_TAISHAN_V110, CPU_VENDOR_HUAWEI) // Kunpeng 920 series
|
||||
CHECK_UARCH(arch, cpu, 'H', 0xD02, 2, 2, "TaiShan v120", UARCH_TAISHAN_V120, CPU_VENDOR_HUAWEI) // Kiring 9000S Big cores (https://github.com/Dr-Noob/cpufetch/issues/259)
|
||||
CHECK_UARCH(arch, cpu, 'H', 0xD02, NA, NA, "TaiShan v200", UARCH_TAISHAN_V200, CPU_VENDOR_HUAWEI) // Kunpeng 930 series (found in openeuler: https://mailweb.openeuler.org/hyperkitty/list/kernel@openeuler.org/message/XQCV7NX2UKRIUWUFKRF4PO3QENCOUFR3)
|
||||
CHECK_UARCH(arch, cpu, 'H', 0xD40, NA, NA, "Cortex-A76", UARCH_CORTEX_A76, CPU_VENDOR_ARM) // Kirin 980 Big/Medium cores -> Cortex-A76
|
||||
CHECK_UARCH(arch, cpu, 'H', 0xD42, NA, NA, "TaiShan v120", UARCH_TAISHAN_V120, CPU_VENDOR_HUAWEI) // Kiring 9000S Small Cores (https://github.com/Dr-Noob/cpufetch/issues/259)
|
||||
|
||||
CHECK_UARCH(arch, cpu, 'N', 0x000, NA, NA, "Denver", UARCH_DENVER, CPU_VENDOR_NVIDIA)
|
||||
CHECK_UARCH(arch, cpu, 'N', 0x003, NA, NA, "Denver2", UARCH_DENVER2, CPU_VENDOR_NVIDIA)
|
||||
@@ -314,8 +252,12 @@ struct uarch* get_uarch_from_midr(uint32_t midr, struct cpuInfo* cpu) {
|
||||
|
||||
CHECK_UARCH(arch, cpu, 'a', 0x022, NA, NA, "Icestorm", UARCH_ICESTORM, CPU_VENDOR_APPLE)
|
||||
CHECK_UARCH(arch, cpu, 'a', 0x023, NA, NA, "Firestorm", UARCH_FIRESTORM, CPU_VENDOR_APPLE)
|
||||
CHECK_UARCH(arch, cpu, 'a', 0x024, NA, NA, "Icestorm", UARCH_ICESTORM, CPU_VENDOR_APPLE) // https://github.com/Dr-Noob/cpufetch/issues/263
|
||||
CHECK_UARCH(arch, cpu, 'a', 0x025, NA, NA, "Firestorm", UARCH_FIRESTORM, CPU_VENDOR_APPLE) // https://github.com/Dr-Noob/cpufetch/issues/263
|
||||
CHECK_UARCH(arch, cpu, 'a', 0x030, NA, NA, "Blizzard", UARCH_BLIZZARD, CPU_VENDOR_APPLE)
|
||||
CHECK_UARCH(arch, cpu, 'a', 0x031, NA, NA, "Avalanche", UARCH_AVALANCHE, CPU_VENDOR_APPLE)
|
||||
CHECK_UARCH(arch, cpu, 'a', 0x048, NA, NA, "Sawtooth", UARCH_SAWTOOTH, CPU_VENDOR_APPLE)
|
||||
CHECK_UARCH(arch, cpu, 'a', 0x049, NA, NA, "Everest", UARCH_EVEREST, CPU_VENDOR_APPLE)
|
||||
|
||||
CHECK_UARCH(arch, cpu, 'V', 0x581, NA, NA, "PJ4", UARCH_PJ4, CPU_VENDOR_MARVELL)
|
||||
CHECK_UARCH(arch, cpu, 'V', 0x584, NA, NA, "PJ4B-MP", UARCH_PJ4, CPU_VENDOR_MARVELL)
|
||||
@@ -325,15 +267,115 @@ struct uarch* get_uarch_from_midr(uint32_t midr, struct cpuInfo* cpu) {
|
||||
return arch;
|
||||
}
|
||||
|
||||
bool is_ARMv8_or_newer(struct cpuInfo* cpu) {
|
||||
return cpu->arch->isa == ISA_ARMv8_A ||
|
||||
cpu->arch->isa == ISA_ARMv8_A_AArch32 ||
|
||||
cpu->arch->isa == ISA_ARMv8_1_A ||
|
||||
cpu->arch->isa == ISA_ARMv8_2_A ||
|
||||
cpu->arch->isa == ISA_ARMv8_3_A ||
|
||||
cpu->arch->isa == ISA_ARMv8_4_A ||
|
||||
cpu->arch->isa == ISA_ARMv8_5_A ||
|
||||
cpu->arch->isa == ISA_ARMv8_6_A ||
|
||||
cpu->arch->isa == ISA_ARMv9_A;
|
||||
}
|
||||
|
||||
bool has_fma_support(struct cpuInfo* cpu) {
|
||||
// Arm A64 Instruction Set Architecture
|
||||
// https://developer.arm.com/documentation/ddi0596/2021-12/SIMD-FP-Instructions
|
||||
return is_ARMv8_or_newer(cpu);
|
||||
}
|
||||
|
||||
int get_vpus_width(struct cpuInfo* cpu) {
|
||||
// If the CPU has NEON, width can be 64 or 128 [1].
|
||||
// In >= ARMv8, NEON are 128 bits width [2]
|
||||
// If the CPU has SVE/SVE2, width can be between 128-2048 [3],
|
||||
// so we must check the exact width depending on
|
||||
// the exact chip (Neoverse V1 uses 256b implementations.)
|
||||
//
|
||||
// [1] https://en.wikipedia.org/wiki/ARM_architecture_family#Advanced_SIMD_(Neon)
|
||||
// [2] https://developer.arm.com/documentation/102474/0100/Fundamentals-of-Armv8-Neon-technology
|
||||
// [3] https://www.anandtech.com/show/16640/arm-announces-neoverse-v1-n2-platforms-cpus-cmn700-mesh/5
|
||||
|
||||
MICROARCH ua = cpu->arch->uarch;
|
||||
switch(ua) {
|
||||
case UARCH_NEOVERSE_V1:
|
||||
return 256;
|
||||
default:
|
||||
if (cpu->feat->SVE && cpu->feat->cntb > 0) {
|
||||
return cpu->feat->cntb * 8;
|
||||
}
|
||||
else if (cpu->feat->NEON) {
|
||||
if(is_ARMv8_or_newer(cpu)) {
|
||||
return 128;
|
||||
}
|
||||
else {
|
||||
return 64;
|
||||
}
|
||||
}
|
||||
else {
|
||||
return 32;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
int get_number_of_vpus(struct cpuInfo* cpu) {
|
||||
MICROARCH ua = cpu->arch->uarch;
|
||||
|
||||
switch(ua) {
|
||||
case UARCH_EVEREST: // Just a guess, needs confirmation.
|
||||
case UARCH_FIRESTORM: // [https://dougallj.github.io/applecpu/firestorm-simd.html]
|
||||
case UARCH_AVALANCHE: // [https://en.wikipedia.org/wiki/Comparison_of_ARM_processors]
|
||||
case UARCH_CORTEX_X1: // [https://www.anandtech.com/show/15813/arm-cortex-a78-cortex-x1-cpu-ip-diverging/3]
|
||||
case UARCH_CORTEX_X2: // [https://www.anandtech.com/show/16693/arm-announces-mobile-armv9-cpu-microarchitectures-cortexx2-cortexa710-cortexa510/2]
|
||||
case UARCH_CORTEX_X3: // [https://www.hwcooling.net/en/cortex-x3-the-new-fastest-arm-core-architecture-analysis: "The FPU and SIMD unit of the core still has four pipelines"]
|
||||
case UARCH_NEOVERSE_V1: // [https://en.wikichip.org/wiki/arm_holdings/microarchitectures/neoverse_v1]
|
||||
return 4;
|
||||
case UARCH_SAWTOOTH: // Needs confirmation, rn this is the best we know: https://mastodon.social/@dougall/111118317031041336
|
||||
case UARCH_EXYNOS_M3: // [https://www.anandtech.com/show/12361/samsung-exynos-m3-architecture]
|
||||
case UARCH_EXYNOS_M4: // [https://en.wikichip.org/wiki/samsung/microarchitectures/m4#Block_Diagram]
|
||||
case UARCH_EXYNOS_M5: // [https://en.wikichip.org/wiki/samsung/microarchitectures/m5]
|
||||
return 3;
|
||||
case UARCH_ICESTORM: // [https://dougallj.github.io/applecpu/icestorm-simd.html]
|
||||
case UARCH_BLIZZARD: // [https://en.wikipedia.org/wiki/Comparison_of_ARM_processors]
|
||||
case UARCH_TAISHAN_V110:// [https://www-file.huawei.com/-/media/corp2020/pdf/publications/huawei-research/2022/huawei-research-issue1-en.pdf]: "128-bit x 2 for single precision"
|
||||
case UARCH_TAISHAN_V120:// Not confirmed, asssuming same as v110
|
||||
case UARCH_TAISHAN_V200:// Not confirmed, asssuming same as v110
|
||||
case UARCH_CORTEX_A57: // [https://www.anandtech.com/show/8718/the-samsung-galaxy-note-4-exynos-review/5]
|
||||
case UARCH_CORTEX_A72: // [https://www.anandtech.com/show/10347/arm-cortex-a73-artemis-unveiled/2]
|
||||
case UARCH_CORTEX_A73: // [https://www.anandtech.com/show/10347/arm-cortex-a73-artemis-unveiled/2]
|
||||
case UARCH_CORTEX_A75: // [https://www.anandtech.com/show/11441/dynamiq-and-arms-new-cpus-cortex-a75-a55/3]
|
||||
case UARCH_CORTEX_A76: // [https://www.anandtech.com/show/12785/arm-cortex-a76-cpu-unveiled-7nm-powerhouse/3]
|
||||
case UARCH_CORTEX_A77: // [https://fuse.wikichip.org/news/2339/arm-unveils-cortex-a77-emphasizes-single-thread-performance]
|
||||
case UARCH_CORTEX_A78: // [https://fuse.wikichip.org/news/3536/arm-unveils-the-cortex-a78-when-less-is-more]
|
||||
case UARCH_EXYNOS_M1: // [https://www.anandtech.com/show/12361/samsung-exynos-m3-architecture]
|
||||
case UARCH_EXYNOS_M2: // [https://www.anandtech.com/show/12361/samsung-exynos-m3-architecture]
|
||||
case UARCH_NEOVERSE_N1: // [https://en.wikichip.org/wiki/arm_holdings/microarchitectures/neoverse_n1#Individual_Core]
|
||||
case UARCH_CORTEX_A710: // [https://chipsandcheese.com/2023/08/11/arms-cortex-a710-winning-by-default/]: Fig in Core Overview. Table in Instruction Scheduling and Execution
|
||||
case UARCH_CORTEX_A715: // [https://www.hwcooling.net/en/arm-introduces-new-cortex-a715-core-architecture-analysis/]: "the numbers of ALU and FPU execution units themselves >
|
||||
return 2;
|
||||
case UARCH_NEOVERSE_E1: // [https://www.anandtech.com/show/13959/arm-announces-neoverse-n1-platform/5]
|
||||
// A510 is integrated as part of a Complex. Normally, each complex would incorporate two Cortex-A510 cores.
|
||||
// Each complex incorporates a single VPU with 2 ports, so for each A510 there is theoretically 1 port.
|
||||
case UARCH_CORTEX_A510: // [https://en.wikichip.org/wiki/arm_holdings/microarchitectures/cortex-a510#Vector_Processing_Unit_.28VPU.29]
|
||||
return 1;
|
||||
default:
|
||||
// ARMv6
|
||||
// ARMv7
|
||||
// Remaining UARCH_CORTEX_AXX
|
||||
// Old Snapdragon (e.g., Scorpion, Krait, etc)
|
||||
return 1;
|
||||
}
|
||||
}
|
||||
|
||||
char* get_str_uarch(struct cpuInfo* cpu) {
|
||||
return cpu->arch->uarch_str;
|
||||
}
|
||||
|
||||
MICROARCH get_uarch(struct uarch* arch) {
|
||||
return arch->uarch;
|
||||
}
|
||||
|
||||
void free_uarch_struct(struct uarch* arch) {
|
||||
free(arch->uarch_str);
|
||||
free(arch);
|
||||
}
|
||||
|
||||
bool is_cortex_x2(struct uarch* arch) {
|
||||
return arch->uarch == UARCH_CORTEX_X2;
|
||||
}
|
||||
|
||||
@@ -5,9 +5,100 @@
|
||||
|
||||
#include "midr.h"
|
||||
|
||||
enum {
|
||||
UARCH_UNKNOWN,
|
||||
// ARM
|
||||
UARCH_ARM7,
|
||||
UARCH_ARM9,
|
||||
UARCH_ARM1136,
|
||||
UARCH_ARM1156,
|
||||
UARCH_ARM1176,
|
||||
UARCH_ARM11MPCORE,
|
||||
UARCH_CORTEX_A5,
|
||||
UARCH_CORTEX_A7,
|
||||
UARCH_CORTEX_A8,
|
||||
UARCH_CORTEX_A9,
|
||||
UARCH_CORTEX_A12,
|
||||
UARCH_CORTEX_A15,
|
||||
UARCH_CORTEX_A17,
|
||||
UARCH_CORTEX_A32,
|
||||
UARCH_CORTEX_A35,
|
||||
UARCH_CORTEX_A53,
|
||||
UARCH_CORTEX_A55r0, // ARM Cortex-A55 revision 0 (restricted dual-issue capabilities compared to revision 1+).
|
||||
UARCH_CORTEX_A55,
|
||||
UARCH_CORTEX_A57,
|
||||
UARCH_CORTEX_A65,
|
||||
UARCH_CORTEX_A72,
|
||||
UARCH_CORTEX_A73,
|
||||
UARCH_CORTEX_A75,
|
||||
UARCH_CORTEX_A76,
|
||||
UARCH_CORTEX_A77,
|
||||
UARCH_CORTEX_A78,
|
||||
UARCH_CORTEX_A510,
|
||||
UARCH_CORTEX_A710,
|
||||
UARCH_CORTEX_A715,
|
||||
UARCH_CORTEX_X1,
|
||||
UARCH_CORTEX_X2,
|
||||
UARCH_CORTEX_X3,
|
||||
UARCH_NEOVERSE_N1,
|
||||
UARCH_NEOVERSE_E1,
|
||||
UARCH_NEOVERSE_V1,
|
||||
UARCH_SCORPION,
|
||||
UARCH_KRAIT,
|
||||
UARCH_KYRO,
|
||||
UARCH_FALKOR,
|
||||
UARCH_SAPHIRA,
|
||||
UARCH_DENVER,
|
||||
UARCH_DENVER2,
|
||||
UARCH_CARMEL,
|
||||
// SAMSUNG
|
||||
UARCH_EXYNOS_M1, // Samsung Exynos M1 (Exynos 8890 big cores)
|
||||
UARCH_EXYNOS_M2, // Samsung Exynos M2 (Exynos 8895 big cores)
|
||||
UARCH_EXYNOS_M3, // Samsung Exynos M3 (Exynos 9810 big cores)
|
||||
UARCH_EXYNOS_M4, // Samsung Exynos M4 (Exynos 9820 big cores)
|
||||
UARCH_EXYNOS_M5, // Samsung Exynos M5 (Exynos 9830 big cores)
|
||||
// APPLE
|
||||
UARCH_SWIFT, // Apple A6 and A6X processors.
|
||||
UARCH_CYCLONE, // Apple A7 processor.
|
||||
UARCH_TYPHOON, // Apple A8 and A8X processor
|
||||
UARCH_TWISTER, // Apple A9 and A9X processor.
|
||||
UARCH_HURRICANE, // Apple A10 and A10X processor.
|
||||
UARCH_MONSOON, // Apple A11 processor (big cores).
|
||||
UARCH_MISTRAL, // Apple A11 processor (little cores).
|
||||
UARCH_VORTEX, // Apple A12 processor (big cores).
|
||||
UARCH_TEMPEST, // Apple A12 processor (big cores).
|
||||
UARCH_LIGHTNING, // Apple A13 processor (big cores).
|
||||
UARCH_THUNDER, // Apple A13 processor (little cores).
|
||||
UARCH_ICESTORM, // Apple M1 processor (little cores).
|
||||
UARCH_FIRESTORM, // Apple M1 processor (big cores).
|
||||
UARCH_BLIZZARD, // Apple M2 processor (little cores).
|
||||
UARCH_AVALANCHE, // Apple M2 processor (big cores).
|
||||
UARCH_SAWTOOTH, // Apple M3 processor (little cores).
|
||||
UARCH_EVEREST, // Apple M3 processor (big cores).
|
||||
// CAVIUM
|
||||
UARCH_THUNDERX, // Cavium ThunderX
|
||||
UARCH_THUNDERX2, // Cavium ThunderX2 (originally Broadcom Vulkan).
|
||||
// MARVELL
|
||||
UARCH_PJ4,
|
||||
UARCH_BRAHMA_B15,
|
||||
UARCH_BRAHMA_B53,
|
||||
UARCH_XGENE, // Applied Micro X-Gene.
|
||||
// HUAWEI
|
||||
UARCH_TAISHAN_V110, // HiSilicon TaiShan v110
|
||||
UARCH_TAISHAN_V120, // HiSilicon TaiShan v120
|
||||
UARCH_TAISHAN_V200, // HiSilicon TaiShan v200
|
||||
// PHYTIUM
|
||||
UARCH_XIAOMI, // Not to be confused with Xiaomi Inc
|
||||
};
|
||||
|
||||
typedef uint32_t MICROARCH;
|
||||
|
||||
struct uarch* get_uarch_from_midr(uint32_t midr, struct cpuInfo* cpu);
|
||||
int get_number_of_vpus(struct cpuInfo* cpu);
|
||||
int get_vpus_width(struct cpuInfo* cpu);
|
||||
bool has_fma_support(struct cpuInfo* cpu);
|
||||
char* get_str_uarch(struct cpuInfo* cpu);
|
||||
void free_uarch_struct(struct uarch* arch);
|
||||
bool is_cortex_x2(struct uarch* arch);
|
||||
MICROARCH get_uarch(struct uarch* arch);
|
||||
|
||||
#endif
|
||||
|
||||
@@ -3,8 +3,6 @@
|
||||
#include "midr.h"
|
||||
|
||||
#define _PATH_DEVICETREE_MODEL "/sys/firmware/devicetree/base/model"
|
||||
#define _PATH_CPUINFO "/proc/cpuinfo"
|
||||
//#define _PATH_CPUINFO "cpuinfo_debug"
|
||||
|
||||
#define CPUINFO_CPU_IMPLEMENTER_STR "CPU implementer\t: "
|
||||
#define CPUINFO_CPU_ARCHITECTURE_STR "CPU architecture: "
|
||||
@@ -108,36 +106,15 @@ uint32_t get_midr_from_cpuinfo(uint32_t core, bool* success) {
|
||||
return midr;
|
||||
}
|
||||
|
||||
char* get_field_from_cpuinfo(char* CPUINFO_FIELD) {
|
||||
int filelen;
|
||||
char* buf;
|
||||
if((buf = read_file(_PATH_CPUINFO, &filelen)) == NULL) {
|
||||
printWarn("read_file: %s: %s:\n", _PATH_CPUINFO, strerror(errno));
|
||||
return NULL;
|
||||
}
|
||||
|
||||
char* tmp1 = strstr(buf, CPUINFO_FIELD);
|
||||
if(tmp1 == NULL) return NULL;
|
||||
tmp1 = tmp1 + strlen(CPUINFO_FIELD);
|
||||
char* tmp2 = strstr(tmp1, "\n");
|
||||
|
||||
int strlen = (1 + (tmp2-tmp1));
|
||||
char* hardware = emalloc(sizeof(char) * strlen);
|
||||
memset(hardware, 0, sizeof(char) * strlen);
|
||||
strncpy(hardware, tmp1, tmp2-tmp1);
|
||||
|
||||
return hardware;
|
||||
}
|
||||
|
||||
char* get_hardware_from_cpuinfo() {
|
||||
char* get_hardware_from_cpuinfo(void) {
|
||||
return get_field_from_cpuinfo(CPUINFO_HARDWARE_STR);
|
||||
}
|
||||
|
||||
char* get_revision_from_cpuinfo() {
|
||||
char* get_revision_from_cpuinfo(void) {
|
||||
return get_field_from_cpuinfo(CPUINFO_REVISION_STR);
|
||||
}
|
||||
|
||||
bool is_raspberry_pi() {
|
||||
bool is_raspberry_pi(void) {
|
||||
int filelen;
|
||||
char* buf;
|
||||
if((buf = read_file(_PATH_DEVICETREE_MODEL, &filelen)) == NULL) {
|
||||
|
||||
@@ -3,12 +3,16 @@
|
||||
|
||||
#include "../common/udev.h"
|
||||
|
||||
#define _PATH_SUNXI_NVMEM "/sys/bus/nvmem/devices/sunxi-sid0/nvmem"
|
||||
#define _PATH_RK_EFUSE0 "/sys/bus/nvmem/devices/rockchip-efuse0/nvmem"
|
||||
#define _PATH_RK_OTP0 "/sys/bus/nvmem/devices/rockchip-otp0/nvmem"
|
||||
|
||||
#define UNKNOWN -1
|
||||
int get_ncores_from_cpuinfo();
|
||||
int get_ncores_from_cpuinfo(void);
|
||||
uint32_t get_midr_from_cpuinfo(uint32_t core, bool* success);
|
||||
char* get_hardware_from_cpuinfo();
|
||||
char* get_revision_from_cpuinfo();
|
||||
bool is_raspberry_pi();
|
||||
char* get_hardware_from_cpuinfo(void);
|
||||
char* get_revision_from_cpuinfo(void);
|
||||
bool is_raspberry_pi(void);
|
||||
|
||||
#endif
|
||||
|
||||
|
||||
@@ -12,6 +12,8 @@
|
||||
#define COLOR_STR_AMD "amd"
|
||||
#define COLOR_STR_IBM "ibm"
|
||||
#define COLOR_STR_ARM "arm"
|
||||
#define COLOR_STR_ROCKCHIP "rockchip"
|
||||
#define COLOR_STR_SIFIVE "sifive"
|
||||
|
||||
static const char *SYTLES_STR_LIST[] = {
|
||||
[STYLE_EMPTY] = NULL,
|
||||
@@ -26,6 +28,7 @@ struct args_struct {
|
||||
bool help_flag;
|
||||
bool raw_flag;
|
||||
bool accurate_pp;
|
||||
bool measure_max_frequency_flag;
|
||||
bool full_cpu_name_flag;
|
||||
bool logo_long;
|
||||
bool logo_short;
|
||||
@@ -38,92 +41,98 @@ struct args_struct {
|
||||
};
|
||||
|
||||
const char args_chr[] = {
|
||||
/* [ARG_STYLE] = */ 's',
|
||||
/* [ARG_COLOR] = */ 'c',
|
||||
/* [ARG_HELP] = */ 'h',
|
||||
/* [ARG_RAW] = */ 'r',
|
||||
/* [ARG_FULLCPUNAME] = */ 'F',
|
||||
/* [ARG_LOGO_LONG] = */ 1,
|
||||
/* [ARG_LOGO_SHORT] = */ 2,
|
||||
/* [ARG_LOGO_INTEL_NEW] = */ 3,
|
||||
/* [ARG_LOGO_INTEL_OLD] = */ 4,
|
||||
/* [ARG_ACCURATE_PP] = */ 5,
|
||||
/* [ARG_DEBUG] = */ 'd',
|
||||
/* [ARG_VERBOSE] = */ 'v',
|
||||
/* [ARG_VERSION] = */ 'V',
|
||||
/* [ARG_STYLE] = */ 's',
|
||||
/* [ARG_COLOR] = */ 'c',
|
||||
/* [ARG_HELP] = */ 'h',
|
||||
/* [ARG_RAW] = */ 'r',
|
||||
/* [ARG_FULLCPUNAME] = */ 'F',
|
||||
/* [ARG_LOGO_LONG] = */ 1,
|
||||
/* [ARG_LOGO_SHORT] = */ 2,
|
||||
/* [ARG_LOGO_INTEL_NEW] = */ 3,
|
||||
/* [ARG_LOGO_INTEL_OLD] = */ 4,
|
||||
/* [ARG_ACCURATE_PP] = */ 5,
|
||||
/* [ARG_MEASURE_MAX_FREQ] = */ 6,
|
||||
/* [ARG_DEBUG] = */ 'd',
|
||||
/* [ARG_VERBOSE] = */ 'v',
|
||||
/* [ARG_VERSION] = */ 'V',
|
||||
};
|
||||
|
||||
const char *args_str[] = {
|
||||
/* [ARG_STYLE] = */ "style",
|
||||
/* [ARG_COLOR] = */ "color",
|
||||
/* [ARG_HELP] = */ "help",
|
||||
/* [ARG_RAW] = */ "raw",
|
||||
/* [ARG_FULLCPUNAME] = */ "full-cpu-name",
|
||||
/* [ARG_LOGO_LONG] = */ "logo-long",
|
||||
/* [ARG_LOGO_SHORT] = */ "logo-short",
|
||||
/* [ARG_LOGO_INTEL_NEW] = */ "logo-intel-new",
|
||||
/* [ARG_LOGO_INTEL_OLD] = */ "logo-intel-old",
|
||||
/* [ARG_ACCURATE_PP] = */ "accurate-pp",
|
||||
/* [ARG_DEBUG] = */ "debug",
|
||||
/* [ARG_VERBOSE] = */ "verbose",
|
||||
/* [ARG_VERSION] = */ "version",
|
||||
/* [ARG_STYLE] = */ "style",
|
||||
/* [ARG_COLOR] = */ "color",
|
||||
/* [ARG_HELP] = */ "help",
|
||||
/* [ARG_RAW] = */ "raw",
|
||||
/* [ARG_FULLCPUNAME] = */ "full-cpu-name",
|
||||
/* [ARG_LOGO_LONG] = */ "logo-long",
|
||||
/* [ARG_LOGO_SHORT] = */ "logo-short",
|
||||
/* [ARG_LOGO_INTEL_NEW] = */ "logo-intel-new",
|
||||
/* [ARG_LOGO_INTEL_OLD] = */ "logo-intel-old",
|
||||
/* [ARG_ACCURATE_PP] = */ "accurate-pp",
|
||||
/* [ARG_MEASURE_MAX_FREQ] = */ "measure-max-freq",
|
||||
/* [ARG_DEBUG] = */ "debug",
|
||||
/* [ARG_VERBOSE] = */ "verbose",
|
||||
/* [ARG_VERSION] = */ "version",
|
||||
};
|
||||
|
||||
static struct args_struct args;
|
||||
|
||||
STYLE get_style() {
|
||||
STYLE get_style(void) {
|
||||
return args.style;
|
||||
}
|
||||
|
||||
struct color** get_colors() {
|
||||
struct color** get_colors(void) {
|
||||
return args.colors;
|
||||
}
|
||||
|
||||
bool show_help() {
|
||||
bool show_help(void) {
|
||||
return args.help_flag;
|
||||
}
|
||||
|
||||
bool show_version() {
|
||||
bool show_version(void) {
|
||||
return args.version_flag;
|
||||
}
|
||||
|
||||
bool show_debug() {
|
||||
bool show_debug(void) {
|
||||
return args.debug_flag;
|
||||
}
|
||||
|
||||
bool show_raw() {
|
||||
bool show_raw(void) {
|
||||
return args.raw_flag;
|
||||
}
|
||||
|
||||
bool accurate_pp() {
|
||||
bool accurate_pp(void) {
|
||||
return args.accurate_pp;
|
||||
}
|
||||
|
||||
bool show_full_cpu_name() {
|
||||
bool measure_max_frequency_flag(void) {
|
||||
return args.measure_max_frequency_flag;
|
||||
}
|
||||
|
||||
bool show_full_cpu_name(void) {
|
||||
return args.full_cpu_name_flag;
|
||||
}
|
||||
|
||||
bool show_logo_long() {
|
||||
bool show_logo_long(void) {
|
||||
return args.logo_long;
|
||||
}
|
||||
|
||||
bool show_logo_short() {
|
||||
bool show_logo_short(void) {
|
||||
return args.logo_short;
|
||||
}
|
||||
|
||||
bool show_logo_intel_new() {
|
||||
bool show_logo_intel_new(void) {
|
||||
return args.logo_intel_new;
|
||||
}
|
||||
|
||||
bool show_logo_intel_old() {
|
||||
bool show_logo_intel_old(void) {
|
||||
return args.logo_intel_old;
|
||||
}
|
||||
|
||||
bool verbose_enabled() {
|
||||
bool verbose_enabled(void) {
|
||||
return args.verbose_flag;
|
||||
}
|
||||
|
||||
int max_arg_str_length() {
|
||||
int max_arg_str_length(void) {
|
||||
int max_len = -1;
|
||||
int len = sizeof(args_str) / sizeof(args_str[0]);
|
||||
for(int i=0; i < len; i++) {
|
||||
@@ -168,6 +177,8 @@ bool parse_color(char* optarg_str, struct color*** cs) {
|
||||
else if(strcmp(optarg_str, COLOR_STR_AMD) == 0) color_to_copy = COLOR_DEFAULT_AMD;
|
||||
else if(strcmp(optarg_str, COLOR_STR_IBM) == 0) color_to_copy = COLOR_DEFAULT_IBM;
|
||||
else if(strcmp(optarg_str, COLOR_STR_ARM) == 0) color_to_copy = COLOR_DEFAULT_ARM;
|
||||
else if(strcmp(optarg_str, COLOR_STR_ROCKCHIP) == 0) color_to_copy = COLOR_DEFAULT_ROCKCHIP;
|
||||
else if(strcmp(optarg_str, COLOR_STR_SIFIVE) == 0) color_to_copy = COLOR_DEFAULT_SIFIVE;
|
||||
else {
|
||||
str_to_parse = optarg_str;
|
||||
free_ptr = false;
|
||||
@@ -211,19 +222,27 @@ bool parse_color(char* optarg_str, struct color*** cs) {
|
||||
return true;
|
||||
}
|
||||
|
||||
char* build_short_options() {
|
||||
char* build_short_options(void) {
|
||||
const char *c = args_chr;
|
||||
int len = sizeof(args_chr) / sizeof(args_chr[0]);
|
||||
char* str = (char *) emalloc(sizeof(char) * (len*2 + 1));
|
||||
memset(str, 0, sizeof(char) * (len*2 + 1));
|
||||
|
||||
#ifdef ARCH_X86
|
||||
sprintf(str, "%c:%c:%c%c%c%c%c%c%c%c%c%c%c",
|
||||
sprintf(str, "%c:%c:%c%c%c%c%c%c%c%c%c%c%c%c",
|
||||
c[ARG_STYLE], c[ARG_COLOR], c[ARG_HELP],
|
||||
c[ARG_RAW], c[ARG_FULLCPUNAME],
|
||||
c[ARG_LOGO_SHORT], c[ARG_LOGO_LONG],
|
||||
c[ARG_LOGO_INTEL_NEW], c[ARG_LOGO_INTEL_OLD],
|
||||
c[ARG_ACCURATE_PP], c[ARG_DEBUG], c[ARG_VERBOSE],
|
||||
c[ARG_ACCURATE_PP], c[ARG_MEASURE_MAX_FREQ],
|
||||
c[ARG_DEBUG], c[ARG_VERBOSE],
|
||||
c[ARG_VERSION]);
|
||||
#elif ARCH_ARM
|
||||
sprintf(str, "%c:%c:%c%c%c%c%c%c%c",
|
||||
c[ARG_STYLE], c[ARG_COLOR], c[ARG_HELP],
|
||||
c[ARG_LOGO_SHORT], c[ARG_LOGO_LONG],
|
||||
c[ARG_MEASURE_MAX_FREQ],
|
||||
c[ARG_DEBUG], c[ARG_VERBOSE],
|
||||
c[ARG_VERSION]);
|
||||
#else
|
||||
sprintf(str, "%c:%c:%c%c%c%c%c%c",
|
||||
@@ -259,21 +278,24 @@ bool parse_args(int argc, char* argv[]) {
|
||||
set_log_level(true);
|
||||
|
||||
const struct option long_options[] = {
|
||||
{args_str[ARG_STYLE], required_argument, 0, args_chr[ARG_STYLE] },
|
||||
{args_str[ARG_COLOR], required_argument, 0, args_chr[ARG_COLOR] },
|
||||
{args_str[ARG_HELP], no_argument, 0, args_chr[ARG_HELP] },
|
||||
{args_str[ARG_STYLE], required_argument, 0, args_chr[ARG_STYLE] },
|
||||
{args_str[ARG_COLOR], required_argument, 0, args_chr[ARG_COLOR] },
|
||||
{args_str[ARG_HELP], no_argument, 0, args_chr[ARG_HELP] },
|
||||
#ifdef ARCH_X86
|
||||
{args_str[ARG_LOGO_INTEL_NEW], no_argument, 0, args_chr[ARG_LOGO_INTEL_NEW] },
|
||||
{args_str[ARG_LOGO_INTEL_OLD], no_argument, 0, args_chr[ARG_LOGO_INTEL_OLD] },
|
||||
{args_str[ARG_ACCURATE_PP], no_argument, 0, args_chr[ARG_ACCURATE_PP] },
|
||||
{args_str[ARG_FULLCPUNAME], no_argument, 0, args_chr[ARG_FULLCPUNAME] },
|
||||
{args_str[ARG_RAW], no_argument, 0, args_chr[ARG_RAW] },
|
||||
{args_str[ARG_LOGO_INTEL_NEW], no_argument, 0, args_chr[ARG_LOGO_INTEL_NEW] },
|
||||
{args_str[ARG_LOGO_INTEL_OLD], no_argument, 0, args_chr[ARG_LOGO_INTEL_OLD] },
|
||||
{args_str[ARG_ACCURATE_PP], no_argument, 0, args_chr[ARG_ACCURATE_PP] },
|
||||
{args_str[ARG_MEASURE_MAX_FREQ], no_argument, 0, args_chr[ARG_MEASURE_MAX_FREQ] },
|
||||
{args_str[ARG_FULLCPUNAME], no_argument, 0, args_chr[ARG_FULLCPUNAME] },
|
||||
{args_str[ARG_RAW], no_argument, 0, args_chr[ARG_RAW] },
|
||||
#elif ARCH_ARM
|
||||
{args_str[ARG_MEASURE_MAX_FREQ], no_argument, 0, args_chr[ARG_MEASURE_MAX_FREQ] },
|
||||
#endif
|
||||
{args_str[ARG_LOGO_SHORT], no_argument, 0, args_chr[ARG_LOGO_SHORT] },
|
||||
{args_str[ARG_LOGO_LONG], no_argument, 0, args_chr[ARG_LOGO_LONG] },
|
||||
{args_str[ARG_DEBUG], no_argument, 0, args_chr[ARG_DEBUG] },
|
||||
{args_str[ARG_VERBOSE], no_argument, 0, args_chr[ARG_VERBOSE] },
|
||||
{args_str[ARG_VERSION], no_argument, 0, args_chr[ARG_VERSION] },
|
||||
{args_str[ARG_LOGO_SHORT], no_argument, 0, args_chr[ARG_LOGO_SHORT] },
|
||||
{args_str[ARG_LOGO_LONG], no_argument, 0, args_chr[ARG_LOGO_LONG] },
|
||||
{args_str[ARG_DEBUG], no_argument, 0, args_chr[ARG_DEBUG] },
|
||||
{args_str[ARG_VERBOSE], no_argument, 0, args_chr[ARG_VERBOSE] },
|
||||
{args_str[ARG_VERSION], no_argument, 0, args_chr[ARG_VERSION] },
|
||||
{0, 0, 0, 0}
|
||||
};
|
||||
|
||||
@@ -309,6 +331,9 @@ bool parse_args(int argc, char* argv[]) {
|
||||
else if(opt == args_chr[ARG_ACCURATE_PP]) {
|
||||
args.accurate_pp = true;
|
||||
}
|
||||
else if(opt == args_chr[ARG_MEASURE_MAX_FREQ]) {
|
||||
args.measure_max_frequency_flag = true;
|
||||
}
|
||||
else if(opt == args_chr[ARG_FULLCPUNAME]) {
|
||||
args.full_cpu_name_flag = true;
|
||||
}
|
||||
|
||||
@@ -29,6 +29,7 @@ enum {
|
||||
ARG_LOGO_INTEL_NEW,
|
||||
ARG_LOGO_INTEL_OLD,
|
||||
ARG_ACCURATE_PP,
|
||||
ARG_MEASURE_MAX_FREQ,
|
||||
ARG_DEBUG,
|
||||
ARG_VERBOSE,
|
||||
ARG_VERSION
|
||||
@@ -39,21 +40,22 @@ extern const char *args_str[];
|
||||
|
||||
#include "printer.h"
|
||||
|
||||
int max_arg_str_length();
|
||||
int max_arg_str_length(void);
|
||||
bool parse_args(int argc, char* argv[]);
|
||||
bool show_help();
|
||||
bool accurate_pp();
|
||||
bool show_full_cpu_name();
|
||||
bool show_logo_long();
|
||||
bool show_logo_short();
|
||||
bool show_logo_intel_new();
|
||||
bool show_logo_intel_old();
|
||||
bool show_raw();
|
||||
bool show_debug();
|
||||
bool show_version();
|
||||
bool verbose_enabled();
|
||||
bool show_help(void);
|
||||
bool accurate_pp(void);
|
||||
bool measure_max_frequency_flag(void);
|
||||
bool show_full_cpu_name(void);
|
||||
bool show_logo_long(void);
|
||||
bool show_logo_short(void);
|
||||
bool show_logo_intel_new(void);
|
||||
bool show_logo_intel_old(void);
|
||||
bool show_raw(void);
|
||||
bool show_debug(void);
|
||||
bool show_version(void);
|
||||
bool verbose_enabled(void);
|
||||
void free_colors_struct(struct color** cs);
|
||||
struct color** get_colors();
|
||||
STYLE get_style();
|
||||
struct color** get_colors(void);
|
||||
STYLE get_style(void);
|
||||
|
||||
#endif
|
||||
|
||||
@@ -33,7 +33,7 @@ struct ascii_logo {
|
||||
uint32_t width;
|
||||
uint32_t height;
|
||||
bool replace_blocks;
|
||||
char color_ascii[3][100];
|
||||
char color_ascii[4][100];
|
||||
char color_text[2][100];
|
||||
};
|
||||
|
||||
@@ -105,6 +105,19 @@ $C1 MMM :MMM NMM dMMK dMMX MMN \
|
||||
$C1 MMM :MMM NMM dMMMoo OMM0....:Nx. MMN \
|
||||
$C1 MMM :WWW XWW lONMM 'xXMMMMNOc MMN "
|
||||
|
||||
#define ASCII_HYGON \
|
||||
"$C1 \
|
||||
$C1 \
|
||||
$C1 \
|
||||
$C1 ## ## ## ## ###### ###### ## # \
|
||||
$C1 ##....## ## ## ## ## ## #### # \
|
||||
$C1 ######## ## ## ##. ## ## # #### \
|
||||
$C1 ## ## ## *######. ###### # ## \
|
||||
$C1 \
|
||||
$C1 \
|
||||
$C1 \
|
||||
$C1 "
|
||||
|
||||
#define ASCII_SNAPD \
|
||||
" $C1@@$C2######## \
|
||||
$C1@@@@@$C2########### \
|
||||
@@ -145,6 +158,25 @@ $C2 Exynos \
|
||||
$C2 \
|
||||
$C2 "
|
||||
|
||||
#define ASCII_KUNPENG \
|
||||
"$C2 . \
|
||||
$C2 .. \
|
||||
$C2 .## \
|
||||
$C1 .$CR $C2.###. \
|
||||
$C1 ..$CR $C2#####. \
|
||||
$C1 .#.$CR $C2.#######. \
|
||||
$C1 .####.$CR $C2.#######. \
|
||||
$C1 ..######*$CR $C2.#######. . \
|
||||
$C1 .#########*$CR $C2.#######* . \
|
||||
$C1 ######*$CR $C2.#######. .#. \
|
||||
$C1*#######*$CR $C2.#######. *##. \
|
||||
$C1 ##*$CR $C2.#######. ####### \
|
||||
$C2 ###.$CR $C1#####$C2 *### \
|
||||
$C1 *########## \
|
||||
$C1 *######## \
|
||||
$C1 #####. \
|
||||
$C1 *###. "
|
||||
|
||||
#define ASCII_KIRIN \
|
||||
"$C1 ####### \
|
||||
$C1 ##### #################### \
|
||||
@@ -218,6 +250,23 @@ $C1 kMMMMMMMMMMMMMMMMMMMMMMd \
|
||||
$C1 'KMMMMMMMWXXWMMMMMMMk. \
|
||||
$C1 \"cooc\"* \"*coo'\" "
|
||||
|
||||
#define ASCII_GOOGLE \
|
||||
"$C1 aaaaaaaa \
|
||||
$C1 .MMMMMMMMMMMMMMMM. \
|
||||
$C1 .MMMMMMMMMMMMMMMMMMMMM* \
|
||||
$C1 .MMMMMMMM** *MM* \
|
||||
$C2 MM$C1MMMMM. \
|
||||
$C2 *MMM$C1MM. \
|
||||
$C2*MMMMMM $C4lMMMMMMMMMMMMMMM* \
|
||||
$C2MMMMMMM $C4lMMMMMMMMMMMMMMMM \
|
||||
$C2*MMMMMM $C4lMMMMMMMMMMMMMMMd \
|
||||
$C2 MMMM$C3MMM. $C4*MMMMM. \
|
||||
$C2 MM$C3MMMMMM. $C4.MMMMMM. \
|
||||
$C3 *MMMMMMMMM*.......MMM$C4MMMMMM* \
|
||||
$C3 *MMMMMMMMMMMMMMMMMMMM$C4MM* \
|
||||
$C3 *MMMMMMMMMMMMMM* \
|
||||
$C3 ****** "
|
||||
|
||||
#define ASCII_ALLWINNER \
|
||||
"$C1 \
|
||||
$C1 ################# \
|
||||
@@ -236,6 +285,134 @@ $C1 ##### ##. \
|
||||
$C1 ###########. \
|
||||
$C1 "
|
||||
|
||||
#define ASCII_ROCKCHIP \
|
||||
"$C1 \
|
||||
$C1 $C2## \
|
||||
$C1 ###### ## ## \
|
||||
$C1 ##. ### ##### ##### ## .## ##### ######. ## ##### \
|
||||
$C1 #######. ##. # #. ##### ##. ### ### # .## \
|
||||
$C1##. ###. ####. #### ### .## #### ### ### #.##### \
|
||||
$C1 ## \
|
||||
$C1 "
|
||||
|
||||
#define ASCII_RISCV \
|
||||
"$C1 \
|
||||
$C1 ************ \
|
||||
$C1 %%%%%%%%% *********** \
|
||||
$C1 %%%%%%%%%% ********** \
|
||||
$C1 %%%%%%%%% ********* \
|
||||
$C1 % ******** \
|
||||
$C1 %% .********* % \
|
||||
$C1 %%%% ******* %%% \
|
||||
$C1 %%%%%%. **** %%%%% \
|
||||
$C1 %%%%%%%%. %%%%%%% \
|
||||
$C1 \
|
||||
$C1 \
|
||||
$C1 ########### ## .######### ######### .## ## \
|
||||
$C1 ## ## ## ## ## ### ### \
|
||||
$C1 ########### ## ##########. ## #### .## ## \
|
||||
$C1 ## ### ## ##. ## ### ### \
|
||||
$C1 ## ### ## ##########. ########## ### \
|
||||
$C1 "
|
||||
|
||||
#define ASCII_SIFIVE \
|
||||
"$C1 ############################################## \
|
||||
$C1 ###########@@@@@@@@@@@@@@@@@@@@@@@@########### \
|
||||
$C1 #########@@@@@@@@@@@@@@@@@@@@@@@@@@@@######### \
|
||||
$C1 ########@@@@######################@@@@######## \
|
||||
$C1 #######@@@@########################@@@@####### \
|
||||
$C1 ######@@@@##########################@@@@###### \
|
||||
$C1 #####@@@@#######@@@@@@@@@@@@@@@@@@@@@@@@@##### \
|
||||
$C1 ####@@@@#######@@@@@@@@@@@@@@@@@@@@@@@@@@@#### \
|
||||
$C1 ###@@@@################################@@@@### \
|
||||
$C1 ##@@@@##################################@@@@## \
|
||||
$C1 #@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@#########@@@@# \
|
||||
$C1 #@@@@@@@@@@@@@@@@@@@@@@@@@@@@@###########@@@@# \
|
||||
$C1 ##@@@@@@############@@@@@@############@@@@@@## \
|
||||
$C1 ######@@@@@###########@@###########@@@@@###### \
|
||||
$C1 #########@@@@@@################@@@@@@######### \
|
||||
$C1 #############@@@@@##########@@@@@############# \
|
||||
$C1 ################@@@@@@##@@@@@@################ \
|
||||
$C1 ####################@@@@@@#################### \
|
||||
$C1 ############################################## "
|
||||
|
||||
#define ASCII_STARFIVE \
|
||||
"$C1 # \
|
||||
$C1 ########## \
|
||||
$C1 ######## ######## \
|
||||
$C1 ######## #### \
|
||||
$C1 ####### #### \
|
||||
$C1 #### ####### \
|
||||
$C1 #### ##### ####### \
|
||||
$C1 ####### ######## .## \
|
||||
$C1 ######## ######## \
|
||||
$C1 ### ########. ####### \
|
||||
$C1 ####### ##### #### \
|
||||
$C1 ######## #. #### \
|
||||
$C1 # #### ####### \
|
||||
$C1 ##### ####### \
|
||||
$C1 ######## ######## \
|
||||
$C1 ######### \
|
||||
$C1 # "
|
||||
|
||||
#define ASCII_SIPEED \
|
||||
"$C1 #################################### \
|
||||
$C1######@@################################ \
|
||||
$C1####@@##@@####@@@@@@@@@@@@@@@@########## \
|
||||
$C1######@@####@@@@@@@@@@@@@@@@@@########## \
|
||||
$C1#########@@@@########################### \
|
||||
$C1#######@@@@@@########################### \
|
||||
$C1#########@@@@########################### \
|
||||
$C1###########@@@@@@@@@@@@@@@############## \
|
||||
$C1##############@@@@@@@@@@@@@@@########### \
|
||||
$C1###########################@@@@@######## \
|
||||
$C1###########################@@@@@@####### \
|
||||
$C1###########################@@@@@######## \
|
||||
$C1##########@@@@@@@@@@@@@@@@@@@########### \
|
||||
$C1##########@@@@@@@@@@@@@@@@############## \
|
||||
$C1######################################## \
|
||||
$C1 #################################### "
|
||||
|
||||
#define ASCII_NVIDIA \
|
||||
"$C1 'cccccccccccccccccccccccccc \
|
||||
$C1 ;oooooooooooooooooooooooool \
|
||||
$C1 .:::. .oooooooooooooooooool \
|
||||
$C1 .:cll; ,c:::. cooooooooooooool \
|
||||
$C1 ,clo' ;. oolc: ooooooooooool \
|
||||
$C1.cloo ;cclo . .olc. coooooooool \
|
||||
$C1oooo :lo, ;ll; looc :oooooooool \
|
||||
$C1 oooc ool. ;oooc;clol :looooooooool \
|
||||
$C1 :ooc ,ol; ;oooooo. .cloo; loool \
|
||||
$C1 ool; .olc. ,:lool .lool \
|
||||
$C1 ool:. ,::::ccloo. :clooool \
|
||||
$C1 oolc::. ':cclooooooool \
|
||||
$C1 ;oooooooooooooooooooooooool \
|
||||
$C1 \
|
||||
$C1 \
|
||||
$C2######. ## ## ## ###### ## ### \
|
||||
$C2## ## ## ## ## ## ## ## #: :# \
|
||||
$C2## ## ## ## ## ## ## ## ####### \
|
||||
$C2## ## ### ## ###### ## ## ## "
|
||||
|
||||
#define ASCII_AMPERE \
|
||||
"$C1 \
|
||||
$C1 \
|
||||
$C1 ## \
|
||||
$C1 #### \
|
||||
$C1 ### ## \
|
||||
$C1 ### ### \
|
||||
$C1 ### ### \
|
||||
$C1 ### ### \
|
||||
$C1 ## ### \
|
||||
$C1 ####### ### ### \
|
||||
$C1 ###### ## ###### ### \
|
||||
$C1 #### ### ######## \
|
||||
$C1 #### ### #### \
|
||||
$C1 ### ### #### \
|
||||
$C1 ## ### ### \
|
||||
$C1 \
|
||||
$C1 "
|
||||
|
||||
// --------------------- LONG LOGOS ------------------------- //
|
||||
#define ASCII_AMD_L \
|
||||
"$C1 \
|
||||
@@ -320,30 +497,108 @@ $C1 ############ ################## ######### #### ######### \
|
||||
$C1 \
|
||||
$C1 ############ ################ ######### ## ######### "
|
||||
|
||||
#define ASCII_SIFIVE_L \
|
||||
"$C1 ################################################### \
|
||||
$C1 ###########@@@@@@@@@@@@@@@@@@@@@@@@@@@@############ \
|
||||
$C1 ##########@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@########### \
|
||||
$C1 #########@@@@@#######################@@@@########## \
|
||||
$C1 ########@@@@@#########################@@@@######### \
|
||||
$C1 #######@@@@@###########################@@@@######## \
|
||||
$C1 ######@@@@@########@@@@@@@@@@@@@@@@@@@@@@@@@####### \
|
||||
$C1 #####@@@@@########@@@@@@@@@@@@@@@@@@@@@@@@@@@###### \
|
||||
$C1 ####@@@@@################################@@@@@##### \
|
||||
$C1 ###@@@@@##################################@@@@@#### \
|
||||
$C1 ##@@@@@####################################@@@@@### \
|
||||
$C1 ##@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@#########@@@@### \
|
||||
$C1 ##@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@############@@@@### \
|
||||
$C1 ####@@@@@#############@@@@@@@############@@@@@##### \
|
||||
$C1 #######@@@@@@############@############@@@@@@####### \
|
||||
$C1 ##########@@@@@@###################@@@@@@########## \
|
||||
$C1 ##############@@@@@@###########@@@@@@############## \
|
||||
$C1 #################@@@@@@#####@@@@@@################# \
|
||||
$C1 ####################@@@@@@@@@@@#################### \
|
||||
$C1 ########################@@@######################## \
|
||||
$C1 ################################################### "
|
||||
|
||||
#define ASCII_STARFIVE_L \
|
||||
"$C1 ####### \
|
||||
$C1 ################. \
|
||||
$C1 ############ ########### \
|
||||
$C1 ############ ##########. \
|
||||
$C1 ############ # ###### \
|
||||
$C1 ########### ##### ## \
|
||||
$C1 #######. ########## \
|
||||
$C1 ###### ### *########### \
|
||||
$C1 ###### #######. ########## \
|
||||
$C1 ######### ############ ###### \
|
||||
$C1 ###########. ###########* # \
|
||||
$C1 ############ ############ \
|
||||
$C1 # ############. .########### \
|
||||
$C1 ###### ########### ######### \
|
||||
$C1 ########## .######, ##### \
|
||||
$C1 ############ ##. #####. \
|
||||
$C1 ######### ######## \
|
||||
$C1 ## ##### ##########. \
|
||||
$C1 ####### # ############ \
|
||||
$C1 ########### ###########. \
|
||||
$C1 ###########. ############ \
|
||||
$C1 ################ \
|
||||
$C1 ####### "
|
||||
|
||||
#define ASCII_NVIDIA_L \
|
||||
"$C1 MMMMMMMMMMMMMMMMMMMMMMMMMMMMMM \
|
||||
$C1 MMMMMMMMMMMMMMMMMMMMMMMMMMMMMM \
|
||||
$C1 .:: 'MMMMMMMMMMMMMMMMMMMMMMMMM \
|
||||
$C1 ccllooo;:;. ;MMMMMMMMMMMMMMMMMM \
|
||||
$C1 cloc :ooollcc: :MMMMMMMMMMMMMMM \
|
||||
$C1 cloc :ccl; lolc, ;MMMMMMMMMMMM \
|
||||
$C1.cloo: :clo ;c: .ool; MMMMMMMMMMM \
|
||||
$C1 ooo: ooo :ool, .cloo. ;lMMMMMMMMMMM \
|
||||
$C1 ooo: ooc :ooooccooo. :MMMM lMMMMMMM \
|
||||
$C1 ooc. ool: :oooooo' ,cloo. MMMM \
|
||||
$C1 ool:. olc: .:cloo. :MMMM \
|
||||
$C1 olc, ;:::cccloo. :MMMMMMMM \
|
||||
$C1 olcc::; ,:ccloMMMMMMMMM \
|
||||
$C1 :......oMMMMMMMMMMMMMMMMMMMMMM \
|
||||
$C1 :lllMMMMMMMMMMMMMMMMMMMMMMMMMM "
|
||||
|
||||
typedef struct ascii_logo asciiL;
|
||||
|
||||
// ------------------------------------------------------------------------------------------------------+
|
||||
// | LOGO | W | H | REPLACE | COLORS LOGO (>0 && <10) | COLORS TEXT (=2) |
|
||||
// ------------------------------------------------------------------------------------------------------+
|
||||
asciiL logo_amd = { ASCII_AMD, 39, 15, false, {C_FG_WHITE, C_FG_GREEN}, {C_FG_WHITE, C_FG_GREEN} };
|
||||
asciiL logo_intel = { ASCII_INTEL, 48, 14, false, {C_FG_CYAN}, {C_FG_CYAN, C_FG_WHITE} };
|
||||
asciiL logo_intel_new = { ASCII_INTEL_NEW, 51, 9, false, {C_FG_CYAN}, {C_FG_CYAN, C_FG_WHITE} };
|
||||
asciiL logo_snapd = { ASCII_SNAPD, 39, 16, false, {C_FG_RED, C_FG_WHITE}, {C_FG_RED, C_FG_WHITE} };
|
||||
asciiL logo_mtk = { ASCII_MTK, 59, 5, false, {C_FG_BLUE, C_FG_YELLOW}, {C_FG_BLUE, C_FG_YELLOW} };
|
||||
asciiL logo_exynos = { ASCII_EXYNOS, 22, 13, true, {C_BG_BLUE, C_FG_WHITE}, {C_FG_BLUE, C_FG_WHITE} };
|
||||
asciiL logo_kirin = { ASCII_KIRIN, 53, 12, false, {C_FG_RED}, {C_FG_WHITE, C_FG_RED} };
|
||||
asciiL logo_broadcom = { ASCII_BROADCOM, 44, 19, false, {C_FG_WHITE, C_FG_RED}, {C_FG_WHITE, C_FG_RED} };
|
||||
asciiL logo_arm = { ASCII_ARM, 42, 5, false, {C_FG_CYAN}, {C_FG_WHITE, C_FG_CYAN} };
|
||||
asciiL logo_ibm = { ASCII_IBM, 42, 9, false, {C_FG_CYAN, C_FG_WHITE}, {C_FG_CYAN, C_FG_WHITE} };
|
||||
asciiL logo_apple = { ASCII_APPLE, 32, 17, false, {C_FG_WHITE}, {C_FG_CYAN, C_FG_B_WHITE} };
|
||||
asciiL logo_allwinner = { ASCII_ALLWINNER, 47, 16, false, {C_FG_CYAN}, {C_FG_B_BLACK, C_FG_B_CYAN } };
|
||||
// +-----------------------------------------------------------------------------------------------------------------+
|
||||
// | LOGO | W | H | REPLACE | COLORS LOGO (>0 && <10) | COLORS TEXT (=2) |
|
||||
// +-----------------------------------------------------------------------------------------------------------------+
|
||||
asciiL logo_amd = { ASCII_AMD, 39, 15, false, {C_FG_WHITE, C_FG_GREEN}, {C_FG_WHITE, C_FG_GREEN} };
|
||||
asciiL logo_intel = { ASCII_INTEL, 48, 14, false, {C_FG_CYAN}, {C_FG_CYAN, C_FG_WHITE} };
|
||||
asciiL logo_intel_new = { ASCII_INTEL_NEW, 51, 9, false, {C_FG_CYAN}, {C_FG_CYAN, C_FG_WHITE} };
|
||||
asciiL logo_hygon = { ASCII_HYGON, 51, 11, false, {C_FG_RED}, {C_FG_RED, C_FG_WHITE} };
|
||||
asciiL logo_snapd = { ASCII_SNAPD, 39, 16, false, {C_FG_RED, C_FG_WHITE}, {C_FG_RED, C_FG_WHITE} };
|
||||
asciiL logo_mtk = { ASCII_MTK, 59, 5, false, {C_FG_BLUE, C_FG_YELLOW}, {C_FG_BLUE, C_FG_YELLOW} };
|
||||
asciiL logo_exynos = { ASCII_EXYNOS, 22, 13, true, {C_BG_BLUE, C_FG_WHITE}, {C_FG_BLUE, C_FG_WHITE} };
|
||||
asciiL logo_kirin = { ASCII_KIRIN, 53, 12, false, {C_FG_RED}, {C_FG_WHITE, C_FG_RED} };
|
||||
asciiL logo_kunpeng = { ASCII_KUNPENG, 48, 17, false, {C_FG_RED, C_FG_WHITE}, {C_FG_WHITE, C_FG_RED} };
|
||||
asciiL logo_broadcom = { ASCII_BROADCOM, 44, 19, false, {C_FG_WHITE, C_FG_RED}, {C_FG_WHITE, C_FG_RED} };
|
||||
asciiL logo_arm = { ASCII_ARM, 42, 5, false, {C_FG_CYAN}, {C_FG_WHITE, C_FG_CYAN} };
|
||||
asciiL logo_ibm = { ASCII_IBM, 42, 9, false, {C_FG_CYAN, C_FG_WHITE}, {C_FG_CYAN, C_FG_WHITE} };
|
||||
asciiL logo_apple = { ASCII_APPLE, 32, 17, false, {C_FG_WHITE}, {C_FG_CYAN, C_FG_B_WHITE} };
|
||||
asciiL logo_google = { ASCII_GOOGLE, 35, 15, false, {C_FG_RED, C_FG_YELLOW, C_FG_GREEN, C_FG_BLUE}, {C_FG_BLUE, C_FG_B_WHITE} };
|
||||
asciiL logo_allwinner = { ASCII_ALLWINNER, 47, 16, false, {C_FG_CYAN}, {C_FG_B_BLACK, C_FG_B_CYAN } };
|
||||
asciiL logo_rockchip = { ASCII_ROCKCHIP, 58, 8, false, {C_FG_CYAN, C_FG_YELLOW}, {C_FG_CYAN, C_FG_YELLOW} };
|
||||
asciiL logo_riscv = { ASCII_RISCV, 63, 18, false, {C_FG_CYAN, C_FG_YELLOW}, {C_FG_CYAN, C_FG_YELLOW} };
|
||||
asciiL logo_sifive = { ASCII_SIFIVE, 48, 19, true, {C_BG_WHITE, C_BG_BLACK}, {C_FG_WHITE, C_FG_BLUE} };
|
||||
asciiL logo_starfive = { ASCII_STARFIVE, 33, 17, false, {C_FG_WHITE}, {C_FG_WHITE, C_FG_BLUE} };
|
||||
asciiL logo_sipeed = { ASCII_SIPEED, 41, 16, true, {C_BG_RED, C_BG_WHITE}, {C_FG_RED, C_FG_WHITE} };
|
||||
asciiL logo_nvidia = { ASCII_NVIDIA, 45, 19, false, {C_FG_GREEN, C_FG_WHITE}, {C_FG_WHITE, C_FG_GREEN} };
|
||||
asciiL logo_ampere = { ASCII_AMPERE, 50, 17, false, {C_FG_RED}, {C_FG_WHITE, C_FG_RED} };
|
||||
|
||||
// Long variants | ----------------------------------------------------------------------------------------------------|
|
||||
asciiL logo_amd_l = { ASCII_AMD_L, 62, 19, true, {C_BG_WHITE, C_BG_GREEN}, {C_FG_WHITE, C_FG_GREEN} };
|
||||
asciiL logo_intel_l = { ASCII_INTEL_L, 62, 19, true, {C_BG_CYAN, C_BG_WHITE}, {C_FG_CYAN, C_FG_WHITE} };
|
||||
asciiL logo_intel_l_new = { ASCII_INTEL_L_NEW, 57, 14, true, {C_BG_CYAN, C_BG_WHITE, C_BG_BLUE}, {C_FG_CYAN, C_FG_WHITE} };
|
||||
asciiL logo_arm_l = { ASCII_ARM_L, 60, 8, true, {C_BG_CYAN}, {C_FG_WHITE, C_FG_CYAN} };
|
||||
asciiL logo_ibm_l = { ASCII_IBM_L, 62, 13, true, {C_BG_CYAN, C_FG_WHITE}, {C_FG_CYAN, C_FG_WHITE} };
|
||||
asciiL logo_unknown = { NULL, 0, 0, false, {COLOR_NONE}, {COLOR_NONE, COLOR_NONE} };
|
||||
// Long variants | ----------------------------------------------------------------------------------------------------------------|
|
||||
asciiL logo_amd_l = { ASCII_AMD_L, 62, 19, true, {C_BG_WHITE, C_BG_GREEN}, {C_FG_WHITE, C_FG_GREEN} };
|
||||
asciiL logo_intel_l = { ASCII_INTEL_L, 62, 19, true, {C_BG_CYAN, C_BG_WHITE}, {C_FG_CYAN, C_FG_WHITE} };
|
||||
asciiL logo_intel_l_new = { ASCII_INTEL_L_NEW, 57, 14, true, {C_BG_CYAN, C_BG_WHITE, C_BG_BLUE}, {C_FG_CYAN, C_FG_WHITE} };
|
||||
asciiL logo_arm_l = { ASCII_ARM_L, 60, 8, true, {C_BG_CYAN}, {C_FG_WHITE, C_FG_CYAN} };
|
||||
asciiL logo_ibm_l = { ASCII_IBM_L, 62, 13, true, {C_BG_CYAN, C_FG_WHITE}, {C_FG_CYAN, C_FG_WHITE} };
|
||||
asciiL logo_starfive_l = { ASCII_STARFIVE_L, 50, 22, false, {C_FG_WHITE}, {C_FG_WHITE, C_FG_BLUE} };
|
||||
asciiL logo_sifive_l = { ASCII_SIFIVE_L, 53, 21, true, {C_BG_WHITE, C_BG_BLACK}, {C_FG_WHITE, C_FG_CYAN} };
|
||||
asciiL logo_nvidia_l = { ASCII_NVIDIA_L, 50, 15, false, {C_FG_GREEN, C_FG_WHITE}, {C_FG_WHITE, C_FG_GREEN} };
|
||||
asciiL logo_unknown = { NULL, 0, 0, false, {COLOR_NONE}, {COLOR_NONE, COLOR_NONE} };
|
||||
|
||||
#endif
|
||||
|
||||
@@ -14,6 +14,8 @@
|
||||
#include "../ppc/uarch.h"
|
||||
#elif ARCH_ARM
|
||||
#include "../arm/uarch.h"
|
||||
#elif ARCH_RISCV
|
||||
#include "../riscv/uarch.h"
|
||||
#endif
|
||||
|
||||
#define STRING_YES "Yes"
|
||||
@@ -143,17 +145,25 @@ char* get_str_l3(struct cache* cach) {
|
||||
|
||||
char* get_str_freq(struct frequency* freq) {
|
||||
//Max 3 digits and 3 for '(M/G)Hz' plus 1 for '\0'
|
||||
uint32_t size = (5+1+3+1);
|
||||
uint32_t size = (1+5+1+3+1);
|
||||
assert(strlen(STRING_UNKNOWN)+1 <= size);
|
||||
char* string = emalloc(sizeof(char)*size);
|
||||
memset(string, 0, sizeof(char)*size);
|
||||
char* string = ecalloc(size, sizeof(char));
|
||||
|
||||
if(freq->max == UNKNOWN_DATA || freq->max < 0)
|
||||
if(freq->max == UNKNOWN_DATA || freq->max < 0) {
|
||||
snprintf(string,strlen(STRING_UNKNOWN)+1,STRING_UNKNOWN);
|
||||
else if(freq->max >= 1000)
|
||||
snprintf(string,size,"%.3f "STRING_GIGAHERZ,(float)(freq->max)/1000);
|
||||
else
|
||||
snprintf(string,size,"%d "STRING_MEGAHERZ,freq->max);
|
||||
}
|
||||
else if(freq->max >= 1000) {
|
||||
if (freq->measured)
|
||||
snprintf(string,size,"~%.3f "STRING_GIGAHERZ,(float)(freq->max)/1000);
|
||||
else
|
||||
snprintf(string,size,"%.3f "STRING_GIGAHERZ,(float)(freq->max)/1000);
|
||||
}
|
||||
else {
|
||||
if (freq->measured)
|
||||
snprintf(string,size,"~%d "STRING_MEGAHERZ,freq->max);
|
||||
else
|
||||
snprintf(string,size,"%d "STRING_MEGAHERZ,freq->max);
|
||||
}
|
||||
|
||||
return string;
|
||||
}
|
||||
@@ -192,7 +202,7 @@ void init_topology_struct(struct topology* topo, struct cache* cach) {
|
||||
topo->sockets = 0;
|
||||
#ifdef ARCH_X86
|
||||
topo->smt_available = 0;
|
||||
topo->apic = emalloc(sizeof(struct apic));
|
||||
topo->apic = ecalloc(1, sizeof(struct apic));
|
||||
#endif
|
||||
#endif
|
||||
}
|
||||
|
||||
@@ -8,6 +8,7 @@ enum {
|
||||
// ARCH_X86
|
||||
CPU_VENDOR_INTEL,
|
||||
CPU_VENDOR_AMD,
|
||||
CPU_VENDOR_HYGON,
|
||||
// ARCH_ARM
|
||||
CPU_VENDOR_ARM,
|
||||
CPU_VENDOR_APPLE,
|
||||
@@ -16,10 +17,14 @@ enum {
|
||||
CPU_VENDOR_NVIDIA,
|
||||
CPU_VENDOR_APM,
|
||||
CPU_VENDOR_QUALCOMM,
|
||||
CPU_VENDOR_HUAWUEI,
|
||||
CPU_VENDOR_HUAWEI,
|
||||
CPU_VENDOR_SAMSUNG,
|
||||
CPU_VENDOR_MARVELL,
|
||||
CPU_VENDOR_PHYTIUM,
|
||||
// ARCH_RISCV
|
||||
CPU_VENDOR_RISCV,
|
||||
CPU_VENDOR_SIFIVE,
|
||||
CPU_VENDOR_THEAD,
|
||||
// OTHERS
|
||||
CPU_VENDOR_UNKNOWN,
|
||||
CPU_VENDOR_INVALID
|
||||
@@ -28,10 +33,14 @@ enum {
|
||||
enum {
|
||||
HV_VENDOR_KVM,
|
||||
HV_VENDOR_QEMU,
|
||||
HV_VENDOR_VBOX,
|
||||
HV_VENDOR_HYPERV,
|
||||
HV_VENDOR_VMWARE,
|
||||
HV_VENDOR_XEN,
|
||||
HV_VENDOR_PARALLELS,
|
||||
HV_VENDOR_PHYP,
|
||||
HV_VENDOR_BHYVE,
|
||||
HV_VENDOR_APPLEVZ,
|
||||
HV_VENDOR_INVALID
|
||||
};
|
||||
|
||||
@@ -49,6 +58,8 @@ typedef int32_t VENDOR;
|
||||
struct frequency {
|
||||
int32_t base;
|
||||
int32_t max;
|
||||
// Indicates if max frequency was measured
|
||||
bool measured;
|
||||
};
|
||||
|
||||
struct hypervisor {
|
||||
@@ -113,19 +124,34 @@ struct features {
|
||||
bool SHA1;
|
||||
bool SHA2;
|
||||
bool CRC32;
|
||||
bool SVE;
|
||||
bool SVE2;
|
||||
uint64_t cntb;
|
||||
#endif
|
||||
};
|
||||
|
||||
struct extensions {
|
||||
char* str;
|
||||
uint64_t mask;
|
||||
};
|
||||
|
||||
struct cpuInfo {
|
||||
VENDOR cpu_vendor;
|
||||
VENDOR cpu_vendor;
|
||||
struct uarch* arch;
|
||||
struct hypervisor* hv;
|
||||
struct frequency* freq;
|
||||
struct cache* cach;
|
||||
struct topology* topo;
|
||||
struct features* feat;
|
||||
int64_t peak_performance;
|
||||
|
||||
// Similar but not exactly equal
|
||||
// to struct features
|
||||
#ifdef ARCH_RISCV
|
||||
struct extensions* ext;
|
||||
#else
|
||||
struct features* feat;
|
||||
#endif
|
||||
|
||||
#if defined(ARCH_X86) || defined(ARCH_PPC)
|
||||
// CPU name from model
|
||||
char* cpu_name;
|
||||
@@ -149,7 +175,7 @@ struct cpuInfo {
|
||||
uint32_t midr;
|
||||
#endif
|
||||
|
||||
#ifdef ARCH_ARM
|
||||
#if defined(ARCH_ARM) || defined(ARCH_RISCV)
|
||||
struct system_on_chip* soc;
|
||||
#endif
|
||||
|
||||
|
||||
195
src/common/freq.c
Normal file
195
src/common/freq.c
Normal file
@@ -0,0 +1,195 @@
|
||||
#ifdef __linux__
|
||||
|
||||
#define _GNU_SOURCE
|
||||
|
||||
#include <time.h>
|
||||
#include <stdio.h>
|
||||
#include <stdint.h>
|
||||
#include <string.h>
|
||||
#include <errno.h>
|
||||
#include <unistd.h>
|
||||
#include <asm/unistd.h>
|
||||
#include <sys/ioctl.h>
|
||||
#include <linux/perf_event.h>
|
||||
|
||||
#include "global.h"
|
||||
#include "cpu.h"
|
||||
|
||||
static long
|
||||
perf_event_open(struct perf_event_attr *hw_event, pid_t pid,
|
||||
int cpu, int group_fd, unsigned long flags) {
|
||||
int ret;
|
||||
ret = syscall(__NR_perf_event_open, hw_event, pid, cpu,
|
||||
group_fd, flags);
|
||||
return ret;
|
||||
}
|
||||
|
||||
#define INSERT_ASM_ONCE __asm volatile("nop");
|
||||
#define INSERT_ASM_10_TIMES \
|
||||
INSERT_ASM_ONCE \
|
||||
INSERT_ASM_ONCE \
|
||||
INSERT_ASM_ONCE \
|
||||
INSERT_ASM_ONCE \
|
||||
INSERT_ASM_ONCE \
|
||||
INSERT_ASM_ONCE \
|
||||
INSERT_ASM_ONCE \
|
||||
INSERT_ASM_ONCE \
|
||||
INSERT_ASM_ONCE \
|
||||
INSERT_ASM_ONCE \
|
||||
|
||||
#define INSERT_ASM_100_TIMES \
|
||||
INSERT_ASM_10_TIMES \
|
||||
INSERT_ASM_10_TIMES \
|
||||
INSERT_ASM_10_TIMES \
|
||||
INSERT_ASM_10_TIMES \
|
||||
INSERT_ASM_10_TIMES \
|
||||
INSERT_ASM_10_TIMES \
|
||||
INSERT_ASM_10_TIMES \
|
||||
INSERT_ASM_10_TIMES \
|
||||
INSERT_ASM_10_TIMES \
|
||||
INSERT_ASM_10_TIMES
|
||||
|
||||
#define INSERT_ASM_1000_TIMES \
|
||||
INSERT_ASM_100_TIMES \
|
||||
INSERT_ASM_100_TIMES \
|
||||
INSERT_ASM_100_TIMES \
|
||||
INSERT_ASM_100_TIMES \
|
||||
INSERT_ASM_100_TIMES \
|
||||
INSERT_ASM_100_TIMES \
|
||||
INSERT_ASM_100_TIMES \
|
||||
INSERT_ASM_100_TIMES \
|
||||
INSERT_ASM_100_TIMES \
|
||||
INSERT_ASM_100_TIMES \
|
||||
|
||||
void nop_function(uint64_t iters) {
|
||||
for (uint64_t i = 0; i < iters; i++) {
|
||||
INSERT_ASM_1000_TIMES
|
||||
INSERT_ASM_1000_TIMES
|
||||
INSERT_ASM_1000_TIMES
|
||||
INSERT_ASM_1000_TIMES
|
||||
}
|
||||
}
|
||||
|
||||
// Run the nop_function with the number of iterations specified and
|
||||
// measure both the time and number of cycles
|
||||
int measure_freq_iters(uint64_t iters, uint32_t core, double* freq) {
|
||||
clockid_t clock = CLOCK_PROCESS_CPUTIME_ID;
|
||||
struct timespec start, end;
|
||||
struct perf_event_attr pe;
|
||||
uint64_t cycles;
|
||||
int fd;
|
||||
int pid = 0;
|
||||
memset(&pe, 0, sizeof(struct perf_event_attr));
|
||||
pe.type = PERF_TYPE_HARDWARE;
|
||||
pe.size = sizeof(struct perf_event_attr);
|
||||
pe.config = PERF_COUNT_HW_CPU_CYCLES;
|
||||
pe.disabled = 1;
|
||||
pe.exclude_kernel = 1;
|
||||
pe.exclude_hv = 1;
|
||||
|
||||
fd = perf_event_open(&pe, pid, core, -1, 0);
|
||||
if (fd == -1) {
|
||||
perror("perf_event_open");
|
||||
if (errno == EPERM || errno == EACCES) {
|
||||
printErr("You may not have permission to collect stats.\n"\
|
||||
"Consider tweaking /proc/sys/kernel/perf_event_paranoid or running as root");
|
||||
}
|
||||
return -1;
|
||||
}
|
||||
|
||||
if (clock_gettime(clock, &start) == -1) {
|
||||
perror("clock_gettime");
|
||||
return -1;
|
||||
}
|
||||
if(ioctl(fd, PERF_EVENT_IOC_RESET, 0) == -1) {
|
||||
perror("ioctl");
|
||||
return -1;
|
||||
}
|
||||
if(ioctl(fd, PERF_EVENT_IOC_ENABLE, 0) == -1) {
|
||||
perror("ioctl");
|
||||
return -1;
|
||||
}
|
||||
|
||||
nop_function(iters);
|
||||
|
||||
ssize_t ret = read(fd, &cycles, sizeof(uint64_t));
|
||||
if (ret == -1) {
|
||||
perror("read");
|
||||
return -1;
|
||||
}
|
||||
if (ret != sizeof(uint64_t)) {
|
||||
printErr("Read returned %d, expected %d", ret, sizeof(uint64_t));
|
||||
return -1;
|
||||
}
|
||||
if(ioctl(fd, PERF_EVENT_IOC_DISABLE, 0) == -1) {
|
||||
perror("ioctl");
|
||||
return -1;
|
||||
}
|
||||
if (clock_gettime(clock, &end) == -1) {
|
||||
perror("clock_gettime");
|
||||
return -1;
|
||||
}
|
||||
|
||||
uint64_t nsecs = (end.tv_sec*1e9 + end.tv_nsec) - (start.tv_sec*1e9 + start.tv_nsec);
|
||||
uint64_t usecs = nsecs/1000;
|
||||
*freq = cycles/((double)usecs);
|
||||
return 0;
|
||||
}
|
||||
|
||||
// Return a good number of iterations to run the nop_function in
|
||||
// order to get a precise measurement of the frequency without taking
|
||||
// too much time.
|
||||
uint64_t get_num_iters_from_freq(double frequency) {
|
||||
// Truncate to reduce variability
|
||||
uint64_t freq_trunc = ((uint64_t) frequency / 100) * 100;
|
||||
uint64_t osp_per_iter = 4 * 1000;
|
||||
|
||||
return freq_trunc * 1e7 * 1/osp_per_iter;
|
||||
}
|
||||
|
||||
// Differences between x86 measure_frequency and this measure_max_frequency:
|
||||
// - measure_frequency employs all cores simultaneously whereas
|
||||
// measure_max_frequency only employs 1.
|
||||
// - measure_frequency runs the computation and checks /proc/cpuinfo whereas
|
||||
// measure_max_frequency does not rely on /proc/cpuinfo and simply
|
||||
// counts cpu cycles to measure frequency.
|
||||
// - measure_frequency uses actual computation while measuring the frequency
|
||||
// whereas measure_max_frequency uses nop instructions. This makes the former
|
||||
// x86 dependant whereas the latter is architecture independant.
|
||||
int64_t measure_max_frequency(uint32_t core) {
|
||||
if (!bind_to_cpu(core)) {
|
||||
printErr("Failed binding the process to CPU %d", core);
|
||||
return UNKNOWN_DATA;
|
||||
}
|
||||
|
||||
// First, get very rough estimation of clock cycle to
|
||||
// compute a reasonable value for the iterations
|
||||
double estimation_freq, frequency;
|
||||
uint64_t iters = 100000;
|
||||
if (measure_freq_iters(iters, core, &estimation_freq) == -1)
|
||||
return UNKNOWN_DATA;
|
||||
|
||||
if (estimation_freq <= 0.0) {
|
||||
printErr("First frequency measurement yielded an invalid value: %f", estimation_freq);
|
||||
return UNKNOWN_DATA;
|
||||
}
|
||||
iters = get_num_iters_from_freq(estimation_freq);
|
||||
printWarn("Running frequency measurement with %ld iterations on core %d...", iters, core);
|
||||
|
||||
// Now perform actual measurement
|
||||
const char* frequency_banner = "cpufetch is measuring the max frequency...";
|
||||
printf("%s", frequency_banner);
|
||||
fflush(stdout);
|
||||
|
||||
if (measure_freq_iters(iters, core, &frequency) == -1)
|
||||
return UNKNOWN_DATA;
|
||||
|
||||
// Clean screen once measurement is finished
|
||||
printf("\r%*c\r", (int) strlen(frequency_banner), ' ');
|
||||
|
||||
// Discard last digit in the frequency, which should help providing
|
||||
// more reliable and predictable values.
|
||||
return (((int) frequency + 5)/10) * 10;
|
||||
}
|
||||
|
||||
#endif // #ifdef __linux__
|
||||
6
src/common/freq.h
Normal file
6
src/common/freq.h
Normal file
@@ -0,0 +1,6 @@
|
||||
#ifndef __COMMON_FREQ__
|
||||
#define __COMMON_FREQ__
|
||||
|
||||
int64_t measure_max_frequency(uint32_t core);
|
||||
|
||||
#endif
|
||||
@@ -1,3 +1,14 @@
|
||||
#ifdef _WIN32
|
||||
#define NOMINMAX
|
||||
#include <windows.h>
|
||||
#elif defined __linux__
|
||||
#define _GNU_SOURCE
|
||||
#include <sched.h>
|
||||
#elif defined __FreeBSD__
|
||||
#include <sys/param.h>
|
||||
#include <sys/cpuset.h>
|
||||
#endif
|
||||
|
||||
#include <stdarg.h>
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
@@ -20,6 +31,40 @@
|
||||
|
||||
#endif
|
||||
|
||||
#ifdef ARCH_X86
|
||||
static const char* ARCH_STR = "x86 / x86_64 build";
|
||||
#include "../x86/cpuid.h"
|
||||
#elif ARCH_PPC
|
||||
static const char* ARCH_STR = "PowerPC build";
|
||||
#include "../ppc/ppc.h"
|
||||
#elif ARCH_ARM
|
||||
static const char* ARCH_STR = "ARM build";
|
||||
#include "../arm/midr.h"
|
||||
#elif ARCH_RISCV
|
||||
static const char* ARCH_STR = "RISC-V build";
|
||||
#include "../riscv/riscv.h"
|
||||
#endif
|
||||
|
||||
#ifdef __linux__
|
||||
#ifdef __ANDROID__
|
||||
static const char* OS_STR = "Android";
|
||||
#else
|
||||
static const char* OS_STR = "Linux";
|
||||
#endif
|
||||
#elif __FreeBSD__
|
||||
static const char* OS_STR = "FreeBSD";
|
||||
#elif _WIN32
|
||||
static const char* OS_STR = "Windows";
|
||||
#elif defined __APPLE__ || __MACH__
|
||||
static const char* OS_STR = "macOS";
|
||||
#else
|
||||
static const char* OS_STR = "Unknown OS";
|
||||
#endif
|
||||
|
||||
#ifndef GIT_FULL_VERSION
|
||||
static const char* VERSION = "1.06";
|
||||
#endif
|
||||
|
||||
enum {
|
||||
LOG_LEVEL_NORMAL,
|
||||
LOG_LEVEL_VERBOSE
|
||||
@@ -27,6 +72,14 @@ enum {
|
||||
|
||||
int LOG_LEVEL;
|
||||
|
||||
void printBugMessage(FILE *restrict stream) {
|
||||
#if defined(ARCH_X86) || defined(ARCH_PPC)
|
||||
fprintf(stream, "Please, create a new issue with this error message, the output of 'cpufetch' and 'cpufetch --debug' on https://github.com/Dr-Noob/cpufetch/issues\n");
|
||||
#elif ARCH_ARM
|
||||
fprintf(stream, "Please, create a new issue with this error message, your smartphone/computer model, the output of 'cpufetch --verbose' and 'cpufetch --debug' on https://github.com/Dr-Noob/cpufetch/issues\n");
|
||||
#endif
|
||||
}
|
||||
|
||||
void printWarn(const char *fmt, ...) {
|
||||
if(LOG_LEVEL == LOG_LEVEL_VERBOSE) {
|
||||
int buffer_size = 4096;
|
||||
@@ -47,6 +100,8 @@ void printErr(const char *fmt, ...) {
|
||||
vsnprintf(buffer,buffer_size, fmt, args);
|
||||
va_end(args);
|
||||
fprintf(stderr,RED "[ERROR]: "RESET "%s\n",buffer);
|
||||
fprintf(stderr,"[VERSION]: ");
|
||||
print_version(stderr);
|
||||
}
|
||||
|
||||
void printBug(const char *fmt, ...) {
|
||||
@@ -57,10 +112,42 @@ void printBug(const char *fmt, ...) {
|
||||
vsnprintf(buffer,buffer_size, fmt, args);
|
||||
va_end(args);
|
||||
fprintf(stderr,RED "[ERROR]: "RESET "%s\n",buffer);
|
||||
#if defined(ARCH_X86) || defined(ARCH_PPC)
|
||||
fprintf(stderr, "Please, create a new issue with this error message, the output of 'cpufetch' and 'cpufetch --debug' on https://github.com/Dr-Noob/cpufetch/issues\n");
|
||||
#elif ARCH_ARM
|
||||
fprintf(stderr, "Please, create a new issue with this error message, your smartphone/computer model, the output of 'cpufetch --verbose' and 'cpufetch --debug' on https://github.com/Dr-Noob/cpufetch/issues\n");
|
||||
fprintf(stderr,"[VERSION]: ");
|
||||
print_version(stderr);
|
||||
printBugMessage(stderr);
|
||||
}
|
||||
|
||||
bool isReleaseVersion(char *git_full_version) {
|
||||
return strstr(git_full_version, "-") == NULL;
|
||||
}
|
||||
|
||||
/// The unknown uarch errors are by far the most common error a user will encounter.
|
||||
/// Rather than using the generic printBug function, which asks the user to report
|
||||
/// the problem on the issues webpage, this function will check if the program is
|
||||
/// the release version. In such case, support for this feature is most likely already
|
||||
/// in the last version, so just tell the user to compile that one and not report this
|
||||
/// in github.
|
||||
void printBugCheckRelease(const char *fmt, ...) {
|
||||
int buffer_size = 4096;
|
||||
char buffer[buffer_size];
|
||||
va_list args;
|
||||
va_start(args, fmt);
|
||||
vsnprintf(buffer,buffer_size, fmt, args);
|
||||
va_end(args);
|
||||
|
||||
fprintf(stderr, RED "[ERROR]: "RESET "%s\n", buffer);
|
||||
fprintf(stderr, "[VERSION]: ");
|
||||
print_version(stderr);
|
||||
|
||||
#ifdef GIT_FULL_VERSION
|
||||
if (isReleaseVersion(GIT_FULL_VERSION)) {
|
||||
fprintf(stderr, RED "[ERROR]: "RESET "You are using an outdated version of cpufetch. Please compile cpufetch from source (see https://github.com/Dr-Noob/cpufetch?tab=readme-ov-file#22-building-from-source)");
|
||||
}
|
||||
else {
|
||||
printBugMessage(stderr);
|
||||
}
|
||||
#else
|
||||
printBugMessage(stderr);
|
||||
#endif
|
||||
}
|
||||
|
||||
@@ -123,3 +210,38 @@ void* erealloc(void *ptr, size_t size) {
|
||||
return newptr;
|
||||
}
|
||||
|
||||
#ifndef __APPLE__
|
||||
bool bind_to_cpu(int cpu_id) {
|
||||
#ifdef _WIN32
|
||||
HANDLE process = GetCurrentProcess();
|
||||
DWORD_PTR processAffinityMask = 1 << cpu_id;
|
||||
return SetProcessAffinityMask(process, processAffinityMask);
|
||||
#elif defined __linux__
|
||||
cpu_set_t currentCPU;
|
||||
CPU_ZERO(¤tCPU);
|
||||
CPU_SET(cpu_id, ¤tCPU);
|
||||
if (sched_setaffinity (0, sizeof(currentCPU), ¤tCPU) == -1) {
|
||||
printWarn("sched_setaffinity: %s", strerror(errno));
|
||||
return false;
|
||||
}
|
||||
return true;
|
||||
#elif defined __FreeBSD__
|
||||
cpuset_t currentCPU;
|
||||
CPU_ZERO(¤tCPU);
|
||||
CPU_SET(cpu_id, ¤tCPU);
|
||||
if(cpuset_setaffinity(CPU_LEVEL_WHICH, CPU_WHICH_TID, -1, sizeof(cpuset_t), ¤tCPU) == -1) {
|
||||
printWarn("cpuset_setaffinity: %s", strerror(errno));
|
||||
return false;
|
||||
}
|
||||
return true;
|
||||
#endif
|
||||
}
|
||||
#endif
|
||||
|
||||
void print_version(FILE *restrict stream) {
|
||||
#ifdef GIT_FULL_VERSION
|
||||
fprintf(stream, "cpufetch %s (%s %s)\n", GIT_FULL_VERSION, OS_STR, ARCH_STR);
|
||||
#else
|
||||
fprintf(stream, "cpufetch v%s (%s %s)\n", VERSION, OS_STR, ARCH_STR);
|
||||
#endif
|
||||
}
|
||||
|
||||
@@ -1,6 +1,7 @@
|
||||
#ifndef __GLOBAL__
|
||||
#define __GLOBAL__
|
||||
|
||||
#include <stdio.h>
|
||||
#include <stdbool.h>
|
||||
#include <stddef.h>
|
||||
|
||||
@@ -11,11 +12,16 @@ void set_log_level(bool verbose);
|
||||
void printWarn(const char *fmt, ...);
|
||||
void printErr(const char *fmt, ...);
|
||||
void printBug(const char *fmt, ...);
|
||||
void printBugCheckRelease(const char *fmt, ...);
|
||||
int min(int a, int b);
|
||||
int max(int a, int b);
|
||||
char *strremove(char *str, const char *sub);
|
||||
void* emalloc(size_t size);
|
||||
void* ecalloc(size_t nmemb, size_t size);
|
||||
void* erealloc(void *ptr, size_t size);
|
||||
#ifndef __APPLE__
|
||||
bool bind_to_cpu(int cpu_id);
|
||||
#endif
|
||||
void print_version(FILE *restrict stream);
|
||||
|
||||
#endif
|
||||
|
||||
@@ -6,35 +6,6 @@
|
||||
#include "printer.h"
|
||||
#include "global.h"
|
||||
|
||||
#ifdef ARCH_X86
|
||||
static const char* ARCH_STR = "x86_64 build";
|
||||
#include "../x86/cpuid.h"
|
||||
#elif ARCH_PPC
|
||||
static const char* ARCH_STR = "PowerPC build";
|
||||
#include "../ppc/ppc.h"
|
||||
#elif ARCH_ARM
|
||||
static const char* ARCH_STR = "ARM build";
|
||||
#include "../arm/midr.h"
|
||||
#endif
|
||||
|
||||
#ifdef __linux__
|
||||
#ifdef __ANDROID__
|
||||
static const char* OS_STR = "Android";
|
||||
#else
|
||||
static const char* OS_STR = "Linux";
|
||||
#endif
|
||||
#elif __FreeBSD__
|
||||
static const char* OS_STR = "FreeBSD";
|
||||
#elif _WIN32
|
||||
static const char* OS_STR = "Windows";
|
||||
#elif defined __APPLE__ || __MACH__
|
||||
static const char* OS_STR = "macOS";
|
||||
#else
|
||||
static const char* OS_STR = "Unknown OS";
|
||||
#endif
|
||||
|
||||
static const char* VERSION = "1.03";
|
||||
|
||||
void print_help(char *argv[]) {
|
||||
const char **t = args_str;
|
||||
const char *c = args_chr;
|
||||
@@ -59,20 +30,29 @@ void print_help(char *argv[]) {
|
||||
#ifdef ARCH_X86
|
||||
#ifdef __linux__
|
||||
printf(" --%s %*s Compute the peak performance accurately (measure the CPU frequency instead of using the maximum)\n", t[ARG_ACCURATE_PP], (int) (max_len-strlen(t[ARG_ACCURATE_PP])), "");
|
||||
#endif
|
||||
printf(" --%s %*s Measure the max CPU frequency instead of reading it\n", t[ARG_MEASURE_MAX_FREQ], (int) (max_len-strlen(t[ARG_MEASURE_MAX_FREQ])), "");
|
||||
#endif // __linux__
|
||||
printf(" --%s %*s Show the old Intel logo\n", t[ARG_LOGO_INTEL_OLD], (int) (max_len-strlen(t[ARG_LOGO_INTEL_OLD])), "");
|
||||
printf(" --%s %*s Show the new Intel logo\n", t[ARG_LOGO_INTEL_NEW], (int) (max_len-strlen(t[ARG_LOGO_INTEL_NEW])), "");
|
||||
printf(" -%c, --%s %*s Show the full CPU name (do not abbreviate it)\n", c[ARG_FULLCPUNAME], t[ARG_FULLCPUNAME], (int) (max_len-strlen(t[ARG_FULLCPUNAME])), "");
|
||||
printf(" -%c, --%s %*s Print raw cpuid data (debug purposes)\n", c[ARG_RAW], t[ARG_RAW], (int) (max_len-strlen(t[ARG_RAW])), "");
|
||||
#endif // ARCH_X86
|
||||
#ifdef ARCH_ARM
|
||||
#ifdef __linux__
|
||||
printf(" --%s %*s Measure the max CPU frequency instead of reading it\n", t[ARG_MEASURE_MAX_FREQ], (int) (max_len-strlen(t[ARG_MEASURE_MAX_FREQ])), "");
|
||||
#endif
|
||||
#endif
|
||||
printf(" -%c, --%s %*s Print this help and exit\n", c[ARG_HELP], t[ARG_HELP], (int) (max_len-strlen(t[ARG_HELP])), "");
|
||||
printf(" -%c, --%s %*s Print cpufetch version and exit\n", c[ARG_VERSION], t[ARG_VERSION], (int) (max_len-strlen(t[ARG_VERSION])), "");
|
||||
|
||||
printf("\nCOLORS: \n");
|
||||
printf(" * \"intel\": Use Intel default color scheme \n");
|
||||
printf(" * \"amd\": Use AMD default color scheme \n");
|
||||
printf(" * \"ibm\", Use IBM default color scheme \n");
|
||||
printf(" * \"arm\": Use ARM default color scheme \n");
|
||||
printf(" * \"intel\": Use Intel color scheme \n");
|
||||
printf(" * \"intel-new\": Use Intel (new logo) color scheme \n");
|
||||
printf(" * \"amd\": Use AMD color scheme \n");
|
||||
printf(" * \"ibm\", Use IBM color scheme \n");
|
||||
printf(" * \"arm\": Use ARM color scheme \n");
|
||||
printf(" * \"rockchip\": Use Rockchip color scheme \n");
|
||||
printf(" * \"sifive\": Use SiFive color scheme \n");
|
||||
printf(" * custom: If the argument of --color does not match any of the previous strings, a custom scheme can be specified.\n");
|
||||
printf(" 5 colors must be given in RGB with the format: R,G,B:R,G,B:...\n");
|
||||
printf(" The first 3 colors are the CPU art color and the next 2 colors are the text colors\n");
|
||||
@@ -102,12 +82,15 @@ void print_help(char *argv[]) {
|
||||
printf("\nNOTE: \n");
|
||||
printf(" Peak performance information is NOT accurate. cpufetch computes peak performance using the max\n");
|
||||
printf(" frequency of the CPU. However, to compute the peak performance, you need to know the frequency of the\n");
|
||||
printf(" CPU running AVX code. This value is not be fetched by cpufetch since it depends on each specific CPU.\n");
|
||||
printf(" To correctly measure peak performance, see: https://github.com/Dr-Noob/peakperf\n");
|
||||
}
|
||||
|
||||
void print_version() {
|
||||
printf("cpufetch v%s (%s %s)\n",VERSION, OS_STR, ARCH_STR);
|
||||
printf(" CPU running AVX code. By default, this value is not fetched by cpufetch, but you can use the\n");
|
||||
printf(" --accurate-pp option, which will measure the AVX frequency and show a more precise estimation\n");
|
||||
printf(" (this option is only available in x86 architectures).\n");
|
||||
printf(" To precisely measure peak performance, see: https://github.com/Dr-Noob/peakperf\n");
|
||||
printf("\n");
|
||||
printf(" Both --accurate-pp and --measure-max-freq measure the actual frequency of the CPU. However,\n");
|
||||
printf(" they differ slightly. The former measures the max frequency while running vectorized SSE/AVX\n");
|
||||
printf(" instructions and it is thus x86 only, whereas the latter simply measures the max clock cycle\n");
|
||||
printf(" and is architecture independent.\n");
|
||||
}
|
||||
|
||||
int main(int argc, char* argv[]) {
|
||||
@@ -120,7 +103,7 @@ int main(int argc, char* argv[]) {
|
||||
}
|
||||
|
||||
if(show_version()) {
|
||||
print_version();
|
||||
print_version(stdout);
|
||||
return EXIT_SUCCESS;
|
||||
}
|
||||
|
||||
@@ -131,7 +114,7 @@ int main(int argc, char* argv[]) {
|
||||
return EXIT_FAILURE;
|
||||
|
||||
if(show_debug()) {
|
||||
print_version();
|
||||
print_version(stdout);
|
||||
print_debug(cpu);
|
||||
return EXIT_SUCCESS;
|
||||
}
|
||||
@@ -139,7 +122,7 @@ int main(int argc, char* argv[]) {
|
||||
// TODO: This should be moved to the end of args.c
|
||||
if(show_raw()) {
|
||||
#ifdef ARCH_X86
|
||||
print_version();
|
||||
print_version(stdout);
|
||||
print_raw(cpu);
|
||||
return EXIT_SUCCESS;
|
||||
#else
|
||||
@@ -148,8 +131,10 @@ int main(int argc, char* argv[]) {
|
||||
#endif
|
||||
}
|
||||
|
||||
if(print_cpufetch(cpu, get_style(), get_colors(), show_full_cpu_name()))
|
||||
if(print_cpufetch(cpu, get_style(), get_colors(), show_full_cpu_name())) {
|
||||
return EXIT_SUCCESS;
|
||||
else
|
||||
}
|
||||
else {
|
||||
return EXIT_FAILURE;
|
||||
}
|
||||
}
|
||||
|
||||
133
src/common/pci.c
Normal file
133
src/common/pci.c
Normal file
@@ -0,0 +1,133 @@
|
||||
#define _GNU_SOURCE
|
||||
|
||||
#include <sys/stat.h>
|
||||
#include <dirent.h>
|
||||
|
||||
#include "udev.h"
|
||||
#include "global.h"
|
||||
#include "pci.h"
|
||||
|
||||
#ifndef PATH_MAX
|
||||
#define PATH_MAX 1024
|
||||
#endif
|
||||
|
||||
#define PCI_PATH "/sys/bus/pci/devices/"
|
||||
#define MAX_LENGTH_PCI_DIR_NAME 1024
|
||||
|
||||
// Return a list of PCI devices containing only
|
||||
// the sysfs path
|
||||
struct pci_devices * get_pci_paths(void) {
|
||||
DIR *dirp;
|
||||
|
||||
if ((dirp = opendir(PCI_PATH)) == NULL) {
|
||||
perror("opendir");
|
||||
return NULL;
|
||||
}
|
||||
|
||||
struct dirent *dp;
|
||||
int numDirs = 0;
|
||||
errno = 0;
|
||||
|
||||
while ((dp = readdir(dirp)) != NULL) {
|
||||
if (strcmp(dp->d_name, ".") != 0 && strcmp(dp->d_name, "..") != 0)
|
||||
numDirs++;
|
||||
}
|
||||
if (errno != 0) {
|
||||
perror("readdir");
|
||||
return NULL;
|
||||
}
|
||||
|
||||
rewinddir(dirp);
|
||||
|
||||
struct pci_devices * pci = emalloc(sizeof(struct pci_devices));
|
||||
pci->num_devices = numDirs;
|
||||
pci->devices = emalloc(sizeof(struct pci_device) * pci->num_devices);
|
||||
char * full_path = emalloc(PATH_MAX * sizeof(char));
|
||||
struct stat stbuf;
|
||||
int i = 0;
|
||||
|
||||
while ((dp = readdir(dirp)) != NULL) {
|
||||
if (strcmp(dp->d_name, ".") == 0 || strcmp(dp->d_name, "..") == 0)
|
||||
continue;
|
||||
|
||||
if (strlen(dp->d_name) > MAX_LENGTH_PCI_DIR_NAME) {
|
||||
printErr("Directory name is too long: %s", dp->d_name);
|
||||
return NULL;
|
||||
}
|
||||
|
||||
memset(full_path, 0, PATH_MAX * sizeof(char));
|
||||
snprintf(full_path, min(strlen(PCI_PATH) + strlen(dp->d_name) + 1, PATH_MAX), "%s%s", PCI_PATH, dp->d_name);
|
||||
|
||||
if (stat(full_path, &stbuf) == -1) {
|
||||
perror("stat");
|
||||
return NULL;
|
||||
}
|
||||
|
||||
if ((stbuf.st_mode & S_IFMT) == S_IFDIR) {
|
||||
int strLen = min(MAX_LENGTH_PCI_DIR_NAME, strlen(dp->d_name)) + 1;
|
||||
pci->devices[i] = emalloc(sizeof(struct pci_device));
|
||||
pci->devices[i]->path = ecalloc(sizeof(char), strLen);
|
||||
strncpy(pci->devices[i]->path, dp->d_name, strLen);
|
||||
i++;
|
||||
}
|
||||
}
|
||||
if (errno != 0) {
|
||||
perror("readdir");
|
||||
return NULL;
|
||||
}
|
||||
|
||||
return pci;
|
||||
}
|
||||
|
||||
// For each PCI device in the list pci, fetch its vendor and
|
||||
// device id using sysfs (e.g., /sys/bus/pci/devices/XXX/{vendor/device})
|
||||
void populate_pci_devices(struct pci_devices * pci) {
|
||||
int filelen;
|
||||
char* buf;
|
||||
|
||||
for (int i=0; i < pci->num_devices; i++) {
|
||||
struct pci_device* dev = pci->devices[i];
|
||||
int path_size = strlen(PCI_PATH) + strlen(dev->path) + 2;
|
||||
|
||||
// Read vendor_id
|
||||
char *vendor_id_path = emalloc(sizeof(char) * (path_size + strlen("vendor") + 1));
|
||||
sprintf(vendor_id_path, "%s/%s/%s", PCI_PATH, dev->path, "vendor");
|
||||
|
||||
if ((buf = read_file(vendor_id_path, &filelen)) == NULL) {
|
||||
printWarn("read_file: %s: %s\n", vendor_id_path, strerror(errno));
|
||||
dev->vendor_id = 0;
|
||||
}
|
||||
else {
|
||||
dev->vendor_id = strtol(buf, NULL, 16);
|
||||
}
|
||||
|
||||
// Read device_id
|
||||
char *device_id_path = emalloc(sizeof(char) * (path_size + strlen("device") + 1));
|
||||
sprintf(device_id_path, "%s/%s/%s", PCI_PATH, dev->path, "device");
|
||||
|
||||
if ((buf = read_file(device_id_path, &filelen)) == NULL) {
|
||||
printWarn("read_file: %s: %s\n", device_id_path, strerror(errno));
|
||||
dev->device_id = 0;
|
||||
}
|
||||
else {
|
||||
dev->device_id = strtol(buf, NULL, 16);
|
||||
}
|
||||
|
||||
free(vendor_id_path);
|
||||
free(device_id_path);
|
||||
}
|
||||
}
|
||||
|
||||
// Return a list of PCI devices that could be used to infer the SoC.
|
||||
// The criteria to determine which devices are suitable for this task
|
||||
// is decided in filter_pci_devices.
|
||||
struct pci_devices * get_pci_devices(void) {
|
||||
struct pci_devices * pci = get_pci_paths();
|
||||
|
||||
if (pci == NULL)
|
||||
return NULL;
|
||||
|
||||
populate_pci_devices(pci);
|
||||
|
||||
return pci;
|
||||
}
|
||||
23
src/common/pci.h
Normal file
23
src/common/pci.h
Normal file
@@ -0,0 +1,23 @@
|
||||
#ifndef __PCI__
|
||||
#define __PCI__
|
||||
|
||||
#define PCI_VENDOR_NVIDIA 0x10de
|
||||
#define PCI_VENDOR_AMPERE 0x1def
|
||||
|
||||
#define PCI_DEVICE_TEGRA_X1 0x0faf
|
||||
#define PCI_DEVICE_ALTRA 0xe100
|
||||
|
||||
struct pci_device {
|
||||
char * path;
|
||||
uint16_t vendor_id;
|
||||
uint16_t device_id;
|
||||
};
|
||||
|
||||
struct pci_devices {
|
||||
struct pci_device ** devices;
|
||||
int num_devices;
|
||||
};
|
||||
|
||||
struct pci_devices * get_pci_devices(void);
|
||||
|
||||
#endif
|
||||
@@ -16,10 +16,15 @@
|
||||
#elif ARCH_PPC
|
||||
#include "../ppc/uarch.h"
|
||||
#include "../ppc/ppc.h"
|
||||
#else
|
||||
#elif ARCH_ARM
|
||||
#include "../arm/uarch.h"
|
||||
#include "../arm/midr.h"
|
||||
#include "../arm/soc.h"
|
||||
#include "../common/soc.h"
|
||||
#elif ARCH_RISCV
|
||||
#include "../riscv/riscv.h"
|
||||
#include "../riscv/uarch.h"
|
||||
#include "../riscv/soc.h"
|
||||
#endif
|
||||
|
||||
#ifdef _WIN32
|
||||
@@ -42,7 +47,7 @@
|
||||
enum {
|
||||
#if defined(ARCH_X86) || defined(ARCH_PPC)
|
||||
ATTRIBUTE_NAME,
|
||||
#elif ARCH_ARM
|
||||
#elif defined(ARCH_ARM) || defined(ARCH_RISCV)
|
||||
ATTRIBUTE_SOC,
|
||||
#endif
|
||||
#if defined(ARCH_X86) || defined(ARCH_ARM)
|
||||
@@ -56,12 +61,15 @@ enum {
|
||||
ATTRIBUTE_NCORES,
|
||||
ATTRIBUTE_NCORES_DUAL,
|
||||
#ifdef ARCH_X86
|
||||
ATTRIBUTE_SSE,
|
||||
ATTRIBUTE_AVX,
|
||||
ATTRIBUTE_FMA,
|
||||
#elif ARCH_PPC
|
||||
ATTRIBUTE_ALTIVEC,
|
||||
#elif ARCH_ARM
|
||||
ATTRIBUTE_FEATURES,
|
||||
#elif ARCH_RISCV
|
||||
ATTRIBUTE_EXTENSIONS,
|
||||
#endif
|
||||
ATTRIBUTE_L1i,
|
||||
ATTRIBUTE_L1d,
|
||||
@@ -75,7 +83,7 @@ static const char* ATTRIBUTE_FIELDS [] = {
|
||||
"Name:",
|
||||
#elif ARCH_PPC
|
||||
"Part Number:",
|
||||
#elif ARCH_ARM
|
||||
#elif defined(ARCH_ARM) || defined(ARCH_RISCV)
|
||||
"SoC:",
|
||||
#endif
|
||||
#if defined(ARCH_X86) || defined(ARCH_ARM)
|
||||
@@ -89,12 +97,15 @@ static const char* ATTRIBUTE_FIELDS [] = {
|
||||
"Cores:",
|
||||
"Cores (Total):",
|
||||
#ifdef ARCH_X86
|
||||
"SSE:",
|
||||
"AVX:",
|
||||
"FMA:",
|
||||
#elif ARCH_PPC
|
||||
"Altivec: ",
|
||||
#elif defined(ARCH_ARM)
|
||||
"Features: ",
|
||||
#elif defined(ARCH_RISCV)
|
||||
"Extensions: ",
|
||||
#endif
|
||||
"L1i Size:",
|
||||
"L1d Size:",
|
||||
@@ -122,12 +133,15 @@ static const char* ATTRIBUTE_FIELDS_SHORT [] = {
|
||||
"Cores:",
|
||||
"Cores (Total):",
|
||||
#ifdef ARCH_X86
|
||||
"SSE:",
|
||||
"AVX:",
|
||||
"FMA:",
|
||||
#elif ARCH_PPC
|
||||
"Altivec: ",
|
||||
#elif defined(ARCH_ARM)
|
||||
"Features: ",
|
||||
#elif defined(ARCH_RISCV)
|
||||
"Extensions: ",
|
||||
#endif
|
||||
"L1i Size:",
|
||||
"L1d Size:",
|
||||
@@ -325,6 +339,13 @@ struct ascii_logo* choose_ascii_art_aux(struct ascii_logo* logo_long, struct asc
|
||||
}
|
||||
}
|
||||
|
||||
// https://no-color.org/
|
||||
bool is_color_enabled(void) {
|
||||
const char *var_name = "NO_COLOR";
|
||||
char *no_color = getenv(var_name);
|
||||
return no_color == NULL || no_color[0] == '\0';
|
||||
}
|
||||
|
||||
void choose_ascii_art(struct ascii* art, struct color** cs, struct terminal* term, int lf) {
|
||||
// 1. Choose logo
|
||||
#ifdef ARCH_X86
|
||||
@@ -339,6 +360,9 @@ void choose_ascii_art(struct ascii* art, struct color** cs, struct terminal* ter
|
||||
else if(art->vendor == CPU_VENDOR_AMD) {
|
||||
art->art = choose_ascii_art_aux(&logo_amd_l, &logo_amd, term, lf);
|
||||
}
|
||||
else if(art->vendor == CPU_VENDOR_HYGON) {
|
||||
art->art = &logo_hygon;
|
||||
}
|
||||
else {
|
||||
art->art = &logo_unknown;
|
||||
}
|
||||
@@ -353,19 +377,43 @@ void choose_ascii_art(struct ascii* art, struct color** cs, struct terminal* ter
|
||||
art->art = &logo_exynos;
|
||||
else if(art->vendor == SOC_VENDOR_KIRIN)
|
||||
art->art = &logo_kirin;
|
||||
else if(art->vendor == SOC_VENDOR_KUNPENG)
|
||||
art->art = &logo_kunpeng;
|
||||
else if(art->vendor == SOC_VENDOR_BROADCOM)
|
||||
art->art = &logo_broadcom;
|
||||
else if(art->vendor == SOC_VENDOR_APPLE)
|
||||
art->art = &logo_apple;
|
||||
else if(art->vendor == SOC_VENDOR_GOOGLE)
|
||||
art->art = &logo_google;
|
||||
else if(art->vendor == SOC_VENDOR_ALLWINNER)
|
||||
art->art = &logo_allwinner;
|
||||
else if(art->vendor == SOC_VENDOR_ROCKCHIP)
|
||||
art->art = &logo_rockchip;
|
||||
else if(art->vendor == SOC_VENDOR_AMPERE)
|
||||
art->art = &logo_ampere;
|
||||
else if(art->vendor == SOC_VENDOR_NVIDIA)
|
||||
art->art = choose_ascii_art_aux(&logo_nvidia_l, &logo_nvidia, term, lf);
|
||||
else {
|
||||
art->art = choose_ascii_art_aux(&logo_arm_l, &logo_arm, term, lf);
|
||||
}
|
||||
#elif ARCH_RISCV
|
||||
if(art->vendor == SOC_VENDOR_SIFIVE)
|
||||
art->art = choose_ascii_art_aux(&logo_sifive_l, &logo_sifive, term, lf);
|
||||
else if(art->vendor == SOC_VENDOR_STARFIVE)
|
||||
art->art = choose_ascii_art_aux(&logo_starfive_l, &logo_starfive, term, lf);
|
||||
else if(art->vendor == SOC_VENDOR_ALLWINNER)
|
||||
art->art = &logo_allwinner;
|
||||
else if(art->vendor == SOC_VENDOR_SIPEED)
|
||||
art->art = &logo_sipeed;
|
||||
else
|
||||
art->art = &logo_riscv;
|
||||
#endif
|
||||
|
||||
// 2. Choose colors
|
||||
struct ascii_logo* logo = art->art;
|
||||
bool color = is_color_enabled();
|
||||
if (!color)
|
||||
art->style = STYLE_LEGACY;
|
||||
|
||||
switch(art->style) {
|
||||
case STYLE_LEGACY:
|
||||
@@ -551,6 +599,7 @@ bool print_cpufetch_x86(struct cpuInfo* cpu, STYLE s, struct color** cs, struct
|
||||
for(int i = 0; i < cpu->num_cpus; ptr = ptr->next_cpu, i++) {
|
||||
char* max_frequency = get_str_freq(ptr->freq);
|
||||
char* avx = get_str_avx(ptr);
|
||||
char* sse = get_str_sse(ptr);
|
||||
char* fma = get_str_fma(ptr);
|
||||
char* cpu_num = emalloc(sizeof(char) * 9);
|
||||
|
||||
@@ -585,8 +634,18 @@ bool print_cpufetch_x86(struct cpuInfo* cpu, STYLE s, struct color** cs, struct
|
||||
setAttribute(art, ATTRIBUTE_NCORES, n_cores);
|
||||
}
|
||||
}
|
||||
setAttribute(art, ATTRIBUTE_AVX, avx);
|
||||
setAttribute(art, ATTRIBUTE_FMA, fma);
|
||||
|
||||
// Show the most modern vector instructions.
|
||||
if (strcmp(avx, "No") == 0) {
|
||||
if (strcmp(sse, "No") != 0) {
|
||||
setAttribute(art, ATTRIBUTE_SSE, sse);
|
||||
}
|
||||
}
|
||||
else {
|
||||
setAttribute(art, ATTRIBUTE_AVX, avx);
|
||||
setAttribute(art, ATTRIBUTE_FMA, fma);
|
||||
}
|
||||
|
||||
if(l1i != NULL) setAttribute(art, ATTRIBUTE_L1i, l1i);
|
||||
if(l1d != NULL) setAttribute(art, ATTRIBUTE_L1d, l1d);
|
||||
if(l2 != NULL) setAttribute(art, ATTRIBUTE_L2, l2);
|
||||
@@ -656,11 +715,14 @@ bool print_cpufetch_ppc(struct cpuInfo* cpu, STYLE s, struct color** cs, struct
|
||||
|
||||
// Step 2. Set attributes
|
||||
if(cpu_name != NULL) {
|
||||
setAttribute(art,ATTRIBUTE_NAME,cpu_name);
|
||||
setAttribute(art, ATTRIBUTE_NAME, cpu_name);
|
||||
}
|
||||
setAttribute(art,ATTRIBUTE_UARCH,uarch);
|
||||
setAttribute(art,ATTRIBUTE_TECHNOLOGY,manufacturing_process);
|
||||
setAttribute(art,ATTRIBUTE_FREQUENCY,max_frequency);
|
||||
setAttribute(art, ATTRIBUTE_UARCH, uarch);
|
||||
if(cpu->hv->present) {
|
||||
setAttribute(art, ATTRIBUTE_HYPERVISOR, cpu->hv->hv_name);
|
||||
}
|
||||
setAttribute(art, ATTRIBUTE_TECHNOLOGY, manufacturing_process);
|
||||
setAttribute(art, ATTRIBUTE_FREQUENCY, max_frequency);
|
||||
uint32_t socket_num = get_nsockets(cpu->topo);
|
||||
if (socket_num > 1) {
|
||||
setAttribute(art, ATTRIBUTE_SOCKETS, sockets);
|
||||
@@ -668,16 +730,16 @@ bool print_cpufetch_ppc(struct cpuInfo* cpu, STYLE s, struct color** cs, struct
|
||||
setAttribute(art, ATTRIBUTE_NCORES_DUAL, n_cores_dual);
|
||||
}
|
||||
else {
|
||||
setAttribute(art,ATTRIBUTE_NCORES, n_cores);
|
||||
setAttribute(art, ATTRIBUTE_NCORES, n_cores);
|
||||
}
|
||||
setAttribute(art,ATTRIBUTE_ALTIVEC, altivec);
|
||||
setAttribute(art,ATTRIBUTE_L1i,l1i);
|
||||
setAttribute(art,ATTRIBUTE_L1d,l1d);
|
||||
setAttribute(art,ATTRIBUTE_L2,l2);
|
||||
setAttribute(art, ATTRIBUTE_ALTIVEC, altivec);
|
||||
setAttribute(art, ATTRIBUTE_L1i, l1i);
|
||||
setAttribute(art, ATTRIBUTE_L1d, l1d);
|
||||
setAttribute(art, ATTRIBUTE_L2, l2);
|
||||
if(l3 != NULL) {
|
||||
setAttribute(art,ATTRIBUTE_L3,l3);
|
||||
setAttribute(art, ATTRIBUTE_L3, l3);
|
||||
}
|
||||
setAttribute(art,ATTRIBUTE_PEAK,pp);
|
||||
setAttribute(art, ATTRIBUTE_PEAK, pp);
|
||||
|
||||
// Step 3. Print output
|
||||
const char** attribute_fields = ATTRIBUTE_FIELDS;
|
||||
@@ -818,26 +880,17 @@ bool print_cpufetch_arm(struct cpuInfo* cpu, STYLE s, struct color** cs, struct
|
||||
char* manufacturing_process = get_str_process(cpu->soc);
|
||||
char* soc_name = get_soc_name(cpu->soc);
|
||||
char* features = get_str_features(cpu);
|
||||
setAttribute(art,ATTRIBUTE_SOC,soc_name);
|
||||
setAttribute(art,ATTRIBUTE_TECHNOLOGY,manufacturing_process);
|
||||
setAttribute(art, ATTRIBUTE_SOC, soc_name);
|
||||
setAttribute(art, ATTRIBUTE_TECHNOLOGY, manufacturing_process);
|
||||
|
||||
if(cpu->num_cpus == 1) {
|
||||
char* uarch = get_str_uarch(cpu);
|
||||
char* max_frequency = get_str_freq(cpu->freq);
|
||||
char* n_cores = get_str_topology(cpu, cpu->topo, false);
|
||||
/*
|
||||
* char* l1i = get_str_l1i(cpu->cach);
|
||||
* char* l1d = get_str_l1d(cpu->cach);
|
||||
* char* l2 = get_str_l2(cpu->cach);
|
||||
* char* l3 = get_str_l3(cpu->cach);
|
||||
* Do not setAttribute for caches.
|
||||
* Cache functionality may be implemented
|
||||
* in the future
|
||||
*/
|
||||
|
||||
setAttribute(art,ATTRIBUTE_UARCH,uarch);
|
||||
setAttribute(art,ATTRIBUTE_FREQUENCY,max_frequency);
|
||||
setAttribute(art,ATTRIBUTE_NCORES,n_cores);
|
||||
setAttribute(art, ATTRIBUTE_UARCH, uarch);
|
||||
setAttribute(art, ATTRIBUTE_FREQUENCY, max_frequency);
|
||||
setAttribute(art, ATTRIBUTE_NCORES, n_cores);
|
||||
if(features != NULL) {
|
||||
setAttribute(art, ATTRIBUTE_FEATURES, features);
|
||||
}
|
||||
@@ -848,17 +901,8 @@ bool print_cpufetch_arm(struct cpuInfo* cpu, STYLE s, struct color** cs, struct
|
||||
char* uarch = get_str_uarch(ptr);
|
||||
char* max_frequency = get_str_freq(ptr->freq);
|
||||
char* n_cores = get_str_topology(ptr, ptr->topo, false);
|
||||
/*
|
||||
* char* l1i = get_str_l1i(cpu->cach);
|
||||
* char* l1d = get_str_l1d(cpu->cach);
|
||||
* char* l2 = get_str_l2(cpu->cach);
|
||||
* char* l3 = get_str_l3(cpu->cach);
|
||||
* Do not setAttribute for caches.
|
||||
* Cache functionality may be implemented
|
||||
* in the future
|
||||
*/
|
||||
|
||||
char* cpu_num = emalloc(sizeof(char) * 9);
|
||||
|
||||
sprintf(cpu_num, "CPU %d:", i+1);
|
||||
setAttribute(art, ATTRIBUTE_CPU_NUM, cpu_num);
|
||||
setAttribute(art, ATTRIBUTE_UARCH, uarch);
|
||||
@@ -870,7 +914,7 @@ bool print_cpufetch_arm(struct cpuInfo* cpu, STYLE s, struct color** cs, struct
|
||||
}
|
||||
}
|
||||
char* pp = get_str_peak_performance(cpu->peak_performance);
|
||||
setAttribute(art,ATTRIBUTE_PEAK,pp);
|
||||
setAttribute(art, ATTRIBUTE_PEAK, pp);
|
||||
if(cpu->hv->present) {
|
||||
setAttribute(art, ATTRIBUTE_HYPERVISOR, cpu->hv->hv_name);
|
||||
}
|
||||
@@ -909,7 +953,142 @@ bool print_cpufetch_arm(struct cpuInfo* cpu, STYLE s, struct color** cs, struct
|
||||
}
|
||||
#endif
|
||||
|
||||
struct terminal* get_terminal_size() {
|
||||
#ifdef ARCH_RISCV
|
||||
// https://stackoverflow.com/a/2709523
|
||||
uint64_t number_of_bits(uint64_t i) {
|
||||
i = i - ((i >> 1) & 0x5555555555555555);
|
||||
i = (i & 0x3333333333333333) + ((i >> 2) & 0x3333333333333333);
|
||||
return (((i + (i >> 4)) & 0xF0F0F0F0F0F0F0F) * 0x101010101010101) >> 56;
|
||||
}
|
||||
|
||||
void print_ascii_riscv(struct ascii* art, uint32_t la, int32_t termw, const char** attribute_fields, uint64_t extensions_mask) {
|
||||
struct ascii_logo* logo = art->art;
|
||||
int attr_to_print = 0;
|
||||
int attr_type;
|
||||
char* attr_value;
|
||||
int32_t beg_space;
|
||||
int32_t space_right;
|
||||
int32_t ext_list_size = sizeof(extension_list)/sizeof(extension_list[0]);
|
||||
int32_t ext_num = 0;
|
||||
int32_t ext_to_print = 0;
|
||||
int32_t num_extensions = number_of_bits(extensions_mask);
|
||||
int32_t space_up = ((int)logo->height - (int)(art->n_attributes_set + num_extensions))/2;
|
||||
int32_t space_down = (int)logo->height - (int)(art->n_attributes_set + num_extensions) - (int)space_up;
|
||||
uint32_t logo_pos = 0;
|
||||
int32_t iters = max(logo->height, art->n_attributes_set + num_extensions);
|
||||
|
||||
struct line_buffer* lbuf = emalloc(sizeof(struct line_buffer));
|
||||
lbuf->buf = emalloc(sizeof(char) * LINE_BUFFER_SIZE);
|
||||
lbuf->pos = 0;
|
||||
lbuf->chars = 0;
|
||||
|
||||
printf("\n");
|
||||
for(int32_t n=0; n < iters; n++) {
|
||||
// 1. Print logo
|
||||
if(space_up > 0 || (space_up + n >= 0 && space_up + n < (int)logo->height)) {
|
||||
for(uint32_t i=0; i < logo->width; i++) {
|
||||
if(logo->art[logo_pos] == '$') {
|
||||
if(logo->replace_blocks) logo_pos += 3;
|
||||
else parse_print_color(art, lbuf, &logo_pos);
|
||||
}
|
||||
if(logo->replace_blocks && logo->art[logo_pos] != ' ') {
|
||||
if(logo->art[logo_pos] == '#') printOut(lbuf, 1, "%s%c%s", logo->color_ascii[0], ' ', art->reset);
|
||||
else if(logo->art[logo_pos] == '@') printOut(lbuf, 1, "%s%c%s", logo->color_ascii[1], ' ', art->reset);
|
||||
else if(logo->art[logo_pos] == '%') printOut(lbuf, 1, "%s%c%s", logo->color_ascii[2], ' ', art->reset);
|
||||
else printOut(lbuf, 1, "%c", logo->art[logo_pos]);
|
||||
}
|
||||
else
|
||||
printOut(lbuf, 1, "%c", logo->art[logo_pos]);
|
||||
|
||||
logo_pos++;
|
||||
}
|
||||
printOut(lbuf, 0, "%s", art->reset);
|
||||
}
|
||||
else {
|
||||
// If logo should not be printed, fill with spaces
|
||||
printOut(lbuf, logo->width, "%*c", logo->width, ' ');
|
||||
}
|
||||
|
||||
// 2. Print text
|
||||
if(space_up < 0 || (n > space_up-1 && n < (int)logo->height - space_down)) {
|
||||
attr_type = art->attributes[attr_to_print]->type;
|
||||
attr_value = art->attributes[attr_to_print]->value;
|
||||
|
||||
// Print extension
|
||||
if(attr_to_print > 0 && art->attributes[attr_to_print-1]->type == ATTRIBUTE_EXTENSIONS && ext_num != num_extensions) {
|
||||
// Search for the extension to print
|
||||
while(ext_to_print < ext_list_size && !((extensions_mask >> extension_list[ext_to_print].id) & 1U)) ext_to_print++;
|
||||
if(ext_to_print == ext_list_size) {
|
||||
printBug("print_ascii_riscv: Unable to find the extension to print");
|
||||
}
|
||||
|
||||
printOut(lbuf, 3 + strlen(extension_list[ext_to_print].str), "%s - %s%s", logo->color_text[0], extension_list[ext_to_print].str, art->reset);
|
||||
ext_num++;
|
||||
ext_to_print++;
|
||||
}
|
||||
else {
|
||||
attr_to_print++;
|
||||
beg_space = 0;
|
||||
space_right = 2 + 1 + (la - strlen(attribute_fields[attr_type]));
|
||||
|
||||
printOut(lbuf, beg_space + strlen(attribute_fields[attr_type]) + space_right + strlen(attr_value),
|
||||
"%*s%s%s%s%*s%s%s%s", beg_space, "", logo->color_text[0], attribute_fields[attr_type], art->reset, space_right, "", logo->color_text[1], attr_value, art->reset);
|
||||
}
|
||||
}
|
||||
printOutLine(lbuf, art, termw);
|
||||
printf("\n");
|
||||
}
|
||||
printf("\n");
|
||||
|
||||
free(lbuf->buf);
|
||||
free(lbuf);
|
||||
}
|
||||
|
||||
bool print_cpufetch_riscv(struct cpuInfo* cpu, STYLE s, struct color** cs, struct terminal* term) {
|
||||
struct ascii* art = set_ascii(get_soc_vendor(cpu->soc), s);
|
||||
if(art == NULL)
|
||||
return false;
|
||||
|
||||
// Step 1. Retrieve attributes
|
||||
char* uarch = get_str_uarch(cpu);
|
||||
char* manufacturing_process = get_str_process(cpu->soc);
|
||||
char* soc_name = get_soc_name(cpu->soc);
|
||||
char* extensions = get_str_extensions(cpu);
|
||||
char* max_frequency = get_str_freq(cpu->freq);
|
||||
char* n_cores = get_str_topology(cpu, cpu->topo);
|
||||
char* pp = get_str_peak_performance(cpu->peak_performance);
|
||||
|
||||
// Step 2. Set attributes
|
||||
setAttribute(art, ATTRIBUTE_SOC, soc_name);
|
||||
setAttribute(art, ATTRIBUTE_TECHNOLOGY, manufacturing_process);
|
||||
setAttribute(art, ATTRIBUTE_UARCH, uarch);
|
||||
setAttribute(art, ATTRIBUTE_NCORES, n_cores);
|
||||
setAttribute(art, ATTRIBUTE_FREQUENCY, max_frequency);
|
||||
if(extensions != NULL) {
|
||||
setAttribute(art, ATTRIBUTE_EXTENSIONS, extensions);
|
||||
}
|
||||
setAttribute(art, ATTRIBUTE_PEAK, pp);
|
||||
|
||||
// Step 3. Print output
|
||||
const char** attribute_fields = ATTRIBUTE_FIELDS;
|
||||
uint32_t longest_attribute = longest_attribute_length(art, attribute_fields);
|
||||
uint32_t longest_field = longest_field_length(art, longest_attribute);
|
||||
choose_ascii_art(art, cs, term, longest_field);
|
||||
|
||||
if(!ascii_fits_screen(term->w, *art->art, longest_field)) {
|
||||
// Despite of choosing the smallest logo, the output does not fit
|
||||
// Choose the shorter field names and recalculate the longest attr
|
||||
attribute_fields = ATTRIBUTE_FIELDS_SHORT;
|
||||
longest_attribute = longest_attribute_length(art, attribute_fields);
|
||||
}
|
||||
|
||||
print_ascii_riscv(art, longest_attribute, term->w, attribute_fields, cpu->ext->mask);
|
||||
|
||||
return true;
|
||||
}
|
||||
#endif
|
||||
|
||||
struct terminal* get_terminal_size(void) {
|
||||
struct terminal* term = emalloc(sizeof(struct terminal));
|
||||
|
||||
#ifdef _WIN32
|
||||
@@ -946,5 +1125,7 @@ bool print_cpufetch(struct cpuInfo* cpu, STYLE s, struct color** cs, bool show_f
|
||||
return print_cpufetch_ppc(cpu, s, cs, term, show_full_cpu_name);
|
||||
#elif ARCH_ARM
|
||||
return print_cpufetch_arm(cpu, s, cs, term);
|
||||
#elif ARCH_RISCV
|
||||
return print_cpufetch_riscv(cpu, s, cs, term);
|
||||
#endif
|
||||
}
|
||||
|
||||
@@ -11,6 +11,8 @@ typedef int STYLE;
|
||||
#include "../ppc/ppc.h"
|
||||
#elif ARCH_ARM
|
||||
#include "../arm/midr.h"
|
||||
#elif ARCH_RISCV
|
||||
#include "../riscv/riscv.h"
|
||||
#endif
|
||||
|
||||
// +-----------------------------------+-----------------------+
|
||||
@@ -21,6 +23,8 @@ typedef int STYLE;
|
||||
#define COLOR_DEFAULT_AMD "250,250,250:000,154,102:000,000,000:250,250,250:000,154,102"
|
||||
#define COLOR_DEFAULT_IBM "092,119,172:092,119,172:000,000,000:240,240,240:092,119,172"
|
||||
#define COLOR_DEFAULT_ARM "000,145,189:000,145,189:000,000,000:240,240,240:000,145,189"
|
||||
#define COLOR_DEFAULT_ROCKCHIP "114,159,207:229,195,000:000,000,000:240,240,240:114,159,207"
|
||||
#define COLOR_DEFAULT_SIFIVE "255,255,255:000,000,000:000,000,000:255,255,255:000,000,000"
|
||||
|
||||
#ifdef ARCH_X86
|
||||
void print_levels(struct cpuInfo* cpu);
|
||||
|
||||
93
src/common/soc.c
Normal file
93
src/common/soc.c
Normal file
@@ -0,0 +1,93 @@
|
||||
#include "soc.h"
|
||||
#ifdef ARCH_ARM
|
||||
#include "../arm/socs.h"
|
||||
#elif ARCH_RISCV
|
||||
#include "../riscv/socs.h"
|
||||
#endif
|
||||
#include "udev.h"
|
||||
#include "../common/global.h"
|
||||
|
||||
#include <string.h>
|
||||
|
||||
static char* soc_trademark_string[] = {
|
||||
// ARM
|
||||
[SOC_VENDOR_SNAPDRAGON] = "Snapdragon ",
|
||||
[SOC_VENDOR_MEDIATEK] = "MediaTek ",
|
||||
[SOC_VENDOR_EXYNOS] = "Exynos ",
|
||||
[SOC_VENDOR_KIRIN] = "Kirin ",
|
||||
[SOC_VENDOR_KUNPENG] = "Kunpeng ",
|
||||
[SOC_VENDOR_BROADCOM] = "Broadcom BCM",
|
||||
[SOC_VENDOR_APPLE] = "Apple ",
|
||||
[SOC_VENDOR_ROCKCHIP] = "Rockchip ",
|
||||
[SOC_VENDOR_GOOGLE] = "Google ",
|
||||
[SOC_VENDOR_NVIDIA] = "NVIDIA ",
|
||||
[SOC_VENDOR_AMPERE] = "Ampere ",
|
||||
// RISC-V
|
||||
[SOC_VENDOR_SIFIVE] = "SiFive ",
|
||||
[SOC_VENDOR_STARFIVE] = "StarFive ",
|
||||
[SOC_VENDOR_SIPEED] = "Sipeed ",
|
||||
// ARM & RISC-V
|
||||
[SOC_VENDOR_ALLWINNER] = "Allwinner "
|
||||
};
|
||||
|
||||
VENDOR get_soc_vendor(struct system_on_chip* soc) {
|
||||
return soc->soc_vendor;
|
||||
}
|
||||
|
||||
char* get_str_process(struct system_on_chip* soc) {
|
||||
char* str;
|
||||
|
||||
if(soc->process == UNKNOWN) {
|
||||
str = emalloc(sizeof(char) * (strlen(STRING_UNKNOWN)+1));
|
||||
snprintf(str, strlen(STRING_UNKNOWN)+1, STRING_UNKNOWN);
|
||||
}
|
||||
else {
|
||||
str = emalloc(sizeof(char) * 5);
|
||||
memset(str, 0, sizeof(char) * 5);
|
||||
snprintf(str, 5, "%dnm", soc->process);
|
||||
}
|
||||
return str;
|
||||
}
|
||||
|
||||
char* get_soc_name(struct system_on_chip* soc) {
|
||||
if(soc->soc_model == SOC_MODEL_UNKNOWN)
|
||||
return soc->raw_name;
|
||||
return soc->soc_name;
|
||||
}
|
||||
|
||||
void fill_soc(struct system_on_chip* soc, char* soc_name, SOC soc_model, int32_t process) {
|
||||
soc->soc_model = soc_model;
|
||||
soc->soc_vendor = get_soc_vendor_from_soc(soc_model);
|
||||
soc->process = process;
|
||||
if(soc->soc_vendor == SOC_VENDOR_UNKNOWN) {
|
||||
printBug("fill_soc: soc->soc_vendor == SOC_VENDOR_UNKOWN");
|
||||
// If we fall here there is a bug in socs.h
|
||||
// Reset everything to avoid segfault
|
||||
soc->soc_vendor = SOC_VENDOR_UNKNOWN;
|
||||
soc->soc_model = SOC_MODEL_UNKNOWN;
|
||||
soc->process = UNKNOWN;
|
||||
soc->raw_name = emalloc(sizeof(char) * (strlen(STRING_UNKNOWN)+1));
|
||||
snprintf(soc->raw_name, strlen(STRING_UNKNOWN)+1, STRING_UNKNOWN);
|
||||
}
|
||||
else {
|
||||
soc->process = process;
|
||||
int len = strlen(soc_name) + strlen(soc_trademark_string[soc->soc_vendor]) + 1;
|
||||
soc->soc_name = emalloc(sizeof(char) * len);
|
||||
memset(soc->soc_name, 0, sizeof(char) * len);
|
||||
sprintf(soc->soc_name, "%s%s", soc_trademark_string[soc->soc_vendor], soc_name);
|
||||
}
|
||||
}
|
||||
|
||||
bool match_soc(struct system_on_chip* soc, char* raw_name, char* expected_name, char* soc_name, SOC soc_model, int32_t process) {
|
||||
int len1 = strlen(raw_name);
|
||||
int len2 = strlen(expected_name);
|
||||
int len = min(len1, len2);
|
||||
|
||||
if(strncmp(raw_name, expected_name, len) != 0) {
|
||||
return false;
|
||||
}
|
||||
else {
|
||||
fill_soc(soc, soc_name, soc_model, process);
|
||||
return true;
|
||||
}
|
||||
}
|
||||
57
src/common/soc.h
Normal file
57
src/common/soc.h
Normal file
@@ -0,0 +1,57 @@
|
||||
#ifndef __SOC__
|
||||
#define __SOC__
|
||||
|
||||
// NOTE:
|
||||
// soc.c/soc.h are used by
|
||||
// ARM and RISC-V backends
|
||||
|
||||
#include "../common/cpu.h"
|
||||
#include <stdint.h>
|
||||
|
||||
#define UNKNOWN -1
|
||||
|
||||
typedef int32_t SOC;
|
||||
|
||||
enum {
|
||||
SOC_VENDOR_UNKNOWN,
|
||||
// ARM
|
||||
SOC_VENDOR_SNAPDRAGON,
|
||||
SOC_VENDOR_MEDIATEK,
|
||||
SOC_VENDOR_EXYNOS,
|
||||
SOC_VENDOR_KIRIN,
|
||||
SOC_VENDOR_KUNPENG,
|
||||
SOC_VENDOR_BROADCOM,
|
||||
SOC_VENDOR_APPLE,
|
||||
SOC_VENDOR_ROCKCHIP,
|
||||
SOC_VENDOR_GOOGLE,
|
||||
SOC_VENDOR_NVIDIA,
|
||||
SOC_VENDOR_AMPERE,
|
||||
// RISC-V
|
||||
SOC_VENDOR_SIFIVE,
|
||||
SOC_VENDOR_STARFIVE,
|
||||
SOC_VENDOR_SIPEED,
|
||||
// ARM & RISC-V
|
||||
SOC_VENDOR_ALLWINNER
|
||||
};
|
||||
|
||||
struct system_on_chip {
|
||||
SOC soc_model;
|
||||
VENDOR soc_vendor;
|
||||
int32_t process;
|
||||
char* soc_name;
|
||||
char* raw_name;
|
||||
};
|
||||
|
||||
struct system_on_chip* get_soc(struct cpuInfo* cpu);
|
||||
char* get_soc_name(struct system_on_chip* soc);
|
||||
VENDOR get_soc_vendor(struct system_on_chip* soc);
|
||||
bool match_soc(struct system_on_chip* soc, char* raw_name, char* expected_name, char* soc_name, SOC soc_model, int32_t process);
|
||||
char* get_str_process(struct system_on_chip* soc);
|
||||
void fill_soc(struct system_on_chip* soc, char* soc_name, SOC soc_model, int32_t process);
|
||||
|
||||
#define SOC_START if (false) {}
|
||||
#define SOC_EQ(raw_name, expected_name, soc_name, soc_model, soc, process) \
|
||||
else if (match_soc(soc, raw_name, expected_name, soc_name, soc_model, process)) return true;
|
||||
#define SOC_END else { return false; }
|
||||
|
||||
#endif
|
||||
@@ -4,8 +4,8 @@
|
||||
#include <string.h>
|
||||
#include <errno.h>
|
||||
|
||||
#include "../common/global.h"
|
||||
#include "../common/cpu.h"
|
||||
#include "global.h"
|
||||
#include "cpu.h"
|
||||
|
||||
uint32_t get_sys_info_by_name(char* name) {
|
||||
size_t size = 0;
|
||||
@@ -8,6 +8,9 @@
|
||||
// APPLE_CPU_PART_M2_BLIZZARD=0x30,M2_AVALANCHE=0x31
|
||||
#define MIDR_APPLE_M2_BLIZZARD 0x610F0300
|
||||
#define MIDR_APPLE_M2_AVALANCHE 0x610F0310
|
||||
// https://github.com/AsahiLinux/m1n1/blob/main/src/chickens.c
|
||||
#define MIDR_APPLE_M3_SAWTOOTH 0x610F0480
|
||||
#define MIDR_APPLE_M3_EVEREST 0x610F0490
|
||||
|
||||
// M1 / A14
|
||||
#ifndef CPUFAMILY_ARM_FIRESTORM_ICESTORM
|
||||
@@ -17,6 +20,15 @@
|
||||
#ifndef CPUFAMILY_ARM_AVALANCHE_BLIZZARD
|
||||
#define CPUFAMILY_ARM_AVALANCHE_BLIZZARD 0xDA33D83D
|
||||
#endif
|
||||
// M3 / A16 / A17
|
||||
// M3: https://ratfactor.com/zig/stdlib-browseable2/c/darwin.zig.html
|
||||
// M3_2: https://github.com/Dr-Noob/cpufetch/issues/230
|
||||
// PRO: https://github.com/Dr-Noob/cpufetch/issues/225
|
||||
// MAX: https://github.com/Dr-Noob/cpufetch/issues/210
|
||||
#define CPUFAMILY_ARM_EVEREST_SAWTOOTH 0x8765EDEA
|
||||
#define CPUFAMILY_ARM_EVEREST_SAWTOOTH_2 0xFA33415E
|
||||
#define CPUFAMILY_ARM_EVEREST_SAWTOOTH_PRO 0x5F4DEA93
|
||||
#define CPUFAMILY_ARM_EVEREST_SAWTOOTH_MAX 0x72015832
|
||||
|
||||
// For detecting different M1 types
|
||||
// NOTE: Could also be achieved detecting different
|
||||
@@ -31,6 +43,14 @@
|
||||
#define CPUSUBFAMILY_ARM_HC_HD 5
|
||||
#endif
|
||||
|
||||
// For alternative way to get CPU frequency on macOS and *BSD
|
||||
#ifdef __APPLE__
|
||||
#define CPUFREQUENCY_SYSCTL "hw.cpufrequency_max"
|
||||
#else
|
||||
// For FreeBSD, not sure about other *BSD
|
||||
#define CPUFREQUENCY_SYSCTL "dev.cpu.0.freq"
|
||||
#endif
|
||||
|
||||
uint32_t get_sys_info_by_name(char* name);
|
||||
|
||||
#endif
|
||||
@@ -1,9 +1,12 @@
|
||||
#include "../common/global.h"
|
||||
#include "udev.h"
|
||||
#include "global.h"
|
||||
#include "cpu.h"
|
||||
|
||||
#define _PATH_DEVTREE "/proc/device-tree/compatible"
|
||||
|
||||
// https://www.kernel.org/doc/html/latest/core-api/cpu_hotplug.html
|
||||
int get_ncores_from_cpuinfo() {
|
||||
int get_ncores_from_cpuinfo(void) {
|
||||
// Examples:
|
||||
// 0-271
|
||||
// 0-7
|
||||
@@ -129,6 +132,27 @@ long get_cache_size_from_file(char* path) {
|
||||
return ret * 1024;
|
||||
}
|
||||
|
||||
char* get_field_from_cpuinfo(char* CPUINFO_FIELD) {
|
||||
int filelen;
|
||||
char* buf;
|
||||
if((buf = read_file(_PATH_CPUINFO, &filelen)) == NULL) {
|
||||
printWarn("read_file: %s: %s:\n", _PATH_CPUINFO, strerror(errno));
|
||||
return NULL;
|
||||
}
|
||||
|
||||
char* tmp1 = strstr(buf, CPUINFO_FIELD);
|
||||
if(tmp1 == NULL) return NULL;
|
||||
tmp1 = tmp1 + strlen(CPUINFO_FIELD);
|
||||
char* tmp2 = strstr(tmp1, "\n");
|
||||
|
||||
int strlen = (1 + (tmp2-tmp1));
|
||||
char* hardware = emalloc(sizeof(char) * strlen);
|
||||
memset(hardware, 0, sizeof(char) * strlen);
|
||||
strncpy(hardware, tmp1, tmp2-tmp1);
|
||||
|
||||
return hardware;
|
||||
}
|
||||
|
||||
long get_max_freq_from_file(uint32_t core) {
|
||||
char path[_PATH_FREQUENCY_MAX_LEN];
|
||||
sprintf(path, "%s%s/cpu%d%s%s", _PATH_SYS_SYSTEM, _PATH_SYS_CPU, core, _PATH_FREQUENCY, _PATH_FREQUENCY_MAX);
|
||||
@@ -178,7 +202,13 @@ bool maps_equal(uint32_t* map1, uint32_t* map2, int n) {
|
||||
return true;
|
||||
}
|
||||
|
||||
int get_num_caches_from_files(char** paths, int num_paths) {
|
||||
// Generic function to count the number of distinct
|
||||
// elements in the list of files passed in char** paths.
|
||||
// An element can be potentially anything.
|
||||
// We use this function to count:
|
||||
// - The number of caches
|
||||
// - The number of sockets
|
||||
int get_num_elements_from_files(char** paths, int num_paths) {
|
||||
int filelen;
|
||||
char* buf;
|
||||
char* tmpbuf;
|
||||
@@ -193,10 +223,10 @@ int get_num_caches_from_files(char** paths, int num_paths) {
|
||||
num_bitmasks += (buf[i] == ',');
|
||||
}
|
||||
|
||||
// 2. Read cpu_shared_map from every core
|
||||
uint32_t** shared_maps = emalloc(sizeof(uint32_t *) * num_paths);
|
||||
// 2. Read map from every core
|
||||
uint32_t** maps = emalloc(sizeof(uint32_t *) * num_paths);
|
||||
for(int i=0; i < num_paths; i++) {
|
||||
shared_maps[i] = emalloc(sizeof(uint32_t) * num_bitmasks);
|
||||
maps[i] = emalloc(sizeof(uint32_t) * num_bitmasks);
|
||||
|
||||
if((buf = read_file(paths[i], &filelen)) == NULL) {
|
||||
printWarn("Could not open '%s'", paths[i]);
|
||||
@@ -206,6 +236,7 @@ int get_num_caches_from_files(char** paths, int num_paths) {
|
||||
for(int j=0; j < num_bitmasks; j++) {
|
||||
char* end;
|
||||
tmpbuf = emalloc(sizeof(char) * (strlen(buf) + 1));
|
||||
memset(tmpbuf, 0, sizeof(char) * (strlen(buf) + 1));
|
||||
char* commaend = strstr(buf, ",");
|
||||
if(commaend == NULL) {
|
||||
strcpy(tmpbuf, buf);
|
||||
@@ -221,35 +252,43 @@ int get_num_caches_from_files(char** paths, int num_paths) {
|
||||
return -1;
|
||||
}
|
||||
|
||||
shared_maps[i][j] = (uint32_t) ret;
|
||||
maps[i][j] = (uint32_t) ret;
|
||||
buf = commaend + 1;
|
||||
free(tmpbuf);
|
||||
}
|
||||
}
|
||||
|
||||
// 2. Count number of different masks; this is the number of caches
|
||||
int num_caches = 0;
|
||||
// 2. Count number of different masks; this is the number of elements
|
||||
int num_elements = 0;
|
||||
bool found = false;
|
||||
uint32_t** unique_shared_maps = emalloc(sizeof(uint32_t *) * num_paths);
|
||||
uint32_t** unique_maps = emalloc(sizeof(uint32_t *) * num_paths);
|
||||
for(int i=0; i < num_paths; i++) {
|
||||
unique_shared_maps[i] = emalloc(sizeof(uint32_t) * num_bitmasks);
|
||||
unique_maps[i] = emalloc(sizeof(uint32_t) * num_bitmasks);
|
||||
for(int j=0; j < num_bitmasks; j++) {
|
||||
unique_shared_maps[i][j] = 0;
|
||||
unique_maps[i][j] = 0;
|
||||
}
|
||||
}
|
||||
|
||||
for(int i=0; i < num_paths; i++) {
|
||||
for(int j=0; j < num_paths && !found; j++) {
|
||||
if(maps_equal(shared_maps[i], unique_shared_maps[j], num_bitmasks)) found = true;
|
||||
if(maps_equal(maps[i], unique_maps[j], num_bitmasks)) found = true;
|
||||
}
|
||||
if(!found) {
|
||||
add_shared_map(shared_maps, i, unique_shared_maps, num_caches, num_bitmasks);
|
||||
num_caches++;
|
||||
add_shared_map(maps, i, unique_maps, num_elements, num_bitmasks);
|
||||
num_elements++;
|
||||
}
|
||||
found = false;
|
||||
}
|
||||
|
||||
return num_caches;
|
||||
return num_elements;
|
||||
}
|
||||
|
||||
int get_num_caches_from_files(char** paths, int num_paths) {
|
||||
return get_num_elements_from_files(paths, num_paths);
|
||||
}
|
||||
|
||||
int get_num_sockets_from_files(char** paths, int num_paths) {
|
||||
return get_num_elements_from_files(paths, num_paths);
|
||||
}
|
||||
|
||||
int get_num_caches_by_level(struct cpuInfo* cpu, uint32_t level) {
|
||||
@@ -278,3 +317,48 @@ int get_num_caches_by_level(struct cpuInfo* cpu, uint32_t level) {
|
||||
|
||||
return ret;
|
||||
}
|
||||
|
||||
int get_num_sockets_package_cpus(struct topology* topo) {
|
||||
// Get number of sockets using
|
||||
// /sys/devices/system/cpu/cpu*/topology/package_cpus
|
||||
|
||||
char** paths = emalloc(sizeof(char *) * topo->total_cores);
|
||||
|
||||
for(int i=0; i < topo->total_cores; i++) {
|
||||
paths[i] = emalloc(sizeof(char) * _PATH_PACKAGE_MAX_LEN);
|
||||
sprintf(paths[i], "%s%s/cpu%d%s", _PATH_SYS_SYSTEM, _PATH_SYS_CPU, i, _PATH_TOPO_PACKAGE_CPUS);
|
||||
}
|
||||
|
||||
int ret = get_num_sockets_from_files(paths, topo->total_cores);
|
||||
|
||||
for(int i=0; i < topo->total_cores; i++)
|
||||
free(paths[i]);
|
||||
free(paths);
|
||||
|
||||
return ret;
|
||||
}
|
||||
|
||||
// Inspired in is_devtree_compatible from lscpu
|
||||
bool is_devtree_compatible(char* str) {
|
||||
int filelen;
|
||||
char* buf;
|
||||
if((buf = read_file("/proc/device-tree/compatible", &filelen)) == NULL) {
|
||||
return false;
|
||||
}
|
||||
|
||||
char* tmp;
|
||||
if((tmp = strstr(buf, str)) == NULL) {
|
||||
return false;
|
||||
}
|
||||
return true;
|
||||
}
|
||||
|
||||
char* get_devtree_compatible(int *filelen) {
|
||||
char* buf;
|
||||
|
||||
if ((buf = read_file(_PATH_DEVTREE, filelen)) == NULL) {
|
||||
printWarn("read_file: %s: %s", _PATH_DEVTREE, strerror(errno));
|
||||
}
|
||||
|
||||
return buf;
|
||||
}
|
||||
|
||||
@@ -12,6 +12,7 @@
|
||||
|
||||
#include "cpu.h"
|
||||
|
||||
#define _PATH_CPUINFO "/proc/cpuinfo"
|
||||
#define _PATH_SYS_SYSTEM "/sys/devices/system"
|
||||
#define _PATH_SYS_CPU "/cpu"
|
||||
#define _PATH_FREQUENCY "/cpufreq"
|
||||
@@ -23,10 +24,12 @@
|
||||
#define _PATH_CACHE_L3 "/cache/index3"
|
||||
#define _PATH_CACHE_SIZE "/size"
|
||||
#define _PATH_CACHE_SHARED_MAP "/shared_cpu_map"
|
||||
#define _PATH_CPUS_PRESENT _PATH_SYS_SYSTEM _PATH_SYS_CPU "/present"
|
||||
#define _PATH_CPUS_PRESENT _PATH_SYS_SYSTEM _PATH_SYS_CPU "/present"
|
||||
#define _PATH_TOPO_PACKAGE_CPUS "/topology/package_cpus"
|
||||
|
||||
#define _PATH_FREQUENCY_MAX_LEN 100
|
||||
#define _PATH_CACHE_MAX_LEN 200
|
||||
#define _PATH_PACKAGE_MAX_LEN 200
|
||||
|
||||
char* read_file(char* path, int* len);
|
||||
long get_max_freq_from_file(uint32_t core);
|
||||
@@ -36,6 +39,10 @@ long get_l1d_cache_size(uint32_t core);
|
||||
long get_l2_cache_size(uint32_t core);
|
||||
long get_l3_cache_size(uint32_t core);
|
||||
int get_num_caches_by_level(struct cpuInfo* cpu, uint32_t level);
|
||||
int get_ncores_from_cpuinfo();
|
||||
int get_num_sockets_package_cpus(struct topology* topo);
|
||||
int get_ncores_from_cpuinfo(void);
|
||||
char* get_field_from_cpuinfo(char* CPUINFO_FIELD);
|
||||
bool is_devtree_compatible(char* str);
|
||||
char* get_devtree_compatible(int *filelen);
|
||||
|
||||
#endif
|
||||
|
||||
@@ -11,6 +11,20 @@
|
||||
#include "../common/udev.h"
|
||||
#include "../common/global.h"
|
||||
|
||||
static char *hv_vendors_name[] = {
|
||||
[HV_VENDOR_KVM] = "KVM",
|
||||
[HV_VENDOR_QEMU] = "QEMU",
|
||||
[HV_VENDOR_VBOX] = "VirtualBox",
|
||||
[HV_VENDOR_HYPERV] = "Microsoft Hyper-V",
|
||||
[HV_VENDOR_VMWARE] = "VMware",
|
||||
[HV_VENDOR_XEN] = "Xen",
|
||||
[HV_VENDOR_PARALLELS] = "Parallels",
|
||||
[HV_VENDOR_PHYP] = "pHyp",
|
||||
[HV_VENDOR_BHYVE] = "bhyve",
|
||||
[HV_VENDOR_APPLEVZ] = "Apple VZ",
|
||||
[HV_VENDOR_INVALID] = STRING_UNKNOWN
|
||||
};
|
||||
|
||||
struct cache* get_cache_info(struct cpuInfo* cpu) {
|
||||
struct cache* cach = emalloc(sizeof(struct cache));
|
||||
init_cache_struct(cach);
|
||||
@@ -63,23 +77,30 @@ struct topology* get_topology_info(struct cache* cach) {
|
||||
printWarn("fill_core_ids_from_sys failed, output may be incomplete/invalid");
|
||||
for(int i=0; i < topo->total_cores; i++) core_ids[i] = 0;
|
||||
}
|
||||
|
||||
if(!fill_package_ids_from_sys(package_ids, topo->total_cores)) {
|
||||
printWarn("fill_package_ids_from_sys failed, output may be incomplete/invalid");
|
||||
for(int i=0; i < topo->total_cores; i++) package_ids[i] = 0;
|
||||
// fill_package_ids_from_sys failed, use a
|
||||
// more sophisticated wat to find the number of sockets
|
||||
topo->sockets = get_num_sockets_package_cpus(topo);
|
||||
}
|
||||
|
||||
// 2. Socket detection
|
||||
int *package_ids_count = emalloc(sizeof(int) * topo->total_cores);
|
||||
for(int i=0; i < topo->total_cores; i++) {
|
||||
package_ids_count[i] = 0;
|
||||
}
|
||||
for(int i=0; i < topo->total_cores; i++) {
|
||||
package_ids_count[package_ids[i]]++;
|
||||
}
|
||||
for(int i=0; i < topo->total_cores; i++) {
|
||||
if(package_ids_count[i] != 0) {
|
||||
topo->sockets++;
|
||||
else {
|
||||
// fill_package_ids_from_sys succeeded, use the
|
||||
// traditional socket detection algorithm
|
||||
int *package_ids_count = emalloc(sizeof(int) * topo->total_cores);
|
||||
for(int i=0; i < topo->total_cores; i++) {
|
||||
package_ids_count[i] = 0;
|
||||
}
|
||||
for(int i=0; i < topo->total_cores; i++) {
|
||||
package_ids_count[package_ids[i]]++;
|
||||
}
|
||||
for(int i=0; i < topo->total_cores; i++) {
|
||||
if(package_ids_count[i] != 0) {
|
||||
topo->sockets++;
|
||||
}
|
||||
}
|
||||
free(package_ids_count);
|
||||
}
|
||||
|
||||
// 3. Physical cores detection
|
||||
@@ -105,13 +126,12 @@ struct topology* get_topology_info(struct cache* cach) {
|
||||
|
||||
free(core_ids);
|
||||
free(package_ids);
|
||||
free(package_ids_count);
|
||||
free(core_ids_unified);
|
||||
|
||||
return topo;
|
||||
}
|
||||
|
||||
static inline uint32_t mfpvr() {
|
||||
static inline uint32_t mfpvr(void) {
|
||||
uint32_t pvr;
|
||||
|
||||
asm ("mfpvr %0"
|
||||
@@ -123,12 +143,19 @@ struct uarch* get_cpu_uarch(struct cpuInfo* cpu) {
|
||||
return get_uarch_from_pvr(cpu->pvr);
|
||||
}
|
||||
|
||||
struct frequency* get_frequency_info() {
|
||||
struct frequency* get_frequency_info(void) {
|
||||
struct frequency* freq = emalloc(sizeof(struct frequency));
|
||||
|
||||
freq->measured = false;
|
||||
freq->max = get_max_freq_from_file(0);
|
||||
freq->base = get_min_freq_from_file(0);
|
||||
|
||||
if(freq->max == UNKNOWN_DATA) {
|
||||
// If we are unable to find it in the
|
||||
// standard path, try /proc/cpuinfo
|
||||
freq->max = get_frequency_from_cpuinfo();
|
||||
}
|
||||
|
||||
return freq;
|
||||
}
|
||||
|
||||
@@ -158,7 +185,29 @@ int64_t get_peak_performance(struct cpuInfo* cpu, struct topology* topo, int64_t
|
||||
return flops;
|
||||
}
|
||||
|
||||
struct cpuInfo* get_cpu_info() {
|
||||
struct hypervisor* get_hp_info(void) {
|
||||
struct hypervisor* hv = emalloc(sizeof(struct hypervisor));
|
||||
hv->present = false;
|
||||
|
||||
// Weird heuristic found in lscpu:
|
||||
// https://github.com/util-linux/util-linux/blob/master/sys-utils/lscpu-virt.c
|
||||
if(access("/proc" _PATH_DT_IBM_PARTIT_NAME, F_OK) == 0 &&
|
||||
access("/proc" _PATH_DT_HMC_MANAGED, F_OK) == 0 &&
|
||||
access("/proc" _PATH_DT_QEMU_WIDTH, F_OK) != 0) {
|
||||
hv->present = true;
|
||||
hv->hv_vendor = HV_VENDOR_PHYP;
|
||||
}
|
||||
else if(is_devtree_compatible("qemu,pseries")) {
|
||||
hv->present = true;
|
||||
hv->hv_vendor = HV_VENDOR_QEMU;
|
||||
}
|
||||
|
||||
hv->hv_name = hv_vendors_name[hv->hv_vendor];
|
||||
|
||||
return hv;
|
||||
}
|
||||
|
||||
struct cpuInfo* get_cpu_info(void) {
|
||||
struct cpuInfo* cpu = emalloc(sizeof(struct cpuInfo));
|
||||
struct features* feat = emalloc(sizeof(struct features));
|
||||
cpu->feat = feat;
|
||||
@@ -172,8 +221,11 @@ struct cpuInfo* get_cpu_info() {
|
||||
char* path = emalloc(sizeof(char) * (strlen(_PATH_DT) + strlen(_PATH_DT_PART) + 1));
|
||||
sprintf(path, "%s%s", _PATH_DT, _PATH_DT_PART);
|
||||
|
||||
cpu->cpu_name = read_file(path, &len);
|
||||
if((cpu->cpu_name = read_file(path, &len)) == NULL) {
|
||||
printWarn("Could not open '%s'", path);
|
||||
}
|
||||
cpu->pvr = mfpvr();
|
||||
cpu->hv = get_hp_info();
|
||||
cpu->arch = get_cpu_uarch(cpu);
|
||||
cpu->freq = get_frequency_info();
|
||||
cpu->topo = get_topology_info(cpu->cach);
|
||||
|
||||
@@ -3,7 +3,7 @@
|
||||
|
||||
#include "../common/cpu.h"
|
||||
|
||||
struct cpuInfo* get_cpu_info();
|
||||
struct cpuInfo* get_cpu_info(void);
|
||||
char* get_str_altivec(struct cpuInfo* cpu);
|
||||
char* get_str_topology(struct topology* topo, bool dual_socket);
|
||||
void print_debug(struct cpuInfo* cpu);
|
||||
|
||||
@@ -35,6 +35,7 @@ enum {
|
||||
UARCH_POWER7,
|
||||
UARCH_POWER7PLUS,
|
||||
UARCH_POWER8,
|
||||
UARCH_POWER8_DD21,
|
||||
UARCH_POWER9,
|
||||
UARCH_POWER9_DD20,
|
||||
UARCH_POWER9_DD21,
|
||||
@@ -84,6 +85,7 @@ void fill_uarch(struct uarch* arch, MICROARCH u) {
|
||||
FILL_UARCH(arch->uarch, UARCH_POWER7, "POWER7", 45)
|
||||
FILL_UARCH(arch->uarch, UARCH_POWER7PLUS, "POWER7+", 32)
|
||||
FILL_UARCH(arch->uarch, UARCH_POWER8, "POWER8", 22)
|
||||
FILL_UARCH(arch->uarch, UARCH_POWER8_DD21, "POWER8 (DD2.1)", 22)
|
||||
FILL_UARCH(arch->uarch, UARCH_POWER9, "POWER9", 14)
|
||||
FILL_UARCH(arch->uarch, UARCH_POWER9_DD20, "POWER9 (DD2.0)", 14)
|
||||
FILL_UARCH(arch->uarch, UARCH_POWER9_DD21, "POWER9 (DD2.1)", 14)
|
||||
@@ -100,7 +102,19 @@ void fill_uarch(struct uarch* arch, MICROARCH u) {
|
||||
}
|
||||
|
||||
/*
|
||||
* PVR masks/values from arch/powerpc/kernel/cputable.c (Linux kernel)
|
||||
* PVR masks/values from Linux kernel:
|
||||
* - arch/powerpc/kernel/cputable.c (kernel <= 6.0)
|
||||
* - arch/powerpc/kernel/cpu_specs_book3s_64.h (kernel >= 6.1)
|
||||
*
|
||||
* In the kernel, there is a POWER8E identifier. In
|
||||
* https://wiki.raptorcs.com/wiki/POWER8E it says it is
|
||||
* actually DD2.1, while other POWER8 should be DD2.0.
|
||||
* The last assumption does not seem to be correct according
|
||||
* to https://openbenchmarking.org/s/POWER8NVL, which shows a
|
||||
* POWER8NVL where kernel says it is DD1.0. We implement this
|
||||
* to show only the uarch, not the revision, since it seems a bit
|
||||
* redundant?
|
||||
*
|
||||
* This list may be incorrect, incomplete or overly simplified,
|
||||
* specially in the case of 32 bit entries
|
||||
*/
|
||||
@@ -125,7 +139,7 @@ struct uarch* get_uarch_from_pvr(uint32_t pvr) {
|
||||
CHECK_UARCH(arch, pvr, 0xffffffff, 0x0f000006, UARCH_POWER10)
|
||||
CHECK_UARCH(arch, pvr, 0xffff0000, 0x003f0000, UARCH_POWER7)
|
||||
CHECK_UARCH(arch, pvr, 0xffff0000, 0x004A0000, UARCH_POWER7PLUS)
|
||||
CHECK_UARCH(arch, pvr, 0xffff0000, 0x004b0000, UARCH_POWER8)
|
||||
CHECK_UARCH(arch, pvr, 0xffff0000, 0x004b0000, UARCH_POWER8_DD21)
|
||||
CHECK_UARCH(arch, pvr, 0xffff0000, 0x004c0000, UARCH_POWER8)
|
||||
CHECK_UARCH(arch, pvr, 0xffff0000, 0x004d0000, UARCH_POWER8)
|
||||
CHECK_UARCH(arch, pvr, 0xffffefff, 0x004e0200, UARCH_POWER9_DD20)
|
||||
@@ -234,6 +248,7 @@ bool has_altivec(struct uarch* arch) {
|
||||
case UARCH_POWER7:
|
||||
case UARCH_POWER7PLUS:
|
||||
case UARCH_POWER8:
|
||||
case UARCH_POWER8_DD21:
|
||||
case UARCH_POWER9:
|
||||
case UARCH_POWER9_DD20:
|
||||
case UARCH_POWER9_DD21:
|
||||
@@ -265,9 +280,6 @@ char* get_str_process(struct cpuInfo* cpu) {
|
||||
if(process == UNK) {
|
||||
snprintf(str, strlen(STRING_UNKNOWN)+1, STRING_UNKNOWN);
|
||||
}
|
||||
else if(process > 100) {
|
||||
sprintf(str, "%.2fum", (double)process/100);
|
||||
}
|
||||
else if(process > 0){
|
||||
sprintf(str, "%dnm", process);
|
||||
}
|
||||
|
||||
@@ -1,16 +1,19 @@
|
||||
#include <errno.h>
|
||||
|
||||
#include "../common/udev.h"
|
||||
#include "../common/global.h"
|
||||
#include "udev.h"
|
||||
|
||||
#define _PATH_TOPO_CORE_ID "topology/core_id"
|
||||
#define _PATH_TOPO_PACKAGE_ID "topology/physical_package_id"
|
||||
#define _PATH_TOPO_CORE_ID "topology/core_id"
|
||||
#define _PATH_TOPO_PACKAGE_ID "topology/physical_package_id"
|
||||
#define CPUINFO_FREQUENCY_STR "clock\t\t: "
|
||||
|
||||
bool fill_array_from_sys(int *core_ids, int total_cores, char* SYS_PATH) {
|
||||
int filelen;
|
||||
char* buf;
|
||||
char* end;
|
||||
char path[128];
|
||||
memset(path, 0, 128);
|
||||
|
||||
for(int i=0; i < total_cores; i++) {
|
||||
sprintf(path, "%s%s/cpu%d/%s", _PATH_SYS_SYSTEM, _PATH_SYS_CPU, i, SYS_PATH);
|
||||
@@ -36,5 +39,52 @@ bool fill_core_ids_from_sys(int *core_ids, int total_cores) {
|
||||
}
|
||||
|
||||
bool fill_package_ids_from_sys(int* package_ids, int total_cores) {
|
||||
return fill_array_from_sys(package_ids, total_cores, _PATH_TOPO_PACKAGE_ID);
|
||||
bool status = fill_array_from_sys(package_ids, total_cores, _PATH_TOPO_PACKAGE_ID);
|
||||
if(status) {
|
||||
// fill_array_from_sys completed successfully, but we
|
||||
// must to check the integrity of the package_ids array
|
||||
for(int i=0; i < total_cores; i++) {
|
||||
if(package_ids[i] == -1) {
|
||||
printWarn("fill_package_ids_from_sys: package_ids[%d] = -1", i);
|
||||
return false;
|
||||
}
|
||||
else if(package_ids[i] >= total_cores || package_ids[i] < 0) {
|
||||
printBug("fill_package_ids_from_sys: package_ids[%d] = %d", i, package_ids[i]);
|
||||
return false;
|
||||
}
|
||||
}
|
||||
|
||||
return true;
|
||||
}
|
||||
return false;
|
||||
}
|
||||
|
||||
long get_frequency_from_cpuinfo(void) {
|
||||
char* freq_str = get_field_from_cpuinfo(CPUINFO_FREQUENCY_STR);
|
||||
if(freq_str == NULL) {
|
||||
return UNKNOWN_DATA;
|
||||
}
|
||||
else {
|
||||
// freq_str should be in the form XXXX.YYYYYYMHz
|
||||
char* dot = strstr(freq_str, ".");
|
||||
freq_str[dot-freq_str] = '\0';
|
||||
|
||||
char* end;
|
||||
errno = 0;
|
||||
long ret = strtol(freq_str, &end, 10);
|
||||
if(errno != 0) {
|
||||
printBug("strtol: %s", strerror(errno));
|
||||
free(freq_str);
|
||||
return UNKNOWN_DATA;
|
||||
}
|
||||
|
||||
// We consider it an error if frequency is
|
||||
// greater than 10 GHz or less than 100 MHz
|
||||
if(ret > 10000 || ret < 100) {
|
||||
printBug("Invalid data was read from file '%s': %ld\n", CPUINFO_FREQUENCY_STR, ret);
|
||||
return UNKNOWN_DATA;
|
||||
}
|
||||
|
||||
return ret;
|
||||
}
|
||||
}
|
||||
|
||||
@@ -2,10 +2,15 @@
|
||||
#define __UDEV_PPC__
|
||||
|
||||
#include "../common/udev.h"
|
||||
#define _PATH_DT "/proc/device-tree/vpd/root-node-vpd@a000/enclosure@1e00/backplane@800/processor@1000"
|
||||
#define _PATH_DT_PART "/part-number"
|
||||
#define _PATH_DT "/proc/device-tree/vpd/root-node-vpd@a000/enclosure@1e00/backplane@800/processor@1000"
|
||||
#define _PATH_DT_PART "/part-number"
|
||||
#define _PATH_DT_IBM_PARTIT_NAME "/device-tree/ibm,partition-name"
|
||||
#define _PATH_DT_HMC_MANAGED "/device-tree/hmc-managed?"
|
||||
#define _PATH_DT_QEMU_WIDTH "/device-tree/chosen/qemu,graphic-width"
|
||||
|
||||
bool fill_core_ids_from_sys(int *core_ids, int total_cores);
|
||||
bool fill_package_ids_from_sys(int* package_ids, int total_cores);
|
||||
int get_num_sockets_package_cpus(struct topology* topo);
|
||||
long get_frequency_from_cpuinfo(void);
|
||||
|
||||
#endif
|
||||
|
||||
207
src/riscv/riscv.c
Normal file
207
src/riscv/riscv.c
Normal file
@@ -0,0 +1,207 @@
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
#include <string.h>
|
||||
#include <ctype.h>
|
||||
|
||||
#include "../common/global.h"
|
||||
#include "../common/udev.h"
|
||||
#include "udev.h"
|
||||
#include "uarch.h"
|
||||
#include "soc.h"
|
||||
|
||||
#define SET_ISA_EXT_MAP(name, bit) \
|
||||
if(strncmp(multi_letter_extension, name, \
|
||||
multi_letter_extension_len) == 0) { \
|
||||
ext->mask |= 1UL << bit; \
|
||||
maskset = true; \
|
||||
} \
|
||||
|
||||
struct frequency* get_frequency_info(uint32_t core) {
|
||||
struct frequency* freq = emalloc(sizeof(struct frequency));
|
||||
|
||||
freq->measured = false;
|
||||
freq->base = UNKNOWN_DATA;
|
||||
freq->max = get_max_freq_from_file(core);
|
||||
|
||||
return freq;
|
||||
}
|
||||
|
||||
int64_t get_peak_performance(struct cpuInfo* cpu) {
|
||||
//First check we have consistent data
|
||||
if(get_freq(cpu->freq) == UNKNOWN_DATA) {
|
||||
return -1;
|
||||
}
|
||||
|
||||
int64_t flops = cpu->topo->total_cores * (get_freq(cpu->freq) * 1000000);
|
||||
return flops;
|
||||
}
|
||||
|
||||
// Returns the length of the multi-letter
|
||||
// extension, or -1 if an error occurs
|
||||
int parse_multi_letter_extension(struct extensions* ext, char* e) {
|
||||
if(*e != '_') return -1;
|
||||
char* multi_letter_extension_end = strstr(e+1, "_");
|
||||
if(multi_letter_extension_end == NULL) {
|
||||
// This is the last extension, find the end
|
||||
// of the string
|
||||
multi_letter_extension_end = e + strlen(e);
|
||||
}
|
||||
|
||||
int multi_letter_extension_len = multi_letter_extension_end-(e+1);
|
||||
bool maskset = false;
|
||||
char* multi_letter_extension = emalloc(multi_letter_extension_len);
|
||||
strncpy(multi_letter_extension, e+1, multi_letter_extension_len);
|
||||
// This should be up-to-date with
|
||||
// https://elixir.bootlin.com/linux/latest/source/arch/riscv/kernel/cpufeature.c
|
||||
// which should represent the list of extensions available in real chips
|
||||
SET_ISA_EXT_MAP("sscofpmf", RISCV_ISA_EXT_SSCOFPMF)
|
||||
SET_ISA_EXT_MAP("sstc", RISCV_ISA_EXT_SSTC)
|
||||
SET_ISA_EXT_MAP("svinval", RISCV_ISA_EXT_SVINVAL)
|
||||
SET_ISA_EXT_MAP("svpbmt", RISCV_ISA_EXT_SVPBMT)
|
||||
SET_ISA_EXT_MAP("zbb", RISCV_ISA_EXT_ZBB)
|
||||
SET_ISA_EXT_MAP("zicbom", RISCV_ISA_EXT_ZICBOM)
|
||||
SET_ISA_EXT_MAP("zihintpause", RISCV_ISA_EXT_ZIHINTPAUSE)
|
||||
SET_ISA_EXT_MAP("svnapot", RISCV_ISA_EXT_SVNAPOT)
|
||||
SET_ISA_EXT_MAP("zicboz", RISCV_ISA_EXT_ZICBOZ)
|
||||
SET_ISA_EXT_MAP("smaia", RISCV_ISA_EXT_SMAIA)
|
||||
SET_ISA_EXT_MAP("ssaia", RISCV_ISA_EXT_SSAIA)
|
||||
SET_ISA_EXT_MAP("zba", RISCV_ISA_EXT_ZBA)
|
||||
SET_ISA_EXT_MAP("zbs", RISCV_ISA_EXT_ZBS)
|
||||
SET_ISA_EXT_MAP("zicntr", RISCV_ISA_EXT_ZICNTR)
|
||||
SET_ISA_EXT_MAP("zicsr", RISCV_ISA_EXT_ZICSR)
|
||||
SET_ISA_EXT_MAP("zifencei", RISCV_ISA_EXT_ZIFENCEI)
|
||||
SET_ISA_EXT_MAP("zihpm", RISCV_ISA_EXT_ZIHPM)
|
||||
if(!maskset) {
|
||||
printBug("parse_multi_letter_extension: Unknown multi-letter extension: %s", multi_letter_extension);
|
||||
return -1;
|
||||
}
|
||||
|
||||
return multi_letter_extension_len;
|
||||
}
|
||||
|
||||
bool valid_extension(char ext) {
|
||||
bool found = false;
|
||||
uint64_t idx = 0;
|
||||
|
||||
while(idx < sizeof(extension_list)/sizeof(extension_list[0]) && !found) {
|
||||
found = (extension_list[idx].id == (ext - 'a'));
|
||||
if(!found) idx++;
|
||||
}
|
||||
|
||||
return found;
|
||||
}
|
||||
|
||||
struct extensions* get_extensions_from_str(char* str) {
|
||||
struct extensions* ext = emalloc(sizeof(struct extensions));
|
||||
ext->mask = 0;
|
||||
ext->str = NULL;
|
||||
|
||||
if(str == NULL) {
|
||||
return ext;
|
||||
}
|
||||
|
||||
int len = sizeof(char) * (strlen(str)+1);
|
||||
ext->str = emalloc(sizeof(char) * len);
|
||||
memset(ext->str, 0, len);
|
||||
strncpy(ext->str, str, sizeof(char) * len);
|
||||
|
||||
// Code inspired in Linux kernel (riscv_fill_hwcap):
|
||||
// https://elixir.bootlin.com/linux/v6.2.10/source/arch/riscv/kernel/cpufeature.c
|
||||
char* isa = str;
|
||||
if (!strncmp(isa, "rv32", 4))
|
||||
isa += 4;
|
||||
else if (!strncmp(isa, "rv64", 4))
|
||||
isa += 4;
|
||||
else {
|
||||
printBug("get_extensions_from_str: ISA string must start with rv64 or rv32");
|
||||
return ext;
|
||||
}
|
||||
|
||||
for(char* e = isa; *e != '\0'; e++) {
|
||||
if(*e == '_') {
|
||||
// Multi-letter extension
|
||||
int multi_letter_extension_len = parse_multi_letter_extension(ext, e);
|
||||
if(multi_letter_extension_len == -1) {
|
||||
return ext;
|
||||
}
|
||||
e += multi_letter_extension_len;
|
||||
}
|
||||
else {
|
||||
// Single-letter extensions 's' and 'u' are invalid
|
||||
// according to Linux kernel (arch/riscv/kernel/cpufeature.c:
|
||||
// riscv_fill_hwcap). Optionally, we could opt for using
|
||||
// hwcap instead of cpuinfo to avoid this
|
||||
if (*e == 's' || *e == 'u') {
|
||||
continue;
|
||||
}
|
||||
// Make sure that the extension is valid before
|
||||
// adding it to the mask
|
||||
if(valid_extension(*e)) {
|
||||
int n = *e - 'a';
|
||||
ext->mask |= 1UL << n;
|
||||
}
|
||||
else {
|
||||
printBug("get_extensions_from_str: Invalid extension: '%c'", *e);
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
return ext;
|
||||
}
|
||||
|
||||
struct cpuInfo* get_cpu_info(void) {
|
||||
struct cpuInfo* cpu = malloc(sizeof(struct cpuInfo));
|
||||
//init_cpu_info(cpu);
|
||||
struct topology* topo = emalloc(sizeof(struct topology));
|
||||
topo->total_cores = get_ncores_from_cpuinfo();
|
||||
topo->cach = NULL;
|
||||
cpu->topo = topo;
|
||||
|
||||
char* cpuinfo_str = get_uarch_from_cpuinfo();
|
||||
char* ext_str = get_extensions_from_cpuinfo();
|
||||
cpu->hv = emalloc(sizeof(struct hypervisor));
|
||||
cpu->hv->present = false;
|
||||
cpu->ext = get_extensions_from_str(ext_str);
|
||||
if(cpu->ext->str != NULL && cpu->ext->mask == 0) return NULL;
|
||||
cpu->arch = get_uarch_from_cpuinfo_str(cpuinfo_str, cpu);
|
||||
cpu->soc = get_soc(cpu);
|
||||
cpu->freq = get_frequency_info(0);
|
||||
cpu->peak_performance = get_peak_performance(cpu);
|
||||
|
||||
return cpu;
|
||||
}
|
||||
|
||||
//TODO: Might be worth refactoring with other archs
|
||||
char* get_str_topology(struct cpuInfo* cpu, struct topology* topo) {
|
||||
uint32_t size = 3+7+1;
|
||||
char* string = emalloc(sizeof(char)*size);
|
||||
snprintf(string, size, "%d cores", topo->total_cores);
|
||||
|
||||
return string;
|
||||
}
|
||||
|
||||
char* get_str_extensions(struct cpuInfo* cpu) {
|
||||
if(cpu->ext != NULL) {
|
||||
return cpu->ext->str;
|
||||
}
|
||||
return NULL;
|
||||
}
|
||||
|
||||
void print_debug(struct cpuInfo* cpu) {
|
||||
printf("- soc: ");
|
||||
if(cpu->soc->raw_name == NULL) {
|
||||
printf("NULL\n");
|
||||
}
|
||||
else {
|
||||
printf("'%s'\n", cpu->soc->raw_name);
|
||||
}
|
||||
|
||||
printf("- uarch: ");
|
||||
char* arch_cpuinfo_str = get_arch_cpuinfo_str(cpu);
|
||||
if(arch_cpuinfo_str == NULL) {
|
||||
printf("NULL\n");
|
||||
}
|
||||
else {
|
||||
printf("'%s'\n", arch_cpuinfo_str);
|
||||
}
|
||||
}
|
||||
82
src/riscv/riscv.h
Normal file
82
src/riscv/riscv.h
Normal file
@@ -0,0 +1,82 @@
|
||||
#ifndef __RISCV__
|
||||
#define __RISCV__
|
||||
|
||||
#include "../common/cpu.h"
|
||||
|
||||
struct extension {
|
||||
int id;
|
||||
char* str;
|
||||
};
|
||||
|
||||
#define RISCV_ISA_EXT_NAME_LEN_MAX 32
|
||||
#define RISCV_ISA_EXT_BASE 26
|
||||
|
||||
// https://elixir.bootlin.com/linux/latest/source/arch/riscv/include/asm/hwcap.h
|
||||
// This enum represent the logical ID for multi-letter RISC-V ISA extensions.
|
||||
// The logical ID should start from RISCV_ISA_EXT_BASE
|
||||
enum riscv_isa_ext_id {
|
||||
RISCV_ISA_EXT_SSCOFPMF = RISCV_ISA_EXT_BASE,
|
||||
RISCV_ISA_EXT_SSTC,
|
||||
RISCV_ISA_EXT_SVINVAL,
|
||||
RISCV_ISA_EXT_SVPBMT,
|
||||
RISCV_ISA_EXT_ZBB,
|
||||
RISCV_ISA_EXT_ZICBOM,
|
||||
RISCV_ISA_EXT_ZIHINTPAUSE,
|
||||
RISCV_ISA_EXT_SVNAPOT,
|
||||
RISCV_ISA_EXT_ZICBOZ,
|
||||
RISCV_ISA_EXT_SMAIA,
|
||||
RISCV_ISA_EXT_SSAIA,
|
||||
RISCV_ISA_EXT_ZBA,
|
||||
RISCV_ISA_EXT_ZBS,
|
||||
RISCV_ISA_EXT_ZICNTR,
|
||||
RISCV_ISA_EXT_ZICSR,
|
||||
RISCV_ISA_EXT_ZIFENCEI,
|
||||
RISCV_ISA_EXT_ZIHPM,
|
||||
RISCV_ISA_EXT_ID_MAX
|
||||
};
|
||||
|
||||
// https://five-embeddev.com/riscv-isa-manual/latest/preface.html#preface
|
||||
// https://en.wikichip.org/wiki/risc-v/standard_extensions
|
||||
// Included all except for G
|
||||
static const struct extension extension_list[] = {
|
||||
{ 'i' - 'a', "(I) Integer Instruction Set" },
|
||||
{ 'm' - 'a', "(M) Integer Multiplication and Division" },
|
||||
{ 'a' - 'a', "(A) Atomic Instructions" },
|
||||
{ 'f' - 'a', "(F) Single-Precision Floating-Point" },
|
||||
{ 'd' - 'a', "(D) Double-Precision Floating-Point" },
|
||||
{ 'q' - 'a', "(Q) Quad-Precision Floating-Point" },
|
||||
{ 'l' - 'a', "(L) Decimal Floating-Point" },
|
||||
{ 'c' - 'a', "(C) Compressed Instructions" },
|
||||
{ 'b' - 'a', "(B) Double-Precision Floating-Point" },
|
||||
{ 'j' - 'a', "(J) Dynamically Translated Languages" },
|
||||
{ 't' - 'a', "(T) Transactional Memory" },
|
||||
{ 'p' - 'a', "(P) Packed-SIMD Instructions" },
|
||||
{ 'v' - 'a', "(V) Vector Operations" },
|
||||
{ 'n' - 'a', "(N) User-Level Interrupts" },
|
||||
{ 'h' - 'a', "(H) Hypervisor" },
|
||||
// multi-letter extensions
|
||||
{ RISCV_ISA_EXT_SSCOFPMF, "(Sscofpmf) Count OverFlow and Privilege Mode Filtering" },
|
||||
{ RISCV_ISA_EXT_SSTC, "(Sstc) S and VS level Time Compare" },
|
||||
{ RISCV_ISA_EXT_SVINVAL, "(Svinval) Fast TLB Invalidation" },
|
||||
{ RISCV_ISA_EXT_SVPBMT, "(Svpbmt) Page-based Memory Types" },
|
||||
{ RISCV_ISA_EXT_ZBB, "(Zbb) Basic bit-manipulation" },
|
||||
{ RISCV_ISA_EXT_ZICBOM, "(Zicbom) Cache Block Management Operations" },
|
||||
{ RISCV_ISA_EXT_ZIHINTPAUSE, "(Zihintpause) Pause Hint" },
|
||||
{ RISCV_ISA_EXT_SVNAPOT, "(Svnapot) Naturally Aligned Power of Two Pages" },
|
||||
{ RISCV_ISA_EXT_ZICBOZ, "(Zicboz) Cache Block Zero Operations" },
|
||||
{ RISCV_ISA_EXT_SMAIA, "(Smaia) Advanced Interrupt Architecture" },
|
||||
{ RISCV_ISA_EXT_SSAIA, "(Ssaia) Advanced Interrupt Architecture" },
|
||||
{ RISCV_ISA_EXT_ZBA, "(Zba) Address Generation" },
|
||||
{ RISCV_ISA_EXT_ZBS, "(Zbs) Single-bit Instructions" },
|
||||
{ RISCV_ISA_EXT_ZICNTR, "(Zicntr) Base Counters and Timers" },
|
||||
{ RISCV_ISA_EXT_ZICSR, "(Zicsr) Control and Status Register" },
|
||||
{ RISCV_ISA_EXT_ZIFENCEI, "(Zifencei) Instruction-Fetch Fence" },
|
||||
{ RISCV_ISA_EXT_ZIHPM, "(Zihpm) Hardware Performance Counters" }
|
||||
};
|
||||
|
||||
struct cpuInfo* get_cpu_info(void);
|
||||
char* get_str_topology(struct cpuInfo* cpu, struct topology* topo);
|
||||
char* get_str_extensions(struct cpuInfo* cpu);
|
||||
void print_debug(struct cpuInfo* cpu);
|
||||
|
||||
#endif
|
||||
93
src/riscv/soc.c
Normal file
93
src/riscv/soc.c
Normal file
@@ -0,0 +1,93 @@
|
||||
#include "soc.h"
|
||||
#include "socs.h"
|
||||
#include "udev.h"
|
||||
#include "../common/global.h"
|
||||
|
||||
#include <string.h>
|
||||
|
||||
bool match_sifive(char* soc_name, struct system_on_chip* soc) {
|
||||
char* tmp = soc_name;
|
||||
|
||||
// Dont know if it makes sense in RISC-V
|
||||
/*if((tmp = strstr(soc_name, "???")) == NULL)
|
||||
return false;*/
|
||||
|
||||
//soc->soc_vendor = ???
|
||||
|
||||
SOC_START
|
||||
SOC_EQ(tmp, "fu740", "Freedom U740", SOC_SIFIVE_U740, soc, 40)
|
||||
SOC_END
|
||||
}
|
||||
|
||||
bool match_starfive(char* soc_name, struct system_on_chip* soc) {
|
||||
SOC_START
|
||||
SOC_EQ(soc_name, "jh7110#", "VisionFive 2", SOC_STARFIVE_VF2, soc, 28) // https://blog.bitsofnetworks.org/benchmarking-risc-v-visionfive-2-vs-the-world.html
|
||||
SOC_EQ(soc_name, "jh7110", "VisionFive 2", SOC_STARFIVE_VF2, soc, 28)
|
||||
SOC_END
|
||||
}
|
||||
|
||||
bool match_allwinner(char* soc_name, struct system_on_chip* soc) {
|
||||
SOC_START
|
||||
SOC_EQ(soc_name, "sun20i-d1", "D1-H", SOC_ALLWINNER_D1H, soc, 22)
|
||||
SOC_END
|
||||
}
|
||||
|
||||
bool match_sipeed(char* soc_name, struct system_on_chip* soc) {
|
||||
SOC_START
|
||||
SOC_EQ(soc_name, "light", "Lichee Pi 4A", SOC_SIPEED_LICHEEPI4A, soc, 12) // https://github.com/Dr-Noob/cpufetch/issues/200, https://sipeed.com/licheepi4a
|
||||
SOC_END
|
||||
}
|
||||
|
||||
struct system_on_chip* parse_soc_from_string(struct system_on_chip* soc) {
|
||||
char* raw_name = soc->raw_name;
|
||||
|
||||
if(match_starfive(raw_name, soc))
|
||||
return soc;
|
||||
|
||||
if(match_allwinner(raw_name, soc))
|
||||
return soc;
|
||||
|
||||
if(match_sifive(raw_name, soc))
|
||||
return soc;
|
||||
|
||||
match_sipeed(raw_name, soc);
|
||||
return soc;
|
||||
}
|
||||
|
||||
struct system_on_chip* guess_soc_from_devtree(struct system_on_chip* soc) {
|
||||
char* tmp = get_hardware_from_devtree();
|
||||
|
||||
if(tmp != NULL) {
|
||||
soc->raw_name = tmp;
|
||||
return parse_soc_from_string(soc);
|
||||
}
|
||||
|
||||
return soc;
|
||||
}
|
||||
|
||||
struct system_on_chip* get_soc(struct cpuInfo* cpu) {
|
||||
struct system_on_chip* soc = emalloc(sizeof(struct system_on_chip));
|
||||
soc->raw_name = NULL;
|
||||
soc->soc_vendor = SOC_VENDOR_UNKNOWN;
|
||||
soc->soc_model = SOC_MODEL_UNKNOWN;
|
||||
soc->process = UNKNOWN;
|
||||
|
||||
soc = guess_soc_from_devtree(soc);
|
||||
if(soc->soc_vendor == SOC_VENDOR_UNKNOWN) {
|
||||
if(soc->raw_name != NULL) {
|
||||
printWarn("SoC detection failed using device tree: Found '%s' string", soc->raw_name);
|
||||
}
|
||||
else {
|
||||
printWarn("SoC detection failed using device tree");
|
||||
}
|
||||
}
|
||||
|
||||
if(soc->soc_model == SOC_MODEL_UNKNOWN) {
|
||||
// raw_name might not be NULL, but if we were unable to find
|
||||
// the exact SoC, just print "Unkwnown"
|
||||
soc->raw_name = emalloc(sizeof(char) * (strlen(STRING_UNKNOWN)+1));
|
||||
snprintf(soc->raw_name, strlen(STRING_UNKNOWN)+1, STRING_UNKNOWN);
|
||||
}
|
||||
|
||||
return soc;
|
||||
}
|
||||
10
src/riscv/soc.h
Normal file
10
src/riscv/soc.h
Normal file
@@ -0,0 +1,10 @@
|
||||
#ifndef __SOC_RISCV__
|
||||
#define __SOC_RISCV__
|
||||
|
||||
#include "../common/soc.h"
|
||||
#include "../common/cpu.h"
|
||||
#include <stdint.h>
|
||||
|
||||
struct system_on_chip* get_soc(struct cpuInfo* cpu);
|
||||
|
||||
#endif
|
||||
28
src/riscv/socs.h
Normal file
28
src/riscv/socs.h
Normal file
@@ -0,0 +1,28 @@
|
||||
#ifndef __SOCS__
|
||||
#define __SOCS__
|
||||
|
||||
#include "soc.h"
|
||||
|
||||
// List of supported SOCs
|
||||
enum {
|
||||
// SIFIVE
|
||||
SOC_SIFIVE_U740,
|
||||
// STARFIVE
|
||||
SOC_STARFIVE_VF2,
|
||||
// ALLWINNER
|
||||
SOC_ALLWINNER_D1H,
|
||||
// SIPEED
|
||||
SOC_SIPEED_LICHEEPI4A,
|
||||
// UNKNOWN
|
||||
SOC_MODEL_UNKNOWN
|
||||
};
|
||||
|
||||
inline static VENDOR get_soc_vendor_from_soc(SOC soc) {
|
||||
if(soc >= SOC_SIFIVE_U740 && soc <= SOC_SIFIVE_U740) return SOC_VENDOR_SIFIVE;
|
||||
if(soc >= SOC_STARFIVE_VF2 && soc <= SOC_STARFIVE_VF2) return SOC_VENDOR_STARFIVE;
|
||||
if(soc >= SOC_ALLWINNER_D1H && soc <= SOC_ALLWINNER_D1H) return SOC_VENDOR_ALLWINNER;
|
||||
if(soc >= SOC_SIPEED_LICHEEPI4A && soc <= SOC_SIPEED_LICHEEPI4A) return SOC_VENDOR_SIPEED;
|
||||
return SOC_VENDOR_UNKNOWN;
|
||||
}
|
||||
|
||||
#endif
|
||||
84
src/riscv/uarch.c
Normal file
84
src/riscv/uarch.c
Normal file
@@ -0,0 +1,84 @@
|
||||
#include <stdbool.h>
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
#include <string.h>
|
||||
|
||||
#include "uarch.h"
|
||||
#include "../common/global.h"
|
||||
|
||||
typedef uint32_t MICROARCH;
|
||||
|
||||
struct uarch {
|
||||
MICROARCH uarch;
|
||||
char* uarch_str;
|
||||
char* cpuinfo_str;
|
||||
};
|
||||
|
||||
enum {
|
||||
UARCH_UNKNOWN,
|
||||
// SIFIVE
|
||||
UARCH_U54,
|
||||
UARCH_U74,
|
||||
// THEAD
|
||||
UARCH_C906,
|
||||
UARCH_C910
|
||||
};
|
||||
|
||||
#define UARCH_START if (false) {}
|
||||
#define CHECK_UARCH(arch, cpu, cpuinfo_str, uarch_str, str, uarch, vendor) \
|
||||
else if (strcmp(cpuinfo_str, uarch_str) == 0) fill_uarch(arch, cpu, str, uarch, vendor);
|
||||
#define UARCH_END else { printBug("Unknown microarchitecture detected: uarch='%s'", cpuinfo_str); fill_uarch(arch, cpu, "Unknown", UARCH_UNKNOWN, CPU_VENDOR_UNKNOWN); }
|
||||
|
||||
void fill_uarch(struct uarch* arch, struct cpuInfo* cpu, char* str, MICROARCH u, VENDOR vendor) {
|
||||
arch->uarch = u;
|
||||
cpu->cpu_vendor = vendor;
|
||||
arch->uarch_str = emalloc(sizeof(char) * (strlen(str)+1));
|
||||
strcpy(arch->uarch_str, str);
|
||||
}
|
||||
|
||||
// https://elixir.bootlin.com/linux/latest/source/Documentation/devicetree/bindings/riscv/cpus.yaml
|
||||
// SiFive: https://www.sifive.com/risc-v-core-ip
|
||||
// T-Head: https://www.t-head.cn/product/c906
|
||||
struct uarch* get_uarch_from_cpuinfo_str(char* cpuinfo_str, struct cpuInfo* cpu) {
|
||||
struct uarch* arch = emalloc(sizeof(struct uarch));
|
||||
arch->cpuinfo_str = cpuinfo_str;
|
||||
if(cpuinfo_str == NULL) {
|
||||
printWarn("get_uarch_from_cpuinfo: Unable to detect microarchitecture, cpuinfo_str is NULL");
|
||||
fill_uarch(arch, cpu, "Unknown", UARCH_UNKNOWN, CPU_VENDOR_UNKNOWN);
|
||||
return arch;
|
||||
}
|
||||
|
||||
// U74/U74-MC:
|
||||
// SiFive says that U74-MC is "Multicore: four U74 cores and one S76 core" while
|
||||
// U74 is "High performance Linux-capable processor". It's like U74-MC is somehow a small SoC containing
|
||||
// the U74 and the S76? Then U74-MC is not a microarchitecture per se...
|
||||
UARCH_START
|
||||
CHECK_UARCH(arch, cpu, cpuinfo_str, "sifive,bullet0", "U74", UARCH_U74, CPU_VENDOR_SIFIVE) // bullet0 is present in U740, which has U74
|
||||
// CHECK_UARCH(arch, cpu, cpuinfo_str, "sifive,e5", "XXXXXX", UARCH_U74, CPU_VENDOR_SIFIVE)
|
||||
// CHECK_UARCH(arch, cpu, cpuinfo_str, "sifive,e7", "XXXXXX", UARCH_U74, CPU_VENDOR_SIFIVE)
|
||||
// CHECK_UARCH(arch, cpu, cpuinfo_str, "sifive,e71", "XXXXXX", UARCH_U74, CPU_VENDOR_SIFIVE)
|
||||
// CHECK_UARCH(arch, cpu, cpuinfo_str, "sifive,rocket0", "XXXXXX", UARCH_U74, CPU_VENDOR_SIFIVE)
|
||||
// CHECK_UARCH(arch, cpu, cpuinfo_str, "sifive,u5", "XXXXXX", UARCH_U74, CPU_VENDOR_SIFIVE)
|
||||
CHECK_UARCH(arch, cpu, cpuinfo_str, "sifive,u54", "U54", UARCH_U54, CPU_VENDOR_SIFIVE)
|
||||
// CHECK_UARCH(arch, cpu, cpuinfo_str, "sifive,u7", "XXXXXX", UARCH_U74, CPU_VENDOR_SIFIVE)
|
||||
CHECK_UARCH(arch, cpu, cpuinfo_str, "sifive,u74", "U74", UARCH_U74, CPU_VENDOR_SIFIVE)
|
||||
CHECK_UARCH(arch, cpu, cpuinfo_str, "sifive,u74-mc", "U74", UARCH_U74, CPU_VENDOR_SIFIVE)
|
||||
CHECK_UARCH(arch, cpu, cpuinfo_str, "thead,c906", "T-Head C906", UARCH_C906, CPU_VENDOR_THEAD)
|
||||
CHECK_UARCH(arch, cpu, cpuinfo_str, "thead,c910", "T-Head C910", UARCH_C910, CPU_VENDOR_THEAD)
|
||||
UARCH_END
|
||||
|
||||
return arch;
|
||||
}
|
||||
|
||||
char* get_str_uarch(struct cpuInfo* cpu) {
|
||||
return cpu->arch->uarch_str;
|
||||
}
|
||||
|
||||
char* get_arch_cpuinfo_str(struct cpuInfo* cpu) {
|
||||
return cpu->arch->cpuinfo_str;
|
||||
}
|
||||
|
||||
void free_uarch_struct(struct uarch* arch) {
|
||||
free(arch->uarch_str);
|
||||
free(arch);
|
||||
}
|
||||
14
src/riscv/uarch.h
Normal file
14
src/riscv/uarch.h
Normal file
@@ -0,0 +1,14 @@
|
||||
#ifndef __UARCH__
|
||||
#define __UARCH__
|
||||
|
||||
#include <stdint.h>
|
||||
#include "riscv.h"
|
||||
|
||||
struct uarch;
|
||||
|
||||
char* get_arch_cpuinfo_str(struct cpuInfo* cpu);
|
||||
char* get_str_uarch(struct cpuInfo* cpu);
|
||||
void free_uarch_struct(struct uarch* arch);
|
||||
struct uarch* get_uarch_from_cpuinfo_str(char* cpuinfo_str, struct cpuInfo* cpu);
|
||||
|
||||
#endif
|
||||
91
src/riscv/udev.c
Normal file
91
src/riscv/udev.c
Normal file
@@ -0,0 +1,91 @@
|
||||
#include <errno.h>
|
||||
#include <string.h>
|
||||
|
||||
#include "../common/global.h"
|
||||
#include "udev.h"
|
||||
|
||||
#define _PATH_DEVTREE "/proc/device-tree/compatible"
|
||||
#define CPUINFO_UARCH_STR "uarch\t\t: "
|
||||
#define CPUINFO_EXTENSIONS_STR "isa\t\t: "
|
||||
#define DEVTREE_HARDWARE_FIELD 0
|
||||
|
||||
char* get_field_from_devtree(int DEVTREE_FIELD) {
|
||||
int filelen;
|
||||
char* buf;
|
||||
if((buf = read_file(_PATH_DEVTREE, &filelen)) == NULL) {
|
||||
printWarn("read_file: %s: %s", _PATH_DEVTREE, strerror(errno));
|
||||
return NULL;
|
||||
}
|
||||
|
||||
// Here we would use strstr to find the comma.
|
||||
// However, the device-tree file may contain NULL
|
||||
// bytes in the middle of the string, which would
|
||||
// cause strstr to return NULL even when there might
|
||||
// be an occurence after the NULL byte
|
||||
//
|
||||
// We iterate the string backwards to find the field
|
||||
// in position n-DEVTREE_HARDWARE_FIELD where n
|
||||
// is the number of fields.
|
||||
int i=0;
|
||||
char* tmp1 = buf+filelen-1;
|
||||
do {
|
||||
tmp1--;
|
||||
if(*tmp1 == ',') i++;
|
||||
} while(tmp1 != buf && i <= DEVTREE_FIELD);
|
||||
|
||||
if(tmp1 == buf) {
|
||||
printWarn("get_field_from_devtree: Unable to find field %d", DEVTREE_FIELD);
|
||||
return NULL;
|
||||
}
|
||||
|
||||
tmp1++;
|
||||
int strlen = filelen-(tmp1-buf);
|
||||
char* hardware = emalloc(sizeof(char) * strlen);
|
||||
memset(hardware, 0, sizeof(char) * strlen);
|
||||
strncpy(hardware, tmp1, strlen-1);
|
||||
|
||||
return hardware;
|
||||
}
|
||||
|
||||
char* parse_cpuinfo_field(char* field_str) {
|
||||
int filelen;
|
||||
char* buf;
|
||||
if((buf = read_file(_PATH_CPUINFO, &filelen)) == NULL) {
|
||||
printWarn("read_file: %s: %s", _PATH_CPUINFO, strerror(errno));
|
||||
return NULL;
|
||||
}
|
||||
|
||||
char* tmp = strstr(buf, field_str);
|
||||
if(tmp == NULL) {
|
||||
printWarn("parse_cpuinfo_field: Unable to find field %s", field_str);
|
||||
return NULL;
|
||||
}
|
||||
|
||||
tmp += strlen(field_str);
|
||||
char* end = strstr(tmp, "\n");
|
||||
|
||||
if(end == NULL) {
|
||||
printWarn("parse_cpuinfo_field: Unable to find newline after field %s", field_str);
|
||||
return NULL;
|
||||
}
|
||||
|
||||
int ret_strlen = (end-tmp);
|
||||
char* ret = emalloc(sizeof(char) * (ret_strlen+1));
|
||||
memset(ret, 0, sizeof(char) * (ret_strlen+1));
|
||||
strncpy(ret, tmp, ret_strlen);
|
||||
|
||||
return ret;
|
||||
}
|
||||
|
||||
char* get_hardware_from_devtree(void) {
|
||||
return get_field_from_devtree(DEVTREE_HARDWARE_FIELD);
|
||||
}
|
||||
|
||||
char* get_uarch_from_cpuinfo(void) {
|
||||
return parse_cpuinfo_field(CPUINFO_UARCH_STR);
|
||||
}
|
||||
|
||||
char* get_extensions_from_cpuinfo(void) {
|
||||
return parse_cpuinfo_field(CPUINFO_EXTENSIONS_STR);
|
||||
}
|
||||
|
||||
12
src/riscv/udev.h
Normal file
12
src/riscv/udev.h
Normal file
@@ -0,0 +1,12 @@
|
||||
#ifndef __UDEV_RISCV__
|
||||
#define __UDEV_RISCV__
|
||||
|
||||
#include "../common/udev.h"
|
||||
|
||||
#define UNKNOWN -1
|
||||
|
||||
char* get_hardware_from_devtree(void);
|
||||
char* get_uarch_from_cpuinfo(void);
|
||||
char* get_extensions_from_cpuinfo(void);
|
||||
|
||||
#endif
|
||||
@@ -72,34 +72,6 @@ uint32_t get_apic_id(bool x2apic_id) {
|
||||
}
|
||||
}
|
||||
|
||||
#ifndef __APPLE__
|
||||
bool bind_to_cpu(int cpu_id) {
|
||||
#ifdef _WIN32
|
||||
HANDLE process = GetCurrentProcess();
|
||||
DWORD_PTR processAffinityMask = 1 << cpu_id;
|
||||
return SetProcessAffinityMask(process, processAffinityMask);
|
||||
#elif defined __linux__
|
||||
cpu_set_t currentCPU;
|
||||
CPU_ZERO(¤tCPU);
|
||||
CPU_SET(cpu_id, ¤tCPU);
|
||||
if (sched_setaffinity (0, sizeof(currentCPU), ¤tCPU) == -1) {
|
||||
printWarn("sched_setaffinity: %s", strerror(errno));
|
||||
return false;
|
||||
}
|
||||
return true;
|
||||
#elif defined __FreeBSD__
|
||||
cpuset_t currentCPU;
|
||||
CPU_ZERO(¤tCPU);
|
||||
CPU_SET(cpu_id, ¤tCPU);
|
||||
if(cpuset_setaffinity(CPU_LEVEL_WHICH, CPU_WHICH_TID, -1, sizeof(cpuset_t), ¤tCPU) == -1) {
|
||||
printWarn("cpuset_setaffinity: %s", strerror(errno));
|
||||
return false;
|
||||
}
|
||||
return true;
|
||||
#endif
|
||||
}
|
||||
#endif
|
||||
|
||||
#ifdef __linux__
|
||||
int get_total_cores_module(int total_cores, int module) {
|
||||
int total_modules = 2;
|
||||
@@ -397,6 +369,11 @@ bool fill_apic_ids(uint32_t* apic_ids, int first_core, int n, bool x2apic_id) {
|
||||
}
|
||||
|
||||
bool get_topology_from_apic(struct cpuInfo* cpu, struct topology* topo) {
|
||||
if (topo->cach == NULL) {
|
||||
printWarn("get_topology_from_apic: cach is NULL");
|
||||
return false;
|
||||
}
|
||||
|
||||
uint32_t apic_id;
|
||||
uint32_t* apic_ids = emalloc(sizeof(uint32_t) * topo->total_cores_module);
|
||||
uint32_t* apic_pkg = emalloc(sizeof(uint32_t) * topo->total_cores_module);
|
||||
|
||||
@@ -17,10 +17,6 @@ struct apic {
|
||||
bool get_topology_from_apic(struct cpuInfo* cpu, struct topology* topo);
|
||||
uint32_t is_smt_enabled_amd(struct topology* topo);
|
||||
|
||||
#ifndef __APPLE__
|
||||
bool bind_to_cpu(int cpu_id);
|
||||
#endif
|
||||
|
||||
#ifdef __linux__
|
||||
int get_total_cores_module(int total_cores, int module);
|
||||
#endif
|
||||
|
||||
329
src/x86/cpuid.c
329
src/x86/cpuid.c
@@ -5,6 +5,13 @@
|
||||
#include "../common/udev.h"
|
||||
#include <unistd.h>
|
||||
#endif
|
||||
#if defined (__FreeBSD__) || defined (__APPLE__)
|
||||
#include "../common/sysctl.h"
|
||||
#endif
|
||||
|
||||
#ifdef __linux__
|
||||
#include "../common/freq.h"
|
||||
#endif
|
||||
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
@@ -22,28 +29,35 @@
|
||||
|
||||
#define CPU_VENDOR_INTEL_STRING "GenuineIntel"
|
||||
#define CPU_VENDOR_AMD_STRING "AuthenticAMD"
|
||||
#define CPU_VENDOR_HYGON_STRING "HygonGenuine"
|
||||
|
||||
static const char *hv_vendors_string[] = {
|
||||
[HV_VENDOR_KVM] = "KVMKVMKVM",
|
||||
[HV_VENDOR_QEMU] = "TCGTCGTCGTCG",
|
||||
[HV_VENDOR_VBOX] = "VBoxVBoxVBox",
|
||||
[HV_VENDOR_HYPERV] = "Microsoft Hv",
|
||||
[HV_VENDOR_VMWARE] = "VMwareVMware",
|
||||
[HV_VENDOR_XEN] = "XenVMMXenVMM",
|
||||
[HV_VENDOR_PARALLELS] = "lrpepyh vr",
|
||||
[HV_VENDOR_PHYP] = NULL,
|
||||
[HV_VENDOR_BHYVE] = "bhyve bhyve ",
|
||||
[HV_VENDOR_APPLEVZ] = "Apple VZ"
|
||||
};
|
||||
|
||||
static char *hv_vendors_name[] = {
|
||||
[HV_VENDOR_KVM] = "KVM",
|
||||
[HV_VENDOR_QEMU] = "QEMU",
|
||||
[HV_VENDOR_VBOX] = "VirtualBox",
|
||||
[HV_VENDOR_HYPERV] = "Microsoft Hyper-V",
|
||||
[HV_VENDOR_VMWARE] = "VMware",
|
||||
[HV_VENDOR_XEN] = "Xen",
|
||||
[HV_VENDOR_PARALLELS] = "Parallels",
|
||||
[HV_VENDOR_PHYP] = "pHyp",
|
||||
[HV_VENDOR_BHYVE] = "bhyve",
|
||||
[HV_VENDOR_APPLEVZ] = "Apple VZ",
|
||||
[HV_VENDOR_INVALID] = STRING_UNKNOWN
|
||||
};
|
||||
|
||||
#define HYPERVISOR_NAME_MAX_LENGTH 17
|
||||
|
||||
#define MASK 0xFF
|
||||
|
||||
/*
|
||||
@@ -70,7 +84,7 @@ void get_name_cpuid(char* name, uint32_t reg1, uint32_t reg2, uint32_t reg3) {
|
||||
name[c++] = (reg3>>24) & MASK;
|
||||
}
|
||||
|
||||
char* get_str_cpu_name_internal() {
|
||||
char* get_str_cpu_name_internal(void) {
|
||||
uint32_t eax = 0;
|
||||
uint32_t ebx = 0;
|
||||
uint32_t ecx = 0;
|
||||
@@ -212,7 +226,7 @@ int64_t get_peak_performance(struct cpuInfo* cpu, bool accurate_pp) {
|
||||
#endif
|
||||
|
||||
//First, check we have consistent data
|
||||
if(freq == UNKNOWN_DATA || topo->logical_cores == UNKNOWN_DATA) {
|
||||
if(freq == UNKNOWN_DATA || topo == NULL || topo->logical_cores == UNKNOWN_DATA) {
|
||||
return -1;
|
||||
}
|
||||
|
||||
@@ -223,9 +237,10 @@ int64_t get_peak_performance(struct cpuInfo* cpu, bool accurate_pp) {
|
||||
if(feat->FMA3 || feat->FMA4)
|
||||
flops = flops*2;
|
||||
|
||||
// Ice Lake has AVX512, but it has 1 VPU for AVX512, while
|
||||
// it has 2 for AVX2. If this is a Ice Lake CPU, we are computing
|
||||
// the peak performance supposing AVX2, not AVX512
|
||||
// NOTE:
|
||||
// Some CPUs (Ice Lake, Zen 4) have AVX512, but they have only
|
||||
// 1 VPU for AVX512, while they have 2 for AVX2. In such cases,
|
||||
// we are computing the peak performance supposing AVX2, not AVX512
|
||||
if(feat->AVX512 && vpus_are_AVX512(ptr))
|
||||
flops = flops*16;
|
||||
else if(feat->AVX || feat->AVX2)
|
||||
@@ -260,23 +275,29 @@ struct hypervisor* get_hp_info(bool hv_present) {
|
||||
|
||||
cpuid(&eax, &ebx, &ecx, &edx);
|
||||
|
||||
char name[13];
|
||||
memset(name, 0, 13);
|
||||
get_name_cpuid(name, ebx, ecx, edx);
|
||||
|
||||
bool found = false;
|
||||
uint8_t len = sizeof(hv_vendors_string) / sizeof(hv_vendors_string[0]);
|
||||
|
||||
for(uint8_t v=0; v < len && !found; v++) {
|
||||
if(strcmp(hv_vendors_string[v], name) == 0) {
|
||||
hv->hv_vendor = v;
|
||||
found = true;
|
||||
}
|
||||
}
|
||||
|
||||
if(!found) {
|
||||
if(ebx == 0x0 && ecx == 0x0 && edx == 0x0) {
|
||||
hv->hv_vendor = HV_VENDOR_INVALID;
|
||||
printWarn("Unknown hypervisor vendor: %s", name);
|
||||
printWarn("Hypervisor vendor is empty");
|
||||
}
|
||||
else {
|
||||
char name[13];
|
||||
memset(name, 0, 13);
|
||||
get_name_cpuid(name, ebx, ecx, edx);
|
||||
|
||||
bool found = false;
|
||||
uint8_t len = sizeof(hv_vendors_string) / sizeof(hv_vendors_string[0]);
|
||||
|
||||
for(uint8_t v=0; v < len && !found; v++) {
|
||||
if(hv_vendors_string[v] != NULL && strcmp(hv_vendors_string[v], name) == 0) {
|
||||
hv->hv_vendor = v;
|
||||
found = true;
|
||||
}
|
||||
}
|
||||
|
||||
if(!found) {
|
||||
hv->hv_vendor = HV_VENDOR_INVALID;
|
||||
printBug("Unknown hypervisor vendor: '%s'", name);
|
||||
}
|
||||
}
|
||||
|
||||
hv->hv_name = hv_vendors_name[hv->hv_vendor];
|
||||
@@ -412,7 +433,7 @@ bool set_cpu_module(int m, int total_modules, int32_t* first_core) {
|
||||
return true;
|
||||
}
|
||||
|
||||
int32_t get_core_type() {
|
||||
int32_t get_core_type(void) {
|
||||
uint32_t eax = 0x0000001A;
|
||||
uint32_t ebx = 0;
|
||||
uint32_t ecx = 0;
|
||||
@@ -430,7 +451,7 @@ int32_t get_core_type() {
|
||||
}
|
||||
}
|
||||
|
||||
struct cpuInfo* get_cpu_info() {
|
||||
struct cpuInfo* get_cpu_info(void) {
|
||||
struct cpuInfo* cpu = emalloc(sizeof(struct cpuInfo));
|
||||
cpu->peak_performance = -1;
|
||||
cpu->next_cpu = NULL;
|
||||
@@ -438,7 +459,7 @@ struct cpuInfo* get_cpu_info() {
|
||||
cpu->cach = NULL;
|
||||
cpu->feat = NULL;
|
||||
|
||||
uint32_t modules = 1;
|
||||
cpu->num_cpus = 1;
|
||||
uint32_t eax = 0;
|
||||
uint32_t ebx = 0;
|
||||
uint32_t ecx = 0;
|
||||
@@ -457,6 +478,8 @@ struct cpuInfo* get_cpu_info() {
|
||||
cpu->cpu_vendor = CPU_VENDOR_INTEL;
|
||||
else if (strcmp(CPU_VENDOR_AMD_STRING,name) == 0)
|
||||
cpu->cpu_vendor = CPU_VENDOR_AMD;
|
||||
else if (strcmp(CPU_VENDOR_HYGON_STRING,name) == 0)
|
||||
cpu->cpu_vendor = CPU_VENDOR_HYGON;
|
||||
else {
|
||||
cpu->cpu_vendor = CPU_VENDOR_INVALID;
|
||||
printErr("Unknown CPU vendor: %s", name);
|
||||
@@ -475,9 +498,8 @@ struct cpuInfo* get_cpu_info() {
|
||||
cpu->cpu_name = get_str_cpu_name_internal();
|
||||
}
|
||||
else {
|
||||
cpu->cpu_name = emalloc(sizeof(char) * (strlen(STRING_UNKNOWN) + 1));
|
||||
strcpy(cpu->cpu_name, STRING_UNKNOWN);
|
||||
printWarn("Can't read cpu name from cpuid (needed extended level is 0x%.8X, max is 0x%.8X)", 0x80000004, cpu->maxExtendedLevels);
|
||||
cpu->cpu_name = NULL;
|
||||
printWarn("Can't read CPU name from cpuid (needed extended level is 0x%.8X, max is 0x%.8X)", 0x80000004, cpu->maxExtendedLevels);
|
||||
}
|
||||
|
||||
cpu->topology_extensions = false;
|
||||
@@ -495,12 +517,12 @@ struct cpuInfo* get_cpu_info() {
|
||||
cpu->hybrid_flag = (edx >> 15) & 0x1;
|
||||
}
|
||||
|
||||
if(cpu->hybrid_flag) modules = 2;
|
||||
if(cpu->hybrid_flag) cpu->num_cpus = 2;
|
||||
|
||||
struct cpuInfo* ptr = cpu;
|
||||
for(uint32_t i=0; i < modules; i++) {
|
||||
for(uint32_t i=0; i < cpu->num_cpus; i++) {
|
||||
int32_t first_core;
|
||||
set_cpu_module(i, modules, &first_core);
|
||||
set_cpu_module(i, cpu->num_cpus, &first_core);
|
||||
|
||||
if(i > 0) {
|
||||
ptr->next_cpu = emalloc(sizeof(struct cpuInfo));
|
||||
@@ -527,14 +549,15 @@ struct cpuInfo* get_cpu_info() {
|
||||
ptr->first_core_id = first_core;
|
||||
ptr->feat = get_features_info(ptr);
|
||||
|
||||
// If any field of the struct is NULL,
|
||||
// return inmideately, as further functions
|
||||
// require valid fields (cach, topo, etc)
|
||||
ptr->arch = get_cpu_uarch(ptr);
|
||||
ptr->freq = get_frequency_info(ptr);
|
||||
|
||||
if (cpu->cpu_name == NULL && ptr == cpu) {
|
||||
// If we couldnt read CPU name from cpuid, infer it now
|
||||
cpu->cpu_name = infer_cpu_name_from_uarch(cpu->arch);
|
||||
}
|
||||
|
||||
ptr->cach = get_cache_info(ptr);
|
||||
if(ptr->cach == NULL) return cpu;
|
||||
|
||||
if(cpu->hybrid_flag) {
|
||||
ptr->topo = get_topology_info(ptr, ptr->cach, i);
|
||||
@@ -542,16 +565,23 @@ struct cpuInfo* get_cpu_info() {
|
||||
else {
|
||||
ptr->topo = get_topology_info(ptr, ptr->cach, -1);
|
||||
}
|
||||
if(cpu->topo == NULL) return cpu;
|
||||
|
||||
// If topo is NULL, return early, as get_peak_performance
|
||||
// requries non-NULL topology.
|
||||
if(ptr->topo == NULL) return cpu;
|
||||
}
|
||||
|
||||
cpu->num_cpus = modules;
|
||||
cpu->peak_performance = get_peak_performance(cpu, accurate_pp());
|
||||
|
||||
return cpu;
|
||||
}
|
||||
|
||||
bool get_cache_topology_amd(struct cpuInfo* cpu, struct topology* topo) {
|
||||
if (topo->cach == NULL) {
|
||||
printWarn("get_cache_topology_amd: cach is NULL");
|
||||
return false;
|
||||
}
|
||||
|
||||
if(cpu->maxExtendedLevels >= 0x8000001D && cpu->topology_extensions) {
|
||||
uint32_t i, eax, ebx, ecx, edx, num_sharing_cache, cache_type, cache_level;
|
||||
|
||||
@@ -625,15 +655,24 @@ bool get_cache_topology_amd(struct cpuInfo* cpu, struct topology* topo) {
|
||||
return true;
|
||||
}
|
||||
|
||||
#ifdef __linux__
|
||||
void get_topology_from_udev(struct topology* topo) {
|
||||
// TODO: To be improved in the future
|
||||
topo->total_cores = get_ncores_from_cpuinfo();
|
||||
topo->logical_cores = topo->total_cores;
|
||||
topo->physical_cores = topo->total_cores;
|
||||
// TODO: To be improved in the future
|
||||
if (topo->total_cores == 1) {
|
||||
// We can assume it's a single core CPU
|
||||
topo->logical_cores = topo->total_cores;
|
||||
topo->physical_cores = topo->total_cores;
|
||||
}
|
||||
else {
|
||||
topo->logical_cores = UNKNOWN_DATA;
|
||||
topo->physical_cores = UNKNOWN_DATA;
|
||||
}
|
||||
topo->smt_available = 1;
|
||||
topo->smt_supported = 1;
|
||||
topo->sockets = 1;
|
||||
}
|
||||
#endif
|
||||
|
||||
// Main reference: https://software.intel.com/content/www/us/en/develop/articles/intel-64-architecture-processor-topology-enumeration.html
|
||||
// Very interesting resource: https://wiki.osdev.org/Detecting_CPU_Topology_(80x86)
|
||||
@@ -673,32 +712,31 @@ struct topology* get_topology_info(struct cpuInfo* cpu, struct cache* cach, int
|
||||
topo->total_cores_module = topo->total_cores;
|
||||
}
|
||||
|
||||
bool toporet = false;
|
||||
switch(cpu->cpu_vendor) {
|
||||
case CPU_VENDOR_INTEL:
|
||||
if (cpu->maxLevels >= 0x00000004) {
|
||||
bool toporet = get_topology_from_apic(cpu, topo);
|
||||
if(!toporet) {
|
||||
#ifdef __linux__
|
||||
printWarn("Failed to retrieve topology from APIC, using udev...\n");
|
||||
get_topology_from_udev(topo);
|
||||
#else
|
||||
printErr("Failed to retrieve topology from APIC, assumming default values...\n");
|
||||
topo->logical_cores = UNKNOWN_DATA;
|
||||
topo->physical_cores = UNKNOWN_DATA;
|
||||
topo->smt_available = 1;
|
||||
topo->smt_supported = 1;
|
||||
#endif
|
||||
}
|
||||
toporet = get_topology_from_apic(cpu, topo);
|
||||
}
|
||||
else {
|
||||
printWarn("Can't read topology information from cpuid (needed level is 0x%.8X, max is 0x%.8X)", 0x00000001, cpu->maxLevels);
|
||||
topo->physical_cores = 1;
|
||||
topo->logical_cores = 1;
|
||||
topo->smt_available = 1;
|
||||
topo->smt_supported = 1;
|
||||
printWarn("Can't read topology information from cpuid (needed level is 0x%.8X, max is 0x%.8X)", 0x00000004, cpu->maxLevels);
|
||||
}
|
||||
if(!toporet) {
|
||||
#ifdef __linux__
|
||||
printWarn("Failed to retrieve topology from APIC, using udev...");
|
||||
get_topology_from_udev(topo);
|
||||
#else
|
||||
if (cpu->maxLevels >= 0x00000004)
|
||||
printErr("Failed to retrieve topology from APIC, assumming default values...");
|
||||
topo->logical_cores = UNKNOWN_DATA;
|
||||
topo->physical_cores = UNKNOWN_DATA;
|
||||
topo->smt_available = 1;
|
||||
topo->smt_supported = 1;
|
||||
#endif
|
||||
}
|
||||
break;
|
||||
case CPU_VENDOR_AMD:
|
||||
case CPU_VENDOR_HYGON:
|
||||
if (cpu->maxExtendedLevels >= 0x80000008) {
|
||||
eax = 0x80000008;
|
||||
cpuid(&eax, &ebx, &ecx, &edx);
|
||||
@@ -715,10 +753,15 @@ struct topology* get_topology_info(struct cpuInfo* cpu, struct cache* cach, int
|
||||
}
|
||||
}
|
||||
else {
|
||||
printWarn("Can't read topology information from cpuid (needed extended level is 0x%.8X, max is 0x%.8X)", 0x80000008, cpu->maxExtendedLevels);
|
||||
topo->physical_cores = 1;
|
||||
topo->logical_cores = 1;
|
||||
topo->smt_supported = 1;
|
||||
#ifdef __linux__
|
||||
printWarn("Can't read topology information from cpuid (needed extended level is 0x%.8X, max is 0x%.8X), using udev...", 0x80000008, cpu->maxExtendedLevels);
|
||||
get_topology_from_udev(topo);
|
||||
#else
|
||||
printWarn("Can't read topology information from cpuid (needed extended level is 0x%.8X, max is 0x%.8X)", 0x80000008, cpu->maxExtendedLevels);
|
||||
topo->physical_cores = 1;
|
||||
topo->logical_cores = 1;
|
||||
topo->smt_supported = 1;
|
||||
#endif
|
||||
}
|
||||
|
||||
if (cpu->maxLevels >= 0x00000001) {
|
||||
@@ -895,16 +938,27 @@ struct cache* get_cache_info(struct cpuInfo* cpu) {
|
||||
|
||||
struct frequency* get_frequency_info(struct cpuInfo* cpu) {
|
||||
struct frequency* freq = emalloc(sizeof(struct frequency));
|
||||
freq->measured = false;
|
||||
|
||||
if(cpu->maxLevels < 0x00000016) {
|
||||
#if defined (_WIN32) || defined (__APPLE__)
|
||||
#if defined (_WIN32)
|
||||
printWarn("Can't read frequency information from cpuid (needed level is 0x%.8X, max is 0x%.8X)", 0x00000016, cpu->maxLevels);
|
||||
freq->base = UNKNOWN_DATA;
|
||||
freq->max = UNKNOWN_DATA;
|
||||
#elif defined (__FreeBSD__) || defined (__APPLE__)
|
||||
printWarn("Can't read frequency information from cpuid (needed level is 0x%.8X, max is 0x%.8X). Using sysctl", 0x00000016, cpu->maxLevels);
|
||||
uint32_t freq_hz = get_sys_info_by_name(CPUFREQUENCY_SYSCTL);
|
||||
if (freq_hz == 0) {
|
||||
printWarn("Read max CPU frequency from sysctl and got 0 MHz");
|
||||
freq->max = UNKNOWN_DATA;
|
||||
}
|
||||
|
||||
freq->base = UNKNOWN_DATA;
|
||||
freq->max = freq_hz;
|
||||
#else
|
||||
printWarn("Can't read frequency information from cpuid (needed level is 0x%.8X, max is 0x%.8X). Using udev", 0x00000016, cpu->maxLevels);
|
||||
freq->base = UNKNOWN_DATA;
|
||||
freq->max = get_max_freq_from_file(0);
|
||||
freq->max = get_max_freq_from_file(cpu->first_core_id);
|
||||
|
||||
if(freq->max == 0) {
|
||||
printWarn("Read max CPU frequency from udev and got 0 MHz");
|
||||
@@ -931,7 +985,7 @@ struct frequency* get_frequency_info(struct cpuInfo* cpu) {
|
||||
printWarn("Read max CPU frequency from CPUID and got 0 MHz");
|
||||
#ifdef __linux__
|
||||
printWarn("Using udev to detect frequency");
|
||||
freq->max = get_max_freq_from_file(0);
|
||||
freq->max = get_max_freq_from_file(cpu->first_core_id);
|
||||
|
||||
if(freq->max == 0) {
|
||||
printWarn("Read max CPU frequency from udev and got 0 MHz");
|
||||
@@ -943,6 +997,15 @@ struct frequency* get_frequency_info(struct cpuInfo* cpu) {
|
||||
}
|
||||
}
|
||||
|
||||
#ifdef __linux__
|
||||
if (freq->max == UNKNOWN_DATA || measure_max_frequency_flag()) {
|
||||
if (freq->max == UNKNOWN_DATA)
|
||||
printWarn("All previous methods failed, measuring CPU frequency");
|
||||
freq->max = measure_max_frequency(cpu->first_core_id);
|
||||
freq->measured = true;
|
||||
}
|
||||
#endif
|
||||
|
||||
return freq;
|
||||
}
|
||||
|
||||
@@ -964,24 +1027,33 @@ char* get_str_topology(struct cpuInfo* cpu, struct topology* topo, bool dual_soc
|
||||
string = emalloc(sizeof(char) * (strlen(STRING_UNKNOWN) + 1));
|
||||
strcpy(string, STRING_UNKNOWN);
|
||||
}
|
||||
else if(topo->smt_supported > 1) {
|
||||
// 4 for digits, 21 for ' cores (SMT disabled)' which is the longest possible output
|
||||
uint32_t max_size = 4+21+1;
|
||||
string = emalloc(sizeof(char) * max_size);
|
||||
|
||||
if(topo->smt_available > 1)
|
||||
snprintf(string, max_size, "%d cores (%d threads)", topo->physical_cores * topo_sockets, topo->logical_cores * topo_sockets);
|
||||
else {
|
||||
if(cpu->cpu_vendor == CPU_VENDOR_AMD)
|
||||
snprintf(string, max_size, "%d cores (SMT disabled)", topo->physical_cores * topo_sockets);
|
||||
else
|
||||
snprintf(string, max_size, "%d cores (HT disabled)", topo->physical_cores * topo_sockets);
|
||||
}
|
||||
}
|
||||
else {
|
||||
uint32_t max_size = 4+7+1;
|
||||
string = emalloc(sizeof(char) * max_size);
|
||||
snprintf(string, max_size, "%d cores",topo->physical_cores * topo_sockets);
|
||||
char cores_str[6];
|
||||
memset(cores_str, 0, sizeof(char) * 6);
|
||||
if (topo->physical_cores * topo_sockets > 1)
|
||||
strcpy(cores_str, "cores");
|
||||
else
|
||||
strcpy(cores_str, "core");
|
||||
|
||||
if(topo->smt_supported > 1) {
|
||||
// 4 for digits, 21 for ' cores (SMT disabled)' which is the longest possible output
|
||||
uint32_t max_size = 4+21+1;
|
||||
string = emalloc(sizeof(char) * max_size);
|
||||
|
||||
if(topo->smt_available > 1)
|
||||
snprintf(string, max_size, "%d %s (%d threads)", topo->physical_cores * topo_sockets, cores_str, topo->logical_cores * topo_sockets);
|
||||
else {
|
||||
if(cpu->cpu_vendor == CPU_VENDOR_AMD)
|
||||
snprintf(string, max_size, "%d %s (SMT disabled)", topo->physical_cores * topo_sockets, cores_str);
|
||||
else
|
||||
snprintf(string, max_size, "%d %s (HT disabled)", topo->physical_cores * topo_sockets, cores_str);
|
||||
}
|
||||
}
|
||||
else {
|
||||
uint32_t max_size = 4+7+1;
|
||||
string = emalloc(sizeof(char) * max_size);
|
||||
snprintf(string, max_size, "%d %s",topo->physical_cores * topo_sockets, cores_str);
|
||||
}
|
||||
}
|
||||
|
||||
return string;
|
||||
@@ -1042,8 +1114,14 @@ char* get_str_sse(struct cpuInfo* cpu) {
|
||||
last+=SSE4_2_sl;
|
||||
}
|
||||
|
||||
//Purge last comma
|
||||
string[last-1] = '\0';
|
||||
if (last == 0) {
|
||||
snprintf(string, 2+1, "No");
|
||||
}
|
||||
else {
|
||||
//Purge last comma
|
||||
string[last-1] = '\0';
|
||||
}
|
||||
|
||||
return string;
|
||||
}
|
||||
|
||||
@@ -1084,12 +1162,29 @@ void print_debug(struct cpuInfo* cpu) {
|
||||
free_cpuinfo_struct(cpu);
|
||||
}
|
||||
|
||||
// TODO: Query HV and Xeon Phi levels
|
||||
void print_raw_level(uint32_t reg) {
|
||||
uint32_t eax = reg;
|
||||
uint32_t ebx = 0;
|
||||
uint32_t ecx = 0;
|
||||
uint32_t edx = 0;
|
||||
|
||||
cpuid(&eax, &ebx, &ecx, &edx);
|
||||
|
||||
printf(" 0x%.8X 0x%.2X: 0x%.8X 0x%.8X 0x%.8X 0x%.8X\n", reg, 0x00, eax, ebx, ecx, edx);
|
||||
}
|
||||
|
||||
void print_raw_sublevel(uint32_t reg, uint32_t reg2) {
|
||||
uint32_t eax = reg;
|
||||
uint32_t ebx = 0;
|
||||
uint32_t ecx = reg2;
|
||||
uint32_t edx = 0;
|
||||
|
||||
cpuid(&eax, &ebx, &ecx, &edx);
|
||||
|
||||
printf(" 0x%.8X 0x%.2X: 0x%.8X 0x%.8X 0x%.8X 0x%.8X\n", reg, reg2, eax, ebx, ecx, edx);
|
||||
}
|
||||
|
||||
void print_raw(struct cpuInfo* cpu) {
|
||||
uint32_t eax;
|
||||
uint32_t ebx;
|
||||
uint32_t ecx;
|
||||
uint32_t edx;
|
||||
printf("%s\n\n", cpu->cpu_name);
|
||||
printf(" CPUID leaf sub EAX EBX ECX EDX \n");
|
||||
printf("--------------------------------------------------------------\n");
|
||||
@@ -1104,66 +1199,40 @@ void print_raw(struct cpuInfo* cpu) {
|
||||
|
||||
printf("CPU %d:\n", c);
|
||||
|
||||
// Standard levels
|
||||
for(uint32_t reg=0x00000000; reg <= cpu->maxLevels; reg++) {
|
||||
if(reg == 0x00000004) {
|
||||
for(uint32_t reg2=0x00000000; reg2 < cpu->cach->max_cache_level; reg2++) {
|
||||
eax = reg;
|
||||
ebx = 0;
|
||||
ecx = reg2;
|
||||
edx = 0;
|
||||
|
||||
cpuid(&eax, &ebx, &ecx, &edx);
|
||||
|
||||
printf(" 0x%.8X 0x%.2X: 0x%.8X 0x%.8X 0x%.8X 0x%.8X\n", reg, reg2, eax, ebx, ecx, edx);
|
||||
print_raw_sublevel(reg, reg2);
|
||||
}
|
||||
}
|
||||
else if(reg == 0x0000000B) {
|
||||
for(uint32_t reg2=0x00000000; reg2 < cpu->topo->smt_supported; reg2++) {
|
||||
eax = reg;
|
||||
ebx = 0;
|
||||
ecx = reg2;
|
||||
edx = 0;
|
||||
|
||||
cpuid(&eax, &ebx, &ecx, &edx);
|
||||
|
||||
printf(" 0x%.8X 0x%.2X: 0x%.8X 0x%.8X 0x%.8X 0x%.8X\n", reg, reg2, eax, ebx, ecx, edx);
|
||||
print_raw_sublevel(reg, reg2);
|
||||
}
|
||||
}
|
||||
else {
|
||||
eax = reg;
|
||||
ebx = 0;
|
||||
ecx = 0;
|
||||
edx = 0;
|
||||
|
||||
cpuid(&eax, &ebx, &ecx, &edx);
|
||||
|
||||
printf(" 0x%.8X 0x%.2X: 0x%.8X 0x%.8X 0x%.8X 0x%.8X\n", reg, 0x00, eax, ebx, ecx, edx);
|
||||
print_raw_level(reg);
|
||||
}
|
||||
}
|
||||
|
||||
// Hypervisor levels
|
||||
for(uint32_t reg=0x40000000; reg <= 0x40000006; reg++) {
|
||||
print_raw_level(reg);
|
||||
}
|
||||
|
||||
// Extended levels
|
||||
for(uint32_t reg=0x80000000; reg <= cpu->maxExtendedLevels; reg++) {
|
||||
if(reg == 0x8000001D) {
|
||||
for(uint32_t reg2=0x00000000; reg2 < cpu->cach->max_cache_level; reg2++) {
|
||||
eax = reg;
|
||||
ebx = 0;
|
||||
ecx = reg2;
|
||||
edx = 0;
|
||||
|
||||
cpuid(&eax, &ebx, &ecx, &edx);
|
||||
|
||||
printf(" 0x%.8X 0x%.2X: 0x%.8X 0x%.8X 0x%.8X 0x%.8X\n", reg, reg2, eax, ebx, ecx, edx);
|
||||
print_raw_sublevel(reg, reg2);
|
||||
}
|
||||
}
|
||||
else {
|
||||
eax = reg;
|
||||
ebx = 0;
|
||||
ecx = 0;
|
||||
edx = 0;
|
||||
|
||||
cpuid(&eax, &ebx, &ecx, &edx);
|
||||
|
||||
printf(" 0x%.8X 0x%.2X: 0x%.8X 0x%.8X 0x%.8X 0x%.8X\n", reg, 0x00, eax, ebx, ecx, edx);
|
||||
print_raw_level(reg);
|
||||
}
|
||||
}
|
||||
|
||||
}
|
||||
}
|
||||
|
||||
|
||||
@@ -3,7 +3,7 @@
|
||||
|
||||
#include "../common/cpu.h"
|
||||
|
||||
struct cpuInfo* get_cpu_info();
|
||||
struct cpuInfo* get_cpu_info(void);
|
||||
struct cache* get_cache_info(struct cpuInfo* cpu);
|
||||
struct frequency* get_frequency_info(struct cpuInfo* cpu);
|
||||
struct topology* get_topology_info(struct cpuInfo* cpu, struct cache* cach, int module);
|
||||
|
||||
@@ -3,6 +3,7 @@
|
||||
|
||||
#include <stdint.h>
|
||||
#include "../../common/cpu.h"
|
||||
#include "../../common/global.h"
|
||||
|
||||
#define MEASURE_TIME_SECONDS 5
|
||||
#define LOOP_ITERS 100000000
|
||||
|
||||
@@ -10,7 +10,8 @@
|
||||
#include <stdint.h>
|
||||
#include "freq.h"
|
||||
|
||||
void* compute_avx() {
|
||||
void* compute_avx(void * pthread_arg) {
|
||||
UNUSED(pthread_arg);
|
||||
bool end = false;
|
||||
|
||||
struct timeval begin, now;
|
||||
|
||||
@@ -1,6 +1,6 @@
|
||||
#ifndef __FREQ_AVX__
|
||||
#define __FREQ_AVX__
|
||||
|
||||
void* compute_avx();
|
||||
void* compute_avx(void * pthread_arg);
|
||||
|
||||
#endif
|
||||
|
||||
@@ -10,7 +10,8 @@
|
||||
#include <stdint.h>
|
||||
#include "freq.h"
|
||||
|
||||
void* compute_avx512() {
|
||||
void* compute_avx512(void * pthread_arg) {
|
||||
UNUSED(pthread_arg);
|
||||
bool end = false;
|
||||
|
||||
struct timeval begin, now;
|
||||
|
||||
@@ -1,6 +1,6 @@
|
||||
#ifndef __FREQ_AVX512__
|
||||
#define __FREQ_AVX512__
|
||||
|
||||
void* compute_avx512();
|
||||
void* compute_avx512(void * pthread_arg);
|
||||
|
||||
#endif
|
||||
|
||||
@@ -10,7 +10,8 @@
|
||||
#include <stdint.h>
|
||||
#include "freq.h"
|
||||
|
||||
void* compute_nov() {
|
||||
void* compute_nov(void * pthread_arg) {
|
||||
UNUSED(pthread_arg);
|
||||
bool end = false;
|
||||
|
||||
struct timeval begin, now;
|
||||
|
||||
@@ -1,6 +1,6 @@
|
||||
#ifndef __FREQ_NO_VECTOR__
|
||||
#define __FREQ_NO_VECTOR__
|
||||
|
||||
void* compute_nov();
|
||||
void* compute_nov(void * pthread_arg);
|
||||
|
||||
#endif
|
||||
|
||||
424
src/x86/uarch.c
424
src/x86/uarch.c
@@ -47,8 +47,12 @@ typedef uint32_t MICROARCH;
|
||||
enum {
|
||||
UARCH_UNKNOWN,
|
||||
// INTEL //
|
||||
UARCH_I486,
|
||||
UARCH_P5,
|
||||
UARCH_P6,
|
||||
UARCH_P5_MMX,
|
||||
UARCH_P6_PRO,
|
||||
UARCH_P6_PENTIUM_II,
|
||||
UARCH_P6_PENTIUM_III,
|
||||
UARCH_DOTHAN,
|
||||
UARCH_YONAH,
|
||||
UARCH_MEROM,
|
||||
@@ -95,6 +99,8 @@ enum {
|
||||
// AMD //
|
||||
UARCH_AM486,
|
||||
UARCH_AM5X86,
|
||||
UARCH_SSA5,
|
||||
UARCH_K5,
|
||||
UARCH_K6,
|
||||
UARCH_K7,
|
||||
UARCH_K8,
|
||||
@@ -112,7 +118,8 @@ enum {
|
||||
UARCH_ZEN2,
|
||||
UARCH_ZEN3,
|
||||
UARCH_ZEN3_PLUS,
|
||||
UARCH_ZEN4
|
||||
UARCH_ZEN4,
|
||||
UARCH_ZEN4C
|
||||
};
|
||||
|
||||
struct uarch {
|
||||
@@ -124,7 +131,8 @@ struct uarch {
|
||||
#define UARCH_START if (false) {}
|
||||
#define CHECK_UARCH(arch, ef_, f_, em_, m_, s_, str, uarch, process) \
|
||||
else if (ef_ == ef && f_ == f && (em_ == NA || em_ == em) && (m_ == NA || m_ == m) && (s_ == NA || s_ == s)) fill_uarch(arch, str, uarch, process);
|
||||
#define UARCH_END else { printBug("Unknown microarchitecture detected: M=0x%.8X EM=0x%.8X F=0x%.8X EF=0x%.8X S=0x%.8X", m, em, f, ef, s); fill_uarch(arch, STRING_UNKNOWN, UARCH_UNKNOWN, 0); }
|
||||
#define UARCH_END else { printBugCheckRelease("Unknown microarchitecture detected: M=0x%X EM=0x%X F=0x%X EF=0x%X S=0x%X", m, em, f, ef, s); \
|
||||
fill_uarch(arch, STRING_UNKNOWN, UARCH_UNKNOWN, UNK); }
|
||||
|
||||
void fill_uarch(struct uarch* arch, char* str, MICROARCH u, uint32_t process) {
|
||||
arch->uarch_str = emalloc(sizeof(char) * (strlen(str)+1));
|
||||
@@ -137,127 +145,143 @@ void fill_uarch(struct uarch* arch, char* str, MICROARCH u, uint32_t process) {
|
||||
struct uarch* get_uarch_from_cpuid_intel(uint32_t ef, uint32_t f, uint32_t em, uint32_t m, int s) {
|
||||
struct uarch* arch = emalloc(sizeof(struct uarch));
|
||||
|
||||
// EF: Extended Family //
|
||||
// F: Family //
|
||||
// EM: Extended Model //
|
||||
// M: Model //
|
||||
// S: Stepping //
|
||||
// ----------------------------------------------------------------------------- //
|
||||
// EF F EM M S //
|
||||
// EF: Extended Family //
|
||||
// F: Family //
|
||||
// EM: Extended Model //
|
||||
// M: Model //
|
||||
// S: Stepping //
|
||||
// ------------------------------------------------------------------------------- //
|
||||
// EF F EM M S //
|
||||
UARCH_START
|
||||
CHECK_UARCH(arch, 0, 5, 0, 0, NA, "P5", UARCH_P5, 800)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 1, NA, "P5", UARCH_P5, 800)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 2, NA, "P5", UARCH_P5, UNK)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 3, NA, "P5", UARCH_P5, 600)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 4, NA, "P5 MMX", UARCH_P5, UNK)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 7, NA, "P5 MMX", UARCH_P5, UNK)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 8, NA, "P5 MMX", UARCH_P5, 250)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 9, 0, "Lakemont", UARCH_LAKEMONT, 32)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 9, NA, "P5 MMX", UARCH_P5, UNK)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 10, 0, "Lakemont", UARCH_LAKEMONT, 32)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 0, NA, "P6 Pentium II", UARCH_P6, UNK)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 1, NA, "P6 Pentium II", UARCH_P6, UNK) // process depends on core
|
||||
CHECK_UARCH(arch, 0, 6, 0, 2, NA, "P6 Pentium II", UARCH_P6, UNK)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 3, NA, "P6 Pentium II", UARCH_P6, 350)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 4, NA, "P6 Pentium II", UARCH_P6, UNK)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 5, NA, "P6 Pentium II", UARCH_P6, 250)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 6, NA, "P6 Pentium II", UARCH_P6, UNK)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 7, NA, "P6 Pentium III", UARCH_P6, 250)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 8, NA, "P6 Pentium III", UARCH_P6, 180)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 9, NA, "P6 Pentium M", UARCH_P6, 130)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 10, NA, "P6 Pentium III", UARCH_P6, 180)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 11, NA, "P6 Pentium III", UARCH_P6, 130)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 13, NA, "Dothan", UARCH_DOTHAN, UNK) // process depends on core
|
||||
CHECK_UARCH(arch, 0, 6, 0, 14, NA, "Yonah", UARCH_YONAH, 65)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 15, NA, "Merom", UARCH_MEROM, 65)
|
||||
CHECK_UARCH(arch, 0, 6, 1, 5, NA, "Dothan", UARCH_DOTHAN, 90)
|
||||
CHECK_UARCH(arch, 0, 6, 1, 6, NA, "Merom", UARCH_MEROM, 65)
|
||||
CHECK_UARCH(arch, 0, 6, 1, 7, NA, "Penryn", UARCH_PENYR, 45)
|
||||
CHECK_UARCH(arch, 0, 6, 1, 10, NA, "Nehalem", UARCH_NEHALEM, 45)
|
||||
CHECK_UARCH(arch, 0, 6, 1, 12, NA, "Bonnell", UARCH_BONNELL, 45)
|
||||
CHECK_UARCH(arch, 0, 6, 1, 13, NA, "Penryn", UARCH_PENYR, 45)
|
||||
CHECK_UARCH(arch, 0, 6, 1, 14, NA, "Nehalem", UARCH_NEHALEM, 45)
|
||||
CHECK_UARCH(arch, 0, 6, 1, 15, NA, "Nehalem", UARCH_NEHALEM, 45)
|
||||
CHECK_UARCH(arch, 0, 6, 2, 5, NA, "Westmere", UARCH_WESTMERE, 32)
|
||||
CHECK_UARCH(arch, 0, 6, 2 , 6, NA, "Bonnell", UARCH_BONNELL, 45)
|
||||
CHECK_UARCH(arch, 0, 6, 2, 7, NA, "Saltwell", UARCH_SALTWELL, 32)
|
||||
CHECK_UARCH(arch, 0, 6, 2, 10, NA, "Sandy Bridge", UARCH_SANDY_BRIDGE, 32)
|
||||
CHECK_UARCH(arch, 0, 6, 2, 12, NA, "Westmere", UARCH_WESTMERE, 32)
|
||||
CHECK_UARCH(arch, 0, 6, 2, 13, NA, "Sandy Bridge", UARCH_SANDY_BRIDGE, 32)
|
||||
CHECK_UARCH(arch, 0, 6, 2, 14, NA, "Nehalem", UARCH_NEHALEM, 45)
|
||||
CHECK_UARCH(arch, 0, 6, 2, 15, NA, "Westmere", UARCH_WESTMERE, 32)
|
||||
CHECK_UARCH(arch, 0, 6, 3, 5, NA, "Saltwell", UARCH_SALTWELL, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 3, 6, NA, "Saltwell", UARCH_SALTWELL, 32)
|
||||
CHECK_UARCH(arch, 0, 6, 3, 7, NA, "Silvermont", UARCH_SILVERMONT, 22)
|
||||
CHECK_UARCH(arch, 0, 6, 3, 10, NA, "Ivy Bridge", UARCH_IVY_BRIDGE, 22)
|
||||
CHECK_UARCH(arch, 0, 6, 3, 12, NA, "Haswell", UARCH_HASWELL, 22)
|
||||
CHECK_UARCH(arch, 0, 6, 3, 13, NA, "Broadwell", UARCH_BROADWELL, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 3, 14, NA, "Ivy Bridge", UARCH_IVY_BRIDGE, 22)
|
||||
CHECK_UARCH(arch, 0, 6, 3, 15, NA, "Haswell", UARCH_HASWELL, 22)
|
||||
CHECK_UARCH(arch, 0, 6, 4, 5, NA, "Haswell", UARCH_HASWELL, 22)
|
||||
CHECK_UARCH(arch, 0, 6, 4, 6, NA, "Haswell", UARCH_HASWELL, 22)
|
||||
CHECK_UARCH(arch, 0, 6, 4, 7, NA, "Broadwell", UARCH_BROADWELL, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 4, 10, NA, "Silvermont", UARCH_SILVERMONT, 22) // no docs, but /proc/cpuinfo seen in wild
|
||||
CHECK_UARCH(arch, 0, 6, 4, 12, NA, "Airmont", UARCH_AIRMONT, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 4, 13, NA, "Silvermont", UARCH_SILVERMONT, 22)
|
||||
CHECK_UARCH(arch, 0, 6, 4, 14, 8, "Kaby Lake", UARCH_KABY_LAKE, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 4, 14, NA, "Skylake", UARCH_SKYLAKE, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 4, 15, NA, "Broadwell", UARCH_BROADWELL, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 5, 5, 6, "Cascade Lake", UARCH_CASCADE_LAKE, 14) // no docs, but example from Greg Stewart
|
||||
CHECK_UARCH(arch, 0, 6, 5, 5, 7, "Cascade Lake", UARCH_CASCADE_LAKE, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 5, 5, 10, "Cooper Lake", UARCH_COOPER_LAKE, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 5, 5, NA, "Skylake", UARCH_SKYLAKE, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 5, 6, NA, "Broadwell", UARCH_BROADWELL, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 5, 7, NA, "Knights Landing", UARCH_KNIGHTS_LANDING, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 5, 10, NA, "Silvermont", UARCH_SILVERMONT, 22) // no spec update; only MSR_CPUID_table* so far
|
||||
CHECK_UARCH(arch, 0, 6, 5, 12, NA, "Goldmont", UARCH_GOLDMONT, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 5, 13, NA, "Silvermont", UARCH_SILVERMONT, 22) // no spec update; only MSR_CPUID_table* so far
|
||||
CHECK_UARCH(arch, 0, 6, 5, 14, 8, "Kaby Lake", UARCH_KABY_LAKE, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 5, 14, NA, "Skylake", UARCH_SKYLAKE, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 5, 15, NA, "Goldmont", UARCH_GOLDMONT, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 6, 6, NA, "Palm Cove", UARCH_PALM_COVE, 10) // no spec update; only MSR_CPUID_table* so far
|
||||
CHECK_UARCH(arch, 0, 6, 6, 10, NA, "Sunny Cove", UARCH_SUNNY_COVE, 10) // no spec update; only MSR_CPUID_table* so far
|
||||
CHECK_UARCH(arch, 0, 6, 6, 12, NA, "Sunny Cove", UARCH_SUNNY_COVE, 10) // no spec update; only MSR_CPUID_table* so far
|
||||
CHECK_UARCH(arch, 0, 6, 7, 5, NA, "Airmont", UARCH_AIRMONT, 14) // no spec update; whispers & rumors
|
||||
CHECK_UARCH(arch, 0, 6, 7, 10, NA, "Goldmont Plus", UARCH_GOLDMONT_PLUS, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 7, 13, NA, "Sunny Cove", UARCH_SUNNY_COVE, 10) // no spec update; only MSR_CPUID_table* so far
|
||||
CHECK_UARCH(arch, 0, 6, 7, 14, NA, "Ice Lake", UARCH_ICE_LAKE, 10)
|
||||
CHECK_UARCH(arch, 0, 6, 8, 5, NA, "Knights Mill", UARCH_KNIGHTS_MILL, 14) // no spec update; only MSR_CPUID_table* so far
|
||||
CHECK_UARCH(arch, 0, 6, 8, 6, NA, "Tremont", UARCH_TREMONT, 10) // LX*
|
||||
CHECK_UARCH(arch, 0, 6, 8, 10, NA, "Tremont", UARCH_TREMONT, 10) // no spec update; only geekbench.com example
|
||||
CHECK_UARCH(arch, 0, 6, 8, 12, NA, "Tiger Lake", UARCH_TIGER_LAKE, 10) // instlatx64
|
||||
CHECK_UARCH(arch, 0, 6, 8, 13, NA, "Tiger Lake", UARCH_TIGER_LAKE, 10) // instlatx64
|
||||
CHECK_UARCH(arch, 0, 4, 0, 0, NA, "i80486DX", UARCH_I486, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||
CHECK_UARCH(arch, 0, 4, 0, 1, NA, "i80486DX-50", UARCH_I486, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||
CHECK_UARCH(arch, 0, 4, 0, 2, NA, "i80486SX", UARCH_I486, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||
CHECK_UARCH(arch, 0, 4, 0, 3, NA, "i80486DX2", UARCH_I486, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||
CHECK_UARCH(arch, 0, 4, 0, 4, NA, "i80486SL", UARCH_I486, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||
CHECK_UARCH(arch, 0, 4, 0, 5, NA, "i80486SX2", UARCH_I486, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||
CHECK_UARCH(arch, 0, 4, 0, 7, NA, "i80486DX2WB", UARCH_I486, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||
CHECK_UARCH(arch, 0, 4, 0, 8, NA, "i80486DX4", UARCH_I486, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||
CHECK_UARCH(arch, 0, 4, 0, 9, NA, "i80486DX4WB", UARCH_I486, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||
CHECK_UARCH(arch, 0, 5, 0, 0, NA, "P5", UARCH_P5, 800)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 1, NA, "P5", UARCH_P5, 800)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 2, NA, "P54C", UARCH_P5, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||
CHECK_UARCH(arch, 0, 5, 0, 3, NA, "P24T (Overdrive)", UARCH_P5, 600) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||
CHECK_UARCH(arch, 0, 5, 0, 4, NA, "P55C (MMX)", UARCH_P5_MMX, 350) // https://www.cpu-world.com/CPUs/Pentium/TYPE-Pentium%20MMX.html
|
||||
CHECK_UARCH(arch, 0, 5, 0, 7, NA, "P54C", UARCH_P5, 350) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||
CHECK_UARCH(arch, 0, 5, 0, 8, NA, "Tillamook", UARCH_P5_MMX, 250) // http://instlatx64.atw.hu./
|
||||
CHECK_UARCH(arch, 0, 5, 0, 9, 0, "Lakemont", UARCH_LAKEMONT, 32)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 9, NA, "P5 (MMX)", UARCH_P5_MMX, UNK)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 10, 0, "Lakemont", UARCH_LAKEMONT, 32)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 1, 1, "P6", UARCH_P6_PRO, UNK)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 1, 2, "P6", UARCH_P6_PRO, UNK)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 1, 6, "P6", UARCH_P6_PRO, 350)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 1, 7, "P6", UARCH_P6_PRO, 350)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 1, 9, "P6", UARCH_P6_PRO, 350)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 0, NA, "P6 (Pentium II)", UARCH_P6_PENTIUM_II, UNK)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 1, NA, "P6 (Pentium II)", UARCH_P6_PENTIUM_II, UNK) // process depends on core
|
||||
CHECK_UARCH(arch, 0, 6, 0, 2, NA, "P6 (Pentium II)", UARCH_P6_PENTIUM_II, UNK)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 3, NA, "P6 (Klamath)", UARCH_P6_PENTIUM_II, 350) // http://instlatx64.atw.hu.
|
||||
CHECK_UARCH(arch, 0, 6, 0, 4, NA, "P6 (Pentium II)", UARCH_P6_PENTIUM_II, UNK)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 5, NA, "P6 (Deschutes)", UARCH_P6_PENTIUM_II, 250) // http://instlatx64.atw.hu.
|
||||
CHECK_UARCH(arch, 0, 6, 0, 6, NA, "P6 (Dixon)", UARCH_P6_PENTIUM_II, UNK) // http://instlatx64.atw.hu.
|
||||
CHECK_UARCH(arch, 0, 6, 0, 7, NA, "P6 (Katmai)", UARCH_P6_PENTIUM_III, 250) // Core names from: https://en.wikichip.org/wiki/intel/cpuid. NOTE: Xeon core names are different! https://www.techpowerup.com/cpu-specs/?generation=Intel+Pentium+III+Xeon
|
||||
CHECK_UARCH(arch, 0, 6, 0, 8, NA, "P6 (Coppermine)", UARCH_P6_PENTIUM_III, 180) // Also: https://en.wikipedia.org/wiki/Pentium_III
|
||||
CHECK_UARCH(arch, 0, 6, 0, 9, NA, "P6 (Pentium M)", UARCH_P6_PENTIUM_III, 130)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 10, NA, "P6 (Coppermine T)", UARCH_P6_PENTIUM_III, 180)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 11, NA, "P6 (Tualatin)", UARCH_P6_PENTIUM_III, 130)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 13, NA, "Dothan", UARCH_DOTHAN, UNK) // process depends on core
|
||||
CHECK_UARCH(arch, 0, 6, 0, 14, NA, "Yonah", UARCH_YONAH, 65)
|
||||
CHECK_UARCH(arch, 0, 6, 0, 15, NA, "Merom", UARCH_MEROM, 65)
|
||||
CHECK_UARCH(arch, 0, 6, 1, 5, NA, "Dothan", UARCH_DOTHAN, 90)
|
||||
CHECK_UARCH(arch, 0, 6, 1, 6, NA, "Merom", UARCH_MEROM, 65)
|
||||
CHECK_UARCH(arch, 0, 6, 1, 7, NA, "Penryn", UARCH_PENYR, 45)
|
||||
CHECK_UARCH(arch, 0, 6, 1, 10, NA, "Nehalem", UARCH_NEHALEM, 45)
|
||||
CHECK_UARCH(arch, 0, 6, 1, 12, NA, "Bonnell", UARCH_BONNELL, 45)
|
||||
CHECK_UARCH(arch, 0, 6, 1, 13, NA, "Penryn", UARCH_PENYR, 45)
|
||||
CHECK_UARCH(arch, 0, 6, 1, 14, NA, "Nehalem", UARCH_NEHALEM, 45)
|
||||
CHECK_UARCH(arch, 0, 6, 1, 15, NA, "Nehalem", UARCH_NEHALEM, 45)
|
||||
CHECK_UARCH(arch, 0, 6, 2, 5, NA, "Westmere", UARCH_WESTMERE, 32)
|
||||
CHECK_UARCH(arch, 0, 6, 2 , 6, NA, "Bonnell", UARCH_BONNELL, 45)
|
||||
CHECK_UARCH(arch, 0, 6, 2, 7, NA, "Saltwell", UARCH_SALTWELL, 32)
|
||||
CHECK_UARCH(arch, 0, 6, 2, 10, NA, "Sandy Bridge", UARCH_SANDY_BRIDGE, 32)
|
||||
CHECK_UARCH(arch, 0, 6, 2, 12, NA, "Westmere", UARCH_WESTMERE, 32)
|
||||
CHECK_UARCH(arch, 0, 6, 2, 13, NA, "Sandy Bridge", UARCH_SANDY_BRIDGE, 32)
|
||||
CHECK_UARCH(arch, 0, 6, 2, 14, NA, "Nehalem", UARCH_NEHALEM, 45)
|
||||
CHECK_UARCH(arch, 0, 6, 2, 15, NA, "Westmere", UARCH_WESTMERE, 32)
|
||||
CHECK_UARCH(arch, 0, 6, 3, 5, NA, "Saltwell", UARCH_SALTWELL, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 3, 6, NA, "Saltwell", UARCH_SALTWELL, 32)
|
||||
CHECK_UARCH(arch, 0, 6, 3, 7, NA, "Silvermont", UARCH_SILVERMONT, 22)
|
||||
CHECK_UARCH(arch, 0, 6, 3, 10, NA, "Ivy Bridge", UARCH_IVY_BRIDGE, 22)
|
||||
CHECK_UARCH(arch, 0, 6, 3, 12, NA, "Haswell", UARCH_HASWELL, 22)
|
||||
CHECK_UARCH(arch, 0, 6, 3, 13, NA, "Broadwell", UARCH_BROADWELL, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 3, 14, NA, "Ivy Bridge", UARCH_IVY_BRIDGE, 22)
|
||||
CHECK_UARCH(arch, 0, 6, 3, 15, NA, "Haswell", UARCH_HASWELL, 22)
|
||||
CHECK_UARCH(arch, 0, 6, 4, 5, NA, "Haswell", UARCH_HASWELL, 22)
|
||||
CHECK_UARCH(arch, 0, 6, 4, 6, NA, "Haswell", UARCH_HASWELL, 22)
|
||||
CHECK_UARCH(arch, 0, 6, 4, 7, NA, "Broadwell", UARCH_BROADWELL, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 4, 10, NA, "Silvermont", UARCH_SILVERMONT, 22) // no docs, but /proc/cpuinfo seen in wild
|
||||
CHECK_UARCH(arch, 0, 6, 4, 12, NA, "Airmont", UARCH_AIRMONT, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 4, 13, NA, "Silvermont", UARCH_SILVERMONT, 22)
|
||||
CHECK_UARCH(arch, 0, 6, 4, 14, 8, "Kaby Lake", UARCH_KABY_LAKE, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 4, 14, NA, "Skylake", UARCH_SKYLAKE, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 4, 15, NA, "Broadwell", UARCH_BROADWELL, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 5, 5, 6, "Cascade Lake", UARCH_CASCADE_LAKE, 14) // no docs, but example from Greg Stewart
|
||||
CHECK_UARCH(arch, 0, 6, 5, 5, 7, "Cascade Lake", UARCH_CASCADE_LAKE, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 5, 5, 10, "Cooper Lake", UARCH_COOPER_LAKE, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 5, 5, NA, "Skylake", UARCH_SKYLAKE, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 5, 6, NA, "Broadwell", UARCH_BROADWELL, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 5, 7, NA, "Knights Landing", UARCH_KNIGHTS_LANDING, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 5, 10, NA, "Silvermont", UARCH_SILVERMONT, 22) // no spec update; only MSR_CPUID_table* so far
|
||||
CHECK_UARCH(arch, 0, 6, 5, 12, NA, "Goldmont", UARCH_GOLDMONT, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 5, 13, NA, "Silvermont", UARCH_SILVERMONT, 22) // no spec update; only MSR_CPUID_table* so far
|
||||
CHECK_UARCH(arch, 0, 6, 5, 14, 8, "Kaby Lake", UARCH_KABY_LAKE, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 5, 14, NA, "Skylake", UARCH_SKYLAKE, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 5, 15, NA, "Goldmont", UARCH_GOLDMONT, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 6, 6, NA, "Palm Cove", UARCH_PALM_COVE, 10) // no spec update; only MSR_CPUID_table* so far
|
||||
CHECK_UARCH(arch, 0, 6, 6, 10, NA, "Sunny Cove", UARCH_SUNNY_COVE, 10) // no spec update; only MSR_CPUID_table* so far
|
||||
CHECK_UARCH(arch, 0, 6, 6, 12, NA, "Sunny Cove", UARCH_SUNNY_COVE, 10) // no spec update; only MSR_CPUID_table* so far
|
||||
CHECK_UARCH(arch, 0, 6, 7, 5, NA, "Airmont", UARCH_AIRMONT, 14) // no spec update; whispers & rumors
|
||||
CHECK_UARCH(arch, 0, 6, 7, 10, NA, "Goldmont Plus", UARCH_GOLDMONT_PLUS, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 7, 13, NA, "Sunny Cove", UARCH_SUNNY_COVE, 10) // no spec update; only MSR_CPUID_table* so far
|
||||
CHECK_UARCH(arch, 0, 6, 7, 14, NA, "Ice Lake", UARCH_ICE_LAKE, 10)
|
||||
CHECK_UARCH(arch, 0, 6, 8, 5, NA, "Knights Mill", UARCH_KNIGHTS_MILL, 14) // no spec update; only MSR_CPUID_table* so far
|
||||
CHECK_UARCH(arch, 0, 6, 8, 6, NA, "Tremont", UARCH_TREMONT, 10) // LX*
|
||||
CHECK_UARCH(arch, 0, 6, 8, 10, NA, "Tremont", UARCH_TREMONT, 10) // no spec update; only geekbench.com example
|
||||
CHECK_UARCH(arch, 0, 6, 8, 12, NA, "Tiger Lake", UARCH_TIGER_LAKE, 10) // instlatx64
|
||||
CHECK_UARCH(arch, 0, 6, 8, 13, NA, "Tiger Lake", UARCH_TIGER_LAKE, 10) // instlatx64
|
||||
// CHECK_UARCH(arch, 0, 6, 8, 14, 9, ...) It is not possible to determine uarch only from CPUID dump (can be Kaby Lake or Amber Lake)
|
||||
CHECK_UARCH(arch, 0, 6, 8, 14, 10, "Coffee Lake", UARCH_COFFEE_LAKE, 14) // wikichip
|
||||
CHECK_UARCH(arch, 0, 6, 8, 14, 11, "Whiskey Lake", UARCH_WHISKEY_LAKE, 14) // wikichip
|
||||
CHECK_UARCH(arch, 0, 6, 8, 14, 12, "Comet Lake", UARCH_COMET_LAKE, 14) // wikichip
|
||||
CHECK_UARCH(arch, 0, 6, 9, 6, NA, "Tremont", UARCH_TREMONT, 10) // LX*
|
||||
CHECK_UARCH(arch, 0, 6, 9, 7, NA, "Alder Lake", UARCH_ALDER_LAKE, 10) // instlatx64 (Alder Lake-S)
|
||||
CHECK_UARCH(arch, 0, 6, 9, 10, NA, "Alder Lake", UARCH_ALDER_LAKE, 10) // instlatx64 (Alder Lake-P)
|
||||
CHECK_UARCH(arch, 0, 6, 9, 12, NA, "Tremont", UARCH_TREMONT, 10) // LX*
|
||||
CHECK_UARCH(arch, 0, 6, 9, 13, NA, "Sunny Cove", UARCH_SUNNY_COVE, 10) // LX*
|
||||
CHECK_UARCH(arch, 0, 6, 9, 14, 9, "Kaby Lake", UARCH_KABY_LAKE, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 9, 14, 10, "Coffee Lake", UARCH_COFFEE_LAKE, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 9, 14, 11, "Coffee Lake", UARCH_COFFEE_LAKE, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 9, 14, 12, "Coffee Lake", UARCH_COFFEE_LAKE, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 9, 14, 13, "Coffee Lake", UARCH_COFFEE_LAKE, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 10, 5, NA, "Comet Lake", UARCH_COMET_LAKE, 14) // wikichip
|
||||
CHECK_UARCH(arch, 0, 6, 10, 6, NA, "Comet Lake", UARCH_COMET_LAKE, 14) // instlatx64.atw.hu (i7-10710U)
|
||||
CHECK_UARCH(arch, 0, 6, 10, 7, NA, "Rocket Lake", UARCH_ROCKET_LAKE, 14) // instlatx64.atw.hu (i7-11700K)
|
||||
CHECK_UARCH(arch, 0, 6, 11, 7, NA, "Raptor Lake", UARCH_RAPTOR_LAKE, 10) // instlatx64.atw.hu (i5-13600K)
|
||||
CHECK_UARCH(arch, 0, 11, 0, 0, NA, "Knights Ferry", UARCH_KNIGHTS_FERRY, 45) // found only on en.wikichip.org
|
||||
CHECK_UARCH(arch, 0, 11, 0, 1, NA, "Knights Corner", UARCH_KNIGHTS_CORNER, 22)
|
||||
CHECK_UARCH(arch, 0, 15, 0, 0, NA, "Willamette", UARCH_WILLAMETTE, 180)
|
||||
CHECK_UARCH(arch, 0, 15, 0, 1, NA, "Willamette", UARCH_WILLAMETTE, 180)
|
||||
CHECK_UARCH(arch, 0, 15, 0, 2, NA, "Northwood", UARCH_NORTHWOOD, 130)
|
||||
CHECK_UARCH(arch, 0, 15, 0, 3, NA, "Prescott", UARCH_PRESCOTT, 90)
|
||||
CHECK_UARCH(arch, 0, 15, 0, 4, NA, "Prescott", UARCH_PRESCOTT, 90)
|
||||
CHECK_UARCH(arch, 0, 15, 0, 6, NA, "Cedar Mill", UARCH_CEDAR_MILL, 65)
|
||||
CHECK_UARCH(arch, 1, 15, 0, 0, NA, "Itanium2", UARCH_ITANIUM2, 180)
|
||||
CHECK_UARCH(arch, 1, 15, 0, 1, NA, "Itanium2", UARCH_ITANIUM2, 130)
|
||||
CHECK_UARCH(arch, 1, 15, 0, 2, NA, "Itanium2", UARCH_ITANIUM2, 130)
|
||||
// CHECK_UARCH(arch, 0, 6, 8, 14, 10, ...) It is not possible to determine uarch only from CPUID dump (can be Kaby Lake R or Coffee Lake U)
|
||||
CHECK_UARCH(arch, 0, 6, 8, 14, 11, "Whiskey Lake", UARCH_WHISKEY_LAKE, 14) // wikichip
|
||||
CHECK_UARCH(arch, 0, 6, 8, 14, 12, "Comet Lake", UARCH_COMET_LAKE, 14) // wikichip
|
||||
CHECK_UARCH(arch, 0, 6, 9, 6, NA, "Tremont", UARCH_TREMONT, 10) // LX*
|
||||
CHECK_UARCH(arch, 0, 6, 9, 7, NA, "Alder Lake", UARCH_ALDER_LAKE, 10) // instlatx64 (Alder Lake-S)
|
||||
CHECK_UARCH(arch, 0, 6, 9, 10, NA, "Alder Lake", UARCH_ALDER_LAKE, 10) // instlatx64 (Alder Lake-P)
|
||||
CHECK_UARCH(arch, 0, 6, 9, 12, NA, "Tremont", UARCH_TREMONT, 10) // LX*
|
||||
CHECK_UARCH(arch, 0, 6, 9, 13, NA, "Sunny Cove", UARCH_SUNNY_COVE, 10) // LX*
|
||||
CHECK_UARCH(arch, 0, 6, 9, 14, 9, "Kaby Lake", UARCH_KABY_LAKE, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 9, 14, 10, "Coffee Lake", UARCH_COFFEE_LAKE, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 9, 14, 11, "Coffee Lake", UARCH_COFFEE_LAKE, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 9, 14, 12, "Coffee Lake", UARCH_COFFEE_LAKE, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 9, 14, 13, "Coffee Lake", UARCH_COFFEE_LAKE, 14)
|
||||
CHECK_UARCH(arch, 0, 6, 10, 5, NA, "Comet Lake", UARCH_COMET_LAKE, 14) // wikichip
|
||||
CHECK_UARCH(arch, 0, 6, 10, 6, NA, "Comet Lake", UARCH_COMET_LAKE, 14) // instlatx64.atw.hu (i7-10710U)
|
||||
CHECK_UARCH(arch, 0, 6, 10, 7, NA, "Rocket Lake", UARCH_ROCKET_LAKE, 14) // instlatx64.atw.hu (i7-11700K)
|
||||
CHECK_UARCH(arch, 0, 6, 11, 7, NA, "Raptor Lake", UARCH_RAPTOR_LAKE, 10) // instlatx64.atw.hu (i5-13600K)
|
||||
CHECK_UARCH(arch, 0, 6, 11, 10, NA, "Raptor Lake", UARCH_RAPTOR_LAKE, 10) // instlatx64.atw.hu (i7-1370P)
|
||||
CHECK_UARCH(arch, 0, 6, 11, 14, NA, "Alder Lake", UARCH_ALDER_LAKE, 10) // instlatx64.atw.hu (Alder Lake-N)
|
||||
CHECK_UARCH(arch, 0, 6, 11, 15, NA, "Raptor Lake", UARCH_RAPTOR_LAKE, 10) // instlatx64.atw.hu (i5-13500)
|
||||
CHECK_UARCH(arch, 0, 11, 0, 0, NA, "Knights Ferry", UARCH_KNIGHTS_FERRY, 45) // found only on en.wikichip.org
|
||||
CHECK_UARCH(arch, 0, 11, 0, 1, NA, "Knights Corner", UARCH_KNIGHTS_CORNER, 22)
|
||||
CHECK_UARCH(arch, 0, 15, 0, 0, NA, "Willamette", UARCH_WILLAMETTE, 180)
|
||||
CHECK_UARCH(arch, 0, 15, 0, 1, NA, "Willamette", UARCH_WILLAMETTE, 180)
|
||||
CHECK_UARCH(arch, 0, 15, 0, 2, NA, "Northwood", UARCH_NORTHWOOD, 130)
|
||||
CHECK_UARCH(arch, 0, 15, 0, 3, NA, "Prescott", UARCH_PRESCOTT, 90)
|
||||
CHECK_UARCH(arch, 0, 15, 0, 4, NA, "Prescott", UARCH_PRESCOTT, 90)
|
||||
CHECK_UARCH(arch, 0, 15, 0, 6, NA, "Cedar Mill", UARCH_CEDAR_MILL, 65)
|
||||
CHECK_UARCH(arch, 1, 15, 0, 0, NA, "Itanium2", UARCH_ITANIUM2, 180)
|
||||
CHECK_UARCH(arch, 1, 15, 0, 1, NA, "Itanium2", UARCH_ITANIUM2, 130)
|
||||
CHECK_UARCH(arch, 1, 15, 0, 2, NA, "Itanium2", UARCH_ITANIUM2, 130)
|
||||
UARCH_END
|
||||
|
||||
return arch;
|
||||
}
|
||||
|
||||
@@ -273,11 +297,16 @@ struct uarch* get_uarch_from_cpuid_amd(uint32_t ef, uint32_t f, uint32_t em, uin
|
||||
// ----------------------------------------------------------------------------- //
|
||||
// EF F EM M S //
|
||||
UARCH_START
|
||||
CHECK_UARCH(arch, 0, 4, 0, 3, NA, "Am486", UARCH_AM486, UNK)
|
||||
CHECK_UARCH(arch, 0, 4, 0, 7, NA, "Am486", UARCH_AM486, UNK)
|
||||
CHECK_UARCH(arch, 0, 4, 0, 8, NA, "Am486", UARCH_AM486, UNK)
|
||||
CHECK_UARCH(arch, 0, 4, 0, 9, NA, "Am486", UARCH_AM486, UNK)
|
||||
CHECK_UARCH(arch, 0, 4, NA, NA, NA, "Am5x86", UARCH_AM5X86, UNK)
|
||||
CHECK_UARCH(arch, 0, 4, 0, 3, NA, "Am486DX2", UARCH_AM486, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||
CHECK_UARCH(arch, 0, 4, 0, 7, NA, "Am486DX2WB", UARCH_AM486, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||
CHECK_UARCH(arch, 0, 4, 0, 8, NA, "Am486DX4", UARCH_AM486, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||
CHECK_UARCH(arch, 0, 4, 0, 9, NA, "Am486DX4WB", UARCH_AM486, UNK) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||
CHECK_UARCH(arch, 0, 4, 0, 14, NA, "Am5x86", UARCH_AM5X86, 350) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||
CHECK_UARCH(arch, 0, 4, 0, 15, NA, "Am5x86WB", UARCH_AM5X86, 350) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||
CHECK_UARCH(arch, 0, 5, 0, 0, NA, "SSA5 (K5)", UARCH_SSA5, 350) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||
CHECK_UARCH(arch, 0, 5, 0, 1, NA, "K5", UARCH_K5, 350) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||
CHECK_UARCH(arch, 0, 5, 0, 2, NA, "K5", UARCH_K5, 350) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||
CHECK_UARCH(arch, 0, 5, 0, 3, NA, "K5", UARCH_K5, 350) // https://sandpile.org/x86/cpuid.htm#level_0000_0001h
|
||||
CHECK_UARCH(arch, 0, 5, 0, 6, NA, "K6", UARCH_K6, 300)
|
||||
CHECK_UARCH(arch, 0, 5, 0, 7, NA, "K6", UARCH_K6, 250) // *p from sandpile.org
|
||||
CHECK_UARCH(arch, 0, 5, 0, 10, NA, "K7", UARCH_K7, 130) // Geode NX
|
||||
@@ -348,6 +377,7 @@ struct uarch* get_uarch_from_cpuid_amd(uint32_t ef, uint32_t f, uint32_t em, uin
|
||||
CHECK_UARCH(arch, 6, 15, 6, 5, NA, "Excavator", UARCH_EXCAVATOR, 28) // undocumented, but sample from Alexandros Couloumbis
|
||||
CHECK_UARCH(arch, 6, 15, 7, 0, NA, "Excavator", UARCH_EXCAVATOR, 28)
|
||||
CHECK_UARCH(arch, 7, 15, 0, 0, NA, "Jaguar", UARCH_JAGUAR, 28)
|
||||
CHECK_UARCH(arch, 7, 15, 1, NA, NA, "Jaguar", UARCH_JAGUAR, 14) // instlatx64 (PS4) Normal PS4 is 28nm, Slim and Pro are 16nm
|
||||
CHECK_UARCH(arch, 7, 15, 2, 6, NA, "Jaguar", UARCH_JAGUAR, 28) // AMD Cato (Xbox One?)
|
||||
CHECK_UARCH(arch, 7, 15, 3, 0, NA, "Puma 2014", UARCH_PUMA_2014, 28)
|
||||
CHECK_UARCH(arch, 8, 15, 0, 0, NA, "Zen", UARCH_ZEN, 14) // instlatx64 engr sample
|
||||
@@ -362,12 +392,43 @@ struct uarch* get_uarch_from_cpuid_amd(uint32_t ef, uint32_t f, uint32_t em, uin
|
||||
CHECK_UARCH(arch, 8, 15, 6, 0, NA, "Zen 2", UARCH_ZEN2, 7) // undocumented, geekbench.com example
|
||||
CHECK_UARCH(arch, 8, 15, 6, 8, NA, "Zen 2", UARCH_ZEN2, 7) // found on instlatx64
|
||||
CHECK_UARCH(arch, 8, 15, 7, 1, NA, "Zen 2", UARCH_ZEN2, 7) // samples from Steven Noonan and instlatx64
|
||||
CHECK_UARCH(arch, 8, 15, 8, 4, NA, "Zen 2", UARCH_ZEN2, 7) // instlatx64 (Xbox Series X?)
|
||||
CHECK_UARCH(arch, 8, 15, 9, 0, 2, "Zen 2", UARCH_ZEN2, 7) // Steam Deck (instlatx64)
|
||||
CHECK_UARCH(arch, 8, 15, 10, 0, NA, "Zen 2", UARCH_ZEN2, 6) // instlatx64
|
||||
CHECK_UARCH(arch, 10, 15, 0, 1, NA, "Zen 3", UARCH_ZEN3, 7) // instlatx64
|
||||
CHECK_UARCH(arch, 10, 15, 0, 8, NA, "Zen 3", UARCH_ZEN3, 7) // instlatx64
|
||||
CHECK_UARCH(arch, 10, 15, 1, 1, NA, "Zen 4", UARCH_ZEN4, 5) // instlatx64
|
||||
CHECK_UARCH(arch, 10, 15, 1, 8, NA, "Zen 4", UARCH_ZEN4, 5) // instlatx64
|
||||
CHECK_UARCH(arch, 10, 15, 2, 1, NA, "Zen 3", UARCH_ZEN3, 7) // instlatx64
|
||||
CHECK_UARCH(arch, 10, 15, 3, NA, NA, "Zen 3", UARCH_ZEN3, 7) // instlatx64
|
||||
CHECK_UARCH(arch, 10, 15, 4, 4, NA, "Zen 3+", UARCH_ZEN3_PLUS, 6) // instlatx64 (they say it is Zen3...)
|
||||
CHECK_UARCH(arch, 10, 15, 5, 0, NA, "Zen 3", UARCH_ZEN3, 7) // instlatx64
|
||||
CHECK_UARCH(arch, 10, 15, 6, 1, 2, "Zen 4", UARCH_ZEN4, 5) // instlatx64
|
||||
CHECK_UARCH(arch, 10, 15, 7, 4, 1, "Zen 4", UARCH_ZEN4, 4) // instlatx64
|
||||
CHECK_UARCH(arch, 10, 15, 7, 5, 2, "Zen 4", UARCH_ZEN4, 4) // instlatx64
|
||||
CHECK_UARCH(arch, 10, 15, 7, 8, 0, "Zen 4", UARCH_ZEN4, 4) // instlatx64
|
||||
CHECK_UARCH(arch, 10, 15, 8, NA, NA, "Zen 4", UARCH_ZEN4, 5) // instlatx64 (AMD MI300C)
|
||||
CHECK_UARCH(arch, 10, 15, 9, NA, NA, "Zen 4", UARCH_ZEN4, 5) // instlatx64 (AMD MI300A)
|
||||
CHECK_UARCH(arch, 10, 15, 10, NA, NA, "Zen 4c", UARCH_ZEN4C, 5) // instlatx64
|
||||
UARCH_END
|
||||
|
||||
return arch;
|
||||
}
|
||||
|
||||
struct uarch* get_uarch_from_cpuid_hygon(uint32_t ef, uint32_t f, uint32_t em, uint32_t m, int s) {
|
||||
struct uarch* arch = emalloc(sizeof(struct uarch));
|
||||
|
||||
// EF: Extended Family //
|
||||
// F: Family //
|
||||
// EM: Extended Model //
|
||||
// M: Model //
|
||||
// S: Stepping //
|
||||
// ----------------------------------------------------------------------------- //
|
||||
// EF F EM M S //
|
||||
UARCH_START
|
||||
// https://www.phoronix.com/news/Hygon-Dhyana-AMD-China-CPUs
|
||||
CHECK_UARCH(arch, 9, 15, 0, 1, NA, "Zen", UARCH_ZEN, UNK) // https://github.com/Dr-Noob/cpufetch/issues/244
|
||||
// CHECK_UARCH(arch, 9, 15, 0, 2, NA, "???", ?????????, UNK) // http://instlatx64.atw.hu/
|
||||
UARCH_END
|
||||
|
||||
return arch;
|
||||
@@ -375,10 +436,16 @@ struct uarch* get_uarch_from_cpuid_amd(uint32_t ef, uint32_t f, uint32_t em, uin
|
||||
|
||||
struct uarch* get_uarch_from_cpuid(struct cpuInfo* cpu, uint32_t dump, uint32_t ef, uint32_t f, uint32_t em, uint32_t m, int s) {
|
||||
if(cpu->cpu_vendor == CPU_VENDOR_INTEL) {
|
||||
struct uarch* arch = emalloc(sizeof(struct uarch));
|
||||
if(dump == 0x000806E9) {
|
||||
// It is not possible to determine uarch only from CPUID dump (can be Kaby Lake or Amber Lake)
|
||||
struct uarch* arch = emalloc(sizeof(struct uarch));
|
||||
if (cpu->cpu_name == NULL) {
|
||||
printErr("Unable to find uarch without CPU name");
|
||||
fill_uarch(arch, STRING_UNKNOWN, UARCH_UNKNOWN, UNK);
|
||||
return arch;
|
||||
}
|
||||
|
||||
// It is not possible to determine uarch only from CPUID dump (can be Kaby Lake or Amber Lake)
|
||||
// See issue https://github.com/Dr-Noob/cpufetch/issues/122
|
||||
if(strstr(cpu->cpu_name, "Y") != NULL) {
|
||||
fill_uarch(arch, "Amber Lake", UARCH_AMBER_LAKE, 14);
|
||||
}
|
||||
@@ -388,14 +455,107 @@ struct uarch* get_uarch_from_cpuid(struct cpuInfo* cpu, uint32_t dump, uint32_t
|
||||
|
||||
return arch;
|
||||
}
|
||||
else if (dump == 0x000806EA) {
|
||||
if (cpu->cpu_name == NULL) {
|
||||
printErr("Unable to find uarch without CPU name");
|
||||
fill_uarch(arch, STRING_UNKNOWN, UARCH_UNKNOWN, UNK);
|
||||
return arch;
|
||||
}
|
||||
|
||||
// It is not possible to determine uarch only from CPUID dump (can be Kaby Lake R or Coffee Lake U)
|
||||
// See issue https://github.com/Dr-Noob/cpufetch/issues/149
|
||||
if(strstr(cpu->cpu_name, "i5-8250U") != NULL ||
|
||||
strstr(cpu->cpu_name, "i5-8350U") != NULL ||
|
||||
strstr(cpu->cpu_name, "i7-8550U") != NULL ||
|
||||
strstr(cpu->cpu_name, "i7-8650U") != NULL) {
|
||||
fill_uarch(arch, "Kaby Lake", UARCH_KABY_LAKE, 14);
|
||||
}
|
||||
else {
|
||||
fill_uarch(arch, "Coffee Lake", UARCH_COFFEE_LAKE, 14);
|
||||
}
|
||||
|
||||
return arch;
|
||||
}
|
||||
return get_uarch_from_cpuid_intel(ef, f, em, m, s);
|
||||
}
|
||||
else
|
||||
else if(cpu->cpu_vendor == CPU_VENDOR_AMD) {
|
||||
return get_uarch_from_cpuid_amd(ef, f, em, m, s);
|
||||
}
|
||||
else if(cpu->cpu_vendor == CPU_VENDOR_HYGON) {
|
||||
return get_uarch_from_cpuid_hygon(ef, f, em, m, s);
|
||||
}
|
||||
else {
|
||||
printBug("Invalid CPU vendor: %d", cpu->cpu_vendor);
|
||||
return NULL;
|
||||
}
|
||||
}
|
||||
|
||||
// If we cannot get the CPU name from CPUID, try to infer it from uarch
|
||||
char* infer_cpu_name_from_uarch(struct uarch* arch) {
|
||||
char* cpu_name = NULL;
|
||||
if (arch == NULL) {
|
||||
printErr("infer_cpu_name_from_uarch: Unable to find CPU name");
|
||||
cpu_name = ecalloc(strlen(STRING_UNKNOWN) + 1, sizeof(char));
|
||||
strcpy(cpu_name, STRING_UNKNOWN);
|
||||
return cpu_name;
|
||||
}
|
||||
|
||||
char *str = NULL;
|
||||
|
||||
switch (arch->uarch) {
|
||||
// Intel
|
||||
case UARCH_I486:
|
||||
str = "Intel 486";
|
||||
break;
|
||||
case UARCH_P5:
|
||||
str = "Intel Pentium";
|
||||
break;
|
||||
case UARCH_P5_MMX:
|
||||
str = "Intel Pentium MMX";
|
||||
break;
|
||||
case UARCH_P6_PRO:
|
||||
str = "Intel Pentium Pro";
|
||||
break;
|
||||
case UARCH_P6_PENTIUM_II:
|
||||
str = "Intel Pentium II";
|
||||
break;
|
||||
case UARCH_P6_PENTIUM_III:
|
||||
str = "Intel Pentium III";
|
||||
break;
|
||||
|
||||
// AMD
|
||||
case UARCH_AM486:
|
||||
str = "AMD 486";
|
||||
break;
|
||||
case UARCH_AM5X86:
|
||||
str = "AMD 5x86";
|
||||
break;
|
||||
case UARCH_SSA5:
|
||||
str = "AMD 5k86";
|
||||
break;
|
||||
|
||||
default:
|
||||
printErr("Unable to find name from uarch: %d", arch->uarch);
|
||||
break;
|
||||
}
|
||||
|
||||
if (str == NULL) {
|
||||
cpu_name = ecalloc(strlen(STRING_UNKNOWN) + 1, sizeof(char));
|
||||
strcpy(cpu_name, STRING_UNKNOWN);
|
||||
}
|
||||
else {
|
||||
cpu_name = ecalloc(strlen(str) + 1, sizeof(char));
|
||||
strcpy(cpu_name, str);
|
||||
}
|
||||
|
||||
return cpu_name;
|
||||
}
|
||||
|
||||
bool vpus_are_AVX512(struct cpuInfo* cpu) {
|
||||
return cpu->arch->uarch != UARCH_ICE_LAKE && cpu->arch->uarch != UARCH_TIGER_LAKE;
|
||||
return cpu->arch->uarch != UARCH_ICE_LAKE &&
|
||||
cpu->arch->uarch != UARCH_TIGER_LAKE &&
|
||||
cpu->arch->uarch != UARCH_ZEN4 &&
|
||||
cpu->arch->uarch != UARCH_ZEN4C;
|
||||
}
|
||||
|
||||
bool is_knights_landing(struct cpuInfo* cpu) {
|
||||
@@ -431,6 +591,7 @@ int get_number_of_vpus(struct cpuInfo* cpu) {
|
||||
case UARCH_ZEN3:
|
||||
case UARCH_ZEN3_PLUS:
|
||||
case UARCH_ZEN4:
|
||||
case UARCH_ZEN4C:
|
||||
return 2;
|
||||
default:
|
||||
return 1;
|
||||
@@ -460,9 +621,6 @@ char* get_str_process(struct cpuInfo* cpu) {
|
||||
if(process == UNK) {
|
||||
snprintf(str, strlen(STRING_UNKNOWN)+1, STRING_UNKNOWN);
|
||||
}
|
||||
else if(process > 100) {
|
||||
sprintf(str, "%.2fum", (double)process/100);
|
||||
}
|
||||
else if(process > 0){
|
||||
sprintf(str, "%dnm", process);
|
||||
}
|
||||
|
||||
@@ -8,6 +8,7 @@
|
||||
struct uarch;
|
||||
|
||||
struct uarch* get_uarch_from_cpuid(struct cpuInfo* cpu, uint32_t dump, uint32_t ef, uint32_t f, uint32_t em, uint32_t m, int s);
|
||||
char* infer_cpu_name_from_uarch(struct uarch* arch);
|
||||
bool vpus_are_AVX512(struct cpuInfo* cpu);
|
||||
bool is_knights_landing(struct cpuInfo* cpu);
|
||||
int get_number_of_vpus(struct cpuInfo* cpu);
|
||||
|
||||
Reference in New Issue
Block a user