mirror of
https://github.com/google/cpu_features.git
synced 2025-04-28 07:23:37 +02:00
1012 lines
35 KiB
C
1012 lines
35 KiB
C
// Copyright 2017 Google Inc.
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
#include "cpuinfo_x86.h"
|
|
#include "internal/bit_utils.h"
|
|
#include "internal/cpuid_x86.h"
|
|
|
|
#include <stdbool.h>
|
|
#include <string.h>
|
|
|
|
#if !defined(CPU_FEATURES_ARCH_X86)
|
|
#error "Cannot compile cpuinfo_x86 on a non x86 platform."
|
|
#endif
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
// Definitions for CpuId and GetXCR0Eax.
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
#if defined(CPU_FEATURES_MOCK_CPUID_X86)
|
|
// Implementation will be provided by test/cpuinfo_x86_test.cc.
|
|
#elif defined(CPU_FEATURES_COMPILER_CLANG) || defined(CPU_FEATURES_COMPILER_GCC)
|
|
|
|
#include <cpuid.h>
|
|
|
|
Leaf CpuIdEx(uint32_t leaf_id, int ecx) {
|
|
Leaf leaf;
|
|
__cpuid_count(leaf_id, ecx, leaf.eax, leaf.ebx, leaf.ecx, leaf.edx);
|
|
return leaf;
|
|
}
|
|
|
|
uint32_t GetXCR0Eax(void) {
|
|
uint32_t eax, edx;
|
|
/* named form of xgetbv not supported on OSX, so must use byte form, see:
|
|
https://github.com/asmjit/asmjit/issues/78
|
|
*/
|
|
__asm(".byte 0x0F, 0x01, 0xd0" : "=a"(eax), "=d"(edx) : "c"(0));
|
|
return eax;
|
|
}
|
|
|
|
#elif defined(CPU_FEATURES_COMPILER_MSC)
|
|
|
|
#include <immintrin.h>
|
|
#include <intrin.h> // For __cpuidex()
|
|
|
|
Leaf CpuIdEx(uint32_t leaf_id, int ecx) {
|
|
Leaf leaf;
|
|
int data[4];
|
|
__cpuidex(data, leaf_id, ecx);
|
|
leaf.eax = data[0];
|
|
leaf.ebx = data[1];
|
|
leaf.ecx = data[2];
|
|
leaf.edx = data[3];
|
|
return leaf;
|
|
}
|
|
|
|
uint32_t GetXCR0Eax(void) { return (uint32_t)_xgetbv(0); }
|
|
|
|
#else
|
|
#error "Unsupported compiler, x86 cpuid requires either GCC, Clang or MSVC."
|
|
#endif
|
|
|
|
static Leaf CpuId(uint32_t leaf_id) { return CpuIdEx(leaf_id, 0); }
|
|
|
|
static const Leaf kEmptyLeaf;
|
|
|
|
static Leaf SafeCpuIdEx(uint32_t max_cpuid_leaf, uint32_t leaf_id, int ecx) {
|
|
if (leaf_id <= max_cpuid_leaf) {
|
|
return CpuIdEx(leaf_id, ecx);
|
|
} else {
|
|
return kEmptyLeaf;
|
|
}
|
|
}
|
|
|
|
static Leaf SafeCpuId(uint32_t max_cpuid_leaf, uint32_t leaf_id) {
|
|
return SafeCpuIdEx(max_cpuid_leaf, leaf_id, 0);
|
|
}
|
|
|
|
#define MASK_XMM 0x2
|
|
#define MASK_YMM 0x4
|
|
#define MASK_MASKREG 0x20
|
|
#define MASK_ZMM0_15 0x40
|
|
#define MASK_ZMM16_31 0x80
|
|
|
|
static bool HasMask(uint32_t value, uint32_t mask) {
|
|
return (value & mask) == mask;
|
|
}
|
|
|
|
// Checks that operating system saves and restores xmm registers during context
|
|
// switches.
|
|
static bool HasXmmOsXSave(uint32_t xcr0_eax) {
|
|
return HasMask(xcr0_eax, MASK_XMM);
|
|
}
|
|
|
|
// Checks that operating system saves and restores ymm registers during context
|
|
// switches.
|
|
static bool HasYmmOsXSave(uint32_t xcr0_eax) {
|
|
return HasMask(xcr0_eax, MASK_XMM | MASK_YMM);
|
|
}
|
|
|
|
// Checks that operating system saves and restores zmm registers during context
|
|
// switches.
|
|
static bool HasZmmOsXSave(uint32_t xcr0_eax) {
|
|
return HasMask(xcr0_eax, MASK_XMM | MASK_YMM | MASK_MASKREG | MASK_ZMM0_15 |
|
|
MASK_ZMM16_31);
|
|
}
|
|
|
|
static void SetVendor(const Leaf leaf, char* const vendor) {
|
|
*(uint32_t*)(vendor) = leaf.ebx;
|
|
*(uint32_t*)(vendor + 4) = leaf.edx;
|
|
*(uint32_t*)(vendor + 8) = leaf.ecx;
|
|
vendor[12] = '\0';
|
|
}
|
|
|
|
static int IsVendor(const Leaf leaf, const char* const name) {
|
|
const uint32_t ebx = *(const uint32_t*)(name);
|
|
const uint32_t edx = *(const uint32_t*)(name + 4);
|
|
const uint32_t ecx = *(const uint32_t*)(name + 8);
|
|
return leaf.ebx == ebx && leaf.ecx == ecx && leaf.edx == edx;
|
|
}
|
|
|
|
static const CacheLevelInfo kEmptyCacheLevelInfo;
|
|
|
|
static CacheLevelInfo MakeX86CacheLevelInfo(int level, CacheType cache_type,
|
|
int cache_size, int ways,
|
|
int line_size, int entries,
|
|
int partitioning) {
|
|
CacheLevelInfo info;
|
|
info.level = level;
|
|
info.cache_type = cache_type;
|
|
info.cache_size = cache_size;
|
|
info.ways = ways;
|
|
info.line_size = line_size;
|
|
info.tlb_entries = entries;
|
|
info.partitioning = partitioning;
|
|
return info;
|
|
}
|
|
|
|
static CacheLevelInfo GetCacheLevelInfo(const uint32_t reg) {
|
|
const int UNDEF = -1;
|
|
const int KiB = 1024;
|
|
const int MiB = 1024 * KiB;
|
|
switch (reg) {
|
|
case 0x01:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 4 * KiB, 4,
|
|
UNDEF, 32, 0);
|
|
case 0x02:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 4 * MiB, 0xFF,
|
|
UNDEF, 2, 0);
|
|
case 0x03:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 4 * KiB, 4,
|
|
UNDEF, 64, 0);
|
|
case 0x04:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 4 * MiB, 4,
|
|
UNDEF, 8, 0);
|
|
case 0x05:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 4 * MiB, 4,
|
|
UNDEF, 32, 0);
|
|
case 0x06:
|
|
return MakeX86CacheLevelInfo(1, CPU_FEATURE_CACHE_INSTRUCTION, 8 * KiB, 4,
|
|
32, UNDEF, 0);
|
|
case 0x08:
|
|
return MakeX86CacheLevelInfo(1, CPU_FEATURE_CACHE_INSTRUCTION, 16 * KiB,
|
|
4, 32, UNDEF, 0);
|
|
case 0x09:
|
|
return MakeX86CacheLevelInfo(1, CPU_FEATURE_CACHE_INSTRUCTION, 32 * KiB,
|
|
4, 64, UNDEF, 0);
|
|
case 0x0A:
|
|
return MakeX86CacheLevelInfo(1, CPU_FEATURE_CACHE_DATA, 8 * KiB, 2, 32,
|
|
UNDEF, 0);
|
|
case 0x0B:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 4 * MiB, 4,
|
|
UNDEF, 4, 0);
|
|
case 0x0C:
|
|
return MakeX86CacheLevelInfo(1, CPU_FEATURE_CACHE_DATA, 16 * KiB, 4, 32,
|
|
UNDEF, 0);
|
|
case 0x0D:
|
|
return MakeX86CacheLevelInfo(1, CPU_FEATURE_CACHE_DATA, 16 * KiB, 4, 64,
|
|
UNDEF, 0);
|
|
case 0x0E:
|
|
return MakeX86CacheLevelInfo(1, CPU_FEATURE_CACHE_DATA, 24 * KiB, 6, 64,
|
|
UNDEF, 0);
|
|
case 0x1D:
|
|
return MakeX86CacheLevelInfo(2, CPU_FEATURE_CACHE_DATA, 128 * KiB, 2, 64,
|
|
UNDEF, 0);
|
|
case 0x21:
|
|
return MakeX86CacheLevelInfo(2, CPU_FEATURE_CACHE_DATA, 256 * KiB, 8, 64,
|
|
UNDEF, 0);
|
|
case 0x22:
|
|
return MakeX86CacheLevelInfo(3, CPU_FEATURE_CACHE_DATA, 512 * KiB, 4, 64,
|
|
UNDEF, 2);
|
|
case 0x23:
|
|
return MakeX86CacheLevelInfo(3, CPU_FEATURE_CACHE_DATA, 1 * MiB, 8, 64,
|
|
UNDEF, 2);
|
|
case 0x24:
|
|
return MakeX86CacheLevelInfo(2, CPU_FEATURE_CACHE_DATA, 1 * MiB, 16, 64,
|
|
UNDEF, 0);
|
|
case 0x25:
|
|
return MakeX86CacheLevelInfo(3, CPU_FEATURE_CACHE_DATA, 2 * MiB, 8, 64,
|
|
UNDEF, 2);
|
|
case 0x29:
|
|
return MakeX86CacheLevelInfo(3, CPU_FEATURE_CACHE_DATA, 4 * MiB, 8, 64,
|
|
UNDEF, 2);
|
|
case 0x2C:
|
|
return MakeX86CacheLevelInfo(1, CPU_FEATURE_CACHE_DATA, 32 * KiB, 8, 64,
|
|
UNDEF, 0);
|
|
case 0x30:
|
|
return MakeX86CacheLevelInfo(1, CPU_FEATURE_CACHE_INSTRUCTION, 32 * KiB,
|
|
8, 64, UNDEF, 0);
|
|
case 0x40:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_DATA, UNDEF, UNDEF,
|
|
UNDEF, UNDEF, 0);
|
|
case 0x41:
|
|
return MakeX86CacheLevelInfo(2, CPU_FEATURE_CACHE_DATA, 128 * KiB, 4, 32,
|
|
UNDEF, 0);
|
|
case 0x42:
|
|
return MakeX86CacheLevelInfo(2, CPU_FEATURE_CACHE_DATA, 256 * KiB, 4, 32,
|
|
UNDEF, 0);
|
|
case 0x43:
|
|
return MakeX86CacheLevelInfo(2, CPU_FEATURE_CACHE_DATA, 512 * KiB, 4, 32,
|
|
UNDEF, 0);
|
|
case 0x44:
|
|
return MakeX86CacheLevelInfo(2, CPU_FEATURE_CACHE_DATA, 1 * MiB, 4, 32,
|
|
UNDEF, 0);
|
|
case 0x45:
|
|
return MakeX86CacheLevelInfo(2, CPU_FEATURE_CACHE_DATA, 2 * MiB, 4, 32,
|
|
UNDEF, 0);
|
|
case 0x46:
|
|
return MakeX86CacheLevelInfo(3, CPU_FEATURE_CACHE_DATA, 4 * MiB, 4, 64,
|
|
UNDEF, 0);
|
|
case 0x47:
|
|
return MakeX86CacheLevelInfo(3, CPU_FEATURE_CACHE_DATA, 8 * MiB, 8, 64,
|
|
UNDEF, 0);
|
|
case 0x48:
|
|
return MakeX86CacheLevelInfo(2, CPU_FEATURE_CACHE_DATA, 3 * MiB, 12, 64,
|
|
UNDEF, 0);
|
|
case 0x49:
|
|
return MakeX86CacheLevelInfo(2, CPU_FEATURE_CACHE_DATA, 4 * MiB, 16, 64,
|
|
UNDEF, 0);
|
|
case (0x49 | (1 << 8)):
|
|
return MakeX86CacheLevelInfo(3, CPU_FEATURE_CACHE_DATA, 4 * MiB, 16, 64,
|
|
UNDEF, 0);
|
|
case 0x4A:
|
|
return MakeX86CacheLevelInfo(3, CPU_FEATURE_CACHE_DATA, 6 * MiB, 12, 64,
|
|
UNDEF, 0);
|
|
case 0x4B:
|
|
return MakeX86CacheLevelInfo(3, CPU_FEATURE_CACHE_DATA, 8 * MiB, 16, 64,
|
|
UNDEF, 0);
|
|
case 0x4C:
|
|
return MakeX86CacheLevelInfo(3, CPU_FEATURE_CACHE_DATA, 12 * MiB, 12, 64,
|
|
UNDEF, 0);
|
|
case 0x4D:
|
|
return MakeX86CacheLevelInfo(3, CPU_FEATURE_CACHE_DATA, 16 * MiB, 16, 64,
|
|
UNDEF, 0);
|
|
case 0x4E:
|
|
return MakeX86CacheLevelInfo(2, CPU_FEATURE_CACHE_DATA, 6 * MiB, 24, 64,
|
|
UNDEF, 0);
|
|
case 0x4F:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 4 * KiB, UNDEF,
|
|
UNDEF, 32, 0);
|
|
case 0x50:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 4 * KiB, UNDEF,
|
|
UNDEF, 64, 0);
|
|
case 0x51:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 4 * KiB, UNDEF,
|
|
UNDEF, 128, 0);
|
|
case 0x52:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 4 * KiB, UNDEF,
|
|
UNDEF, 256, 0);
|
|
case 0x55:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 2 * MiB, 0xFF,
|
|
UNDEF, 7, 0);
|
|
case 0x56:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 4 * MiB, 4,
|
|
UNDEF, 16, 0);
|
|
case 0x57:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 4 * KiB, 4,
|
|
UNDEF, 16, 0);
|
|
case 0x59:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 4 * KiB, 0xFF,
|
|
UNDEF, 16, 0);
|
|
case 0x5A:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 2 * MiB, 4,
|
|
UNDEF, 32, 0);
|
|
case 0x5B:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 4 * KiB, UNDEF,
|
|
UNDEF, 64, 0);
|
|
case 0x5C:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 4 * KiB, UNDEF,
|
|
UNDEF, 128, 0);
|
|
case 0x5D:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 4, UNDEF,
|
|
UNDEF, 256, 0);
|
|
case 0x60:
|
|
return MakeX86CacheLevelInfo(1, CPU_FEATURE_CACHE_DATA, 16 * KiB, 8, 64,
|
|
UNDEF, 0);
|
|
case 0x61:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 4 * KiB, 0xFF,
|
|
UNDEF, 48, 0);
|
|
case 0x63:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 2 * MiB, 4,
|
|
UNDEF, 4, 0);
|
|
case 0x66:
|
|
return MakeX86CacheLevelInfo(1, CPU_FEATURE_CACHE_DATA, 8 * KiB, 4, 64,
|
|
UNDEF, 0);
|
|
case 0x67:
|
|
return MakeX86CacheLevelInfo(1, CPU_FEATURE_CACHE_DATA, 16 * KiB, 4, 64,
|
|
UNDEF, 0);
|
|
case 0x68:
|
|
return MakeX86CacheLevelInfo(1, CPU_FEATURE_CACHE_DATA, 32 * KiB, 4, 64,
|
|
UNDEF, 0);
|
|
case 0x70:
|
|
return MakeX86CacheLevelInfo(1, CPU_FEATURE_CACHE_INSTRUCTION, 12 * KiB,
|
|
8, UNDEF, UNDEF, 0);
|
|
case 0x71:
|
|
return MakeX86CacheLevelInfo(1, CPU_FEATURE_CACHE_INSTRUCTION, 16 * KiB,
|
|
8, UNDEF, UNDEF, 0);
|
|
case 0x72:
|
|
return MakeX86CacheLevelInfo(1, CPU_FEATURE_CACHE_INSTRUCTION, 32 * KiB,
|
|
8, UNDEF, UNDEF, 0);
|
|
case 0x76:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 2 * MiB, 0xFF,
|
|
UNDEF, 8, 0);
|
|
case 0x78:
|
|
return MakeX86CacheLevelInfo(2, CPU_FEATURE_CACHE_DATA, 1 * MiB, 4, 64,
|
|
UNDEF, 0);
|
|
case 0x79:
|
|
return MakeX86CacheLevelInfo(2, CPU_FEATURE_CACHE_DATA, 128 * KiB, 8, 64,
|
|
UNDEF, 2);
|
|
case 0x7A:
|
|
return MakeX86CacheLevelInfo(2, CPU_FEATURE_CACHE_DATA, 256 * KiB, 8, 64,
|
|
UNDEF, 2);
|
|
case 0x7B:
|
|
return MakeX86CacheLevelInfo(2, CPU_FEATURE_CACHE_DATA, 512 * KiB, 8, 64,
|
|
UNDEF, 2);
|
|
case 0x7C:
|
|
return MakeX86CacheLevelInfo(2, CPU_FEATURE_CACHE_DATA, 1 * MiB, 8, 64,
|
|
UNDEF, 2);
|
|
case 0x7D:
|
|
return MakeX86CacheLevelInfo(2, CPU_FEATURE_CACHE_DATA, 2 * MiB, 8, 64,
|
|
UNDEF, 0);
|
|
case 0x7F:
|
|
return MakeX86CacheLevelInfo(2, CPU_FEATURE_CACHE_DATA, 512 * KiB, 2, 64,
|
|
UNDEF, 0);
|
|
case 0x80:
|
|
return MakeX86CacheLevelInfo(2, CPU_FEATURE_CACHE_DATA, 512 * KiB, 8, 64,
|
|
UNDEF, 0);
|
|
case 0x82:
|
|
return MakeX86CacheLevelInfo(2, CPU_FEATURE_CACHE_DATA, 256 * KiB, 8, 32,
|
|
UNDEF, 0);
|
|
case 0x83:
|
|
return MakeX86CacheLevelInfo(2, CPU_FEATURE_CACHE_DATA, 512 * KiB, 8, 32,
|
|
UNDEF, 0);
|
|
case 0x84:
|
|
return MakeX86CacheLevelInfo(2, CPU_FEATURE_CACHE_DATA, 1 * MiB, 8, 32,
|
|
UNDEF, 0);
|
|
case 0x85:
|
|
return MakeX86CacheLevelInfo(2, CPU_FEATURE_CACHE_DATA, 2 * MiB, 8, 32,
|
|
UNDEF, 0);
|
|
case 0x86:
|
|
return MakeX86CacheLevelInfo(2, CPU_FEATURE_CACHE_DATA, 512 * KiB, 4, 32,
|
|
UNDEF, 0);
|
|
case 0x87:
|
|
return MakeX86CacheLevelInfo(2, CPU_FEATURE_CACHE_DATA, 1 * MiB, 8, 64,
|
|
UNDEF, 0);
|
|
case 0xA0:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_DTLB, 4 * KiB, 0xFF,
|
|
UNDEF, 32, 0);
|
|
case 0xB0:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 4 * KiB, 4,
|
|
UNDEF, 128, 0);
|
|
case 0xB1:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 2 * MiB, 4,
|
|
UNDEF, 8, 0);
|
|
case 0xB2:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 4 * KiB, 4,
|
|
UNDEF, 64, 0);
|
|
case 0xB3:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 4 * KiB, 4,
|
|
UNDEF, 128, 0);
|
|
case 0xB4:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 4 * KiB, 4,
|
|
UNDEF, 256, 0);
|
|
case 0xB5:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 4 * KiB, 8,
|
|
UNDEF, 64, 0);
|
|
case 0xB6:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 4 * KiB, 8,
|
|
UNDEF, 128, 0);
|
|
case 0xBA:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 4 * KiB, 4,
|
|
UNDEF, 64, 0);
|
|
case 0xC0:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_TLB, 4 * KiB, 4,
|
|
UNDEF, 8, 0);
|
|
case 0xC1:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_STLB, 4 * KiB, 8,
|
|
UNDEF, 1024, 0);
|
|
case 0xC2:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_DTLB, 4 * KiB, 4,
|
|
UNDEF, 16, 0);
|
|
case 0xC3:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_STLB, 4 * KiB, 6,
|
|
UNDEF, 1536, 0);
|
|
case 0xCA:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_STLB, 4 * KiB, 4,
|
|
UNDEF, 512, 0);
|
|
case 0xD0:
|
|
return MakeX86CacheLevelInfo(3, CPU_FEATURE_CACHE_DATA, 512 * KiB, 4, 64,
|
|
UNDEF, 0);
|
|
case 0xD1:
|
|
return MakeX86CacheLevelInfo(3, CPU_FEATURE_CACHE_DATA, 1 * MiB, 4, 64,
|
|
UNDEF, 0);
|
|
case 0xD2:
|
|
return MakeX86CacheLevelInfo(3, CPU_FEATURE_CACHE_DATA, 2 * MiB, 4, 64,
|
|
UNDEF, 0);
|
|
case 0xD6:
|
|
return MakeX86CacheLevelInfo(3, CPU_FEATURE_CACHE_DATA, 1 * MiB, 8, 64,
|
|
UNDEF, 0);
|
|
case 0xD7:
|
|
return MakeX86CacheLevelInfo(3, CPU_FEATURE_CACHE_DATA, 2 * MiB, 8, 64,
|
|
UNDEF, 0);
|
|
case 0xD8:
|
|
return MakeX86CacheLevelInfo(3, CPU_FEATURE_CACHE_DATA, 4 * MiB, 8, 64,
|
|
UNDEF, 0);
|
|
case 0xDC:
|
|
return MakeX86CacheLevelInfo(3, CPU_FEATURE_CACHE_DATA, 1 * 1536 * KiB,
|
|
12, 64, UNDEF, 0);
|
|
case 0xDD:
|
|
return MakeX86CacheLevelInfo(3, CPU_FEATURE_CACHE_DATA, 3 * MiB, 12, 64,
|
|
UNDEF, 0);
|
|
case 0xDE:
|
|
return MakeX86CacheLevelInfo(3, CPU_FEATURE_CACHE_DATA, 6 * MiB, 12, 64,
|
|
UNDEF, 0);
|
|
case 0xE2:
|
|
return MakeX86CacheLevelInfo(3, CPU_FEATURE_CACHE_DATA, 2 * MiB, 16, 64,
|
|
UNDEF, 0);
|
|
case 0xE3:
|
|
return MakeX86CacheLevelInfo(3, CPU_FEATURE_CACHE_DATA, 4 * MiB, 16, 64,
|
|
UNDEF, 0);
|
|
case 0xE4:
|
|
return MakeX86CacheLevelInfo(3, CPU_FEATURE_CACHE_DATA, 8 * MiB, 16, 64,
|
|
UNDEF, 0);
|
|
case 0xEA:
|
|
return MakeX86CacheLevelInfo(3, CPU_FEATURE_CACHE_DATA, 12 * MiB, 24, 64,
|
|
UNDEF, 0);
|
|
case 0xEB:
|
|
return MakeX86CacheLevelInfo(3, CPU_FEATURE_CACHE_DATA, 18 * MiB, 24, 64,
|
|
UNDEF, 0);
|
|
case 0xEC:
|
|
return MakeX86CacheLevelInfo(3, CPU_FEATURE_CACHE_DATA, 24 * MiB, 24, 64,
|
|
UNDEF, 0);
|
|
case 0xF0:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_PREFETCH, 64 * KiB,
|
|
UNDEF, UNDEF, UNDEF, 0);
|
|
case 0xF1:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_PREFETCH, 128 * KiB,
|
|
UNDEF, UNDEF, UNDEF, 0);
|
|
case 0xFF:
|
|
return MakeX86CacheLevelInfo(UNDEF, CPU_FEATURE_CACHE_NULL, UNDEF, UNDEF,
|
|
UNDEF, UNDEF, 0);
|
|
default:
|
|
return kEmptyCacheLevelInfo;
|
|
}
|
|
}
|
|
|
|
static void GetByteArrayFromRegister(uint32_t result[4], const uint32_t reg) {
|
|
for (int i = 0; i < 4; ++i) {
|
|
result[i] = ExtractBitRange(reg, (i + 1) * 8, i * 8);
|
|
}
|
|
}
|
|
|
|
static void ParseLeaf2(const int max_cpuid_leaf, CacheInfo* info) {
|
|
Leaf leaf = SafeCpuId(max_cpuid_leaf, 2);
|
|
uint32_t registers[] = {leaf.eax, leaf.ebx, leaf.ecx, leaf.edx};
|
|
for (int i = 0; i < 4; ++i) {
|
|
if (registers[i] & (1 << 31)) {
|
|
continue; // register does not contains valid information
|
|
}
|
|
uint32_t bytes[4];
|
|
GetByteArrayFromRegister(bytes, registers[i]);
|
|
for (int j = 0; j < 4; ++j) {
|
|
if (bytes[j] == 0xFF)
|
|
break; // leaf 4 should be used to fetch cache information
|
|
info->levels[info->size] = GetCacheLevelInfo(bytes[j]);
|
|
}
|
|
info->size++;
|
|
}
|
|
}
|
|
|
|
static void ParseLeaf4(const int max_cpuid_leaf, CacheInfo* info) {
|
|
info->size = 0;
|
|
for (int cache_id = 0; cache_id < CPU_FEATURES_MAX_CACHE_LEVEL; cache_id++) {
|
|
const Leaf leaf = SafeCpuIdEx(max_cpuid_leaf, 4, cache_id);
|
|
CacheType cache_type = ExtractBitRange(leaf.eax, 4, 0);
|
|
if (cache_type == CPU_FEATURE_CACHE_NULL) {
|
|
info->levels[cache_id] = kEmptyCacheLevelInfo;
|
|
continue;
|
|
}
|
|
int level = ExtractBitRange(leaf.eax, 7, 5);
|
|
int line_size = ExtractBitRange(leaf.ebx, 11, 0) + 1;
|
|
int partitioning = ExtractBitRange(leaf.ebx, 21, 12) + 1;
|
|
int ways = ExtractBitRange(leaf.ebx, 31, 22) + 1;
|
|
int entries = leaf.ecx + 1;
|
|
int cache_size = (ways * partitioning * line_size * (entries));
|
|
info->levels[cache_id] = MakeX86CacheLevelInfo(
|
|
level, cache_type, cache_size, ways, line_size, entries, partitioning);
|
|
info->size++;
|
|
}
|
|
}
|
|
|
|
// Reference https://en.wikipedia.org/wiki/CPUID.
|
|
static void ParseCpuId(const uint32_t max_cpuid_leaf, X86Info* info) {
|
|
const Leaf leaf_1 = SafeCpuId(max_cpuid_leaf, 1);
|
|
const Leaf leaf_7 = SafeCpuId(max_cpuid_leaf, 7);
|
|
|
|
const bool have_xsave = IsBitSet(leaf_1.ecx, 26);
|
|
const bool have_osxsave = IsBitSet(leaf_1.ecx, 27);
|
|
const uint32_t xcr0_eax = (have_xsave && have_osxsave) ? GetXCR0Eax() : 0;
|
|
const bool have_sse_os_support = HasXmmOsXSave(xcr0_eax);
|
|
const bool have_avx_os_support = HasYmmOsXSave(xcr0_eax);
|
|
const bool have_avx512_os_support = HasZmmOsXSave(xcr0_eax);
|
|
|
|
const uint32_t family = ExtractBitRange(leaf_1.eax, 11, 8);
|
|
const uint32_t extended_family = ExtractBitRange(leaf_1.eax, 27, 20);
|
|
const uint32_t model = ExtractBitRange(leaf_1.eax, 7, 4);
|
|
const uint32_t extended_model = ExtractBitRange(leaf_1.eax, 19, 16);
|
|
|
|
X86Features* const features = &info->features;
|
|
|
|
info->family = extended_family + family;
|
|
info->model = (extended_model << 4) + model;
|
|
info->stepping = ExtractBitRange(leaf_1.eax, 3, 0);
|
|
|
|
features->fpu = IsBitSet(leaf_1.edx, 0);
|
|
features->tsc = IsBitSet(leaf_1.edx, 4);
|
|
features->cx8 = IsBitSet(leaf_1.edx, 8);
|
|
features->clfsh = IsBitSet(leaf_1.edx, 19);
|
|
features->mmx = IsBitSet(leaf_1.edx, 23);
|
|
features->ss = IsBitSet(leaf_1.edx, 27);
|
|
features->pclmulqdq = IsBitSet(leaf_1.ecx, 1);
|
|
features->smx = IsBitSet(leaf_1.ecx, 6);
|
|
features->cx16 = IsBitSet(leaf_1.ecx, 13);
|
|
features->dca = IsBitSet(leaf_1.ecx, 18);
|
|
features->movbe = IsBitSet(leaf_1.ecx, 22);
|
|
features->popcnt = IsBitSet(leaf_1.ecx, 23);
|
|
features->aes = IsBitSet(leaf_1.ecx, 25);
|
|
features->f16c = IsBitSet(leaf_1.ecx, 29);
|
|
features->rdrnd = IsBitSet(leaf_1.ecx, 30);
|
|
features->sgx = IsBitSet(leaf_7.ebx, 2);
|
|
features->bmi1 = IsBitSet(leaf_7.ebx, 3);
|
|
features->hle = IsBitSet(leaf_7.ebx, 4);
|
|
features->bmi2 = IsBitSet(leaf_7.ebx, 8);
|
|
features->erms = IsBitSet(leaf_7.ebx, 9);
|
|
features->rtm = IsBitSet(leaf_7.ebx, 11);
|
|
features->rdseed = IsBitSet(leaf_7.ebx, 18);
|
|
features->clflushopt = IsBitSet(leaf_7.ebx, 23);
|
|
features->clwb = IsBitSet(leaf_7.ebx, 24);
|
|
features->sha = IsBitSet(leaf_7.ebx, 29);
|
|
features->vaes = IsBitSet(leaf_7.ecx, 9);
|
|
features->vpclmulqdq = IsBitSet(leaf_7.ecx, 10);
|
|
|
|
if (have_sse_os_support) {
|
|
features->sse = IsBitSet(leaf_1.edx, 25);
|
|
features->sse2 = IsBitSet(leaf_1.edx, 26);
|
|
features->sse3 = IsBitSet(leaf_1.ecx, 0);
|
|
features->ssse3 = IsBitSet(leaf_1.ecx, 9);
|
|
features->sse4_1 = IsBitSet(leaf_1.ecx, 19);
|
|
features->sse4_2 = IsBitSet(leaf_1.ecx, 20);
|
|
}
|
|
|
|
if (have_avx_os_support) {
|
|
features->fma3 = IsBitSet(leaf_1.ecx, 12);
|
|
features->avx = IsBitSet(leaf_1.ecx, 28);
|
|
features->avx2 = IsBitSet(leaf_7.ebx, 5);
|
|
}
|
|
|
|
if (have_avx512_os_support) {
|
|
features->avx512f = IsBitSet(leaf_7.ebx, 16);
|
|
features->avx512cd = IsBitSet(leaf_7.ebx, 28);
|
|
features->avx512er = IsBitSet(leaf_7.ebx, 27);
|
|
features->avx512pf = IsBitSet(leaf_7.ebx, 26);
|
|
features->avx512bw = IsBitSet(leaf_7.ebx, 30);
|
|
features->avx512dq = IsBitSet(leaf_7.ebx, 17);
|
|
features->avx512vl = IsBitSet(leaf_7.ebx, 31);
|
|
features->avx512ifma = IsBitSet(leaf_7.ebx, 21);
|
|
features->avx512vbmi = IsBitSet(leaf_7.ecx, 1);
|
|
features->avx512vbmi2 = IsBitSet(leaf_7.ecx, 6);
|
|
features->avx512vnni = IsBitSet(leaf_7.ecx, 11);
|
|
features->avx512bitalg = IsBitSet(leaf_7.ecx, 12);
|
|
features->avx512vpopcntdq = IsBitSet(leaf_7.ecx, 14);
|
|
features->avx512_4vnniw = IsBitSet(leaf_7.edx, 2);
|
|
features->avx512_4vbmi2 = IsBitSet(leaf_7.edx, 3);
|
|
}
|
|
}
|
|
|
|
static const X86Info kEmptyX86Info;
|
|
static const CacheInfo kEmptyCacheInfo;
|
|
|
|
X86Info GetX86Info(void) {
|
|
X86Info info = kEmptyX86Info;
|
|
const Leaf leaf_0 = CpuId(0);
|
|
const uint32_t max_cpuid_leaf = leaf_0.eax;
|
|
SetVendor(leaf_0, info.vendor);
|
|
if (IsVendor(leaf_0, "GenuineIntel") || IsVendor(leaf_0, "AuthenticAMD")) {
|
|
ParseCpuId(max_cpuid_leaf, &info);
|
|
}
|
|
return info;
|
|
}
|
|
|
|
CacheInfo GetX86CacheInfo(void) {
|
|
CacheInfo info = kEmptyCacheInfo;
|
|
const Leaf leaf_0 = CpuId(0);
|
|
const uint32_t max_cpuid_leaf = leaf_0.eax;
|
|
if (IsVendor(leaf_0, "GenuineIntel")) {
|
|
ParseLeaf2(max_cpuid_leaf, &info);
|
|
ParseLeaf4(max_cpuid_leaf, &info);
|
|
}
|
|
return info;
|
|
}
|
|
|
|
#define CPUID(FAMILY, MODEL) ((((FAMILY)&0xFF) << 8) | ((MODEL)&0xFF))
|
|
|
|
X86Microarchitecture GetX86Microarchitecture(const X86Info* info) {
|
|
if (memcmp(info->vendor, "GenuineIntel", sizeof(info->vendor)) == 0) {
|
|
switch (CPUID(info->family, info->model)) {
|
|
case CPUID(0x06, 0x35):
|
|
case CPUID(0x06, 0x36):
|
|
// https://en.wikipedia.org/wiki/Bonnell_(microarchitecture)
|
|
return INTEL_ATOM_BNL;
|
|
case CPUID(0x06, 0x37):
|
|
case CPUID(0x06, 0x4C):
|
|
// https://en.wikipedia.org/wiki/Silvermont
|
|
return INTEL_ATOM_SMT;
|
|
case CPUID(0x06, 0x5C):
|
|
// https://en.wikipedia.org/wiki/Goldmont
|
|
return INTEL_ATOM_GMT;
|
|
case CPUID(0x06, 0x0F):
|
|
case CPUID(0x06, 0x16):
|
|
// https://en.wikipedia.org/wiki/Intel_Core_(microarchitecture)
|
|
return INTEL_CORE;
|
|
case CPUID(0x06, 0x17):
|
|
case CPUID(0x06, 0x1D):
|
|
// https://en.wikipedia.org/wiki/Penryn_(microarchitecture)
|
|
return INTEL_PNR;
|
|
case CPUID(0x06, 0x1A):
|
|
case CPUID(0x06, 0x1E):
|
|
case CPUID(0x06, 0x1F):
|
|
case CPUID(0x06, 0x2E):
|
|
// https://en.wikipedia.org/wiki/Nehalem_(microarchitecture)
|
|
return INTEL_NHM;
|
|
case CPUID(0x06, 0x25):
|
|
case CPUID(0x06, 0x2C):
|
|
case CPUID(0x06, 0x2F):
|
|
// https://en.wikipedia.org/wiki/Westmere_(microarchitecture)
|
|
return INTEL_WSM;
|
|
case CPUID(0x06, 0x2A):
|
|
case CPUID(0x06, 0x2D):
|
|
// https://en.wikipedia.org/wiki/Sandy_Bridge#Models_and_steppings
|
|
return INTEL_SNB;
|
|
case CPUID(0x06, 0x3A):
|
|
case CPUID(0x06, 0x3E):
|
|
// https://en.wikipedia.org/wiki/Ivy_Bridge_(microarchitecture)#Models_and_steppings
|
|
return INTEL_IVB;
|
|
case CPUID(0x06, 0x3C):
|
|
case CPUID(0x06, 0x3F):
|
|
case CPUID(0x06, 0x45):
|
|
case CPUID(0x06, 0x46):
|
|
// https://en.wikipedia.org/wiki/Haswell_(microarchitecture)
|
|
return INTEL_HSW;
|
|
case CPUID(0x06, 0x3D):
|
|
case CPUID(0x06, 0x47):
|
|
case CPUID(0x06, 0x4F):
|
|
case CPUID(0x06, 0x56):
|
|
// https://en.wikipedia.org/wiki/Broadwell_(microarchitecture)
|
|
return INTEL_BDW;
|
|
case CPUID(0x06, 0x4E):
|
|
case CPUID(0x06, 0x55):
|
|
case CPUID(0x06, 0x5E):
|
|
// https://en.wikipedia.org/wiki/Skylake_(microarchitecture)
|
|
return INTEL_SKL;
|
|
case CPUID(0x06, 0x8E):
|
|
case CPUID(0x06, 0x9E):
|
|
// https://en.wikipedia.org/wiki/Kaby_Lake
|
|
return INTEL_KBL;
|
|
default:
|
|
return X86_UNKNOWN;
|
|
}
|
|
}
|
|
if (memcmp(info->vendor, "AuthenticAMD", sizeof(info->vendor)) == 0) {
|
|
switch (info->family) {
|
|
// https://en.wikipedia.org/wiki/List_of_AMD_CPU_microarchitectures
|
|
case 0x0F:
|
|
return AMD_HAMMER;
|
|
case 0x10:
|
|
return AMD_K10;
|
|
case 0x14:
|
|
return AMD_BOBCAT;
|
|
case 0x15:
|
|
return AMD_BULLDOZER;
|
|
case 0x16:
|
|
return AMD_JAGUAR;
|
|
case 0x17:
|
|
return AMD_ZEN;
|
|
default:
|
|
return X86_UNKNOWN;
|
|
}
|
|
}
|
|
return X86_UNKNOWN;
|
|
}
|
|
|
|
static void SetString(const uint32_t max_cpuid_ext_leaf, const uint32_t leaf_id,
|
|
char* buffer) {
|
|
const Leaf leaf = SafeCpuId(max_cpuid_ext_leaf, leaf_id);
|
|
// We allow calling memcpy from SetString which is only called when requesting
|
|
// X86BrandString.
|
|
memcpy(buffer, &leaf, sizeof(Leaf));
|
|
}
|
|
|
|
void FillX86BrandString(char brand_string[49]) {
|
|
const Leaf leaf_ext_0 = CpuId(0x80000000);
|
|
const uint32_t max_cpuid_leaf_ext = leaf_ext_0.eax;
|
|
SetString(max_cpuid_leaf_ext, 0x80000002, brand_string);
|
|
SetString(max_cpuid_leaf_ext, 0x80000003, brand_string + 16);
|
|
SetString(max_cpuid_leaf_ext, 0x80000004, brand_string + 32);
|
|
brand_string[48] = '\0';
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
// Introspection functions
|
|
|
|
int GetX86FeaturesEnumValue(const X86Features* features,
|
|
X86FeaturesEnum value) {
|
|
switch (value) {
|
|
case X86_FPU:
|
|
return features->fpu;
|
|
case X86_TSC:
|
|
return features->tsc;
|
|
case X86_CX8:
|
|
return features->cx8;
|
|
case X86_CLFSH:
|
|
return features->clfsh;
|
|
case X86_MMX:
|
|
return features->mmx;
|
|
case X86_AES:
|
|
return features->aes;
|
|
case X86_ERMS:
|
|
return features->erms;
|
|
case X86_F16C:
|
|
return features->f16c;
|
|
case X86_FMA3:
|
|
return features->fma3;
|
|
case X86_VAES:
|
|
return features->vaes;
|
|
case X86_VPCLMULQDQ:
|
|
return features->vpclmulqdq;
|
|
case X86_BMI1:
|
|
return features->bmi1;
|
|
case X86_HLE:
|
|
return features->hle;
|
|
case X86_BMI2:
|
|
return features->bmi2;
|
|
case X86_RTM:
|
|
return features->rtm;
|
|
case X86_RDSEED:
|
|
return features->rdseed;
|
|
case X86_CLFLUSHOPT:
|
|
return features->clflushopt;
|
|
case X86_CLWB:
|
|
return features->clwb;
|
|
case X86_SSE:
|
|
return features->sse;
|
|
case X86_SSE2:
|
|
return features->sse2;
|
|
case X86_SSE3:
|
|
return features->sse3;
|
|
case X86_SSSE3:
|
|
return features->ssse3;
|
|
case X86_SSE4_1:
|
|
return features->sse4_1;
|
|
case X86_SSE4_2:
|
|
return features->sse4_2;
|
|
case X86_AVX:
|
|
return features->avx;
|
|
case X86_AVX2:
|
|
return features->avx2;
|
|
case X86_AVX512F:
|
|
return features->avx512f;
|
|
case X86_AVX512CD:
|
|
return features->avx512cd;
|
|
case X86_AVX512ER:
|
|
return features->avx512er;
|
|
case X86_AVX512PF:
|
|
return features->avx512pf;
|
|
case X86_AVX512BW:
|
|
return features->avx512bw;
|
|
case X86_AVX512DQ:
|
|
return features->avx512dq;
|
|
case X86_AVX512VL:
|
|
return features->avx512vl;
|
|
case X86_AVX512IFMA:
|
|
return features->avx512ifma;
|
|
case X86_AVX512VBMI:
|
|
return features->avx512vbmi;
|
|
case X86_AVX512VBMI2:
|
|
return features->avx512vbmi2;
|
|
case X86_AVX512VNNI:
|
|
return features->avx512vnni;
|
|
case X86_AVX512BITALG:
|
|
return features->avx512bitalg;
|
|
case X86_AVX512VPOPCNTDQ:
|
|
return features->avx512vpopcntdq;
|
|
case X86_AVX512_4VNNIW:
|
|
return features->avx512_4vnniw;
|
|
case X86_AVX512_4VBMI2:
|
|
return features->avx512_4vbmi2;
|
|
case X86_PCLMULQDQ:
|
|
return features->pclmulqdq;
|
|
case X86_SMX:
|
|
return features->smx;
|
|
case X86_SGX:
|
|
return features->sgx;
|
|
case X86_CX16:
|
|
return features->cx16;
|
|
case X86_SHA:
|
|
return features->sha;
|
|
case X86_POPCNT:
|
|
return features->popcnt;
|
|
case X86_MOVBE:
|
|
return features->movbe;
|
|
case X86_RDRND:
|
|
return features->rdrnd;
|
|
case X86_DCA:
|
|
return features->dca;
|
|
case X86_SS:
|
|
return features->ss;
|
|
case X86_LAST_:
|
|
break;
|
|
}
|
|
return false;
|
|
}
|
|
|
|
const char* GetX86FeaturesEnumName(X86FeaturesEnum value) {
|
|
switch (value) {
|
|
case X86_FPU:
|
|
return "fpu";
|
|
case X86_TSC:
|
|
return "tsc";
|
|
case X86_CX8:
|
|
return "cx8";
|
|
case X86_CLFSH:
|
|
return "clfsh";
|
|
case X86_MMX:
|
|
return "mmx";
|
|
case X86_AES:
|
|
return "aes";
|
|
case X86_ERMS:
|
|
return "erms";
|
|
case X86_F16C:
|
|
return "f16c";
|
|
case X86_FMA3:
|
|
return "fma3";
|
|
case X86_VAES:
|
|
return "vaes";
|
|
case X86_VPCLMULQDQ:
|
|
return "vpclmulqdq";
|
|
case X86_BMI1:
|
|
return "bmi1";
|
|
case X86_HLE:
|
|
return "hle";
|
|
case X86_BMI2:
|
|
return "bmi2";
|
|
case X86_RTM:
|
|
return "rtm";
|
|
case X86_RDSEED:
|
|
return "rdseed";
|
|
case X86_CLFLUSHOPT:
|
|
return "clflushopt";
|
|
case X86_CLWB:
|
|
return "clwb";
|
|
case X86_SSE:
|
|
return "sse";
|
|
case X86_SSE2:
|
|
return "sse2";
|
|
case X86_SSE3:
|
|
return "sse3";
|
|
case X86_SSSE3:
|
|
return "ssse3";
|
|
case X86_SSE4_1:
|
|
return "sse4_1";
|
|
case X86_SSE4_2:
|
|
return "sse4_2";
|
|
case X86_AVX:
|
|
return "avx";
|
|
case X86_AVX2:
|
|
return "avx2";
|
|
case X86_AVX512F:
|
|
return "avx512f";
|
|
case X86_AVX512CD:
|
|
return "avx512cd";
|
|
case X86_AVX512ER:
|
|
return "avx512er";
|
|
case X86_AVX512PF:
|
|
return "avx512pf";
|
|
case X86_AVX512BW:
|
|
return "avx512bw";
|
|
case X86_AVX512DQ:
|
|
return "avx512dq";
|
|
case X86_AVX512VL:
|
|
return "avx512vl";
|
|
case X86_AVX512IFMA:
|
|
return "avx512ifma";
|
|
case X86_AVX512VBMI:
|
|
return "avx512vbmi";
|
|
case X86_AVX512VBMI2:
|
|
return "avx512vbmi2";
|
|
case X86_AVX512VNNI:
|
|
return "avx512vnni";
|
|
case X86_AVX512BITALG:
|
|
return "avx512bitalg";
|
|
case X86_AVX512VPOPCNTDQ:
|
|
return "avx512vpopcntdq";
|
|
case X86_AVX512_4VNNIW:
|
|
return "avx512_4vnniw";
|
|
case X86_AVX512_4VBMI2:
|
|
return "avx512_4vbmi2";
|
|
case X86_PCLMULQDQ:
|
|
return "pclmulqdq";
|
|
case X86_SMX:
|
|
return "smx";
|
|
case X86_SGX:
|
|
return "sgx";
|
|
case X86_CX16:
|
|
return "cx16";
|
|
case X86_SHA:
|
|
return "sha";
|
|
case X86_POPCNT:
|
|
return "popcnt";
|
|
case X86_MOVBE:
|
|
return "movbe";
|
|
case X86_RDRND:
|
|
return "rdrnd";
|
|
case X86_DCA:
|
|
return "dca";
|
|
case X86_SS:
|
|
return "ss";
|
|
case X86_LAST_:
|
|
break;
|
|
}
|
|
return "unknown_feature";
|
|
}
|
|
|
|
const char* GetX86MicroarchitectureName(X86Microarchitecture uarch) {
|
|
switch (uarch) {
|
|
case X86_UNKNOWN:
|
|
return "X86_UNKNOWN";
|
|
case INTEL_CORE:
|
|
return "INTEL_CORE";
|
|
case INTEL_PNR:
|
|
return "INTEL_PNR";
|
|
case INTEL_NHM:
|
|
return "INTEL_NHM";
|
|
case INTEL_ATOM_BNL:
|
|
return "INTEL_ATOM_BNL";
|
|
case INTEL_WSM:
|
|
return "INTEL_WSM";
|
|
case INTEL_SNB:
|
|
return "INTEL_SNB";
|
|
case INTEL_IVB:
|
|
return "INTEL_IVB";
|
|
case INTEL_ATOM_SMT:
|
|
return "INTEL_ATOM_SMT";
|
|
case INTEL_HSW:
|
|
return "INTEL_HSW";
|
|
case INTEL_BDW:
|
|
return "INTEL_BDW";
|
|
case INTEL_SKL:
|
|
return "INTEL_SKL";
|
|
case INTEL_ATOM_GMT:
|
|
return "INTEL_ATOM_GMT";
|
|
case INTEL_KBL:
|
|
return "INTEL_KBL";
|
|
case INTEL_CFL:
|
|
return "INTEL_CFL";
|
|
case INTEL_CNL:
|
|
return "INTEL_CNL";
|
|
case AMD_HAMMER:
|
|
return "AMD_HAMMER";
|
|
case AMD_K10:
|
|
return "AMD_K10";
|
|
case AMD_BOBCAT:
|
|
return "AMD_BOBCAT";
|
|
case AMD_BULLDOZER:
|
|
return "AMD_BULLDOZER";
|
|
case AMD_JAGUAR:
|
|
return "AMD_JAGUAR";
|
|
case AMD_ZEN:
|
|
return "AMD_ZEN";
|
|
}
|
|
return "unknown microarchitecture";
|
|
}
|