|  | // Copyright (c) 2012 The Chromium Authors. All rights reserved. | 
|  | // Use of this source code is governed by a BSD-style license that can be | 
|  | // found in the LICENSE file. | 
|  |  | 
|  | #include "base/cpu.h" | 
|  |  | 
|  | #include <stdlib.h> | 
|  | #include <string.h> | 
|  |  | 
|  | #include <algorithm> | 
|  |  | 
|  | #include "base/basictypes.h" | 
|  | #include "base/strings/string_piece.h" | 
|  | #include "build/build_config.h" | 
|  |  | 
|  | #if defined(ARCH_CPU_ARM_FAMILY) && (defined(OS_ANDROID) || defined(OS_LINUX)) | 
|  | #include "base/files/file_util.h" | 
|  | #include "base/lazy_instance.h" | 
|  | #endif | 
|  |  | 
|  | #if defined(ARCH_CPU_X86_FAMILY) | 
|  | #if defined(_MSC_VER) | 
|  | #include <intrin.h> | 
|  | #include <immintrin.h>  // For _xgetbv() | 
|  | #endif | 
|  | #endif | 
|  |  | 
|  | namespace base { | 
|  |  | 
|  | CPU::CPU() | 
|  | : signature_(0), | 
|  | type_(0), | 
|  | family_(0), | 
|  | model_(0), | 
|  | stepping_(0), | 
|  | ext_model_(0), | 
|  | ext_family_(0), | 
|  | has_mmx_(false), | 
|  | has_sse_(false), | 
|  | has_sse2_(false), | 
|  | has_sse3_(false), | 
|  | has_ssse3_(false), | 
|  | has_sse41_(false), | 
|  | has_sse42_(false), | 
|  | has_avx_(false), | 
|  | has_avx_hardware_(false), | 
|  | has_aesni_(false), | 
|  | has_non_stop_time_stamp_counter_(false), | 
|  | has_broken_neon_(false), | 
|  | cpu_vendor_("unknown") { | 
|  | Initialize(); | 
|  | } | 
|  |  | 
|  | namespace { | 
|  |  | 
|  | #if defined(ARCH_CPU_X86_FAMILY) | 
|  | #ifndef _MSC_VER | 
|  |  | 
|  | #if defined(__pic__) && defined(__i386__) | 
|  |  | 
|  | void __cpuid(int cpu_info[4], int info_type) { | 
|  | __asm__ volatile ( | 
|  | "mov %%ebx, %%edi\n" | 
|  | "cpuid\n" | 
|  | "xchg %%edi, %%ebx\n" | 
|  | : "=a"(cpu_info[0]), "=D"(cpu_info[1]), "=c"(cpu_info[2]), "=d"(cpu_info[3]) | 
|  | : "a"(info_type) | 
|  | ); | 
|  | } | 
|  |  | 
|  | #else | 
|  |  | 
|  | void __cpuid(int cpu_info[4], int info_type) { | 
|  | __asm__ volatile ( | 
|  | "cpuid \n\t" | 
|  | : "=a"(cpu_info[0]), "=b"(cpu_info[1]), "=c"(cpu_info[2]), "=d"(cpu_info[3]) | 
|  | : "a"(info_type) | 
|  | ); | 
|  | } | 
|  |  | 
|  | #endif | 
|  |  | 
|  | // _xgetbv returns the value of an Intel Extended Control Register (XCR). | 
|  | // Currently only XCR0 is defined by Intel so |xcr| should always be zero. | 
|  | uint64 _xgetbv(uint32 xcr) { | 
|  | uint32 eax, edx; | 
|  |  | 
|  | __asm__ volatile ("xgetbv" : "=a" (eax), "=d" (edx) : "c" (xcr)); | 
|  | return (static_cast<uint64>(edx) << 32) | eax; | 
|  | } | 
|  |  | 
|  | #endif  // !_MSC_VER | 
|  | #endif  // ARCH_CPU_X86_FAMILY | 
|  |  | 
|  | #if defined(ARCH_CPU_ARM_FAMILY) && (defined(OS_ANDROID) || defined(OS_LINUX)) | 
|  | class LazyCpuInfoValue { | 
|  | public: | 
|  | LazyCpuInfoValue() : has_broken_neon_(false) { | 
|  | // This function finds the value from /proc/cpuinfo under the key "model | 
|  | // name" or "Processor". "model name" is used in Linux 3.8 and later (3.7 | 
|  | // and later for arm64) and is shown once per CPU. "Processor" is used in | 
|  | // earler versions and is shown only once at the top of /proc/cpuinfo | 
|  | // regardless of the number CPUs. | 
|  | const char kModelNamePrefix[] = "model name\t: "; | 
|  | const char kProcessorPrefix[] = "Processor\t: "; | 
|  |  | 
|  | // This function also calculates whether we believe that this CPU has a | 
|  | // broken NEON unit based on these fields from cpuinfo: | 
|  | unsigned implementer = 0, architecture = 0, variant = 0, part = 0, | 
|  | revision = 0; | 
|  | const struct { | 
|  | const char key[17]; | 
|  | unsigned *result; | 
|  | } kUnsignedValues[] = { | 
|  | {"CPU implementer", &implementer}, | 
|  | {"CPU architecture", &architecture}, | 
|  | {"CPU variant", &variant}, | 
|  | {"CPU part", &part}, | 
|  | {"CPU revision", &revision}, | 
|  | }; | 
|  |  | 
|  | std::string contents; | 
|  | ReadFileToString(FilePath("/proc/cpuinfo"), &contents); | 
|  | DCHECK(!contents.empty()); | 
|  | if (contents.empty()) { | 
|  | return; | 
|  | } | 
|  |  | 
|  | std::istringstream iss(contents); | 
|  | std::string line; | 
|  | while (std::getline(iss, line)) { | 
|  | if (brand_.empty() && | 
|  | (line.compare(0, strlen(kModelNamePrefix), kModelNamePrefix) == 0 || | 
|  | line.compare(0, strlen(kProcessorPrefix), kProcessorPrefix) == 0)) { | 
|  | brand_.assign(line.substr(strlen(kModelNamePrefix))); | 
|  | } | 
|  |  | 
|  | for (size_t i = 0; i < arraysize(kUnsignedValues); i++) { | 
|  | const char *key = kUnsignedValues[i].key; | 
|  | const size_t len = strlen(key); | 
|  |  | 
|  | if (line.compare(0, len, key) == 0 && | 
|  | line.size() >= len + 1 && | 
|  | (line[len] == '\t' || line[len] == ' ' || line[len] == ':')) { | 
|  | size_t colon_pos = line.find(':', len); | 
|  | if (colon_pos == std::string::npos) { | 
|  | continue; | 
|  | } | 
|  |  | 
|  | const StringPiece line_sp(line); | 
|  | StringPiece value_sp = line_sp.substr(colon_pos + 1); | 
|  | while (!value_sp.empty() && | 
|  | (value_sp[0] == ' ' || value_sp[0] == '\t')) { | 
|  | value_sp = value_sp.substr(1); | 
|  | } | 
|  |  | 
|  | // The string may have leading "0x" or not, so we use strtoul to | 
|  | // handle that. | 
|  | char *endptr; | 
|  | std::string value(value_sp.as_string()); | 
|  | unsigned long int result = strtoul(value.c_str(), &endptr, 0); | 
|  | if (*endptr == 0 && result <= UINT_MAX) { | 
|  | *kUnsignedValues[i].result = result; | 
|  | } | 
|  | } | 
|  | } | 
|  | } | 
|  |  | 
|  | has_broken_neon_ = | 
|  | implementer == 0x51 && | 
|  | architecture == 7 && | 
|  | variant == 1 && | 
|  | part == 0x4d && | 
|  | revision == 0; | 
|  | } | 
|  |  | 
|  | const std::string& brand() const { return brand_; } | 
|  | bool has_broken_neon() const { return has_broken_neon_; } | 
|  |  | 
|  | private: | 
|  | std::string brand_; | 
|  | bool has_broken_neon_; | 
|  | DISALLOW_COPY_AND_ASSIGN(LazyCpuInfoValue); | 
|  | }; | 
|  |  | 
|  | base::LazyInstance<LazyCpuInfoValue>::Leaky g_lazy_cpuinfo = | 
|  | LAZY_INSTANCE_INITIALIZER; | 
|  |  | 
|  | #endif  // defined(ARCH_CPU_ARM_FAMILY) && (defined(OS_ANDROID) || | 
|  | // defined(OS_LINUX)) | 
|  |  | 
|  | }  // anonymous namespace | 
|  |  | 
|  | void CPU::Initialize() { | 
|  | #if defined(ARCH_CPU_X86_FAMILY) | 
|  | int cpu_info[4] = {-1}; | 
|  | char cpu_string[48]; | 
|  |  | 
|  | // __cpuid with an InfoType argument of 0 returns the number of | 
|  | // valid Ids in CPUInfo[0] and the CPU identification string in | 
|  | // the other three array elements. The CPU identification string is | 
|  | // not in linear order. The code below arranges the information | 
|  | // in a human readable form. The human readable order is CPUInfo[1] | | 
|  | // CPUInfo[3] | CPUInfo[2]. CPUInfo[2] and CPUInfo[3] are swapped | 
|  | // before using memcpy to copy these three array elements to cpu_string. | 
|  | __cpuid(cpu_info, 0); | 
|  | int num_ids = cpu_info[0]; | 
|  | std::swap(cpu_info[2], cpu_info[3]); | 
|  | memcpy(cpu_string, &cpu_info[1], 3 * sizeof(cpu_info[1])); | 
|  | cpu_vendor_.assign(cpu_string, 3 * sizeof(cpu_info[1])); | 
|  |  | 
|  | // Interpret CPU feature information. | 
|  | if (num_ids > 0) { | 
|  | __cpuid(cpu_info, 1); | 
|  | signature_ = cpu_info[0]; | 
|  | stepping_ = cpu_info[0] & 0xf; | 
|  | model_ = ((cpu_info[0] >> 4) & 0xf) + ((cpu_info[0] >> 12) & 0xf0); | 
|  | family_ = (cpu_info[0] >> 8) & 0xf; | 
|  | type_ = (cpu_info[0] >> 12) & 0x3; | 
|  | ext_model_ = (cpu_info[0] >> 16) & 0xf; | 
|  | ext_family_ = (cpu_info[0] >> 20) & 0xff; | 
|  | has_mmx_ =   (cpu_info[3] & 0x00800000) != 0; | 
|  | has_sse_ =   (cpu_info[3] & 0x02000000) != 0; | 
|  | has_sse2_ =  (cpu_info[3] & 0x04000000) != 0; | 
|  | has_sse3_ =  (cpu_info[2] & 0x00000001) != 0; | 
|  | has_ssse3_ = (cpu_info[2] & 0x00000200) != 0; | 
|  | has_sse41_ = (cpu_info[2] & 0x00080000) != 0; | 
|  | has_sse42_ = (cpu_info[2] & 0x00100000) != 0; | 
|  | has_avx_hardware_ = | 
|  | (cpu_info[2] & 0x10000000) != 0; | 
|  | // AVX instructions will generate an illegal instruction exception unless | 
|  | //   a) they are supported by the CPU, | 
|  | //   b) XSAVE is supported by the CPU and | 
|  | //   c) XSAVE is enabled by the kernel. | 
|  | // See http://software.intel.com/en-us/blogs/2011/04/14/is-avx-enabled | 
|  | // | 
|  | // In addition, we have observed some crashes with the xgetbv instruction | 
|  | // even after following Intel's example code. (See crbug.com/375968.) | 
|  | // Because of that, we also test the XSAVE bit because its description in | 
|  | // the CPUID documentation suggests that it signals xgetbv support. | 
|  | has_avx_ = | 
|  | has_avx_hardware_ && | 
|  | (cpu_info[2] & 0x04000000) != 0 /* XSAVE */ && | 
|  | (cpu_info[2] & 0x08000000) != 0 /* OSXSAVE */ && | 
|  | (_xgetbv(0) & 6) == 6 /* XSAVE enabled by kernel */; | 
|  | has_aesni_ = (cpu_info[2] & 0x02000000) != 0; | 
|  | } | 
|  |  | 
|  | // Get the brand string of the cpu. | 
|  | __cpuid(cpu_info, 0x80000000); | 
|  | const int parameter_end = 0x80000004; | 
|  | int max_parameter = cpu_info[0]; | 
|  |  | 
|  | if (cpu_info[0] >= parameter_end) { | 
|  | char* cpu_string_ptr = cpu_string; | 
|  |  | 
|  | for (int parameter = 0x80000002; parameter <= parameter_end && | 
|  | cpu_string_ptr < &cpu_string[sizeof(cpu_string)]; parameter++) { | 
|  | __cpuid(cpu_info, parameter); | 
|  | memcpy(cpu_string_ptr, cpu_info, sizeof(cpu_info)); | 
|  | cpu_string_ptr += sizeof(cpu_info); | 
|  | } | 
|  | cpu_brand_.assign(cpu_string, cpu_string_ptr - cpu_string); | 
|  | } | 
|  |  | 
|  | const int parameter_containing_non_stop_time_stamp_counter = 0x80000007; | 
|  | if (max_parameter >= parameter_containing_non_stop_time_stamp_counter) { | 
|  | __cpuid(cpu_info, parameter_containing_non_stop_time_stamp_counter); | 
|  | has_non_stop_time_stamp_counter_ = (cpu_info[3] & (1 << 8)) != 0; | 
|  | } | 
|  | #elif defined(ARCH_CPU_ARM_FAMILY) && (defined(OS_ANDROID) || defined(OS_LINUX)) | 
|  | cpu_brand_.assign(g_lazy_cpuinfo.Get().brand()); | 
|  | has_broken_neon_ = g_lazy_cpuinfo.Get().has_broken_neon(); | 
|  | #endif | 
|  | } | 
|  |  | 
|  | CPU::IntelMicroArchitecture CPU::GetIntelMicroArchitecture() const { | 
|  | if (has_avx()) return AVX; | 
|  | if (has_sse42()) return SSE42; | 
|  | if (has_sse41()) return SSE41; | 
|  | if (has_ssse3()) return SSSE3; | 
|  | if (has_sse3()) return SSE3; | 
|  | if (has_sse2()) return SSE2; | 
|  | if (has_sse()) return SSE; | 
|  | return PENTIUM; | 
|  | } | 
|  |  | 
|  | }  // namespace base |