| Index: src/cpu.cc
|
| diff --git a/src/cpu.cc b/src/cpu.cc
|
| new file mode 100644
|
| index 0000000000000000000000000000000000000000..d7c32dd88878d33467fb24a174699face2ece2c9
|
| --- /dev/null
|
| +++ b/src/cpu.cc
|
| @@ -0,0 +1,446 @@
|
| +// Copyright 2013 the V8 project authors. All rights reserved.
|
| +// Redistribution and use in source and binary forms, with or without
|
| +// modification, are permitted provided that the following conditions are
|
| +// met:
|
| +//
|
| +// * Redistributions of source code must retain the above copyright
|
| +// notice, this list of conditions and the following disclaimer.
|
| +// * Redistributions in binary form must reproduce the above
|
| +// copyright notice, this list of conditions and the following
|
| +// disclaimer in the documentation and/or other materials provided
|
| +// with the distribution.
|
| +// * Neither the name of Google Inc. nor the names of its
|
| +// contributors may be used to endorse or promote products derived
|
| +// from this software without specific prior written permission.
|
| +//
|
| +// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
| +// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
| +// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
| +// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
| +// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
| +// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
|
| +// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
| +// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
| +// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
| +// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
| +// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
| +
|
| +#include "cpu.h"
|
| +
|
| +#include <algorithm>
|
| +#include <cctype>
|
| +#include <cstdio>
|
| +#include <cstdlib>
|
| +#include <cstring>
|
| +
|
| +#include "checks.h"
|
| +
|
| +namespace v8 {
|
| +namespace internal {
|
| +
|
| +#if V8_HOST_ARCH_IA32 || V8_HOST_ARCH_X64
|
| +
|
| +#if V8_CC_MSVC
|
| +
|
| +#include <intrin.h> // NOLINT
|
| +
|
| +#elif defined(__i386__) && defined(__pic__)
|
| +
|
| +static V8_INLINE(void __cpuid(int cpu_info[4], int info_type)) {
|
| + __asm__ volatile (
|
| + "mov %%ebx, %%edi\n"
|
| + "cpuid\n"
|
| + "xchg %%edi, %%ebx\n"
|
| + : "=a"(cpu_info[0]), "=D"(cpu_info[1]), "=c"(cpu_info[2]), "=d"(cpu_info[3])
|
| + : "a"(info_type)
|
| + );
|
| +}
|
| +
|
| +#else // !V8_CC_MSVC || (!defined(__i386__) && !defined(__pic__))
|
| +
|
| +static void V8_INLINE(__cpuid(int cpu_info[4], int info_type)) {
|
| + __asm__ volatile (
|
| + "cpuid \n\t"
|
| + : "=a"(cpu_info[0]), "=b"(cpu_info[1]), "=c"(cpu_info[2]), "=d"(cpu_info[3])
|
| + : "a"(info_type)
|
| + );
|
| +}
|
| +
|
| +#endif
|
| +
|
| +#elif V8_HOST_ARCH_ARM || V8_HOST_ARCH_MIPS
|
| +
|
| +#if V8_HOST_ARCH_ARM
|
| +
|
| +// See <uapi/asm/hwcap.h> kernel header.
|
| +/*
|
| + * HWCAP flags - for elf_hwcap (in kernel) and AT_HWCAP
|
| + */
|
| +#define HWCAP_SWP (1 << 0)
|
| +#define HWCAP_HALF (1 << 1)
|
| +#define HWCAP_THUMB (1 << 2)
|
| +#define HWCAP_26BIT (1 << 3) /* Play it safe */
|
| +#define HWCAP_FAST_MULT (1 << 4)
|
| +#define HWCAP_FPA (1 << 5)
|
| +#define HWCAP_VFP (1 << 6)
|
| +#define HWCAP_EDSP (1 << 7)
|
| +#define HWCAP_JAVA (1 << 8)
|
| +#define HWCAP_IWMMXT (1 << 9)
|
| +#define HWCAP_CRUNCH (1 << 10)
|
| +#define HWCAP_THUMBEE (1 << 11)
|
| +#define HWCAP_NEON (1 << 12)
|
| +#define HWCAP_VFPv3 (1 << 13)
|
| +#define HWCAP_VFPv3D16 (1 << 14) /* also set for VFPv4-D16 */
|
| +#define HWCAP_TLS (1 << 15)
|
| +#define HWCAP_VFPv4 (1 << 16)
|
| +#define HWCAP_IDIVA (1 << 17)
|
| +#define HWCAP_IDIVT (1 << 18)
|
| +#define HWCAP_VFPD32 (1 << 19) /* set if VFP has 32 regs (not 16) */
|
| +#define HWCAP_IDIV (HWCAP_IDIVA | HWCAP_IDIVT)
|
| +#define HWCAP_LPAE (1 << 20)
|
| +
|
| +#define AT_HWCAP 16
|
| +
|
| +// Read the ELF HWCAP flags by parsing /proc/self/auxv.
|
| +static uint32_t ReadELFHWCaps() {
|
| + uint32_t result = 0;
|
| + FILE* fp = fopen("/proc/self/auxv", "r");
|
| + if (fp != NULL) {
|
| + struct { uint32_t tag; uint32_t value; } entry;
|
| + for (;;) {
|
| + size_t n = fread(&entry, sizeof(entry), 1, fp);
|
| + if (n == 0 || (entry.tag == 0 && entry.value == 0)) {
|
| + break;
|
| + }
|
| + if (entry.tag == AT_HWCAP) {
|
| + result = entry.value;
|
| + break;
|
| + }
|
| + }
|
| + fclose(fp);
|
| + }
|
| + return result;
|
| +}
|
| +
|
| +#endif // V8_HOST_ARCH_ARM
|
| +
|
| +// Extract the information exposed by the kernel via /proc/cpuinfo.
|
| +class CPUInfo V8_FINAL BASE_EMBEDDED {
|
| + public:
|
| + CPUInfo() : datalen_(0) {
|
| + // Get the size of the cpuinfo file by reading it until the end. This is
|
| + // required because files under /proc do not always return a valid size
|
| + // when using fseek(0, SEEK_END) + ftell(). Nor can the be mmap()-ed.
|
| + static const char PATHNAME[] = "/proc/cpuinfo";
|
| + FILE* fp = fopen(PATHNAME, "r");
|
| + if (fp != NULL) {
|
| + for (;;) {
|
| + char buffer[256];
|
| + size_t n = fread(buffer, 1, sizeof(buffer), fp);
|
| + if (n == 0) {
|
| + break;
|
| + }
|
| + datalen_ += n;
|
| + }
|
| + fclose(fp);
|
| + }
|
| +
|
| + // Read the contents of the cpuinfo file.
|
| + data_ = new char[datalen_ + 1];
|
| + fp = fopen(PATHNAME, "r");
|
| + if (fp != NULL) {
|
| + for (size_t offset = 0; offset < datalen_; ) {
|
| + size_t n = fread(data_ + offset, 1, datalen_ - offset, fp);
|
| + if (n == 0) {
|
| + break;
|
| + }
|
| + offset += n;
|
| + }
|
| + fclose(fp);
|
| + }
|
| +
|
| + // Zero-terminate the data.
|
| + data_[datalen_] = '\0';
|
| + }
|
| +
|
| + ~CPUInfo() {
|
| + delete[] data_;
|
| + }
|
| +
|
| + // Extract the content of a the first occurence of a given field in
|
| + // the content of the cpuinfo file and return it as a heap-allocated
|
| + // string that must be freed by the caller using delete[].
|
| + // Return NULL if not found.
|
| + char* ExtractField(const char* field) const {
|
| + ASSERT(field != NULL);
|
| +
|
| + // Look for first field occurence, and ensure it starts the line.
|
| + size_t fieldlen = strlen(field);
|
| + char* p = data_;
|
| + for (;;) {
|
| + p = strstr(p, field);
|
| + if (p == NULL) {
|
| + return NULL;
|
| + }
|
| + if (p == data_ || p[-1] == '\n') {
|
| + break;
|
| + }
|
| + p += fieldlen;
|
| + }
|
| +
|
| + // Skip to the first colon followed by a space.
|
| + p = strchr(p + fieldlen, ':');
|
| + if (p == NULL || !isspace(p[1])) {
|
| + return NULL;
|
| + }
|
| + p += 2;
|
| +
|
| + // Find the end of the line.
|
| + char* q = strchr(p, '\n');
|
| + if (q == NULL) {
|
| + q = data_ + datalen_;
|
| + }
|
| +
|
| + // Copy the line into a heap-allocated buffer.
|
| + size_t len = q - p;
|
| + char* result = new char[len + 1];
|
| + if (result != NULL) {
|
| + memcpy(result, p, len);
|
| + result[len] = '\0';
|
| + }
|
| + return result;
|
| + }
|
| +
|
| + private:
|
| + char* data_;
|
| + size_t datalen_;
|
| +};
|
| +
|
| +
|
| +// Checks that a space-separated list of items contains one given 'item'.
|
| +static bool HasListItem(const char* list, const char* item) {
|
| + ssize_t item_len = strlen(item);
|
| + const char* p = list;
|
| + if (p != NULL) {
|
| + while (*p != '\0') {
|
| + // Skip whitespace.
|
| + while (isspace(*p)) ++p;
|
| +
|
| + // Find end of current list item.
|
| + const char* q = p;
|
| + while (*q != '\0' && !isspace(*q)) ++q;
|
| +
|
| + if (item_len == q - p && memcmp(p, item, item_len) == 0) {
|
| + return true;
|
| + }
|
| +
|
| + // Skip to next item.
|
| + p = q;
|
| + }
|
| + }
|
| + return false;
|
| +}
|
| +
|
| +#endif // V8_HOST_ARCH_IA32 || V8_HOST_ARCH_X64
|
| +
|
| +CPU::CPU() : stepping_(0),
|
| + model_(0),
|
| + ext_model_(0),
|
| + family_(0),
|
| + ext_family_(0),
|
| + type_(0),
|
| + implementer_(0),
|
| + architecture_(0),
|
| + part_(0),
|
| + has_fpu_(false),
|
| + has_cmov_(false),
|
| + has_sahf_(false),
|
| + has_mmx_(false),
|
| + has_sse_(false),
|
| + has_sse2_(false),
|
| + has_sse3_(false),
|
| + has_ssse3_(false),
|
| + has_sse41_(false),
|
| + has_sse42_(false),
|
| + has_idiva_(false),
|
| + has_neon_(false),
|
| + has_thumbee_(false),
|
| + has_vfp_(false),
|
| + has_vfp3_(false),
|
| + has_vfp3_d32_(false) {
|
| + memcpy(vendor_, "Unknown", 8);
|
| +#if V8_HOST_ARCH_IA32 || V8_HOST_ARCH_X64
|
| + int cpu_info[4];
|
| +
|
| + // __cpuid with an InfoType argument of 0 returns the number of
|
| + // valid Ids in CPUInfo[0] and the CPU identification string in
|
| + // the other three array elements. The CPU identification string is
|
| + // not in linear order. The code below arranges the information
|
| + // in a human readable form. The human readable order is CPUInfo[1] |
|
| + // CPUInfo[3] | CPUInfo[2]. CPUInfo[2] and CPUInfo[3] are swapped
|
| + // before using memcpy to copy these three array elements to cpu_string.
|
| + __cpuid(cpu_info, 0);
|
| + unsigned num_ids = cpu_info[0];
|
| + std::swap(cpu_info[2], cpu_info[3]);
|
| + memcpy(vendor_, cpu_info + 1, 12);
|
| + vendor_[12] = '\0';
|
| +
|
| + // Interpret CPU feature information.
|
| + if (num_ids > 0) {
|
| + __cpuid(cpu_info, 1);
|
| + stepping_ = cpu_info[0] & 0xf;
|
| + model_ = ((cpu_info[0] >> 4) & 0xf) + ((cpu_info[0] >> 12) & 0xf0);
|
| + family_ = (cpu_info[0] >> 8) & 0xf;
|
| + type_ = (cpu_info[0] >> 12) & 0x3;
|
| + ext_model_ = (cpu_info[0] >> 16) & 0xf;
|
| + ext_family_ = (cpu_info[0] >> 20) & 0xff;
|
| + has_fpu_ = (cpu_info[3] & 0x00000001) != 0;
|
| + has_cmov_ = (cpu_info[3] & 0x00008000) != 0;
|
| + has_mmx_ = (cpu_info[3] & 0x00800000) != 0;
|
| + has_sse_ = (cpu_info[3] & 0x02000000) != 0;
|
| + has_sse2_ = (cpu_info[3] & 0x04000000) != 0;
|
| + has_sse3_ = (cpu_info[2] & 0x00000001) != 0;
|
| + has_ssse3_ = (cpu_info[2] & 0x00000200) != 0;
|
| + has_sse41_ = (cpu_info[2] & 0x00080000) != 0;
|
| + has_sse42_ = (cpu_info[2] & 0x00100000) != 0;
|
| + }
|
| +
|
| + // Query extended IDs.
|
| + __cpuid(cpu_info, 0x80000000);
|
| + unsigned num_ext_ids = cpu_info[0];
|
| +
|
| + // Interpret extended CPU feature information.
|
| + if (num_ext_ids > 0x80000000) {
|
| + __cpuid(cpu_info, 0x80000001);
|
| + // SAHF is always available in compat/legacy mode,
|
| + // but must be probed in long mode.
|
| +#if V8_HOST_ARCH_IA32
|
| + has_sahf_ = true;
|
| +#else
|
| + has_sahf_ = (cpu_info[2] & 0x00000001) != 0;
|
| +#endif
|
| + }
|
| +#elif V8_HOST_ARCH_ARM
|
| + CPUInfo cpu_info;
|
| +
|
| + // Extract implementor from the "CPU implementer" field.
|
| + char* implementer = cpu_info.ExtractField("CPU implementer");
|
| + if (implementer != NULL) {
|
| + char* end ;
|
| + implementer_ = strtol(implementer, &end, 0);
|
| + if (end == implementer) {
|
| + implementer_ = 0;
|
| + }
|
| + delete[] implementer;
|
| + }
|
| +
|
| + // Extract part number from the "CPU part" field.
|
| + char* part = cpu_info.ExtractField("CPU part");
|
| + if (part != NULL) {
|
| + char* end ;
|
| + part_ = strtol(part, &end, 0);
|
| + if (end == part) {
|
| + part_ = 0;
|
| + }
|
| + delete[] part;
|
| + }
|
| +
|
| + // Extract architecture from the "CPU Architecture" field.
|
| + // The list is well-known, unlike the the output of
|
| + // the 'Processor' field which can vary greatly.
|
| + // See the definition of the 'proc_arch' array in
|
| + // $KERNEL/arch/arm/kernel/setup.c and the 'c_show' function in
|
| + // same file.
|
| + char* architecture = cpu_info.ExtractField("CPU architecture");
|
| + if (architecture != NULL) {
|
| + char* end;
|
| + architecture_ = strtol(architecture, &end, 10);
|
| + if (end == architecture) {
|
| + architecture_ = 0;
|
| + }
|
| + delete[] architecture;
|
| +
|
| + // Unfortunately, it seems that certain ARMv6-based CPUs
|
| + // report an incorrect architecture number of 7!
|
| + //
|
| + // See http://code.google.com/p/android/issues/detail?id=10812
|
| + //
|
| + // We try to correct this by looking at the 'elf_format'
|
| + // field reported by the 'Processor' field, which is of the
|
| + // form of "(v7l)" for an ARMv7-based CPU, and "(v6l)" for
|
| + // an ARMv6-one. For example, the Raspberry Pi is one popular
|
| + // ARMv6 device that reports architecture 7.
|
| + if (architecture_ == 7) {
|
| + char* processor = cpu_info.ExtractField("Processor");
|
| + if (HasListItem(processor, "(v6l)")) {
|
| + architecture_ = 6;
|
| + }
|
| + delete[] processor;
|
| + }
|
| + }
|
| +
|
| + // Try to extract the list of CPU features from ELF hwcaps.
|
| + uint32_t hwcaps = ReadELFHWCaps();
|
| + if (hwcaps != 0) {
|
| + has_idiva_ = (hwcaps & HWCAP_IDIVA) != 0;
|
| + has_neon_ = (hwcaps & HWCAP_NEON) != 0;
|
| + has_thumbee_ = (hwcaps & HWCAP_THUMBEE) != 0;
|
| + has_vfp_ = (hwcaps & HWCAP_VFP) != 0;
|
| + has_vfp3_ = (hwcaps & (HWCAP_VFPv3 | HWCAP_VFPv3D16 | HWCAP_VFPv4)) != 0;
|
| + has_vfp3_d32_ = (has_vfp3_ && ((hwcaps & HWCAP_VFPv3D16) == 0 ||
|
| + (hwcaps & HWCAP_VFPD32) != 0));
|
| + } else {
|
| + // Try to fallback to "Features" CPUInfo field.
|
| + char* features = cpu_info.ExtractField("Features");
|
| + has_idiva_ = HasListItem(features, "idiva");
|
| + has_neon_ = HasListItem(features, "neon");
|
| + has_thumbee_ = HasListItem(features, "thumbee");
|
| + has_vfp_ = HasListItem(features, "vfp");
|
| + if (HasListItem(features, "vfpv3")) {
|
| + has_vfp3_ = true;
|
| + has_vfp3_d32_ = true;
|
| + } else if (HasListItem(features, "vfpv3d16")) {
|
| + has_vfp3_ = true;
|
| + }
|
| + delete[] features;
|
| + }
|
| +
|
| + // Some old kernels will report vfp not vfpv3. Here we make an attempt
|
| + // to detect vfpv3 by checking for vfp *and* neon, since neon is only
|
| + // available on architectures with vfpv3. Checking neon on its own is
|
| + // not enough as it is possible to have neon without vfp.
|
| + if (has_vfp_ && has_neon_) {
|
| + has_vfp3_ = true;
|
| + }
|
| +
|
| + // VFPv3 implies ARMv7, see ARM DDI 0406B, page A1-6.
|
| + if (architecture_ < 7 && has_vfp3_) {
|
| + architecture_ = 7;
|
| + }
|
| +
|
| + // ARMv7 implies ThumbEE.
|
| + if (architecture_ >= 7) {
|
| + has_thumbee_ = true;
|
| + }
|
| +
|
| + // The earliest architecture with ThumbEE is ARMv6T2.
|
| + if (has_thumbee_ && architecture_ < 6) {
|
| + architecture_ = 6;
|
| + }
|
| +
|
| + // We don't support any FPUs other than VFP.
|
| + has_fpu_ = has_vfp_;
|
| +#elif V8_HOST_ARCH_MIPS
|
| + // Simple detection of FPU at runtime for Linux.
|
| + // It is based on /proc/cpuinfo, which reveals hardware configuration
|
| + // to user-space applications. According to MIPS (early 2010), no similar
|
| + // facility is universally available on the MIPS architectures,
|
| + // so it's up to individual OSes to provide such.
|
| + CPUInfo cpu_info;
|
| + char* cpu_model = cpu_info.ExtractField("cpu model");
|
| + has_fpu_ = HasListItem(cpu_model, "FPU");
|
| + delete[] cpu_model;
|
| +#endif
|
| +}
|
| +
|
| +} } // namespace v8::internal
|
|
|