| OLD | NEW |
| 1 // Copyright (c) 2012 The Chromium Authors. All rights reserved. | 1 // Copyright (c) 2012 The Chromium Authors. All rights reserved. |
| 2 // Use of this source code is governed by a BSD-style license that can be | 2 // Use of this source code is governed by a BSD-style license that can be |
| 3 // found in the LICENSE file. | 3 // found in the LICENSE file. |
| 4 | 4 |
| 5 #include "base/cpu.h" | 5 #include "base/cpu.h" |
| 6 | 6 |
| 7 #include <string.h> | 7 #include <string.h> |
| 8 | 8 |
| 9 #include <algorithm> | 9 #include <algorithm> |
| 10 | 10 |
| 11 #include "base/basictypes.h" |
| 11 #include "build/build_config.h" | 12 #include "build/build_config.h" |
| 12 | 13 |
| 13 #if defined(ARCH_CPU_X86_FAMILY) | 14 #if defined(ARCH_CPU_X86_FAMILY) |
| 14 #if defined(_MSC_VER) | 15 #if defined(_MSC_VER) |
| 15 #include <intrin.h> | 16 #include <intrin.h> |
| 17 #include <immintrin.h> // For _xgetbv() |
| 16 #endif | 18 #endif |
| 17 #endif | 19 #endif |
| 18 | 20 |
| 19 namespace base { | 21 namespace base { |
| 20 | 22 |
| 21 CPU::CPU() | 23 CPU::CPU() |
| 22 : signature_(0), | 24 : signature_(0), |
| 23 type_(0), | 25 type_(0), |
| 24 family_(0), | 26 family_(0), |
| 25 model_(0), | 27 model_(0), |
| 26 stepping_(0), | 28 stepping_(0), |
| 27 ext_model_(0), | 29 ext_model_(0), |
| 28 ext_family_(0), | 30 ext_family_(0), |
| 29 has_mmx_(false), | 31 has_mmx_(false), |
| 30 has_sse_(false), | 32 has_sse_(false), |
| 31 has_sse2_(false), | 33 has_sse2_(false), |
| 32 has_sse3_(false), | 34 has_sse3_(false), |
| 33 has_ssse3_(false), | 35 has_ssse3_(false), |
| 34 has_sse41_(false), | 36 has_sse41_(false), |
| 35 has_sse42_(false), | 37 has_sse42_(false), |
| 38 has_avx_(false), |
| 39 has_avx_hardware_(false), |
| 36 has_non_stop_time_stamp_counter_(false), | 40 has_non_stop_time_stamp_counter_(false), |
| 37 cpu_vendor_("unknown") { | 41 cpu_vendor_("unknown") { |
| 38 Initialize(); | 42 Initialize(); |
| 39 } | 43 } |
| 40 | 44 |
| 45 namespace { |
| 46 |
| 41 #if defined(ARCH_CPU_X86_FAMILY) | 47 #if defined(ARCH_CPU_X86_FAMILY) |
| 42 #ifndef _MSC_VER | 48 #ifndef _MSC_VER |
| 43 | 49 |
| 44 #if defined(__pic__) && defined(__i386__) | 50 #if defined(__pic__) && defined(__i386__) |
| 45 | 51 |
| 46 void __cpuid(int cpu_info[4], int info_type) { | 52 void __cpuid(int cpu_info[4], int info_type) { |
| 47 __asm__ volatile ( | 53 __asm__ volatile ( |
| 48 "mov %%ebx, %%edi\n" | 54 "mov %%ebx, %%edi\n" |
| 49 "cpuid\n" | 55 "cpuid\n" |
| 50 "xchg %%edi, %%ebx\n" | 56 "xchg %%edi, %%ebx\n" |
| (...skipping 24 matching lines...) Expand all Loading... |
| 75 | 81 |
| 76 void __cpuidex(int cpu_info[4], int info_type, int info_index) { | 82 void __cpuidex(int cpu_info[4], int info_type, int info_index) { |
| 77 __asm__ volatile ( | 83 __asm__ volatile ( |
| 78 "cpuid \n\t" | 84 "cpuid \n\t" |
| 79 : "=a"(cpu_info[0]), "=b"(cpu_info[1]), "=c"(cpu_info[2]), "=d"(cpu_info[3]) | 85 : "=a"(cpu_info[0]), "=b"(cpu_info[1]), "=c"(cpu_info[2]), "=d"(cpu_info[3]) |
| 80 : "a"(info_type), "c"(info_index) | 86 : "a"(info_type), "c"(info_index) |
| 81 ); | 87 ); |
| 82 } | 88 } |
| 83 | 89 |
| 84 #endif | 90 #endif |
| 85 #endif // _MSC_VER | 91 |
| 92 // _xgetbv returns the value of an Intel Extended Control Register (XCR). |
| 93 // Currently only XCR0 is defined by Intel so |xcr| should always be zero. |
| 94 uint64 _xgetbv(uint32 xcr) { |
| 95 uint32 eax, edx; |
| 96 |
| 97 __asm__ volatile ("xgetbv" : "=a" (eax), "=d" (edx) : "c" (xcr)); |
| 98 return (static_cast<uint64>(edx) << 32) | eax; |
| 99 } |
| 100 |
| 101 #endif // !_MSC_VER |
| 86 #endif // ARCH_CPU_X86_FAMILY | 102 #endif // ARCH_CPU_X86_FAMILY |
| 87 | 103 |
| 104 } // anonymous namespace |
| 105 |
| 88 void CPU::Initialize() { | 106 void CPU::Initialize() { |
| 89 #if defined(ARCH_CPU_X86_FAMILY) | 107 #if defined(ARCH_CPU_X86_FAMILY) |
| 90 int cpu_info[4] = {-1}; | 108 int cpu_info[4] = {-1}; |
| 91 char cpu_string[48]; | 109 char cpu_string[48]; |
| 92 | 110 |
| 93 // __cpuid with an InfoType argument of 0 returns the number of | 111 // __cpuid with an InfoType argument of 0 returns the number of |
| 94 // valid Ids in CPUInfo[0] and the CPU identification string in | 112 // valid Ids in CPUInfo[0] and the CPU identification string in |
| 95 // the other three array elements. The CPU identification string is | 113 // the other three array elements. The CPU identification string is |
| 96 // not in linear order. The code below arranges the information | 114 // not in linear order. The code below arranges the information |
| 97 // in a human readable form. The human readable order is CPUInfo[1] | | 115 // in a human readable form. The human readable order is CPUInfo[1] | |
| 98 // CPUInfo[3] | CPUInfo[2]. CPUInfo[2] and CPUInfo[3] are swapped | 116 // CPUInfo[3] | CPUInfo[2]. CPUInfo[2] and CPUInfo[3] are swapped |
| 99 // before using memcpy to copy these three array elements to cpu_string. | 117 // before using memcpy to copy these three array elements to cpu_string. |
| 100 __cpuid(cpu_info, 0); | 118 __cpuid(cpu_info, 0); |
| 101 int num_ids = cpu_info[0]; | 119 int num_ids = cpu_info[0]; |
| 102 std::swap(cpu_info[2], cpu_info[3]); | 120 std::swap(cpu_info[2], cpu_info[3]); |
| 103 memcpy(cpu_string, &cpu_info[1], 3 * sizeof(cpu_info[1])); | 121 memcpy(cpu_string, &cpu_info[1], 3 * sizeof(cpu_info[1])); |
| 104 cpu_vendor_.assign(cpu_string, 3 * sizeof(cpu_info[1])); | 122 cpu_vendor_.assign(cpu_string, 3 * sizeof(cpu_info[1])); |
| 105 | 123 |
| 106 // Interpret CPU feature information. | 124 // Interpret CPU feature information. |
| 107 if (num_ids > 0) { | 125 if (num_ids > 0) { |
| 108 __cpuid(cpu_info, 1); | 126 __cpuid(cpu_info, 1); |
| 109 signature_ = cpu_info[0]; | 127 signature_ = cpu_info[0]; |
| 110 stepping_ = cpu_info[0] & 0xf; | 128 stepping_ = cpu_info[0] & 0xf; |
| 111 model_ = ((cpu_info[0] >> 4) & 0xf) + ((cpu_info[0] >> 12) & 0xf0); | 129 model_ = ((cpu_info[0] >> 4) & 0xf) + ((cpu_info[0] >> 12) & 0xf0); |
| 112 family_ = (cpu_info[0] >> 8) & 0xf; | 130 family_ = (cpu_info[0] >> 8) & 0xf; |
| 113 type_ = (cpu_info[0] >> 12) & 0x3; | 131 type_ = (cpu_info[0] >> 12) & 0x3; |
| 114 ext_model_ = (cpu_info[0] >> 16) & 0xf; | 132 ext_model_ = (cpu_info[0] >> 16) & 0xf; |
| 115 ext_family_ = (cpu_info[0] >> 20) & 0xff; | 133 ext_family_ = (cpu_info[0] >> 20) & 0xff; |
| 116 has_mmx_ = (cpu_info[3] & 0x00800000) != 0; | 134 has_mmx_ = (cpu_info[3] & 0x00800000) != 0; |
| 117 has_sse_ = (cpu_info[3] & 0x02000000) != 0; | 135 has_sse_ = (cpu_info[3] & 0x02000000) != 0; |
| 118 has_sse2_ = (cpu_info[3] & 0x04000000) != 0; | 136 has_sse2_ = (cpu_info[3] & 0x04000000) != 0; |
| 119 has_sse3_ = (cpu_info[2] & 0x00000001) != 0; | 137 has_sse3_ = (cpu_info[2] & 0x00000001) != 0; |
| 120 has_ssse3_ = (cpu_info[2] & 0x00000200) != 0; | 138 has_ssse3_ = (cpu_info[2] & 0x00000200) != 0; |
| 121 has_sse41_ = (cpu_info[2] & 0x00080000) != 0; | 139 has_sse41_ = (cpu_info[2] & 0x00080000) != 0; |
| 122 has_sse42_ = (cpu_info[2] & 0x00100000) != 0; | 140 has_sse42_ = (cpu_info[2] & 0x00100000) != 0; |
| 123 has_avx_ = (cpu_info[2] & 0x10000000) != 0; | 141 has_avx_hardware_ = |
| 142 (cpu_info[2] & 0x10000000) != 0; |
| 143 /* AVX instructions will generate an illegal instruction exception unless |
| 144 * a) they are supported by the CPU, |
| 145 * b) XSAVE is supported by the CPU and |
| 146 * c) XSAVE is enabled by the kernel. |
| 147 * See http://software.intel.com/en-us/blogs/2011/04/14/is-avx-enabled */ |
| 148 has_avx_ = |
| 149 has_avx_hardware_ && |
| 150 (cpu_info[2] & 0x08000000) == 0x08000000 /* OSXSAVE */ && |
| 151 (_xgetbv(0) & 6) == 6 /* XSAVE enabled by kernel */; |
| 124 } | 152 } |
| 125 | 153 |
| 126 // Get the brand string of the cpu. | 154 // Get the brand string of the cpu. |
| 127 __cpuid(cpu_info, 0x80000000); | 155 __cpuid(cpu_info, 0x80000000); |
| 128 const int parameter_end = 0x80000004; | 156 const int parameter_end = 0x80000004; |
| 129 int max_parameter = cpu_info[0]; | 157 int max_parameter = cpu_info[0]; |
| 130 | 158 |
| 131 if (cpu_info[0] >= parameter_end) { | 159 if (cpu_info[0] >= parameter_end) { |
| 132 char* cpu_string_ptr = cpu_string; | 160 char* cpu_string_ptr = cpu_string; |
| 133 | 161 |
| (...skipping 26 matching lines...) Expand all Loading... |
| 160 if (has_sse42()) return SSE42; | 188 if (has_sse42()) return SSE42; |
| 161 if (has_sse41()) return SSE41; | 189 if (has_sse41()) return SSE41; |
| 162 if (has_ssse3()) return SSSE3; | 190 if (has_ssse3()) return SSSE3; |
| 163 if (has_sse3()) return SSE3; | 191 if (has_sse3()) return SSE3; |
| 164 if (has_sse2()) return SSE2; | 192 if (has_sse2()) return SSE2; |
| 165 if (has_sse()) return SSE; | 193 if (has_sse()) return SSE; |
| 166 return PENTIUM; | 194 return PENTIUM; |
| 167 } | 195 } |
| 168 | 196 |
| 169 } // namespace base | 197 } // namespace base |
| OLD | NEW |