Chromium Code Reviews| OLD | NEW |
|---|---|
| 1 // Copyright (c) 2012 The Chromium Authors. All rights reserved. | 1 // Copyright (c) 2012 The Chromium Authors. All rights reserved. |
| 2 // Use of this source code is governed by a BSD-style license that can be | 2 // Use of this source code is governed by a BSD-style license that can be |
| 3 // found in the LICENSE file. | 3 // found in the LICENSE file. |
| 4 | 4 |
| 5 #include "base/cpu.h" | 5 #include "base/cpu.h" |
| 6 | 6 |
| 7 #include <string.h> | 7 #include <string.h> |
| 8 | 8 |
| 9 #include <algorithm> | 9 #include <algorithm> |
| 10 | 10 |
| 11 #include "base/basictypes.h" | |
| 11 #include "build/build_config.h" | 12 #include "build/build_config.h" |
| 12 | 13 |
| 13 #if defined(ARCH_CPU_X86_FAMILY) | 14 #if defined(ARCH_CPU_X86_FAMILY) |
| 14 #if defined(_MSC_VER) | 15 #if defined(_MSC_VER) |
| 15 #include <intrin.h> | 16 #include <intrin.h> |
| 17 #include <immintrin.h> // For _xgetbv() | |
| 16 #endif | 18 #endif |
| 17 #endif | 19 #endif |
| 18 | 20 |
| 19 namespace base { | 21 namespace base { |
| 20 | 22 |
| 21 CPU::CPU() | 23 CPU::CPU() |
| 22 : signature_(0), | 24 : signature_(0), |
| 23 type_(0), | 25 type_(0), |
| 24 family_(0), | 26 family_(0), |
| 25 model_(0), | 27 model_(0), |
| 26 stepping_(0), | 28 stepping_(0), |
| 27 ext_model_(0), | 29 ext_model_(0), |
| 28 ext_family_(0), | 30 ext_family_(0), |
| 29 has_mmx_(false), | 31 has_mmx_(false), |
| 30 has_sse_(false), | 32 has_sse_(false), |
| 31 has_sse2_(false), | 33 has_sse2_(false), |
| 32 has_sse3_(false), | 34 has_sse3_(false), |
| 33 has_ssse3_(false), | 35 has_ssse3_(false), |
| 34 has_sse41_(false), | 36 has_sse41_(false), |
| 35 has_sse42_(false), | 37 has_sse42_(false), |
| 38 has_avx_(false), | |
| 39 has_avx_hardware_(false), | |
| 36 has_non_stop_time_stamp_counter_(false), | 40 has_non_stop_time_stamp_counter_(false), |
| 37 cpu_vendor_("unknown") { | 41 cpu_vendor_("unknown") { |
| 38 Initialize(); | 42 Initialize(); |
| 39 } | 43 } |
| 40 | 44 |
| 45 namespace { | |
| 46 | |
| 41 #if defined(ARCH_CPU_X86_FAMILY) | 47 #if defined(ARCH_CPU_X86_FAMILY) |
| 42 #ifndef _MSC_VER | 48 #ifndef _MSC_VER |
| 43 | 49 |
| 44 #if defined(__pic__) && defined(__i386__) | 50 #if defined(__pic__) && defined(__i386__) |
| 45 | 51 |
| 46 void __cpuid(int cpu_info[4], int info_type) { | 52 void __cpuid(int cpu_info[4], int info_type) { |
| 47 __asm__ volatile ( | 53 __asm__ volatile ( |
| 48 "mov %%ebx, %%edi\n" | 54 "mov %%ebx, %%edi\n" |
| 49 "cpuid\n" | 55 "cpuid\n" |
| 50 "xchg %%edi, %%ebx\n" | 56 "xchg %%edi, %%ebx\n" |
| 51 : "=a"(cpu_info[0]), "=D"(cpu_info[1]), "=c"(cpu_info[2]), "=d"(cpu_info[3]) | 57 : "=a"(cpu_info[0]), "=D"(cpu_info[1]), "=c"(cpu_info[2]), "=d"(cpu_info[3]) |
| 52 : "a"(info_type) | 58 : "a"(info_type) |
| 53 ); | 59 ); |
| 54 } | 60 } |
| 55 | 61 |
| 56 void __cpuidex(int cpu_info[4], int info_type, int info_index) { | |
| 57 __asm__ volatile ( | |
| 58 "mov %%ebx, %%edi\n" | |
| 59 "cpuid\n" | |
| 60 "xchg %%edi, %%ebx\n" | |
| 61 : "=a"(cpu_info[0]), "=D"(cpu_info[1]), "=c"(cpu_info[2]), "=d"(cpu_info[3]) | |
| 62 : "a"(info_type), "c"(info_index) | |
| 63 ); | |
| 64 } | |
| 65 | |
| 66 #else | 62 #else |
| 67 | 63 |
| 68 void __cpuid(int cpu_info[4], int info_type) { | 64 void __cpuid(int cpu_info[4], int info_type) { |
| 69 __asm__ volatile ( | 65 __asm__ volatile ( |
| 70 "cpuid \n\t" | 66 "cpuid \n\t" |
| 71 : "=a"(cpu_info[0]), "=b"(cpu_info[1]), "=c"(cpu_info[2]), "=d"(cpu_info[3]) | 67 : "=a"(cpu_info[0]), "=b"(cpu_info[1]), "=c"(cpu_info[2]), "=d"(cpu_info[3]) |
| 72 : "a"(info_type) | 68 : "a"(info_type) |
| 73 ); | 69 ); |
| 74 } | 70 } |
| 75 | 71 |
| 76 void __cpuidex(int cpu_info[4], int info_type, int info_index) { | |
| 77 __asm__ volatile ( | |
| 78 "cpuid \n\t" | |
| 79 : "=a"(cpu_info[0]), "=b"(cpu_info[1]), "=c"(cpu_info[2]), "=d"(cpu_info[3]) | |
| 80 : "a"(info_type), "c"(info_index) | |
| 81 ); | |
| 82 } | |
| 83 | |
| 84 #endif | 72 #endif |
| 85 #endif // _MSC_VER | 73 |
| 74 // _xgetbv returns the value of an Intel Extended Control Register (XCR). | |
| 75 // Currently only XCR0 is defined by Intel so |xcr| should always be zero. | |
| 76 uint64 _xgetbv(uint32 xcr) { | |
| 77 uint32 eax, edx; | |
| 78 | |
| 79 __asm__ volatile ("xgetbv" : "=a" (eax), "=d" (edx) : "c" (xcr)); | |
| 80 return (static_cast<uint64>(edx) << 32) | eax; | |
| 81 } | |
| 82 | |
| 83 #endif // !_MSC_VER | |
| 86 #endif // ARCH_CPU_X86_FAMILY | 84 #endif // ARCH_CPU_X86_FAMILY |
| 87 | 85 |
| 86 } // anonymous namespace | |
| 87 | |
| 88 void CPU::Initialize() { | 88 void CPU::Initialize() { |
| 89 #if defined(ARCH_CPU_X86_FAMILY) | 89 #if defined(ARCH_CPU_X86_FAMILY) |
| 90 int cpu_info[4] = {-1}; | 90 int cpu_info[4] = {-1}; |
| 91 char cpu_string[48]; | 91 char cpu_string[48]; |
| 92 | 92 |
| 93 // __cpuid with an InfoType argument of 0 returns the number of | 93 // __cpuid with an InfoType argument of 0 returns the number of |
| 94 // valid Ids in CPUInfo[0] and the CPU identification string in | 94 // valid Ids in CPUInfo[0] and the CPU identification string in |
| 95 // the other three array elements. The CPU identification string is | 95 // the other three array elements. The CPU identification string is |
| 96 // not in linear order. The code below arranges the information | 96 // not in linear order. The code below arranges the information |
| 97 // in a human readable form. The human readable order is CPUInfo[1] | | 97 // in a human readable form. The human readable order is CPUInfo[1] | |
| 98 // CPUInfo[3] | CPUInfo[2]. CPUInfo[2] and CPUInfo[3] are swapped | 98 // CPUInfo[3] | CPUInfo[2]. CPUInfo[2] and CPUInfo[3] are swapped |
| 99 // before using memcpy to copy these three array elements to cpu_string. | 99 // before using memcpy to copy these three array elements to cpu_string. |
| 100 __cpuid(cpu_info, 0); | 100 __cpuid(cpu_info, 0); |
| 101 int num_ids = cpu_info[0]; | 101 int num_ids = cpu_info[0]; |
| 102 std::swap(cpu_info[2], cpu_info[3]); | 102 std::swap(cpu_info[2], cpu_info[3]); |
| 103 memcpy(cpu_string, &cpu_info[1], 3 * sizeof(cpu_info[1])); | 103 memcpy(cpu_string, &cpu_info[1], 3 * sizeof(cpu_info[1])); |
| 104 cpu_vendor_.assign(cpu_string, 3 * sizeof(cpu_info[1])); | 104 cpu_vendor_.assign(cpu_string, 3 * sizeof(cpu_info[1])); |
| 105 | 105 |
| 106 // Interpret CPU feature information. | 106 // Interpret CPU feature information. |
| 107 if (num_ids > 0) { | 107 if (num_ids > 0) { |
| 108 __cpuid(cpu_info, 1); | 108 __cpuid(cpu_info, 1); |
| 109 signature_ = cpu_info[0]; | 109 signature_ = cpu_info[0]; |
| 110 stepping_ = cpu_info[0] & 0xf; | 110 stepping_ = cpu_info[0] & 0xf; |
| 111 model_ = ((cpu_info[0] >> 4) & 0xf) + ((cpu_info[0] >> 12) & 0xf0); | 111 model_ = ((cpu_info[0] >> 4) & 0xf) + ((cpu_info[0] >> 12) & 0xf0); |
| 112 family_ = (cpu_info[0] >> 8) & 0xf; | 112 family_ = (cpu_info[0] >> 8) & 0xf; |
| 113 type_ = (cpu_info[0] >> 12) & 0x3; | 113 type_ = (cpu_info[0] >> 12) & 0x3; |
| 114 ext_model_ = (cpu_info[0] >> 16) & 0xf; | 114 ext_model_ = (cpu_info[0] >> 16) & 0xf; |
| 115 ext_family_ = (cpu_info[0] >> 20) & 0xff; | 115 ext_family_ = (cpu_info[0] >> 20) & 0xff; |
| 116 has_mmx_ = (cpu_info[3] & 0x00800000) != 0; | 116 has_mmx_ = (cpu_info[3] & 0x00800000) != 0; |
| 117 has_sse_ = (cpu_info[3] & 0x02000000) != 0; | 117 has_sse_ = (cpu_info[3] & 0x02000000) != 0; |
| 118 has_sse2_ = (cpu_info[3] & 0x04000000) != 0; | 118 has_sse2_ = (cpu_info[3] & 0x04000000) != 0; |
| 119 has_sse3_ = (cpu_info[2] & 0x00000001) != 0; | 119 has_sse3_ = (cpu_info[2] & 0x00000001) != 0; |
| 120 has_ssse3_ = (cpu_info[2] & 0x00000200) != 0; | 120 has_ssse3_ = (cpu_info[2] & 0x00000200) != 0; |
| 121 has_sse41_ = (cpu_info[2] & 0x00080000) != 0; | 121 has_sse41_ = (cpu_info[2] & 0x00080000) != 0; |
| 122 has_sse42_ = (cpu_info[2] & 0x00100000) != 0; | 122 has_sse42_ = (cpu_info[2] & 0x00100000) != 0; |
| 123 has_avx_ = (cpu_info[2] & 0x10000000) != 0; | 123 has_avx_hardware_ = |
| 124 (cpu_info[2] & 0x10000000) != 0; | |
| 125 /* AVX instructions will generate an illegal instruction exception unless | |
| 126 * a) they are supported by the CPU, | |
| 127 * b) XSAVE is supported by the CPU and | |
| 128 * c) XSAVE is enabled by the kernel. | |
| 129 * See http://software.intel.com/en-us/blogs/2011/04/14/is-avx-enabled */ | |
|
wtc
2013/11/21 21:03:44
Use C++ comment //.
agl
2013/11/22 16:22:35
Done.
| |
| 130 has_avx_ = | |
| 131 has_avx_hardware_ && | |
| 132 (cpu_info[2] & 0x08000000) == 0x08000000 /* OSXSAVE */ && | |
|
wtc
2013/11/21 21:03:44
Nit: since 0x08000000 has only one bit, you can ju
agl
2013/11/22 16:22:35
Done.
| |
| 133 (_xgetbv(0) & 6) == 6 /* XSAVE enabled by kernel */; | |
|
wtc
2013/11/21 21:03:44
Nit: indent by four spaces
agl
2013/11/22 16:22:35
Done.
| |
| 124 } | 134 } |
| 125 | 135 |
| 126 // Get the brand string of the cpu. | 136 // Get the brand string of the cpu. |
| 127 __cpuid(cpu_info, 0x80000000); | 137 __cpuid(cpu_info, 0x80000000); |
| 128 const int parameter_end = 0x80000004; | 138 const int parameter_end = 0x80000004; |
| 129 int max_parameter = cpu_info[0]; | 139 int max_parameter = cpu_info[0]; |
| 130 | 140 |
| 131 if (cpu_info[0] >= parameter_end) { | 141 if (cpu_info[0] >= parameter_end) { |
| 132 char* cpu_string_ptr = cpu_string; | 142 char* cpu_string_ptr = cpu_string; |
| 133 | 143 |
| (...skipping 26 matching lines...) Expand all Loading... | |
| 160 if (has_sse42()) return SSE42; | 170 if (has_sse42()) return SSE42; |
| 161 if (has_sse41()) return SSE41; | 171 if (has_sse41()) return SSE41; |
| 162 if (has_ssse3()) return SSSE3; | 172 if (has_ssse3()) return SSSE3; |
| 163 if (has_sse3()) return SSE3; | 173 if (has_sse3()) return SSE3; |
| 164 if (has_sse2()) return SSE2; | 174 if (has_sse2()) return SSE2; |
| 165 if (has_sse()) return SSE; | 175 if (has_sse()) return SSE; |
| 166 return PENTIUM; | 176 return PENTIUM; |
| 167 } | 177 } |
| 168 | 178 |
| 169 } // namespace base | 179 } // namespace base |
| OLD | NEW |