Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(2)

Side by Side Diff: source/cpu_id.cc

Issue 1503393004: Work around bug in xgetbv for Visual Studio. (Closed) Base URL: https://chromium.googlesource.com/libyuv/libyuv@master
Patch Set: use pragma to disable optimization for xgetbv intrinsic Created 5 years ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch
« no previous file with comments | « no previous file | no next file » | no next file with comments »
Toggle Intra-line Diffs ('i') | Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
OLDNEW
1 /* 1 /*
2 * Copyright 2011 The LibYuv Project Authors. All rights reserved. 2 * Copyright 2011 The LibYuv Project Authors. All rights reserved.
3 * 3 *
4 * Use of this source code is governed by a BSD-style license 4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source 5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found 6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may 7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree. 8 * be found in the AUTHORS file in the root of the source tree.
9 */ 9 */
10 10
(...skipping 30 matching lines...) Expand all
41 #else 41 #else
42 #define SAFEBUFFERS 42 #define SAFEBUFFERS
43 #endif 43 #endif
44 44
45 // Low level cpuid for X86. 45 // Low level cpuid for X86.
46 #if (defined(_M_IX86) || defined(_M_X64) || \ 46 #if (defined(_M_IX86) || defined(_M_X64) || \
47 defined(__i386__) || defined(__x86_64__)) && \ 47 defined(__i386__) || defined(__x86_64__)) && \
48 !defined(__pnacl__) && !defined(__CLR_VER) 48 !defined(__pnacl__) && !defined(__CLR_VER)
49 LIBYUV_API 49 LIBYUV_API
50 void CpuId(uint32 info_eax, uint32 info_ecx, uint32* cpu_info) { 50 void CpuId(uint32 info_eax, uint32 info_ecx, uint32* cpu_info) {
51 #if (defined(_MSC_VER) && !defined(__clang__)) && !defined(__clang__) 51 #if defined(_MSC_VER) && !defined(__clang__)
52 // Visual C version uses intrinsic or inline x86 assembly. 52 // Visual C version uses intrinsic or inline x86 assembly.
53 #if (_MSC_FULL_VER >= 160040219) 53 #if (_MSC_FULL_VER >= 160040219)
54 __cpuidex((int*)(cpu_info), info_eax, info_ecx); 54 __cpuidex((int*)(cpu_info), info_eax, info_ecx);
55 #elif defined(_M_IX86) 55 #elif defined(_M_IX86)
56 __asm { 56 __asm {
57 mov eax, info_eax 57 mov eax, info_eax
58 mov ecx, info_ecx 58 mov ecx, info_ecx
59 mov edi, cpu_info 59 mov edi, cpu_info
60 cpuid 60 cpuid
61 mov [edi], eax 61 mov [edi], eax
62 mov [edi + 4], ebx 62 mov [edi + 4], ebx
63 mov [edi + 8], ecx 63 mov [edi + 8], ecx
64 mov [edi + 12], edx 64 mov [edi + 12], edx
65 } 65 }
66 #else 66 #else // Visual C but not x86
67 if (info_ecx == 0) { 67 if (info_ecx == 0) {
68 __cpuid((int*)(cpu_info), info_eax); 68 __cpuid((int*)(cpu_info), info_eax);
69 } else { 69 } else {
70 cpu_info[3] = cpu_info[2] = cpu_info[1] = cpu_info[0] = 0; 70 cpu_info[3] = cpu_info[2] = cpu_info[1] = cpu_info[0] = 0;
71 } 71 }
72 #endif 72 #endif
73 // GCC version uses inline x86 assembly. 73 // GCC version uses inline x86 assembly.
74 #else // (defined(_MSC_VER) && !defined(__clang__)) && !defined(__clang__) 74 #else // defined(_MSC_VER) && !defined(__clang__)
75 uint32 info_ebx, info_edx; 75 uint32 info_ebx, info_edx;
76 asm volatile ( 76 asm volatile (
77 #if defined( __i386__) && defined(__PIC__) 77 #if defined( __i386__) && defined(__PIC__)
78 // Preserve ebx for fpic 32 bit. 78 // Preserve ebx for fpic 32 bit.
79 "mov %%ebx, %%edi \n" 79 "mov %%ebx, %%edi \n"
80 "cpuid \n" 80 "cpuid \n"
81 "xchg %%edi, %%ebx \n" 81 "xchg %%edi, %%ebx \n"
82 : "=D" (info_ebx), 82 : "=D" (info_ebx),
83 #else 83 #else
84 "cpuid \n" 84 "cpuid \n"
85 : "=b" (info_ebx), 85 : "=b" (info_ebx),
86 #endif // defined( __i386__) && defined(__PIC__) 86 #endif // defined( __i386__) && defined(__PIC__)
87 "+a" (info_eax), "+c" (info_ecx), "=d" (info_edx)); 87 "+a" (info_eax), "+c" (info_ecx), "=d" (info_edx));
88 cpu_info[0] = info_eax; 88 cpu_info[0] = info_eax;
89 cpu_info[1] = info_ebx; 89 cpu_info[1] = info_ebx;
90 cpu_info[2] = info_ecx; 90 cpu_info[2] = info_ecx;
91 cpu_info[3] = info_edx; 91 cpu_info[3] = info_edx;
92 #endif // (defined(_MSC_VER) && !defined(__clang__)) && !defined(__clang__) 92 #endif // defined(_MSC_VER) && !defined(__clang__)
93 } 93 }
94 #else // (defined(_M_IX86) || defined(_M_X64) ... 94 #else // (defined(_M_IX86) || defined(_M_X64) ...
95 LIBYUV_API 95 LIBYUV_API
96 void CpuId(uint32 eax, uint32 ecx, uint32* cpu_info) { 96 void CpuId(uint32 eax, uint32 ecx, uint32* cpu_info) {
97 cpu_info[0] = cpu_info[1] = cpu_info[2] = cpu_info[3] = 0; 97 cpu_info[0] = cpu_info[1] = cpu_info[2] = cpu_info[3] = 0;
98 } 98 }
99 #endif 99 #endif
100 100
101 // TODO(fbarchard): Enable xgetbv when validator supports it. 101 // For VS2010 and earlier emit can be used:
102 // _asm _emit 0x0f _asm _emit 0x01 _asm _emit 0xd0 // For VS2010 and earlier.
103 // __asm {
104 // xor ecx, ecx // xcr 0
105 // xgetbv
106 // mov xcr0, eax
107 // }
108 // For VS2013 and earlier 32 bit, the _xgetbv(0) optimizer produces bad code.
109 // https://code.google.com/p/libyuv/issues/detail?id=529
110 #if defined(_M_IX86) && (_MSC_VER < 1900)
111 #pragma optimize("g", off)
112 #endif
102 #if (defined(_M_IX86) || defined(_M_X64) || \ 113 #if (defined(_M_IX86) || defined(_M_X64) || \
103 defined(__i386__) || defined(__x86_64__)) && \ 114 defined(__i386__) || defined(__x86_64__)) && \
104 !defined(__pnacl__) && !defined(__CLR_VER) && !defined(__native_client__) 115 !defined(__pnacl__) && !defined(__CLR_VER) && !defined(__native_client__)
105 #define HAS_XGETBV 116 #define HAS_XGETBV
106 // X86 CPUs have xgetbv to detect OS saves high parts of ymm registers. 117 // X86 CPUs have xgetbv to detect OS saves high parts of ymm registers.
107 int GetXCR0() { 118 int GetXCR0() {
108 uint32 xcr0 = 0u; 119 uint32 xcr0 = 0u;
109 #if (defined(_MSC_VER) && !defined(__clang__)) && (_MSC_FULL_VER >= 160040219) 120 #if (_MSC_FULL_VER >= 160040219)
110 xcr0 = (uint32)(_xgetbv(0)); // VS2010 SP1 required. 121 xcr0 = (uint32)(_xgetbv(0)); // VS2010 SP1 required.
111 #elif defined(_M_IX86) && defined(_MSC_VER) && !defined(__clang__)
112 __asm {
113 xor ecx, ecx // xcr 0
114 _asm _emit 0x0f _asm _emit 0x01 _asm _emit 0xd0 // For VS2010 and earlier.
115 mov xcr0, eax
116 }
117 #elif defined(__i386__) || defined(__x86_64__) 122 #elif defined(__i386__) || defined(__x86_64__)
123 uint32 xcr0 = 0u;
118 asm(".byte 0x0f, 0x01, 0xd0" : "=a" (xcr0) : "c" (0) : "%edx"); 124 asm(".byte 0x0f, 0x01, 0xd0" : "=a" (xcr0) : "c" (0) : "%edx");
119 #endif // defined(__i386__) || defined(__x86_64__) 125 #endif // defined(__i386__) || defined(__x86_64__)
120 return xcr0; 126 return xcr0;
121 } 127 }
122 #endif // defined(_M_IX86) || defined(_M_X64) .. 128 #endif // defined(_M_IX86) || defined(_M_X64) ..
129 // Return optimization to previous setting, which is off for debug.
brucedawson 2015/12/09 01:53:34 I'd delete the ", which is off for debug." from th
fbarchard 2015/12/09 02:13:21 Done.
130 #if defined(_M_IX86) && (_MSC_VER < 1900)
131 #pragma optimize("g", on)
132 #endif
123 133
124 // based on libvpx arm_cpudetect.c 134 // based on libvpx arm_cpudetect.c
125 // For Arm, but public to allow testing on any CPU 135 // For Arm, but public to allow testing on any CPU
126 LIBYUV_API SAFEBUFFERS 136 LIBYUV_API SAFEBUFFERS
127 int ArmCpuCaps(const char* cpuinfo_name) { 137 int ArmCpuCaps(const char* cpuinfo_name) {
128 char cpuinfo_line[512]; 138 char cpuinfo_line[512];
129 FILE* f = fopen(cpuinfo_name, "r"); 139 FILE* f = fopen(cpuinfo_name, "r");
130 if (!f) { 140 if (!f) {
131 // Assume Neon if /proc/cpuinfo is unavailable. 141 // Assume Neon if /proc/cpuinfo is unavailable.
132 // This will occur for Chrome sandbox for Pepper or Render process. 142 // This will occur for Chrome sandbox for Pepper or Render process.
(...skipping 152 matching lines...) Expand 10 before | Expand all | Expand 10 after
285 // Note that use of this function is not thread safe. 295 // Note that use of this function is not thread safe.
286 LIBYUV_API 296 LIBYUV_API
287 void MaskCpuFlags(int enable_flags) { 297 void MaskCpuFlags(int enable_flags) {
288 cpu_info_ = InitCpuFlags() & enable_flags; 298 cpu_info_ = InitCpuFlags() & enable_flags;
289 } 299 }
290 300
291 #ifdef __cplusplus 301 #ifdef __cplusplus
292 } // extern "C" 302 } // extern "C"
293 } // namespace libyuv 303 } // namespace libyuv
294 #endif 304 #endif
OLDNEW
« no previous file with comments | « no previous file | no next file » | no next file with comments »

Powered by Google App Engine
This is Rietveld 408576698