OLD | NEW |
1 // Copyright (c) 2011 The Chromium Authors. All rights reserved. | 1 // Copyright (c) 2011 The Chromium Authors. All rights reserved. |
2 // Use of this source code is governed by a BSD-style license that can be | 2 // Use of this source code is governed by a BSD-style license that can be |
3 // found in the LICENSE file. | 3 // found in the LICENSE file. |
4 | 4 |
5 #include "base/threading/thread_local_storage.h" | 5 #include "base/threading/thread_local_storage.h" |
6 | 6 |
7 #include <windows.h> | 7 #include <windows.h> |
8 | 8 |
9 #include "base/logging.h" | 9 #include "base/logging.h" |
10 | 10 |
| 11 |
11 namespace base { | 12 namespace base { |
12 | 13 |
| 14 namespace { |
| 15 // The maximum number of 'slots' in our thread local storage stack. |
| 16 const int kThreadLocalStorageSize = 64; |
| 17 |
| 18 // The maximum number of times to try to clear slots by calling destructors. |
| 19 // Use pthread naming convention for clarity. |
| 20 const int kMaxDestructorIterations = kThreadLocalStorageSize; |
| 21 |
| 22 // An array of destructor function pointers for the slots. If a slot has a |
| 23 // destructor, it will be stored in its corresponding entry in this array. |
| 24 // The elements are volatile to ensure that when the compiler reads the value |
| 25 // to potentially call the destructor, it does so once, and that value is tested |
| 26 // for null-ness and then used. Yes, that would be a weird de-optimization, |
| 27 // but I can imagine some register machines where it was just as easy to |
| 28 // re-fetch an array element, and I want to be sure a call to free the key |
| 29 // (i.e., null out the destructor entry) that happens on a separate thread can't |
| 30 // hurt the racy calls to the destructors on another thread. |
| 31 volatile ThreadLocalStorage::TLSDestructorFunc |
| 32 g_tls_destructors[kThreadLocalStorageSize]; |
| 33 |
| 34 } // namespace anonymous |
| 35 |
13 // In order to make TLS destructors work, we need to keep function | 36 // In order to make TLS destructors work, we need to keep function |
14 // pointers to the destructor for each TLS that we allocate. | 37 // pointers to the destructor for each TLS that we allocate. |
15 // We make this work by allocating a single OS-level TLS, which | 38 // We make this work by allocating a single OS-level TLS, which |
16 // contains an array of slots for the application to use. In | 39 // contains an array of slots for the application to use. In |
17 // parallel, we also allocate an array of destructors, which we | 40 // parallel, we also allocate an array of destructors, which we |
18 // keep track of and call when threads terminate. | 41 // keep track of and call when threads terminate. |
19 | 42 |
20 // tls_key_ is the one native TLS that we use. It stores our | 43 // tls_key_ is the one native TLS that we use. It stores our |
21 // table. | 44 // table. |
22 long ThreadLocalStorage::tls_key_ = TLS_OUT_OF_INDEXES; | 45 long ThreadLocalStorage::tls_key_ = TLS_OUT_OF_INDEXES; |
23 | 46 |
24 // tls_max_ is the high-water-mark of allocated thread local storage. | 47 // tls_max_ is the high-water-mark of allocated thread local storage. |
25 // We intentionally skip 0 so that it is not confused with an | 48 // We intentionally skip 0 so that it is not confused with an |
26 // unallocated TLS slot. | 49 // unallocated TLS slot. |
27 long ThreadLocalStorage::tls_max_ = 1; | 50 long ThreadLocalStorage::tls_max_ = 1; |
28 | 51 |
29 // An array of destructor function pointers for the slots. If | |
30 // a slot has a destructor, it will be stored in its corresponding | |
31 // entry in this array. | |
32 ThreadLocalStorage::TLSDestructorFunc | |
33 ThreadLocalStorage::tls_destructors_[kThreadLocalStorageSize]; | |
34 | |
35 void** ThreadLocalStorage::Initialize() { | 52 void** ThreadLocalStorage::Initialize() { |
36 if (tls_key_ == TLS_OUT_OF_INDEXES) { | 53 if (tls_key_ == TLS_OUT_OF_INDEXES) { |
37 long value = TlsAlloc(); | 54 long value = TlsAlloc(); |
38 DCHECK(value != TLS_OUT_OF_INDEXES); | 55 DCHECK(value != TLS_OUT_OF_INDEXES); |
39 | 56 |
40 // Atomically test-and-set the tls_key. If the key is TLS_OUT_OF_INDEXES, | 57 // Atomically test-and-set the tls_key. If the key is TLS_OUT_OF_INDEXES, |
41 // go ahead and set it. Otherwise, do nothing, as another | 58 // go ahead and set it. Otherwise, do nothing, as another |
42 // thread already did our dirty work. | 59 // thread already did our dirty work. |
43 if (InterlockedCompareExchange(&tls_key_, value, TLS_OUT_OF_INDEXES) != | 60 if (InterlockedCompareExchange(&tls_key_, value, TLS_OUT_OF_INDEXES) != |
44 TLS_OUT_OF_INDEXES) { | 61 TLS_OUT_OF_INDEXES) { |
45 // We've been shortcut. Another thread replaced tls_key_ first so we need | 62 // We've been shortcut. Another thread replaced tls_key_ first so we need |
46 // to destroy our index and use the one the other thread got first. | 63 // to destroy our index and use the one the other thread got first. |
47 TlsFree(value); | 64 TlsFree(value); |
48 } | 65 } |
49 } | 66 } |
50 DCHECK(!TlsGetValue(tls_key_)); | 67 DCHECK(!TlsGetValue(tls_key_)); |
51 | 68 |
52 // Create an array to store our data. | 69 // Some allocators, such as TCMalloc, make use of thread local storage. |
| 70 // As a result, any attempt to call new (or malloc) will lazily cause such a |
| 71 // system to initialize, which will include registering for a TLS key. If we |
| 72 // are not careful here, then that request to create a key will call new back, |
| 73 // and we'll have an infinite loop. We avoid that as follows: |
| 74 // Use a stack allocated vector, so that we don't have dependence on our |
| 75 // allocator until our service is in place. (i.e., don't even call new until |
| 76 // after we're setup) |
| 77 void* stack_allocated_tls_data[kThreadLocalStorageSize]; |
| 78 memset(stack_allocated_tls_data, 0, sizeof(stack_allocated_tls_data)); |
| 79 // Ensure that any rentrant calls change the temp version. |
| 80 TlsSetValue(tls_key_, stack_allocated_tls_data); |
| 81 |
| 82 // Allocate an array to store our data. |
53 void** tls_data = new void*[kThreadLocalStorageSize]; | 83 void** tls_data = new void*[kThreadLocalStorageSize]; |
54 memset(tls_data, 0, sizeof(void*[kThreadLocalStorageSize])); | 84 memcpy(tls_data, stack_allocated_tls_data, sizeof(stack_allocated_tls_data)); |
55 TlsSetValue(tls_key_, tls_data); | 85 TlsSetValue(tls_key_, tls_data); |
56 return tls_data; | 86 return tls_data; |
57 } | 87 } |
58 | 88 |
59 ThreadLocalStorage::Slot::Slot(TLSDestructorFunc destructor) | 89 ThreadLocalStorage::Slot::Slot(TLSDestructorFunc destructor) |
60 : initialized_(false), | 90 : initialized_(false), |
61 slot_(0) { | 91 slot_(0) { |
62 Initialize(destructor); | 92 Initialize(destructor); |
63 } | 93 } |
64 | 94 |
65 bool ThreadLocalStorage::Slot::Initialize(TLSDestructorFunc destructor) { | 95 bool ThreadLocalStorage::Slot::Initialize(TLSDestructorFunc destructor) { |
66 if (tls_key_ == TLS_OUT_OF_INDEXES || !TlsGetValue(tls_key_)) | 96 if (tls_key_ == TLS_OUT_OF_INDEXES || !TlsGetValue(tls_key_)) |
67 ThreadLocalStorage::Initialize(); | 97 ThreadLocalStorage::Initialize(); |
68 | 98 |
69 // Grab a new slot. | 99 // Grab a new slot. |
70 slot_ = InterlockedIncrement(&tls_max_) - 1; | 100 slot_ = InterlockedIncrement(&tls_max_) - 1; |
| 101 DCHECK_GT(slot_, 0); |
71 if (slot_ >= kThreadLocalStorageSize) { | 102 if (slot_ >= kThreadLocalStorageSize) { |
72 NOTREACHED(); | 103 NOTREACHED(); |
73 return false; | 104 return false; |
74 } | 105 } |
75 | 106 |
76 // Setup our destructor. | 107 // Setup our destructor. |
77 tls_destructors_[slot_] = destructor; | 108 g_tls_destructors[slot_] = destructor; |
78 initialized_ = true; | 109 initialized_ = true; |
79 return true; | 110 return true; |
80 } | 111 } |
81 | 112 |
82 void ThreadLocalStorage::Slot::Free() { | 113 void ThreadLocalStorage::Slot::Free() { |
83 // At this time, we don't reclaim old indices for TLS slots. | 114 // At this time, we don't reclaim old indices for TLS slots. |
84 // So all we need to do is wipe the destructor. | 115 // So all we need to do is wipe the destructor. |
85 tls_destructors_[slot_] = NULL; | 116 DCHECK_GT(slot_, 0); |
| 117 DCHECK_LT(slot_, kThreadLocalStorageSize); |
| 118 g_tls_destructors[slot_] = NULL; |
| 119 slot_ = 0; |
86 initialized_ = false; | 120 initialized_ = false; |
87 } | 121 } |
88 | 122 |
89 void* ThreadLocalStorage::Slot::Get() const { | 123 void* ThreadLocalStorage::Slot::Get() const { |
90 void** tls_data = static_cast<void**>(TlsGetValue(tls_key_)); | 124 void** tls_data = static_cast<void**>(TlsGetValue(tls_key_)); |
91 if (!tls_data) | 125 if (!tls_data) |
92 tls_data = ThreadLocalStorage::Initialize(); | 126 tls_data = ThreadLocalStorage::Initialize(); |
93 DCHECK_GE(slot_, 0); | 127 DCHECK_GT(slot_, 0); |
94 DCHECK_LT(slot_, kThreadLocalStorageSize); | 128 DCHECK_LT(slot_, kThreadLocalStorageSize); |
95 return tls_data[slot_]; | 129 return tls_data[slot_]; |
96 } | 130 } |
97 | 131 |
98 void ThreadLocalStorage::Slot::Set(void* value) { | 132 void ThreadLocalStorage::Slot::Set(void* value) { |
99 void** tls_data = static_cast<void**>(TlsGetValue(tls_key_)); | 133 void** tls_data = static_cast<void**>(TlsGetValue(tls_key_)); |
100 if (!tls_data) | 134 if (!tls_data) |
101 tls_data = ThreadLocalStorage::Initialize(); | 135 tls_data = ThreadLocalStorage::Initialize(); |
102 DCHECK_GE(slot_, 0); | 136 DCHECK_GT(slot_, 0); |
103 DCHECK_LT(slot_, kThreadLocalStorageSize); | 137 DCHECK_LT(slot_, kThreadLocalStorageSize); |
104 tls_data[slot_] = value; | 138 tls_data[slot_] = value; |
105 } | 139 } |
106 | 140 |
107 void ThreadLocalStorage::ThreadExit() { | 141 void ThreadLocalStorage::ThreadExit() { |
108 if (tls_key_ == TLS_OUT_OF_INDEXES) | 142 if (tls_key_ == TLS_OUT_OF_INDEXES) |
109 return; | 143 return; |
110 | 144 |
111 void** tls_data = static_cast<void**>(TlsGetValue(tls_key_)); | 145 void** tls_data = static_cast<void**>(TlsGetValue(tls_key_)); |
112 | |
113 // Maybe we have never initialized TLS for this thread. | 146 // Maybe we have never initialized TLS for this thread. |
114 if (!tls_data) | 147 if (!tls_data) |
115 return; | 148 return; |
116 | 149 |
117 for (int slot = 0; slot < tls_max_; slot++) { | 150 // Some allocators, such as TCMalloc, use TLS. As a result, when a thread |
118 if (tls_destructors_[slot] != NULL) { | 151 // terminates, one of the destructor calls we make may be to shut down an |
119 void* value = tls_data[slot]; | 152 // allocator. We have to be careful that after we've shutdown all of the |
120 tls_destructors_[slot](value); | 153 // known destructors (perchance including an allocator), that we don't call |
| 154 // the allocator and cause it to resurrect itself (with no possibly destructor |
| 155 // call to follow). We handle this problem as follows: |
| 156 // Switch to using a stack allocated vector, so that we don't have dependence |
| 157 // on our allocator after we have called all g_tls_destructors. (i.e., don't |
| 158 // even call delete[] after we're done with destructors.) |
| 159 void* stack_allocated_tls_data[kThreadLocalStorageSize]; |
| 160 memcpy(stack_allocated_tls_data, tls_data, sizeof(stack_allocated_tls_data)); |
| 161 // Ensure that any re-entrant calls change the temp version. |
| 162 TlsSetValue(tls_key_, stack_allocated_tls_data); |
| 163 delete[] tls_data; // Our last dependence on an allocator. |
| 164 |
| 165 int remaining_attempts = kMaxDestructorIterations; |
| 166 bool need_to_scan_destructors = true; |
| 167 while (need_to_scan_destructors) { |
| 168 need_to_scan_destructors = false; |
| 169 // Try to destroy the first-created-slot (which is slot 1) in our last |
| 170 // destructor call. That user was able to function, and define a slot with |
| 171 // no other services running, so perhaps it is a basic service (like an |
| 172 // allocator) and should also be destroyed last. If we get the order wrong, |
| 173 // then we'll itterate several more times, so it is really not that |
| 174 // critical (but it might help). |
| 175 for (int slot = tls_max_ - 1; slot > 0; --slot) { |
| 176 void* value = stack_allocated_tls_data[slot]; |
| 177 if (value == NULL) |
| 178 continue; |
| 179 TLSDestructorFunc destructor = g_tls_destructors[slot]; |
| 180 if (destructor == NULL) |
| 181 continue; |
| 182 stack_allocated_tls_data[slot] = NULL; // pre-clear the slot. |
| 183 destructor(value); |
| 184 // Any destructor might have called a different service, which then set |
| 185 // a different slot to a non-NULL value. Hence we need to check |
| 186 // the whole vector again. This is a pthread standard. |
| 187 need_to_scan_destructors = true; |
| 188 } |
| 189 if (--remaining_attempts <= 0) { |
| 190 NOTREACHED(); // Destructors might not have been called. |
| 191 break; |
121 } | 192 } |
122 } | 193 } |
123 | 194 |
124 delete[] tls_data; | 195 // Remove our stack allocated vector. |
125 | |
126 // In case there are other "onexit" handlers... | |
127 TlsSetValue(tls_key_, NULL); | 196 TlsSetValue(tls_key_, NULL); |
128 } | 197 } |
129 | 198 |
130 } // namespace base | 199 } // namespace base |
131 | 200 |
132 // Thread Termination Callbacks. | 201 // Thread Termination Callbacks. |
133 // Windows doesn't support a per-thread destructor with its | 202 // Windows doesn't support a per-thread destructor with its |
134 // TLS primitives. So, we build it manually by inserting a | 203 // TLS primitives. So, we build it manually by inserting a |
135 // function to be called on each thread's exit. | 204 // function to be called on each thread's exit. |
136 // This magic is from http://www.codeproject.com/threads/tls.asp | 205 // This magic is from http://www.codeproject.com/threads/tls.asp |
(...skipping 55 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
192 #else // _WIN64 | 261 #else // _WIN64 |
193 | 262 |
194 #pragma data_seg(".CRT$XLB") | 263 #pragma data_seg(".CRT$XLB") |
195 PIMAGE_TLS_CALLBACK p_thread_callback_base = OnThreadExit; | 264 PIMAGE_TLS_CALLBACK p_thread_callback_base = OnThreadExit; |
196 | 265 |
197 // Reset the default section. | 266 // Reset the default section. |
198 #pragma data_seg() | 267 #pragma data_seg() |
199 | 268 |
200 #endif // _WIN64 | 269 #endif // _WIN64 |
201 } // extern "C" | 270 } // extern "C" |
OLD | NEW |