1 // Copyright 2015 The BoringSSL Authors
2 //
3 // Licensed under the Apache License, Version 2.0 (the "License");
4 // you may not use this file except in compliance with the License.
5 // You may obtain a copy of the License at
6 //
7 //     https://www.apache.org/licenses/LICENSE-2.0
8 //
9 // Unless required by applicable law or agreed to in writing, software
10 // distributed under the License is distributed on an "AS IS" BASIS,
11 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 // See the License for the specific language governing permissions and
13 // limitations under the License.
14 
15 // Ensure we can't call OPENSSL_malloc circularly.
16 #define _BORINGSSL_PROHIBIT_OPENSSL_MALLOC
17 #include "internal.h"
18 
19 #if defined(OPENSSL_WINDOWS_THREADS)
20 
21 #include <windows.h>
22 
23 #include <assert.h>
24 #include <stdlib.h>
25 #include <string.h>
26 
call_once_init(INIT_ONCE * once,void * arg,void ** out)27 static BOOL CALLBACK call_once_init(INIT_ONCE *once, void *arg, void **out) {
28   void (**init)(void) = (void (**)(void))arg;
29   (**init)();
30   return TRUE;
31 }
32 
CRYPTO_once(CRYPTO_once_t * once,void (* init)(void))33 void CRYPTO_once(CRYPTO_once_t *once, void (*init)(void)) {
34   if (!InitOnceExecuteOnce(once, call_once_init, &init, NULL)) {
35     abort();
36   }
37 }
38 
CRYPTO_MUTEX_init(CRYPTO_MUTEX * lock)39 void CRYPTO_MUTEX_init(CRYPTO_MUTEX *lock) { InitializeSRWLock(lock); }
40 
CRYPTO_MUTEX_lock_read(CRYPTO_MUTEX * lock)41 void CRYPTO_MUTEX_lock_read(CRYPTO_MUTEX *lock) { AcquireSRWLockShared(lock); }
42 
CRYPTO_MUTEX_lock_write(CRYPTO_MUTEX * lock)43 void CRYPTO_MUTEX_lock_write(CRYPTO_MUTEX *lock) {
44   AcquireSRWLockExclusive(lock);
45 }
46 
CRYPTO_MUTEX_unlock_read(CRYPTO_MUTEX * lock)47 void CRYPTO_MUTEX_unlock_read(CRYPTO_MUTEX *lock) {
48   ReleaseSRWLockShared(lock);
49 }
50 
CRYPTO_MUTEX_unlock_write(CRYPTO_MUTEX * lock)51 void CRYPTO_MUTEX_unlock_write(CRYPTO_MUTEX *lock) {
52   ReleaseSRWLockExclusive(lock);
53 }
54 
CRYPTO_MUTEX_cleanup(CRYPTO_MUTEX * lock)55 void CRYPTO_MUTEX_cleanup(CRYPTO_MUTEX *lock) {
56   // SRWLOCKs require no cleanup.
57 }
58 
59 static SRWLOCK g_destructors_lock = SRWLOCK_INIT;
60 static thread_local_destructor_t g_destructors[NUM_OPENSSL_THREAD_LOCALS];
61 
62 static CRYPTO_once_t g_thread_local_init_once = CRYPTO_ONCE_INIT;
63 static DWORD g_thread_local_key;
64 static int g_thread_local_failed;
65 
thread_local_init(void)66 static void thread_local_init(void) {
67   g_thread_local_key = TlsAlloc();
68   g_thread_local_failed = (g_thread_local_key == TLS_OUT_OF_INDEXES);
69 }
70 
thread_local_destructor(PVOID module,DWORD reason,PVOID reserved)71 static void NTAPI thread_local_destructor(PVOID module, DWORD reason,
72                                           PVOID reserved) {
73   // Only free memory on |DLL_THREAD_DETACH|, not |DLL_PROCESS_DETACH|. In
74   // VS2015's debug runtime, the C runtime has been unloaded by the time
75   // |DLL_PROCESS_DETACH| runs. See https://crbug.com/575795. This is consistent
76   // with |pthread_key_create| which does not call destructors on process exit,
77   // only thread exit.
78   if (reason != DLL_THREAD_DETACH) {
79     return;
80   }
81 
82   CRYPTO_once(&g_thread_local_init_once, thread_local_init);
83   if (g_thread_local_failed) {
84     return;
85   }
86 
87   void **pointers = (void **)TlsGetValue(g_thread_local_key);
88   if (pointers == NULL) {
89     return;
90   }
91 
92   thread_local_destructor_t destructors[NUM_OPENSSL_THREAD_LOCALS];
93 
94   AcquireSRWLockExclusive(&g_destructors_lock);
95   OPENSSL_memcpy(destructors, g_destructors, sizeof(destructors));
96   ReleaseSRWLockExclusive(&g_destructors_lock);
97 
98   for (unsigned i = 0; i < NUM_OPENSSL_THREAD_LOCALS; i++) {
99     if (destructors[i] != NULL) {
100       destructors[i](pointers[i]);
101     }
102   }
103 
104   free(pointers);
105 }
106 
107 // Thread Termination Callbacks.
108 //
109 // Windows doesn't support a per-thread destructor with its TLS primitives.
110 // So, we build it manually by inserting a function to be called on each
111 // thread's exit. This magic is from http://www.codeproject.com/threads/tls.asp
112 // and it works for VC++ 7.0 and later.
113 //
114 // Force a reference to _tls_used to make the linker create the TLS directory
115 // if it's not already there. (E.g. if __declspec(thread) is not used). Force
116 // a reference to p_thread_callback_boringssl to prevent whole program
117 // optimization from discarding the variable.
118 //
119 // Note, in the prefixed build, |p_thread_callback_boringssl| may be a macro.
120 #define STRINGIFY(x) #x
121 #define EXPAND_AND_STRINGIFY(x) STRINGIFY(x)
122 #ifdef _WIN64
123 __pragma(comment(linker, "/INCLUDE:_tls_used")) __pragma(comment(
124     linker, "/INCLUDE:" EXPAND_AND_STRINGIFY(p_thread_callback_boringssl)))
125 #else
126 __pragma(comment(linker, "/INCLUDE:__tls_used")) __pragma(comment(
127     linker, "/INCLUDE:_" EXPAND_AND_STRINGIFY(p_thread_callback_boringssl)))
128 #endif
129 
130 // .CRT$XLA to .CRT$XLZ is an array of PIMAGE_TLS_CALLBACK pointers that are
131 // called automatically by the OS loader code (not the CRT) when the module is
132 // loaded and on thread creation. They are NOT called if the module has been
133 // loaded by a LoadLibrary() call. It must have implicitly been loaded at
134 // process startup.
135 //
136 // By implicitly loaded, I mean that it is directly referenced by the main EXE
137 // or by one of its dependent DLLs. Delay-loaded DLL doesn't count as being
138 // implicitly loaded.
139 //
140 // See VC\crt\src\tlssup.c for reference.
141 
142 // The linker must not discard p_thread_callback_boringssl. (We force a
143 // reference to this variable with a linker /INCLUDE:symbol pragma to ensure
144 // that.) If this variable is discarded, the OnThreadExit function will never
145 // be called.
146 #ifdef _WIN64
147 
148 // .CRT section is merged with .rdata on x64 so it must be constant data.
149 #pragma const_seg(".CRT$XLC")
150     // clang-format off
151     // When defining a const variable, it must have external linkage to be sure
152     // the linker doesn't discard it.
153 extern "C" {
154   extern const PIMAGE_TLS_CALLBACK p_thread_callback_boringssl;
155 }
156 // clang-format on
157 const PIMAGE_TLS_CALLBACK p_thread_callback_boringssl = thread_local_destructor;
158 // Reset the default section.
159 #pragma const_seg()
160 
161 #else
162 
163 #pragma data_seg(".CRT$XLC")
164     // clang-format off
165 extern "C" {
166   extern PIMAGE_TLS_CALLBACK p_thread_callback_boringssl;
167 }
168 // clang-format on
169 PIMAGE_TLS_CALLBACK p_thread_callback_boringssl = thread_local_destructor;
170 // Reset the default section.
171 #pragma data_seg()
172 
173 #endif  // _WIN64
174 
get_thread_locals(void)175 static void **get_thread_locals(void) {
176   // |TlsGetValue| clears the last error even on success, so that callers may
177   // distinguish it successfully returning NULL or failing. It is documented to
178   // never fail if the argument is a valid index from |TlsAlloc|, so we do not
179   // need to handle this.
180   //
181   // However, this error-mangling behavior interferes with the caller's use of
182   // |GetLastError|. In particular |SSL_get_error| queries the error queue to
183   // determine whether the caller should look at the OS's errors. To avoid
184   // destroying state, save and restore the Windows error.
185   //
186   // https://msdn.microsoft.com/en-us/library/windows/desktop/ms686812(v=vs.85).aspx
187   DWORD last_error = GetLastError();
188   void **ret = reinterpret_cast<void **>(TlsGetValue(g_thread_local_key));
189   SetLastError(last_error);
190   return ret;
191 }
192 
CRYPTO_get_thread_local(thread_local_data_t index)193 void *CRYPTO_get_thread_local(thread_local_data_t index) {
194   CRYPTO_once(&g_thread_local_init_once, thread_local_init);
195   if (g_thread_local_failed) {
196     return NULL;
197   }
198 
199   void **pointers = get_thread_locals();
200   if (pointers == NULL) {
201     return NULL;
202   }
203   return pointers[index];
204 }
205 
CRYPTO_set_thread_local(thread_local_data_t index,void * value,thread_local_destructor_t destructor)206 int CRYPTO_set_thread_local(thread_local_data_t index, void *value,
207                             thread_local_destructor_t destructor) {
208   CRYPTO_once(&g_thread_local_init_once, thread_local_init);
209   if (g_thread_local_failed) {
210     destructor(value);
211     return 0;
212   }
213 
214   void **pointers = get_thread_locals();
215   if (pointers == NULL) {
216     pointers = reinterpret_cast<void **>(
217         malloc(sizeof(void *) * NUM_OPENSSL_THREAD_LOCALS));
218     if (pointers == NULL) {
219       destructor(value);
220       return 0;
221     }
222     OPENSSL_memset(pointers, 0, sizeof(void *) * NUM_OPENSSL_THREAD_LOCALS);
223     if (TlsSetValue(g_thread_local_key, pointers) == 0) {
224       free(pointers);
225       destructor(value);
226       return 0;
227     }
228   }
229 
230   AcquireSRWLockExclusive(&g_destructors_lock);
231   g_destructors[index] = destructor;
232   ReleaseSRWLockExclusive(&g_destructors_lock);
233 
234   pointers[index] = value;
235   return 1;
236 }
237 
238 #endif  // OPENSSL_WINDOWS_THREADS
239