• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*
2  * Copyright (C) 2008 The Android Open Source Project
3  * All rights reserved.
4  *
5  * Redistribution and use in source and binary forms, with or without
6  * modification, are permitted provided that the following conditions
7  * are met:
8  *  * Redistributions of source code must retain the above copyright
9  *    notice, this list of conditions and the following disclaimer.
10  *  * Redistributions in binary form must reproduce the above copyright
11  *    notice, this list of conditions and the following disclaimer in
12  *    the documentation and/or other materials provided with the
13  *    distribution.
14  *
15  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
16  * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
17  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
18  * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
19  * COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
20  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
21  * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS
22  * OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
23  * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
24  * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
25  * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26  * SUCH DAMAGE.
27  */
28 
29 #include <pthread.h>
30 
31 #include <errno.h>
32 #include <string.h>
33 #include <sys/mman.h>
34 #include <unistd.h>
35 
36 #include "pthread_internal.h"
37 
38 #include <async_safe/log.h>
39 
40 #include "private/bionic_macros.h"
41 #include "private/bionic_prctl.h"
42 #include "private/bionic_ssp.h"
43 #include "private/bionic_tls.h"
44 #include "private/ErrnoRestorer.h"
45 
46 // x86 uses segment descriptors rather than a direct pointer to TLS.
47 #if defined(__i386__)
48 #include <asm/ldt.h>
49 void __init_user_desc(struct user_desc*, bool, void*);
50 #endif
51 
52 // This code is used both by each new pthread and the code that initializes the main thread.
__init_tls(pthread_internal_t * thread)53 bool __init_tls(pthread_internal_t* thread) {
54   // Slot 0 must point to itself. The x86 Linux kernel reads the TLS from %fs:0.
55   thread->tls[TLS_SLOT_SELF] = thread->tls;
56   thread->tls[TLS_SLOT_THREAD_ID] = thread;
57 
58   // Add a guard page before and after.
59   size_t allocation_size = BIONIC_TLS_SIZE + 2 * PAGE_SIZE;
60   void* allocation = mmap(nullptr, allocation_size, PROT_NONE, MAP_PRIVATE | MAP_ANONYMOUS, -1, 0);
61   if (allocation == MAP_FAILED) {
62     async_safe_format_log(ANDROID_LOG_WARN, "libc",
63                           "pthread_create failed: couldn't allocate TLS: %s", strerror(errno));
64     return false;
65   }
66 
67   prctl(PR_SET_VMA, PR_SET_VMA_ANON_NAME, allocation, allocation_size, "bionic TLS guard");
68 
69   // Carve out the writable TLS section.
70   thread->bionic_tls = reinterpret_cast<bionic_tls*>(static_cast<char*>(allocation) + PAGE_SIZE);
71   if (mprotect(thread->bionic_tls, BIONIC_TLS_SIZE, PROT_READ | PROT_WRITE) != 0) {
72     async_safe_format_log(ANDROID_LOG_WARN, "libc",
73                           "pthread_create failed: couldn't mprotect TLS: %s", strerror(errno));
74     munmap(allocation, allocation_size);
75     return false;
76   }
77 
78   prctl(PR_SET_VMA, PR_SET_VMA_ANON_NAME, thread->bionic_tls, BIONIC_TLS_SIZE, "bionic TLS");
79   return true;
80 }
81 
__init_thread_stack_guard(pthread_internal_t * thread)82 void __init_thread_stack_guard(pthread_internal_t* thread) {
83   // GCC looks in the TLS for the stack guard on x86, so copy it there from our global.
84   thread->tls[TLS_SLOT_STACK_GUARD] = reinterpret_cast<void*>(__stack_chk_guard);
85 }
86 
__init_alternate_signal_stack(pthread_internal_t * thread)87 void __init_alternate_signal_stack(pthread_internal_t* thread) {
88   // Create and set an alternate signal stack.
89   void* stack_base = mmap(NULL, SIGNAL_STACK_SIZE, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0);
90   if (stack_base != MAP_FAILED) {
91 
92     // Create a guard page to catch stack overflows in signal handlers.
93     if (mprotect(stack_base, PAGE_SIZE, PROT_NONE) == -1) {
94       munmap(stack_base, SIGNAL_STACK_SIZE);
95       return;
96     }
97     stack_t ss;
98     ss.ss_sp = reinterpret_cast<uint8_t*>(stack_base) + PAGE_SIZE;
99     ss.ss_size = SIGNAL_STACK_SIZE - PAGE_SIZE;
100     ss.ss_flags = 0;
101     sigaltstack(&ss, NULL);
102     thread->alternate_signal_stack = stack_base;
103 
104     // We can only use const static allocated string for mapped region name, as Android kernel
105     // uses the string pointer directly when dumping /proc/pid/maps.
106     prctl(PR_SET_VMA, PR_SET_VMA_ANON_NAME, ss.ss_sp, ss.ss_size, "thread signal stack");
107     prctl(PR_SET_VMA, PR_SET_VMA_ANON_NAME, stack_base, PAGE_SIZE, "thread signal stack guard page");
108   }
109 }
110 
__init_thread(pthread_internal_t * thread)111 int __init_thread(pthread_internal_t* thread) {
112   int error = 0;
113 
114   if (__predict_true((thread->attr.flags & PTHREAD_ATTR_FLAG_DETACHED) == 0)) {
115     atomic_init(&thread->join_state, THREAD_NOT_JOINED);
116   } else {
117     atomic_init(&thread->join_state, THREAD_DETACHED);
118   }
119 
120   // Set the scheduling policy/priority of the thread.
121   if (thread->attr.sched_policy != SCHED_NORMAL) {
122     sched_param param;
123     param.sched_priority = thread->attr.sched_priority;
124     if (sched_setscheduler(thread->tid, thread->attr.sched_policy, &param) == -1) {
125 #if defined(__LP64__)
126       // For backwards compatibility reasons, we only report failures on 64-bit devices.
127       error = errno;
128 #endif
129       async_safe_format_log(ANDROID_LOG_WARN, "libc",
130                             "pthread_create sched_setscheduler call failed: %s", strerror(errno));
131     }
132   }
133 
134   thread->cleanup_stack = NULL;
135 
136   return error;
137 }
138 
__create_thread_mapped_space(size_t mmap_size,size_t stack_guard_size)139 static void* __create_thread_mapped_space(size_t mmap_size, size_t stack_guard_size) {
140   // Create a new private anonymous map.
141   int prot = PROT_READ | PROT_WRITE;
142   int flags = MAP_PRIVATE | MAP_ANONYMOUS | MAP_NORESERVE;
143   void* space = mmap(NULL, mmap_size, prot, flags, -1, 0);
144   if (space == MAP_FAILED) {
145     async_safe_format_log(ANDROID_LOG_WARN,
146                       "libc",
147                       "pthread_create failed: couldn't allocate %zu-bytes mapped space: %s",
148                       mmap_size, strerror(errno));
149     return NULL;
150   }
151 
152   // Stack is at the lower end of mapped space, stack guard region is at the lower end of stack.
153   // Set the stack guard region to PROT_NONE, so we can detect thread stack overflow.
154   if (mprotect(space, stack_guard_size, PROT_NONE) == -1) {
155     async_safe_format_log(ANDROID_LOG_WARN, "libc",
156                           "pthread_create failed: couldn't mprotect PROT_NONE %zu-byte stack guard region: %s",
157                           stack_guard_size, strerror(errno));
158     munmap(space, mmap_size);
159     return NULL;
160   }
161   prctl(PR_SET_VMA, PR_SET_VMA_ANON_NAME, space, stack_guard_size, "thread stack guard page");
162 
163   return space;
164 }
165 
__allocate_thread(pthread_attr_t * attr,pthread_internal_t ** threadp,void ** child_stack)166 static int __allocate_thread(pthread_attr_t* attr, pthread_internal_t** threadp, void** child_stack) {
167   size_t mmap_size;
168   uint8_t* stack_top;
169 
170   if (attr->stack_base == NULL) {
171     // The caller didn't provide a stack, so allocate one.
172     // Make sure the stack size and guard size are multiples of PAGE_SIZE.
173     mmap_size = BIONIC_ALIGN(attr->stack_size + sizeof(pthread_internal_t), PAGE_SIZE);
174     attr->guard_size = BIONIC_ALIGN(attr->guard_size, PAGE_SIZE);
175     attr->stack_base = __create_thread_mapped_space(mmap_size, attr->guard_size);
176     if (attr->stack_base == NULL) {
177       return EAGAIN;
178     }
179     stack_top = reinterpret_cast<uint8_t*>(attr->stack_base) + mmap_size;
180   } else {
181     // Remember the mmap size is zero and we don't need to free it.
182     mmap_size = 0;
183     stack_top = reinterpret_cast<uint8_t*>(attr->stack_base) + attr->stack_size;
184   }
185 
186   // Mapped space(or user allocated stack) is used for:
187   //   pthread_internal_t
188   //   thread stack (including guard page)
189 
190   // To safely access the pthread_internal_t and thread stack, we need to find a 16-byte aligned boundary.
191   stack_top = reinterpret_cast<uint8_t*>(
192                 (reinterpret_cast<uintptr_t>(stack_top) - sizeof(pthread_internal_t)) & ~0xf);
193 
194   pthread_internal_t* thread = reinterpret_cast<pthread_internal_t*>(stack_top);
195   if (mmap_size == 0) {
196     // If thread was not allocated by mmap(), it may not have been cleared to zero.
197     // So assume the worst and zero it.
198     memset(thread, 0, sizeof(pthread_internal_t));
199   }
200   attr->stack_size = stack_top - reinterpret_cast<uint8_t*>(attr->stack_base);
201 
202   thread->mmap_size = mmap_size;
203   thread->attr = *attr;
204   if (!__init_tls(thread)) {
205     if (thread->mmap_size != 0) munmap(thread->attr.stack_base, thread->mmap_size);
206     return EAGAIN;
207   }
208   __init_thread_stack_guard(thread);
209 
210   *threadp = thread;
211   *child_stack = stack_top;
212   return 0;
213 }
214 
__pthread_start(void * arg)215 static int __pthread_start(void* arg) {
216   pthread_internal_t* thread = reinterpret_cast<pthread_internal_t*>(arg);
217 
218   // Wait for our creating thread to release us. This lets it have time to
219   // notify gdb about this thread before we start doing anything.
220   // This also provides the memory barrier needed to ensure that all memory
221   // accesses previously made by the creating thread are visible to us.
222   thread->startup_handshake_lock.lock();
223 
224   __init_alternate_signal_stack(thread);
225 
226   void* result = thread->start_routine(thread->start_routine_arg);
227   pthread_exit(result);
228 
229   return 0;
230 }
231 
232 // A dummy start routine for pthread_create failures where we've created a thread but aren't
233 // going to run user code on it. We swap out the user's start routine for this and take advantage
234 // of the regular thread teardown to free up resources.
__do_nothing(void *)235 static void* __do_nothing(void*) {
236   return NULL;
237 }
238 
pthread_create(pthread_t * thread_out,pthread_attr_t const * attr,void * (* start_routine)(void *),void * arg)239 int pthread_create(pthread_t* thread_out, pthread_attr_t const* attr,
240                    void* (*start_routine)(void*), void* arg) {
241   ErrnoRestorer errno_restorer;
242 
243   pthread_attr_t thread_attr;
244   if (attr == NULL) {
245     pthread_attr_init(&thread_attr);
246   } else {
247     thread_attr = *attr;
248     attr = NULL; // Prevent misuse below.
249   }
250 
251   pthread_internal_t* thread = NULL;
252   void* child_stack = NULL;
253   int result = __allocate_thread(&thread_attr, &thread, &child_stack);
254   if (result != 0) {
255     return result;
256   }
257 
258   // Create a lock for the thread to wait on once it starts so we can keep
259   // it from doing anything until after we notify the debugger about it
260   //
261   // This also provides the memory barrier we need to ensure that all
262   // memory accesses previously performed by this thread are visible to
263   // the new thread.
264   thread->startup_handshake_lock.init(false);
265   thread->startup_handshake_lock.lock();
266 
267   thread->start_routine = start_routine;
268   thread->start_routine_arg = arg;
269 
270   thread->set_cached_pid(getpid());
271 
272   int flags = CLONE_VM | CLONE_FS | CLONE_FILES | CLONE_SIGHAND | CLONE_THREAD | CLONE_SYSVSEM |
273       CLONE_SETTLS | CLONE_PARENT_SETTID | CLONE_CHILD_CLEARTID;
274   void* tls = reinterpret_cast<void*>(thread->tls);
275 #if defined(__i386__)
276   // On x86 (but not x86-64), CLONE_SETTLS takes a pointer to a struct user_desc rather than
277   // a pointer to the TLS itself.
278   user_desc tls_descriptor;
279   __init_user_desc(&tls_descriptor, false, tls);
280   tls = &tls_descriptor;
281 #endif
282   int rc = clone(__pthread_start, child_stack, flags, thread, &(thread->tid), tls, &(thread->tid));
283   if (rc == -1) {
284     int clone_errno = errno;
285     // We don't have to unlock the mutex at all because clone(2) failed so there's no child waiting to
286     // be unblocked, but we're about to unmap the memory the mutex is stored in, so this serves as a
287     // reminder that you can't rewrite this function to use a ScopedPthreadMutexLocker.
288     thread->startup_handshake_lock.unlock();
289     if (thread->mmap_size != 0) {
290       munmap(thread->attr.stack_base, thread->mmap_size);
291     }
292     async_safe_format_log(ANDROID_LOG_WARN, "libc", "pthread_create failed: clone failed: %s",
293                           strerror(errno));
294     return clone_errno;
295   }
296 
297   int init_errno = __init_thread(thread);
298   if (init_errno != 0) {
299     // Mark the thread detached and replace its start_routine with a no-op.
300     // Letting the thread run is the easiest way to clean up its resources.
301     atomic_store(&thread->join_state, THREAD_DETACHED);
302     __pthread_internal_add(thread);
303     thread->start_routine = __do_nothing;
304     thread->startup_handshake_lock.unlock();
305     return init_errno;
306   }
307 
308   // Publish the pthread_t and unlock the mutex to let the new thread start running.
309   *thread_out = __pthread_internal_add(thread);
310   thread->startup_handshake_lock.unlock();
311 
312   return 0;
313 }
314