1/*
2 * Copyright (C) 2008 The Android Open Source Project
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
7 * are met:
8 *  * Redistributions of source code must retain the above copyright
9 *    notice, this list of conditions and the following disclaimer.
10 *  * Redistributions in binary form must reproduce the above copyright
11 *    notice, this list of conditions and the following disclaimer in
12 *    the documentation and/or other materials provided with the
13 *    distribution.
14 *
15 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
16 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
17 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
18 * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
19 * COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
20 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
21 * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS
22 * OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
23 * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
24 * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
25 * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26 * SUCH DAMAGE.
27 */
28
29#include <pthread.h>
30
31#include <errno.h>
32#include <string.h>
33#include <sys/mman.h>
34#include <unistd.h>
35
36#include "pthread_internal.h"
37
38#include <async_safe/log.h>
39
40#include "private/bionic_defs.h"
41#include "private/bionic_macros.h"
42#include "private/bionic_prctl.h"
43#include "private/bionic_ssp.h"
44#include "private/bionic_tls.h"
45#include "private/ErrnoRestorer.h"
46
47// x86 uses segment descriptors rather than a direct pointer to TLS.
48#if defined(__i386__)
49#include <asm/ldt.h>
50void __init_user_desc(struct user_desc*, bool, void*);
51#endif
52
53// This code is used both by each new pthread and the code that initializes the main thread.
54bool __init_tls(pthread_internal_t* thread) {
55  // Slot 0 must point to itself. The x86 Linux kernel reads the TLS from %fs:0.
56  thread->tls[TLS_SLOT_SELF] = thread->tls;
57  thread->tls[TLS_SLOT_THREAD_ID] = thread;
58
59  // Add a guard before and after.
60  size_t allocation_size = BIONIC_TLS_SIZE + (2 * PTHREAD_GUARD_SIZE);
61  void* allocation = mmap(nullptr, allocation_size, PROT_NONE, MAP_PRIVATE | MAP_ANONYMOUS, -1, 0);
62  if (allocation == MAP_FAILED) {
63    async_safe_format_log(ANDROID_LOG_WARN, "libc",
64                          "pthread_create failed: couldn't allocate TLS: %s", strerror(errno));
65    return false;
66  }
67
68  prctl(PR_SET_VMA, PR_SET_VMA_ANON_NAME, allocation, allocation_size, "bionic TLS guard");
69
70  // Carve out the writable TLS section.
71  thread->bionic_tls = reinterpret_cast<bionic_tls*>(static_cast<char*>(allocation) +
72                                                     PTHREAD_GUARD_SIZE);
73  if (mprotect(thread->bionic_tls, BIONIC_TLS_SIZE, PROT_READ | PROT_WRITE) != 0) {
74    async_safe_format_log(ANDROID_LOG_WARN, "libc",
75                          "pthread_create failed: couldn't mprotect TLS: %s", strerror(errno));
76    munmap(allocation, allocation_size);
77    return false;
78  }
79
80  prctl(PR_SET_VMA, PR_SET_VMA_ANON_NAME, thread->bionic_tls, BIONIC_TLS_SIZE, "bionic TLS");
81  return true;
82}
83
84void __init_thread_stack_guard(pthread_internal_t* thread) {
85  // GCC looks in the TLS for the stack guard on x86, so copy it there from our global.
86  thread->tls[TLS_SLOT_STACK_GUARD] = reinterpret_cast<void*>(__stack_chk_guard);
87}
88
89void __init_alternate_signal_stack(pthread_internal_t* thread) {
90  // Create and set an alternate signal stack.
91  void* stack_base = mmap(NULL, SIGNAL_STACK_SIZE, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0);
92  if (stack_base != MAP_FAILED) {
93    // Create a guard to catch stack overflows in signal handlers.
94    if (mprotect(stack_base, PTHREAD_GUARD_SIZE, PROT_NONE) == -1) {
95      munmap(stack_base, SIGNAL_STACK_SIZE);
96      return;
97    }
98    stack_t ss;
99    ss.ss_sp = reinterpret_cast<uint8_t*>(stack_base) + PTHREAD_GUARD_SIZE;
100    ss.ss_size = SIGNAL_STACK_SIZE - PTHREAD_GUARD_SIZE;
101    ss.ss_flags = 0;
102    sigaltstack(&ss, NULL);
103    thread->alternate_signal_stack = stack_base;
104
105    // We can only use const static allocated string for mapped region name, as Android kernel
106    // uses the string pointer directly when dumping /proc/pid/maps.
107    prctl(PR_SET_VMA, PR_SET_VMA_ANON_NAME, ss.ss_sp, ss.ss_size, "thread signal stack");
108    prctl(PR_SET_VMA, PR_SET_VMA_ANON_NAME, stack_base, PTHREAD_GUARD_SIZE, "thread signal stack guard");
109  }
110}
111
112int __init_thread(pthread_internal_t* thread) {
113  thread->cleanup_stack = nullptr;
114
115  if (__predict_true((thread->attr.flags & PTHREAD_ATTR_FLAG_DETACHED) == 0)) {
116    atomic_init(&thread->join_state, THREAD_NOT_JOINED);
117  } else {
118    atomic_init(&thread->join_state, THREAD_DETACHED);
119  }
120
121  // Set the scheduling policy/priority of the thread if necessary.
122  bool need_set = true;
123  int policy;
124  sched_param param;
125  if ((thread->attr.flags & PTHREAD_ATTR_FLAG_INHERIT) != 0) {
126    // Unless the parent has SCHED_RESET_ON_FORK set, we've already inherited from the parent.
127    policy = sched_getscheduler(0);
128    need_set = ((policy & SCHED_RESET_ON_FORK) != 0);
129    if (need_set) {
130      if (policy == -1) {
131        async_safe_format_log(ANDROID_LOG_WARN, "libc",
132                              "pthread_create sched_getscheduler failed: %s", strerror(errno));
133        return errno;
134      }
135      if (sched_getparam(0, &param) == -1) {
136        async_safe_format_log(ANDROID_LOG_WARN, "libc",
137                              "pthread_create sched_getparam failed: %s", strerror(errno));
138        return errno;
139      }
140    }
141  } else {
142    policy = thread->attr.sched_policy;
143    param.sched_priority = thread->attr.sched_priority;
144  }
145  // Backwards compatibility: before P, Android didn't have pthread_attr_setinheritsched,
146  // and our behavior was neither of the POSIX behaviors.
147  if ((thread->attr.flags & (PTHREAD_ATTR_FLAG_INHERIT|PTHREAD_ATTR_FLAG_EXPLICIT)) == 0) {
148    need_set = (thread->attr.sched_policy != SCHED_NORMAL);
149  }
150  if (need_set) {
151    if (sched_setscheduler(thread->tid, policy, &param) == -1) {
152      async_safe_format_log(ANDROID_LOG_WARN, "libc",
153                            "pthread_create sched_setscheduler(%d, {%d}) call failed: %s", policy,
154                            param.sched_priority, strerror(errno));
155#if defined(__LP64__)
156      // For backwards compatibility reasons, we only report failures on 64-bit devices.
157      return errno;
158#endif
159    }
160  }
161
162  return 0;
163}
164
165static void* __create_thread_mapped_space(size_t mmap_size, size_t stack_guard_size) {
166  // Create a new private anonymous map.
167  int prot = PROT_READ | PROT_WRITE;
168  int flags = MAP_PRIVATE | MAP_ANONYMOUS | MAP_NORESERVE;
169  void* space = mmap(NULL, mmap_size, prot, flags, -1, 0);
170  if (space == MAP_FAILED) {
171    async_safe_format_log(ANDROID_LOG_WARN,
172                      "libc",
173                      "pthread_create failed: couldn't allocate %zu-bytes mapped space: %s",
174                      mmap_size, strerror(errno));
175    return NULL;
176  }
177
178  // Stack is at the lower end of mapped space, stack guard region is at the lower end of stack.
179  // Set the stack guard region to PROT_NONE, so we can detect thread stack overflow.
180  if (mprotect(space, stack_guard_size, PROT_NONE) == -1) {
181    async_safe_format_log(ANDROID_LOG_WARN, "libc",
182                          "pthread_create failed: couldn't mprotect PROT_NONE %zu-byte stack guard region: %s",
183                          stack_guard_size, strerror(errno));
184    munmap(space, mmap_size);
185    return NULL;
186  }
187  prctl(PR_SET_VMA, PR_SET_VMA_ANON_NAME, space, stack_guard_size, "thread stack guard");
188
189  return space;
190}
191
192static int __allocate_thread(pthread_attr_t* attr, pthread_internal_t** threadp, void** child_stack) {
193  size_t mmap_size;
194  uint8_t* stack_top;
195
196  if (attr->stack_base == NULL) {
197    // The caller didn't provide a stack, so allocate one.
198    // Make sure the stack size and guard size are multiples of PAGE_SIZE.
199    if (__builtin_add_overflow(attr->stack_size, attr->guard_size, &mmap_size)) return EAGAIN;
200    if (__builtin_add_overflow(mmap_size, sizeof(pthread_internal_t), &mmap_size)) return EAGAIN;
201    mmap_size = __BIONIC_ALIGN(mmap_size, PAGE_SIZE);
202    attr->guard_size = __BIONIC_ALIGN(attr->guard_size, PAGE_SIZE);
203    attr->stack_base = __create_thread_mapped_space(mmap_size, attr->guard_size);
204    if (attr->stack_base == NULL) {
205      return EAGAIN;
206    }
207    stack_top = reinterpret_cast<uint8_t*>(attr->stack_base) + mmap_size;
208  } else {
209    // Remember the mmap size is zero and we don't need to free it.
210    mmap_size = 0;
211    stack_top = reinterpret_cast<uint8_t*>(attr->stack_base) + attr->stack_size;
212  }
213
214  // Mapped space(or user allocated stack) is used for:
215  //   pthread_internal_t
216  //   thread stack (including guard)
217
218  // To safely access the pthread_internal_t and thread stack, we need to find a 16-byte aligned boundary.
219  stack_top = reinterpret_cast<uint8_t*>(
220                (reinterpret_cast<uintptr_t>(stack_top) - sizeof(pthread_internal_t)) & ~0xf);
221
222  pthread_internal_t* thread = reinterpret_cast<pthread_internal_t*>(stack_top);
223  if (mmap_size == 0) {
224    // If thread was not allocated by mmap(), it may not have been cleared to zero.
225    // So assume the worst and zero it.
226    memset(thread, 0, sizeof(pthread_internal_t));
227  }
228  attr->stack_size = stack_top - reinterpret_cast<uint8_t*>(attr->stack_base);
229
230  thread->mmap_size = mmap_size;
231  thread->attr = *attr;
232  if (!__init_tls(thread)) {
233    if (thread->mmap_size != 0) munmap(thread->attr.stack_base, thread->mmap_size);
234    return EAGAIN;
235  }
236  __init_thread_stack_guard(thread);
237
238  *threadp = thread;
239  *child_stack = stack_top;
240  return 0;
241}
242
243static int __pthread_start(void* arg) {
244  pthread_internal_t* thread = reinterpret_cast<pthread_internal_t*>(arg);
245
246  // Wait for our creating thread to release us. This lets it have time to
247  // notify gdb about this thread before we start doing anything.
248  // This also provides the memory barrier needed to ensure that all memory
249  // accesses previously made by the creating thread are visible to us.
250  thread->startup_handshake_lock.lock();
251
252  __init_alternate_signal_stack(thread);
253
254  void* result = thread->start_routine(thread->start_routine_arg);
255  pthread_exit(result);
256
257  return 0;
258}
259
260// A dummy start routine for pthread_create failures where we've created a thread but aren't
261// going to run user code on it. We swap out the user's start routine for this and take advantage
262// of the regular thread teardown to free up resources.
263static void* __do_nothing(void*) {
264  return NULL;
265}
266
267
268__BIONIC_WEAK_FOR_NATIVE_BRIDGE
269int pthread_create(pthread_t* thread_out, pthread_attr_t const* attr,
270                   void* (*start_routine)(void*), void* arg) {
271  ErrnoRestorer errno_restorer;
272
273  pthread_attr_t thread_attr;
274  if (attr == NULL) {
275    pthread_attr_init(&thread_attr);
276  } else {
277    thread_attr = *attr;
278    attr = NULL; // Prevent misuse below.
279  }
280
281  pthread_internal_t* thread = NULL;
282  void* child_stack = NULL;
283  int result = __allocate_thread(&thread_attr, &thread, &child_stack);
284  if (result != 0) {
285    return result;
286  }
287
288  // Create a lock for the thread to wait on once it starts so we can keep
289  // it from doing anything until after we notify the debugger about it
290  //
291  // This also provides the memory barrier we need to ensure that all
292  // memory accesses previously performed by this thread are visible to
293  // the new thread.
294  thread->startup_handshake_lock.init(false);
295  thread->startup_handshake_lock.lock();
296
297  thread->start_routine = start_routine;
298  thread->start_routine_arg = arg;
299
300  thread->set_cached_pid(getpid());
301
302  int flags = CLONE_VM | CLONE_FS | CLONE_FILES | CLONE_SIGHAND | CLONE_THREAD | CLONE_SYSVSEM |
303      CLONE_SETTLS | CLONE_PARENT_SETTID | CLONE_CHILD_CLEARTID;
304  void* tls = reinterpret_cast<void*>(thread->tls);
305#if defined(__i386__)
306  // On x86 (but not x86-64), CLONE_SETTLS takes a pointer to a struct user_desc rather than
307  // a pointer to the TLS itself.
308  user_desc tls_descriptor;
309  __init_user_desc(&tls_descriptor, false, tls);
310  tls = &tls_descriptor;
311#endif
312  int rc = clone(__pthread_start, child_stack, flags, thread, &(thread->tid), tls, &(thread->tid));
313  if (rc == -1) {
314    int clone_errno = errno;
315    // We don't have to unlock the mutex at all because clone(2) failed so there's no child waiting to
316    // be unblocked, but we're about to unmap the memory the mutex is stored in, so this serves as a
317    // reminder that you can't rewrite this function to use a ScopedPthreadMutexLocker.
318    thread->startup_handshake_lock.unlock();
319    if (thread->mmap_size != 0) {
320      munmap(thread->attr.stack_base, thread->mmap_size);
321    }
322    async_safe_format_log(ANDROID_LOG_WARN, "libc", "pthread_create failed: clone failed: %s",
323                          strerror(clone_errno));
324    return clone_errno;
325  }
326
327  int init_errno = __init_thread(thread);
328  if (init_errno != 0) {
329    // Mark the thread detached and replace its start_routine with a no-op.
330    // Letting the thread run is the easiest way to clean up its resources.
331    atomic_store(&thread->join_state, THREAD_DETACHED);
332    __pthread_internal_add(thread);
333    thread->start_routine = __do_nothing;
334    thread->startup_handshake_lock.unlock();
335    return init_errno;
336  }
337
338  // Publish the pthread_t and unlock the mutex to let the new thread start running.
339  *thread_out = __pthread_internal_add(thread);
340  thread->startup_handshake_lock.unlock();
341
342  return 0;
343}
344