1/* 2 * Copyright (C) 2008 The Android Open Source Project 3 * All rights reserved. 4 * 5 * Redistribution and use in source and binary forms, with or without 6 * modification, are permitted provided that the following conditions 7 * are met: 8 * * Redistributions of source code must retain the above copyright 9 * notice, this list of conditions and the following disclaimer. 10 * * Redistributions in binary form must reproduce the above copyright 11 * notice, this list of conditions and the following disclaimer in 12 * the documentation and/or other materials provided with the 13 * distribution. 14 * 15 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 16 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 17 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS 18 * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE 19 * COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, 20 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, 21 * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS 22 * OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED 23 * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, 24 * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT 25 * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 26 * SUCH DAMAGE. 27 */ 28 29#include <pthread.h> 30 31#include <errno.h> 32#include <string.h> 33#include <sys/mman.h> 34#include <unistd.h> 35 36#include "pthread_internal.h" 37 38#include <async_safe/log.h> 39 40#include "private/bionic_defs.h" 41#include "private/bionic_macros.h" 42#include "private/bionic_prctl.h" 43#include "private/bionic_ssp.h" 44#include "private/bionic_tls.h" 45#include "private/ErrnoRestorer.h" 46 47// x86 uses segment descriptors rather than a direct pointer to TLS. 48#if defined(__i386__) 49#include <asm/ldt.h> 50void __init_user_desc(struct user_desc*, bool, void*); 51#endif 52 53// This code is used both by each new pthread and the code that initializes the main thread. 54bool __init_tls(pthread_internal_t* thread) { 55 // Slot 0 must point to itself. The x86 Linux kernel reads the TLS from %fs:0. 56 thread->tls[TLS_SLOT_SELF] = thread->tls; 57 thread->tls[TLS_SLOT_THREAD_ID] = thread; 58 59 // Add a guard before and after. 60 size_t allocation_size = BIONIC_TLS_SIZE + (2 * PTHREAD_GUARD_SIZE); 61 void* allocation = mmap(nullptr, allocation_size, PROT_NONE, MAP_PRIVATE | MAP_ANONYMOUS, -1, 0); 62 if (allocation == MAP_FAILED) { 63 async_safe_format_log(ANDROID_LOG_WARN, "libc", 64 "pthread_create failed: couldn't allocate TLS: %s", strerror(errno)); 65 return false; 66 } 67 68 prctl(PR_SET_VMA, PR_SET_VMA_ANON_NAME, allocation, allocation_size, "bionic TLS guard"); 69 70 // Carve out the writable TLS section. 71 thread->bionic_tls = reinterpret_cast<bionic_tls*>(static_cast<char*>(allocation) + 72 PTHREAD_GUARD_SIZE); 73 if (mprotect(thread->bionic_tls, BIONIC_TLS_SIZE, PROT_READ | PROT_WRITE) != 0) { 74 async_safe_format_log(ANDROID_LOG_WARN, "libc", 75 "pthread_create failed: couldn't mprotect TLS: %s", strerror(errno)); 76 munmap(allocation, allocation_size); 77 return false; 78 } 79 80 prctl(PR_SET_VMA, PR_SET_VMA_ANON_NAME, thread->bionic_tls, BIONIC_TLS_SIZE, "bionic TLS"); 81 return true; 82} 83 84void __init_thread_stack_guard(pthread_internal_t* thread) { 85 // GCC looks in the TLS for the stack guard on x86, so copy it there from our global. 86 thread->tls[TLS_SLOT_STACK_GUARD] = reinterpret_cast<void*>(__stack_chk_guard); 87} 88 89void __init_alternate_signal_stack(pthread_internal_t* thread) { 90 // Create and set an alternate signal stack. 91 void* stack_base = mmap(NULL, SIGNAL_STACK_SIZE, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0); 92 if (stack_base != MAP_FAILED) { 93 // Create a guard to catch stack overflows in signal handlers. 94 if (mprotect(stack_base, PTHREAD_GUARD_SIZE, PROT_NONE) == -1) { 95 munmap(stack_base, SIGNAL_STACK_SIZE); 96 return; 97 } 98 stack_t ss; 99 ss.ss_sp = reinterpret_cast<uint8_t*>(stack_base) + PTHREAD_GUARD_SIZE; 100 ss.ss_size = SIGNAL_STACK_SIZE - PTHREAD_GUARD_SIZE; 101 ss.ss_flags = 0; 102 sigaltstack(&ss, NULL); 103 thread->alternate_signal_stack = stack_base; 104 105 // We can only use const static allocated string for mapped region name, as Android kernel 106 // uses the string pointer directly when dumping /proc/pid/maps. 107 prctl(PR_SET_VMA, PR_SET_VMA_ANON_NAME, ss.ss_sp, ss.ss_size, "thread signal stack"); 108 prctl(PR_SET_VMA, PR_SET_VMA_ANON_NAME, stack_base, PTHREAD_GUARD_SIZE, "thread signal stack guard"); 109 } 110} 111 112int __init_thread(pthread_internal_t* thread) { 113 thread->cleanup_stack = nullptr; 114 115 if (__predict_true((thread->attr.flags & PTHREAD_ATTR_FLAG_DETACHED) == 0)) { 116 atomic_init(&thread->join_state, THREAD_NOT_JOINED); 117 } else { 118 atomic_init(&thread->join_state, THREAD_DETACHED); 119 } 120 121 // Set the scheduling policy/priority of the thread if necessary. 122 bool need_set = true; 123 int policy; 124 sched_param param; 125 if ((thread->attr.flags & PTHREAD_ATTR_FLAG_INHERIT) != 0) { 126 // Unless the parent has SCHED_RESET_ON_FORK set, we've already inherited from the parent. 127 policy = sched_getscheduler(0); 128 need_set = ((policy & SCHED_RESET_ON_FORK) != 0); 129 if (need_set) { 130 if (policy == -1) { 131 async_safe_format_log(ANDROID_LOG_WARN, "libc", 132 "pthread_create sched_getscheduler failed: %s", strerror(errno)); 133 return errno; 134 } 135 if (sched_getparam(0, ¶m) == -1) { 136 async_safe_format_log(ANDROID_LOG_WARN, "libc", 137 "pthread_create sched_getparam failed: %s", strerror(errno)); 138 return errno; 139 } 140 } 141 } else { 142 policy = thread->attr.sched_policy; 143 param.sched_priority = thread->attr.sched_priority; 144 } 145 // Backwards compatibility: before P, Android didn't have pthread_attr_setinheritsched, 146 // and our behavior was neither of the POSIX behaviors. 147 if ((thread->attr.flags & (PTHREAD_ATTR_FLAG_INHERIT|PTHREAD_ATTR_FLAG_EXPLICIT)) == 0) { 148 need_set = (thread->attr.sched_policy != SCHED_NORMAL); 149 } 150 if (need_set) { 151 if (sched_setscheduler(thread->tid, policy, ¶m) == -1) { 152 async_safe_format_log(ANDROID_LOG_WARN, "libc", 153 "pthread_create sched_setscheduler(%d, {%d}) call failed: %s", policy, 154 param.sched_priority, strerror(errno)); 155#if defined(__LP64__) 156 // For backwards compatibility reasons, we only report failures on 64-bit devices. 157 return errno; 158#endif 159 } 160 } 161 162 return 0; 163} 164 165static void* __create_thread_mapped_space(size_t mmap_size, size_t stack_guard_size) { 166 // Create a new private anonymous map. 167 int prot = PROT_READ | PROT_WRITE; 168 int flags = MAP_PRIVATE | MAP_ANONYMOUS | MAP_NORESERVE; 169 void* space = mmap(NULL, mmap_size, prot, flags, -1, 0); 170 if (space == MAP_FAILED) { 171 async_safe_format_log(ANDROID_LOG_WARN, 172 "libc", 173 "pthread_create failed: couldn't allocate %zu-bytes mapped space: %s", 174 mmap_size, strerror(errno)); 175 return NULL; 176 } 177 178 // Stack is at the lower end of mapped space, stack guard region is at the lower end of stack. 179 // Set the stack guard region to PROT_NONE, so we can detect thread stack overflow. 180 if (mprotect(space, stack_guard_size, PROT_NONE) == -1) { 181 async_safe_format_log(ANDROID_LOG_WARN, "libc", 182 "pthread_create failed: couldn't mprotect PROT_NONE %zu-byte stack guard region: %s", 183 stack_guard_size, strerror(errno)); 184 munmap(space, mmap_size); 185 return NULL; 186 } 187 prctl(PR_SET_VMA, PR_SET_VMA_ANON_NAME, space, stack_guard_size, "thread stack guard"); 188 189 return space; 190} 191 192static int __allocate_thread(pthread_attr_t* attr, pthread_internal_t** threadp, void** child_stack) { 193 size_t mmap_size; 194 uint8_t* stack_top; 195 196 if (attr->stack_base == NULL) { 197 // The caller didn't provide a stack, so allocate one. 198 // Make sure the stack size and guard size are multiples of PAGE_SIZE. 199 if (__builtin_add_overflow(attr->stack_size, attr->guard_size, &mmap_size)) return EAGAIN; 200 if (__builtin_add_overflow(mmap_size, sizeof(pthread_internal_t), &mmap_size)) return EAGAIN; 201 mmap_size = __BIONIC_ALIGN(mmap_size, PAGE_SIZE); 202 attr->guard_size = __BIONIC_ALIGN(attr->guard_size, PAGE_SIZE); 203 attr->stack_base = __create_thread_mapped_space(mmap_size, attr->guard_size); 204 if (attr->stack_base == NULL) { 205 return EAGAIN; 206 } 207 stack_top = reinterpret_cast<uint8_t*>(attr->stack_base) + mmap_size; 208 } else { 209 // Remember the mmap size is zero and we don't need to free it. 210 mmap_size = 0; 211 stack_top = reinterpret_cast<uint8_t*>(attr->stack_base) + attr->stack_size; 212 } 213 214 // Mapped space(or user allocated stack) is used for: 215 // pthread_internal_t 216 // thread stack (including guard) 217 218 // To safely access the pthread_internal_t and thread stack, we need to find a 16-byte aligned boundary. 219 stack_top = reinterpret_cast<uint8_t*>( 220 (reinterpret_cast<uintptr_t>(stack_top) - sizeof(pthread_internal_t)) & ~0xf); 221 222 pthread_internal_t* thread = reinterpret_cast<pthread_internal_t*>(stack_top); 223 if (mmap_size == 0) { 224 // If thread was not allocated by mmap(), it may not have been cleared to zero. 225 // So assume the worst and zero it. 226 memset(thread, 0, sizeof(pthread_internal_t)); 227 } 228 attr->stack_size = stack_top - reinterpret_cast<uint8_t*>(attr->stack_base); 229 230 thread->mmap_size = mmap_size; 231 thread->attr = *attr; 232 if (!__init_tls(thread)) { 233 if (thread->mmap_size != 0) munmap(thread->attr.stack_base, thread->mmap_size); 234 return EAGAIN; 235 } 236 __init_thread_stack_guard(thread); 237 238 *threadp = thread; 239 *child_stack = stack_top; 240 return 0; 241} 242 243static int __pthread_start(void* arg) { 244 pthread_internal_t* thread = reinterpret_cast<pthread_internal_t*>(arg); 245 246 // Wait for our creating thread to release us. This lets it have time to 247 // notify gdb about this thread before we start doing anything. 248 // This also provides the memory barrier needed to ensure that all memory 249 // accesses previously made by the creating thread are visible to us. 250 thread->startup_handshake_lock.lock(); 251 252 __init_alternate_signal_stack(thread); 253 254 void* result = thread->start_routine(thread->start_routine_arg); 255 pthread_exit(result); 256 257 return 0; 258} 259 260// A dummy start routine for pthread_create failures where we've created a thread but aren't 261// going to run user code on it. We swap out the user's start routine for this and take advantage 262// of the regular thread teardown to free up resources. 263static void* __do_nothing(void*) { 264 return NULL; 265} 266 267 268__BIONIC_WEAK_FOR_NATIVE_BRIDGE 269int pthread_create(pthread_t* thread_out, pthread_attr_t const* attr, 270 void* (*start_routine)(void*), void* arg) { 271 ErrnoRestorer errno_restorer; 272 273 pthread_attr_t thread_attr; 274 if (attr == NULL) { 275 pthread_attr_init(&thread_attr); 276 } else { 277 thread_attr = *attr; 278 attr = NULL; // Prevent misuse below. 279 } 280 281 pthread_internal_t* thread = NULL; 282 void* child_stack = NULL; 283 int result = __allocate_thread(&thread_attr, &thread, &child_stack); 284 if (result != 0) { 285 return result; 286 } 287 288 // Create a lock for the thread to wait on once it starts so we can keep 289 // it from doing anything until after we notify the debugger about it 290 // 291 // This also provides the memory barrier we need to ensure that all 292 // memory accesses previously performed by this thread are visible to 293 // the new thread. 294 thread->startup_handshake_lock.init(false); 295 thread->startup_handshake_lock.lock(); 296 297 thread->start_routine = start_routine; 298 thread->start_routine_arg = arg; 299 300 thread->set_cached_pid(getpid()); 301 302 int flags = CLONE_VM | CLONE_FS | CLONE_FILES | CLONE_SIGHAND | CLONE_THREAD | CLONE_SYSVSEM | 303 CLONE_SETTLS | CLONE_PARENT_SETTID | CLONE_CHILD_CLEARTID; 304 void* tls = reinterpret_cast<void*>(thread->tls); 305#if defined(__i386__) 306 // On x86 (but not x86-64), CLONE_SETTLS takes a pointer to a struct user_desc rather than 307 // a pointer to the TLS itself. 308 user_desc tls_descriptor; 309 __init_user_desc(&tls_descriptor, false, tls); 310 tls = &tls_descriptor; 311#endif 312 int rc = clone(__pthread_start, child_stack, flags, thread, &(thread->tid), tls, &(thread->tid)); 313 if (rc == -1) { 314 int clone_errno = errno; 315 // We don't have to unlock the mutex at all because clone(2) failed so there's no child waiting to 316 // be unblocked, but we're about to unmap the memory the mutex is stored in, so this serves as a 317 // reminder that you can't rewrite this function to use a ScopedPthreadMutexLocker. 318 thread->startup_handshake_lock.unlock(); 319 if (thread->mmap_size != 0) { 320 munmap(thread->attr.stack_base, thread->mmap_size); 321 } 322 async_safe_format_log(ANDROID_LOG_WARN, "libc", "pthread_create failed: clone failed: %s", 323 strerror(clone_errno)); 324 return clone_errno; 325 } 326 327 int init_errno = __init_thread(thread); 328 if (init_errno != 0) { 329 // Mark the thread detached and replace its start_routine with a no-op. 330 // Letting the thread run is the easiest way to clean up its resources. 331 atomic_store(&thread->join_state, THREAD_DETACHED); 332 __pthread_internal_add(thread); 333 thread->start_routine = __do_nothing; 334 thread->startup_handshake_lock.unlock(); 335 return init_errno; 336 } 337 338 // Publish the pthread_t and unlock the mutex to let the new thread start running. 339 *thread_out = __pthread_internal_add(thread); 340 thread->startup_handshake_lock.unlock(); 341 342 return 0; 343} 344