mirror of
https://github.com/jart/cosmopolitan.git
synced 2025-02-01 03:53:33 +00:00
494 lines
17 KiB
C
494 lines
17 KiB
C
/*-*- mode:c;indent-tabs-mode:nil;c-basic-offset:2;tab-width:8;coding:utf-8 -*-│
|
|
│vi: set net ft=c ts=2 sts=2 sw=2 fenc=utf-8 :vi│
|
|
╞══════════════════════════════════════════════════════════════════════════════╡
|
|
│ Copyright 2021 Justine Alexandra Roberts Tunney │
|
|
│ │
|
|
│ Permission to use, copy, modify, and/or distribute this software for │
|
|
│ any purpose with or without fee is hereby granted, provided that the │
|
|
│ above copyright notice and this permission notice appear in all copies. │
|
|
│ │
|
|
│ THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL │
|
|
│ WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED │
|
|
│ WARRANTIES OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE │
|
|
│ AUTHOR BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL │
|
|
│ DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR │
|
|
│ PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER │
|
|
│ TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR │
|
|
│ PERFORMANCE OF THIS SOFTWARE. │
|
|
╚─────────────────────────────────────────────────────────────────────────────*/
|
|
#include "libc/assert.h"
|
|
#include "libc/calls/calls.h"
|
|
#include "libc/calls/internal.h"
|
|
#include "libc/calls/strace.internal.h"
|
|
#include "libc/calls/struct/ucontext-netbsd.internal.h"
|
|
#include "libc/dce.h"
|
|
#include "libc/errno.h"
|
|
#include "libc/intrin/asan.internal.h"
|
|
#include "libc/intrin/kprintf.h"
|
|
#include "libc/intrin/spinlock.h"
|
|
#include "libc/intrin/threaded.h"
|
|
#include "libc/nt/runtime.h"
|
|
#include "libc/nt/thread.h"
|
|
#include "libc/nt/thunk/msabi.h"
|
|
#include "libc/runtime/runtime.h"
|
|
#include "libc/sysv/consts/clone.h"
|
|
#include "libc/sysv/consts/nr.h"
|
|
#include "libc/sysv/consts/nrlinux.h"
|
|
#include "libc/sysv/errfuns.h"
|
|
#include "libc/thread/freebsd.internal.h"
|
|
#include "libc/thread/xnu.internal.h"
|
|
|
|
STATIC_YOINK("gettid"); // for kprintf()
|
|
|
|
#define __NR_thr_new 455
|
|
#define __NR_clone_linux 56
|
|
#define __NR__lwp_create 309
|
|
#define __NR_getcontext_netbsd 307
|
|
#define __NR_bsdthread_create 0x02000168
|
|
#define __NR_thread_fast_set_cthread_self 0x03000003
|
|
#define PTHREAD_START_CUSTOM_XNU 0x01000000
|
|
#define LWP_DETACHED 0x00000040
|
|
#define LWP_SUSPENDED 0x00000080
|
|
|
|
static char tibdefault[64];
|
|
|
|
struct WinThread {
|
|
uint32_t tid;
|
|
int flags;
|
|
int *ctid;
|
|
void *tls;
|
|
int (*func)(void *);
|
|
void *arg;
|
|
};
|
|
|
|
uint32_t WinThreadThunk(void *warg);
|
|
asm(".section\t.text.windows,\"ax\",@progbits\n\t"
|
|
".local\tWinThreadThunk\n"
|
|
"WinThreadThunk:\n\t"
|
|
"xor\t%ebp,%ebp\n\t"
|
|
"mov\t%rcx,%rdi\n\t"
|
|
"mov\t%rcx,%rsp\n\t"
|
|
"and\t$-16,%rsp\n\t"
|
|
"call\tWinThreadMain\n\t"
|
|
".size\tWinThreadThunk,.-WinThreadThunk\n\t"
|
|
".previous");
|
|
__attribute__((__used__, __no_reorder__))
|
|
|
|
static textwindows wontreturn void
|
|
WinThreadMain(struct WinThread *wt) {
|
|
int rc;
|
|
if (wt->flags & CLONE_SETTLS) {
|
|
TlsSetValue(__tls_index, wt->tls);
|
|
}
|
|
if (wt->flags & CLONE_CHILD_SETTID) {
|
|
*wt->ctid = wt->tid;
|
|
}
|
|
rc = wt->func(wt->arg);
|
|
_Exit1(rc);
|
|
}
|
|
|
|
static textwindows int CloneWindows(int (*func)(void *), char *stk,
|
|
size_t stksz, int flags, void *arg,
|
|
void *tls, size_t tlssz, int *ctid) {
|
|
int64_t h;
|
|
struct WinThread *wt;
|
|
wt = (struct WinThread *)(((intptr_t)(stk + stksz) -
|
|
sizeof(struct WinThread)) &
|
|
-alignof(struct WinThread));
|
|
wt->flags = flags;
|
|
wt->ctid = ctid;
|
|
wt->func = func;
|
|
wt->arg = arg;
|
|
wt->tls = tls;
|
|
if ((h = CreateThread(0, 0, WinThreadThunk, wt, 0, &wt->tid))) {
|
|
CloseHandle(h);
|
|
return wt->tid;
|
|
} else {
|
|
return -1;
|
|
}
|
|
}
|
|
|
|
void XnuThreadThunk(void *pthread, int machport, void *(*func)(void *),
|
|
void *arg, intptr_t *stack, unsigned flags);
|
|
asm(".local\tXnuThreadThunk\n"
|
|
"XnuThreadThunk:\n\t"
|
|
"xor\t%ebp,%ebp\n\t"
|
|
"mov\t%r8,%rsp\n\t"
|
|
"jmp\tXnuThreadMain\n\t"
|
|
".size\tXnuThreadThunk,.-XnuThreadThunk");
|
|
__attribute__((__used__, __no_reorder__))
|
|
|
|
static wontreturn void
|
|
XnuThreadMain(void *pthread, int tid, int (*func)(void *arg), void *arg,
|
|
intptr_t *sp, unsigned flags) {
|
|
int rc;
|
|
sp[1] = tid;
|
|
_spunlock(sp);
|
|
if (sp[4] & CLONE_SETTLS) {
|
|
// XNU uses the same 0x30 offset as the WIN32 TIB x64. They told the
|
|
// Go team at Google that they Apply stands by our ability to use it
|
|
// https://github.com/golang/go/issues/23617#issuecomment-376662373
|
|
asm volatile("syscall"
|
|
: "=a"(rc)
|
|
: "0"(__NR_thread_fast_set_cthread_self), "D"(sp[3] - 0x30)
|
|
: "rcx", "r11", "memory", "cc");
|
|
}
|
|
if (sp[4] & CLONE_CHILD_SETTID) {
|
|
*(int *)sp[2] = tid;
|
|
}
|
|
rc = func(arg);
|
|
_Exit1(rc);
|
|
}
|
|
|
|
static int CloneXnu(int (*fn)(void *), char *stk, size_t stksz, int flags,
|
|
void *arg, void *tls, size_t tlssz, int *ctid) {
|
|
int rc;
|
|
bool failed;
|
|
intptr_t *sp;
|
|
static bool once;
|
|
static int broken;
|
|
if (!once) {
|
|
if (bsdthread_register(XnuThreadThunk, 0, 0, 0, 0, 0, 0) == -1) {
|
|
broken = errno;
|
|
}
|
|
once = true;
|
|
}
|
|
if (broken) {
|
|
errno = broken;
|
|
return -1;
|
|
}
|
|
sp = (intptr_t *)(stk + stksz);
|
|
*--sp = 0; // 5 padding
|
|
*--sp = flags; // 4 clone() flags
|
|
*--sp = (intptr_t)tls; // 3 thread local storage
|
|
*--sp = (intptr_t)ctid; // 2 child tid api
|
|
*--sp = 0; // 1 receives tid
|
|
*--sp = 0; // 0 lock
|
|
_seizelock(sp); // TODO: How can we get the tid without locking?
|
|
if ((rc = bsdthread_create(fn, arg, sp, 0, PTHREAD_START_CUSTOM_XNU)) != -1) {
|
|
_spinlock(sp);
|
|
rc = sp[1];
|
|
}
|
|
return rc;
|
|
}
|
|
|
|
void FreebsdThreadThunk(void *sp) wontreturn;
|
|
asm(".local\tFreebsdThreadThunk\n"
|
|
"FreebsdThreadThunk:\n\t"
|
|
"xor\t%ebp,%ebp\n\t"
|
|
"mov\t%rdi,%rsp\n\t"
|
|
"jmp\tFreebsdThreadMain\n\t"
|
|
".size\tFreebsdThreadThunk,.-FreebsdThreadThunk");
|
|
__attribute__((__used__, __no_reorder__))
|
|
|
|
static wontreturn void
|
|
FreebsdThreadMain(intptr_t *sp) {
|
|
int rc;
|
|
if (sp[3] & CLONE_CHILD_SETTID) {
|
|
*(int *)sp[2] = sp[4];
|
|
}
|
|
rc = ((int (*)(intptr_t))sp[0])(sp[1]);
|
|
_Exit1(rc);
|
|
}
|
|
|
|
static int CloneFreebsd(int (*func)(void *), char *stk, size_t stksz, int flags,
|
|
void *arg, void *tls, size_t tlssz, int *ctid) {
|
|
int ax;
|
|
bool failed;
|
|
int64_t tid;
|
|
intptr_t *sp;
|
|
sp = (intptr_t *)(stk + stksz);
|
|
*--sp = 0; // 5 [padding]
|
|
*--sp = 0; // 4 [child_tid]
|
|
*--sp = flags; // 3
|
|
*--sp = (intptr_t)ctid; // 2
|
|
*--sp = (intptr_t)arg; // 1
|
|
*--sp = (intptr_t)func; // 0
|
|
struct thr_param params = {
|
|
.start_func = FreebsdThreadThunk,
|
|
.arg = sp,
|
|
.stack_base = stk,
|
|
.stack_size = stksz,
|
|
.tls_base = flags & CLONE_SETTLS ? tls : 0,
|
|
.tls_size = flags & CLONE_SETTLS ? tlssz : 0,
|
|
.child_tid = sp + 4,
|
|
.parent_tid = &tid,
|
|
};
|
|
asm volatile(CFLAG_ASM("syscall")
|
|
: CFLAG_CONSTRAINT(failed), "=a"(ax)
|
|
: "1"(__NR_thr_new), "D"(¶ms), "S"(sizeof(params))
|
|
: "rcx", "rdx", "r8", "r9", "r10", "r11", "memory");
|
|
if (failed) {
|
|
errno = ax;
|
|
tid = -1;
|
|
}
|
|
return tid;
|
|
}
|
|
|
|
struct __tfork {
|
|
void *tf_tcb;
|
|
int32_t *tf_tid;
|
|
void *tf_stack;
|
|
};
|
|
|
|
int __tfork(struct __tfork *params, size_t psize, intptr_t *stack);
|
|
asm(".section\t.privileged,\"ax\",@progbits\n\t"
|
|
".local\t__tfork\n"
|
|
"__tfork:\n\t"
|
|
"push\t$8\n\t"
|
|
"pop\t%rax\n\t"
|
|
"mov\t%rdx,%r8\n\t"
|
|
"syscall\n\t"
|
|
"jc\t1f\n\t"
|
|
"test\t%eax,%eax\n\t"
|
|
"jz\t2f\n\t"
|
|
"ret\n1:\t"
|
|
"neg\t%eax\n\t"
|
|
"ret\n2:\t"
|
|
"xor\t%ebp,%ebp\n\t"
|
|
"mov\t%r8,%rsp\n\t"
|
|
"mov\t%r8,%rdi\n\t"
|
|
"jmp\tOpenbsdThreadMain\n\t"
|
|
".size\t__tfork,.-__tfork\n\t"
|
|
".previous");
|
|
__attribute__((__used__, __no_reorder__))
|
|
|
|
static privileged wontreturn void
|
|
OpenbsdThreadMain(intptr_t *sp) {
|
|
int rc;
|
|
rc = ((int (*)(intptr_t))sp[0])(sp[1]);
|
|
_Exit1(rc);
|
|
}
|
|
|
|
static int CloneOpenbsd(int (*func)(void *), char *stk, size_t stksz, int flags,
|
|
void *arg, void *tls, size_t tlssz, int *ctid) {
|
|
int tid;
|
|
intptr_t *sp;
|
|
struct __tfork params;
|
|
sp = (intptr_t *)(stk + stksz);
|
|
*--sp = flags; // 3
|
|
*--sp = (intptr_t)ctid; // 2
|
|
*--sp = (intptr_t)arg; // 1
|
|
*--sp = (intptr_t)func; // 0
|
|
params.tf_stack = sp;
|
|
params.tf_tcb = flags & CLONE_SETTLS ? tls : 0;
|
|
params.tf_tid = flags & CLONE_CHILD_SETTID ? ctid : 0;
|
|
if ((tid = __tfork(¶ms, sizeof(params), sp)) < 0) {
|
|
errno = -tid;
|
|
tid = -1;
|
|
}
|
|
return tid;
|
|
}
|
|
|
|
static wontreturn void NetbsdThreadMain(void *arg, int (*func)(void *arg),
|
|
int *tid, int *ctid, int flags) {
|
|
int rc;
|
|
if (flags & CLONE_CHILD_SETTID) {
|
|
*ctid = *tid;
|
|
}
|
|
rc = func(arg);
|
|
_Exit1(rc);
|
|
}
|
|
|
|
static int CloneNetbsd(int (*func)(void *), char *stk, size_t stksz, int flags,
|
|
void *arg, void *tls, size_t tlssz, int *ctid) {
|
|
// NetBSD has its own clone() and it works, but it's technically a
|
|
// second-class API, intended to help Linux folks migrate to this!
|
|
// We put it on the thread's stack, to avoid locking this function
|
|
// so its stack doesn't scope. The ucontext struct needs 784 bytes
|
|
bool failed;
|
|
int ax, *tid;
|
|
intptr_t dx, sp;
|
|
static bool once;
|
|
static int broken;
|
|
struct ucontext_netbsd *ctx;
|
|
static struct ucontext_netbsd netbsd_clone_template;
|
|
if (!once) {
|
|
asm volatile(CFLAG_ASM("syscall")
|
|
: CFLAG_CONSTRAINT(failed), "=a"(ax)
|
|
: "1"(__NR_getcontext_netbsd), "D"(&netbsd_clone_template)
|
|
: "rcx", "rdx", "r11", "memory");
|
|
if (failed) {
|
|
broken = ax;
|
|
}
|
|
once = true;
|
|
}
|
|
if (broken) {
|
|
errno = broken;
|
|
return -1;
|
|
}
|
|
sp = (intptr_t)(stk + stksz);
|
|
sp -= sizeof(int);
|
|
tid = (int *)sp;
|
|
sp -= sizeof(*ctx);
|
|
sp = sp & -alignof(*ctx);
|
|
ctx = (struct ucontext_netbsd *)sp;
|
|
memcpy(ctx, &netbsd_clone_template, sizeof(*ctx));
|
|
ctx->uc_link = 0;
|
|
ctx->uc_mcontext.rbp = 0;
|
|
ctx->uc_mcontext.rsp = sp;
|
|
ctx->uc_mcontext.rip = (intptr_t)NetbsdThreadMain;
|
|
ctx->uc_mcontext.rdi = (intptr_t)arg;
|
|
ctx->uc_mcontext.rsi = (intptr_t)func;
|
|
ctx->uc_mcontext.rdx = (intptr_t)tid;
|
|
ctx->uc_mcontext.rcx = (intptr_t)ctid;
|
|
ctx->uc_mcontext.r8 = flags;
|
|
ctx->uc_flags |= _UC_STACK;
|
|
ctx->uc_stack.ss_sp = stk;
|
|
ctx->uc_stack.ss_size = stksz;
|
|
ctx->uc_stack.ss_flags = 0;
|
|
if (flags & CLONE_SETTLS) {
|
|
ctx->uc_flags |= _UC_TLSBASE;
|
|
ctx->uc_mcontext._mc_tlsbase = (intptr_t)tls;
|
|
}
|
|
asm volatile(CFLAG_ASM("syscall")
|
|
: CFLAG_CONSTRAINT(failed), "=a"(ax), "=d"(dx)
|
|
: "1"(__NR__lwp_create), "D"(ctx), "S"(LWP_DETACHED), "2"(tid)
|
|
: "rcx", "r11", "memory");
|
|
if (!failed) {
|
|
return *tid;
|
|
} else {
|
|
errno = ax;
|
|
return -1;
|
|
}
|
|
}
|
|
|
|
static int CloneLinux(int (*func)(void *), char *stk, size_t stksz, int flags,
|
|
void *arg, int *ptid, void *tls, size_t tlssz,
|
|
int *ctid) {
|
|
int ax;
|
|
register int *r8 asm("r8") = tls;
|
|
register int *r10 asm("r10") = ctid;
|
|
register void *r9 asm("r9") = func;
|
|
intptr_t *stack = (intptr_t *)(stk + stksz);
|
|
*--stack = (intptr_t)arg;
|
|
asm volatile("syscall\n\t"
|
|
"test\t%0,%0\n\t"
|
|
"jnz\t1f\n\t"
|
|
"xor\t%%ebp,%%ebp\n\t"
|
|
"pop\t%%rdi\n\t" // arg
|
|
"call\t*%%r9\n\t" // func
|
|
"xchg\t%%eax,%%edi\n\t"
|
|
"jmp\t_Exit1\n1:"
|
|
: "=a"(ax)
|
|
: "0"(__NR_clone_linux), "D"(flags), "S"(stack), "r"(r10),
|
|
"r"(r8), "r"(r9)
|
|
: "rcx", "r11", "memory");
|
|
if (ax > -4096u) errno = -ax, ax = -1;
|
|
return ax;
|
|
}
|
|
|
|
/**
|
|
* Creates thread.
|
|
*
|
|
* Threads are created in a detached manner. They currently can't be
|
|
* synchronized using wait() or posix signals. Threads created by this
|
|
* function should be synchronized using shared memory operations.
|
|
*
|
|
* Any memory that's required by this system call wrapper is allocated
|
|
* to the top of your stack. This is normally about 64 bytes, although
|
|
* on NetBSD it's currently 800.
|
|
*
|
|
* Your function is called from within the stack you specify. A return
|
|
* address is pushed onto your stack, that causes returning to jump to
|
|
* _Exit1() which terminates the thread. Even though the callback says
|
|
* it supports a return code, that'll only work on Linux and Windows.
|
|
*
|
|
* The `tls` parameter is for thread-local storage. If you specify this
|
|
* then clone() will implicitly rewire libc (e.g. errno) to use TLS:
|
|
*
|
|
* static char tib[64];
|
|
* __initialize_tls(tib);
|
|
* __install_tls(tib);
|
|
*
|
|
* If you want a main process TLS size that's larger call it manually.
|
|
* Once you've done the above and/or started creating your own threads
|
|
* you'll be able to access your `tls` thread information block, using
|
|
*
|
|
* char *p = __get_tls();
|
|
* printf("errno is %d\n", *(int *)(p + 0x3c));
|
|
*
|
|
* This function follows the same ABI convention as the Linux userspace
|
|
* libraries, with a few small changes. The varargs has been removed to
|
|
* help prevent broken code, and the stack size and tls size parameters
|
|
* are introduced for compatibility with FreeBSD.
|
|
*
|
|
* To keep this system call lightweight, only the thread creation use
|
|
* case is polyfilled across platforms. For example, if you want fork
|
|
* that works on OpenBSD for example, don't do it with clone(SIGCHLD)
|
|
* and please just call fork(). Even if you do that on Linux, it will
|
|
* effectively work around libc features like atfork(), so that means
|
|
* other calls like getpid() may return incorrect values.
|
|
*
|
|
* @param func is your callback function
|
|
* @param stk points to the bottom of a caller allocated stack, which
|
|
* must be allocated via mmap() using the MAP_STACK flag, or else
|
|
* you won't get optimal performance and it won't work on OpenBSD
|
|
* @param stksz is the size of that stack in bytes, we recommend that
|
|
* that this be set to GetStackSize() or else memory safety tools
|
|
* like kprintf() can't do as good and quick of a job; this value
|
|
* must be 16-aligned plus it must be at least 4192 bytes in size
|
|
* and it's advised to have the bottom-most page, be a guard page
|
|
* @param flags should have:
|
|
* - `CLONE_THREAD|CLONE_VM|CLONE_FS|CLONE_FILES|CLONE_SIGHAND`
|
|
* and may optionally bitwise any of the following:
|
|
* - `CLONE_CHILD_SETTID` is needed too if you use `ctid`
|
|
* - `CLONE_SETTLS` is needed too if you set `tls`
|
|
* @param arg will be passed to your callback
|
|
* @param tls may be used to set the thread local storage segment;
|
|
* this parameter is ignored if `CLONE_SETTLS` is not set
|
|
* @param tlssz is the size of tls in bytes which must be at least 64
|
|
* @param ctid lets the child receive its thread id without having to
|
|
* call gettid() and is ignored if `CLONE_CHILD_SETTID` isn't set
|
|
* @return tid of child on success, or -1 w/ errno
|
|
* @threadsafe
|
|
*/
|
|
int clone(int (*func)(void *), void *stk, size_t stksz, int flags, void *arg,
|
|
int *ptid, void *tls, size_t tlssz, int *ctid) {
|
|
int rc;
|
|
|
|
__threaded = true;
|
|
if (tls && !__tls_enabled) {
|
|
__initialize_tls(tibdefault);
|
|
__install_tls(tibdefault);
|
|
}
|
|
|
|
if (IsAsan() &&
|
|
((stksz > PAGESIZE &&
|
|
!__asan_is_valid((char *)stk + PAGESIZE, stksz - PAGESIZE)) ||
|
|
((flags & CLONE_SETTLS) && !__asan_is_valid(tls, tlssz)) ||
|
|
((flags & CLONE_SETTLS) && !__asan_is_valid(tls, sizeof(long))) ||
|
|
((flags & CLONE_PARENT_SETTID) &&
|
|
!__asan_is_valid(ptid, sizeof(*ptid))) ||
|
|
((flags & CLONE_CHILD_SETTID) &&
|
|
!__asan_is_valid(ctid, sizeof(*ctid))))) {
|
|
rc = efault();
|
|
} else if (!IsTiny() &&
|
|
(((flags & CLONE_VM) && (stksz < PAGESIZE || (stksz & 15))) ||
|
|
((flags & CLONE_SETTLS) && (tlssz < 64 || (tlssz & 7))))) {
|
|
rc = einval();
|
|
} else if (IsLinux()) {
|
|
rc = CloneLinux(func, stk, stksz, flags, arg, ptid, tls, tlssz, ctid);
|
|
} else if (!IsTiny() && (flags & ~(CLONE_SETTLS | CLONE_PARENT_SETTID |
|
|
CLONE_CHILD_SETTID)) !=
|
|
(CLONE_THREAD | CLONE_VM | CLONE_FS |
|
|
CLONE_FILES | CLONE_SIGHAND)) {
|
|
rc = einval();
|
|
} else if (IsXnu()) {
|
|
rc = CloneXnu(func, stk, stksz, flags, arg, tls, tlssz, ctid);
|
|
} else if (IsFreebsd()) {
|
|
rc = CloneFreebsd(func, stk, stksz, flags, arg, tls, tlssz, ctid);
|
|
} else if (IsNetbsd()) {
|
|
rc = CloneNetbsd(func, stk, stksz, flags, arg, tls, tlssz, ctid);
|
|
} else if (IsOpenbsd()) {
|
|
rc = CloneOpenbsd(func, stk, stksz, flags, arg, tls, tlssz, ctid);
|
|
} else if (IsWindows()) {
|
|
rc = CloneWindows(func, stk, stksz, flags, arg, tls, tlssz, ctid);
|
|
} else {
|
|
rc = enosys();
|
|
}
|
|
|
|
STRACE("clone(%p, %p, %'zu, %#x, %p, %p, %p, %'zu, %p) → %d", func, stk,
|
|
stksz, flags, arg, ptid, tls, tlssz, ctid, rc);
|
|
return rc;
|
|
}
|