mirror of
https://github.com/jart/cosmopolitan.git
synced 2025-01-31 19:43:32 +00:00
b1d9d11be1
This change simplifies the thread-local storage support code. On Windows and Mac OS X the startup latency of __enable_tls() has been reduced from 30ms to 1ms. On Windows, TLS memory accesses will now go much faster due to better self-modifying code that prevents a function call and acquires our thread information block pointer in a single instruction.
173 lines
5.7 KiB
C
173 lines
5.7 KiB
C
/*-*- mode:c;indent-tabs-mode:nil;c-basic-offset:2;tab-width:8;coding:utf-8 -*-│
|
|
│vi: set net ft=c ts=2 sts=2 sw=2 fenc=utf-8 :vi│
|
|
╞══════════════════════════════════════════════════════════════════════════════╡
|
|
│ Copyright 2021 Justine Alexandra Roberts Tunney │
|
|
│ │
|
|
│ Permission to use, copy, modify, and/or distribute this software for │
|
|
│ any purpose with or without fee is hereby granted, provided that the │
|
|
│ above copyright notice and this permission notice appear in all copies. │
|
|
│ │
|
|
│ THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL │
|
|
│ WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED │
|
|
│ WARRANTIES OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE │
|
|
│ AUTHOR BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL │
|
|
│ DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR │
|
|
│ PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER │
|
|
│ TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR │
|
|
│ PERFORMANCE OF THIS SOFTWARE. │
|
|
╚─────────────────────────────────────────────────────────────────────────────*/
|
|
#include "libc/calls/calls.h"
|
|
#include "libc/calls/struct/timespec.h"
|
|
#include "libc/dce.h"
|
|
#include "libc/errno.h"
|
|
#include "libc/intrin/kprintf.h"
|
|
#include "libc/intrin/spinlock.h"
|
|
#include "libc/intrin/wait0.internal.h"
|
|
#include "libc/log/backtrace.internal.h"
|
|
#include "libc/macros.internal.h"
|
|
#include "libc/mem/mem.h"
|
|
#include "libc/nexgen32e/gettls.h"
|
|
#include "libc/nexgen32e/nexgen32e.h"
|
|
#include "libc/runtime/internal.h"
|
|
#include "libc/runtime/runtime.h"
|
|
#include "libc/runtime/stack.h"
|
|
#include "libc/runtime/symbols.internal.h"
|
|
#include "libc/stdio/stdio.h"
|
|
#include "libc/sysv/consts/clock.h"
|
|
#include "libc/sysv/consts/clone.h"
|
|
#include "libc/sysv/consts/map.h"
|
|
#include "libc/sysv/consts/o.h"
|
|
#include "libc/sysv/consts/prot.h"
|
|
#include "libc/sysv/consts/sig.h"
|
|
#include "libc/testlib/ezbench.h"
|
|
#include "libc/testlib/testlib.h"
|
|
#include "libc/thread/spawn.h"
|
|
#include "libc/time/time.h"
|
|
|
|
int x, me, tid;
|
|
_Atomic(int) thechilde;
|
|
|
|
__attribute__((__constructor__)) static void init(void) {
|
|
pledge("stdio rpath thread", 0);
|
|
errno = 0;
|
|
}
|
|
|
|
void *__initialize_tls(char tib[64]) {
|
|
if (tib) {
|
|
*(intptr_t *)(tib + 0x00) = (intptr_t)tib;
|
|
*(intptr_t *)(tib + 0x30) = (intptr_t)tib;
|
|
*(int *)(tib + 0x38) = -1; // tid
|
|
*(int *)(tib + 0x3c) = 0;
|
|
}
|
|
return tib;
|
|
}
|
|
|
|
void SetUp(void) {
|
|
x = 0;
|
|
me = gettid();
|
|
}
|
|
|
|
void TearDown(void) {
|
|
}
|
|
|
|
int DoNothing(void *arg) {
|
|
return 0;
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
// TEST THREADS WORK
|
|
|
|
int CloneTest1(void *arg, int tid) {
|
|
intptr_t rsp, top, bot;
|
|
CheckStackIsAligned();
|
|
// PrintBacktraceUsingSymbols(2, __builtin_frame_address(0),
|
|
// GetSymbolTable());
|
|
rsp = (intptr_t)__builtin_frame_address(0);
|
|
bot = ROUNDDOWN((intptr_t)rsp, GetStackSize());
|
|
top = bot + GetStackSize();
|
|
ASSERT_GT(rsp, bot); // check we're on stack
|
|
ASSERT_LT(rsp, top); // check we're on stack
|
|
ASSERT_GT(rsp, top - 256); // check we're near top of stack
|
|
ASSERT_TRUE(IS2POW(GetStackSize()));
|
|
ASSERT_EQ(0, bot & (GetStackSize() - 1));
|
|
x = 42;
|
|
ASSERT_EQ(23, (intptr_t)arg);
|
|
ASSERT_NE(gettid(), getpid());
|
|
return 0;
|
|
}
|
|
|
|
TEST(clone, test1) {
|
|
int ptid = 0;
|
|
struct spawn th;
|
|
ASSERT_SYS(0, 0, _spawn(CloneTest1, (void *)23, &th));
|
|
ASSERT_SYS(0, 0, _join(&th));
|
|
ASSERT_NE(gettid(), tid);
|
|
ASSERT_EQ(tid, ptid);
|
|
ASSERT_EQ(42, x);
|
|
ASSERT_NE(me, tid);
|
|
ASSERT_EQ(0, errno);
|
|
errno = 31337;
|
|
ASSERT_EQ(31337, errno);
|
|
errno = 0;
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
// TEST THREADS CAN ISSUE SYSTEM CALLS WITH INDEPENDENT ERRNOS
|
|
|
|
_Atomic(int) sysbarrier;
|
|
|
|
int CloneTestSys(void *arg, int tid) {
|
|
int i, id = (intptr_t)arg;
|
|
CheckStackIsAligned();
|
|
while (!sysbarrier) asm("pause");
|
|
for (i = 0; i < 20; ++i) {
|
|
switch (id % 3) {
|
|
case 0:
|
|
errno = 123;
|
|
open(0, 0);
|
|
asm("pause");
|
|
ASSERT_EQ(EFAULT, errno);
|
|
break;
|
|
case 1:
|
|
errno = 123;
|
|
dup(-1);
|
|
asm("pause");
|
|
ASSERT_EQ(EBADF, errno);
|
|
break;
|
|
case 2:
|
|
errno = 123;
|
|
dup3(0, 0, 0);
|
|
asm("pause");
|
|
ASSERT_EQ(EINVAL, errno);
|
|
break;
|
|
default:
|
|
unreachable;
|
|
}
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
TEST(clone, tlsSystemCallsErrno_wontClobberMainThreadBecauseTls) {
|
|
int i;
|
|
struct spawn th[8];
|
|
ASSERT_EQ(0, errno);
|
|
for (i = 0; i < 8; ++i) {
|
|
ASSERT_SYS(0, 0, _spawn(CloneTestSys, (void *)(intptr_t)i, th + i));
|
|
}
|
|
sysbarrier = 1;
|
|
for (i = 0; i < 8; ++i) {
|
|
ASSERT_SYS(0, 0, _join(th + i));
|
|
}
|
|
ASSERT_EQ(0, errno);
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
// BENCHMARK
|
|
|
|
BENCH(clone, bench) {
|
|
char *volatile tp;
|
|
errno_t *volatile ep;
|
|
EZBENCH2("__errno_location", donothing, (ep = __errno_location()));
|
|
EZBENCH2("__get_tls_privileged", donothing, (tp = __get_tls_privileged()));
|
|
EZBENCH2("__get_tls", donothing, (tp = __get_tls()));
|
|
}
|