From 31a5a2bb2fa9bdd8710af5f9ea99068ab86fb9e8 Mon Sep 17 00:00:00 2001 From: Jameson Nash Date: Thu, 4 Apr 2019 14:03:04 -0400 Subject: [PATCH] tasks,debugging: make it possible to get the backtrace of a task This should work for any non-copy stack task. To make it work better, this now switches to the JL_HAVE_UNW_CONTEXT by default. Ulso export the list of all live (currently running or suspended) tasks which have real stacks (the non-copy-stack tasks) which were started by the current thread. --- src/gc-stacks.c | 23 +++- src/julia.expmap | 1 + src/julia.h | 9 +- src/julia_threads.h | 39 ++++-- src/partr.c | 2 +- src/signals-unix.c | 1 + src/stackwalk.c | 74 ++++++++++- src/task.c | 301 ++++++++++++++++++++++++-------------------- 8 files changed, 295 insertions(+), 155 deletions(-) diff --git a/src/gc-stacks.c b/src/gc-stacks.c index 815bc062ec261..8c2f9b4320ab1 100644 --- a/src/gc-stacks.c +++ b/src/gc-stacks.c @@ -215,8 +215,12 @@ void sweep_stack_pools(void) continue; while (1) { jl_task_t *t = (jl_task_t*)lst[n]; + assert(jl_is_task(t)); if (gc_marked(jl_astaggedvalue(t)->bits.gc)) { - n++; + if (t->stkbuf == NULL) + ndel++; // jl_release_task_stack called + else + n++; } else { ndel++; @@ -236,3 +240,20 @@ void sweep_stack_pools(void) live_tasks->len -= ndel; } } + +JL_DLLEXPORT jl_array_t *jl_live_tasks(void) +{ + jl_ptls_t ptls = jl_get_ptls_states(); + arraylist_t *live_tasks = &ptls->heap.live_tasks; + size_t i, l; + jl_array_t *a; + do { + l = live_tasks->len; + a = jl_alloc_vec_any(l + 1); // may gc + } while (l != live_tasks->len); + void **lst = live_tasks->items; + ((void**)jl_array_data(a))[0] = ptls->root_task; + for (i = 0; i < l; i++) + ((void**)jl_array_data(a))[i + 1] = lst[i]; + return a; +} diff --git a/src/julia.expmap b/src/julia.expmap index f0b808d8db1f6..162978abcbc49 100644 --- a/src/julia.expmap +++ b/src/julia.expmap @@ -30,6 +30,7 @@ add_library_mapping; utf8proc_*; jlbacktrace; + jlbacktracet; julia_type_to_llvm; _IO_stdin_used; __ZN4llvm23createLowerSimdLoopPassEv; diff --git a/src/julia.h b/src/julia.h index c6de10f286da0..1095298e34346 100644 --- a/src/julia.h +++ b/src/julia.h @@ -1770,7 +1770,14 @@ typedef struct _jl_task_t { uint8_t sticky; // record whether this Task can be migrated to a new thread // hidden state: - jl_ucontext_t ctx; // saved thread state + union { + jl_ucontext_t ctx; // saved thread state +#ifdef _OS_WINDOWS_ + jl_ucontext_t copy_stack_ctx; +#else + struct jl_stack_context_t copy_stack_ctx; +#endif + }; void *stkbuf; // malloc'd memory (either copybuf or stack) size_t bufsz; // actual sizeof stkbuf unsigned int copy_stack:31; // sizeof stack for copybuf diff --git a/src/julia_threads.h b/src/julia_threads.h index 6040a593300c1..fcf0b395c2eba 100644 --- a/src/julia_threads.h +++ b/src/julia_threads.h @@ -16,8 +16,9 @@ // Options for task switching algorithm (in order of preference): // JL_HAVE_ASM -- mostly setjmp -// JL_HAVE_ASYNCIFY -- task switching based on the binaryen asyncify transform -// JL_HAVE_UNW_CONTEXT -- hybrid of libunwind for start, setjmp for resume +// JL_HAVE_ASM && JL_HAVE_UNW_CONTEXT -- libunwind-based +// JL_HAVE_UNW_CONTEXT -- libunwind-based +// JL_HAVE_ASYNCIFY -- task switching based on the binary asyncify transform // JL_HAVE_UCONTEXT -- posix standard API, requires syscall for resume // JL_HAVE_SIGALTSTACK -- requires several syscall for start, setjmp for resume @@ -33,21 +34,25 @@ typedef win32_ucontext_t jl_ucontext_t; #if (defined(_CPU_X86_64_) || defined(_CPU_X86_) || defined(_CPU_AARCH64_) || \ defined(_CPU_ARM_) || defined(_CPU_PPC64_)) #define JL_HAVE_ASM -#elif defined(_OS_DARWIN_) +#endif +#if defined(_OS_DARWIN_) #define JL_HAVE_UNW_CONTEXT #elif defined(_OS_LINUX_) -#define JL_HAVE_UCONTEXT +#define JL_HAVE_UNW_CONTEXT #elif defined(_OS_EMSCRIPTEN_) #define JL_HAVE_ASYNCIFY -#else -#define JL_HAVE_UNW_CONTEXT +#elif !defined(JL_HAVE_ASM) +#define JL_HAVE_UNW_CONTEXT // optimistically? #endif #endif -#if defined(JL_HAVE_ASM) || defined(JL_HAVE_SIGALTSTACK) -typedef struct { + +struct jl_stack_context_t { jl_jmp_buf uc_mcontext; -} jl_ucontext_t; +}; + +#if (!defined(JL_HAVE_UNW_CONTEXT) && defined(JL_HAVE_ASM)) || defined(JL_HAVE_SIGALTSTACK) +typedef struct jl_stack_context_t jl_ucontext_t; #endif #if defined(JL_HAVE_ASYNCIFY) typedef struct { @@ -59,9 +64,13 @@ typedef struct { void *stacktop; } jl_ucontext_t; #endif -#if defined(JL_HAVE_UCONTEXT) || defined(JL_HAVE_UNW_CONTEXT) +#if defined(JL_HAVE_UNW_CONTEXT) #define UNW_LOCAL_ONLY #include +typedef unw_context_t jl_ucontext_t; +#endif +#if defined(JL_HAVE_UCONTEXT) +#include typedef ucontext_t jl_ucontext_t; #endif #endif @@ -192,7 +201,15 @@ struct _jl_tls_states_t { struct _jl_task_t *root_task; void *stackbase; size_t stacksize; - jl_ucontext_t base_ctx; // base context of stack + union { + jl_ucontext_t base_ctx; // base context of stack + // This hack is needed to support always_copy_stacks: +#ifdef _OS_WINDOWS_ + jl_ucontext_t copy_stack_ctx; +#else + struct jl_stack_context_t copy_stack_ctx; +#endif + }; jl_jmp_buf *safe_restore; // Temp storage for exception thrown in signal handler. Not rooted. struct _jl_value_t *sig_exception; diff --git a/src/partr.c b/src/partr.c index 61e28814c233e..160c504898b6a 100644 --- a/src/partr.c +++ b/src/partr.c @@ -40,7 +40,7 @@ uint64_t io_wakeup_leave; JL_DLLEXPORT int jl_set_task_tid(jl_task_t *task, int tid) JL_NOTSAFEPOINT { // Try to acquire the lock on this task. - int16_t was = task->tid; + int16_t was = jl_atomic_load_relaxed(&task->tid); if (was == tid) return 1; if (was == -1) diff --git a/src/signals-unix.c b/src/signals-unix.c index c3d93735d1168..e64aa8ba14450 100644 --- a/src/signals-unix.c +++ b/src/signals-unix.c @@ -41,6 +41,7 @@ #include "julia_assert.h" +// helper function for returning the unw_context_t inside a ucontext_t static bt_context_t *jl_to_bt_context(void *sigctx) { #ifdef __APPLE__ diff --git a/src/stackwalk.c b/src/stackwalk.c index ecff626e9a03e..23d9fb03771fe 100644 --- a/src/stackwalk.c +++ b/src/stackwalk.c @@ -713,8 +713,68 @@ void jl_print_bt_entry_codeloc(jl_bt_element_t *bt_entry) JL_NOTSAFEPOINT } } +extern bt_context_t *jl_to_bt_context(void *sigctx); + +void jl_rec_backtrace(jl_task_t *t) +{ + jl_ptls_t ptls = jl_get_ptls_states(); + ptls->bt_size = 0; + if (t == ptls->current_task) { + ptls->bt_size = rec_backtrace(ptls->bt_data, JL_MAX_BT_SIZE, 0); + return; + } + if (t->copy_stack || !t->started || t->stkbuf == NULL) + return; + int old = jl_atomic_compare_exchange(&t->tid, -1, ptls->tid); + if (old != -1 && old != ptls->tid) + return; + bt_context_t *context = NULL; +#if defined(_OS_WINDOWS_) + bt_context_t c; + memset(c, 0, sizeof(c)); + jl_jmp_buf *mctx = &t->uc_mcontext; +#if defined(_CPU_X86_64_) + c.Rbx = mctx->Rbx; + c.Rsp = mctx->Rsp; + c.Rbp = mctx->Rbp; + c.Rsi = mctx->Rsi; + c.Rdi = mctx->Rdi; + c.R12 = mctx->R12; + c.R13 = mctx->R13; + c.R14 = mctx->R14; + c.R15 = mctx->R15; + c.Rip = mctx->Rip; + c.Xmm6 = mctx->Xmm6; + c.Xmm7 = mctx->Xmm7; + c.Xmm8 = mctx->Xmm8; + c.Xmm9 = mctx->Xmm9; + c.Xmm10 = mctx->Xmm10; + c.Xmm11 = mctx->Xmm11; + c.Xmm12 = mctx->Xmm12; + c.Xmm13 = mctx->Xmm13; + c.Xmm14 = mctx->Xmm14; + c.Xmm15 = mctx->Xmm15; +#else + c.Eip = mctx->Eip; + c.Esp = mctx->Esp; + c.Ebp = mctx->Ebp; +#endif + context = &c; +#elif defined(JL_HAVE_UNW_CONTEXT) + context = &t->ctx; +#elif defined(JL_HAVE_UCONTEXT) + context = jl_to_bt_context(&t->ctx); +#else +#endif + if (context) + ptls->bt_size = rec_backtrace_ctx(ptls->bt_data, JL_MAX_BT_SIZE, context, t->gcstack, 0); + if (old == -1) + jl_atomic_store_relaxed(&t->tid, old); +} + //-------------------------------------------------- // Tools for interactive debugging in gdb + JL_DLLEXPORT void jl_gdblookup(void* ip) { jl_print_native_codeloc((uintptr_t)ip); @@ -726,9 +786,19 @@ JL_DLLEXPORT void jlbacktrace(void) JL_NOTSAFEPOINT jl_excstack_t *s = jl_get_ptls_states()->current_task->excstack; if (!s) return; - size_t bt_size = jl_excstack_bt_size(s, s->top); + size_t i, bt_size = jl_excstack_bt_size(s, s->top); jl_bt_element_t *bt_data = jl_excstack_bt_data(s, s->top); - for (size_t i = 0; i < bt_size; i += jl_bt_entry_size(bt_data + i)) { + for (i = 0; i < bt_size; i += jl_bt_entry_size(bt_data + i)) { + jl_print_bt_entry_codeloc(bt_data + i); + } +} +JL_DLLEXPORT void jlbacktracet(jl_task_t *t) +{ + jl_ptls_t ptls = jl_get_ptls_states(); + jl_rec_backtrace(t); + size_t i, bt_size = ptls->bt_size; + jl_bt_element_t *bt_data = ptls->bt_data; + for (i = 0; i < bt_size; i += jl_bt_entry_size(bt_data + i)) { jl_print_bt_entry_codeloc(bt_data + i); } } diff --git a/src/task.c b/src/task.c index 9d88306dd4eee..e51f492a8f301 100644 --- a/src/task.c +++ b/src/task.c @@ -54,10 +54,6 @@ static inline void sanitizer_finish_switch_fiber(void) {} #if defined(_OS_WINDOWS_) volatile int jl_in_stackwalk = 0; -#else -#ifdef JL_HAVE_UCONTEXT -#include -#endif #endif // empirically, jl_finish_task needs about 64k stack space to infer/run @@ -83,13 +79,9 @@ jl_sym_t *runnable_sym; extern size_t jl_page_size; static char *jl_alloc_fiber(jl_ucontext_t *t, size_t *ssize, jl_task_t *owner) JL_NOTSAFEPOINT; -STATIC_OR_JS void jl_set_fiber(jl_ucontext_t *t); -STATIC_OR_JS void jl_start_fiber(jl_ucontext_t *lastt, jl_ucontext_t *t); -STATIC_OR_JS void jl_swap_fiber(jl_ucontext_t *lastt, jl_ucontext_t *t); - -#ifdef JL_HAVE_UNW_CONTEXT -static JL_THREAD_LOCAL unw_cursor_t jl_basecursor; -#endif +STATIC_OR_JS inline void jl_set_fiber(jl_ucontext_t *t); +STATIC_OR_JS inline void jl_start_fiber(jl_ucontext_t *lastt, jl_ucontext_t *t); +STATIC_OR_JS inline void jl_swap_fiber(jl_ucontext_t *lastt, jl_ucontext_t *t); #ifdef ALWAYS_COPY_STACKS # ifndef COPY_STACKS @@ -100,7 +92,10 @@ static int always_copy_stacks = 1; static int always_copy_stacks = 0; #endif -#ifdef COPY_STACKS + +#if defined(JL_HAVE_UNW_CONTEXT) +extern int unw_getcontext(unw_context_t*) __attribute__((__nothrow__,__returns_twice__)); +#endif static void memcpy_a16(uint64_t *to, uint64_t *from, size_t nb) { @@ -152,21 +147,41 @@ static void NOINLINE JL_NORETURN restore_stack(jl_task_t *t, jl_ptls_t ptls, cha memcpy_a16((uint64_t*)_x, (uint64_t*)_y, nb); // destroys all but the current stackframe sanitizer_start_switch_fiber(t->stkbuf, t->bufsz); - jl_set_fiber(&t->ctx); +#if defined(_OS_WINDOWS_) + jl_setcontext(t->ctx); +#else + jl_longjmp(t->copy_stack_ctx.uc_mcontext, 1); +#endif abort(); // unreachable } + static void restore_stack2(jl_task_t *t, jl_ptls_t ptls, jl_task_t *lastt) { + assert(t->copy_stack && !lastt->copy_stack); size_t nb = t->copy_stack; char *_x = (char*)ptls->stackbase - nb; void *_y = t->stkbuf; assert(_x != NULL && _y != NULL); memcpy_a16((uint64_t*)_x, (uint64_t*)_y, nb); // destroys all but the current stackframe +#if defined(JL_HAVE_UNW_CONTEXT) + int r = unw_getcontext(&lastt->ctx); + if (r == 1) + return; + if (r < 0) + abort(); +#elif defined(JL_HAVE_ASM) || defined(JL_HAVE_SIGALTSTACK) || defined(_OS_WINDOWS_) + if (jl_setjmp(lastt->copy_stack_ctx.uc_mcontext, 0)) + return; +#else +#error COPY_STACKS is incompatible with this platform +#endif sanitizer_start_switch_fiber(t->stkbuf, t->bufsz); - jl_swap_fiber(&lastt->ctx, &t->ctx); - sanitizer_finish_switch_fiber(); -} +#if defined(_OS_WINDOWS_) + jl_setcontext(t->ctx); +#else + jl_longjmp(t->copy_stack_ctx.uc_mcontext, 1); #endif +} /* Rooted by the base module */ static jl_function_t *task_done_hook_func JL_GLOBALLY_ROOTED = NULL; @@ -288,7 +303,10 @@ static void ctx_switch(jl_ptls_t ptls) t->copy_stack = 1; t->sticky = 1; t->bufsz = 0; - memcpy(&t->ctx, &ptls->base_ctx, sizeof(t->ctx)); + if (always_copy_stacks) + memcpy(&t->copy_stack_ctx, &ptls->copy_stack_ctx, sizeof(t->copy_stack_ctx)); + else + memcpy(&t->ctx, &ptls->base_ctx, sizeof(t->ctx)); #else jl_throw(jl_memory_exception); #endif @@ -308,7 +326,7 @@ static void ctx_switch(jl_ptls_t ptls) #ifdef COPY_STACKS if (lastt->copy_stack) { // save the old copy-stack save_stack(ptls, lastt, pt); // allocates (gc-safepoint, and can also fail) - if (jl_setjmp(lastt->ctx.uc_mcontext, 0)) { + if (jl_setjmp(lastt->copy_stack_ctx.uc_mcontext, 0)) { sanitizer_finish_switch_fiber(); // TODO: mutex unlock the thread we just switched from return; @@ -363,11 +381,15 @@ static void ctx_switch(jl_ptls_t ptls) } else { sanitizer_start_switch_fiber(t->stkbuf, t->bufsz); - if (always_copy_stacks) { + if (t->copy_stack && always_copy_stacks) { #ifdef COPY_STACKS - jl_longjmp(ptls->base_ctx.uc_mcontext, 1); - abort(); // unreachable +#if defined(_OS_WINDOWS_) + jl_setcontext(t->ctx); +#else + jl_longjmp(t->copy_stack_ctx.uc_mcontext, 1); +#endif #endif + abort(); // unreachable } else { jl_start_fiber(lastt_ctx, &t->ctx); sanitizer_finish_switch_fiber(); @@ -597,7 +619,9 @@ JL_DLLEXPORT jl_task_t *jl_new_task(jl_function_t *start, jl_value_t *completion memset(&t->ctx, 0, sizeof(t->ctx)); #endif #ifdef COPY_STACKS - if (t->copy_stack) + if (always_copy_stacks) + memcpy(&t->copy_stack_ctx, &ptls->copy_stack_ctx, sizeof(t->copy_stack_ctx)); + else if (t->copy_stack) memcpy(&t->ctx, &ptls->base_ctx, sizeof(t->ctx)); #endif return t; @@ -661,10 +685,13 @@ void jl_init_tasks(void) JL_GC_DISABLED else if (!strcmp(acs, "0") || !strcmp(acs, "no")) always_copy_stacks = 0; else { - jl_printf(JL_STDERR, "invalid JULIA_COPY_STACKS value: %s\n", acs); - exit(1); + jl_errorf("invalid JULIA_COPY_STACKS value: %s", acs); } } +#ifndef COPY_STACKS + if (always_copy_stacks) + jl_error(JL_STDERR, "Julia built without COPY_STACKS support"); +#endif } STATIC_OR_JS void NOINLINE JL_NORETURN start_task(void) @@ -723,7 +750,6 @@ skip_pop_exception:; #if defined(JL_HAVE_UCONTEXT) #ifdef _OS_WINDOWS_ #define setcontext jl_setcontext -#define getcontext jl_getcontext #define swapcontext jl_swapcontext #define makecontext jl_makecontext #endif @@ -762,112 +788,128 @@ static void jl_set_fiber(jl_ucontext_t *t) { setcontext(t); } -static void jl_init_basefiber(size_t ssize) -{ - jl_ptls_t ptls = jl_get_ptls_states(); - char *stkbuf = jl_alloc_fiber(&ptls->base_ctx, &ssize, NULL); - ptls->stackbase = stkbuf + ssize; - ptls->stacksize = ssize; -} #endif -#if defined(JL_HAVE_UNW_CONTEXT) -static void start_basefiber(void) -{ - jl_ptls_t ptls = jl_get_ptls_states(); - if (jl_setjmp(ptls->base_ctx.uc_mcontext, 0)) - start_task(); // sanitizer_finish_switch_fiber is part of start_task - sanitizer_start_switch_fiber(jl_root_task->stkbuf, jl_root_task->bufsz); - jl_longjmp(jl_root_task->ctx.uc_mcontext, 1); - abort(); // unreachable -} -#if defined(_CPU_X86_) || defined(_CPU_X86_64_) -#define PUSH_RET(ctx, stk) \ - do { \ - stk -= sizeof(uintptr_t); \ - *(uintptr_t*)stk = 0; /* push null RIP/EIP onto the stack */ \ - } while (0) -#elif defined(_CPU_ARM_) -#define PUSH_RET(ctx, stk) \ - unw_set_reg(ctx, UNW_ARM_R14, 0) /* put NULL into the LR */ -#else -#error please define how to simulate a CALL on this platform -#endif -static char *jl_alloc_fiber(unw_context_t *t, size_t *ssize, jl_task_t *owner) +#if defined(JL_HAVE_UNW_CONTEXT) || defined(JL_HAVE_ASM) +static char *jl_alloc_fiber(jl_ucontext_t *t, size_t *ssize, jl_task_t *owner) { char *stkbuf = (char*)jl_malloc_stack(ssize, owner); if (stkbuf == NULL) return NULL; - char *stk = stkbuf; - stk += *ssize; - PUSH_RET(&jl_basecursor, stk); - if (unw_set_reg(&jl_basecursor, UNW_REG_SP, (uintptr_t)stk) != 0) { - jl_free_stack((void*)stkbuf, *ssize); - jl_error("unw_set_reg UNW_REG_SP failed"); - } - uintptr_t fn; - if (t == &ptls->base_ctx) - fn = (uintptr_t)&start_basefiber; - else - fn = (uintptr_t)&start_task; - if (unw_set_reg(&jl_basecursor, UNW_REG_IP, fn) != 0) { - jl_free_stack((void*)stkbuf, *ssize); - jl_error("unw_set_reg UNW_REG_IP failed"); - } +#ifndef __clang_analyzer__ + ((char**)t)[0] = stkbuf; // stash the stack pointer somewhere for start_fiber + ((size_t*)t)[1] = *ssize; // stash the stack size somewhere for start_fiber +#endif return stkbuf; } -static void jl_start_fiber(unw_context_t *lastt, unw_context_t *t) +#endif + +#if defined(JL_HAVE_UNW_CONTEXT) +#if defined(_CPU_X86_64_) +#define UNW_REG_RETURN UNW_X86_64_RAX +#elif defined(_CPU_X86_) +#define UNW_REG_RETURN UNW_X86_EAX +#elif defined(_CPU_AARCH64_) +#define UNW_REG_RETURN UNW_AARCH64_X0 +#elif defined(_CPU_ARM_) +#define UNW_REG_RETURN UNW_ARM_R0 +#elif defined(_CPU_PPC64_) +#define UNW_REG_RETURN UNW_PPC64_R3 +#else +#error +#endif +static inline void jl_unw_swapcontext(unw_context_t *old, unw_cursor_t *c) { - if (lastt && jl_setjmp(lastt->uc_mcontext, 0)) + if (unw_set_reg(c, UNW_REG_RETURN, 1)) + abort(); + int r = unw_getcontext(old); + if (r == 1) return; - unw_resume(&jl_basecursor); // (doesn't return) + if (r < 0) + abort(); + unw_resume(c); } static void jl_swap_fiber(unw_context_t *lastt, unw_context_t *t) +{ + unw_cursor_t c; + if (unw_init_local(&c, t)) + abort(); + jl_unw_swapcontext(lastt, &c); +} +static void jl_set_fiber(unw_context_t *t) +{ + unw_cursor_t c; + if (unw_init_local(&c, t)) + abort(); + if (unw_set_reg(&c, UNW_REG_RETURN, 1)) + abort(); + unw_resume(&c); +} +#elif defined(JL_HAVE_ASM) +static void jl_swap_fiber(jl_ucontext_t *lastt, jl_ucontext_t *t) { if (jl_setjmp(lastt->uc_mcontext, 0)) return; jl_longjmp(t->uc_mcontext, 1); // (doesn't return) } -static void jl_set_fiber(unw_context_t *t) +static void jl_set_fiber(jl_ucontext_t *t) { jl_longjmp(t->uc_mcontext, 1); } -static void jl_init_basefiber(size_t ssize) -{ - int r = unw_getcontext(&ptls->base_ctx); - if (r != 0) - jl_error("unw_getcontext failed"); - r = unw_init_local(&jl_basecursor, &ptls->base_ctx); - if (r != 0) - jl_error("unw_init_local failed"); -#ifdef COPY_STACKS - jl_ptls_t ptls = jl_get_ptls_states(); - char *stkbuf = jl_alloc_fiber(&ptls->base_ctx, &ssize, NULL); - ptls->stackbase = stkbuf + ssize; - ptls->stacksize = ssize; - sanitizer_start_switch_fiber(stkbuf, sksize); - jl_start_fiber(jl_root_task, &ptls->base_ctx); // finishes initializing jl_basectx - sanitizer_finish_switch_fiber(); #endif + +#if defined(JL_HAVE_UNW_CONTEXT) && !defined(JL_HAVE_ASM) +#if defined(_CPU_X86_) || defined(_CPU_X86_64_) +#define PUSH_RET(ctx, stk) \ + do { \ + stk -= sizeof(uintptr_t); \ + *(uintptr_t*)stk = 0; /* push null RIP/EIP onto the stack */ \ + } while (0) +#elif defined(_CPU_ARM_) +#define PUSH_RET(ctx, stk) \ + unw_set_reg(ctx, UNW_ARM_R14, 0) /* put NULL into the LR */ +#else +#error please define how to simulate a CALL on this platform +#endif +static void jl_start_fiber(unw_context_t *lastt, unw_context_t *t) +{ + unw_cursor_t c; + char *stk = ((char**)t)[0]; + size_t ssize = ((size_t*)t)[1]; + uintptr_t fn = (uintptr_t)&start_task; + stk += ssize; + if (unw_getcontext(t)) + abort(); + if (unw_init_local(&c, t)) + abort(); + PUSH_RET(&c, stk); + if (unw_set_reg(&c, UNW_REG_SP, (uintptr_t)stk)) + abort(); + if (unw_set_reg(&c, UNW_REG_IP, fn)) + abort(); + if (lastt) + jl_unw_swapcontext(lastt, &c); + else + unw_resume(&c); // (doesn't return) } #endif #if defined(JL_HAVE_ASM) -static char *jl_alloc_fiber(jl_ucontext_t *t, size_t *ssize, jl_task_t *owner) -{ - char *stkbuf = (char*)jl_malloc_stack(ssize, owner); - if (stkbuf == NULL) - return NULL; -#ifndef __clang_analyzer__ - ((char**)t)[0] = stkbuf; // stash the stack pointer somewhere for start_fiber - ((size_t*)t)[1] = *ssize; // stash the stack size somewhere for start_fiber -#endif - return stkbuf; -} static void jl_start_fiber(jl_ucontext_t *lastt, jl_ucontext_t *t) { +#ifdef JL_HAVE_UNW_CONTEXT + if (lastt) { + int r = unw_getcontext(lastt); + if (r == 1) + return; + if (r < 0) + abort(); + } +#else if (lastt && jl_setjmp(lastt->uc_mcontext, 0)) return; +#endif + char *stk = ((char**)t)[0]; size_t ssize = ((size_t*)t)[1]; uintptr_t fn = (uintptr_t)&start_task; @@ -936,32 +978,13 @@ static void jl_start_fiber(jl_ucontext_t *lastt, jl_ucontext_t *t) #endif __builtin_unreachable(); } -static void jl_swap_fiber(jl_ucontext_t *lastt, jl_ucontext_t *t) -{ - if (jl_setjmp(lastt->uc_mcontext, 0)) - return; - jl_longjmp(t->uc_mcontext, 1); // (doesn't return) -} -static void jl_set_fiber(jl_ucontext_t *t) -{ - jl_longjmp(t->uc_mcontext, 1); -} -static void jl_init_basefiber(size_t ssize) -{ -#ifdef COPY_STACKS - jl_ptls_t ptls = jl_get_ptls_states(); - char *stkbuf = jl_alloc_fiber(&ptls->base_ctx, &ssize, NULL); - ptls->stackbase = stkbuf + ssize; - ptls->stacksize = ssize; -#endif -} #endif #if defined(JL_HAVE_SIGALTSTACK) static void start_basefiber(void) { jl_ptls_t ptls = jl_get_ptls_states(); - if (jl_setjmp(ptls->base_ctx.uc_mcontext, 0)) + if (jl_setjmp(ptls->base_ctx, 0)) start_task(); // sanitizer_finish_switch_fiber is part of start_task } static char *jl_alloc_fiber(jl_ucontext_t *t, size_t *ssize, jl_task_t *owner) @@ -1014,8 +1037,10 @@ static char *jl_alloc_fiber(jl_ucontext_t *t, size_t *ssize, jl_task_t *owner) jl_free_stack(stk, *ssize); jl_error("sigprocmask failed"); } - memcpy(&t, &ptls->base_ctx, sizeof(ptls->base_ctx)); - memcpy(&ptls->base_ctx, &base_ctx, sizeof(ptls->base_ctx)); + if (&ptls->base_ctx != t) { + memcpy(t, &ptls->base_ctx, sizeof(ptls->base_ctx)); + memcpy(&ptls->base_ctx, &base_ctx, sizeof(ptls->base_ctx)); // restore COPY_STACKS context + } return (char*)stk; } static void jl_start_fiber(jl_ucontext_t *lastt, jl_ucontext_t *t) @@ -1034,22 +1059,10 @@ static void jl_set_fiber(jl_ucontext_t *t) { jl_longjmp(t->uc_mcontext, 1); } -static void jl_init_basefiber(size_t ssize) -{ -#ifdef COPY_STACKS - jl_ptls_t ptls = jl_get_ptls_states(); - char *stkbuf = jl_alloc_fiber(jl_root_task, &ssize, NULL); - ptls->stackbase = stkbuf + ssize; - ptls->stacksize = ssize; - memcpy(&ptls->base_ctx, &jl_root_task->ctx, sizeof(ptls->base_ctx)); -#endif } #endif #if defined(JL_HAVE_ASYNCIFY) -static void jl_init_basefiber(size_t ssize) -{ -} static char *jl_alloc_fiber(jl_ucontext_t *t, size_t *ssize, jl_task_t *owner) JL_NOTSAFEPOINT { void *stk = jl_malloc_stack(ssize, owner); @@ -1108,16 +1121,25 @@ void jl_init_root_task(void *stack_lo, void *stack_hi) arraylist_new(&ptls->current_task->locks, 0); #ifdef COPY_STACKS + // initialize the base_ctx from which all future copy_stacks will be copies if (always_copy_stacks) { + // when this is set, we will attempt to corrupt the process stack to switch tasks, + // although this is unreliable, and thus not recommended ptls->stackbase = stack_hi; ptls->stacksize = ssize; - if (jl_setjmp(ptls->base_ctx.uc_mcontext, 0)) +#ifdef _OS_WINDOWS_ + ptls->copy_stack_ctx.uc_stack.ss_sp = stack_hi; + ptls->copy_stack_ctx.uc_stack.ss_size = ssize; +#endif + if (jl_setjmp(ptls->copy_stack_ctx.uc_mcontext, 0)) start_task(); // sanitizer_finish_switch_fiber is part of start_task return; } + ssize = JL_STACK_SIZE; + char *stkbuf = jl_alloc_fiber(&ptls->base_ctx, &ssize, NULL); + ptls->stackbase = stkbuf + ssize; + ptls->stacksize = ssize; #endif - - jl_init_basefiber(JL_STACK_SIZE); } JL_DLLEXPORT int jl_is_task_started(jl_task_t *t) @@ -1174,6 +1196,7 @@ JL_DLLEXPORT void jl_gdb_dump_threadinfo(void) } #endif + #ifdef __cplusplus } #endif