https://github.com/JuliaLang/julia
Tip revision: 8bc794d1aee3c65a75c4fdb129035b4682c1cce8 authored by Keno Fischer on 12 May 2018, 19:38:04 UTC
[NewOptimizer] Fix codegen test
[NewOptimizer] Fix codegen test
Tip revision: 8bc794d
task.c
// This file is a part of Julia. License is MIT: https://julialang.org/license
/*
task.c
lightweight processes (symmetric coroutines)
*/
//// enable this for ifndef COPY_STACKS to work on linux
//#ifdef _FORTIFY_SOURCE
//// disable __longjmp_chk validation so that we can jump between stacks
//#pragma push_macro("_FORTIFY_SOURCE")
//#undef _FORTIFY_SOURCE
//#include <setjmp.h>
//#pragma pop_macro("_FORTIFY_SOURCE")
//#endif
#include "platform.h"
#include <stdlib.h>
#include <string.h>
#include <signal.h>
#include <errno.h>
#include <inttypes.h>
#include "julia.h"
#include "julia_internal.h"
#include "threading.h"
#include "julia_assert.h"
#ifdef __cplusplus
extern "C" {
#endif
#if defined(_OS_WINDOWS_)
#include <winbase.h>
#include <malloc.h>
volatile int jl_in_stackwalk = 0;
#else
#include <unistd.h>
#include <sys/mman.h> // for mprotect
#include <dlfcn.h> // for dladdr
#endif
/* This probing code is derived from Douglas Jones' user thread library */
/* true if stack grows up, false if down */
static int _stack_grows_up;
/* the offset of the beginning of the stack frame in a function */
static size_t _frame_offset;
struct _probe_data {
intptr_t low_bound; /* below probe on stack */
intptr_t probe_local; /* local to probe on stack */
intptr_t high_bound; /* above probe on stack */
intptr_t prior_local; /* value of probe_local from earlier call */
jl_jmp_buf probe_env; /* saved environment of probe */
jl_jmp_buf probe_sameAR; /* second environment saved by same call */
jl_jmp_buf probe_samePC; /* environment saved on previous call */
jl_jmp_buf * ref_probe; /* switches between probes */
};
static void boundhigh(struct _probe_data *p)
{
int c;
p->high_bound = (intptr_t)&c;
}
static void probe(struct _probe_data *p)
{
p->prior_local = p->probe_local;
p->probe_local = (intptr_t)&p;
jl_setjmp( *(p->ref_probe), 0 );
p->ref_probe = &p->probe_env;
jl_setjmp( p->probe_sameAR, 0 );
boundhigh(p);
}
static void boundlow(struct _probe_data *p)
{
p->low_bound = (intptr_t)&p;
probe(p);
}
// we need this function to exist so we can measure its stack frame!
static void NOINLINE_DECL(fill(struct _probe_data *p));
static void fill(struct _probe_data *p)
{
boundlow(p);
}
static void _infer_direction_from(int *first_addr)
{
int second;
_stack_grows_up = (first_addr < &second);
}
static void _infer_stack_direction(void)
{
int first;
_infer_direction_from(&first);
}
static int mangle_pointers;
static void _probe_arch(void)
{
struct _probe_data p;
memset(p.probe_env, 0, sizeof(jl_jmp_buf));
memset(p.probe_sameAR, 0, sizeof(jl_jmp_buf));
memset(p.probe_samePC, 0, sizeof(jl_jmp_buf));
p.ref_probe = &p.probe_samePC;
_infer_stack_direction();
/* do a probe with filler on stack */
fill(&p);
/* do a probe without filler */
boundlow(&p);
#if defined(__linux__) && defined(__i386__)
jl_ptls_t ptls = jl_get_ptls_states();
char **s = (char**)p.ref_probe;
mangle_pointers = !(s[4] > ptls->stack_lo &&
s[4] < ptls->stack_hi);
#elif defined(__linux__) && defined(__x86_64__)
jl_ptls_t ptls = jl_get_ptls_states();
char **s = (char**)p.ref_probe;
mangle_pointers = !(s[6] > ptls->stack_lo &&
s[6] < ptls->stack_hi);
#else
mangle_pointers = 0;
#endif
intptr_t prior_diff = p.probe_local - p.prior_local;
_frame_offset = labs(prior_diff);
}
/* end probing code */
static jl_sym_t *done_sym;
static jl_sym_t *failed_sym;
static jl_sym_t *runnable_sym;
extern size_t jl_page_size;
jl_datatype_t *jl_task_type;
#ifdef COPY_STACKS
#if (defined(_CPU_X86_64_) || defined(_CPU_X86_) || defined(_CPU_AARCH64_) || defined(_CPU_ARM_)) && !defined(_COMPILER_MICROSOFT_)
#define ASM_COPY_STACKS
#endif
static void NOINLINE save_stack(jl_ptls_t ptls, jl_task_t *lastt, jl_task_t **pt)
{
if (lastt->state == done_sym || lastt->state == failed_sym)
return;
char *frame_addr = (char*)jl_get_frame_addr();
char *stackbase = (char*)ptls->stackbase;
size_t nb = stackbase > frame_addr ? stackbase - frame_addr : 0;
char *buf;
if (lastt->stkbuf == NULL || lastt->bufsz < nb) {
buf = (char*)jl_gc_alloc_buf(ptls, nb);
lastt->stkbuf = buf;
lastt->bufsz = nb;
}
else {
buf = (char*)lastt->stkbuf;
}
lastt->ssize = nb;
*pt = lastt; // clear the gc-root for the target task before copying the stack for saving
memcpy(buf, frame_addr, nb);
// this task's stack could have been modified after
// it was marked by an incremental collection
// move the barrier back instead of walking it again here
jl_gc_wb_back(lastt);
}
static void NOINLINE restore_stack(jl_ptls_t ptls, char *p)
{
jl_task_t *t = ptls->current_task;
char *_x = (char*)ptls->stackbase - t->ssize;
if (!p) {
p = _x;
if ((char*)&_x > _x) {
p = (char*)alloca((char*)&_x - _x);
}
restore_stack(ptls, p); // pass p to ensure the compiler can't tailcall this
}
assert(t->stkbuf != NULL);
memcpy(_x, t->stkbuf, t->ssize); // destroys all but the current stackframe
jl_longjmp(t->ctx, 1);
}
#endif
static jl_function_t *task_done_hook_func=NULL;
static void JL_NORETURN finish_task(jl_task_t *t, jl_value_t *resultval)
{
jl_ptls_t ptls = jl_get_ptls_states();
JL_SIGATOMIC_BEGIN();
if (t->exception != jl_nothing)
t->state = failed_sym;
else
t->state = done_sym;
t->result = resultval;
jl_gc_wb(t, t->result);
// TODO: early free of t->stkbuf
#ifdef COPY_STACKS
t->stkbuf = (void*)(intptr_t)-1;
#endif
// ensure that state is cleared
ptls->in_finalizer = 0;
ptls->in_pure_callback = 0;
jl_get_ptls_states()->world_age = jl_world_counter;
if (ptls->tid != 0) {
// For now, only thread 0 runs the task scheduler.
// The others return to the thread loop
ptls->root_task->result = jl_nothing;
jl_task_t *task = ptls->root_task;
jl_switchto(&task);
gc_debug_critical_error();
abort();
}
if (task_done_hook_func == NULL) {
task_done_hook_func = (jl_function_t*)jl_get_global(jl_base_module,
jl_symbol("task_done_hook"));
}
if (task_done_hook_func != NULL) {
jl_value_t *args[2] = {task_done_hook_func, (jl_value_t*)t};
JL_TRY {
jl_apply(args, 2);
}
JL_CATCH {
jl_no_exc_handler(jl_exception_in_transit);
}
}
gc_debug_critical_error();
abort();
}
static void record_backtrace(void)
{
jl_ptls_t ptls = jl_get_ptls_states();
ptls->bt_size = rec_backtrace(ptls->bt_data, JL_MAX_BT_SIZE);
}
static void NOINLINE JL_NORETURN JL_USED_FUNC start_task(void)
{
jl_ptls_t ptls = jl_get_ptls_states();
// this runs the first time we switch to a task
jl_task_t *t = ptls->current_task;
jl_value_t *res;
t->started = 1;
if (t->exception != jl_nothing) {
record_backtrace();
res = t->exception;
}
else {
JL_TRY {
if (ptls->defer_signal) {
ptls->defer_signal = 0;
jl_sigint_safepoint(ptls);
}
JL_TIMING(ROOT);
ptls->world_age = jl_world_counter;
res = jl_apply(&t->start, 1);
}
JL_CATCH {
res = ptls->exception_in_transit;
t->exception = res;
jl_gc_wb(t, res);
}
}
finish_task(t, res);
gc_debug_critical_error();
abort();
}
#ifdef COPY_STACKS
void NOINLINE jl_set_base_ctx(char *__stk)
{
jl_ptls_t ptls = jl_get_ptls_states();
ptls->stackbase = (char*)(((uintptr_t)__stk + sizeof(*__stk))&-16); // also ensures stackbase is 16-byte aligned
#ifndef ASM_COPY_STACKS
if (jl_setjmp(ptls->base_ctx, 0)) {
start_task();
}
#endif
}
#endif
JL_DLLEXPORT void julia_init(JL_IMAGE_SEARCH rel)
{
// keep this function small, since we want to keep the stack frame
// leading up to this also quite small
#ifdef COPY_STACKS
char __stk;
jl_set_base_ctx(&__stk); // separate function, to record the size of a stack frame
#endif
_julia_init(rel);
}
static void ctx_switch(jl_ptls_t ptls, jl_task_t **pt)
{
jl_task_t *t = *pt;
assert(t != ptls->current_task);
#ifdef ENABLE_TIMINGS
jl_timing_block_t *blk = ptls->current_task->timing_stack;
if (blk)
jl_timing_block_stop(blk);
#endif
if (!jl_setjmp(ptls->current_task->ctx, 0)) {
// backtraces don't survive task switches, see e.g. issue #12485
ptls->bt_size = 0;
jl_task_t *lastt = ptls->current_task;
#ifdef COPY_STACKS
save_stack(ptls, lastt, pt); // allocates (gc-safepoint, and can also fail)
#else
*pt = lastt; // can't fail after here: clear the gc-root for the target task now
#endif
// set up global state for new task
lastt->gcstack = ptls->pgcstack;
lastt->world_age = ptls->world_age;
ptls->pgcstack = t->gcstack;
ptls->world_age = t->world_age;
#ifdef JULIA_ENABLE_THREADING
// If the current task is not holding any locks, free the locks list
// so that it can be GC'd without leaking memory
arraylist_t *locks = &ptls->current_task->locks;
if (locks->len == 0 && locks->items != locks->_space) {
arraylist_free(locks);
arraylist_new(locks, 0);
}
#endif
// restore task's current module, looking at parent tasks
// if it hasn't set one.
jl_task_t *last = t;
while (last->current_module == NULL && last != ptls->root_task) {
last = last->parent;
}
if (last->current_module != NULL) {
ptls->current_module = last->current_module;
}
ptls->current_task = t;
#ifdef COPY_STACKS
if (t->stkbuf) {
restore_stack(ptls, NULL);
}
else {
#ifdef ASM_COPY_STACKS
// Start the task without `setjmp`
void *stackbase = ptls->stackbase;
#ifdef _CPU_X86_64_
#ifdef _OS_WINDOWS_
stackbase = (char*)stackbase - 0x20;
#endif
asm(" movq %0, %%rsp;\n"
" xorq %%rbp, %%rbp;\n"
" push %%rbp;\n" // instead of RSP
" jmp %P1;\n" // call `start_task` with fake stack frame
" ud2"
: : "r"(stackbase), "i"(&start_task) : "memory" );
#elif defined(_CPU_X86_)
asm(" movl %0, %%esp;\n"
" xorl %%ebp, %%ebp;\n"
" push %%ebp;\n" // instead of ESP
" jmp %P1;\n" // call `start_task` with fake stack frame
" ud2"
: : "r"(stackbase), "X"(&start_task) : "memory" );
#elif defined(_CPU_AARCH64_)
asm(" mov sp, %0;\n"
" mov x29, xzr;\n" // Clear link register (x29) and frame pointer
" mov x30, xzr;\n" // (x30) to terminate unwinder.
" b %1;\n" // call `start_task` with fake stack frame
" brk #0x1" // abort
: : "r"(stackbase), "S"(&start_task) : "memory" );
#elif defined(_CPU_ARM_)
// A "i" constraint on `&start_task` works only on clang and not on GCC.
asm(" mov sp, %0;\n"
" mov lr, #0;\n" // Clear link register (lr) and frame pointer
" mov fp, #0;\n" // (fp) to terminate unwinder.
" b start_task;\n" // call `start_task` with fake stack frame
" udf #0" // abort
: : "r"(stackbase) : "memory" );
#else
#error ASM_COPY_STACKS not supported on this cpu architecture
#endif
#else // ASM_COPY_STACKS
jl_longjmp(ptls->base_ctx, 1);
#endif
jl_unreachable();
}
#else
jl_longjmp(t->ctx, 1);
#endif
}
#ifdef ENABLE_TIMINGS
assert(blk == jl_current_task->timing_stack);
if (blk)
jl_timing_block_start(blk);
#endif
}
JL_DLLEXPORT void jl_switchto(jl_task_t **pt)
{
jl_ptls_t ptls = jl_get_ptls_states();
jl_task_t *t = *pt;
if (t == ptls->current_task) {
return;
}
if (t->state == done_sym || t->state == failed_sym ||
(t->stkbuf == (void*)(intptr_t)-1)) {
ptls->current_task->exception = t->exception;
ptls->current_task->result = t->result;
return;
}
if (ptls->in_finalizer)
jl_error("task switch not allowed from inside gc finalizer");
if (ptls->in_pure_callback)
jl_error("task switch not allowed from inside staged nor pure functions");
sig_atomic_t defer_signal = ptls->defer_signal;
int8_t gc_state = jl_gc_unsafe_enter(ptls);
ctx_switch(ptls, pt);
jl_gc_unsafe_leave(ptls, gc_state);
sig_atomic_t other_defer_signal = ptls->defer_signal;
ptls->defer_signal = defer_signal;
if (other_defer_signal && !defer_signal)
jl_sigint_safepoint(ptls);
}
#ifndef COPY_STACKS
#ifdef __linux__
#if defined(__i386__)
static intptr_t ptr_mangle(intptr_t p)
{
intptr_t ret;
asm(" movl %1, %%eax;\n"
" xorl %%gs:0x18, %%eax;"
" roll $9, %%eax;"
" movl %%eax, %0;"
: "=r"(ret) : "r"(p) : "%eax");
return ret;
}
static intptr_t ptr_demangle(intptr_t p)
{
intptr_t ret;
asm(" movl %1, %%eax;\n"
" rorl $9, %%eax;"
" xorl %%gs:0x18, %%eax;"
" movl %%eax, %0;"
: "=r"(ret) : "r"(p) : "%eax" );
return ret;
}
#elif defined(__x86_64__)
static intptr_t ptr_mangle(intptr_t p)
{
intptr_t ret;
asm(" movq %1, %%rax;\n"
" xorq %%fs:0x30, %%rax;"
" rolq $17, %%rax;"
" movq %%rax, %0;"
: "=r"(ret) : "r"(p) : "%rax");
return ret;
}
static intptr_t ptr_demangle(intptr_t p)
{
intptr_t ret;
asm(" movq %1, %%rax;\n"
" rorq $17, %%rax;"
" xorq %%fs:0x30, %%rax;"
" movq %%rax, %0;"
: "=r"(ret) : "r"(p) : "%rax" );
return ret;
}
#endif
#endif //__linux__
/* rebase any values in saved state to the new stack */
static void rebase_state(jl_jmp_buf *ctx, intptr_t local_sp, intptr_t new_sp)
{
intptr_t *s = (intptr_t*)ctx;
intptr_t diff = new_sp - local_sp; /* subtract old base, and add new base */
#if defined(__linux__) && defined(__i386__)
s[3] += diff;
if (mangle_pointers)
s[4] = ptr_mangle(ptr_demangle(s[4])+diff);
else
s[4] += diff;
#elif defined(__linux__) && defined(__x86_64__)
if (mangle_pointers) {
s[1] = ptr_mangle(ptr_demangle(s[1])+diff);
s[6] = ptr_mangle(ptr_demangle(s[6])+diff);
}
else {
s[1] += diff;
s[6] += diff;
}
#elif defined(__APPLE__) && defined(__i386__)
s[8] += diff;
s[9] += diff;
#elif defined(__APPLE__) && defined(__x86_64__)
s[1] += diff;
s[2] += diff;
#else
#error "COPY_STACKS must be defined on this platform."
#endif
}
static void init_task(jl_task_t *t, char *stack)
{
if (jl_setjmp(t->ctx, 0)) {
start_task();
}
// this runs when the task is created
intptr_t local_sp = (intptr_t)&t;
intptr_t new_sp = (intptr_t)stack + t->ssize - _frame_offset;
#ifdef _P64
// SP must be 16-byte aligned
new_sp = new_sp&-16;
local_sp = local_sp&-16;
#endif
memcpy((void*)new_sp, (void*)local_sp, _frame_offset);
rebase_state(&t->ctx, local_sp, new_sp);
}
#endif /* !COPY_STACKS */
jl_timing_block_t *jl_pop_timing_block(jl_timing_block_t *cur_block);
JL_DLLEXPORT JL_NORETURN void jl_no_exc_handler(jl_value_t *e)
{
jl_printf(JL_STDERR, "fatal: error thrown and no exception handler available.\n");
jl_static_show(JL_STDERR, e);
jl_printf(JL_STDERR, "\n");
jlbacktrace();
jl_exit(1);
}
// yield to exception handler
void JL_NORETURN throw_internal(jl_value_t *e)
{
jl_ptls_t ptls = jl_get_ptls_states();
ptls->io_wait = 0;
if (ptls->safe_restore)
jl_longjmp(*ptls->safe_restore, 1);
jl_gc_unsafe_enter(ptls);
assert(e != NULL);
ptls->exception_in_transit = e;
jl_handler_t *eh = ptls->current_task->eh;
if (eh != NULL) {
#ifdef ENABLE_TIMINGS
jl_timing_block_t *cur_block = ptls->current_task->timing_stack;
while (cur_block && eh->timing_stack != cur_block) {
cur_block = jl_pop_timing_block(cur_block);
}
assert(cur_block == eh->timing_stack);
#endif
jl_longjmp(eh->eh_ctx, 1);
}
else {
jl_no_exc_handler(e);
}
assert(0);
}
// record backtrace and raise an error
JL_DLLEXPORT void jl_throw(jl_value_t *e)
{
jl_ptls_t ptls = jl_get_ptls_states();
assert(e != NULL);
if (!ptls->safe_restore)
record_backtrace();
throw_internal(e);
}
JL_DLLEXPORT void jl_rethrow(void)
{
jl_ptls_t ptls = jl_get_ptls_states();
throw_internal(ptls->exception_in_transit);
}
JL_DLLEXPORT void jl_rethrow_other(jl_value_t *e)
{
throw_internal(e);
}
JL_DLLEXPORT jl_task_t *jl_new_task(jl_function_t *start, size_t ssize)
{
jl_ptls_t ptls = jl_get_ptls_states();
size_t pagesz = jl_page_size;
jl_task_t *t = (jl_task_t*)jl_gc_alloc(ptls, sizeof(jl_task_t),
jl_task_type);
#ifndef COPY_STACKS
if (ssize == 0) // unspecified -- pick some default size
ssize = 1*1024*1024; // 1M (for now)
#endif
ssize = LLT_ALIGN(ssize, pagesz);
t->ssize = ssize;
t->current_module = NULL;
t->parent = ptls->current_task;
t->tls = jl_nothing;
t->state = runnable_sym;
t->start = start;
t->result = jl_nothing;
t->donenotify = jl_nothing;
t->exception = jl_nothing;
t->backtrace = jl_nothing;
// Inherit logger state from parent task
t->logstate = ptls->current_task->logstate;
// there is no active exception handler available on this stack yet
t->eh = NULL;
t->gcstack = NULL;
t->stkbuf = NULL;
t->tid = 0;
t->started = 0;
#ifdef ENABLE_TIMINGS
t->timing_stack = NULL;
#endif
#ifdef COPY_STACKS
t->bufsz = 0;
#else
JL_GC_PUSH1(&t);
size_t stkbuf_sz = ssize + pagesz + (pagesz - 1);
char *stk = (char*)jl_gc_alloc_buf(ptls, stkbuf_sz);
t->stkbuf = stk;
jl_gc_wb_buf(t, t->stkbuf, stkbuf_sz);
stk = (char*)LLT_ALIGN((uintptr_t)stk, pagesz);
// add a guard page to detect stack overflow
if (mprotect(stk, pagesz-1, PROT_NONE) == -1)
jl_errorf("mprotect: %s", strerror(errno));
stk += pagesz;
init_task(t, stk);
jl_gc_add_finalizer((jl_value_t*)t, jl_unprotect_stack_func);
JL_GC_POP();
#endif
#ifdef JULIA_ENABLE_THREADING
arraylist_new(&t->locks, 0);
#endif
return t;
}
#ifndef COPY_STACKS
static void jl_unprotect_stack(jl_task_t *t)
{
size_t pagesz = jl_page_size;
char *stk = (char*)LLT_ALIGN((uintptr_t)t->stkbuf, pagesz);
// unprotect stack so it can be reallocated for something else
mprotect(stk, pagesz - 1, PROT_READ|PROT_WRITE);
}
#endif
JL_DLLEXPORT jl_value_t *jl_get_current_task(void)
{
jl_ptls_t ptls = jl_get_ptls_states();
return (jl_value_t*)ptls->current_task;
}
jl_function_t *jl_unprotect_stack_func;
// Do one-time initializations for task system
void jl_init_tasks(void)
{
_probe_arch();
jl_task_type = (jl_datatype_t*)
jl_new_datatype(jl_symbol("Task"),
NULL,
jl_any_type,
jl_emptysvec,
jl_perm_symsvec(9,
"parent",
"storage",
"state",
"donenotify",
"result",
"exception",
"backtrace",
"logstate",
"code"),
jl_svec(9,
jl_any_type,
jl_any_type,
jl_sym_type,
jl_any_type,
jl_any_type,
jl_any_type,
jl_any_type,
jl_any_type,
jl_any_type),
0, 1, 8);
jl_svecset(jl_task_type->types, 0, (jl_value_t*)jl_task_type);
done_sym = jl_symbol("done");
failed_sym = jl_symbol("failed");
runnable_sym = jl_symbol("runnable");
#ifndef COPY_STACKS
jl_unprotect_stack_func = jl_box_voidpointer(&jl_unprotect_stack);
#endif
}
// Initialize a root task using the given stack.
void jl_init_root_task(void *stack, size_t ssize)
{
jl_ptls_t ptls = jl_get_ptls_states();
ptls->current_task = (jl_task_t*)jl_gc_alloc(ptls, sizeof(jl_task_t),
jl_task_type);
#ifdef COPY_STACKS
ptls->current_task->ssize = 0; // size of saved piece
ptls->current_task->bufsz = 0;
ptls->current_task->stkbuf = NULL;
#else
ptls->current_task->ssize = ssize;
ptls->current_task->stkbuf = stack;
#endif
ptls->current_task->started = 1;
ptls->current_task->parent = ptls->current_task;
ptls->current_task->current_module = ptls->current_module;
ptls->current_task->tls = jl_nothing;
ptls->current_task->state = runnable_sym;
ptls->current_task->start = NULL;
ptls->current_task->result = jl_nothing;
ptls->current_task->donenotify = jl_nothing;
ptls->current_task->exception = jl_nothing;
ptls->current_task->backtrace = jl_nothing;
ptls->current_task->logstate = jl_nothing;
ptls->current_task->eh = NULL;
ptls->current_task->gcstack = NULL;
ptls->current_task->tid = ptls->tid;
#ifdef JULIA_ENABLE_THREADING
arraylist_new(&ptls->current_task->locks, 0);
#endif
ptls->root_task = ptls->current_task;
ptls->exception_in_transit = (jl_value_t*)jl_nothing;
}
JL_DLLEXPORT int jl_is_task_started(jl_task_t *t)
{
return t->started;
}
#ifdef __cplusplus
}
#endif