Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Revert "linux: workaround to avoid deadlock inside dl_iterate_phdr in glibc" #57059

Open
wants to merge 1 commit into
base: master
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
3 changes: 2 additions & 1 deletion src/julia_internal.h
Original file line number Diff line number Diff line change
Expand Up @@ -208,7 +208,8 @@ JL_DLLEXPORT void jl_lock_profile(void) JL_NOTSAFEPOINT JL_NOTSAFEPOINT_ENTER;
JL_DLLEXPORT void jl_unlock_profile(void) JL_NOTSAFEPOINT JL_NOTSAFEPOINT_LEAVE;
JL_DLLEXPORT void jl_lock_profile_wr(void) JL_NOTSAFEPOINT JL_NOTSAFEPOINT_ENTER;
JL_DLLEXPORT void jl_unlock_profile_wr(void) JL_NOTSAFEPOINT JL_NOTSAFEPOINT_LEAVE;
void jl_with_stackwalk_lock(void (*f)(void*) JL_NOTSAFEPOINT, void *ctx) JL_NOTSAFEPOINT;
int jl_lock_stackwalk(void) JL_NOTSAFEPOINT JL_NOTSAFEPOINT_ENTER;
void jl_unlock_stackwalk(int lockret) JL_NOTSAFEPOINT JL_NOTSAFEPOINT_LEAVE;

arraylist_t *jl_get_all_tasks_arraylist(void) JL_NOTSAFEPOINT;
typedef struct {
Expand Down
9 changes: 6 additions & 3 deletions src/signals-mach.c
Original file line number Diff line number Diff line change
Expand Up @@ -714,10 +714,13 @@ static void jl_unlock_profile_mach(int dlsymlock, int keymgr_locked)
jl_unlock_profile();
}

void jl_with_stackwalk_lock(void (*f)(void*), void *ctx)
int jl_lock_stackwalk(void)
{
return jl_lock_profile_mach(1);
}

void jl_unlock_stackwalk(int lockret)
{
int lockret = jl_lock_profile_mach(1);
f(ctx);
jl_unlock_profile_mach(1, lockret);
}

Expand Down
186 changes: 86 additions & 100 deletions src/signals-unix.c
Original file line number Diff line number Diff line change
Expand Up @@ -308,27 +308,20 @@ int exc_reg_is_write_fault(uintptr_t esr) {
#else
#include <poll.h>
#include <sys/eventfd.h>
#include <link.h>

typedef struct {
void (*f)(void*) JL_NOTSAFEPOINT;
void *ctx;
} callback_t;
static int with_dl_iterate_phdr_lock(struct dl_phdr_info *info, size_t size, void *data)
int jl_lock_stackwalk(void)
{
jl_lock_profile();
callback_t *callback = (callback_t*)data;
callback->f(callback->ctx);
jl_unlock_profile();
return 1; // only call this once
return 0;
}

void jl_with_stackwalk_lock(void (*f)(void*), void *ctx)
void jl_unlock_stackwalk(int lockret)
{
callback_t callback = {f, ctx};
dl_iterate_phdr(with_dl_iterate_phdr_lock, &callback);
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

On FreeBSD, can you just replace this call with int rtld_locks[MAX_RTLD_LOCKS]; jl_lock_profile(); _rtld_atfork_pre(rtld_locks); f(ctx); _rtld_atfork_post(rtld_locks); jl_unlock_profile();

Copy link
Member Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Looks like even though _rtld_atfork_pre is accessible from libc, there's no corresponding header that's included in a standard system installation that has a prototype for it nor a definition for MAX_RTLD_LOCKS. 😔

Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

It's here, if you have this rtld_lock.h header, or you can just copy-paste the relevant lines from it:
https://github.com/lattera/freebsd/blob/401a161083850a9a4ce916f37520c084cff1543b/libexec/rtld-elf/rtld_lock.h#L48

Copy link
Member Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Right, what I mean is that it's in the system source files (as in your link) but those aren't included in a standard installation, so I don't have the definitions available from an existing file on my machine. I'm compiling now with this change:

diff --git a/src/signals-unix.c b/src/signals-unix.c
index 91d3378068..e1f1d70a80 100644
--- a/src/signals-unix.c
+++ b/src/signals-unix.c
@@ -41,6 +41,12 @@
 #include <sys/event.h>
 #endif

+#if defined(_OS_FREEBSD_)
+#define MAX_RTLS_LOCKS 8
+extern void _rtld_atfork_pre(int*);
+extern void _rtld_atfork_post(int*);
+#endif
+
 // 8M signal stack, same as default stack size (though we barely use this)
 static const size_t sig_stack_size = 8 * 1024 * 1024;

@@ -325,8 +331,17 @@ static int with_dl_iterate_phdr_lock(struct dl_phdr_info *info, size_t size, voi

 void jl_with_stackwalk_lock(void (*f)(void*), void *ctx)
 {
+#if defined(_OS_FREEBSD_)
+    int rtld_locks[MAX_RTLD_LOCKS];
+    jl_lock_profile();
+    _rtld_atfork_pre(rtld_locks);
+    f(ctx);
+    _rtld_atfork_post(rtld_locks);
+    jl_unlock_profile();
+#else
     callback_t callback = {f, ctx};
     dl_iterate_phdr(with_dl_iterate_phdr_lock, &callback);
+#endif
 }

 #if defined(_OS_LINUX_) && (defined(_CPU_X86_64_) || defined(_CPU_X86_))

Any idea what tests need to be run to trigger this specific deadlock or should I just run all of them?

Copy link
Member Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Looks like that didn't fix it, I still hit a deadlock.

Copy link
Member

@vtjnash vtjnash Jan 17, 2025

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

okay, if that doesn't work, then the other alternative is to block the thread from receiving the profile signal:

sigset_t sset, oset;
sigemptyset(&sset);
sigaddset(&sset, SIGUSR2);
pthread_sigmask(SIG_BLOCK, &sset, &oset);
f(ctx);
pthread_sigmask(SIG_SETMASK, &oset, NULL);

(in this case, this doesn't really need to be freebsd-specific either, and can be used on linux too)

Copy link
Member Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Do you mean like this?:

diff --git a/src/signals-unix.c b/src/signals-unix.c
index 91d3378068..ad2ad87140 100644
--- a/src/signals-unix.c
+++ b/src/signals-unix.c
@@ -325,8 +325,12 @@ static int with_dl_iterate_phdr_lock(struct dl_phdr_info *info, size_t size, voi

 void jl_with_stackwalk_lock(void (*f)(void*), void *ctx)
 {
-    callback_t callback = {f, ctx};
-    dl_iterate_phdr(with_dl_iterate_phdr_lock, &callback);
+    sigset_t sset, oset;
+    sigemptyset(&sset);
+    sigaddset(&sset, SIGUSR2);
+    pthread_sigmask(SIG_BLOCK, &sset, &oset);
+    f(ctx);
+    pthread_sigmask(SIG_SETMASK, &oset, NULL);
 }

 #if defined(_OS_LINUX_) && (defined(_CPU_X86_64_) || defined(_CPU_X86_))

Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

yes

(void)lockret;
jl_unlock_profile();
}


#if defined(_OS_LINUX_) && (defined(_CPU_X86_64_) || defined(_CPU_X86_))
int is_write_fault(void *context) {
ucontext_t *ctx = (ucontext_t*)context;
Expand Down Expand Up @@ -442,7 +435,7 @@ JL_NO_ASAN static void segv_handler(int sig, siginfo_t *info, void *context)
}

pthread_mutex_t in_signal_lock; // shared with jl_delete_thread
static bt_context_t *usr2_signal_context; // protected by in_signal_lock
static bt_context_t *signal_context; // protected by in_signal_lock
static int exit_signal_cond = -1;
static int signal_caught_cond = -1;
static int signals_inflight = 0;
Expand Down Expand Up @@ -514,7 +507,7 @@ int jl_thread_suspend_and_get_state(int tid, int timeout, bt_context_t *ctx)
request = jl_atomic_load_acquire(&ptls2->signal_request);
assert(request == 0 || request == -1); (void) request;
jl_atomic_store_release(&ptls2->signal_request, 4); // prepare to resume normally, but later code may change this
*ctx = *usr2_signal_context;
*ctx = *signal_context;
return 1;
}

Expand Down Expand Up @@ -594,8 +587,8 @@ void usr2_handler(int sig, siginfo_t *info, void *ctx)
if (!jl_atomic_cmpswap(&ptls->signal_request, &request, -1))
return;
if (request == 1) {
usr2_signal_context = jl_to_bt_context(ctx);
// acknowledge that we saw the signal_request and set usr2_signal_context
signal_context = jl_to_bt_context(ctx);
// acknowledge that we saw the signal_request and set signal_context
int err;
eventfd_t got = 1;
err = write(signal_caught_cond, &got, sizeof(eventfd_t));
Expand All @@ -609,7 +602,7 @@ void usr2_handler(int sig, siginfo_t *info, void *ctx)
if (err != sizeof(eventfd_t)) abort();
assert(got == 1);
request = jl_atomic_exchange(&ptls->signal_request, -1);
usr2_signal_context = NULL;
signal_context = NULL;
assert(request == 2 || request == 3 || request == 4);
}
int err;
Expand Down Expand Up @@ -813,7 +806,7 @@ void trigger_profile_peek(void)
jl_safe_printf("\n======================================================================================\n");
jl_safe_printf("Information request received. A stacktrace will print followed by a %.1f second profile\n", profile_peek_duration);
jl_safe_printf("======================================================================================\n");
if (profile_bt_size_max == 0) {
if (profile_bt_size_max == 0){
// If the buffer hasn't been initialized, initialize with default size
// Keep these values synchronized with Profile.default_init()
if (jl_profile_init(10000000, 1000000) == -1) {
Expand All @@ -828,93 +821,59 @@ void trigger_profile_peek(void)
profile_autostop_time = jl_hrtime() + (profile_peek_duration * 1e9);
}

#if !defined(JL_DISABLE_LIBUNWIND)

static jl_bt_element_t signal_bt_data[JL_MAX_BT_SIZE + 1];
static size_t signal_bt_size = 0;
static void do_critical_profile(void *ctx)
// assumes holding `jl_lock_stackwalk`
void jl_profile_thread_unix(int tid, bt_context_t *signal_context)
{
bt_context_t signal_context;
// sample each thread, round-robin style in reverse order
// (so that thread zero gets notified last)
int nthreads = jl_atomic_load_acquire(&jl_n_threads);
for (int i = nthreads; i-- > 0; ) {
// notify thread to stop
if (!jl_thread_suspend_and_get_state(i, 1, &signal_context))
continue;

// do backtrace on thread contexts for critical signals
// this part must be signal-handler safe
signal_bt_size += rec_backtrace_ctx(signal_bt_data + signal_bt_size,
JL_MAX_BT_SIZE / nthreads - 1,
&signal_context, NULL);
signal_bt_data[signal_bt_size++].uintptr = 0;
jl_thread_resume(i);
if (jl_profile_is_buffer_full()) {
// Buffer full: Delete the timer
jl_profile_stop_timer();
return;
}
}

static void do_profile(void *ctx)
{
bt_context_t signal_context;
int nthreads = jl_atomic_load_acquire(&jl_n_threads);
int *randperm = profile_get_randperm(nthreads);
for (int idx = nthreads; idx-- > 0; ) {
// Stop the threads in the random order.
int tid = randperm[idx];
// do backtrace for profiler
if (!profile_running)
return;
if (jl_profile_is_buffer_full()) {
// Buffer full: Delete the timer
jl_profile_stop_timer();
return;
}
// notify thread to stop
if (!jl_thread_suspend_and_get_state(tid, 1, &signal_context))
return;
// unwinding can fail, so keep track of the current state
// and restore from the SEGV handler if anything happens.
jl_jmp_buf *old_buf = jl_get_safe_restore();
jl_jmp_buf buf;

jl_set_safe_restore(&buf);
if (jl_setjmp(buf, 0)) {
jl_safe_printf("WARNING: profiler attempt to access an invalid memory location\n");
}
else {
// Get backtrace data
profile_bt_size_cur += rec_backtrace_ctx((jl_bt_element_t*)profile_bt_data_prof + profile_bt_size_cur,
profile_bt_size_max - profile_bt_size_cur - 1, &signal_context, NULL);
}
jl_set_safe_restore(old_buf);
// notify thread to stop
if (!jl_thread_suspend_and_get_state(tid, 1, signal_context))
return;
// unwinding can fail, so keep track of the current state
// and restore from the SEGV handler if anything happens.
jl_jmp_buf *old_buf = jl_get_safe_restore();
jl_jmp_buf buf;

jl_set_safe_restore(&buf);
if (jl_setjmp(buf, 0)) {
jl_safe_printf("WARNING: profiler attempt to access an invalid memory location\n");
} else {
// Get backtrace data
profile_bt_size_cur += rec_backtrace_ctx((jl_bt_element_t*)profile_bt_data_prof + profile_bt_size_cur,
profile_bt_size_max - profile_bt_size_cur - 1, signal_context, NULL);
}
jl_set_safe_restore(old_buf);

jl_ptls_t ptls2 = jl_atomic_load_relaxed(&jl_all_tls_states)[tid];
jl_ptls_t ptls2 = jl_atomic_load_relaxed(&jl_all_tls_states)[tid];

// store threadid but add 1 as 0 is preserved to indicate end of block
profile_bt_data_prof[profile_bt_size_cur++].uintptr = ptls2->tid + 1;
// store threadid but add 1 as 0 is preserved to indicate end of block
profile_bt_data_prof[profile_bt_size_cur++].uintptr = ptls2->tid + 1;

// store task id (never null)
profile_bt_data_prof[profile_bt_size_cur++].jlvalue = (jl_value_t*)jl_atomic_load_relaxed(&ptls2->current_task);
// store task id (never null)
profile_bt_data_prof[profile_bt_size_cur++].jlvalue = (jl_value_t*)jl_atomic_load_relaxed(&ptls2->current_task);

// store cpu cycle clock
profile_bt_data_prof[profile_bt_size_cur++].uintptr = cycleclock();
// store cpu cycle clock
profile_bt_data_prof[profile_bt_size_cur++].uintptr = cycleclock();

// store whether thread is sleeping (don't ever encode a state as `0` since is preserved to indicate end of block)
int state = jl_atomic_load_relaxed(&ptls2->sleep_check_state) == 0 ? PROFILE_STATE_THREAD_NOT_SLEEPING : PROFILE_STATE_THREAD_SLEEPING;
profile_bt_data_prof[profile_bt_size_cur++].uintptr = state;
// store whether thread is sleeping (don't ever encode a state as `0` since is preserved to indicate end of block)
int state = jl_atomic_load_relaxed(&ptls2->sleep_check_state) == 0 ? PROFILE_STATE_THREAD_NOT_SLEEPING : PROFILE_STATE_THREAD_SLEEPING;
profile_bt_data_prof[profile_bt_size_cur++].uintptr = state;

// Mark the end of this block with two 0's
profile_bt_data_prof[profile_bt_size_cur++].uintptr = 0;
profile_bt_data_prof[profile_bt_size_cur++].uintptr = 0;
// Mark the end of this block with two 0's
profile_bt_data_prof[profile_bt_size_cur++].uintptr = 0;
profile_bt_data_prof[profile_bt_size_cur++].uintptr = 0;

// notify thread to resume
jl_thread_resume(tid);
}
// notify thread to resume
jl_thread_resume(tid);
}
#endif

static void *signal_listener(void *arg)
{
static jl_bt_element_t bt_data[JL_MAX_BT_SIZE + 1];
static size_t bt_size = 0;
sigset_t sset;
int sig, critical, profile;
jl_sigsetset(&sset);
Expand Down Expand Up @@ -1046,18 +1005,46 @@ static void *signal_listener(void *arg)
}
}

signal_bt_size = 0;
int nthreads = jl_atomic_load_acquire(&jl_n_threads);
bt_size = 0;
#if !defined(JL_DISABLE_LIBUNWIND)
bt_context_t signal_context;
if (critical) {
jl_with_stackwalk_lock(do_critical_profile, NULL);
int lockret = jl_lock_stackwalk();
// sample each thread, round-robin style in reverse order
// (so that thread zero gets notified last)
for (int i = nthreads; i-- > 0; ) {
// notify thread to stop
if (!jl_thread_suspend_and_get_state(i, 1, &signal_context))
continue;

// do backtrace on thread contexts for critical signals
// this part must be signal-handler safe
bt_size += rec_backtrace_ctx(bt_data + bt_size,
JL_MAX_BT_SIZE / nthreads - 1,
&signal_context, NULL);
bt_data[bt_size++].uintptr = 0;
jl_thread_resume(i);
}
jl_unlock_stackwalk(lockret);
}
else if (profile) {
if (profile_all_tasks) {
// Don't take the stackwalk lock here since it's already taken in `jl_rec_backtrace`
jl_profile_task();
}
else {
jl_with_stackwalk_lock(do_profile, NULL);
int lockret = jl_lock_stackwalk();
int *randperm = profile_get_randperm(nthreads);
for (int idx = nthreads; idx-- > 0; ) {
// Stop the threads in the random order.
int i = randperm[idx];
// do backtrace for profiler
if (profile_running) {
jl_profile_thread_unix(i, &signal_context);
}
}
jl_unlock_stackwalk(lockret);
}
}
#ifndef HAVE_MACH
Expand All @@ -1078,12 +1065,11 @@ static void *signal_listener(void *arg)
//#if defined(_POSIX_C_SOURCE) && _POSIX_C_SOURCE >= 199309L && !HAVE_KEVENT
// si_code = info.si_code;
//#endif
jl_exit_thread0(sig, signal_bt_data, signal_bt_size);
jl_exit_thread0(sig, bt_data, bt_size);
}
else if (critical) {
// critical in this case actually means SIGINFO request
#ifndef SIGINFO // SIGINFO already prints something similar automatically
int nthreads = jl_atomic_load_acquire(&jl_n_threads);
int n_threads_running = 0;
for (int idx = nthreads; idx-- > 0; ) {
jl_ptls_t ptls2 = jl_atomic_load_relaxed(&jl_all_tls_states)[idx];
Expand All @@ -1094,8 +1080,8 @@ static void *signal_listener(void *arg)

jl_safe_printf("\nsignal (%d): %s\n", sig, strsignal(sig));
size_t i;
for (i = 0; i < signal_bt_size; i += jl_bt_entry_size(signal_bt_data + i)) {
jl_print_bt_entry_codeloc(signal_bt_data + i);
for (i = 0; i < bt_size; i += jl_bt_entry_size(bt_data + i)) {
jl_print_bt_entry_codeloc(bt_data + i);
}
}
}
Expand Down
19 changes: 7 additions & 12 deletions src/signals-win.c
Original file line number Diff line number Diff line change
Expand Up @@ -383,25 +383,20 @@ void jl_thread_resume(int tid)
}
}

void jl_lock_stackwalk(void)
int jl_lock_stackwalk(void)
{
uv_mutex_lock(&jl_in_stackwalk);
jl_lock_profile();
return 0;
}

void jl_unlock_stackwalk(void)
void jl_unlock_stackwalk(int lockret)
{
(void)lockret;
jl_unlock_profile();
uv_mutex_unlock(&jl_in_stackwalk);
}

void jl_with_stackwalk_lock(void (*f)(void*), void *ctx)
{
jl_lock_stackwalk();
f(ctx);
jl_unlock_stackwalk();
}


static DWORD WINAPI profile_bt( LPVOID lparam )
{
Expand All @@ -421,10 +416,10 @@ static DWORD WINAPI profile_bt( LPVOID lparam )
}
else {
// TODO: bring this up to parity with other OS by adding loop over tid here
jl_lock_stackwalk();
int lockret = jl_lock_stackwalk();
CONTEXT ctxThread;
if (!jl_thread_suspend_and_get_state(0, 0, &ctxThread)) {
jl_unlock_stackwalk();
jl_unlock_stackwalk(lockret);
fputs("failed to suspend main thread. aborting profiling.", stderr);
jl_profile_stop_timer();
break;
Expand All @@ -451,7 +446,7 @@ static DWORD WINAPI profile_bt( LPVOID lparam )
// Mark the end of this block with two 0's
profile_bt_data_prof[profile_bt_size_cur++].uintptr = 0;
profile_bt_data_prof[profile_bt_size_cur++].uintptr = 0;
jl_unlock_stackwalk();
jl_unlock_stackwalk(lockret);
jl_thread_resume(0);
jl_check_profile_autostop();
}
Expand Down
Loading
Loading