From 66871c5a06d723f8350935ced1e88d8cc929d809 Mon Sep 17 00:00:00 2001 From: KJ Tsanaktsidis Date: Sun, 21 May 2023 22:29:16 +1000 Subject: Fix busy-loop when waiting for file descriptors to close When one thread is closing a file descriptor whilst another thread is concurrently reading it, we need to wait for the reading thread to be done with it to prevent a potential EBADF (or, worse, file descriptor reuse). At the moment, that is done by keeping a list of threads still using the file descriptor in io_close_fptr. It then continually calls rb_thread_schedule() in fptr_finalize_flush until said list is empty. That busy-looping seems to behave rather poorly on some OS's, particulary FreeBSD. It can cause the TestIO#test_race_gets_and_close test to fail (even with its very long 200 second timeout) because the closing thread starves out the using thread. To fix that, I introduce the concept of struct rb_io_close_wait_list; a list of threads still using a file descriptor that we want to close. We call `rb_notify_fd_close` to let the thread scheduler know we're closing a FD, which fills the list with threads. Then, we call rb_notify_fd_close_wait which will block the thread until all of the still-using threads are done. This is implemented with a condition variable sleep, so no busy-looping is required. --- thread.c | 50 +++++++++++++++++++++++++++++++++++++++++++------- 1 file changed, 43 insertions(+), 7 deletions(-) (limited to 'thread.c') diff --git a/thread.c b/thread.c index a99e2318ab..409ec7435a 100644 --- a/thread.c +++ b/thread.c @@ -155,6 +155,7 @@ struct waiting_fd { struct ccan_list_node wfd_node; /* <=> vm.waiting_fds */ rb_thread_t *th; int fd; + struct rb_io_close_wait_list *busy; }; /********************************************************************************/ @@ -1672,7 +1673,8 @@ rb_thread_io_blocking_region(rb_blocking_function_t *func, void *data1, int fd) struct waiting_fd waiting_fd = { .fd = fd, - .th = rb_ec_thread_ptr(ec) + .th = rb_ec_thread_ptr(ec), + .busy = NULL, }; // `errno` is only valid when there is an actual error - but we can't @@ -1702,7 +1704,14 @@ rb_thread_io_blocking_region(rb_blocking_function_t *func, void *data1, int fd) */ RB_VM_LOCK_ENTER(); { + if (waiting_fd.busy) { + rb_native_mutex_lock(&waiting_fd.busy->mu); + } ccan_list_del(&waiting_fd.wfd_node); + if (waiting_fd.busy) { + rb_native_cond_broadcast(&waiting_fd.busy->cv); + rb_native_mutex_unlock(&waiting_fd.busy->mu); + } } RB_VM_LOCK_LEAVE(); @@ -2461,10 +2470,12 @@ rb_ec_reset_raised(rb_execution_context_t *ec) } int -rb_notify_fd_close(int fd, struct ccan_list_head *busy) +rb_notify_fd_close(int fd, struct rb_io_close_wait_list *busy) { rb_vm_t *vm = GET_THREAD()->vm; struct waiting_fd *wfd = 0, *next; + ccan_list_head_init(&busy->list); + int has_any; RB_VM_LOCK_ENTER(); { @@ -2474,27 +2485,52 @@ rb_notify_fd_close(int fd, struct ccan_list_head *busy) VALUE err; ccan_list_del(&wfd->wfd_node); - ccan_list_add(busy, &wfd->wfd_node); + ccan_list_add(&busy->list, &wfd->wfd_node); + wfd->busy = busy; err = th->vm->special_exceptions[ruby_error_stream_closed]; rb_threadptr_pending_interrupt_enque(th, err); rb_threadptr_interrupt(th); } } } + has_any = !ccan_list_empty(&busy->list); + if (has_any) { + rb_native_mutex_initialize(&busy->mu); + rb_native_cond_initialize(&busy->cv); + } RB_VM_LOCK_LEAVE(); - return !ccan_list_empty(busy); + return has_any; +} + +void +rb_notify_fd_close_wait(struct rb_io_close_wait_list *busy) +{ + rb_native_mutex_lock(&busy->mu); + while (!ccan_list_empty(&busy->list)) { + rb_native_cond_wait(&busy->cv, &busy->mu); + }; + rb_native_mutex_unlock(&busy->mu); + rb_native_mutex_destroy(&busy->mu); + rb_native_cond_destroy(&busy->cv); +} + +static void* +call_notify_fd_close_wait_nogvl(void *arg) +{ + struct rb_io_close_wait_list *busy = (struct rb_io_close_wait_list *)arg; + rb_notify_fd_close_wait(busy); + return NULL; } void rb_thread_fd_close(int fd) { - struct ccan_list_head busy; + struct rb_io_close_wait_list busy; - ccan_list_head_init(&busy); if (rb_notify_fd_close(fd, &busy)) { - do rb_thread_schedule(); while (!ccan_list_empty(&busy)); + rb_thread_call_without_gvl(call_notify_fd_close_wait_nogvl, &busy, RUBY_UBF_IO, 0); } } -- cgit v1.2.3