On Fri, Apr 23, 2021 at 11:26 AM Rainer Jung <rainer.j...@kippdata.de> wrote: > > When compiling and running make check for latest head of APU 1.6.x in > preparation of httpd release testing, I observe very frequent hangs > during testqueue and testpass. > > It seems the hang happens only for APU 1.6.x head, but not for APU 1.6.1. > > The hangs seem not to depend on the exact APR version. I observed them > with 1.6.5, 1.7.0, 1.6.x head and 1.7.x head. > > I have not yet tested APU 1.7.x head. > > I can see them on RHEL 6, SLES 11, 12 and 15 and Solaris. It seems they > do not happen on RHEL 7 and 8. > > Here are some stacks:
Thanks Rainer for the details. Does the attached patch (for 1.6.x) fix the hang? Regards; Yann.
Index: misc/apr_thread_pool.c =================================================================== --- misc/apr_thread_pool.c (revision 1889124) +++ misc/apr_thread_pool.c (working copy) @@ -46,8 +46,9 @@ struct apr_thread_list_elt { APR_RING_ENTRY(apr_thread_list_elt) link; apr_thread_t *thd; - volatile void *current_owner; - volatile enum { TH_RUN, TH_STOP, TH_PROBATION } state; + void *current_owner; + enum { TH_RUN, TH_STOP, TH_PROBATION } state; + int signal_work_done; }; APR_RING_HEAD(apr_thread_list, apr_thread_list_elt); @@ -78,7 +79,6 @@ struct apr_thread_pool apr_thread_cond_t *all_done; apr_thread_mutex_t *lock; volatile int terminated; - int waiting_work_done; struct apr_thread_pool_tasks *recycled_tasks; struct apr_thread_list *recycled_thds; apr_thread_pool_task_t *task_idx[TASK_PRIORITY_SEGS]; @@ -254,6 +254,7 @@ static struct apr_thread_list_elt *elt_new(apr_thr APR_RING_ELEM_INIT(elt, link); elt->thd = t; elt->current_owner = NULL; + elt->signal_work_done = 0; elt->state = TH_RUN; return elt; } @@ -311,10 +312,9 @@ static void *APR_THREAD_FUNC thread_pool_func(apr_ APR_RING_INSERT_TAIL(me->recycled_tasks, task, apr_thread_pool_task, link); elt->current_owner = NULL; - if (me->waiting_work_done) { + if (elt->signal_work_done) { + elt->signal_work_done = 0; apr_thread_cond_signal(me->work_done); - apr_thread_mutex_unlock(me->lock); - apr_thread_mutex_lock(me->lock); } } while (elt->state != TH_STOP); APR_RING_REMOVE(elt, link); @@ -426,15 +426,14 @@ APU_DECLARE(apr_status_t) apr_thread_pool_create(a return rv; apr_pool_pre_cleanup_register(tp->pool, tp, thread_pool_cleanup); - while (init_threads) { - /* Grab the mutex as apr_thread_create() and thread_pool_func() will - * allocate from (*me)->pool. This is dangerous if there are multiple - * initial threads to create. - */ - apr_thread_mutex_lock(tp->lock); + /* Grab the mutex as apr_thread_create() and thread_pool_func() will + * allocate from (*me)->pool. This is dangerous if there are multiple + * initial threads to create. + */ + apr_thread_mutex_lock(tp->lock); + while (init_threads--) { rv = apr_thread_create(&t, NULL, thread_pool_func, tp, tp->pool); if (APR_SUCCESS != rv) { - apr_thread_mutex_unlock(tp->lock); break; } tp->thd_cnt++; @@ -441,9 +440,8 @@ APU_DECLARE(apr_status_t) apr_thread_pool_create(a if (tp->thd_cnt > tp->thd_high) { tp->thd_high = tp->thd_cnt; } - apr_thread_mutex_unlock(tp->lock); - --init_threads; } + apr_thread_mutex_unlock(tp->lock); if (rv == APR_SUCCESS) { *me = tp; @@ -748,7 +746,7 @@ static void wait_on_busy_threads(apr_thread_pool_t elt = APR_RING_FIRST(me->busy_thds); while (elt != APR_RING_SENTINEL(me->busy_thds, apr_thread_list_elt, link)) { - if (owner && elt->current_owner != owner) { + if (owner ? owner != elt->current_owner : !elt->current_owner) { elt = APR_RING_NEXT(elt, link); continue; } @@ -764,9 +762,8 @@ static void wait_on_busy_threads(apr_thread_pool_t #endif #endif - me->waiting_work_done = 1; + elt->signal_work_done = 1; apr_thread_cond_wait(me->work_done, me->lock); - me->waiting_work_done = 0; /* Restart */ elt = APR_RING_FIRST(me->busy_thds);