Module: xenomai-3
Branch: wip/prioceil
Commit: 5902ea95bccd08d2b5161cfd61fcfb5709941cc6
URL:    
http://git.xenomai.org/?p=xenomai-3.git;a=commit;h=5902ea95bccd08d2b5161cfd61fcfb5709941cc6

Author: Philippe Gerum <r...@xenomai.org>
Date:   Tue Mar  1 12:50:29 2016 +0100

cobalt/thread: fix SMP race with xnthread_join()

The situation below would cause a kernel crash on any earlier 3.x
release, with ktask implemented in a dynamically loaded/unloaded
module:

CPU0:  rtdm_task_destroy(ktask)
       ...
       rmmod(module)

CPU1:  ktask()
       ...
       ...
       __xnthread_test_cancel()
           do_exit()
              (last) schedule()
                 OOPS: prev still treading on stale memory

In this case, the module would be unmapped too early, before the
cancelled task can ultimately schedule away.

The changes also fix a stale reference from the joiner thread to the
former ->idtag field, after the joinee's TCB has been dropped.

---

 include/cobalt/kernel/thread.h |    6 +-
 kernel/cobalt/thread.c         |  136 ++++++++++++++++++++++++++++++++--------
 2 files changed, 113 insertions(+), 29 deletions(-)

diff --git a/include/cobalt/kernel/thread.h b/include/cobalt/kernel/thread.h
index f25c6d0..e08a0a2 100644
--- a/include/cobalt/kernel/thread.h
+++ b/include/cobalt/kernel/thread.h
@@ -19,6 +19,7 @@
 #ifndef _COBALT_KERNEL_THREAD_H
 #define _COBALT_KERNEL_THREAD_H
 
+#include <linux/wait.h>
 #include <linux/sched.h>
 #include <linux/sched/rt.h>
 #include <cobalt/kernel/list.h>
@@ -107,9 +108,6 @@ struct xnthread {
        struct list_head quota_expired;
        struct list_head quota_next;
 #endif
-
-       unsigned int idtag;     /* Unique ID tag */
-
        cpumask_t affinity;     /* Processor affinity. */
 
        int bprio;              /* Base priority (before PIP boost) */
@@ -184,6 +182,8 @@ struct xnthread {
 
        struct xnthread_personality *personality;
 
+       struct completion exited;
+
 #ifdef CONFIG_XENO_OPT_DEBUG
        const char *exe_path;   /* Executable path */
        u32 proghash;           /* Hash value for exe_path */
diff --git a/kernel/cobalt/thread.c b/kernel/cobalt/thread.c
index ca02e94..aaf868a 100644
--- a/kernel/cobalt/thread.c
+++ b/kernel/cobalt/thread.c
@@ -23,6 +23,7 @@
 #include <linux/kthread.h>
 #include <linux/wait.h>
 #include <linux/signal.h>
+#include <linux/pid.h>
 #include <cobalt/kernel/sched.h>
 #include <cobalt/kernel/timer.h>
 #include <cobalt/kernel/synch.h>
@@ -40,16 +41,14 @@
 #include <asm-generic/xenomai/mayday.h>
 #include "debug.h"
 
+static DECLARE_WAIT_QUEUE_HEAD(join_all);
+
 /**
  * @ingroup cobalt_core
  * @defgroup cobalt_core_thread Thread services
  * @{
  */
 
-static DECLARE_WAIT_QUEUE_HEAD(nkjoinq);
-
-static unsigned int idtags;
-
 static void timeout_handler(struct xntimer *timer)
 {
        struct xnthread *thread = container_of(timer, struct xnthread, rtimer);
@@ -158,20 +157,13 @@ int __xnthread_init(struct xnthread *thread,
                    const union xnsched_policy_param *sched_param)
 {
        int flags = attr->flags, ret, gravity;
-       spl_t s;
 
        flags &= ~XNSUSP;
 #ifndef CONFIG_XENO_ARCH_FPU
        flags &= ~XNFPU;
 #endif
-       if (flags & XNROOT)
-               thread->idtag = 0;
-       else {
-               xnlock_get_irqsave(&nklock, s);
-               thread->idtag = ++idtags ?: 1;
-               xnlock_put_irqrestore(&nklock, s);
+       if ((flags & XNROOT) == 0)
                flags |= XNDORMANT;
-       }
 
        if (attr->name)
                ksformat(thread->name,
@@ -207,6 +199,7 @@ int __xnthread_init(struct xnthread *thread,
        /* These will be filled by xnthread_start() */
        thread->entry = NULL;
        thread->cookie = NULL;
+       init_completion(&thread->exited);
 
        gravity = flags & XNUSER ? XNTIMER_UGRAVITY : XNTIMER_KGRAVITY;
        xntimer_init(&thread->rtimer, &nkclock, timeout_handler,
@@ -484,8 +477,6 @@ static inline void cleanup_tcb(struct xnthread *thread) /* 
nklock held, irqs off
                xnthread_clear_state(thread, XNREADY);
        }
 
-       thread->idtag = 0;
-
        if (xnthread_test_state(thread, XNPEND))
                xnsynch_forget_sleeper(thread);
 
@@ -525,10 +516,15 @@ void __xnthread_cleanup(struct xnthread *curr)
        cleanup_tcb(curr);
        xnlock_put_irqrestore(&nklock, s);
 
+       /* Wake up the joiner if any (we can't have more than one). */
+       complete(&curr->exited);
+
+       /* Notify our exit to xnthread_killall() if need be. */
+       if (waitqueue_active(&join_all))
+               wake_up(&join_all);
+
        /* Finalize last since this incurs releasing the TCB. */
        xnthread_run_handler_stack(curr, finalize_thread);
-
-       wake_up(&nkjoinq);
 }
 
 /*
@@ -1587,6 +1583,40 @@ out:
 }
 EXPORT_SYMBOL_GPL(xnthread_cancel);
 
+struct wait_grace_struct {
+       struct completion done;
+       struct rcu_head rcu;
+};
+
+static void grace_elapsed(struct rcu_head *head)
+{
+       struct wait_grace_struct *wgs;
+
+       wgs = container_of(head, struct wait_grace_struct, rcu);
+       complete(&wgs->done);
+}
+
+static void wait_grace_period(struct pid *pid)
+{
+       struct wait_grace_struct wait = {
+               .done = COMPLETION_INITIALIZER_ONSTACK(wait.done),
+       };
+       struct task_struct *p;
+
+       init_rcu_head_on_stack(&wait.rcu);
+       
+       for (;;) {
+               call_rcu(&wait.rcu, grace_elapsed);
+               wait_for_completion(&wait.done);
+               rcu_read_lock();
+               p = pid_task(pid, PIDTYPE_PID);
+               rcu_read_unlock();
+               if (p == NULL)
+                       break;
+               reinit_completion(&wait.done);
+       }
+}
+
 /**
  * @fn void xnthread_join(struct xnthread *thread, bool uninterruptible)
  * @brief Join with a terminated thread.
@@ -1604,7 +1634,7 @@ EXPORT_SYMBOL_GPL(xnthread_cancel);
  * @param thread The descriptor address of the thread to join with.
  *
  * @param uninterruptible Boolean telling whether the service should
- * wait for completion uninterruptible if called from secondary mode.
+ * wait for completion uninterruptible.
  *
  * @return 0 is returned on success. Otherwise, the following error
  * codes indicate the cause of the failure:
@@ -1624,7 +1654,8 @@ int xnthread_join(struct xnthread *thread, bool 
uninterruptible)
 {
        struct xnthread *curr = xnthread_current();
        int ret = 0, switched = 0;
-       unsigned int tag;
+       struct pid *pid;
+       pid_t tpid;
        spl_t s;
 
        XENO_BUG_ON(COBALT, xnthread_test_state(thread, XNROOT));
@@ -1639,13 +1670,13 @@ int xnthread_join(struct xnthread *thread, bool 
uninterruptible)
                goto out;
        }
 
-       tag = thread->idtag;
-       if (xnthread_test_info(thread, XNDORMANT) || tag == 0)
+       if (xnthread_test_info(thread, XNDORMANT))
                goto out;
 
        trace_cobalt_thread_join(thread);
 
        xnthread_set_state(thread, XNJOINED);
+       tpid = xnthread_host_pid(thread);
        
        if (!xnthread_test_state(curr, XNRELAX|XNROOT)) {
                xnlock_put_irqrestore(&nklock, s);
@@ -1654,12 +1685,65 @@ int xnthread_join(struct xnthread *thread, bool 
uninterruptible)
        } else
                xnlock_put_irqrestore(&nklock, s);
 
+       /*
+        * Since in theory, we might be sleeping there for a long
+        * time, we get a reference on the pid struct holding our
+        * target, then we check for its existence upon wake up.
+        */
+       pid = find_get_pid(tpid);
+       if (pid == NULL)
+               goto done;
+
+       /*
+        * We have a tricky issue to deal with, which involves code
+        * relying on the assumption that a destroyed thread will have
+        * scheduled away from do_exit() before xnthread_join()
+        * returns. A typical example is illustrated by the following
+        * sequence, with a RTDM kernel task implemented in a
+        * dynamically loaded module:
+        *
+        * CPU0:  rtdm_task_destroy(ktask)
+        *           xnthread_cancel(ktask)
+        *           xnthread_join(ktask)
+        *        ...<back to user>..
+        *        rmmod(module)
+        *
+        * CPU1:  in ktask()
+        *        ...
+        *        ...
+        *          __xnthread_test_cancel()
+        *             do_exit()
+         *                schedule()
+        *
+        * In such a sequence, the code on CPU0 would expect the RTDM
+        * task to have scheduled away upon return from
+        * rtdm_task_destroy(), so that unmapping the destroyed task
+        * code and data memory when unloading the module is always
+        * safe.
+        *
+        * To address this, the joiner first waits for the joinee to
+        * signal completion from the Cobalt thread cleanup handler
+        * (__xnthread_cleanup), then waits for a full RCU grace
+        * period to have elapsed. Since the completion signal is sent
+        * on behalf of do_exit(), we may assume that the joinee has
+        * scheduled away before the grace period ends.
+        */
        if (uninterruptible)
-               wait_event(nkjoinq, thread->idtag != tag);
-       else if (wait_event_interruptible(nkjoinq,
-                                         thread->idtag != tag))
-               return -EINTR;
+               wait_for_completion(&thread->exited);
+       else {
+               ret = wait_for_completion_interruptible(&thread->exited);
+               if (ret < 0) {
+                       put_pid(pid);
+                       return -EINTR;
+               }
+       }
+
+       /* Make sure the joinee has scheduled away ultimately. */
+       wait_grace_period(pid);
 
+       put_pid(pid);
+done:
+       ret = 0;
        if (switched)
                ret = xnthread_harden();
 
@@ -2561,13 +2645,13 @@ int xnthread_killall(int grace, int mask)
                       nrkilled);
 
        if (grace > 0) {
-               ret = wait_event_interruptible_timeout(nkjoinq,
+               ret = wait_event_interruptible_timeout(join_all,
                                                       cobalt_nrthreads == 
count,
                                                       grace * HZ);
                if (ret == 0)
                        return -EAGAIN;
        } else
-               ret = wait_event_interruptible(nkjoinq,
+               ret = wait_event_interruptible(join_all,
                                               cobalt_nrthreads == count);
 
        if (XENO_DEBUG(COBALT))


_______________________________________________
Xenomai-git mailing list
Xenomai-git@xenomai.org
https://xenomai.org/mailman/listinfo/xenomai-git

Reply via email to