On Sun, Jun 19, 2022 at 01:26:27PM +0200, Stephan Mending wrote:
> Hi, 
> it crashed again. 
> Here is the dmesg, this time the kernel had debugging symbols enabled. 
> 
> [...]
> ic0 at ichiic0
> spdmem0 at iic0 addr 0x50: 2GB DDR3 SDRAM PC3-12800 SO-DIMM
> isa0 at pcib0
> isadma0 at isa0
> vga0 at isa0 port 0x3b0/48 iomem 0xa0000/131072
> wsdisplay at vga0 not configured
> pcppi0 at isa0 port 0x61
> spkr0 at pcppi0
> wbsio0 at isa0 port 0x2e/2: NCT5104D rev 0x53
> wbsio0 port 0xa10/2 not configured
> vmm0 at mainbus0: VMX/EPT
> run0 at uhub0 port 4 configuration 1 interface 0 "Ralink 802.11 n WLAN" rev 
> 2.0
> 0/1.01 addr 2
> run0: MAC/BBP RT5592 (rev 0x0222), RF RT5592 (MIMO 2T2R), address 
> d8:61:62:37:5
> 6:c8       
> uhub2 at uhub1 port 1 configuration 1 interface 0 "Intel Rate Matching Hub" 
> rev
>  2.00/0.04 addr 2
>  vscsi0 at root
>  scsibus2 at vscsi0: 256 targets
>  softraid0 at root
>  scsibus3 at softraid0: 256 targets
>  root on sd0a (7ec83d15890e2a71.a) swap on sd0b dump on sd0b
>  inteldrm0: 1024x768, 32bpp
>  wsdisplay0 at inteldrm0 mux 1
>  wsdisplay0: screen 0-5 added (std, vt100 emulation)
>  kernel: protection fault trap, code=0
>  Stopped at      icmp_mtudisc_timeout+0x77 
> [/usr/src/sys/netinet/ip_icmp.c:1072]
>  :       movq    0(%rax),%rcx
>  ddb{0}> ddb{0}>
>  ddb{0}> bt          
>  icmp_mtudisc_timeout(fffffd807a4e0620,0) at icmp_mtudisc_timeout+0x77 
> [/usr/src
>  /sys/netinet/ip_icmp.c:1072]
>  rt_timer_timer(ffffffff82324248) at rt_timer_timer+0x1cc 
> [/usr/src/sys/net/rout
>  e.c:1551]
>  softclock_thread(ffff8000fffff260) at softclock_thread+0x13b 
> [/usr/src/sys/kern
>  /kern_timeout.c:681]
>  end trace frame: 0x0, count: -3
>  ddb{0}> call db_show_rtentry(fffffd807a4e0620, 0, 0)      
>  Symbol not found
> 
> I'd love to know whats going wrong here.
> 

This is a race condition in the rttimer code that was introduced by bluhm@
when he added the mutex around the global list.
Can you try the diff below which is a refactor I did some time ago which
changes this and uses a per route timeout instead of the global one. With
this we should not have this use after free anymore.

-- 
:wq Claudio

Index: net/route.c
===================================================================
RCS file: /cvs/src/sys/net/route.c,v
retrieving revision 1.410
diff -u -p -r1.410 route.c
--- net/route.c 5 May 2022 13:57:40 -0000       1.410
+++ net/route.c 13 May 2022 11:49:00 -0000
@@ -1361,7 +1361,16 @@ rt_ifa_purge_walker(struct rtentry *rt, 
  */
 
 struct mutex                   rttimer_mtx;
-LIST_HEAD(, rttimer_queue)     rttimer_queue_head;     /* [T] */
+
+struct rttimer {
+       TAILQ_ENTRY(rttimer)    rtt_next;       /* [T] entry on timer queue */
+       LIST_ENTRY(rttimer)     rtt_link;       /* [T] timers per rtentry */
+       struct timeout          rtt_timeout;    /* [I] timeout for this entry */
+       struct rttimer_queue    *rtt_queue;     /* [I] back pointer to queue */
+       struct rtentry          *rtt_rt;        /* [T] back pointer to route */
+       time_t                  rtt_expire;     /* [I] rt expire time */
+       u_int                   rtt_tableid;    /* [I] rtable id of rtt_rt */
+};
 
 #define RTTIMER_CALLOUT(r)     {                                       \
        if (r->rtt_queue->rtq_func != NULL) {                           \
@@ -1388,15 +1397,9 @@ LIST_HEAD(, rttimer_queue)       rttimer_queue
 void
 rt_timer_init(void)
 {
-       static struct timeout   rt_timer_timeout;
-
        pool_init(&rttimer_pool, sizeof(struct rttimer), 0,
            IPL_MPFLOOR, 0, "rttmr", NULL);
-
        mtx_init(&rttimer_mtx, IPL_MPFLOOR);
-       LIST_INIT(&rttimer_queue_head);
-       timeout_set_proc(&rt_timer_timeout, rt_timer_timer, &rt_timer_timeout);
-       timeout_add_sec(&rt_timer_timeout, 1);
 }
 
 void
@@ -1407,10 +1410,6 @@ rt_timer_queue_init(struct rttimer_queue
        rtq->rtq_count = 0;
        rtq->rtq_func = func;
        TAILQ_INIT(&rtq->rtq_head);
-
-       mtx_enter(&rttimer_mtx);
-       LIST_INSERT_HEAD(&rttimer_queue_head, rtq, rtq_link);
-       mtx_leave(&rttimer_mtx);
 }
 
 void
@@ -1453,6 +1452,25 @@ rt_timer_queue_count(struct rttimer_queu
        return (rtq->rtq_count);
 }
 
+static inline struct rttimer *
+rt_timer_unlink(struct rttimer *r)
+{
+       MUTEX_ASSERT_LOCKED(&rttimer_mtx);
+
+       LIST_REMOVE(r, rtt_link);
+       r->rtt_rt = NULL;
+
+       if (timeout_del(&r->rtt_timeout) == 0) {
+               /* timeout fired, so rt_timer_timer will do the cleanup */
+               return NULL;
+       }
+
+       TAILQ_REMOVE(&r->rtt_queue->rtq_head, r, rtt_next);
+       KASSERT(r->rtt_queue->rtq_count > 0);
+       r->rtt_queue->rtq_count--;
+       return r;
+}
+
 void
 rt_timer_remove_all(struct rtentry *rt)
 {
@@ -1462,11 +1480,9 @@ rt_timer_remove_all(struct rtentry *rt)
        TAILQ_INIT(&rttlist);
        mtx_enter(&rttimer_mtx);
        while ((r = LIST_FIRST(&rt->rt_timer)) != NULL) {
-               LIST_REMOVE(r, rtt_link);
-               TAILQ_REMOVE(&r->rtt_queue->rtq_head, r, rtt_next);
-               TAILQ_INSERT_TAIL(&rttlist, r, rtt_next);
-               KASSERT(r->rtt_queue->rtq_count > 0);
-               r->rtt_queue->rtq_count--;
+               r = rt_timer_unlink(r);
+               if (r != NULL)
+                       TAILQ_INSERT_TAIL(&rttlist, r, rtt_next);
        }
        mtx_leave(&rttimer_mtx);
 
@@ -1476,41 +1492,52 @@ rt_timer_remove_all(struct rtentry *rt)
        }
 }
 
+time_t
+rt_timer_get_expire(const struct rtentry *rt)
+{
+       const struct rttimer    *r;
+       time_t                   expire = 0;
+       
+       mtx_enter(&rttimer_mtx);
+       LIST_FOREACH(r, &rt->rt_timer, rtt_link) {
+               if (expire == 0 || expire > r->rtt_expire)
+                       expire = r->rtt_expire;
+       }
+       mtx_leave(&rttimer_mtx);
+
+       return expire;
+}
+
 int
 rt_timer_add(struct rtentry *rt, struct rttimer_queue *queue, u_int rtableid)
 {
        struct rttimer  *r, *rnew;
-       time_t           current_time;
 
        rnew = pool_get(&rttimer_pool, PR_NOWAIT | PR_ZERO);
        if (rnew == NULL)
                return (ENOBUFS);
 
-       current_time = getuptime();
-
        rnew->rtt_rt = rt;
-       rnew->rtt_time = current_time;
        rnew->rtt_queue = queue;
        rnew->rtt_tableid = rtableid;
+       rnew->rtt_expire = getuptime() + queue->rtq_timeout;
+       timeout_set_proc(&rnew->rtt_timeout, rt_timer_timer, rnew);
 
        mtx_enter(&rttimer_mtx);
-       rt->rt_expire = current_time + queue->rtq_timeout;
        /*
         * If there's already a timer with this action, destroy it before
         * we add a new one.
         */
        LIST_FOREACH(r, &rt->rt_timer, rtt_link) {
                if (r->rtt_queue == queue) {
-                       LIST_REMOVE(r, rtt_link);
-                       TAILQ_REMOVE(&r->rtt_queue->rtq_head, r, rtt_next);
-                       KASSERT(r->rtt_queue->rtq_count > 0);
-                       r->rtt_queue->rtq_count--;
+                       r = rt_timer_unlink(r);
                        break;  /* only one per list, so we can quit... */
                }
        }
 
        LIST_INSERT_HEAD(&rt->rt_timer, rnew, rtt_link);
        TAILQ_INSERT_TAIL(&queue->rtq_head, rnew, rtt_next);
+       timeout_add_sec(&rnew->rtt_timeout, queue->rtq_timeout);
        rnew->rtt_queue->rtq_count++;
        mtx_leave(&rttimer_mtx);
 
@@ -1523,37 +1550,25 @@ rt_timer_add(struct rtentry *rt, struct 
 void
 rt_timer_timer(void *arg)
 {
-       struct timeout          *to = (struct timeout *)arg;
-       struct rttimer_queue    *rtq;
-       struct rttimer          *r;
-       TAILQ_HEAD(, rttimer)    rttlist;
-       time_t                   current_time;
-
-       current_time = getuptime();
-       TAILQ_INIT(&rttlist);
+       struct rttimer          *r = arg;
+       struct rttimer_queue    *rtq = r->rtt_queue;
 
        NET_LOCK();
        mtx_enter(&rttimer_mtx);
-       LIST_FOREACH(rtq, &rttimer_queue_head, rtq_link) {
-               while ((r = TAILQ_FIRST(&rtq->rtq_head)) != NULL &&
-                   (r->rtt_time + rtq->rtq_timeout) < current_time) {
-                       LIST_REMOVE(r, rtt_link);
-                       TAILQ_REMOVE(&rtq->rtq_head, r, rtt_next);
-                       TAILQ_INSERT_TAIL(&rttlist, r, rtt_next);
-                       KASSERT(rtq->rtq_count > 0);
-                       rtq->rtq_count--;
-               }
-       }
+
+       if (r->rtt_rt != NULL)
+               LIST_REMOVE(r, rtt_link);
+       TAILQ_REMOVE(&rtq->rtq_head, r, rtt_next);
+       KASSERT(rtq->rtq_count > 0);
+       rtq->rtq_count--;
+
        mtx_leave(&rttimer_mtx);
 
-       while ((r = TAILQ_FIRST(&rttlist)) != NULL) {
-               TAILQ_REMOVE(&rttlist, r, rtt_next);
+       if (r->rtt_rt != NULL)
                RTTIMER_CALLOUT(r);
-               pool_put(&rttimer_pool, r);
-       }
        NET_UNLOCK();
 
-       timeout_add_sec(to, 1);
+       pool_put(&rttimer_pool, r);
 }
 
 #ifdef MPLS
Index: net/route.h
===================================================================
RCS file: /cvs/src/sys/net/route.h,v
retrieving revision 1.194
diff -u -p -r1.194 route.h
--- net/route.h 5 May 2022 13:57:40 -0000       1.194
+++ net/route.h 13 May 2022 11:49:18 -0000
@@ -92,6 +92,8 @@ struct rt_metrics {
 #include <sys/queue.h>
 #include <net/rtable.h>
 
+struct rttimer;
+
 /*
  * We distinguish between routes to hosts and routes to networks,
  * preferring the former if available.  For each route we infer
@@ -405,15 +407,6 @@ rtstat_inc(enum rtstat_counters c)
  * add,timer} functions all used with the kind permission of BSDI.
  * These allow functions to be called for routes at specific times.
  */
-struct rttimer {
-       TAILQ_ENTRY(rttimer)    rtt_next;       /* [T] entry on timer queue */
-       LIST_ENTRY(rttimer)     rtt_link;       /* [T] timers per rtentry */
-       struct rttimer_queue    *rtt_queue;     /* [T] back pointer to queue */
-       struct rtentry          *rtt_rt;        /* [I] back pointer to route */
-       time_t                  rtt_time;       /* [I] when timer registered */
-       u_int                   rtt_tableid;    /* [I] rtable id of rtt_rt */
-};
-
 struct rttimer_queue {
        TAILQ_HEAD(, rttimer)           rtq_head;       /* [T] */
        LIST_ENTRY(rttimer_queue)       rtq_link;       /* [T] */
@@ -461,6 +454,7 @@ void                rt_timer_init(void);
 int            rt_timer_add(struct rtentry *,
                    struct rttimer_queue *, u_int);
 void           rt_timer_remove_all(struct rtentry *);
+time_t         rt_timer_get_expire(const struct rtentry *);
 void           rt_timer_queue_init(struct rttimer_queue *, int,
                    void(*)(struct rtentry *, u_int));
 void           rt_timer_queue_change(struct rttimer_queue *, int);
Index: net/rtsock.c
===================================================================
RCS file: /cvs/src/sys/net/rtsock.c,v
retrieving revision 1.331
diff -u -p -r1.331 rtsock.c
--- net/rtsock.c        27 Jun 2022 08:15:38 -0000      1.331
+++ net/rtsock.c        27 Jun 2022 14:00:22 -0000
@@ -132,7 +132,7 @@ int          rtm_xaddrs(caddr_t, caddr_t, struc
 int             rtm_validate_proposal(struct rt_addrinfo *);
 void            rtm_setmetrics(u_long, const struct rt_metrics *,
                     struct rt_kmetrics *);
-void            rtm_getmetrics(const struct rt_kmetrics *,
+void            rtm_getmetrics(const struct rtentry *,
                     struct rt_metrics *);
 
 int             sysctl_iflist(int, struct walkarg *);
@@ -674,7 +674,7 @@ rtm_report(struct rtentry *rt, u_char ty
        rtm->rtm_flags = rt->rt_flags;
        rtm->rtm_pid = curproc->p_p->ps_pid;
        rtm->rtm_seq = seq;
-       rtm_getmetrics(&rt->rt_rmx, &rtm->rtm_rmx);
+       rtm_getmetrics(rt, &rtm->rtm_rmx);
        rtm->rtm_addrs = info.rti_addrs;
 #ifdef MPLS
        rtm->rtm_mpls = info.rti_mpls;
@@ -1391,11 +1391,14 @@ rtm_setmetrics(u_long which, const struc
 }
 
 void
-rtm_getmetrics(const struct rt_kmetrics *in, struct rt_metrics *out)
+rtm_getmetrics(const struct rtentry *rt, struct rt_metrics *out)
 {
+       const struct rt_kmetrics *in = &rt->rt_rmx;
        int64_t expire;
 
        expire = in->rmx_expire;
+       if (expire == 0)
+               expire = rt_timer_get_expire(rt);
        if (expire != 0) {
                expire -= getuptime();
                expire += gettime();
@@ -1998,7 +2001,7 @@ sysctl_dumpentry(struct rtentry *rt, voi
                rtm->rtm_pid = curproc->p_p->ps_pid;
                rtm->rtm_flags = RTF_DONE | rt->rt_flags;
                rtm->rtm_priority = rt->rt_priority & RTP_MASK;
-               rtm_getmetrics(&rt->rt_rmx, &rtm->rtm_rmx);
+               rtm_getmetrics(rt, &rtm->rtm_rmx);
                /* Do not account the routing table's reference. */
                rtm->rtm_rmx.rmx_refcnt = rt->rt_refcnt - 1;
                rtm->rtm_index = rt->rt_ifidx;

Reply via email to