Hi,

To fix the KASSERT(la != NULL) we have to protect the rt_llinfo
with a mutex.  The idea is to keep rt_llinfo and RTF_LLINFO consistent.
Also do not put the mutex in the fast path.

ok?

bluhm

Index: netinet/if_ether.c
===================================================================
RCS file: /data/mirror/openbsd/cvs/src/sys/netinet/if_ether.c,v
retrieving revision 1.250
diff -u -p -r1.250 if_ether.c
--- netinet/if_ether.c  27 Jun 2022 20:47:10 -0000      1.250
+++ netinet/if_ether.c  28 Jun 2022 14:00:12 -0000
@@ -101,6 +101,8 @@ void arpreply(struct ifnet *, struct mbu
     unsigned int);
 
 struct niqueue arpinq = NIQUEUE_INITIALIZER(50, NETISR_ARP);
+
+/* llinfo_arp live time, rt_llinfo and RTF_LLINFO are protected by arp_mtx */
 struct mutex arp_mtx = MUTEX_INITIALIZER(IPL_SOFTNET);
 
 LIST_HEAD(, llinfo_arp) arp_list; /* [mN] list of all llinfo_arp structures */
@@ -155,7 +157,7 @@ void
 arp_rtrequest(struct ifnet *ifp, int req, struct rtentry *rt)
 {
        struct sockaddr *gate = rt->rt_gateway;
-       struct llinfo_arp *la = (struct llinfo_arp *)rt->rt_llinfo;
+       struct llinfo_arp *la;
        time_t uptime;
 
        NET_ASSERT_LOCKED();
@@ -171,7 +173,7 @@ arp_rtrequest(struct ifnet *ifp, int req
                        rt->rt_expire = 0;
                        break;
                }
-               if ((rt->rt_flags & RTF_LOCAL) && !la)
+               if ((rt->rt_flags & RTF_LOCAL) && rt->rt_llinfo == NULL)
                        rt->rt_expire = 0;
                /*
                 * Announce a new entry if requested or warn the user
@@ -192,44 +194,54 @@ arp_rtrequest(struct ifnet *ifp, int req
                }
                satosdl(gate)->sdl_type = ifp->if_type;
                satosdl(gate)->sdl_index = ifp->if_index;
-               if (la != NULL)
-                       break; /* This happens on a route change */
                /*
                 * Case 2:  This route may come from cloning, or a manual route
                 * add with a LL address.
                 */
                la = pool_get(&arp_pool, PR_NOWAIT | PR_ZERO);
-               rt->rt_llinfo = (caddr_t)la;
                if (la == NULL) {
                        log(LOG_DEBUG, "%s: pool get failed\n", __func__);
                        break;
                }
 
+               mtx_enter(&arp_mtx);
+               if (rt->rt_llinfo != NULL) {
+                       /* we lost the race, another thread has entered it */
+                       mtx_leave(&arp_mtx);
+                       printf("%s: llinfo exists\n", __func__);
+                       pool_put(&arp_pool, la);
+                       break;
+               }
                mq_init(&la->la_mq, LA_HOLD_QUEUE, IPL_SOFTNET);
+               rt->rt_llinfo = (caddr_t)la;
                la->la_rt = rt;
                rt->rt_flags |= RTF_LLINFO;
+               LIST_INSERT_HEAD(&arp_list, la, la_list);
                if ((rt->rt_flags & RTF_LOCAL) == 0)
                        rt->rt_expire = uptime;
-               mtx_enter(&arp_mtx);
-               LIST_INSERT_HEAD(&arp_list, la, la_list);
                mtx_leave(&arp_mtx);
+
                break;
 
        case RTM_DELETE:
-               if (la == NULL)
-                       break;
                mtx_enter(&arp_mtx);
+               la = (struct llinfo_arp *)rt->rt_llinfo;
+               if (la == NULL) {
+                       /* we lost the race, another thread has removed it */
+                       mtx_leave(&arp_mtx);
+                       printf("%s: llinfo missing\n", __func__);
+                       break;
+               }
                LIST_REMOVE(la, la_list);
-               mtx_leave(&arp_mtx);
                rt->rt_llinfo = NULL;
                rt->rt_flags &= ~RTF_LLINFO;
                atomic_sub_int(&la_hold_total, mq_purge(&la->la_mq));
+               mtx_leave(&arp_mtx);
+
                pool_put(&arp_pool, la);
                break;
 
        case RTM_INVALIDATE:
-               if (la == NULL)
-                       break;
                if (!ISSET(rt->rt_flags, RTF_LOCAL))
                        arpinvalidate(rt);
                break;
@@ -363,8 +375,6 @@ arpresolve(struct ifnet *ifp, struct rte
                goto bad;
        }
 
-       la = (struct llinfo_arp *)rt->rt_llinfo;
-       KASSERT(la != NULL);
 
        /*
         * Check the address family and length is valid, the address
@@ -372,13 +382,27 @@ arpresolve(struct ifnet *ifp, struct rte
         */
        if ((rt->rt_expire == 0 || rt->rt_expire > uptime) &&
            sdl->sdl_family == AF_LINK && sdl->sdl_alen != 0) {
+               int refresh = 0;
+
                memcpy(desten, LLADDR(sdl), sdl->sdl_alen);
 
                /* refresh ARP entry when timeout gets close */
                if (rt->rt_expire != 0 &&
-                   rt->rt_expire - arpt_keep / 8 < uptime &&
-                   la->la_refreshed + 30 < uptime) {
-                       la->la_refreshed = uptime;
+                   rt->rt_expire - arpt_keep / 8 < uptime) {
+
+                       mtx_enter(&arp_mtx);
+                       if (ISSET(rt->rt_flags, RTF_LLINFO)) {
+                               la = (struct llinfo_arp *)rt->rt_llinfo;
+                               KASSERT(la != NULL);
+
+                               if (la->la_refreshed + 30 < uptime) {
+                                       la->la_refreshed = uptime;
+                                       refresh = 1;
+                               }
+                       }
+                       mtx_leave(&arp_mtx);
+               }
+               if (refresh) {
                        arprequest(ifp,
                            &satosin(rt->rt_ifa->ifa_addr)->sin_addr.s_addr,
                            &satosin(dst)->sin_addr.s_addr,
@@ -724,12 +748,19 @@ arpcache(struct ifnet *ifp, struct ether
 void
 arpinvalidate(struct rtentry *rt)
 {
-       struct llinfo_arp *la = (struct llinfo_arp *)rt->rt_llinfo;
+       struct llinfo_arp *la;
        struct sockaddr_dl *sdl = satosdl(rt->rt_gateway);
 
+       mtx_enter(&arp_mtx);
+       la = (struct llinfo_arp *)rt->rt_llinfo;
+       if (la == NULL) {
+               mtx_leave(&arp_mtx);
+               return;
+       }
        atomic_sub_int(&la_hold_total, mq_purge(&la->la_mq));
        sdl->sdl_alen = 0;
        la->la_asked = 0;
+       mtx_leave(&arp_mtx);
 }
 
 /*

Reply via email to