I didn't experiment.  The dpif-linux fds have the advantage of being
static and unchanging from one iteration to the next.  It might be worth
a try later.

On Thu, Nov 24, 2011 at 10:28:45AM -0800, Justin Pettit wrote:
> Looks good.  Do you think there's benefit in using epoll in the main
> poll library?
> 
> --Justin
> 
> 
> On Nov 22, 2011, at 3:12 PM, Ben Pfaff wrote:
> 
> > epoll appears to be much more efficient than poll() at least for
> > static file descriptor sets.  I can't otherwise explain why this
> > patch increases netperf CRR performance by 20% above the previous
> > commit, which is also about a 19% overall improvement versus
> > the baseline from before the poll_fd_woke() optimization was
> > removed.
> > ---
> > lib/dpif-linux.c |   54 
> > +++++++++++++++++++++++++++++++-----------------------
> > 1 files changed, 31 insertions(+), 23 deletions(-)
> > 
> > diff --git a/lib/dpif-linux.c b/lib/dpif-linux.c
> > index 75e4301..d71fa2a 100644
> > --- a/lib/dpif-linux.c
> > +++ b/lib/dpif-linux.c
> > @@ -31,6 +31,7 @@
> > #include <poll.h>
> > #include <stdlib.h>
> > #include <strings.h>
> > +#include <sys/epoll.h>
> > #include <sys/stat.h>
> > #include <unistd.h>
> > 
> > @@ -140,6 +141,7 @@ struct dpif_linux {
> >     struct nl_sock *upcall_socks[N_UPCALL_SOCKS];
> >     uint32_t nonempty_socks;
> >     unsigned int listen_mask;
> > +    int epoll_fd;
> > 
> >     /* Change notification. */
> >     struct sset changed_ports;  /* Ports that have changed. */
> > @@ -274,6 +276,7 @@ open_dpif(const struct dpif_linux_dp *dp, struct dpif 
> > **dpifp)
> >     dpif = xzalloc(sizeof *dpif);
> >     dpif->port_notifier = nln_notifier_create(nln, dpif_linux_port_changed,
> >                                               dpif);
> > +    dpif->epoll_fd = -1;
> > 
> >     dpif_init(&dpif->dpif, &dpif_linux_class, dp->name,
> >               dp->dp_ifindex, dp->dp_ifindex);
> > @@ -294,6 +297,10 @@ destroy_upcall_socks(struct dpif_linux *dpif)
> > {
> >     int i;
> > 
> > +    if (dpif->epoll_fd >= 0) {
> > +        close(dpif->epoll_fd);
> > +        dpif->epoll_fd = -1;
> > +    }
> >     for (i = 0; i < N_UPCALL_SOCKS; i++) {
> >         nl_sock_destroy(dpif->upcall_socks[i]);
> >         dpif->upcall_socks[i] = NULL;
> > @@ -1005,12 +1012,28 @@ dpif_linux_recv_set_mask(struct dpif *dpif_, int 
> > listen_mask)
> >         int i;
> >         int error;
> > 
> > +        dpif->epoll_fd = epoll_create(N_UPCALL_SOCKS);
> > +        if (dpif->epoll_fd < 0) {
> > +            return errno;
> > +        }
> > +
> >         for (i = 0; i < N_UPCALL_SOCKS; i++) {
> > +            struct epoll_event event;
> > +
> >             error = nl_sock_create(NETLINK_GENERIC, &dpif->upcall_socks[i]);
> >             if (error) {
> >                 destroy_upcall_socks(dpif);
> >                 return error;
> >             }
> > +
> > +            event.events = EPOLLIN;
> > +            event.data.u32 = i;
> > +            if (epoll_ctl(dpif->epoll_fd, EPOLL_CTL_ADD,
> > +                          nl_sock_fd(dpif->upcall_socks[i]), &event) < 0) {
> > +                error = errno;
> > +                destroy_upcall_socks(dpif);
> > +                return error;
> > +            }
> >         }
> > 
> >         dpif->nonempty_socks = 0;
> > @@ -1100,36 +1123,24 @@ dpif_linux_recv(struct dpif *dpif_, struct 
> > dpif_upcall *upcall)
> >     }
> > 
> >     if (!dpif->nonempty_socks) {
> > -        struct pollfd pfds[N_UPCALL_SOCKS];
> > +        struct epoll_event events[N_UPCALL_SOCKS];
> >         int retval;
> >         int i;
> > 
> > -        for (i = 0; i < N_UPCALL_SOCKS; i++) {
> > -            pfds[i].fd = nl_sock_fd(dpif->upcall_socks[i]);
> > -            pfds[i].events = POLLIN;
> > -            pfds[i].revents = 0;
> > -        }
> > -
> >         do {
> > -            retval = poll(pfds, N_UPCALL_SOCKS, 0);
> > +            retval = epoll_wait(dpif->epoll_fd, events, N_UPCALL_SOCKS, 0);
> >         } while (retval < 0 && errno == EINTR);
> >         if (retval < 0) {
> >             static struct vlog_rate_limit rl = VLOG_RATE_LIMIT_INIT(1, 1);
> > -            VLOG_WARN_RL(&rl, "poll failed (%s)", strerror(errno));
> > -        } else if (!retval) {
> > -            return EAGAIN;
> > +            VLOG_WARN_RL(&rl, "epoll_wait failed (%s)", strerror(errno));
> >         }
> > 
> > -        for (i = 0; i < N_UPCALL_SOCKS; i++) {
> > -            if (pfds[i].revents) {
> > -                dpif->nonempty_socks |= 1u << i;
> > -            }
> > +        for (i = 0; i < retval; i++) {
> > +            dpif->nonempty_socks |= 1u << events[i].data.u32;
> >         }
> > -
> > -        assert(dpif->nonempty_socks);
> >     }
> > 
> > -    do {
> > +    while (dpif->nonempty_socks) {
> >         int indx = ffs(dpif->nonempty_socks) - 1;
> >         struct nl_sock *upcall_sock = dpif->upcall_socks[indx];
> > 
> > @@ -1163,7 +1174,7 @@ dpif_linux_recv(struct dpif *dpif_, struct 
> > dpif_upcall *upcall)
> >                 return error;
> >             }
> >         }
> > -    } while (dpif->nonempty_socks);
> > +    }
> > 
> >     return EAGAIN;
> > }
> > @@ -1172,15 +1183,12 @@ static void
> > dpif_linux_recv_wait(struct dpif *dpif_)
> > {
> >     struct dpif_linux *dpif = dpif_linux_cast(dpif_);
> > -    int i;
> > 
> >     if (!dpif->listen_mask) {
> >        return;
> >     }
> > 
> > -    for (i = 0; i < N_UPCALL_SOCKS; i++) {
> > -        nl_sock_wait(dpif->upcall_socks[i], POLLIN);
> > -    }
> > +    poll_fd_wait(dpif->epoll_fd, POLLIN);
> > }
> > 
> > static void
> > -- 
> > 1.7.4.4
> > 
> > _______________________________________________
> > dev mailing list
> > dev@openvswitch.org
> > http://openvswitch.org/mailman/listinfo/dev
> 
_______________________________________________
dev mailing list
dev@openvswitch.org
http://openvswitch.org/mailman/listinfo/dev

Reply via email to