Re: [ovs-dev] [PATCHv2] netdev-provider: Apply batch object to netdev provider.

Darrell Ball Sun, 26 Jun 2016 20:03:09 -0700

On Sat, Jun 25, 2016 at 7:44 AM, William Tu <[email protected]> wrote:


> Commit 1895cc8dbb64 ("dpif-netdev: create batch object") introduces
> batch process functions and 'struct dp_packet_batch' to associate with
> batch-level metadata.  This patch applies the packet batch object to
> the netdev provider interface (dummy, Linux, BSD, and DPDK) so that
> batch APIs can be used in providers.  With batch metadata visible in
> providers, optimizations can be introduced at per-batch level instead
> of per-packet.
>
> Tested-at: https://travis-ci.org/williamtu/ovs-travis/builds/140135888
> <https://travis-ci.org/williamtu/ovs-travis/builds/140135888 Signed-off-by>


The test shows as failed ?

The code change is replacing an array of ptrs to packets and count with a
packet batch and replacing some code blocks with equivalent existing inline
functions based on batchs.

I have some comments inline.




> Signed-off-by
> <https://travis-ci.org/williamtu/ovs-travis/builds/140135888 Signed-off-by>:
> William Tu <[email protected]>
> --
> v1->v2: make commit message more descriptive.
> ---
>  lib/netdev-bsd.c      |  9 ++++--
>  lib/netdev-dpdk.c     | 81
> +++++++++++++++++++++++++--------------------------
>  lib/netdev-dummy.c    |  9 ++++--
>  lib/netdev-linux.c    |  9 ++++--
>  lib/netdev-provider.h | 25 ++++++++--------
>  lib/netdev.c          |  6 ++--
>  6 files changed, 72 insertions(+), 67 deletions(-)
>
> diff --git a/lib/netdev-bsd.c b/lib/netdev-bsd.c
> index 2e92d97..1b55b1a 100644
> --- a/lib/netdev-bsd.c
> +++ b/lib/netdev-bsd.c
> @@ -618,12 +618,13 @@ netdev_rxq_bsd_recv_tap(struct netdev_rxq_bsd *rxq,
> struct dp_packet *buffer)
>  }
>
>  static int
> -netdev_bsd_rxq_recv(struct netdev_rxq *rxq_, struct dp_packet **packets,
> -                    int *c)
> +netdev_bsd_rxq_recv(struct netdev_rxq *rxq_, struct dp_packet_batch
> *batch)
>  {
>      struct netdev_rxq_bsd *rxq = netdev_rxq_bsd_cast(rxq_);
>      struct netdev *netdev = rxq->up.netdev;
>      struct dp_packet *packet;
> +    struct dp_packet **packets = batch->packets;
> +    int *c = &batch->count;
>      ssize_t retval;
>      int mtu;
>
> @@ -681,10 +682,12 @@ netdev_bsd_rxq_drain(struct netdev_rxq *rxq_)
>   */
>  static int
>  netdev_bsd_send(struct netdev *netdev_, int qid OVS_UNUSED,
> -                struct dp_packet **pkts, int cnt, bool may_steal)
> +                struct dp_packet_batch *batch, bool may_steal)
>  {
>      struct netdev_bsd *dev = netdev_bsd_cast(netdev_);
>      const char *name = netdev_get_name(netdev_);
> +    int cnt = batch->count;
> +    struct dp_packet **okts = batch->packets;
>


"okts" is not used in the function; "pkts" is used in the function.
The function will no longer work.



>      int error;
>      int i;
>
> diff --git a/lib/netdev-dpdk.c b/lib/netdev-dpdk.c
> index ed14a21..3b1e7fa 100644
> --- a/lib/netdev-dpdk.c
> +++ b/lib/netdev-dpdk.c
> @@ -1251,12 +1251,14 @@ netdev_dpdk_vhost_update_rx_counters(struct
> netdev_stats *stats,
>   */
>  static int
>  netdev_dpdk_vhost_rxq_recv(struct netdev_rxq *rxq,
> -                           struct dp_packet **packets, int *c)
> +                           struct dp_packet_batch *batch)
>  {
>      struct netdev_dpdk *dev = netdev_dpdk_cast(rxq->netdev);
>      struct virtio_net *virtio_dev = netdev_dpdk_get_virtio(dev);
>      int qid = rxq->queue_id;
>      struct ingress_policer *policer =
> netdev_dpdk_get_ingress_policer(dev);
> +    struct dp_packet **packets = batch->packets;
> +    int *c = &batch->count;
>

I see this pattern throughout where extra variables are used in all
functions.
There are 2 local variables for packets and count and also the batch
parameter,
which itself already has reference to packets and count from the start of
the call chain
in netdev_*().

Pre-change, there are two parameters for packets and count derived from the
batch
parameter at the start of the call chain in netdev_*().

These functions are intended to be fast.



>      uint16_t nb_rx = 0;
>      uint16_t dropped = 0;
>
> @@ -1292,12 +1294,13 @@ netdev_dpdk_vhost_rxq_recv(struct netdev_rxq *rxq,
>  }
>
>  static int
> -netdev_dpdk_rxq_recv(struct netdev_rxq *rxq, struct dp_packet **packets,
> -                     int *c)
> +netdev_dpdk_rxq_recv(struct netdev_rxq *rxq, struct dp_packet_batch
> *batch)
>  {
>      struct netdev_rxq_dpdk *rx = netdev_rxq_dpdk_cast(rxq);
>      struct netdev_dpdk *dev = netdev_dpdk_cast(rxq->netdev);
>      struct ingress_policer *policer =
> netdev_dpdk_get_ingress_policer(dev);
> +    struct dp_packet **packets = batch->packets;
> +    int *c = &batch->count;
>      int nb_rx;
>      int dropped = 0;
>
> @@ -1371,11 +1374,13 @@ netdev_dpdk_vhost_update_tx_counters(struct
> netdev_stats *stats,
>
>  static void
>  __netdev_dpdk_vhost_send(struct netdev *netdev, int qid,
> -                         struct dp_packet **pkts, int cnt,
> +                         struct dp_packet_batch *batch,
>                           bool may_steal)
>  {
>      struct netdev_dpdk *dev = netdev_dpdk_cast(netdev);
>      struct virtio_net *virtio_dev = netdev_dpdk_get_virtio(dev);
> +    struct dp_packet **pkts = batch->packets;
> +    int cnt = batch->count;
>      struct rte_mbuf **cur_pkts = (struct rte_mbuf **) pkts;
>      unsigned int total_pkts = cnt;
>      unsigned int qos_pkts = cnt;
> @@ -1423,11 +1428,7 @@ __netdev_dpdk_vhost_send(struct netdev *netdev, int
> qid,
>
>  out:
>      if (may_steal) {
> -        int i;
> -
> -        for (i = 0; i < total_pkts; i++) {
> -            dp_packet_delete(pkts[i]);
> -        }
> +        dp_packet_delete_batch(batch, may_steal);
>      }
>  }
>
> @@ -1462,18 +1463,19 @@ dpdk_queue_pkts(struct netdev_dpdk *dev, int qid,
>
>  /* Tx function. Transmit packets indefinitely */
>  static void
> -dpdk_do_tx_copy(struct netdev *netdev, int qid, struct dp_packet **pkts,
> -                int cnt)
> -    OVS_NO_THREAD_SAFETY_ANALYSIS
> +dpdk_do_tx_copy(struct netdev *netdev, int qid, struct dp_packet_batch
> *batch)
> +OVS_NO_THREAD_SAFETY_ANALYSIS
>  {
>  #if !defined(__CHECKER__) && !defined(_WIN32)
> -    const size_t PKT_ARRAY_SIZE = cnt;
> +    const size_t PKT_ARRAY_SIZE = batch->count;
>  #else
>      /* Sparse or MSVC doesn't like variable length array. */
>      enum { PKT_ARRAY_SIZE = NETDEV_MAX_BURST };
>  #endif
>      struct netdev_dpdk *dev = netdev_dpdk_cast(netdev);
>      struct rte_mbuf *mbufs[PKT_ARRAY_SIZE];
> +    struct dp_packet **pkts = batch->packets;
> +    int cnt = batch->count;
>      int dropped = 0;
>      int newcnt = 0;
>      int i;
> @@ -1517,7 +1519,12 @@ dpdk_do_tx_copy(struct netdev *netdev, int qid,
> struct dp_packet **pkts,
>      }
>
>      if (dev->type == DPDK_DEV_VHOST) {
> -        __netdev_dpdk_vhost_send(netdev, qid, (struct dp_packet **)
> mbufs, newcnt, true);
> +        struct dp_packet_batch mbatch;
> +
> +        dp_packet_batch_init(&mbatch);
> +        mbatch.count = newcnt;
> +        memcpy(mbatch.packets, mbufs, newcnt * sizeof(struct rte_mbuf
> *));

+        __netdev_dpdk_vhost_send(netdev, qid, &mbatch, true);
>

This looks more expensive to me in terms of processing performance in this
caller especially and also the callee.
This code is intended to be fast.



>      } else {
>          unsigned int qos_pkts = newcnt;
>
> @@ -1541,37 +1548,30 @@ dpdk_do_tx_copy(struct netdev *netdev, int qid,
> struct dp_packet **pkts,
>  }
>
>  static int
> -netdev_dpdk_vhost_send(struct netdev *netdev, int qid, struct dp_packet
> **pkts,
> -                 int cnt, bool may_steal)
> +netdev_dpdk_vhost_send(struct netdev *netdev, int qid,
> +                       struct dp_packet_batch *batch,
> +                       bool may_steal)
>  {
> -    if (OVS_UNLIKELY(pkts[0]->source != DPBUF_DPDK)) {
> -        int i;
>
> -        dpdk_do_tx_copy(netdev, qid, pkts, cnt);
> +    if (OVS_UNLIKELY(batch->packets[0]->source != DPBUF_DPDK)) {
> +        dpdk_do_tx_copy(netdev, qid, batch);
>          if (may_steal) {
> -            for (i = 0; i < cnt; i++) {
> -                dp_packet_delete(pkts[i]);
> -            }
> +            dp_packet_delete_batch(batch, may_steal);
>          }
>      } else {
> -        int i;
> -
> -        for (i = 0; i < cnt; i++) {
> -            int cutlen = dp_packet_get_cutlen(pkts[i]);
> -
> -            dp_packet_set_size(pkts[i], dp_packet_size(pkts[i]) - cutlen);
> -            dp_packet_reset_cutlen(pkts[i]);
> -        }
> -        __netdev_dpdk_vhost_send(netdev, qid, pkts, cnt, may_steal);
> +        dp_packet_batch_apply_cutlen(batch);
> +        __netdev_dpdk_vhost_send(netdev, qid, batch, may_steal);
>      }
>      return 0;
>  }
>
>  static inline void
>  netdev_dpdk_send__(struct netdev_dpdk *dev, int qid,
> -                   struct dp_packet **pkts, int cnt, bool may_steal)
> +                   struct dp_packet_batch *batch, bool may_steal)
>  {
>      int i;
> +    struct dp_packet **pkts = batch->packets;
> +    int cnt = batch->count;
>
>      if (OVS_UNLIKELY(dev->txq_needs_locking)) {
>          qid = qid % dev->real_n_txq;
> @@ -1582,12 +1582,10 @@ netdev_dpdk_send__(struct netdev_dpdk *dev, int
> qid,
>                       pkts[0]->source != DPBUF_DPDK)) {
>          struct netdev *netdev = &dev->up;
>
> -        dpdk_do_tx_copy(netdev, qid, pkts, cnt);
> +        dpdk_do_tx_copy(netdev, qid, batch);
>
>          if (may_steal) {
> -            for (i = 0; i < cnt; i++) {
> -                dp_packet_delete(pkts[i]);
> -            }
> +            dp_packet_delete_batch(batch, may_steal);
>          }
>      } else {
>          int next_tx_idx = 0;
> @@ -1647,11 +1645,11 @@ netdev_dpdk_send__(struct netdev_dpdk *dev, int
> qid,
>
>  static int
>  netdev_dpdk_eth_send(struct netdev *netdev, int qid,
> -                     struct dp_packet **pkts, int cnt, bool may_steal)
> +                     struct dp_packet_batch *batch, bool may_steal)
>  {
>      struct netdev_dpdk *dev = netdev_dpdk_cast(netdev);
>
> -    netdev_dpdk_send__(dev, qid, pkts, cnt, may_steal);
> +    netdev_dpdk_send__(dev, qid, batch, may_steal);
>      return 0;
>  }
>
> @@ -2646,20 +2644,21 @@ dpdk_ring_open(const char dev_name[], unsigned int
> *eth_port_id) OVS_REQUIRES(dp
>
>  static int
>  netdev_dpdk_ring_send(struct netdev *netdev, int qid,
> -                      struct dp_packet **pkts, int cnt, bool may_steal)
> +                      struct dp_packet_batch *batch, bool may_steal)
>  {
>      struct netdev_dpdk *dev = netdev_dpdk_cast(netdev);
> +    struct dp_packet **pkts = batch->packets;
>      unsigned i;
>
>      /* When using 'dpdkr' and sending to a DPDK ring, we want to ensure
> that the
>       * rss hash field is clear. This is because the same mbuf may be
> modified by
>       * the consumer of the ring and return into the datapath without
> recalculating
>       * the RSS hash. */
> -    for (i = 0; i < cnt; i++) {
> +    for (i = 0; i < batch->count; i++) {
>          dp_packet_rss_invalidate(pkts[i]);
>      }
>
> -    netdev_dpdk_send__(dev, qid, pkts, cnt, may_steal);
> +    netdev_dpdk_send__(dev, qid, batch, may_steal);
>      return 0;
>  }
>
> diff --git a/lib/netdev-dummy.c b/lib/netdev-dummy.c
> index 127b6ae..63fc0b3 100644
> --- a/lib/netdev-dummy.c
> +++ b/lib/netdev-dummy.c
> @@ -951,12 +951,13 @@ netdev_dummy_rxq_dealloc(struct netdev_rxq *rxq_)
>  }
>
>  static int
> -netdev_dummy_rxq_recv(struct netdev_rxq *rxq_, struct dp_packet **arr,
> -                      int *c)
> +netdev_dummy_rxq_recv(struct netdev_rxq *rxq_, struct dp_packet_batch
> *batch)
>  {
>      struct netdev_rxq_dummy *rx = netdev_rxq_dummy_cast(rxq_);
>      struct netdev_dummy *netdev = netdev_dummy_cast(rx->up.netdev);
>      struct dp_packet *packet;
> +    struct dp_packet **arr = batch->packets;
> +    int *c = &batch->count;
>
>      ovs_mutex_lock(&netdev->mutex);
>      if (!ovs_list_is_empty(&rx->recv_queue)) {
> @@ -1034,10 +1035,12 @@ netdev_dummy_rxq_drain(struct netdev_rxq *rxq_)
>
>  static int
>  netdev_dummy_send(struct netdev *netdev, int qid OVS_UNUSED,
> -                  struct dp_packet **pkts, int cnt, bool may_steal)
> +                  struct dp_packet_batch *batch, bool may_steal)
>  {
>      struct netdev_dummy *dev = netdev_dummy_cast(netdev);
>      int error = 0;
> +    int cnt = batch->count;
> +    struct dp_packet **pkts = batch->packets;
>      int i;
>
>      for (i = 0; i < cnt; i++) {
> diff --git a/lib/netdev-linux.c b/lib/netdev-linux.c
> index ef11d12..594d437 100644
> --- a/lib/netdev-linux.c
> +++ b/lib/netdev-linux.c
> @@ -1091,12 +1091,13 @@ netdev_linux_rxq_recv_tap(int fd, struct dp_packet
> *buffer)
>  }
>
>  static int
> -netdev_linux_rxq_recv(struct netdev_rxq *rxq_, struct dp_packet **packets,
> -                      int *c)
> +netdev_linux_rxq_recv(struct netdev_rxq *rxq_, struct dp_packet_batch
> *batch)
>  {
>      struct netdev_rxq_linux *rx = netdev_rxq_linux_cast(rxq_);
>      struct netdev *netdev = rx->up.netdev;
>      struct dp_packet *buffer;
> +    struct dp_packet **packets = batch->packets;
> +    int *c = &batch->count;
>      ssize_t retval;
>      int mtu;
>
> @@ -1161,10 +1162,12 @@ netdev_linux_rxq_drain(struct netdev_rxq *rxq_)
>   * expected to do additional queuing of packets. */
>  static int
>  netdev_linux_send(struct netdev *netdev_, int qid OVS_UNUSED,
> -                  struct dp_packet **pkts, int cnt, bool may_steal)
> +                  struct dp_packet_batch *batch, bool may_steal)
>  {
>      int i;
>      int error = 0;
> +    int cnt = batch->count;
> +    struct dp_packet **pkts = batch->packets;
>
>      /* 'i' is incremented only if there's no error */
>      for (i = 0; i < cnt;) {
> diff --git a/lib/netdev-provider.h b/lib/netdev-provider.h
> index 5da377f..8c7c8ea 100644
> --- a/lib/netdev-provider.h
> +++ b/lib/netdev-provider.h
> @@ -340,8 +340,8 @@ struct netdev_class {
>       * network device from being usefully used by the netdev-based
> "userspace
>       * datapath".  It will also prevent the OVS implementation of bonding
> from
>       * working properly over 'netdev'.) */
> -    int (*send)(struct netdev *netdev, int qid, struct dp_packet
> **buffers,
> -                int cnt, bool may_steal);
> +    int (*send)(struct netdev *netdev, int qid, struct dp_packet_batch
> *batch,
> +                bool may_steal);
>
>      /* Registers with the poll loop to wake up from the next call to
>       * poll_block() when the packet transmission queue for 'netdev' has
> @@ -727,25 +727,24 @@ struct netdev_class {
>      void (*rxq_destruct)(struct netdev_rxq *);
>      void (*rxq_dealloc)(struct netdev_rxq *);
>
> -    /* Attempts to receive a batch of packets from 'rx'.  The caller
> supplies
> -     * 'pkts' as the pointer to the beginning of an array of MAX_RX_BATCH
> -     * pointers to dp_packet.  If successful, the implementation stores
> -     * pointers to up to MAX_RX_BATCH dp_packets into the array,
> transferring
> -     * ownership of the packets to the caller, stores the number of
> received
> -     * packets into '*cnt', and returns 0.
> +    /* Attempts to receive a batch of packets from 'batch'.  In batch, the
> +     * caller supplies 'packets' as the pointer to the beginning of an
> array
> +     * of MAX_RX_BATCH pointers to dp_packet.  If successful, the
> +     * implementation stores pointers to up to MAX_RX_BATCH dp_packets
> into
> +     * the array, transferring ownership of the packets to the caller,
> stores
> +     * the number of received packets into 'count', and returns 0.
>       *
>       * The implementation does not necessarily initialize any non-data
> members
> -     * of 'pkts'.  That is, the caller must initialize layer pointers and
> -     * metadata itself, if desired, e.g. with pkt_metadata_init() and
> -     * miniflow_extract().
> +     * of 'packets' in 'batch'.  That is, the caller must initialize layer
> +     * pointers and metadata itself, if desired, e.g. with
> pkt_metadata_init()
> +     * and miniflow_extract().
>       *
>       * Implementations should allocate buffers with DP_NETDEV_HEADROOM
> bytes of
>       * headroom.
>       *
>       * Returns EAGAIN immediately if no packet is ready to be received or
>       * another positive errno value if an error was encountered. */
> -    int (*rxq_recv)(struct netdev_rxq *rx, struct dp_packet **pkts,
> -                    int *cnt);
> +    int (*rxq_recv)(struct netdev_rxq *rx, struct dp_packet_batch *batch);
>
>      /* Registers with the poll loop to wake up from the next call to
>       * poll_block() when a packet is ready to be received with
> diff --git a/lib/netdev.c b/lib/netdev.c
> index 6651173..405bf41 100644
> --- a/lib/netdev.c
> +++ b/lib/netdev.c
> @@ -625,7 +625,7 @@ netdev_rxq_recv(struct netdev_rxq *rx, struct
> dp_packet_batch *batch)
>  {
>      int retval;
>
> -    retval = rx->netdev->netdev_class->rxq_recv(rx, batch->packets,
> &batch->count);
> +    retval = rx->netdev->netdev_class->rxq_recv(rx,  batch);
>      if (!retval) {
>          COVERAGE_INC(netdev_received);
>      } else {
> @@ -711,9 +711,7 @@ netdev_send(struct netdev *netdev, int qid, struct
> dp_packet_batch *batch,
>          return EOPNOTSUPP;
>      }
>
> -    int error = netdev->netdev_class->send(netdev, qid,
> -                                           batch->packets, batch->count,
> -                                           may_steal);
> +    int error = netdev->netdev_class->send(netdev, qid, batch, may_steal);
>      if (!error) {
>          COVERAGE_INC(netdev_sent);
>          if (!may_steal) {
> --
> 2.5.0
>
> _______________________________________________
> dev mailing list
> [email protected]
> http://openvswitch.org/mailman/listinfo/dev
>
_______________________________________________
dev mailing list
[email protected]
http://openvswitch.org/mailman/listinfo/dev

Re: [ovs-dev] [PATCHv2] netdev-provider: Apply batch object to netdev provider.

Reply via email to