Enable nanosecond-precision timestamps for both live capture and pcap
file reading.

Replace pcap_open_live() with the pcap_create()/pcap_activate() API,
which allows setting PCAP_TSTAMP_PRECISION_NANO before
activation. Similarly, use pcap_open_offline_with_tstamp_precision()
for reading pcap files. The pcap_pkthdr timestamp field, despite being
declared as struct timeval, actually contains nanoseconds (not
microseconds) when nanosecond precision is requested.

Make receive timestamp offloading conditional: timestamps are now only
written to the mbuf dynamic field when RTE_ETH_RX_OFFLOAD_TIMESTAMP is
enabled. Previously, timestamps were unconditionally added to every
received packet.

Other related changes:
* Defer timestamp dynfield registration from probe to device start,
  and only when timestamp offloading is enabled
* Add read_clock dev_op returning current UTC time
  for timestamp correlation
* Move per-burst timestamp calculation outside the packet loop in
  tx_dumper
* Enable immediate mode and improve error reporting
  in live capture setup

Signed-off-by: Stephen Hemminger <[email protected]>
---
 doc/guides/rel_notes/release_26_03.rst |   2 +
 drivers/net/pcap/pcap_ethdev.c         | 129 +++++++++++++++++++------
 2 files changed, 102 insertions(+), 29 deletions(-)

diff --git a/doc/guides/rel_notes/release_26_03.rst 
b/doc/guides/rel_notes/release_26_03.rst
index 4e31d85e50..a1536033f7 100644
--- a/doc/guides/rel_notes/release_26_03.rst
+++ b/doc/guides/rel_notes/release_26_03.rst
@@ -59,6 +59,8 @@ New Features
 
   * Added support for setting MTU in single interface mode.
   * Added support for VLAN insertion and stripping.
+  * Receive timestamp offload is only done if offload flag set.
+  * Receive timestamps support nanosecond precision.
   * Changed transmit burst to always return the number of packets requested.
     Failed sends are counted as transmit errors.
 
diff --git a/drivers/net/pcap/pcap_ethdev.c b/drivers/net/pcap/pcap_ethdev.c
index 85225fca2d..1c53a47bc6 100644
--- a/drivers/net/pcap/pcap_ethdev.c
+++ b/drivers/net/pcap/pcap_ethdev.c
@@ -27,13 +27,12 @@
 #include <rte_mbuf_dyn.h>
 #include <bus_vdev_driver.h>
 #include <rte_os_shim.h>
+#include <rte_time.h>
 
 #include "pcap_osdep.h"
 
 #define RTE_ETH_PCAP_SNAPSHOT_LEN 65535
 #define RTE_ETH_PCAP_SNAPLEN (RTE_ETHER_MAX_JUMBO_FRAME_LEN - 
RTE_ETHER_CRC_LEN)
-#define RTE_ETH_PCAP_PROMISC 1
-#define RTE_ETH_PCAP_TIMEOUT -1
 
 #define ETH_PCAP_RX_PCAP_ARG  "rx_pcap"
 #define ETH_PCAP_TX_PCAP_ARG  "tx_pcap"
@@ -77,6 +76,7 @@ struct pcap_rx_queue {
        uint16_t port_id;
        uint16_t queue_id;
        bool vlan_strip;
+       bool timestamp_offloading;
        struct rte_mempool *mb_pool;
        struct queue_stat rx_stat;
        struct queue_missed_stat missed_stat;
@@ -105,6 +105,7 @@ struct pmd_internals {
        bool phy_mac;
        bool infinite_rx;
        bool vlan_strip;
+       bool timestamp_offloading;
 };
 
 struct pmd_process_private {
@@ -339,10 +340,20 @@ eth_pcap_rx(void *queue, struct rte_mbuf **bufs, uint16_t 
nb_pkts)
                if (pcap_q->vlan_strip)
                        rte_vlan_strip(mbuf);
 
-               uint64_t us = (uint64_t)header->ts.tv_sec * US_PER_S + 
header->ts.tv_usec;
+               if (pcap_q->timestamp_offloading) {
+                       /*
+                        * Although time stamp in struct pcap_pkthdr is defined 
as struct timeval,
+                        * it really is a timespec with nanosecond resolution.
+                        */
+                       uint64_t ns = (uint64_t)header->ts.tv_sec * NSEC_PER_SEC
+                               +  header->ts.tv_usec;
+
+                       *RTE_MBUF_DYNFIELD(mbuf, timestamp_dynfield_offset,
+                                          rte_mbuf_timestamp_t *) = ns;
+
+                       mbuf->ol_flags |= timestamp_rx_dynflag;
+               }
 
-               *RTE_MBUF_DYNFIELD(mbuf, timestamp_dynfield_offset, 
rte_mbuf_timestamp_t *) = us;
-               mbuf->ol_flags |= timestamp_rx_dynflag;
                mbuf->port = pcap_q->port_id;
                bufs[num_rx] = mbuf;
                num_rx++;
@@ -362,14 +373,13 @@ eth_null_rx(void *queue __rte_unused,
        return 0;
 }
 
-#define NSEC_PER_SEC   1000000000L
-
 /*
  * This function stores nanoseconds in `tv_usec` field of `struct timeval`,
  * because `ts` goes directly to nanosecond-precision dump.
  */
 static inline void
-calculate_timestamp(struct timeval *ts) {
+calculate_timestamp(struct timeval *ts)
+{
        uint64_t cycles;
        struct timespec cur_time;
 
@@ -420,6 +430,9 @@ eth_pcap_tx_dumper(void *queue, struct rte_mbuf **bufs, 
uint16_t nb_pkts)
        if (unlikely(dumper == NULL || nb_pkts == 0))
                return 0;
 
+       /* all packets in burst have same timestamp */
+       calculate_timestamp(&header.ts);
+
        /* writes the nb_pkts packets to the previously opened pcap file dumper 
*/
        for (i = 0; i < nb_pkts; i++) {
                struct rte_mbuf *mbuf = bufs[i];
@@ -433,7 +446,6 @@ eth_pcap_tx_dumper(void *queue, struct rte_mbuf **bufs, 
uint16_t nb_pkts)
                                continue;
                }
 
-               calculate_timestamp(&header.ts);
                header.len = len;
                header.caplen = len;
 
@@ -536,22 +548,60 @@ eth_pcap_tx(void *queue, struct rte_mbuf **bufs, uint16_t 
nb_pkts)
  * pcap_open_live wrapper function
  */
 static inline int
-open_iface_live(const char *iface, pcap_t **pcap) {
-       *pcap = pcap_open_live(iface, RTE_ETH_PCAP_SNAPLEN,
-                       RTE_ETH_PCAP_PROMISC, RTE_ETH_PCAP_TIMEOUT, errbuf);
+open_iface_live(const char *iface, pcap_t **pcap)
+{
+       pcap_t *pc;
+       int status;
 
-       if (*pcap == NULL) {
-               PMD_LOG(ERR, "Couldn't open %s: %s", iface, errbuf);
-               return -1;
+       pc = pcap_create(iface, errbuf);
+       if (pc == NULL) {
+               PMD_LOG(ERR, "Couldn't create %s: %s", iface, errbuf);
+               goto error;
        }
 
-       if (pcap_setnonblock(*pcap, 1, errbuf)) {
+       status = pcap_set_tstamp_precision(pc, PCAP_TSTAMP_PRECISION_NANO);
+       if (status != 0)
+               PMD_LOG(WARNING, "%s: Could not set to ns precision: %s",
+                       iface, pcap_statustostr(status));
+
+       status = pcap_set_immediate_mode(pc, 1);
+       if (status != 0)
+               PMD_LOG(WARNING, "%s: Could not set to immediate mode: %s",
+                       iface, pcap_statustostr(status));
+
+       status = pcap_set_promisc(pc, 1);
+       if (status != 0)
+               PMD_LOG(WARNING, "%s: Could not set to promiscuous: %s",
+                       iface, pcap_statustostr(status));
+
+       status = pcap_set_snaplen(pc, RTE_ETH_PCAP_SNAPSHOT_LEN);
+       if (status != 0)
+               PMD_LOG(WARNING, "%s: Could not set snapshot length: %s",
+                       iface, pcap_statustostr(status));
+
+       status = pcap_activate(pc);
+       if (status < 0) {
+               char *cp = pcap_geterr(pc);
+
+               if (status == PCAP_ERROR)
+                       PMD_LOG(ERR, "%s: could not activate: %s", iface, cp);
+               else
+                       PMD_LOG(ERR, "%s: %s (%s)", iface, 
pcap_statustostr(status), cp);
+               goto error;
+       }
+
+       if (pcap_setnonblock(pc, 1, errbuf)) {
                PMD_LOG(ERR, "Couldn't set non-blocking on %s: %s", iface, 
errbuf);
-               pcap_close(*pcap);
-               return -1;
+               goto error;
        }
 
+       *pcap = pc;
        return 0;
+
+error:
+       if (pc != NULL)
+               pcap_close(pc);
+       return -1;
 }
 
 static int
@@ -598,7 +648,8 @@ open_single_tx_pcap(const char *pcap_filename, 
pcap_dumper_t **dumper)
 static int
 open_single_rx_pcap(const char *pcap_filename, pcap_t **pcap)
 {
-       *pcap = pcap_open_offline(pcap_filename, errbuf);
+       *pcap = pcap_open_offline_with_tstamp_precision(pcap_filename,
+                                                       
PCAP_TSTAMP_PRECISION_NANO, errbuf);
        if (*pcap == NULL) {
                PMD_LOG(ERR, "Couldn't open %s: %s", pcap_filename,
                        errbuf);
@@ -635,6 +686,15 @@ eth_dev_start(struct rte_eth_dev *dev)
        struct pcap_tx_queue *tx;
        struct pcap_rx_queue *rx;
 
+       if (internals->timestamp_offloading) {
+               int ret = 
rte_mbuf_dyn_rx_timestamp_register(&timestamp_dynfield_offset,
+                                                            
&timestamp_rx_dynflag);
+               if (ret != 0) {
+                       PMD_LOG(ERR, "Failed to register Rx timestamp 
field/flag");
+                       return ret;
+               }
+       }
+
        /* Special iface case. Single pcap is open and shared between tx/rx. */
        if (internals->single_iface) {
                tx = &internals->tx_queue[0];
@@ -757,6 +817,7 @@ eth_dev_configure(struct rte_eth_dev *dev)
        const struct rte_eth_rxmode *rxmode = &dev_conf->rxmode;
 
        internals->vlan_strip = !!(rxmode->offloads & 
RTE_ETH_RX_OFFLOAD_VLAN_STRIP);
+       internals->timestamp_offloading = !!(rxmode->offloads & 
RTE_ETH_RX_OFFLOAD_TIMESTAMP);
        return 0;
 }
 
@@ -776,7 +837,8 @@ eth_dev_info(struct rte_eth_dev *dev,
        dev_info->max_mtu = RTE_ETH_PCAP_SNAPLEN;
        dev_info->tx_offload_capa = RTE_ETH_TX_OFFLOAD_MULTI_SEGS |
                RTE_ETH_TX_OFFLOAD_VLAN_INSERT;
-       dev_info->rx_offload_capa = RTE_ETH_RX_OFFLOAD_VLAN_STRIP;
+       dev_info->rx_offload_capa = RTE_ETH_RX_OFFLOAD_VLAN_STRIP |
+               RTE_ETH_RX_OFFLOAD_TIMESTAMP;
 
        return 0;
 }
@@ -925,6 +987,7 @@ eth_rx_queue_setup(struct rte_eth_dev *dev,
        pcap_q->queue_id = rx_queue_id;
        pcap_q->vlan_strip = internals->vlan_strip;
        dev->data->rx_queues[rx_queue_id] = pcap_q;
+       pcap_q->timestamp_offloading = internals->timestamp_offloading;
 
        if (internals->infinite_rx) {
                struct pmd_process_private *pp;
@@ -1046,6 +1109,17 @@ eth_mtu_set(struct rte_eth_dev *dev, uint16_t mtu)
        return 0;
 }
 
+/* Timestamp values in receive packets from libpcap are in nanoseconds */
+static int
+ns_read_clock(struct rte_eth_dev *dev __rte_unused, uint64_t *timestamp)
+{
+       struct timespec cur_time;
+
+       timespec_get(&cur_time, TIME_UTC);
+       *timestamp = rte_timespec_to_ns(&cur_time);
+       return 0;
+}
+
 static const struct eth_dev_ops ops = {
        .dev_start = eth_dev_start,
        .dev_stop = eth_dev_stop,
@@ -1062,6 +1136,7 @@ static const struct eth_dev_ops ops = {
        .mtu_set = eth_mtu_set,
        .stats_get = eth_stats_get,
        .stats_reset = eth_stats_reset,
+       .read_clock = ns_read_clock,
 };
 
 static int
@@ -1461,15 +1536,11 @@ pmd_pcap_probe(struct rte_vdev_device *dev)
        name = rte_vdev_device_name(dev);
        PMD_LOG(INFO, "Initializing pmd_pcap for %s", name);
 
-       timespec_get(&start_time, TIME_UTC);
-       start_cycles = rte_get_timer_cycles();
-       hz = rte_get_timer_hz();
-
-       ret = rte_mbuf_dyn_rx_timestamp_register(&timestamp_dynfield_offset,
-                       &timestamp_rx_dynflag);
-       if (ret != 0) {
-               PMD_LOG(ERR, "Failed to register Rx timestamp field/flag");
-               return -1;
+       /* Record info for timestamps on first probe */
+       if (hz == 0) {
+               timespec_get(&start_time, TIME_UTC);
+               start_cycles = rte_get_timer_cycles();
+               hz = rte_get_timer_hz();
        }
 
        if (rte_eal_process_type() == RTE_PROC_SECONDARY) {
-- 
2.51.0

Reply via email to