mlx4 NIC is using lkey in big endian format. Save lkey in this format
in order to avoid conversions during Tx fast path

Signed-off-by: Ophir Munk <ophi...@mellanox.com>
---
 drivers/net/mlx4/mlx4_rxtx.c | 14 ++++++--------
 drivers/net/mlx4/mlx4_rxtx.h | 10 ++++++----
 2 files changed, 12 insertions(+), 12 deletions(-)

diff --git a/drivers/net/mlx4/mlx4_rxtx.c b/drivers/net/mlx4/mlx4_rxtx.c
index ae37f9b..4e06cca 100644
--- a/drivers/net/mlx4/mlx4_rxtx.c
+++ b/drivers/net/mlx4/mlx4_rxtx.c
@@ -260,10 +260,10 @@ uint32_t mlx4_txq_add_mr(struct txq *txq, struct 
rte_mempool *mp, uint32_t i)
        /* Store the new entry. */
        txq->mp2mr[i].mp = mp;
        txq->mp2mr[i].mr = mr;
-       txq->mp2mr[i].lkey = mr->lkey;
+       txq->mp2mr[i].be_lkey = rte_cpu_to_be_32(mr->lkey);
        DEBUG("%p: new MR lkey for MP \"%s\" (%p): 0x%08" PRIu32,
-             (void *)txq, mp->name, (void *)mp, txq->mp2mr[i].lkey);
-       return txq->mp2mr[i].lkey;
+             (void *)txq, mp->name, (void *)mp, mr->lkey);
+       return txq->mp2mr[i].be_lkey;
 }
 
 /**
@@ -289,7 +289,6 @@ mlx4_post_send(struct txq *txq, struct rte_mbuf *pkt)
                uint16_t flags16[2];
        } srcrb;
        uint32_t head_idx = sq->head & sq->txbb_cnt_mask;
-       uint32_t lkey;
        uintptr_t addr;
        uint32_t owner_opcode = MLX4_OPCODE_SEND;
        uint32_t byte_count;
@@ -323,10 +322,10 @@ mlx4_post_send(struct txq *txq, struct rte_mbuf *pkt)
                if (unlikely(dseg >= (struct mlx4_wqe_data_seg *)sq->eob))
                        dseg = (struct mlx4_wqe_data_seg *)sq->buf;
                dseg->addr = rte_cpu_to_be_64(addr);
-               /* Memory region key for this memory pool. */
-               lkey = mlx4_txq_mp2mr(txq, mlx4_txq_mb2mp(buf));
+               /* Memory region key (big endian) for this memory pool. */
+               dseg->lkey = mlx4_txq_mp2mr(txq, mlx4_txq_mb2mp(buf));
 #ifndef NDEBUG
-               if (unlikely(lkey == (uint32_t)-1)) {
+               if (unlikely(dseg->lkey == rte_cpu_to_be_32((uint32_t)-1))) {
                        /* MR does not exist. */
                        DEBUG("%p: unable to get MP <-> MR association",
                              (void *)txq);
@@ -341,7 +340,6 @@ mlx4_post_send(struct txq *txq, struct rte_mbuf *pkt)
                        return -EFAULT;
                }
 #endif /* NDEBUG */
-               dseg->lkey = rte_cpu_to_be_32(lkey);
                if (likely(buf->data_len)) {
                        byte_count = rte_cpu_to_be_32(buf->data_len);
                } else {
diff --git a/drivers/net/mlx4/mlx4_rxtx.h b/drivers/net/mlx4/mlx4_rxtx.h
index 719ef45..8d39afb 100644
--- a/drivers/net/mlx4/mlx4_rxtx.h
+++ b/drivers/net/mlx4/mlx4_rxtx.h
@@ -135,7 +135,7 @@ struct txq {
        struct {
                const struct rte_mempool *mp; /**< Cached memory pool. */
                struct ibv_mr *mr; /**< Memory region (for mp). */
-               uint32_t lkey; /**< mr->lkey copy. */
+               uint32_t be_lkey; /**< mr->lkey copy. (big endian) */
        } mp2mr[MLX4_PMD_TX_MP_CACHE]; /**< MP to MR translation table. */
        struct priv *priv; /**< Back pointer to private data. */
        unsigned int socket; /**< CPU socket ID for allocations. */
@@ -220,9 +220,11 @@ mlx4_txq_mp2mr(struct txq *txq, struct rte_mempool *mp)
                        break;
                }
                if (txq->mp2mr[i].mp == mp) {
-                       assert(txq->mp2mr[i].lkey != (uint32_t)-1);
-                       assert(txq->mp2mr[i].mr->lkey == txq->mp2mr[i].lkey);
-                       return txq->mp2mr[i].lkey;
+                       assert(txq->mp2mr[i].be_lkey !=
+                               rte_cpu_to_be_32((uint32_t)-1));
+                       assert(txq->mp2mr[i].mr->lkey ==
+                               rte_be_to_cpu_32(txq->mp2mr[i].be_lkey));
+                       return txq->mp2mr[i].be_lkey;
                }
        }
        return mlx4_txq_add_mr(txq, mp, i);
-- 
2.7.4

Reply via email to