Wednesday, October 31, 2018 9:11 AM, Dekel Peled:
> Subject: [dpdk-dev] [PATCH v7 7/7] net/mlx5: add caching of encap decap
> actions
> 
> Make flow encap and decap Verbs actions cacheable resources.
> Reuse 17.11 PR 876.

No one knows what is PR 876 in the mailing list, also this code is not in 17.11 
community. 
Need to make a proper commit log here explains how you do the caching and why 
it is needed. 

> 
> Signed-off-by: Dekel Peled <dek...@mellanox.com>
> ---
>  drivers/net/mlx5/mlx5.h         |   1 +
>  drivers/net/mlx5/mlx5_flow.h    |  18 ++-
>  drivers/net/mlx5/mlx5_flow_dv.c | 265 ++++++++++++++++++++++++++---
> -----------
>  3 files changed, 193 insertions(+), 91 deletions(-)
> 
> diff --git a/drivers/net/mlx5/mlx5.h b/drivers/net/mlx5/mlx5.h index
> 74d87c0..0422803 100644
> --- a/drivers/net/mlx5/mlx5.h
> +++ b/drivers/net/mlx5/mlx5.h
> @@ -219,6 +219,7 @@ struct priv {
>       /* Verbs Indirection tables. */
>       LIST_HEAD(ind_tables, mlx5_ind_table_ibv) ind_tbls;
>       LIST_HEAD(matchers, mlx5_flow_dv_matcher) matchers;
> +     LIST_HEAD(encap_decap, mlx5_flow_dv_encap_decap_resource)
> +encaps_decaps;
>       uint32_t link_speed_capa; /* Link speed capabilities. */
>       struct mlx5_xstats_ctrl xstats_ctrl; /* Extended stats control. */
>       int primary_socket; /* Unix socket for primary process. */ diff --git
> a/drivers/net/mlx5/mlx5_flow.h b/drivers/net/mlx5/mlx5_flow.h index
> 908123f..25cd9c5 100644
> --- a/drivers/net/mlx5/mlx5_flow.h
> +++ b/drivers/net/mlx5/mlx5_flow.h
> @@ -170,6 +170,7 @@ struct mlx5_flow_dv_match_params {  };
> 
>  #define MLX5_DV_MAX_NUMBER_OF_ACTIONS 8
> +#define MLX5_ENCAP_MAX_LEN 132
> 
>  /* Matcher structure. */
>  struct mlx5_flow_dv_matcher {
> @@ -183,6 +184,19 @@ struct mlx5_flow_dv_matcher {
>       struct mlx5_flow_dv_match_params mask; /**< Matcher mask. */  };
> 
> +/* Encap/decap resource structure. */
> +struct mlx5_flow_dv_encap_decap_resource {
> +     LIST_ENTRY(mlx5_flow_dv_encap_decap_resource) next;
> +     /* Pointer to next element. */
> +     rte_atomic32_t refcnt; /**< Reference counter. */
> +     struct ibv_flow_action *verbs_action;
> +     /**< Verbs encap/decap action object. */
> +     uint8_t buf[MLX5_ENCAP_MAX_LEN];
> +     size_t size;
> +     uint8_t reformat_type;
> +     uint8_t ft_type;
> +};
> +
>  /* DV flows structure. */
>  struct mlx5_flow_dv {
>       uint64_t hash_fields; /**< Fields that participate in the hash. */ @@
> -191,12 +205,12 @@ struct mlx5_flow_dv {
>       struct mlx5_flow_dv_matcher *matcher; /**< Cache to matcher. */
>       struct mlx5_flow_dv_match_params value;
>       /**< Holds the value that the packet is compared to. */
> +     struct mlx5_flow_dv_encap_decap_resource *encap_decap;
> +     /**< Pointer to encap/decap resource in cache. */
>       struct ibv_flow *flow; /**< Installed flow. */  #ifdef
> HAVE_IBV_FLOW_DV_SUPPORT
>       struct mlx5dv_flow_action_attr
> actions[MLX5_DV_MAX_NUMBER_OF_ACTIONS];
>       /**< Action list. */
> -     struct ibv_flow_action *encap_decap_verbs_action;
> -     /**< Verbs encap/decap object. */
>  #endif
>       int actions_n; /**< number of actions. */  }; diff --git
> a/drivers/net/mlx5/mlx5_flow_dv.c b/drivers/net/mlx5/mlx5_flow_dv.c
> index d1c811f..818b30c 100644
> --- a/drivers/net/mlx5/mlx5_flow_dv.c
> +++ b/drivers/net/mlx5/mlx5_flow_dv.c
> @@ -34,8 +34,6 @@
> 
>  #ifdef HAVE_IBV_FLOW_DV_SUPPORT
> 
> -#define MLX5_ENCAP_MAX_LEN 132
> -
>  /**
>   * Validate META item.
>   *
> @@ -271,6 +269,77 @@
>       return 0;
>  }
> 
> +
> +/**
> + * Find existing encap/decap resource or create and register a new one.
> + *
> + * @param dev[in, out]
> + *   Pointer to rte_eth_dev structure.
> + * @param[in, out] resource
> + *   Pointer to encap/decap resource.
> + * @parm[in, out] dev_flow
> + *   Pointer to the dev_flow.
> + * @param[out] error
> + *   pointer to error structure.
> + *
> + * @return
> + *   0 on success otherwise -errno and errno is set.
> + */
> +static int
> +flow_dv_encap_decap_resource_register
> +                     (struct rte_eth_dev *dev,
> +                      struct mlx5_flow_dv_encap_decap_resource
> *resource,
> +                      struct mlx5_flow *dev_flow,
> +                      struct rte_flow_error *error)
> +{
> +     struct priv *priv = dev->data->dev_private;
> +     struct mlx5_flow_dv_encap_decap_resource *cache_resource;
> +
> +     /* Lookup a matching resource from cache. */
> +     LIST_FOREACH(cache_resource, &priv->encaps_decaps, next) {
> +             if (resource->reformat_type == cache_resource-
> >reformat_type &&
> +                 resource->ft_type == cache_resource->ft_type &&
> +                 resource->size == cache_resource->size &&
> +                 !memcmp((const void *)resource->buf,
> +                         (const void *)cache_resource->buf,
> +                         resource->size)) {
> +                     DRV_LOG(DEBUG, "encap/decap resource %p: refcnt
> %d++",
> +                             (void *)cache_resource,
> +                             rte_atomic32_read(&cache_resource-
> >refcnt));
> +                     rte_atomic32_inc(&cache_resource->refcnt);
> +                     dev_flow->dv.encap_decap = cache_resource;
> +                     return 0;
> +             }
> +     }
> +     /* Register new encap/decap resource. */
> +     cache_resource = rte_calloc(__func__, 1, sizeof(*cache_resource),
> 0);
> +     if (!cache_resource)
> +             return rte_flow_error_set(error, ENOMEM,
> +
> RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
> +                                       "cannot allocate resource
> memory");
> +     *cache_resource = *resource;
> +     cache_resource->verbs_action =
> +             mlx5_glue->dv_create_flow_action_packet_reformat
> +                     (priv->ctx, cache_resource->size,
> +                      (cache_resource->size ? cache_resource->buf :
> NULL),
> +                      cache_resource->reformat_type,
> +                      cache_resource->ft_type);
> +     if (!cache_resource->verbs_action) {
> +             rte_free(cache_resource);
> +             return rte_flow_error_set(error, ENOMEM,
> +
> RTE_FLOW_ERROR_TYPE_UNSPECIFIED,
> +                                       NULL, "cannot create action");
> +     }
> +     rte_atomic32_init(&cache_resource->refcnt);
> +     rte_atomic32_inc(&cache_resource->refcnt);
> +     LIST_INSERT_HEAD(&priv->encaps_decaps, cache_resource, next);
> +     dev_flow->dv.encap_decap = cache_resource;
> +     DRV_LOG(DEBUG, "new encap/decap resource %p: refcnt %d++",
> +             (void *)cache_resource,
> +             rte_atomic32_read(&cache_resource->refcnt));
> +     return 0;
> +}
> +
>  /**
>   * Get the size of specific rte_flow_item_type
>   *
> @@ -505,31 +574,33 @@
>   *   Pointer to rte_eth_dev structure.
>   * @param[in] action
>   *   Pointer to action structure.
> + * @param[in, out] dev_flow
> + *   Pointer to the mlx5_flow.
>   * @param[out] error
>   *   Pointer to the error structure.
>   *
>   * @return
> - *   Pointer to action on success, NULL otherwise and rte_errno is set.
> + *   0 on success, a negative errno value otherwise and rte_errno is set.
>   */
> -static struct ibv_flow_action *
> +static int
>  flow_dv_create_action_l2_encap(struct rte_eth_dev *dev,
>                              const struct rte_flow_action *action,
> +                            struct mlx5_flow *dev_flow,
>                              struct rte_flow_error *error)  {
> -     struct ibv_flow_action *verbs_action = NULL;
>       const struct rte_flow_item *encap_data;
>       const struct rte_flow_action_raw_encap *raw_encap_data;
> -     struct priv *priv = dev->data->dev_private;
> -     uint8_t buf[MLX5_ENCAP_MAX_LEN];
> -     uint8_t *buf_ptr = buf;
> -     size_t size = 0;
> -     int convert_result = 0;
> +     struct mlx5_flow_dv_encap_decap_resource res = {
> +             .reformat_type =
> +
>       MLX5DV_FLOW_ACTION_PACKET_REFORMAT_TYPE_L2_TO_L2_TU
> NNEL,
> +             .ft_type = MLX5DV_FLOW_TABLE_TYPE_NIC_TX,
> +     };
> 
>       if (action->type == RTE_FLOW_ACTION_TYPE_RAW_ENCAP) {
>               raw_encap_data =
>                       (const struct rte_flow_action_raw_encap *)action-
> >conf;
> -             buf_ptr = raw_encap_data->data;
> -             size = raw_encap_data->size;
> +             res.size = raw_encap_data->size;
> +             memcpy(res.buf, raw_encap_data->data, res.size);
>       } else {
>               if (action->type ==
> RTE_FLOW_ACTION_TYPE_VXLAN_ENCAP)
>                       encap_data =
> @@ -539,19 +610,15 @@
>                       encap_data =
>                               ((const struct rte_flow_action_nvgre_encap
> *)
>                                               action->conf)->definition;
> -             convert_result = flow_dv_convert_encap_data(encap_data,
> buf,
> -                                                         &size, error);
> -             if (convert_result)
> -                     return NULL;
> +             if (flow_dv_convert_encap_data(encap_data, res.buf,
> +                                            &res.size, error))
> +                     return -rte_errno;
>       }
> -     verbs_action = mlx5_glue-
> >dv_create_flow_action_packet_reformat
> -             (priv->ctx, size, buf_ptr,
> -
> MLX5DV_FLOW_ACTION_PACKET_REFORMAT_TYPE_L2_TO_L2_TUNNEL,
> -              MLX5DV_FLOW_TABLE_TYPE_NIC_TX);
> -     if (!verbs_action)
> -             rte_flow_error_set(error, EINVAL,
> RTE_FLOW_ERROR_TYPE_ACTION,
> -                                NULL, "cannot create L2 encap action");
> -     return verbs_action;
> +     if (flow_dv_encap_decap_resource_register(dev, &res, dev_flow,
> error))
> +             return rte_flow_error_set(error, EINVAL,
> +                                       RTE_FLOW_ERROR_TYPE_ACTION,
> +                                       NULL, "can't create L2 encap
> action");
> +     return 0;
>  }
> 
>  /**
> @@ -559,27 +626,31 @@
>   *
>   * @param[in] dev
>   *   Pointer to rte_eth_dev structure.
> + * @param[in, out] dev_flow
> + *   Pointer to the mlx5_flow.
>   * @param[out] error
>   *   Pointer to the error structure.
>   *
>   * @return
> - *   Pointer to action on success, NULL otherwise and rte_errno is set.
> + *   0 on success, a negative errno value otherwise and rte_errno is set.
>   */
> -static struct ibv_flow_action *
> +static int
>  flow_dv_create_action_l2_decap(struct rte_eth_dev *dev,
> +                            struct mlx5_flow *dev_flow,
>                              struct rte_flow_error *error)  {
> -     struct ibv_flow_action *verbs_action = NULL;
> -     struct priv *priv = dev->data->dev_private;
> +     struct mlx5_flow_dv_encap_decap_resource res = {
> +             .size = 0,
> +             .reformat_type =
> +
>       MLX5DV_FLOW_ACTION_PACKET_REFORMAT_TYPE_L2_TUNNEL_T
> O_L2,
> +             .ft_type = MLX5DV_FLOW_TABLE_TYPE_NIC_RX,
> +     };
> 
> -     verbs_action = mlx5_glue-
> >dv_create_flow_action_packet_reformat
> -             (priv->ctx, 0, NULL,
> -
> MLX5DV_FLOW_ACTION_PACKET_REFORMAT_TYPE_L2_TUNNEL_TO_L2,
> -              MLX5DV_FLOW_TABLE_TYPE_NIC_RX);
> -     if (!verbs_action)
> -             rte_flow_error_set(error, EINVAL,
> RTE_FLOW_ERROR_TYPE_ACTION,
> -                                NULL, "cannot create L2 decap action");
> -     return verbs_action;
> +     if (flow_dv_encap_decap_resource_register(dev, &res, dev_flow,
> error))
> +             return rte_flow_error_set(error, EINVAL,
> +                                       RTE_FLOW_ERROR_TYPE_ACTION,
> +                                       NULL, "can't create L2 decap
> action");
> +     return 0;
>  }
> 
>  /**
> @@ -589,41 +660,39 @@
>   *   Pointer to rte_eth_dev structure.
>   * @param[in] action
>   *   Pointer to action structure.
> + * @param[in, out] dev_flow
> + *   Pointer to the mlx5_flow.
>   * @param[in] attr
>   *   Pointer to the flow attributes.
>   * @param[out] error
>   *   Pointer to the error structure.
>   *
>   * @return
> - *   Pointer to action on success, NULL otherwise and rte_errno is set.
> + *   0 on success, a negative errno value otherwise and rte_errno is set.
>   */
> -static struct ibv_flow_action *
> +static int
>  flow_dv_create_action_raw_encap(struct rte_eth_dev *dev,
>                               const struct rte_flow_action *action,
> +                             struct mlx5_flow *dev_flow,
>                               const struct rte_flow_attr *attr,
>                               struct rte_flow_error *error)
>  {
> -     struct ibv_flow_action *verbs_action = NULL;
>       const struct rte_flow_action_raw_encap *encap_data;
> -     struct priv *priv = dev->data->dev_private;
> -     enum mlx5dv_flow_action_packet_reformat_type reformat_type;
> -     enum mlx5dv_flow_table_type ft_type;
> +     struct mlx5_flow_dv_encap_decap_resource res;
> 
>       encap_data = (const struct rte_flow_action_raw_encap *)action-
> >conf;
> -     reformat_type = attr->egress ?
> +     res.size = encap_data->size;
> +     memcpy(res.buf, encap_data->data, res.size);
> +     res.reformat_type = attr->egress ?
> 
>       MLX5DV_FLOW_ACTION_PACKET_REFORMAT_TYPE_L2_TO_L3_TU
> NNEL :
> 
>       MLX5DV_FLOW_ACTION_PACKET_REFORMAT_TYPE_L3_TUNNEL_T
> O_L2;
> -     ft_type = attr->egress ?
> -                     MLX5DV_FLOW_TABLE_TYPE_NIC_TX :
> -                     MLX5DV_FLOW_TABLE_TYPE_NIC_RX;
> -     verbs_action = mlx5_glue-
> >dv_create_flow_action_packet_reformat
> -                             (priv->ctx, encap_data->size,
> -                             (encap_data->size ? encap_data->data :
> NULL),
> -                             reformat_type, ft_type);
> -     if (!verbs_action)
> -             rte_flow_error_set(error, EINVAL,
> RTE_FLOW_ERROR_TYPE_ACTION,
> -                                NULL, "cannot create encap action");
> -     return verbs_action;
> +     res.ft_type = attr->egress ? MLX5DV_FLOW_TABLE_TYPE_NIC_TX :
> +                                  MLX5DV_FLOW_TABLE_TYPE_NIC_RX;
> +     if (flow_dv_encap_decap_resource_register(dev, &res, dev_flow,
> error))
> +             return rte_flow_error_set(error, EINVAL,
> +                                       RTE_FLOW_ERROR_TYPE_ACTION,
> +                                       NULL, "can't create encap action");
> +     return 0;
>  }
> 
>  /**
> @@ -1689,15 +1758,13 @@
>               break;
>       case RTE_FLOW_ACTION_TYPE_VXLAN_ENCAP:
>       case RTE_FLOW_ACTION_TYPE_NVGRE_ENCAP:
> +             if (flow_dv_create_action_l2_encap(dev, action,
> +                                                dev_flow, error))
> +                     return -rte_errno;
>               dev_flow->dv.actions[actions_n].type =
>                       MLX5DV_FLOW_ACTION_IBV_FLOW_ACTION;
>               dev_flow->dv.actions[actions_n].action =
> -                             flow_dv_create_action_l2_encap(dev,
> action,
> -                                                            error);
> -             if (!(dev_flow->dv.actions[actions_n].action))
> -                     return -rte_errno;
> -             dev_flow->dv.encap_decap_verbs_action =
> -                     dev_flow->dv.actions[actions_n].action;
> +                     dev_flow->dv.encap_decap->verbs_action;
>               flow->actions |= action->type ==
>                                RTE_FLOW_ACTION_TYPE_VXLAN_ENCAP ?
>                                MLX5_FLOW_ACTION_VXLAN_ENCAP :
> @@ -1706,14 +1773,12 @@
>               break;
>       case RTE_FLOW_ACTION_TYPE_VXLAN_DECAP:
>       case RTE_FLOW_ACTION_TYPE_NVGRE_DECAP:
> +             if (flow_dv_create_action_l2_decap(dev, dev_flow, error))
> +                     return -rte_errno;
>               dev_flow->dv.actions[actions_n].type =
>                       MLX5DV_FLOW_ACTION_IBV_FLOW_ACTION;
>               dev_flow->dv.actions[actions_n].action =
> -                             flow_dv_create_action_l2_decap(dev,
> error);
> -             if (!(dev_flow->dv.actions[actions_n].action))
> -                     return -rte_errno;
> -             dev_flow->dv.encap_decap_verbs_action =
> -                     dev_flow->dv.actions[actions_n].action;
> +                     dev_flow->dv.encap_decap->verbs_action;
>               flow->actions |= action->type ==
>                                RTE_FLOW_ACTION_TYPE_VXLAN_DECAP ?
>                                MLX5_FLOW_ACTION_VXLAN_DECAP :
> @@ -1723,27 +1788,23 @@
>       case RTE_FLOW_ACTION_TYPE_RAW_ENCAP:
>               /* Handle encap action with preceding decap */
>               if (flow->actions & MLX5_FLOW_ACTION_RAW_DECAP) {
> +                     if (flow_dv_create_action_raw_encap(dev, action,
> +                                                         dev_flow,
> +                                                         attr, error))
> +                             return -rte_errno;
>                       dev_flow->dv.actions[actions_n].type =
> 
>       MLX5DV_FLOW_ACTION_IBV_FLOW_ACTION;
>                       dev_flow->dv.actions[actions_n].action =
> -                                     flow_dv_create_action_raw_encap
> -                                                             (dev, action,
> -                                                              attr, error);
> -                     if (!(dev_flow->dv.actions[actions_n].action))
> -                             return -rte_errno;
> -                     dev_flow->dv.encap_decap_verbs_action =
> -                             dev_flow->dv.actions[actions_n].action;
> +                                     dev_flow->dv.encap_decap-
> >verbs_action;
>               } else {
>                       /* Handle encap action without preceding decap */
> +                     if (flow_dv_create_action_l2_encap(dev, action,
> +                                                        dev_flow, error))
> +                             return -rte_errno;
>                       dev_flow->dv.actions[actions_n].type =
> 
>       MLX5DV_FLOW_ACTION_IBV_FLOW_ACTION;
>                       dev_flow->dv.actions[actions_n].action =
> -                                     flow_dv_create_action_l2_encap
> -                                                     (dev, action, error);
> -                     if (!(dev_flow->dv.actions[actions_n].action))
> -                             return -rte_errno;
> -                     dev_flow->dv.encap_decap_verbs_action =
> -                             dev_flow->dv.actions[actions_n].action;
> +                                     dev_flow->dv.encap_decap-
> >verbs_action;
>               }
>               flow->actions |= MLX5_FLOW_ACTION_RAW_ENCAP;
>               actions_n++;
> @@ -1756,15 +1817,13 @@
>               }
>               /* Handle decap action only if it isn't followed by encap */
>               if (action_ptr->type !=
> RTE_FLOW_ACTION_TYPE_RAW_ENCAP) {
> +                     if (flow_dv_create_action_l2_decap(dev, dev_flow,
> +                                                        error))
> +                             return -rte_errno;
>                       dev_flow->dv.actions[actions_n].type =
> 
>       MLX5DV_FLOW_ACTION_IBV_FLOW_ACTION;
>                       dev_flow->dv.actions[actions_n].action =
> -
>       flow_dv_create_action_l2_decap(dev,
> -                                                                    error);
> -                     if (!(dev_flow->dv.actions[actions_n].action))
> -                             return -rte_errno;
> -                     dev_flow->dv.encap_decap_verbs_action =
> -                             dev_flow->dv.actions[actions_n].action;
> +                                     dev_flow->dv.encap_decap-
> >verbs_action;
>                       actions_n++;
>               }
>               /* If decap is followed by encap, handle it at encap case. */
> @@ -2074,6 +2133,37 @@  }
> 
>  /**
> + * Release an encap/decap resource.
> + *
> + * @param flow
> + *   Pointer to mlx5_flow.
> + *
> + * @return
> + *   1 while a reference on it exists, 0 when freed.
> + */
> +static int
> +flow_dv_encap_decap_resource_release(struct mlx5_flow *flow) {
> +     struct mlx5_flow_dv_encap_decap_resource *cache_resource =
> +                                             flow->dv.encap_decap;
> +
> +     assert(cache_resource->verbs_action);
> +     DRV_LOG(DEBUG, "encap/decap resource %p: refcnt %d--",
> +             (void *)cache_resource,
> +             rte_atomic32_read(&cache_resource->refcnt));
> +     if (rte_atomic32_dec_and_test(&cache_resource->refcnt)) {
> +             claim_zero(mlx5_glue->destroy_flow_action
> +                             (cache_resource->verbs_action));
> +             LIST_REMOVE(cache_resource, next);
> +             rte_free(cache_resource);
> +             DRV_LOG(DEBUG, "encap/decap resource %p: removed",
> +                     cache_resource);
> +             return 0;
> +     }
> +     return 1;
> +}
> +
> +/**
>   * Remove the flow from the NIC but keeps it in memory.
>   *
>   * @param[in] dev
> @@ -2128,11 +2218,8 @@
>               LIST_REMOVE(dev_flow, next);
>               if (dev_flow->dv.matcher)
>                       flow_dv_matcher_release(dev, dev_flow);
> -             if (dev_flow->dv.encap_decap_verbs_action) {
> -                     claim_zero(mlx5_glue->destroy_flow_action
> -                             (dev_flow->dv.encap_decap_verbs_action));
> -                     dev_flow->dv.encap_decap_verbs_action = NULL;
> -             }
> +             if (dev_flow->dv.encap_decap)
> +
>       flow_dv_encap_decap_resource_release(dev_flow);
>               rte_free(dev_flow);
>       }
>  }
> --
> 1.8.3.1

Reply via email to