> -----Original Message-----
> From: Guo, Junfeng <junfeng....@intel.com>
> Sent: Thursday, October 28, 2021 5:14 PM
> To: Zhang, Qi Z <qi.z.zh...@intel.com>; Wu, Jingjing <jingjing...@intel.com>;
> Xing, Beilei <beilei.x...@intel.com>
> Cc: dev@dpdk.org; Yigit, Ferruh <ferruh.yi...@intel.com>; Xu, Ting
> <ting...@intel.com>; Guo, Junfeng <junfeng....@intel.com>
> Subject: [PATCH v7 4/4] net/ice: enable protocol agnostic flow offloading in
> FDIR
>
> Protocol agnostic flow offloading in Flow Director is enabled by this patch
> based on the Parser Library, using existing rte_flow raw API.
>
> Note that the raw flow requires:
> 1. byte string of raw target packet bits.
> 2. byte string of mask of target packet.
>
> Here is an example:
> FDIR matching ipv4 dst addr with 1.2.3.4 and redirect to queue 3:
>
> flow create 0 ingress pattern raw \
> pattern spec \
> 0000000000000000000000000800450000140000400040100000000000000
> 1020304 \ pattern mask \
> 000000000000000000000000000000000000000000000000000000000000ff
> ffffff \ / end actions queue index 3 / mark id 3 / end
>
> Note that mask of some key bits (e.g., 0x0800 to indicate ipv4 proto) is
> optional in our cases. To avoid redundancy, we just omit the mask of 0x0800
> (with 0xFFFF) in the mask byte string example. The prefix '0x' for the spec
> and
> mask byte (hex) strings are also omitted here.
>
> Signed-off-by: Junfeng Guo <junfeng....@intel.com>
> ---
> doc/guides/rel_notes/release_21_11.rst | 1 +
> drivers/net/ice/ice_ethdev.h | 17 ++
> drivers/net/ice/ice_fdir_filter.c | 260 +++++++++++++++++++++++++
> drivers/net/ice/ice_generic_flow.c | 7 +
> drivers/net/ice/ice_generic_flow.h | 3 +
> 5 files changed, 288 insertions(+)
>
> diff --git a/doc/guides/rel_notes/release_21_11.rst
> b/doc/guides/rel_notes/release_21_11.rst
> index 9c13ceed1c..cc449a4340 100644
> --- a/doc/guides/rel_notes/release_21_11.rst
> +++ b/doc/guides/rel_notes/release_21_11.rst
> @@ -167,6 +167,7 @@ New Features
>
> * **Updated Intel ice driver.**
>
> + * Added protocol agnostic flow offloading support in Flow Director.
> * Added 1PPS out support by a devargs.
> * Added IPv4 and L4 (TCP/UDP/SCTP) checksum hash support in RSS flow.
> * Added DEV_RX_OFFLOAD_TIMESTAMP support.
> diff --git a/drivers/net/ice/ice_ethdev.h b/drivers/net/ice/ice_ethdev.h index
> 599e0028f7..441242ee89 100644
> --- a/drivers/net/ice/ice_ethdev.h
> +++ b/drivers/net/ice/ice_ethdev.h
> @@ -318,6 +318,11 @@ struct ice_fdir_filter_conf {
> uint64_t input_set_o; /* used for non-tunnel or tunnel outer fields */
> uint64_t input_set_i; /* only for tunnel inner fields */
> uint32_t mark_flag;
> +
> + struct ice_parser_profile *prof;
> + const u8 *pkt_buf;
> + bool parser_ena;
> + u8 pkt_len;
> };
>
> #define ICE_MAX_FDIR_FILTER_NUM (1024 * 16)
> @@ -487,6 +492,17 @@ struct ice_devargs {
> uint8_t pps_out_ena;
> };
>
> +/**
> + * Structure to store fdir fv entry.
> + */
> +struct ice_fdir_prof_info {
> + struct LIST_ENTRY_TYPE l_entry;
> +
> + struct ice_parser_profile prof;
> + u16 ptg;
> + u64 fdir_actived_cnt;
> +};
> +
> /**
> * Structure to store private data for each PF/VF instance.
> */
> @@ -509,6 +525,7 @@ struct ice_adapter {
> struct rte_timecounter rx_tstamp_tc;
> struct rte_timecounter tx_tstamp_tc;
> bool ptp_ena;
> + struct LIST_HEAD_TYPE fdir_prof_list;
> #ifdef RTE_ARCH_X86
> bool rx_use_avx2;
> bool rx_use_avx512;
> diff --git a/drivers/net/ice/ice_fdir_filter.c
> b/drivers/net/ice/ice_fdir_filter.c
> index bd627e3aa8..bcf105d1bd 100644
> --- a/drivers/net/ice/ice_fdir_filter.c
> +++ b/drivers/net/ice/ice_fdir_filter.c
> @@ -107,6 +107,7 @@
> ICE_INSET_NAT_T_ESP_SPI)
>
> static struct ice_pattern_match_item ice_fdir_pattern_list[] = {
> + {pattern_raw, ICE_INSET_NONE,
> ICE_INSET_NONE, ICE_INSET_NONE},
> {pattern_ethertype, ICE_FDIR_INSET_ETH,
> ICE_INSET_NONE, ICE_INSET_NONE},
> {pattern_eth_ipv4, ICE_FDIR_INSET_ETH_IPV4,
> ICE_INSET_NONE, ICE_INSET_NONE},
> {pattern_eth_ipv4_udp,
> ICE_FDIR_INSET_ETH_IPV4_UDP,
> ICE_INSET_NONE, ICE_INSET_NONE},
> @@ -1158,6 +1159,8 @@ ice_fdir_init(struct ice_adapter *ad)
> if (ret)
> return ret;
>
> + INIT_LIST_HEAD(&ad->fdir_prof_list);
> +
> parser = &ice_fdir_parser;
>
> return ice_register_parser(parser, ad); @@ -1188,6 +1191,24 @@
> ice_fdir_is_tunnel_profile(enum ice_fdir_tunnel_type tunnel_type)
> return 0;
> }
>
> +static int
> +ice_fdir_add_del_raw(struct ice_pf *pf,
> + struct ice_fdir_filter_conf *filter,
> + bool add)
> +{
> + struct ice_hw *hw = ICE_PF_TO_HW(pf);
> +
> + unsigned char *pkt = (unsigned char *)pf->fdir.prg_pkt;
> + rte_memcpy(pkt, filter->pkt_buf, filter->pkt_len);
> +
> + struct ice_fltr_desc desc;
> + memset(&desc, 0, sizeof(desc));
> + filter->input.comp_report = ICE_FXD_FLTR_QW0_COMP_REPORT_SW;
> + ice_fdir_get_prgm_desc(hw, &filter->input, &desc, add);
> +
> + return ice_fdir_programming(pf, &desc); }
> +
> static int
> ice_fdir_add_del_filter(struct ice_pf *pf,
> struct ice_fdir_filter_conf *filter, @@ -1303,6
> +1324,100 @@
> ice_fdir_create_filter(struct ice_adapter *ad,
> struct ice_fdir_fltr_pattern key;
> bool is_tun;
> int ret;
> + int i;
> +
> + if (filter->parser_ena) {
> + struct ice_hw *hw = ICE_PF_TO_HW(pf);
> +
> + int id = ice_find_first_bit(filter->prof->ptypes, UINT16_MAX);
> + u16 ctrl_vsi = pf->fdir.fdir_vsi->idx;
> + u16 main_vsi = pf->main_vsi->idx;
> + bool fv_found = false;
> + u16 vsi_num;
> +
> + struct ice_fdir_prof_info *pi;
> + LIST_FOR_EACH_ENTRY(pi, &ad->fdir_prof_list,
> + ice_fdir_prof_info, l_entry) {
> + if (pi->ptg != hw->blk[ICE_BLK_FD].xlt1.t[id])
> + continue;
> + if (!pi->fdir_actived_cnt) {
> + vsi_num = ice_get_hw_vsi_num(hw, ctrl_vsi);
> + ret = ice_rem_prof_id_flow(hw, ICE_BLK_FD,
> + vsi_num, id);
Looks like you delay the "profile remove" until next call
ice_fdir_add_del_filter,
Why not just do this at the exact moment that "fdir_actived_cnt = 0"?
> + if (ret)
> + return -rte_errno;
> +
> + vsi_num = ice_get_hw_vsi_num(hw, main_vsi);
> + ret = ice_rem_prof_id_flow(hw, ICE_BLK_FD,
> + vsi_num, id);
> + if (ret)
> + return -rte_errno;
> +
> + LIST_DEL(&pi->l_entry);
> + continue;
> + }
> + for (i = 0; i < ICE_MAX_FV_WORDS; i++)
> + if (pi->prof.fv[i].proto_id !=
> + filter->prof->fv[i].proto_id ||
> + pi->prof.fv[i].offset !=
> + filter->prof->fv[i].offset)
> + break;
> + if (i == ICE_MAX_FV_WORDS) {
> + fv_found = true;
> + pi->fdir_actived_cnt++;
> + break;
> + }
> + }
> +
> + if (!fv_found) {
> + ret = ice_flow_set_hw_prof(hw, main_vsi, ctrl_vsi,
> + filter->prof, ICE_BLK_FD);
> + if (ret)
> + return -rte_errno;
> + }
> +
> + ret = ice_fdir_add_del_raw(pf, filter, true);
> + if (ret)
> + return -rte_errno;
> +
> + if (!fv_found) {
> + pi = (struct ice_fdir_prof_info *)
> + ice_malloc(hw, sizeof(*pi));
> + if (!pi)
> + return ICE_ERR_NO_MEMORY;
> +
> + memset(&pi->prof, 0, sizeof(pi->prof));
> +
> + for (i = 0; i < filter->prof->fv_num; i++) {
> + pi->prof.fv[i].proto_id =
> + filter->prof->fv[i].proto_id;
> + pi->prof.fv[i].offset =
> + filter->prof->fv[i].offset;
> + pi->prof.fv[i].spec = filter->prof->fv[i].spec;
> + pi->prof.fv[i].msk = filter->prof->fv[i].msk;
> + }
> + pi->ptg = hw->blk[ICE_BLK_FD].xlt1.t[id];
> + pi->fdir_actived_cnt = 1;
> +
> + LIST_ADD(&pi->l_entry, &ad->fdir_prof_list);
> + }
> +
> + if (filter->mark_flag == 1)
> + ice_fdir_rx_parsing_enable(ad, 1);
> +
> + entry = rte_zmalloc("fdir_entry", sizeof(*entry), 0);
> + if (!entry)
> + return -rte_errno;
> +
> + rte_memcpy(entry, filter, sizeof(*filter));
> +
> + filter->prof = NULL;
> + filter->pkt_buf = NULL;
> +
> + flow->rule = entry;
> +
> + return 0;
> + }
>
> ice_fdir_extract_fltr_key(&key, filter);
> node = ice_fdir_entry_lookup(fdir_info, &key); @@ -1397,6 +1512,44
> @@ ice_fdir_destroy_filter(struct ice_adapter *ad,
>
> filter = (struct ice_fdir_filter_conf *)flow->rule;
>
> + if (filter->parser_ena) {
> + struct ice_hw *hw = ICE_PF_TO_HW(pf);
> +
> + ret = ice_fdir_add_del_raw(pf, filter, false);
> + if (ret)
> + return -rte_errno;
> +
> + int id = ice_find_first_bit(filter->prof->ptypes, UINT16_MAX);
> + int i;
> + struct ice_fdir_prof_info *pi;
> + LIST_FOR_EACH_ENTRY(pi, &ad->fdir_prof_list,
> + ice_fdir_prof_info, l_entry) {
> + if (pi->ptg != hw->blk[ICE_BLK_FD].xlt1.t[id])
> + continue;
> + for (i = 0; i < ICE_MAX_FV_WORDS; i++)
> + if (pi->prof.fv[i].proto_id !=
> + filter->prof->fv[i].proto_id ||
> + pi->prof.fv[i].offset !=
> + filter->prof->fv[i].offset)
> + break;
> + if (i == ICE_MAX_FV_WORDS) {
> + pi->fdir_actived_cnt--;
Here you can remove the profile.
> + break;
> + }
> + }
can all above part be moved into ice_fdir_add_del_filter, this make the add
/delete implementation symmetric .
> +
> + if (filter->mark_flag == 1)
> + ice_fdir_rx_parsing_enable(ad, 0);
> +
> + flow->rule = NULL;
> + filter->prof = NULL;
> + filter->pkt_buf = NULL;
> +
> + rte_free(filter);
> +
> + return 0;
> + }
> +
> is_tun = ice_fdir_is_tunnel_profile(filter->tunnel_type);
>
> if (filter->counter) {
> @@ -1675,6 +1828,7 @@ ice_fdir_parse_pattern(__rte_unused struct
> ice_adapter *ad,
> enum rte_flow_item_type l3 = RTE_FLOW_ITEM_TYPE_END;
> enum rte_flow_item_type l4 = RTE_FLOW_ITEM_TYPE_END;
> enum ice_fdir_tunnel_type tunnel_type =
> ICE_FDIR_TUNNEL_TYPE_NONE;
> + const struct rte_flow_item_raw *raw_spec, *raw_mask;
> const struct rte_flow_item_eth *eth_spec, *eth_mask;
> const struct rte_flow_item_ipv4 *ipv4_spec, *ipv4_last, *ipv4_mask;
> const struct rte_flow_item_ipv6 *ipv6_spec, *ipv6_mask; @@ -1702,6
> +1856,9 @@ ice_fdir_parse_pattern(__rte_unused struct ice_adapter *ad,
> struct ice_fdir_extra *p_ext_data;
> struct ice_fdir_v4 *p_v4 = NULL;
> struct ice_fdir_v6 *p_v6 = NULL;
> + struct ice_parser_result rslt;
> + struct ice_parser *psr;
> + uint8_t item_num = 0;
>
> for (item = pattern; item->type != RTE_FLOW_ITEM_TYPE_END; item++) {
> if (item->type == RTE_FLOW_ITEM_TYPE_VXLAN) @@ -1713,6
> +1870,7 @@ ice_fdir_parse_pattern(__rte_unused struct ice_adapter *ad,
> item->type == RTE_FLOW_ITEM_TYPE_GTP_PSC) {
> is_outer = false;
> }
> + item_num++;
> }
>
> /* This loop parse flow pattern and distinguish Non-tunnel and tunnel
> @@ -1733,6 +1891,101 @@ ice_fdir_parse_pattern(__rte_unused struct
> ice_adapter *ad,
> &input_set_i : &input_set_o;
>
> switch (item_type) {
> + case RTE_FLOW_ITEM_TYPE_RAW:
> + raw_spec = item->spec;
> + raw_mask = item->mask;
> +
> + if (item_num != 1)
> + break;
> +
> + /* convert raw spec & mask from byte string to int */
> + unsigned char *tmp_spec =
> + (uint8_t *)(uintptr_t)raw_spec->pattern;
> + unsigned char *tmp_mask =
> + (uint8_t *)(uintptr_t)raw_mask->pattern;
> + uint16_t udp_port = 0;
> + uint16_t tmp_val = 0;
> + uint8_t pkt_len = 0;
> + uint8_t tmp = 0;
> + int i, j;
> +
> + pkt_len = strlen((char *)(uintptr_t)raw_spec->pattern);
> + if (strlen((char *)(uintptr_t)raw_mask->pattern) !=
> + pkt_len)
> + return -rte_errno;
> +
> + for (i = 0, j = 0; i < pkt_len; i += 2, j++) {
> + tmp = tmp_spec[i];
> + if (tmp >= 'a' && tmp <= 'f')
> + tmp_val = tmp - 'a' + 10;
> + if (tmp >= 'A' && tmp <= 'F')
> + tmp_val = tmp - 'A' + 10;
> + if (tmp >= '0' && tmp <= '9')
> + tmp_val = tmp - '0';
> +
> + tmp_val *= 16;
> + tmp = tmp_spec[i + 1];
> + if (tmp >= 'a' && tmp <= 'f')
> + tmp_spec[j] = tmp_val + tmp - 'a' + 10;
> + if (tmp >= 'A' && tmp <= 'F')
> + tmp_spec[j] = tmp_val + tmp - 'A' + 10;
> + if (tmp >= '0' && tmp <= '9')
> + tmp_spec[j] = tmp_val + tmp - '0';
> +
> + tmp = tmp_mask[i];
> + if (tmp >= 'a' && tmp <= 'f')
> + tmp_val = tmp - 'a' + 10;
> + if (tmp >= 'A' && tmp <= 'F')
> + tmp_val = tmp - 'A' + 10;
> + if (tmp >= '0' && tmp <= '9')
> + tmp_val = tmp - '0';
> +
> + tmp_val *= 16;
> + tmp = tmp_mask[i + 1];
> + if (tmp >= 'a' && tmp <= 'f')
> + tmp_mask[j] = tmp_val + tmp - 'a' + 10;
> + if (tmp >= 'A' && tmp <= 'F')
> + tmp_mask[j] = tmp_val + tmp - 'A' + 10;
> + if (tmp >= '0' && tmp <= '9')
> + tmp_mask[j] = tmp_val + tmp - '0';
> + }
> +
> + pkt_len /= 2;
> +
> + if (ice_parser_create(&ad->hw, &psr))
> + return -rte_errno;
> + if (ice_get_open_tunnel_port(&ad->hw, TNL_VXLAN,
> + &udp_port))
> + ice_parser_vxlan_tunnel_set(psr, udp_port,
> + true);
> + if (ice_parser_run(psr, tmp_spec, pkt_len, &rslt))
> + return -rte_errno;
> + ice_parser_destroy(psr);
> +
> + if (!tmp_mask)
> + return -rte_errno;
> +
> + filter->prof = (struct ice_parser_profile *)
> + ice_malloc(&ad->hw, sizeof(*filter->prof));
> + if (!filter->prof)
> + return -ENOMEM;
> +
> + if (ice_parser_profile_init(&rslt, tmp_spec, tmp_mask,
> + pkt_len, ICE_BLK_FD, true, filter->prof))
> + return -rte_errno;
> +
> + u8 *pkt_buf = (u8 *)ice_malloc(&ad->hw, pkt_len + 1);
> + if (!pkt_buf)
> + return -ENOMEM;
> + rte_memcpy(pkt_buf, tmp_spec, pkt_len);
> + filter->pkt_buf = pkt_buf;
> +
> + filter->pkt_len = pkt_len;
> +
> + filter->parser_ena = true;
> +
> + break;
> +
> case RTE_FLOW_ITEM_TYPE_ETH:
> flow_type = ICE_FLTR_PTYPE_NON_IP_L2;
> eth_spec = item->spec;
> @@ -2198,6 +2451,7 @@ ice_fdir_parse(struct ice_adapter *ad,
> struct ice_fdir_filter_conf *filter = &pf->fdir.conf;
> struct ice_pattern_match_item *item = NULL;
> uint64_t input_set;
> + bool raw = false;
> int ret;
>
> memset(filter, 0, sizeof(*filter));
> @@ -2213,7 +2467,13 @@ ice_fdir_parse(struct ice_adapter *ad,
> ret = ice_fdir_parse_pattern(ad, pattern, error, filter);
> if (ret)
> goto error;
> +
> + if (item->pattern_list[0] == RTE_FLOW_ITEM_TYPE_RAW)
> + raw = true;
> +
> input_set = filter->input_set_o | filter->input_set_i;
> + input_set = raw ? ~input_set : input_set;
> +
> if (!input_set || filter->input_set_o &
> ~(item->input_set_mask_o | ICE_INSET_ETHERTYPE) ||
> filter->input_set_i & ~item->input_set_mask_i) { diff --git
> a/drivers/net/ice/ice_generic_flow.c b/drivers/net/ice/ice_generic_flow.c
> index 02f854666a..d3391c86c0 100644
> --- a/drivers/net/ice/ice_generic_flow.c
> +++ b/drivers/net/ice/ice_generic_flow.c
> @@ -65,6 +65,12 @@ enum rte_flow_item_type pattern_empty[] = {
> RTE_FLOW_ITEM_TYPE_END,
> };
>
> +/* raw */
> +enum rte_flow_item_type pattern_raw[] = {
> + RTE_FLOW_ITEM_TYPE_RAW,
> + RTE_FLOW_ITEM_TYPE_END,
> +};
> +
> /* L2 */
> enum rte_flow_item_type pattern_ethertype[] = {
> RTE_FLOW_ITEM_TYPE_ETH,
> @@ -2081,6 +2087,7 @@ struct ice_ptype_match { };
>
> static struct ice_ptype_match ice_ptype_map[] = {
> + {pattern_raw, ICE_PTYPE_IPV4_PAY},
> {pattern_eth_ipv4, ICE_PTYPE_IPV4_PAY},
> {pattern_eth_ipv4_udp, ICE_PTYPE_IPV4_UDP_PAY},
> {pattern_eth_ipv4_tcp, ICE_PTYPE_IPV4_TCP_PAY},
> diff --git a/drivers/net/ice/ice_generic_flow.h
> b/drivers/net/ice/ice_generic_flow.h
> index 8845a3e156..1b030c0466 100644
> --- a/drivers/net/ice/ice_generic_flow.h
> +++ b/drivers/net/ice/ice_generic_flow.h
> @@ -124,6 +124,9 @@
> /* empty pattern */
> extern enum rte_flow_item_type pattern_empty[];
>
> +/* raw pattern */
> +extern enum rte_flow_item_type pattern_raw[];
> +
> /* L2 */
> extern enum rte_flow_item_type pattern_ethertype[]; extern enum
> rte_flow_item_type pattern_ethertype_vlan[];
> --
> 2.25.1