[dpdk-dev] [PATCH v2 18/20] net/mlx5: add flow GRE item
Yongseok Koh
yskoh at mellanox.com
Sat Jul 7 01:46:11 CEST 2018
On Wed, Jun 27, 2018 at 05:07:50PM +0200, Nelio Laranjeiro wrote:
> Signed-off-by: Nelio Laranjeiro <nelio.laranjeiro at 6wind.com>
> ---
> drivers/net/mlx5/mlx5_flow.c | 191 ++++++++++++++++++++++++++++++++++-
> 1 file changed, 186 insertions(+), 5 deletions(-)
>
> diff --git a/drivers/net/mlx5/mlx5_flow.c b/drivers/net/mlx5/mlx5_flow.c
> index 47c55b426..636aaabe8 100644
> --- a/drivers/net/mlx5/mlx5_flow.c
> +++ b/drivers/net/mlx5/mlx5_flow.c
> @@ -54,6 +54,7 @@ extern const struct eth_dev_ops mlx5_dev_ops_isolate;
> /* Pattern tunnel Layer bits. */
> #define MLX5_FLOW_LAYER_VXLAN (1u << 12)
> #define MLX5_FLOW_LAYER_VXLAN_GPE (1u << 13)
> +#define MLX5_FLOW_LAYER_GRE (1u << 14)
>
> /* Outer Masks. */
> #define MLX5_FLOW_LAYER_OUTER_L3 \
> @@ -66,7 +67,8 @@ extern const struct eth_dev_ops mlx5_dev_ops_isolate;
>
> /* Tunnel masks. */
> #define MLX5_FLOW_LAYER_TUNNEL \
> - (MLX5_FLOW_LAYER_VXLAN | MLX5_FLOW_LAYER_VXLAN_GPE)
> + (MLX5_FLOW_LAYER_VXLAN | MLX5_FLOW_LAYER_VXLAN_GPE | \
> + MLX5_FLOW_LAYER_GRE)
>
> /* Inner Masks. */
> #define MLX5_FLOW_LAYER_INNER_L3 \
> @@ -215,6 +217,9 @@ static const struct rte_flow_expand_node mlx5_support_expansion[] = {
> },
> };
>
> +/* Tunnel protocol values. */
> +#define MLX5_PROTOCOL_GRE 47
How about using IPPROTO_GRE instead?
> +
> /** Handles information leading to a drop fate. */
> struct mlx5_flow_verbs {
> LIST_ENTRY(mlx5_flow_verbs) next;
> @@ -1005,12 +1010,23 @@ mlx5_flow_item_ipv6(const struct rte_flow_item *item, struct rte_flow *flow,
> item,
> "L3 cannot follow an L4"
> " layer");
> + /*
> + * IPv6 is not recognised by the NIC inside a GRE tunnel.
> + * Such support has to be disabled as the rule will be
> + * accepted. Tested with Mellanox OFED 4.3-3.0.2.1
> + */
This comment doesn't look appropriate. Do you think it is a bug of OFED/FW,
which can be fixed? Or, is it a HW erratum? Let's talk offline.
> + if (tunnel && layers & MLX5_FLOW_LAYER_GRE)
> + return rte_flow_error_set(error, ENOTSUP,
> + RTE_FLOW_ERROR_TYPE_ITEM,
> + item,
> + "IPv6 inside a GRE tunnel is"
> + " not recognised.");
> if (!mask)
> mask = &rte_flow_item_ipv6_mask;
> - ret = mlx5_flow_item_validate(item, (const uint8_t *)mask,
> - (const uint8_t *)&nic_mask,
> - sizeof(struct rte_flow_item_ipv6),
> - error);
> + ret = mlx5_flow_item_validate
> + (item, (const uint8_t *)mask,
> + (const uint8_t *)&nic_mask,
> + sizeof(struct rte_flow_item_ipv6), error);
> if (ret < 0)
> return ret;
> }
> @@ -1411,6 +1427,168 @@ mlx5_flow_item_vxlan_gpe(struct rte_eth_dev *dev,
> return size;
> }
>
> +/**
> + * Update the protocol in Verbs IPv4 spec.
> + *
> + * @param attr[in, out]
> + * Pointer to Verbs attributes structure.
> + * @param protocol[in]
> + * Protocol value to set if none is present in the specification.
> + */
> +static void
> +mlx5_flow_item_gre_ipv4_protocol_update(struct ibv_flow_attr *attr,
> + uint8_t protocol)
> +{
> + unsigned int i;
> + const enum ibv_flow_spec_type search = IBV_FLOW_SPEC_IPV4_EXT;
> + struct ibv_spec_header *hdr = (struct ibv_spec_header *)
> + ((uint8_t *)attr + sizeof(struct ibv_flow_attr));
> +
> + if (!attr)
> + return;
> + for (i = 0; i != attr->num_of_specs; ++i) {
> + if (hdr->type == search) {
> + struct ibv_flow_spec_ipv4_ext *ip =
> + (struct ibv_flow_spec_ipv4_ext *)hdr;
> +
> + if (!ip->val.proto) {
> + ip->val.proto = protocol;
> + ip->mask.proto = 0xff;
> + }
> + break;
> + }
> + hdr = (struct ibv_spec_header *)((uint8_t *)hdr + hdr->size);
> + }
> +}
> +
> +/**
> + * Update the protocol in Verbs IPv6 spec.
> + *
> + * @param attr[in, out]
> + * Pointer to Verbs attributes structure.
> + * @param protocol[in]
> + * Protocol value to set if none is present in the specification.
> + */
> +static void
> +mlx5_flow_item_gre_ipv6_protocol_update(struct ibv_flow_attr *attr,
> + uint8_t protocol)
How about consolidating the two funcs -
mlx5_flow_item_gre_ipv6_protocol_update() and
mlx5_flow_item_gre_ipv4_protocol_update()? There are many things in common.
> +{
> + unsigned int i;
> + const enum ibv_flow_spec_type search = IBV_FLOW_SPEC_IPV6;
> + struct ibv_spec_header *hdr = (struct ibv_spec_header *)
> + ((uint8_t *)attr + sizeof(struct ibv_flow_attr));
> +
> + if (!attr)
> + return;
> + for (i = 0; i != attr->num_of_specs; ++i) {
> + if (hdr->type == search) {
> + struct ibv_flow_spec_ipv6 *ip =
> + (struct ibv_flow_spec_ipv6 *)hdr;
> +
> + if (!ip->val.next_hdr) {
What if protocol in IP header does have wrong value other than 47 (IPPROTO_GRE)?
Shouldn't we have a validation check for it in mlx5_flow_item_gre()?
> + ip->val.next_hdr = protocol;
> + ip->mask.next_hdr = 0xff;
> + }
> + break;
> + }
> + hdr = (struct ibv_spec_header *)((uint8_t *)hdr + hdr->size);
> + }
> +}
> +
> +/**
> + * Validate GRE layer and possibly create the Verbs specification.
> + *
> + * @param dev
> + * Pointer to Ethernet device.
> + * @param item[in]
> + * Item specification.
> + * @param flow[in, out]
> + * Pointer to flow structure.
> + * @param flow_size[in]
> + * Size in bytes of the available space for to store the flow information.
> + * @param error
> + * Pointer to error structure.
> + *
> + * @return
> + * size in bytes necessary for the conversion, a negative errno value
> + * otherwise and rte_errno is set.
> + */
> +static int
> +mlx5_flow_item_gre(const struct rte_flow_item *item,
> + struct rte_flow *flow, const size_t flow_size,
> + struct rte_flow_error *error)
> +{
> + struct mlx5_flow_verbs *verbs = flow->cur_verbs;
> + const struct rte_flow_item_gre *spec = item->spec;
> + const struct rte_flow_item_gre *mask = item->mask;
> + const uint32_t layers = mlx5_flow_layers(flow);
> +#ifdef HAVE_IBV_DEVICE_MPLS_SUPPORT
> + unsigned int size = sizeof(struct ibv_flow_spec_gre);
> + struct ibv_flow_spec_gre tunnel = {
> + .type = IBV_FLOW_SPEC_GRE,
> + .size = size,
> + };
> +#else
> + unsigned int size = sizeof(struct ibv_flow_spec_tunnel);
> + struct ibv_flow_spec_tunnel tunnel = {
> + .type = IBV_FLOW_SPEC_VXLAN_TUNNEL,
> + .size = size,
> + };
> +#endif
> + int ret;
> +
> + if (layers & MLX5_FLOW_LAYER_TUNNEL)
> + return rte_flow_error_set(error, ENOTSUP,
> + RTE_FLOW_ERROR_TYPE_ITEM,
> + item,
> + "a tunnel is already present");
> + if (!(layers & MLX5_FLOW_LAYER_OUTER_L3))
> + return rte_flow_error_set(error, ENOTSUP,
> + RTE_FLOW_ERROR_TYPE_ITEM,
> + item,
> + "L3 Layer is missing");
> + if (!mask)
> + mask = &rte_flow_item_gre_mask;
> + ret = mlx5_flow_item_validate
> + (item, (const uint8_t *)mask,
> + (const uint8_t *)&rte_flow_item_gre_mask,
> + sizeof(struct rte_flow_item_gre), error);
> + if (ret < 0)
> + return ret;
> +#ifdef HAVE_IBV_DEVICE_MPLS_SUPPORT
> + if (spec) {
> + tunnel.val.c_ks_res0_ver = spec->c_rsvd0_ver;
> + tunnel.val.protocol = spec->protocol;
> + tunnel.mask.c_ks_res0_ver = mask->c_rsvd0_ver;
> + tunnel.mask.protocol = mask->protocol;
> + /* Remove unwanted bits from values. */
> + tunnel.val.c_ks_res0_ver &= tunnel.mask.c_ks_res0_ver;
> + tunnel.val.protocol &= tunnel.mask.protocol;
> + tunnel.val.key &= tunnel.mask.key;
> + }
> +#else
> + if (spec && (spec->protocol & mask->protocol))
> + return rte_flow_error_set(error, ENOTSUP,
> + RTE_FLOW_ERROR_TYPE_ITEM,
> + item,
> + "without MPLS support the"
> + " specification cannot be used for"
> + " filtering");
> +#endif /* !HAVE_IBV_DEVICE_MPLS_SUPPORT */
> + if (size <= flow_size) {
> + if (layers & MLX5_FLOW_LAYER_OUTER_L3_IPV4)
> + mlx5_flow_item_gre_ipv4_protocol_update
> + (verbs->attr, MLX5_PROTOCOL_GRE);
> + else
> + mlx5_flow_item_gre_ipv6_protocol_update
> + (verbs->attr, MLX5_PROTOCOL_GRE);
> + mlx5_flow_spec_verbs_add(flow, &tunnel, size);
> + }
> + mlx5_flow_layers_update(flow, MLX5_FLOW_LAYER_GRE);
> + flow->ptype = RTE_PTYPE_TUNNEL_GRE;
> + return size;
> +}
> +
> /**
> * Validate items provided by the user.
> *
> @@ -1469,6 +1647,9 @@ mlx5_flow_items(struct rte_eth_dev *dev,
> ret = mlx5_flow_item_vxlan_gpe(dev, items, flow,
> remain, error);
> break;
> + case RTE_FLOW_ITEM_TYPE_GRE:
> + ret = mlx5_flow_item_gre(items, flow, remain, error);
> + break;
> default:
> return rte_flow_error_set(error, ENOTSUP,
> RTE_FLOW_ERROR_TYPE_ITEM,
> --
> 2.18.0
>
More information about the dev
mailing list