DPDK patches and discussions
 help / color / mirror / Atom feed
From: Nithin Dabilpuram <nithind1988@gmail.com>
To: pbhagavatula@marvell.com
Cc: jerinj@marvell.com, ndabilpuram@marvell.com,
	 Kiran Kumar K <kirankumark@marvell.com>,
	Zhirun Yan <zhirun.yan@intel.com>,
	dev@dpdk.org
Subject: Re: [PATCH v4] node: add IPv4 reassembly node
Date: Fri, 8 Sep 2023 11:07:36 +0530	[thread overview]
Message-ID: <CAMuDWKQ2KF0mOeGidfqf-6+5vmqWFtmWS8Xa8NFLht+LW+HkZw@mail.gmail.com> (raw)
In-Reply-To: <20230727143656.10260-1-pbhagavatula@marvell.com>

Acked-by: Nithin Dabilpuram <ndabilpuram@marvell.com>


On Thu, Jul 27, 2023 at 8:07 PM <pbhagavatula@marvell.com> wrote:
>
> From: Pavan Nikhilesh <pbhagavatula@marvell.com>
>
> Add IPv4 reassembly node.
>
> Signed-off-by: Pavan Nikhilesh <pbhagavatula@marvell.com>
> ---
>  v4 Changes:
>  - Add packet drop node as the 0th edge.
>  - Free deathrow packets to packet drop node.
>  v3 Changes:
>  - Actually include the changes that fix compilation.
>  v2 Changes:
>  - Fix compilation.
>
>  doc/guides/prog_guide/graph_lib.rst |   8 ++
>  lib/node/ethdev_rx.c                |   1 +
>  lib/node/ethdev_rx_priv.h           |   1 +
>  lib/node/ip4_reassembly.c           | 186 ++++++++++++++++++++++++++++
>  lib/node/ip4_reassembly_priv.h      |  28 +++++
>  lib/node/meson.build                |   3 +-
>  lib/node/rte_node_ip4_api.h         |  37 ++++++
>  lib/node/version.map                |   1 +
>  8 files changed, 264 insertions(+), 1 deletion(-)
>  create mode 100644 lib/node/ip4_reassembly.c
>  create mode 100644 lib/node/ip4_reassembly_priv.h
>
> diff --git a/doc/guides/prog_guide/graph_lib.rst b/doc/guides/prog_guide/graph_lib.rst
> index e7b6e12004..10d146e2f6 100644
> --- a/doc/guides/prog_guide/graph_lib.rst
> +++ b/doc/guides/prog_guide/graph_lib.rst
> @@ -453,6 +453,14 @@ to determine the L2 header to be written to the packet before sending
>  the packet out to a particular ethdev_tx node.
>  ``rte_node_ip4_rewrite_add()`` is control path API to add next-hop info.
>
> +ip4_reassembly
> +~~~~~~~~~~~~~~
> +This node is an intermediate node that reassembles ipv4 fragmented packets,
> +non-fragmented packets pass through the node un-effected. The node rewrites
> +it's stream and moves it to the next node.
> +The fragment table and death row table should be setup via the
> +``rte_node_ip4_reassembly_configure`` API.
> +
>  ip6_lookup
>  ~~~~~~~~~~
>  This node is an intermediate node that does LPM lookup for the received
> diff --git a/lib/node/ethdev_rx.c b/lib/node/ethdev_rx.c
> index d131034991..3e8fac1df4 100644
> --- a/lib/node/ethdev_rx.c
> +++ b/lib/node/ethdev_rx.c
> @@ -215,6 +215,7 @@ static struct rte_node_register ethdev_rx_node_base = {
>         .next_nodes = {
>                 [ETHDEV_RX_NEXT_PKT_CLS] = "pkt_cls",
>                 [ETHDEV_RX_NEXT_IP4_LOOKUP] = "ip4_lookup",
> +               [ETHDEV_RX_NEXT_IP4_REASSEMBLY] = "ip4_reassembly",
>         },
>  };
>
> diff --git a/lib/node/ethdev_rx_priv.h b/lib/node/ethdev_rx_priv.h
> index 7f24cf962e..574a76c2a6 100644
> --- a/lib/node/ethdev_rx_priv.h
> +++ b/lib/node/ethdev_rx_priv.h
> @@ -39,6 +39,7 @@ struct ethdev_rx_node_elem {
>  enum ethdev_rx_next_nodes {
>         ETHDEV_RX_NEXT_IP4_LOOKUP,
>         ETHDEV_RX_NEXT_PKT_CLS,
> +       ETHDEV_RX_NEXT_IP4_REASSEMBLY,
>         ETHDEV_RX_NEXT_MAX,
>  };
>
> diff --git a/lib/node/ip4_reassembly.c b/lib/node/ip4_reassembly.c
> new file mode 100644
> index 0000000000..04823cc596
> --- /dev/null
> +++ b/lib/node/ip4_reassembly.c
> @@ -0,0 +1,186 @@
> +/* SPDX-License-Identifier: BSD-3-Clause
> + * Copyright(C) 2023 Marvell.
> + */
> +
> +#include <arpa/inet.h>
> +#include <stdlib.h>
> +#include <sys/socket.h>
> +
> +#include <rte_cycles.h>
> +#include <rte_debug.h>
> +#include <rte_ethdev.h>
> +#include <rte_ether.h>
> +#include <rte_graph.h>
> +#include <rte_graph_worker.h>
> +#include <rte_ip.h>
> +#include <rte_ip_frag.h>
> +#include <rte_mbuf.h>
> +#include <rte_tcp.h>
> +#include <rte_udp.h>
> +
> +#include "rte_node_ip4_api.h"
> +
> +#include "ip4_reassembly_priv.h"
> +#include "node_private.h"
> +
> +struct ip4_reassembly_elem {
> +       struct ip4_reassembly_elem *next;
> +       struct ip4_reassembly_ctx ctx;
> +       rte_node_t node_id;
> +};
> +
> +/* IP4 reassembly global data struct */
> +struct ip4_reassembly_node_main {
> +       struct ip4_reassembly_elem *head;
> +};
> +
> +typedef struct ip4_reassembly_ctx ip4_reassembly_ctx_t;
> +typedef struct ip4_reassembly_elem ip4_reassembly_elem_t;
> +
> +static struct ip4_reassembly_node_main ip4_reassembly_main;
> +
> +static uint16_t
> +ip4_reassembly_node_process(struct rte_graph *graph, struct rte_node *node, void **objs,
> +                           uint16_t nb_objs)
> +{
> +#define PREFETCH_OFFSET 4
> +       struct rte_mbuf *mbuf, *mbuf_out;
> +       struct rte_ip_frag_death_row *dr;
> +       struct ip4_reassembly_ctx *ctx;
> +       struct rte_ipv4_hdr *ipv4_hdr;
> +       struct rte_ip_frag_tbl *tbl;
> +       void **to_next, **to_free;
> +       uint16_t idx = 0;
> +       int i;
> +
> +       ctx = (struct ip4_reassembly_ctx *)node->ctx;
> +
> +       /* Get core specific reassembly tbl */
> +       tbl = ctx->tbl;
> +       dr = ctx->dr;
> +
> +       for (i = 0; i < PREFETCH_OFFSET && i < nb_objs; i++) {
> +               rte_prefetch0(rte_pktmbuf_mtod_offset((struct rte_mbuf *)objs[i], void *,
> +                                                     sizeof(struct rte_ether_hdr)));
> +       }
> +
> +       to_next = node->objs;
> +       for (i = 0; i < nb_objs - PREFETCH_OFFSET; i++) {
> +#if RTE_GRAPH_BURST_SIZE > 64
> +               /* Prefetch next-next mbufs */
> +               if (likely(i + 8 < nb_objs))
> +                       rte_prefetch0(objs[i + 8]);
> +#endif
> +               rte_prefetch0(rte_pktmbuf_mtod_offset((struct rte_mbuf *)objs[i + PREFETCH_OFFSET],
> +                                                     void *, sizeof(struct rte_ether_hdr)));
> +               mbuf = (struct rte_mbuf *)objs[i];
> +
> +               ipv4_hdr = rte_pktmbuf_mtod_offset(mbuf, struct rte_ipv4_hdr *,
> +                                                  sizeof(struct rte_ether_hdr));
> +               if (rte_ipv4_frag_pkt_is_fragmented(ipv4_hdr)) {
> +                       /* prepare mbuf: setup l2_len/l3_len. */
> +                       mbuf->l2_len = sizeof(struct rte_ether_hdr);
> +                       mbuf->l3_len = sizeof(struct rte_ipv4_hdr);
> +
> +                       mbuf_out = rte_ipv4_frag_reassemble_packet(tbl, dr, mbuf, rte_rdtsc(),
> +                                                                  ipv4_hdr);
> +               } else {
> +                       mbuf_out = mbuf;
> +               }
> +
> +               if (mbuf_out)
> +                       to_next[idx++] = (void *)mbuf_out;
> +       }
> +
> +       for (; i < nb_objs; i++) {
> +               mbuf = (struct rte_mbuf *)objs[i];
> +
> +               ipv4_hdr = rte_pktmbuf_mtod_offset(mbuf, struct rte_ipv4_hdr *,
> +                                                  sizeof(struct rte_ether_hdr));
> +               if (rte_ipv4_frag_pkt_is_fragmented(ipv4_hdr)) {
> +                       /* prepare mbuf: setup l2_len/l3_len. */
> +                       mbuf->l2_len = sizeof(struct rte_ether_hdr);
> +                       mbuf->l3_len = sizeof(struct rte_ipv4_hdr);
> +
> +                       mbuf_out = rte_ipv4_frag_reassemble_packet(tbl, dr, mbuf, rte_rdtsc(),
> +                                                                  ipv4_hdr);
> +               } else {
> +                       mbuf_out = mbuf;
> +               }
> +
> +               if (mbuf_out)
> +                       to_next[idx++] = (void *)mbuf_out;
> +       }
> +       node->idx = idx;
> +       rte_node_next_stream_move(graph, node, 1);
> +       if (dr->cnt) {
> +               to_free = rte_node_next_stream_get(graph, node,
> +                                                  RTE_NODE_IP4_REASSEMBLY_NEXT_PKT_DROP, dr->cnt);
> +               rte_memcpy(to_free, dr->row, dr->cnt * sizeof(to_free[0]));
> +               rte_node_next_stream_put(graph, node, RTE_NODE_IP4_REASSEMBLY_NEXT_PKT_DROP,
> +                                        dr->cnt);
> +               idx += dr->cnt;
> +               dr->cnt = 0;
> +       }
> +
> +       return idx;
> +}
> +
> +int
> +rte_node_ip4_reassembly_configure(struct rte_node_ip4_reassembly_cfg *cfg, uint16_t cnt)
> +{
> +       ip4_reassembly_elem_t *elem;
> +       int i;
> +
> +       for (i = 0; i < cnt; i++) {
> +               elem = malloc(sizeof(ip4_reassembly_elem_t));
> +               if (elem == NULL)
> +                       return -ENOMEM;
> +               elem->ctx.dr = cfg[i].dr;
> +               elem->ctx.tbl = cfg[i].tbl;
> +               elem->node_id = cfg[i].node_id;
> +               elem->next = ip4_reassembly_main.head;
> +               ip4_reassembly_main.head = elem;
> +       }
> +
> +       return 0;
> +}
> +
> +static int
> +ip4_reassembly_node_init(const struct rte_graph *graph, struct rte_node *node)
> +{
> +       ip4_reassembly_ctx_t *ctx = (ip4_reassembly_ctx_t *)node->ctx;
> +       ip4_reassembly_elem_t *elem = ip4_reassembly_main.head;
> +
> +       RTE_SET_USED(graph);
> +       while (elem) {
> +               if (elem->node_id == node->id) {
> +                       /* Update node specific context */
> +                       memcpy(ctx, &elem->ctx, sizeof(ip4_reassembly_ctx_t));
> +                       break;
> +               }
> +               elem = elem->next;
> +       }
> +
> +       return 0;
> +}
> +
> +static struct rte_node_register ip4_reassembly_node = {
> +       .process = ip4_reassembly_node_process,
> +       .name = "ip4_reassembly",
> +
> +       .init = ip4_reassembly_node_init,
> +
> +       .nb_edges = RTE_NODE_IP4_REASSEMBLY_NEXT_PKT_DROP + 1,
> +       .next_nodes = {
> +               [RTE_NODE_IP4_REASSEMBLY_NEXT_PKT_DROP] = "pkt_drop",
> +       },
> +};
> +
> +struct rte_node_register *
> +ip4_reassembly_node_get(void)
> +{
> +       return &ip4_reassembly_node;
> +}
> +
> +RTE_NODE_REGISTER(ip4_reassembly_node);
> diff --git a/lib/node/ip4_reassembly_priv.h b/lib/node/ip4_reassembly_priv.h
> new file mode 100644
> index 0000000000..1fa70274ba
> --- /dev/null
> +++ b/lib/node/ip4_reassembly_priv.h
> @@ -0,0 +1,28 @@
> +/* SPDX-License-Identifier: BSD-3-Clause
> + * Copyright(C) 2023 Marvell International Ltd.
> + */
> +
> +#ifndef __INCLUDE_IP4_REASSEMBLY_PRIV_H__
> +#define __INCLUDE_IP4_REASSEMBLY_PRIV_H__
> +
> +/**
> + * @internal
> + *
> + * Ip4_reassembly context structure.
> + */
> +struct ip4_reassembly_ctx {
> +       struct rte_ip_frag_tbl *tbl;
> +       struct rte_ip_frag_death_row *dr;
> +};
> +
> +/**
> + * @internal
> + *
> + * Get the IP4 reassembly node
> + *
> + * @return
> + *   Pointer to the IP4 reassembly node.
> + */
> +struct rte_node_register *ip4_reassembly_node_get(void);
> +
> +#endif /* __INCLUDE_IP4_REASSEMBLY_PRIV_H__ */
> diff --git a/lib/node/meson.build b/lib/node/meson.build
> index 2fa7c1c8f3..72474c0856 100644
> --- a/lib/node/meson.build
> +++ b/lib/node/meson.build
> @@ -13,6 +13,7 @@ sources = files(
>          'ethdev_tx.c',
>          'ip4_lookup.c',
>          'ip4_rewrite.c',
> +       'ip4_reassembly.c',
>          'ip6_lookup.c',
>          'ip6_rewrite.c',
>          'kernel_rx.c',
> @@ -30,4 +31,4 @@ headers = files(
>
>  # Strict-aliasing rules are violated by uint8_t[] to context size casts.
>  cflags += '-fno-strict-aliasing'
> -deps += ['graph', 'mbuf', 'lpm', 'ethdev', 'mempool', 'cryptodev']
> +deps += ['graph', 'mbuf', 'lpm', 'ethdev', 'mempool', 'cryptodev', 'ip_frag']
> diff --git a/lib/node/rte_node_ip4_api.h b/lib/node/rte_node_ip4_api.h
> index 3397da0ae8..8d8e4c41b2 100644
> --- a/lib/node/rte_node_ip4_api.h
> +++ b/lib/node/rte_node_ip4_api.h
> @@ -22,6 +22,8 @@ extern "C" {
>  #include <rte_common.h>
>  #include <rte_compat.h>
>
> +#include <rte_graph.h>
> +
>  /**
>   * IP4 lookup next nodes.
>   */
> @@ -34,6 +36,27 @@ enum rte_node_ip4_lookup_next {
>         /**< Number of next nodes of lookup node. */
>  };
>
> +/**
> + * IP4 reassembly next nodes.
> + */
> +enum rte_node_ip4_reassembly_next {
> +       RTE_NODE_IP4_REASSEMBLY_NEXT_PKT_DROP,
> +       /**< Packet drop node. */
> +};
> +
> +/**
> + * Reassembly configure structure.
> + * @see rte_node_ip4_reassembly_configure
> + */
> +struct rte_node_ip4_reassembly_cfg {
> +       struct rte_ip_frag_tbl *tbl;
> +       /**< Reassembly fragmentation table. */
> +       struct rte_ip_frag_death_row *dr;
> +       /**< Reassembly deathrow table. */
> +       rte_node_t node_id;
> +       /**< Node identifier to configure. */
> +};
> +
>  /**
>   * Add ipv4 route to lookup table.
>   *
> @@ -72,6 +95,20 @@ __rte_experimental
>  int rte_node_ip4_rewrite_add(uint16_t next_hop, uint8_t *rewrite_data,
>                              uint8_t rewrite_len, uint16_t dst_port);
>
> +/**
> + * Add reassembly node configuration data.
> + *
> + * @param cfg
> + *   Pointer to the configuration structure.
> + * @param cnt
> + *   Number of configuration structures passed.
> + *
> + * @return
> + *   0 on success, negative otherwise.
> + */
> +__rte_experimental
> +int rte_node_ip4_reassembly_configure(struct rte_node_ip4_reassembly_cfg *cfg, uint16_t cnt);
> +
>  #ifdef __cplusplus
>  }
>  #endif
> diff --git a/lib/node/version.map b/lib/node/version.map
> index 40df308bfe..c10e2e78ea 100644
> --- a/lib/node/version.map
> +++ b/lib/node/version.map
> @@ -4,6 +4,7 @@ EXPERIMENTAL {
>         rte_node_eth_config;
>         rte_node_ip4_route_add;
>         rte_node_ip4_rewrite_add;
> +       rte_node_ip4_reassembly_configure;
>         rte_node_ip6_rewrite_add;
>         rte_node_ip6_route_add;
>         rte_node_logtype;
> --
> 2.25.1
>

  reply	other threads:[~2023-09-08  5:37 UTC|newest]

Thread overview: 7+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2023-06-01 19:42 [PATCH] " pbhagavatula
2023-06-02 16:48 ` [PATCH v2] " pbhagavatula
2023-06-05 11:26   ` [PATCH v3] node: add ipv4 " pbhagavatula
2023-06-06  6:14     ` Nithin Dabilpuram
2023-07-27 14:36     ` [PATCH v4] node: add IPv4 " pbhagavatula
2023-09-08  5:37       ` Nithin Dabilpuram [this message]
2023-10-17 11:16         ` Thomas Monjalon

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=CAMuDWKQ2KF0mOeGidfqf-6+5vmqWFtmWS8Xa8NFLht+LW+HkZw@mail.gmail.com \
    --to=nithind1988@gmail.com \
    --cc=dev@dpdk.org \
    --cc=jerinj@marvell.com \
    --cc=kirankumark@marvell.com \
    --cc=ndabilpuram@marvell.com \
    --cc=pbhagavatula@marvell.com \
    --cc=zhirun.yan@intel.com \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).