> -----Original Message-----
> From: Kavanagh, Mark B
> Sent: Monday, October 2, 2017 5:46 PM
> To: dev@dpdk.org
> Cc: Hu, Jiayu <jiayu...@intel.com>; Tan, Jianfeng <jianfeng....@intel.com>; 
> Ananyev, Konstantin <konstantin.anan...@intel.com>; Yigit,
> Ferruh <ferruh.yi...@intel.com>; tho...@monjalon.net; Kavanagh, Mark B 
> <mark.b.kavan...@intel.com>
> Subject: [PATCH v6 5/6] app/testpmd: enable TCP/IPv4, VxLAN and GRE GSO
> 
> From: Jiayu Hu <jiayu...@intel.com>
> 
> This patch adds GSO support to the csum forwarding engine. Oversized
> packets transmitted over a GSO-enabled port will undergo segmentation
> (with the exception of packet-types unsupported by the GSO library).
> GSO support is disabled by default.
> 
> GSO support may be toggled on a per-port basis, using the command:
> 
>         "set port <port_id> gso on|off"
> 
> The maximum packet length (including the packet header and payload) for
> GSO segments may be set with the command:
> 
>         "set gso segsz <length>"
> 
> Show GSO configuration for a given port with the command:
> 
>       "show port <port_id> gso"
> 
> Signed-off-by: Jiayu Hu <jiayu...@intel.com>
> Signed-off-by: Mark Kavanagh <mark.b.kavan...@intel.com>
> ---
>  app/test-pmd/cmdline.c                      | 178 
> ++++++++++++++++++++++++++++
>  app/test-pmd/config.c                       |  24 ++++
>  app/test-pmd/csumonly.c                     |  69 ++++++++++-
>  app/test-pmd/testpmd.c                      |  13 ++
>  app/test-pmd/testpmd.h                      |  10 ++
>  doc/guides/testpmd_app_ug/testpmd_funcs.rst |  46 +++++++
>  6 files changed, 335 insertions(+), 5 deletions(-)
> 
> diff --git a/app/test-pmd/cmdline.c b/app/test-pmd/cmdline.c
> index ccdf239..05b0ce8 100644
> --- a/app/test-pmd/cmdline.c
> +++ b/app/test-pmd/cmdline.c
> @@ -431,6 +431,17 @@ static void cmd_help_long_parsed(void *parsed_result,
>                       "    Set max flow number and max packet number per-flow"
>                       " for GRO.\n\n"
> 
> +                     "set port (port_id) gso (on|off)"
> +                     "    Enable or disable Generic Segmentation Offload in"
> +                     " csum forwarding engine.\n\n"
> +
> +                     "set gso segsz (length)\n"
> +                     "    Set max packet length for output GSO segments,"
> +                     " including packet header and payload.\n\n"

Probably a  good future improvement would be to allow user to specify gso_type 
too.

> +
> +                     "show port (port_id) gso\n"
> +                     "    Show GSO configuration.\n\n"
> +
>                       "set fwd (%s)\n"
>                       "    Set packet forwarding mode.\n\n"
> 
> @@ -3967,6 +3978,170 @@ struct cmd_gro_set_result {
>       },
>  };
> 
> +/* *** ENABLE/DISABLE GSO *** */
> +struct cmd_gso_enable_result {
> +     cmdline_fixed_string_t cmd_set;
> +     cmdline_fixed_string_t cmd_port;
> +     cmdline_fixed_string_t cmd_keyword;
> +     cmdline_fixed_string_t cmd_mode;
> +     uint8_t cmd_pid;
> +};
> +
> +static void
> +cmd_gso_enable_parsed(void *parsed_result,
> +             __attribute__((unused)) struct cmdline *cl,
> +             __attribute__((unused)) void *data)
> +{
> +     struct cmd_gso_enable_result *res;
> +
> +     res = parsed_result;
> +     if (!strcmp(res->cmd_keyword, "gso"))
> +             setup_gso(res->cmd_mode, res->cmd_pid);
> +}
> +
> +cmdline_parse_token_string_t cmd_gso_enable_set =
> +     TOKEN_STRING_INITIALIZER(struct cmd_gso_enable_result,
> +                     cmd_set, "set");
> +cmdline_parse_token_string_t cmd_gso_enable_port =
> +     TOKEN_STRING_INITIALIZER(struct cmd_gso_enable_result,
> +                     cmd_port, "port");
> +cmdline_parse_token_string_t cmd_gso_enable_keyword =
> +     TOKEN_STRING_INITIALIZER(struct cmd_gso_enable_result,
> +                     cmd_keyword, "gso");
> +cmdline_parse_token_string_t cmd_gso_enable_mode =
> +     TOKEN_STRING_INITIALIZER(struct cmd_gso_enable_result,
> +                     cmd_mode, "on#off");
> +cmdline_parse_token_num_t cmd_gso_enable_pid =
> +     TOKEN_NUM_INITIALIZER(struct cmd_gso_enable_result,
> +                     cmd_pid, UINT8);
> +
> +cmdline_parse_inst_t cmd_gso_enable = {
> +     .f = cmd_gso_enable_parsed,
> +     .data = NULL,
> +     .help_str = "set port <port_id> gso on|off",
> +     .tokens = {
> +             (void *)&cmd_gso_enable_set,
> +             (void *)&cmd_gso_enable_port,
> +             (void *)&cmd_gso_enable_pid,
> +             (void *)&cmd_gso_enable_keyword,
> +             (void *)&cmd_gso_enable_mode,
> +             NULL,
> +     },
> +};
> +
> +/* *** SET MAX PACKET LENGTH FOR GSO SEGMENTS *** */
> +struct cmd_gso_size_result {
> +     cmdline_fixed_string_t cmd_set;
> +     cmdline_fixed_string_t cmd_keyword;
> +     cmdline_fixed_string_t cmd_segsz;
> +     uint16_t cmd_size;
> +};
> +
> +static void
> +cmd_gso_size_parsed(void *parsed_result,
> +                    __attribute__((unused)) struct cmdline *cl,
> +                    __attribute__((unused)) void *data)
> +{
> +     struct cmd_gso_size_result *res = parsed_result;
> +
> +     if (test_done == 0) {
> +             printf("Before setting GSO segsz, please first stop 
> fowarding\n");
> +             return;
> +     }
> +
> +     if (!strcmp(res->cmd_keyword, "gso") &&
> +                     !strcmp(res->cmd_segsz, "segsz")) {
> +             if (res->cmd_size == 0) {

As your gso_size includes packet header too, you probably shouldn't allow 
gso_size less
then some minimal value of l2_len + l3_len + l4_len + ...
Another alternative change gso_ctx.gso_size to count only payload size.

> +                     printf("gso_size should be larger than 0."
> +                                     " Please input a legal value\n");
> +             } else
> +                     gso_max_segment_size = res->cmd_size;
> +     }
> +}
> +
> +cmdline_parse_token_string_t cmd_gso_size_set =
> +     TOKEN_STRING_INITIALIZER(struct cmd_gso_size_result,
> +                             cmd_set, "set");
> +cmdline_parse_token_string_t cmd_gso_size_keyword =
> +     TOKEN_STRING_INITIALIZER(struct cmd_gso_size_result,
> +                             cmd_keyword, "gso");
> +cmdline_parse_token_string_t cmd_gso_size_segsz =
> +     TOKEN_STRING_INITIALIZER(struct cmd_gso_size_result,
> +                             cmd_segsz, "segsz");
> +cmdline_parse_token_num_t cmd_gso_size_size =
> +     TOKEN_NUM_INITIALIZER(struct cmd_gso_size_result,
> +                             cmd_size, UINT16);
> +
> +cmdline_parse_inst_t cmd_gso_size = {
> +     .f = cmd_gso_size_parsed,
> +     .data = NULL,
> +     .help_str = "set gso segsz <length>",
> +     .tokens = {
> +             (void *)&cmd_gso_size_set,
> +             (void *)&cmd_gso_size_keyword,
> +             (void *)&cmd_gso_size_segsz,
> +             (void *)&cmd_gso_size_size,
> +             NULL,
> +     },
> +};
> +
> +/* *** SHOW GSO CONFIGURATION *** */
> +struct cmd_gso_show_result {
> +     cmdline_fixed_string_t cmd_show;
> +     cmdline_fixed_string_t cmd_port;
> +     cmdline_fixed_string_t cmd_keyword;
> +     uint8_t cmd_pid;
> +};
> +
> +static void
> +cmd_gso_show_parsed(void *parsed_result,
> +                    __attribute__((unused)) struct cmdline *cl,
> +                    __attribute__((unused)) void *data)
> +{
> +     struct cmd_gso_show_result *res = parsed_result;
> +
> +     if (!rte_eth_dev_is_valid_port(res->cmd_pid)) {
> +             printf("invalid port id %u\n", res->cmd_pid);
> +             return;
> +     }
> +     if (!strcmp(res->cmd_keyword, "gso")) {
> +             if (gso_ports[res->cmd_pid].enable) {
> +                     printf("Max GSO'd packet size: %uB\n"
> +                                     "Supported GSO types: TCP/IPv4, "
> +                                     "VxLAN with inner TCP/IPv4 packet, "
> +                                     "GRE with inner TCP/IPv4  packet\n",
> +                                     gso_max_segment_size);
> +             } else
> +                     printf("GSO is not enabled on Port %u\n", res->cmd_pid);
> +     }
> +}
> +
> +cmdline_parse_token_string_t cmd_gso_show_show =
> +TOKEN_STRING_INITIALIZER(struct cmd_gso_show_result,
> +             cmd_show, "show");
> +cmdline_parse_token_string_t cmd_gso_show_port =
> +TOKEN_STRING_INITIALIZER(struct cmd_gso_show_result,
> +             cmd_port, "port");
> +cmdline_parse_token_string_t cmd_gso_show_keyword =
> +     TOKEN_STRING_INITIALIZER(struct cmd_gso_show_result,
> +                             cmd_keyword, "gso");
> +cmdline_parse_token_num_t cmd_gso_show_pid =
> +     TOKEN_NUM_INITIALIZER(struct cmd_gso_show_result,
> +                             cmd_pid, UINT8);
> +
> +cmdline_parse_inst_t cmd_gso_show = {
> +     .f = cmd_gso_show_parsed,
> +     .data = NULL,
> +     .help_str = "show port <port_id> gso",
> +     .tokens = {
> +             (void *)&cmd_gso_show_show,
> +             (void *)&cmd_gso_show_port,
> +             (void *)&cmd_gso_show_pid,
> +             (void *)&cmd_gso_show_keyword,
> +             NULL,
> +     },
> +};
> +
>  /* *** ENABLE/DISABLE FLUSH ON RX STREAMS *** */
>  struct cmd_set_flush_rx {
>       cmdline_fixed_string_t set;
> @@ -14255,6 +14430,9 @@ struct cmd_cmdfile_result {
>       (cmdline_parse_inst_t *)&cmd_tunnel_tso_show,
>       (cmdline_parse_inst_t *)&cmd_enable_gro,
>       (cmdline_parse_inst_t *)&cmd_gro_set,
> +     (cmdline_parse_inst_t *)&cmd_gso_enable,
> +     (cmdline_parse_inst_t *)&cmd_gso_size,
> +     (cmdline_parse_inst_t *)&cmd_gso_show,
>       (cmdline_parse_inst_t *)&cmd_link_flow_control_set,
>       (cmdline_parse_inst_t *)&cmd_link_flow_control_set_rx,
>       (cmdline_parse_inst_t *)&cmd_link_flow_control_set_tx,
> diff --git a/app/test-pmd/config.c b/app/test-pmd/config.c
> index 3ae3e1c..88d09d0 100644
> --- a/app/test-pmd/config.c
> +++ b/app/test-pmd/config.c
> @@ -2454,6 +2454,30 @@ struct igb_ring_desc_16_bytes {
>       }
>  }
> 
> +void
> +setup_gso(const char *mode, uint8_t port_id)
> +{
> +     if (!rte_eth_dev_is_valid_port(port_id)) {
> +             printf("invalid port id %u\n", port_id);
> +             return;
> +     }
> +     if (strcmp(mode, "on") == 0) {
> +             if (test_done == 0) {
> +                     printf("before enabling GSO,"
> +                                     " please stop forwarding first\n");
> +                     return;
> +             }
> +             gso_ports[port_id].enable = 1;
> +     } else if (strcmp(mode, "off") == 0) {
> +             if (test_done == 0) {
> +                     printf("before disabling GSO,"
> +                                     " please stop forwarding first\n");
> +                     return;
> +             }
> +             gso_ports[port_id].enable = 0;
> +     }
> +}
> +
>  char*
>  list_pkt_forwarding_modes(void)
>  {
> diff --git a/app/test-pmd/csumonly.c b/app/test-pmd/csumonly.c
> index 90c8119..bd1a287 100644
> --- a/app/test-pmd/csumonly.c
> +++ b/app/test-pmd/csumonly.c
> @@ -70,6 +70,8 @@
>  #include <rte_string_fns.h>
>  #include <rte_flow.h>
>  #include <rte_gro.h>
> +#include <rte_gso.h>
> +
>  #include "testpmd.h"
> 
>  #define IP_DEFTTL  64   /* from RFC 1340. */
> @@ -91,6 +93,7 @@
>  /* structure that caches offload info for the current packet */
>  struct testpmd_offload_info {
>       uint16_t ethertype;
> +     uint8_t gso_enable;
>       uint16_t l2_len;
>       uint16_t l3_len;
>       uint16_t l4_len;
> @@ -381,6 +384,8 @@ struct simple_gre_hdr {
>                               get_udptcp_checksum(l3_hdr, tcp_hdr,
>                                       info->ethertype);
>               }
> +             if (info->gso_enable)
> +                     ol_flags |= PKT_TX_TCP_SEG;
>       } else if (info->l4_proto == IPPROTO_SCTP) {
>               sctp_hdr = (struct sctp_hdr *)((char *)l3_hdr + info->l3_len);
>               sctp_hdr->cksum = 0;
> @@ -627,6 +632,9 @@ struct simple_gre_hdr {
>  pkt_burst_checksum_forward(struct fwd_stream *fs)
>  {
>       struct rte_mbuf *pkts_burst[MAX_PKT_BURST];
> +     struct rte_mbuf *gso_segments[GSO_MAX_PKT_BURST];
> +     struct rte_gso_ctx *gso_ctx;
> +     struct rte_mbuf **tx_pkts_burst;
>       struct rte_port *txp;
>       struct rte_mbuf *m, *p;
>       struct ether_hdr *eth_hdr;
> @@ -634,13 +642,15 @@ struct simple_gre_hdr {
>       uint16_t nb_rx;
>       uint16_t nb_tx;
>       uint16_t nb_prep;
> -     uint16_t i;
> +     uint16_t i, j;
>       uint64_t rx_ol_flags, tx_ol_flags;
>       uint16_t testpmd_ol_flags;
>       uint32_t retry;
>       uint32_t rx_bad_ip_csum;
>       uint32_t rx_bad_l4_csum;
>       struct testpmd_offload_info info;
> +     uint16_t nb_segments = 0;
> +     int ret;
> 
>  #ifdef RTE_TEST_PMD_RECORD_CORE_CYCLES
>       uint64_t start_tsc;
> @@ -674,6 +684,8 @@ struct simple_gre_hdr {
>       memset(&info, 0, sizeof(info));
>       info.tso_segsz = txp->tso_segsz;
>       info.tunnel_tso_segsz = txp->tunnel_tso_segsz;
> +     if (gso_ports[fs->tx_port].enable)
> +             info.gso_enable = 1;
> 
>       for (i = 0; i < nb_rx; i++) {
>               if (likely(i < nb_rx - 1))
> @@ -851,13 +863,59 @@ struct simple_gre_hdr {
>               }
>       }
> 
> +     if (gso_ports[fs->tx_port].enable == 0)
> +             tx_pkts_burst = pkts_burst;
> +     else {
> +             gso_ctx = &(current_fwd_lcore()->gso_ctx);
> +             gso_ctx->gso_size = gso_max_segment_size;
> +             for (i = 0; i < nb_rx; i++) {

It seems quite a lot of code to handle an error case, which I suppose
will happen pretty rare.
Why not just:

ret = rte_gso_segment(pkts_burst[i], gso_ctx,
                                        &gso_segments[nb_segments],
                                        RTE_DIM(gso_segments) - nb_segments);
If (ret < 0)  {
    RTE_LOG(DEBUG, ....);
     rte_free(pkts_burst[i]);
} else
   nb_segments += ret;



> +                     if (unlikely(nb_rx - i >= GSO_MAX_PKT_BURST -
> +                                             nb_segments)) {
> +                             /*
> +                              * insufficient space in gso_segments,
> +                              * stop GSO.
> +                              */
> +                             for (j = i; j < GSO_MAX_PKT_BURST -
> +                                             nb_segments; j++) {
> +                                     pkts_burst[j]->ol_flags &=
> +                                             (~PKT_TX_TCP_SEG);
> +                                     gso_segments[nb_segments++] =
> +                                             pkts_burst[j];
> +                             }
> +                             for (; j < nb_rx; j++)
> +                                     rte_pktmbuf_free(pkts_burst[j]);
> +                             break;
> +                     }
> +                     ret = rte_gso_segment(pkts_burst[i], gso_ctx,
> +                                     &gso_segments[nb_segments],
> +                                     GSO_MAX_PKT_BURST - nb_segments);
> +                     if (ret >= 1)
> +                             nb_segments += ret;
> +                     else if (ret < 0) {
> +                             /*
> +                              * insufficient MBUFs or space in
> +                              * gso_segments, stop GSO.
> +                              */
> +                             for (j = i; j < nb_rx; j++) {
> +                                     pkts_burst[j]->ol_flags &=
> +                                             (~PKT_TX_TCP_SEG);
> +                                     gso_segments[nb_segments++] =
> +                                             pkts_burst[j];
> +                             }
> +                             break;
> +                     }
> +             }
> +             tx_pkts_burst = gso_segments;
> +             nb_rx = nb_segments;
> +     }
> +
>       nb_prep = rte_eth_tx_prepare(fs->tx_port, fs->tx_queue,
> -                     pkts_burst, nb_rx);
> +                     tx_pkts_burst, nb_rx);
>       if (nb_prep != nb_rx)
>               printf("Preparing packet burst to transmit failed: %s\n",
>                               rte_strerror(rte_errno));
> 
> -     nb_tx = rte_eth_tx_burst(fs->tx_port, fs->tx_queue, pkts_burst,
> +     nb_tx = rte_eth_tx_burst(fs->tx_port, fs->tx_queue, tx_pkts_burst,
>                       nb_prep);
> 
>       /*
> @@ -868,7 +926,7 @@ struct simple_gre_hdr {
>               while (nb_tx < nb_rx && retry++ < burst_tx_retry_num) {
>                       rte_delay_us(burst_tx_delay_time);
>                       nb_tx += rte_eth_tx_burst(fs->tx_port, fs->tx_queue,
> -                                     &pkts_burst[nb_tx], nb_rx - nb_tx);
> +                                     &tx_pkts_burst[nb_tx], nb_rx - nb_tx);
>               }
>       }
>       fs->tx_packets += nb_tx;
> @@ -881,9 +939,10 @@ struct simple_gre_hdr {
>       if (unlikely(nb_tx < nb_rx)) {
>               fs->fwd_dropped += (nb_rx - nb_tx);
>               do {
> -                     rte_pktmbuf_free(pkts_burst[nb_tx]);
> +                     rte_pktmbuf_free(tx_pkts_burst[nb_tx]);
>               } while (++nb_tx < nb_rx);
>       }
> +
>  #ifdef RTE_TEST_PMD_RECORD_CORE_CYCLES
>       end_tsc = rte_rdtsc();
>       core_cycles = (end_tsc - start_tsc);
> diff --git a/app/test-pmd/testpmd.c b/app/test-pmd/testpmd.c
> index e097ee0..97e349d 100644
> --- a/app/test-pmd/testpmd.c
> +++ b/app/test-pmd/testpmd.c
> @@ -400,6 +400,9 @@ static int eth_event_callback(uint8_t port_id,
>   */
>  static int all_ports_started(void);
> 
> +struct gso_status gso_ports[RTE_MAX_ETHPORTS];
> +uint16_t gso_max_segment_size = ETHER_MAX_LEN - ETHER_CRC_LEN;
> +
>  /*
>   * Helper function to check if socket is already discovered.
>   * If yes, return positive value. If not, return zero.
> @@ -570,6 +573,7 @@ static int eth_event_callback(uint8_t port_id,
>       unsigned int nb_mbuf_per_pool;
>       lcoreid_t  lc_id;
>       uint8_t port_per_socket[RTE_MAX_NUMA_NODES];
> +     uint32_t gso_types = 0;
> 
>       memset(port_per_socket,0,RTE_MAX_NUMA_NODES);
> 
> @@ -654,6 +658,8 @@ static int eth_event_callback(uint8_t port_id,
> 
>       init_port_config();
> 
> +     gso_types = DEV_TX_OFFLOAD_TCP_TSO | DEV_TX_OFFLOAD_VXLAN_TNL_TSO |
> +             DEV_TX_OFFLOAD_GRE_TNL_TSO;
>       /*
>        * Records which Mbuf pool to use by each logical core, if needed.
>        */
> @@ -664,6 +670,13 @@ static int eth_event_callback(uint8_t port_id,
>               if (mbp == NULL)
>                       mbp = mbuf_pool_find(0);
>               fwd_lcores[lc_id]->mbp = mbp;
> +             /* initialize GSO context */
> +             fwd_lcores[lc_id]->gso_ctx.direct_pool = mbp;
> +             fwd_lcores[lc_id]->gso_ctx.indirect_pool = mbp;
> +             fwd_lcores[lc_id]->gso_ctx.gso_types = gso_types;
> +             fwd_lcores[lc_id]->gso_ctx.gso_size = ETHER_MAX_LEN -
> +                     ETHER_CRC_LEN;
> +             fwd_lcores[lc_id]->gso_ctx.ipid_flag = !RTE_GSO_IPID_FIXED;

Just
fwd_lcores[lc_id]->gso_ctx.ipid_flag = 0;
should do here.

Konstantin

Reply via email to