On 12/28/2018 9:03 PM, Konstantin Ananyev wrote: > Right now ipsec-secgw always enables TX offloads > (DEV_TX_OFFLOAD_MULTI_SEGS, DEV_TX_OFFLOAD_SECURITY), > even when they are not requested by the config. > That causes many PMD to choose full-featured TX function, > which in many cases is much slower then one without offloads. > That patch adds ability for the user to disable unneeded HW offloads. > If DEV_TX_OFFLOAD_IPV4_CKSUM is disabled by user, then > SW version of ip cksum calculation is used. > That allows to use vector TX function, when inline-ipsec is not > requested. > > Signed-off-by: Remy Horton <remy.hor...@intel.com> > Signed-off-by: Konstantin Ananyev <konstantin.anan...@intel.com> > Acked-by: Radu Nicolau <radu.nico...@intel.com> > --- > doc/guides/sample_app_ug/ipsec_secgw.rst | 12 +++ > examples/ipsec-secgw/ipsec-secgw.c | 126 ++++++++++++++++++++--- > examples/ipsec-secgw/ipsec.h | 6 ++ > examples/ipsec-secgw/sa.c | 35 +++++++ > 4 files changed, 164 insertions(+), 15 deletions(-) > > diff --git a/doc/guides/sample_app_ug/ipsec_secgw.rst > b/doc/guides/sample_app_ug/ipsec_secgw.rst > index 4869a011d..244bde2de 100644 > --- a/doc/guides/sample_app_ug/ipsec_secgw.rst > +++ b/doc/guides/sample_app_ug/ipsec_secgw.rst > @@ -95,6 +95,8 @@ The application has a number of command line options:: > -p PORTMASK -P -u PORTMASK -j FRAMESIZE > --config (port,queue,lcore)[,(port,queue,lcore] > --single-sa SAIDX > + --rxoffload MASK > + --txoffload MASK > -f CONFIG_FILE_PATH > > Where: > @@ -119,6 +121,16 @@ Where: > on both Inbound and Outbound. This option is meant for > debugging/performance > purposes. > > +* ``--rxoffload MASK``: RX HW offload capabilities to enable/use on this > port > + (bitmask of DEV_RX_OFFLOAD_* values). It is an optional parameter and > + allows user to disable some of the RX HW offload capabilities. > + By default all HW RX offloads are enabled. > + > +* ``--txoffload MASK``: TX HW offload capabilities to enable/use on this > port > + (bitmask of DEV_TX_OFFLOAD_* values). It is an optional parameter and > + allows user to disable some of the TX HW offload capabilities. > + By default all HW TX offloads are enabled. > + by default all should not be enabled. It should remain as it was before your patchset. It would be good if you can add a link to ethdev section where it explain different offloads available.
If anyone needs to change the default behavior, a patch need to be submitted to add that. > * ``-f CONFIG_FILE_PATH``: the full path of text-based file containing all > configuration items for running the application (See Configuration file > syntax section below). ``-f CONFIG_FILE_PATH`` **must** be specified. > diff --git a/examples/ipsec-secgw/ipsec-secgw.c > b/examples/ipsec-secgw/ipsec-secgw.c > index 1bc0b5b50..f5db3da0c 100644 > --- a/examples/ipsec-secgw/ipsec-secgw.c > +++ b/examples/ipsec-secgw/ipsec-secgw.c > @@ -124,6 +124,8 @@ struct ethaddr_info ethaddr_tbl[RTE_MAX_ETHPORTS] = { > #define CMD_LINE_OPT_CONFIG "config" > #define CMD_LINE_OPT_SINGLE_SA "single-sa" > #define CMD_LINE_OPT_CRYPTODEV_MASK "cryptodev_mask" > +#define CMD_LINE_OPT_RX_OFFLOAD "rxoffload" > +#define CMD_LINE_OPT_TX_OFFLOAD "txoffload" > > enum { > /* long options mapped to a short option */ > @@ -135,12 +137,16 @@ enum { > CMD_LINE_OPT_CONFIG_NUM, > CMD_LINE_OPT_SINGLE_SA_NUM, > CMD_LINE_OPT_CRYPTODEV_MASK_NUM, > + CMD_LINE_OPT_RX_OFFLOAD_NUM, > + CMD_LINE_OPT_TX_OFFLOAD_NUM, > }; > > static const struct option lgopts[] = { > {CMD_LINE_OPT_CONFIG, 1, 0, CMD_LINE_OPT_CONFIG_NUM}, > {CMD_LINE_OPT_SINGLE_SA, 1, 0, CMD_LINE_OPT_SINGLE_SA_NUM}, > {CMD_LINE_OPT_CRYPTODEV_MASK, 1, 0, CMD_LINE_OPT_CRYPTODEV_MASK_NUM}, > + {CMD_LINE_OPT_RX_OFFLOAD, 1, 0, CMD_LINE_OPT_RX_OFFLOAD_NUM}, > + {CMD_LINE_OPT_TX_OFFLOAD, 1, 0, CMD_LINE_OPT_TX_OFFLOAD_NUM}, > {NULL, 0, 0, 0} > }; > > @@ -155,6 +161,13 @@ static uint32_t single_sa; > static uint32_t single_sa_idx; > static uint32_t frame_size; > > +/* > + * RX/TX HW offload capabilities to enable/use on ethernet ports. > + * By default all capabilities are enabled. > + */ > +static uint64_t dev_rx_offload = UINT64_MAX; > +static uint64_t dev_tx_offload = UINT64_MAX; > + > struct lcore_rx_queue { > uint16_t port_id; > uint8_t queue_id; > @@ -208,8 +221,6 @@ static struct rte_eth_conf port_conf = { > }, > .txmode = { > .mq_mode = ETH_MQ_TX_NONE, > - .offloads = (DEV_TX_OFFLOAD_IPV4_CKSUM | > - DEV_TX_OFFLOAD_MULTI_SEGS), > }, > }; > > @@ -315,7 +326,8 @@ prepare_traffic(struct rte_mbuf **pkts, struct > ipsec_traffic *t, > } > > static inline void > -prepare_tx_pkt(struct rte_mbuf *pkt, uint16_t port) > +prepare_tx_pkt(struct rte_mbuf *pkt, uint16_t port, > + const struct lcore_conf *qconf) > { > struct ip *ip; > struct ether_hdr *ethhdr; > @@ -325,14 +337,19 @@ prepare_tx_pkt(struct rte_mbuf *pkt, uint16_t port) > ethhdr = (struct ether_hdr *)rte_pktmbuf_prepend(pkt, ETHER_HDR_LEN); > > if (ip->ip_v == IPVERSION) { > - pkt->ol_flags |= PKT_TX_IP_CKSUM | PKT_TX_IPV4; > + pkt->ol_flags |= qconf->outbound.ipv4_offloads; > pkt->l3_len = sizeof(struct ip); > pkt->l2_len = ETHER_HDR_LEN; > > ip->ip_sum = 0; > + > + /* calculate IPv4 cksum in SW */ > + if ((pkt->ol_flags & PKT_TX_IP_CKSUM) == 0) > + ip->ip_sum = rte_ipv4_cksum((struct ipv4_hdr *)ip); > + something is not correct, on my hardware I still see rte_ipv4_cksum getting called. This result in around 2% drop due to this patch. > ethhdr->ether_type = rte_cpu_to_be_16(ETHER_TYPE_IPv4); > } else { > - pkt->ol_flags |= PKT_TX_IPV6; > + pkt->ol_flags |= qconf->outbound.ipv6_offloads; > pkt->l3_len = sizeof(struct ip6_hdr); > pkt->l2_len = ETHER_HDR_LEN; > > @@ -346,18 +363,19 @@ prepare_tx_pkt(struct rte_mbuf *pkt, uint16_t port) > } > > static inline void > -prepare_tx_burst(struct rte_mbuf *pkts[], uint16_t nb_pkts, uint16_t port) > +prepare_tx_burst(struct rte_mbuf *pkts[], uint16_t nb_pkts, uint16_t port, > + const struct lcore_conf *qconf) > { > int32_t i; > const int32_t prefetch_offset = 2; > > for (i = 0; i < (nb_pkts - prefetch_offset); i++) { > rte_mbuf_prefetch_part2(pkts[i + prefetch_offset]); > - prepare_tx_pkt(pkts[i], port); > + prepare_tx_pkt(pkts[i], port, qconf); > } > /* Process left packets */ > for (; i < nb_pkts; i++) > - prepare_tx_pkt(pkts[i], port); > + prepare_tx_pkt(pkts[i], port, qconf); > } > > /* Send burst of packets on an output interface */ > @@ -371,7 +389,7 @@ send_burst(struct lcore_conf *qconf, uint16_t n, uint16_t > port) > queueid = qconf->tx_queue_id[port]; > m_table = (struct rte_mbuf **)qconf->tx_mbufs[port].m_table; > > - prepare_tx_burst(m_table, n, port); > + prepare_tx_burst(m_table, n, port, qconf); > > ret = rte_eth_tx_burst(port, queueid, m_table, n); > if (unlikely(ret < n)) { > @@ -954,6 +972,8 @@ print_usage(const char *prgname) > " --config (port,queue,lcore)[,(port,queue,lcore)]" > " [--single-sa SAIDX]" > " [--cryptodev_mask MASK]" > + " [--" CMD_LINE_OPT_RX_OFFLOAD " RX_OFFLOAD_MASK]" > + " [--" CMD_LINE_OPT_TX_OFFLOAD " TX_OFFLOAD_MASK]" > "\n\n" > " -p PORTMASK: Hexadecimal bitmask of ports to configure\n" > " -P : Enable promiscuous mode\n" > @@ -966,10 +986,31 @@ print_usage(const char *prgname) > " bypassing the SP\n" > " --cryptodev_mask MASK: Hexadecimal bitmask of the crypto\n" > " devices to configure\n" > + " --" CMD_LINE_OPT_RX_OFFLOAD > + ": bitmask of the RX HW offload capabilities to enable/use\n" > + " (DEV_RX_OFFLOAD_*)\n" > + " --" CMD_LINE_OPT_TX_OFFLOAD > + ": bitmask of the TX HW offload capabilities to enable/use\n" > + " (DEV_TX_OFFLOAD_*)\n" > "\n", > prgname); > } > > +static int > +parse_mask(const char *str, uint64_t *val) > +{ > + char *end; > + unsigned long t; > + > + errno = 0; > + t = strtoul(str, &end, 0); > + if (errno != 0 || end[0] != 0) > + return -EINVAL; > + > + *val = t; > + return 0; > +} > + > static int32_t > parse_portmask(const char *portmask) > { > @@ -1156,6 +1197,24 @@ parse_args(int32_t argc, char **argv) > /* else */ > enabled_cryptodev_mask = ret; > break; > + case CMD_LINE_OPT_RX_OFFLOAD_NUM: > + ret = parse_mask(optarg, &dev_rx_offload); > + if (ret != 0) { > + printf("Invalid argument for \'%s\': %s\n", > + CMD_LINE_OPT_RX_OFFLOAD, optarg); > + print_usage(prgname); > + return -1; > + } > + break; > + case CMD_LINE_OPT_TX_OFFLOAD_NUM: > + ret = parse_mask(optarg, &dev_tx_offload); > + if (ret != 0) { > + printf("Invalid argument for \'%s\': %s\n", > + CMD_LINE_OPT_TX_OFFLOAD, optarg); > + print_usage(prgname); > + return -1; > + } > + break; > default: > print_usage(prgname); > return -1; > @@ -1543,7 +1602,7 @@ cryptodevs_init(void) > } > > static void > -port_init(uint16_t portid) > +port_init(uint16_t portid, uint64_t req_rx_offloads, uint64_t > req_tx_offloads) > { > struct rte_eth_dev_info dev_info; > struct rte_eth_txconf *txconf; > @@ -1556,6 +1615,10 @@ port_init(uint16_t portid) > > rte_eth_dev_info_get(portid, &dev_info); > > + /* limit allowed HW offloafs, as user requested */ > + dev_info.rx_offload_capa &= dev_rx_offload; > + dev_info.tx_offload_capa &= dev_tx_offload; > + > printf("Configuring device port %u:\n", portid); > > rte_eth_macaddr_get(portid, ðaddr); > @@ -1584,14 +1647,38 @@ port_init(uint16_t portid) > local_port_conf.rxmode.offloads |= DEV_RX_OFFLOAD_JUMBO_FRAME; > } > > - if (dev_info.rx_offload_capa & DEV_RX_OFFLOAD_SECURITY) > - local_port_conf.rxmode.offloads |= DEV_RX_OFFLOAD_SECURITY; > - if (dev_info.tx_offload_capa & DEV_TX_OFFLOAD_SECURITY) > - local_port_conf.txmode.offloads |= DEV_TX_OFFLOAD_SECURITY; > + local_port_conf.rxmode.offloads |= req_rx_offloads; > + local_port_conf.txmode.offloads |= req_tx_offloads; > + > + /* Check that all required capabilities are supported */ > + if ((local_port_conf.rxmode.offloads & dev_info.rx_offload_capa) != > + local_port_conf.rxmode.offloads) > + rte_exit(EXIT_FAILURE, > + "Error: port %u required RX offloads: 0x%" PRIx64 > + ", avaialbe RX offloads: 0x%" PRIx64 "\n", > + portid, local_port_conf.rxmode.offloads, > + dev_info.rx_offload_capa); > + > + if ((local_port_conf.txmode.offloads & dev_info.tx_offload_capa) != > + local_port_conf.txmode.offloads) > + rte_exit(EXIT_FAILURE, > + "Error: port %u required TX offloads: 0x%" PRIx64 > + ", avaialbe TX offloads: 0x%" PRIx64 "\n", > + portid, local_port_conf.txmode.offloads, > + dev_info.tx_offload_capa); > + > if (dev_info.tx_offload_capa & DEV_TX_OFFLOAD_MBUF_FAST_FREE) > local_port_conf.txmode.offloads |= > DEV_TX_OFFLOAD_MBUF_FAST_FREE; > > + if (dev_info.tx_offload_capa & DEV_TX_OFFLOAD_IPV4_CKSUM) > + local_port_conf.txmode.offloads |= DEV_TX_OFFLOAD_IPV4_CKSUM; > + > + printf("port %u configurng rx_offloads=0x%" PRIx64 > + ", tx_offloads=0x%" PRIx64 "\n", > + portid, local_port_conf.rxmode.offloads, > + local_port_conf.txmode.offloads); > + > local_port_conf.rx_adv_conf.rss_conf.rss_hf &= > dev_info.flow_type_rss_offloads; > if (local_port_conf.rx_adv_conf.rss_conf.rss_hf != > @@ -1639,6 +1726,13 @@ port_init(uint16_t portid) > > qconf = &lcore_conf[lcore_id]; > qconf->tx_queue_id[portid] = tx_queueid; > + > + /* Pre-populate pkt offloads based on capabilities */ > + qconf->outbound.ipv4_offloads = PKT_TX_IPV4; > + qconf->outbound.ipv6_offloads = PKT_TX_IPV6; > + if (req_tx_offloads & DEV_TX_OFFLOAD_IPV4_CKSUM) > + qconf->outbound.ipv4_offloads |= PKT_TX_IP_CKSUM; I believe this is the issue, this should not be req_tx_offload. req_tx_offloads cannot have DEV_TX_OFFLOAD_IPV4_CKSUM set for lookaside mode. > + > tx_queueid++; > > /* init RX queues */ > @@ -1749,6 +1843,7 @@ main(int32_t argc, char **argv) > uint32_t lcore_id; > uint8_t socket_id; > uint16_t portid; > + uint64_t req_rx_offloads, req_tx_offloads; > > /* init EAL */ > ret = rte_eal_init(argc, argv); > @@ -1804,7 +1899,8 @@ main(int32_t argc, char **argv) > if ((enabled_port_mask & (1 << portid)) == 0) > continue; > > - port_init(portid); > + sa_check_offloads(portid, &req_rx_offloads, &req_tx_offloads); > + port_init(portid, req_rx_offloads, req_tx_offloads); > } > > cryptodevs_init(); > diff --git a/examples/ipsec-secgw/ipsec.h b/examples/ipsec-secgw/ipsec.h > index c998c8076..9b1586f52 100644 > --- a/examples/ipsec-secgw/ipsec.h > +++ b/examples/ipsec-secgw/ipsec.h > @@ -146,6 +146,8 @@ struct ipsec_ctx { > struct rte_mempool *session_pool; > struct rte_mbuf *ol_pkts[MAX_PKT_BURST] __rte_aligned(sizeof(void *)); > uint16_t ol_pkts_cnt; > + uint64_t ipv4_offloads; > + uint64_t ipv6_offloads; > }; > > struct cdev_key { > @@ -239,4 +241,8 @@ sa_init(struct socket_ctx *ctx, int32_t socket_id); > void > rt_init(struct socket_ctx *ctx, int32_t socket_id); > > +int > +sa_check_offloads(uint16_t port_id, uint64_t *rx_offloads, > + uint64_t *tx_offloads); > + > #endif /* __IPSEC_H__ */ > diff --git a/examples/ipsec-secgw/sa.c b/examples/ipsec-secgw/sa.c > index d2d3550a4..f6271bc60 100644 > --- a/examples/ipsec-secgw/sa.c > +++ b/examples/ipsec-secgw/sa.c > @@ -1017,3 +1017,38 @@ outbound_sa_lookup(struct sa_ctx *sa_ctx, uint32_t > sa_idx[], > for (i = 0; i < nb_pkts; i++) > sa[i] = &sa_ctx->sa[sa_idx[i]]; > } > + > +/* > + * Select HW offloads to be used. > + */ > +int > +sa_check_offloads(uint16_t port_id, uint64_t *rx_offloads, > + uint64_t *tx_offloads) > +{ > + struct ipsec_sa *rule; > + uint32_t idx_sa; > + > + *rx_offloads = 0; > + *tx_offloads = 0; > + > + /* Check for inbound rules that use offloads and use this port */ > + for (idx_sa = 0; idx_sa < nb_sa_in; idx_sa++) { > + rule = &sa_in[idx_sa]; > + if ((rule->type == RTE_SECURITY_ACTION_TYPE_INLINE_CRYPTO || > + rule->type == > + RTE_SECURITY_ACTION_TYPE_INLINE_PROTOCOL) > + && rule->portid == port_id) > + *rx_offloads |= DEV_RX_OFFLOAD_SECURITY; > + } > + > + /* Check for outbound rules that use offloads and use this port */ > + for (idx_sa = 0; idx_sa < nb_sa_out; idx_sa++) { > + rule = &sa_out[idx_sa]; > + if ((rule->type == RTE_SECURITY_ACTION_TYPE_INLINE_CRYPTO || > + rule->type == > + RTE_SECURITY_ACTION_TYPE_INLINE_PROTOCOL) > + && rule->portid == port_id) > + *tx_offloads |= DEV_TX_OFFLOAD_SECURITY; > + } > + return 0; > +}