> -----Original Message----- > From: Maciej Fijalkowski <maciej.fijalkow...@intel.com> > Sent: Tuesday, November 24, 2020 21:52 > To: Camelia Alexandra Groza <camelia.gr...@nxp.com> > Cc: k...@kernel.org; bro...@redhat.com; sa...@kernel.org; > da...@davemloft.net; Madalin Bucur (OSS) > <madalin.bu...@oss.nxp.com>; Ioana Ciornei <ioana.cior...@nxp.com>; > netdev@vger.kernel.org > Subject: Re: [PATCH net-next v4 4/7] dpaa_eth: add XDP_TX support > > On Mon, Nov 23, 2020 at 07:36:22PM +0200, Camelia Groza wrote: > > Use an xdp_frame structure for managing the frame. Store a backpointer > to > > the structure at the start of the buffer before enqueueing for cleanup > > on TX confirmation. Reserve DPAA_TX_PRIV_DATA_SIZE bytes from the > frame > > size shared with the XDP program for this purpose. Use the XDP > > API for freeing the buffer when it returns to the driver on the TX > > confirmation path. > > > > The frame queues are shared with the netstack. > > Can you also provide the info from cover letter about locklessness (is > that even a word?) in here?
Sure. > One question below and: > > Reviewed-by: Maciej Fijalkowski <maciej.fijalkow...@intel.com> > > > > > This approach will be reused for XDP REDIRECT. > > > > Acked-by: Madalin Bucur <madalin.bu...@oss.nxp.com> > > Signed-off-by: Camelia Groza <camelia.gr...@nxp.com> > > --- > > Changes in v4: > > - call xdp_rxq_info_is_reg() before unregistering > > - minor cleanups (remove unneeded variable, print error code) > > - add more details in the commit message > > - did not call qman_destroy_fq() in case of xdp_rxq_info_reg() failure > > since it would lead to a double free of the fq resources > > > > drivers/net/ethernet/freescale/dpaa/dpaa_eth.c | 128 > ++++++++++++++++++++++++- > > drivers/net/ethernet/freescale/dpaa/dpaa_eth.h | 2 + > > 2 files changed, 125 insertions(+), 5 deletions(-) > > > > diff --git a/drivers/net/ethernet/freescale/dpaa/dpaa_eth.c > b/drivers/net/ethernet/freescale/dpaa/dpaa_eth.c > > index ee076f4..0deffcc 100644 > > --- a/drivers/net/ethernet/freescale/dpaa/dpaa_eth.c > > +++ b/drivers/net/ethernet/freescale/dpaa/dpaa_eth.c > > @@ -1130,6 +1130,24 @@ static int dpaa_fq_init(struct dpaa_fq *dpaa_fq, > bool td_enable) > > > > dpaa_fq->fqid = qman_fq_fqid(fq); > > > > + if (dpaa_fq->fq_type == FQ_TYPE_RX_DEFAULT || > > + dpaa_fq->fq_type == FQ_TYPE_RX_PCD) { > > + err = xdp_rxq_info_reg(&dpaa_fq->xdp_rxq, dpaa_fq- > >net_dev, > > + dpaa_fq->fqid); > > + if (err) { > > + dev_err(dev, "xdp_rxq_info_reg() = %d\n", err); > > + return err; > > + } > > + > > + err = xdp_rxq_info_reg_mem_model(&dpaa_fq->xdp_rxq, > > + MEM_TYPE_PAGE_ORDER0, > NULL); > > + if (err) { > > + dev_err(dev, "xdp_rxq_info_reg_mem_model() = > %d\n", err); > > + xdp_rxq_info_unreg(&dpaa_fq->xdp_rxq); > > + return err; > > + } > > + } > > + > > return 0; > > } > > > > @@ -1159,6 +1177,11 @@ static int dpaa_fq_free_entry(struct device > *dev, struct qman_fq *fq) > > } > > } > > > > + if ((dpaa_fq->fq_type == FQ_TYPE_RX_DEFAULT || > > + dpaa_fq->fq_type == FQ_TYPE_RX_PCD) && > > + xdp_rxq_info_is_reg(&dpaa_fq->xdp_rxq)) > > + xdp_rxq_info_unreg(&dpaa_fq->xdp_rxq); > > + > > qman_destroy_fq(fq); > > list_del(&dpaa_fq->list); > > > > @@ -1625,6 +1648,9 @@ static int dpaa_eth_refill_bpools(struct dpaa_priv > *priv) > > * > > * Return the skb backpointer, since for S/G frames the buffer containing > > it > > * gets freed here. > > + * > > + * No skb backpointer is set when transmitting XDP frames. Cleanup the > buffer > > + * and return NULL in this case. > > */ > > static struct sk_buff *dpaa_cleanup_tx_fd(const struct dpaa_priv *priv, > > const struct qm_fd *fd, bool ts) > > @@ -1664,13 +1690,21 @@ static struct sk_buff > *dpaa_cleanup_tx_fd(const struct dpaa_priv *priv, > > } > > } else { > > dma_unmap_single(priv->tx_dma_dev, addr, > > - priv->tx_headroom + > qm_fd_get_length(fd), > > + qm_fd_get_offset(fd) + > qm_fd_get_length(fd), > > dma_dir); > > } > > > > swbp = (struct dpaa_eth_swbp *)vaddr; > > skb = swbp->skb; > > > > + /* No skb backpointer is set when running XDP. An xdp_frame > > + * backpointer is saved instead. > > + */ > > + if (!skb) { > > + xdp_return_frame(swbp->xdpf); > > + return NULL; > > + } > > + > > /* DMA unmapping is required before accessing the HW provided > info */ > > if (ts && priv->tx_tstamp && > > skb_shinfo(skb)->tx_flags & SKBTX_HW_TSTAMP) { > > @@ -2350,11 +2384,76 @@ static enum qman_cb_dqrr_result > rx_error_dqrr(struct qman_portal *portal, > > return qman_cb_dqrr_consume; > > } > > > > +static int dpaa_xdp_xmit_frame(struct net_device *net_dev, > > + struct xdp_frame *xdpf) > > +{ > > + struct dpaa_priv *priv = netdev_priv(net_dev); > > + struct rtnl_link_stats64 *percpu_stats; > > + struct dpaa_percpu_priv *percpu_priv; > > + struct dpaa_eth_swbp *swbp; > > + struct netdev_queue *txq; > > + void *buff_start; > > + struct qm_fd fd; > > + dma_addr_t addr; > > + int err; > > + > > + percpu_priv = this_cpu_ptr(priv->percpu_priv); > > + percpu_stats = &percpu_priv->stats; > > + > > + if (xdpf->headroom < DPAA_TX_PRIV_DATA_SIZE) { > > + err = -EINVAL; > > + goto out_error; > > + } > > + > > + buff_start = xdpf->data - xdpf->headroom; > > + > > + /* Leave empty the skb backpointer at the start of the buffer. > > + * Save the XDP frame for easy cleanup on confirmation. > > + */ > > + swbp = (struct dpaa_eth_swbp *)buff_start; > > + swbp->skb = NULL; > > + swbp->xdpf = xdpf; > > + > > + qm_fd_clear_fd(&fd); > > + fd.bpid = FSL_DPAA_BPID_INV; > > + fd.cmd |= cpu_to_be32(FM_FD_CMD_FCO); > > + qm_fd_set_contig(&fd, xdpf->headroom, xdpf->len); > > + > > + addr = dma_map_single(priv->tx_dma_dev, buff_start, > > + xdpf->headroom + xdpf->len, > > + DMA_TO_DEVICE); > > Not sure if I asked that. What is the purpose for including the headroom > in frame being set? I would expect to take into account only frame from > xdpf->data. The xdpf headroom becomes the fd's offset, the area before the data where the backpointers for cleanup are stored. This area isn't sent out with the frame. > > + if (unlikely(dma_mapping_error(priv->tx_dma_dev, addr))) { > > + err = -EINVAL; > > + goto out_error; > > + } > > + > > + qm_fd_addr_set64(&fd, addr); > > + > > + /* Bump the trans_start */ > > + txq = netdev_get_tx_queue(net_dev, smp_processor_id()); > > + txq->trans_start = jiffies; > > + > > + err = dpaa_xmit(priv, percpu_stats, smp_processor_id(), &fd); > > + if (err) { > > + dma_unmap_single(priv->tx_dma_dev, addr, > > + qm_fd_get_offset(&fd) + > qm_fd_get_length(&fd), > > + DMA_TO_DEVICE); > > + goto out_error; > > + } > > + > > + return 0; > > + > > +out_error: > > + percpu_stats->tx_errors++; > > + return err; > > +} > > + > > static u32 dpaa_run_xdp(struct dpaa_priv *priv, struct qm_fd *fd, void > *vaddr, > > - unsigned int *xdp_meta_len) > > + struct dpaa_fq *dpaa_fq, unsigned int > *xdp_meta_len) > > { > > ssize_t fd_off = qm_fd_get_offset(fd); > > struct bpf_prog *xdp_prog; > > + struct xdp_frame *xdpf; > > struct xdp_buff xdp; > > u32 xdp_act; > > > > @@ -2370,7 +2469,8 @@ static u32 dpaa_run_xdp(struct dpaa_priv *priv, > struct qm_fd *fd, void *vaddr, > > xdp.data_meta = xdp.data; > > xdp.data_hard_start = xdp.data - XDP_PACKET_HEADROOM; > > xdp.data_end = xdp.data + qm_fd_get_length(fd); > > - xdp.frame_sz = DPAA_BP_RAW_SIZE; > > + xdp.frame_sz = DPAA_BP_RAW_SIZE - DPAA_TX_PRIV_DATA_SIZE; > > + xdp.rxq = &dpaa_fq->xdp_rxq; > > > > xdp_act = bpf_prog_run_xdp(xdp_prog, &xdp); > > > > @@ -2381,6 +2481,22 @@ static u32 dpaa_run_xdp(struct dpaa_priv *priv, > struct qm_fd *fd, void *vaddr, > > case XDP_PASS: > > *xdp_meta_len = xdp.data - xdp.data_meta; > > break; > > + case XDP_TX: > > + /* We can access the full headroom when sending the frame > > + * back out > > + */ > > + xdp.data_hard_start = vaddr; > > + xdp.frame_sz = DPAA_BP_RAW_SIZE; > > + xdpf = xdp_convert_buff_to_frame(&xdp); > > + if (unlikely(!xdpf)) { > > + free_pages((unsigned long)vaddr, 0); > > + break; > > + } > > + > > + if (dpaa_xdp_xmit_frame(priv->net_dev, xdpf)) > > + xdp_return_frame_rx_napi(xdpf); > > + > > + break; > > default: > > bpf_warn_invalid_xdp_action(xdp_act); > > fallthrough; > > @@ -2415,6 +2531,7 @@ static enum qman_cb_dqrr_result > rx_default_dqrr(struct qman_portal *portal, > > u32 fd_status, hash_offset; > > struct qm_sg_entry *sgt; > > struct dpaa_bp *dpaa_bp; > > + struct dpaa_fq *dpaa_fq; > > struct dpaa_priv *priv; > > struct sk_buff *skb; > > int *count_ptr; > > @@ -2423,9 +2540,10 @@ static enum qman_cb_dqrr_result > rx_default_dqrr(struct qman_portal *portal, > > u32 hash; > > u64 ns; > > > > + dpaa_fq = container_of(fq, struct dpaa_fq, fq_base); > > fd_status = be32_to_cpu(fd->status); > > fd_format = qm_fd_get_format(fd); > > - net_dev = ((struct dpaa_fq *)fq)->net_dev; > > + net_dev = dpaa_fq->net_dev; > > priv = netdev_priv(net_dev); > > dpaa_bp = dpaa_bpid2pool(dq->fd.bpid); > > if (!dpaa_bp) > > @@ -2494,7 +2612,7 @@ static enum qman_cb_dqrr_result > rx_default_dqrr(struct qman_portal *portal, > > > > if (likely(fd_format == qm_fd_contig)) { > > xdp_act = dpaa_run_xdp(priv, (struct qm_fd *)fd, vaddr, > > - &xdp_meta_len); > > + dpaa_fq, &xdp_meta_len); > > if (xdp_act != XDP_PASS) { > > percpu_stats->rx_packets++; > > percpu_stats->rx_bytes += qm_fd_get_length(fd); > > diff --git a/drivers/net/ethernet/freescale/dpaa/dpaa_eth.h > b/drivers/net/ethernet/freescale/dpaa/dpaa_eth.h > > index 94e8613..5c8d52a 100644 > > --- a/drivers/net/ethernet/freescale/dpaa/dpaa_eth.h > > +++ b/drivers/net/ethernet/freescale/dpaa/dpaa_eth.h > > @@ -68,6 +68,7 @@ struct dpaa_fq { > > u16 channel; > > u8 wq; > > enum dpaa_fq_type fq_type; > > + struct xdp_rxq_info xdp_rxq; > > }; > > > > struct dpaa_fq_cbs { > > @@ -150,6 +151,7 @@ struct dpaa_buffer_layout { > > */ > > struct dpaa_eth_swbp { > > struct sk_buff *skb; > > + struct xdp_frame *xdpf; > > }; > > > > struct dpaa_priv { > > -- > > 1.9.1 > >