> -----Original Message-----
> From: Thomas Monjalon <tho...@monjalon.net>
> Sent: Tuesday, November 3, 2020 2:14
> To: dev@dpdk.org
> Cc: ferruh.yi...@intel.com; david.march...@redhat.com;
> bruce.richard...@intel.com; olivier.m...@6wind.com;
> andrew.rybche...@oktetlabs.ru; jer...@marvell.com; Slava Ovsiienko
> <viachesl...@nvidia.com>; Ruifeng Wang <ruifeng.w...@arm.com>; David
> Christensen <d...@linux.vnet.ibm.com>; Matan Azrad <ma...@nvidia.com>;
> Shahaf Shuler <shah...@nvidia.com>; Konstantin Ananyev
> <konstantin.anan...@intel.com>
> Subject: [PATCH v3 07/16] net/mlx5: switch Rx timestamp to dynamic mbuf
> field
> 
> The mbuf timestamp is moved to a dynamic field in order to allow removal of
> the deprecated static field.
> The related mbuf flag is also replaced.
> 
> The dynamic offset and flag are stored in struct mlx5_rxq_data to favor cache
> locality.
> 
> Signed-off-by: Thomas Monjalon <tho...@monjalon.net>
> Reviewed-by: Ruifeng Wang <ruifeng.w...@arm.com>
> Reviewed-by: David Christensen <d...@linux.vnet.ibm.com>
Reviewed-by: Viacheslav Ovsiienko <viachesl...@nvidia.com>

> ---
>  drivers/net/mlx5/mlx5_rxq.c              |  8 +++++
>  drivers/net/mlx5/mlx5_rxtx.c             |  4 +--
>  drivers/net/mlx5/mlx5_rxtx.h             | 19 +++++++++++
>  drivers/net/mlx5/mlx5_rxtx_vec_altivec.h | 41 +++++++++++-----------
>  drivers/net/mlx5/mlx5_rxtx_vec_neon.h    | 43 ++++++++++++------------
>  drivers/net/mlx5/mlx5_rxtx_vec_sse.h     | 35 +++++++++----------
>  6 files changed, 90 insertions(+), 60 deletions(-)
> 
> diff --git a/drivers/net/mlx5/mlx5_rxq.c b/drivers/net/mlx5/mlx5_rxq.c index
> f1d8373079..52519910ee 100644
> --- a/drivers/net/mlx5/mlx5_rxq.c
> +++ b/drivers/net/mlx5/mlx5_rxq.c
> @@ -1492,7 +1492,15 @@ mlx5_rxq_new(struct rte_eth_dev *dev, uint16_t
> idx, uint16_t desc,
>       mlx5_max_lro_msg_size_adjust(dev, idx, max_lro_size);
>       /* Toggle RX checksum offload if hardware supports it. */
>       tmpl->rxq.csum = !!(offloads & DEV_RX_OFFLOAD_CHECKSUM);
> +     /* Configure Rx timestamp. */
>       tmpl->rxq.hw_timestamp = !!(offloads &
> DEV_RX_OFFLOAD_TIMESTAMP);
> +     tmpl->rxq.timestamp_rx_flag = 0;
> +     if (tmpl->rxq.hw_timestamp &&
> rte_mbuf_dyn_rx_timestamp_register(
> +                     &tmpl->rxq.timestamp_offset,
> +                     &tmpl->rxq.timestamp_rx_flag) != 0) {
> +             DRV_LOG(ERR, "Cannot register Rx timestamp field/flag");
> +             goto error;
> +     }
>       /* Configure VLAN stripping. */
>       tmpl->rxq.vlan_strip = !!(offloads & DEV_RX_OFFLOAD_VLAN_STRIP);
>       /* By default, FCS (CRC) is stripped by hardware. */ diff --git
> a/drivers/net/mlx5/mlx5_rxtx.c b/drivers/net/mlx5/mlx5_rxtx.c index
> e86468b67a..b577aab00b 100644
> --- a/drivers/net/mlx5/mlx5_rxtx.c
> +++ b/drivers/net/mlx5/mlx5_rxtx.c
> @@ -1287,8 +1287,8 @@ rxq_cq_to_mbuf(struct mlx5_rxq_data *rxq, struct
> rte_mbuf *pkt,
> 
>               if (rxq->rt_timestamp)
>                       ts = mlx5_txpp_convert_rx_ts(rxq->sh, ts);
> -             pkt->timestamp = ts;
> -             pkt->ol_flags |= PKT_RX_TIMESTAMP;
> +             mlx5_timestamp_set(pkt, rxq->timestamp_offset, ts);
> +             pkt->ol_flags |= rxq->timestamp_rx_flag;
>       }
>  }
> 
> diff --git a/drivers/net/mlx5/mlx5_rxtx.h b/drivers/net/mlx5/mlx5_rxtx.h index
> 674296ee98..e9eca36b40 100644
> --- a/drivers/net/mlx5/mlx5_rxtx.h
> +++ b/drivers/net/mlx5/mlx5_rxtx.h
> @@ -151,6 +151,8 @@ struct mlx5_rxq_data {
>       /* CQ (UAR) access lock required for 32bit implementations */  #endif
>       uint32_t tunnel; /* Tunnel information. */
> +     int timestamp_offset; /* Dynamic mbuf field for timestamp. */
> +     uint64_t timestamp_rx_flag; /* Dynamic mbuf flag for timestamp. */
>       uint64_t flow_meta_mask;
>       int32_t flow_meta_offset;
>  } __rte_cache_aligned;
> @@ -681,4 +683,21 @@ mlx5_txpp_convert_tx_ts(struct
> mlx5_dev_ctx_shared *sh, uint64_t mts)
>       return ci;
>  }
> 
> +/**
> + * Set timestamp in mbuf dynamic field.
> + *
> + * @param mbuf
> + *   Structure to write into.
> + * @param offset
> + *   Dynamic field offset in mbuf structure.
> + * @param timestamp
> + *   Value to write.
> + */
> +static __rte_always_inline void
> +mlx5_timestamp_set(struct rte_mbuf *mbuf, int offset,
> +             rte_mbuf_timestamp_t timestamp)
> +{
> +     *RTE_MBUF_DYNFIELD(mbuf, offset, rte_mbuf_timestamp_t *) =
> timestamp;
> +}
> +
>  #endif /* RTE_PMD_MLX5_RXTX_H_ */
> diff --git a/drivers/net/mlx5/mlx5_rxtx_vec_altivec.h
> b/drivers/net/mlx5/mlx5_rxtx_vec_altivec.h
> index 6bf0c9b540..171d7bb0f8 100644
> --- a/drivers/net/mlx5/mlx5_rxtx_vec_altivec.h
> +++ b/drivers/net/mlx5/mlx5_rxtx_vec_altivec.h
> @@ -330,13 +330,13 @@ rxq_cq_to_ptype_oflags_v(struct mlx5_rxq_data
> *rxq,
>       vector unsigned char ol_flags = (vector unsigned char)
>               (vector unsigned int){
>                       rxq->rss_hash * PKT_RX_RSS_HASH |
> -                             rxq->hw_timestamp * PKT_RX_TIMESTAMP,
> +                             rxq->hw_timestamp * rxq-
> >timestamp_rx_flag,
>                       rxq->rss_hash * PKT_RX_RSS_HASH |
> -                             rxq->hw_timestamp * PKT_RX_TIMESTAMP,
> +                             rxq->hw_timestamp * rxq-
> >timestamp_rx_flag,
>                       rxq->rss_hash * PKT_RX_RSS_HASH |
> -                             rxq->hw_timestamp * PKT_RX_TIMESTAMP,
> +                             rxq->hw_timestamp * rxq-
> >timestamp_rx_flag,
>                       rxq->rss_hash * PKT_RX_RSS_HASH |
> -                             rxq->hw_timestamp * PKT_RX_TIMESTAMP};
> +                             rxq->hw_timestamp * rxq-
> >timestamp_rx_flag};
>       vector unsigned char cv_flags;
>       const vector unsigned char zero = (vector unsigned char){0};
>       const vector unsigned char ptype_mask = @@ -1025,31 +1025,32 @@
> rxq_burst_v(struct mlx5_rxq_data *rxq, struct rte_mbuf **pkts, uint16_t
> pkts_n,
>               /* D.5 fill in mbuf - rearm_data and packet_type. */
>               rxq_cq_to_ptype_oflags_v(rxq, cqes, opcode, &pkts[pos]);
>               if (rxq->hw_timestamp) {
> +                     int offset = rxq->timestamp_offset;
>                       if (rxq->rt_timestamp) {
>                               struct mlx5_dev_ctx_shared *sh = rxq->sh;
>                               uint64_t ts;
> 
>                               ts = rte_be_to_cpu_64(cq[pos].timestamp);
> -                             pkts[pos]->timestamp =
> -                                     mlx5_txpp_convert_rx_ts(sh, ts);
> +                             mlx5_timestamp_set(pkts[pos], offset,
> +                                     mlx5_txpp_convert_rx_ts(sh, ts));
>                               ts = rte_be_to_cpu_64(cq[pos +
> p1].timestamp);
> -                             pkts[pos + 1]->timestamp =
> -                                     mlx5_txpp_convert_rx_ts(sh, ts);
> +                             mlx5_timestamp_set(pkts[pos + 1], offset,
> +                                     mlx5_txpp_convert_rx_ts(sh, ts));
>                               ts = rte_be_to_cpu_64(cq[pos +
> p2].timestamp);
> -                             pkts[pos + 2]->timestamp =
> -                                     mlx5_txpp_convert_rx_ts(sh, ts);
> +                             mlx5_timestamp_set(pkts[pos + 2], offset,
> +                                     mlx5_txpp_convert_rx_ts(sh, ts));
>                               ts = rte_be_to_cpu_64(cq[pos +
> p3].timestamp);
> -                             pkts[pos + 3]->timestamp =
> -                                     mlx5_txpp_convert_rx_ts(sh, ts);
> +                             mlx5_timestamp_set(pkts[pos + 3], offset,
> +                                     mlx5_txpp_convert_rx_ts(sh, ts));
>                       } else {
> -                             pkts[pos]->timestamp = rte_be_to_cpu_64
> -                                             (cq[pos].timestamp);
> -                             pkts[pos + 1]->timestamp = rte_be_to_cpu_64
> -                                             (cq[pos + p1].timestamp);
> -                             pkts[pos + 2]->timestamp = rte_be_to_cpu_64
> -                                             (cq[pos + p2].timestamp);
> -                             pkts[pos + 3]->timestamp = rte_be_to_cpu_64
> -                                             (cq[pos + p3].timestamp);
> +                             mlx5_timestamp_set(pkts[pos], offset,
> +
>       rte_be_to_cpu_64(cq[pos].timestamp));
> +                             mlx5_timestamp_set(pkts[pos + 1], offset,
> +                                     rte_be_to_cpu_64(cq[pos +
> p1].timestamp));
> +                             mlx5_timestamp_set(pkts[pos + 2], offset,
> +                                     rte_be_to_cpu_64(cq[pos +
> p2].timestamp));
> +                             mlx5_timestamp_set(pkts[pos + 3], offset,
> +                                     rte_be_to_cpu_64(cq[pos +
> p3].timestamp));
>                       }
>               }
>               if (rxq->dynf_meta) {
> diff --git a/drivers/net/mlx5/mlx5_rxtx_vec_neon.h
> b/drivers/net/mlx5/mlx5_rxtx_vec_neon.h
> index d122dad4fe..436b247ade 100644
> --- a/drivers/net/mlx5/mlx5_rxtx_vec_neon.h
> +++ b/drivers/net/mlx5/mlx5_rxtx_vec_neon.h
> @@ -271,7 +271,7 @@ rxq_cq_to_ptype_oflags_v(struct mlx5_rxq_data *rxq,
>       uint32x4_t pinfo, cv_flags;
>       uint32x4_t ol_flags =
>               vdupq_n_u32(rxq->rss_hash * PKT_RX_RSS_HASH |
> -                         rxq->hw_timestamp * PKT_RX_TIMESTAMP);
> +                         rxq->hw_timestamp * rxq->timestamp_rx_flag);
>       const uint32x4_t ptype_ol_mask = { 0x106, 0x106, 0x106, 0x106 };
>       const uint8x16_t cv_flag_sel = {
>               0,
> @@ -697,6 +697,7 @@ rxq_burst_v(struct mlx5_rxq_data *rxq, struct
> rte_mbuf **pkts, uint16_t pkts_n,
>               rxq_cq_to_ptype_oflags_v(rxq, ptype_info, flow_tag,
>                                        opcode, &elts[pos]);
>               if (rxq->hw_timestamp) {
> +                     int offset = rxq->timestamp_offset;
>                       if (rxq->rt_timestamp) {
>                               struct mlx5_dev_ctx_shared *sh = rxq->sh;
>                               uint64_t ts;
> @@ -704,36 +705,36 @@ rxq_burst_v(struct mlx5_rxq_data *rxq, struct
> rte_mbuf **pkts, uint16_t pkts_n,
>                               ts = rte_be_to_cpu_64
>                                       (container_of(p0, struct mlx5_cqe,
>                                                     pkt_info)->timestamp);
> -                             elts[pos]->timestamp =
> -                                     mlx5_txpp_convert_rx_ts(sh, ts);
> +                             mlx5_timestamp_set(elts[pos], offset,
> +                                     mlx5_txpp_convert_rx_ts(sh, ts));
>                               ts = rte_be_to_cpu_64
>                                       (container_of(p1, struct mlx5_cqe,
>                                                     pkt_info)->timestamp);
> -                             elts[pos + 1]->timestamp =
> -                                     mlx5_txpp_convert_rx_ts(sh, ts);
> +                             mlx5_timestamp_set(elts[pos + 1], offset,
> +                                     mlx5_txpp_convert_rx_ts(sh, ts));
>                               ts = rte_be_to_cpu_64
>                                       (container_of(p2, struct mlx5_cqe,
>                                                     pkt_info)->timestamp);
> -                             elts[pos + 2]->timestamp =
> -                                     mlx5_txpp_convert_rx_ts(sh, ts);
> +                             mlx5_timestamp_set(elts[pos + 2], offset,
> +                                     mlx5_txpp_convert_rx_ts(sh, ts));
>                               ts = rte_be_to_cpu_64
>                                       (container_of(p3, struct mlx5_cqe,
>                                                     pkt_info)->timestamp);
> -                             elts[pos + 3]->timestamp =
> -                                     mlx5_txpp_convert_rx_ts(sh, ts);
> +                             mlx5_timestamp_set(elts[pos + 3], offset,
> +                                     mlx5_txpp_convert_rx_ts(sh, ts));
>                       } else {
> -                             elts[pos]->timestamp = rte_be_to_cpu_64
> -                                     (container_of(p0, struct mlx5_cqe,
> -                                                   pkt_info)->timestamp);
> -                             elts[pos + 1]->timestamp = rte_be_to_cpu_64
> -                                     (container_of(p1, struct mlx5_cqe,
> -                                                   pkt_info)->timestamp);
> -                             elts[pos + 2]->timestamp = rte_be_to_cpu_64
> -                                     (container_of(p2, struct mlx5_cqe,
> -                                                   pkt_info)->timestamp);
> -                             elts[pos + 3]->timestamp = rte_be_to_cpu_64
> -                                     (container_of(p3, struct mlx5_cqe,
> -                                                   pkt_info)->timestamp);
> +                             mlx5_timestamp_set(elts[pos], offset,
> +                                     rte_be_to_cpu_64(container_of(p0,
> +                                     struct mlx5_cqe, pkt_info)-
> >timestamp));
> +                             mlx5_timestamp_set(elts[pos + 1], offset,
> +                                     rte_be_to_cpu_64(container_of(p1,
> +                                     struct mlx5_cqe, pkt_info)-
> >timestamp));
> +                             mlx5_timestamp_set(elts[pos + 2], offset,
> +                                     rte_be_to_cpu_64(container_of(p2,
> +                                     struct mlx5_cqe, pkt_info)-
> >timestamp));
> +                             mlx5_timestamp_set(elts[pos + 3], offset,
> +                                     rte_be_to_cpu_64(container_of(p3,
> +                                     struct mlx5_cqe, pkt_info)-
> >timestamp));
>                       }
>               }
>               if (rxq->dynf_meta) {
> diff --git a/drivers/net/mlx5/mlx5_rxtx_vec_sse.h
> b/drivers/net/mlx5/mlx5_rxtx_vec_sse.h
> index 0bbcbeefff..ae4439efc7 100644
> --- a/drivers/net/mlx5/mlx5_rxtx_vec_sse.h
> +++ b/drivers/net/mlx5/mlx5_rxtx_vec_sse.h
> @@ -251,7 +251,7 @@ rxq_cq_to_ptype_oflags_v(struct mlx5_rxq_data *rxq,
> __m128i cqes[4],
>       __m128i pinfo0, pinfo1;
>       __m128i pinfo, ptype;
>       __m128i ol_flags = _mm_set1_epi32(rxq->rss_hash *
> PKT_RX_RSS_HASH |
> -                                       rxq->hw_timestamp *
> PKT_RX_TIMESTAMP);
> +                                       rxq->hw_timestamp * rxq-
> >timestamp_rx_flag);
>       __m128i cv_flags;
>       const __m128i zero = _mm_setzero_si128();
>       const __m128i ptype_mask =
> @@ -656,31 +656,32 @@ rxq_burst_v(struct mlx5_rxq_data *rxq, struct
> rte_mbuf **pkts, uint16_t pkts_n,
>               /* D.5 fill in mbuf - rearm_data and packet_type. */
>               rxq_cq_to_ptype_oflags_v(rxq, cqes, opcode, &pkts[pos]);
>               if (rxq->hw_timestamp) {
> +                     int offset = rxq->timestamp_offset;
>                       if (rxq->rt_timestamp) {
>                               struct mlx5_dev_ctx_shared *sh = rxq->sh;
>                               uint64_t ts;
> 
>                               ts = rte_be_to_cpu_64(cq[pos].timestamp);
> -                             pkts[pos]->timestamp =
> -                                     mlx5_txpp_convert_rx_ts(sh, ts);
> +                             mlx5_timestamp_set(pkts[pos], offset,
> +                                     mlx5_txpp_convert_rx_ts(sh, ts));
>                               ts = rte_be_to_cpu_64(cq[pos +
> p1].timestamp);
> -                             pkts[pos + 1]->timestamp =
> -                                     mlx5_txpp_convert_rx_ts(sh, ts);
> +                             mlx5_timestamp_set(pkts[pos + 1], offset,
> +                                     mlx5_txpp_convert_rx_ts(sh, ts));
>                               ts = rte_be_to_cpu_64(cq[pos +
> p2].timestamp);
> -                             pkts[pos + 2]->timestamp =
> -                                     mlx5_txpp_convert_rx_ts(sh, ts);
> +                             mlx5_timestamp_set(pkts[pos + 2], offset,
> +                                     mlx5_txpp_convert_rx_ts(sh, ts));
>                               ts = rte_be_to_cpu_64(cq[pos +
> p3].timestamp);
> -                             pkts[pos + 3]->timestamp =
> -                                     mlx5_txpp_convert_rx_ts(sh, ts);
> +                             mlx5_timestamp_set(pkts[pos + 3], offset,
> +                                     mlx5_txpp_convert_rx_ts(sh, ts));
>                       } else {
> -                             pkts[pos]->timestamp = rte_be_to_cpu_64
> -                                             (cq[pos].timestamp);
> -                             pkts[pos + 1]->timestamp = rte_be_to_cpu_64
> -                                             (cq[pos + p1].timestamp);
> -                             pkts[pos + 2]->timestamp = rte_be_to_cpu_64
> -                                             (cq[pos + p2].timestamp);
> -                             pkts[pos + 3]->timestamp = rte_be_to_cpu_64
> -                                             (cq[pos + p3].timestamp);
> +                             mlx5_timestamp_set(pkts[pos], offset,
> +
>       rte_be_to_cpu_64(cq[pos].timestamp));
> +                             mlx5_timestamp_set(pkts[pos + 1], offset,
> +                                     rte_be_to_cpu_64(cq[pos +
> p1].timestamp));
> +                             mlx5_timestamp_set(pkts[pos + 2], offset,
> +                                     rte_be_to_cpu_64(cq[pos +
> p2].timestamp));
> +                             mlx5_timestamp_set(pkts[pos + 3], offset,
> +                                     rte_be_to_cpu_64(cq[pos +
> p3].timestamp));
>                       }
>               }
>               if (rxq->dynf_meta) {
> --
> 2.28.0

Reply via email to