net/mlx5: switch Rx timestamp to dynamic mbuf field
authorThomas Monjalon <thomas@monjalon.net>
Thu, 29 Oct 2020 03:53:38 +0000 (04:53 +0100)
committerThomas Monjalon <thomas@monjalon.net>
Tue, 3 Nov 2020 15:21:15 +0000 (16:21 +0100)
The mbuf timestamp is moved to a dynamic field
in order to allow removal of the deprecated static field.
The related mbuf flag is also replaced.

The dynamic offset and flag are stored in struct mlx5_rxq_data
to favor cache locality.

Signed-off-by: Thomas Monjalon <thomas@monjalon.net>
Reviewed-by: Ruifeng Wang <ruifeng.wang@arm.com>
Reviewed-by: David Christensen <drc@linux.vnet.ibm.com>
Acked-by: Viacheslav Ovsiienko <viacheslavo@nvidia.com>
Acked-by: David Marchand <david.marchand@redhat.com>
Acked-by: Olivier Matz <olivier.matz@6wind.com>
drivers/net/mlx5/mlx5_rxq.c
drivers/net/mlx5/mlx5_rxtx.c
drivers/net/mlx5/mlx5_rxtx.h
drivers/net/mlx5/mlx5_rxtx_vec_altivec.h
drivers/net/mlx5/mlx5_rxtx_vec_neon.h
drivers/net/mlx5/mlx5_rxtx_vec_sse.h

index f1d8373..5251991 100644 (file)
@@ -1492,7 +1492,15 @@ mlx5_rxq_new(struct rte_eth_dev *dev, uint16_t idx, uint16_t desc,
        mlx5_max_lro_msg_size_adjust(dev, idx, max_lro_size);
        /* Toggle RX checksum offload if hardware supports it. */
        tmpl->rxq.csum = !!(offloads & DEV_RX_OFFLOAD_CHECKSUM);
+       /* Configure Rx timestamp. */
        tmpl->rxq.hw_timestamp = !!(offloads & DEV_RX_OFFLOAD_TIMESTAMP);
+       tmpl->rxq.timestamp_rx_flag = 0;
+       if (tmpl->rxq.hw_timestamp && rte_mbuf_dyn_rx_timestamp_register(
+                       &tmpl->rxq.timestamp_offset,
+                       &tmpl->rxq.timestamp_rx_flag) != 0) {
+               DRV_LOG(ERR, "Cannot register Rx timestamp field/flag");
+               goto error;
+       }
        /* Configure VLAN stripping. */
        tmpl->rxq.vlan_strip = !!(offloads & DEV_RX_OFFLOAD_VLAN_STRIP);
        /* By default, FCS (CRC) is stripped by hardware. */
index e86468b..b577aab 100644 (file)
@@ -1287,8 +1287,8 @@ rxq_cq_to_mbuf(struct mlx5_rxq_data *rxq, struct rte_mbuf *pkt,
 
                if (rxq->rt_timestamp)
                        ts = mlx5_txpp_convert_rx_ts(rxq->sh, ts);
-               pkt->timestamp = ts;
-               pkt->ol_flags |= PKT_RX_TIMESTAMP;
+               mlx5_timestamp_set(pkt, rxq->timestamp_offset, ts);
+               pkt->ol_flags |= rxq->timestamp_rx_flag;
        }
 }
 
index 674296e..e9eca36 100644 (file)
@@ -151,6 +151,8 @@ struct mlx5_rxq_data {
        /* CQ (UAR) access lock required for 32bit implementations */
 #endif
        uint32_t tunnel; /* Tunnel information. */
+       int timestamp_offset; /* Dynamic mbuf field for timestamp. */
+       uint64_t timestamp_rx_flag; /* Dynamic mbuf flag for timestamp. */
        uint64_t flow_meta_mask;
        int32_t flow_meta_offset;
 } __rte_cache_aligned;
@@ -681,4 +683,21 @@ mlx5_txpp_convert_tx_ts(struct mlx5_dev_ctx_shared *sh, uint64_t mts)
        return ci;
 }
 
+/**
+ * Set timestamp in mbuf dynamic field.
+ *
+ * @param mbuf
+ *   Structure to write into.
+ * @param offset
+ *   Dynamic field offset in mbuf structure.
+ * @param timestamp
+ *   Value to write.
+ */
+static __rte_always_inline void
+mlx5_timestamp_set(struct rte_mbuf *mbuf, int offset,
+               rte_mbuf_timestamp_t timestamp)
+{
+       *RTE_MBUF_DYNFIELD(mbuf, offset, rte_mbuf_timestamp_t *) = timestamp;
+}
+
 #endif /* RTE_PMD_MLX5_RXTX_H_ */
index 6bf0c9b..171d7bb 100644 (file)
@@ -330,13 +330,13 @@ rxq_cq_to_ptype_oflags_v(struct mlx5_rxq_data *rxq,
        vector unsigned char ol_flags = (vector unsigned char)
                (vector unsigned int){
                        rxq->rss_hash * PKT_RX_RSS_HASH |
-                               rxq->hw_timestamp * PKT_RX_TIMESTAMP,
+                               rxq->hw_timestamp * rxq->timestamp_rx_flag,
                        rxq->rss_hash * PKT_RX_RSS_HASH |
-                               rxq->hw_timestamp * PKT_RX_TIMESTAMP,
+                               rxq->hw_timestamp * rxq->timestamp_rx_flag,
                        rxq->rss_hash * PKT_RX_RSS_HASH |
-                               rxq->hw_timestamp * PKT_RX_TIMESTAMP,
+                               rxq->hw_timestamp * rxq->timestamp_rx_flag,
                        rxq->rss_hash * PKT_RX_RSS_HASH |
-                               rxq->hw_timestamp * PKT_RX_TIMESTAMP};
+                               rxq->hw_timestamp * rxq->timestamp_rx_flag};
        vector unsigned char cv_flags;
        const vector unsigned char zero = (vector unsigned char){0};
        const vector unsigned char ptype_mask =
@@ -1025,31 +1025,32 @@ rxq_burst_v(struct mlx5_rxq_data *rxq, struct rte_mbuf **pkts, uint16_t pkts_n,
                /* D.5 fill in mbuf - rearm_data and packet_type. */
                rxq_cq_to_ptype_oflags_v(rxq, cqes, opcode, &pkts[pos]);
                if (rxq->hw_timestamp) {
+                       int offset = rxq->timestamp_offset;
                        if (rxq->rt_timestamp) {
                                struct mlx5_dev_ctx_shared *sh = rxq->sh;
                                uint64_t ts;
 
                                ts = rte_be_to_cpu_64(cq[pos].timestamp);
-                               pkts[pos]->timestamp =
-                                       mlx5_txpp_convert_rx_ts(sh, ts);
+                               mlx5_timestamp_set(pkts[pos], offset,
+                                       mlx5_txpp_convert_rx_ts(sh, ts));
                                ts = rte_be_to_cpu_64(cq[pos + p1].timestamp);
-                               pkts[pos + 1]->timestamp =
-                                       mlx5_txpp_convert_rx_ts(sh, ts);
+                               mlx5_timestamp_set(pkts[pos + 1], offset,
+                                       mlx5_txpp_convert_rx_ts(sh, ts));
                                ts = rte_be_to_cpu_64(cq[pos + p2].timestamp);
-                               pkts[pos + 2]->timestamp =
-                                       mlx5_txpp_convert_rx_ts(sh, ts);
+                               mlx5_timestamp_set(pkts[pos + 2], offset,
+                                       mlx5_txpp_convert_rx_ts(sh, ts));
                                ts = rte_be_to_cpu_64(cq[pos + p3].timestamp);
-                               pkts[pos + 3]->timestamp =
-                                       mlx5_txpp_convert_rx_ts(sh, ts);
+                               mlx5_timestamp_set(pkts[pos + 3], offset,
+                                       mlx5_txpp_convert_rx_ts(sh, ts));
                        } else {
-                               pkts[pos]->timestamp = rte_be_to_cpu_64
-                                               (cq[pos].timestamp);
-                               pkts[pos + 1]->timestamp = rte_be_to_cpu_64
-                                               (cq[pos + p1].timestamp);
-                               pkts[pos + 2]->timestamp = rte_be_to_cpu_64
-                                               (cq[pos + p2].timestamp);
-                               pkts[pos + 3]->timestamp = rte_be_to_cpu_64
-                                               (cq[pos + p3].timestamp);
+                               mlx5_timestamp_set(pkts[pos], offset,
+                                       rte_be_to_cpu_64(cq[pos].timestamp));
+                               mlx5_timestamp_set(pkts[pos + 1], offset,
+                                       rte_be_to_cpu_64(cq[pos + p1].timestamp));
+                               mlx5_timestamp_set(pkts[pos + 2], offset,
+                                       rte_be_to_cpu_64(cq[pos + p2].timestamp));
+                               mlx5_timestamp_set(pkts[pos + 3], offset,
+                                       rte_be_to_cpu_64(cq[pos + p3].timestamp));
                        }
                }
                if (rxq->dynf_meta) {
index d122dad..436b247 100644 (file)
@@ -271,7 +271,7 @@ rxq_cq_to_ptype_oflags_v(struct mlx5_rxq_data *rxq,
        uint32x4_t pinfo, cv_flags;
        uint32x4_t ol_flags =
                vdupq_n_u32(rxq->rss_hash * PKT_RX_RSS_HASH |
-                           rxq->hw_timestamp * PKT_RX_TIMESTAMP);
+                           rxq->hw_timestamp * rxq->timestamp_rx_flag);
        const uint32x4_t ptype_ol_mask = { 0x106, 0x106, 0x106, 0x106 };
        const uint8x16_t cv_flag_sel = {
                0,
@@ -697,6 +697,7 @@ rxq_burst_v(struct mlx5_rxq_data *rxq, struct rte_mbuf **pkts, uint16_t pkts_n,
                rxq_cq_to_ptype_oflags_v(rxq, ptype_info, flow_tag,
                                         opcode, &elts[pos]);
                if (rxq->hw_timestamp) {
+                       int offset = rxq->timestamp_offset;
                        if (rxq->rt_timestamp) {
                                struct mlx5_dev_ctx_shared *sh = rxq->sh;
                                uint64_t ts;
@@ -704,36 +705,36 @@ rxq_burst_v(struct mlx5_rxq_data *rxq, struct rte_mbuf **pkts, uint16_t pkts_n,
                                ts = rte_be_to_cpu_64
                                        (container_of(p0, struct mlx5_cqe,
                                                      pkt_info)->timestamp);
-                               elts[pos]->timestamp =
-                                       mlx5_txpp_convert_rx_ts(sh, ts);
+                               mlx5_timestamp_set(elts[pos], offset,
+                                       mlx5_txpp_convert_rx_ts(sh, ts));
                                ts = rte_be_to_cpu_64
                                        (container_of(p1, struct mlx5_cqe,
                                                      pkt_info)->timestamp);
-                               elts[pos + 1]->timestamp =
-                                       mlx5_txpp_convert_rx_ts(sh, ts);
+                               mlx5_timestamp_set(elts[pos + 1], offset,
+                                       mlx5_txpp_convert_rx_ts(sh, ts));
                                ts = rte_be_to_cpu_64
                                        (container_of(p2, struct mlx5_cqe,
                                                      pkt_info)->timestamp);
-                               elts[pos + 2]->timestamp =
-                                       mlx5_txpp_convert_rx_ts(sh, ts);
+                               mlx5_timestamp_set(elts[pos + 2], offset,
+                                       mlx5_txpp_convert_rx_ts(sh, ts));
                                ts = rte_be_to_cpu_64
                                        (container_of(p3, struct mlx5_cqe,
                                                      pkt_info)->timestamp);
-                               elts[pos + 3]->timestamp =
-                                       mlx5_txpp_convert_rx_ts(sh, ts);
+                               mlx5_timestamp_set(elts[pos + 3], offset,
+                                       mlx5_txpp_convert_rx_ts(sh, ts));
                        } else {
-                               elts[pos]->timestamp = rte_be_to_cpu_64
-                                       (container_of(p0, struct mlx5_cqe,
-                                                     pkt_info)->timestamp);
-                               elts[pos + 1]->timestamp = rte_be_to_cpu_64
-                                       (container_of(p1, struct mlx5_cqe,
-                                                     pkt_info)->timestamp);
-                               elts[pos + 2]->timestamp = rte_be_to_cpu_64
-                                       (container_of(p2, struct mlx5_cqe,
-                                                     pkt_info)->timestamp);
-                               elts[pos + 3]->timestamp = rte_be_to_cpu_64
-                                       (container_of(p3, struct mlx5_cqe,
-                                                     pkt_info)->timestamp);
+                               mlx5_timestamp_set(elts[pos], offset,
+                                       rte_be_to_cpu_64(container_of(p0,
+                                       struct mlx5_cqe, pkt_info)->timestamp));
+                               mlx5_timestamp_set(elts[pos + 1], offset,
+                                       rte_be_to_cpu_64(container_of(p1,
+                                       struct mlx5_cqe, pkt_info)->timestamp));
+                               mlx5_timestamp_set(elts[pos + 2], offset,
+                                       rte_be_to_cpu_64(container_of(p2,
+                                       struct mlx5_cqe, pkt_info)->timestamp));
+                               mlx5_timestamp_set(elts[pos + 3], offset,
+                                       rte_be_to_cpu_64(container_of(p3,
+                                       struct mlx5_cqe, pkt_info)->timestamp));
                        }
                }
                if (rxq->dynf_meta) {
index 0bbcbee..ae4439e 100644 (file)
@@ -251,7 +251,7 @@ rxq_cq_to_ptype_oflags_v(struct mlx5_rxq_data *rxq, __m128i cqes[4],
        __m128i pinfo0, pinfo1;
        __m128i pinfo, ptype;
        __m128i ol_flags = _mm_set1_epi32(rxq->rss_hash * PKT_RX_RSS_HASH |
-                                         rxq->hw_timestamp * PKT_RX_TIMESTAMP);
+                                         rxq->hw_timestamp * rxq->timestamp_rx_flag);
        __m128i cv_flags;
        const __m128i zero = _mm_setzero_si128();
        const __m128i ptype_mask =
@@ -656,31 +656,32 @@ rxq_burst_v(struct mlx5_rxq_data *rxq, struct rte_mbuf **pkts, uint16_t pkts_n,
                /* D.5 fill in mbuf - rearm_data and packet_type. */
                rxq_cq_to_ptype_oflags_v(rxq, cqes, opcode, &pkts[pos]);
                if (rxq->hw_timestamp) {
+                       int offset = rxq->timestamp_offset;
                        if (rxq->rt_timestamp) {
                                struct mlx5_dev_ctx_shared *sh = rxq->sh;
                                uint64_t ts;
 
                                ts = rte_be_to_cpu_64(cq[pos].timestamp);
-                               pkts[pos]->timestamp =
-                                       mlx5_txpp_convert_rx_ts(sh, ts);
+                               mlx5_timestamp_set(pkts[pos], offset,
+                                       mlx5_txpp_convert_rx_ts(sh, ts));
                                ts = rte_be_to_cpu_64(cq[pos + p1].timestamp);
-                               pkts[pos + 1]->timestamp =
-                                       mlx5_txpp_convert_rx_ts(sh, ts);
+                               mlx5_timestamp_set(pkts[pos + 1], offset,
+                                       mlx5_txpp_convert_rx_ts(sh, ts));
                                ts = rte_be_to_cpu_64(cq[pos + p2].timestamp);
-                               pkts[pos + 2]->timestamp =
-                                       mlx5_txpp_convert_rx_ts(sh, ts);
+                               mlx5_timestamp_set(pkts[pos + 2], offset,
+                                       mlx5_txpp_convert_rx_ts(sh, ts));
                                ts = rte_be_to_cpu_64(cq[pos + p3].timestamp);
-                               pkts[pos + 3]->timestamp =
-                                       mlx5_txpp_convert_rx_ts(sh, ts);
+                               mlx5_timestamp_set(pkts[pos + 3], offset,
+                                       mlx5_txpp_convert_rx_ts(sh, ts));
                        } else {
-                               pkts[pos]->timestamp = rte_be_to_cpu_64
-                                               (cq[pos].timestamp);
-                               pkts[pos + 1]->timestamp = rte_be_to_cpu_64
-                                               (cq[pos + p1].timestamp);
-                               pkts[pos + 2]->timestamp = rte_be_to_cpu_64
-                                               (cq[pos + p2].timestamp);
-                               pkts[pos + 3]->timestamp = rte_be_to_cpu_64
-                                               (cq[pos + p3].timestamp);
+                               mlx5_timestamp_set(pkts[pos], offset,
+                                       rte_be_to_cpu_64(cq[pos].timestamp));
+                               mlx5_timestamp_set(pkts[pos + 1], offset,
+                                       rte_be_to_cpu_64(cq[pos + p1].timestamp));
+                               mlx5_timestamp_set(pkts[pos + 2], offset,
+                                       rte_be_to_cpu_64(cq[pos + p2].timestamp));
+                               mlx5_timestamp_set(pkts[pos + 3], offset,
+                                       rte_be_to_cpu_64(cq[pos + p3].timestamp));
                        }
                }
                if (rxq->dynf_meta) {