1 /* SPDX-License-Identifier: BSD-3-Clause
2 * Copyright 2018-2019 Cisco Systems, Inc. All rights reserved.
9 #include <sys/socket.h>
11 #include <sys/ioctl.h>
13 #include <linux/if_ether.h>
15 #include <sys/eventfd.h>
17 #include <rte_version.h>
19 #include <rte_ether.h>
20 #include <rte_ethdev_driver.h>
21 #include <rte_ethdev_vdev.h>
22 #include <rte_malloc.h>
23 #include <rte_kvargs.h>
24 #include <rte_bus_vdev.h>
25 #include <rte_string_fns.h>
26 #include <rte_errno.h>
27 #include <rte_memory.h>
28 #include <rte_memzone.h>
29 #include <rte_eal_memconfig.h>
31 #include "rte_eth_memif.h"
32 #include "memif_socket.h"
34 #define ETH_MEMIF_ID_ARG "id"
35 #define ETH_MEMIF_ROLE_ARG "role"
36 #define ETH_MEMIF_PKT_BUFFER_SIZE_ARG "bsize"
37 #define ETH_MEMIF_RING_SIZE_ARG "rsize"
38 #define ETH_MEMIF_SOCKET_ARG "socket"
39 #define ETH_MEMIF_MAC_ARG "mac"
40 #define ETH_MEMIF_ZC_ARG "zero-copy"
41 #define ETH_MEMIF_SECRET_ARG "secret"
43 static const char * const valid_arguments[] = {
46 ETH_MEMIF_PKT_BUFFER_SIZE_ARG,
47 ETH_MEMIF_RING_SIZE_ARG,
55 static const struct rte_eth_link pmd_link = {
56 .link_speed = ETH_SPEED_NUM_10G,
57 .link_duplex = ETH_LINK_FULL_DUPLEX,
58 .link_status = ETH_LINK_DOWN,
59 .link_autoneg = ETH_LINK_AUTONEG
62 #define MEMIF_MP_SEND_REGION "memif_mp_send_region"
65 static int memif_region_init_zc(const struct rte_memseg_list *msl,
66 const struct rte_memseg *ms, void *arg);
71 return ("memif-" RTE_STR(MEMIF_VERSION_MAJOR) "." RTE_STR(MEMIF_VERSION_MINOR));
74 /* Message header to synchronize regions */
75 struct mp_region_msg {
76 char port_name[RTE_DEV_NAME_MAX_LEN];
77 memif_region_index_t idx;
78 memif_region_size_t size;
82 memif_mp_send_region(const struct rte_mp_msg *msg, const void *peer)
84 struct rte_eth_dev *dev;
85 struct pmd_process_private *proc_private;
86 const struct mp_region_msg *msg_param = (const struct mp_region_msg *)msg->param;
87 struct rte_mp_msg reply;
88 struct mp_region_msg *reply_param = (struct mp_region_msg *)reply.param;
92 /* Get requested port */
93 ret = rte_eth_dev_get_port_by_name(msg_param->port_name, &port_id);
95 MIF_LOG(ERR, "Failed to get port id for %s",
96 msg_param->port_name);
99 dev = &rte_eth_devices[port_id];
100 proc_private = dev->process_private;
102 memset(&reply, 0, sizeof(reply));
103 strlcpy(reply.name, msg->name, sizeof(reply.name));
104 reply_param->idx = msg_param->idx;
105 if (proc_private->regions[msg_param->idx] != NULL) {
106 reply_param->size = proc_private->regions[msg_param->idx]->region_size;
107 reply.fds[0] = proc_private->regions[msg_param->idx]->fd;
110 reply.len_param = sizeof(*reply_param);
111 if (rte_mp_reply(&reply, peer) < 0) {
112 MIF_LOG(ERR, "Failed to reply to an add region request");
121 * Called by secondary process, when ports link status goes up.
124 memif_mp_request_regions(struct rte_eth_dev *dev)
127 struct timespec timeout = {.tv_sec = 5, .tv_nsec = 0};
128 struct rte_mp_msg msg, *reply;
129 struct rte_mp_reply replies;
130 struct mp_region_msg *msg_param = (struct mp_region_msg *)msg.param;
131 struct mp_region_msg *reply_param;
132 struct memif_region *r;
133 struct pmd_process_private *proc_private = dev->process_private;
134 struct pmd_internals *pmd = dev->data->dev_private;
135 /* in case of zero-copy slave, only request region 0 */
136 uint16_t max_region_num = (pmd->flags & ETH_MEMIF_FLAG_ZERO_COPY) ?
137 1 : ETH_MEMIF_MAX_REGION_NUM;
139 MIF_LOG(DEBUG, "Requesting memory regions");
141 for (i = 0; i < max_region_num; i++) {
142 /* Prepare the message */
143 memset(&msg, 0, sizeof(msg));
144 strlcpy(msg.name, MEMIF_MP_SEND_REGION, sizeof(msg.name));
145 strlcpy(msg_param->port_name, dev->data->name,
146 sizeof(msg_param->port_name));
148 msg.len_param = sizeof(*msg_param);
151 ret = rte_mp_request_sync(&msg, &replies, &timeout);
152 if (ret < 0 || replies.nb_received != 1) {
153 MIF_LOG(ERR, "Failed to send mp msg: %d",
158 reply = &replies.msgs[0];
159 reply_param = (struct mp_region_msg *)reply->param;
161 if (reply_param->size > 0) {
162 r = rte_zmalloc("region", sizeof(struct memif_region), 0);
164 MIF_LOG(ERR, "Failed to alloc memif region.");
168 r->region_size = reply_param->size;
169 if (reply->num_fds < 1) {
170 MIF_LOG(ERR, "Missing file descriptor.");
174 r->fd = reply->fds[0];
177 proc_private->regions[reply_param->idx] = r;
178 proc_private->regions_num++;
183 if (pmd->flags & ETH_MEMIF_FLAG_ZERO_COPY) {
184 ret = rte_memseg_walk(memif_region_init_zc, (void *)proc_private);
189 return memif_connect(dev);
193 memif_dev_info(struct rte_eth_dev *dev __rte_unused, struct rte_eth_dev_info *dev_info)
195 dev_info->max_mac_addrs = 1;
196 dev_info->max_rx_pktlen = (uint32_t)ETH_FRAME_LEN;
197 dev_info->max_rx_queues = ETH_MEMIF_MAX_NUM_Q_PAIRS;
198 dev_info->max_tx_queues = ETH_MEMIF_MAX_NUM_Q_PAIRS;
199 dev_info->min_rx_bufsize = 0;
204 static memif_ring_t *
205 memif_get_ring(struct pmd_internals *pmd, struct pmd_process_private *proc_private,
206 memif_ring_type_t type, uint16_t ring_num)
208 /* rings only in region 0 */
209 void *p = proc_private->regions[0]->addr;
210 int ring_size = sizeof(memif_ring_t) + sizeof(memif_desc_t) *
211 (1 << pmd->run.log2_ring_size);
213 p = (uint8_t *)p + (ring_num + type * pmd->run.num_s2m_rings) * ring_size;
215 return (memif_ring_t *)p;
218 static memif_region_offset_t
219 memif_get_ring_offset(struct rte_eth_dev *dev, struct memif_queue *mq,
220 memif_ring_type_t type, uint16_t num)
222 struct pmd_internals *pmd = dev->data->dev_private;
223 struct pmd_process_private *proc_private = dev->process_private;
225 return ((uint8_t *)memif_get_ring(pmd, proc_private, type, num) -
226 (uint8_t *)proc_private->regions[mq->region]->addr);
229 static memif_ring_t *
230 memif_get_ring_from_queue(struct pmd_process_private *proc_private,
231 struct memif_queue *mq)
233 struct memif_region *r;
235 r = proc_private->regions[mq->region];
239 return (memif_ring_t *)((uint8_t *)r->addr + mq->ring_offset);
243 memif_get_buffer(struct pmd_process_private *proc_private, memif_desc_t *d)
245 return ((uint8_t *)proc_private->regions[d->region]->addr + d->offset);
248 /* Free mbufs received by master */
250 memif_free_stored_mbufs(struct pmd_process_private *proc_private, struct memif_queue *mq)
253 uint16_t mask = (1 << mq->log2_ring_size) - 1;
254 memif_ring_t *ring = memif_get_ring_from_queue(proc_private, mq);
256 /* FIXME: improve performance */
257 /* The ring->tail acts as a guard variable between Tx and Rx
258 * threads, so using load-acquire pairs with store-release
259 * in function eth_memif_rx for S2M queues.
261 cur_tail = __atomic_load_n(&ring->tail, __ATOMIC_ACQUIRE);
262 while (mq->last_tail != cur_tail) {
263 RTE_MBUF_PREFETCH_TO_FREE(mq->buffers[(mq->last_tail + 1) & mask]);
264 /* Decrement refcnt and free mbuf. (current segment) */
265 rte_mbuf_refcnt_update(mq->buffers[mq->last_tail & mask], -1);
266 rte_pktmbuf_free_seg(mq->buffers[mq->last_tail & mask]);
272 memif_pktmbuf_chain(struct rte_mbuf *head, struct rte_mbuf *cur_tail,
273 struct rte_mbuf *tail)
275 /* Check for number-of-segments-overflow */
276 if (unlikely(head->nb_segs + tail->nb_segs > RTE_MBUF_MAX_NB_SEGS))
279 /* Chain 'tail' onto the old tail */
280 cur_tail->next = tail;
282 /* accumulate number of segments and total length. */
283 head->nb_segs = (uint16_t)(head->nb_segs + tail->nb_segs);
285 tail->pkt_len = tail->data_len;
286 head->pkt_len += tail->pkt_len;
292 eth_memif_rx(void *queue, struct rte_mbuf **bufs, uint16_t nb_pkts)
294 struct memif_queue *mq = queue;
295 struct pmd_internals *pmd = rte_eth_devices[mq->in_port].data->dev_private;
296 struct pmd_process_private *proc_private =
297 rte_eth_devices[mq->in_port].process_private;
298 memif_ring_t *ring = memif_get_ring_from_queue(proc_private, mq);
299 uint16_t cur_slot, last_slot, n_slots, ring_size, mask, s0;
300 uint16_t n_rx_pkts = 0;
301 uint16_t mbuf_size = rte_pktmbuf_data_room_size(mq->mempool) -
302 RTE_PKTMBUF_HEADROOM;
303 uint16_t src_len, src_off, dst_len, dst_off, cp_len;
304 memif_ring_type_t type = mq->type;
306 struct rte_mbuf *mbuf, *mbuf_head, *mbuf_tail;
308 ssize_t size __rte_unused;
311 struct rte_eth_link link;
313 if (unlikely((pmd->flags & ETH_MEMIF_FLAG_CONNECTED) == 0))
315 if (unlikely(ring == NULL)) {
316 /* Secondary process will attempt to request regions. */
317 ret = rte_eth_link_get(mq->in_port, &link);
319 MIF_LOG(ERR, "Failed to get port %u link info: %s",
320 mq->in_port, rte_strerror(-ret));
324 /* consume interrupt */
325 if ((ring->flags & MEMIF_RING_FLAG_MASK_INT) == 0)
326 size = read(mq->intr_handle.fd, &b, sizeof(b));
328 ring_size = 1 << mq->log2_ring_size;
329 mask = ring_size - 1;
331 if (type == MEMIF_RING_S2M) {
332 cur_slot = mq->last_head;
333 last_slot = __atomic_load_n(&ring->head, __ATOMIC_ACQUIRE);
335 cur_slot = mq->last_tail;
336 last_slot = __atomic_load_n(&ring->tail, __ATOMIC_ACQUIRE);
339 if (cur_slot == last_slot)
341 n_slots = last_slot - cur_slot;
343 while (n_slots && n_rx_pkts < nb_pkts) {
344 mbuf_head = rte_pktmbuf_alloc(mq->mempool);
345 if (unlikely(mbuf_head == NULL))
348 mbuf->port = mq->in_port;
351 s0 = cur_slot & mask;
352 d0 = &ring->desc[s0];
354 src_len = d0->length;
359 dst_len = mbuf_size - dst_off;
364 /* store pointer to tail */
366 mbuf = rte_pktmbuf_alloc(mq->mempool);
367 if (unlikely(mbuf == NULL))
369 mbuf->port = mq->in_port;
370 ret = memif_pktmbuf_chain(mbuf_head, mbuf_tail, mbuf);
371 if (unlikely(ret < 0)) {
372 MIF_LOG(ERR, "number-of-segments-overflow");
373 rte_pktmbuf_free(mbuf);
377 cp_len = RTE_MIN(dst_len, src_len);
379 rte_pktmbuf_data_len(mbuf) += cp_len;
380 rte_pktmbuf_pkt_len(mbuf) = rte_pktmbuf_data_len(mbuf);
381 if (mbuf != mbuf_head)
382 rte_pktmbuf_pkt_len(mbuf_head) += cp_len;
384 memcpy(rte_pktmbuf_mtod_offset(mbuf, void *, dst_off),
385 (uint8_t *)memif_get_buffer(proc_private, d0) + src_off,
396 if (d0->flags & MEMIF_DESC_FLAG_NEXT)
399 mq->n_bytes += rte_pktmbuf_pkt_len(mbuf_head);
405 if (type == MEMIF_RING_S2M) {
406 __atomic_store_n(&ring->tail, cur_slot, __ATOMIC_RELEASE);
407 mq->last_head = cur_slot;
409 mq->last_tail = cur_slot;
413 if (type == MEMIF_RING_M2S) {
414 /* ring->head is updated by the receiver and this function
415 * is called in the context of receiver thread. The loads in
416 * the receiver do not need to synchronize with its own stores.
418 head = __atomic_load_n(&ring->head, __ATOMIC_RELAXED);
419 n_slots = ring_size - head + mq->last_tail;
423 d0 = &ring->desc[s0];
424 d0->length = pmd->run.pkt_buffer_size;
426 __atomic_store_n(&ring->head, head, __ATOMIC_RELEASE);
429 mq->n_pkts += n_rx_pkts;
434 eth_memif_rx_zc(void *queue, struct rte_mbuf **bufs, uint16_t nb_pkts)
436 struct memif_queue *mq = queue;
437 struct pmd_internals *pmd = rte_eth_devices[mq->in_port].data->dev_private;
438 struct pmd_process_private *proc_private =
439 rte_eth_devices[mq->in_port].process_private;
440 memif_ring_t *ring = memif_get_ring_from_queue(proc_private, mq);
441 uint16_t cur_slot, last_slot, n_slots, ring_size, mask, s0, head;
442 uint16_t n_rx_pkts = 0;
444 struct rte_mbuf *mbuf, *mbuf_tail;
445 struct rte_mbuf *mbuf_head = NULL;
447 struct rte_eth_link link;
449 if (unlikely((pmd->flags & ETH_MEMIF_FLAG_CONNECTED) == 0))
451 if (unlikely(ring == NULL)) {
452 /* Secondary process will attempt to request regions. */
453 rte_eth_link_get(mq->in_port, &link);
457 /* consume interrupt */
458 if ((ring->flags & MEMIF_RING_FLAG_MASK_INT) == 0) {
460 ssize_t size __rte_unused;
461 size = read(mq->intr_handle.fd, &b, sizeof(b));
464 ring_size = 1 << mq->log2_ring_size;
465 mask = ring_size - 1;
467 cur_slot = mq->last_tail;
468 /* The ring->tail acts as a guard variable between Tx and Rx
469 * threads, so using load-acquire pairs with store-release
470 * to synchronize it between threads.
472 last_slot = __atomic_load_n(&ring->tail, __ATOMIC_ACQUIRE);
473 if (cur_slot == last_slot)
475 n_slots = last_slot - cur_slot;
477 while (n_slots && n_rx_pkts < nb_pkts) {
478 s0 = cur_slot & mask;
480 d0 = &ring->desc[s0];
481 mbuf_head = mq->buffers[s0];
485 /* prefetch next descriptor */
486 if (n_rx_pkts + 1 < nb_pkts)
487 rte_prefetch0(&ring->desc[(cur_slot + 1) & mask]);
489 mbuf->port = mq->in_port;
490 rte_pktmbuf_data_len(mbuf) = d0->length;
491 rte_pktmbuf_pkt_len(mbuf) = rte_pktmbuf_data_len(mbuf);
493 mq->n_bytes += rte_pktmbuf_data_len(mbuf);
497 if (d0->flags & MEMIF_DESC_FLAG_NEXT) {
498 s0 = cur_slot & mask;
499 d0 = &ring->desc[s0];
501 mbuf = mq->buffers[s0];
502 ret = memif_pktmbuf_chain(mbuf_head, mbuf_tail, mbuf);
503 if (unlikely(ret < 0)) {
504 MIF_LOG(ERR, "number-of-segments-overflow");
514 mq->last_tail = cur_slot;
516 /* Supply master with new buffers */
518 /* ring->head is updated by the receiver and this function
519 * is called in the context of receiver thread. The loads in
520 * the receiver do not need to synchronize with its own stores.
522 head = __atomic_load_n(&ring->head, __ATOMIC_RELAXED);
523 n_slots = ring_size - head + mq->last_tail;
528 ret = rte_pktmbuf_alloc_bulk(mq->mempool, &mq->buffers[head & mask], n_slots);
529 if (unlikely(ret < 0))
535 rte_prefetch0(mq->buffers[head & mask]);
536 d0 = &ring->desc[s0];
537 /* store buffer header */
538 mbuf = mq->buffers[s0];
539 /* populate descriptor */
540 d0->length = rte_pktmbuf_data_room_size(mq->mempool) -
541 RTE_PKTMBUF_HEADROOM;
543 d0->offset = rte_pktmbuf_mtod(mbuf, uint8_t *) -
544 (uint8_t *)proc_private->regions[d0->region]->addr;
547 /* The ring->head acts as a guard variable between Tx and Rx
548 * threads, so using store-release pairs with load-acquire
549 * in function eth_memif_tx.
551 __atomic_store_n(&ring->head, head, __ATOMIC_RELEASE);
553 mq->n_pkts += n_rx_pkts;
559 eth_memif_tx(void *queue, struct rte_mbuf **bufs, uint16_t nb_pkts)
561 struct memif_queue *mq = queue;
562 struct pmd_internals *pmd = rte_eth_devices[mq->in_port].data->dev_private;
563 struct pmd_process_private *proc_private =
564 rte_eth_devices[mq->in_port].process_private;
565 memif_ring_t *ring = memif_get_ring_from_queue(proc_private, mq);
566 uint16_t slot, saved_slot, n_free, ring_size, mask, n_tx_pkts = 0;
567 uint16_t src_len, src_off, dst_len, dst_off, cp_len;
568 memif_ring_type_t type = mq->type;
570 struct rte_mbuf *mbuf;
571 struct rte_mbuf *mbuf_head;
574 struct rte_eth_link link;
576 if (unlikely((pmd->flags & ETH_MEMIF_FLAG_CONNECTED) == 0))
578 if (unlikely(ring == NULL)) {
581 /* Secondary process will attempt to request regions. */
582 ret = rte_eth_link_get(mq->in_port, &link);
584 MIF_LOG(ERR, "Failed to get port %u link info: %s",
585 mq->in_port, rte_strerror(-ret));
589 ring_size = 1 << mq->log2_ring_size;
590 mask = ring_size - 1;
592 if (type == MEMIF_RING_S2M) {
593 /* For S2M queues ring->head is updated by the sender and
594 * this function is called in the context of sending thread.
595 * The loads in the sender do not need to synchronize with
596 * its own stores. Hence, the following load can be a
599 slot = __atomic_load_n(&ring->head, __ATOMIC_RELAXED);
600 n_free = ring_size - slot +
601 __atomic_load_n(&ring->tail, __ATOMIC_ACQUIRE);
603 /* For M2S queues ring->tail is updated by the sender and
604 * this function is called in the context of sending thread.
605 * The loads in the sender do not need to synchronize with
606 * its own stores. Hence, the following load can be a
609 slot = __atomic_load_n(&ring->tail, __ATOMIC_RELAXED);
610 n_free = __atomic_load_n(&ring->head, __ATOMIC_ACQUIRE) - slot;
613 while (n_tx_pkts < nb_pkts && n_free) {
618 d0 = &ring->desc[slot & mask];
620 dst_len = (type == MEMIF_RING_S2M) ?
621 pmd->run.pkt_buffer_size : d0->length;
625 src_len = rte_pktmbuf_data_len(mbuf);
632 d0->flags |= MEMIF_DESC_FLAG_NEXT;
633 d0 = &ring->desc[slot & mask];
635 dst_len = (type == MEMIF_RING_S2M) ?
636 pmd->run.pkt_buffer_size : d0->length;
643 cp_len = RTE_MIN(dst_len, src_len);
645 memcpy((uint8_t *)memif_get_buffer(proc_private, d0) + dst_off,
646 rte_pktmbuf_mtod_offset(mbuf, void *, src_off),
649 mq->n_bytes += cp_len;
655 d0->length = dst_off;
658 if (rte_pktmbuf_is_contiguous(mbuf) == 0) {
666 rte_pktmbuf_free(mbuf_head);
670 if (type == MEMIF_RING_S2M)
671 __atomic_store_n(&ring->head, slot, __ATOMIC_RELEASE);
673 __atomic_store_n(&ring->tail, slot, __ATOMIC_RELEASE);
675 if ((ring->flags & MEMIF_RING_FLAG_MASK_INT) == 0) {
677 size = write(mq->intr_handle.fd, &a, sizeof(a));
678 if (unlikely(size < 0)) {
680 "Failed to send interrupt. %s", strerror(errno));
684 mq->n_pkts += n_tx_pkts;
690 memif_tx_one_zc(struct pmd_process_private *proc_private, struct memif_queue *mq,
691 memif_ring_t *ring, struct rte_mbuf *mbuf, const uint16_t mask,
692 uint16_t slot, uint16_t n_free)
698 /* store pointer to mbuf to free it later */
699 mq->buffers[slot & mask] = mbuf;
700 /* Increment refcnt to make sure the buffer is not freed before master
701 * receives it. (current segment)
703 rte_mbuf_refcnt_update(mbuf, 1);
704 /* populate descriptor */
705 d0 = &ring->desc[slot & mask];
706 d0->length = rte_pktmbuf_data_len(mbuf);
707 /* FIXME: get region index */
709 d0->offset = rte_pktmbuf_mtod(mbuf, uint8_t *) -
710 (uint8_t *)proc_private->regions[d0->region]->addr;
713 /* check if buffer is chained */
714 if (rte_pktmbuf_is_contiguous(mbuf) == 0) {
717 /* mark buffer as chained */
718 d0->flags |= MEMIF_DESC_FLAG_NEXT;
721 /* update counters */
731 eth_memif_tx_zc(void *queue, struct rte_mbuf **bufs, uint16_t nb_pkts)
733 struct memif_queue *mq = queue;
734 struct pmd_internals *pmd = rte_eth_devices[mq->in_port].data->dev_private;
735 struct pmd_process_private *proc_private =
736 rte_eth_devices[mq->in_port].process_private;
737 memif_ring_t *ring = memif_get_ring_from_queue(proc_private, mq);
738 uint16_t slot, n_free, ring_size, mask, n_tx_pkts = 0;
739 struct rte_eth_link link;
741 if (unlikely((pmd->flags & ETH_MEMIF_FLAG_CONNECTED) == 0))
743 if (unlikely(ring == NULL)) {
744 /* Secondary process will attempt to request regions. */
745 rte_eth_link_get(mq->in_port, &link);
749 ring_size = 1 << mq->log2_ring_size;
750 mask = ring_size - 1;
752 /* free mbufs received by master */
753 memif_free_stored_mbufs(proc_private, mq);
755 /* ring type always MEMIF_RING_S2M */
756 /* For S2M queues ring->head is updated by the sender and
757 * this function is called in the context of sending thread.
758 * The loads in the sender do not need to synchronize with
759 * its own stores. Hence, the following load can be a
762 slot = __atomic_load_n(&ring->head, __ATOMIC_RELAXED);
763 n_free = ring_size - slot + mq->last_tail;
767 while (n_free && (n_tx_pkts < nb_pkts)) {
768 while ((n_free > 4) && ((nb_pkts - n_tx_pkts) > 4)) {
769 if ((nb_pkts - n_tx_pkts) > 8) {
770 rte_prefetch0(*bufs + 4);
771 rte_prefetch0(*bufs + 5);
772 rte_prefetch0(*bufs + 6);
773 rte_prefetch0(*bufs + 7);
775 used_slots = memif_tx_one_zc(proc_private, mq, ring, *bufs++,
777 if (unlikely(used_slots < 1))
781 n_free -= used_slots;
783 used_slots = memif_tx_one_zc(proc_private, mq, ring, *bufs++,
785 if (unlikely(used_slots < 1))
789 n_free -= used_slots;
791 used_slots = memif_tx_one_zc(proc_private, mq, ring, *bufs++,
793 if (unlikely(used_slots < 1))
797 n_free -= used_slots;
799 used_slots = memif_tx_one_zc(proc_private, mq, ring, *bufs++,
801 if (unlikely(used_slots < 1))
805 n_free -= used_slots;
807 used_slots = memif_tx_one_zc(proc_private, mq, ring, *bufs++,
809 if (unlikely(used_slots < 1))
813 n_free -= used_slots;
817 /* ring type always MEMIF_RING_S2M */
818 /* The ring->head acts as a guard variable between Tx and Rx
819 * threads, so using store-release pairs with load-acquire
820 * in function eth_memif_rx for S2M rings.
822 __atomic_store_n(&ring->head, slot, __ATOMIC_RELEASE);
824 /* Send interrupt, if enabled. */
825 if ((ring->flags & MEMIF_RING_FLAG_MASK_INT) == 0) {
827 ssize_t size = write(mq->intr_handle.fd, &a, sizeof(a));
828 if (unlikely(size < 0)) {
830 "Failed to send interrupt. %s", strerror(errno));
834 /* increment queue counters */
835 mq->n_pkts += n_tx_pkts;
841 memif_free_regions(struct rte_eth_dev *dev)
843 struct pmd_process_private *proc_private = dev->process_private;
844 struct pmd_internals *pmd = dev->data->dev_private;
846 struct memif_region *r;
848 /* regions are allocated contiguously, so it's
849 * enough to loop until 'proc_private->regions_num'
851 for (i = 0; i < proc_private->regions_num; i++) {
852 r = proc_private->regions[i];
854 /* This is memzone */
855 if (i > 0 && (pmd->flags & ETH_MEMIF_FLAG_ZERO_COPY)) {
860 if (r->addr != NULL) {
861 munmap(r->addr, r->region_size);
868 proc_private->regions[i] = NULL;
871 proc_private->regions_num = 0;
875 memif_region_init_zc(const struct rte_memseg_list *msl, const struct rte_memseg *ms,
878 struct pmd_process_private *proc_private = (struct pmd_process_private *)arg;
879 struct memif_region *r;
881 if (proc_private->regions_num < 1) {
882 MIF_LOG(ERR, "Missing descriptor region");
886 r = proc_private->regions[proc_private->regions_num - 1];
888 if (r->addr != msl->base_va)
889 r = proc_private->regions[++proc_private->regions_num - 1];
892 r = rte_zmalloc("region", sizeof(struct memif_region), 0);
894 MIF_LOG(ERR, "Failed to alloc memif region.");
898 r->addr = msl->base_va;
899 r->region_size = ms->len;
900 r->fd = rte_memseg_get_fd(ms);
903 r->pkt_buffer_offset = 0;
905 proc_private->regions[proc_private->regions_num - 1] = r;
907 r->region_size += ms->len;
914 memif_region_init_shm(struct rte_eth_dev *dev, uint8_t has_buffers)
916 struct pmd_internals *pmd = dev->data->dev_private;
917 struct pmd_process_private *proc_private = dev->process_private;
918 char shm_name[ETH_MEMIF_SHM_NAME_SIZE];
920 struct memif_region *r;
922 if (proc_private->regions_num >= ETH_MEMIF_MAX_REGION_NUM) {
923 MIF_LOG(ERR, "Too many regions.");
927 r = rte_zmalloc("region", sizeof(struct memif_region), 0);
929 MIF_LOG(ERR, "Failed to alloc memif region.");
933 /* calculate buffer offset */
934 r->pkt_buffer_offset = (pmd->run.num_s2m_rings + pmd->run.num_m2s_rings) *
935 (sizeof(memif_ring_t) + sizeof(memif_desc_t) *
936 (1 << pmd->run.log2_ring_size));
938 r->region_size = r->pkt_buffer_offset;
939 /* if region has buffers, add buffers size to region_size */
940 if (has_buffers == 1)
941 r->region_size += (uint32_t)(pmd->run.pkt_buffer_size *
942 (1 << pmd->run.log2_ring_size) *
943 (pmd->run.num_s2m_rings +
944 pmd->run.num_m2s_rings));
946 memset(shm_name, 0, sizeof(char) * ETH_MEMIF_SHM_NAME_SIZE);
947 snprintf(shm_name, ETH_MEMIF_SHM_NAME_SIZE, "memif_region_%d",
948 proc_private->regions_num);
950 r->fd = memfd_create(shm_name, MFD_ALLOW_SEALING);
952 MIF_LOG(ERR, "Failed to create shm file: %s.", strerror(errno));
957 ret = fcntl(r->fd, F_ADD_SEALS, F_SEAL_SHRINK);
959 MIF_LOG(ERR, "Failed to add seals to shm file: %s.", strerror(errno));
963 ret = ftruncate(r->fd, r->region_size);
965 MIF_LOG(ERR, "Failed to truncate shm file: %s.", strerror(errno));
969 r->addr = mmap(NULL, r->region_size, PROT_READ |
970 PROT_WRITE, MAP_SHARED, r->fd, 0);
971 if (r->addr == MAP_FAILED) {
972 MIF_LOG(ERR, "Failed to mmap shm region: %s.", strerror(ret));
977 proc_private->regions[proc_private->regions_num] = r;
978 proc_private->regions_num++;
991 memif_regions_init(struct rte_eth_dev *dev)
993 struct pmd_internals *pmd = dev->data->dev_private;
997 * Zero-copy exposes dpdk memory.
998 * Each memseg list will be represented by memif region.
999 * Zero-copy regions indexing: memseg list idx + 1,
1000 * as we already have region 0 reserved for descriptors.
1002 if (pmd->flags & ETH_MEMIF_FLAG_ZERO_COPY) {
1003 /* create region idx 0 containing descriptors */
1004 ret = memif_region_init_shm(dev, 0);
1007 ret = rte_memseg_walk(memif_region_init_zc, (void *)dev->process_private);
1011 /* create one memory region contaning rings and buffers */
1012 ret = memif_region_init_shm(dev, /* has buffers */ 1);
1021 memif_init_rings(struct rte_eth_dev *dev)
1023 struct pmd_internals *pmd = dev->data->dev_private;
1024 struct pmd_process_private *proc_private = dev->process_private;
1029 for (i = 0; i < pmd->run.num_s2m_rings; i++) {
1030 ring = memif_get_ring(pmd, proc_private, MEMIF_RING_S2M, i);
1031 __atomic_store_n(&ring->head, 0, __ATOMIC_RELAXED);
1032 __atomic_store_n(&ring->tail, 0, __ATOMIC_RELAXED);
1033 ring->cookie = MEMIF_COOKIE;
1036 if (pmd->flags & ETH_MEMIF_FLAG_ZERO_COPY)
1039 for (j = 0; j < (1 << pmd->run.log2_ring_size); j++) {
1040 slot = i * (1 << pmd->run.log2_ring_size) + j;
1041 ring->desc[j].region = 0;
1042 ring->desc[j].offset =
1043 proc_private->regions[0]->pkt_buffer_offset +
1044 (uint32_t)(slot * pmd->run.pkt_buffer_size);
1045 ring->desc[j].length = pmd->run.pkt_buffer_size;
1049 for (i = 0; i < pmd->run.num_m2s_rings; i++) {
1050 ring = memif_get_ring(pmd, proc_private, MEMIF_RING_M2S, i);
1051 __atomic_store_n(&ring->head, 0, __ATOMIC_RELAXED);
1052 __atomic_store_n(&ring->tail, 0, __ATOMIC_RELAXED);
1053 ring->cookie = MEMIF_COOKIE;
1056 if (pmd->flags & ETH_MEMIF_FLAG_ZERO_COPY)
1059 for (j = 0; j < (1 << pmd->run.log2_ring_size); j++) {
1060 slot = (i + pmd->run.num_s2m_rings) *
1061 (1 << pmd->run.log2_ring_size) + j;
1062 ring->desc[j].region = 0;
1063 ring->desc[j].offset =
1064 proc_private->regions[0]->pkt_buffer_offset +
1065 (uint32_t)(slot * pmd->run.pkt_buffer_size);
1066 ring->desc[j].length = pmd->run.pkt_buffer_size;
1071 /* called only by slave */
1073 memif_init_queues(struct rte_eth_dev *dev)
1075 struct pmd_internals *pmd = dev->data->dev_private;
1076 struct memif_queue *mq;
1079 for (i = 0; i < pmd->run.num_s2m_rings; i++) {
1080 mq = dev->data->tx_queues[i];
1081 mq->log2_ring_size = pmd->run.log2_ring_size;
1082 /* queues located only in region 0 */
1084 mq->ring_offset = memif_get_ring_offset(dev, mq, MEMIF_RING_S2M, i);
1087 mq->intr_handle.fd = eventfd(0, EFD_NONBLOCK);
1088 if (mq->intr_handle.fd < 0) {
1090 "Failed to create eventfd for tx queue %d: %s.", i,
1094 if (pmd->flags & ETH_MEMIF_FLAG_ZERO_COPY) {
1095 mq->buffers = rte_zmalloc("bufs", sizeof(struct rte_mbuf *) *
1096 (1 << mq->log2_ring_size), 0);
1097 if (mq->buffers == NULL)
1102 for (i = 0; i < pmd->run.num_m2s_rings; i++) {
1103 mq = dev->data->rx_queues[i];
1104 mq->log2_ring_size = pmd->run.log2_ring_size;
1105 /* queues located only in region 0 */
1107 mq->ring_offset = memif_get_ring_offset(dev, mq, MEMIF_RING_M2S, i);
1110 mq->intr_handle.fd = eventfd(0, EFD_NONBLOCK);
1111 if (mq->intr_handle.fd < 0) {
1113 "Failed to create eventfd for rx queue %d: %s.", i,
1117 if (pmd->flags & ETH_MEMIF_FLAG_ZERO_COPY) {
1118 mq->buffers = rte_zmalloc("bufs", sizeof(struct rte_mbuf *) *
1119 (1 << mq->log2_ring_size), 0);
1120 if (mq->buffers == NULL)
1128 memif_init_regions_and_queues(struct rte_eth_dev *dev)
1132 ret = memif_regions_init(dev);
1136 memif_init_rings(dev);
1138 ret = memif_init_queues(dev);
1146 memif_connect(struct rte_eth_dev *dev)
1148 struct pmd_internals *pmd = dev->data->dev_private;
1149 struct pmd_process_private *proc_private = dev->process_private;
1150 struct memif_region *mr;
1151 struct memif_queue *mq;
1155 for (i = 0; i < proc_private->regions_num; i++) {
1156 mr = proc_private->regions[i];
1158 if (mr->addr == NULL) {
1161 mr->addr = mmap(NULL, mr->region_size,
1162 PROT_READ | PROT_WRITE,
1163 MAP_SHARED, mr->fd, 0);
1164 if (mr->addr == MAP_FAILED) {
1165 MIF_LOG(ERR, "mmap failed: %s\n",
1170 if (i > 0 && (pmd->flags & ETH_MEMIF_FLAG_ZERO_COPY)) {
1171 /* close memseg file */
1178 if (rte_eal_process_type() == RTE_PROC_PRIMARY) {
1179 for (i = 0; i < pmd->run.num_s2m_rings; i++) {
1180 mq = (pmd->role == MEMIF_ROLE_SLAVE) ?
1181 dev->data->tx_queues[i] : dev->data->rx_queues[i];
1182 ring = memif_get_ring_from_queue(proc_private, mq);
1183 if (ring == NULL || ring->cookie != MEMIF_COOKIE) {
1184 MIF_LOG(ERR, "Wrong ring");
1187 __atomic_store_n(&ring->head, 0, __ATOMIC_RELAXED);
1188 __atomic_store_n(&ring->tail, 0, __ATOMIC_RELAXED);
1191 /* enable polling mode */
1192 if (pmd->role == MEMIF_ROLE_MASTER)
1193 ring->flags = MEMIF_RING_FLAG_MASK_INT;
1195 for (i = 0; i < pmd->run.num_m2s_rings; i++) {
1196 mq = (pmd->role == MEMIF_ROLE_SLAVE) ?
1197 dev->data->rx_queues[i] : dev->data->tx_queues[i];
1198 ring = memif_get_ring_from_queue(proc_private, mq);
1199 if (ring == NULL || ring->cookie != MEMIF_COOKIE) {
1200 MIF_LOG(ERR, "Wrong ring");
1203 __atomic_store_n(&ring->head, 0, __ATOMIC_RELAXED);
1204 __atomic_store_n(&ring->tail, 0, __ATOMIC_RELAXED);
1207 /* enable polling mode */
1208 if (pmd->role == MEMIF_ROLE_SLAVE)
1209 ring->flags = MEMIF_RING_FLAG_MASK_INT;
1212 pmd->flags &= ~ETH_MEMIF_FLAG_CONNECTING;
1213 pmd->flags |= ETH_MEMIF_FLAG_CONNECTED;
1214 dev->data->dev_link.link_status = ETH_LINK_UP;
1216 MIF_LOG(INFO, "Connected.");
1221 memif_dev_start(struct rte_eth_dev *dev)
1223 struct pmd_internals *pmd = dev->data->dev_private;
1226 switch (pmd->role) {
1227 case MEMIF_ROLE_SLAVE:
1228 ret = memif_connect_slave(dev);
1230 case MEMIF_ROLE_MASTER:
1231 ret = memif_connect_master(dev);
1234 MIF_LOG(ERR, "Unknown role: %d.", pmd->role);
1243 memif_dev_close(struct rte_eth_dev *dev)
1245 struct pmd_internals *pmd = dev->data->dev_private;
1248 if (rte_eal_process_type() == RTE_PROC_PRIMARY) {
1249 memif_msg_enq_disconnect(pmd->cc, "Device closed", 0);
1250 memif_disconnect(dev);
1252 for (i = 0; i < dev->data->nb_rx_queues; i++)
1253 (*dev->dev_ops->rx_queue_release)(dev->data->rx_queues[i]);
1254 for (i = 0; i < dev->data->nb_tx_queues; i++)
1255 (*dev->dev_ops->tx_queue_release)(dev->data->tx_queues[i]);
1257 memif_socket_remove_device(dev);
1259 memif_disconnect(dev);
1262 rte_free(dev->process_private);
1268 memif_dev_configure(struct rte_eth_dev *dev)
1270 struct pmd_internals *pmd = dev->data->dev_private;
1276 pmd->cfg.num_s2m_rings = (pmd->role == MEMIF_ROLE_SLAVE) ?
1277 dev->data->nb_tx_queues : dev->data->nb_rx_queues;
1283 pmd->cfg.num_m2s_rings = (pmd->role == MEMIF_ROLE_SLAVE) ?
1284 dev->data->nb_rx_queues : dev->data->nb_tx_queues;
1290 memif_tx_queue_setup(struct rte_eth_dev *dev,
1292 uint16_t nb_tx_desc __rte_unused,
1293 unsigned int socket_id __rte_unused,
1294 const struct rte_eth_txconf *tx_conf __rte_unused)
1296 struct pmd_internals *pmd = dev->data->dev_private;
1297 struct memif_queue *mq;
1299 mq = rte_zmalloc("tx-queue", sizeof(struct memif_queue), 0);
1301 MIF_LOG(ERR, "Failed to allocate tx queue id: %u", qid);
1306 (pmd->role == MEMIF_ROLE_SLAVE) ? MEMIF_RING_S2M : MEMIF_RING_M2S;
1309 mq->intr_handle.fd = -1;
1310 mq->intr_handle.type = RTE_INTR_HANDLE_EXT;
1311 mq->in_port = dev->data->port_id;
1312 dev->data->tx_queues[qid] = mq;
1318 memif_rx_queue_setup(struct rte_eth_dev *dev,
1320 uint16_t nb_rx_desc __rte_unused,
1321 unsigned int socket_id __rte_unused,
1322 const struct rte_eth_rxconf *rx_conf __rte_unused,
1323 struct rte_mempool *mb_pool)
1325 struct pmd_internals *pmd = dev->data->dev_private;
1326 struct memif_queue *mq;
1328 mq = rte_zmalloc("rx-queue", sizeof(struct memif_queue), 0);
1330 MIF_LOG(ERR, "Failed to allocate rx queue id: %u", qid);
1334 mq->type = (pmd->role == MEMIF_ROLE_SLAVE) ? MEMIF_RING_M2S : MEMIF_RING_S2M;
1337 mq->intr_handle.fd = -1;
1338 mq->intr_handle.type = RTE_INTR_HANDLE_EXT;
1339 mq->mempool = mb_pool;
1340 mq->in_port = dev->data->port_id;
1341 dev->data->rx_queues[qid] = mq;
1347 memif_queue_release(void *queue)
1349 struct memif_queue *mq = (struct memif_queue *)queue;
1358 memif_link_update(struct rte_eth_dev *dev,
1359 int wait_to_complete __rte_unused)
1361 struct pmd_process_private *proc_private;
1363 if (rte_eal_process_type() == RTE_PROC_SECONDARY) {
1364 proc_private = dev->process_private;
1365 if (dev->data->dev_link.link_status == ETH_LINK_UP &&
1366 proc_private->regions_num == 0) {
1367 memif_mp_request_regions(dev);
1368 } else if (dev->data->dev_link.link_status == ETH_LINK_DOWN &&
1369 proc_private->regions_num > 0) {
1370 memif_free_regions(dev);
1377 memif_stats_get(struct rte_eth_dev *dev, struct rte_eth_stats *stats)
1379 struct pmd_internals *pmd = dev->data->dev_private;
1380 struct memif_queue *mq;
1384 stats->ipackets = 0;
1386 stats->opackets = 0;
1389 tmp = (pmd->role == MEMIF_ROLE_SLAVE) ? pmd->run.num_s2m_rings :
1390 pmd->run.num_m2s_rings;
1391 nq = (tmp < RTE_ETHDEV_QUEUE_STAT_CNTRS) ? tmp :
1392 RTE_ETHDEV_QUEUE_STAT_CNTRS;
1395 for (i = 0; i < nq; i++) {
1396 mq = dev->data->rx_queues[i];
1397 stats->q_ipackets[i] = mq->n_pkts;
1398 stats->q_ibytes[i] = mq->n_bytes;
1399 stats->ipackets += mq->n_pkts;
1400 stats->ibytes += mq->n_bytes;
1403 tmp = (pmd->role == MEMIF_ROLE_SLAVE) ? pmd->run.num_m2s_rings :
1404 pmd->run.num_s2m_rings;
1405 nq = (tmp < RTE_ETHDEV_QUEUE_STAT_CNTRS) ? tmp :
1406 RTE_ETHDEV_QUEUE_STAT_CNTRS;
1409 for (i = 0; i < nq; i++) {
1410 mq = dev->data->tx_queues[i];
1411 stats->q_opackets[i] = mq->n_pkts;
1412 stats->q_obytes[i] = mq->n_bytes;
1413 stats->opackets += mq->n_pkts;
1414 stats->obytes += mq->n_bytes;
1420 memif_stats_reset(struct rte_eth_dev *dev)
1422 struct pmd_internals *pmd = dev->data->dev_private;
1424 struct memif_queue *mq;
1426 for (i = 0; i < pmd->run.num_s2m_rings; i++) {
1427 mq = (pmd->role == MEMIF_ROLE_SLAVE) ? dev->data->tx_queues[i] :
1428 dev->data->rx_queues[i];
1432 for (i = 0; i < pmd->run.num_m2s_rings; i++) {
1433 mq = (pmd->role == MEMIF_ROLE_SLAVE) ? dev->data->rx_queues[i] :
1434 dev->data->tx_queues[i];
1443 memif_rx_queue_intr_enable(struct rte_eth_dev *dev __rte_unused,
1444 uint16_t qid __rte_unused)
1446 MIF_LOG(WARNING, "Interrupt mode not supported.");
1452 memif_rx_queue_intr_disable(struct rte_eth_dev *dev, uint16_t qid __rte_unused)
1454 struct pmd_internals *pmd __rte_unused = dev->data->dev_private;
1459 static const struct eth_dev_ops ops = {
1460 .dev_start = memif_dev_start,
1461 .dev_close = memif_dev_close,
1462 .dev_infos_get = memif_dev_info,
1463 .dev_configure = memif_dev_configure,
1464 .tx_queue_setup = memif_tx_queue_setup,
1465 .rx_queue_setup = memif_rx_queue_setup,
1466 .rx_queue_release = memif_queue_release,
1467 .tx_queue_release = memif_queue_release,
1468 .rx_queue_intr_enable = memif_rx_queue_intr_enable,
1469 .rx_queue_intr_disable = memif_rx_queue_intr_disable,
1470 .link_update = memif_link_update,
1471 .stats_get = memif_stats_get,
1472 .stats_reset = memif_stats_reset,
1476 memif_create(struct rte_vdev_device *vdev, enum memif_role_t role,
1477 memif_interface_id_t id, uint32_t flags,
1478 const char *socket_filename,
1479 memif_log2_ring_size_t log2_ring_size,
1480 uint16_t pkt_buffer_size, const char *secret,
1481 struct rte_ether_addr *ether_addr)
1484 struct rte_eth_dev *eth_dev;
1485 struct rte_eth_dev_data *data;
1486 struct pmd_internals *pmd;
1487 struct pmd_process_private *process_private;
1488 const unsigned int numa_node = vdev->device.numa_node;
1489 const char *name = rte_vdev_device_name(vdev);
1491 eth_dev = rte_eth_vdev_allocate(vdev, sizeof(*pmd));
1492 if (eth_dev == NULL) {
1493 MIF_LOG(ERR, "%s: Unable to allocate device struct.", name);
1497 process_private = (struct pmd_process_private *)
1498 rte_zmalloc(name, sizeof(struct pmd_process_private),
1499 RTE_CACHE_LINE_SIZE);
1501 if (process_private == NULL) {
1502 MIF_LOG(ERR, "Failed to alloc memory for process private");
1505 eth_dev->process_private = process_private;
1507 pmd = eth_dev->data->dev_private;
1508 memset(pmd, 0, sizeof(*pmd));
1512 pmd->flags |= ETH_MEMIF_FLAG_DISABLED;
1514 /* Zero-copy flag irelevant to master. */
1515 if (pmd->role == MEMIF_ROLE_MASTER)
1516 pmd->flags &= ~ETH_MEMIF_FLAG_ZERO_COPY;
1518 ret = memif_socket_init(eth_dev, socket_filename);
1522 memset(pmd->secret, 0, sizeof(char) * ETH_MEMIF_SECRET_SIZE);
1524 strlcpy(pmd->secret, secret, sizeof(pmd->secret));
1526 pmd->cfg.log2_ring_size = log2_ring_size;
1527 /* set in .dev_configure() */
1528 pmd->cfg.num_s2m_rings = 0;
1529 pmd->cfg.num_m2s_rings = 0;
1531 pmd->cfg.pkt_buffer_size = pkt_buffer_size;
1532 rte_spinlock_init(&pmd->cc_lock);
1534 data = eth_dev->data;
1535 data->dev_private = pmd;
1536 data->numa_node = numa_node;
1537 data->dev_link = pmd_link;
1538 data->mac_addrs = ether_addr;
1539 data->promiscuous = 1;
1541 eth_dev->dev_ops = &ops;
1542 eth_dev->device = &vdev->device;
1543 if (pmd->flags & ETH_MEMIF_FLAG_ZERO_COPY) {
1544 eth_dev->rx_pkt_burst = eth_memif_rx_zc;
1545 eth_dev->tx_pkt_burst = eth_memif_tx_zc;
1547 eth_dev->rx_pkt_burst = eth_memif_rx;
1548 eth_dev->tx_pkt_burst = eth_memif_tx;
1551 rte_eth_dev_probing_finish(eth_dev);
1557 memif_set_role(const char *key __rte_unused, const char *value,
1560 enum memif_role_t *role = (enum memif_role_t *)extra_args;
1562 if (strstr(value, "master") != NULL) {
1563 *role = MEMIF_ROLE_MASTER;
1564 } else if (strstr(value, "slave") != NULL) {
1565 *role = MEMIF_ROLE_SLAVE;
1567 MIF_LOG(ERR, "Unknown role: %s.", value);
1574 memif_set_zc(const char *key __rte_unused, const char *value, void *extra_args)
1576 uint32_t *flags = (uint32_t *)extra_args;
1578 if (strstr(value, "yes") != NULL) {
1579 if (!rte_mcfg_get_single_file_segments()) {
1580 MIF_LOG(ERR, "Zero-copy doesn't support multi-file segments.");
1583 *flags |= ETH_MEMIF_FLAG_ZERO_COPY;
1584 } else if (strstr(value, "no") != NULL) {
1585 *flags &= ~ETH_MEMIF_FLAG_ZERO_COPY;
1587 MIF_LOG(ERR, "Failed to parse zero-copy param: %s.", value);
1594 memif_set_id(const char *key __rte_unused, const char *value, void *extra_args)
1596 memif_interface_id_t *id = (memif_interface_id_t *)extra_args;
1598 /* even if parsing fails, 0 is a valid id */
1599 *id = strtoul(value, NULL, 10);
1604 memif_set_bs(const char *key __rte_unused, const char *value, void *extra_args)
1607 uint16_t *pkt_buffer_size = (uint16_t *)extra_args;
1609 tmp = strtoul(value, NULL, 10);
1610 if (tmp == 0 || tmp > 0xFFFF) {
1611 MIF_LOG(ERR, "Invalid buffer size: %s.", value);
1614 *pkt_buffer_size = tmp;
1619 memif_set_rs(const char *key __rte_unused, const char *value, void *extra_args)
1622 memif_log2_ring_size_t *log2_ring_size =
1623 (memif_log2_ring_size_t *)extra_args;
1625 tmp = strtoul(value, NULL, 10);
1626 if (tmp == 0 || tmp > ETH_MEMIF_MAX_LOG2_RING_SIZE) {
1627 MIF_LOG(ERR, "Invalid ring size: %s (max %u).",
1628 value, ETH_MEMIF_MAX_LOG2_RING_SIZE);
1631 *log2_ring_size = tmp;
1635 /* check if directory exists and if we have permission to read/write */
1637 memif_check_socket_filename(const char *filename)
1639 char *dir = NULL, *tmp;
1643 if (strlen(filename) >= MEMIF_SOCKET_UN_SIZE) {
1644 MIF_LOG(ERR, "Unix socket address too long (max 108).");
1648 tmp = strrchr(filename, '/');
1650 idx = tmp - filename;
1651 dir = rte_zmalloc("memif_tmp", sizeof(char) * (idx + 1), 0);
1653 MIF_LOG(ERR, "Failed to allocate memory.");
1656 strlcpy(dir, filename, sizeof(char) * (idx + 1));
1659 if (dir == NULL || (faccessat(-1, dir, F_OK | R_OK |
1660 W_OK, AT_EACCESS) < 0)) {
1661 MIF_LOG(ERR, "Invalid socket directory.");
1672 memif_set_socket_filename(const char *key __rte_unused, const char *value,
1675 const char **socket_filename = (const char **)extra_args;
1677 *socket_filename = value;
1678 return memif_check_socket_filename(*socket_filename);
1682 memif_set_mac(const char *key __rte_unused, const char *value, void *extra_args)
1684 struct rte_ether_addr *ether_addr = (struct rte_ether_addr *)extra_args;
1686 if (rte_ether_unformat_addr(value, ether_addr) < 0)
1687 MIF_LOG(WARNING, "Failed to parse mac '%s'.", value);
1692 memif_set_secret(const char *key __rte_unused, const char *value, void *extra_args)
1694 const char **secret = (const char **)extra_args;
1701 rte_pmd_memif_probe(struct rte_vdev_device *vdev)
1703 RTE_BUILD_BUG_ON(sizeof(memif_msg_t) != 128);
1704 RTE_BUILD_BUG_ON(sizeof(memif_desc_t) != 16);
1706 struct rte_kvargs *kvlist;
1707 const char *name = rte_vdev_device_name(vdev);
1708 enum memif_role_t role = MEMIF_ROLE_SLAVE;
1709 memif_interface_id_t id = 0;
1710 uint16_t pkt_buffer_size = ETH_MEMIF_DEFAULT_PKT_BUFFER_SIZE;
1711 memif_log2_ring_size_t log2_ring_size = ETH_MEMIF_DEFAULT_RING_SIZE;
1712 const char *socket_filename = ETH_MEMIF_DEFAULT_SOCKET_FILENAME;
1714 const char *secret = NULL;
1715 struct rte_ether_addr *ether_addr = rte_zmalloc("",
1716 sizeof(struct rte_ether_addr), 0);
1717 struct rte_eth_dev *eth_dev;
1719 rte_eth_random_addr(ether_addr->addr_bytes);
1721 MIF_LOG(INFO, "Initialize MEMIF: %s.", name);
1723 if (rte_eal_process_type() == RTE_PROC_SECONDARY) {
1724 eth_dev = rte_eth_dev_attach_secondary(name);
1726 MIF_LOG(ERR, "Failed to probe %s", name);
1730 eth_dev->dev_ops = &ops;
1731 eth_dev->device = &vdev->device;
1732 eth_dev->rx_pkt_burst = eth_memif_rx;
1733 eth_dev->tx_pkt_burst = eth_memif_tx;
1735 if (!rte_eal_primary_proc_alive(NULL)) {
1736 MIF_LOG(ERR, "Primary process is missing");
1740 eth_dev->process_private = (struct pmd_process_private *)
1742 sizeof(struct pmd_process_private),
1743 RTE_CACHE_LINE_SIZE);
1744 if (eth_dev->process_private == NULL) {
1746 "Failed to alloc memory for process private");
1750 rte_eth_dev_probing_finish(eth_dev);
1755 ret = rte_mp_action_register(MEMIF_MP_SEND_REGION, memif_mp_send_region);
1757 * Primary process can continue probing, but secondary process won't
1758 * be able to get memory regions information
1760 if (ret < 0 && rte_errno != EEXIST)
1761 MIF_LOG(WARNING, "Failed to register mp action callback: %s",
1762 strerror(rte_errno));
1764 kvlist = rte_kvargs_parse(rte_vdev_device_args(vdev), valid_arguments);
1766 /* parse parameters */
1767 if (kvlist != NULL) {
1768 ret = rte_kvargs_process(kvlist, ETH_MEMIF_ROLE_ARG,
1769 &memif_set_role, &role);
1772 ret = rte_kvargs_process(kvlist, ETH_MEMIF_ID_ARG,
1773 &memif_set_id, &id);
1776 ret = rte_kvargs_process(kvlist, ETH_MEMIF_PKT_BUFFER_SIZE_ARG,
1777 &memif_set_bs, &pkt_buffer_size);
1780 ret = rte_kvargs_process(kvlist, ETH_MEMIF_RING_SIZE_ARG,
1781 &memif_set_rs, &log2_ring_size);
1784 ret = rte_kvargs_process(kvlist, ETH_MEMIF_SOCKET_ARG,
1785 &memif_set_socket_filename,
1786 (void *)(&socket_filename));
1789 ret = rte_kvargs_process(kvlist, ETH_MEMIF_MAC_ARG,
1790 &memif_set_mac, ether_addr);
1793 ret = rte_kvargs_process(kvlist, ETH_MEMIF_ZC_ARG,
1794 &memif_set_zc, &flags);
1797 ret = rte_kvargs_process(kvlist, ETH_MEMIF_SECRET_ARG,
1798 &memif_set_secret, (void *)(&secret));
1803 /* create interface */
1804 ret = memif_create(vdev, role, id, flags, socket_filename,
1805 log2_ring_size, pkt_buffer_size, secret, ether_addr);
1809 rte_kvargs_free(kvlist);
1814 rte_pmd_memif_remove(struct rte_vdev_device *vdev)
1816 struct rte_eth_dev *eth_dev;
1818 eth_dev = rte_eth_dev_allocated(rte_vdev_device_name(vdev));
1819 if (eth_dev == NULL)
1822 rte_eth_dev_close(eth_dev->data->port_id);
1827 static struct rte_vdev_driver pmd_memif_drv = {
1828 .probe = rte_pmd_memif_probe,
1829 .remove = rte_pmd_memif_remove,
1832 RTE_PMD_REGISTER_VDEV(net_memif, pmd_memif_drv);
1834 RTE_PMD_REGISTER_PARAM_STRING(net_memif,
1835 ETH_MEMIF_ID_ARG "=<int>"
1836 ETH_MEMIF_ROLE_ARG "=master|slave"
1837 ETH_MEMIF_PKT_BUFFER_SIZE_ARG "=<int>"
1838 ETH_MEMIF_RING_SIZE_ARG "=<int>"
1839 ETH_MEMIF_SOCKET_ARG "=<string>"
1840 ETH_MEMIF_MAC_ARG "=xx:xx:xx:xx:xx:xx"
1841 ETH_MEMIF_ZC_ARG "=yes|no"
1842 ETH_MEMIF_SECRET_ARG "=<string>");
1844 RTE_LOG_REGISTER(memif_logtype, pmd.net.memif, NOTICE);