1 /* SPDX-License-Identifier: BSD-3-Clause
2 * Copyright 2018-2019 Cisco Systems, Inc. All rights reserved.
9 #include <sys/socket.h>
10 #include <sys/ioctl.h>
13 #include <rte_version.h>
15 #include <rte_ether.h>
16 #include <ethdev_driver.h>
17 #include <ethdev_vdev.h>
18 #include <rte_malloc.h>
19 #include <rte_kvargs.h>
20 #include <rte_bus_vdev.h>
22 #include <rte_jhash.h>
23 #include <rte_string_fns.h>
25 #include "rte_eth_memif.h"
26 #include "memif_socket.h"
28 static void memif_intr_handler(void *arg);
31 memif_msg_send(int fd, memif_msg_t *msg, int afd)
33 struct msghdr mh = { 0 };
36 char ctl[CMSG_SPACE(sizeof(int))];
38 iov[0].iov_base = msg;
39 iov[0].iov_len = sizeof(memif_msg_t);
44 memset(&ctl, 0, sizeof(ctl));
46 mh.msg_controllen = sizeof(ctl);
47 cmsg = CMSG_FIRSTHDR(&mh);
48 cmsg->cmsg_len = CMSG_LEN(sizeof(int));
49 cmsg->cmsg_level = SOL_SOCKET;
50 cmsg->cmsg_type = SCM_RIGHTS;
51 rte_memcpy(CMSG_DATA(cmsg), &afd, sizeof(int));
54 return sendmsg(fd, &mh, 0);
58 memif_msg_send_from_queue(struct memif_control_channel *cc)
62 struct memif_msg_queue_elt *e;
64 e = TAILQ_FIRST(&cc->msg_queue);
68 size = memif_msg_send(rte_intr_fd_get(cc->intr_handle), &e->msg,
70 if (size != sizeof(memif_msg_t)) {
71 MIF_LOG(ERR, "sendmsg fail: %s.", strerror(errno));
74 MIF_LOG(DEBUG, "Sent msg type %u.", e->msg.type);
76 TAILQ_REMOVE(&cc->msg_queue, e, next);
82 static struct memif_msg_queue_elt *
83 memif_msg_enq(struct memif_control_channel *cc)
85 struct memif_msg_queue_elt *e;
87 e = rte_zmalloc("memif_msg", sizeof(struct memif_msg_queue_elt), 0);
89 MIF_LOG(ERR, "Failed to allocate control message.");
94 TAILQ_INSERT_TAIL(&cc->msg_queue, e, next);
100 memif_msg_enq_disconnect(struct memif_control_channel *cc, const char *reason,
103 struct memif_msg_queue_elt *e;
104 struct pmd_internals *pmd;
105 memif_msg_disconnect_t *d;
108 MIF_LOG(DEBUG, "Missing control channel.");
112 e = memif_msg_enq(cc);
114 MIF_LOG(WARNING, "Failed to enqueue disconnect message.");
118 d = &e->msg.disconnect;
120 e->msg.type = MEMIF_MSG_TYPE_DISCONNECT;
123 if (reason != NULL) {
124 strlcpy((char *)d->string, reason, sizeof(d->string));
125 if (cc->dev != NULL) {
126 pmd = cc->dev->data->dev_private;
127 strlcpy(pmd->local_disc_string, reason,
128 sizeof(pmd->local_disc_string));
134 memif_msg_enq_hello(struct memif_control_channel *cc)
136 struct memif_msg_queue_elt *e = memif_msg_enq(cc);
137 memif_msg_hello_t *h;
144 e->msg.type = MEMIF_MSG_TYPE_HELLO;
145 h->min_version = MEMIF_VERSION;
146 h->max_version = MEMIF_VERSION;
147 h->max_c2s_ring = ETH_MEMIF_MAX_NUM_Q_PAIRS;
148 h->max_s2c_ring = ETH_MEMIF_MAX_NUM_Q_PAIRS;
149 h->max_region = ETH_MEMIF_MAX_REGION_NUM - 1;
150 h->max_log2_ring_size = ETH_MEMIF_MAX_LOG2_RING_SIZE;
152 strlcpy((char *)h->name, rte_version(), sizeof(h->name));
158 memif_msg_receive_hello(struct rte_eth_dev *dev, memif_msg_t *msg)
160 struct pmd_internals *pmd = dev->data->dev_private;
161 memif_msg_hello_t *h = &msg->hello;
163 if (h->min_version > MEMIF_VERSION || h->max_version < MEMIF_VERSION) {
164 memif_msg_enq_disconnect(pmd->cc, "Incompatible memif version", 0);
168 /* Set parameters for active connection */
169 pmd->run.num_c2s_rings = RTE_MIN(h->max_c2s_ring + 1,
170 pmd->cfg.num_c2s_rings);
171 pmd->run.num_s2c_rings = RTE_MIN(h->max_s2c_ring + 1,
172 pmd->cfg.num_s2c_rings);
173 pmd->run.log2_ring_size = RTE_MIN(h->max_log2_ring_size,
174 pmd->cfg.log2_ring_size);
175 pmd->run.pkt_buffer_size = pmd->cfg.pkt_buffer_size;
177 strlcpy(pmd->remote_name, (char *)h->name, sizeof(pmd->remote_name));
179 MIF_LOG(DEBUG, "Connecting to %s.", pmd->remote_name);
185 memif_msg_receive_init(struct memif_control_channel *cc, memif_msg_t *msg)
187 memif_msg_init_t *i = &msg->init;
188 struct memif_socket_dev_list_elt *elt;
189 struct pmd_internals *pmd;
190 struct rte_eth_dev *dev;
192 if (i->version != MEMIF_VERSION) {
193 memif_msg_enq_disconnect(cc, "Incompatible memif version", 0);
197 if (cc->socket == NULL) {
198 memif_msg_enq_disconnect(cc, "Device error", 0);
202 /* Find device with requested ID */
203 TAILQ_FOREACH(elt, &cc->socket->dev_queue, next) {
205 pmd = dev->data->dev_private;
206 if (((pmd->flags & ETH_MEMIF_FLAG_DISABLED) == 0) &&
207 (pmd->id == i->id) && (pmd->role == MEMIF_ROLE_SERVER)) {
208 if (pmd->flags & (ETH_MEMIF_FLAG_CONNECTING |
209 ETH_MEMIF_FLAG_CONNECTED)) {
210 memif_msg_enq_disconnect(cc,
211 "Already connected", 0);
215 /* assign control channel to device */
219 if (i->mode != MEMIF_INTERFACE_MODE_ETHERNET) {
220 memif_msg_enq_disconnect(pmd->cc,
221 "Only ethernet mode supported",
226 strlcpy(pmd->remote_name, (char *)i->name,
227 sizeof(pmd->remote_name));
229 if (*pmd->secret != '\0') {
230 if (*i->secret == '\0') {
231 memif_msg_enq_disconnect(pmd->cc,
232 "Secret required", 0);
235 if (strncmp(pmd->secret, (char *)i->secret,
236 ETH_MEMIF_SECRET_SIZE) != 0) {
237 memif_msg_enq_disconnect(pmd->cc,
238 "Incorrect secret", 0);
243 pmd->flags |= ETH_MEMIF_FLAG_CONNECTING;
248 /* ID not found on this socket */
249 MIF_LOG(DEBUG, "ID %u not found.", i->id);
250 memif_msg_enq_disconnect(cc, "ID not found", 0);
255 memif_msg_receive_add_region(struct rte_eth_dev *dev, memif_msg_t *msg,
258 struct pmd_internals *pmd = dev->data->dev_private;
259 struct pmd_process_private *proc_private = dev->process_private;
260 memif_msg_add_region_t *ar = &msg->add_region;
261 struct memif_region *r;
264 memif_msg_enq_disconnect(pmd->cc, "Missing region fd", 0);
268 if (ar->index >= ETH_MEMIF_MAX_REGION_NUM ||
269 ar->index != proc_private->regions_num ||
270 proc_private->regions[ar->index] != NULL) {
271 memif_msg_enq_disconnect(pmd->cc, "Invalid region index", 0);
275 r = rte_zmalloc("region", sizeof(struct memif_region), 0);
277 memif_msg_enq_disconnect(pmd->cc, "Failed to alloc memif region.", 0);
282 r->region_size = ar->size;
285 proc_private->regions[ar->index] = r;
286 proc_private->regions_num++;
292 memif_msg_receive_add_ring(struct rte_eth_dev *dev, memif_msg_t *msg, int fd)
294 struct pmd_internals *pmd = dev->data->dev_private;
295 memif_msg_add_ring_t *ar = &msg->add_ring;
296 struct memif_queue *mq;
299 memif_msg_enq_disconnect(pmd->cc, "Missing interrupt fd", 0);
303 /* check if we have enough queues */
304 if (ar->flags & MEMIF_MSG_ADD_RING_FLAG_C2S) {
305 if (ar->index >= pmd->cfg.num_c2s_rings) {
306 memif_msg_enq_disconnect(pmd->cc, "Invalid ring index", 0);
309 pmd->run.num_c2s_rings++;
311 if (ar->index >= pmd->cfg.num_s2c_rings) {
312 memif_msg_enq_disconnect(pmd->cc, "Invalid ring index", 0);
315 pmd->run.num_s2c_rings++;
318 mq = (ar->flags & MEMIF_MSG_ADD_RING_FLAG_C2S) ?
319 dev->data->rx_queues[ar->index] : dev->data->tx_queues[ar->index];
321 if (rte_intr_fd_set(mq->intr_handle, fd))
324 mq->log2_ring_size = ar->log2_ring_size;
325 mq->region = ar->region;
326 mq->ring_offset = ar->offset;
332 memif_msg_receive_connect(struct rte_eth_dev *dev, memif_msg_t *msg)
334 struct pmd_internals *pmd = dev->data->dev_private;
335 memif_msg_connect_t *c = &msg->connect;
338 ret = memif_connect(dev);
342 strlcpy(pmd->remote_if_name, (char *)c->if_name,
343 sizeof(pmd->remote_if_name));
344 MIF_LOG(INFO, "Remote interface %s connected.", pmd->remote_if_name);
350 memif_msg_receive_connected(struct rte_eth_dev *dev, memif_msg_t *msg)
352 struct pmd_internals *pmd = dev->data->dev_private;
353 memif_msg_connected_t *c = &msg->connected;
356 ret = memif_connect(dev);
360 strlcpy(pmd->remote_if_name, (char *)c->if_name,
361 sizeof(pmd->remote_if_name));
362 MIF_LOG(INFO, "Remote interface %s connected.", pmd->remote_if_name);
368 memif_msg_receive_disconnect(struct rte_eth_dev *dev, memif_msg_t *msg)
370 struct pmd_internals *pmd = dev->data->dev_private;
371 memif_msg_disconnect_t *d = &msg->disconnect;
373 memset(pmd->remote_disc_string, 0, sizeof(pmd->remote_disc_string));
374 strlcpy(pmd->remote_disc_string, (char *)d->string,
375 sizeof(pmd->remote_disc_string));
377 MIF_LOG(INFO, "Disconnect received: %s", pmd->remote_disc_string);
379 memset(pmd->local_disc_string, 0, 96);
380 memif_disconnect(dev);
385 memif_msg_enq_ack(struct rte_eth_dev *dev)
387 struct pmd_internals *pmd = dev->data->dev_private;
388 struct memif_msg_queue_elt *e = memif_msg_enq(pmd->cc);
392 e->msg.type = MEMIF_MSG_TYPE_ACK;
398 memif_msg_enq_init(struct rte_eth_dev *dev)
400 struct pmd_internals *pmd = dev->data->dev_private;
401 struct memif_msg_queue_elt *e = memif_msg_enq(pmd->cc);
402 memif_msg_init_t *i = &e->msg.init;
408 e->msg.type = MEMIF_MSG_TYPE_INIT;
409 i->version = MEMIF_VERSION;
411 i->mode = MEMIF_INTERFACE_MODE_ETHERNET;
413 strlcpy((char *)i->name, rte_version(), sizeof(i->name));
415 if (*pmd->secret != '\0')
416 strlcpy((char *)i->secret, pmd->secret, sizeof(i->secret));
422 memif_msg_enq_add_region(struct rte_eth_dev *dev, uint8_t idx)
424 struct pmd_internals *pmd = dev->data->dev_private;
425 struct pmd_process_private *proc_private = dev->process_private;
426 struct memif_msg_queue_elt *e = memif_msg_enq(pmd->cc);
427 memif_msg_add_region_t *ar;
428 struct memif_region *mr = proc_private->regions[idx];
433 ar = &e->msg.add_region;
434 e->msg.type = MEMIF_MSG_TYPE_ADD_REGION;
437 ar->size = mr->region_size;
443 memif_msg_enq_add_ring(struct rte_eth_dev *dev, uint8_t idx,
444 memif_ring_type_t type)
446 struct pmd_internals *pmd = dev->data->dev_private;
447 struct memif_msg_queue_elt *e = memif_msg_enq(pmd->cc);
448 struct memif_queue *mq;
449 memif_msg_add_ring_t *ar;
454 ar = &e->msg.add_ring;
455 mq = (type == MEMIF_RING_C2S) ? dev->data->tx_queues[idx] :
456 dev->data->rx_queues[idx];
458 e->msg.type = MEMIF_MSG_TYPE_ADD_RING;
459 e->fd = rte_intr_fd_get(mq->intr_handle);
461 ar->offset = mq->ring_offset;
462 ar->region = mq->region;
463 ar->log2_ring_size = mq->log2_ring_size;
464 ar->flags = (type == MEMIF_RING_C2S) ? MEMIF_MSG_ADD_RING_FLAG_C2S : 0;
465 ar->private_hdr_size = 0;
471 memif_msg_enq_connect(struct rte_eth_dev *dev)
473 struct pmd_internals *pmd = dev->data->dev_private;
474 struct memif_msg_queue_elt *e = memif_msg_enq(pmd->cc);
475 memif_msg_connect_t *c;
481 e->msg.type = MEMIF_MSG_TYPE_CONNECT;
482 strlcpy((char *)c->if_name, dev->data->name, sizeof(c->if_name));
488 memif_msg_enq_connected(struct rte_eth_dev *dev)
490 struct pmd_internals *pmd = dev->data->dev_private;
491 struct memif_msg_queue_elt *e = memif_msg_enq(pmd->cc);
492 memif_msg_connected_t *c;
497 c = &e->msg.connected;
498 e->msg.type = MEMIF_MSG_TYPE_CONNECTED;
499 strlcpy((char *)c->if_name, dev->data->name, sizeof(c->if_name));
505 memif_intr_unregister_handler(struct rte_intr_handle *intr_handle, void *arg)
507 struct memif_msg_queue_elt *elt;
508 struct memif_control_channel *cc = arg;
510 /* close control channel fd */
511 close(rte_intr_fd_get(intr_handle));
512 /* clear message queue */
513 while ((elt = TAILQ_FIRST(&cc->msg_queue)) != NULL) {
514 TAILQ_REMOVE(&cc->msg_queue, elt, next);
517 rte_intr_instance_free(cc->intr_handle);
518 /* free control channel */
523 memif_disconnect(struct rte_eth_dev *dev)
525 struct pmd_internals *pmd = dev->data->dev_private;
526 struct memif_msg_queue_elt *elt, *next;
527 struct memif_queue *mq;
528 struct rte_intr_handle *ih;
532 dev->data->dev_link.link_status = RTE_ETH_LINK_DOWN;
533 pmd->flags &= ~ETH_MEMIF_FLAG_CONNECTING;
534 pmd->flags &= ~ETH_MEMIF_FLAG_CONNECTED;
536 rte_spinlock_lock(&pmd->cc_lock);
537 if (pmd->cc != NULL) {
538 /* Clear control message queue (except disconnect message if any). */
539 for (elt = TAILQ_FIRST(&pmd->cc->msg_queue); elt != NULL; elt = next) {
540 next = TAILQ_NEXT(elt, next);
541 if (elt->msg.type != MEMIF_MSG_TYPE_DISCONNECT) {
542 TAILQ_REMOVE(&pmd->cc->msg_queue, elt, next);
546 /* send disconnect message (if there is any in queue) */
547 memif_msg_send_from_queue(pmd->cc);
549 /* at this point, there should be no more messages in queue */
550 if (TAILQ_FIRST(&pmd->cc->msg_queue) != NULL) {
552 "Unexpected message(s) in message queue.");
555 ih = pmd->cc->intr_handle;
556 if (rte_intr_fd_get(ih) > 0) {
557 ret = rte_intr_callback_unregister(ih,
561 * If callback is active (disconnecting based on
562 * received control message).
564 if (ret == -EAGAIN) {
565 ret = rte_intr_callback_unregister_pending(ih,
568 memif_intr_unregister_handler);
569 } else if (ret > 0) {
570 close(rte_intr_fd_get(ih));
571 rte_intr_instance_free(ih);
577 "Failed to unregister control channel callback.");
580 rte_spinlock_unlock(&pmd->cc_lock);
582 /* unconfig interrupts */
583 for (i = 0; i < pmd->cfg.num_c2s_rings; i++) {
584 if (pmd->role == MEMIF_ROLE_CLIENT) {
585 if (dev->data->tx_queues != NULL)
586 mq = dev->data->tx_queues[i];
590 if (dev->data->rx_queues != NULL)
591 mq = dev->data->rx_queues[i];
596 if (rte_intr_fd_get(mq->intr_handle) > 0) {
597 close(rte_intr_fd_get(mq->intr_handle));
598 rte_intr_fd_set(mq->intr_handle, -1);
601 for (i = 0; i < pmd->cfg.num_s2c_rings; i++) {
602 if (pmd->role == MEMIF_ROLE_SERVER) {
603 if (dev->data->tx_queues != NULL)
604 mq = dev->data->tx_queues[i];
608 if (dev->data->rx_queues != NULL)
609 mq = dev->data->rx_queues[i];
614 if (rte_intr_fd_get(mq->intr_handle) > 0) {
615 close(rte_intr_fd_get(mq->intr_handle));
616 rte_intr_fd_set(mq->intr_handle, -1);
620 memif_free_regions(dev);
622 /* reset connection configuration */
623 memset(&pmd->run, 0, sizeof(pmd->run));
625 MIF_LOG(DEBUG, "Disconnected, id: %d, role: %s.", pmd->id,
626 (pmd->role == MEMIF_ROLE_SERVER) ? "server" : "client");
630 memif_msg_receive(struct memif_control_channel *cc)
632 char ctl[CMSG_SPACE(sizeof(int)) +
633 CMSG_SPACE(sizeof(struct ucred))] = { 0 };
634 struct msghdr mh = { 0 };
636 memif_msg_t msg = { 0 };
639 struct ucred *cr __rte_unused;
641 struct cmsghdr *cmsg;
644 struct pmd_internals *pmd;
645 struct pmd_process_private *proc_private;
647 iov[0].iov_base = (void *)&msg;
648 iov[0].iov_len = sizeof(memif_msg_t);
651 mh.msg_control = ctl;
652 mh.msg_controllen = sizeof(ctl);
654 size = recvmsg(rte_intr_fd_get(cc->intr_handle), &mh, 0);
655 if (size != sizeof(memif_msg_t)) {
656 MIF_LOG(DEBUG, "Invalid message size = %zd", size);
658 /* 0 means end-of-file, negative size means error,
659 * don't send further disconnect message in such cases.
661 memif_msg_enq_disconnect(cc, "Invalid message size", 0);
664 MIF_LOG(DEBUG, "Received msg type: %u.", msg.type);
666 cmsg = CMSG_FIRSTHDR(&mh);
668 if (cmsg->cmsg_level == SOL_SOCKET) {
669 if (cmsg->cmsg_type == SCM_CREDENTIALS)
670 cr = (struct ucred *)CMSG_DATA(cmsg);
671 else if (cmsg->cmsg_type == SCM_RIGHTS)
672 rte_memcpy(&afd, CMSG_DATA(cmsg), sizeof(int));
674 cmsg = CMSG_NXTHDR(&mh, cmsg);
677 if (cc->dev == NULL && msg.type != MEMIF_MSG_TYPE_INIT) {
678 MIF_LOG(DEBUG, "Unexpected message.");
679 memif_msg_enq_disconnect(cc, "Unexpected message", 0);
683 /* get device from hash data */
685 case MEMIF_MSG_TYPE_ACK:
687 case MEMIF_MSG_TYPE_HELLO:
688 ret = memif_msg_receive_hello(cc->dev, &msg);
691 ret = memif_init_regions_and_queues(cc->dev);
694 ret = memif_msg_enq_init(cc->dev);
697 pmd = cc->dev->data->dev_private;
698 proc_private = cc->dev->process_private;
699 for (i = 0; i < proc_private->regions_num; i++) {
700 ret = memif_msg_enq_add_region(cc->dev, i);
704 for (i = 0; i < pmd->run.num_c2s_rings; i++) {
705 ret = memif_msg_enq_add_ring(cc->dev, i,
710 for (i = 0; i < pmd->run.num_s2c_rings; i++) {
711 ret = memif_msg_enq_add_ring(cc->dev, i,
716 ret = memif_msg_enq_connect(cc->dev);
720 case MEMIF_MSG_TYPE_INIT:
722 * This cc does not have an interface asociated with it.
723 * If suitable interface is found it will be assigned here.
725 ret = memif_msg_receive_init(cc, &msg);
728 ret = memif_msg_enq_ack(cc->dev);
732 case MEMIF_MSG_TYPE_ADD_REGION:
733 ret = memif_msg_receive_add_region(cc->dev, &msg, afd);
736 ret = memif_msg_enq_ack(cc->dev);
740 case MEMIF_MSG_TYPE_ADD_RING:
741 ret = memif_msg_receive_add_ring(cc->dev, &msg, afd);
744 ret = memif_msg_enq_ack(cc->dev);
748 case MEMIF_MSG_TYPE_CONNECT:
749 ret = memif_msg_receive_connect(cc->dev, &msg);
752 ret = memif_msg_enq_connected(cc->dev);
756 case MEMIF_MSG_TYPE_CONNECTED:
757 ret = memif_msg_receive_connected(cc->dev, &msg);
759 case MEMIF_MSG_TYPE_DISCONNECT:
760 ret = memif_msg_receive_disconnect(cc->dev, &msg);
765 memif_msg_enq_disconnect(cc, "Unknown message type", 0);
775 memif_intr_handler(void *arg)
777 struct memif_control_channel *cc = arg;
780 ret = memif_msg_receive(cc);
781 /* if driver failed to assign device */
782 if (cc->dev == NULL) {
783 memif_msg_send_from_queue(cc);
784 ret = rte_intr_callback_unregister_pending(cc->intr_handle,
787 memif_intr_unregister_handler);
790 "Failed to unregister control channel callback.");
793 /* if memif_msg_receive failed */
797 ret = memif_msg_send_from_queue(cc);
804 if (cc->dev == NULL) {
805 MIF_LOG(WARNING, "eth dev not allocated");
808 memif_disconnect(cc->dev);
812 memif_listener_handler(void *arg)
814 struct memif_socket *socket = arg;
817 struct sockaddr_un client;
818 struct memif_control_channel *cc;
821 addr_len = sizeof(client);
822 sockfd = accept(rte_intr_fd_get(socket->intr_handle),
823 (struct sockaddr *)&client, (socklen_t *)&addr_len);
826 "Failed to accept connection request on socket fd %d",
827 rte_intr_fd_get(socket->intr_handle));
831 MIF_LOG(DEBUG, "%s: Connection request accepted.", socket->filename);
833 cc = rte_zmalloc("memif-cc", sizeof(struct memif_control_channel), 0);
835 MIF_LOG(ERR, "Failed to allocate control channel.");
839 /* Allocate interrupt instance */
840 cc->intr_handle = rte_intr_instance_alloc(RTE_INTR_INSTANCE_F_SHARED);
841 if (cc->intr_handle == NULL) {
842 MIF_LOG(ERR, "Failed to allocate intr handle");
846 if (rte_intr_fd_set(cc->intr_handle, sockfd))
849 if (rte_intr_type_set(cc->intr_handle, RTE_INTR_HANDLE_EXT))
854 TAILQ_INIT(&cc->msg_queue);
856 ret = rte_intr_callback_register(cc->intr_handle, memif_intr_handler,
859 MIF_LOG(ERR, "Failed to register control channel callback.");
863 ret = memif_msg_enq_hello(cc);
865 MIF_LOG(ERR, "Failed to enqueue hello message.");
868 ret = memif_msg_send_from_queue(cc);
880 rte_intr_instance_free(cc->intr_handle);
885 static struct memif_socket *
886 memif_socket_create(char *key, uint8_t listener, bool is_abstract)
888 struct memif_socket *sock;
889 struct sockaddr_un un = { 0 };
895 sock = rte_zmalloc("memif-socket", sizeof(struct memif_socket), 0);
897 MIF_LOG(ERR, "Failed to allocate memory for memif socket");
901 sock->listener = listener;
902 strlcpy(sock->filename, key, MEMIF_SOCKET_UN_SIZE);
903 TAILQ_INIT(&sock->dev_queue);
906 sockfd = socket(AF_UNIX, SOCK_SEQPACKET, 0);
910 un.sun_family = AF_UNIX;
912 /* abstract address */
913 un.sun_path[0] = '\0';
914 strlcpy(un.sun_path + 1, sock->filename, MEMIF_SOCKET_UN_SIZE - 1);
915 sunlen = RTE_MIN(1 + strlen(sock->filename),
916 MEMIF_SOCKET_UN_SIZE) +
917 sizeof(un) - sizeof(un.sun_path);
920 strlcpy(un.sun_path, sock->filename, MEMIF_SOCKET_UN_SIZE);
923 ret = setsockopt(sockfd, SOL_SOCKET, SO_PASSCRED, &on,
928 ret = bind(sockfd, (struct sockaddr *)&un, sunlen);
932 ret = listen(sockfd, 1);
936 MIF_LOG(DEBUG, "Memif listener socket %s created.", sock->filename);
938 /* Allocate interrupt instance */
940 rte_intr_instance_alloc(RTE_INTR_INSTANCE_F_SHARED);
941 if (sock->intr_handle == NULL) {
942 MIF_LOG(ERR, "Failed to allocate intr handle");
946 if (rte_intr_fd_set(sock->intr_handle, sockfd))
949 if (rte_intr_type_set(sock->intr_handle, RTE_INTR_HANDLE_EXT))
952 ret = rte_intr_callback_register(sock->intr_handle,
953 memif_listener_handler, sock);
955 MIF_LOG(ERR, "Failed to register interrupt "
956 "callback for listener socket");
964 MIF_LOG(ERR, "Failed to setup socket %s: %s", key, strerror(errno));
966 rte_intr_instance_free(sock->intr_handle);
974 static struct rte_hash *
975 memif_create_socket_hash(void)
977 struct rte_hash_parameters params = { 0 };
979 params.name = MEMIF_SOCKET_HASH_NAME;
980 params.entries = 256;
981 params.key_len = MEMIF_SOCKET_UN_SIZE;
982 params.hash_func = rte_jhash;
983 params.hash_func_init_val = 0;
984 params.socket_id = SOCKET_ID_ANY;
985 return rte_hash_create(¶ms);
989 memif_socket_init(struct rte_eth_dev *dev, const char *socket_filename)
991 struct pmd_internals *pmd = dev->data->dev_private;
992 struct memif_socket *socket = NULL;
993 struct memif_socket_dev_list_elt *elt;
994 struct pmd_internals *tmp_pmd;
995 struct rte_hash *hash;
997 char key[MEMIF_SOCKET_UN_SIZE];
999 hash = rte_hash_find_existing(MEMIF_SOCKET_HASH_NAME);
1001 hash = memif_create_socket_hash();
1003 MIF_LOG(ERR, "Failed to create memif socket hash.");
1008 memset(key, 0, MEMIF_SOCKET_UN_SIZE);
1009 strlcpy(key, socket_filename, MEMIF_SOCKET_UN_SIZE);
1010 ret = rte_hash_lookup_data(hash, key, (void **)&socket);
1012 socket = memif_socket_create(key,
1013 (pmd->role == MEMIF_ROLE_CLIENT) ? 0 : 1,
1014 pmd->flags & ETH_MEMIF_FLAG_SOCKET_ABSTRACT);
1017 ret = rte_hash_add_key_data(hash, key, socket);
1019 MIF_LOG(ERR, "Failed to add socket to socket hash.");
1023 pmd->socket_filename = socket->filename;
1025 TAILQ_FOREACH(elt, &socket->dev_queue, next) {
1026 tmp_pmd = elt->dev->data->dev_private;
1027 if (tmp_pmd->id == pmd->id && tmp_pmd->role == pmd->role) {
1028 MIF_LOG(ERR, "Two interfaces with the same id (%d) can "
1029 "not have the same role.", pmd->id);
1034 elt = rte_malloc("pmd-queue", sizeof(struct memif_socket_dev_list_elt), 0);
1036 MIF_LOG(ERR, "Failed to add device to socket device list.");
1040 TAILQ_INSERT_TAIL(&socket->dev_queue, elt, next);
1046 memif_socket_remove_device(struct rte_eth_dev *dev)
1048 struct pmd_internals *pmd = dev->data->dev_private;
1049 struct memif_socket *socket = NULL;
1050 struct memif_socket_dev_list_elt *elt, *next;
1051 struct rte_hash *hash;
1054 hash = rte_hash_find_existing(MEMIF_SOCKET_HASH_NAME);
1058 if (pmd->socket_filename == NULL)
1061 if (rte_hash_lookup_data(hash, pmd->socket_filename, (void **)&socket) < 0)
1064 for (elt = TAILQ_FIRST(&socket->dev_queue); elt != NULL; elt = next) {
1065 next = TAILQ_NEXT(elt, next);
1066 if (elt->dev == dev) {
1067 TAILQ_REMOVE(&socket->dev_queue, elt, next);
1069 pmd->socket_filename = NULL;
1073 /* remove socket, if this was the last device using it */
1074 if (TAILQ_EMPTY(&socket->dev_queue)) {
1075 rte_hash_del_key(hash, socket->filename);
1076 if (socket->listener && !(pmd->flags & ETH_MEMIF_FLAG_SOCKET_ABSTRACT)) {
1077 /* remove listener socket file,
1078 * so we can create new one later.
1080 ret = remove(socket->filename);
1082 MIF_LOG(ERR, "Failed to remove socket file: %s",
1085 if (pmd->role != MEMIF_ROLE_CLIENT)
1086 rte_intr_instance_free(socket->intr_handle);
1092 memif_connect_server(struct rte_eth_dev *dev)
1094 struct pmd_internals *pmd = dev->data->dev_private;
1096 memset(pmd->local_disc_string, 0, ETH_MEMIF_DISC_STRING_SIZE);
1097 memset(pmd->remote_disc_string, 0, ETH_MEMIF_DISC_STRING_SIZE);
1098 pmd->flags &= ~ETH_MEMIF_FLAG_DISABLED;
1103 memif_connect_client(struct rte_eth_dev *dev)
1108 struct sockaddr_un sun = { 0 };
1109 struct pmd_internals *pmd = dev->data->dev_private;
1111 memset(pmd->local_disc_string, 0, ETH_MEMIF_DISC_STRING_SIZE);
1112 memset(pmd->remote_disc_string, 0, ETH_MEMIF_DISC_STRING_SIZE);
1113 pmd->flags &= ~ETH_MEMIF_FLAG_DISABLED;
1115 sockfd = socket(AF_UNIX, SOCK_SEQPACKET, 0);
1117 MIF_LOG(ERR, "Failed to open socket.");
1121 sun.sun_family = AF_UNIX;
1122 sunlen = sizeof(struct sockaddr_un);
1123 if (pmd->flags & ETH_MEMIF_FLAG_SOCKET_ABSTRACT) {
1124 /* abstract address */
1125 sun.sun_path[0] = '\0';
1126 strlcpy(sun.sun_path + 1, pmd->socket_filename, MEMIF_SOCKET_UN_SIZE - 1);
1127 sunlen = RTE_MIN(strlen(pmd->socket_filename) + 1,
1128 MEMIF_SOCKET_UN_SIZE) +
1129 sizeof(sun) - sizeof(sun.sun_path);
1131 strlcpy(sun.sun_path, pmd->socket_filename, MEMIF_SOCKET_UN_SIZE);
1134 ret = connect(sockfd, (struct sockaddr *)&sun, sunlen);
1136 MIF_LOG(ERR, "Failed to connect socket: %s.", pmd->socket_filename);
1140 MIF_LOG(DEBUG, "Memif socket: %s connected.", pmd->socket_filename);
1142 pmd->cc = rte_zmalloc("memif-cc",
1143 sizeof(struct memif_control_channel), 0);
1144 if (pmd->cc == NULL) {
1145 MIF_LOG(ERR, "Failed to allocate control channel.");
1149 /* Allocate interrupt instance */
1150 pmd->cc->intr_handle =
1151 rte_intr_instance_alloc(RTE_INTR_INSTANCE_F_SHARED);
1152 if (pmd->cc->intr_handle == NULL) {
1153 MIF_LOG(ERR, "Failed to allocate intr handle");
1157 if (rte_intr_fd_set(pmd->cc->intr_handle, sockfd))
1160 if (rte_intr_type_set(pmd->cc->intr_handle, RTE_INTR_HANDLE_EXT))
1163 pmd->cc->socket = NULL;
1165 TAILQ_INIT(&pmd->cc->msg_queue);
1167 ret = rte_intr_callback_register(pmd->cc->intr_handle,
1168 memif_intr_handler, pmd->cc);
1170 MIF_LOG(ERR, "Failed to register interrupt callback for control fd");
1181 if (pmd->cc != NULL) {
1182 rte_intr_instance_free(pmd->cc->intr_handle);