1 /* SPDX-License-Identifier: BSD-3-Clause
2 * Copyright 2018-2019 Cisco Systems, Inc. All rights reserved.
9 #include <sys/socket.h>
10 #include <sys/ioctl.h>
13 #include <rte_version.h>
15 #include <rte_ether.h>
16 #include <ethdev_driver.h>
17 #include <ethdev_vdev.h>
18 #include <rte_malloc.h>
19 #include <rte_kvargs.h>
20 #include <rte_bus_vdev.h>
22 #include <rte_jhash.h>
23 #include <rte_string_fns.h>
25 #include "rte_eth_memif.h"
26 #include "memif_socket.h"
28 static void memif_intr_handler(void *arg);
31 memif_msg_send(int fd, memif_msg_t *msg, int afd)
33 struct msghdr mh = { 0 };
36 char ctl[CMSG_SPACE(sizeof(int))];
38 iov[0].iov_base = msg;
39 iov[0].iov_len = sizeof(memif_msg_t);
44 memset(&ctl, 0, sizeof(ctl));
46 mh.msg_controllen = sizeof(ctl);
47 cmsg = CMSG_FIRSTHDR(&mh);
48 cmsg->cmsg_len = CMSG_LEN(sizeof(int));
49 cmsg->cmsg_level = SOL_SOCKET;
50 cmsg->cmsg_type = SCM_RIGHTS;
51 rte_memcpy(CMSG_DATA(cmsg), &afd, sizeof(int));
54 return sendmsg(fd, &mh, 0);
58 memif_msg_send_from_queue(struct memif_control_channel *cc)
62 struct memif_msg_queue_elt *e;
64 e = TAILQ_FIRST(&cc->msg_queue);
68 if (rte_intr_fd_get(cc->intr_handle) < 0)
71 size = memif_msg_send(rte_intr_fd_get(cc->intr_handle), &e->msg,
73 if (size != sizeof(memif_msg_t)) {
74 MIF_LOG(ERR, "sendmsg fail: %s.", strerror(errno));
77 MIF_LOG(DEBUG, "Sent msg type %u.", e->msg.type);
79 TAILQ_REMOVE(&cc->msg_queue, e, next);
85 static struct memif_msg_queue_elt *
86 memif_msg_enq(struct memif_control_channel *cc)
88 struct memif_msg_queue_elt *e;
90 e = rte_zmalloc("memif_msg", sizeof(struct memif_msg_queue_elt), 0);
92 MIF_LOG(ERR, "Failed to allocate control message.");
97 TAILQ_INSERT_TAIL(&cc->msg_queue, e, next);
103 memif_msg_enq_disconnect(struct memif_control_channel *cc, const char *reason,
106 struct memif_msg_queue_elt *e;
107 struct pmd_internals *pmd;
108 memif_msg_disconnect_t *d;
111 MIF_LOG(DEBUG, "Missing control channel.");
115 e = memif_msg_enq(cc);
117 MIF_LOG(WARNING, "Failed to enqueue disconnect message.");
121 d = &e->msg.disconnect;
123 e->msg.type = MEMIF_MSG_TYPE_DISCONNECT;
126 if (reason != NULL) {
127 strlcpy((char *)d->string, reason, sizeof(d->string));
128 if (cc->dev != NULL) {
129 pmd = cc->dev->data->dev_private;
130 strlcpy(pmd->local_disc_string, reason,
131 sizeof(pmd->local_disc_string));
137 memif_msg_enq_hello(struct memif_control_channel *cc)
139 struct memif_msg_queue_elt *e = memif_msg_enq(cc);
140 memif_msg_hello_t *h;
147 e->msg.type = MEMIF_MSG_TYPE_HELLO;
148 h->min_version = MEMIF_VERSION;
149 h->max_version = MEMIF_VERSION;
150 h->max_c2s_ring = ETH_MEMIF_MAX_NUM_Q_PAIRS;
151 h->max_s2c_ring = ETH_MEMIF_MAX_NUM_Q_PAIRS;
152 h->max_region = ETH_MEMIF_MAX_REGION_NUM - 1;
153 h->max_log2_ring_size = ETH_MEMIF_MAX_LOG2_RING_SIZE;
155 strlcpy((char *)h->name, rte_version(), sizeof(h->name));
161 memif_msg_receive_hello(struct rte_eth_dev *dev, memif_msg_t *msg)
163 struct pmd_internals *pmd = dev->data->dev_private;
164 memif_msg_hello_t *h = &msg->hello;
166 if (h->min_version > MEMIF_VERSION || h->max_version < MEMIF_VERSION) {
167 memif_msg_enq_disconnect(pmd->cc, "Incompatible memif version", 0);
171 /* Set parameters for active connection */
172 pmd->run.num_c2s_rings = RTE_MIN(h->max_c2s_ring + 1,
173 pmd->cfg.num_c2s_rings);
174 pmd->run.num_s2c_rings = RTE_MIN(h->max_s2c_ring + 1,
175 pmd->cfg.num_s2c_rings);
176 pmd->run.log2_ring_size = RTE_MIN(h->max_log2_ring_size,
177 pmd->cfg.log2_ring_size);
178 pmd->run.pkt_buffer_size = pmd->cfg.pkt_buffer_size;
180 strlcpy(pmd->remote_name, (char *)h->name, sizeof(pmd->remote_name));
182 MIF_LOG(DEBUG, "Connecting to %s.", pmd->remote_name);
188 memif_msg_receive_init(struct memif_control_channel *cc, memif_msg_t *msg)
190 memif_msg_init_t *i = &msg->init;
191 struct memif_socket_dev_list_elt *elt;
192 struct pmd_internals *pmd;
193 struct rte_eth_dev *dev;
195 if (i->version != MEMIF_VERSION) {
196 memif_msg_enq_disconnect(cc, "Incompatible memif version", 0);
200 if (cc->socket == NULL) {
201 memif_msg_enq_disconnect(cc, "Device error", 0);
205 /* Find device with requested ID */
206 TAILQ_FOREACH(elt, &cc->socket->dev_queue, next) {
208 pmd = dev->data->dev_private;
209 if (((pmd->flags & ETH_MEMIF_FLAG_DISABLED) == 0) &&
210 (pmd->id == i->id) && (pmd->role == MEMIF_ROLE_SERVER)) {
211 if (pmd->flags & (ETH_MEMIF_FLAG_CONNECTING |
212 ETH_MEMIF_FLAG_CONNECTED)) {
213 memif_msg_enq_disconnect(cc,
214 "Already connected", 0);
218 /* assign control channel to device */
222 if (i->mode != MEMIF_INTERFACE_MODE_ETHERNET) {
223 memif_msg_enq_disconnect(pmd->cc,
224 "Only ethernet mode supported",
229 strlcpy(pmd->remote_name, (char *)i->name,
230 sizeof(pmd->remote_name));
232 if (*pmd->secret != '\0') {
233 if (*i->secret == '\0') {
234 memif_msg_enq_disconnect(pmd->cc,
235 "Secret required", 0);
238 if (strncmp(pmd->secret, (char *)i->secret,
239 ETH_MEMIF_SECRET_SIZE) != 0) {
240 memif_msg_enq_disconnect(pmd->cc,
241 "Incorrect secret", 0);
246 pmd->flags |= ETH_MEMIF_FLAG_CONNECTING;
251 /* ID not found on this socket */
252 MIF_LOG(DEBUG, "ID %u not found.", i->id);
253 memif_msg_enq_disconnect(cc, "ID not found", 0);
258 memif_msg_receive_add_region(struct rte_eth_dev *dev, memif_msg_t *msg,
261 struct pmd_internals *pmd = dev->data->dev_private;
262 struct pmd_process_private *proc_private = dev->process_private;
263 memif_msg_add_region_t *ar = &msg->add_region;
264 struct memif_region *r;
267 memif_msg_enq_disconnect(pmd->cc, "Missing region fd", 0);
271 if (ar->index >= ETH_MEMIF_MAX_REGION_NUM ||
272 ar->index != proc_private->regions_num ||
273 proc_private->regions[ar->index] != NULL) {
274 memif_msg_enq_disconnect(pmd->cc, "Invalid region index", 0);
278 r = rte_zmalloc("region", sizeof(struct memif_region), 0);
280 memif_msg_enq_disconnect(pmd->cc, "Failed to alloc memif region.", 0);
285 r->region_size = ar->size;
288 proc_private->regions[ar->index] = r;
289 proc_private->regions_num++;
295 memif_msg_receive_add_ring(struct rte_eth_dev *dev, memif_msg_t *msg, int fd)
297 struct pmd_internals *pmd = dev->data->dev_private;
298 memif_msg_add_ring_t *ar = &msg->add_ring;
299 struct memif_queue *mq;
302 memif_msg_enq_disconnect(pmd->cc, "Missing interrupt fd", 0);
306 /* check if we have enough queues */
307 if (ar->flags & MEMIF_MSG_ADD_RING_FLAG_C2S) {
308 if (ar->index >= pmd->cfg.num_c2s_rings) {
309 memif_msg_enq_disconnect(pmd->cc, "Invalid ring index", 0);
312 pmd->run.num_c2s_rings++;
314 if (ar->index >= pmd->cfg.num_s2c_rings) {
315 memif_msg_enq_disconnect(pmd->cc, "Invalid ring index", 0);
318 pmd->run.num_s2c_rings++;
321 mq = (ar->flags & MEMIF_MSG_ADD_RING_FLAG_C2S) ?
322 dev->data->rx_queues[ar->index] : dev->data->tx_queues[ar->index];
324 if (rte_intr_fd_set(mq->intr_handle, fd))
327 mq->log2_ring_size = ar->log2_ring_size;
328 mq->region = ar->region;
329 mq->ring_offset = ar->offset;
335 memif_msg_receive_connect(struct rte_eth_dev *dev, memif_msg_t *msg)
337 struct pmd_internals *pmd = dev->data->dev_private;
338 memif_msg_connect_t *c = &msg->connect;
341 ret = memif_connect(dev);
345 strlcpy(pmd->remote_if_name, (char *)c->if_name,
346 sizeof(pmd->remote_if_name));
347 MIF_LOG(INFO, "Remote interface %s connected.", pmd->remote_if_name);
353 memif_msg_receive_connected(struct rte_eth_dev *dev, memif_msg_t *msg)
355 struct pmd_internals *pmd = dev->data->dev_private;
356 memif_msg_connected_t *c = &msg->connected;
359 ret = memif_connect(dev);
363 strlcpy(pmd->remote_if_name, (char *)c->if_name,
364 sizeof(pmd->remote_if_name));
365 MIF_LOG(INFO, "Remote interface %s connected.", pmd->remote_if_name);
371 memif_msg_receive_disconnect(struct rte_eth_dev *dev, memif_msg_t *msg)
373 struct pmd_internals *pmd = dev->data->dev_private;
374 memif_msg_disconnect_t *d = &msg->disconnect;
376 memset(pmd->remote_disc_string, 0, sizeof(pmd->remote_disc_string));
377 strlcpy(pmd->remote_disc_string, (char *)d->string,
378 sizeof(pmd->remote_disc_string));
380 MIF_LOG(INFO, "Disconnect received: %s", pmd->remote_disc_string);
382 memset(pmd->local_disc_string, 0, 96);
383 memif_disconnect(dev);
388 memif_msg_enq_ack(struct rte_eth_dev *dev)
390 struct pmd_internals *pmd = dev->data->dev_private;
391 struct memif_msg_queue_elt *e = memif_msg_enq(pmd->cc);
395 e->msg.type = MEMIF_MSG_TYPE_ACK;
401 memif_msg_enq_init(struct rte_eth_dev *dev)
403 struct pmd_internals *pmd = dev->data->dev_private;
404 struct memif_msg_queue_elt *e = memif_msg_enq(pmd->cc);
410 e->msg.type = MEMIF_MSG_TYPE_INIT;
411 i->version = MEMIF_VERSION;
413 i->mode = MEMIF_INTERFACE_MODE_ETHERNET;
415 strlcpy((char *)i->name, rte_version(), sizeof(i->name));
417 if (*pmd->secret != '\0')
418 strlcpy((char *)i->secret, pmd->secret, sizeof(i->secret));
424 memif_msg_enq_add_region(struct rte_eth_dev *dev, uint8_t idx)
426 struct pmd_internals *pmd = dev->data->dev_private;
427 struct pmd_process_private *proc_private = dev->process_private;
428 struct memif_msg_queue_elt *e = memif_msg_enq(pmd->cc);
429 memif_msg_add_region_t *ar;
430 struct memif_region *mr = proc_private->regions[idx];
435 ar = &e->msg.add_region;
436 e->msg.type = MEMIF_MSG_TYPE_ADD_REGION;
439 ar->size = mr->region_size;
445 memif_msg_enq_add_ring(struct rte_eth_dev *dev, uint8_t idx,
446 memif_ring_type_t type)
448 struct pmd_internals *pmd = dev->data->dev_private;
449 struct memif_msg_queue_elt *e = memif_msg_enq(pmd->cc);
450 struct memif_queue *mq;
451 memif_msg_add_ring_t *ar;
456 ar = &e->msg.add_ring;
457 mq = (type == MEMIF_RING_C2S) ? dev->data->tx_queues[idx] :
458 dev->data->rx_queues[idx];
460 e->msg.type = MEMIF_MSG_TYPE_ADD_RING;
461 e->fd = rte_intr_fd_get(mq->intr_handle);
463 ar->offset = mq->ring_offset;
464 ar->region = mq->region;
465 ar->log2_ring_size = mq->log2_ring_size;
466 ar->flags = (type == MEMIF_RING_C2S) ? MEMIF_MSG_ADD_RING_FLAG_C2S : 0;
467 ar->private_hdr_size = 0;
473 memif_msg_enq_connect(struct rte_eth_dev *dev)
475 struct pmd_internals *pmd = dev->data->dev_private;
476 struct memif_msg_queue_elt *e = memif_msg_enq(pmd->cc);
477 memif_msg_connect_t *c;
483 e->msg.type = MEMIF_MSG_TYPE_CONNECT;
484 strlcpy((char *)c->if_name, dev->data->name, sizeof(c->if_name));
490 memif_msg_enq_connected(struct rte_eth_dev *dev)
492 struct pmd_internals *pmd = dev->data->dev_private;
493 struct memif_msg_queue_elt *e = memif_msg_enq(pmd->cc);
494 memif_msg_connected_t *c;
499 c = &e->msg.connected;
500 e->msg.type = MEMIF_MSG_TYPE_CONNECTED;
501 strlcpy((char *)c->if_name, dev->data->name, sizeof(c->if_name));
507 memif_intr_unregister_handler(struct rte_intr_handle *intr_handle, void *arg)
509 struct memif_msg_queue_elt *elt;
510 struct memif_control_channel *cc = arg;
512 /* close control channel fd */
513 if (rte_intr_fd_get(intr_handle) >= 0)
514 close(rte_intr_fd_get(intr_handle));
515 /* clear message queue */
516 while ((elt = TAILQ_FIRST(&cc->msg_queue)) != NULL) {
517 TAILQ_REMOVE(&cc->msg_queue, elt, next);
520 rte_intr_instance_free(cc->intr_handle);
521 /* free control channel */
526 memif_disconnect(struct rte_eth_dev *dev)
528 struct pmd_internals *pmd = dev->data->dev_private;
529 struct memif_msg_queue_elt *elt, *next;
530 struct memif_queue *mq;
531 struct rte_intr_handle *ih;
535 dev->data->dev_link.link_status = RTE_ETH_LINK_DOWN;
536 pmd->flags &= ~ETH_MEMIF_FLAG_CONNECTING;
537 pmd->flags &= ~ETH_MEMIF_FLAG_CONNECTED;
539 rte_spinlock_lock(&pmd->cc_lock);
540 if (pmd->cc != NULL) {
541 /* Clear control message queue (except disconnect message if any). */
542 for (elt = TAILQ_FIRST(&pmd->cc->msg_queue); elt != NULL; elt = next) {
543 next = TAILQ_NEXT(elt, next);
544 if (elt->msg.type != MEMIF_MSG_TYPE_DISCONNECT) {
545 TAILQ_REMOVE(&pmd->cc->msg_queue, elt, next);
549 /* send disconnect message (if there is any in queue) */
550 memif_msg_send_from_queue(pmd->cc);
552 /* at this point, there should be no more messages in queue */
553 if (TAILQ_FIRST(&pmd->cc->msg_queue) != NULL) {
555 "Unexpected message(s) in message queue.");
558 ih = pmd->cc->intr_handle;
559 if (rte_intr_fd_get(ih) > 0) {
560 ret = rte_intr_callback_unregister(ih,
564 * If callback is active (disconnecting based on
565 * received control message).
567 if (ret == -EAGAIN) {
568 ret = rte_intr_callback_unregister_pending(ih,
571 memif_intr_unregister_handler);
572 } else if (ret > 0) {
573 close(rte_intr_fd_get(ih));
574 rte_intr_instance_free(ih);
580 "Failed to unregister control channel callback.");
583 rte_spinlock_unlock(&pmd->cc_lock);
585 /* unconfig interrupts */
586 for (i = 0; i < pmd->cfg.num_c2s_rings; i++) {
587 if (pmd->role == MEMIF_ROLE_CLIENT) {
588 if (dev->data->tx_queues != NULL)
589 mq = dev->data->tx_queues[i];
593 if (dev->data->rx_queues != NULL)
594 mq = dev->data->rx_queues[i];
599 if (rte_intr_fd_get(mq->intr_handle) > 0) {
600 close(rte_intr_fd_get(mq->intr_handle));
601 rte_intr_fd_set(mq->intr_handle, -1);
604 for (i = 0; i < pmd->cfg.num_s2c_rings; i++) {
605 if (pmd->role == MEMIF_ROLE_SERVER) {
606 if (dev->data->tx_queues != NULL)
607 mq = dev->data->tx_queues[i];
611 if (dev->data->rx_queues != NULL)
612 mq = dev->data->rx_queues[i];
617 if (rte_intr_fd_get(mq->intr_handle) > 0) {
618 close(rte_intr_fd_get(mq->intr_handle));
619 rte_intr_fd_set(mq->intr_handle, -1);
623 memif_free_regions(dev);
625 /* reset connection configuration */
626 memset(&pmd->run, 0, sizeof(pmd->run));
628 MIF_LOG(DEBUG, "Disconnected, id: %d, role: %s.", pmd->id,
629 (pmd->role == MEMIF_ROLE_SERVER) ? "server" : "client");
633 memif_msg_receive(struct memif_control_channel *cc)
635 char ctl[CMSG_SPACE(sizeof(int)) +
636 CMSG_SPACE(sizeof(struct ucred))] = { 0 };
637 struct msghdr mh = { 0 };
639 memif_msg_t msg = { 0 };
642 struct ucred *cr __rte_unused;
644 struct cmsghdr *cmsg;
647 struct pmd_internals *pmd;
648 struct pmd_process_private *proc_private;
650 iov[0].iov_base = (void *)&msg;
651 iov[0].iov_len = sizeof(memif_msg_t);
654 mh.msg_control = ctl;
655 mh.msg_controllen = sizeof(ctl);
657 if (rte_intr_fd_get(cc->intr_handle) < 0)
660 size = recvmsg(rte_intr_fd_get(cc->intr_handle), &mh, 0);
661 if (size != sizeof(memif_msg_t)) {
662 MIF_LOG(DEBUG, "Invalid message size = %zd", size);
664 /* 0 means end-of-file, negative size means error,
665 * don't send further disconnect message in such cases.
667 memif_msg_enq_disconnect(cc, "Invalid message size", 0);
670 MIF_LOG(DEBUG, "Received msg type: %u.", msg.type);
672 cmsg = CMSG_FIRSTHDR(&mh);
674 if (cmsg->cmsg_level == SOL_SOCKET) {
675 if (cmsg->cmsg_type == SCM_CREDENTIALS)
676 cr = (struct ucred *)CMSG_DATA(cmsg);
677 else if (cmsg->cmsg_type == SCM_RIGHTS)
678 rte_memcpy(&afd, CMSG_DATA(cmsg), sizeof(int));
680 cmsg = CMSG_NXTHDR(&mh, cmsg);
683 if (cc->dev == NULL && msg.type != MEMIF_MSG_TYPE_INIT) {
684 MIF_LOG(DEBUG, "Unexpected message.");
685 memif_msg_enq_disconnect(cc, "Unexpected message", 0);
689 /* get device from hash data */
691 case MEMIF_MSG_TYPE_ACK:
693 case MEMIF_MSG_TYPE_HELLO:
694 ret = memif_msg_receive_hello(cc->dev, &msg);
697 ret = memif_init_regions_and_queues(cc->dev);
700 ret = memif_msg_enq_init(cc->dev);
703 pmd = cc->dev->data->dev_private;
704 proc_private = cc->dev->process_private;
705 for (i = 0; i < proc_private->regions_num; i++) {
706 ret = memif_msg_enq_add_region(cc->dev, i);
710 for (i = 0; i < pmd->run.num_c2s_rings; i++) {
711 ret = memif_msg_enq_add_ring(cc->dev, i,
716 for (i = 0; i < pmd->run.num_s2c_rings; i++) {
717 ret = memif_msg_enq_add_ring(cc->dev, i,
722 ret = memif_msg_enq_connect(cc->dev);
726 case MEMIF_MSG_TYPE_INIT:
728 * This cc does not have an interface associated with it.
729 * If suitable interface is found it will be assigned here.
731 ret = memif_msg_receive_init(cc, &msg);
734 ret = memif_msg_enq_ack(cc->dev);
738 case MEMIF_MSG_TYPE_ADD_REGION:
739 ret = memif_msg_receive_add_region(cc->dev, &msg, afd);
742 ret = memif_msg_enq_ack(cc->dev);
746 case MEMIF_MSG_TYPE_ADD_RING:
747 ret = memif_msg_receive_add_ring(cc->dev, &msg, afd);
750 ret = memif_msg_enq_ack(cc->dev);
754 case MEMIF_MSG_TYPE_CONNECT:
755 ret = memif_msg_receive_connect(cc->dev, &msg);
758 ret = memif_msg_enq_connected(cc->dev);
762 case MEMIF_MSG_TYPE_CONNECTED:
763 ret = memif_msg_receive_connected(cc->dev, &msg);
765 case MEMIF_MSG_TYPE_DISCONNECT:
766 ret = memif_msg_receive_disconnect(cc->dev, &msg);
771 memif_msg_enq_disconnect(cc, "Unknown message type", 0);
781 memif_intr_handler(void *arg)
783 struct memif_control_channel *cc = arg;
786 ret = memif_msg_receive(cc);
787 /* if driver failed to assign device */
788 if (cc->dev == NULL) {
789 memif_msg_send_from_queue(cc);
790 ret = rte_intr_callback_unregister_pending(cc->intr_handle,
793 memif_intr_unregister_handler);
796 "Failed to unregister control channel callback.");
799 /* if memif_msg_receive failed */
803 ret = memif_msg_send_from_queue(cc);
810 if (cc->dev == NULL) {
811 MIF_LOG(WARNING, "eth dev not allocated");
814 memif_disconnect(cc->dev);
818 memif_listener_handler(void *arg)
820 struct memif_socket *socket = arg;
823 struct sockaddr_un client;
824 struct memif_control_channel *cc;
827 addr_len = sizeof(client);
828 sockfd = accept(rte_intr_fd_get(socket->intr_handle),
829 (struct sockaddr *)&client, (socklen_t *)&addr_len);
832 "Failed to accept connection request on socket fd %d",
833 rte_intr_fd_get(socket->intr_handle));
837 MIF_LOG(DEBUG, "%s: Connection request accepted.", socket->filename);
839 cc = rte_zmalloc("memif-cc", sizeof(struct memif_control_channel), 0);
841 MIF_LOG(ERR, "Failed to allocate control channel.");
845 /* Allocate interrupt instance */
846 cc->intr_handle = rte_intr_instance_alloc(RTE_INTR_INSTANCE_F_SHARED);
847 if (cc->intr_handle == NULL) {
848 MIF_LOG(ERR, "Failed to allocate intr handle");
852 if (rte_intr_fd_set(cc->intr_handle, sockfd))
855 if (rte_intr_type_set(cc->intr_handle, RTE_INTR_HANDLE_EXT))
860 TAILQ_INIT(&cc->msg_queue);
862 ret = rte_intr_callback_register(cc->intr_handle, memif_intr_handler,
865 MIF_LOG(ERR, "Failed to register control channel callback.");
869 ret = memif_msg_enq_hello(cc);
871 MIF_LOG(ERR, "Failed to enqueue hello message.");
874 ret = memif_msg_send_from_queue(cc);
886 rte_intr_instance_free(cc->intr_handle);
891 static struct memif_socket *
892 memif_socket_create(char *key, uint8_t listener, bool is_abstract)
894 struct memif_socket *sock;
895 struct sockaddr_un un = { 0 };
901 sock = rte_zmalloc("memif-socket", sizeof(struct memif_socket), 0);
903 MIF_LOG(ERR, "Failed to allocate memory for memif socket");
907 sock->listener = listener;
908 strlcpy(sock->filename, key, MEMIF_SOCKET_UN_SIZE);
909 TAILQ_INIT(&sock->dev_queue);
912 sockfd = socket(AF_UNIX, SOCK_SEQPACKET, 0);
916 un.sun_family = AF_UNIX;
918 /* abstract address */
919 un.sun_path[0] = '\0';
920 strlcpy(un.sun_path + 1, sock->filename, MEMIF_SOCKET_UN_SIZE - 1);
921 sunlen = RTE_MIN(1 + strlen(sock->filename),
922 MEMIF_SOCKET_UN_SIZE) +
923 sizeof(un) - sizeof(un.sun_path);
926 strlcpy(un.sun_path, sock->filename, MEMIF_SOCKET_UN_SIZE);
929 ret = setsockopt(sockfd, SOL_SOCKET, SO_PASSCRED, &on,
934 ret = bind(sockfd, (struct sockaddr *)&un, sunlen);
938 ret = listen(sockfd, 1);
942 MIF_LOG(DEBUG, "Memif listener socket %s created.", sock->filename);
944 /* Allocate interrupt instance */
946 rte_intr_instance_alloc(RTE_INTR_INSTANCE_F_SHARED);
947 if (sock->intr_handle == NULL) {
948 MIF_LOG(ERR, "Failed to allocate intr handle");
952 if (rte_intr_fd_set(sock->intr_handle, sockfd))
955 if (rte_intr_type_set(sock->intr_handle, RTE_INTR_HANDLE_EXT))
958 ret = rte_intr_callback_register(sock->intr_handle,
959 memif_listener_handler, sock);
961 MIF_LOG(ERR, "Failed to register interrupt "
962 "callback for listener socket");
970 MIF_LOG(ERR, "Failed to setup socket %s: %s", key, strerror(errno));
972 rte_intr_instance_free(sock->intr_handle);
980 static struct rte_hash *
981 memif_create_socket_hash(void)
983 struct rte_hash_parameters params = { 0 };
985 params.name = MEMIF_SOCKET_HASH_NAME;
986 params.entries = 256;
987 params.key_len = MEMIF_SOCKET_UN_SIZE;
988 params.hash_func = rte_jhash;
989 params.hash_func_init_val = 0;
990 params.socket_id = SOCKET_ID_ANY;
991 return rte_hash_create(¶ms);
995 memif_socket_init(struct rte_eth_dev *dev, const char *socket_filename)
997 struct pmd_internals *pmd = dev->data->dev_private;
998 struct memif_socket *socket = NULL;
999 struct memif_socket_dev_list_elt *elt;
1000 struct pmd_internals *tmp_pmd;
1001 struct rte_hash *hash;
1003 char key[MEMIF_SOCKET_UN_SIZE];
1005 hash = rte_hash_find_existing(MEMIF_SOCKET_HASH_NAME);
1007 hash = memif_create_socket_hash();
1009 MIF_LOG(ERR, "Failed to create memif socket hash.");
1014 memset(key, 0, MEMIF_SOCKET_UN_SIZE);
1015 strlcpy(key, socket_filename, MEMIF_SOCKET_UN_SIZE);
1016 ret = rte_hash_lookup_data(hash, key, (void **)&socket);
1018 socket = memif_socket_create(key,
1019 (pmd->role == MEMIF_ROLE_CLIENT) ? 0 : 1,
1020 pmd->flags & ETH_MEMIF_FLAG_SOCKET_ABSTRACT);
1023 ret = rte_hash_add_key_data(hash, key, socket);
1025 MIF_LOG(ERR, "Failed to add socket to socket hash.");
1029 pmd->socket_filename = socket->filename;
1031 TAILQ_FOREACH(elt, &socket->dev_queue, next) {
1032 tmp_pmd = elt->dev->data->dev_private;
1033 if (tmp_pmd->id == pmd->id && tmp_pmd->role == pmd->role) {
1034 MIF_LOG(ERR, "Two interfaces with the same id (%d) can "
1035 "not have the same role.", pmd->id);
1040 elt = rte_malloc("pmd-queue", sizeof(struct memif_socket_dev_list_elt), 0);
1042 MIF_LOG(ERR, "Failed to add device to socket device list.");
1046 TAILQ_INSERT_TAIL(&socket->dev_queue, elt, next);
1052 memif_socket_remove_device(struct rte_eth_dev *dev)
1054 struct pmd_internals *pmd = dev->data->dev_private;
1055 struct memif_socket *socket = NULL;
1056 struct memif_socket_dev_list_elt *elt, *next;
1057 struct rte_hash *hash;
1060 hash = rte_hash_find_existing(MEMIF_SOCKET_HASH_NAME);
1064 if (pmd->socket_filename == NULL)
1067 if (rte_hash_lookup_data(hash, pmd->socket_filename, (void **)&socket) < 0)
1070 for (elt = TAILQ_FIRST(&socket->dev_queue); elt != NULL; elt = next) {
1071 next = TAILQ_NEXT(elt, next);
1072 if (elt->dev == dev) {
1073 TAILQ_REMOVE(&socket->dev_queue, elt, next);
1075 pmd->socket_filename = NULL;
1079 /* remove socket, if this was the last device using it */
1080 if (TAILQ_EMPTY(&socket->dev_queue)) {
1081 rte_hash_del_key(hash, socket->filename);
1082 if (socket->listener && !(pmd->flags & ETH_MEMIF_FLAG_SOCKET_ABSTRACT)) {
1083 /* remove listener socket file,
1084 * so we can create new one later.
1086 ret = remove(socket->filename);
1088 MIF_LOG(ERR, "Failed to remove socket file: %s",
1091 if (pmd->role != MEMIF_ROLE_CLIENT)
1092 rte_intr_instance_free(socket->intr_handle);
1098 memif_connect_server(struct rte_eth_dev *dev)
1100 struct pmd_internals *pmd = dev->data->dev_private;
1102 memset(pmd->local_disc_string, 0, ETH_MEMIF_DISC_STRING_SIZE);
1103 memset(pmd->remote_disc_string, 0, ETH_MEMIF_DISC_STRING_SIZE);
1104 pmd->flags &= ~ETH_MEMIF_FLAG_DISABLED;
1109 memif_connect_client(struct rte_eth_dev *dev)
1114 struct sockaddr_un sun = { 0 };
1115 struct pmd_internals *pmd = dev->data->dev_private;
1117 memset(pmd->local_disc_string, 0, ETH_MEMIF_DISC_STRING_SIZE);
1118 memset(pmd->remote_disc_string, 0, ETH_MEMIF_DISC_STRING_SIZE);
1119 pmd->flags &= ~ETH_MEMIF_FLAG_DISABLED;
1121 sockfd = socket(AF_UNIX, SOCK_SEQPACKET, 0);
1123 MIF_LOG(ERR, "Failed to open socket.");
1127 sun.sun_family = AF_UNIX;
1128 sunlen = sizeof(struct sockaddr_un);
1129 if (pmd->flags & ETH_MEMIF_FLAG_SOCKET_ABSTRACT) {
1130 /* abstract address */
1131 sun.sun_path[0] = '\0';
1132 strlcpy(sun.sun_path + 1, pmd->socket_filename, MEMIF_SOCKET_UN_SIZE - 1);
1133 sunlen = RTE_MIN(strlen(pmd->socket_filename) + 1,
1134 MEMIF_SOCKET_UN_SIZE) +
1135 sizeof(sun) - sizeof(sun.sun_path);
1137 strlcpy(sun.sun_path, pmd->socket_filename, MEMIF_SOCKET_UN_SIZE);
1140 ret = connect(sockfd, (struct sockaddr *)&sun, sunlen);
1142 MIF_LOG(ERR, "Failed to connect socket: %s.", pmd->socket_filename);
1146 MIF_LOG(DEBUG, "Memif socket: %s connected.", pmd->socket_filename);
1148 pmd->cc = rte_zmalloc("memif-cc",
1149 sizeof(struct memif_control_channel), 0);
1150 if (pmd->cc == NULL) {
1151 MIF_LOG(ERR, "Failed to allocate control channel.");
1155 /* Allocate interrupt instance */
1156 pmd->cc->intr_handle =
1157 rte_intr_instance_alloc(RTE_INTR_INSTANCE_F_SHARED);
1158 if (pmd->cc->intr_handle == NULL) {
1159 MIF_LOG(ERR, "Failed to allocate intr handle");
1163 if (rte_intr_fd_set(pmd->cc->intr_handle, sockfd))
1166 if (rte_intr_type_set(pmd->cc->intr_handle, RTE_INTR_HANDLE_EXT))
1169 pmd->cc->socket = NULL;
1171 TAILQ_INIT(&pmd->cc->msg_queue);
1173 ret = rte_intr_callback_register(pmd->cc->intr_handle,
1174 memif_intr_handler, pmd->cc);
1176 MIF_LOG(ERR, "Failed to register interrupt callback for control fd");
1187 if (pmd->cc != NULL) {
1188 rte_intr_instance_free(pmd->cc->intr_handle);