net/memif: support multi-process
[dpdk.git] / drivers / net / memif / rte_eth_memif.c
1 /* SPDX-License-Identifier: BSD-3-Clause
2  * Copyright 2018-2019 Cisco Systems, Inc.  All rights reserved.
3  */
4
5 #include <stdlib.h>
6 #include <fcntl.h>
7 #include <unistd.h>
8 #include <sys/types.h>
9 #include <sys/socket.h>
10 #include <sys/un.h>
11 #include <sys/ioctl.h>
12 #include <sys/mman.h>
13 #include <linux/if_ether.h>
14 #include <errno.h>
15 #include <sys/eventfd.h>
16
17 #include <rte_version.h>
18 #include <rte_mbuf.h>
19 #include <rte_ether.h>
20 #include <rte_ethdev_driver.h>
21 #include <rte_ethdev_vdev.h>
22 #include <rte_malloc.h>
23 #include <rte_kvargs.h>
24 #include <rte_bus_vdev.h>
25 #include <rte_string_fns.h>
26
27 #include "rte_eth_memif.h"
28 #include "memif_socket.h"
29
30 #define ETH_MEMIF_ID_ARG                "id"
31 #define ETH_MEMIF_ROLE_ARG              "role"
32 #define ETH_MEMIF_PKT_BUFFER_SIZE_ARG   "bsize"
33 #define ETH_MEMIF_RING_SIZE_ARG         "rsize"
34 #define ETH_MEMIF_SOCKET_ARG            "socket"
35 #define ETH_MEMIF_MAC_ARG               "mac"
36 #define ETH_MEMIF_ZC_ARG                "zero-copy"
37 #define ETH_MEMIF_SECRET_ARG            "secret"
38
39 static const char * const valid_arguments[] = {
40         ETH_MEMIF_ID_ARG,
41         ETH_MEMIF_ROLE_ARG,
42         ETH_MEMIF_PKT_BUFFER_SIZE_ARG,
43         ETH_MEMIF_RING_SIZE_ARG,
44         ETH_MEMIF_SOCKET_ARG,
45         ETH_MEMIF_MAC_ARG,
46         ETH_MEMIF_ZC_ARG,
47         ETH_MEMIF_SECRET_ARG,
48         NULL
49 };
50
51 #define MEMIF_MP_SEND_REGION            "memif_mp_send_region"
52
53 const char *
54 memif_version(void)
55 {
56         return ("memif-" RTE_STR(MEMIF_VERSION_MAJOR) "." RTE_STR(MEMIF_VERSION_MINOR));
57 }
58
59 /* Message header to synchronize regions */
60 struct mp_region_msg {
61         char port_name[RTE_DEV_NAME_MAX_LEN];
62         memif_region_index_t idx;
63         memif_region_size_t size;
64 };
65
66 static int
67 memif_mp_send_region(const struct rte_mp_msg *msg, const void *peer)
68 {
69         struct rte_eth_dev *dev;
70         struct pmd_process_private *proc_private;
71         const struct mp_region_msg *msg_param = (const struct mp_region_msg *)msg->param;
72         struct rte_mp_msg reply;
73         struct mp_region_msg *reply_param = (struct mp_region_msg *)reply.param;
74         uint16_t port_id;
75         int ret;
76
77         /* Get requested port */
78         ret = rte_eth_dev_get_port_by_name(msg_param->port_name, &port_id);
79         if (ret) {
80                 MIF_LOG(ERR, "Failed to get port id for %s",
81                         msg_param->port_name);
82                 return -1;
83         }
84         dev = &rte_eth_devices[port_id];
85         proc_private = dev->process_private;
86
87         memset(&reply, 0, sizeof(reply));
88         strlcpy(reply.name, msg->name, sizeof(reply.name));
89         reply_param->idx = msg_param->idx;
90         if (proc_private->regions[msg_param->idx] != NULL) {
91                 reply_param->size = proc_private->regions[msg_param->idx]->region_size;
92                 reply.fds[0] = proc_private->regions[msg_param->idx]->fd;
93                 reply.num_fds = 1;
94         }
95         reply.len_param = sizeof(*reply_param);
96         if (rte_mp_reply(&reply, peer) < 0) {
97                 MIF_LOG(ERR, "Failed to reply to an add region request");
98                 return -1;
99         }
100
101         return 0;
102 }
103
104 /*
105  * Request regions
106  * Called by secondary process, when ports link status goes up.
107  */
108 static int
109 memif_mp_request_regions(struct rte_eth_dev *dev)
110 {
111         int ret, i;
112         struct timespec timeout = {.tv_sec = 5, .tv_nsec = 0};
113         struct rte_mp_msg msg, *reply;
114         struct rte_mp_reply replies;
115         struct mp_region_msg *msg_param = (struct mp_region_msg *)msg.param;
116         struct mp_region_msg *reply_param;
117         struct memif_region *r;
118         struct pmd_process_private *proc_private = dev->process_private;
119
120         MIF_LOG(DEBUG, "Requesting memory regions");
121
122         for (i = 0; i < ETH_MEMIF_MAX_REGION_NUM; i++) {
123                 /* Prepare the message */
124                 memset(&msg, 0, sizeof(msg));
125                 strlcpy(msg.name, MEMIF_MP_SEND_REGION, sizeof(msg.name));
126                 strlcpy(msg_param->port_name, dev->data->name,
127                         sizeof(msg_param->port_name));
128                 msg_param->idx = i;
129                 msg.len_param = sizeof(*msg_param);
130
131                 /* Send message */
132                 ret = rte_mp_request_sync(&msg, &replies, &timeout);
133                 if (ret < 0 || replies.nb_received != 1) {
134                         MIF_LOG(ERR, "Failed to send mp msg: %d",
135                                 rte_errno);
136                         return -1;
137                 }
138
139                 reply = &replies.msgs[0];
140                 reply_param = (struct mp_region_msg *)reply->param;
141
142                 if (reply_param->size > 0) {
143                         r = rte_zmalloc("region", sizeof(struct memif_region), 0);
144                         if (r == NULL) {
145                                 MIF_LOG(ERR, "Failed to alloc memif region.");
146                                 free(reply);
147                                 return -ENOMEM;
148                         }
149                         r->region_size = reply_param->size;
150                         if (reply->num_fds < 1) {
151                                 MIF_LOG(ERR, "Missing file descriptor.");
152                                 free(reply);
153                                 return -1;
154                         }
155                         r->fd = reply->fds[0];
156                         r->addr = NULL;
157
158                         proc_private->regions[reply_param->idx] = r;
159                         proc_private->regions_num++;
160                 }
161                 free(reply);
162         }
163
164         return memif_connect(dev);
165 }
166
167 static void
168 memif_dev_info(struct rte_eth_dev *dev __rte_unused, struct rte_eth_dev_info *dev_info)
169 {
170         dev_info->max_mac_addrs = 1;
171         dev_info->max_rx_pktlen = (uint32_t)ETH_FRAME_LEN;
172         dev_info->max_rx_queues = ETH_MEMIF_MAX_NUM_Q_PAIRS;
173         dev_info->max_tx_queues = ETH_MEMIF_MAX_NUM_Q_PAIRS;
174         dev_info->min_rx_bufsize = 0;
175 }
176
177 static memif_ring_t *
178 memif_get_ring(struct pmd_internals *pmd, struct pmd_process_private *proc_private,
179                memif_ring_type_t type, uint16_t ring_num)
180 {
181         /* rings only in region 0 */
182         void *p = proc_private->regions[0]->addr;
183         int ring_size = sizeof(memif_ring_t) + sizeof(memif_desc_t) *
184             (1 << pmd->run.log2_ring_size);
185
186         p = (uint8_t *)p + (ring_num + type * pmd->run.num_s2m_rings) * ring_size;
187
188         return (memif_ring_t *)p;
189 }
190
191 static memif_region_offset_t
192 memif_get_ring_offset(struct rte_eth_dev *dev, struct memif_queue *mq,
193                       memif_ring_type_t type, uint16_t num)
194 {
195         struct pmd_internals *pmd = dev->data->dev_private;
196         struct pmd_process_private *proc_private = dev->process_private;
197
198         return ((uint8_t *)memif_get_ring(pmd, proc_private, type, num) -
199                 (uint8_t *)proc_private->regions[mq->region]->addr);
200 }
201
202 static memif_ring_t *
203 memif_get_ring_from_queue(struct pmd_process_private *proc_private,
204                           struct memif_queue *mq)
205 {
206         struct memif_region *r;
207
208         r = proc_private->regions[mq->region];
209         if (r == NULL)
210                 return NULL;
211
212         return (memif_ring_t *)((uint8_t *)r->addr + mq->ring_offset);
213 }
214
215 static void *
216 memif_get_buffer(struct pmd_process_private *proc_private, memif_desc_t *d)
217 {
218         return ((uint8_t *)proc_private->regions[d->region]->addr + d->offset);
219 }
220
221 static int
222 memif_pktmbuf_chain(struct rte_mbuf *head, struct rte_mbuf *cur_tail,
223                     struct rte_mbuf *tail)
224 {
225         /* Check for number-of-segments-overflow */
226         if (unlikely(head->nb_segs + tail->nb_segs > RTE_MBUF_MAX_NB_SEGS))
227                 return -EOVERFLOW;
228
229         /* Chain 'tail' onto the old tail */
230         cur_tail->next = tail;
231
232         /* accumulate number of segments and total length. */
233         head->nb_segs = (uint16_t)(head->nb_segs + tail->nb_segs);
234
235         tail->pkt_len = tail->data_len;
236         head->pkt_len += tail->pkt_len;
237
238         return 0;
239 }
240
241 static uint16_t
242 eth_memif_rx(void *queue, struct rte_mbuf **bufs, uint16_t nb_pkts)
243 {
244         struct memif_queue *mq = queue;
245         struct pmd_internals *pmd = rte_eth_devices[mq->in_port].data->dev_private;
246         struct pmd_process_private *proc_private =
247                 rte_eth_devices[mq->in_port].process_private;
248         memif_ring_t *ring = memif_get_ring_from_queue(proc_private, mq);
249         uint16_t cur_slot, last_slot, n_slots, ring_size, mask, s0;
250         uint16_t n_rx_pkts = 0;
251         uint16_t mbuf_size = rte_pktmbuf_data_room_size(mq->mempool) -
252                 RTE_PKTMBUF_HEADROOM;
253         uint16_t src_len, src_off, dst_len, dst_off, cp_len;
254         memif_ring_type_t type = mq->type;
255         memif_desc_t *d0;
256         struct rte_mbuf *mbuf, *mbuf_head, *mbuf_tail;
257         uint64_t b;
258         ssize_t size __rte_unused;
259         uint16_t head;
260         int ret;
261         struct rte_eth_link link;
262
263         if (unlikely((pmd->flags & ETH_MEMIF_FLAG_CONNECTED) == 0))
264                 return 0;
265         if (unlikely(ring == NULL)) {
266                 /* Secondary process will attempt to request regions. */
267                 rte_eth_link_get(mq->in_port, &link);
268                 return 0;
269         }
270
271         /* consume interrupt */
272         if ((ring->flags & MEMIF_RING_FLAG_MASK_INT) == 0)
273                 size = read(mq->intr_handle.fd, &b, sizeof(b));
274
275         ring_size = 1 << mq->log2_ring_size;
276         mask = ring_size - 1;
277
278         cur_slot = (type == MEMIF_RING_S2M) ? mq->last_head : mq->last_tail;
279         last_slot = (type == MEMIF_RING_S2M) ? ring->head : ring->tail;
280         if (cur_slot == last_slot)
281                 goto refill;
282         n_slots = last_slot - cur_slot;
283
284         while (n_slots && n_rx_pkts < nb_pkts) {
285                 mbuf_head = rte_pktmbuf_alloc(mq->mempool);
286                 if (unlikely(mbuf_head == NULL))
287                         goto no_free_bufs;
288                 mbuf = mbuf_head;
289                 mbuf->port = mq->in_port;
290
291 next_slot:
292                 s0 = cur_slot & mask;
293                 d0 = &ring->desc[s0];
294
295                 src_len = d0->length;
296                 dst_off = 0;
297                 src_off = 0;
298
299                 do {
300                         dst_len = mbuf_size - dst_off;
301                         if (dst_len == 0) {
302                                 dst_off = 0;
303                                 dst_len = mbuf_size;
304
305                                 /* store pointer to tail */
306                                 mbuf_tail = mbuf;
307                                 mbuf = rte_pktmbuf_alloc(mq->mempool);
308                                 if (unlikely(mbuf == NULL))
309                                         goto no_free_bufs;
310                                 mbuf->port = mq->in_port;
311                                 ret = memif_pktmbuf_chain(mbuf_head, mbuf_tail, mbuf);
312                                 if (unlikely(ret < 0)) {
313                                         MIF_LOG(ERR, "number-of-segments-overflow");
314                                         rte_pktmbuf_free(mbuf);
315                                         goto no_free_bufs;
316                                 }
317                         }
318                         cp_len = RTE_MIN(dst_len, src_len);
319
320                         rte_pktmbuf_data_len(mbuf) += cp_len;
321                         rte_pktmbuf_pkt_len(mbuf) = rte_pktmbuf_data_len(mbuf);
322                         if (mbuf != mbuf_head)
323                                 rte_pktmbuf_pkt_len(mbuf_head) += cp_len;
324
325                         memcpy(rte_pktmbuf_mtod_offset(mbuf, void *, dst_off),
326                                (uint8_t *)memif_get_buffer(proc_private, d0) +
327                                src_off, cp_len);
328
329                         src_off += cp_len;
330                         dst_off += cp_len;
331                         src_len -= cp_len;
332                 } while (src_len);
333
334                 cur_slot++;
335                 n_slots--;
336
337                 if (d0->flags & MEMIF_DESC_FLAG_NEXT)
338                         goto next_slot;
339
340                 mq->n_bytes += rte_pktmbuf_pkt_len(mbuf_head);
341                 *bufs++ = mbuf_head;
342                 n_rx_pkts++;
343         }
344
345 no_free_bufs:
346         if (type == MEMIF_RING_S2M) {
347                 rte_mb();
348                 ring->tail = cur_slot;
349                 mq->last_head = cur_slot;
350         } else {
351                 mq->last_tail = cur_slot;
352         }
353
354 refill:
355         if (type == MEMIF_RING_M2S) {
356                 head = ring->head;
357                 n_slots = ring_size - head + mq->last_tail;
358
359                 while (n_slots--) {
360                         s0 = head++ & mask;
361                         d0 = &ring->desc[s0];
362                         d0->length = pmd->run.pkt_buffer_size;
363                 }
364                 rte_mb();
365                 ring->head = head;
366         }
367
368         mq->n_pkts += n_rx_pkts;
369         return n_rx_pkts;
370 }
371
372 static uint16_t
373 eth_memif_tx(void *queue, struct rte_mbuf **bufs, uint16_t nb_pkts)
374 {
375         struct memif_queue *mq = queue;
376         struct pmd_internals *pmd = rte_eth_devices[mq->in_port].data->dev_private;
377         struct pmd_process_private *proc_private =
378                 rte_eth_devices[mq->in_port].process_private;
379         memif_ring_t *ring = memif_get_ring_from_queue(proc_private, mq);
380         uint16_t slot, saved_slot, n_free, ring_size, mask, n_tx_pkts = 0;
381         uint16_t src_len, src_off, dst_len, dst_off, cp_len;
382         memif_ring_type_t type = mq->type;
383         memif_desc_t *d0;
384         struct rte_mbuf *mbuf;
385         struct rte_mbuf *mbuf_head;
386         uint64_t a;
387         ssize_t size;
388         struct rte_eth_link link;
389
390         if (unlikely((pmd->flags & ETH_MEMIF_FLAG_CONNECTED) == 0))
391                 return 0;
392         if (unlikely(ring == NULL)) {
393                 /* Secondary process will attempt to request regions. */
394                 rte_eth_link_get(mq->in_port, &link);
395                 return 0;
396         }
397
398         ring_size = 1 << mq->log2_ring_size;
399         mask = ring_size - 1;
400
401         n_free = ring->tail - mq->last_tail;
402         mq->last_tail += n_free;
403         slot = (type == MEMIF_RING_S2M) ? ring->head : ring->tail;
404
405         if (type == MEMIF_RING_S2M)
406                 n_free = ring_size - ring->head + mq->last_tail;
407         else
408                 n_free = ring->head - ring->tail;
409
410         while (n_tx_pkts < nb_pkts && n_free) {
411                 mbuf_head = *bufs++;
412                 mbuf = mbuf_head;
413
414                 saved_slot = slot;
415                 d0 = &ring->desc[slot & mask];
416                 dst_off = 0;
417                 dst_len = (type == MEMIF_RING_S2M) ?
418                         pmd->run.pkt_buffer_size : d0->length;
419
420 next_in_chain:
421                 src_off = 0;
422                 src_len = rte_pktmbuf_data_len(mbuf);
423
424                 while (src_len) {
425                         if (dst_len == 0) {
426                                 if (n_free) {
427                                         slot++;
428                                         n_free--;
429                                         d0->flags |= MEMIF_DESC_FLAG_NEXT;
430                                         d0 = &ring->desc[slot & mask];
431                                         dst_off = 0;
432                                         dst_len = (type == MEMIF_RING_S2M) ?
433                                             pmd->run.pkt_buffer_size : d0->length;
434                                         d0->flags = 0;
435                                 } else {
436                                         slot = saved_slot;
437                                         goto no_free_slots;
438                                 }
439                         }
440                         cp_len = RTE_MIN(dst_len, src_len);
441
442                         memcpy((uint8_t *)memif_get_buffer(proc_private, d0) + dst_off,
443                                rte_pktmbuf_mtod_offset(mbuf, void *, src_off),
444                                cp_len);
445
446                         mq->n_bytes += cp_len;
447                         src_off += cp_len;
448                         dst_off += cp_len;
449                         src_len -= cp_len;
450                         dst_len -= cp_len;
451
452                         d0->length = dst_off;
453                 }
454
455                 if (rte_pktmbuf_is_contiguous(mbuf) == 0) {
456                         mbuf = mbuf->next;
457                         goto next_in_chain;
458                 }
459
460                 n_tx_pkts++;
461                 slot++;
462                 n_free--;
463                 rte_pktmbuf_free(mbuf_head);
464         }
465
466 no_free_slots:
467         rte_mb();
468         if (type == MEMIF_RING_S2M)
469                 ring->head = slot;
470         else
471                 ring->tail = slot;
472
473         if ((ring->flags & MEMIF_RING_FLAG_MASK_INT) == 0) {
474                 a = 1;
475                 size = write(mq->intr_handle.fd, &a, sizeof(a));
476                 if (unlikely(size < 0)) {
477                         MIF_LOG(WARNING,
478                                 "Failed to send interrupt. %s", strerror(errno));
479                 }
480         }
481
482         mq->n_err += nb_pkts - n_tx_pkts;
483         mq->n_pkts += n_tx_pkts;
484         return n_tx_pkts;
485 }
486
487 void
488 memif_free_regions(struct pmd_process_private *proc_private)
489 {
490         int i;
491         struct memif_region *r;
492
493         MIF_LOG(DEBUG, "Free memory regions");
494         /* regions are allocated contiguously, so it's
495          * enough to loop until 'proc_private->regions_num'
496          */
497         for (i = 0; i < proc_private->regions_num; i++) {
498                 r = proc_private->regions[i];
499                 if (r != NULL) {
500                         if (r->addr != NULL) {
501                                 munmap(r->addr, r->region_size);
502                                 if (r->fd > 0) {
503                                         close(r->fd);
504                                         r->fd = -1;
505                                 }
506                         }
507                         rte_free(r);
508                         proc_private->regions[i] = NULL;
509                 }
510         }
511         proc_private->regions_num = 0;
512 }
513
514 static int
515 memif_region_init_shm(struct rte_eth_dev *dev, uint8_t has_buffers)
516 {
517         struct pmd_internals *pmd = dev->data->dev_private;
518         struct pmd_process_private *proc_private = dev->process_private;
519         char shm_name[ETH_MEMIF_SHM_NAME_SIZE];
520         int ret = 0;
521         struct memif_region *r;
522
523         if (proc_private->regions_num >= ETH_MEMIF_MAX_REGION_NUM) {
524                 MIF_LOG(ERR, "Too many regions.");
525                 return -1;
526         }
527
528         r = rte_zmalloc("region", sizeof(struct memif_region), 0);
529         if (r == NULL) {
530                 MIF_LOG(ERR, "Failed to alloc memif region.");
531                 return -ENOMEM;
532         }
533
534         /* calculate buffer offset */
535         r->pkt_buffer_offset = (pmd->run.num_s2m_rings + pmd->run.num_m2s_rings) *
536             (sizeof(memif_ring_t) + sizeof(memif_desc_t) *
537             (1 << pmd->run.log2_ring_size));
538
539         r->region_size = r->pkt_buffer_offset;
540         /* if region has buffers, add buffers size to region_size */
541         if (has_buffers == 1)
542                 r->region_size += (uint32_t)(pmd->run.pkt_buffer_size *
543                         (1 << pmd->run.log2_ring_size) *
544                         (pmd->run.num_s2m_rings +
545                          pmd->run.num_m2s_rings));
546
547         memset(shm_name, 0, sizeof(char) * ETH_MEMIF_SHM_NAME_SIZE);
548         snprintf(shm_name, ETH_MEMIF_SHM_NAME_SIZE, "memif_region_%d",
549                  proc_private->regions_num);
550
551         r->fd = memfd_create(shm_name, MFD_ALLOW_SEALING);
552         if (r->fd < 0) {
553                 MIF_LOG(ERR, "Failed to create shm file: %s.", strerror(errno));
554                 ret = -1;
555                 goto error;
556         }
557
558         ret = fcntl(r->fd, F_ADD_SEALS, F_SEAL_SHRINK);
559         if (ret < 0) {
560                 MIF_LOG(ERR, "Failed to add seals to shm file: %s.", strerror(errno));
561                 goto error;
562         }
563
564         ret = ftruncate(r->fd, r->region_size);
565         if (ret < 0) {
566                 MIF_LOG(ERR, "Failed to truncate shm file: %s.", strerror(errno));
567                 goto error;
568         }
569
570         r->addr = mmap(NULL, r->region_size, PROT_READ |
571                        PROT_WRITE, MAP_SHARED, r->fd, 0);
572         if (r->addr == MAP_FAILED) {
573                 MIF_LOG(ERR, "Failed to mmap shm region: %s.", strerror(ret));
574                 ret = -1;
575                 goto error;
576         }
577
578         proc_private->regions[proc_private->regions_num] = r;
579         proc_private->regions_num++;
580
581         return ret;
582
583 error:
584         if (r->fd > 0)
585                 close(r->fd);
586         r->fd = -1;
587
588         return ret;
589 }
590
591 static int
592 memif_regions_init(struct rte_eth_dev *dev)
593 {
594         int ret;
595
596         /* create one buffer region */
597         ret = memif_region_init_shm(dev, /* has buffer */ 1);
598         if (ret < 0)
599                 return ret;
600
601         return 0;
602 }
603
604 static void
605 memif_init_rings(struct rte_eth_dev *dev)
606 {
607         struct pmd_internals *pmd = dev->data->dev_private;
608         struct pmd_process_private *proc_private = dev->process_private;
609         memif_ring_t *ring;
610         int i, j;
611         uint16_t slot;
612
613         for (i = 0; i < pmd->run.num_s2m_rings; i++) {
614                 ring = memif_get_ring(pmd, proc_private, MEMIF_RING_S2M, i);
615                 ring->head = 0;
616                 ring->tail = 0;
617                 ring->cookie = MEMIF_COOKIE;
618                 ring->flags = 0;
619                 for (j = 0; j < (1 << pmd->run.log2_ring_size); j++) {
620                         slot = i * (1 << pmd->run.log2_ring_size) + j;
621                         ring->desc[j].region = 0;
622                         ring->desc[j].offset =
623                                 proc_private->regions[0]->pkt_buffer_offset +
624                                 (uint32_t)(slot * pmd->run.pkt_buffer_size);
625                         ring->desc[j].length = pmd->run.pkt_buffer_size;
626                 }
627         }
628
629         for (i = 0; i < pmd->run.num_m2s_rings; i++) {
630                 ring = memif_get_ring(pmd, proc_private, MEMIF_RING_M2S, i);
631                 ring->head = 0;
632                 ring->tail = 0;
633                 ring->cookie = MEMIF_COOKIE;
634                 ring->flags = 0;
635                 for (j = 0; j < (1 << pmd->run.log2_ring_size); j++) {
636                         slot = (i + pmd->run.num_s2m_rings) *
637                             (1 << pmd->run.log2_ring_size) + j;
638                         ring->desc[j].region = 0;
639                         ring->desc[j].offset =
640                                 proc_private->regions[0]->pkt_buffer_offset +
641                                 (uint32_t)(slot * pmd->run.pkt_buffer_size);
642                         ring->desc[j].length = pmd->run.pkt_buffer_size;
643                 }
644         }
645 }
646
647 /* called only by slave */
648 static void
649 memif_init_queues(struct rte_eth_dev *dev)
650 {
651         struct pmd_internals *pmd = dev->data->dev_private;
652         struct memif_queue *mq;
653         int i;
654
655         for (i = 0; i < pmd->run.num_s2m_rings; i++) {
656                 mq = dev->data->tx_queues[i];
657                 mq->log2_ring_size = pmd->run.log2_ring_size;
658                 /* queues located only in region 0 */
659                 mq->region = 0;
660                 mq->ring_offset = memif_get_ring_offset(dev, mq, MEMIF_RING_S2M, i);
661                 mq->last_head = 0;
662                 mq->last_tail = 0;
663                 mq->intr_handle.fd = eventfd(0, EFD_NONBLOCK);
664                 if (mq->intr_handle.fd < 0) {
665                         MIF_LOG(WARNING,
666                                 "Failed to create eventfd for tx queue %d: %s.", i,
667                                 strerror(errno));
668                 }
669         }
670
671         for (i = 0; i < pmd->run.num_m2s_rings; i++) {
672                 mq = dev->data->rx_queues[i];
673                 mq->log2_ring_size = pmd->run.log2_ring_size;
674                 /* queues located only in region 0 */
675                 mq->region = 0;
676                 mq->ring_offset = memif_get_ring_offset(dev, mq, MEMIF_RING_M2S, i);
677                 mq->last_head = 0;
678                 mq->last_tail = 0;
679                 mq->intr_handle.fd = eventfd(0, EFD_NONBLOCK);
680                 if (mq->intr_handle.fd < 0) {
681                         MIF_LOG(WARNING,
682                                 "Failed to create eventfd for rx queue %d: %s.", i,
683                                 strerror(errno));
684                 }
685         }
686 }
687
688 int
689 memif_init_regions_and_queues(struct rte_eth_dev *dev)
690 {
691         int ret;
692
693         ret = memif_regions_init(dev);
694         if (ret < 0)
695                 return ret;
696
697         memif_init_rings(dev);
698
699         memif_init_queues(dev);
700
701         return 0;
702 }
703
704 int
705 memif_connect(struct rte_eth_dev *dev)
706 {
707         struct pmd_internals *pmd = dev->data->dev_private;
708         struct pmd_process_private *proc_private = dev->process_private;
709         struct memif_region *mr;
710         struct memif_queue *mq;
711         memif_ring_t *ring;
712         int i;
713
714         for (i = 0; i < proc_private->regions_num; i++) {
715                 mr = proc_private->regions[i];
716                 if (mr != NULL) {
717                         if (mr->addr == NULL) {
718                                 if (mr->fd < 0)
719                                         return -1;
720                                 mr->addr = mmap(NULL, mr->region_size,
721                                                 PROT_READ | PROT_WRITE,
722                                                 MAP_SHARED, mr->fd, 0);
723                                 if (mr->addr == NULL)
724                                         return -1;
725                         }
726                 }
727         }
728
729         if (rte_eal_process_type() == RTE_PROC_PRIMARY) {
730                 for (i = 0; i < pmd->run.num_s2m_rings; i++) {
731                         mq = (pmd->role == MEMIF_ROLE_SLAVE) ?
732                             dev->data->tx_queues[i] : dev->data->rx_queues[i];
733                         ring = memif_get_ring_from_queue(proc_private, mq);
734                         if (ring == NULL || ring->cookie != MEMIF_COOKIE) {
735                                 MIF_LOG(ERR, "Wrong ring");
736                                 return -1;
737                         }
738                         ring->head = 0;
739                         ring->tail = 0;
740                         mq->last_head = 0;
741                         mq->last_tail = 0;
742                         /* enable polling mode */
743                         if (pmd->role == MEMIF_ROLE_MASTER)
744                                 ring->flags = MEMIF_RING_FLAG_MASK_INT;
745                 }
746                 for (i = 0; i < pmd->run.num_m2s_rings; i++) {
747                         mq = (pmd->role == MEMIF_ROLE_SLAVE) ?
748                             dev->data->rx_queues[i] : dev->data->tx_queues[i];
749                         ring = memif_get_ring_from_queue(proc_private, mq);
750                         if (ring == NULL || ring->cookie != MEMIF_COOKIE) {
751                                 MIF_LOG(ERR, "Wrong ring");
752                                 return -1;
753                         }
754                         ring->head = 0;
755                         ring->tail = 0;
756                         mq->last_head = 0;
757                         mq->last_tail = 0;
758                         /* enable polling mode */
759                         if (pmd->role == MEMIF_ROLE_SLAVE)
760                                 ring->flags = MEMIF_RING_FLAG_MASK_INT;
761                 }
762
763                 pmd->flags &= ~ETH_MEMIF_FLAG_CONNECTING;
764                 pmd->flags |= ETH_MEMIF_FLAG_CONNECTED;
765                 dev->data->dev_link.link_status = ETH_LINK_UP;
766         }
767         MIF_LOG(INFO, "Connected.");
768         return 0;
769 }
770
771 static int
772 memif_dev_start(struct rte_eth_dev *dev)
773 {
774         struct pmd_internals *pmd = dev->data->dev_private;
775         int ret = 0;
776
777         switch (pmd->role) {
778         case MEMIF_ROLE_SLAVE:
779                 ret = memif_connect_slave(dev);
780                 break;
781         case MEMIF_ROLE_MASTER:
782                 ret = memif_connect_master(dev);
783                 break;
784         default:
785                 MIF_LOG(ERR, "%s: Unknown role: %d.",
786                         rte_vdev_device_name(pmd->vdev), pmd->role);
787                 ret = -1;
788                 break;
789         }
790
791         return ret;
792 }
793
794 static void
795 memif_dev_close(struct rte_eth_dev *dev)
796 {
797         struct pmd_internals *pmd = dev->data->dev_private;
798         int i;
799
800         if (rte_eal_process_type() == RTE_PROC_PRIMARY) {
801                 memif_msg_enq_disconnect(pmd->cc, "Device closed", 0);
802                 memif_disconnect(dev);
803
804                 for (i = 0; i < dev->data->nb_rx_queues; i++)
805                         (*dev->dev_ops->rx_queue_release)(dev->data->rx_queues[i]);
806                 for (i = 0; i < dev->data->nb_tx_queues; i++)
807                         (*dev->dev_ops->tx_queue_release)(dev->data->tx_queues[i]);
808
809                 memif_socket_remove_device(dev);
810         } else {
811                 memif_disconnect(dev);
812         }
813
814         rte_free(dev->process_private);
815 }
816
817 static int
818 memif_dev_configure(struct rte_eth_dev *dev)
819 {
820         struct pmd_internals *pmd = dev->data->dev_private;
821
822         /*
823          * SLAVE - TXQ
824          * MASTER - RXQ
825          */
826         pmd->cfg.num_s2m_rings = (pmd->role == MEMIF_ROLE_SLAVE) ?
827                                   dev->data->nb_tx_queues : dev->data->nb_rx_queues;
828
829         /*
830          * SLAVE - RXQ
831          * MASTER - TXQ
832          */
833         pmd->cfg.num_m2s_rings = (pmd->role == MEMIF_ROLE_SLAVE) ?
834                                   dev->data->nb_rx_queues : dev->data->nb_tx_queues;
835
836         return 0;
837 }
838
839 static int
840 memif_tx_queue_setup(struct rte_eth_dev *dev,
841                      uint16_t qid,
842                      uint16_t nb_tx_desc __rte_unused,
843                      unsigned int socket_id __rte_unused,
844                      const struct rte_eth_txconf *tx_conf __rte_unused)
845 {
846         struct pmd_internals *pmd = dev->data->dev_private;
847         struct memif_queue *mq;
848
849         mq = rte_zmalloc("tx-queue", sizeof(struct memif_queue), 0);
850         if (mq == NULL) {
851                 MIF_LOG(ERR, "%s: Failed to allocate tx queue id: %u",
852                         rte_vdev_device_name(pmd->vdev), qid);
853                 return -ENOMEM;
854         }
855
856         mq->type =
857             (pmd->role == MEMIF_ROLE_SLAVE) ? MEMIF_RING_S2M : MEMIF_RING_M2S;
858         mq->n_pkts = 0;
859         mq->n_bytes = 0;
860         mq->n_err = 0;
861         mq->intr_handle.fd = -1;
862         mq->intr_handle.type = RTE_INTR_HANDLE_EXT;
863         dev->data->tx_queues[qid] = mq;
864
865         return 0;
866 }
867
868 static int
869 memif_rx_queue_setup(struct rte_eth_dev *dev,
870                      uint16_t qid,
871                      uint16_t nb_rx_desc __rte_unused,
872                      unsigned int socket_id __rte_unused,
873                      const struct rte_eth_rxconf *rx_conf __rte_unused,
874                      struct rte_mempool *mb_pool)
875 {
876         struct pmd_internals *pmd = dev->data->dev_private;
877         struct memif_queue *mq;
878
879         mq = rte_zmalloc("rx-queue", sizeof(struct memif_queue), 0);
880         if (mq == NULL) {
881                 MIF_LOG(ERR, "%s: Failed to allocate rx queue id: %u",
882                         rte_vdev_device_name(pmd->vdev), qid);
883                 return -ENOMEM;
884         }
885
886         mq->type = (pmd->role == MEMIF_ROLE_SLAVE) ? MEMIF_RING_M2S : MEMIF_RING_S2M;
887         mq->n_pkts = 0;
888         mq->n_bytes = 0;
889         mq->n_err = 0;
890         mq->intr_handle.fd = -1;
891         mq->intr_handle.type = RTE_INTR_HANDLE_EXT;
892         mq->mempool = mb_pool;
893         mq->in_port = dev->data->port_id;
894         dev->data->rx_queues[qid] = mq;
895
896         return 0;
897 }
898
899 static void
900 memif_queue_release(void *queue)
901 {
902         struct memif_queue *mq = (struct memif_queue *)queue;
903
904         if (!mq)
905                 return;
906
907         rte_free(mq);
908 }
909
910 static int
911 memif_link_update(struct rte_eth_dev *dev,
912                   int wait_to_complete __rte_unused)
913 {
914         struct pmd_process_private *proc_private;
915
916         if (rte_eal_process_type() == RTE_PROC_SECONDARY) {
917                 proc_private = dev->process_private;
918                 if (dev->data->dev_link.link_status == ETH_LINK_UP &&
919                                 proc_private->regions_num == 0) {
920                         memif_mp_request_regions(dev);
921                 } else if (dev->data->dev_link.link_status == ETH_LINK_DOWN &&
922                                 proc_private->regions_num > 0) {
923                         memif_free_regions(proc_private);
924                 }
925         }
926         return 0;
927 }
928
929 static int
930 memif_stats_get(struct rte_eth_dev *dev, struct rte_eth_stats *stats)
931 {
932         struct pmd_internals *pmd = dev->data->dev_private;
933         struct memif_queue *mq;
934         int i;
935         uint8_t tmp, nq;
936
937         stats->ipackets = 0;
938         stats->ibytes = 0;
939         stats->opackets = 0;
940         stats->obytes = 0;
941         stats->oerrors = 0;
942
943         tmp = (pmd->role == MEMIF_ROLE_SLAVE) ? pmd->run.num_s2m_rings :
944             pmd->run.num_m2s_rings;
945         nq = (tmp < RTE_ETHDEV_QUEUE_STAT_CNTRS) ? tmp :
946             RTE_ETHDEV_QUEUE_STAT_CNTRS;
947
948         /* RX stats */
949         for (i = 0; i < nq; i++) {
950                 mq = dev->data->rx_queues[i];
951                 stats->q_ipackets[i] = mq->n_pkts;
952                 stats->q_ibytes[i] = mq->n_bytes;
953                 stats->ipackets += mq->n_pkts;
954                 stats->ibytes += mq->n_bytes;
955         }
956
957         tmp = (pmd->role == MEMIF_ROLE_SLAVE) ? pmd->run.num_m2s_rings :
958             pmd->run.num_s2m_rings;
959         nq = (tmp < RTE_ETHDEV_QUEUE_STAT_CNTRS) ? tmp :
960             RTE_ETHDEV_QUEUE_STAT_CNTRS;
961
962         /* TX stats */
963         for (i = 0; i < nq; i++) {
964                 mq = dev->data->tx_queues[i];
965                 stats->q_opackets[i] = mq->n_pkts;
966                 stats->q_obytes[i] = mq->n_bytes;
967                 stats->opackets += mq->n_pkts;
968                 stats->obytes += mq->n_bytes;
969                 stats->oerrors += mq->n_err;
970         }
971         return 0;
972 }
973
974 static void
975 memif_stats_reset(struct rte_eth_dev *dev)
976 {
977         struct pmd_internals *pmd = dev->data->dev_private;
978         int i;
979         struct memif_queue *mq;
980
981         for (i = 0; i < pmd->run.num_s2m_rings; i++) {
982                 mq = (pmd->role == MEMIF_ROLE_SLAVE) ? dev->data->tx_queues[i] :
983                     dev->data->rx_queues[i];
984                 mq->n_pkts = 0;
985                 mq->n_bytes = 0;
986                 mq->n_err = 0;
987         }
988         for (i = 0; i < pmd->run.num_m2s_rings; i++) {
989                 mq = (pmd->role == MEMIF_ROLE_SLAVE) ? dev->data->rx_queues[i] :
990                     dev->data->tx_queues[i];
991                 mq->n_pkts = 0;
992                 mq->n_bytes = 0;
993                 mq->n_err = 0;
994         }
995 }
996
997 static int
998 memif_rx_queue_intr_enable(struct rte_eth_dev *dev __rte_unused,
999                            uint16_t qid __rte_unused)
1000 {
1001         MIF_LOG(WARNING, "Interrupt mode not supported.");
1002
1003         return -1;
1004 }
1005
1006 static int
1007 memif_rx_queue_intr_disable(struct rte_eth_dev *dev, uint16_t qid __rte_unused)
1008 {
1009         struct pmd_internals *pmd __rte_unused = dev->data->dev_private;
1010
1011         return 0;
1012 }
1013
1014 static const struct eth_dev_ops ops = {
1015         .dev_start = memif_dev_start,
1016         .dev_close = memif_dev_close,
1017         .dev_infos_get = memif_dev_info,
1018         .dev_configure = memif_dev_configure,
1019         .tx_queue_setup = memif_tx_queue_setup,
1020         .rx_queue_setup = memif_rx_queue_setup,
1021         .rx_queue_release = memif_queue_release,
1022         .tx_queue_release = memif_queue_release,
1023         .rx_queue_intr_enable = memif_rx_queue_intr_enable,
1024         .rx_queue_intr_disable = memif_rx_queue_intr_disable,
1025         .link_update = memif_link_update,
1026         .stats_get = memif_stats_get,
1027         .stats_reset = memif_stats_reset,
1028 };
1029
1030 static int
1031 memif_create(struct rte_vdev_device *vdev, enum memif_role_t role,
1032              memif_interface_id_t id, uint32_t flags,
1033              const char *socket_filename,
1034              memif_log2_ring_size_t log2_ring_size,
1035              uint16_t pkt_buffer_size, const char *secret,
1036              struct rte_ether_addr *ether_addr)
1037 {
1038         int ret = 0;
1039         struct rte_eth_dev *eth_dev;
1040         struct rte_eth_dev_data *data;
1041         struct pmd_internals *pmd;
1042         struct pmd_process_private *process_private;
1043         const unsigned int numa_node = vdev->device.numa_node;
1044         const char *name = rte_vdev_device_name(vdev);
1045
1046         if (flags & ETH_MEMIF_FLAG_ZERO_COPY) {
1047                 MIF_LOG(ERR, "Zero-copy slave not supported.");
1048                 return -1;
1049         }
1050
1051         eth_dev = rte_eth_vdev_allocate(vdev, sizeof(*pmd));
1052         if (eth_dev == NULL) {
1053                 MIF_LOG(ERR, "%s: Unable to allocate device struct.", name);
1054                 return -1;
1055         }
1056
1057         process_private = (struct pmd_process_private *)
1058                 rte_zmalloc(name, sizeof(struct pmd_process_private),
1059                             RTE_CACHE_LINE_SIZE);
1060
1061         if (process_private == NULL) {
1062                 MIF_LOG(ERR, "Failed to alloc memory for process private");
1063                 return -1;
1064         }
1065         eth_dev->process_private = process_private;
1066
1067         pmd = eth_dev->data->dev_private;
1068         memset(pmd, 0, sizeof(*pmd));
1069
1070         pmd->id = id;
1071         pmd->flags = flags;
1072         pmd->flags |= ETH_MEMIF_FLAG_DISABLED;
1073         pmd->role = role;
1074
1075         ret = memif_socket_init(eth_dev, socket_filename);
1076         if (ret < 0)
1077                 return ret;
1078
1079         memset(pmd->secret, 0, sizeof(char) * ETH_MEMIF_SECRET_SIZE);
1080         if (secret != NULL)
1081                 strlcpy(pmd->secret, secret, sizeof(pmd->secret));
1082
1083         pmd->cfg.log2_ring_size = log2_ring_size;
1084         /* set in .dev_configure() */
1085         pmd->cfg.num_s2m_rings = 0;
1086         pmd->cfg.num_m2s_rings = 0;
1087
1088         pmd->cfg.pkt_buffer_size = pkt_buffer_size;
1089
1090         data = eth_dev->data;
1091         data->dev_private = pmd;
1092         data->numa_node = numa_node;
1093         data->mac_addrs = ether_addr;
1094
1095         eth_dev->dev_ops = &ops;
1096         eth_dev->device = &vdev->device;
1097         eth_dev->rx_pkt_burst = eth_memif_rx;
1098         eth_dev->tx_pkt_burst = eth_memif_tx;
1099
1100         eth_dev->data->dev_flags &= RTE_ETH_DEV_CLOSE_REMOVE;
1101
1102         rte_eth_dev_probing_finish(eth_dev);
1103
1104         return 0;
1105 }
1106
1107 static int
1108 memif_set_role(const char *key __rte_unused, const char *value,
1109                void *extra_args)
1110 {
1111         enum memif_role_t *role = (enum memif_role_t *)extra_args;
1112
1113         if (strstr(value, "master") != NULL) {
1114                 *role = MEMIF_ROLE_MASTER;
1115         } else if (strstr(value, "slave") != NULL) {
1116                 *role = MEMIF_ROLE_SLAVE;
1117         } else {
1118                 MIF_LOG(ERR, "Unknown role: %s.", value);
1119                 return -EINVAL;
1120         }
1121         return 0;
1122 }
1123
1124 static int
1125 memif_set_zc(const char *key __rte_unused, const char *value, void *extra_args)
1126 {
1127         uint32_t *flags = (uint32_t *)extra_args;
1128
1129         if (strstr(value, "yes") != NULL) {
1130                 *flags |= ETH_MEMIF_FLAG_ZERO_COPY;
1131         } else if (strstr(value, "no") != NULL) {
1132                 *flags &= ~ETH_MEMIF_FLAG_ZERO_COPY;
1133         } else {
1134                 MIF_LOG(ERR, "Failed to parse zero-copy param: %s.", value);
1135                 return -EINVAL;
1136         }
1137         return 0;
1138 }
1139
1140 static int
1141 memif_set_id(const char *key __rte_unused, const char *value, void *extra_args)
1142 {
1143         memif_interface_id_t *id = (memif_interface_id_t *)extra_args;
1144
1145         /* even if parsing fails, 0 is a valid id */
1146         *id = strtoul(value, NULL, 10);
1147         return 0;
1148 }
1149
1150 static int
1151 memif_set_bs(const char *key __rte_unused, const char *value, void *extra_args)
1152 {
1153         unsigned long tmp;
1154         uint16_t *pkt_buffer_size = (uint16_t *)extra_args;
1155
1156         tmp = strtoul(value, NULL, 10);
1157         if (tmp == 0 || tmp > 0xFFFF) {
1158                 MIF_LOG(ERR, "Invalid buffer size: %s.", value);
1159                 return -EINVAL;
1160         }
1161         *pkt_buffer_size = tmp;
1162         return 0;
1163 }
1164
1165 static int
1166 memif_set_rs(const char *key __rte_unused, const char *value, void *extra_args)
1167 {
1168         unsigned long tmp;
1169         memif_log2_ring_size_t *log2_ring_size =
1170             (memif_log2_ring_size_t *)extra_args;
1171
1172         tmp = strtoul(value, NULL, 10);
1173         if (tmp == 0 || tmp > ETH_MEMIF_MAX_LOG2_RING_SIZE) {
1174                 MIF_LOG(ERR, "Invalid ring size: %s (max %u).",
1175                         value, ETH_MEMIF_MAX_LOG2_RING_SIZE);
1176                 return -EINVAL;
1177         }
1178         *log2_ring_size = tmp;
1179         return 0;
1180 }
1181
1182 /* check if directory exists and if we have permission to read/write */
1183 static int
1184 memif_check_socket_filename(const char *filename)
1185 {
1186         char *dir = NULL, *tmp;
1187         uint32_t idx;
1188         int ret = 0;
1189
1190         tmp = strrchr(filename, '/');
1191         if (tmp != NULL) {
1192                 idx = tmp - filename;
1193                 dir = rte_zmalloc("memif_tmp", sizeof(char) * (idx + 1), 0);
1194                 if (dir == NULL) {
1195                         MIF_LOG(ERR, "Failed to allocate memory.");
1196                         return -1;
1197                 }
1198                 strlcpy(dir, filename, sizeof(char) * (idx + 1));
1199         }
1200
1201         if (dir == NULL || (faccessat(-1, dir, F_OK | R_OK |
1202                                         W_OK, AT_EACCESS) < 0)) {
1203                 MIF_LOG(ERR, "Invalid socket directory.");
1204                 ret = -EINVAL;
1205         }
1206
1207         if (dir != NULL)
1208                 rte_free(dir);
1209
1210         return ret;
1211 }
1212
1213 static int
1214 memif_set_socket_filename(const char *key __rte_unused, const char *value,
1215                           void *extra_args)
1216 {
1217         const char **socket_filename = (const char **)extra_args;
1218
1219         *socket_filename = value;
1220         return memif_check_socket_filename(*socket_filename);
1221 }
1222
1223 static int
1224 memif_set_mac(const char *key __rte_unused, const char *value, void *extra_args)
1225 {
1226         struct rte_ether_addr *ether_addr = (struct rte_ether_addr *)extra_args;
1227         int ret = 0;
1228
1229         ret = sscanf(value, "%hhx:%hhx:%hhx:%hhx:%hhx:%hhx",
1230                &ether_addr->addr_bytes[0], &ether_addr->addr_bytes[1],
1231                &ether_addr->addr_bytes[2], &ether_addr->addr_bytes[3],
1232                &ether_addr->addr_bytes[4], &ether_addr->addr_bytes[5]);
1233         if (ret != 6)
1234                 MIF_LOG(WARNING, "Failed to parse mac '%s'.", value);
1235         return 0;
1236 }
1237
1238 static int
1239 memif_set_secret(const char *key __rte_unused, const char *value, void *extra_args)
1240 {
1241         const char **secret = (const char **)extra_args;
1242
1243         *secret = value;
1244         return 0;
1245 }
1246
1247 static int
1248 rte_pmd_memif_probe(struct rte_vdev_device *vdev)
1249 {
1250         RTE_BUILD_BUG_ON(sizeof(memif_msg_t) != 128);
1251         RTE_BUILD_BUG_ON(sizeof(memif_desc_t) != 16);
1252         int ret = 0;
1253         struct rte_kvargs *kvlist;
1254         const char *name = rte_vdev_device_name(vdev);
1255         enum memif_role_t role = MEMIF_ROLE_SLAVE;
1256         memif_interface_id_t id = 0;
1257         uint16_t pkt_buffer_size = ETH_MEMIF_DEFAULT_PKT_BUFFER_SIZE;
1258         memif_log2_ring_size_t log2_ring_size = ETH_MEMIF_DEFAULT_RING_SIZE;
1259         const char *socket_filename = ETH_MEMIF_DEFAULT_SOCKET_FILENAME;
1260         uint32_t flags = 0;
1261         const char *secret = NULL;
1262         struct rte_ether_addr *ether_addr = rte_zmalloc("",
1263                 sizeof(struct rte_ether_addr), 0);
1264         struct rte_eth_dev *eth_dev;
1265
1266         rte_eth_random_addr(ether_addr->addr_bytes);
1267
1268         MIF_LOG(INFO, "Initialize MEMIF: %s.", name);
1269
1270         if (rte_eal_process_type() == RTE_PROC_SECONDARY) {
1271                 eth_dev = rte_eth_dev_attach_secondary(name);
1272                 if (!eth_dev) {
1273                         MIF_LOG(ERR, "Failed to probe %s", name);
1274                         return -1;
1275                 }
1276
1277                 eth_dev->dev_ops = &ops;
1278                 eth_dev->device = &vdev->device;
1279                 eth_dev->rx_pkt_burst = eth_memif_rx;
1280                 eth_dev->tx_pkt_burst = eth_memif_rx;
1281
1282                 if (!rte_eal_primary_proc_alive(NULL)) {
1283                         MIF_LOG(ERR, "Primary process is missing");
1284                         return -1;
1285                 }
1286
1287                 eth_dev->process_private = (struct pmd_process_private *)
1288                         rte_zmalloc(name,
1289                                 sizeof(struct pmd_process_private),
1290                                 RTE_CACHE_LINE_SIZE);
1291                 if (eth_dev->process_private == NULL) {
1292                         MIF_LOG(ERR,
1293                                 "Failed to alloc memory for process private");
1294                         return -1;
1295                 }
1296
1297                 rte_eth_dev_probing_finish(eth_dev);
1298
1299                 return 0;
1300         }
1301
1302         ret = rte_mp_action_register(MEMIF_MP_SEND_REGION, memif_mp_send_region);
1303         /*
1304          * Primary process can continue probing, but secondary process won't
1305          * be able to get memory regions information
1306          */
1307         if (ret < 0 && rte_errno != EEXIST)
1308                 MIF_LOG(WARNING, "Failed to register mp action callback: %s",
1309                         strerror(rte_errno));
1310
1311         kvlist = rte_kvargs_parse(rte_vdev_device_args(vdev), valid_arguments);
1312
1313         /* parse parameters */
1314         if (kvlist != NULL) {
1315                 ret = rte_kvargs_process(kvlist, ETH_MEMIF_ROLE_ARG,
1316                                          &memif_set_role, &role);
1317                 if (ret < 0)
1318                         goto exit;
1319                 ret = rte_kvargs_process(kvlist, ETH_MEMIF_ID_ARG,
1320                                          &memif_set_id, &id);
1321                 if (ret < 0)
1322                         goto exit;
1323                 ret = rte_kvargs_process(kvlist, ETH_MEMIF_PKT_BUFFER_SIZE_ARG,
1324                                          &memif_set_bs, &pkt_buffer_size);
1325                 if (ret < 0)
1326                         goto exit;
1327                 ret = rte_kvargs_process(kvlist, ETH_MEMIF_RING_SIZE_ARG,
1328                                          &memif_set_rs, &log2_ring_size);
1329                 if (ret < 0)
1330                         goto exit;
1331                 ret = rte_kvargs_process(kvlist, ETH_MEMIF_SOCKET_ARG,
1332                                          &memif_set_socket_filename,
1333                                          (void *)(&socket_filename));
1334                 if (ret < 0)
1335                         goto exit;
1336                 ret = rte_kvargs_process(kvlist, ETH_MEMIF_MAC_ARG,
1337                                          &memif_set_mac, ether_addr);
1338                 if (ret < 0)
1339                         goto exit;
1340                 ret = rte_kvargs_process(kvlist, ETH_MEMIF_ZC_ARG,
1341                                          &memif_set_zc, &flags);
1342                 if (ret < 0)
1343                         goto exit;
1344                 ret = rte_kvargs_process(kvlist, ETH_MEMIF_SECRET_ARG,
1345                                          &memif_set_secret, (void *)(&secret));
1346                 if (ret < 0)
1347                         goto exit;
1348         }
1349
1350         /* create interface */
1351         ret = memif_create(vdev, role, id, flags, socket_filename,
1352                            log2_ring_size, pkt_buffer_size, secret, ether_addr);
1353
1354 exit:
1355         if (kvlist != NULL)
1356                 rte_kvargs_free(kvlist);
1357         return ret;
1358 }
1359
1360 static int
1361 rte_pmd_memif_remove(struct rte_vdev_device *vdev)
1362 {
1363         struct rte_eth_dev *eth_dev;
1364
1365         eth_dev = rte_eth_dev_allocated(rte_vdev_device_name(vdev));
1366         if (eth_dev == NULL)
1367                 return 0;
1368
1369         rte_eth_dev_close(eth_dev->data->port_id);
1370
1371         return 0;
1372 }
1373
1374 static struct rte_vdev_driver pmd_memif_drv = {
1375         .probe = rte_pmd_memif_probe,
1376         .remove = rte_pmd_memif_remove,
1377 };
1378
1379 RTE_PMD_REGISTER_VDEV(net_memif, pmd_memif_drv);
1380
1381 RTE_PMD_REGISTER_PARAM_STRING(net_memif,
1382                               ETH_MEMIF_ID_ARG "=<int>"
1383                               ETH_MEMIF_ROLE_ARG "=master|slave"
1384                               ETH_MEMIF_PKT_BUFFER_SIZE_ARG "=<int>"
1385                               ETH_MEMIF_RING_SIZE_ARG "=<int>"
1386                               ETH_MEMIF_SOCKET_ARG "=<string>"
1387                               ETH_MEMIF_MAC_ARG "=xx:xx:xx:xx:xx:xx"
1388                               ETH_MEMIF_ZC_ARG "=yes|no"
1389                               ETH_MEMIF_SECRET_ARG "=<string>");
1390
1391 int memif_logtype;
1392
1393 RTE_INIT(memif_init_log)
1394 {
1395         memif_logtype = rte_log_register("pmd.net.memif");
1396         if (memif_logtype >= 0)
1397                 rte_log_set_level(memif_logtype, RTE_LOG_NOTICE);
1398 }