ring: fix memory leak when detaching
[dpdk.git] / drivers / net / ring / rte_eth_ring.c
1 /*-
2  *   BSD LICENSE
3  *
4  *   Copyright(c) 2010-2015 Intel Corporation. All rights reserved.
5  *   All rights reserved.
6  *
7  *   Redistribution and use in source and binary forms, with or without
8  *   modification, are permitted provided that the following conditions
9  *   are met:
10  *
11  *     * Redistributions of source code must retain the above copyright
12  *       notice, this list of conditions and the following disclaimer.
13  *     * Redistributions in binary form must reproduce the above copyright
14  *       notice, this list of conditions and the following disclaimer in
15  *       the documentation and/or other materials provided with the
16  *       distribution.
17  *     * Neither the name of Intel Corporation nor the names of its
18  *       contributors may be used to endorse or promote products derived
19  *       from this software without specific prior written permission.
20  *
21  *   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
22  *   "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
23  *   LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
24  *   A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
25  *   OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
26  *   SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
27  *   LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
28  *   DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
29  *   THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
30  *   (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
31  *   OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
32  */
33
34 #include "rte_eth_ring.h"
35 #include <rte_mbuf.h>
36 #include <rte_ethdev.h>
37 #include <rte_malloc.h>
38 #include <rte_memcpy.h>
39 #include <rte_memzone.h>
40 #include <rte_string_fns.h>
41 #include <rte_dev.h>
42 #include <rte_kvargs.h>
43 #include <rte_errno.h>
44
45 #define ETH_RING_NUMA_NODE_ACTION_ARG   "nodeaction"
46 #define ETH_RING_ACTION_CREATE          "CREATE"
47 #define ETH_RING_ACTION_ATTACH          "ATTACH"
48
49 static const char *valid_arguments[] = {
50         ETH_RING_NUMA_NODE_ACTION_ARG,
51         NULL
52 };
53
54 struct ring_queue {
55         struct rte_ring *rng;
56         rte_atomic64_t rx_pkts;
57         rte_atomic64_t tx_pkts;
58         rte_atomic64_t err_pkts;
59 };
60
61 struct pmd_internals {
62         unsigned nb_rx_queues;
63         unsigned nb_tx_queues;
64
65         struct ring_queue rx_ring_queues[RTE_PMD_RING_MAX_RX_RINGS];
66         struct ring_queue tx_ring_queues[RTE_PMD_RING_MAX_TX_RINGS];
67
68         struct ether_addr address;
69 };
70
71
72 static const char *drivername = "Rings PMD";
73 static struct rte_eth_link pmd_link = {
74                 .link_speed = 10000,
75                 .link_duplex = ETH_LINK_FULL_DUPLEX,
76                 .link_status = 0
77 };
78
79 static uint16_t
80 eth_ring_rx(void *q, struct rte_mbuf **bufs, uint16_t nb_bufs)
81 {
82         void **ptrs = (void *)&bufs[0];
83         struct ring_queue *r = q;
84         const uint16_t nb_rx = (uint16_t)rte_ring_dequeue_burst(r->rng,
85                         ptrs, nb_bufs);
86         if (r->rng->flags & RING_F_SC_DEQ)
87                 r->rx_pkts.cnt += nb_rx;
88         else
89                 rte_atomic64_add(&(r->rx_pkts), nb_rx);
90         return nb_rx;
91 }
92
93 static uint16_t
94 eth_ring_tx(void *q, struct rte_mbuf **bufs, uint16_t nb_bufs)
95 {
96         void **ptrs = (void *)&bufs[0];
97         struct ring_queue *r = q;
98         const uint16_t nb_tx = (uint16_t)rte_ring_enqueue_burst(r->rng,
99                         ptrs, nb_bufs);
100         if (r->rng->flags & RING_F_SP_ENQ) {
101                 r->tx_pkts.cnt += nb_tx;
102                 r->err_pkts.cnt += nb_bufs - nb_tx;
103         } else {
104                 rte_atomic64_add(&(r->tx_pkts), nb_tx);
105                 rte_atomic64_add(&(r->err_pkts), nb_bufs - nb_tx);
106         }
107         return nb_tx;
108 }
109
110 static int
111 eth_dev_configure(struct rte_eth_dev *dev __rte_unused) { return 0; }
112
113 static int
114 eth_dev_start(struct rte_eth_dev *dev)
115 {
116         dev->data->dev_link.link_status = 1;
117         return 0;
118 }
119
120 static void
121 eth_dev_stop(struct rte_eth_dev *dev)
122 {
123         dev->data->dev_link.link_status = 0;
124 }
125
126 static int
127 eth_dev_set_link_down(struct rte_eth_dev *dev)
128 {
129         dev->data->dev_link.link_status = 0;
130         return 0;
131 }
132
133 static int
134 eth_dev_set_link_up(struct rte_eth_dev *dev)
135 {
136         dev->data->dev_link.link_status = 1;
137         return 0;
138 }
139
140 static int
141 eth_rx_queue_setup(struct rte_eth_dev *dev,uint16_t rx_queue_id,
142                                     uint16_t nb_rx_desc __rte_unused,
143                                     unsigned int socket_id __rte_unused,
144                                     const struct rte_eth_rxconf *rx_conf __rte_unused,
145                                     struct rte_mempool *mb_pool __rte_unused)
146 {
147         struct pmd_internals *internals = dev->data->dev_private;
148         dev->data->rx_queues[rx_queue_id] = &internals->rx_ring_queues[rx_queue_id];
149         return 0;
150 }
151
152 static int
153 eth_tx_queue_setup(struct rte_eth_dev *dev, uint16_t tx_queue_id,
154                                     uint16_t nb_tx_desc __rte_unused,
155                                     unsigned int socket_id __rte_unused,
156                                     const struct rte_eth_txconf *tx_conf __rte_unused)
157 {
158         struct pmd_internals *internals = dev->data->dev_private;
159         dev->data->tx_queues[tx_queue_id] = &internals->tx_ring_queues[tx_queue_id];
160         return 0;
161 }
162
163
164 static void
165 eth_dev_info(struct rte_eth_dev *dev,
166                 struct rte_eth_dev_info *dev_info)
167 {
168         struct pmd_internals *internals = dev->data->dev_private;
169         dev_info->driver_name = drivername;
170         dev_info->max_mac_addrs = 1;
171         dev_info->max_rx_pktlen = (uint32_t)-1;
172         dev_info->max_rx_queues = (uint16_t)internals->nb_rx_queues;
173         dev_info->max_tx_queues = (uint16_t)internals->nb_tx_queues;
174         dev_info->min_rx_bufsize = 0;
175         dev_info->pci_dev = NULL;
176 }
177
178 static void
179 eth_stats_get(struct rte_eth_dev *dev, struct rte_eth_stats *igb_stats)
180 {
181         unsigned i;
182         unsigned long rx_total = 0, tx_total = 0, tx_err_total = 0;
183         const struct pmd_internals *internal = dev->data->dev_private;
184
185         for (i = 0; i < RTE_ETHDEV_QUEUE_STAT_CNTRS &&
186                         i < internal->nb_rx_queues; i++) {
187                 igb_stats->q_ipackets[i] = internal->rx_ring_queues[i].rx_pkts.cnt;
188                 rx_total += igb_stats->q_ipackets[i];
189         }
190
191         for (i = 0; i < RTE_ETHDEV_QUEUE_STAT_CNTRS &&
192                         i < internal->nb_tx_queues; i++) {
193                 igb_stats->q_opackets[i] = internal->tx_ring_queues[i].tx_pkts.cnt;
194                 igb_stats->q_errors[i] = internal->tx_ring_queues[i].err_pkts.cnt;
195                 tx_total += igb_stats->q_opackets[i];
196                 tx_err_total += igb_stats->q_errors[i];
197         }
198
199         igb_stats->ipackets = rx_total;
200         igb_stats->opackets = tx_total;
201         igb_stats->oerrors = tx_err_total;
202 }
203
204 static void
205 eth_stats_reset(struct rte_eth_dev *dev)
206 {
207         unsigned i;
208         struct pmd_internals *internal = dev->data->dev_private;
209         for (i = 0; i < internal->nb_rx_queues; i++)
210                 internal->rx_ring_queues[i].rx_pkts.cnt = 0;
211         for (i = 0; i < internal->nb_tx_queues; i++) {
212                 internal->tx_ring_queues[i].tx_pkts.cnt = 0;
213                 internal->tx_ring_queues[i].err_pkts.cnt = 0;
214         }
215 }
216
217 static void
218 eth_mac_addr_remove(struct rte_eth_dev *dev __rte_unused,
219         uint32_t index __rte_unused)
220 {
221 }
222
223 static void
224 eth_mac_addr_add(struct rte_eth_dev *dev __rte_unused,
225         struct ether_addr *mac_addr __rte_unused,
226         uint32_t index __rte_unused,
227         uint32_t vmdq __rte_unused)
228 {
229 }
230
231 static void
232 eth_queue_release(void *q __rte_unused) { ; }
233 static int
234 eth_link_update(struct rte_eth_dev *dev __rte_unused,
235                 int wait_to_complete __rte_unused) { return 0; }
236
237 static const struct eth_dev_ops ops = {
238         .dev_start = eth_dev_start,
239         .dev_stop = eth_dev_stop,
240         .dev_set_link_up = eth_dev_set_link_up,
241         .dev_set_link_down = eth_dev_set_link_down,
242         .dev_configure = eth_dev_configure,
243         .dev_infos_get = eth_dev_info,
244         .rx_queue_setup = eth_rx_queue_setup,
245         .tx_queue_setup = eth_tx_queue_setup,
246         .rx_queue_release = eth_queue_release,
247         .tx_queue_release = eth_queue_release,
248         .link_update = eth_link_update,
249         .stats_get = eth_stats_get,
250         .stats_reset = eth_stats_reset,
251         .mac_addr_remove = eth_mac_addr_remove,
252         .mac_addr_add = eth_mac_addr_add,
253 };
254
255 int
256 rte_eth_from_rings(const char *name, struct rte_ring *const rx_queues[],
257                 const unsigned nb_rx_queues,
258                 struct rte_ring *const tx_queues[],
259                 const unsigned nb_tx_queues,
260                 const unsigned numa_node)
261 {
262         struct rte_eth_dev_data *data = NULL;
263         struct pmd_internals *internals = NULL;
264         struct rte_eth_dev *eth_dev = NULL;
265
266         unsigned i;
267
268         /* do some parameter checking */
269         if (rx_queues == NULL && nb_rx_queues > 0) {
270                 rte_errno = EINVAL;
271                 goto error;
272         }
273         if (tx_queues == NULL && nb_tx_queues > 0) {
274                 rte_errno = EINVAL;
275                 goto error;
276         }
277         if (nb_rx_queues > RTE_PMD_RING_MAX_RX_RINGS) {
278                 rte_errno = EINVAL;
279                 goto error;
280         }
281
282         RTE_LOG(INFO, PMD, "Creating rings-backed ethdev on numa socket %u\n",
283                         numa_node);
284
285         /* now do all data allocation - for eth_dev structure, dummy pci driver
286          * and internal (private) data
287          */
288         data = rte_zmalloc_socket(name, sizeof(*data), 0, numa_node);
289         if (data == NULL) {
290                 rte_errno = ENOMEM;
291                 goto error;
292         }
293
294         data->rx_queues = rte_zmalloc_socket(name, sizeof(void *) * nb_rx_queues,
295                         0, numa_node);
296         if (data->rx_queues == NULL) {
297                 rte_errno = ENOMEM;
298                 goto error;
299         }
300
301         data->tx_queues = rte_zmalloc_socket(name, sizeof(void *) * nb_tx_queues,
302                         0, numa_node);
303         if (data->tx_queues == NULL) {
304                 rte_errno = ENOMEM;
305                 goto error;
306         }
307
308         internals = rte_zmalloc_socket(name, sizeof(*internals), 0, numa_node);
309         if (internals == NULL) {
310                 rte_errno = ENOMEM;
311                 goto error;
312         }
313
314         /* reserve an ethdev entry */
315         eth_dev = rte_eth_dev_allocate(name, RTE_ETH_DEV_VIRTUAL);
316         if (eth_dev == NULL) {
317                 rte_errno = ENOSPC;
318                 goto error;
319         }
320
321         /* now put it all together
322          * - store queue data in internals,
323          * - store numa_node info in eth_dev_data
324          * - point eth_dev_data to internals
325          * - and point eth_dev structure to new eth_dev_data structure
326          */
327         /* NOTE: we'll replace the data element, of originally allocated eth_dev
328          * so the rings are local per-process */
329
330         internals->nb_rx_queues = nb_rx_queues;
331         internals->nb_tx_queues = nb_tx_queues;
332         for (i = 0; i < nb_rx_queues; i++) {
333                 internals->rx_ring_queues[i].rng = rx_queues[i];
334                 data->rx_queues[i] = &internals->rx_ring_queues[i];
335         }
336         for (i = 0; i < nb_tx_queues; i++) {
337                 internals->tx_ring_queues[i].rng = tx_queues[i];
338                 data->tx_queues[i] = &internals->tx_ring_queues[i];
339         }
340
341         data->dev_private = internals;
342         data->port_id = eth_dev->data->port_id;
343         memmove(data->name, eth_dev->data->name, sizeof(data->name));
344         data->nb_rx_queues = (uint16_t)nb_rx_queues;
345         data->nb_tx_queues = (uint16_t)nb_tx_queues;
346         data->dev_link = pmd_link;
347         data->mac_addrs = &internals->address;
348
349         eth_dev->data = data;
350         eth_dev->driver = NULL;
351         eth_dev->dev_ops = &ops;
352         eth_dev->data->dev_flags = RTE_ETH_DEV_DETACHABLE;
353         eth_dev->data->kdrv = RTE_KDRV_NONE;
354         eth_dev->data->drv_name = drivername;
355         eth_dev->data->numa_node = numa_node;
356
357         TAILQ_INIT(&(eth_dev->link_intr_cbs));
358
359         /* finally assign rx and tx ops */
360         eth_dev->rx_pkt_burst = eth_ring_rx;
361         eth_dev->tx_pkt_burst = eth_ring_tx;
362
363         return data->port_id;
364
365 error:
366         if (data) {
367                 rte_free(data->rx_queues);
368                 rte_free(data->tx_queues);
369         }
370         rte_free(data);
371         rte_free(internals);
372
373         return -1;
374 }
375
376 int
377 rte_eth_from_ring(struct rte_ring *r)
378 {
379         return rte_eth_from_rings(r->name, &r, 1, &r, 1,
380                         r->memzone ? r->memzone->socket_id : SOCKET_ID_ANY);
381 }
382
383 enum dev_action{
384         DEV_CREATE,
385         DEV_ATTACH
386 };
387
388 static int
389 eth_dev_ring_create(const char *name, const unsigned numa_node,
390                 enum dev_action action)
391 {
392         /* rx and tx are so-called from point of view of first port.
393          * They are inverted from the point of view of second port
394          */
395         struct rte_ring *rxtx[RTE_PMD_RING_MAX_RX_RINGS];
396         unsigned i;
397         char rng_name[RTE_RING_NAMESIZE];
398         unsigned num_rings = RTE_MIN(RTE_PMD_RING_MAX_RX_RINGS,
399                         RTE_PMD_RING_MAX_TX_RINGS);
400
401         for (i = 0; i < num_rings; i++) {
402                 snprintf(rng_name, sizeof(rng_name), "ETH_RXTX%u_%s", i, name);
403                 rxtx[i] = (action == DEV_CREATE) ?
404                                 rte_ring_create(rng_name, 1024, numa_node,
405                                                 RING_F_SP_ENQ|RING_F_SC_DEQ) :
406                                 rte_ring_lookup(rng_name);
407                 if (rxtx[i] == NULL)
408                         return -1;
409         }
410
411         if (rte_eth_from_rings(name, rxtx, num_rings, rxtx, num_rings, numa_node) < 0)
412                 return -1;
413
414         return 0;
415 }
416
417 struct node_action_pair {
418         char name[PATH_MAX];
419         unsigned node;
420         enum dev_action action;
421 };
422
423 struct node_action_list {
424         unsigned total;
425         unsigned count;
426         struct node_action_pair *list;
427 };
428
429 static int parse_kvlist (const char *key __rte_unused, const char *value, void *data)
430 {
431         struct node_action_list *info = data;
432         int ret;
433         char *name;
434         char *action;
435         char *node;
436         char *end;
437
438         name = strdup(value);
439
440         ret = -EINVAL;
441
442         if (!name) {
443                 RTE_LOG(WARNING, PMD, "command line paramter is empty for ring pmd!\n");
444                 goto out;
445         }
446
447         node = strchr(name, ':');
448         if (!node) {
449                 RTE_LOG(WARNING, PMD, "could not parse node value from %s", name);
450                 goto out;
451         }
452
453         *node = '\0';
454         node++;
455
456         action = strchr(node, ':');
457         if (!action) {
458                 RTE_LOG(WARNING, PMD, "could not action value from %s", node);
459                 goto out;
460         }
461
462         *action = '\0';
463         action++;
464
465         /*
466          * Need to do some sanity checking here
467          */
468
469         if (strcmp(action, ETH_RING_ACTION_ATTACH) == 0)
470                 info->list[info->count].action = DEV_ATTACH;
471         else if (strcmp(action, ETH_RING_ACTION_CREATE) == 0)
472                 info->list[info->count].action = DEV_CREATE;
473         else
474                 goto out;
475
476         errno = 0;
477         info->list[info->count].node = strtol(node, &end, 10);
478
479         if ((errno != 0) || (*end != '\0')) {
480                 RTE_LOG(WARNING, PMD, "node value %s is unparseable as a number\n", node);
481                 goto out;
482         }
483
484         snprintf(info->list[info->count].name, sizeof(info->list[info->count].name), "%s", name);
485
486         info->count++;
487
488         ret = 0;
489 out:
490         free(name);
491         return ret;
492 }
493
494 static int
495 rte_pmd_ring_devinit(const char *name, const char *params)
496 {
497         struct rte_kvargs *kvlist = NULL;
498         int ret = 0;
499         struct node_action_list *info = NULL;
500
501         RTE_LOG(INFO, PMD, "Initializing pmd_ring for %s\n", name);
502
503         if (params == NULL || params[0] == '\0') {
504                 ret = eth_dev_ring_create(name, rte_socket_id(), DEV_CREATE);
505                 if (ret == -1) {
506                         RTE_LOG(INFO, PMD,
507                                 "Attach to pmd_ring for %s\n", name);
508                         ret = eth_dev_ring_create(name, rte_socket_id(),
509                                                   DEV_ATTACH);
510                 }
511         }
512         else {
513                 kvlist = rte_kvargs_parse(params, valid_arguments);
514
515                 if (!kvlist) {
516                         RTE_LOG(INFO, PMD, "Ignoring unsupported parameters when creating"
517                                         " rings-backed ethernet device\n");
518                         ret = eth_dev_ring_create(name, rte_socket_id(),
519                                                   DEV_CREATE);
520                         if (ret == -1) {
521                                 RTE_LOG(INFO, PMD,
522                                         "Attach to pmd_ring for %s\n",
523                                         name);
524                                 ret = eth_dev_ring_create(name, rte_socket_id(),
525                                                           DEV_ATTACH);
526                         }
527                         return ret;
528                 } else {
529                         ret = rte_kvargs_count(kvlist, ETH_RING_NUMA_NODE_ACTION_ARG);
530                         info = rte_zmalloc("struct node_action_list",
531                                            sizeof(struct node_action_list) +
532                                            (sizeof(struct node_action_pair) * ret),
533                                            0);
534                         if (!info)
535                                 goto out_free;
536
537                         info->total = ret;
538                         info->list = (struct node_action_pair*)(info + 1);
539
540                         ret = rte_kvargs_process(kvlist, ETH_RING_NUMA_NODE_ACTION_ARG,
541                                                  parse_kvlist, info);
542
543                         if (ret < 0)
544                                 goto out_free;
545
546                         for (info->count = 0; info->count < info->total; info->count++) {
547                                 ret = eth_dev_ring_create(name,
548                                                           info->list[info->count].node,
549                                                           info->list[info->count].action);
550                                 if ((ret == -1) &&
551                                     (info->list[info->count].action == DEV_CREATE)) {
552                                         RTE_LOG(INFO, PMD,
553                                                 "Attach to pmd_ring for %s\n",
554                                                 name);
555                                         ret = eth_dev_ring_create(name,
556                                                         info->list[info->count].node,
557                                                         DEV_ATTACH);
558                                 }
559                         }
560                 }
561         }
562
563 out_free:
564         rte_kvargs_free(kvlist);
565         rte_free(info);
566         return ret;
567 }
568
569 static int
570 rte_pmd_ring_devuninit(const char *name)
571 {
572         struct rte_eth_dev *eth_dev = NULL;
573
574         RTE_LOG(INFO, PMD, "Un-Initializing pmd_ring for %s\n", name);
575
576         if (name == NULL)
577                 return -EINVAL;
578
579         /* find an ethdev entry */
580         eth_dev = rte_eth_dev_allocated(name);
581         if (eth_dev == NULL)
582                 return -ENODEV;
583
584         eth_dev_stop(eth_dev);
585
586         if (eth_dev->data) {
587                 rte_free(eth_dev->data->rx_queues);
588                 rte_free(eth_dev->data->tx_queues);
589                 rte_free(eth_dev->data->dev_private);
590         }
591         rte_free(eth_dev->data);
592
593         rte_eth_dev_release_port(eth_dev);
594         return 0;
595 }
596
597 static struct rte_driver pmd_ring_drv = {
598         .name = "eth_ring",
599         .type = PMD_VDEV,
600         .init = rte_pmd_ring_devinit,
601         .uninit = rte_pmd_ring_devuninit,
602 };
603
604 PMD_REGISTER_DRIVER(pmd_ring_drv);