bus/fslmc: support multi VFIO group
[dpdk.git] / drivers / bus / fslmc / fslmc_bus.c
1 /* SPDX-License-Identifier: BSD-3-Clause
2  *
3  *   Copyright 2016,2018-2019 NXP
4  *
5  */
6
7 #include <string.h>
8 #include <dirent.h>
9 #include <stdbool.h>
10
11 #include <rte_log.h>
12 #include <rte_bus.h>
13 #include <rte_malloc.h>
14 #include <rte_devargs.h>
15 #include <rte_memcpy.h>
16 #include <rte_ethdev_driver.h>
17
18 #include <rte_fslmc.h>
19 #include <fslmc_vfio.h>
20 #include "fslmc_logs.h"
21
22 #include <dpaax_iova_table.h>
23
24 int dpaa2_logtype_bus;
25
26 #define VFIO_IOMMU_GROUP_PATH "/sys/kernel/iommu_groups"
27 #define FSLMC_BUS_NAME  fslmc
28
29 struct rte_fslmc_bus rte_fslmc_bus;
30 uint8_t dpaa2_virt_mode;
31
32 uint32_t
33 rte_fslmc_get_device_count(enum rte_dpaa2_dev_type device_type)
34 {
35         if (device_type >= DPAA2_DEVTYPE_MAX)
36                 return 0;
37         return rte_fslmc_bus.device_count[device_type];
38 }
39
40 RTE_DEFINE_PER_LCORE(struct dpaa2_portal_dqrr, dpaa2_held_bufs);
41
42 static void
43 cleanup_fslmc_device_list(void)
44 {
45         struct rte_dpaa2_device *dev;
46         struct rte_dpaa2_device *t_dev;
47
48         TAILQ_FOREACH_SAFE(dev, &rte_fslmc_bus.device_list, next, t_dev) {
49                 TAILQ_REMOVE(&rte_fslmc_bus.device_list, dev, next);
50                 free(dev);
51                 dev = NULL;
52         }
53 }
54
55 static int
56 compare_dpaa2_devname(struct rte_dpaa2_device *dev1,
57                       struct rte_dpaa2_device *dev2)
58 {
59         int comp;
60
61         if (dev1->dev_type > dev2->dev_type) {
62                 comp = 1;
63         } else if (dev1->dev_type < dev2->dev_type) {
64                 comp = -1;
65         } else {
66                 /* Check the ID as types match */
67                 if (dev1->object_id > dev2->object_id)
68                         comp = 1;
69                 else if (dev1->object_id < dev2->object_id)
70                         comp = -1;
71                 else
72                         comp = 0; /* Duplicate device name */
73         }
74
75         return comp;
76 }
77
78 static void
79 insert_in_device_list(struct rte_dpaa2_device *newdev)
80 {
81         int comp, inserted = 0;
82         struct rte_dpaa2_device *dev = NULL;
83         struct rte_dpaa2_device *tdev = NULL;
84
85         TAILQ_FOREACH_SAFE(dev, &rte_fslmc_bus.device_list, next, tdev) {
86                 comp = compare_dpaa2_devname(newdev, dev);
87                 if (comp < 0) {
88                         TAILQ_INSERT_BEFORE(dev, newdev, next);
89                         inserted = 1;
90                         break;
91                 }
92         }
93
94         if (!inserted)
95                 TAILQ_INSERT_TAIL(&rte_fslmc_bus.device_list, newdev, next);
96 }
97
98 static struct rte_devargs *
99 fslmc_devargs_lookup(struct rte_dpaa2_device *dev)
100 {
101         struct rte_devargs *devargs;
102         char dev_name[32];
103
104         RTE_EAL_DEVARGS_FOREACH("fslmc", devargs) {
105                 devargs->bus->parse(devargs->name, &dev_name);
106                 if (strcmp(dev_name, dev->device.name) == 0) {
107                         DPAA2_BUS_INFO("**Devargs matched %s", dev_name);
108                         return devargs;
109                 }
110         }
111         return NULL;
112 }
113
114 static void
115 dump_device_list(void)
116 {
117         struct rte_dpaa2_device *dev;
118         uint32_t global_log_level;
119         int local_log_level;
120
121         /* Only if the log level has been set to Debugging, print list */
122         global_log_level = rte_log_get_global_level();
123         local_log_level = rte_log_get_level(dpaa2_logtype_bus);
124         if (global_log_level == RTE_LOG_DEBUG ||
125             local_log_level == RTE_LOG_DEBUG) {
126                 DPAA2_BUS_LOG(DEBUG, "List of devices scanned on bus:");
127                 TAILQ_FOREACH(dev, &rte_fslmc_bus.device_list, next) {
128                         DPAA2_BUS_LOG(DEBUG, "\t\t%s", dev->device.name);
129                 }
130         }
131 }
132
133 static int
134 scan_one_fslmc_device(char *dev_name)
135 {
136         char *dup_dev_name, *t_ptr;
137         struct rte_dpaa2_device *dev = NULL;
138         int ret = -1;
139
140         if (!dev_name)
141                 return ret;
142
143         /* Ignore the Container name itself */
144         if (!strncmp("dprc", dev_name, 4))
145                 return 0;
146
147         /* Creating a temporary copy to perform cut-parse over string */
148         dup_dev_name = strdup(dev_name);
149         if (!dup_dev_name) {
150                 DPAA2_BUS_ERR("Unable to allocate device name memory");
151                 return -ENOMEM;
152         }
153
154         /* For all other devices, we allocate rte_dpaa2_device.
155          * For those devices where there is no driver, probe would release
156          * the memory associated with the rte_dpaa2_device after necessary
157          * initialization.
158          */
159         dev = calloc(1, sizeof(struct rte_dpaa2_device));
160         if (!dev) {
161                 DPAA2_BUS_ERR("Unable to allocate device object");
162                 free(dup_dev_name);
163                 return -ENOMEM;
164         }
165
166         dev->device.bus = &rte_fslmc_bus.bus;
167
168         /* Parse the device name and ID */
169         t_ptr = strtok(dup_dev_name, ".");
170         if (!t_ptr) {
171                 DPAA2_BUS_ERR("Invalid device found: (%s)", dup_dev_name);
172                 ret = -EINVAL;
173                 goto cleanup;
174         }
175         if (!strncmp("dpni", t_ptr, 4))
176                 dev->dev_type = DPAA2_ETH;
177         else if (!strncmp("dpseci", t_ptr, 6))
178                 dev->dev_type = DPAA2_CRYPTO;
179         else if (!strncmp("dpcon", t_ptr, 5))
180                 dev->dev_type = DPAA2_CON;
181         else if (!strncmp("dpbp", t_ptr, 4))
182                 dev->dev_type = DPAA2_BPOOL;
183         else if (!strncmp("dpio", t_ptr, 4))
184                 dev->dev_type = DPAA2_IO;
185         else if (!strncmp("dpci", t_ptr, 4))
186                 dev->dev_type = DPAA2_CI;
187         else if (!strncmp("dpmcp", t_ptr, 5))
188                 dev->dev_type = DPAA2_MPORTAL;
189         else if (!strncmp("dpdmai", t_ptr, 6))
190                 dev->dev_type = DPAA2_QDMA;
191         else if (!strncmp("dpdmux", t_ptr, 6))
192                 dev->dev_type = DPAA2_MUX;
193         else if (!strncmp("dprtc", t_ptr, 5))
194                 dev->dev_type = DPAA2_DPRTC;
195         else
196                 dev->dev_type = DPAA2_UNKNOWN;
197
198         t_ptr = strtok(NULL, ".");
199         if (!t_ptr) {
200                 DPAA2_BUS_ERR("Skipping invalid device (%s)", dup_dev_name);
201                 ret = 0;
202                 goto cleanup;
203         }
204
205         sscanf(t_ptr, "%hu", &dev->object_id);
206         dev->device.name = strdup(dev_name);
207         if (!dev->device.name) {
208                 DPAA2_BUS_ERR("Unable to clone device name. Out of memory");
209                 ret = -ENOMEM;
210                 goto cleanup;
211         }
212         dev->device.devargs = fslmc_devargs_lookup(dev);
213
214         /* Update the device found into the device_count table */
215         rte_fslmc_bus.device_count[dev->dev_type]++;
216
217         /* Add device in the fslmc device list */
218         insert_in_device_list(dev);
219
220         /* Don't need the duplicated device filesystem entry anymore */
221         if (dup_dev_name)
222                 free(dup_dev_name);
223
224         return 0;
225 cleanup:
226         if (dup_dev_name)
227                 free(dup_dev_name);
228         if (dev)
229                 free(dev);
230         return ret;
231 }
232
233 static int
234 rte_fslmc_parse(const char *name, void *addr)
235 {
236         uint16_t dev_id;
237         char *t_ptr;
238         char *sep = NULL;
239         uint8_t sep_exists = 0;
240
241         DPAA2_BUS_DEBUG("Parsing dev=(%s)", name);
242
243         /* There are multiple ways this can be called, with bus:dev, name=dev
244          * or just dev. In all cases, the 'addr' is actually a string.
245          */
246         sep = strchr(name, ':');
247         if (!sep) {
248                 /* check for '=' */
249                 sep = strchr(name, '=');
250                 if (!sep)
251                         sep_exists = 0;
252                 else
253                         sep_exists = 1;
254         } else
255                 sep_exists = 1;
256
257         /* Check if starting part if either of 'fslmc:' or 'name=', separator
258          * exists.
259          */
260         if (sep_exists) {
261                 /* If either of "fslmc" or "name" are starting part */
262                 if (!strncmp(name, RTE_STR(FSLMC_BUS_NAME),
263                              strlen(RTE_STR(FSLMC_BUS_NAME))) ||
264                    (!strncmp(name, "name", strlen("name")))) {
265                         goto jump_out;
266                 } else {
267                         DPAA2_BUS_DEBUG("Invalid device for matching (%s).",
268                                         name);
269                         goto err_out;
270                 }
271         } else
272                 sep = strdup(name);
273
274 jump_out:
275         /* Validate device name */
276         if (strncmp("dpni", sep, 4) &&
277             strncmp("dpseci", sep, 6) &&
278             strncmp("dpcon", sep, 5) &&
279             strncmp("dpbp", sep, 4) &&
280             strncmp("dpio", sep, 4) &&
281             strncmp("dpci", sep, 4) &&
282             strncmp("dpmcp", sep, 5) &&
283             strncmp("dpdmai", sep, 6) &&
284             strncmp("dpdmux", sep, 6)) {
285                 DPAA2_BUS_DEBUG("Unknown or unsupported device (%s)", sep);
286                 goto err_out;
287         }
288
289         t_ptr = strchr(sep, '.');
290         if (!t_ptr || sscanf(t_ptr + 1, "%hu", &dev_id) != 1) {
291                 DPAA2_BUS_ERR("Missing device id in device name (%s)", sep);
292                 goto err_out;
293         }
294
295         if (addr)
296                 strcpy(addr, sep);
297
298         return 0;
299 err_out:
300         if (!sep_exists && sep)
301                 free(sep);
302         return -EINVAL;
303 }
304
305 static int
306 rte_fslmc_scan(void)
307 {
308         int ret;
309         int device_count = 0;
310         char fslmc_dirpath[PATH_MAX];
311         DIR *dir;
312         struct dirent *entry;
313         static int process_once;
314         int groupid;
315
316         if (process_once) {
317                 DPAA2_BUS_DEBUG("Fslmc bus already scanned. Not rescanning");
318                 return 0;
319         }
320         process_once = 1;
321
322         ret = fslmc_get_container_group(&groupid);
323         if (ret != 0)
324                 goto scan_fail;
325
326         /* Scan devices on the group */
327         sprintf(fslmc_dirpath, "%s/%s", SYSFS_FSL_MC_DEVICES, fslmc_container);
328         dir = opendir(fslmc_dirpath);
329         if (!dir) {
330                 DPAA2_BUS_ERR("Unable to open VFIO group directory");
331                 goto scan_fail;
332         }
333
334         while ((entry = readdir(dir)) != NULL) {
335                 if (entry->d_name[0] == '.' || entry->d_type != DT_DIR)
336                         continue;
337
338                 ret = scan_one_fslmc_device(entry->d_name);
339                 if (ret != 0) {
340                         /* Error in parsing directory - exit gracefully */
341                         goto scan_fail_cleanup;
342                 }
343                 device_count += 1;
344         }
345
346         closedir(dir);
347
348         DPAA2_BUS_INFO("FSLMC Bus scan completed");
349         /* If debugging is enabled, device list is dumped to log output */
350         dump_device_list();
351
352         return 0;
353
354 scan_fail_cleanup:
355         closedir(dir);
356
357         /* Remove all devices in the list */
358         cleanup_fslmc_device_list();
359 scan_fail:
360         DPAA2_BUS_DEBUG("FSLMC Bus Not Available. Skipping (%d)", ret);
361         /* Irrespective of failure, scan only return success */
362         return 0;
363 }
364
365 static int
366 rte_fslmc_match(struct rte_dpaa2_driver *dpaa2_drv,
367                 struct rte_dpaa2_device *dpaa2_dev)
368 {
369         if (dpaa2_drv->drv_type == dpaa2_dev->dev_type)
370                 return 0;
371
372         return 1;
373 }
374
375 static int
376 rte_fslmc_probe(void)
377 {
378         int ret = 0;
379         int probe_all;
380
381         struct rte_dpaa2_device *dev;
382         struct rte_dpaa2_driver *drv;
383
384         if (TAILQ_EMPTY(&rte_fslmc_bus.device_list))
385                 return 0;
386
387         ret = fslmc_vfio_setup_group();
388         if (ret) {
389                 DPAA2_BUS_ERR("Unable to setup VFIO %d", ret);
390                 return 0;
391         }
392
393         /* Map existing segments as well as, in case of hotpluggable memory,
394          * install callback handler.
395          */
396         if (rte_eal_process_type() == RTE_PROC_PRIMARY) {
397                 ret = rte_fslmc_vfio_dmamap();
398                 if (ret) {
399                         DPAA2_BUS_ERR("Unable to DMA map existing VAs: (%d)",
400                                       ret);
401                         /* Not continuing ahead */
402                         DPAA2_BUS_ERR("FSLMC VFIO Mapping failed");
403                         return 0;
404                 }
405         }
406
407         ret = fslmc_vfio_process_group();
408         if (ret) {
409                 DPAA2_BUS_ERR("Unable to setup devices %d", ret);
410                 return 0;
411         }
412
413         probe_all = rte_fslmc_bus.bus.conf.scan_mode != RTE_BUS_SCAN_WHITELIST;
414
415         /* In case of PA, the FD addresses returned by qbman APIs are physical
416          * addresses, which need conversion into equivalent VA address for
417          * rte_mbuf. For that, a table (a serial array, in memory) is used to
418          * increase translation efficiency.
419          * This has to be done before probe as some device initialization
420          * (during) probe allocate memory (dpaa2_sec) which needs to be pinned
421          * to this table.
422          *
423          * Error is ignored as relevant logs are handled within dpaax and
424          * handling for unavailable dpaax table too is transparent to caller.
425          *
426          * And, the IOVA table is only applicable in case of PA mode.
427          */
428         if (rte_eal_iova_mode() == RTE_IOVA_PA)
429                 dpaax_iova_table_populate();
430
431         TAILQ_FOREACH(dev, &rte_fslmc_bus.device_list, next) {
432                 TAILQ_FOREACH(drv, &rte_fslmc_bus.driver_list, next) {
433                         ret = rte_fslmc_match(drv, dev);
434                         if (ret)
435                                 continue;
436
437                         if (!drv->probe)
438                                 continue;
439
440                         if (rte_dev_is_probed(&dev->device))
441                                 continue;
442
443                         if (dev->device.devargs &&
444                           dev->device.devargs->policy == RTE_DEV_BLACKLISTED) {
445                                 DPAA2_BUS_LOG(DEBUG, "%s Blacklisted, skipping",
446                                               dev->device.name);
447                                 continue;
448                         }
449
450                         if (probe_all ||
451                            (dev->device.devargs &&
452                            dev->device.devargs->policy ==
453                            RTE_DEV_WHITELISTED)) {
454                                 ret = drv->probe(drv, dev);
455                                 if (ret) {
456                                         DPAA2_BUS_ERR("Unable to probe");
457                                 } else {
458                                         dev->driver = drv;
459                                         dev->device.driver = &drv->driver;
460                                 }
461                         }
462                         break;
463                 }
464         }
465
466         if (rte_eal_iova_mode() == RTE_IOVA_VA)
467                 dpaa2_virt_mode = 1;
468
469         return 0;
470 }
471
472 static struct rte_device *
473 rte_fslmc_find_device(const struct rte_device *start, rte_dev_cmp_t cmp,
474                       const void *data)
475 {
476         const struct rte_dpaa2_device *dstart;
477         struct rte_dpaa2_device *dev;
478
479         DPAA2_BUS_DEBUG("Finding a device named %s\n", (const char *)data);
480
481         /* find_device is always called with an opaque object which should be
482          * passed along to the 'cmp' function iterating over all device obj
483          * on the bus.
484          */
485
486         if (start != NULL) {
487                 dstart = RTE_DEV_TO_FSLMC_CONST(start);
488                 dev = TAILQ_NEXT(dstart, next);
489         } else {
490                 dev = TAILQ_FIRST(&rte_fslmc_bus.device_list);
491         }
492         while (dev != NULL) {
493                 if (cmp(&dev->device, data) == 0) {
494                         DPAA2_BUS_DEBUG("Found device (%s)\n",
495                                         dev->device.name);
496                         return &dev->device;
497                 }
498                 dev = TAILQ_NEXT(dev, next);
499         }
500
501         return NULL;
502 }
503
504 /*register a fslmc bus based dpaa2 driver */
505 void
506 rte_fslmc_driver_register(struct rte_dpaa2_driver *driver)
507 {
508         RTE_VERIFY(driver);
509
510         TAILQ_INSERT_TAIL(&rte_fslmc_bus.driver_list, driver, next);
511         /* Update Bus references */
512         driver->fslmc_bus = &rte_fslmc_bus;
513 }
514
515 /*un-register a fslmc bus based dpaa2 driver */
516 void
517 rte_fslmc_driver_unregister(struct rte_dpaa2_driver *driver)
518 {
519         struct rte_fslmc_bus *fslmc_bus;
520
521         fslmc_bus = driver->fslmc_bus;
522
523         /* Cleanup the PA->VA Translation table; From whereever this function
524          * is called from.
525          */
526         if (rte_eal_iova_mode() == RTE_IOVA_PA)
527                 dpaax_iova_table_depopulate();
528
529         TAILQ_REMOVE(&fslmc_bus->driver_list, driver, next);
530         /* Update Bus references */
531         driver->fslmc_bus = NULL;
532 }
533
534 /*
535  * All device has iova as va
536  */
537 static inline int
538 fslmc_all_device_support_iova(void)
539 {
540         int ret = 0;
541         struct rte_dpaa2_device *dev;
542         struct rte_dpaa2_driver *drv;
543
544         TAILQ_FOREACH(dev, &rte_fslmc_bus.device_list, next) {
545                 TAILQ_FOREACH(drv, &rte_fslmc_bus.driver_list, next) {
546                         ret = rte_fslmc_match(drv, dev);
547                         if (ret)
548                                 continue;
549                         /* if the driver is not supporting IOVA */
550                         if (!(drv->drv_flags & RTE_DPAA2_DRV_IOVA_AS_VA))
551                                 return 0;
552                 }
553         }
554         return 1;
555 }
556
557 /*
558  * Get iommu class of DPAA2 devices on the bus.
559  */
560 static enum rte_iova_mode
561 rte_dpaa2_get_iommu_class(void)
562 {
563         bool is_vfio_noiommu_enabled = 1;
564         bool has_iova_va;
565
566         if (TAILQ_EMPTY(&rte_fslmc_bus.device_list))
567                 return RTE_IOVA_DC;
568
569 #ifdef RTE_LIBRTE_DPAA2_USE_PHYS_IOVA
570         return RTE_IOVA_PA;
571 #endif
572
573         /* check if all devices on the bus support Virtual addressing or not */
574         has_iova_va = fslmc_all_device_support_iova();
575
576 #ifdef VFIO_PRESENT
577         is_vfio_noiommu_enabled = rte_vfio_noiommu_is_enabled() == true ?
578                                                 true : false;
579 #endif
580
581         if (has_iova_va && !is_vfio_noiommu_enabled)
582                 return RTE_IOVA_VA;
583
584         return RTE_IOVA_PA;
585 }
586
587 static int
588 fslmc_bus_plug(struct rte_device *dev __rte_unused)
589 {
590         /* No operation is performed while plugging the device */
591         return 0;
592 }
593
594 static int
595 fslmc_bus_unplug(struct rte_device *dev __rte_unused)
596 {
597         /* No operation is performed while unplugging the device */
598         return 0;
599 }
600
601 static void *
602 fslmc_bus_dev_iterate(const void *start, const char *str,
603                       const struct rte_dev_iterator *it __rte_unused)
604 {
605         const struct rte_dpaa2_device *dstart;
606         struct rte_dpaa2_device *dev;
607         char *dup, *dev_name = NULL;
608
609         /* Expectation is that device would be name=device_name */
610         if (strncmp(str, "name=", 5) != 0) {
611                 DPAA2_BUS_DEBUG("Invalid device string (%s)\n", str);
612                 return NULL;
613         }
614
615         /* Now that name=device_name format is available, split */
616         dup = strdup(str);
617         dev_name = dup + strlen("name=");
618
619         if (start != NULL) {
620                 dstart = RTE_DEV_TO_FSLMC_CONST(start);
621                 dev = TAILQ_NEXT(dstart, next);
622         } else {
623                 dev = TAILQ_FIRST(&rte_fslmc_bus.device_list);
624         }
625
626         while (dev != NULL) {
627                 if (strcmp(dev->device.name, dev_name) == 0) {
628                         free(dup);
629                         return &dev->device;
630                 }
631                 dev = TAILQ_NEXT(dev, next);
632         }
633
634         free(dup);
635         return NULL;
636 }
637
638 struct rte_fslmc_bus rte_fslmc_bus = {
639         .bus = {
640                 .scan = rte_fslmc_scan,
641                 .probe = rte_fslmc_probe,
642                 .parse = rte_fslmc_parse,
643                 .find_device = rte_fslmc_find_device,
644                 .get_iommu_class = rte_dpaa2_get_iommu_class,
645                 .plug = fslmc_bus_plug,
646                 .unplug = fslmc_bus_unplug,
647                 .dev_iterate = fslmc_bus_dev_iterate,
648         },
649         .device_list = TAILQ_HEAD_INITIALIZER(rte_fslmc_bus.device_list),
650         .driver_list = TAILQ_HEAD_INITIALIZER(rte_fslmc_bus.driver_list),
651         .device_count = {0},
652 };
653
654 RTE_REGISTER_BUS(FSLMC_BUS_NAME, rte_fslmc_bus.bus);
655
656 RTE_INIT(fslmc_init_log)
657 {
658         /* Bus level logs */
659         dpaa2_logtype_bus = rte_log_register("bus.fslmc");
660         if (dpaa2_logtype_bus >= 0)
661                 rte_log_set_level(dpaa2_logtype_bus, RTE_LOG_NOTICE);
662 }