4 * Copyright(c) 2010-2015 Intel Corporation. All rights reserved.
5 * Copyright 2013-2014 6WIND S.A.
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
12 * * Redistributions of source code must retain the above copyright
13 * notice, this list of conditions and the following disclaimer.
14 * * Redistributions in binary form must reproduce the above copyright
15 * notice, this list of conditions and the following disclaimer in
16 * the documentation and/or other materials provided with the
18 * * Neither the name of Intel Corporation nor the names of its
19 * contributors may be used to endorse or promote products derived
20 * from this software without specific prior written permission.
22 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
23 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
24 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
25 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
26 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
27 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
28 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
29 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
30 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
31 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
32 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
52 #include <sys/queue.h>
56 #include <rte_debug.h>
57 #include <rte_interrupts.h>
61 /** Pathname of PCI devices directory. */
62 const char *pci_get_sysfs_path(void);
64 /** Formatting string for PCI device identifier: Ex: 0000:00:01.0 */
65 #define PCI_PRI_FMT "%.4" PRIx16 ":%.2" PRIx8 ":%.2" PRIx8 ".%" PRIx8
66 #define PCI_PRI_STR_SIZE sizeof("XXXXXXXX:XX:XX.X")
68 /** Short formatting string, without domain, for PCI device: Ex: 00:01.0 */
69 #define PCI_SHORT_PRI_FMT "%.2" PRIx8 ":%.2" PRIx8 ".%" PRIx8
71 /** Nb. of values in PCI device identifier format string. */
72 #define PCI_FMT_NVAL 4
74 /** Nb. of values in PCI resource format. */
75 #define PCI_RESOURCE_FMT_NVAL 3
77 /** Maximum number of PCI resources. */
78 #define PCI_MAX_RESOURCE 6
80 /* Forward declarations */
81 struct rte_pci_device;
82 struct rte_pci_driver;
84 /** List of PCI devices */
85 TAILQ_HEAD(rte_pci_device_list, rte_pci_device);
86 /** List of PCI drivers */
87 TAILQ_HEAD(rte_pci_driver_list, rte_pci_driver);
89 /* PCI Bus iterators */
90 #define FOREACH_DEVICE_ON_PCIBUS(p) \
91 TAILQ_FOREACH(p, &(rte_pci_bus.device_list), next)
93 #define FOREACH_DRIVER_ON_PCIBUS(p) \
94 TAILQ_FOREACH(p, &(rte_pci_bus.driver_list), next)
97 * A structure describing an ID for a PCI driver. Each driver provides a
98 * table of these IDs for each device that it supports.
101 uint32_t class_id; /**< Class ID (class, subclass, pi) or RTE_CLASS_ANY_ID. */
102 uint16_t vendor_id; /**< Vendor ID or PCI_ANY_ID. */
103 uint16_t device_id; /**< Device ID or PCI_ANY_ID. */
104 uint16_t subsystem_vendor_id; /**< Subsystem vendor ID or PCI_ANY_ID. */
105 uint16_t subsystem_device_id; /**< Subsystem device ID or PCI_ANY_ID. */
109 * A structure describing the location of a PCI device.
111 struct rte_pci_addr {
112 uint32_t domain; /**< Device domain */
113 uint8_t bus; /**< Device bus */
114 uint8_t devid; /**< Device ID */
115 uint8_t function; /**< Device function. */
121 * A structure describing a PCI device.
123 struct rte_pci_device {
124 TAILQ_ENTRY(rte_pci_device) next; /**< Next probed PCI device. */
125 struct rte_device device; /**< Inherit core device */
126 struct rte_pci_addr addr; /**< PCI location. */
127 struct rte_pci_id id; /**< PCI ID. */
128 struct rte_mem_resource mem_resource[PCI_MAX_RESOURCE];
129 /**< PCI Memory Resource */
130 struct rte_intr_handle intr_handle; /**< Interrupt handle */
131 struct rte_pci_driver *driver; /**< Associated driver */
132 uint16_t max_vfs; /**< sriov enable if not zero */
133 enum rte_kernel_driver kdrv; /**< Kernel driver passthrough */
134 char name[PCI_PRI_STR_SIZE+1]; /**< PCI location (ASCII) */
139 * Helper macro for drivers that need to convert to struct rte_pci_device.
141 #define RTE_DEV_TO_PCI(ptr) container_of(ptr, struct rte_pci_device, device)
143 /** Any PCI device identifier (vendor, device, ...) */
144 #define PCI_ANY_ID (0xffff)
145 #define RTE_CLASS_ANY_ID (0xffffff)
148 /** C++ macro used to help building up tables of device IDs */
149 #define RTE_PCI_DEVICE(vend, dev) \
156 /** Macro used to help building up tables of device IDs */
157 #define RTE_PCI_DEVICE(vend, dev) \
158 .class_id = RTE_CLASS_ANY_ID, \
159 .vendor_id = (vend), \
160 .device_id = (dev), \
161 .subsystem_vendor_id = PCI_ANY_ID, \
162 .subsystem_device_id = PCI_ANY_ID
166 * Initialisation function for the driver called during PCI probing.
168 typedef int (pci_probe_t)(struct rte_pci_driver *, struct rte_pci_device *);
171 * Uninitialisation function for the driver called during hotplugging.
173 typedef int (pci_remove_t)(struct rte_pci_device *);
176 * A structure describing a PCI driver.
178 struct rte_pci_driver {
179 TAILQ_ENTRY(rte_pci_driver) next; /**< Next in list. */
180 struct rte_driver driver; /**< Inherit core driver. */
181 struct rte_pci_bus *bus; /**< PCI bus reference. */
182 pci_probe_t *probe; /**< Device Probe function. */
183 pci_remove_t *remove; /**< Device Remove function. */
184 const struct rte_pci_id *id_table; /**< ID table, NULL terminated. */
185 uint32_t drv_flags; /**< Flags contolling handling of device. */
189 * Structure describing the PCI bus
192 struct rte_bus bus; /**< Inherit the generic class */
193 struct rte_pci_device_list device_list; /**< List of PCI devices */
194 struct rte_pci_driver_list driver_list; /**< List of PCI drivers */
197 /** Device needs PCI BAR mapping (done with either IGB_UIO or VFIO) */
198 #define RTE_PCI_DRV_NEED_MAPPING 0x0001
199 /** Device driver supports link state interrupt */
200 #define RTE_PCI_DRV_INTR_LSC 0x0008
201 /** Device driver supports device removal interrupt */
202 #define RTE_PCI_DRV_INTR_RMV 0x0010
203 /** Device driver needs to keep mapped resources if unsupported dev detected */
204 #define RTE_PCI_DRV_KEEP_MAPPED_RES 0x0020
205 /** Device driver supports IOVA as VA */
206 #define RTE_PCI_DRV_IOVA_AS_VA 0X0040
209 * A structure describing a PCI mapping.
220 * A structure describing a mapped PCI resource.
221 * For multi-process we need to reproduce all PCI mappings in secondary
222 * processes, so save them in a tailq.
224 struct mapped_pci_resource {
225 TAILQ_ENTRY(mapped_pci_resource) next;
227 struct rte_pci_addr pci_addr;
230 struct pci_map maps[PCI_MAX_RESOURCE];
233 /** mapped pci device list */
234 TAILQ_HEAD(mapped_pci_res_list, mapped_pci_resource);
236 /**< Internal use only - Macro used by pci addr parsing functions **/
237 #define GET_PCIADDR_FIELD(in, fd, lim, dlm) \
242 val = strtoul((in), &end, 16); \
243 if (errno != 0 || end[0] != (dlm) || val > (lim)) \
245 (fd) = (typeof (fd))val; \
250 * Utility function to produce a PCI Bus-Device-Function value
251 * given a string representation. Assumes that the BDF is provided without
252 * a domain prefix (i.e. domain returned is always 0)
255 * The input string to be parsed. Should have the format XX:XX.X
257 * The PCI Bus-Device-Function address to be returned. Domain will always be
260 * 0 on success, negative on error.
263 eal_parse_pci_BDF(const char *input, struct rte_pci_addr *dev_addr)
265 dev_addr->domain = 0;
266 GET_PCIADDR_FIELD(input, dev_addr->bus, UINT8_MAX, ':');
267 GET_PCIADDR_FIELD(input, dev_addr->devid, UINT8_MAX, '.');
268 GET_PCIADDR_FIELD(input, dev_addr->function, UINT8_MAX, 0);
273 * Utility function to produce a PCI Bus-Device-Function value
274 * given a string representation. Assumes that the BDF is provided including
278 * The input string to be parsed. Should have the format XXXX:XX:XX.X
280 * The PCI Bus-Device-Function address to be returned
282 * 0 on success, negative on error.
285 eal_parse_pci_DomBDF(const char *input, struct rte_pci_addr *dev_addr)
287 GET_PCIADDR_FIELD(input, dev_addr->domain, UINT16_MAX, ':');
288 GET_PCIADDR_FIELD(input, dev_addr->bus, UINT8_MAX, ':');
289 GET_PCIADDR_FIELD(input, dev_addr->devid, UINT8_MAX, '.');
290 GET_PCIADDR_FIELD(input, dev_addr->function, UINT8_MAX, 0);
293 #undef GET_PCIADDR_FIELD
296 * Utility function to write a pci device name, this device name can later be
297 * used to retrieve the corresponding rte_pci_addr using eal_parse_pci_*
301 * The PCI Bus-Device-Function address
303 * The output buffer string
305 * The output buffer size
308 rte_pci_device_name(const struct rte_pci_addr *addr,
309 char *output, size_t size)
311 RTE_VERIFY(size >= PCI_PRI_STR_SIZE);
312 RTE_VERIFY(snprintf(output, size, PCI_PRI_FMT,
313 addr->domain, addr->bus,
314 addr->devid, addr->function) >= 0);
317 /* Compare two PCI device addresses. */
319 * Utility function to compare two PCI device addresses.
322 * The PCI Bus-Device-Function address to compare
324 * The PCI Bus-Device-Function address to compare
326 * 0 on equal PCI address.
327 * Positive on addr is greater than addr2.
328 * Negative on addr is less than addr2, or error.
331 rte_eal_compare_pci_addr(const struct rte_pci_addr *addr,
332 const struct rte_pci_addr *addr2)
334 uint64_t dev_addr, dev_addr2;
336 if ((addr == NULL) || (addr2 == NULL))
339 dev_addr = ((uint64_t)addr->domain << 24) |
340 (addr->bus << 16) | (addr->devid << 8) | addr->function;
341 dev_addr2 = ((uint64_t)addr2->domain << 24) |
342 (addr2->bus << 16) | (addr2->devid << 8) | addr2->function;
344 if (dev_addr > dev_addr2)
346 else if (dev_addr < dev_addr2)
353 * Scan the content of the PCI bus, and the devices in the devices
357 * 0 on success, negative on error
359 int rte_pci_scan(void);
372 * Match the PCI Driver and Device using the ID Table
375 * PCI driver from which ID table would be extracted
377 * PCI device to match against the driver
379 * 1 for successful match
380 * 0 for unsuccessful match
383 rte_pci_match(const struct rte_pci_driver *pci_drv,
384 const struct rte_pci_device *pci_dev);
388 * Get iommu class of PCI devices on the bus.
389 * And return their preferred iova mapping mode.
392 * - enum rte_iova_mode.
395 rte_pci_get_iommu_class(void);
398 * Map the PCI device resources in user space virtual memory address
400 * Note that driver should not call this function when flag
401 * RTE_PCI_DRV_NEED_MAPPING is set, as EAL will do that for
405 * A pointer to a rte_pci_device structure describing the device
409 * 0 on success, negative on error and positive if no driver
410 * is found for the device.
412 int rte_pci_map_device(struct rte_pci_device *dev);
418 * A pointer to a rte_pci_device structure describing the device
421 void rte_pci_unmap_device(struct rte_pci_device *dev);
425 * Map a particular resource from a file.
427 * @param requested_addr
428 * The starting address for the new mapping range.
430 * The file descriptor.
432 * The offset for the mapping range.
434 * The size for the mapping range.
435 * @param additional_flags
436 * The additional flags for the mapping range.
438 * - On success, the function returns a pointer to the mapped area.
439 * - On error, the value MAP_FAILED is returned.
441 void *pci_map_resource(void *requested_addr, int fd, off_t offset,
442 size_t size, int additional_flags);
446 * Unmap a particular resource.
448 * @param requested_addr
449 * The address for the unmapping range.
451 * The size for the unmapping range.
453 void pci_unmap_resource(void *requested_addr, size_t size);
456 * Probe the single PCI device.
458 * Scan the content of the PCI bus, and find the pci device specified by pci
459 * address, then call the probe() function for registered driver that has a
460 * matching entry in its id_table for discovered device.
463 * The PCI Bus-Device-Function address to probe.
466 * - Negative on error.
468 int rte_pci_probe_one(const struct rte_pci_addr *addr);
471 * Close the single PCI device.
473 * Scan the content of the PCI bus, and find the pci device specified by pci
474 * address, then call the remove() function for registered driver that has a
475 * matching entry in its id_table for discovered device.
478 * The PCI Bus-Device-Function address to close.
481 * - Negative on error.
483 int rte_pci_detach(const struct rte_pci_addr *addr);
486 * Dump the content of the PCI bus.
489 * A pointer to a file for output
491 void rte_pci_dump(FILE *f);
494 * Register a PCI driver.
497 * A pointer to a rte_pci_driver structure describing the driver
500 void rte_pci_register(struct rte_pci_driver *driver);
502 /** Helper for PCI device registration from driver (eth, crypto) instance */
503 #define RTE_PMD_REGISTER_PCI(nm, pci_drv) \
504 RTE_INIT(pciinitfn_ ##nm); \
505 static void pciinitfn_ ##nm(void) \
507 (pci_drv).driver.name = RTE_STR(nm);\
508 rte_pci_register(&pci_drv); \
510 RTE_PMD_EXPORT_NAME(nm, __COUNTER__)
513 * Unregister a PCI driver.
516 * A pointer to a rte_pci_driver structure describing the driver
517 * to be unregistered.
519 void rte_pci_unregister(struct rte_pci_driver *driver);
522 * Read PCI config space.
525 * A pointer to a rte_pci_device structure describing the device
528 * A data buffer where the bytes should be read into
530 * The length of the data buffer.
532 * The offset into PCI config space
534 int rte_pci_read_config(const struct rte_pci_device *device,
535 void *buf, size_t len, off_t offset);
538 * Write PCI config space.
541 * A pointer to a rte_pci_device structure describing the device
544 * A data buffer containing the bytes should be written
546 * The length of the data buffer.
548 * The offset into PCI config space
550 int rte_pci_write_config(const struct rte_pci_device *device,
551 const void *buf, size_t len, off_t offset);
554 * A structure used to access io resources for a pci device.
555 * rte_pci_ioport is arch, os, driver specific, and should not be used outside
558 struct rte_pci_ioport {
559 struct rte_pci_device *dev;
561 uint64_t len; /* only filled for memory mapped ports */
565 * Initialize a rte_pci_ioport object for a pci device io resource.
567 * This object is then used to gain access to those io resources (see below).
570 * A pointer to a rte_pci_device structure describing the device
573 * Index of the io pci resource we want to access.
575 * The rte_pci_ioport object to be initialized.
577 * 0 on success, negative on error.
579 int rte_pci_ioport_map(struct rte_pci_device *dev, int bar,
580 struct rte_pci_ioport *p);
583 * Release any resources used in a rte_pci_ioport object.
586 * The rte_pci_ioport object to be uninitialized.
588 * 0 on success, negative on error.
590 int rte_pci_ioport_unmap(struct rte_pci_ioport *p);
593 * Read from a io pci resource.
596 * The rte_pci_ioport object from which we want to read.
598 * A data buffer where the bytes should be read into
600 * The length of the data buffer.
602 * The offset into the pci io resource.
604 void rte_pci_ioport_read(struct rte_pci_ioport *p,
605 void *data, size_t len, off_t offset);
608 * Write to a io pci resource.
611 * The rte_pci_ioport object to which we want to write.
613 * A data buffer where the bytes should be read into
615 * The length of the data buffer.
617 * The offset into the pci io resource.
619 void rte_pci_ioport_write(struct rte_pci_ioport *p,
620 const void *data, size_t len, off_t offset);
626 #endif /* _RTE_PCI_H_ */