-/*-
- * BSD LICENSE
- *
- * Copyright(c) 2010-2014 Intel Corporation. All rights reserved.
- * All rights reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions
- * are met:
- *
- * * Redistributions of source code must retain the above copyright
- * notice, this list of conditions and the following disclaimer.
- * * Redistributions in binary form must reproduce the above copyright
- * notice, this list of conditions and the following disclaimer in
- * the documentation and/or other materials provided with the
- * distribution.
- * * Neither the name of Intel Corporation nor the names of its
- * contributors may be used to endorse or promote products derived
- * from this software without specific prior written permission.
- *
- * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
- * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
- * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
- * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
- * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
- * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
- * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
- * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
- * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
- * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(c) 2010-2018 Intel Corporation
*/
#ifndef _EAL_PRIVATE_H_
#include <stdbool.h>
#include <stdint.h>
#include <stdio.h>
-#include <rte_pci.h>
+
+#include <rte_dev.h>
+#include <rte_lcore.h>
+#include <rte_memory.h>
+
+/**
+ * Structure storing internal configuration (per-lcore)
+ */
+struct lcore_config {
+ pthread_t thread_id; /**< pthread identifier */
+ int pipe_master2slave[2]; /**< communication pipe with master */
+ int pipe_slave2master[2]; /**< communication pipe with master */
+
+ lcore_function_t * volatile f; /**< function to call */
+ void * volatile arg; /**< argument of function */
+ volatile int ret; /**< return value of function */
+
+ volatile enum rte_lcore_state_t state; /**< lcore state */
+ unsigned int socket_id; /**< physical socket id for this lcore */
+ unsigned int core_id; /**< core number on socket for this lcore */
+ int core_index; /**< relative index, starting from 0 */
+ uint8_t core_role; /**< role of core eg: OFF, RTE, SERVICE */
+
+ rte_cpuset_t cpuset; /**< cpu set which the lcore affinity to */
+};
+
+extern struct lcore_config lcore_config[RTE_MAX_LCORE];
+
+/**
+ * The global RTE configuration structure.
+ */
+struct rte_config {
+ uint32_t master_lcore; /**< Id of the master lcore */
+ uint32_t lcore_count; /**< Number of available logical cores. */
+ uint32_t numa_node_count; /**< Number of detected NUMA nodes. */
+ uint32_t numa_nodes[RTE_MAX_NUMA_NODES]; /**< List of detected NUMA nodes. */
+ uint32_t service_lcore_count;/**< Number of available service cores. */
+ enum rte_lcore_role_t lcore_role[RTE_MAX_LCORE]; /**< State of cores. */
+
+ /** Primary or secondary configuration */
+ enum rte_proc_type_t process_type;
+
+ /** PA or VA mapping mode */
+ enum rte_iova_mode iova_mode;
+
+ /**
+ * Pointer to memory configuration, which may be shared across multiple
+ * DPDK instances
+ */
+ struct rte_mem_config *mem_config;
+} __rte_packed;
+
+/**
+ * Get the global configuration structure.
+ *
+ * @return
+ * A pointer to the global configuration structure.
+ */
+struct rte_config *rte_eal_get_configuration(void);
/**
* Initialize the memzone subsystem (private to eal).
*/
int rte_eal_cpu_init(void);
+/**
+ * Create memseg lists
+ *
+ * This function is private to EAL.
+ *
+ * Preallocate virtual memory.
+ *
+ * @return
+ * 0 on success, negative on error
+ */
+int rte_eal_memseg_init(void);
+
/**
* Map memory
*
*/
int rte_eal_log_init(const char *id, int facility);
-struct rte_pci_driver;
-struct rte_pci_device;
+/**
+ * Save the log regexp for later
+ */
+int rte_log_save_regexp(const char *type, int priority);
+int rte_log_save_pattern(const char *pattern, int priority);
/**
- * Probe the PCI bus
+ * Init tail queues for non-EAL library structures. This is to allow
+ * the rings, mempools, etc. lists to be shared among multiple processes
+ *
+ * This function is private to EAL
*
* @return
- * - 0 on success.
- * - !0 on error.
+ * 0 on success, negative on error
*/
-int
-rte_pci_probe(void);
+int rte_eal_tailqs_init(void);
/**
- * Scan the content of the PCI bus, and the devices in the devices
- * list
+ * Init interrupt handling.
+ *
+ * This function is private to EAL.
*
* @return
* 0 on success, negative on error
*/
-int rte_pci_scan(void);
+int rte_eal_intr_init(void);
/**
- * Probe the single PCI device.
+ * Init alarm mechanism. This is to allow a callback be called after
+ * specific time.
*
- * Scan the content of the PCI bus, and find the pci device specified by pci
- * address, then call the probe() function for registered driver that has a
- * matching entry in its id_table for discovered device.
+ * This function is private to EAL.
*
- * @param addr
- * The PCI Bus-Device-Function address to probe.
* @return
- * - 0 on success.
- * - Negative on error.
+ * 0 on success, negative on error
*/
-int rte_pci_probe_one(const struct rte_pci_addr *addr);
+int rte_eal_alarm_init(void);
/**
- * Close the single PCI device.
+ * Function is to check if the kernel module(like, vfio, vfio_iommu_type1,
+ * etc.) loaded.
*
- * Scan the content of the PCI bus, and find the pci device specified by pci
- * address, then call the remove() function for registered driver that has a
- * matching entry in its id_table for discovered device.
+ * @param module_name
+ * The module's name which need to be checked
*
- * @param addr
- * The PCI Bus-Device-Function address to close.
* @return
- * - 0 on success.
- * - Negative on error.
+ * -1 means some error happens(NULL pointer or open failure)
+ * 0 means the module not loaded
+ * 1 means the module loaded
*/
-int rte_pci_detach(const struct rte_pci_addr *addr);
+int rte_eal_check_module(const char *module_name);
/**
- * Find the name of a PCI device.
+ * Memory reservation flags.
*/
-void pci_name_set(struct rte_pci_device *dev);
+enum eal_mem_reserve_flags {
+ /**
+ * Reserve hugepages. May be unsupported by some platforms.
+ */
+ EAL_RESERVE_HUGEPAGES = 1 << 0,
+ /**
+ * Force reserving memory at the requested address.
+ * This can be a destructive action depending on the implementation.
+ *
+ * @see RTE_MAP_FORCE_ADDRESS for description of possible consequences
+ * (although implementations are not required to use it).
+ */
+ EAL_RESERVE_FORCE_ADDRESS = 1 << 1
+};
/**
- * Add a PCI device to the PCI Bus (append to PCI Device list). This function
- * also updates the bus references of the PCI Device (and the generic device
- * object embedded within.
+ * Get virtual area of specified size from the OS.
+ *
+ * This function is private to the EAL.
+ *
+ * @param requested_addr
+ * Address where to request address space.
+ * @param size
+ * Size of requested area.
+ * @param page_sz
+ * Page size on which to align requested virtual area.
+ * @param flags
+ * EAL_VIRTUAL_AREA_* flags.
+ * @param reserve_flags
+ * Extra flags passed directly to eal_mem_reserve().
*
- * @param pci_dev
- * PCI device to add
- * @return void
+ * @return
+ * Virtual area address if successful.
+ * NULL if unsuccessful.
+ */
+
+#define EAL_VIRTUAL_AREA_ADDR_IS_HINT (1 << 0)
+/**< don't fail if cannot get exact requested address. */
+#define EAL_VIRTUAL_AREA_ALLOW_SHRINK (1 << 1)
+/**< try getting smaller sized (decrement by page size) virtual areas if cannot
+ * get area of requested size.
+ */
+#define EAL_VIRTUAL_AREA_UNMAP (1 << 2)
+/**< immediately unmap reserved virtual area. */
+void *
+eal_get_virtual_area(void *requested_addr, size_t *size,
+ size_t page_sz, int flags, int reserve_flags);
+
+/**
+ * Initialize a memory segment list and create its backing storage.
+ *
+ * @param msl
+ * Memory segment list to be filled.
+ * @param name
+ * Name for the backing storage.
+ * @param page_sz
+ * Size of segment pages in the MSL.
+ * @param n_segs
+ * Number of segments.
+ * @param socket_id
+ * Socket ID. Must not be SOCKET_ID_ANY.
+ * @param heap
+ * Mark MSL as pointing to a heap.
+ * @return
+ * 0 on success, (-1) on failure and rte_errno is set.
*/
-void rte_pci_add_device(struct rte_pci_device *pci_dev);
+int
+eal_memseg_list_init_named(struct rte_memseg_list *msl, const char *name,
+ uint64_t page_sz, int n_segs, int socket_id, bool heap);
/**
- * Insert a PCI device in the PCI Bus at a particular location in the device
- * list. It also updates the PCI Bus reference of the new devices to be
- * inserted.
+ * Initialize memory segment list and create its backing storage
+ * with a name corresponding to MSL parameters.
*
- * @param exist_pci_dev
- * Existing PCI device in PCI Bus
- * @param new_pci_dev
- * PCI device to be added before exist_pci_dev
- * @return void
+ * @param type_msl_idx
+ * Index of the MSL among other MSLs of the same socket and page size.
+ *
+ * @see eal_memseg_list_init_named for remaining parameters description.
*/
-void rte_pci_insert_device(struct rte_pci_device *exist_pci_dev,
- struct rte_pci_device *new_pci_dev);
+int
+eal_memseg_list_init(struct rte_memseg_list *msl, uint64_t page_sz,
+ int n_segs, int socket_id, int type_msl_idx, bool heap);
/**
- * Remove a PCI device from the PCI Bus. This sets to NULL the bus references
- * in the PCI device object as well as the generic device object.
+ * Reserve VA space for a memory segment list
+ * previously initialized with eal_memseg_list_init().
*
- * @param pci_device
- * PCI device to be removed from PCI Bus
- * @return void
+ * @param msl
+ * Initialized memory segment list with page size defined.
+ * @param reserve_flags
+ * Extra memory reservation flags. Can be 0 if unnecessary.
+ * @return
+ * 0 on success, (-1) on failure and rte_errno is set.
*/
-void rte_pci_remove_device(struct rte_pci_device *pci_device);
+int
+eal_memseg_list_alloc(struct rte_memseg_list *msl, int reserve_flags);
/**
- * Update a pci device object by asking the kernel for the latest information.
- *
- * This function is private to EAL.
+ * Populate MSL, each segment is one page long.
*
+ * @param msl
+ * Initialized memory segment list with page size defined.
* @param addr
- * The PCI Bus-Device-Function address to look for
- * @return
- * - 0 on success.
- * - negative on error.
+ * Starting address of list segments.
+ * @param n_segs
+ * Number of segments to populate.
*/
-int pci_update_device(const struct rte_pci_addr *addr);
+void
+eal_memseg_list_populate(struct rte_memseg_list *msl, void *addr, int n_segs);
/**
- * Unbind kernel driver for this device
- *
- * This function is private to EAL.
+ * Get cpu core_id.
*
- * @return
- * 0 on success, negative on error
+ * This function is private to the EAL.
*/
-int pci_unbind_kernel_driver(struct rte_pci_device *dev);
+unsigned eal_cpu_core_id(unsigned lcore_id);
/**
- * Map the PCI resource of a PCI device in virtual memory
+ * Check if cpu is present.
*
- * This function is private to EAL.
+ * This function is private to the EAL.
+ */
+int eal_cpu_detected(unsigned lcore_id);
+
+/**
+ * Set TSC frequency from precise value or estimation
*
- * @return
- * 0 on success, negative on error
+ * This function is private to the EAL.
*/
-int pci_uio_map_resource(struct rte_pci_device *dev);
+void set_tsc_freq(void);
/**
- * Unmap the PCI resource of a PCI device
+ * Get precise TSC frequency from system
*
- * This function is private to EAL.
+ * This function is private to the EAL.
*/
-void pci_uio_unmap_resource(struct rte_pci_device *dev);
+uint64_t get_tsc_freq(void);
/**
- * Allocate uio resource for PCI device
+ * Get TSC frequency if the architecture supports.
*
- * This function is private to EAL.
+ * This function is private to the EAL.
*
- * @param dev
- * PCI device to allocate uio resource
- * @param uio_res
- * Pointer to uio resource.
- * If the function returns 0, the pointer will be filled.
* @return
- * 0 on success, negative on error
+ * The number of TSC cycles in one second.
+ * Returns zero if the architecture support is not available.
*/
-int pci_uio_alloc_resource(struct rte_pci_device *dev,
- struct mapped_pci_resource **uio_res);
+uint64_t get_tsc_freq_arch(void);
/**
- * Free uio resource for PCI device
+ * Prepare physical memory mapping
+ * i.e. hugepages on Linux and
+ * contigmem on BSD.
*
- * This function is private to EAL.
+ * This function is private to the EAL.
+ */
+int rte_eal_hugepage_init(void);
+
+/**
+ * Creates memory mapping in secondary process
+ * i.e. hugepages on Linux and
+ * contigmem on BSD.
*
- * @param dev
- * PCI device to free uio resource
- * @param uio_res
- * Pointer to uio resource.
+ * This function is private to the EAL.
*/
-void pci_uio_free_resource(struct rte_pci_device *dev,
- struct mapped_pci_resource *uio_res);
+int rte_eal_hugepage_attach(void);
/**
- * Map device memory to uio resource
+ * Find a bus capable of identifying a device.
*
- * This function is private to EAL.
+ * @param str
+ * A device identifier (PCI address, virtual PMD name, ...).
*
- * @param dev
- * PCI device that has memory information.
- * @param res_idx
- * Memory resource index of the PCI device.
- * @param uio_res
- * uio resource that will keep mapping information.
- * @param map_idx
- * Mapping information index of the uio resource.
* @return
- * 0 on success, negative on error
+ * A valid bus handle if found.
+ * NULL if no bus is able to parse this device.
*/
-int pci_uio_map_resource_by_index(struct rte_pci_device *dev, int res_idx,
- struct mapped_pci_resource *uio_res, int map_idx);
+struct rte_bus *rte_bus_find_by_device_name(const char *str);
/**
- * Init tail queues for non-EAL library structures. This is to allow
- * the rings, mempools, etc. lists to be shared among multiple processes
- *
- * This function is private to EAL
+ * Create the unix channel for primary/secondary communication.
*
* @return
- * 0 on success, negative on error
+ * 0 on success;
+ * (<0) on failure.
*/
-int rte_eal_tailqs_init(void);
+int rte_mp_channel_init(void);
/**
- * Init interrupt handling.
+ * Primary/secondary communication cleanup.
+ */
+void rte_mp_channel_cleanup(void);
+
+/**
+ * @internal
+ * Parse a device string and store its information in an
+ * rte_devargs structure.
*
- * This function is private to EAL.
+ * A device description is split by layers of abstraction of the device:
+ * bus, class and driver. Each layer will offer a set of properties that
+ * can be applied either to configure or recognize a device.
+ *
+ * This function will parse those properties and prepare the rte_devargs
+ * to be given to each layers for processing.
+ *
+ * Note: if the "data" field of the devargs points to devstr,
+ * then no dynamic allocation is performed and the rte_devargs
+ * can be safely discarded.
+ *
+ * Otherwise ``data`` will hold a workable copy of devstr, that will be
+ * used by layers descriptors within rte_devargs. In this case,
+ * any rte_devargs should be cleaned-up before being freed.
+ *
+ * @param da
+ * rte_devargs structure to fill.
+ *
+ * @param devstr
+ * Device string.
*
* @return
- * 0 on success, negative on error
+ * 0 on success.
+ * Negative errno values on error (rte_errno is set).
*/
-int rte_eal_intr_init(void);
+int
+rte_devargs_layers_parse(struct rte_devargs *devargs,
+ const char *devstr);
-/**
- * Init alarm mechanism. This is to allow a callback be called after
- * specific time.
- *
- * This function is private to EAL.
+/*
+ * probe a device at local process.
*
+ * @param devargs
+ * Device arguments including bus, class and driver properties.
+ * @param new_dev
+ * new device be probed as output.
* @return
- * 0 on success, negative on error
+ * 0 on success, negative on error.
*/
-int rte_eal_alarm_init(void);
+int local_dev_probe(const char *devargs, struct rte_device **new_dev);
/**
- * Function is to check if the kernel module(like, vfio, vfio_iommu_type1,
- * etc.) loaded.
- *
- * @param module_name
- * The module's name which need to be checked
+ * Hotplug remove a given device from a specific bus at local process.
*
+ * @param dev
+ * Data structure of the device to remove.
* @return
- * -1 means some error happens(NULL pointer or open failure)
- * 0 means the module not loaded
- * 1 means the module loaded
+ * 0 on success, negative on error.
*/
-int rte_eal_check_module(const char *module_name);
+int local_dev_remove(struct rte_device *dev);
/**
- * Get cpu core_id.
+ * Iterate over all buses to find the corresponding bus to handle the sigbus
+ * error.
+ * @param failure_addr
+ * Pointer of the fault address of the sigbus error.
*
- * This function is private to the EAL.
+ * @return
+ * 0 success to handle the sigbus.
+ * -1 failed to handle the sigbus
+ * 1 no bus can handler the sigbus
*/
-unsigned eal_cpu_core_id(unsigned lcore_id);
+int rte_bus_sigbus_handler(const void *failure_addr);
/**
- * Check if cpu is present.
+ * @internal
+ * Register the sigbus handler.
*
- * This function is private to the EAL.
+ * @return
+ * - On success, zero.
+ * - On failure, a negative value.
*/
-int eal_cpu_detected(unsigned lcore_id);
+int
+dev_sigbus_handler_register(void);
/**
- * Set TSC frequency from precise value or estimation
+ * @internal
+ * Unregister the sigbus handler.
*
- * This function is private to the EAL.
+ * @return
+ * - On success, zero.
+ * - On failure, a negative value.
*/
-void set_tsc_freq(void);
+int
+dev_sigbus_handler_unregister(void);
/**
- * Get precise TSC frequency from system
+ * Get OS-specific EAL mapping base address.
+ */
+uint64_t
+eal_get_baseaddr(void);
+
+void *
+eal_malloc_no_trace(const char *type, size_t size, unsigned int align);
+
+void eal_free_no_trace(void *addr);
+
+/** Options for eal_file_open(). */
+enum eal_open_flags {
+ /** Open file for reading. */
+ EAL_OPEN_READONLY = 0x00,
+ /** Open file for reading and writing. */
+ EAL_OPEN_READWRITE = 0x02,
+ /**
+ * Create the file if it doesn't exist.
+ * New files are only accessible to the owner (0600 equivalent).
+ */
+ EAL_OPEN_CREATE = 0x04
+};
+
+/**
+ * Open or create a file.
*
- * This function is private to the EAL.
+ * @param path
+ * Path to the file.
+ * @param flags
+ * A combination of eal_open_flags controlling operation and FD behavior.
+ * @return
+ * Open file descriptor on success, (-1) on failure and rte_errno is set.
*/
-uint64_t get_tsc_freq(void);
+int
+eal_file_open(const char *path, int flags);
+
+/** File locking operation. */
+enum eal_flock_op {
+ EAL_FLOCK_SHARED, /**< Acquire a shared lock. */
+ EAL_FLOCK_EXCLUSIVE, /**< Acquire an exclusive lock. */
+ EAL_FLOCK_UNLOCK /**< Release a previously taken lock. */
+};
+
+/** Behavior on file locking conflict. */
+enum eal_flock_mode {
+ EAL_FLOCK_WAIT, /**< Wait until the file gets unlocked to lock it. */
+ EAL_FLOCK_RETURN /**< Return immediately if the file is locked. */
+};
/**
- * Get TSC frequency if the architecture supports.
+ * Lock or unlock the file.
*
- * This function is private to the EAL.
+ * On failure @code rte_errno @endcode is set to the error code
+ * specified by POSIX flock(3) description.
*
+ * @param fd
+ * Opened file descriptor.
+ * @param op
+ * Operation to perform.
+ * @param mode
+ * Behavior on conflict.
* @return
- * The number of TSC cycles in one second.
- * Returns zero if the architecture support is not available.
+ * 0 on success, (-1) on failure.
*/
-uint64_t get_tsc_freq_arch(void);
+int
+eal_file_lock(int fd, enum eal_flock_op op, enum eal_flock_mode mode);
/**
- * Prepare physical memory mapping
- * i.e. hugepages on Linux and
- * contigmem on BSD.
+ * Truncate or extend the file to the specified size.
*
- * This function is private to the EAL.
+ * On failure @code rte_errno @endcode is set to the error code
+ * specified by POSIX ftruncate(3) description.
+ *
+ * @param fd
+ * Opened file descriptor.
+ * @param size
+ * Desired file size.
+ * @return
+ * 0 on success, (-1) on failure.
*/
-int rte_eal_hugepage_init(void);
+int
+eal_file_truncate(int fd, ssize_t size);
/**
- * Creates memory mapping in secondary process
- * i.e. hugepages on Linux and
- * contigmem on BSD.
+ * Reserve a region of virtual memory.
*
- * This function is private to the EAL.
+ * Use eal_mem_free() to free reserved memory.
+ *
+ * @param requested_addr
+ * A desired reservation address which must be page-aligned.
+ * The system might not respect it.
+ * NULL means the address will be chosen by the system.
+ * @param size
+ * Reservation size. Must be a multiple of system page size.
+ * @param flags
+ * Reservation options, a combination of eal_mem_reserve_flags.
+ * @returns
+ * Starting address of the reserved area on success, NULL on failure.
+ * Callers must not access this memory until remapping it.
*/
-int rte_eal_hugepage_attach(void);
+void *
+eal_mem_reserve(void *requested_addr, size_t size, int flags);
/**
- * Find a bus capable of identifying a device.
+ * Free memory obtained by eal_mem_reserve() or eal_mem_alloc().
*
- * @param str
- * A device identifier (PCI address, virtual PMD name, ...).
+ * If *virt* and *size* describe a part of the reserved region,
+ * only this part of the region is freed (accurately up to the system
+ * page size). If *virt* points to allocated memory, *size* must match
+ * the one specified on allocation. The behavior is undefined
+ * if the memory pointed by *virt* is obtained from another source
+ * than listed above.
*
+ * @param virt
+ * A virtual address in a region previously reserved.
+ * @param size
+ * Number of bytes to unreserve.
+ */
+void
+eal_mem_free(void *virt, size_t size);
+
+/**
+ * Configure memory region inclusion into dumps.
+ *
+ * @param virt
+ * Starting address of the region.
+ * @param size
+ * Size of the region.
+ * @param dump
+ * True to include memory into dumps, false to exclude.
* @return
- * A valid bus handle if found.
- * NULL if no bus is able to parse this device.
+ * 0 on success, (-1) on failure and rte_errno is set.
*/
-struct rte_bus *rte_bus_find_by_device_name(const char *str);
+int
+eal_mem_set_dump(void *virt, size_t size, bool dump);
#endif /* _EAL_PRIVATE_H_ */