eal/bsd: rename bsdapp to freebsd
[dpdk.git] / lib / librte_eal / linuxapp / eal / eal.c
index e59ac65..13f4016 100644 (file)
@@ -13,7 +13,9 @@
 #include <syslog.h>
 #include <getopt.h>
 #include <sys/file.h>
+#include <dirent.h>
 #include <fcntl.h>
+#include <fnmatch.h>
 #include <stddef.h>
 #include <errno.h>
 #include <limits.h>
@@ -48,6 +50,7 @@
 #include <rte_atomic.h>
 #include <malloc_heap.h>
 #include <rte_vfio.h>
+#include <rte_option.h>
 
 #include "eal_private.h"
 #include "eal_thread.h"
@@ -122,7 +125,7 @@ eal_create_runtime_dir(void)
 
        /* create prefix-specific subdirectory under DPDK runtime dir */
        ret = snprintf(runtime_dir, sizeof(runtime_dir), "%s/%s",
-                       tmp, internal_config.hugefile_prefix);
+                       tmp, eal_get_hugefile_prefix());
        if (ret < 0 || ret == sizeof(runtime_dir)) {
                RTE_LOG(ERR, EAL, "Error creating prefix-specific runtime path name\n");
                return -1;
@@ -148,8 +151,93 @@ eal_create_runtime_dir(void)
        return 0;
 }
 
+int
+eal_clean_runtime_dir(void)
+{
+       DIR *dir;
+       struct dirent *dirent;
+       int dir_fd, fd, lck_result;
+       static const char * const filters[] = {
+               "fbarray_*",
+               "mp_socket_*"
+       };
+
+       /* open directory */
+       dir = opendir(runtime_dir);
+       if (!dir) {
+               RTE_LOG(ERR, EAL, "Unable to open runtime directory %s\n",
+                               runtime_dir);
+               goto error;
+       }
+       dir_fd = dirfd(dir);
+
+       /* lock the directory before doing anything, to avoid races */
+       if (flock(dir_fd, LOCK_EX) < 0) {
+               RTE_LOG(ERR, EAL, "Unable to lock runtime directory %s\n",
+                       runtime_dir);
+               goto error;
+       }
+
+       dirent = readdir(dir);
+       if (!dirent) {
+               RTE_LOG(ERR, EAL, "Unable to read runtime directory %s\n",
+                               runtime_dir);
+               goto error;
+       }
+
+       while (dirent != NULL) {
+               unsigned int f_idx;
+               bool skip = true;
+
+               /* skip files that don't match the patterns */
+               for (f_idx = 0; f_idx < RTE_DIM(filters); f_idx++) {
+                       const char *filter = filters[f_idx];
+
+                       if (fnmatch(filter, dirent->d_name, 0) == 0) {
+                               skip = false;
+                               break;
+                       }
+               }
+               if (skip) {
+                       dirent = readdir(dir);
+                       continue;
+               }
+
+               /* try and lock the file */
+               fd = openat(dir_fd, dirent->d_name, O_RDONLY);
+
+               /* skip to next file */
+               if (fd == -1) {
+                       dirent = readdir(dir);
+                       continue;
+               }
+
+               /* non-blocking lock */
+               lck_result = flock(fd, LOCK_EX | LOCK_NB);
+
+               /* if lock succeeds, remove the file */
+               if (lck_result != -1)
+                       unlinkat(dir_fd, dirent->d_name, 0);
+               close(fd);
+               dirent = readdir(dir);
+       }
+
+       /* closedir closes dir_fd and drops the lock */
+       closedir(dir);
+       return 0;
+
+error:
+       if (dir)
+               closedir(dir);
+
+       RTE_LOG(ERR, EAL, "Error while clearing runtime dir: %s\n",
+               strerror(errno));
+
+       return -1;
+}
+
 const char *
-eal_get_runtime_dir(void)
+rte_eal_get_runtime_dir(void)
 {
        return runtime_dir;
 }
@@ -263,6 +351,8 @@ rte_eal_config_create(void)
         * processes could later map the config into this exact location */
        rte_config.mem_config->mem_cfg_addr = (uintptr_t) rte_mem_cfg_addr;
 
+       rte_config.mem_config->dma_maskbits = 0;
+
 }
 
 /* attach to an existing shared memory config */
@@ -352,6 +442,24 @@ eal_proc_type_detect(void)
        return ptype;
 }
 
+/* copies data from internal config to shared config */
+static void
+eal_update_mem_config(void)
+{
+       struct rte_mem_config *mcfg = rte_eal_get_configuration()->mem_config;
+       mcfg->legacy_mem = internal_config.legacy_mem;
+       mcfg->single_file_segments = internal_config.single_file_segments;
+}
+
+/* copies data from shared config to internal config */
+static void
+eal_update_internal_config(void)
+{
+       struct rte_mem_config *mcfg = rte_eal_get_configuration()->mem_config;
+       internal_config.legacy_mem = mcfg->legacy_mem;
+       internal_config.single_file_segments = mcfg->single_file_segments;
+}
+
 /* Sets up rte_config structure with the pointer to shared memory config.*/
 static void
 rte_config_init(void)
@@ -361,11 +469,13 @@ rte_config_init(void)
        switch (rte_config.process_type){
        case RTE_PROC_PRIMARY:
                rte_eal_config_create();
+               eal_update_mem_config();
                break;
        case RTE_PROC_SECONDARY:
                rte_eal_config_attach();
                rte_eal_mcfg_wait_complete(rte_config.mem_config);
                rte_eal_config_reattach();
+               eal_update_internal_config();
                break;
        case RTE_PROC_AUTO:
        case RTE_PROC_INVALID:
@@ -408,6 +518,7 @@ eal_usage(const char *prgname)
               "  --"OPT_VFIO_INTR"         Interrupt mode for VFIO (legacy|msi|msix)\n"
               "  --"OPT_LEGACY_MEM"        Legacy memory mode (no dynamic allocation, contiguous segments)\n"
               "  --"OPT_SINGLE_FILE_SEGMENTS" Put all hugepage memory in single files\n"
+              "  --"OPT_MATCH_ALLOCATIONS" Free hugepages exactly as allocated\n"
               "\n");
        /* Allow the application to print its usage message too if hook is set */
        if ( rte_application_usage_hook ) {
@@ -471,10 +582,6 @@ eal_parse_socket_arg(char *strval, volatile uint64_t *socket_arg)
                socket_arg[i] = val;
        }
 
-       /* check if we have a positive amount of total memory */
-       if (total_mem == 0)
-               return -1;
-
        return 0;
 }
 
@@ -580,12 +687,20 @@ eal_parse_args(int argc, char **argv)
 
        argvopt = argv;
        optind = 1;
+       opterr = 0;
 
        while ((opt = getopt_long(argc, argvopt, eal_short_options,
                                  eal_long_options, &option_index)) != EOF) {
 
-               /* getopt is not happy, stop right now */
+               /*
+                * getopt didn't recognise the option, lets parse the
+                * registered options to see if the flag is valid
+                */
                if (opt == '?') {
+                       ret = rte_option_parse(argv[optind-1]);
+                       if (ret == 0)
+                               continue;
+
                        eal_usage(prgname);
                        ret = -1;
                        goto out;
@@ -608,13 +723,31 @@ eal_parse_args(int argc, char **argv)
                        exit(EXIT_SUCCESS);
 
                case OPT_HUGE_DIR_NUM:
-                       internal_config.hugepage_dir = strdup(optarg);
+               {
+                       char *hdir = strdup(optarg);
+                       if (hdir == NULL)
+                               RTE_LOG(ERR, EAL, "Could not store hugepage directory\n");
+                       else {
+                               /* free old hugepage dir */
+                               if (internal_config.hugepage_dir != NULL)
+                                       free(internal_config.hugepage_dir);
+                               internal_config.hugepage_dir = hdir;
+                       }
                        break;
-
+               }
                case OPT_FILE_PREFIX_NUM:
-                       internal_config.hugefile_prefix = strdup(optarg);
+               {
+                       char *prefix = strdup(optarg);
+                       if (prefix == NULL)
+                               RTE_LOG(ERR, EAL, "Could not store file prefix\n");
+                       else {
+                               /* free old prefix */
+                               if (internal_config.hugefile_prefix != NULL)
+                                       free(internal_config.hugefile_prefix);
+                               internal_config.hugefile_prefix = prefix;
+                       }
                        break;
-
+               }
                case OPT_SOCKET_MEM_NUM:
                        if (eal_parse_socket_arg(optarg,
                                        internal_config.socket_mem) < 0) {
@@ -664,8 +797,23 @@ eal_parse_args(int argc, char **argv)
                        break;
 
                case OPT_MBUF_POOL_OPS_NAME_NUM:
-                       internal_config.user_mbuf_pool_ops_name =
-                           strdup(optarg);
+               {
+                       char *ops_name = strdup(optarg);
+                       if (ops_name == NULL)
+                               RTE_LOG(ERR, EAL, "Could not store mbuf pool ops name\n");
+                       else {
+                               /* free old ops name */
+                               if (internal_config.user_mbuf_pool_ops_name !=
+                                               NULL)
+                                       free(internal_config.user_mbuf_pool_ops_name);
+
+                               internal_config.user_mbuf_pool_ops_name =
+                                               ops_name;
+                       }
+                       break;
+               }
+               case OPT_MATCH_ALLOCATIONS_NUM:
+                       internal_config.match_allocations = 1;
                        break;
 
                default:
@@ -725,6 +873,9 @@ check_socket(const struct rte_memseg_list *msl, void *arg)
 {
        int *socket_id = arg;
 
+       if (msl->external)
+               return 0;
+
        return *socket_id == msl->socket_id;
 }
 
@@ -793,7 +944,8 @@ rte_eal_init(int argc, char **argv)
        int i, fctret, ret;
        pthread_t thread_id;
        static rte_atomic32_t run_once = RTE_ATOMIC32_INIT(0);
-       const char *logid;
+       const char *p;
+       static char logid[PATH_MAX];
        char cpuset[RTE_CPU_AFFINITY_STR_LEN];
        char thread_name[RTE_MAX_THREAD_NAME_LEN];
 
@@ -810,9 +962,8 @@ rte_eal_init(int argc, char **argv)
                return -1;
        }
 
-       logid = strrchr(argv[0], '/');
-       logid = strdup(logid ? logid + 1: argv[0]);
-
+       p = strrchr(argv[0], '/');
+       strlcpy(logid, p ? p + 1 : argv[0], sizeof(logid));
        thread_id = pthread_self();
 
        eal_reset_internal_config(&internal_config);
@@ -835,7 +986,7 @@ rte_eal_init(int argc, char **argv)
        }
 
        if (eal_plugins_init() < 0) {
-               rte_eal_init_alert("Cannot init plugins\n");
+               rte_eal_init_alert("Cannot init plugins");
                rte_errno = EINVAL;
                rte_atomic32_clear(&run_once);
                return -1;
@@ -850,7 +1001,7 @@ rte_eal_init(int argc, char **argv)
        rte_config_init();
 
        if (rte_eal_intr_init() < 0) {
-               rte_eal_init_alert("Cannot init interrupt-handling thread\n");
+               rte_eal_init_alert("Cannot init interrupt-handling thread");
                return -1;
        }
 
@@ -858,30 +1009,43 @@ rte_eal_init(int argc, char **argv)
         * bus through mp channel in the secondary process before the bus scan.
         */
        if (rte_mp_channel_init() < 0) {
-               rte_eal_init_alert("failed to init mp channel\n");
+               rte_eal_init_alert("failed to init mp channel");
                if (rte_eal_process_type() == RTE_PROC_PRIMARY) {
                        rte_errno = EFAULT;
                        return -1;
                }
        }
 
+       /* register multi-process action callbacks for hotplug */
+       if (rte_mp_dev_hotplug_init() < 0) {
+               rte_eal_init_alert("failed to register mp callback for hotplug");
+               return -1;
+       }
+
        if (rte_bus_scan()) {
-               rte_eal_init_alert("Cannot scan the buses for devices\n");
+               rte_eal_init_alert("Cannot scan the buses for devices");
                rte_errno = ENODEV;
                rte_atomic32_clear(&run_once);
                return -1;
        }
 
-       /* autodetect the iova mapping mode (default is iova_pa) */
-       rte_eal_get_configuration()->iova_mode = rte_bus_get_iommu_class();
-
-       /* Workaround for KNI which requires physical address to work */
-       if (rte_eal_get_configuration()->iova_mode == RTE_IOVA_VA &&
-                       rte_eal_check_module("rte_kni") == 1) {
-               rte_eal_get_configuration()->iova_mode = RTE_IOVA_PA;
-               RTE_LOG(WARNING, EAL,
-                       "Some devices want IOVA as VA but PA will be used because.. "
-                       "KNI module inserted\n");
+       /* if no EAL option "--iova-mode=<pa|va>", use bus IOVA scheme */
+       if (internal_config.iova_mode == RTE_IOVA_DC) {
+               /* autodetect the IOVA mapping mode (default is RTE_IOVA_PA) */
+               rte_eal_get_configuration()->iova_mode =
+                       rte_bus_get_iommu_class();
+
+               /* Workaround for KNI which requires physical address to work */
+               if (rte_eal_get_configuration()->iova_mode == RTE_IOVA_VA &&
+                               rte_eal_check_module("rte_kni") == 1) {
+                       rte_eal_get_configuration()->iova_mode = RTE_IOVA_PA;
+                       RTE_LOG(WARNING, EAL,
+                               "Some devices want IOVA as VA but PA will be used because.. "
+                               "KNI module inserted\n");
+               }
+       } else {
+               rte_eal_get_configuration()->iova_mode =
+                       internal_config.iova_mode;
        }
 
        if (internal_config.no_hugetlbfs == 0) {
@@ -924,7 +1088,7 @@ rte_eal_init(int argc, char **argv)
 
 #ifdef VFIO_PRESENT
        if (rte_eal_vfio_setup() < 0) {
-               rte_eal_init_alert("Cannot init VFIO\n");
+               rte_eal_init_alert("Cannot init VFIO");
                rte_errno = EAGAIN;
                rte_atomic32_clear(&run_once);
                return -1;
@@ -935,13 +1099,13 @@ rte_eal_init(int argc, char **argv)
         * initialize memzones first.
         */
        if (rte_eal_memzone_init() < 0) {
-               rte_eal_init_alert("Cannot init memzone\n");
+               rte_eal_init_alert("Cannot init memzone");
                rte_errno = ENODEV;
                return -1;
        }
 
        if (rte_eal_memory_init() < 0) {
-               rte_eal_init_alert("Cannot init memory\n");
+               rte_eal_init_alert("Cannot init memory");
                rte_errno = ENOMEM;
                return -1;
        }
@@ -950,25 +1114,25 @@ rte_eal_init(int argc, char **argv)
        eal_hugedirs_unlock();
 
        if (rte_eal_malloc_heap_init() < 0) {
-               rte_eal_init_alert("Cannot init malloc heap\n");
+               rte_eal_init_alert("Cannot init malloc heap");
                rte_errno = ENODEV;
                return -1;
        }
 
        if (rte_eal_tailqs_init() < 0) {
-               rte_eal_init_alert("Cannot init tail queues for objects\n");
+               rte_eal_init_alert("Cannot init tail queues for objects");
                rte_errno = EFAULT;
                return -1;
        }
 
        if (rte_eal_alarm_init() < 0) {
-               rte_eal_init_alert("Cannot init interrupt-handling thread\n");
+               rte_eal_init_alert("Cannot init interrupt-handling thread");
                /* rte_eal_alarm_init sets rte_errno on failure. */
                return -1;
        }
 
        if (rte_eal_timer_init() < 0) {
-               rte_eal_init_alert("Cannot init HPET or TSC timers\n");
+               rte_eal_init_alert("Cannot init HPET or TSC timers");
                rte_errno = ENOTSUP;
                return -1;
        }
@@ -979,8 +1143,8 @@ rte_eal_init(int argc, char **argv)
 
        ret = eal_thread_dump_affinity(cpuset, sizeof(cpuset));
 
-       RTE_LOG(DEBUG, EAL, "Master lcore %u is ready (tid=%x;cpuset=[%s%s])\n",
-               rte_config.master_lcore, (int)thread_id, cpuset,
+       RTE_LOG(DEBUG, EAL, "Master lcore %u is ready (tid=%zx;cpuset=[%s%s])\n",
+               rte_config.master_lcore, (uintptr_t)thread_id, cpuset,
                ret == 0 ? "" : "...");
 
        RTE_LCORE_FOREACH_SLAVE(i) {
@@ -1022,14 +1186,14 @@ rte_eal_init(int argc, char **argv)
        /* initialize services so vdevs register service during bus_probe. */
        ret = rte_service_init();
        if (ret) {
-               rte_eal_init_alert("rte_service_init() failed\n");
+               rte_eal_init_alert("rte_service_init() failed");
                rte_errno = ENOEXEC;
                return -1;
        }
 
        /* Probe all the buses and devices/drivers on them */
        if (rte_bus_probe()) {
-               rte_eal_init_alert("Cannot probe devices\n");
+               rte_eal_init_alert("Cannot probe devices");
                rte_errno = ENOTSUP;
                return -1;
        }
@@ -1049,8 +1213,26 @@ rte_eal_init(int argc, char **argv)
                return -1;
        }
 
+       /*
+        * Clean up unused files in runtime directory. We do this at the end of
+        * init and not at the beginning because we want to clean stuff up
+        * whether we are primary or secondary process, but we cannot remove
+        * primary process' files because secondary should be able to run even
+        * if primary process is dead.
+        *
+        * In no_shconf mode, no runtime directory is created in the first
+        * place, so no cleanup needed.
+        */
+       if (!internal_config.no_shconf && eal_clean_runtime_dir() < 0) {
+               rte_eal_init_alert("Cannot clear runtime directory\n");
+               return -1;
+       }
+
        rte_eal_mcfg_complete();
 
+       /* Call each registered callback, if enabled */
+       rte_option_init();
+
        return fctret;
 }
 
@@ -1059,7 +1241,12 @@ mark_freeable(const struct rte_memseg_list *msl, const struct rte_memseg *ms,
                void *arg __rte_unused)
 {
        /* ms is const, so find this memseg */
-       struct rte_memseg *found = rte_mem_virt2memseg(ms->addr, msl);
+       struct rte_memseg *found;
+
+       if (msl->external)
+               return 0;
+
+       found = rte_mem_virt2memseg(ms->addr, msl);
 
        found->flags &= ~RTE_MEMSEG_FLAG_DO_NOT_FREE;
 
@@ -1075,6 +1262,8 @@ rte_eal_cleanup(void)
        if (rte_eal_process_type() == RTE_PROC_PRIMARY)
                rte_memseg_walk(mark_freeable, NULL);
        rte_service_finalize();
+       rte_mp_channel_cleanup();
+       eal_cleanup_config(&internal_config);
        return 0;
 }