drivers: remove direct access to interrupt handle
[dpdk.git] / drivers / raw / ifpga / ifpga_rawdev.c
index fef89e6..8d9db58 100644 (file)
@@ -8,9 +8,10 @@
 #include <unistd.h>
 #include <sys/types.h>
 #include <fcntl.h>
+#include <sys/ioctl.h>
+#include <sys/epoll.h>
 #include <rte_log.h>
 #include <rte_bus.h>
-#include <rte_eal_memconfig.h>
 #include <rte_malloc.h>
 #include <rte_devargs.h>
 #include <rte_memcpy.h>
@@ -18,7 +19,7 @@
 #include <rte_bus_pci.h>
 #include <rte_kvargs.h>
 #include <rte_alarm.h>
-
+#include <rte_interrupts.h>
 #include <rte_errno.h>
 #include <rte_per_lcore.h>
 #include <rte_memory.h>
 #include <rte_eal.h>
 #include <rte_common.h>
 #include <rte_bus_vdev.h>
+#include <rte_string_fns.h>
+#include <rte_pmd_i40e.h>
 
 #include "base/opae_hw_api.h"
+#include "base/opae_ifpga_hw_api.h"
+#include "base/ifpga_api.h"
 #include "rte_rawdev.h"
 #include "rte_rawdev_pmd.h"
 #include "rte_bus_ifpga.h"
@@ -36,8 +41,6 @@
 #include "ifpga_rawdev.h"
 #include "ipn3ke_rawdev_api.h"
 
-int ifpga_rawdev_logtype;
-
 #define PCI_VENDOR_ID_INTEL          0x8086
 /* PCI Device ID */
 #define PCIE_DEVICE_ID_PF_INT_5_X    0xBCBD
@@ -63,6 +66,501 @@ static const struct rte_pci_id pci_ifpga_map[] = {
        { .vendor_id = 0, /* sentinel */ },
 };
 
+static struct ifpga_rawdev ifpga_rawdevices[IFPGA_RAWDEV_NUM];
+
+static int ifpga_monitor_start;
+static pthread_t ifpga_monitor_start_thread;
+
+#define IFPGA_MAX_IRQ 12
+/* 0 for FME interrupt, others are reserved for AFU irq */
+static struct rte_intr_handle *ifpga_irq_handle[IFPGA_MAX_IRQ];
+
+static struct ifpga_rawdev *
+ifpga_rawdev_allocate(struct rte_rawdev *rawdev);
+static int set_surprise_link_check_aer(
+               struct ifpga_rawdev *ifpga_rdev, int force_disable);
+static int ifpga_pci_find_next_ext_capability(unsigned int fd,
+                                             int start, uint32_t cap);
+static int ifpga_pci_find_ext_capability(unsigned int fd, uint32_t cap);
+
+struct ifpga_rawdev *
+ifpga_rawdev_get(const struct rte_rawdev *rawdev)
+{
+       struct ifpga_rawdev *dev;
+       unsigned int i;
+
+       if (rawdev == NULL)
+               return NULL;
+
+       for (i = 0; i < IFPGA_RAWDEV_NUM; i++) {
+               dev = &ifpga_rawdevices[i];
+               if (dev->rawdev == rawdev)
+                       return dev;
+       }
+
+       return NULL;
+}
+
+static inline uint8_t
+ifpga_rawdev_find_free_device_index(void)
+{
+       uint16_t dev_id;
+
+       for (dev_id = 0; dev_id < IFPGA_RAWDEV_NUM; dev_id++) {
+               if (ifpga_rawdevices[dev_id].rawdev == NULL)
+                       return dev_id;
+       }
+
+       return IFPGA_RAWDEV_NUM;
+}
+static struct ifpga_rawdev *
+ifpga_rawdev_allocate(struct rte_rawdev *rawdev)
+{
+       struct ifpga_rawdev *dev;
+       uint16_t dev_id;
+
+       dev = ifpga_rawdev_get(rawdev);
+       if (dev != NULL) {
+               IFPGA_RAWDEV_PMD_ERR("Event device already allocated!");
+               return NULL;
+       }
+
+       dev_id = ifpga_rawdev_find_free_device_index();
+       if (dev_id == IFPGA_RAWDEV_NUM) {
+               IFPGA_RAWDEV_PMD_ERR("Reached maximum number of raw devices");
+               return NULL;
+       }
+
+       dev = &ifpga_rawdevices[dev_id];
+       dev->rawdev = rawdev;
+       dev->dev_id = dev_id;
+
+       return dev;
+}
+
+static int
+ifpga_pci_find_next_ext_capability(unsigned int fd, int start, uint32_t cap)
+{
+       uint32_t header;
+       int ttl;
+       int pos = RTE_PCI_CFG_SPACE_SIZE;
+       int ret;
+
+       /* minimum 8 bytes per capability */
+       ttl = (RTE_PCI_CFG_SPACE_EXP_SIZE - RTE_PCI_CFG_SPACE_SIZE) / 8;
+
+       if (start)
+               pos = start;
+       ret = pread(fd, &header, sizeof(header), pos);
+       if (ret == -1)
+               return -1;
+
+       /*
+        * If we have no capabilities, this is indicated by cap ID,
+        * cap version and next pointer all being 0.
+        */
+       if (header == 0)
+               return 0;
+
+       while (ttl-- > 0) {
+               if (RTE_PCI_EXT_CAP_ID(header) == cap && pos != start)
+                       return pos;
+
+               pos = RTE_PCI_EXT_CAP_NEXT(header);
+               if (pos < RTE_PCI_CFG_SPACE_SIZE)
+                       break;
+               ret = pread(fd, &header, sizeof(header), pos);
+               if (ret == -1)
+                       return -1;
+       }
+
+       return 0;
+}
+
+static int
+ifpga_pci_find_ext_capability(unsigned int fd, uint32_t cap)
+{
+       return ifpga_pci_find_next_ext_capability(fd, 0, cap);
+}
+
+static int ifpga_get_dev_vendor_id(const char *bdf,
+       uint32_t *dev_id, uint32_t *vendor_id)
+{
+       int fd;
+       char path[1024];
+       int ret;
+       uint32_t header;
+
+       strlcpy(path, "/sys/bus/pci/devices/", sizeof(path));
+       strlcat(path, bdf, sizeof(path));
+       strlcat(path, "/config", sizeof(path));
+       fd = open(path, O_RDWR);
+       if (fd < 0)
+               return -1;
+       ret = pread(fd, &header, sizeof(header), 0);
+       if (ret == -1) {
+               close(fd);
+               return -1;
+       }
+       (*vendor_id) = header & 0xffff;
+       (*dev_id) = (header >> 16) & 0xffff;
+       close(fd);
+
+       return 0;
+}
+static int ifpga_rawdev_fill_info(struct ifpga_rawdev *ifpga_dev,
+       const char *bdf)
+{
+       char path[1024] = "/sys/bus/pci/devices/0000:";
+       char link[1024], link1[1024];
+       char dir[1024] = "/sys/devices/";
+       char *c;
+       int ret;
+       char sub_brg_bdf[4][16];
+       int point;
+       DIR *dp = NULL;
+       struct dirent *entry;
+       int i, j;
+
+       unsigned int dom, bus, dev;
+       int func;
+       uint32_t dev_id, vendor_id;
+
+       strlcat(path, bdf, sizeof(path));
+       memset(link, 0, sizeof(link));
+       memset(link1, 0, sizeof(link1));
+       ret = readlink(path, link, (sizeof(link)-1));
+       if ((ret < 0) || ((unsigned int)ret > (sizeof(link)-1)))
+               return -1;
+       link[ret] = 0;   /* terminate string with null character */
+       strlcpy(link1, link, sizeof(link1));
+       memset(ifpga_dev->parent_bdf, 0, 16);
+       point = strlen(link);
+       if (point < 39)
+               return -1;
+       point -= 39;
+       link[point] = 0;
+       if (point < 12)
+               return -1;
+       point -= 12;
+       rte_memcpy(ifpga_dev->parent_bdf, &link[point], 12);
+
+       point = strlen(link1);
+       if (point < 26)
+               return -1;
+       point -= 26;
+       link1[point] = 0;
+       if (point < 12)
+               return -1;
+       point -= 12;
+       c = strchr(link1, 'p');
+       if (!c)
+               return -1;
+       strlcat(dir, c, sizeof(dir));
+
+       /* scan folder */
+       dp = opendir(dir);
+       if (dp == NULL)
+               return -1;
+       i = 0;
+       while ((entry = readdir(dp)) != NULL) {
+               if (i >= 4)
+                       break;
+               if (entry->d_name[0] == '.')
+                       continue;
+               if (strlen(entry->d_name) > 12)
+                       continue;
+               if (sscanf(entry->d_name, "%x:%x:%x.%d",
+                       &dom, &bus, &dev, &func) < 4)
+                       continue;
+               else {
+                       strlcpy(sub_brg_bdf[i],
+                               entry->d_name,
+                               sizeof(sub_brg_bdf[i]));
+                       i++;
+               }
+       }
+       closedir(dp);
+
+       /* get fpga and fvl */
+       j = 0;
+       for (i = 0; i < 4; i++) {
+               strlcpy(link, dir, sizeof(link));
+               strlcat(link, "/", sizeof(link));
+               strlcat(link, sub_brg_bdf[i], sizeof(link));
+               dp = opendir(link);
+               if (dp == NULL)
+                       return -1;
+               while ((entry = readdir(dp)) != NULL) {
+                       if (j >= 8)
+                               break;
+                       if (entry->d_name[0] == '.')
+                               continue;
+
+                       if (strlen(entry->d_name) > 12)
+                               continue;
+                       if (sscanf(entry->d_name, "%x:%x:%x.%d",
+                               &dom, &bus, &dev, &func) < 4)
+                               continue;
+                       else {
+                               if (ifpga_get_dev_vendor_id(entry->d_name,
+                                       &dev_id, &vendor_id))
+                                       continue;
+                               if (vendor_id == 0x8086 &&
+                                       (dev_id == 0x0CF8 ||
+                                       dev_id == 0x0D58 ||
+                                       dev_id == 0x1580)) {
+                                       strlcpy(ifpga_dev->fvl_bdf[j],
+                                               entry->d_name,
+                                               sizeof(ifpga_dev->fvl_bdf[j]));
+                                       j++;
+                               }
+                       }
+               }
+               closedir(dp);
+       }
+
+       return 0;
+}
+
+#define HIGH_FATAL(_sens, value)\
+       (((_sens)->flags & OPAE_SENSOR_HIGH_FATAL_VALID) &&\
+        (value > (_sens)->high_fatal))
+
+#define HIGH_WARN(_sens, value)\
+       (((_sens)->flags & OPAE_SENSOR_HIGH_WARN_VALID) &&\
+        (value > (_sens)->high_warn))
+
+#define LOW_FATAL(_sens, value)\
+       (((_sens)->flags & OPAE_SENSOR_LOW_FATAL_VALID) &&\
+        (value > (_sens)->low_fatal))
+
+#define LOW_WARN(_sens, value)\
+       (((_sens)->flags & OPAE_SENSOR_LOW_WARN_VALID) &&\
+        (value > (_sens)->low_warn))
+
+#define AUX_VOLTAGE_WARN 11400
+
+static int
+ifpga_monitor_sensor(struct rte_rawdev *raw_dev,
+              bool *gsd_start)
+{
+       struct opae_adapter *adapter;
+       struct opae_manager *mgr;
+       struct opae_sensor_info *sensor;
+       unsigned int value;
+       int ret;
+
+       adapter = ifpga_rawdev_get_priv(raw_dev);
+       if (!adapter)
+               return -ENODEV;
+
+       mgr = opae_adapter_get_mgr(adapter);
+       if (!mgr)
+               return -ENODEV;
+
+       opae_mgr_for_each_sensor(mgr, sensor) {
+               if (!(sensor->flags & OPAE_SENSOR_VALID))
+                       goto fail;
+
+               ret = opae_mgr_get_sensor_value(mgr, sensor, &value);
+               if (ret)
+                       goto fail;
+
+               if (value == 0xdeadbeef) {
+                       IFPGA_RAWDEV_PMD_ERR("dev_id %d sensor %s value %x\n",
+                                       raw_dev->dev_id, sensor->name, value);
+                       continue;
+               }
+
+               /* monitor temperature sensors */
+               if (!strcmp(sensor->name, "Board Temperature") ||
+                               !strcmp(sensor->name, "FPGA Die Temperature")) {
+                       IFPGA_RAWDEV_PMD_INFO("read sensor %s %d %d %d\n",
+                                       sensor->name, value, sensor->high_warn,
+                                       sensor->high_fatal);
+
+                       if (HIGH_WARN(sensor, value) ||
+                               LOW_WARN(sensor, value)) {
+                               IFPGA_RAWDEV_PMD_INFO("%s reach theshold %d\n",
+                                       sensor->name, value);
+                               *gsd_start = true;
+                               break;
+                       }
+               }
+
+               /* monitor 12V AUX sensor */
+               if (!strcmp(sensor->name, "12V AUX Voltage")) {
+                       if (value < AUX_VOLTAGE_WARN) {
+                               IFPGA_RAWDEV_PMD_INFO(
+                                       "%s reach theshold %d mV\n",
+                                       sensor->name, value);
+                               *gsd_start = true;
+                               break;
+                       }
+               }
+       }
+
+       return 0;
+fail:
+       return -EFAULT;
+}
+
+static int set_surprise_link_check_aer(
+       struct ifpga_rawdev *ifpga_rdev, int force_disable)
+{
+       struct rte_rawdev *rdev;
+       int fd = -1;
+       char path[1024];
+       int pos;
+       int ret;
+       uint32_t data;
+       bool enable = 0;
+       uint32_t aer_new0, aer_new1;
+
+       if (!ifpga_rdev) {
+               printf("\n device does not exist\n");
+               return -EFAULT;
+       }
+
+       rdev = ifpga_rdev->rawdev;
+       if (ifpga_rdev->aer_enable)
+               return -EFAULT;
+       if (ifpga_monitor_sensor(rdev, &enable))
+               return -EFAULT;
+       if (enable || force_disable) {
+               IFPGA_RAWDEV_PMD_ERR("Set AER, pls graceful shutdown\n");
+               ifpga_rdev->aer_enable = 1;
+               /* get bridge fd */
+               strlcpy(path, "/sys/bus/pci/devices/", sizeof(path));
+               strlcat(path, ifpga_rdev->parent_bdf, sizeof(path));
+               strlcat(path, "/config", sizeof(path));
+               fd = open(path, O_RDWR);
+               if (fd < 0)
+                       goto end;
+               pos = ifpga_pci_find_ext_capability(fd, RTE_PCI_EXT_CAP_ID_ERR);
+               if (!pos)
+                       goto end;
+               /* save previout ECAP_AER+0x08 */
+               ret = pread(fd, &data, sizeof(data), pos+0x08);
+               if (ret == -1)
+                       goto end;
+               ifpga_rdev->aer_old[0] = data;
+               /* save previout ECAP_AER+0x14 */
+               ret = pread(fd, &data, sizeof(data), pos+0x14);
+               if (ret == -1)
+                       goto end;
+               ifpga_rdev->aer_old[1] = data;
+
+               /* set ECAP_AER+0x08 to 0xFFFFFFFF */
+               data = 0xffffffff;
+               ret = pwrite(fd, &data, 4, pos+0x08);
+               if (ret == -1)
+                       goto end;
+               /* set ECAP_AER+0x14 to 0xFFFFFFFF */
+               ret = pwrite(fd, &data, 4, pos+0x14);
+               if (ret == -1)
+                       goto end;
+
+               /* read current ECAP_AER+0x08 */
+               ret = pread(fd, &data, sizeof(data), pos+0x08);
+               if (ret == -1)
+                       goto end;
+               aer_new0 = data;
+               /* read current ECAP_AER+0x14 */
+               ret = pread(fd, &data, sizeof(data), pos+0x14);
+               if (ret == -1)
+                       goto end;
+               aer_new1 = data;
+
+               if (fd != -1)
+                       close(fd);
+
+               printf(">>>>>>Set AER %x,%x %x,%x\n",
+                       ifpga_rdev->aer_old[0], ifpga_rdev->aer_old[1],
+                       aer_new0, aer_new1);
+
+               return 1;
+               }
+
+end:
+       if (fd != -1)
+               close(fd);
+       return -EFAULT;
+}
+
+static void *
+ifpga_rawdev_gsd_handle(__rte_unused void *param)
+{
+       struct ifpga_rawdev *ifpga_rdev;
+       int i;
+       int gsd_enable, ret;
+#define MS 1000
+
+       while (1) {
+               gsd_enable = 0;
+               for (i = 0; i < IFPGA_RAWDEV_NUM; i++) {
+                       ifpga_rdev = &ifpga_rawdevices[i];
+                       if (ifpga_rdev->rawdev) {
+                               ret = set_surprise_link_check_aer(ifpga_rdev,
+                                       gsd_enable);
+                               if (ret == 1 && !gsd_enable) {
+                                       gsd_enable = 1;
+                                       i = -1;
+                               }
+                       }
+               }
+
+               if (gsd_enable)
+                       printf(">>>>>>Pls Shutdown APP\n");
+
+               rte_delay_us(100 * MS);
+       }
+
+       return NULL;
+}
+
+static int
+ifpga_monitor_start_func(void)
+{
+       int ret;
+
+       if (ifpga_monitor_start == 0) {
+               ret = rte_ctrl_thread_create(&ifpga_monitor_start_thread,
+                                            "ifpga-monitor", NULL,
+                                            ifpga_rawdev_gsd_handle, NULL);
+               if (ret != 0) {
+                       IFPGA_RAWDEV_PMD_ERR(
+                               "Fail to create ifpga nonitor thread");
+                       return -1;
+               }
+               ifpga_monitor_start = 1;
+       }
+
+       return 0;
+}
+static int
+ifpga_monitor_stop_func(void)
+{
+       int ret;
+
+       if (ifpga_monitor_start == 1) {
+               ret = pthread_cancel(ifpga_monitor_start_thread);
+               if (ret)
+                       IFPGA_RAWDEV_PMD_ERR("Can't cancel the thread");
+
+               ret = pthread_join(ifpga_monitor_start_thread, NULL);
+               if (ret)
+                       IFPGA_RAWDEV_PMD_ERR("Can't join the thread");
+
+               ifpga_monitor_start = 0;
+
+               return ret;
+       }
+
+       return 0;
+}
+
 static int
 ifpga_fill_afu_dev(struct opae_accelerator *acc,
                struct rte_afu_device *afu_dev)
@@ -101,9 +599,10 @@ ifpga_fill_afu_dev(struct opae_accelerator *acc,
        return 0;
 }
 
-static void
+static int
 ifpga_rawdev_info_get(struct rte_rawdev *dev,
-                                    rte_rawdev_obj_t dev_info)
+                     rte_rawdev_obj_t dev_info,
+                     size_t dev_info_size)
 {
        struct opae_adapter *adapter;
        struct opae_accelerator *acc;
@@ -115,14 +614,14 @@ ifpga_rawdev_info_get(struct rte_rawdev *dev,
 
        IFPGA_RAWDEV_PMD_FUNC_TRACE();
 
-       if (!dev_info) {
+       if (!dev_info || dev_info_size != sizeof(*afu_dev)) {
                IFPGA_RAWDEV_PMD_ERR("Invalid request");
-               return;
+               return -EINVAL;
        }
 
        adapter = ifpga_rawdev_get_priv(dev);
        if (!adapter)
-               return;
+               return -ENOENT;
 
        afu_dev = dev_info;
        afu_dev->rawdev = dev;
@@ -134,7 +633,7 @@ ifpga_rawdev_info_get(struct rte_rawdev *dev,
 
                if (ifpga_fill_afu_dev(acc, afu_dev)) {
                        IFPGA_RAWDEV_PMD_ERR("cannot get info\n");
-                       return;
+                       return -ENOENT;
                }
        }
 
@@ -144,21 +643,21 @@ ifpga_rawdev_info_get(struct rte_rawdev *dev,
                /* get LineSide BAR Index */
                if (opae_manager_get_eth_group_region_info(mgr, 0,
                        &opae_lside_eth_info)) {
-                       return;
+                       return -ENOENT;
                }
                lside_bar_idx = opae_lside_eth_info.mem_idx;
 
                /* get NICSide BAR Index */
                if (opae_manager_get_eth_group_region_info(mgr, 1,
                        &opae_nside_eth_info)) {
-                       return;
+                       return -ENOENT;
                }
                nside_bar_idx = opae_nside_eth_info.mem_idx;
 
                if (lside_bar_idx >= PCI_MAX_RESOURCE ||
                        nside_bar_idx >= PCI_MAX_RESOURCE ||
                        lside_bar_idx == nside_bar_idx)
-                       return;
+                       return -ENOENT;
 
                /* fill LineSide BAR Index */
                afu_dev->mem_resource[lside_bar_idx].phys_addr =
@@ -176,11 +675,13 @@ ifpga_rawdev_info_get(struct rte_rawdev *dev,
                afu_dev->mem_resource[nside_bar_idx].addr =
                        opae_nside_eth_info.addr;
        }
+       return 0;
 }
 
 static int
 ifpga_rawdev_configure(const struct rte_rawdev *dev,
-               rte_rawdev_obj_t config)
+               rte_rawdev_obj_t config,
+               size_t config_size __rte_unused)
 {
        IFPGA_RAWDEV_PMD_FUNC_TRACE();
 
@@ -215,6 +716,16 @@ ifpga_rawdev_stop(struct rte_rawdev *dev)
 static int
 ifpga_rawdev_close(struct rte_rawdev *dev)
 {
+       struct opae_adapter *adapter;
+
+       if (dev) {
+               adapter = ifpga_rawdev_get_priv(dev);
+               if (adapter) {
+                       opae_adapter_destroy(adapter);
+                       opae_adapter_data_free(adapter->data);
+               }
+       }
+
        return dev ? 0:1;
 }
 
@@ -275,7 +786,7 @@ rte_fpga_do_pr(struct rte_rawdev *rawdev, int port_id,
        int file_fd;
        int ret = 0;
        ssize_t buffer_size;
-       void *buffer;
+       void *buffer, *buf_to_free;
        u64 pr_error;
 
        if (!file_name)
@@ -307,6 +818,7 @@ rte_fpga_do_pr(struct rte_rawdev *rawdev, int port_id,
                ret = -ENOMEM;
                goto close_fd;
        }
+       buf_to_free = buffer;
 
        /*read the raw data*/
        if (buffer_size != read(file_fd, (void *)buffer, buffer_size)) {
@@ -324,8 +836,8 @@ rte_fpga_do_pr(struct rte_rawdev *rawdev, int port_id,
        }
 
 free_buffer:
-       if (buffer)
-               rte_free(buffer);
+       if (buf_to_free)
+               rte_free(buf_to_free);
 close_fd:
        close(file_fd);
        file_fd = 0;
@@ -337,6 +849,8 @@ ifpga_rawdev_pr(struct rte_rawdev *dev,
        rte_rawdev_obj_t pr_conf)
 {
        struct opae_adapter *adapter;
+       struct opae_manager *mgr;
+       struct opae_board_info *info;
        struct rte_afu_pr_conf *afu_pr_conf;
        int ret;
        struct uuid uuid;
@@ -363,21 +877,40 @@ ifpga_rawdev_pr(struct rte_rawdev *dev,
                }
        }
 
-       acc = opae_adapter_get_acc(adapter, afu_pr_conf->afu_id.port);
-       if (!acc)
-               return -ENODEV;
+       mgr = opae_adapter_get_mgr(adapter);
+       if (!mgr) {
+               IFPGA_RAWDEV_PMD_ERR("opae_manager of opae_adapter is NULL");
+               return -1;
+       }
 
-       ret = opae_acc_get_uuid(acc, &uuid);
-       if (ret)
-               return ret;
+       if (ifpga_mgr_ops.get_board_info(mgr, &info)) {
+               IFPGA_RAWDEV_PMD_ERR("ifpga manager get_board_info fail!");
+               return -1;
+       }
 
-       memcpy(&afu_pr_conf->afu_id.uuid.uuid_low, uuid.b, sizeof(u64));
-       memcpy(&afu_pr_conf->afu_id.uuid.uuid_high, uuid.b + 8, sizeof(u64));
+       if (info->lightweight) {
+               /* set uuid to all 0, when fpga is lightweight image */
+               memset(&afu_pr_conf->afu_id.uuid.uuid_low, 0, sizeof(u64));
+               memset(&afu_pr_conf->afu_id.uuid.uuid_high, 0, sizeof(u64));
+       } else {
+               acc = opae_adapter_get_acc(adapter, afu_pr_conf->afu_id.port);
+               if (!acc)
+                       return -ENODEV;
+
+               ret = opae_acc_get_uuid(acc, &uuid);
+               if (ret)
+                       return ret;
 
-       IFPGA_RAWDEV_PMD_INFO("%s: uuid_l=0x%lx, uuid_h=0x%lx\n", __func__,
-               (unsigned long)afu_pr_conf->afu_id.uuid.uuid_low,
-               (unsigned long)afu_pr_conf->afu_id.uuid.uuid_high);
+               rte_memcpy(&afu_pr_conf->afu_id.uuid.uuid_low, uuid.b,
+                       sizeof(u64));
+               rte_memcpy(&afu_pr_conf->afu_id.uuid.uuid_high, uuid.b + 8,
+                       sizeof(u64));
 
+               IFPGA_RAWDEV_PMD_INFO("%s: uuid_l=0x%lx, uuid_h=0x%lx\n",
+                       __func__,
+                       (unsigned long)afu_pr_conf->afu_id.uuid.uuid_low,
+                       (unsigned long)afu_pr_conf->afu_id.uuid.uuid_high);
+               }
        return 0;
 }
 
@@ -605,12 +1138,333 @@ static const struct rte_rawdev_ops ifpga_rawdev_ops = {
        .dev_selftest = NULL,
 };
 
+static int
+ifpga_get_fme_error_prop(struct opae_manager *mgr,
+               u64 prop_id, u64 *val)
+{
+       struct feature_prop prop;
+
+       prop.feature_id = IFPGA_FME_FEATURE_ID_GLOBAL_ERR;
+       prop.prop_id = prop_id;
+
+       if (opae_manager_ifpga_get_prop(mgr, &prop))
+               return -EINVAL;
+
+       *val = prop.data;
+
+       return 0;
+}
+
+static int
+ifpga_set_fme_error_prop(struct opae_manager *mgr,
+               u64 prop_id, u64 val)
+{
+       struct feature_prop prop;
+
+       prop.feature_id = IFPGA_FME_FEATURE_ID_GLOBAL_ERR;
+       prop.prop_id = prop_id;
+
+       prop.data = val;
+
+       if (opae_manager_ifpga_set_prop(mgr, &prop))
+               return -EINVAL;
+
+       return 0;
+}
+
+static int
+fme_err_read_seu_emr(struct opae_manager *mgr)
+{
+       u64 val;
+       int ret;
+
+       ret = ifpga_get_fme_error_prop(mgr, FME_ERR_PROP_SEU_EMR_LOW, &val);
+       if (ret)
+               return -EINVAL;
+
+       IFPGA_RAWDEV_PMD_INFO("seu emr low: 0x%" PRIx64 "\n", val);
+
+       ret = ifpga_get_fme_error_prop(mgr, FME_ERR_PROP_SEU_EMR_HIGH, &val);
+       if (ret)
+               return -EINVAL;
+
+       IFPGA_RAWDEV_PMD_INFO("seu emr high: 0x%" PRIx64 "\n", val);
+
+       return 0;
+}
+
+static int fme_clear_warning_intr(struct opae_manager *mgr)
+{
+       u64 val;
+
+       if (ifpga_set_fme_error_prop(mgr, FME_ERR_PROP_INJECT_ERRORS, 0))
+               return -EINVAL;
+
+       if (ifpga_get_fme_error_prop(mgr, FME_ERR_PROP_NONFATAL_ERRORS, &val))
+               return -EINVAL;
+       if ((val & 0x40) != 0)
+               IFPGA_RAWDEV_PMD_INFO("clean not done\n");
+
+       return 0;
+}
+
+static int fme_clean_fme_error(struct opae_manager *mgr)
+{
+       u64 val;
+
+       if (ifpga_get_fme_error_prop(mgr, FME_ERR_PROP_ERRORS, &val))
+               return -EINVAL;
+
+       IFPGA_RAWDEV_PMD_DEBUG("before clean 0x%" PRIx64 "\n", val);
+
+       ifpga_set_fme_error_prop(mgr, FME_ERR_PROP_CLEAR, val);
+
+       if (ifpga_get_fme_error_prop(mgr, FME_ERR_PROP_ERRORS, &val))
+               return -EINVAL;
+
+       IFPGA_RAWDEV_PMD_DEBUG("after clean 0x%" PRIx64 "\n", val);
+
+       return 0;
+}
+
+static int
+fme_err_handle_error0(struct opae_manager *mgr)
+{
+       struct feature_fme_error0 fme_error0;
+       u64 val;
+
+       if (ifpga_get_fme_error_prop(mgr, FME_ERR_PROP_ERRORS, &val))
+               return -EINVAL;
+
+       if (fme_clean_fme_error(mgr))
+               return -EINVAL;
+
+       fme_error0.csr = val;
+
+       if (fme_error0.fabric_err)
+               IFPGA_RAWDEV_PMD_ERR("Fabric error\n");
+       else if (fme_error0.fabfifo_overflow)
+               IFPGA_RAWDEV_PMD_ERR("Fabric fifo under/overflow error\n");
+       else if (fme_error0.afu_acc_mode_err)
+               IFPGA_RAWDEV_PMD_ERR("AFU PF/VF access mismatch detected\n");
+       else if (fme_error0.pcie0cdc_parity_err)
+               IFPGA_RAWDEV_PMD_ERR("PCIe0 CDC Parity Error\n");
+       else if (fme_error0.cvlcdc_parity_err)
+               IFPGA_RAWDEV_PMD_ERR("CVL CDC Parity Error\n");
+       else if (fme_error0.fpgaseuerr)
+               fme_err_read_seu_emr(mgr);
+
+       /* clean the errors */
+       if (ifpga_set_fme_error_prop(mgr, FME_ERR_PROP_ERRORS, val))
+               return -EINVAL;
+
+       return 0;
+}
+
+static int
+fme_err_handle_catfatal_error(struct opae_manager *mgr)
+{
+       struct feature_fme_ras_catfaterror fme_catfatal;
+       u64 val;
+
+       if (ifpga_get_fme_error_prop(mgr, FME_ERR_PROP_CATFATAL_ERRORS, &val))
+               return -EINVAL;
+
+       fme_catfatal.csr = val;
+
+       if (fme_catfatal.cci_fatal_err)
+               IFPGA_RAWDEV_PMD_ERR("CCI error detected\n");
+       else if (fme_catfatal.fabric_fatal_err)
+               IFPGA_RAWDEV_PMD_ERR("Fabric fatal error detected\n");
+       else if (fme_catfatal.pcie_poison_err)
+               IFPGA_RAWDEV_PMD_ERR("Poison error from PCIe ports\n");
+       else if (fme_catfatal.inject_fata_err)
+               IFPGA_RAWDEV_PMD_ERR("Injected Fatal Error\n");
+       else if (fme_catfatal.crc_catast_err)
+               IFPGA_RAWDEV_PMD_ERR("a catastrophic EDCRC error\n");
+       else if (fme_catfatal.injected_catast_err)
+               IFPGA_RAWDEV_PMD_ERR("Injected Catastrophic Error\n");
+       else if (fme_catfatal.bmc_seu_catast_err)
+               fme_err_read_seu_emr(mgr);
+
+       return 0;
+}
+
+static int
+fme_err_handle_nonfaterror(struct opae_manager *mgr)
+{
+       struct feature_fme_ras_nonfaterror nonfaterr;
+       u64 val;
+
+       if (ifpga_get_fme_error_prop(mgr, FME_ERR_PROP_NONFATAL_ERRORS, &val))
+               return -EINVAL;
+
+       nonfaterr.csr = val;
+
+       if (nonfaterr.temp_thresh_ap1)
+               IFPGA_RAWDEV_PMD_INFO("Temperature threshold triggered AP1\n");
+       else if (nonfaterr.temp_thresh_ap2)
+               IFPGA_RAWDEV_PMD_INFO("Temperature threshold triggered AP2\n");
+       else if (nonfaterr.pcie_error)
+               IFPGA_RAWDEV_PMD_INFO("an error has occurred in pcie\n");
+       else if (nonfaterr.portfatal_error)
+               IFPGA_RAWDEV_PMD_INFO("fatal error occurred in AFU port.\n");
+       else if (nonfaterr.proc_hot)
+               IFPGA_RAWDEV_PMD_INFO("a ProcHot event\n");
+       else if (nonfaterr.afu_acc_mode_err)
+               IFPGA_RAWDEV_PMD_INFO("an AFU PF/VF access mismatch\n");
+       else if (nonfaterr.injected_nonfata_err) {
+               IFPGA_RAWDEV_PMD_INFO("Injected Warning Error\n");
+               fme_clear_warning_intr(mgr);
+       } else if (nonfaterr.temp_thresh_AP6)
+               IFPGA_RAWDEV_PMD_INFO("Temperature threshold triggered AP6\n");
+       else if (nonfaterr.power_thresh_AP1)
+               IFPGA_RAWDEV_PMD_INFO("Power threshold triggered AP1\n");
+       else if (nonfaterr.power_thresh_AP2)
+               IFPGA_RAWDEV_PMD_INFO("Power threshold triggered AP2\n");
+       else if (nonfaterr.mbp_err)
+               IFPGA_RAWDEV_PMD_INFO("an MBP event\n");
+
+       return 0;
+}
+
+static void
+fme_interrupt_handler(void *param)
+{
+       struct opae_manager *mgr = (struct opae_manager *)param;
+
+       IFPGA_RAWDEV_PMD_INFO("%s interrupt occurred\n", __func__);
+
+       fme_err_handle_error0(mgr);
+       fme_err_handle_nonfaterror(mgr);
+       fme_err_handle_catfatal_error(mgr);
+}
+
+int
+ifpga_unregister_msix_irq(enum ifpga_irq_type type,
+               int vec_start, rte_intr_callback_fn handler, void *arg)
+{
+       struct rte_intr_handle *intr_handle;
+       int rc, i;
+
+       if (type == IFPGA_FME_IRQ)
+               intr_handle = ifpga_irq_handle[0];
+       else if (type == IFPGA_AFU_IRQ)
+               intr_handle = ifpga_irq_handle[vec_start + 1];
+       else
+               return 0;
+
+       rte_intr_efd_disable(intr_handle);
+
+       rc = rte_intr_callback_unregister(intr_handle, handler, arg);
+
+       for (i = 0; i < IFPGA_MAX_IRQ; i++)
+               rte_intr_instance_free(ifpga_irq_handle[i]);
+       return rc;
+}
+
+int
+ifpga_register_msix_irq(struct rte_rawdev *dev, int port_id,
+               enum ifpga_irq_type type, int vec_start, int count,
+               rte_intr_callback_fn handler, const char *name,
+               void *arg)
+{
+       int ret;
+       struct rte_intr_handle *intr_handle;
+       struct opae_adapter *adapter;
+       struct opae_manager *mgr;
+       struct opae_accelerator *acc;
+       int *intr_efds = NULL, nb_intr, i;
+
+       for (i = 0; i < IFPGA_MAX_IRQ; i++) {
+               ifpga_irq_handle[i] =
+                       rte_intr_instance_alloc(RTE_INTR_INSTANCE_F_PRIVATE);
+               if (ifpga_irq_handle[i] == NULL)
+                       return -ENOMEM;
+       }
+
+       adapter = ifpga_rawdev_get_priv(dev);
+       if (!adapter)
+               return -ENODEV;
+
+       mgr = opae_adapter_get_mgr(adapter);
+       if (!mgr)
+               return -ENODEV;
+
+       if (type == IFPGA_FME_IRQ) {
+               intr_handle = ifpga_irq_handle[0];
+               count = 1;
+       } else if (type == IFPGA_AFU_IRQ) {
+               intr_handle = ifpga_irq_handle[vec_start + 1];
+       } else {
+               return -EINVAL;
+       }
+
+       if (rte_intr_type_set(intr_handle, RTE_INTR_HANDLE_VFIO_MSIX))
+               return -rte_errno;
+
+       ret = rte_intr_efd_enable(intr_handle, count);
+       if (ret)
+               return -ENODEV;
+
+       if (rte_intr_fd_set(intr_handle,
+                       rte_intr_efds_index_get(intr_handle, 0)))
+               return -rte_errno;
+
+       IFPGA_RAWDEV_PMD_DEBUG("register %s irq, vfio_fd=%d, fd=%d\n",
+                       name, rte_intr_dev_fd_get(intr_handle),
+                       rte_intr_fd_get(intr_handle));
+
+       if (type == IFPGA_FME_IRQ) {
+               struct fpga_fme_err_irq_set err_irq_set;
+               err_irq_set.evtfd = rte_intr_efds_index_get(intr_handle,
+                                                                  0);
+
+               ret = opae_manager_ifpga_set_err_irq(mgr, &err_irq_set);
+               if (ret)
+                       return -EINVAL;
+       } else if (type == IFPGA_AFU_IRQ) {
+               acc = opae_adapter_get_acc(adapter, port_id);
+               if (!acc)
+                       return -EINVAL;
+
+               nb_intr = rte_intr_nb_intr_get(intr_handle);
+
+               intr_efds = calloc(nb_intr, sizeof(int));
+               if (!intr_efds)
+                       return -ENOMEM;
+
+               for (i = 0; i < nb_intr; i++)
+                       intr_efds[i] = rte_intr_efds_index_get(intr_handle, i);
+
+               ret = opae_acc_set_irq(acc, vec_start, count, intr_efds);
+               if (ret) {
+                       free(intr_efds);
+                       return -EINVAL;
+               }
+       }
+
+       /* register interrupt handler using DPDK API */
+       ret = rte_intr_callback_register(intr_handle,
+                       handler, (void *)arg);
+       if (ret) {
+               free(intr_efds);
+               return -EINVAL;
+       }
+
+       IFPGA_RAWDEV_PMD_INFO("success register %s interrupt\n", name);
+
+       free(intr_efds);
+       return 0;
+}
+
 static int
 ifpga_rawdev_create(struct rte_pci_device *pci_dev,
                        int socket_id)
 {
        int ret = 0;
        struct rte_rawdev *rawdev = NULL;
+       struct ifpga_rawdev *dev = NULL;
        struct opae_adapter *adapter = NULL;
        struct opae_manager *mgr = NULL;
        struct opae_adapter_data_pci *data = NULL;
@@ -624,7 +1478,7 @@ ifpga_rawdev_create(struct rte_pci_device *pci_dev,
        }
 
        memset(name, 0, sizeof(name));
-       snprintf(name, RTE_RAWDEV_NAME_MAX_LEN, "IFPGA:%x:%02x.%x",
+       snprintf(name, RTE_RAWDEV_NAME_MAX_LEN, IFPGA_RAWDEV_NAME_FMT,
                pci_dev->addr.bus, pci_dev->addr.devid, pci_dev->addr.function);
 
        IFPGA_RAWDEV_PMD_INFO("Init %s on NUMA node %d", name, rte_socket_id());
@@ -638,6 +1492,17 @@ ifpga_rawdev_create(struct rte_pci_device *pci_dev,
                goto cleanup;
        }
 
+       ipn3ke_bridge_func.get_ifpga_rawdev = ifpga_rawdev_get;
+       ipn3ke_bridge_func.set_i40e_sw_dev = rte_pmd_i40e_set_switch_dev;
+
+       dev = ifpga_rawdev_allocate(rawdev);
+       if (dev == NULL) {
+               IFPGA_RAWDEV_PMD_ERR("Unable to allocate ifpga_rawdevice");
+               ret = -EINVAL;
+               goto cleanup;
+       }
+       dev->aer_enable = 0;
+
        /* alloc OPAE_FPGA_PCI data to register to OPAE hardware level API */
        data = opae_adapter_data_alloc(OPAE_FPGA_PCI);
        if (!data) {
@@ -653,6 +1518,10 @@ ifpga_rawdev_create(struct rte_pci_device *pci_dev,
        }
        data->device_id = pci_dev->id.device_id;
        data->vendor_id = pci_dev->id.vendor_id;
+       data->bus = pci_dev->addr.bus;
+       data->devid = pci_dev->addr.devid;
+       data->function = pci_dev->addr.function;
+       data->vfio_dev_fd = rte_intr_dev_fd_get(pci_dev->intr_handle);
 
        adapter = rawdev->dev_private;
        /* create a opae_adapter based on above device data */
@@ -678,6 +1547,11 @@ ifpga_rawdev_create(struct rte_pci_device *pci_dev,
                IFPGA_RAWDEV_PMD_INFO("this is a PF function");
        }
 
+       ret = ifpga_register_msix_irq(rawdev, 0, IFPGA_FME_IRQ, 0, 0,
+                       fme_interrupt_handler, "fme_irq", mgr);
+       if (ret)
+               goto free_adapter_data;
+
        return ret;
 
 free_adapter_data:
@@ -697,6 +1571,8 @@ ifpga_rawdev_destroy(struct rte_pci_device *pci_dev)
        struct rte_rawdev *rawdev;
        char name[RTE_RAWDEV_NAME_MAX_LEN];
        struct opae_adapter *adapter;
+       struct opae_manager *mgr;
+       struct ifpga_rawdev *dev;
 
        if (!pci_dev) {
                IFPGA_RAWDEV_PMD_ERR("Invalid pci_dev of the device!");
@@ -705,7 +1581,7 @@ ifpga_rawdev_destroy(struct rte_pci_device *pci_dev)
        }
 
        memset(name, 0, sizeof(name));
-       snprintf(name, RTE_RAWDEV_NAME_MAX_LEN, "IFPGA:%x:%02x.%x",
+       snprintf(name, RTE_RAWDEV_NAME_MAX_LEN, IFPGA_RAWDEV_NAME_FMT,
                pci_dev->addr.bus, pci_dev->addr.devid, pci_dev->addr.function);
 
        IFPGA_RAWDEV_PMD_INFO("Closing %s on NUMA node %d",
@@ -716,13 +1592,21 @@ ifpga_rawdev_destroy(struct rte_pci_device *pci_dev)
                IFPGA_RAWDEV_PMD_ERR("Invalid device name (%s)", name);
                return -EINVAL;
        }
+       dev = ifpga_rawdev_get(rawdev);
+       if (dev)
+               dev->rawdev = NULL;
 
        adapter = ifpga_rawdev_get_priv(rawdev);
        if (!adapter)
                return -ENODEV;
 
-       opae_adapter_data_free(adapter->data);
-       opae_adapter_free(adapter);
+       mgr = opae_adapter_get_mgr(adapter);
+       if (!mgr)
+               return -ENODEV;
+
+       if (ifpga_unregister_msix_irq(IFPGA_FME_IRQ, 0,
+                               fme_interrupt_handler, mgr) < 0)
+               return -EINVAL;
 
        /* rte_rawdev_close is called by pmd_release */
        ret = rte_rawdev_pmd_release(rawdev);
@@ -743,6 +1627,7 @@ ifpga_rawdev_pci_probe(struct rte_pci_driver *pci_drv __rte_unused,
 static int
 ifpga_rawdev_pci_remove(struct rte_pci_device *pci_dev)
 {
+       ifpga_monitor_stop_func();
        return ifpga_rawdev_destroy(pci_dev);
 }
 
@@ -756,13 +1641,7 @@ static struct rte_pci_driver rte_ifpga_rawdev_pmd = {
 RTE_PMD_REGISTER_PCI(ifpga_rawdev_pci_driver, rte_ifpga_rawdev_pmd);
 RTE_PMD_REGISTER_PCI_TABLE(ifpga_rawdev_pci_driver, rte_ifpga_rawdev_pmd);
 RTE_PMD_REGISTER_KMOD_DEP(ifpga_rawdev_pci_driver, "* igb_uio | uio_pci_generic | vfio-pci");
-
-RTE_INIT(ifpga_rawdev_init_log)
-{
-       ifpga_rawdev_logtype = rte_log_register("driver.raw.init");
-       if (ifpga_rawdev_logtype >= 0)
-               rte_log_set_level(ifpga_rawdev_logtype, RTE_LOG_NOTICE);
-}
+RTE_LOG_REGISTER_DEFAULT(ifpga_rawdev_logtype, NOTICE);
 
 static const char * const valid_args[] = {
 #define IFPGA_ARG_NAME         "ifpga"
@@ -774,13 +1653,32 @@ static const char * const valid_args[] = {
        NULL
 };
 
+static int ifpga_rawdev_get_string_arg(const char *key __rte_unused,
+       const char *value, void *extra_args)
+{
+       int size;
+       if (!value || !extra_args)
+               return -EINVAL;
+
+       size = strlen(value) + 1;
+       *(char **)extra_args = rte_malloc(NULL, size, RTE_CACHE_LINE_SIZE);
+       if (!*(char **)extra_args)
+               return -ENOMEM;
+
+       strlcpy(*(char **)extra_args, value, size);
+
+       return 0;
+}
 static int
 ifpga_cfg_probe(struct rte_vdev_device *dev)
 {
        struct rte_devargs *devargs;
        struct rte_kvargs *kvlist = NULL;
+       struct rte_rawdev *rawdev = NULL;
+       struct ifpga_rawdev *ifpga_dev;
        int port;
        char *name = NULL;
+       const char *bdf;
        char dev_name[RTE_RAWDEV_NAME_MAX_LEN];
        int ret = -1;
 
@@ -794,7 +1692,8 @@ ifpga_cfg_probe(struct rte_vdev_device *dev)
 
        if (rte_kvargs_count(kvlist, IFPGA_ARG_NAME) == 1) {
                if (rte_kvargs_process(kvlist, IFPGA_ARG_NAME,
-                                      &rte_ifpga_get_string_arg, &name) < 0) {
+                                      &ifpga_rawdev_get_string_arg,
+                                      &name) < 0) {
                        IFPGA_RAWDEV_PMD_ERR("error to parse %s",
                                     IFPGA_ARG_NAME);
                        goto end;
@@ -820,6 +1719,19 @@ ifpga_cfg_probe(struct rte_vdev_device *dev)
                goto end;
        }
 
+       memset(dev_name, 0, sizeof(dev_name));
+       snprintf(dev_name, RTE_RAWDEV_NAME_MAX_LEN, "IFPGA:%s", name);
+       rawdev = rte_rawdev_pmd_get_named_dev(dev_name);
+       if (!rawdev)
+               goto end;
+       ifpga_dev = ifpga_rawdev_get(rawdev);
+       if (!ifpga_dev)
+               goto end;
+       bdf = name;
+       ifpga_rawdev_fill_info(ifpga_dev, bdf);
+
+       ifpga_monitor_start_func();
+
        memset(dev_name, 0, sizeof(dev_name));
        snprintf(dev_name, RTE_RAWDEV_NAME_MAX_LEN, "%d|%s",
        port, name);
@@ -855,3 +1767,33 @@ RTE_PMD_REGISTER_PARAM_STRING(ifpga_rawdev_cfg,
        "ifpga=<string> "
        "port=<int> "
        "afu_bts=<path>");
+
+struct rte_pci_bus *ifpga_get_pci_bus(void)
+{
+       return rte_ifpga_rawdev_pmd.bus;
+}
+
+int ifpga_rawdev_partial_reconfigure(struct rte_rawdev *dev, int port,
+       const char *file)
+{
+       if (!dev) {
+               IFPGA_RAWDEV_PMD_ERR("Input parameter is invalid");
+               return -EINVAL;
+       }
+
+       return rte_fpga_do_pr(dev, port, file);
+}
+
+void ifpga_rawdev_cleanup(void)
+{
+       struct ifpga_rawdev *dev;
+       unsigned int i;
+
+       for (i = 0; i < IFPGA_RAWDEV_NUM; i++) {
+               dev = &ifpga_rawdevices[i];
+               if (dev->rawdev) {
+                       rte_rawdev_pmd_release(dev->rawdev);
+                       dev->rawdev = NULL;
+               }
+       }
+}