ethdev: add namespace
[dpdk.git] / drivers / net / mlx5 / linux / mlx5_ethdev_os.c
index 3d3dd2e..9d0e491 100644 (file)
@@ -24,8 +24,7 @@
 #include <sys/un.h>
 #include <time.h>
 
-#include <rte_atomic.h>
-#include <rte_ethdev_driver.h>
+#include <ethdev_driver.h>
 #include <rte_bus_pci.h>
 #include <rte_mbuf.h>
 #include <rte_common.h>
@@ -129,6 +128,17 @@ struct ethtool_link_settings {
 #define ETHTOOL_LINK_MODE_200000baseCR4_Full_BIT 2 /* 66 - 64 */
 #endif
 
+/* Get interface index from SubFunction device name. */
+int
+mlx5_auxiliary_get_ifindex(const char *sf_name)
+{
+       char if_name[IF_NAMESIZE] = { 0 };
+
+       if (mlx5_auxiliary_get_child_name(sf_name, "/net",
+                                         if_name, sizeof(if_name)) != 0)
+               return -rte_errno;
+       return if_nametoindex(if_name);
+}
 
 /**
  * Get interface name from private structure.
@@ -144,13 +154,17 @@ struct ethtool_link_settings {
  *   0 on success, a negative errno value otherwise and rte_errno is set.
  */
 int
-mlx5_get_ifname(const struct rte_eth_dev *dev, char (*ifname)[IF_NAMESIZE])
+mlx5_get_ifname(const struct rte_eth_dev *dev, char (*ifname)[MLX5_NAMESIZE])
 {
        struct mlx5_priv *priv = dev->data->dev_private;
        unsigned int ifindex;
 
        MLX5_ASSERT(priv);
        MLX5_ASSERT(priv->sh);
+       if (priv->master && priv->sh->bond.ifindex > 0) {
+               memcpy(ifname, priv->sh->bond.ifname, MLX5_NAMESIZE);
+               return 0;
+       }
        ifindex = mlx5_ifindex(dev);
        if (!ifindex) {
                if (!priv->representor)
@@ -166,10 +180,10 @@ mlx5_get_ifname(const struct rte_eth_dev *dev, char (*ifname)[IF_NAMESIZE])
 }
 
 /**
- * Perform ifreq ioctl() on associated Ethernet device.
+ * Perform ifreq ioctl() on associated netdev ifname.
  *
- * @param[in] dev
- *   Pointer to Ethernet device.
+ * @param[in] ifname
+ *   Pointer to netdev name.
  * @param req
  *   Request number to pass to ioctl().
  * @param[out] ifr
@@ -179,7 +193,7 @@ mlx5_get_ifname(const struct rte_eth_dev *dev, char (*ifname)[IF_NAMESIZE])
  *   0 on success, a negative errno value otherwise and rte_errno is set.
  */
 static int
-mlx5_ifreq(const struct rte_eth_dev *dev, int req, struct ifreq *ifr)
+mlx5_ifreq_by_ifname(const char *ifname, int req, struct ifreq *ifr)
 {
        int sock = socket(PF_INET, SOCK_DGRAM, IPPROTO_IP);
        int ret = 0;
@@ -188,9 +202,7 @@ mlx5_ifreq(const struct rte_eth_dev *dev, int req, struct ifreq *ifr)
                rte_errno = errno;
                return -rte_errno;
        }
-       ret = mlx5_get_ifname(dev, &ifr->ifr_name);
-       if (ret)
-               goto error;
+       rte_strscpy(ifr->ifr_name, ifname, sizeof(ifr->ifr_name));
        ret = ioctl(sock, req, ifr);
        if (ret == -1) {
                rte_errno = errno;
@@ -203,6 +215,31 @@ error:
        return -rte_errno;
 }
 
+/**
+ * Perform ifreq ioctl() on associated Ethernet device.
+ *
+ * @param[in] dev
+ *   Pointer to Ethernet device.
+ * @param req
+ *   Request number to pass to ioctl().
+ * @param[out] ifr
+ *   Interface request structure output buffer.
+ *
+ * @return
+ *   0 on success, a negative errno value otherwise and rte_errno is set.
+ */
+static int
+mlx5_ifreq(const struct rte_eth_dev *dev, int req, struct ifreq *ifr)
+{
+       char ifname[sizeof(ifr->ifr_name)];
+       int ret;
+
+       ret = mlx5_get_ifname(dev, &ifname);
+       if (ret)
+               return -rte_errno;
+       return mlx5_ifreq_by_ifname(ifname, req, ifr);
+}
+
 /**
  * Get device MTU.
  *
@@ -287,7 +324,7 @@ int
 mlx5_read_clock(struct rte_eth_dev *dev, uint64_t *clock)
 {
        struct mlx5_priv *priv = dev->data->dev_private;
-       struct ibv_context *ctx = priv->sh->ctx;
+       struct ibv_context *ctx = priv->sh->cdev->ctx;
        struct ibv_values_ex values;
        int err = 0;
 
@@ -320,7 +357,7 @@ mlx5_find_master_dev(struct rte_eth_dev *dev)
        priv = dev->data->dev_private;
        domain_id = priv->domain_id;
        MLX5_ASSERT(priv->representor);
-       MLX5_ETH_FOREACH_DEV(port_id, priv->pci_dev) {
+       MLX5_ETH_FOREACH_DEV(port_id, dev->device) {
                struct mlx5_priv *opriv =
                        rte_eth_devices[port_id].data->dev_private;
                if (opriv &&
@@ -402,31 +439,24 @@ mlx5_link_update_unlocked_gset(struct rte_eth_dev *dev,
        }
        link_speed = ethtool_cmd_speed(&edata);
        if (link_speed == -1)
-               dev_link.link_speed = ETH_SPEED_NUM_NONE;
+               dev_link.link_speed = RTE_ETH_SPEED_NUM_UNKNOWN;
        else
                dev_link.link_speed = link_speed;
        priv->link_speed_capa = 0;
-       if (edata.supported & SUPPORTED_Autoneg)
-               priv->link_speed_capa |= ETH_LINK_SPEED_AUTONEG;
        if (edata.supported & (SUPPORTED_1000baseT_Full |
                               SUPPORTED_1000baseKX_Full))
-               priv->link_speed_capa |= ETH_LINK_SPEED_1G;
+               priv->link_speed_capa |= RTE_ETH_LINK_SPEED_1G;
        if (edata.supported & SUPPORTED_10000baseKR_Full)
-               priv->link_speed_capa |= ETH_LINK_SPEED_10G;
+               priv->link_speed_capa |= RTE_ETH_LINK_SPEED_10G;
        if (edata.supported & (SUPPORTED_40000baseKR4_Full |
                               SUPPORTED_40000baseCR4_Full |
                               SUPPORTED_40000baseSR4_Full |
                               SUPPORTED_40000baseLR4_Full))
-               priv->link_speed_capa |= ETH_LINK_SPEED_40G;
+               priv->link_speed_capa |= RTE_ETH_LINK_SPEED_40G;
        dev_link.link_duplex = ((edata.duplex == DUPLEX_HALF) ?
-                               ETH_LINK_HALF_DUPLEX : ETH_LINK_FULL_DUPLEX);
+                               RTE_ETH_LINK_HALF_DUPLEX : RTE_ETH_LINK_FULL_DUPLEX);
        dev_link.link_autoneg = !(dev->data->dev_conf.link_speeds &
-                       ETH_LINK_SPEED_FIXED);
-       if (((dev_link.link_speed && !dev_link.link_status) ||
-            (!dev_link.link_speed && dev_link.link_status))) {
-               rte_errno = EAGAIN;
-               return -rte_errno;
-       }
+                       RTE_ETH_LINK_SPEED_FIXED);
        *link = dev_link;
        return 0;
 }
@@ -514,48 +544,46 @@ mlx5_link_update_unlocked_gs(struct rte_eth_dev *dev,
                        dev->data->port_id, strerror(rte_errno));
                return ret;
        }
-       dev_link.link_speed = (ecmd->speed == UINT32_MAX) ? ETH_SPEED_NUM_NONE :
-                                                           ecmd->speed;
+       dev_link.link_speed = (ecmd->speed == UINT32_MAX) ?
+                               RTE_ETH_SPEED_NUM_UNKNOWN : ecmd->speed;
        sc = ecmd->link_mode_masks[0] |
                ((uint64_t)ecmd->link_mode_masks[1] << 32);
        priv->link_speed_capa = 0;
-       if (sc & MLX5_BITSHIFT(ETHTOOL_LINK_MODE_Autoneg_BIT))
-               priv->link_speed_capa |= ETH_LINK_SPEED_AUTONEG;
        if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_1000baseT_Full_BIT) |
                  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_1000baseKX_Full_BIT)))
-               priv->link_speed_capa |= ETH_LINK_SPEED_1G;
+               priv->link_speed_capa |= RTE_ETH_LINK_SPEED_1G;
        if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_10000baseKX4_Full_BIT) |
                  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_10000baseKR_Full_BIT) |
                  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_10000baseR_FEC_BIT)))
-               priv->link_speed_capa |= ETH_LINK_SPEED_10G;
+               priv->link_speed_capa |= RTE_ETH_LINK_SPEED_10G;
        if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_20000baseMLD2_Full_BIT) |
                  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_20000baseKR2_Full_BIT)))
-               priv->link_speed_capa |= ETH_LINK_SPEED_20G;
+               priv->link_speed_capa |= RTE_ETH_LINK_SPEED_20G;
        if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_40000baseKR4_Full_BIT) |
                  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_40000baseCR4_Full_BIT) |
                  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_40000baseSR4_Full_BIT) |
                  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_40000baseLR4_Full_BIT)))
-               priv->link_speed_capa |= ETH_LINK_SPEED_40G;
+               priv->link_speed_capa |= RTE_ETH_LINK_SPEED_40G;
        if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_56000baseKR4_Full_BIT) |
                  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_56000baseCR4_Full_BIT) |
                  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_56000baseSR4_Full_BIT) |
                  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_56000baseLR4_Full_BIT)))
-               priv->link_speed_capa |= ETH_LINK_SPEED_56G;
+               priv->link_speed_capa |= RTE_ETH_LINK_SPEED_56G;
        if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_25000baseCR_Full_BIT) |
                  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_25000baseKR_Full_BIT) |
                  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_25000baseSR_Full_BIT)))
-               priv->link_speed_capa |= ETH_LINK_SPEED_25G;
+               priv->link_speed_capa |= RTE_ETH_LINK_SPEED_25G;
        if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_50000baseCR2_Full_BIT) |
                  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_50000baseKR2_Full_BIT)))
-               priv->link_speed_capa |= ETH_LINK_SPEED_50G;
+               priv->link_speed_capa |= RTE_ETH_LINK_SPEED_50G;
        if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_100000baseKR4_Full_BIT) |
                  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_100000baseSR4_Full_BIT) |
                  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_100000baseCR4_Full_BIT) |
                  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_100000baseLR4_ER4_Full_BIT)))
-               priv->link_speed_capa |= ETH_LINK_SPEED_100G;
+               priv->link_speed_capa |= RTE_ETH_LINK_SPEED_100G;
        if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_200000baseKR4_Full_BIT) |
                  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_200000baseSR4_Full_BIT)))
-               priv->link_speed_capa |= ETH_LINK_SPEED_200G;
+               priv->link_speed_capa |= RTE_ETH_LINK_SPEED_200G;
 
        sc = ecmd->link_mode_masks[2] |
                ((uint64_t)ecmd->link_mode_masks[3] << 32);
@@ -563,16 +591,11 @@ mlx5_link_update_unlocked_gs(struct rte_eth_dev *dev,
                  MLX5_BITSHIFT
                       (ETHTOOL_LINK_MODE_200000baseLR4_ER4_FR4_Full_BIT) |
                  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_200000baseDR4_Full_BIT)))
-               priv->link_speed_capa |= ETH_LINK_SPEED_200G;
+               priv->link_speed_capa |= RTE_ETH_LINK_SPEED_200G;
        dev_link.link_duplex = ((ecmd->duplex == DUPLEX_HALF) ?
-                               ETH_LINK_HALF_DUPLEX : ETH_LINK_FULL_DUPLEX);
+                               RTE_ETH_LINK_HALF_DUPLEX : RTE_ETH_LINK_FULL_DUPLEX);
        dev_link.link_autoneg = !(dev->data->dev_conf.link_speeds &
-                                 ETH_LINK_SPEED_FIXED);
-       if (((dev_link.link_speed && !dev_link.link_status) ||
-            (!dev_link.link_speed && dev_link.link_status))) {
-               rte_errno = EAGAIN;
-               return -rte_errno;
-       }
+                                 RTE_ETH_LINK_SPEED_FIXED);
        *link = dev_link;
        return 0;
 }
@@ -654,13 +677,13 @@ mlx5_dev_get_flow_ctrl(struct rte_eth_dev *dev, struct rte_eth_fc_conf *fc_conf)
        }
        fc_conf->autoneg = ethpause.autoneg;
        if (ethpause.rx_pause && ethpause.tx_pause)
-               fc_conf->mode = RTE_FC_FULL;
+               fc_conf->mode = RTE_ETH_FC_FULL;
        else if (ethpause.rx_pause)
-               fc_conf->mode = RTE_FC_RX_PAUSE;
+               fc_conf->mode = RTE_ETH_FC_RX_PAUSE;
        else if (ethpause.tx_pause)
-               fc_conf->mode = RTE_FC_TX_PAUSE;
+               fc_conf->mode = RTE_ETH_FC_TX_PAUSE;
        else
-               fc_conf->mode = RTE_FC_NONE;
+               fc_conf->mode = RTE_ETH_FC_NONE;
        return 0;
 }
 
@@ -686,14 +709,14 @@ mlx5_dev_set_flow_ctrl(struct rte_eth_dev *dev, struct rte_eth_fc_conf *fc_conf)
 
        ifr.ifr_data = (void *)&ethpause;
        ethpause.autoneg = fc_conf->autoneg;
-       if (((fc_conf->mode & RTE_FC_FULL) == RTE_FC_FULL) ||
-           (fc_conf->mode & RTE_FC_RX_PAUSE))
+       if (((fc_conf->mode & RTE_ETH_FC_FULL) == RTE_ETH_FC_FULL) ||
+           (fc_conf->mode & RTE_ETH_FC_RX_PAUSE))
                ethpause.rx_pause = 1;
        else
                ethpause.rx_pause = 0;
 
-       if (((fc_conf->mode & RTE_FC_FULL) == RTE_FC_FULL) ||
-           (fc_conf->mode & RTE_FC_TX_PAUSE))
+       if (((fc_conf->mode & RTE_ETH_FC_FULL) == RTE_ETH_FC_FULL) ||
+           (fc_conf->mode & RTE_ETH_FC_TX_PAUSE))
                ethpause.tx_pause = 1;
        else
                ethpause.tx_pause = 0;
@@ -732,7 +755,7 @@ mlx5_dev_interrupt_device_fatal(struct mlx5_dev_ctx_shared *sh)
                dev = &rte_eth_devices[sh->port[i].ih_port_id];
                MLX5_ASSERT(dev);
                if (dev->data->dev_conf.intr_conf.rmv)
-                       _rte_eth_dev_callback_process
+                       rte_eth_dev_callback_process
                                (dev, RTE_ETH_EVENT_INTR_RMV, NULL);
        }
 }
@@ -755,7 +778,7 @@ mlx5_dev_interrupt_handler(void *cb_arg)
                struct rte_eth_dev *dev;
                uint32_t tmp;
 
-               if (mlx5_glue->get_async_event(sh->ctx, &event))
+               if (mlx5_glue->get_async_event(sh->cdev->ctx, &event))
                        break;
                /* Retrieve and check IB port index. */
                tmp = (uint32_t)event.element.port_num;
@@ -808,7 +831,7 @@ mlx5_dev_interrupt_handler(void *cb_arg)
                                usleep(0);
                                continue;
                        }
-                       _rte_eth_dev_callback_process
+                       rte_eth_dev_callback_process
                                (dev, RTE_ETH_EVENT_INTR_LSC, NULL);
                        continue;
                }
@@ -967,7 +990,7 @@ mlx5_is_removed(struct rte_eth_dev *dev)
        struct ibv_device_attr device_attr;
        struct mlx5_priv *priv = dev->data->dev_private;
 
-       if (mlx5_glue->query_device(priv->sh->ctx, &device_attr) == EIO)
+       if (mlx5_glue->query_device(priv->sh->cdev->ctx, &device_attr) == EIO)
                return 1;
        return 0;
 }
@@ -1017,9 +1040,14 @@ mlx5_sysfs_check_switch_info(bool device_dir,
        case MLX5_PHYS_PORT_NAME_TYPE_PFHPF:
                /* Fallthrough */
        case MLX5_PHYS_PORT_NAME_TYPE_PFVF:
+               /* Fallthrough */
+       case MLX5_PHYS_PORT_NAME_TYPE_PFSF:
                /* New representors naming schema. */
                switch_info->representor = 1;
                break;
+       default:
+               switch_info->master = device_dir;
+               break;
        }
 }
 
@@ -1101,6 +1129,58 @@ mlx5_sysfs_switch_info(unsigned int ifindex, struct mlx5_switch_info *info)
        return 0;
 }
 
+/**
+ * Get bond information associated with network interface.
+ *
+ * @param pf_ifindex
+ *   Network interface index of bond slave interface
+ * @param[out] ifindex
+ *   Pointer to bond ifindex.
+ * @param[out] ifname
+ *   Pointer to bond ifname.
+ *
+ * @return
+ *   0 on success, a negative errno value otherwise and rte_errno is set.
+ */
+int
+mlx5_sysfs_bond_info(unsigned int pf_ifindex, unsigned int *ifindex,
+                    char *ifname)
+{
+       char name[IF_NAMESIZE];
+       FILE *file;
+       unsigned int index;
+       int ret;
+
+       if (!if_indextoname(pf_ifindex, name) || !strlen(name)) {
+               rte_errno = errno;
+               return -rte_errno;
+       }
+       MKSTR(bond_if, "/sys/class/net/%s/master/ifindex", name);
+       /* read bond ifindex */
+       file = fopen(bond_if, "rb");
+       if (file == NULL) {
+               rte_errno = errno;
+               return -rte_errno;
+       }
+       ret = fscanf(file, "%u", &index);
+       fclose(file);
+       if (ret <= 0) {
+               rte_errno = errno;
+               return -rte_errno;
+       }
+       if (ifindex)
+               *ifindex = index;
+
+       /* read bond device name from symbol link */
+       if (ifname) {
+               if (!if_indextoname(index, ifname)) {
+                       rte_errno = errno;
+                       return -rte_errno;
+               }
+       }
+       return 0;
+}
+
 /**
  * DPDK callback to retrieve plug-in module EEPROM information (type and size).
  *
@@ -1124,7 +1204,7 @@ mlx5_get_module_info(struct rte_eth_dev *dev,
        };
        int ret = 0;
 
-       if (!dev || !modinfo) {
+       if (!dev) {
                DRV_LOG(WARNING, "missing argument, cannot get module info");
                rte_errno = EINVAL;
                return -rte_errno;
@@ -1158,7 +1238,7 @@ int mlx5_get_module_eeprom(struct rte_eth_dev *dev,
        struct ifreq ifr;
        int ret = 0;
 
-       if (!dev || !info) {
+       if (!dev) {
                DRV_LOG(WARNING, "missing argument, cannot get module eeprom");
                rte_errno = EINVAL;
                return -rte_errno;
@@ -1193,6 +1273,8 @@ int mlx5_get_module_eeprom(struct rte_eth_dev *dev,
  *
  * @param dev
  *   Pointer to Ethernet device.
+ * @param[in] pf
+ *   PF index in case of bonding device, -1 otherwise
  * @param[out] stats
  *   Counters table output buffer.
  *
@@ -1200,8 +1282,8 @@ int mlx5_get_module_eeprom(struct rte_eth_dev *dev,
  *   0 on success and stats is filled, negative errno value otherwise and
  *   rte_errno is set.
  */
-int
-mlx5_os_read_dev_counters(struct rte_eth_dev *dev, uint64_t *stats)
+static int
+_mlx5_os_read_dev_counters(struct rte_eth_dev *dev, int pf, uint64_t *stats)
 {
        struct mlx5_priv *priv = dev->data->dev_private;
        struct mlx5_xstats_ctrl *xstats_ctrl = &priv->xstats_ctrl;
@@ -1215,7 +1297,11 @@ mlx5_os_read_dev_counters(struct rte_eth_dev *dev, uint64_t *stats)
        et_stats->cmd = ETHTOOL_GSTATS;
        et_stats->n_stats = xstats_ctrl->stats_n;
        ifr.ifr_data = (caddr_t)et_stats;
-       ret = mlx5_ifreq(dev, SIOCETHTOOL, &ifr);
+       if (pf >= 0)
+               ret = mlx5_ifreq_by_ifname(priv->sh->bond.ports[pf].ifname,
+                                          SIOCETHTOOL, &ifr);
+       else
+               ret = mlx5_ifreq(dev, SIOCETHTOOL, &ifr);
        if (ret) {
                DRV_LOG(WARNING,
                        "port %u unable to read statistic values from device",
@@ -1223,23 +1309,60 @@ mlx5_os_read_dev_counters(struct rte_eth_dev *dev, uint64_t *stats)
                return ret;
        }
        for (i = 0; i != xstats_ctrl->mlx5_stats_n; ++i) {
-               if (xstats_ctrl->info[i].dev) {
-                       ret = mlx5_os_read_dev_stat(priv,
-                                           xstats_ctrl->info[i].ctr_name,
-                                           &stats[i]);
-                       /* return last xstats counter if fail to read. */
-                       if (ret == 0)
-                               xstats_ctrl->xstats[i] = stats[i];
-                       else
-                               stats[i] = xstats_ctrl->xstats[i];
-               } else {
-                       stats[i] = (uint64_t)
-                               et_stats->data[xstats_ctrl->dev_table_idx[i]];
-               }
+               if (xstats_ctrl->info[i].dev)
+                       continue;
+               stats[i] += (uint64_t)
+                           et_stats->data[xstats_ctrl->dev_table_idx[i]];
        }
        return 0;
 }
 
+/**
+ * Read device counters.
+ *
+ * @param dev
+ *   Pointer to Ethernet device.
+ * @param[out] stats
+ *   Counters table output buffer.
+ *
+ * @return
+ *   0 on success and stats is filled, negative errno value otherwise and
+ *   rte_errno is set.
+ */
+int
+mlx5_os_read_dev_counters(struct rte_eth_dev *dev, uint64_t *stats)
+{
+       struct mlx5_priv *priv = dev->data->dev_private;
+       struct mlx5_xstats_ctrl *xstats_ctrl = &priv->xstats_ctrl;
+       int ret = 0, i;
+
+       memset(stats, 0, sizeof(*stats) * xstats_ctrl->mlx5_stats_n);
+       /* Read ifreq counters. */
+       if (priv->master && priv->pf_bond >= 0) {
+               /* Sum xstats from bonding device member ports. */
+               for (i = 0; i < priv->sh->bond.n_port; i++) {
+                       ret = _mlx5_os_read_dev_counters(dev, i, stats);
+                       if (ret)
+                               return ret;
+               }
+       } else {
+               ret = _mlx5_os_read_dev_counters(dev, -1, stats);
+       }
+       /* Read IB counters. */
+       for (i = 0; i != xstats_ctrl->mlx5_stats_n; ++i) {
+               if (!xstats_ctrl->info[i].dev)
+                       continue;
+               ret = mlx5_os_read_dev_stat(priv, xstats_ctrl->info[i].ctr_name,
+                                           &stats[i]);
+               /* return last xstats counter if fail to read. */
+               if (ret != 0)
+                       xstats_ctrl->xstats[i] = stats[i];
+               else
+                       stats[i] = xstats_ctrl->xstats[i];
+       }
+       return ret;
+}
+
 /**
  * Query the number of statistics provided by ETHTOOL.
  *
@@ -1253,13 +1376,19 @@ mlx5_os_read_dev_counters(struct rte_eth_dev *dev, uint64_t *stats)
 int
 mlx5_os_get_stats_n(struct rte_eth_dev *dev)
 {
+       struct mlx5_priv *priv = dev->data->dev_private;
        struct ethtool_drvinfo drvinfo;
        struct ifreq ifr;
        int ret;
 
        drvinfo.cmd = ETHTOOL_GDRVINFO;
        ifr.ifr_data = (caddr_t)&drvinfo;
-       ret = mlx5_ifreq(dev, SIOCETHTOOL, &ifr);
+       if (priv->master && priv->pf_bond >= 0)
+               /* Bonding PF. */
+               ret = mlx5_ifreq_by_ifname(priv->sh->bond.ports[0].ifname,
+                                          SIOCETHTOOL, &ifr);
+       else
+               ret = mlx5_ifreq(dev, SIOCETHTOOL, &ifr);
        if (ret) {
                DRV_LOG(WARNING, "port %u unable to query number of statistics",
                        dev->data->port_id);
@@ -1270,71 +1399,71 @@ mlx5_os_get_stats_n(struct rte_eth_dev *dev)
 
 static const struct mlx5_counter_ctrl mlx5_counters_init[] = {
        {
-               .dpdk_name = "rx_port_unicast_bytes",
+               .dpdk_name = "rx_unicast_bytes",
                .ctr_name = "rx_vport_unicast_bytes",
        },
        {
-               .dpdk_name = "rx_port_multicast_bytes",
+               .dpdk_name = "rx_multicast_bytes",
                .ctr_name = "rx_vport_multicast_bytes",
        },
        {
-               .dpdk_name = "rx_port_broadcast_bytes",
+               .dpdk_name = "rx_broadcast_bytes",
                .ctr_name = "rx_vport_broadcast_bytes",
        },
        {
-               .dpdk_name = "rx_port_unicast_packets",
+               .dpdk_name = "rx_unicast_packets",
                .ctr_name = "rx_vport_unicast_packets",
        },
        {
-               .dpdk_name = "rx_port_multicast_packets",
+               .dpdk_name = "rx_multicast_packets",
                .ctr_name = "rx_vport_multicast_packets",
        },
        {
-               .dpdk_name = "rx_port_broadcast_packets",
+               .dpdk_name = "rx_broadcast_packets",
                .ctr_name = "rx_vport_broadcast_packets",
        },
        {
-               .dpdk_name = "tx_port_unicast_bytes",
+               .dpdk_name = "tx_unicast_bytes",
                .ctr_name = "tx_vport_unicast_bytes",
        },
        {
-               .dpdk_name = "tx_port_multicast_bytes",
+               .dpdk_name = "tx_multicast_bytes",
                .ctr_name = "tx_vport_multicast_bytes",
        },
        {
-               .dpdk_name = "tx_port_broadcast_bytes",
+               .dpdk_name = "tx_broadcast_bytes",
                .ctr_name = "tx_vport_broadcast_bytes",
        },
        {
-               .dpdk_name = "tx_port_unicast_packets",
+               .dpdk_name = "tx_unicast_packets",
                .ctr_name = "tx_vport_unicast_packets",
        },
        {
-               .dpdk_name = "tx_port_multicast_packets",
+               .dpdk_name = "tx_multicast_packets",
                .ctr_name = "tx_vport_multicast_packets",
        },
        {
-               .dpdk_name = "tx_port_broadcast_packets",
+               .dpdk_name = "tx_broadcast_packets",
                .ctr_name = "tx_vport_broadcast_packets",
        },
        {
-               .dpdk_name = "rx_wqe_err",
+               .dpdk_name = "rx_wqe_errors",
                .ctr_name = "rx_wqe_err",
        },
        {
-               .dpdk_name = "rx_crc_errors_phy",
+               .dpdk_name = "rx_phy_crc_errors",
                .ctr_name = "rx_crc_errors_phy",
        },
        {
-               .dpdk_name = "rx_in_range_len_errors_phy",
+               .dpdk_name = "rx_phy_in_range_len_errors",
                .ctr_name = "rx_in_range_len_errors_phy",
        },
        {
-               .dpdk_name = "rx_symbol_err_phy",
+               .dpdk_name = "rx_phy_symbol_errors",
                .ctr_name = "rx_symbol_err_phy",
        },
        {
-               .dpdk_name = "tx_errors_phy",
+               .dpdk_name = "tx_phy_errors",
                .ctr_name = "tx_errors_phy",
        },
        {
@@ -1343,44 +1472,44 @@ static const struct mlx5_counter_ctrl mlx5_counters_init[] = {
                .dev = 1,
        },
        {
-               .dpdk_name = "tx_packets_phy",
+               .dpdk_name = "tx_phy_packets",
                .ctr_name = "tx_packets_phy",
        },
        {
-               .dpdk_name = "rx_packets_phy",
+               .dpdk_name = "rx_phy_packets",
                .ctr_name = "rx_packets_phy",
        },
        {
-               .dpdk_name = "tx_discards_phy",
+               .dpdk_name = "tx_phy_discard_packets",
                .ctr_name = "tx_discards_phy",
        },
        {
-               .dpdk_name = "rx_discards_phy",
+               .dpdk_name = "rx_phy_discard_packets",
                .ctr_name = "rx_discards_phy",
        },
        {
-               .dpdk_name = "tx_bytes_phy",
+               .dpdk_name = "tx_phy_bytes",
                .ctr_name = "tx_bytes_phy",
        },
        {
-               .dpdk_name = "rx_bytes_phy",
+               .dpdk_name = "rx_phy_bytes",
                .ctr_name = "rx_bytes_phy",
        },
        /* Representor only */
        {
-               .dpdk_name = "rx_packets",
+               .dpdk_name = "rx_vport_packets",
                .ctr_name = "vport_rx_packets",
        },
        {
-               .dpdk_name = "rx_bytes",
+               .dpdk_name = "rx_vport_bytes",
                .ctr_name = "vport_rx_bytes",
        },
        {
-               .dpdk_name = "tx_packets",
+               .dpdk_name = "tx_vport_packets",
                .ctr_name = "vport_tx_packets",
        },
        {
-               .dpdk_name = "tx_bytes",
+               .dpdk_name = "tx_vport_bytes",
                .ctr_name = "vport_tx_bytes",
        },
 };
@@ -1430,7 +1559,12 @@ mlx5_os_stats_init(struct rte_eth_dev *dev)
        strings->string_set = ETH_SS_STATS;
        strings->len = dev_stats_n;
        ifr.ifr_data = (caddr_t)strings;
-       ret = mlx5_ifreq(dev, SIOCETHTOOL, &ifr);
+       if (priv->master && priv->pf_bond >= 0)
+               /* Bonding master. */
+               ret = mlx5_ifreq_by_ifname(priv->sh->bond.ports[0].ifname,
+                                          SIOCETHTOOL, &ifr);
+       else
+               ret = mlx5_ifreq(dev, SIOCETHTOOL, &ifr);
        if (ret) {
                DRV_LOG(WARNING, "port %u unable to get statistic names",
                        dev->data->port_id);
@@ -1496,4 +1630,3 @@ mlx5_get_mac(struct rte_eth_dev *dev, uint8_t (*mac)[RTE_ETHER_ADDR_LEN])
        memcpy(mac, request.ifr_hwaddr.sa_data, RTE_ETHER_ADDR_LEN);
        return 0;
 }
-