net/hns3: support device reset
[dpdk.git] / drivers / net / hns3 / hns3_intr.c
index 3cf52a2..9e2d811 100644 (file)
                        hw->reset.stats.merge_cnt++;    \
        } while (0)
 
+static const char *reset_string[HNS3_MAX_RESET] = {
+       "none", "vf_func", "vf_pf_func", "vf_full", "flr",
+       "vf_global", "pf_func", "global", "IMP",
+};
+
 const struct hns3_hw_error mac_afifo_tnl_int[] = {
        { .int_msk = BIT(0), .msg = "egu_cge_afifo_ecc_1bit_err",
          .reset_level = HNS3_NONE_RESET },
@@ -652,3 +657,510 @@ hns3_handle_msix_error(struct hns3_adapter *hns, uint64_t *levels)
 out:
        rte_free(desc);
 }
+
+int
+hns3_reset_init(struct hns3_hw *hw)
+{
+       rte_spinlock_init(&hw->lock);
+       hw->reset.level = HNS3_NONE_RESET;
+       hw->reset.stage = RESET_STAGE_NONE;
+       hw->reset.request = 0;
+       hw->reset.pending = 0;
+       rte_atomic16_init(&hw->reset.resetting);
+       rte_atomic16_init(&hw->reset.disable_cmd);
+       hw->reset.wait_data = rte_zmalloc("wait_data",
+                                         sizeof(struct hns3_wait_data), 0);
+       if (!hw->reset.wait_data) {
+               PMD_INIT_LOG(ERR, "Failed to allocate memory for wait_data");
+               return -ENOMEM;
+       }
+       return 0;
+}
+
+void
+hns3_schedule_reset(struct hns3_adapter *hns)
+{
+       struct hns3_hw *hw = &hns->hw;
+
+       /* Reschedule the reset process after successful initialization */
+       if (hw->adapter_state == HNS3_NIC_UNINITIALIZED) {
+               rte_atomic16_set(&hns->hw.reset.schedule, SCHEDULE_PENDING);
+               return;
+       }
+
+       if (hw->adapter_state >= HNS3_NIC_CLOSED)
+               return;
+
+       /* Schedule restart alarm if it is not scheduled yet */
+       if (rte_atomic16_read(&hns->hw.reset.schedule) == SCHEDULE_REQUESTED)
+               return;
+       if (rte_atomic16_read(&hns->hw.reset.schedule) == SCHEDULE_DEFERRED)
+               rte_eal_alarm_cancel(hw->reset.ops->reset_service, hns);
+       rte_atomic16_set(&hns->hw.reset.schedule, SCHEDULE_REQUESTED);
+
+       rte_eal_alarm_set(SWITCH_CONTEXT_US, hw->reset.ops->reset_service, hns);
+}
+
+void
+hns3_schedule_delayed_reset(struct hns3_adapter *hns)
+{
+#define DEFERRED_SCHED_US (3 * MSEC_PER_SEC * USEC_PER_MSEC)
+       struct hns3_hw *hw = &hns->hw;
+
+       /* Do nothing if it is uninited or closed */
+       if (hw->adapter_state == HNS3_NIC_UNINITIALIZED ||
+           hw->adapter_state >= HNS3_NIC_CLOSED) {
+               return;
+       }
+
+       if (rte_atomic16_read(&hns->hw.reset.schedule) != SCHEDULE_NONE)
+               return;
+       rte_atomic16_set(&hns->hw.reset.schedule, SCHEDULE_DEFERRED);
+       rte_eal_alarm_set(DEFERRED_SCHED_US, hw->reset.ops->reset_service, hns);
+}
+
+void
+hns3_wait_callback(void *param)
+{
+       struct hns3_wait_data *data = (struct hns3_wait_data *)param;
+       struct hns3_adapter *hns = data->hns;
+       struct hns3_hw *hw = &hns->hw;
+       uint64_t msec;
+       bool done;
+
+       data->count--;
+       if (data->check_completion) {
+               /*
+                * Check if the current time exceeds the deadline
+                * or a pending reset coming, or reset during close.
+                */
+               msec = get_timeofday_ms();
+               if (msec > data->end_ms || is_reset_pending(hns) ||
+                   hw->adapter_state == HNS3_NIC_CLOSING) {
+                       done = false;
+                       data->count = 0;
+               } else
+                       done = data->check_completion(hw);
+       } else
+               done = true;
+
+       if (!done && data->count > 0) {
+               rte_eal_alarm_set(data->interval, hns3_wait_callback, data);
+               return;
+       }
+       if (done)
+               data->result = HNS3_WAIT_SUCCESS;
+       else {
+               hns3_err(hw, "%s wait timeout at stage %d",
+                        reset_string[hw->reset.level], hw->reset.stage);
+               data->result = HNS3_WAIT_TIMEOUT;
+       }
+       hns3_schedule_reset(hns);
+}
+
+void
+hns3_notify_reset_ready(struct hns3_hw *hw, bool enable)
+{
+       uint32_t reg_val;
+
+       reg_val = hns3_read_dev(hw, HNS3_CMDQ_TX_DEPTH_REG);
+       if (enable)
+               reg_val |= HNS3_NIC_SW_RST_RDY;
+       else
+               reg_val &= ~HNS3_NIC_SW_RST_RDY;
+
+       hns3_write_dev(hw, HNS3_CMDQ_TX_DEPTH_REG, reg_val);
+}
+
+int
+hns3_reset_req_hw_reset(struct hns3_adapter *hns)
+{
+       struct hns3_hw *hw = &hns->hw;
+
+       if (hw->reset.wait_data->result == HNS3_WAIT_UNKNOWN) {
+               hw->reset.wait_data->hns = hns;
+               hw->reset.wait_data->check_completion = NULL;
+               hw->reset.wait_data->interval = HNS3_RESET_SYNC_US;
+               hw->reset.wait_data->count = 1;
+               hw->reset.wait_data->result = HNS3_WAIT_REQUEST;
+               rte_eal_alarm_set(hw->reset.wait_data->interval,
+                                 hns3_wait_callback, hw->reset.wait_data);
+               return -EAGAIN;
+       } else if (hw->reset.wait_data->result == HNS3_WAIT_REQUEST)
+               return -EAGAIN;
+
+       /* inform hardware that preparatory work is done */
+       hns3_notify_reset_ready(hw, true);
+       return 0;
+}
+
+static void
+hns3_clear_reset_level(struct hns3_hw *hw, uint64_t *levels)
+{
+       uint64_t merge_cnt = hw->reset.stats.merge_cnt;
+       int64_t tmp;
+
+       switch (hw->reset.level) {
+       case HNS3_IMP_RESET:
+               hns3_atomic_clear_bit(HNS3_IMP_RESET, levels);
+               tmp = hns3_test_and_clear_bit(HNS3_GLOBAL_RESET, levels);
+               HNS3_CHECK_MERGE_CNT(tmp);
+               tmp = hns3_test_and_clear_bit(HNS3_FUNC_RESET, levels);
+               HNS3_CHECK_MERGE_CNT(tmp);
+               break;
+       case HNS3_GLOBAL_RESET:
+               hns3_atomic_clear_bit(HNS3_GLOBAL_RESET, levels);
+               tmp = hns3_test_and_clear_bit(HNS3_FUNC_RESET, levels);
+               HNS3_CHECK_MERGE_CNT(tmp);
+               break;
+       case HNS3_FUNC_RESET:
+               hns3_atomic_clear_bit(HNS3_FUNC_RESET, levels);
+               break;
+       case HNS3_VF_RESET:
+               hns3_atomic_clear_bit(HNS3_VF_RESET, levels);
+               tmp = hns3_test_and_clear_bit(HNS3_VF_PF_FUNC_RESET, levels);
+               HNS3_CHECK_MERGE_CNT(tmp);
+               tmp = hns3_test_and_clear_bit(HNS3_VF_FUNC_RESET, levels);
+               HNS3_CHECK_MERGE_CNT(tmp);
+               break;
+       case HNS3_VF_FULL_RESET:
+               hns3_atomic_clear_bit(HNS3_VF_FULL_RESET, levels);
+               tmp = hns3_test_and_clear_bit(HNS3_VF_FUNC_RESET, levels);
+               HNS3_CHECK_MERGE_CNT(tmp);
+               break;
+       case HNS3_VF_PF_FUNC_RESET:
+               hns3_atomic_clear_bit(HNS3_VF_PF_FUNC_RESET, levels);
+               tmp = hns3_test_and_clear_bit(HNS3_VF_FUNC_RESET, levels);
+               HNS3_CHECK_MERGE_CNT(tmp);
+               break;
+       case HNS3_VF_FUNC_RESET:
+               hns3_atomic_clear_bit(HNS3_VF_FUNC_RESET, levels);
+               break;
+       case HNS3_FLR_RESET:
+               hns3_atomic_clear_bit(HNS3_FLR_RESET, levels);
+               break;
+       case HNS3_NONE_RESET:
+       default:
+               return;
+       };
+       if (merge_cnt != hw->reset.stats.merge_cnt)
+               hns3_warn(hw,
+                         "No need to do low-level reset after %s reset. "
+                         "merge cnt: %" PRIx64 " total merge cnt: %" PRIx64,
+                         reset_string[hw->reset.level],
+                         hw->reset.stats.merge_cnt - merge_cnt,
+                         hw->reset.stats.merge_cnt);
+}
+
+static bool
+hns3_reset_err_handle(struct hns3_adapter *hns)
+{
+#define MAX_RESET_FAIL_CNT 5
+
+       struct hns3_hw *hw = &hns->hw;
+
+       if (hw->adapter_state == HNS3_NIC_CLOSING)
+               goto reset_fail;
+
+       if (is_reset_pending(hns)) {
+               hw->reset.attempts = 0;
+               hw->reset.stats.fail_cnt++;
+               hns3_warn(hw, "%s reset fail because new Reset is pending "
+                             "attempts:%" PRIx64,
+                         reset_string[hw->reset.level],
+                         hw->reset.stats.fail_cnt);
+               hw->reset.level = HNS3_NONE_RESET;
+               return true;
+       }
+
+       hw->reset.attempts++;
+       if (hw->reset.attempts < MAX_RESET_FAIL_CNT) {
+               hns3_atomic_set_bit(hw->reset.level, &hw->reset.pending);
+               hns3_warn(hw, "%s retry to reset attempts: %d",
+                         reset_string[hw->reset.level],
+                         hw->reset.attempts);
+               return true;
+       }
+
+       if (rte_atomic16_read(&hw->reset.disable_cmd))
+               hns3_cmd_init(hw);
+reset_fail:
+       hw->reset.attempts = 0;
+       hw->reset.stats.fail_cnt++;
+       hns3_warn(hw, "%s reset fail fail_cnt:%" PRIx64 " success_cnt:%" PRIx64
+                 " global_cnt:%" PRIx64 " imp_cnt:%" PRIx64
+                 " request_cnt:%" PRIx64 " exec_cnt:%" PRIx64
+                 " merge_cnt:%" PRIx64,
+                 reset_string[hw->reset.level], hw->reset.stats.fail_cnt,
+                 hw->reset.stats.success_cnt, hw->reset.stats.global_cnt,
+                 hw->reset.stats.imp_cnt, hw->reset.stats.request_cnt,
+                 hw->reset.stats.exec_cnt, hw->reset.stats.merge_cnt);
+
+       /* IMP no longer waiting the ready flag */
+       hns3_notify_reset_ready(hw, true);
+       return false;
+}
+
+static int
+hns3_reset_pre(struct hns3_adapter *hns)
+{
+       struct hns3_hw *hw = &hns->hw;
+       struct timeval tv;
+       int ret;
+
+       if (hw->reset.stage == RESET_STAGE_NONE) {
+               rte_atomic16_set(&hns->hw.reset.resetting, 1);
+               hw->reset.stage = RESET_STAGE_DOWN;
+               ret = hw->reset.ops->stop_service(hns);
+               gettimeofday(&tv, NULL);
+               if (ret) {
+                       hns3_warn(hw, "Reset step1 down fail=%d time=%ld.%.6ld",
+                                 ret, tv.tv_sec, tv.tv_usec);
+                       return ret;
+               }
+               hns3_warn(hw, "Reset step1 down success time=%ld.%.6ld",
+                         tv.tv_sec, tv.tv_usec);
+               hw->reset.stage = RESET_STAGE_PREWAIT;
+       }
+       if (hw->reset.stage == RESET_STAGE_PREWAIT) {
+               ret = hw->reset.ops->prepare_reset(hns);
+               gettimeofday(&tv, NULL);
+               if (ret) {
+                       hns3_warn(hw,
+                                 "Reset step2 prepare wait fail=%d time=%ld.%.6ld",
+                                 ret, tv.tv_sec, tv.tv_usec);
+                       return ret;
+               }
+               hns3_warn(hw, "Reset step2 prepare wait success time=%ld.%.6ld",
+                         tv.tv_sec, tv.tv_usec);
+               hw->reset.stage = RESET_STAGE_REQ_HW_RESET;
+               hw->reset.wait_data->result = HNS3_WAIT_UNKNOWN;
+       }
+       return 0;
+}
+
+static int
+hns3_reset_post(struct hns3_adapter *hns)
+{
+#define TIMEOUT_RETRIES_CNT    5
+       struct hns3_hw *hw = &hns->hw;
+       struct timeval tv_delta;
+       struct timeval tv;
+       int ret = 0;
+
+       if (hw->adapter_state == HNS3_NIC_CLOSING) {
+               hns3_warn(hw, "Don't do reset_post during closing, just uninit cmd");
+               hns3_cmd_uninit(hw);
+               return -EPERM;
+       }
+
+       if (hw->reset.stage == RESET_STAGE_DEV_INIT) {
+               rte_spinlock_lock(&hw->lock);
+               if (hw->reset.mbuf_deferred_free) {
+                       hns3_dev_release_mbufs(hns);
+                       hw->reset.mbuf_deferred_free = false;
+               }
+               ret = hw->reset.ops->reinit_dev(hns);
+               rte_spinlock_unlock(&hw->lock);
+               gettimeofday(&tv, NULL);
+               if (ret) {
+                       hns3_warn(hw, "Reset step5 devinit fail=%d retries=%d",
+                                 ret, hw->reset.retries);
+                       goto err;
+               }
+               hns3_warn(hw, "Reset step5 devinit success time=%ld.%.6ld",
+                         tv.tv_sec, tv.tv_usec);
+               hw->reset.retries = 0;
+               hw->reset.stage = RESET_STAGE_RESTORE;
+               rte_eal_alarm_set(SWITCH_CONTEXT_US,
+                                 hw->reset.ops->reset_service, hns);
+               return -EAGAIN;
+       }
+       if (hw->reset.stage == RESET_STAGE_RESTORE) {
+               rte_spinlock_lock(&hw->lock);
+               ret = hw->reset.ops->restore_conf(hns);
+               rte_spinlock_unlock(&hw->lock);
+               gettimeofday(&tv, NULL);
+               if (ret) {
+                       hns3_warn(hw,
+                                 "Reset step6 restore fail=%d retries=%d",
+                                 ret, hw->reset.retries);
+                       goto err;
+               }
+               hns3_warn(hw, "Reset step6 restore success time=%ld.%.6ld",
+                         tv.tv_sec, tv.tv_usec);
+               hw->reset.retries = 0;
+               hw->reset.stage = RESET_STAGE_DONE;
+       }
+       if (hw->reset.stage == RESET_STAGE_DONE) {
+               /* IMP will wait ready flag before reset */
+               hns3_notify_reset_ready(hw, false);
+               hns3_clear_reset_level(hw, &hw->reset.pending);
+               rte_atomic16_clear(&hns->hw.reset.resetting);
+               hw->reset.attempts = 0;
+               hw->reset.stats.success_cnt++;
+               hw->reset.stage = RESET_STAGE_NONE;
+               hw->reset.ops->start_service(hns);
+               gettimeofday(&tv, NULL);
+               timersub(&tv, &hw->reset.start_time, &tv_delta);
+               hns3_warn(hw, "%s reset done fail_cnt:%" PRIx64
+                         " success_cnt:%" PRIx64 " global_cnt:%" PRIx64
+                         " imp_cnt:%" PRIx64 " request_cnt:%" PRIx64
+                         " exec_cnt:%" PRIx64 " merge_cnt:%" PRIx64,
+                         reset_string[hw->reset.level],
+                         hw->reset.stats.fail_cnt, hw->reset.stats.success_cnt,
+                         hw->reset.stats.global_cnt, hw->reset.stats.imp_cnt,
+                         hw->reset.stats.request_cnt, hw->reset.stats.exec_cnt,
+                         hw->reset.stats.merge_cnt);
+               hns3_warn(hw,
+                         "%s reset done delta %ld ms time=%ld.%.6ld",
+                         reset_string[hw->reset.level],
+                         tv_delta.tv_sec * MSEC_PER_SEC +
+                         tv_delta.tv_usec / USEC_PER_MSEC,
+                         tv.tv_sec, tv.tv_usec);
+               hw->reset.level = HNS3_NONE_RESET;
+       }
+       return 0;
+
+err:
+       if (ret == -ETIME) {
+               hw->reset.retries++;
+               if (hw->reset.retries < TIMEOUT_RETRIES_CNT) {
+                       rte_eal_alarm_set(HNS3_RESET_SYNC_US,
+                                         hw->reset.ops->reset_service, hns);
+                       return -EAGAIN;
+               }
+       }
+       hw->reset.retries = 0;
+       return -EIO;
+}
+
+/*
+ * There are three scenarios as follows:
+ * When the reset is not in progress, the reset process starts.
+ * During the reset process, if the reset level has not changed,
+ * the reset process continues; otherwise, the reset process is aborted.
+ *     hw->reset.level   new_level          action
+ *     HNS3_NONE_RESET  HNS3_XXXX_RESET    start reset
+ *     HNS3_XXXX_RESET  HNS3_XXXX_RESET    continue reset
+ *     HNS3_LOW_RESET   HNS3_HIGH_RESET    abort
+ */
+int
+hns3_reset_process(struct hns3_adapter *hns, enum hns3_reset_level new_level)
+{
+       struct hns3_hw *hw = &hns->hw;
+       struct timeval tv_delta;
+       struct timeval tv;
+       int ret;
+
+       if (hw->reset.level == HNS3_NONE_RESET) {
+               hw->reset.level = new_level;
+               hw->reset.stats.exec_cnt++;
+               gettimeofday(&hw->reset.start_time, NULL);
+               hns3_warn(hw, "Start %s reset time=%ld.%.6ld",
+                         reset_string[hw->reset.level],
+                         hw->reset.start_time.tv_sec,
+                         hw->reset.start_time.tv_usec);
+       }
+
+       if (is_reset_pending(hns)) {
+               gettimeofday(&tv, NULL);
+               hns3_warn(hw,
+                         "%s reset is aborted by high level time=%ld.%.6ld",
+                         reset_string[hw->reset.level], tv.tv_sec, tv.tv_usec);
+               if (hw->reset.wait_data->result == HNS3_WAIT_REQUEST)
+                       rte_eal_alarm_cancel(hns3_wait_callback,
+                                            hw->reset.wait_data);
+               ret = -EBUSY;
+               goto err;
+       }
+
+       ret = hns3_reset_pre(hns);
+       if (ret)
+               goto err;
+
+       if (hw->reset.stage == RESET_STAGE_REQ_HW_RESET) {
+               ret = hns3_reset_req_hw_reset(hns);
+               if (ret == -EAGAIN)
+                       return ret;
+               gettimeofday(&tv, NULL);
+               hns3_warn(hw,
+                         "Reset step3 request IMP reset success time=%ld.%.6ld",
+                         tv.tv_sec, tv.tv_usec);
+               hw->reset.stage = RESET_STAGE_WAIT;
+               hw->reset.wait_data->result = HNS3_WAIT_UNKNOWN;
+       }
+       if (hw->reset.stage == RESET_STAGE_WAIT) {
+               ret = hw->reset.ops->wait_hardware_ready(hns);
+               if (ret)
+                       goto retry;
+               gettimeofday(&tv, NULL);
+               hns3_warn(hw, "Reset step4 reset wait success time=%ld.%.6ld",
+                         tv.tv_sec, tv.tv_usec);
+               hw->reset.stage = RESET_STAGE_DEV_INIT;
+       }
+
+       ret = hns3_reset_post(hns);
+       if (ret)
+               goto retry;
+
+       return 0;
+retry:
+       if (ret == -EAGAIN)
+               return ret;
+err:
+       hns3_clear_reset_level(hw, &hw->reset.pending);
+       if (hns3_reset_err_handle(hns)) {
+               hw->reset.stage = RESET_STAGE_PREWAIT;
+               hns3_schedule_reset(hns);
+       } else {
+               rte_spinlock_lock(&hw->lock);
+               if (hw->reset.mbuf_deferred_free) {
+                       hns3_dev_release_mbufs(hns);
+                       hw->reset.mbuf_deferred_free = false;
+               }
+               rte_spinlock_unlock(&hw->lock);
+               rte_atomic16_clear(&hns->hw.reset.resetting);
+               hw->reset.stage = RESET_STAGE_NONE;
+               gettimeofday(&tv, NULL);
+               timersub(&tv, &hw->reset.start_time, &tv_delta);
+               hns3_warn(hw, "%s reset fail delta %ld ms time=%ld.%.6ld",
+                         reset_string[hw->reset.level],
+                         tv_delta.tv_sec * MSEC_PER_SEC +
+                         tv_delta.tv_usec / USEC_PER_MSEC,
+                         tv.tv_sec, tv.tv_usec);
+               hw->reset.level = HNS3_NONE_RESET;
+       }
+
+       return -EIO;
+}
+
+/*
+ * The reset process can only be terminated after handshake with IMP(step3),
+ * so that IMP can complete the reset process normally.
+ */
+void
+hns3_reset_abort(struct hns3_adapter *hns)
+{
+       struct hns3_hw *hw = &hns->hw;
+       struct timeval tv;
+       int i;
+
+       for (i = 0; i < HNS3_QUIT_RESET_CNT; i++) {
+               if (hw->reset.level == HNS3_NONE_RESET)
+                       break;
+               rte_delay_ms(HNS3_QUIT_RESET_DELAY_MS);
+       }
+
+       /* IMP no longer waiting the ready flag */
+       hns3_notify_reset_ready(hw, true);
+
+       rte_eal_alarm_cancel(hw->reset.ops->reset_service, hns);
+       rte_eal_alarm_cancel(hns3_wait_callback, hw->reset.wait_data);
+
+       if (hw->reset.level != HNS3_NONE_RESET) {
+               gettimeofday(&tv, NULL);
+               hns3_err(hw, "Failed to terminate reset: %s time=%ld.%.6ld",
+                        reset_string[hw->reset.level], tv.tv_sec, tv.tv_usec);
+       }
+}