eal: rename power monitor condition member
[dpdk.git] / drivers / event / dlb / dlb.c
index 95b7bbe..a65f708 100644 (file)
@@ -72,6 +72,25 @@ static struct rte_event_dev_info evdev_dlb_default_info = {
 struct process_local_port_data
 dlb_port[DLB_MAX_NUM_PORTS][NUM_DLB_PORT_TYPES];
 
+static inline uint16_t
+dlb_event_enqueue_delayed(void *event_port,
+                         const struct rte_event events[]);
+
+static inline uint16_t
+dlb_event_enqueue_burst_delayed(void *event_port,
+                               const struct rte_event events[],
+                               uint16_t num);
+
+static inline uint16_t
+dlb_event_enqueue_new_burst_delayed(void *event_port,
+                                   const struct rte_event events[],
+                                   uint16_t num);
+
+static inline uint16_t
+dlb_event_enqueue_forward_burst_delayed(void *event_port,
+                                       const struct rte_event events[],
+                                       uint16_t num);
+
 static int
 dlb_hw_query_resources(struct dlb_eventdev *dlb)
 {
@@ -140,6 +159,9 @@ dlb_free_qe_mem(struct dlb_port *qm_port)
 
        rte_free(qm_port->consume_qe);
        qm_port->consume_qe = NULL;
+
+       rte_memzone_free(dlb_port[qm_port->id][PORT_TYPE(qm_port)].mz);
+       dlb_port[qm_port->id][PORT_TYPE(qm_port)].mz = NULL;
 }
 
 static int
@@ -978,7 +1000,6 @@ dlb_hw_create_ldb_port(struct dlb_eventdev *dlb,
        /* The credit window is one high water mark of QEs */
        qm_port->dir_pushcount_at_credit_expiry = 0;
        qm_port->cached_dir_credits = cfg.dir_credit_high_watermark;
-       qm_port->cq_depth = cfg.cq_depth;
        /* CQs with depth < 8 use an 8-entry queue, but withhold credits so
         * the effective depth is smaller.
         */
@@ -1003,6 +1024,33 @@ dlb_hw_create_ldb_port(struct dlb_eventdev *dlb,
 
        qm_port->dequeue_depth = dequeue_depth;
 
+       /* When using the reserved token scheme, token_pop_thresh is
+        * initially 2 * dequeue_depth. Once the tokens are reserved,
+        * the enqueue code re-assigns it to dequeue_depth.
+        */
+       qm_port->token_pop_thresh = cq_depth;
+
+       /* When the deferred scheduling vdev arg is selected, use deferred pop
+        * for all single-entry CQs.
+        */
+       if (cfg.cq_depth == 1 || (cfg.cq_depth == 2 && use_rsvd_token_scheme)) {
+               if (dlb->defer_sched)
+                       qm_port->token_pop_mode = DEFERRED_POP;
+       }
+
+       /* The default enqueue functions do not include delayed-pop support for
+        * performance reasons.
+        */
+       if (qm_port->token_pop_mode == DELAYED_POP) {
+               dlb->event_dev->enqueue = dlb_event_enqueue_delayed;
+               dlb->event_dev->enqueue_burst =
+                       dlb_event_enqueue_burst_delayed;
+               dlb->event_dev->enqueue_new_burst =
+                       dlb_event_enqueue_new_burst_delayed;
+               dlb->event_dev->enqueue_forward_burst =
+                       dlb_event_enqueue_forward_burst_delayed;
+       }
+
        qm_port->owed_tokens = 0;
        qm_port->issued_releases = 0;
 
@@ -1163,6 +1211,8 @@ dlb_hw_create_dir_port(struct dlb_eventdev *dlb,
 
        qm_port->dequeue_depth = dequeue_depth;
 
+       /* Directed ports are auto-pop, by default. */
+       qm_port->token_pop_mode = AUTO_POP;
        qm_port->owed_tokens = 0;
        qm_port->issued_releases = 0;
 
@@ -2572,6 +2622,30 @@ dlb_event_build_hcws(struct dlb_port *qm_port,
        }
 }
 
+static inline void
+dlb_construct_token_pop_qe(struct dlb_port *qm_port, int idx)
+{
+       struct dlb_cq_pop_qe *qe = (void *)qm_port->qe4;
+       int num = qm_port->owed_tokens;
+
+       if (qm_port->use_rsvd_token_scheme) {
+               /* Check if there's a deficit of reserved tokens, and return
+                * early if there are no (unreserved) tokens to consume.
+                */
+               if (num <= qm_port->cq_rsvd_token_deficit) {
+                       qm_port->cq_rsvd_token_deficit -= num;
+                       qm_port->owed_tokens = 0;
+                       return;
+               }
+               num -= qm_port->cq_rsvd_token_deficit;
+               qm_port->cq_rsvd_token_deficit = 0;
+       }
+
+       qe[idx].cmd_byte = DLB_POP_CMD_BYTE;
+       qe[idx].tokens = num - 1;
+       qm_port->owed_tokens = 0;
+}
+
 static __rte_always_inline void
 dlb_pp_write(struct dlb_enqueue_qe *qe4,
             struct process_local_port_data *port_data)
@@ -2638,7 +2712,8 @@ dlb_consume_qe_immediate(struct dlb_port *qm_port, int num)
 static inline uint16_t
 __dlb_event_enqueue_burst(void *event_port,
                          const struct rte_event events[],
-                         uint16_t num)
+                         uint16_t num,
+                         bool use_delayed)
 {
        struct dlb_eventdev_port *ev_port = event_port;
        struct dlb_port *qm_port = &ev_port->qm_port;
@@ -2666,6 +2741,35 @@ __dlb_event_enqueue_burst(void *event_port,
 
                for (; j < DLB_NUM_QES_PER_CACHE_LINE && (i + j) < num; j++) {
                        const struct rte_event *ev = &events[i + j];
+                       int16_t thresh = qm_port->token_pop_thresh;
+
+                       if (use_delayed &&
+                           qm_port->token_pop_mode == DELAYED_POP &&
+                           (ev->op == RTE_EVENT_OP_FORWARD ||
+                            ev->op == RTE_EVENT_OP_RELEASE) &&
+                           qm_port->issued_releases >= thresh - 1) {
+                               /* Insert the token pop QE and break out. This
+                                * may result in a partial HCW, but that is
+                                * simpler than supporting arbitrary QE
+                                * insertion.
+                                */
+                               dlb_construct_token_pop_qe(qm_port, j);
+
+                               /* Reset the releases for the next QE batch */
+                               qm_port->issued_releases -= thresh;
+
+                               /* When using delayed token pop mode, the
+                                * initial token threshold is the full CQ
+                                * depth. After the first token pop, we need to
+                                * reset it to the dequeue_depth.
+                                */
+                               qm_port->token_pop_thresh =
+                                       qm_port->dequeue_depth;
+
+                               pop_offs = 1;
+                               j++;
+                               break;
+                       }
 
                        if (dlb_event_enqueue_prep(ev_port, qm_port, ev,
                                                   port_data, &sched_types[j],
@@ -2701,14 +2805,29 @@ dlb_event_enqueue_burst(void *event_port,
                        const struct rte_event events[],
                        uint16_t num)
 {
-       return __dlb_event_enqueue_burst(event_port, events, num);
+       return __dlb_event_enqueue_burst(event_port, events, num, false);
+}
+
+static inline uint16_t
+dlb_event_enqueue_burst_delayed(void *event_port,
+                               const struct rte_event events[],
+                               uint16_t num)
+{
+       return __dlb_event_enqueue_burst(event_port, events, num, true);
 }
 
 static inline uint16_t
 dlb_event_enqueue(void *event_port,
                  const struct rte_event events[])
 {
-       return __dlb_event_enqueue_burst(event_port, events, 1);
+       return __dlb_event_enqueue_burst(event_port, events, 1, false);
+}
+
+static inline uint16_t
+dlb_event_enqueue_delayed(void *event_port,
+                         const struct rte_event events[])
+{
+       return __dlb_event_enqueue_burst(event_port, events, 1, true);
 }
 
 static uint16_t
@@ -2716,7 +2835,15 @@ dlb_event_enqueue_new_burst(void *event_port,
                            const struct rte_event events[],
                            uint16_t num)
 {
-       return __dlb_event_enqueue_burst(event_port, events, num);
+       return __dlb_event_enqueue_burst(event_port, events, num, false);
+}
+
+static uint16_t
+dlb_event_enqueue_new_burst_delayed(void *event_port,
+                                   const struct rte_event events[],
+                                   uint16_t num)
+{
+       return __dlb_event_enqueue_burst(event_port, events, num, true);
 }
 
 static uint16_t
@@ -2724,7 +2851,15 @@ dlb_event_enqueue_forward_burst(void *event_port,
                                const struct rte_event events[],
                                uint16_t num)
 {
-       return __dlb_event_enqueue_burst(event_port, events, num);
+       return __dlb_event_enqueue_burst(event_port, events, num, false);
+}
+
+static uint16_t
+dlb_event_enqueue_forward_burst_delayed(void *event_port,
+                                       const struct rte_event events[],
+                                       uint16_t num)
+{
+       return __dlb_event_enqueue_burst(event_port, events, num, true);
 }
 
 static __rte_always_inline int
@@ -3026,6 +3161,7 @@ dlb_dequeue_wait(struct dlb_eventdev *dlb,
                /* Interrupts not supported by PF PMD */
                return 1;
        } else if (dlb->umwait_allowed) {
+               struct rte_power_monitor_cond pmc;
                volatile struct dlb_dequeue_qe *cq_base;
                union {
                        uint64_t raw_qe[2];
@@ -3046,9 +3182,12 @@ dlb_dequeue_wait(struct dlb_eventdev *dlb,
                else
                        expected_value = 0;
 
-               rte_power_monitor(monitor_addr, expected_value,
-                                 qe_mask.raw_qe[1], timeout + start_ticks,
-                                 sizeof(uint64_t));
+               pmc.addr = monitor_addr;
+               pmc.val = expected_value;
+               pmc.mask = qe_mask.raw_qe[1];
+               pmc.size = sizeof(uint64_t);
+
+               rte_power_monitor(&pmc, timeout + start_ticks);
 
                DLB_INC_STAT(ev_port->stats.traffic.rx_umonitor_umwait, 1);
        } else {
@@ -3124,7 +3263,8 @@ dlb_hw_dequeue(struct dlb_eventdev *dlb,
 
        qm_port->owed_tokens += num;
 
-       dlb_consume_qe_immediate(qm_port, num);
+       if (num && qm_port->token_pop_mode == AUTO_POP)
+               dlb_consume_qe_immediate(qm_port, num);
 
        ev_port->outstanding_releases += num;
 
@@ -3249,7 +3389,8 @@ dlb_hw_dequeue_sparse(struct dlb_eventdev *dlb,
 
        qm_port->owed_tokens += num;
 
-       dlb_consume_qe_immediate(qm_port, num);
+       if (num && qm_port->token_pop_mode == AUTO_POP)
+               dlb_consume_qe_immediate(qm_port, num);
 
        ev_port->outstanding_releases += num;
 
@@ -3293,6 +3434,28 @@ dlb_event_release(struct dlb_eventdev *dlb, uint8_t port_id, int n)
                qm_port->qe4[3].cmd_byte = 0;
 
                for (; j < DLB_NUM_QES_PER_CACHE_LINE && (i + j) < n; j++) {
+                       int16_t thresh = qm_port->token_pop_thresh;
+
+                       if (qm_port->token_pop_mode == DELAYED_POP &&
+                           qm_port->issued_releases >= thresh - 1) {
+                               /* Insert the token pop QE */
+                               dlb_construct_token_pop_qe(qm_port, j);
+
+                               /* Reset the releases for the next QE batch */
+                               qm_port->issued_releases -= thresh;
+
+                               /* When using delayed token pop mode, the
+                                * initial token threshold is the full CQ
+                                * depth. After the first token pop, we need to
+                                * reset it to the dequeue_depth.
+                                */
+                               qm_port->token_pop_thresh =
+                                       qm_port->dequeue_depth;
+
+                               pop_offs = 1;
+                               j++;
+                               break;
+                       }
 
                        qm_port->qe4[j].cmd_byte = DLB_COMP_CMD_BYTE;
                        qm_port->issued_releases++;
@@ -3325,6 +3488,7 @@ dlb_event_dequeue_burst(void *event_port, struct rte_event *ev, uint16_t num,
                        uint64_t wait)
 {
        struct dlb_eventdev_port *ev_port = event_port;
+       struct dlb_port *qm_port = &ev_port->qm_port;
        struct dlb_eventdev *dlb = ev_port->dlb;
        uint16_t cnt;
        int ret;
@@ -3344,6 +3508,10 @@ dlb_event_dequeue_burst(void *event_port, struct rte_event *ev, uint16_t num,
                DLB_INC_STAT(ev_port->stats.tx_implicit_rel, out_rels);
        }
 
+       if (qm_port->token_pop_mode == DEFERRED_POP &&
+                       qm_port->owed_tokens)
+               dlb_consume_qe_immediate(qm_port, qm_port->owed_tokens);
+
        cnt = dlb_hw_dequeue(dlb, ev_port, ev, num, wait);
 
        DLB_INC_STAT(ev_port->stats.traffic.total_polls, 1);
@@ -3362,6 +3530,7 @@ dlb_event_dequeue_burst_sparse(void *event_port, struct rte_event *ev,
                               uint16_t num, uint64_t wait)
 {
        struct dlb_eventdev_port *ev_port = event_port;
+       struct dlb_port *qm_port = &ev_port->qm_port;
        struct dlb_eventdev *dlb = ev_port->dlb;
        uint16_t cnt;
        int ret;
@@ -3381,6 +3550,10 @@ dlb_event_dequeue_burst_sparse(void *event_port, struct rte_event *ev,
                DLB_INC_STAT(ev_port->stats.tx_implicit_rel, out_rels);
        }
 
+       if (qm_port->token_pop_mode == DEFERRED_POP &&
+           qm_port->owed_tokens)
+               dlb_consume_qe_immediate(qm_port, qm_port->owed_tokens);
+
        cnt = dlb_hw_dequeue_sparse(dlb, ev_port, ev, num, wait);
 
        DLB_INC_STAT(ev_port->stats.traffic.total_polls, 1);
@@ -3637,6 +3810,40 @@ dlb_eventdev_close(struct rte_eventdev *dev)
        return 0;
 }
 
+static void
+dlb_eventdev_port_release(void *port)
+{
+       struct dlb_eventdev_port *ev_port = port;
+
+       if (ev_port) {
+               struct dlb_port *qm_port = &ev_port->qm_port;
+
+               if (qm_port->config_state == DLB_CONFIGURED)
+                       dlb_free_qe_mem(qm_port);
+       }
+}
+
+static void
+dlb_eventdev_queue_release(struct rte_eventdev *dev, uint8_t id)
+{
+       RTE_SET_USED(dev);
+       RTE_SET_USED(id);
+
+       /* This function intentionally left blank. */
+}
+
+static int
+dlb_eventdev_timeout_ticks(struct rte_eventdev *dev, uint64_t ns,
+                          uint64_t *timeout_ticks)
+{
+       RTE_SET_USED(dev);
+       uint64_t cycles_per_ns = rte_get_timer_hz() / 1E9;
+
+       *timeout_ticks = ns * cycles_per_ns;
+
+       return 0;
+}
+
 void
 dlb_entry_points_init(struct rte_eventdev *dev)
 {
@@ -3651,16 +3858,20 @@ dlb_entry_points_init(struct rte_eventdev *dev)
                .queue_def_conf   = dlb_eventdev_queue_default_conf_get,
                .port_def_conf    = dlb_eventdev_port_default_conf_get,
                .queue_setup      = dlb_eventdev_queue_setup,
+               .queue_release    = dlb_eventdev_queue_release,
                .port_setup       = dlb_eventdev_port_setup,
+               .port_release     = dlb_eventdev_port_release,
                .port_link        = dlb_eventdev_port_link,
                .port_unlink      = dlb_eventdev_port_unlink,
                .port_unlinks_in_progress =
                                    dlb_eventdev_port_unlinks_in_progress,
+               .timeout_ticks    = dlb_eventdev_timeout_ticks,
                .dump             = dlb_eventdev_dump,
                .xstats_get       = dlb_eventdev_xstats_get,
                .xstats_get_names = dlb_eventdev_xstats_get_names,
                .xstats_get_by_name = dlb_eventdev_xstats_get_by_name,
                .xstats_reset       = dlb_eventdev_xstats_reset,
+               .dev_selftest     = test_dlb_eventdev,
        };
 
        /* Expose PMD's eventdev interface */
@@ -3687,7 +3898,7 @@ dlb_primary_eventdev_probe(struct rte_eventdev *dev,
                           struct dlb_devargs *dlb_args)
 {
        struct dlb_eventdev *dlb;
-       int err;
+       int err, i;
 
        dlb = dev->data->dev_private;
 
@@ -3736,6 +3947,10 @@ dlb_primary_eventdev_probe(struct rte_eventdev *dev,
                return err;
        }
 
+       /* Initialize each port's token pop mode */
+       for (i = 0; i < DLB_MAX_NUM_PORTS; i++)
+               dlb->ev_ports[i].qm_port.token_pop_mode = AUTO_POP;
+
        rte_spinlock_init(&dlb->qm_instance.resource_lock);
 
        dlb_iface_low_level_io_init(dlb);