net/ice: fix flow redirect
[dpdk.git] / drivers / event / octeontx2 / otx2_tim_evdev.c
index c668e26..6da8b14 100644 (file)
@@ -9,7 +9,7 @@
 #include "otx2_evdev.h"
 #include "otx2_tim_evdev.h"
 
-static struct rte_event_timer_adapter_ops otx2_tim_ops;
+static struct event_timer_adapter_ops otx2_tim_ops;
 
 static inline int
 tim_get_msix_offsets(void)
@@ -34,25 +34,26 @@ tim_set_fp_ops(struct otx2_tim_ring *tim_ring)
 {
        uint8_t prod_flag = !tim_ring->prod_type_sp;
 
-       /* [MOD/AND] [DFB/FB] [SP][MP]*/
+       /* [DFB/FB] [SP][MP]*/
        const rte_event_timer_arm_burst_t arm_burst[2][2][2] = {
-#define FP(_name,  _f3, _f2, _f1, flags) \
-               [_f3][_f2][_f1] = otx2_tim_arm_burst_ ## _name,
-TIM_ARM_FASTPATH_MODES
+#define FP(_name, _f3, _f2, _f1, flags)                                        \
+       [_f3][_f2][_f1] = otx2_tim_arm_burst_##_name,
+               TIM_ARM_FASTPATH_MODES
 #undef FP
        };
 
        const rte_event_timer_arm_tmo_tick_burst_t arm_tmo_burst[2][2] = {
-#define FP(_name, _f2, _f1, flags) \
-               [_f2][_f1] = otx2_tim_arm_tmo_tick_burst_ ## _name,
-TIM_ARM_TMO_FASTPATH_MODES
+#define FP(_name, _f2, _f1, flags)                                             \
+       [_f2][_f1] = otx2_tim_arm_tmo_tick_burst_##_name,
+               TIM_ARM_TMO_FASTPATH_MODES
 #undef FP
        };
 
-       otx2_tim_ops.arm_burst = arm_burst[tim_ring->optimized]
-                               [tim_ring->ena_dfb][prod_flag];
-       otx2_tim_ops.arm_tmo_tick_burst = arm_tmo_burst[tim_ring->optimized]
-                               [tim_ring->ena_dfb];
+       otx2_tim_ops.arm_burst =
+               arm_burst[tim_ring->enable_stats][tim_ring->ena_dfb][prod_flag];
+       otx2_tim_ops.arm_tmo_tick_burst =
+               arm_tmo_burst[tim_ring->enable_stats][tim_ring->ena_dfb];
+       otx2_tim_ops.cancel_burst = otx2_tim_timer_cancel_burst;
 }
 
 static void
@@ -62,56 +63,12 @@ otx2_tim_ring_info_get(const struct rte_event_timer_adapter *adptr,
        struct otx2_tim_ring *tim_ring = adptr->data->adapter_priv;
 
        adptr_info->max_tmo_ns = tim_ring->max_tout;
-       adptr_info->min_resolution_ns = tim_ring->tck_nsec;
+       adptr_info->min_resolution_ns = tim_ring->ena_periodic ?
+               tim_ring->max_tout : tim_ring->tck_nsec;
        rte_memcpy(&adptr_info->conf, &adptr->data->conf,
                   sizeof(struct rte_event_timer_adapter_conf));
 }
 
-static void
-tim_optimze_bkt_param(struct otx2_tim_ring *tim_ring)
-{
-       uint64_t tck_nsec;
-       uint32_t hbkts;
-       uint32_t lbkts;
-
-       hbkts = rte_align32pow2(tim_ring->nb_bkts);
-       tck_nsec = RTE_ALIGN_MUL_CEIL(tim_ring->max_tout / (hbkts - 1), 10);
-
-       if ((tck_nsec < TICK2NSEC(OTX2_TIM_MIN_TMO_TKS,
-                                 tim_ring->tenns_clk_freq) ||
-           hbkts > OTX2_TIM_MAX_BUCKETS))
-               hbkts = 0;
-
-       lbkts = rte_align32prevpow2(tim_ring->nb_bkts);
-       tck_nsec = RTE_ALIGN_MUL_CEIL((tim_ring->max_tout / (lbkts - 1)), 10);
-
-       if ((tck_nsec < TICK2NSEC(OTX2_TIM_MIN_TMO_TKS,
-                                 tim_ring->tenns_clk_freq) ||
-           lbkts > OTX2_TIM_MAX_BUCKETS))
-               lbkts = 0;
-
-       if (!hbkts && !lbkts)
-               return;
-
-       if (!hbkts) {
-               tim_ring->nb_bkts = lbkts;
-               goto end;
-       } else if (!lbkts) {
-               tim_ring->nb_bkts = hbkts;
-               goto end;
-       }
-
-       tim_ring->nb_bkts = (hbkts - tim_ring->nb_bkts) <
-               (tim_ring->nb_bkts - lbkts) ? hbkts : lbkts;
-end:
-       tim_ring->optimized = true;
-       tim_ring->tck_nsec = RTE_ALIGN_MUL_CEIL((tim_ring->max_tout /
-                                               (tim_ring->nb_bkts - 1)), 10);
-       otx2_tim_dbg("Optimized configured values");
-       otx2_tim_dbg("Nb_bkts  : %" PRIu32 "", tim_ring->nb_bkts);
-       otx2_tim_dbg("Tck_nsec : %" PRIu64 "", tim_ring->tck_nsec);
-}
-
 static int
 tim_chnk_pool_create(struct otx2_tim_ring *tim_ring,
                     struct rte_event_timer_adapter_conf *rcfg)
@@ -121,9 +78,10 @@ tim_chnk_pool_create(struct otx2_tim_ring *tim_ring,
        char pool_name[25];
        int rc;
 
+       cache_sz /= rte_lcore_count();
        /* Create chunk pool. */
        if (rcfg->flags & RTE_EVENT_TIMER_ADAPTER_F_SP_PUT) {
-               mp_flags = MEMPOOL_F_SP_PUT | MEMPOOL_F_SC_GET;
+               mp_flags = RTE_MEMPOOL_F_SP_PUT | RTE_MEMPOOL_F_SC_GET;
                otx2_tim_dbg("Using single producer mode");
                tim_ring->prod_type_sp = true;
        }
@@ -134,11 +92,12 @@ tim_chnk_pool_create(struct otx2_tim_ring *tim_ring,
        if (cache_sz > RTE_MEMPOOL_CACHE_MAX_SIZE)
                cache_sz = RTE_MEMPOOL_CACHE_MAX_SIZE;
 
+       cache_sz = cache_sz != 0 ? cache_sz : 2;
+       tim_ring->nb_chunks += (cache_sz * rte_lcore_count());
        if (!tim_ring->disable_npa) {
-               /* NPA need not have cache as free is not visible to SW */
                tim_ring->chunk_pool = rte_mempool_create_empty(pool_name,
                                tim_ring->nb_chunks, tim_ring->chunk_sz,
-                               0, 0, rte_socket_id(), mp_flags);
+                               cache_sz, 0, rte_socket_id(), mp_flags);
 
                if (tim_ring->chunk_pool == NULL) {
                        otx2_err("Unable to create chunkpool.");
@@ -160,7 +119,7 @@ tim_chnk_pool_create(struct otx2_tim_ring *tim_ring,
                }
                tim_ring->aura = npa_lf_aura_handle_to_aura(
                                tim_ring->chunk_pool->pool_id);
-               tim_ring->ena_dfb = 0;
+               tim_ring->ena_dfb = tim_ring->ena_periodic ? 1 : 0;
        } else {
                tim_ring->chunk_pool = rte_mempool_create(pool_name,
                                tim_ring->nb_chunks, tim_ring->chunk_sz,
@@ -251,8 +210,8 @@ otx2_tim_ring_create(struct rte_event_timer_adapter *adptr)
        struct tim_ring_req *free_req;
        struct tim_lf_alloc_req *req;
        struct tim_lf_alloc_rsp *rsp;
-       uint64_t nb_timers;
-       int rc;
+       uint8_t is_periodic;
+       int i, rc;
 
        if (dev == NULL)
                return -ENODEV;
@@ -282,6 +241,20 @@ otx2_tim_ring_create(struct rte_event_timer_adapter *adptr)
                }
        }
 
+       is_periodic = 0;
+       if (rcfg->flags & RTE_EVENT_TIMER_ADAPTER_F_PERIODIC) {
+               if (rcfg->max_tmo_ns &&
+                   rcfg->max_tmo_ns != rcfg->timer_tick_ns) {
+                       rc = -ERANGE;
+                       goto rng_mem_err;
+               }
+
+               /* Use 2 buckets to avoid contention */
+               rcfg->max_tmo_ns = rcfg->timer_tick_ns;
+               rcfg->timer_tick_ns /= 2;
+               is_periodic = 1;
+       }
+
        tim_ring = rte_zmalloc("otx2_tim_prv", sizeof(struct otx2_tim_ring), 0);
        if (tim_ring == NULL) {
                rc =  -ENOMEM;
@@ -294,26 +267,36 @@ otx2_tim_ring_create(struct rte_event_timer_adapter *adptr)
        tim_ring->clk_src = (int)rcfg->clk_src;
        tim_ring->ring_id = adptr->data->id;
        tim_ring->tck_nsec = RTE_ALIGN_MUL_CEIL(rcfg->timer_tick_ns, 10);
-       tim_ring->max_tout = rcfg->max_tmo_ns;
+       tim_ring->max_tout = is_periodic ?
+               rcfg->timer_tick_ns * 2 : rcfg->max_tmo_ns;
        tim_ring->nb_bkts = (tim_ring->max_tout / tim_ring->tck_nsec);
        tim_ring->chunk_sz = dev->chunk_sz;
-       nb_timers = rcfg->nb_timers;
+       tim_ring->nb_timers = rcfg->nb_timers;
        tim_ring->disable_npa = dev->disable_npa;
-
-       tim_ring->nb_chunks = nb_timers / OTX2_TIM_NB_CHUNK_SLOTS(
-                                                       tim_ring->chunk_sz);
-       tim_ring->nb_chunk_slots = OTX2_TIM_NB_CHUNK_SLOTS(tim_ring->chunk_sz);
-
-       /* Try to optimize the bucket parameters. */
-       if ((rcfg->flags & RTE_EVENT_TIMER_ADAPTER_F_ADJUST_RES)) {
-               if (rte_is_power_of_2(tim_ring->nb_bkts))
-                       tim_ring->optimized = true;
-               else
-                       tim_optimze_bkt_param(tim_ring);
+       tim_ring->ena_periodic = is_periodic;
+       tim_ring->enable_stats = dev->enable_stats;
+
+       for (i = 0; i < dev->ring_ctl_cnt ; i++) {
+               struct otx2_tim_ctl *ring_ctl = &dev->ring_ctl_data[i];
+
+               if (ring_ctl->ring == tim_ring->ring_id) {
+                       tim_ring->chunk_sz = ring_ctl->chunk_slots ?
+                               ((uint32_t)(ring_ctl->chunk_slots + 1) *
+                                OTX2_TIM_CHUNK_ALIGNMENT) : tim_ring->chunk_sz;
+                       tim_ring->enable_stats = ring_ctl->enable_stats;
+                       tim_ring->disable_npa = ring_ctl->disable_npa;
+               }
        }
 
-       tim_ring->nb_chunks = tim_ring->nb_chunks * tim_ring->nb_bkts;
-       /* Create buckets. */
+       if (tim_ring->disable_npa) {
+               tim_ring->nb_chunks =
+                       tim_ring->nb_timers /
+                       OTX2_TIM_NB_CHUNK_SLOTS(tim_ring->chunk_sz);
+               tim_ring->nb_chunks = tim_ring->nb_chunks * tim_ring->nb_bkts;
+       } else {
+               tim_ring->nb_chunks = tim_ring->nb_timers;
+       }
+       tim_ring->nb_chunk_slots = OTX2_TIM_NB_CHUNK_SLOTS(tim_ring->chunk_sz);
        tim_ring->bkt = rte_zmalloc("otx2_tim_bucket", (tim_ring->nb_bkts) *
                                    sizeof(struct otx2_tim_bkt),
                                    RTE_CACHE_LINE_SIZE);
@@ -329,7 +312,7 @@ otx2_tim_ring_create(struct rte_event_timer_adapter *adptr)
        cfg_req->ring = tim_ring->ring_id;
        cfg_req->bigendian = false;
        cfg_req->clocksource = tim_ring->clk_src;
-       cfg_req->enableperiodic = false;
+       cfg_req->enableperiodic = tim_ring->ena_periodic;
        cfg_req->enabledontfreebuffer = tim_ring->ena_dfb;
        cfg_req->bucketsize = tim_ring->nb_bkts;
        cfg_req->chunksize = tim_ring->chunk_sz;
@@ -357,10 +340,15 @@ otx2_tim_ring_create(struct rte_event_timer_adapter *adptr)
        tim_set_fp_ops(tim_ring);
 
        /* Update SSO xae count. */
-       sso_updt_xae_cnt(sso_pmd_priv(dev->event_dev), (void *)&nb_timers,
+       sso_updt_xae_cnt(sso_pmd_priv(dev->event_dev), (void *)tim_ring,
                         RTE_EVENT_TYPE_TIMER);
        sso_xae_reconfigure(dev->event_dev);
 
+       otx2_tim_dbg("Total memory used %"PRIu64"MB\n",
+                       (uint64_t)(((tim_ring->nb_chunks * tim_ring->chunk_sz)
+                       + (tim_ring->nb_bkts * sizeof(struct otx2_tim_bkt))) /
+                       BIT_ULL(20)));
+
        return rc;
 
 chnk_mem_err:
@@ -374,6 +362,86 @@ rng_mem_err:
        return rc;
 }
 
+static void
+otx2_tim_calibrate_start_tsc(struct otx2_tim_ring *tim_ring)
+{
+#define OTX2_TIM_CALIB_ITER    1E6
+       uint32_t real_bkt, bucket;
+       int icount, ecount = 0;
+       uint64_t bkt_cyc;
+
+       for (icount = 0; icount < OTX2_TIM_CALIB_ITER; icount++) {
+               real_bkt = otx2_read64(tim_ring->base + TIM_LF_RING_REL) >> 44;
+               bkt_cyc = tim_cntvct();
+               bucket = (bkt_cyc - tim_ring->ring_start_cyc) /
+                                                       tim_ring->tck_int;
+               bucket = bucket % (tim_ring->nb_bkts);
+               tim_ring->ring_start_cyc = bkt_cyc - (real_bkt *
+                                                       tim_ring->tck_int);
+               if (bucket != real_bkt)
+                       ecount++;
+       }
+       tim_ring->last_updt_cyc = bkt_cyc;
+       otx2_tim_dbg("Bucket mispredict %3.2f distance %d\n",
+                    100 - (((double)(icount - ecount) / (double)icount) * 100),
+                    bucket - real_bkt);
+}
+
+static int
+otx2_tim_ring_start(const struct rte_event_timer_adapter *adptr)
+{
+       struct otx2_tim_ring *tim_ring = adptr->data->adapter_priv;
+       struct otx2_tim_evdev *dev = tim_priv_get();
+       struct tim_enable_rsp *rsp;
+       struct tim_ring_req *req;
+       int rc;
+
+       if (dev == NULL)
+               return -ENODEV;
+
+       req = otx2_mbox_alloc_msg_tim_enable_ring(dev->mbox);
+       req->ring = tim_ring->ring_id;
+
+       rc = otx2_mbox_process_msg(dev->mbox, (void **)&rsp);
+       if (rc < 0) {
+               tim_err_desc(rc);
+               goto fail;
+       }
+       tim_ring->ring_start_cyc = rsp->timestarted;
+       tim_ring->tck_int = NSEC2TICK(tim_ring->tck_nsec, tim_cntfrq());
+       tim_ring->tot_int = tim_ring->tck_int * tim_ring->nb_bkts;
+       tim_ring->fast_div = rte_reciprocal_value_u64(tim_ring->tck_int);
+       tim_ring->fast_bkt = rte_reciprocal_value_u64(tim_ring->nb_bkts);
+
+       otx2_tim_calibrate_start_tsc(tim_ring);
+
+fail:
+       return rc;
+}
+
+static int
+otx2_tim_ring_stop(const struct rte_event_timer_adapter *adptr)
+{
+       struct otx2_tim_ring *tim_ring = adptr->data->adapter_priv;
+       struct otx2_tim_evdev *dev = tim_priv_get();
+       struct tim_ring_req *req;
+       int rc;
+
+       if (dev == NULL)
+               return -ENODEV;
+
+       req = otx2_mbox_alloc_msg_tim_disable_ring(dev->mbox);
+       req->ring = tim_ring->ring_id;
+
+       rc = otx2_mbox_process(dev->mbox);
+       if (rc < 0) {
+               tim_err_desc(rc);
+               rc = -EBUSY;
+       }
+
+       return rc;
+}
+
 static int
 otx2_tim_ring_free(struct rte_event_timer_adapter *adptr)
 {
@@ -403,24 +471,56 @@ otx2_tim_ring_free(struct rte_event_timer_adapter *adptr)
        return 0;
 }
 
+static int
+otx2_tim_stats_get(const struct rte_event_timer_adapter *adapter,
+                  struct rte_event_timer_adapter_stats *stats)
+{
+       struct otx2_tim_ring *tim_ring = adapter->data->adapter_priv;
+       uint64_t bkt_cyc = tim_cntvct() - tim_ring->ring_start_cyc;
+
+       stats->evtim_exp_count = __atomic_load_n(&tim_ring->arm_cnt,
+                                                __ATOMIC_RELAXED);
+       stats->ev_enq_count = stats->evtim_exp_count;
+       stats->adapter_tick_count = rte_reciprocal_divide_u64(bkt_cyc,
+                               &tim_ring->fast_div);
+       return 0;
+}
+
+static int
+otx2_tim_stats_reset(const struct rte_event_timer_adapter *adapter)
+{
+       struct otx2_tim_ring *tim_ring = adapter->data->adapter_priv;
+
+       __atomic_store_n(&tim_ring->arm_cnt, 0, __ATOMIC_RELAXED);
+       return 0;
+}
+
 int
 otx2_tim_caps_get(const struct rte_eventdev *evdev, uint64_t flags,
-                 uint32_t *caps,
-                 const struct rte_event_timer_adapter_ops **ops)
+                 uint32_t *caps, const struct event_timer_adapter_ops **ops)
 {
        struct otx2_tim_evdev *dev = tim_priv_get();
 
        RTE_SET_USED(flags);
+
        if (dev == NULL)
                return -ENODEV;
 
        otx2_tim_ops.init = otx2_tim_ring_create;
        otx2_tim_ops.uninit = otx2_tim_ring_free;
+       otx2_tim_ops.start = otx2_tim_ring_start;
+       otx2_tim_ops.stop = otx2_tim_ring_stop;
        otx2_tim_ops.get_info   = otx2_tim_ring_info_get;
 
+       if (dev->enable_stats) {
+               otx2_tim_ops.stats_get   = otx2_tim_stats_get;
+               otx2_tim_ops.stats_reset = otx2_tim_stats_reset;
+       }
+
        /* Store evdev pointer for later use. */
        dev->event_dev = (struct rte_eventdev *)(uintptr_t)evdev;
-       *caps = RTE_EVENT_TIMER_ADAPTER_CAP_INTERNAL_PORT;
+       *caps = RTE_EVENT_TIMER_ADAPTER_CAP_INTERNAL_PORT |
+               RTE_EVENT_TIMER_ADAPTER_CAP_PERIODIC;
        *ops = &otx2_tim_ops;
 
        return 0;
@@ -428,6 +528,88 @@ otx2_tim_caps_get(const struct rte_eventdev *evdev, uint64_t flags,
 
 #define OTX2_TIM_DISABLE_NPA   "tim_disable_npa"
 #define OTX2_TIM_CHNK_SLOTS    "tim_chnk_slots"
+#define OTX2_TIM_STATS_ENA     "tim_stats_ena"
+#define OTX2_TIM_RINGS_LMT     "tim_rings_lmt"
+#define OTX2_TIM_RING_CTL      "tim_ring_ctl"
+
+static void
+tim_parse_ring_param(char *value, void *opaque)
+{
+       struct otx2_tim_evdev *dev = opaque;
+       struct otx2_tim_ctl ring_ctl = {0};
+       char *tok = strtok(value, "-");
+       struct otx2_tim_ctl *old_ptr;
+       uint16_t *val;
+
+       val = (uint16_t *)&ring_ctl;
+
+       if (!strlen(value))
+               return;
+
+       while (tok != NULL) {
+               *val = atoi(tok);
+               tok = strtok(NULL, "-");
+               val++;
+       }
+
+       if (val != (&ring_ctl.enable_stats + 1)) {
+               otx2_err(
+               "Invalid ring param expected [ring-chunk_sz-disable_npa-enable_stats]");
+               return;
+       }
+
+       dev->ring_ctl_cnt++;
+       old_ptr = dev->ring_ctl_data;
+       dev->ring_ctl_data = rte_realloc(dev->ring_ctl_data,
+                                        sizeof(struct otx2_tim_ctl) *
+                                        dev->ring_ctl_cnt, 0);
+       if (dev->ring_ctl_data == NULL) {
+               dev->ring_ctl_data = old_ptr;
+               dev->ring_ctl_cnt--;
+               return;
+       }
+
+       dev->ring_ctl_data[dev->ring_ctl_cnt - 1] = ring_ctl;
+}
+
+static void
+tim_parse_ring_ctl_list(const char *value, void *opaque)
+{
+       char *s = strdup(value);
+       char *start = NULL;
+       char *end = NULL;
+       char *f = s;
+
+       while (*s) {
+               if (*s == '[')
+                       start = s;
+               else if (*s == ']')
+                       end = s;
+
+               if (start && start < end) {
+                       *end = 0;
+                       tim_parse_ring_param(start + 1, opaque);
+                       start = end;
+                       s = end;
+               }
+               s++;
+       }
+
+       free(f);
+}
+
+static int
+tim_parse_kvargs_dict(const char *key, const char *value, void *opaque)
+{
+       RTE_SET_USED(key);
+
+       /* Dict format [ring-chunk_sz-disable_npa-enable_stats] use '-' as ','
+        * isn't allowed. 0 represents default.
+        */
+       tim_parse_ring_ctl_list(value, opaque);
+
+       return 0;
+}
 
 static void
 tim_parse_devargs(struct rte_devargs *devargs, struct otx2_tim_evdev *dev)
@@ -445,6 +627,14 @@ tim_parse_devargs(struct rte_devargs *devargs, struct otx2_tim_evdev *dev)
                           &parse_kvargs_flag, &dev->disable_npa);
        rte_kvargs_process(kvlist, OTX2_TIM_CHNK_SLOTS,
                           &parse_kvargs_value, &dev->chunk_slots);
+       rte_kvargs_process(kvlist, OTX2_TIM_STATS_ENA, &parse_kvargs_flag,
+                          &dev->enable_stats);
+       rte_kvargs_process(kvlist, OTX2_TIM_RINGS_LMT, &parse_kvargs_value,
+                          &dev->min_ring_cnt);
+       rte_kvargs_process(kvlist, OTX2_TIM_RING_CTL,
+                          &tim_parse_kvargs_dict, &dev);
+
+       rte_kvargs_free(kvlist);
 }
 
 void
@@ -482,7 +672,8 @@ otx2_tim_init(struct rte_pci_device *pci_dev, struct otx2_dev *cmn_dev)
                goto mz_free;
        }
 
-       dev->nb_rings = rsrc_cnt->tim;
+       dev->nb_rings = dev->min_ring_cnt ?
+               RTE_MIN(dev->min_ring_cnt, rsrc_cnt->tim) : rsrc_cnt->tim;
 
        if (!dev->nb_rings) {
                otx2_tim_dbg("No TIM Logical functions provisioned.");