event/cnxk: add external clock support for timer
[dpdk.git] / drivers / event / cnxk / cnxk_tim_evdev.c
index 62a15a4..5d52a39 100644 (file)
@@ -2,10 +2,12 @@
  * Copyright(C) 2021 Marvell.
  */
 
+#include <math.h>
+
 #include "cnxk_eventdev.h"
 #include "cnxk_tim_evdev.h"
 
-static struct rte_event_timer_adapter_ops cnxk_tim_ops;
+static struct event_timer_adapter_ops cnxk_tim_ops;
 
 static int
 cnxk_tim_chnk_pool_create(struct cnxk_tim_ring *tim_ring,
@@ -19,7 +21,7 @@ cnxk_tim_chnk_pool_create(struct cnxk_tim_ring *tim_ring,
        cache_sz /= rte_lcore_count();
        /* Create chunk pool. */
        if (rcfg->flags & RTE_EVENT_TIMER_ADAPTER_F_SP_PUT) {
-               mp_flags = MEMPOOL_F_SP_PUT | MEMPOOL_F_SC_GET;
+               mp_flags = RTE_MEMPOOL_F_SP_PUT | RTE_MEMPOOL_F_SC_GET;
                plt_tim_dbg("Using single producer mode");
                tim_ring->prod_type_sp = true;
        }
@@ -27,8 +29,8 @@ cnxk_tim_chnk_pool_create(struct cnxk_tim_ring *tim_ring,
        snprintf(pool_name, sizeof(pool_name), "cnxk_tim_chunk_pool%d",
                 tim_ring->ring_id);
 
-       if (cache_sz > RTE_MEMPOOL_CACHE_MAX_SIZE)
-               cache_sz = RTE_MEMPOOL_CACHE_MAX_SIZE;
+       if (cache_sz > CNXK_TIM_MAX_POOL_CACHE_SZ)
+               cache_sz = CNXK_TIM_MAX_POOL_CACHE_SZ;
        cache_sz = cache_sz != 0 ? cache_sz : 2;
        tim_ring->nb_chunks += (cache_sz * rte_lcore_count());
        if (!tim_ring->disable_npa) {
@@ -81,21 +83,25 @@ cnxk_tim_set_fp_ops(struct cnxk_tim_ring *tim_ring)
 {
        uint8_t prod_flag = !tim_ring->prod_type_sp;
 
-       /* [DFB/FB] [SP][MP]*/
-       const rte_event_timer_arm_burst_t arm_burst[2][2] = {
-#define FP(_name, _f2, _f1, flags) [_f2][_f1] = cnxk_tim_arm_burst_##_name,
+       /* [STATS] [DFB/FB] [SP][MP]*/
+       const rte_event_timer_arm_burst_t arm_burst[2][2][2] = {
+#define FP(_name, _f3, _f2, _f1, flags)                                        \
+       [_f3][_f2][_f1] = cnxk_tim_arm_burst_##_name,
                TIM_ARM_FASTPATH_MODES
 #undef FP
        };
 
-       const rte_event_timer_arm_tmo_tick_burst_t arm_tmo_burst[2] = {
-#define FP(_name, _f1, flags) [_f1] = cnxk_tim_arm_tmo_tick_burst_##_name,
+       const rte_event_timer_arm_tmo_tick_burst_t arm_tmo_burst[2][2] = {
+#define FP(_name, _f2, _f1, flags)                                             \
+       [_f2][_f1] = cnxk_tim_arm_tmo_tick_burst_##_name,
                TIM_ARM_TMO_FASTPATH_MODES
 #undef FP
        };
 
-       cnxk_tim_ops.arm_burst = arm_burst[tim_ring->ena_dfb][prod_flag];
-       cnxk_tim_ops.arm_tmo_tick_burst = arm_tmo_burst[tim_ring->ena_dfb];
+       cnxk_tim_ops.arm_burst =
+               arm_burst[tim_ring->enable_stats][tim_ring->ena_dfb][prod_flag];
+       cnxk_tim_ops.arm_tmo_tick_burst =
+               arm_tmo_burst[tim_ring->enable_stats][tim_ring->ena_dfb];
        cnxk_tim_ops.cancel_burst = cnxk_tim_timer_cancel_burst;
 }
 
@@ -111,13 +117,90 @@ cnxk_tim_ring_info_get(const struct rte_event_timer_adapter *adptr,
                   sizeof(struct rte_event_timer_adapter_conf));
 }
 
+static inline void
+sort_multi_array(double ref_arr[], uint64_t arr1[], uint64_t arr2[],
+                uint64_t arr3[], uint8_t sz)
+{
+       int x;
+
+       for (x = 0; x < sz - 1; x++) {
+               if (ref_arr[x] > ref_arr[x + 1]) {
+                       PLT_SWAP(ref_arr[x], ref_arr[x + 1]);
+                       PLT_SWAP(arr1[x], arr1[x + 1]);
+                       PLT_SWAP(arr2[x], arr2[x + 1]);
+                       PLT_SWAP(arr3[x], arr3[x + 1]);
+                       x = -1;
+               }
+       }
+}
+
+static inline void
+populate_sample(uint64_t tck[], uint64_t ns[], double diff[], uint64_t dst[],
+               uint64_t req_tck, uint64_t clk_freq, double tck_ns, uint8_t sz,
+               bool mov_fwd)
+{
+       int i;
+
+       for (i = 0; i < sz; i++) {
+               tck[i] = i ? tck[i - 1] : req_tck;
+               do {
+                       mov_fwd ? tck[i]++ : tck[i]--;
+                       ns[i] = round((double)tck[i] * tck_ns);
+                       if (round((double)tck[i] * tck_ns) >
+                           ((double)tck[i] * tck_ns))
+                               continue;
+               } while (ns[i] % (uint64_t)cnxk_tim_ns_per_tck(clk_freq));
+               diff[i] = PLT_MAX((double)ns[i], (double)tck[i] * tck_ns) -
+                         PLT_MIN((double)ns[i], (double)tck[i] * tck_ns);
+               dst[i] = mov_fwd ? tck[i] - req_tck : req_tck - tck[i];
+       }
+}
+
+static void
+tim_adjust_resolution(uint64_t *req_ns, uint64_t *req_tck, double tck_ns,
+                     uint64_t clk_freq, uint64_t max_tmo, uint64_t m_tck)
+{
+#define MAX_SAMPLES 5
+       double rmax_diff[MAX_SAMPLES], rmin_diff[MAX_SAMPLES];
+       uint64_t min_tck[MAX_SAMPLES], max_tck[MAX_SAMPLES];
+       uint64_t min_dst[MAX_SAMPLES], max_dst[MAX_SAMPLES];
+       uint64_t min_ns[MAX_SAMPLES], max_ns[MAX_SAMPLES];
+       int i;
+
+       populate_sample(max_tck, max_ns, rmax_diff, max_dst, *req_tck, clk_freq,
+                       tck_ns, MAX_SAMPLES, true);
+       sort_multi_array(rmax_diff, max_dst, max_tck, max_ns, MAX_SAMPLES);
+
+       populate_sample(min_tck, min_ns, rmin_diff, min_dst, *req_tck, clk_freq,
+                       tck_ns, MAX_SAMPLES, false);
+       sort_multi_array(rmin_diff, min_dst, min_tck, min_ns, MAX_SAMPLES);
+
+       for (i = 0; i < MAX_SAMPLES; i++) {
+               if (min_dst[i] < max_dst[i] && min_tck[i] > m_tck &&
+                   (max_tmo / min_ns[i]) <=
+                           (TIM_MAX_BUCKET_SIZE - TIM_MIN_BUCKET_SIZE)) {
+                       *req_tck = min_tck[i];
+                       *req_ns = min_ns[i];
+                       break;
+               } else if ((max_tmo / max_ns[i]) <
+                          (TIM_MAX_BUCKET_SIZE - TIM_MIN_BUCKET_SIZE)) {
+                       *req_tck = max_tck[i];
+                       *req_ns = max_ns[i];
+                       break;
+               }
+       }
+}
+
 static int
 cnxk_tim_ring_create(struct rte_event_timer_adapter *adptr)
 {
        struct rte_event_timer_adapter_conf *rcfg = &adptr->data->conf;
        struct cnxk_tim_evdev *dev = cnxk_tim_priv_get();
+       uint64_t min_intvl_ns, min_intvl_cyc;
        struct cnxk_tim_ring *tim_ring;
-       int rc;
+       enum roc_tim_clk_src clk_src;
+       uint64_t clk_freq = 0;
+       int i, rc;
 
        if (dev == NULL)
                return -ENODEV;
@@ -135,30 +218,87 @@ cnxk_tim_ring_create(struct rte_event_timer_adapter *adptr)
                goto tim_ring_free;
        }
 
-       if (NSEC2TICK(RTE_ALIGN_MUL_CEIL(
-                             rcfg->timer_tick_ns,
-                             cnxk_tim_min_resolution_ns(cnxk_tim_cntfrq())),
-                     cnxk_tim_cntfrq()) <
-           cnxk_tim_min_tmo_ticks(cnxk_tim_cntfrq())) {
-               if (rcfg->flags & RTE_EVENT_TIMER_ADAPTER_F_ADJUST_RES)
-                       rcfg->timer_tick_ns = TICK2NSEC(
-                               cnxk_tim_min_tmo_ticks(cnxk_tim_cntfrq()),
-                               cnxk_tim_cntfrq());
-               else {
+       clk_src = cnxk_tim_convert_clk_src(rcfg->clk_src);
+       if (clk_src == ROC_TIM_CLK_SRC_INVALID) {
+               plt_err("Invalid clock source");
+               goto tim_hw_free;
+       }
+
+       rc = cnxk_tim_get_clk_freq(dev, clk_src, &clk_freq);
+       if (rc < 0) {
+               plt_err("Failed to get clock frequency");
+               goto tim_hw_free;
+       }
+
+       rc = roc_tim_lf_interval(&dev->tim, clk_src, clk_freq, &min_intvl_ns,
+                                &min_intvl_cyc);
+       if (rc < 0) {
+               plt_err("Failed to get min interval details");
+               goto tim_hw_free;
+       }
+
+       if (rcfg->timer_tick_ns < min_intvl_ns) {
+               if (rcfg->flags & RTE_EVENT_TIMER_ADAPTER_F_ADJUST_RES) {
+                       rcfg->timer_tick_ns = min_intvl_ns;
+               } else {
                        rc = -ERANGE;
                        goto tim_hw_free;
                }
        }
+
+       if (rcfg->timer_tick_ns > rcfg->max_tmo_ns) {
+               plt_err("Max timeout to too high");
+               rc = -ERANGE;
+               goto tim_hw_free;
+       }
+
+       tim_ring->tck_nsec =
+               round(RTE_ALIGN_MUL_NEAR((long double)rcfg->timer_tick_ns,
+                                        cnxk_tim_ns_per_tck(clk_freq)));
+       if (log10(clk_freq) - floor(log10(clk_freq)) != 0.0) {
+               uint64_t req_ns, req_tck;
+               double tck_ns;
+
+               req_ns = tim_ring->tck_nsec;
+               tck_ns = NSECPERSEC / clk_freq;
+               req_tck = round(rcfg->timer_tick_ns / tck_ns);
+               tim_adjust_resolution(&req_ns, &req_tck, tck_ns, clk_freq,
+                                     rcfg->max_tmo_ns, min_intvl_cyc);
+               if ((tim_ring->tck_nsec != req_ns) &&
+                   !(rcfg->flags & RTE_EVENT_TIMER_ADAPTER_F_ADJUST_RES)) {
+                       rc = -ERANGE;
+                       goto tim_hw_free;
+               }
+               tim_ring->tck_nsec = ceil(req_tck * tck_ns);
+       }
+
+       tim_ring->tck_int = round((long double)tim_ring->tck_nsec /
+                                 cnxk_tim_ns_per_tck(clk_freq));
+       tim_ring->tck_nsec =
+               ceil(tim_ring->tck_int * cnxk_tim_ns_per_tck(clk_freq));
+
        tim_ring->ring_id = adptr->data->id;
-       tim_ring->clk_src = (int)rcfg->clk_src;
-       tim_ring->tck_nsec = RTE_ALIGN_MUL_CEIL(
-               rcfg->timer_tick_ns,
-               cnxk_tim_min_resolution_ns(cnxk_tim_cntfrq()));
+       tim_ring->clk_src = clk_src;
        tim_ring->max_tout = rcfg->max_tmo_ns;
        tim_ring->nb_bkts = (tim_ring->max_tout / tim_ring->tck_nsec);
        tim_ring->nb_timers = rcfg->nb_timers;
        tim_ring->chunk_sz = dev->chunk_sz;
        tim_ring->disable_npa = dev->disable_npa;
+       tim_ring->enable_stats = dev->enable_stats;
+
+       for (i = 0; i < dev->ring_ctl_cnt; i++) {
+               struct cnxk_tim_ctl *ring_ctl = &dev->ring_ctl_data[i];
+
+               if (ring_ctl->ring == tim_ring->ring_id) {
+                       tim_ring->chunk_sz =
+                               ring_ctl->chunk_slots ?
+                                       ((uint32_t)(ring_ctl->chunk_slots + 1) *
+                                        CNXK_TIM_CHUNK_ALIGNMENT) :
+                                             tim_ring->chunk_sz;
+                       tim_ring->enable_stats = ring_ctl->enable_stats;
+                       tim_ring->disable_npa = ring_ctl->disable_npa;
+               }
+       }
 
        if (tim_ring->disable_npa) {
                tim_ring->nb_chunks =
@@ -182,11 +322,9 @@ cnxk_tim_ring_create(struct rte_event_timer_adapter *adptr)
        if (rc < 0)
                goto tim_bkt_free;
 
-       rc = roc_tim_lf_config(
-               &dev->tim, tim_ring->ring_id,
-               cnxk_tim_convert_clk_src(tim_ring->clk_src), 0, 0,
-               tim_ring->nb_bkts, tim_ring->chunk_sz,
-               NSEC2TICK(tim_ring->tck_nsec, cnxk_tim_cntfrq()));
+       rc = roc_tim_lf_config(&dev->tim, tim_ring->ring_id, clk_src, 0, 0,
+                              tim_ring->nb_bkts, tim_ring->chunk_sz,
+                              tim_ring->tck_int, tim_ring->tck_nsec, clk_freq);
        if (rc < 0) {
                plt_err("Failed to configure timer ring");
                goto tim_chnk_free;
@@ -241,26 +379,242 @@ cnxk_tim_ring_free(struct rte_event_timer_adapter *adptr)
        return 0;
 }
 
+static void
+cnxk_tim_calibrate_start_tsc(struct cnxk_tim_ring *tim_ring)
+{
+#define CNXK_TIM_CALIB_ITER 1E6
+       uint32_t real_bkt, bucket;
+       int icount, ecount = 0;
+       uint64_t bkt_cyc;
+
+       for (icount = 0; icount < CNXK_TIM_CALIB_ITER; icount++) {
+               real_bkt = plt_read64(tim_ring->base + TIM_LF_RING_REL) >> 44;
+               bkt_cyc = cnxk_tim_cntvct();
+               bucket = (bkt_cyc - tim_ring->ring_start_cyc) /
+                        tim_ring->tck_int;
+               bucket = bucket % (tim_ring->nb_bkts);
+               tim_ring->ring_start_cyc =
+                       bkt_cyc - (real_bkt * tim_ring->tck_int);
+               if (bucket != real_bkt)
+                       ecount++;
+       }
+       tim_ring->last_updt_cyc = bkt_cyc;
+       plt_tim_dbg("Bucket mispredict %3.2f distance %d\n",
+                   100 - (((double)(icount - ecount) / (double)icount) * 100),
+                   bucket - real_bkt);
+}
+
+static int
+cnxk_tim_ring_start(const struct rte_event_timer_adapter *adptr)
+{
+       struct cnxk_tim_ring *tim_ring = adptr->data->adapter_priv;
+       struct cnxk_tim_evdev *dev = cnxk_tim_priv_get();
+       int rc;
+
+       if (dev == NULL)
+               return -ENODEV;
+
+       rc = roc_tim_lf_enable(&dev->tim, tim_ring->ring_id,
+                              &tim_ring->ring_start_cyc, NULL);
+       if (rc < 0)
+               return rc;
+
+       tim_ring->tot_int = tim_ring->tck_int * tim_ring->nb_bkts;
+       tim_ring->fast_div = rte_reciprocal_value_u64(tim_ring->tck_int);
+       tim_ring->fast_bkt = rte_reciprocal_value_u64(tim_ring->nb_bkts);
+
+       cnxk_tim_calibrate_start_tsc(tim_ring);
+
+       return rc;
+}
+
+static int
+cnxk_tim_ring_stop(const struct rte_event_timer_adapter *adptr)
+{
+       struct cnxk_tim_ring *tim_ring = adptr->data->adapter_priv;
+       struct cnxk_tim_evdev *dev = cnxk_tim_priv_get();
+       int rc;
+
+       if (dev == NULL)
+               return -ENODEV;
+
+       rc = roc_tim_lf_disable(&dev->tim, tim_ring->ring_id);
+       if (rc < 0)
+               plt_err("Failed to disable timer ring");
+
+       return rc;
+}
+
+static int
+cnxk_tim_stats_get(const struct rte_event_timer_adapter *adapter,
+                  struct rte_event_timer_adapter_stats *stats)
+{
+       struct cnxk_tim_ring *tim_ring = adapter->data->adapter_priv;
+       uint64_t bkt_cyc = cnxk_tim_cntvct() - tim_ring->ring_start_cyc;
+
+       stats->evtim_exp_count =
+               __atomic_load_n(&tim_ring->arm_cnt, __ATOMIC_RELAXED);
+       stats->ev_enq_count = stats->evtim_exp_count;
+       stats->adapter_tick_count =
+               rte_reciprocal_divide_u64(bkt_cyc, &tim_ring->fast_div);
+       return 0;
+}
+
+static int
+cnxk_tim_stats_reset(const struct rte_event_timer_adapter *adapter)
+{
+       struct cnxk_tim_ring *tim_ring = adapter->data->adapter_priv;
+
+       __atomic_store_n(&tim_ring->arm_cnt, 0, __ATOMIC_RELAXED);
+       return 0;
+}
+
 int
 cnxk_tim_caps_get(const struct rte_eventdev *evdev, uint64_t flags,
-                 uint32_t *caps,
-                 const struct rte_event_timer_adapter_ops **ops)
+                 uint32_t *caps, const struct event_timer_adapter_ops **ops)
 {
        struct cnxk_tim_evdev *dev = cnxk_tim_priv_get();
 
        RTE_SET_USED(flags);
-       RTE_SET_USED(ops);
 
        if (dev == NULL)
                return -ENODEV;
 
        cnxk_tim_ops.init = cnxk_tim_ring_create;
        cnxk_tim_ops.uninit = cnxk_tim_ring_free;
+       cnxk_tim_ops.start = cnxk_tim_ring_start;
+       cnxk_tim_ops.stop = cnxk_tim_ring_stop;
        cnxk_tim_ops.get_info = cnxk_tim_ring_info_get;
 
+       if (dev->enable_stats) {
+               cnxk_tim_ops.stats_get = cnxk_tim_stats_get;
+               cnxk_tim_ops.stats_reset = cnxk_tim_stats_reset;
+       }
+
        /* Store evdev pointer for later use. */
        dev->event_dev = (struct rte_eventdev *)(uintptr_t)evdev;
        *caps = RTE_EVENT_TIMER_ADAPTER_CAP_INTERNAL_PORT;
+       *ops = &cnxk_tim_ops;
+
+       return 0;
+}
+
+static void
+cnxk_tim_parse_ring_param(char *value, void *opaque)
+{
+       struct cnxk_tim_evdev *dev = opaque;
+       struct cnxk_tim_ctl ring_ctl = {0};
+       char *tok = strtok(value, "-");
+       struct cnxk_tim_ctl *old_ptr;
+       uint16_t *val;
+
+       val = (uint16_t *)&ring_ctl;
+
+       if (!strlen(value))
+               return;
+
+       while (tok != NULL) {
+               *val = atoi(tok);
+               tok = strtok(NULL, "-");
+               val++;
+       }
+
+       if (val != (&ring_ctl.enable_stats + 1)) {
+               plt_err("Invalid ring param expected [ring-chunk_sz-disable_npa-enable_stats]");
+               return;
+       }
+
+       dev->ring_ctl_cnt++;
+       old_ptr = dev->ring_ctl_data;
+       dev->ring_ctl_data =
+               rte_realloc(dev->ring_ctl_data,
+                           sizeof(struct cnxk_tim_ctl) * dev->ring_ctl_cnt, 0);
+       if (dev->ring_ctl_data == NULL) {
+               dev->ring_ctl_data = old_ptr;
+               dev->ring_ctl_cnt--;
+               return;
+       }
+
+       dev->ring_ctl_data[dev->ring_ctl_cnt - 1] = ring_ctl;
+}
+
+static void
+cnxk_tim_parse_ring_ctl_list(const char *value, void *opaque)
+{
+       char *s = strdup(value);
+       char *start = NULL;
+       char *end = NULL;
+       char *f = s;
+
+       if (s == NULL || !strlen(s))
+               return;
+
+       while (*s) {
+               if (*s == '[')
+                       start = s;
+               else if (*s == ']')
+                       end = s;
+               else
+                       continue;
+
+               if (start && start < end) {
+                       *end = 0;
+                       cnxk_tim_parse_ring_param(start + 1, opaque);
+                       start = end;
+                       s = end;
+               }
+               s++;
+       }
+
+       free(f);
+}
+
+static int
+cnxk_tim_parse_kvargs_dict(const char *key, const char *value, void *opaque)
+{
+       RTE_SET_USED(key);
+
+       /* Dict format [ring-chunk_sz-disable_npa-enable_stats] use '-' as ','
+        * isn't allowed. 0 represents default.
+        */
+       cnxk_tim_parse_ring_ctl_list(value, opaque);
+
+       return 0;
+}
+
+static void
+cnxk_tim_parse_clk_list(const char *value, void *opaque)
+{
+       enum roc_tim_clk_src src[] = {ROC_TIM_CLK_SRC_GPIO, ROC_TIM_CLK_SRC_PTP,
+                                     ROC_TIM_CLK_SRC_SYNCE,
+                                     ROC_TIM_CLK_SRC_INVALID};
+       struct cnxk_tim_evdev *dev = opaque;
+       char *str = strdup(value);
+       char *tok;
+       int i = 0;
+
+       if (str == NULL || !strlen(str))
+               return;
+
+       tok = strtok(str, "-");
+       while (tok != NULL && src[i] != ROC_TIM_CLK_SRC_INVALID) {
+               dev->ext_clk_freq[src[i]] = strtoull(tok, NULL, 10);
+               tok = strtok(NULL, "-");
+               i++;
+       }
+
+       free(str);
+}
+
+static int
+cnxk_tim_parse_kvargs_dsv(const char *key, const char *value, void *opaque)
+{
+       RTE_SET_USED(key);
+
+       /* DSV format GPIO-PTP-SYNCE-BTS use '-' as ','
+        * isn't allowed. 0 represents default.
+        */
+       cnxk_tim_parse_clk_list(value, opaque);
 
        return 0;
 }
@@ -281,8 +635,14 @@ cnxk_tim_parse_devargs(struct rte_devargs *devargs, struct cnxk_tim_evdev *dev)
                           &dev->disable_npa);
        rte_kvargs_process(kvlist, CNXK_TIM_CHNK_SLOTS, &parse_kvargs_value,
                           &dev->chunk_slots);
+       rte_kvargs_process(kvlist, CNXK_TIM_STATS_ENA, &parse_kvargs_flag,
+                          &dev->enable_stats);
        rte_kvargs_process(kvlist, CNXK_TIM_RINGS_LMT, &parse_kvargs_value,
                           &dev->min_ring_cnt);
+       rte_kvargs_process(kvlist, CNXK_TIM_RING_CTL,
+                          &cnxk_tim_parse_kvargs_dict, &dev);
+       rte_kvargs_process(kvlist, CNXK_TIM_EXT_CLK, &cnxk_tim_parse_kvargs_dsv,
+                          dev);
 
        rte_kvargs_free(kvlist);
 }
@@ -331,7 +691,7 @@ cnxk_tim_fini(void)
 {
        struct cnxk_tim_evdev *dev = cnxk_tim_priv_get();
 
-       if (rte_eal_process_type() != RTE_PROC_PRIMARY)
+       if (dev == NULL || rte_eal_process_type() != RTE_PROC_PRIMARY)
                return;
 
        roc_tim_fini(&dev->tim);