1 /* SPDX-License-Identifier: BSD-3-Clause
2 * Copyright(c) 2021 HiSilicon Limited
7 #include <rte_bus_vdev.h>
8 #include <rte_cycles.h>
10 #include <rte_kvargs.h>
11 #include <rte_lcore.h>
13 #include <rte_malloc.h>
14 #include <rte_memcpy.h>
16 #include <rte_dmadev_pmd.h>
18 #include "skeleton_dmadev.h"
20 RTE_LOG_REGISTER_DEFAULT(skeldma_logtype, INFO);
21 #define SKELDMA_LOG(level, fmt, args...) \
22 rte_log(RTE_LOG_ ## level, skeldma_logtype, "%s(): " fmt "\n", \
26 skeldma_info_get(const struct rte_dma_dev *dev, struct rte_dma_info *dev_info,
29 #define SKELDMA_MAX_DESC 8192
30 #define SKELDMA_MIN_DESC 32
33 RTE_SET_USED(info_sz);
35 dev_info->dev_capa = RTE_DMA_CAPA_MEM_TO_MEM |
37 RTE_DMA_CAPA_OPS_COPY;
38 dev_info->max_vchans = 1;
39 dev_info->max_desc = SKELDMA_MAX_DESC;
40 dev_info->min_desc = SKELDMA_MIN_DESC;
46 skeldma_configure(struct rte_dma_dev *dev, const struct rte_dma_conf *conf,
51 RTE_SET_USED(conf_sz);
56 cpucopy_thread(void *param)
58 #define SLEEP_THRESHOLD 10000
59 #define SLEEP_US_VAL 10
61 struct rte_dma_dev *dev = param;
62 struct skeldma_hw *hw = dev->data->dev_private;
63 struct skeldma_desc *desc = NULL;
66 while (!hw->exit_flag) {
67 ret = rte_ring_dequeue(hw->desc_running, (void **)&desc);
70 if (hw->zero_req_count == 0)
71 hw->zero_req_count = SLEEP_THRESHOLD;
72 if (hw->zero_req_count >= SLEEP_THRESHOLD)
73 rte_delay_us_sleep(SLEEP_US_VAL);
77 hw->zero_req_count = 0;
78 rte_memcpy(desc->dst, desc->src, desc->len);
79 __atomic_add_fetch(&hw->completed_count, 1, __ATOMIC_RELEASE);
80 (void)rte_ring_enqueue(hw->desc_completed, (void *)desc);
87 fflush_ring(struct skeldma_hw *hw, struct rte_ring *ring)
89 struct skeldma_desc *desc = NULL;
90 while (rte_ring_count(ring) > 0) {
91 (void)rte_ring_dequeue(ring, (void **)&desc);
92 (void)rte_ring_enqueue(hw->desc_empty, (void *)desc);
97 skeldma_start(struct rte_dma_dev *dev)
99 struct skeldma_hw *hw = dev->data->dev_private;
100 char name[RTE_MAX_THREAD_NAME_LEN];
104 if (hw->desc_mem == NULL) {
105 SKELDMA_LOG(ERR, "Vchan was not setup, start fail!");
109 /* Reset the dmadev to a known state, include:
110 * 1) fflush pending/running/completed ring to empty ring.
111 * 2) init ring idx to zero.
112 * 3) init running statistics.
113 * 4) mark cpucopy task exit_flag to false.
115 fflush_ring(hw, hw->desc_pending);
116 fflush_ring(hw, hw->desc_running);
117 fflush_ring(hw, hw->desc_completed);
119 hw->last_ridx = hw->ridx - 1;
120 hw->submitted_count = 0;
121 hw->zero_req_count = 0;
122 hw->completed_count = 0;
123 hw->exit_flag = false;
127 snprintf(name, sizeof(name), "dma_skel_%d", dev->data->dev_id);
128 ret = rte_ctrl_thread_create(&hw->thread, name, NULL,
129 cpucopy_thread, dev);
131 SKELDMA_LOG(ERR, "Start cpucopy thread fail!");
135 if (hw->lcore_id != -1) {
136 cpuset = rte_lcore_cpuset(hw->lcore_id);
137 ret = pthread_setaffinity_np(hw->thread, sizeof(cpuset),
141 "Set thread affinity lcore = %d fail!",
149 skeldma_stop(struct rte_dma_dev *dev)
151 struct skeldma_hw *hw = dev->data->dev_private;
153 hw->exit_flag = true;
156 (void)pthread_cancel(hw->thread);
157 pthread_join(hw->thread, NULL);
163 vchan_setup(struct skeldma_hw *hw, int16_t dev_id, uint16_t nb_desc)
165 char name[RTE_RING_NAMESIZE];
166 struct skeldma_desc *desc;
167 struct rte_ring *empty;
168 struct rte_ring *pending;
169 struct rte_ring *running;
170 struct rte_ring *completed;
173 desc = rte_zmalloc_socket(NULL, nb_desc * sizeof(struct skeldma_desc),
174 RTE_CACHE_LINE_SIZE, hw->socket_id);
176 SKELDMA_LOG(ERR, "Malloc dma skeleton desc fail!");
180 snprintf(name, RTE_RING_NAMESIZE, "dma_skel_desc_empty_%d", dev_id);
181 empty = rte_ring_create(name, nb_desc, hw->socket_id,
182 RING_F_SP_ENQ | RING_F_SC_DEQ);
183 snprintf(name, RTE_RING_NAMESIZE, "dma_skel_desc_pend_%d", dev_id);
184 pending = rte_ring_create(name, nb_desc, hw->socket_id,
185 RING_F_SP_ENQ | RING_F_SC_DEQ);
186 snprintf(name, RTE_RING_NAMESIZE, "dma_skel_desc_run_%d", dev_id);
187 running = rte_ring_create(name, nb_desc, hw->socket_id,
188 RING_F_SP_ENQ | RING_F_SC_DEQ);
189 snprintf(name, RTE_RING_NAMESIZE, "dma_skel_desc_comp_%d", dev_id);
190 completed = rte_ring_create(name, nb_desc, hw->socket_id,
191 RING_F_SP_ENQ | RING_F_SC_DEQ);
192 if (empty == NULL || pending == NULL || running == NULL ||
194 SKELDMA_LOG(ERR, "Create dma skeleton desc ring fail!");
195 rte_ring_free(empty);
196 rte_ring_free(pending);
197 rte_ring_free(running);
198 rte_ring_free(completed);
203 /* The real usable ring size is *count-1* instead of *count* to
204 * differentiate a free ring from an empty ring.
205 * @see rte_ring_create
207 for (i = 0; i < nb_desc - 1; i++)
208 (void)rte_ring_enqueue(empty, (void *)(desc + i));
211 hw->desc_empty = empty;
212 hw->desc_pending = pending;
213 hw->desc_running = running;
214 hw->desc_completed = completed;
220 vchan_release(struct skeldma_hw *hw)
222 if (hw->desc_mem == NULL)
225 rte_free(hw->desc_mem);
227 rte_ring_free(hw->desc_empty);
228 hw->desc_empty = NULL;
229 rte_ring_free(hw->desc_pending);
230 hw->desc_pending = NULL;
231 rte_ring_free(hw->desc_running);
232 hw->desc_running = NULL;
233 rte_ring_free(hw->desc_completed);
234 hw->desc_completed = NULL;
238 skeldma_close(struct rte_dma_dev *dev)
240 /* The device already stopped */
241 vchan_release(dev->data->dev_private);
246 skeldma_vchan_setup(struct rte_dma_dev *dev, uint16_t vchan,
247 const struct rte_dma_vchan_conf *conf,
250 struct skeldma_hw *hw = dev->data->dev_private;
253 RTE_SET_USED(conf_sz);
255 if (!rte_is_power_of_2(conf->nb_desc)) {
256 SKELDMA_LOG(ERR, "Number of desc must be power of 2!");
261 return vchan_setup(hw, dev->data->dev_id, conf->nb_desc);
265 skeldma_vchan_status(const struct rte_dma_dev *dev,
266 uint16_t vchan, enum rte_dma_vchan_status *status)
268 struct skeldma_hw *hw = dev->data->dev_private;
272 *status = RTE_DMA_VCHAN_IDLE;
273 if (hw->submitted_count != __atomic_load_n(&hw->completed_count, __ATOMIC_ACQUIRE)
274 || hw->zero_req_count == 0)
275 *status = RTE_DMA_VCHAN_ACTIVE;
280 skeldma_stats_get(const struct rte_dma_dev *dev, uint16_t vchan,
281 struct rte_dma_stats *stats, uint32_t stats_sz)
283 struct skeldma_hw *hw = dev->data->dev_private;
286 RTE_SET_USED(stats_sz);
288 stats->submitted = hw->submitted_count;
289 stats->completed = hw->completed_count;
296 skeldma_stats_reset(struct rte_dma_dev *dev, uint16_t vchan)
298 struct skeldma_hw *hw = dev->data->dev_private;
302 hw->submitted_count = 0;
303 hw->completed_count = 0;
309 skeldma_dump(const struct rte_dma_dev *dev, FILE *f)
311 #define GET_RING_COUNT(ring) ((ring) ? (rte_ring_count(ring)) : 0)
313 struct skeldma_hw *hw = dev->data->dev_private;
318 " desc_empty_ring_count: %u\n"
319 " desc_pending_ring_count: %u\n"
320 " desc_running_ring_count: %u\n"
321 " desc_completed_ring_count: %u\n",
322 hw->lcore_id, hw->socket_id,
323 GET_RING_COUNT(hw->desc_empty),
324 GET_RING_COUNT(hw->desc_pending),
325 GET_RING_COUNT(hw->desc_running),
326 GET_RING_COUNT(hw->desc_completed));
328 " next_ring_idx: %u\n"
329 " last_ring_idx: %u\n"
330 " submitted_count: %" PRIu64 "\n"
331 " completed_count: %" PRIu64 "\n",
332 hw->ridx, hw->last_ridx,
333 hw->submitted_count, hw->completed_count);
339 submit(struct skeldma_hw *hw, struct skeldma_desc *desc)
341 uint16_t count = rte_ring_count(hw->desc_pending);
342 struct skeldma_desc *pend_desc = NULL;
345 (void)rte_ring_dequeue(hw->desc_pending, (void **)&pend_desc);
346 (void)rte_ring_enqueue(hw->desc_running, (void *)pend_desc);
351 (void)rte_ring_enqueue(hw->desc_running, (void *)desc);
355 skeldma_copy(void *dev_private, uint16_t vchan,
356 rte_iova_t src, rte_iova_t dst,
357 uint32_t length, uint64_t flags)
359 struct skeldma_hw *hw = dev_private;
360 struct skeldma_desc *desc;
366 ret = rte_ring_dequeue(hw->desc_empty, (void **)&desc);
369 desc->src = (void *)(uintptr_t)src;
370 desc->dst = (void *)(uintptr_t)dst;
372 desc->ridx = hw->ridx;
373 if (flags & RTE_DMA_OP_FLAG_SUBMIT)
376 (void)rte_ring_enqueue(hw->desc_pending, (void *)desc);
377 hw->submitted_count++;
383 skeldma_submit(void *dev_private, uint16_t vchan)
385 struct skeldma_hw *hw = dev_private;
392 skeldma_completed(void *dev_private,
393 uint16_t vchan, const uint16_t nb_cpls,
394 uint16_t *last_idx, bool *has_error)
396 struct skeldma_hw *hw = dev_private;
397 struct skeldma_desc *desc = NULL;
402 RTE_SET_USED(has_error);
404 count = RTE_MIN(nb_cpls, rte_ring_count(hw->desc_completed));
405 while (index < count) {
406 (void)rte_ring_dequeue(hw->desc_completed, (void **)&desc);
407 if (index == count - 1) {
408 hw->last_ridx = desc->ridx;
409 *last_idx = desc->ridx;
412 (void)rte_ring_enqueue(hw->desc_empty, (void *)desc);
414 if (unlikely(count == 0))
415 *last_idx = hw->last_ridx;
421 skeldma_completed_status(void *dev_private,
422 uint16_t vchan, const uint16_t nb_cpls,
423 uint16_t *last_idx, enum rte_dma_status_code *status)
425 struct skeldma_hw *hw = dev_private;
426 struct skeldma_desc *desc = NULL;
432 count = RTE_MIN(nb_cpls, rte_ring_count(hw->desc_completed));
433 while (index < count) {
434 (void)rte_ring_dequeue(hw->desc_completed, (void **)&desc);
435 if (index == count - 1) {
436 hw->last_ridx = desc->ridx;
437 *last_idx = desc->ridx;
439 status[index++] = RTE_DMA_STATUS_SUCCESSFUL;
440 (void)rte_ring_enqueue(hw->desc_empty, (void *)desc);
442 if (unlikely(count == 0))
443 *last_idx = hw->last_ridx;
449 skeldma_burst_capacity(const void *dev_private, uint16_t vchan)
451 const struct skeldma_hw *hw = dev_private;
454 return rte_ring_count(hw->desc_empty);
457 static const struct rte_dma_dev_ops skeldma_ops = {
458 .dev_info_get = skeldma_info_get,
459 .dev_configure = skeldma_configure,
460 .dev_start = skeldma_start,
461 .dev_stop = skeldma_stop,
462 .dev_close = skeldma_close,
464 .vchan_setup = skeldma_vchan_setup,
465 .vchan_status = skeldma_vchan_status,
467 .stats_get = skeldma_stats_get,
468 .stats_reset = skeldma_stats_reset,
470 .dev_dump = skeldma_dump,
474 skeldma_create(const char *name, struct rte_vdev_device *vdev, int lcore_id)
476 struct rte_dma_dev *dev;
477 struct skeldma_hw *hw;
480 socket_id = (lcore_id < 0) ? rte_socket_id() :
481 rte_lcore_to_socket_id(lcore_id);
482 dev = rte_dma_pmd_allocate(name, socket_id, sizeof(struct skeldma_hw));
484 SKELDMA_LOG(ERR, "Unable to allocate dmadev: %s", name);
488 dev->device = &vdev->device;
489 dev->dev_ops = &skeldma_ops;
490 dev->fp_obj->dev_private = dev->data->dev_private;
491 dev->fp_obj->copy = skeldma_copy;
492 dev->fp_obj->submit = skeldma_submit;
493 dev->fp_obj->completed = skeldma_completed;
494 dev->fp_obj->completed_status = skeldma_completed_status;
495 dev->fp_obj->burst_capacity = skeldma_burst_capacity;
497 hw = dev->data->dev_private;
498 hw->lcore_id = lcore_id;
499 hw->socket_id = socket_id;
501 dev->state = RTE_DMA_DEV_READY;
503 return dev->data->dev_id;
507 skeldma_destroy(const char *name)
509 return rte_dma_pmd_release(name);
513 skeldma_parse_lcore(const char *key __rte_unused,
517 int lcore_id = atoi(value);
518 if (lcore_id >= 0 && lcore_id < RTE_MAX_LCORE)
519 *(int *)opaque = lcore_id;
524 skeldma_parse_vdev_args(struct rte_vdev_device *vdev, int *lcore_id)
526 static const char *const args[] = {
531 struct rte_kvargs *kvlist;
534 params = rte_vdev_device_args(vdev);
535 if (params == NULL || params[0] == '\0')
538 kvlist = rte_kvargs_parse(params, args);
542 (void)rte_kvargs_process(kvlist, SKELDMA_ARG_LCORE,
543 skeldma_parse_lcore, lcore_id);
544 SKELDMA_LOG(INFO, "Parse lcore_id = %d", *lcore_id);
546 rte_kvargs_free(kvlist);
550 skeldma_probe(struct rte_vdev_device *vdev)
556 name = rte_vdev_device_name(vdev);
560 if (rte_eal_process_type() != RTE_PROC_PRIMARY) {
561 SKELDMA_LOG(ERR, "Multiple process not supported for %s", name);
565 skeldma_parse_vdev_args(vdev, &lcore_id);
567 ret = skeldma_create(name, vdev, lcore_id);
569 SKELDMA_LOG(INFO, "Create %s dmadev with lcore-id %d",
572 return ret < 0 ? ret : 0;
576 skeldma_remove(struct rte_vdev_device *vdev)
581 name = rte_vdev_device_name(vdev);
585 ret = skeldma_destroy(name);
587 SKELDMA_LOG(INFO, "Remove %s dmadev", name);
592 static struct rte_vdev_driver skeldma_pmd_drv = {
593 .probe = skeldma_probe,
594 .remove = skeldma_remove,
595 .drv_flags = RTE_VDEV_DRV_NEED_IOVA_AS_VA,
598 RTE_PMD_REGISTER_VDEV(dma_skeleton, skeldma_pmd_drv);
599 RTE_PMD_REGISTER_PARAM_STRING(dma_skeleton,
600 SKELDMA_ARG_LCORE "=<uint16> ");