1 /* SPDX-License-Identifier: BSD-3-Clause
2 * Copyright 2019 Mellanox Technologies, Ltd
5 #include <rte_malloc.h>
6 #include <rte_hash_crc.h>
8 #include "mlx5_utils.h"
11 mlx5_hlist_create(const char *name, uint32_t size)
19 /* Align to the next power of 2, 32bits integer is enough now. */
20 if (!rte_is_power_of_2(size)) {
21 act_size = rte_align32pow2(size);
22 DRV_LOG(WARNING, "Size 0x%" PRIX32 " is not power of 2, will "
23 "be aligned to 0x%" PRIX32 ".", size, act_size);
27 alloc_size = sizeof(struct mlx5_hlist) +
28 sizeof(struct mlx5_hlist_head) * act_size;
29 /* Using zmalloc, then no need to initialize the heads. */
30 h = rte_zmalloc(name, alloc_size, RTE_CACHE_LINE_SIZE);
32 DRV_LOG(ERR, "No memory for hash list %s creation",
33 name ? name : "None");
37 snprintf(h->name, MLX5_HLIST_NAMESIZE, "%s", name);
38 h->table_sz = act_size;
39 h->mask = act_size - 1;
40 DRV_LOG(DEBUG, "Hash list with %s size 0x%" PRIX32 " is created.",
45 struct mlx5_hlist_entry *
46 mlx5_hlist_lookup(struct mlx5_hlist *h, uint64_t key)
49 struct mlx5_hlist_head *first;
50 struct mlx5_hlist_entry *node;
53 idx = rte_hash_crc_8byte(key, 0) & h->mask;
54 first = &h->heads[idx];
55 LIST_FOREACH(node, first, next) {
63 mlx5_hlist_insert(struct mlx5_hlist *h, struct mlx5_hlist_entry *entry)
66 struct mlx5_hlist_head *first;
67 struct mlx5_hlist_entry *node;
69 MLX5_ASSERT(h && entry);
70 idx = rte_hash_crc_8byte(entry->key, 0) & h->mask;
71 first = &h->heads[idx];
72 /* No need to reuse the lookup function. */
73 LIST_FOREACH(node, first, next) {
74 if (node->key == entry->key)
77 LIST_INSERT_HEAD(first, entry, next);
82 mlx5_hlist_remove(struct mlx5_hlist *h __rte_unused,
83 struct mlx5_hlist_entry *entry)
85 MLX5_ASSERT(entry && entry->next.le_prev);
86 LIST_REMOVE(entry, next);
87 /* Set to NULL to get rid of removing action for more than once. */
88 entry->next.le_prev = NULL;
92 mlx5_hlist_destroy(struct mlx5_hlist *h,
93 mlx5_hlist_destroy_callback_fn cb, void *ctx)
96 struct mlx5_hlist_entry *entry;
99 for (idx = 0; idx < h->table_sz; ++idx) {
100 /* no LIST_FOREACH_SAFE, using while instead */
101 while (!LIST_EMPTY(&h->heads[idx])) {
102 entry = LIST_FIRST(&h->heads[idx]);
103 LIST_REMOVE(entry, next);
105 * The owner of whole element which contains data entry
106 * is the user, so it's the user's duty to do the clean
107 * up and the free work because someone may not put the
108 * hlist entry at the beginning(suggested to locate at
109 * the beginning). Or else the default free function
122 mlx5_ipool_lock(struct mlx5_indexed_pool *pool)
124 if (pool->cfg.need_lock)
125 rte_spinlock_lock(&pool->lock);
129 mlx5_ipool_unlock(struct mlx5_indexed_pool *pool)
131 if (pool->cfg.need_lock)
132 rte_spinlock_unlock(&pool->lock);
135 static inline uint32_t
136 mlx5_trunk_idx_get(struct mlx5_indexed_pool *pool, uint32_t entry_idx)
138 struct mlx5_indexed_pool_config *cfg = &pool->cfg;
139 uint32_t trunk_idx = 0;
142 if (!cfg->grow_trunk)
143 return entry_idx / cfg->trunk_size;
144 if (entry_idx >= pool->grow_tbl[cfg->grow_trunk - 1]) {
145 trunk_idx = (entry_idx - pool->grow_tbl[cfg->grow_trunk - 1]) /
146 (cfg->trunk_size << (cfg->grow_shift *
147 cfg->grow_trunk)) + cfg->grow_trunk;
149 for (i = 0; i < cfg->grow_trunk; i++) {
150 if (entry_idx < pool->grow_tbl[i])
158 static inline uint32_t
159 mlx5_trunk_size_get(struct mlx5_indexed_pool *pool, uint32_t trunk_idx)
161 struct mlx5_indexed_pool_config *cfg = &pool->cfg;
163 return cfg->trunk_size << (cfg->grow_shift *
164 (trunk_idx > cfg->grow_trunk ? cfg->grow_trunk : trunk_idx));
167 static inline uint32_t
168 mlx5_trunk_idx_offset_get(struct mlx5_indexed_pool *pool, uint32_t trunk_idx)
170 struct mlx5_indexed_pool_config *cfg = &pool->cfg;
175 if (!cfg->grow_trunk)
176 return cfg->trunk_size * trunk_idx;
177 if (trunk_idx < cfg->grow_trunk)
178 offset = pool->grow_tbl[trunk_idx - 1];
180 offset = pool->grow_tbl[cfg->grow_trunk - 1] +
181 (cfg->trunk_size << (cfg->grow_shift *
182 cfg->grow_trunk)) * (trunk_idx - cfg->grow_trunk);
186 struct mlx5_indexed_pool *
187 mlx5_ipool_create(struct mlx5_indexed_pool_config *cfg)
189 struct mlx5_indexed_pool *pool;
192 if (!cfg || !cfg->size || (!cfg->malloc ^ !cfg->free) ||
193 (cfg->trunk_size && ((cfg->trunk_size & (cfg->trunk_size - 1)) ||
194 ((__builtin_ffs(cfg->trunk_size) + TRUNK_IDX_BITS) > 32))))
196 pool = rte_zmalloc("mlx5_ipool", sizeof(*pool) + cfg->grow_trunk *
197 sizeof(pool->grow_tbl[0]), RTE_CACHE_LINE_SIZE);
201 if (!pool->cfg.trunk_size)
202 pool->cfg.trunk_size = MLX5_IPOOL_DEFAULT_TRUNK_SIZE;
203 if (!cfg->malloc && !cfg->free) {
204 pool->cfg.malloc = rte_malloc_socket;
205 pool->cfg.free = rte_free;
207 pool->free_list = TRUNK_INVALID;
208 if (pool->cfg.need_lock)
209 rte_spinlock_init(&pool->lock);
211 * Initialize the dynamic grow trunk size lookup table to have a quick
212 * lookup for the trunk entry index offset.
214 for (i = 0; i < cfg->grow_trunk; i++) {
215 pool->grow_tbl[i] = cfg->trunk_size << (cfg->grow_shift * i);
217 pool->grow_tbl[i] += pool->grow_tbl[i - 1];
223 mlx5_ipool_grow(struct mlx5_indexed_pool *pool)
225 struct mlx5_indexed_trunk *trunk;
226 struct mlx5_indexed_trunk **trunk_tmp;
227 struct mlx5_indexed_trunk **p;
228 size_t trunk_size = 0;
233 if (pool->n_trunk_valid == TRUNK_MAX_IDX)
235 if (pool->n_trunk_valid == pool->n_trunk) {
236 /* No free trunk flags, expand trunk list. */
237 int n_grow = pool->n_trunk_valid ? pool->n_trunk :
238 RTE_CACHE_LINE_SIZE / sizeof(void *);
240 p = pool->cfg.malloc(pool->cfg.type,
241 (pool->n_trunk_valid + n_grow) *
242 sizeof(struct mlx5_indexed_trunk *),
243 RTE_CACHE_LINE_SIZE, rte_socket_id());
247 memcpy(p, pool->trunks, pool->n_trunk_valid *
248 sizeof(struct mlx5_indexed_trunk *));
249 memset(RTE_PTR_ADD(p, pool->n_trunk_valid * sizeof(void *)), 0,
250 n_grow * sizeof(void *));
251 trunk_tmp = pool->trunks;
254 pool->cfg.free(trunk_tmp);
255 pool->n_trunk += n_grow;
257 if (!pool->cfg.release_mem_en) {
258 idx = pool->n_trunk_valid;
260 /* Find the first available slot in trunk list */
261 for (idx = 0; idx < pool->n_trunk; idx++)
262 if (pool->trunks[idx] == NULL)
265 trunk_size += sizeof(*trunk);
266 data_size = mlx5_trunk_size_get(pool, idx);
267 bmp_size = rte_bitmap_get_memory_footprint(data_size);
268 /* rte_bitmap requires memory cacheline aligned. */
269 trunk_size += RTE_CACHE_LINE_ROUNDUP(data_size * pool->cfg.size);
270 trunk_size += bmp_size;
271 trunk = pool->cfg.malloc(pool->cfg.type, trunk_size,
272 RTE_CACHE_LINE_SIZE, rte_socket_id());
275 pool->trunks[idx] = trunk;
277 trunk->free = data_size;
278 trunk->prev = TRUNK_INVALID;
279 trunk->next = TRUNK_INVALID;
280 MLX5_ASSERT(pool->free_list == TRUNK_INVALID);
281 pool->free_list = idx;
282 /* Mark all entries as available. */
283 trunk->bmp = rte_bitmap_init_with_all_set(data_size, &trunk->data
284 [RTE_CACHE_LINE_ROUNDUP(data_size * pool->cfg.size)],
286 MLX5_ASSERT(trunk->bmp);
287 pool->n_trunk_valid++;
296 mlx5_ipool_malloc(struct mlx5_indexed_pool *pool, uint32_t *idx)
298 struct mlx5_indexed_trunk *trunk;
303 mlx5_ipool_lock(pool);
304 if (pool->free_list == TRUNK_INVALID) {
305 /* If no available trunks, grow new. */
306 if (mlx5_ipool_grow(pool)) {
307 mlx5_ipool_unlock(pool);
311 MLX5_ASSERT(pool->free_list != TRUNK_INVALID);
312 trunk = pool->trunks[pool->free_list];
313 MLX5_ASSERT(trunk->free);
314 if (!rte_bitmap_scan(trunk->bmp, &iidx, &slab)) {
315 mlx5_ipool_unlock(pool);
319 iidx += __builtin_ctzll(slab);
320 MLX5_ASSERT(iidx != UINT32_MAX);
321 MLX5_ASSERT(iidx < mlx5_trunk_size_get(pool, trunk->idx));
322 rte_bitmap_clear(trunk->bmp, iidx);
323 p = &trunk->data[iidx * pool->cfg.size];
324 iidx += mlx5_trunk_idx_offset_get(pool, trunk->idx);
325 iidx += 1; /* non-zero index. */
331 /* Full trunk will be removed from free list in imalloc. */
332 MLX5_ASSERT(pool->free_list == trunk->idx);
333 pool->free_list = trunk->next;
334 if (trunk->next != TRUNK_INVALID)
335 pool->trunks[trunk->next]->prev = TRUNK_INVALID;
336 trunk->prev = TRUNK_INVALID;
337 trunk->next = TRUNK_INVALID;
344 mlx5_ipool_unlock(pool);
349 mlx5_ipool_zmalloc(struct mlx5_indexed_pool *pool, uint32_t *idx)
351 void *entry = mlx5_ipool_malloc(pool, idx);
354 memset(entry, 0, pool->cfg.size);
359 mlx5_ipool_free(struct mlx5_indexed_pool *pool, uint32_t idx)
361 struct mlx5_indexed_trunk *trunk;
368 mlx5_ipool_lock(pool);
369 trunk_idx = mlx5_trunk_idx_get(pool, idx);
370 if ((!pool->cfg.release_mem_en && trunk_idx >= pool->n_trunk_valid) ||
371 (pool->cfg.release_mem_en && trunk_idx >= pool->n_trunk))
373 trunk = pool->trunks[trunk_idx];
376 entry_idx = idx - mlx5_trunk_idx_offset_get(pool, trunk->idx);
377 if (trunk_idx != trunk->idx ||
378 rte_bitmap_get(trunk->bmp, entry_idx))
380 rte_bitmap_set(trunk->bmp, entry_idx);
382 if (pool->cfg.release_mem_en && trunk->free == mlx5_trunk_size_get
383 (pool, trunk->idx)) {
384 if (pool->free_list == trunk->idx)
385 pool->free_list = trunk->next;
386 if (trunk->next != TRUNK_INVALID)
387 pool->trunks[trunk->next]->prev = trunk->prev;
388 if (trunk->prev != TRUNK_INVALID)
389 pool->trunks[trunk->prev]->next = trunk->next;
390 pool->cfg.free(trunk);
391 pool->trunks[trunk_idx] = NULL;
392 pool->n_trunk_valid--;
397 if (pool->n_trunk_valid == 0) {
398 pool->cfg.free(pool->trunks);
402 } else if (trunk->free == 1) {
403 /* Put into free trunk list head. */
404 MLX5_ASSERT(pool->free_list != trunk->idx);
405 trunk->next = pool->free_list;
406 trunk->prev = TRUNK_INVALID;
407 if (pool->free_list != TRUNK_INVALID)
408 pool->trunks[pool->free_list]->prev = trunk->idx;
409 pool->free_list = trunk->idx;
419 mlx5_ipool_unlock(pool);
423 mlx5_ipool_get(struct mlx5_indexed_pool *pool, uint32_t idx)
425 struct mlx5_indexed_trunk *trunk;
433 mlx5_ipool_lock(pool);
434 trunk_idx = mlx5_trunk_idx_get(pool, idx);
435 if ((!pool->cfg.release_mem_en && trunk_idx >= pool->n_trunk_valid) ||
436 (pool->cfg.release_mem_en && trunk_idx >= pool->n_trunk))
438 trunk = pool->trunks[trunk_idx];
441 entry_idx = idx - mlx5_trunk_idx_offset_get(pool, trunk->idx);
442 if (trunk_idx != trunk->idx ||
443 rte_bitmap_get(trunk->bmp, entry_idx))
445 p = &trunk->data[entry_idx * pool->cfg.size];
447 mlx5_ipool_unlock(pool);
452 mlx5_ipool_destroy(struct mlx5_indexed_pool *pool)
454 struct mlx5_indexed_trunk **trunks;
458 mlx5_ipool_lock(pool);
459 trunks = pool->trunks;
460 for (i = 0; i < pool->n_trunk; i++) {
462 pool->cfg.free(trunks[i]);
465 pool->cfg.free(pool->trunks);
466 mlx5_ipool_unlock(pool);
472 mlx5_ipool_dump(struct mlx5_indexed_pool *pool)
474 printf("Pool %s entry size %u, trunks %u, %d entry per trunk, "
476 pool->cfg.type, pool->cfg.size, pool->n_trunk_valid,
477 pool->cfg.trunk_size, pool->n_trunk_valid);
479 printf("Pool %s entry %u, trunk alloc %u, empty: %u, "
480 "available %u free %u\n",
481 pool->cfg.type, pool->n_entry, pool->trunk_new,
482 pool->trunk_empty, pool->trunk_avail, pool->trunk_free);
486 struct mlx5_l3t_tbl *
487 mlx5_l3t_create(enum mlx5_l3t_type type)
489 struct mlx5_l3t_tbl *tbl;
490 struct mlx5_indexed_pool_config l3t_ip_cfg = {
496 .malloc = rte_malloc_socket,
500 if (type >= MLX5_L3T_TYPE_MAX) {
504 tbl = rte_zmalloc(NULL, sizeof(struct mlx5_l3t_tbl), 1);
511 case MLX5_L3T_TYPE_WORD:
512 l3t_ip_cfg.size = sizeof(struct mlx5_l3t_entry_word) +
513 sizeof(uint16_t) * MLX5_L3T_ET_SIZE;
514 l3t_ip_cfg.type = "mlx5_l3t_e_tbl_w";
516 case MLX5_L3T_TYPE_DWORD:
517 l3t_ip_cfg.size = sizeof(struct mlx5_l3t_entry_dword) +
518 sizeof(uint32_t) * MLX5_L3T_ET_SIZE;
519 l3t_ip_cfg.type = "mlx5_l3t_e_tbl_dw";
521 case MLX5_L3T_TYPE_QWORD:
522 l3t_ip_cfg.size = sizeof(struct mlx5_l3t_entry_qword) +
523 sizeof(uint64_t) * MLX5_L3T_ET_SIZE;
524 l3t_ip_cfg.type = "mlx5_l3t_e_tbl_qw";
527 l3t_ip_cfg.size = sizeof(struct mlx5_l3t_entry_ptr) +
528 sizeof(void *) * MLX5_L3T_ET_SIZE;
529 l3t_ip_cfg.type = "mlx5_l3t_e_tbl_tpr";
532 tbl->eip = mlx5_ipool_create(&l3t_ip_cfg);
542 mlx5_l3t_destroy(struct mlx5_l3t_tbl *tbl)
544 struct mlx5_l3t_level_tbl *g_tbl, *m_tbl;
551 for (i = 0; i < MLX5_L3T_GT_SIZE; i++) {
552 m_tbl = g_tbl->tbl[i];
555 for (j = 0; j < MLX5_L3T_MT_SIZE; j++) {
558 MLX5_ASSERT(!((struct mlx5_l3t_entry_word *)
559 m_tbl->tbl[j])->ref_cnt);
560 mlx5_ipool_free(tbl->eip,
561 ((struct mlx5_l3t_entry_word *)
562 m_tbl->tbl[j])->idx);
564 if (!(--m_tbl->ref_cnt))
567 MLX5_ASSERT(!m_tbl->ref_cnt);
568 rte_free(g_tbl->tbl[i]);
570 if (!(--g_tbl->ref_cnt))
573 MLX5_ASSERT(!g_tbl->ref_cnt);
577 mlx5_ipool_destroy(tbl->eip);
582 mlx5_l3t_get_entry(struct mlx5_l3t_tbl *tbl, uint32_t idx,
583 union mlx5_l3t_data *data)
585 struct mlx5_l3t_level_tbl *g_tbl, *m_tbl;
592 m_tbl = g_tbl->tbl[(idx >> MLX5_L3T_GT_OFFSET) & MLX5_L3T_GT_MASK];
595 e_tbl = m_tbl->tbl[(idx >> MLX5_L3T_MT_OFFSET) & MLX5_L3T_MT_MASK];
598 entry_idx = idx & MLX5_L3T_ET_MASK;
600 case MLX5_L3T_TYPE_WORD:
601 data->word = ((struct mlx5_l3t_entry_word *)e_tbl)->entry
604 case MLX5_L3T_TYPE_DWORD:
605 data->dword = ((struct mlx5_l3t_entry_dword *)e_tbl)->entry
608 case MLX5_L3T_TYPE_QWORD:
609 data->qword = ((struct mlx5_l3t_entry_qword *)e_tbl)->entry
613 data->ptr = ((struct mlx5_l3t_entry_ptr *)e_tbl)->entry
621 mlx5_l3t_clear_entry(struct mlx5_l3t_tbl *tbl, uint32_t idx)
623 struct mlx5_l3t_level_tbl *g_tbl, *m_tbl;
624 struct mlx5_l3t_entry_word *w_e_tbl;
625 struct mlx5_l3t_entry_dword *dw_e_tbl;
626 struct mlx5_l3t_entry_qword *qw_e_tbl;
627 struct mlx5_l3t_entry_ptr *ptr_e_tbl;
635 m_tbl = g_tbl->tbl[(idx >> MLX5_L3T_GT_OFFSET) & MLX5_L3T_GT_MASK];
638 e_tbl = m_tbl->tbl[(idx >> MLX5_L3T_MT_OFFSET) & MLX5_L3T_MT_MASK];
641 entry_idx = idx & MLX5_L3T_ET_MASK;
643 case MLX5_L3T_TYPE_WORD:
644 w_e_tbl = (struct mlx5_l3t_entry_word *)e_tbl;
645 w_e_tbl->entry[entry_idx] = 0;
646 ref_cnt = --w_e_tbl->ref_cnt;
648 case MLX5_L3T_TYPE_DWORD:
649 dw_e_tbl = (struct mlx5_l3t_entry_dword *)e_tbl;
650 dw_e_tbl->entry[entry_idx] = 0;
651 ref_cnt = --dw_e_tbl->ref_cnt;
653 case MLX5_L3T_TYPE_QWORD:
654 qw_e_tbl = (struct mlx5_l3t_entry_qword *)e_tbl;
655 qw_e_tbl->entry[entry_idx] = 0;
656 ref_cnt = --qw_e_tbl->ref_cnt;
659 ptr_e_tbl = (struct mlx5_l3t_entry_ptr *)e_tbl;
660 ptr_e_tbl->entry[entry_idx] = NULL;
661 ref_cnt = --ptr_e_tbl->ref_cnt;
665 mlx5_ipool_free(tbl->eip,
666 ((struct mlx5_l3t_entry_word *)e_tbl)->idx);
667 m_tbl->tbl[(idx >> MLX5_L3T_MT_OFFSET) & MLX5_L3T_MT_MASK] =
669 if (!(--m_tbl->ref_cnt)) {
672 [(idx >> MLX5_L3T_GT_OFFSET) & MLX5_L3T_GT_MASK] = NULL;
673 if (!(--g_tbl->ref_cnt)) {
682 mlx5_l3t_set_entry(struct mlx5_l3t_tbl *tbl, uint32_t idx,
683 union mlx5_l3t_data *data)
685 struct mlx5_l3t_level_tbl *g_tbl, *m_tbl;
686 struct mlx5_l3t_entry_word *w_e_tbl;
687 struct mlx5_l3t_entry_dword *dw_e_tbl;
688 struct mlx5_l3t_entry_qword *qw_e_tbl;
689 struct mlx5_l3t_entry_ptr *ptr_e_tbl;
691 uint32_t entry_idx, tbl_idx = 0;
693 /* Check the global table, create it if empty. */
696 g_tbl = rte_zmalloc(NULL, sizeof(struct mlx5_l3t_level_tbl) +
697 sizeof(void *) * MLX5_L3T_GT_SIZE, 1);
705 * Check the middle table, create it if empty. Ref_cnt will be
706 * increased if new sub table created.
708 m_tbl = g_tbl->tbl[(idx >> MLX5_L3T_GT_OFFSET) & MLX5_L3T_GT_MASK];
710 m_tbl = rte_zmalloc(NULL, sizeof(struct mlx5_l3t_level_tbl) +
711 sizeof(void *) * MLX5_L3T_MT_SIZE, 1);
716 g_tbl->tbl[(idx >> MLX5_L3T_GT_OFFSET) & MLX5_L3T_GT_MASK] =
721 * Check the entry table, create it if empty. Ref_cnt will be
722 * increased if new sub entry table created.
724 e_tbl = m_tbl->tbl[(idx >> MLX5_L3T_MT_OFFSET) & MLX5_L3T_MT_MASK];
726 e_tbl = mlx5_ipool_zmalloc(tbl->eip, &tbl_idx);
731 ((struct mlx5_l3t_entry_word *)e_tbl)->idx = tbl_idx;
732 m_tbl->tbl[(idx >> MLX5_L3T_MT_OFFSET) & MLX5_L3T_MT_MASK] =
736 entry_idx = idx & MLX5_L3T_ET_MASK;
738 case MLX5_L3T_TYPE_WORD:
739 w_e_tbl = (struct mlx5_l3t_entry_word *)e_tbl;
740 w_e_tbl->entry[entry_idx] = data->word;
743 case MLX5_L3T_TYPE_DWORD:
744 dw_e_tbl = (struct mlx5_l3t_entry_dword *)e_tbl;
745 dw_e_tbl->entry[entry_idx] = data->dword;
748 case MLX5_L3T_TYPE_QWORD:
749 qw_e_tbl = (struct mlx5_l3t_entry_qword *)e_tbl;
750 qw_e_tbl->entry[entry_idx] = data->qword;
754 ptr_e_tbl = (struct mlx5_l3t_entry_ptr *)e_tbl;
755 ptr_e_tbl->entry[entry_idx] = data->ptr;
756 ptr_e_tbl->ref_cnt++;