5 #ifndef _RTE_RCU_QSBR_H_
6 #define _RTE_RCU_QSBR_H_
44 extern int rte_rcu_log_type;
46 #if RTE_LOG_DP_LEVEL >= RTE_LOG_DEBUG
47 #define __RTE_RCU_DP_LOG(level, fmt, args...) \
48 rte_log(RTE_LOG_ ## level, rte_rcu_log_type, \
49 "%s(): " fmt "\n", __func__, ## args)
51 #define __RTE_RCU_DP_LOG(level, fmt, args...)
54 #if defined(RTE_LIBRTE_RCU_DEBUG)
55 #define __RTE_RCU_IS_LOCK_CNT_ZERO(v, thread_id, level, fmt, args...) do {\
56 if (v->qsbr_cnt[thread_id].lock_cnt) \
57 rte_log(RTE_LOG_ ## level, rte_rcu_log_type, \
58 "%s(): " fmt "\n", __func__, ## args); \
61 #define __RTE_RCU_IS_LOCK_CNT_ZERO(v, thread_id, level, fmt, args...)
68 #define __RTE_QSBR_THRID_ARRAY_ELM_SIZE (sizeof(uint64_t) * 8)
69 #define __RTE_QSBR_THRID_ARRAY_SIZE(max_threads) \
70 RTE_ALIGN(RTE_ALIGN_MUL_CEIL(max_threads, \
71 __RTE_QSBR_THRID_ARRAY_ELM_SIZE) >> 3, RTE_CACHE_LINE_SIZE)
72 #define __RTE_QSBR_THRID_ARRAY_ELM(v, i) ((uint64_t *) \
73 ((struct rte_rcu_qsbr_cnt *)(v + 1) + v->max_threads) + i)
74 #define __RTE_QSBR_THRID_INDEX_SHIFT 6
75 #define __RTE_QSBR_THRID_MASK 0x3f
76 #define RTE_QSBR_THRID_INVALID 0xffffffff
79 struct rte_rcu_qsbr_cnt {
90 #define __RTE_QSBR_CNT_THR_OFFLINE 0
91 #define __RTE_QSBR_CNT_INIT 1
92 #define __RTE_QSBR_CNT_MAX ((uint64_t)~0)
93 #define __RTE_QSBR_TOKEN_SIZE sizeof(uint64_t)
101 struct rte_rcu_qsbr {
104 uint64_t acked_token;
111 uint32_t num_threads;
113 uint32_t max_threads;
116 struct rte_rcu_qsbr_cnt qsbr_cnt[0] __rte_cache_aligned;
139 #define RTE_RCU_QSBR_DQ_NAMESIZE RTE_RING_NAMESIZE
149 #define RTE_RCU_QSBR_DQ_MT_UNSAFE 1
193 struct rte_rcu_qsbr *
v;
202 struct rte_rcu_qsbr_dq;
327 RTE_ASSERT(v != NULL && thread_id < v->max_threads);
329 __RTE_RCU_IS_LOCK_CNT_ZERO(v, thread_id, ERR,
"Lock counter %u\n",
330 v->qsbr_cnt[thread_id].lock_cnt);
337 t = __atomic_load_n(&v->token, __ATOMIC_RELAXED);
342 __atomic_store_n(&v->qsbr_cnt[thread_id].cnt,
343 t, __ATOMIC_RELAXED);
352 #ifdef RTE_ARCH_X86_64
356 __atomic_thread_fence(__ATOMIC_SEQ_CST);
387 RTE_ASSERT(v != NULL && thread_id < v->max_threads);
389 __RTE_RCU_IS_LOCK_CNT_ZERO(v, thread_id, ERR,
"Lock counter %u\n",
390 v->qsbr_cnt[thread_id].lock_cnt);
397 __atomic_store_n(&v->qsbr_cnt[thread_id].cnt,
398 __RTE_QSBR_CNT_THR_OFFLINE, __ATOMIC_RELEASE);
429 RTE_ASSERT(v != NULL && thread_id < v->max_threads);
431 #if defined(RTE_LIBRTE_RCU_DEBUG)
433 __atomic_fetch_add(&v->qsbr_cnt[thread_id].lock_cnt,
434 1, __ATOMIC_ACQUIRE);
466 RTE_ASSERT(v != NULL && thread_id < v->max_threads);
468 #if defined(RTE_LIBRTE_RCU_DEBUG)
470 __atomic_fetch_sub(&v->qsbr_cnt[thread_id].lock_cnt,
471 1, __ATOMIC_RELEASE);
473 __RTE_RCU_IS_LOCK_CNT_ZERO(v, thread_id, WARNING,
474 "Lock counter %u. Nested locks?\n",
475 v->qsbr_cnt[thread_id].lock_cnt);
501 RTE_ASSERT(v != NULL);
508 t = __atomic_add_fetch(&v->token, 1, __ATOMIC_RELEASE);
534 RTE_ASSERT(v != NULL && thread_id < v->max_threads);
536 __RTE_RCU_IS_LOCK_CNT_ZERO(v, thread_id, ERR,
"Lock counter %u\n",
537 v->qsbr_cnt[thread_id].lock_cnt);
544 t = __atomic_load_n(&v->token, __ATOMIC_ACQUIRE);
551 if (t != __atomic_load_n(&v->qsbr_cnt[thread_id].cnt, __ATOMIC_RELAXED))
552 __atomic_store_n(&v->qsbr_cnt[thread_id].cnt,
553 t, __ATOMIC_RELEASE);
555 __RTE_RCU_DP_LOG(DEBUG,
"%s: update: token = %"PRIu64
", Thread ID = %d",
556 __func__, t, thread_id);
563 __rte_rcu_qsbr_check_selective(
struct rte_rcu_qsbr *v, uint64_t t,
bool wait)
568 uint64_t *reg_thread_id;
569 uint64_t acked_token = __RTE_QSBR_CNT_MAX;
571 for (i = 0, reg_thread_id = __RTE_QSBR_THRID_ARRAY_ELM(v, 0);
573 i++, reg_thread_id++) {
577 bmap = __atomic_load_n(reg_thread_id, __ATOMIC_ACQUIRE);
578 id = i << __RTE_QSBR_THRID_INDEX_SHIFT;
581 j = __builtin_ctzl(bmap);
582 __RTE_RCU_DP_LOG(DEBUG,
583 "%s: check: token = %"PRIu64
", wait = %d, Bit Map = 0x%"PRIx64
", Thread ID = %d",
584 __func__, t, wait, bmap,
id + j);
586 &v->qsbr_cnt[
id + j].cnt,
588 __RTE_RCU_DP_LOG(DEBUG,
589 "%s: status: token = %"PRIu64
", wait = %d, Thread QS cnt = %"PRIu64
", Thread ID = %d",
590 __func__, t, wait, c,
id+j);
596 __RTE_QSBR_CNT_THR_OFFLINE && c < t)) {
605 bmap = __atomic_load_n(reg_thread_id,
615 if (c != __RTE_QSBR_CNT_THR_OFFLINE && acked_token > c)
626 if (acked_token != __RTE_QSBR_CNT_MAX)
627 __atomic_store_n(&v->acked_token, acked_token,
637 __rte_rcu_qsbr_check_all(
struct rte_rcu_qsbr *v, uint64_t t,
bool wait)
640 struct rte_rcu_qsbr_cnt *cnt;
642 uint64_t acked_token = __RTE_QSBR_CNT_MAX;
644 for (i = 0, cnt = v->qsbr_cnt; i < v->max_threads; i++, cnt++) {
645 __RTE_RCU_DP_LOG(DEBUG,
646 "%s: check: token = %"PRIu64
", wait = %d, Thread ID = %d",
647 __func__, t, wait, i);
649 c = __atomic_load_n(&cnt->cnt, __ATOMIC_ACQUIRE);
650 __RTE_RCU_DP_LOG(DEBUG,
651 "%s: status: token = %"PRIu64
", wait = %d, Thread QS cnt = %"PRIu64
", Thread ID = %d",
652 __func__, t, wait, c, i);
657 if (
likely(c == __RTE_QSBR_CNT_THR_OFFLINE || c >= t))
670 if (
likely(c != __RTE_QSBR_CNT_THR_OFFLINE && acked_token > c))
678 if (acked_token != __RTE_QSBR_CNT_MAX)
679 __atomic_store_n(&v->acked_token, acked_token,
723 RTE_ASSERT(v != NULL);
726 if (
likely(t <= v->acked_token)) {
727 __RTE_RCU_DP_LOG(DEBUG,
728 "%s: check: token = %"PRIu64
", wait = %d",
730 __RTE_RCU_DP_LOG(DEBUG,
731 "%s: status: least acked token = %"PRIu64
"",
732 __func__, v->acked_token);
736 if (
likely(v->num_threads == v->max_threads))
737 return __rte_rcu_qsbr_check_all(v, t, wait);
739 return __rte_rcu_qsbr_check_selective(v, t, wait);
806 struct rte_rcu_qsbr_dq *
872 unsigned int *freed,
unsigned int *pending,
unsigned int *available);
static __rte_experimental __rte_always_inline int rte_rcu_qsbr_check(struct rte_rcu_qsbr *v, uint64_t t, bool wait)
__rte_experimental int rte_rcu_qsbr_thread_register(struct rte_rcu_qsbr *v, unsigned int thread_id)
#define __rte_always_inline
__rte_experimental int rte_rcu_qsbr_dq_reclaim(struct rte_rcu_qsbr_dq *dq, unsigned int n, unsigned int *freed, unsigned int *pending, unsigned int *available)
__rte_experimental int rte_rcu_qsbr_dq_delete(struct rte_rcu_qsbr_dq *dq)
static __rte_experimental __rte_always_inline void rte_rcu_qsbr_thread_online(struct rte_rcu_qsbr *v, unsigned int thread_id)
__rte_experimental int rte_rcu_qsbr_dump(FILE *f, struct rte_rcu_qsbr *v)
static __rte_experimental __rte_always_inline void rte_rcu_qsbr_quiescent(struct rte_rcu_qsbr *v, unsigned int thread_id)
static __rte_experimental __rte_always_inline void rte_rcu_qsbr_thread_offline(struct rte_rcu_qsbr *v, unsigned int thread_id)
void(* rte_rcu_qsbr_free_resource_t)(void *p, void *e, unsigned int n)
rte_rcu_qsbr_free_resource_t free_fn
static void rte_pause(void)
uint32_t trigger_reclaim_limit
uint32_t max_reclaim_size
static __rte_experimental __rte_always_inline void rte_rcu_qsbr_unlock(__rte_unused struct rte_rcu_qsbr *v, __rte_unused unsigned int thread_id)
__rte_experimental int rte_rcu_qsbr_thread_unregister(struct rte_rcu_qsbr *v, unsigned int thread_id)
static __rte_experimental __rte_always_inline uint64_t rte_rcu_qsbr_start(struct rte_rcu_qsbr *v)
__rte_experimental void rte_rcu_qsbr_synchronize(struct rte_rcu_qsbr *v, unsigned int thread_id)
#define __rte_cache_aligned
static __rte_experimental __rte_always_inline void rte_rcu_qsbr_lock(__rte_unused struct rte_rcu_qsbr *v, __rte_unused unsigned int thread_id)
static void rte_smp_mb(void)
__rte_experimental struct rte_rcu_qsbr_dq * rte_rcu_qsbr_dq_create(const struct rte_rcu_qsbr_dq_parameters *params)
__rte_experimental size_t rte_rcu_qsbr_get_memsize(uint32_t max_threads)
__rte_experimental int rte_rcu_qsbr_dq_enqueue(struct rte_rcu_qsbr_dq *dq, void *e)
__rte_experimental int rte_rcu_qsbr_init(struct rte_rcu_qsbr *v, uint32_t max_threads)