DPDK  17.08.2
rte_ring.h
Go to the documentation of this file.
1 /*-
2  * BSD LICENSE
3  *
4  * Copyright(c) 2010-2017 Intel Corporation. All rights reserved.
5  * All rights reserved.
6  *
7  * Redistribution and use in source and binary forms, with or without
8  * modification, are permitted provided that the following conditions
9  * are met:
10  *
11  * * Redistributions of source code must retain the above copyright
12  * notice, this list of conditions and the following disclaimer.
13  * * Redistributions in binary form must reproduce the above copyright
14  * notice, this list of conditions and the following disclaimer in
15  * the documentation and/or other materials provided with the
16  * distribution.
17  * * Neither the name of Intel Corporation nor the names of its
18  * contributors may be used to endorse or promote products derived
19  * from this software without specific prior written permission.
20  *
21  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
22  * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
23  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
24  * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
25  * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
26  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
27  * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
28  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
29  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
30  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
31  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
32  */
33 
34 /*
35  * Derived from FreeBSD's bufring.h
36  *
37  **************************************************************************
38  *
39  * Copyright (c) 2007-2009 Kip Macy kmacy@freebsd.org
40  * All rights reserved.
41  *
42  * Redistribution and use in source and binary forms, with or without
43  * modification, are permitted provided that the following conditions are met:
44  *
45  * 1. Redistributions of source code must retain the above copyright notice,
46  * this list of conditions and the following disclaimer.
47  *
48  * 2. The name of Kip Macy nor the names of other
49  * contributors may be used to endorse or promote products derived from
50  * this software without specific prior written permission.
51  *
52  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
53  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
54  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
55  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
56  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
57  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
58  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
59  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
60  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
61  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
62  * POSSIBILITY OF SUCH DAMAGE.
63  *
64  ***************************************************************************/
65 
66 #ifndef _RTE_RING_H_
67 #define _RTE_RING_H_
68 
90 #ifdef __cplusplus
91 extern "C" {
92 #endif
93 
94 #include <stdio.h>
95 #include <stdint.h>
96 #include <sys/queue.h>
97 #include <errno.h>
98 #include <rte_common.h>
99 #include <rte_memory.h>
100 #include <rte_lcore.h>
101 #include <rte_atomic.h>
102 #include <rte_branch_prediction.h>
103 #include <rte_memzone.h>
104 #include <rte_pause.h>
105 
106 #define RTE_TAILQ_RING_NAME "RTE_RING"
107 
108 enum rte_ring_queue_behavior {
109  RTE_RING_QUEUE_FIXED = 0, /* Enq/Deq a fixed number of items from a ring */
110  RTE_RING_QUEUE_VARIABLE /* Enq/Deq as many items as possible from ring */
111 };
112 
113 #define RTE_RING_MZ_PREFIX "RG_"
114 
115 #define RTE_RING_NAMESIZE (RTE_MEMZONE_NAMESIZE - \
116  sizeof(RTE_RING_MZ_PREFIX) + 1)
117 
118 struct rte_memzone; /* forward declaration, so as not to require memzone.h */
119 
120 #if RTE_CACHE_LINE_SIZE < 128
121 #define PROD_ALIGN (RTE_CACHE_LINE_SIZE * 2)
122 #define CONS_ALIGN (RTE_CACHE_LINE_SIZE * 2)
123 #else
124 #define PROD_ALIGN RTE_CACHE_LINE_SIZE
125 #define CONS_ALIGN RTE_CACHE_LINE_SIZE
126 #endif
127 
128 /* structure to hold a pair of head/tail values and other metadata */
129 struct rte_ring_headtail {
130  volatile uint32_t head;
131  volatile uint32_t tail;
132  uint32_t single;
133 };
134 
145 struct rte_ring {
146  /*
147  * Note: this field kept the RTE_MEMZONE_NAMESIZE size due to ABI
148  * compatibility requirements, it could be changed to RTE_RING_NAMESIZE
149  * next time the ABI changes
150  */
152  int flags;
153  const struct rte_memzone *memzone;
155  uint32_t size;
156  uint32_t mask;
157  uint32_t capacity;
160  struct rte_ring_headtail prod __rte_aligned(PROD_ALIGN);
161 
163  struct rte_ring_headtail cons __rte_aligned(CONS_ALIGN);
164 };
165 
166 #define RING_F_SP_ENQ 0x0001
167 #define RING_F_SC_DEQ 0x0002
176 #define RING_F_EXACT_SZ 0x0004
177 #define RTE_RING_SZ_MASK (unsigned)(0x0fffffff)
179 /* @internal defines for passing to the enqueue dequeue worker functions */
180 #define __IS_SP 1
181 #define __IS_MP 0
182 #define __IS_SC 1
183 #define __IS_MC 0
184 
199 ssize_t rte_ring_get_memsize(unsigned count);
200 
235 int rte_ring_init(struct rte_ring *r, const char *name, unsigned count,
236  unsigned flags);
237 
277 struct rte_ring *rte_ring_create(const char *name, unsigned count,
278  int socket_id, unsigned flags);
285 void rte_ring_free(struct rte_ring *r);
286 
295 void rte_ring_dump(FILE *f, const struct rte_ring *r);
296 
297 /* the actual enqueue of pointers on the ring.
298  * Placed here since identical code needed in both
299  * single and multi producer enqueue functions */
300 #define ENQUEUE_PTRS(r, ring_start, prod_head, obj_table, n, obj_type) do { \
301  unsigned int i; \
302  const uint32_t size = (r)->size; \
303  uint32_t idx = prod_head & (r)->mask; \
304  obj_type *ring = (obj_type *)ring_start; \
305  if (likely(idx + n < size)) { \
306  for (i = 0; i < (n & ((~(unsigned)0x3))); i+=4, idx+=4) { \
307  ring[idx] = obj_table[i]; \
308  ring[idx+1] = obj_table[i+1]; \
309  ring[idx+2] = obj_table[i+2]; \
310  ring[idx+3] = obj_table[i+3]; \
311  } \
312  switch (n & 0x3) { \
313  case 3: \
314  ring[idx++] = obj_table[i++]; /* fallthrough */ \
315  case 2: \
316  ring[idx++] = obj_table[i++]; /* fallthrough */ \
317  case 1: \
318  ring[idx++] = obj_table[i++]; \
319  } \
320  } else { \
321  for (i = 0; idx < size; i++, idx++)\
322  ring[idx] = obj_table[i]; \
323  for (idx = 0; i < n; i++, idx++) \
324  ring[idx] = obj_table[i]; \
325  } \
326 } while (0)
327 
328 /* the actual copy of pointers on the ring to obj_table.
329  * Placed here since identical code needed in both
330  * single and multi consumer dequeue functions */
331 #define DEQUEUE_PTRS(r, ring_start, cons_head, obj_table, n, obj_type) do { \
332  unsigned int i; \
333  uint32_t idx = cons_head & (r)->mask; \
334  const uint32_t size = (r)->size; \
335  obj_type *ring = (obj_type *)ring_start; \
336  if (likely(idx + n < size)) { \
337  for (i = 0; i < (n & (~(unsigned)0x3)); i+=4, idx+=4) {\
338  obj_table[i] = ring[idx]; \
339  obj_table[i+1] = ring[idx+1]; \
340  obj_table[i+2] = ring[idx+2]; \
341  obj_table[i+3] = ring[idx+3]; \
342  } \
343  switch (n & 0x3) { \
344  case 3: \
345  obj_table[i++] = ring[idx++]; /* fallthrough */ \
346  case 2: \
347  obj_table[i++] = ring[idx++]; /* fallthrough */ \
348  case 1: \
349  obj_table[i++] = ring[idx++]; \
350  } \
351  } else { \
352  for (i = 0; idx < size; i++, idx++) \
353  obj_table[i] = ring[idx]; \
354  for (idx = 0; i < n; i++, idx++) \
355  obj_table[i] = ring[idx]; \
356  } \
357 } while (0)
358 
359 static __rte_always_inline void
360 update_tail(struct rte_ring_headtail *ht, uint32_t old_val, uint32_t new_val,
361  uint32_t single)
362 {
363  /*
364  * If there are other enqueues/dequeues in progress that preceded us,
365  * we need to wait for them to complete
366  */
367  if (!single)
368  while (unlikely(ht->tail != old_val))
369  rte_pause();
370 
371  ht->tail = new_val;
372 }
373 
397 static __rte_always_inline unsigned int
398 __rte_ring_move_prod_head(struct rte_ring *r, int is_sp,
399  unsigned int n, enum rte_ring_queue_behavior behavior,
400  uint32_t *old_head, uint32_t *new_head,
401  uint32_t *free_entries)
402 {
403  const uint32_t capacity = r->capacity;
404  unsigned int max = n;
405  int success;
406 
407  do {
408  /* Reset n to the initial burst count */
409  n = max;
410 
411  *old_head = r->prod.head;
412  const uint32_t cons_tail = r->cons.tail;
413  /*
414  * The subtraction is done between two unsigned 32bits value
415  * (the result is always modulo 32 bits even if we have
416  * *old_head > cons_tail). So 'free_entries' is always between 0
417  * and capacity (which is < size).
418  */
419  *free_entries = (capacity + cons_tail - *old_head);
420 
421  /* check that we have enough room in ring */
422  if (unlikely(n > *free_entries))
423  n = (behavior == RTE_RING_QUEUE_FIXED) ?
424  0 : *free_entries;
425 
426  if (n == 0)
427  return 0;
428 
429  *new_head = *old_head + n;
430  if (is_sp)
431  r->prod.head = *new_head, success = 1;
432  else
433  success = rte_atomic32_cmpset(&r->prod.head,
434  *old_head, *new_head);
435  } while (unlikely(success == 0));
436  return n;
437 }
438 
459 static __rte_always_inline unsigned int
460 __rte_ring_do_enqueue(struct rte_ring *r, void * const *obj_table,
461  unsigned int n, enum rte_ring_queue_behavior behavior,
462  int is_sp, unsigned int *free_space)
463 {
464  uint32_t prod_head, prod_next;
465  uint32_t free_entries;
466 
467  n = __rte_ring_move_prod_head(r, is_sp, n, behavior,
468  &prod_head, &prod_next, &free_entries);
469  if (n == 0)
470  goto end;
471 
472  ENQUEUE_PTRS(r, &r[1], prod_head, obj_table, n, void *);
473  rte_smp_wmb();
474 
475  update_tail(&r->prod, prod_head, prod_next, is_sp);
476 end:
477  if (free_space != NULL)
478  *free_space = free_entries - n;
479  return n;
480 }
481 
505 static __rte_always_inline unsigned int
506 __rte_ring_move_cons_head(struct rte_ring *r, int is_sc,
507  unsigned int n, enum rte_ring_queue_behavior behavior,
508  uint32_t *old_head, uint32_t *new_head,
509  uint32_t *entries)
510 {
511  unsigned int max = n;
512  int success;
513 
514  /* move cons.head atomically */
515  do {
516  /* Restore n as it may change every loop */
517  n = max;
518 
519  *old_head = r->cons.head;
520  const uint32_t prod_tail = r->prod.tail;
521  /* The subtraction is done between two unsigned 32bits value
522  * (the result is always modulo 32 bits even if we have
523  * cons_head > prod_tail). So 'entries' is always between 0
524  * and size(ring)-1. */
525  *entries = (prod_tail - *old_head);
526 
527  /* Set the actual entries for dequeue */
528  if (n > *entries)
529  n = (behavior == RTE_RING_QUEUE_FIXED) ? 0 : *entries;
530 
531  if (unlikely(n == 0))
532  return 0;
533 
534  *new_head = *old_head + n;
535  if (is_sc)
536  r->cons.head = *new_head, success = 1;
537  else
538  success = rte_atomic32_cmpset(&r->cons.head, *old_head,
539  *new_head);
540  } while (unlikely(success == 0));
541  return n;
542 }
543 
564 static __rte_always_inline unsigned int
565 __rte_ring_do_dequeue(struct rte_ring *r, void **obj_table,
566  unsigned int n, enum rte_ring_queue_behavior behavior,
567  int is_sc, unsigned int *available)
568 {
569  uint32_t cons_head, cons_next;
570  uint32_t entries;
571 
572  n = __rte_ring_move_cons_head(r, is_sc, n, behavior,
573  &cons_head, &cons_next, &entries);
574  if (n == 0)
575  goto end;
576 
577  DEQUEUE_PTRS(r, &r[1], cons_head, obj_table, n, void *);
578  rte_smp_rmb();
579 
580  update_tail(&r->cons, cons_head, cons_next, is_sc);
581 
582 end:
583  if (available != NULL)
584  *available = entries - n;
585  return n;
586 }
587 
606 static __rte_always_inline unsigned int
607 rte_ring_mp_enqueue_bulk(struct rte_ring *r, void * const *obj_table,
608  unsigned int n, unsigned int *free_space)
609 {
610  return __rte_ring_do_enqueue(r, obj_table, n, RTE_RING_QUEUE_FIXED,
611  __IS_MP, free_space);
612 }
613 
629 static __rte_always_inline unsigned int
630 rte_ring_sp_enqueue_bulk(struct rte_ring *r, void * const *obj_table,
631  unsigned int n, unsigned int *free_space)
632 {
633  return __rte_ring_do_enqueue(r, obj_table, n, RTE_RING_QUEUE_FIXED,
634  __IS_SP, free_space);
635 }
636 
656 static __rte_always_inline unsigned int
657 rte_ring_enqueue_bulk(struct rte_ring *r, void * const *obj_table,
658  unsigned int n, unsigned int *free_space)
659 {
660  return __rte_ring_do_enqueue(r, obj_table, n, RTE_RING_QUEUE_FIXED,
661  r->prod.single, free_space);
662 }
663 
678 static __rte_always_inline int
679 rte_ring_mp_enqueue(struct rte_ring *r, void *obj)
680 {
681  return rte_ring_mp_enqueue_bulk(r, &obj, 1, NULL) ? 0 : -ENOBUFS;
682 }
683 
695 static __rte_always_inline int
696 rte_ring_sp_enqueue(struct rte_ring *r, void *obj)
697 {
698  return rte_ring_sp_enqueue_bulk(r, &obj, 1, NULL) ? 0 : -ENOBUFS;
699 }
700 
716 static __rte_always_inline int
717 rte_ring_enqueue(struct rte_ring *r, void *obj)
718 {
719  return rte_ring_enqueue_bulk(r, &obj, 1, NULL) ? 0 : -ENOBUFS;
720 }
721 
740 static __rte_always_inline unsigned int
741 rte_ring_mc_dequeue_bulk(struct rte_ring *r, void **obj_table,
742  unsigned int n, unsigned int *available)
743 {
744  return __rte_ring_do_dequeue(r, obj_table, n, RTE_RING_QUEUE_FIXED,
745  __IS_MC, available);
746 }
747 
764 static __rte_always_inline unsigned int
765 rte_ring_sc_dequeue_bulk(struct rte_ring *r, void **obj_table,
766  unsigned int n, unsigned int *available)
767 {
768  return __rte_ring_do_dequeue(r, obj_table, n, RTE_RING_QUEUE_FIXED,
769  __IS_SC, available);
770 }
771 
791 static __rte_always_inline unsigned int
792 rte_ring_dequeue_bulk(struct rte_ring *r, void **obj_table, unsigned int n,
793  unsigned int *available)
794 {
795  return __rte_ring_do_dequeue(r, obj_table, n, RTE_RING_QUEUE_FIXED,
796  r->cons.single, available);
797 }
798 
814 static __rte_always_inline int
815 rte_ring_mc_dequeue(struct rte_ring *r, void **obj_p)
816 {
817  return rte_ring_mc_dequeue_bulk(r, obj_p, 1, NULL) ? 0 : -ENOENT;
818 }
819 
832 static __rte_always_inline int
833 rte_ring_sc_dequeue(struct rte_ring *r, void **obj_p)
834 {
835  return rte_ring_sc_dequeue_bulk(r, obj_p, 1, NULL) ? 0 : -ENOENT;
836 }
837 
854 static __rte_always_inline int
855 rte_ring_dequeue(struct rte_ring *r, void **obj_p)
856 {
857  return rte_ring_dequeue_bulk(r, obj_p, 1, NULL) ? 0 : -ENOENT;
858 }
859 
868 static inline unsigned
869 rte_ring_count(const struct rte_ring *r)
870 {
871  uint32_t prod_tail = r->prod.tail;
872  uint32_t cons_tail = r->cons.tail;
873  uint32_t count = (prod_tail - cons_tail) & r->mask;
874  return (count > r->capacity) ? r->capacity : count;
875 }
876 
885 static inline unsigned
887 {
888  return r->capacity - rte_ring_count(r);
889 }
890 
900 static inline int
901 rte_ring_full(const struct rte_ring *r)
902 {
903  return rte_ring_free_count(r) == 0;
904 }
905 
915 static inline int
916 rte_ring_empty(const struct rte_ring *r)
917 {
918  return rte_ring_count(r) == 0;
919 }
920 
931 static inline unsigned int
932 rte_ring_get_size(const struct rte_ring *r)
933 {
934  return r->size;
935 }
936 
945 static inline unsigned int
947 {
948  return r->capacity;
949 }
950 
957 void rte_ring_list_dump(FILE *f);
958 
969 struct rte_ring *rte_ring_lookup(const char *name);
970 
989 static __rte_always_inline unsigned
990 rte_ring_mp_enqueue_burst(struct rte_ring *r, void * const *obj_table,
991  unsigned int n, unsigned int *free_space)
992 {
993  return __rte_ring_do_enqueue(r, obj_table, n,
994  RTE_RING_QUEUE_VARIABLE, __IS_MP, free_space);
995 }
996 
1012 static __rte_always_inline unsigned
1013 rte_ring_sp_enqueue_burst(struct rte_ring *r, void * const *obj_table,
1014  unsigned int n, unsigned int *free_space)
1015 {
1016  return __rte_ring_do_enqueue(r, obj_table, n,
1017  RTE_RING_QUEUE_VARIABLE, __IS_SP, free_space);
1018 }
1019 
1039 static __rte_always_inline unsigned
1040 rte_ring_enqueue_burst(struct rte_ring *r, void * const *obj_table,
1041  unsigned int n, unsigned int *free_space)
1042 {
1043  return __rte_ring_do_enqueue(r, obj_table, n, RTE_RING_QUEUE_VARIABLE,
1044  r->prod.single, free_space);
1045 }
1046 
1067 static __rte_always_inline unsigned
1068 rte_ring_mc_dequeue_burst(struct rte_ring *r, void **obj_table,
1069  unsigned int n, unsigned int *available)
1070 {
1071  return __rte_ring_do_dequeue(r, obj_table, n,
1072  RTE_RING_QUEUE_VARIABLE, __IS_MC, available);
1073 }
1074 
1092 static __rte_always_inline unsigned
1093 rte_ring_sc_dequeue_burst(struct rte_ring *r, void **obj_table,
1094  unsigned int n, unsigned int *available)
1095 {
1096  return __rte_ring_do_dequeue(r, obj_table, n,
1097  RTE_RING_QUEUE_VARIABLE, __IS_SC, available);
1098 }
1099 
1119 static __rte_always_inline unsigned
1120 rte_ring_dequeue_burst(struct rte_ring *r, void **obj_table,
1121  unsigned int n, unsigned int *available)
1122 {
1123  return __rte_ring_do_dequeue(r, obj_table, n,
1124  RTE_RING_QUEUE_VARIABLE,
1125  r->cons.single, available);
1126 }
1127 
1128 #ifdef __cplusplus
1129 }
1130 #endif
1131 
1132 #endif /* _RTE_RING_H_ */