DPDK  23.03.0
rte_vhost.h
Go to the documentation of this file.
1 /* SPDX-License-Identifier: BSD-3-Clause
2  * Copyright(c) 2010-2017 Intel Corporation
3  */
4 
5 #ifndef _RTE_VHOST_H_
6 #define _RTE_VHOST_H_
7 
13 #include <stdbool.h>
14 #include <stdint.h>
15 #include <sys/eventfd.h>
16 
17 #include <rte_compat.h>
18 #include <rte_memory.h>
19 #include <rte_mempool.h>
20 
21 #ifdef __cplusplus
22 extern "C" {
23 #endif
24 
25 #ifndef __cplusplus
26 /* These are not C++-aware. */
27 #include <linux/vhost.h>
28 #include <linux/virtio_ring.h>
29 #include <linux/virtio_net.h>
30 #endif
31 
32 #define RTE_VHOST_USER_CLIENT (1ULL << 0)
33 #define RTE_VHOST_USER_NO_RECONNECT (1ULL << 1)
34 #define RTE_VHOST_USER_RESERVED_1 (1ULL << 2)
35 #define RTE_VHOST_USER_IOMMU_SUPPORT (1ULL << 3)
36 #define RTE_VHOST_USER_POSTCOPY_SUPPORT (1ULL << 4)
37 /* support mbuf with external buffer attached */
38 #define RTE_VHOST_USER_EXTBUF_SUPPORT (1ULL << 5)
39 /* support only linear buffers (no chained mbufs) */
40 #define RTE_VHOST_USER_LINEARBUF_SUPPORT (1ULL << 6)
41 #define RTE_VHOST_USER_ASYNC_COPY (1ULL << 7)
42 #define RTE_VHOST_USER_NET_COMPLIANT_OL_FLAGS (1ULL << 8)
43 #define RTE_VHOST_USER_NET_STATS_ENABLE (1ULL << 9)
44 
45 /* Features. */
46 #ifndef VIRTIO_NET_F_GUEST_ANNOUNCE
47  #define VIRTIO_NET_F_GUEST_ANNOUNCE 21
48 #endif
49 
50 #ifndef VIRTIO_NET_F_MQ
51  #define VIRTIO_NET_F_MQ 22
52 #endif
53 
54 #ifndef VIRTIO_NET_F_MTU
55  #define VIRTIO_NET_F_MTU 3
56 #endif
57 
58 #ifndef VIRTIO_F_ANY_LAYOUT
59  #define VIRTIO_F_ANY_LAYOUT 27
60 #endif
61 
63 #ifndef VHOST_USER_PROTOCOL_F_MQ
64 #define VHOST_USER_PROTOCOL_F_MQ 0
65 #endif
66 
67 #ifndef VHOST_USER_PROTOCOL_F_LOG_SHMFD
68 #define VHOST_USER_PROTOCOL_F_LOG_SHMFD 1
69 #endif
70 
71 #ifndef VHOST_USER_PROTOCOL_F_RARP
72 #define VHOST_USER_PROTOCOL_F_RARP 2
73 #endif
74 
75 #ifndef VHOST_USER_PROTOCOL_F_REPLY_ACK
76 #define VHOST_USER_PROTOCOL_F_REPLY_ACK 3
77 #endif
78 
79 #ifndef VHOST_USER_PROTOCOL_F_NET_MTU
80 #define VHOST_USER_PROTOCOL_F_NET_MTU 4
81 #endif
82 
83 #ifndef VHOST_USER_PROTOCOL_F_BACKEND_REQ
84 #define VHOST_USER_PROTOCOL_F_BACKEND_REQ 5
85 #endif
86 
87 #ifndef VHOST_USER_PROTOCOL_F_CRYPTO_SESSION
88 #define VHOST_USER_PROTOCOL_F_CRYPTO_SESSION 7
89 #endif
90 
91 #ifndef VHOST_USER_PROTOCOL_F_PAGEFAULT
92 #define VHOST_USER_PROTOCOL_F_PAGEFAULT 8
93 #endif
94 
95 #ifndef VHOST_USER_PROTOCOL_F_CONFIG
96 #define VHOST_USER_PROTOCOL_F_CONFIG 9
97 #endif
98 
99 #ifndef VHOST_USER_PROTOCOL_F_BACKEND_SEND_FD
100 #define VHOST_USER_PROTOCOL_F_BACKEND_SEND_FD 10
101 #endif
102 
103 #ifndef VHOST_USER_PROTOCOL_F_HOST_NOTIFIER
104 #define VHOST_USER_PROTOCOL_F_HOST_NOTIFIER 11
105 #endif
106 
107 #ifndef VHOST_USER_PROTOCOL_F_INFLIGHT_SHMFD
108 #define VHOST_USER_PROTOCOL_F_INFLIGHT_SHMFD 12
109 #endif
110 
111 #ifndef VHOST_USER_PROTOCOL_F_STATUS
112 #define VHOST_USER_PROTOCOL_F_STATUS 16
113 #endif
114 
116 #ifndef VHOST_USER_F_PROTOCOL_FEATURES
117 #define VHOST_USER_F_PROTOCOL_FEATURES 30
118 #endif
119 
120 #define RTE_MAX_VHOST_DEVICE 1024
121 
122 #define RTE_VHOST_VDPA_DEVICE_TYPE_NET 0
123 #define RTE_VHOST_VDPA_DEVICE_TYPE_BLK 1
124 
125 struct rte_vdpa_device;
126 
132  uint64_t guest_phys_addr;
133  uint64_t guest_user_addr;
134  uint64_t host_user_addr;
135  uint64_t size;
136  void *mmap_addr;
137  uint64_t mmap_size;
138  int fd;
139 };
140 
145  uint32_t nregions;
146  struct rte_vhost_mem_region regions[];
147 };
148 
149 struct rte_vhost_inflight_desc_split {
150  uint8_t inflight;
151  uint8_t padding[5];
152  uint16_t next;
153  uint64_t counter;
154 };
155 
156 struct rte_vhost_inflight_info_split {
157  uint64_t features;
158  uint16_t version;
159  uint16_t desc_num;
160  uint16_t last_inflight_io;
161  uint16_t used_idx;
162  struct rte_vhost_inflight_desc_split desc[];
163 };
164 
165 struct rte_vhost_inflight_desc_packed {
166  uint8_t inflight;
167  uint8_t padding;
168  uint16_t next;
169  uint16_t last;
170  uint16_t num;
171  uint64_t counter;
172  uint16_t id;
173  uint16_t flags;
174  uint32_t len;
175  uint64_t addr;
176 };
177 
178 struct rte_vhost_inflight_info_packed {
179  uint64_t features;
180  uint16_t version;
181  uint16_t desc_num;
182  uint16_t free_head;
183  uint16_t old_free_head;
184  uint16_t used_idx;
185  uint16_t old_used_idx;
186  uint8_t used_wrap_counter;
187  uint8_t old_used_wrap_counter;
188  uint8_t padding[7];
189  struct rte_vhost_inflight_desc_packed desc[];
190 };
191 
192 struct rte_vhost_resubmit_desc {
193  uint16_t index;
194  uint64_t counter;
195 };
196 
197 struct rte_vhost_resubmit_info {
198  struct rte_vhost_resubmit_desc *resubmit_list;
199  uint16_t resubmit_num;
200 };
201 
202 struct rte_vhost_ring_inflight {
203  union {
204  struct rte_vhost_inflight_info_split *inflight_split;
205  struct rte_vhost_inflight_info_packed *inflight_packed;
206  };
207 
208  struct rte_vhost_resubmit_info *resubmit_inflight;
209 };
210 
211 struct rte_vhost_vring {
212  union {
213  struct vring_desc *desc;
214  struct vring_packed_desc *desc_packed;
215  };
216  union {
217  struct vring_avail *avail;
218  struct vring_packed_desc_event *driver_event;
219  };
220  union {
221  struct vring_used *used;
222  struct vring_packed_desc_event *device_event;
223  };
224  uint64_t log_guest_addr;
225 
227  int callfd;
228 
229  int kickfd;
230  uint16_t size;
231 };
232 
237  /* Message handling failed */
238  RTE_VHOST_MSG_RESULT_ERR = -1,
239  /* Message handling successful */
240  RTE_VHOST_MSG_RESULT_OK = 0,
241  /* Message handling successful and reply prepared */
242  RTE_VHOST_MSG_RESULT_REPLY = 1,
243  /* Message not handled */
244  RTE_VHOST_MSG_RESULT_NOT_HANDLED,
245 };
246 
261 typedef enum rte_vhost_msg_result (*rte_vhost_msg_handle)(int vid, void *msg);
262 
267  /* Called prior to the frontend message handling. */
268  rte_vhost_msg_handle pre_msg_handle;
269  /* Called after the frontend message handling. */
270  rte_vhost_msg_handle post_msg_handle;
271 };
272 
277  int (*new_device)(int vid);
278  void (*destroy_device)(int vid);
280  int (*vring_state_changed)(int vid, uint16_t queue_id, int enable);
288  int (*features_changed)(int vid, uint64_t features);
289 
290  int (*new_connection)(int vid);
291  void (*destroy_connection)(int vid);
292 
299  void (*guest_notified)(int vid);
300 
301  void *reserved[1];
302 };
303 
309  volatile void *addr;
314  uint64_t val;
316  uint64_t mask;
320  uint8_t size;
326  uint8_t match;
327 };
328 
330 #define RTE_VHOST_STATS_NAME_SIZE 64
331 
341  uint64_t id;
342  uint64_t value;
343 };
344 
353 };
354 
367 static __rte_always_inline uint64_t
369  uint64_t gpa, uint64_t *len)
370 {
371  struct rte_vhost_mem_region *r;
372  uint32_t i;
373 
374  for (i = 0; i < mem->nregions; i++) {
375  r = &mem->regions[i];
376  if (gpa >= r->guest_phys_addr &&
377  gpa < r->guest_phys_addr + r->size) {
378 
379  if (unlikely(*len > r->guest_phys_addr + r->size - gpa))
380  *len = r->guest_phys_addr + r->size - gpa;
381 
382  return gpa - r->guest_phys_addr +
383  r->host_user_addr;
384  }
385  }
386  *len = 0;
387 
388  return 0;
389 }
390 
391 #define RTE_VHOST_NEED_LOG(features) ((features) & (1ULL << VHOST_F_LOG_ALL))
392 
411 void rte_vhost_log_write(int vid, uint64_t addr, uint64_t len);
412 
431 void rte_vhost_log_used_vring(int vid, uint16_t vring_idx,
432  uint64_t offset, uint64_t len);
433 
434 int rte_vhost_enable_guest_notification(int vid, uint16_t queue_id, int enable);
435 
440 int rte_vhost_driver_register(const char *path, uint64_t flags);
441 
442 /* Unregister vhost driver. This is only meaningful to vhost user. */
443 int rte_vhost_driver_unregister(const char *path);
444 
455 int
456 rte_vhost_driver_attach_vdpa_device(const char *path,
457  struct rte_vdpa_device *dev);
458 
467 int
468 rte_vhost_driver_detach_vdpa_device(const char *path);
469 
478 struct rte_vdpa_device *
479 rte_vhost_driver_get_vdpa_device(const char *path);
480 
491 __rte_experimental
492 int
493 rte_vhost_driver_get_vdpa_dev_type(const char *path, uint32_t *type);
494 
505 int rte_vhost_driver_set_features(const char *path, uint64_t features);
506 
522 int rte_vhost_driver_enable_features(const char *path, uint64_t features);
523 
536 int rte_vhost_driver_disable_features(const char *path, uint64_t features);
537 
548 int rte_vhost_driver_get_features(const char *path, uint64_t *features);
549 
560 int
562  uint64_t protocol_features);
563 
574 int
576  uint64_t *protocol_features);
577 
588 int
589 rte_vhost_driver_get_queue_num(const char *path, uint32_t *queue_num);
590 
601 int rte_vhost_get_negotiated_features(int vid, uint64_t *features);
602 
613 __rte_experimental
614 int
616  uint64_t *protocol_features);
617 
618 /* Register callbacks. */
619 int rte_vhost_driver_callback_register(const char *path,
620  struct rte_vhost_device_ops const * const ops);
621 
633 int rte_vhost_driver_start(const char *path);
634 
648 int rte_vhost_get_mtu(int vid, uint16_t *mtu);
649 
660 int rte_vhost_get_numa_node(int vid);
661 
671 uint16_t rte_vhost_get_vring_num(int vid);
672 
687 int rte_vhost_get_ifname(int vid, char *buf, size_t len);
688 
700 uint16_t rte_vhost_avail_entries(int vid, uint16_t queue_id);
701 
702 struct rte_mbuf;
703 struct rte_mempool;
720 uint16_t rte_vhost_enqueue_burst(int vid, uint16_t queue_id,
721  struct rte_mbuf **pkts, uint16_t count);
722 
740 uint16_t rte_vhost_dequeue_burst(int vid, uint16_t queue_id,
741  struct rte_mempool *mbuf_pool, struct rte_mbuf **pkts, uint16_t count);
742 
757 int rte_vhost_get_mem_table(int vid, struct rte_vhost_memory **mem);
758 
771 int rte_vhost_get_vhost_vring(int vid, uint16_t vring_idx,
772  struct rte_vhost_vring *vring);
773 
786 int
787 rte_vhost_get_vhost_ring_inflight(int vid, uint16_t vring_idx,
788  struct rte_vhost_ring_inflight *vring);
789 
805 int
806 rte_vhost_set_inflight_desc_split(int vid, uint16_t vring_idx,
807  uint16_t idx);
808 
827 int
828 rte_vhost_set_inflight_desc_packed(int vid, uint16_t vring_idx,
829  uint16_t head, uint16_t last, uint16_t *inflight_entry);
830 
843 int
845  uint16_t vring_idx, uint16_t idx);
846 
862 int
864  uint16_t vring_idx, uint16_t head);
865 
880 int
881 rte_vhost_clr_inflight_desc_split(int vid, uint16_t vring_idx,
882  uint16_t last_used_idx, uint16_t idx);
883 
896 int
897 rte_vhost_clr_inflight_desc_packed(int vid, uint16_t vring_idx,
898  uint16_t head);
899 
911 int rte_vhost_vring_call(int vid, uint16_t vring_idx);
912 
925 __rte_experimental
926 int rte_vhost_vring_call_nonblock(int vid, uint16_t vring_idx);
927 
938 uint32_t rte_vhost_rx_queue_count(int vid, uint16_t qid);
939 
952 __rte_experimental
953 int
954 rte_vhost_get_monitor_addr(int vid, uint16_t queue_id,
955  struct rte_vhost_power_monitor_cond *pmc);
956 
969 int
970 rte_vhost_get_log_base(int vid, uint64_t *log_base, uint64_t *log_size);
971 
986 int
987 rte_vhost_get_vring_base(int vid, uint16_t queue_id,
988  uint16_t *last_avail_idx, uint16_t *last_used_idx);
989 
1008 int
1010  uint16_t queue_id, uint16_t *last_avail_idx, uint16_t *last_used_idx);
1011 
1026 int
1027 rte_vhost_set_vring_base(int vid, uint16_t queue_id,
1028  uint16_t last_avail_idx, uint16_t last_used_idx);
1029 
1042 int
1044  struct rte_vhost_user_extern_ops const * const ops, void *ctx);
1045 
1054 struct rte_vdpa_device *
1055 rte_vhost_get_vdpa_device(int vid);
1056 
1067 __rte_experimental
1068 int
1069 rte_vhost_backend_config_change(int vid, bool need_reply);
1070 
1094 int
1095 rte_vhost_vring_stats_get_names(int vid, uint16_t queue_id,
1096  struct rte_vhost_stat_name *name, unsigned int size);
1097 
1121 int
1122 rte_vhost_vring_stats_get(int vid, uint16_t queue_id,
1123  struct rte_vhost_stat *stats, unsigned int n);
1124 
1137 int
1138 rte_vhost_vring_stats_reset(int vid, uint16_t queue_id);
1139 
1140 #ifdef __cplusplus
1141 }
1142 #endif
1143 
1144 #endif /* _RTE_VHOST_H_ */
int rte_vhost_driver_start(const char *path)
#define __rte_always_inline
Definition: rte_common.h:255
__rte_experimental int rte_vhost_get_negotiated_protocol_features(int vid, uint64_t *protocol_features)
int rte_vhost_driver_register(const char *path, uint64_t flags)
uint16_t rte_vhost_avail_entries(int vid, uint16_t queue_id)
int rte_vhost_vring_stats_reset(int vid, uint16_t queue_id)
int rte_vhost_driver_disable_features(const char *path, uint64_t features)
struct rte_vdpa_device * rte_vhost_get_vdpa_device(int vid)
void rte_vhost_log_used_vring(int vid, uint16_t vring_idx, uint64_t offset, uint64_t len)
#define RTE_VHOST_STATS_NAME_SIZE
Definition: rte_vhost.h:330
int rte_vhost_get_vhost_vring(int vid, uint16_t vring_idx, struct rte_vhost_vring *vring)
int rte_vhost_set_inflight_desc_packed(int vid, uint16_t vring_idx, uint16_t head, uint16_t last, uint16_t *inflight_entry)
int rte_vhost_clr_inflight_desc_packed(int vid, uint16_t vring_idx, uint16_t head)
uint16_t rte_vhost_enqueue_burst(int vid, uint16_t queue_id, struct rte_mbuf **pkts, uint16_t count)
int rte_vhost_get_vhost_ring_inflight(int vid, uint16_t vring_idx, struct rte_vhost_ring_inflight *vring)
int rte_vhost_driver_get_protocol_features(const char *path, uint64_t *protocol_features)
int rte_vhost_set_last_inflight_io_packed(int vid, uint16_t vring_idx, uint16_t head)
int rte_vhost_get_mtu(int vid, uint16_t *mtu)
int rte_vhost_driver_detach_vdpa_device(const char *path)
int rte_vhost_driver_set_protocol_features(const char *path, uint64_t protocol_features)
uint64_t id
Definition: rte_vhost.h:341
int rte_vhost_vring_stats_get(int vid, uint16_t queue_id, struct rte_vhost_stat *stats, unsigned int n)
static __rte_always_inline uint64_t rte_vhost_va_from_guest_pa(struct rte_vhost_memory *mem, uint64_t gpa, uint64_t *len)
Definition: rte_vhost.h:368
#define unlikely(x)
uint16_t rte_vhost_get_vring_num(int vid)
__rte_experimental int rte_vhost_vring_call_nonblock(int vid, uint16_t vring_idx)
int rte_vhost_extern_callback_register(int vid, struct rte_vhost_user_extern_ops const *const ops, void *ctx)
__rte_experimental int rte_vhost_get_monitor_addr(int vid, uint16_t queue_id, struct rte_vhost_power_monitor_cond *pmc)
int rte_vhost_get_numa_node(int vid)
int rte_vhost_set_inflight_desc_split(int vid, uint16_t vring_idx, uint16_t idx)
int rte_vhost_get_mem_table(int vid, struct rte_vhost_memory **mem)
int rte_vhost_driver_attach_vdpa_device(const char *path, struct rte_vdpa_device *dev)
__rte_experimental int rte_vhost_driver_get_vdpa_dev_type(const char *path, uint32_t *type)
int rte_vhost_set_last_inflight_io_split(int vid, uint16_t vring_idx, uint16_t idx)
int rte_vhost_vring_call(int vid, uint16_t vring_idx)
int rte_vhost_get_negotiated_features(int vid, uint64_t *features)
struct rte_vdpa_device * rte_vhost_driver_get_vdpa_device(const char *path)
rte_vhost_msg_result
Definition: rte_vhost.h:236
int rte_vhost_set_vring_base(int vid, uint16_t queue_id, uint16_t last_avail_idx, uint16_t last_used_idx)
int rte_vhost_clr_inflight_desc_split(int vid, uint16_t vring_idx, uint16_t last_used_idx, uint16_t idx)
int rte_vhost_get_log_base(int vid, uint64_t *log_base, uint64_t *log_size)
int rte_vhost_vring_stats_get_names(int vid, uint16_t queue_id, struct rte_vhost_stat_name *name, unsigned int size)
uint32_t rte_vhost_rx_queue_count(int vid, uint16_t qid)
uint64_t value
Definition: rte_vhost.h:342
__rte_experimental int rte_vhost_backend_config_change(int vid, bool need_reply)
uint16_t rte_vhost_dequeue_burst(int vid, uint16_t queue_id, struct rte_mempool *mbuf_pool, struct rte_mbuf **pkts, uint16_t count)
int rte_vhost_get_vring_base(int vid, uint16_t queue_id, uint16_t *last_avail_idx, uint16_t *last_used_idx)
int rte_vhost_driver_get_features(const char *path, uint64_t *features)
int rte_vhost_driver_get_queue_num(const char *path, uint32_t *queue_num)
int rte_vhost_driver_set_features(const char *path, uint64_t features)
int rte_vhost_get_ifname(int vid, char *buf, size_t len)
int rte_vhost_get_vring_base_from_inflight(int vid, uint16_t queue_id, uint16_t *last_avail_idx, uint16_t *last_used_idx)
enum rte_vhost_msg_result(* rte_vhost_msg_handle)(int vid, void *msg)
Definition: rte_vhost.h:261
int rte_vhost_driver_enable_features(const char *path, uint64_t features)
void rte_vhost_log_write(int vid, uint64_t addr, uint64_t len)