blob: 868f34434ce27077f70c569dce036b09e72499a3 [file] [log] [blame]
Ed Warnickecb9cada2015-12-08 15:45:58 -07001/*
2 * Copyright (c) 2015 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
6 *
7 * http://www.apache.org/licenses/LICENSE-2.0
8 *
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
14 */
15#ifndef __VIRTIO_VHOST_USER_H__
16#define __VIRTIO_VHOST_USER_H__
Mohsin Kazmia7a22812020-08-31 17:17:16 +020017
18#include <vnet/devices/virtio/virtio_std.h>
19#include <vnet/devices/virtio/vhost_std.h>
20
Ed Warnickecb9cada2015-12-08 15:45:58 -070021/* vhost-user data structures */
22
23#define VHOST_MEMORY_MAX_NREGIONS 8
24#define VHOST_USER_MSG_HDR_SZ 12
Pierre Pfistere21c5282016-09-21 08:04:59 +010025#define VHOST_VRING_MAX_N 16 //8TX + 8RX
26#define VHOST_VRING_IDX_RX(qid) (2*qid)
27#define VHOST_VRING_IDX_TX(qid) (2*qid + 1)
Ed Warnickecb9cada2015-12-08 15:45:58 -070028
Steven49a04b92017-07-29 08:56:08 -070029#define VHOST_USER_VRING_NOFD_MASK 0x100
Shesha Sreenivasamurthyb8f45b32016-02-03 09:38:36 -080030
Yoann Desmouceaux4667c222016-02-24 22:51:00 +010031#define VHOST_USER_PROTOCOL_F_MQ 0
32#define VHOST_USER_PROTOCOL_F_LOG_SHMFD 1
Yoann Desmouceauxfe2da0e2016-03-08 14:54:28 +010033#define VHOST_VRING_F_LOG 0
Yoann Desmouceaux4667c222016-02-24 22:51:00 +010034
Shesha Sreenivasamurthy0666dc42016-04-18 16:38:20 -040035#define VHOST_USER_PROTOCOL_FEATURES ((1ULL << VHOST_USER_PROTOCOL_F_MQ) | \
36 (1ULL << VHOST_USER_PROTOCOL_F_LOG_SHMFD))
Shesha Sreenivasamurthyb8f45b32016-02-03 09:38:36 -080037
Jerome Tollet2f54c272018-10-02 11:41:11 +020038#define vu_log_debug(dev, f, ...) \
39{ \
40 vlib_log(VLIB_LOG_LEVEL_DEBUG, vhost_user_main.log_default, "%U: " f, \
41 format_vnet_hw_if_index_name, vnet_get_main(), \
42 dev->hw_if_index, ##__VA_ARGS__); \
43};
Mohsin Kazmie7cde312018-06-26 17:20:11 +020044
Jerome Tollet2f54c272018-10-02 11:41:11 +020045#define vu_log_warn(dev, f, ...) \
46{ \
47 vlib_log(VLIB_LOG_LEVEL_WARNING, vhost_user_main.log_default, "%U: " f, \
48 format_vnet_hw_if_index_name, vnet_get_main(), \
49 dev->hw_if_index, ##__VA_ARGS__); \
50};
51#define vu_log_err(dev, f, ...) \
52{ \
53 vlib_log(VLIB_LOG_LEVEL_ERR, vhost_user_main.log_default, "%U: " f, \
54 format_vnet_hw_if_index_name, vnet_get_main(), \
55 dev->hw_if_index, ##__VA_ARGS__); \
56};
Mohsin Kazmie7cde312018-06-26 17:20:11 +020057
58#define UNIX_GET_FD(unixfd_idx) ({ \
59 typeof(unixfd_idx) __unixfd_idx = (unixfd_idx); \
60 (__unixfd_idx != ~0) ? \
61 pool_elt_at_index (file_main.file_pool, \
62 __unixfd_idx)->file_descriptor : -1; })
63
64#define foreach_virtio_trace_flags \
65 _ (SIMPLE_CHAINED, 0, "Simple descriptor chaining") \
66 _ (SINGLE_DESC, 1, "Single descriptor packet") \
67 _ (INDIRECT, 2, "Indirect descriptor") \
68 _ (MAP_ERROR, 4, "Memory mapping error")
69
70typedef enum
71{
72#define _(n,i,s) VIRTIO_TRACE_F_##n,
73 foreach_virtio_trace_flags
74#undef _
75} virtio_trace_flag_t;
76
Steven Luong4208a4c2019-05-06 08:51:56 -070077#define FEATURE_VIRTIO_NET_F_HOST_TSO_FEATURE_BITS \
Mohsin Kazmia7a22812020-08-31 17:17:16 +020078 (VIRTIO_FEATURE (VIRTIO_NET_F_CSUM) | \
79 VIRTIO_FEATURE (VIRTIO_NET_F_HOST_UFO) | \
80 VIRTIO_FEATURE (VIRTIO_NET_F_HOST_TSO4) | \
81 VIRTIO_FEATURE (VIRTIO_NET_F_HOST_TSO6))
Steven Luong4208a4c2019-05-06 08:51:56 -070082
83#define FEATURE_VIRTIO_NET_F_GUEST_TSO_FEATURE_BITS \
Mohsin Kazmia7a22812020-08-31 17:17:16 +020084 (VIRTIO_FEATURE (VIRTIO_NET_F_GUEST_CSUM) | \
85 VIRTIO_FEATURE (VIRTIO_NET_F_GUEST_UFO) | \
86 VIRTIO_FEATURE (VIRTIO_NET_F_GUEST_TSO4) | \
87 VIRTIO_FEATURE (VIRTIO_NET_F_GUEST_TSO6))
Steven Luong4208a4c2019-05-06 08:51:56 -070088
89#define FEATURE_VIRTIO_NET_F_HOST_GUEST_TSO_FEATURE_BITS \
90 (FEATURE_VIRTIO_NET_F_HOST_TSO_FEATURE_BITS | \
91 FEATURE_VIRTIO_NET_F_GUEST_TSO_FEATURE_BITS)
92
Damjan Marion00a9dca2016-08-17 17:05:46 +020093int vhost_user_create_if (vnet_main_t * vnm, vlib_main_t * vm,
94 const char *sock_filename, u8 is_server,
95 u32 * sw_if_index, u64 feature_mask,
Steven Luong4208a4c2019-05-06 08:51:56 -070096 u8 renumber, u32 custom_dev_instance, u8 * hwaddr,
Steven Luongbc0d9ff2020-03-23 09:34:59 -070097 u8 enable_gso, u8 enable_packed);
Damjan Marion00a9dca2016-08-17 17:05:46 +020098int vhost_user_modify_if (vnet_main_t * vnm, vlib_main_t * vm,
99 const char *sock_filename, u8 is_server,
100 u32 sw_if_index, u64 feature_mask,
Steven Luong4208a4c2019-05-06 08:51:56 -0700101 u8 renumber, u32 custom_dev_instance,
Steven Luongbc0d9ff2020-03-23 09:34:59 -0700102 u8 enable_gso, u8 enable_packed);
Damjan Marion00a9dca2016-08-17 17:05:46 +0200103int vhost_user_delete_if (vnet_main_t * vnm, vlib_main_t * vm,
104 u32 sw_if_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700105
Pierre Pfistere21c5282016-09-21 08:04:59 +0100106/* *INDENT-OFF* */
Damjan Marion00a9dca2016-08-17 17:05:46 +0200107typedef struct vhost_user_memory_region
108{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700109 u64 guest_phys_addr;
110 u64 memory_size;
111 u64 userspace_addr;
112 u64 mmap_offset;
Pierre Pfistere21c5282016-09-21 08:04:59 +0100113} __attribute ((packed)) vhost_user_memory_region_t;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700114
Damjan Marion00a9dca2016-08-17 17:05:46 +0200115typedef struct vhost_user_memory
116{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700117 u32 nregions;
118 u32 padding;
119 vhost_user_memory_region_t regions[VHOST_MEMORY_MAX_NREGIONS];
Pierre Pfistere21c5282016-09-21 08:04:59 +0100120} __attribute ((packed)) vhost_user_memory_t;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700121
Damjan Marion00a9dca2016-08-17 17:05:46 +0200122typedef enum vhost_user_req
123{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700124 VHOST_USER_NONE = 0,
125 VHOST_USER_GET_FEATURES = 1,
126 VHOST_USER_SET_FEATURES = 2,
127 VHOST_USER_SET_OWNER = 3,
128 VHOST_USER_RESET_OWNER = 4,
129 VHOST_USER_SET_MEM_TABLE = 5,
130 VHOST_USER_SET_LOG_BASE = 6,
131 VHOST_USER_SET_LOG_FD = 7,
132 VHOST_USER_SET_VRING_NUM = 8,
133 VHOST_USER_SET_VRING_ADDR = 9,
134 VHOST_USER_SET_VRING_BASE = 10,
135 VHOST_USER_GET_VRING_BASE = 11,
136 VHOST_USER_SET_VRING_KICK = 12,
137 VHOST_USER_SET_VRING_CALL = 13,
138 VHOST_USER_SET_VRING_ERR = 14,
Shesha Sreenivasamurthyb8f45b32016-02-03 09:38:36 -0800139 VHOST_USER_GET_PROTOCOL_FEATURES = 15,
140 VHOST_USER_SET_PROTOCOL_FEATURES = 16,
141 VHOST_USER_GET_QUEUE_NUM = 17,
Yoann Desmouceaux4667c222016-02-24 22:51:00 +0100142 VHOST_USER_SET_VRING_ENABLE = 18,
Ed Warnickecb9cada2015-12-08 15:45:58 -0700143 VHOST_USER_MAX
144} vhost_user_req_t;
145
Ed Warnickecb9cada2015-12-08 15:45:58 -0700146typedef struct vhost_user_msg {
Damjan Marion00a9dca2016-08-17 17:05:46 +0200147 vhost_user_req_t request;
148 u32 flags;
149 u32 size;
150 union
151 {
152 u64 u64;
153 vhost_vring_state_t state;
154 vhost_vring_addr_t addr;
155 vhost_user_memory_t memory;
156 vhost_user_log_t log;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700157 };
158} __attribute ((packed)) vhost_user_msg_t;
Damjan Marion00a9dca2016-08-17 17:05:46 +0200159/* *INDENT-ON* */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700160
Damjan Marion00a9dca2016-08-17 17:05:46 +0200161typedef struct
162{
Pierre Pfistere21c5282016-09-21 08:04:59 +0100163 CLIB_CACHE_LINE_ALIGN_MARK (cacheline0);
Steven97878892017-08-29 09:23:26 -0700164 u16 qsz_mask;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700165 u16 last_avail_idx;
166 u16 last_used_idx;
Pierre Pfistere21c5282016-09-21 08:04:59 +0100167 u16 n_since_last_int;
Steven Luongbc0d9ff2020-03-23 09:34:59 -0700168 union
169 {
170 vring_desc_t *desc;
171 vring_packed_desc_t *packed_desc;
172 };
173 union
174 {
175 vring_avail_t *avail;
176 vring_desc_event_t *avail_event;
177 };
178 union
179 {
180 vring_used_t *used;
181 vring_desc_event_t *used_event;
182 };
Steven Luong4442f7c2019-10-02 07:33:48 -0700183 uword desc_user_addr;
184 uword used_user_addr;
185 uword avail_user_addr;
Pierre Pfistere21c5282016-09-21 08:04:59 +0100186 f64 int_deadline;
187 u8 started;
188 u8 enabled;
189 u8 log_used;
190 //Put non-runtime in a different cache line
191 CLIB_CACHE_LINE_ALIGN_MARK (cacheline1);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700192 int errfd;
193 u32 callfd_idx;
Pierre Pfistere21c5282016-09-21 08:04:59 +0100194 u32 kickfd_idx;
195 u64 log_guest_addr;
Stevenf3b53642017-05-01 14:03:02 -0700196
197 /* The rx queue policy (interrupt/adaptive/polling) for this queue */
198 u32 mode;
Steven Luong67f935e2019-02-01 10:23:56 -0800199
200 /*
201 * It contains the device queue number. -1 if it does not. The idea is
202 * to not invoke vnet_hw_interface_assign_rx_thread and
203 * vnet_hw_interface_unassign_rx_thread more than once for the duration of
204 * the interface even if it is disconnected and reconnected.
205 */
206 i16 qid;
Steven Luongbc0d9ff2020-03-23 09:34:59 -0700207
208 u16 used_wrap_counter;
209 u16 avail_wrap_counter;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700210} vhost_user_vring_t;
211
Steven7312cc72017-03-15 21:18:55 -0700212#define VHOST_USER_EVENT_START_TIMER 1
Stevenf3b53642017-05-01 14:03:02 -0700213#define VHOST_USER_EVENT_STOP_TIMER 2
Steven7312cc72017-03-15 21:18:55 -0700214
Damjan Marion00a9dca2016-08-17 17:05:46 +0200215typedef struct
216{
217 CLIB_CACHE_LINE_ALIGN_MARK (cacheline0);
Juraj Slobodab192feb2018-10-01 12:42:07 +0200218 u32 is_ready;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700219 u32 admin_up;
Pierre Pfisterdbb3c252016-11-22 10:33:34 +0000220 u32 unix_server_index;
Damjan Marion56dd5432017-09-08 19:52:02 +0200221 u32 clib_file_index;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700222 char sock_filename[256];
223 int sock_errno;
Steven5445f5f2017-04-25 16:16:00 -0700224 uword if_index;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700225 u32 hw_if_index, sw_if_index;
Damjan Marion00a9dca2016-08-17 17:05:46 +0200226
Pierre Pfistere21c5282016-09-21 08:04:59 +0100227 //Feature negotiation
Ed Warnickecb9cada2015-12-08 15:45:58 -0700228 u64 features;
229 u64 feature_mask;
Yoann Desmouceaux4667c222016-02-24 22:51:00 +0100230 u64 protocol_features;
Pierre Pfistere21c5282016-09-21 08:04:59 +0100231
232 //Memory region information
233 u32 nregions;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700234 vhost_user_memory_region_t regions[VHOST_MEMORY_MAX_NREGIONS];
Damjan Marion00a9dca2016-08-17 17:05:46 +0200235 void *region_mmap_addr[VHOST_MEMORY_MAX_NREGIONS];
Damjan Marion37623702016-09-20 11:25:27 +0200236 u64 region_guest_addr_lo[VHOST_MEMORY_MAX_NREGIONS];
237 u64 region_guest_addr_hi[VHOST_MEMORY_MAX_NREGIONS];
Ed Warnickecb9cada2015-12-08 15:45:58 -0700238 u32 region_mmap_fd[VHOST_MEMORY_MAX_NREGIONS];
Pierre Pfistere21c5282016-09-21 08:04:59 +0100239
240 //Virtual rings
241 vhost_user_vring_t vrings[VHOST_VRING_MAX_N];
242 volatile u32 *vring_locks[VHOST_VRING_MAX_N];
243
Ed Warnickecb9cada2015-12-08 15:45:58 -0700244 int virtio_net_hdr_sz;
245 int is_any_layout;
Yoann Desmouceaux4667c222016-02-24 22:51:00 +0100246
Damjan Marion00a9dca2016-08-17 17:05:46 +0200247 void *log_base_addr;
Yoann Desmouceaux4667c222016-02-24 22:51:00 +0100248 u64 log_size;
Pierre Pfistere21c5282016-09-21 08:04:59 +0100249
250 /* Whether to use spinlock or per_cpu_tx_qid assignment */
251 u8 use_tx_spinlock;
252 u16 *per_cpu_tx_qid;
Steven Luong4208a4c2019-05-06 08:51:56 -0700253
254 u8 enable_gso;
Steven Luongbc0d9ff2020-03-23 09:34:59 -0700255
256 /* Packed ring configured */
257 u8 enable_packed;
258
Ed Warnickecb9cada2015-12-08 15:45:58 -0700259} vhost_user_intf_t;
260
Damjan Marion00a9dca2016-08-17 17:05:46 +0200261typedef struct
262{
Pierre Pfisterd3eb90e2016-11-29 15:36:14 +0000263 uword dst;
264 uword src;
265 u32 len;
266} vhost_copy_t;
267
268typedef struct
269{
270 u16 qid; /** The interface queue index (Not the virtio vring idx) */
271 u16 device_index; /** The device index */
272 u32 virtio_ring_flags; /** Runtime queue flags **/
273 u16 first_desc_len; /** Length of the first data descriptor **/
274 virtio_net_hdr_mrg_rxbuf_t hdr; /** Virtio header **/
275} vhost_trace_t;
276
Pierre Pfisterd3eb90e2016-11-29 15:36:14 +0000277#define VHOST_USER_RX_BUFFERS_N (2 * VLIB_FRAME_SIZE + 2)
278#define VHOST_USER_COPY_ARRAY_N (4 * VLIB_FRAME_SIZE)
279
280typedef struct
281{
Pierre Pfisterd3eb90e2016-11-29 15:36:14 +0000282 u32 rx_buffers_len;
283 u32 rx_buffers[VHOST_USER_RX_BUFFERS_N];
284
285 virtio_net_hdr_mrg_rxbuf_t tx_headers[VLIB_FRAME_SIZE];
286 vhost_copy_t copy[VHOST_USER_COPY_ARRAY_N];
287
288 /* This is here so it doesn't end-up
289 * using stack or registers. */
290 vhost_trace_t *current_trace;
Steven Luongbc0d9ff2020-03-23 09:34:59 -0700291
292 u32 *to_next_list;
293 vlib_buffer_t **rx_buffers_pdesc;
Pierre Pfistere21c5282016-09-21 08:04:59 +0100294} vhost_cpu_t;
295
296typedef struct
297{
Steven5445f5f2017-04-25 16:16:00 -0700298 mhash_t if_index_by_sock_name;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700299 u32 mtu_bytes;
Damjan Marion00a9dca2016-08-17 17:05:46 +0200300 vhost_user_intf_t *vhost_user_interfaces;
Damjan Marion00a9dca2016-08-17 17:05:46 +0200301 u32 *show_dev_instance_by_real_dev_instance;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700302 u32 coalesce_frames;
303 f64 coalesce_time;
304 int dont_dump_vhost_user_memory;
Damjan Marion0dafaa72016-09-20 23:21:02 +0200305
Pierre Pfistere21c5282016-09-21 08:04:59 +0100306 /** Per-CPU data for vhost-user */
307 vhost_cpu_t *cpus;
Pierre Pfisterdbb3c252016-11-22 10:33:34 +0000308
309 /** Pseudo random iterator */
310 u32 random;
Steven7312cc72017-03-15 21:18:55 -0700311
Stevenf3b53642017-05-01 14:03:02 -0700312 /* The number of rx interface/queue pairs in interrupt mode */
313 u32 ifq_count;
Steven388e51a2017-06-01 12:49:23 -0700314
Jerome Tollet2f54c272018-10-02 11:41:11 +0200315 /* logging */
316 vlib_log_class_t log_default;
Steven Luong4208a4c2019-05-06 08:51:56 -0700317
318 /* gso interface count */
319 u32 gso_count;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700320} vhost_user_main_t;
321
Damjan Marion00a9dca2016-08-17 17:05:46 +0200322typedef struct
323{
324 u8 if_name[64];
325 u32 sw_if_index;
326 u32 virtio_net_hdr_sz;
327 u64 features;
328 u8 is_server;
329 u8 sock_filename[256];
330 u32 num_regions;
331 int sock_errno;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700332} vhost_user_intf_details_t;
333
Damjan Marion00a9dca2016-08-17 17:05:46 +0200334int vhost_user_dump_ifs (vnet_main_t * vnm, vlib_main_t * vm,
335 vhost_user_intf_details_t ** out_vuids);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700336
Mohsin Kazmie7cde312018-06-26 17:20:11 +0200337extern vlib_node_registration_t vhost_user_send_interrupt_node;
338extern vnet_device_class_t vhost_user_device_class;
339extern vlib_node_registration_t vhost_user_input_node;
340extern vhost_user_main_t vhost_user_main;
341
Ed Warnickecb9cada2015-12-08 15:45:58 -0700342#endif
Damjan Marion00a9dca2016-08-17 17:05:46 +0200343
344/*
345 * fd.io coding-style-patch-verification: ON
346 *
347 * Local Variables:
348 * eval: (c-set-style "gnu")
349 * End:
350 */