blob: 7dadfed23340b02efefa4cb9ec5291a33f59e6d2 [file] [log] [blame]
Ed Warnickecb9cada2015-12-08 15:45:58 -07001/*
2 * Copyright (c) 2015 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
6 *
7 * http://www.apache.org/licenses/LICENSE-2.0
8 *
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
14 */
15#ifndef __VIRTIO_VHOST_USER_H__
16#define __VIRTIO_VHOST_USER_H__
17/* vhost-user data structures */
18
19#define VHOST_MEMORY_MAX_NREGIONS 8
20#define VHOST_USER_MSG_HDR_SZ 12
21#define VHOST_VRING_MAX_SIZE 32768
Pierre Pfistere21c5282016-09-21 08:04:59 +010022#define VHOST_VRING_MAX_N 16 //8TX + 8RX
23#define VHOST_VRING_IDX_RX(qid) (2*qid)
24#define VHOST_VRING_IDX_TX(qid) (2*qid + 1)
Ed Warnickecb9cada2015-12-08 15:45:58 -070025
Steven49a04b92017-07-29 08:56:08 -070026#define VHOST_USER_VRING_NOFD_MASK 0x100
Ed Warnickecb9cada2015-12-08 15:45:58 -070027#define VIRTQ_DESC_F_NEXT 1
Pierre Pfisterba1d0462016-07-27 16:38:20 +010028#define VIRTQ_DESC_F_INDIRECT 4
Shesha Sreenivasamurthyb8f45b32016-02-03 09:38:36 -080029#define VHOST_USER_REPLY_MASK (0x1 << 2)
30
Yoann Desmouceaux4667c222016-02-24 22:51:00 +010031#define VHOST_USER_PROTOCOL_F_MQ 0
32#define VHOST_USER_PROTOCOL_F_LOG_SHMFD 1
Yoann Desmouceauxfe2da0e2016-03-08 14:54:28 +010033#define VHOST_VRING_F_LOG 0
Yoann Desmouceaux4667c222016-02-24 22:51:00 +010034
Shesha Sreenivasamurthy9f50b0b2016-02-23 13:52:31 -080035#define VHOST_USER_F_PROTOCOL_FEATURES 30
Shesha Sreenivasamurthy0666dc42016-04-18 16:38:20 -040036#define VHOST_USER_PROTOCOL_FEATURES ((1ULL << VHOST_USER_PROTOCOL_F_MQ) | \
37 (1ULL << VHOST_USER_PROTOCOL_F_LOG_SHMFD))
Shesha Sreenivasamurthyb8f45b32016-02-03 09:38:36 -080038
39/* If multiqueue is provided by host, then we suppport it. */
40#define VIRTIO_NET_CTRL_MQ 4
41#define VIRTIO_NET_CTRL_MQ_VQ_PAIRS_SET 0
42#define VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MIN 1
43#define VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MAX 0x8000
Ed Warnickecb9cada2015-12-08 15:45:58 -070044
Pierre Pfistere21c5282016-09-21 08:04:59 +010045#define VRING_USED_F_NO_NOTIFY 1
Stevena1a09012017-03-08 00:23:13 -080046#define VRING_AVAIL_F_NO_INTERRUPT 1
Pierre Pfistere21c5282016-09-21 08:04:59 +010047
Jerome Tollet2f54c272018-10-02 11:41:11 +020048#define vu_log_debug(dev, f, ...) \
49{ \
50 vlib_log(VLIB_LOG_LEVEL_DEBUG, vhost_user_main.log_default, "%U: " f, \
51 format_vnet_hw_if_index_name, vnet_get_main(), \
52 dev->hw_if_index, ##__VA_ARGS__); \
53};
Mohsin Kazmie7cde312018-06-26 17:20:11 +020054
Jerome Tollet2f54c272018-10-02 11:41:11 +020055#define vu_log_warn(dev, f, ...) \
56{ \
57 vlib_log(VLIB_LOG_LEVEL_WARNING, vhost_user_main.log_default, "%U: " f, \
58 format_vnet_hw_if_index_name, vnet_get_main(), \
59 dev->hw_if_index, ##__VA_ARGS__); \
60};
61#define vu_log_err(dev, f, ...) \
62{ \
63 vlib_log(VLIB_LOG_LEVEL_ERR, vhost_user_main.log_default, "%U: " f, \
64 format_vnet_hw_if_index_name, vnet_get_main(), \
65 dev->hw_if_index, ##__VA_ARGS__); \
66};
Mohsin Kazmie7cde312018-06-26 17:20:11 +020067
68#define UNIX_GET_FD(unixfd_idx) ({ \
69 typeof(unixfd_idx) __unixfd_idx = (unixfd_idx); \
70 (__unixfd_idx != ~0) ? \
71 pool_elt_at_index (file_main.file_pool, \
72 __unixfd_idx)->file_descriptor : -1; })
73
74#define foreach_virtio_trace_flags \
75 _ (SIMPLE_CHAINED, 0, "Simple descriptor chaining") \
76 _ (SINGLE_DESC, 1, "Single descriptor packet") \
77 _ (INDIRECT, 2, "Indirect descriptor") \
78 _ (MAP_ERROR, 4, "Memory mapping error")
79
80typedef enum
81{
82#define _(n,i,s) VIRTIO_TRACE_F_##n,
83 foreach_virtio_trace_flags
84#undef _
85} virtio_trace_flag_t;
86
Ed Warnickecb9cada2015-12-08 15:45:58 -070087#define foreach_virtio_net_feature \
88 _ (VIRTIO_NET_F_MRG_RXBUF, 15) \
Pierre Pfistere21c5282016-09-21 08:04:59 +010089 _ (VIRTIO_NET_F_CTRL_VQ, 17) \
90 _ (VIRTIO_NET_F_GUEST_ANNOUNCE, 21) \
91 _ (VIRTIO_NET_F_MQ, 22) \
92 _ (VHOST_F_LOG_ALL, 26) \
Yoann Desmouceaux4667c222016-02-24 22:51:00 +010093 _ (VIRTIO_F_ANY_LAYOUT, 27) \
Pierre Pfisterba1d0462016-07-27 16:38:20 +010094 _ (VIRTIO_F_INDIRECT_DESC, 28) \
Damjan Marione83b7d52016-09-19 14:31:34 +020095 _ (VHOST_USER_F_PROTOCOL_FEATURES, 30) \
96 _ (VIRTIO_F_VERSION_1, 32)
Yoann Desmouceaux4667c222016-02-24 22:51:00 +010097
Damjan Marion00a9dca2016-08-17 17:05:46 +020098typedef enum
99{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700100#define _(f,n) FEAT_##f = (n),
101 foreach_virtio_net_feature
102#undef _
103} virtio_net_feature_t;
104
Damjan Marion00a9dca2016-08-17 17:05:46 +0200105int vhost_user_create_if (vnet_main_t * vnm, vlib_main_t * vm,
106 const char *sock_filename, u8 is_server,
107 u32 * sw_if_index, u64 feature_mask,
Stevenf3b53642017-05-01 14:03:02 -0700108 u8 renumber, u32 custom_dev_instance, u8 * hwaddr);
Damjan Marion00a9dca2016-08-17 17:05:46 +0200109int vhost_user_modify_if (vnet_main_t * vnm, vlib_main_t * vm,
110 const char *sock_filename, u8 is_server,
111 u32 sw_if_index, u64 feature_mask,
Stevenf3b53642017-05-01 14:03:02 -0700112 u8 renumber, u32 custom_dev_instance);
Damjan Marion00a9dca2016-08-17 17:05:46 +0200113int vhost_user_delete_if (vnet_main_t * vnm, vlib_main_t * vm,
114 u32 sw_if_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700115
Pierre Pfistere21c5282016-09-21 08:04:59 +0100116/* *INDENT-OFF* */
Damjan Marion00a9dca2016-08-17 17:05:46 +0200117typedef struct vhost_user_memory_region
118{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700119 u64 guest_phys_addr;
120 u64 memory_size;
121 u64 userspace_addr;
122 u64 mmap_offset;
Pierre Pfistere21c5282016-09-21 08:04:59 +0100123} __attribute ((packed)) vhost_user_memory_region_t;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700124
Damjan Marion00a9dca2016-08-17 17:05:46 +0200125typedef struct vhost_user_memory
126{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700127 u32 nregions;
128 u32 padding;
129 vhost_user_memory_region_t regions[VHOST_MEMORY_MAX_NREGIONS];
Pierre Pfistere21c5282016-09-21 08:04:59 +0100130} __attribute ((packed)) vhost_user_memory_t;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700131
Damjan Marion00a9dca2016-08-17 17:05:46 +0200132typedef struct
133{
Pierre Pfistere21c5282016-09-21 08:04:59 +0100134 u32 index, num;
135} __attribute ((packed)) vhost_vring_state_t;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700136
Damjan Marion00a9dca2016-08-17 17:05:46 +0200137typedef struct
138{
Pierre Pfistere21c5282016-09-21 08:04:59 +0100139 u32 index, flags;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700140 u64 desc_user_addr, used_user_addr, avail_user_addr, log_guest_addr;
Pierre Pfistere21c5282016-09-21 08:04:59 +0100141} __attribute ((packed)) vhost_vring_addr_t;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700142
Damjan Marion00a9dca2016-08-17 17:05:46 +0200143typedef struct vhost_user_log
144{
Yoann Desmouceaux4667c222016-02-24 22:51:00 +0100145 u64 size;
146 u64 offset;
Pierre Pfistere21c5282016-09-21 08:04:59 +0100147} __attribute ((packed)) vhost_user_log_t;
Yoann Desmouceaux4667c222016-02-24 22:51:00 +0100148
Damjan Marion00a9dca2016-08-17 17:05:46 +0200149typedef enum vhost_user_req
150{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700151 VHOST_USER_NONE = 0,
152 VHOST_USER_GET_FEATURES = 1,
153 VHOST_USER_SET_FEATURES = 2,
154 VHOST_USER_SET_OWNER = 3,
155 VHOST_USER_RESET_OWNER = 4,
156 VHOST_USER_SET_MEM_TABLE = 5,
157 VHOST_USER_SET_LOG_BASE = 6,
158 VHOST_USER_SET_LOG_FD = 7,
159 VHOST_USER_SET_VRING_NUM = 8,
160 VHOST_USER_SET_VRING_ADDR = 9,
161 VHOST_USER_SET_VRING_BASE = 10,
162 VHOST_USER_GET_VRING_BASE = 11,
163 VHOST_USER_SET_VRING_KICK = 12,
164 VHOST_USER_SET_VRING_CALL = 13,
165 VHOST_USER_SET_VRING_ERR = 14,
Shesha Sreenivasamurthyb8f45b32016-02-03 09:38:36 -0800166 VHOST_USER_GET_PROTOCOL_FEATURES = 15,
167 VHOST_USER_SET_PROTOCOL_FEATURES = 16,
168 VHOST_USER_GET_QUEUE_NUM = 17,
Yoann Desmouceaux4667c222016-02-24 22:51:00 +0100169 VHOST_USER_SET_VRING_ENABLE = 18,
Ed Warnickecb9cada2015-12-08 15:45:58 -0700170 VHOST_USER_MAX
171} vhost_user_req_t;
172
173// vring_desc I/O buffer descriptor
Damjan Marion00a9dca2016-08-17 17:05:46 +0200174typedef struct
175{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700176 uint64_t addr; // packet data buffer address
177 uint32_t len; // packet data buffer size
178 uint16_t flags; // (see below)
179 uint16_t next; // optional index next descriptor in chain
180} __attribute ((packed)) vring_desc_t;
181
Damjan Marion00a9dca2016-08-17 17:05:46 +0200182typedef struct
183{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700184 uint16_t flags;
Pierre Pfistere21c5282016-09-21 08:04:59 +0100185 volatile uint16_t idx;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700186 uint16_t ring[VHOST_VRING_MAX_SIZE];
187} __attribute ((packed)) vring_avail_t;
188
Damjan Marion00a9dca2016-08-17 17:05:46 +0200189typedef struct
190{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700191 uint16_t flags;
192 uint16_t idx;
Damjan Marion00a9dca2016-08-17 17:05:46 +0200193 struct /* vring_used_elem */
194 {
195 uint32_t id;
196 uint32_t len;
197 } ring[VHOST_VRING_MAX_SIZE];
Ed Warnickecb9cada2015-12-08 15:45:58 -0700198} __attribute ((packed)) vring_used_t;
199
Damjan Marion00a9dca2016-08-17 17:05:46 +0200200typedef struct
201{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700202 u8 flags;
203 u8 gso_type;
204 u16 hdr_len;
205 u16 gso_size;
206 u16 csum_start;
207 u16 csum_offset;
208} __attribute ((packed)) virtio_net_hdr_t;
209
210typedef struct {
211 virtio_net_hdr_t hdr;
212 u16 num_buffers;
213} __attribute ((packed)) virtio_net_hdr_mrg_rxbuf_t;
214
215typedef struct vhost_user_msg {
Damjan Marion00a9dca2016-08-17 17:05:46 +0200216 vhost_user_req_t request;
217 u32 flags;
218 u32 size;
219 union
220 {
221 u64 u64;
222 vhost_vring_state_t state;
223 vhost_vring_addr_t addr;
224 vhost_user_memory_t memory;
225 vhost_user_log_t log;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700226 };
227} __attribute ((packed)) vhost_user_msg_t;
Damjan Marion00a9dca2016-08-17 17:05:46 +0200228/* *INDENT-ON* */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700229
Damjan Marion00a9dca2016-08-17 17:05:46 +0200230typedef struct
231{
Pierre Pfistere21c5282016-09-21 08:04:59 +0100232 CLIB_CACHE_LINE_ALIGN_MARK (cacheline0);
Steven97878892017-08-29 09:23:26 -0700233 u16 qsz_mask;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700234 u16 last_avail_idx;
235 u16 last_used_idx;
Pierre Pfistere21c5282016-09-21 08:04:59 +0100236 u16 n_since_last_int;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700237 vring_desc_t *desc;
238 vring_avail_t *avail;
239 vring_used_t *used;
Pierre Pfistere21c5282016-09-21 08:04:59 +0100240 f64 int_deadline;
241 u8 started;
242 u8 enabled;
243 u8 log_used;
244 //Put non-runtime in a different cache line
245 CLIB_CACHE_LINE_ALIGN_MARK (cacheline1);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700246 int errfd;
247 u32 callfd_idx;
Pierre Pfistere21c5282016-09-21 08:04:59 +0100248 u32 kickfd_idx;
249 u64 log_guest_addr;
Stevenf3b53642017-05-01 14:03:02 -0700250
251 /* The rx queue policy (interrupt/adaptive/polling) for this queue */
252 u32 mode;
Steven Luong67f935e2019-02-01 10:23:56 -0800253
254 /*
255 * It contains the device queue number. -1 if it does not. The idea is
256 * to not invoke vnet_hw_interface_assign_rx_thread and
257 * vnet_hw_interface_unassign_rx_thread more than once for the duration of
258 * the interface even if it is disconnected and reconnected.
259 */
260 i16 qid;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700261} vhost_user_vring_t;
262
Steven7312cc72017-03-15 21:18:55 -0700263#define VHOST_USER_EVENT_START_TIMER 1
Stevenf3b53642017-05-01 14:03:02 -0700264#define VHOST_USER_EVENT_STOP_TIMER 2
Steven7312cc72017-03-15 21:18:55 -0700265
Damjan Marion00a9dca2016-08-17 17:05:46 +0200266typedef struct
267{
268 CLIB_CACHE_LINE_ALIGN_MARK (cacheline0);
Juraj Slobodab192feb2018-10-01 12:42:07 +0200269 u32 is_ready;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700270 u32 admin_up;
Pierre Pfisterdbb3c252016-11-22 10:33:34 +0000271 u32 unix_server_index;
Damjan Marion56dd5432017-09-08 19:52:02 +0200272 u32 clib_file_index;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700273 char sock_filename[256];
274 int sock_errno;
Steven5445f5f2017-04-25 16:16:00 -0700275 uword if_index;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700276 u32 hw_if_index, sw_if_index;
Damjan Marion00a9dca2016-08-17 17:05:46 +0200277
Pierre Pfistere21c5282016-09-21 08:04:59 +0100278 //Feature negotiation
Ed Warnickecb9cada2015-12-08 15:45:58 -0700279 u64 features;
280 u64 feature_mask;
Yoann Desmouceaux4667c222016-02-24 22:51:00 +0100281 u64 protocol_features;
Pierre Pfistere21c5282016-09-21 08:04:59 +0100282
283 //Memory region information
284 u32 nregions;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700285 vhost_user_memory_region_t regions[VHOST_MEMORY_MAX_NREGIONS];
Damjan Marion00a9dca2016-08-17 17:05:46 +0200286 void *region_mmap_addr[VHOST_MEMORY_MAX_NREGIONS];
Damjan Marion37623702016-09-20 11:25:27 +0200287 u64 region_guest_addr_lo[VHOST_MEMORY_MAX_NREGIONS];
288 u64 region_guest_addr_hi[VHOST_MEMORY_MAX_NREGIONS];
Ed Warnickecb9cada2015-12-08 15:45:58 -0700289 u32 region_mmap_fd[VHOST_MEMORY_MAX_NREGIONS];
Pierre Pfistere21c5282016-09-21 08:04:59 +0100290
291 //Virtual rings
292 vhost_user_vring_t vrings[VHOST_VRING_MAX_N];
293 volatile u32 *vring_locks[VHOST_VRING_MAX_N];
294
Ed Warnickecb9cada2015-12-08 15:45:58 -0700295 int virtio_net_hdr_sz;
296 int is_any_layout;
Yoann Desmouceaux4667c222016-02-24 22:51:00 +0100297
Damjan Marion00a9dca2016-08-17 17:05:46 +0200298 void *log_base_addr;
Yoann Desmouceaux4667c222016-02-24 22:51:00 +0100299 u64 log_size;
Pierre Pfistere21c5282016-09-21 08:04:59 +0100300
301 /* Whether to use spinlock or per_cpu_tx_qid assignment */
302 u8 use_tx_spinlock;
303 u16 *per_cpu_tx_qid;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700304} vhost_user_intf_t;
305
Damjan Marion00a9dca2016-08-17 17:05:46 +0200306typedef struct
307{
Pierre Pfisterd3eb90e2016-11-29 15:36:14 +0000308 uword dst;
309 uword src;
310 u32 len;
311} vhost_copy_t;
312
313typedef struct
314{
315 u16 qid; /** The interface queue index (Not the virtio vring idx) */
316 u16 device_index; /** The device index */
317 u32 virtio_ring_flags; /** Runtime queue flags **/
318 u16 first_desc_len; /** Length of the first data descriptor **/
319 virtio_net_hdr_mrg_rxbuf_t hdr; /** Virtio header **/
320} vhost_trace_t;
321
322
323#define VHOST_USER_RX_BUFFERS_N (2 * VLIB_FRAME_SIZE + 2)
324#define VHOST_USER_COPY_ARRAY_N (4 * VLIB_FRAME_SIZE)
325
326typedef struct
327{
Pierre Pfisterd3eb90e2016-11-29 15:36:14 +0000328 u32 rx_buffers_len;
329 u32 rx_buffers[VHOST_USER_RX_BUFFERS_N];
330
331 virtio_net_hdr_mrg_rxbuf_t tx_headers[VLIB_FRAME_SIZE];
332 vhost_copy_t copy[VHOST_USER_COPY_ARRAY_N];
333
334 /* This is here so it doesn't end-up
335 * using stack or registers. */
336 vhost_trace_t *current_trace;
Pierre Pfistere21c5282016-09-21 08:04:59 +0100337} vhost_cpu_t;
338
339typedef struct
340{
Steven5445f5f2017-04-25 16:16:00 -0700341 mhash_t if_index_by_sock_name;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700342 u32 mtu_bytes;
Damjan Marion00a9dca2016-08-17 17:05:46 +0200343 vhost_user_intf_t *vhost_user_interfaces;
Damjan Marion00a9dca2016-08-17 17:05:46 +0200344 u32 *show_dev_instance_by_real_dev_instance;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700345 u32 coalesce_frames;
346 f64 coalesce_time;
347 int dont_dump_vhost_user_memory;
Damjan Marion0dafaa72016-09-20 23:21:02 +0200348
Pierre Pfistere21c5282016-09-21 08:04:59 +0100349 /** Per-CPU data for vhost-user */
350 vhost_cpu_t *cpus;
Pierre Pfisterdbb3c252016-11-22 10:33:34 +0000351
352 /** Pseudo random iterator */
353 u32 random;
Steven7312cc72017-03-15 21:18:55 -0700354
Stevenf3b53642017-05-01 14:03:02 -0700355 /* The number of rx interface/queue pairs in interrupt mode */
356 u32 ifq_count;
Steven388e51a2017-06-01 12:49:23 -0700357
Jerome Tollet2f54c272018-10-02 11:41:11 +0200358 /* logging */
359 vlib_log_class_t log_default;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700360} vhost_user_main_t;
361
Damjan Marion00a9dca2016-08-17 17:05:46 +0200362typedef struct
363{
364 u8 if_name[64];
365 u32 sw_if_index;
366 u32 virtio_net_hdr_sz;
367 u64 features;
368 u8 is_server;
369 u8 sock_filename[256];
370 u32 num_regions;
371 int sock_errno;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700372} vhost_user_intf_details_t;
373
Damjan Marion00a9dca2016-08-17 17:05:46 +0200374int vhost_user_dump_ifs (vnet_main_t * vnm, vlib_main_t * vm,
375 vhost_user_intf_details_t ** out_vuids);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700376
Mohsin Kazmie7cde312018-06-26 17:20:11 +0200377extern vlib_node_registration_t vhost_user_send_interrupt_node;
378extern vnet_device_class_t vhost_user_device_class;
379extern vlib_node_registration_t vhost_user_input_node;
380extern vhost_user_main_t vhost_user_main;
381
Ed Warnickecb9cada2015-12-08 15:45:58 -0700382#endif
Damjan Marion00a9dca2016-08-17 17:05:46 +0200383
384/*
385 * fd.io coding-style-patch-verification: ON
386 *
387 * Local Variables:
388 * eval: (c-set-style "gnu")
389 * End:
390 */