blob: 2cb301ce291e0f963aa638e08c91adc1ff752bbd [file] [log] [blame]
Ed Warnickecb9cada2015-12-08 15:45:58 -07001/*
2 * Copyright (c) 2015 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
6 *
7 * http://www.apache.org/licenses/LICENSE-2.0
8 *
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
14 */
15#ifndef __included_dpdk_h__
16#define __included_dpdk_h__
17
18/* $$$$ We should rename always_inline -> clib_always_inline */
19#undef always_inline
20
21#include <rte_config.h>
22
23#include <rte_common.h>
24#include <rte_dev.h>
25#include <rte_log.h>
26#include <rte_memory.h>
Ed Warnickecb9cada2015-12-08 15:45:58 -070027#include <rte_memzone.h>
28#include <rte_tailq.h>
29#include <rte_eal.h>
30#include <rte_per_lcore.h>
31#include <rte_launch.h>
32#include <rte_atomic.h>
33#include <rte_cycles.h>
34#include <rte_prefetch.h>
35#include <rte_lcore.h>
36#include <rte_per_lcore.h>
37#include <rte_branch_prediction.h>
38#include <rte_interrupts.h>
39#include <rte_pci.h>
40#include <rte_random.h>
41#include <rte_debug.h>
42#include <rte_ether.h>
43#include <rte_ethdev.h>
44#include <rte_ring.h>
45#include <rte_mempool.h>
46#include <rte_mbuf.h>
Damjan Marione90892e2016-02-23 19:20:28 +010047#ifdef RTE_LIBRTE_KNI
Ed Warnickecb9cada2015-12-08 15:45:58 -070048#include <rte_kni.h>
Damjan Marione90892e2016-02-23 19:20:28 +010049#endif
Ed Warnickecb9cada2015-12-08 15:45:58 -070050#include <rte_virtio_net.h>
51#include <rte_pci_dev_ids.h>
52#include <rte_version.h>
John Lod9bf9ab2016-02-25 11:17:55 -050053#include <rte_eth_bond.h>
Ed Warnickecb9cada2015-12-08 15:45:58 -070054
55#include <vnet/unix/pcap.h>
56#include <vnet/devices/virtio/vhost-user.h>
57
58#if CLIB_DEBUG > 0
59#define always_inline static inline
60#else
61#define always_inline static inline __attribute__ ((__always_inline__))
62#endif
63
Damjan Marion1f0da172016-07-13 22:44:18 +020064#if RTE_VERSION < RTE_VERSION_NUM(16, 7, 0, 0)
65#define DPDK_VHOST_USER 1
66#else
67#define DPDK_VHOST_USER 0
68#endif
69
Damjan Marionc68b4cb2016-05-25 20:11:33 +020070#include <vlib/pci/pci.h>
71
Damjan Mariona06dfb32016-06-26 20:16:57 +020072#define NB_MBUF (16<<10)
Ed Warnickecb9cada2015-12-08 15:45:58 -070073
Damjan Marionb8abf872016-03-14 20:02:35 +010074extern vnet_device_class_t dpdk_device_class;
Jean-Mickael Guerin8941ec22016-03-04 14:14:21 +010075extern vlib_node_registration_t dpdk_input_node;
Jean-Mickael Guerin8941ec22016-03-04 14:14:21 +010076extern vlib_node_registration_t handoff_dispatch_node;
Ed Warnickecb9cada2015-12-08 15:45:58 -070077
Ed Warnickecb9cada2015-12-08 15:45:58 -070078#define foreach_dpdk_pmd \
Dave Barach61efa142016-01-22 08:23:09 -050079 _ ("rte_nicvf_pmd", THUNDERX) \
Ed Warnickecb9cada2015-12-08 15:45:58 -070080 _ ("rte_em_pmd", E1000EM) \
81 _ ("rte_igb_pmd", IGB) \
82 _ ("rte_igbvf_pmd", IGBVF) \
83 _ ("rte_ixgbe_pmd", IXGBE) \
84 _ ("rte_ixgbevf_pmd", IXGBEVF) \
85 _ ("rte_i40e_pmd", I40E) \
86 _ ("rte_i40evf_pmd", I40EVF) \
87 _ ("rte_virtio_pmd", VIRTIO) \
Ed Warnickecb9cada2015-12-08 15:45:58 -070088 _ ("rte_enic_pmd", ENIC) \
89 _ ("rte_vmxnet3_pmd", VMXNET3) \
90 _ ("AF_PACKET PMD", AF_PACKET) \
John Lod9bf9ab2016-02-25 11:17:55 -050091 _ ("rte_bond_pmd", BOND) \
Damjan Marion2068e982016-01-27 16:59:04 +010092 _ ("rte_pmd_fm10k", FM10K) \
Sachina29f2002016-06-17 09:24:20 +053093 _ ("rte_cxgbe_pmd", CXGBE) \
94 _ ("rte_dpaa2_dpni", DPAA2)
Ed Warnickecb9cada2015-12-08 15:45:58 -070095
Damjan Marion25665672016-08-16 18:56:08 +020096typedef enum
97{
Ed Warnickecb9cada2015-12-08 15:45:58 -070098 VNET_DPDK_PMD_NONE,
99#define _(s,f) VNET_DPDK_PMD_##f,
100 foreach_dpdk_pmd
101#undef _
Damjan Marion25665672016-08-16 18:56:08 +0200102 VNET_DPDK_PMD_UNKNOWN, /* must be last */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700103} dpdk_pmd_t;
104
Damjan Marion25665672016-08-16 18:56:08 +0200105typedef enum
106{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700107 VNET_DPDK_PORT_TYPE_ETH_1G,
108 VNET_DPDK_PORT_TYPE_ETH_10G,
109 VNET_DPDK_PORT_TYPE_ETH_40G,
John Lod9bf9ab2016-02-25 11:17:55 -0500110 VNET_DPDK_PORT_TYPE_ETH_BOND,
Ed Warnickecb9cada2015-12-08 15:45:58 -0700111 VNET_DPDK_PORT_TYPE_ETH_SWITCH,
Ed Warnickecb9cada2015-12-08 15:45:58 -0700112 VNET_DPDK_PORT_TYPE_AF_PACKET,
113 VNET_DPDK_PORT_TYPE_UNKNOWN,
114} dpdk_port_type_t;
115
Damjan Marion25665672016-08-16 18:56:08 +0200116typedef struct
117{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700118 f64 deadline;
Damjan Marion25665672016-08-16 18:56:08 +0200119 vlib_frame_t *frame;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700120} dpdk_frame_t;
121
122#define DPDK_EFD_MAX_DISCARD_RATE 10
123
Damjan Marion25665672016-08-16 18:56:08 +0200124typedef struct
125{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700126 u16 last_burst_sz;
127 u16 max_burst_sz;
128 u32 full_frames_cnt;
129 u32 consec_full_frames_cnt;
130 u32 congestion_cnt;
131 u64 last_poll_time;
132 u64 max_poll_delay;
133 u32 discard_cnt;
134 u32 total_packet_cnt;
135} dpdk_efd_agent_t;
136
Damjan Marion1f0da172016-07-13 22:44:18 +0200137#if DPDK_VHOST_USER
Damjan Marion25665672016-08-16 18:56:08 +0200138typedef struct
139{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700140 int callfd;
141 int kickfd;
142 int errfd;
Shesha Sreenivasamurthyb8f45b32016-02-03 09:38:36 -0800143 int enabled;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700144 u32 callfd_idx;
145 u32 n_since_last_int;
146 f64 int_deadline;
Shesha Sreenivasamurthy94550842016-03-02 10:33:26 -0800147 u64 packets;
148 u64 bytes;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700149} dpdk_vu_vring;
150
Damjan Marion25665672016-08-16 18:56:08 +0200151typedef struct
152{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700153 u32 is_up;
154 u32 unix_fd;
155 u32 unix_file_index;
156 u32 client_fd;
157 char sock_filename[256];
158 int sock_errno;
159 u8 sock_is_server;
160 u8 active;
161
162 u64 feature_mask;
163 u32 num_vrings;
Shesha Sreenivasamurthyb8f45b32016-02-03 09:38:36 -0800164 dpdk_vu_vring vrings[VHOST_MAX_QUEUE_PAIRS * 2];
Ed Warnickecb9cada2015-12-08 15:45:58 -0700165 u64 region_addr[VHOST_MEMORY_MAX_NREGIONS];
166 u32 region_fd[VHOST_MEMORY_MAX_NREGIONS];
Shesha Sreenivasamurthy81f70922016-06-15 13:47:40 -0700167 u64 region_offset[VHOST_MEMORY_MAX_NREGIONS];
Ed Warnickecb9cada2015-12-08 15:45:58 -0700168} dpdk_vu_intf_t;
Damjan Marion1f0da172016-07-13 22:44:18 +0200169#endif
Ed Warnickecb9cada2015-12-08 15:45:58 -0700170
Damjan Marion25665672016-08-16 18:56:08 +0200171typedef void (*dpdk_flowcontrol_callback_t) (vlib_main_t * vm,
172 u32 hw_if_index, u32 n_packets);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700173
174/*
175 * The header for the tx_vector in dpdk_device_t.
176 * Head and tail are indexes into the tx_vector and are of type
177 * u64 so they never overflow.
178 */
Damjan Marion25665672016-08-16 18:56:08 +0200179typedef struct
180{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700181 u64 tx_head;
182 u64 tx_tail;
183} tx_ring_hdr_t;
184
Damjan Marion25665672016-08-16 18:56:08 +0200185typedef struct
186{
187 CLIB_CACHE_LINE_ALIGN_MARK (cacheline0);
Damjan Marion85cdbd02016-02-12 18:00:23 +0100188 volatile u32 **lockp;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700189
190 /* Instance ID */
191 u32 device_index;
192
193 u32 vlib_hw_if_index;
194 u32 vlib_sw_if_index;
195
196 /* next node index if we decide to steal the rx graph arc */
197 u32 per_interface_next_index;
198
199 /* dpdk rte_mbuf rx and tx vectors, VLIB_FRAME_SIZE */
Damjan Marion25665672016-08-16 18:56:08 +0200200 struct rte_mbuf ***tx_vectors; /* one per worker thread */
201 struct rte_mbuf ***rx_vectors;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700202
203 /* vector of traced contexts, per device */
Damjan Marion25665672016-08-16 18:56:08 +0200204 u32 *d_trace_buffers;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700205
Ed Warnickecb9cada2015-12-08 15:45:58 -0700206 dpdk_pmd_t pmd:8;
207 i8 cpu_socket;
208
Damjan Marionb28e4982016-08-22 22:34:38 +0200209 u16 flags;
Damjan Marion56431702016-09-19 13:18:09 +0200210#define DPDK_DEVICE_FLAG_ADMIN_UP (1 << 0)
211#define DPDK_DEVICE_FLAG_PROMISC (1 << 1)
212#define DPDK_DEVICE_FLAG_PMD (1 << 2)
213#define DPDK_DEVICE_FLAG_KNI (1 << 3)
214#define DPDK_DEVICE_FLAG_VHOST_USER (1 << 4)
Damjan Mariona7cc4472016-09-19 13:31:49 +0200215#define DPDK_DEVICE_FLAG_HAVE_SUBIF (1 << 5)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700216
Damjan Marion25665672016-08-16 18:56:08 +0200217 CLIB_CACHE_LINE_ALIGN_MARK (cacheline1);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700218
Damjan Marion25665672016-08-16 18:56:08 +0200219 u8 *interface_name_suffix;
Damjan Marion32f7bc12016-07-21 03:42:37 -0700220
Damjan Mariona7cc4472016-09-19 13:31:49 +0200221 /* number of sub-interfaces */
222 u16 num_subifs;
223
Ed Warnickecb9cada2015-12-08 15:45:58 -0700224 /* PMD related */
225 u16 tx_q_used;
226 u16 rx_q_used;
227 u16 nb_rx_desc;
228 u16 nb_tx_desc;
Damjan Marion25665672016-08-16 18:56:08 +0200229 u16 *cpu_socket_id_by_queue;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700230 struct rte_eth_conf port_conf;
231 struct rte_eth_txconf tx_conf;
232
233 /* KNI related */
234 struct rte_kni *kni;
235 u8 kni_port_id;
236
Damjan Marion1f0da172016-07-13 22:44:18 +0200237#if DPDK_VHOST_USER
Ed Warnickecb9cada2015-12-08 15:45:58 -0700238 /* vhost-user related */
239 u32 vu_if_id;
Damjan Marion25665672016-08-16 18:56:08 +0200240 struct virtio_net vu_vhost_dev;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700241 u32 vu_is_running;
242 dpdk_vu_intf_t *vu_intf;
Damjan Marion1f0da172016-07-13 22:44:18 +0200243#endif
Ed Warnickecb9cada2015-12-08 15:45:58 -0700244
245 /* af_packet */
246 u8 af_packet_port_id;
247
248 struct rte_eth_link link;
249 f64 time_last_link_update;
250
251 struct rte_eth_stats stats;
252 struct rte_eth_stats last_stats;
Sean Hopea4f16a02016-03-28 13:11:31 -0400253 struct rte_eth_stats last_cleared_stats;
Damjan Marion1f0da172016-07-13 22:44:18 +0200254#if RTE_VERSION >= RTE_VERSION_NUM(16, 7, 0, 0)
Damjan Marion25665672016-08-16 18:56:08 +0200255 struct rte_eth_xstat *xstats;
256 struct rte_eth_xstat *last_cleared_xstats;
Damjan Marion1f0da172016-07-13 22:44:18 +0200257#else
Damjan Marion25665672016-08-16 18:56:08 +0200258 struct rte_eth_xstats *xstats;
259 struct rte_eth_xstats *last_cleared_xstats;
Damjan Marion1f0da172016-07-13 22:44:18 +0200260#endif
Ed Warnickecb9cada2015-12-08 15:45:58 -0700261 f64 time_last_stats_update;
262 dpdk_port_type_t port_type;
263
264 dpdk_efd_agent_t efd_agent;
Damjan Marion25665672016-08-16 18:56:08 +0200265 u8 need_txlock; /* Used by VNET_DPDK_DEV_VHOST_USER */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700266} dpdk_device_t;
267
Bud Grisee0ef46b2016-03-30 15:54:58 -0400268
Ed Warnickecb9cada2015-12-08 15:45:58 -0700269#define DPDK_TX_RING_SIZE (4 * 1024)
270
Bud Grise02301ef2016-02-24 16:09:05 -0500271#define DPDK_STATS_POLL_INTERVAL (10.0)
Damjan Marion25665672016-08-16 18:56:08 +0200272#define DPDK_MIN_STATS_POLL_INTERVAL (0.001) /* 1msec */
Bud Grise02301ef2016-02-24 16:09:05 -0500273
274#define DPDK_LINK_POLL_INTERVAL (3.0)
Damjan Marion25665672016-08-16 18:56:08 +0200275#define DPDK_MIN_LINK_POLL_INTERVAL (0.001) /* 1msec */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700276
Damjan Marion25665672016-08-16 18:56:08 +0200277typedef struct
278{
279 CLIB_CACHE_LINE_ALIGN_MARK (cacheline0);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700280
281 /* total input packet counter */
282 u64 aggregate_rx_packets;
283} dpdk_worker_t;
284
Damjan Marion25665672016-08-16 18:56:08 +0200285typedef struct
286{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700287 u32 device;
288 u16 queue_id;
289} dpdk_device_and_queue_t;
290
291/* Early-Fast-Discard (EFD) */
292#define DPDK_EFD_DISABLED 0
293#define DPDK_EFD_DISCARD_ENABLED (1 << 0)
294#define DPDK_EFD_MONITOR_ENABLED (1 << 1)
295#define DPDK_EFD_DROPALL_ENABLED (1 << 2)
296
297#define DPDK_EFD_DEFAULT_DEVICE_QUEUE_HI_THRESH_PCT 90
298#define DPDK_EFD_DEFAULT_CONSEC_FULL_FRAMES_HI_THRESH 6
299
Damjan Marion25665672016-08-16 18:56:08 +0200300typedef struct dpdk_efd_t
301{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700302 u16 enabled;
303 u16 queue_hi_thresh;
304 u16 consec_full_frames_hi_thresh;
305 u16 pad;
306} dpdk_efd_t;
307
Damjan Marionc68b4cb2016-05-25 20:11:33 +0200308#define foreach_dpdk_device_config_item \
309 _ (num_rx_queues) \
Damjan Marion39da6212016-06-06 13:21:04 +0200310 _ (num_tx_queues) \
311 _ (num_rx_desc) \
Srivatsa Sangli820e3632016-06-14 13:10:55 -0700312 _ (num_tx_desc) \
313 _ (rss_fn)
Damjan Marionc68b4cb2016-05-25 20:11:33 +0200314
Damjan Marion25665672016-08-16 18:56:08 +0200315typedef struct
316{
317 vlib_pci_addr_t pci_addr;
318 u8 is_blacklisted;
319 u8 vlan_strip_offload;
John Loce3e9712016-07-07 13:54:44 -0400320#define DPDK_DEVICE_VLAN_STRIP_DEFAULT 0
321#define DPDK_DEVICE_VLAN_STRIP_OFF 1
322#define DPDK_DEVICE_VLAN_STRIP_ON 2
323
Damjan Marionc68b4cb2016-05-25 20:11:33 +0200324#define _(x) uword x;
325 foreach_dpdk_device_config_item
326#undef _
Damjan Marion0b140722016-06-14 00:36:09 +0200327 clib_bitmap_t * workers;
Damjan Marionc68b4cb2016-05-25 20:11:33 +0200328} dpdk_device_config_t;
329
Damjan Marion25665672016-08-16 18:56:08 +0200330typedef struct
331{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700332
Damjan Marion64ae6692016-05-25 18:40:13 +0200333 /* Config stuff */
Damjan Marion25665672016-08-16 18:56:08 +0200334 u8 **eal_init_args;
335 u8 *eal_init_args_str;
336 u8 *uio_driver_name;
Damjan Marion64ae6692016-05-25 18:40:13 +0200337 u8 no_multi_seg;
338 u8 enable_tcp_udp_checksum;
339
340 /* Required config parameters */
341 u8 coremask_set_manually;
342 u8 nchannels_set_manually;
343 u32 coremask;
344 u32 nchannels;
345 u32 num_mbufs;
Damjan Marion25665672016-08-16 18:56:08 +0200346 u8 num_kni; /* while kni_init allows u32, port_id in callback fn is only u8 */
Damjan Marion64ae6692016-05-25 18:40:13 +0200347
348 /*
349 * format interface names ala xxxEthernet%d/%d/%d instead of
Damjan Marion137c7c62016-07-06 22:52:49 +0200350 * xxxEthernet%x/%x/%x.
Damjan Marion64ae6692016-05-25 18:40:13 +0200351 */
352 u8 interface_name_format_decimal;
353
354 /* virtio vhost-user switch */
355 u8 use_virtio_vhost;
356
357 /* vhost-user coalescence frames config */
358 u32 vhost_coalesce_frames;
359 f64 vhost_coalesce_time;
360
Damjan Marionc68b4cb2016-05-25 20:11:33 +0200361 /* per-device config */
362 dpdk_device_config_t default_devconf;
Damjan Marion25665672016-08-16 18:56:08 +0200363 dpdk_device_config_t *dev_confs;
364 uword *device_config_index_by_pci_addr;
Damjan Marionc68b4cb2016-05-25 20:11:33 +0200365
Damjan Marion64ae6692016-05-25 18:40:13 +0200366} dpdk_config_main_t;
367
368dpdk_config_main_t dpdk_config_main;
369
Damjan Marion25665672016-08-16 18:56:08 +0200370typedef struct
371{
Damjan Marion64ae6692016-05-25 18:40:13 +0200372
Ed Warnickecb9cada2015-12-08 15:45:58 -0700373 /* Devices */
Damjan Marion25665672016-08-16 18:56:08 +0200374 dpdk_device_t *devices;
375 dpdk_device_and_queue_t **devices_by_cpu;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700376
377 /* per-thread recycle lists */
Damjan Marion25665672016-08-16 18:56:08 +0200378 u32 **recycle;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700379
Dave Barachd81566f2016-02-15 11:34:13 -0500380 /* buffer flags template, configurable to enable/disable tcp / udp cksum */
381 u32 buffer_flags_template;
382
Ed Warnickecb9cada2015-12-08 15:45:58 -0700383 /* flow control callback. If 0 then flow control is disabled */
384 dpdk_flowcontrol_callback_t flowcontrol_callback;
385
386 /* vlib buffer free list, must be same size as an rte_mbuf */
387 u32 vlib_buffer_free_list_index;
388
Ed Warnickecb9cada2015-12-08 15:45:58 -0700389 /* dpdk worker "threads" */
Damjan Marion25665672016-08-16 18:56:08 +0200390 dpdk_worker_t *workers;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700391
Ed Warnickecb9cada2015-12-08 15:45:58 -0700392
393 /* Ethernet input node index */
394 u32 ethernet_input_node_index;
395
Ed Warnickecb9cada2015-12-08 15:45:58 -0700396 /* pcap tracing [only works if (CLIB_DEBUG > 0)] */
397 int tx_pcap_enable;
398 pcap_main_t pcap_main;
Damjan Marion25665672016-08-16 18:56:08 +0200399 u8 *pcap_filename;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700400 u32 pcap_sw_if_index;
401 u32 pcap_pkts_to_capture;
402
Ed Warnickecb9cada2015-12-08 15:45:58 -0700403 /* hashes */
Damjan Marion25665672016-08-16 18:56:08 +0200404 uword *dpdk_device_by_kni_port_id;
405 uword *vu_sw_if_index_by_listener_fd;
406 uword *vu_sw_if_index_by_sock_fd;
407 u32 *vu_inactive_interfaces_device_index;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700408
409 u32 next_vu_if_id;
410
411 /* efd (early-fast-discard) settings */
412 dpdk_efd_t efd;
413
414 /*
415 * flag indicating that a posted admin up/down
416 * (via post_sw_interface_set_flags) is in progress
417 */
418 u8 admin_up_down_in_progress;
419
Damjan Marionc68b4cb2016-05-25 20:11:33 +0200420 u8 use_rss;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700421
422 /* which cpus are running dpdk-input */
423 int input_cpu_first_index;
424 int input_cpu_count;
425
Bud Grise02301ef2016-02-24 16:09:05 -0500426 /* control interval of dpdk link state and stat polling */
427 f64 link_state_poll_interval;
428 f64 stat_poll_interval;
429
Dave Barach08602d12016-06-04 14:10:59 -0400430 /* Sleep for this many MS after each device poll */
431 u32 poll_sleep;
432
Ed Warnickecb9cada2015-12-08 15:45:58 -0700433 /* convenience */
Damjan Marion25665672016-08-16 18:56:08 +0200434 vlib_main_t *vlib_main;
435 vnet_main_t *vnet_main;
436 dpdk_config_main_t *conf;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700437} dpdk_main_t;
438
439dpdk_main_t dpdk_main;
440
Damjan Marion25665672016-08-16 18:56:08 +0200441typedef enum
442{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700443 DPDK_RX_NEXT_IP4_INPUT,
444 DPDK_RX_NEXT_IP6_INPUT,
445 DPDK_RX_NEXT_MPLS_INPUT,
446 DPDK_RX_NEXT_ETHERNET_INPUT,
447 DPDK_RX_NEXT_DROP,
448 DPDK_RX_N_NEXT,
449} dpdk_rx_next_t;
450
Damjan Marion25665672016-08-16 18:56:08 +0200451typedef struct
452{
Damjan Marion7f620972016-02-25 16:00:11 +0100453 u32 buffer_index;
454 u16 device_index;
455 u8 queue_index;
456 struct rte_mbuf mb;
457 /* Copy of VLIB buffer; packet data stored in pre_data. */
458 vlib_buffer_t buffer;
459} dpdk_tx_dma_trace_t;
460
Damjan Marion25665672016-08-16 18:56:08 +0200461typedef struct
462{
Damjan Marion7f620972016-02-25 16:00:11 +0100463 u32 buffer_index;
464 u16 device_index;
465 u16 queue_index;
466 struct rte_mbuf mb;
Damjan Marion25665672016-08-16 18:56:08 +0200467 vlib_buffer_t buffer; /* Copy of VLIB buffer; pkt data stored in pre_data. */
468 u8 data[256]; /* First 256 data bytes, used for hexdump */
Damjan Marion7f620972016-02-25 16:00:11 +0100469} dpdk_rx_dma_trace_t;
470
Ed Warnickecb9cada2015-12-08 15:45:58 -0700471void vnet_buffer_needs_dpdk_mb (vlib_buffer_t * b);
472
473void dpdk_set_next_node (dpdk_rx_next_t, char *);
474
Damjan Marion25665672016-08-16 18:56:08 +0200475clib_error_t *dpdk_set_mac_address (vnet_hw_interface_t * hi, char *address);
Christian Dechamplain2073cfe2016-02-19 12:26:57 -0500476
Damjan Marion25665672016-08-16 18:56:08 +0200477clib_error_t *dpdk_set_mc_filter (vnet_hw_interface_t * hi,
478 struct ether_addr mc_addr_vec[], int naddr);
Christian Dechamplain2073cfe2016-02-19 12:26:57 -0500479
Ed Warnickecb9cada2015-12-08 15:45:58 -0700480void dpdk_thread_input (dpdk_main_t * dm, dpdk_device_t * xd);
481
Damjan Marion25665672016-08-16 18:56:08 +0200482clib_error_t *dpdk_port_setup (dpdk_main_t * dm, dpdk_device_t * xd);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700483
Damjan Marion25665672016-08-16 18:56:08 +0200484void dpdk_set_flowcontrol_callback (vlib_main_t * vm,
485 dpdk_flowcontrol_callback_t callback);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700486
487u32 dpdk_interface_tx_vector (vlib_main_t * vm, u32 dev_instance);
488
Damjan Marion25665672016-08-16 18:56:08 +0200489void set_efd_bitmap (u8 * bitmap, u32 value, u32 op);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700490
Damjan Marion25665672016-08-16 18:56:08 +0200491struct rte_mbuf *dpdk_replicate_packet_mb (vlib_buffer_t * b);
492struct rte_mbuf *dpdk_zerocopy_replicate_packet_mb (vlib_buffer_t * b);
Keith Burns (alagalah)52fc44d2016-03-25 09:38:50 -0700493
Ed Warnickecb9cada2015-12-08 15:45:58 -0700494#define foreach_dpdk_error \
495 _(NONE, "no error") \
496 _(RX_PACKET_ERROR, "Rx packet errors") \
497 _(RX_BAD_FCS, "Rx bad fcs") \
498 _(L4_CHECKSUM_ERROR, "Rx L4 checksum errors") \
499 _(IP_CHECKSUM_ERROR, "Rx ip checksum errors") \
500 _(RX_ALLOC_FAIL, "rx buf alloc from free list failed") \
501 _(RX_ALLOC_NO_PHYSMEM, "rx buf alloc failed no physmem") \
502 _(RX_ALLOC_DROP_PKTS, "rx packets dropped due to alloc error") \
503 _(IPV4_EFD_DROP_PKTS, "IPV4 Early Fast Discard rx drops") \
504 _(IPV6_EFD_DROP_PKTS, "IPV6 Early Fast Discard rx drops") \
505 _(MPLS_EFD_DROP_PKTS, "MPLS Early Fast Discard rx drops") \
506 _(VLAN_EFD_DROP_PKTS, "VLAN Early Fast Discard rx drops")
507
Damjan Marion25665672016-08-16 18:56:08 +0200508typedef enum
509{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700510#define _(f,s) DPDK_ERROR_##f,
511 foreach_dpdk_error
512#undef _
Damjan Marion25665672016-08-16 18:56:08 +0200513 DPDK_N_ERROR,
Ed Warnickecb9cada2015-12-08 15:45:58 -0700514} dpdk_error_t;
515
516/*
517 * Increment EFD drop counter
518 */
Damjan Marion25665672016-08-16 18:56:08 +0200519static_always_inline void
520increment_efd_drop_counter (vlib_main_t * vm, u32 counter_index, u32 count)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700521{
Damjan Marion25665672016-08-16 18:56:08 +0200522 vlib_node_t *my_n;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700523
Damjan Marion25665672016-08-16 18:56:08 +0200524 my_n = vlib_get_node (vm, dpdk_input_node.index);
525 vm->error_main.counters[my_n->error_heap_index + counter_index] += count;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700526}
527
Bud Grise02301ef2016-02-24 16:09:05 -0500528int dpdk_set_stat_poll_interval (f64 interval);
529int dpdk_set_link_state_poll_interval (f64 interval);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700530void dpdk_update_link_state (dpdk_device_t * xd, f64 now);
Damjan Marion25665672016-08-16 18:56:08 +0200531void dpdk_device_lock_init (dpdk_device_t * xd);
532void dpdk_device_lock_free (dpdk_device_t * xd);
533void dpdk_efd_update_counters (dpdk_device_t * xd, u32 n_buffers,
534 u16 enabled);
535u32 is_efd_discardable (vlib_thread_main_t * tm, vlib_buffer_t * b0,
536 struct rte_mbuf *mb);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700537
Damjan Marion1f0da172016-07-13 22:44:18 +0200538#if DPDK_VHOST_USER
Ed Warnickecb9cada2015-12-08 15:45:58 -0700539/* dpdk vhost-user interrupt management */
Damjan Marion25665672016-08-16 18:56:08 +0200540u8 dpdk_vhost_user_want_interrupt (dpdk_device_t * xd, int idx);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700541void dpdk_vhost_user_send_interrupt (vlib_main_t * vm, dpdk_device_t * xd,
Damjan Marion25665672016-08-16 18:56:08 +0200542 int idx);
Damjan Marion1f0da172016-07-13 22:44:18 +0200543#endif
Ed Warnickecb9cada2015-12-08 15:45:58 -0700544
545
Damjan Marion25665672016-08-16 18:56:08 +0200546static inline u64
547vnet_get_aggregate_rx_packets (void)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700548{
Damjan Marion25665672016-08-16 18:56:08 +0200549 dpdk_main_t *dm = &dpdk_main;
550 u64 sum = 0;
551 dpdk_worker_t *dw;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700552
Damjan Marion25665672016-08-16 18:56:08 +0200553 vec_foreach (dw, dm->workers) sum += dw->aggregate_rx_packets;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700554
Damjan Marion25665672016-08-16 18:56:08 +0200555 return sum;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700556}
557
558void dpdk_rx_trace (dpdk_main_t * dm,
Damjan Marion25665672016-08-16 18:56:08 +0200559 vlib_node_runtime_t * node,
560 dpdk_device_t * xd,
561 u16 queue_id, u32 * buffers, uword n_buffers);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700562
563#define EFD_OPERATION_LESS_THAN 0
564#define EFD_OPERATION_GREATER_OR_EQUAL 1
565
Damjan Marion25665672016-08-16 18:56:08 +0200566void efd_config (u32 enabled,
567 u32 ip_prec, u32 ip_op,
568 u32 mpls_exp, u32 mpls_op, u32 vlan_cos, u32 vlan_op);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700569
Damjan Marion25665672016-08-16 18:56:08 +0200570void post_sw_interface_set_flags (vlib_main_t * vm, u32 sw_if_index,
571 u32 flags);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700572
Damjan Marion1f0da172016-07-13 22:44:18 +0200573#if DPDK_VHOST_USER
Ed Warnickecb9cada2015-12-08 15:45:58 -0700574typedef struct vhost_user_memory vhost_user_memory_t;
575
576void dpdk_vhost_user_process_init (void **ctx);
577void dpdk_vhost_user_process_cleanup (void *ctx);
Damjan Marion25665672016-08-16 18:56:08 +0200578uword dpdk_vhost_user_process_if (vlib_main_t * vm, dpdk_device_t * xd,
579 void *ctx);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700580
581// vhost-user calls
582int dpdk_vhost_user_create_if (vnet_main_t * vnm, vlib_main_t * vm,
Damjan Marion25665672016-08-16 18:56:08 +0200583 const char *sock_filename,
584 u8 is_server,
585 u32 * sw_if_index,
586 u64 feature_mask,
587 u8 renumber, u32 custom_dev_instance,
588 u8 * hwaddr);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700589int dpdk_vhost_user_modify_if (vnet_main_t * vnm, vlib_main_t * vm,
Damjan Marion25665672016-08-16 18:56:08 +0200590 const char *sock_filename,
591 u8 is_server,
592 u32 sw_if_index,
593 u64 feature_mask,
594 u8 renumber, u32 custom_dev_instance);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700595int dpdk_vhost_user_delete_if (vnet_main_t * vnm, vlib_main_t * vm,
Damjan Marion25665672016-08-16 18:56:08 +0200596 u32 sw_if_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700597int dpdk_vhost_user_dump_ifs (vnet_main_t * vnm, vlib_main_t * vm,
Damjan Marion25665672016-08-16 18:56:08 +0200598 vhost_user_intf_details_t ** out_vuids);
Damjan Marion1f0da172016-07-13 22:44:18 +0200599#endif
Ed Warnickecb9cada2015-12-08 15:45:58 -0700600
601u32 dpdk_get_admin_up_down_in_progress (void);
602
Todd Foggoa (tfoggoa)a30d40d2016-03-17 16:54:30 -0400603u32 dpdk_num_mbufs (void);
604
Damjan Marion25665672016-08-16 18:56:08 +0200605dpdk_pmd_t dpdk_get_pmd_type (vnet_hw_interface_t * hi);
Todd Foggoa (tfoggoa)a30d40d2016-03-17 16:54:30 -0400606
Damjan Marion25665672016-08-16 18:56:08 +0200607i8 dpdk_get_cpu_socket (vnet_hw_interface_t * hi);
Todd Foggoa (tfoggoa)a30d40d2016-03-17 16:54:30 -0400608
Damjan Marion25665672016-08-16 18:56:08 +0200609void *dpdk_input_multiarch_select ();
610void *dpdk_input_rss_multiarch_select ();
611void *dpdk_input_efd_multiarch_select ();
Ed Warnickecb9cada2015-12-08 15:45:58 -0700612
Damjan Marion25665672016-08-16 18:56:08 +0200613clib_error_t *dpdk_get_hw_interface_stats (u32 hw_if_index,
614 struct rte_eth_stats *dest);
Sean Hopea4f16a02016-03-28 13:11:31 -0400615
Damjan Marion7f620972016-02-25 16:00:11 +0100616format_function_t format_dpdk_device_name;
617format_function_t format_dpdk_device;
618format_function_t format_dpdk_tx_dma_trace;
619format_function_t format_dpdk_rx_dma_trace;
620format_function_t format_dpdk_rte_mbuf;
621format_function_t format_dpdk_rx_rte_mbuf;
622unformat_function_t unformat_socket_mem;
Damjan Marion25665672016-08-16 18:56:08 +0200623clib_error_t *unformat_rss_fn (unformat_input_t * input, uword * rss_fn);
Damjan Marion7f620972016-02-25 16:00:11 +0100624
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200625
626static inline void
Damjan Marion25665672016-08-16 18:56:08 +0200627dpdk_pmd_constructor_init ()
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200628{
629 /* Add references to DPDK Driver Constructor functions to get the dynamic
630 * loader to pull in the driver library & run the constructors.
631 */
632#define _(d) \
633 do { \
634 void devinitfn_ ##d(void); \
635 __attribute__((unused)) void (* volatile pf)(void); \
636 pf = devinitfn_ ##d; \
637 } while(0);
638
639#ifdef RTE_LIBRTE_EM_PMD
640 _(em_pmd_drv)
641#endif
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200642#ifdef RTE_LIBRTE_IGB_PMD
Damjan Marion25665672016-08-16 18:56:08 +0200643 _(pmd_igb_drv)
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200644#endif
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200645#ifdef RTE_LIBRTE_IXGBE_PMD
Damjan Marion25665672016-08-16 18:56:08 +0200646 _(rte_ixgbe_driver)
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200647#endif
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200648#ifdef RTE_LIBRTE_I40E_PMD
Damjan Marion25665672016-08-16 18:56:08 +0200649 _(rte_i40e_driver) _(rte_i40evf_driver)
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200650#endif
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200651#ifdef RTE_LIBRTE_FM10K_PMD
Damjan Marion25665672016-08-16 18:56:08 +0200652 _(rte_fm10k_driver)
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200653#endif
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200654#ifdef RTE_LIBRTE_VIRTIO_PMD
Damjan Marion25665672016-08-16 18:56:08 +0200655 _(rte_virtio_driver)
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200656#endif
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200657#ifdef RTE_LIBRTE_VMXNET3_PMD
Damjan Marion25665672016-08-16 18:56:08 +0200658 _(rte_vmxnet3_driver)
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200659#endif
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200660#ifdef RTE_LIBRTE_VICE_PMD
Damjan Marion25665672016-08-16 18:56:08 +0200661 _(rte_vice_driver)
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200662#endif
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200663#ifdef RTE_LIBRTE_ENIC_PMD
Damjan Marion25665672016-08-16 18:56:08 +0200664 _(rte_enic_driver)
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200665#endif
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200666#ifdef RTE_LIBRTE_PMD_AF_PACKET
Damjan Marion25665672016-08-16 18:56:08 +0200667 _(pmd_af_packet_drv)
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200668#endif
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200669#ifdef RTE_LIBRTE_CXGBE_PMD
Damjan Marion25665672016-08-16 18:56:08 +0200670 _(rte_cxgbe_driver)
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200671#endif
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200672#ifdef RTE_LIBRTE_PMD_BOND
Damjan Marion25665672016-08-16 18:56:08 +0200673 _(bond_drv)
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200674#endif
Sachina29f2002016-06-17 09:24:20 +0530675#ifdef RTE_LIBRTE_DPAA2_PMD
Damjan Marion25665672016-08-16 18:56:08 +0200676 _(pmd_dpaa2_drv)
Sachina29f2002016-06-17 09:24:20 +0530677#endif
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200678#undef _
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200679/*
680 * At the moment, the ThunderX NIC driver doesn't have
681 * an entry point named "devinitfn_rte_xxx_driver"
682 */
683#define _(d) \
684 do { \
685 void d(void); \
686 __attribute__((unused)) void (* volatile pf)(void); \
687 pf = d; \
688 } while(0);
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200689#ifdef RTE_LIBRTE_THUNDERVNIC_PMD
Damjan Marion25665672016-08-16 18:56:08 +0200690 _(rte_nicvf_pmd_init)
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200691#endif
692#undef _
Damjan Marionaa04a0f2016-04-01 12:34:24 +0200693}
694
Todd Foggoae3eefff2016-05-20 22:10:34 -0400695uword
696admin_up_down_process (vlib_main_t * vm,
Damjan Marion25665672016-08-16 18:56:08 +0200697 vlib_node_runtime_t * rt, vlib_frame_t * f);
Todd Foggoae3eefff2016-05-20 22:10:34 -0400698
Ed Warnickecb9cada2015-12-08 15:45:58 -0700699#endif /* __included_dpdk_h__ */
Damjan Marion25665672016-08-16 18:56:08 +0200700
701/*
702 * fd.io coding-style-patch-verification: ON
703 *
704 * Local Variables:
705 * eval: (c-set-style "gnu")
706 * End:
707 */