blob: 91c3988b439cd01340c614aa9f19b7eb2f53a350 [file] [log] [blame]
Damjan Marion83243a02016-02-29 13:09:30 +01001/*
2 *------------------------------------------------------------------
3 * af_packet.c - linux kernel packet interface
4 *
5 * Copyright (c) 2016 Cisco and/or its affiliates.
6 * Licensed under the Apache License, Version 2.0 (the "License");
7 * you may not use this file except in compliance with the License.
8 * You may obtain a copy of the License at:
9 *
10 * http://www.apache.org/licenses/LICENSE-2.0
11 *
12 * Unless required by applicable law or agreed to in writing, software
13 * distributed under the License is distributed on an "AS IS" BASIS,
14 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15 * See the License for the specific language governing permissions and
16 * limitations under the License.
17 *------------------------------------------------------------------
18 */
19
20#include <linux/if_ether.h>
21#include <linux/if_packet.h>
22
23#include <vlib/vlib.h>
24#include <vlib/unix/unix.h>
25#include <vnet/ip/ip.h>
26#include <vnet/ethernet/ethernet.h>
27
28#include <vnet/devices/af_packet/af_packet.h>
29
30#define AF_PACKET_DEBUG_SOCKET 0
31
32#define AF_PACKET_TX_FRAMES_PER_BLOCK 1024
33#define AF_PACKET_TX_FRAME_SIZE (2048 * 5)
34#define AF_PACKET_TX_BLOCK_NR 1
35#define AF_PACKET_TX_FRAME_NR (AF_PACKET_TX_BLOCK_NR * \
36 AF_PACKET_TX_FRAMES_PER_BLOCK)
37#define AF_PACKET_TX_BLOCK_SIZE (AF_PACKET_TX_FRAME_SIZE * \
38 AF_PACKET_TX_FRAMES_PER_BLOCK)
39
40#define AF_PACKET_RX_FRAMES_PER_BLOCK 1024
41#define AF_PACKET_RX_FRAME_SIZE (2048 * 5)
42#define AF_PACKET_RX_BLOCK_NR 1
43#define AF_PACKET_RX_FRAME_NR (AF_PACKET_RX_BLOCK_NR * \
44 AF_PACKET_RX_FRAMES_PER_BLOCK)
45#define AF_PACKET_RX_BLOCK_SIZE (AF_PACKET_RX_FRAME_SIZE * \
46 AF_PACKET_RX_FRAMES_PER_BLOCK)
47
48#if AF_PACKET_DEBUG_SOCKET == 1
49#define DBG_SOCK(args...) clib_warning(args);
50#else
51#define DBG_SOCK(args...)
52#endif
53
54/*defined in net/if.h but clashes with dpdk headers */
Damjan Marion00a9dca2016-08-17 17:05:46 +020055unsigned int if_nametoindex (const char *ifname);
Damjan Marion83243a02016-02-29 13:09:30 +010056
57typedef struct tpacket_req tpacket_req_t;
58
59static u32
Damjan Marion00a9dca2016-08-17 17:05:46 +020060af_packet_eth_flag_change (vnet_main_t * vnm, vnet_hw_interface_t * hi,
61 u32 flags)
Damjan Marion83243a02016-02-29 13:09:30 +010062{
63 /* nothing for now */
64 return 0;
65}
66
Damjan Marion00a9dca2016-08-17 17:05:46 +020067static clib_error_t *
68af_packet_fd_read_ready (unix_file_t * uf)
Damjan Marion83243a02016-02-29 13:09:30 +010069{
Damjan Marion00a9dca2016-08-17 17:05:46 +020070 vlib_main_t *vm = vlib_get_main ();
71 af_packet_main_t *apm = &af_packet_main;
Damjan Marion83243a02016-02-29 13:09:30 +010072 u32 idx = uf->private_data;
73
Damjan Marion00a9dca2016-08-17 17:05:46 +020074 apm->pending_input_bitmap =
75 clib_bitmap_set (apm->pending_input_bitmap, idx, 1);
Damjan Marion83243a02016-02-29 13:09:30 +010076
77 /* Schedule the rx node */
78 vlib_node_set_interrupt_pending (vm, af_packet_input_node.index);
79
80 return 0;
81}
82
83static int
Damjan Marion00a9dca2016-08-17 17:05:46 +020084create_packet_v2_sock (u8 * name, tpacket_req_t * rx_req,
85 tpacket_req_t * tx_req, int *fd, u8 ** ring)
Damjan Marion83243a02016-02-29 13:09:30 +010086{
87 int ret, err;
88 struct sockaddr_ll sll;
89 uint host_if_index;
90 int ver = TPACKET_V2;
Damjan Marion00a9dca2016-08-17 17:05:46 +020091 socklen_t req_sz = sizeof (struct tpacket_req);
Damjan Marion83243a02016-02-29 13:09:30 +010092 u32 ring_sz = rx_req->tp_block_size * rx_req->tp_block_nr +
Damjan Marion00a9dca2016-08-17 17:05:46 +020093 tx_req->tp_block_size * tx_req->tp_block_nr;
Damjan Marion83243a02016-02-29 13:09:30 +010094
Damjan Marion00a9dca2016-08-17 17:05:46 +020095 host_if_index = if_nametoindex ((const char *) name);
Damjan Marion83243a02016-02-29 13:09:30 +010096
97 if (!host_if_index)
98 {
Damjan Marion00a9dca2016-08-17 17:05:46 +020099 DBG_SOCK ("Wrong host interface name");
Damjan Marion83243a02016-02-29 13:09:30 +0100100 ret = VNET_API_ERROR_INVALID_INTERFACE;
101 goto error;
102 }
103
Damjan Marion00a9dca2016-08-17 17:05:46 +0200104 if ((*fd = socket (AF_PACKET, SOCK_RAW, htons (ETH_P_ALL))) < 0)
Damjan Marion83243a02016-02-29 13:09:30 +0100105 {
Damjan Marion00a9dca2016-08-17 17:05:46 +0200106 DBG_SOCK ("Failed to create socket");
Damjan Marion83243a02016-02-29 13:09:30 +0100107 ret = VNET_API_ERROR_SYSCALL_ERROR_1;
108 goto error;
109 }
110
Damjan Marion00a9dca2016-08-17 17:05:46 +0200111 if ((err =
112 setsockopt (*fd, SOL_PACKET, PACKET_VERSION, &ver, sizeof (ver))) < 0)
Damjan Marion83243a02016-02-29 13:09:30 +0100113 {
Damjan Marion00a9dca2016-08-17 17:05:46 +0200114 DBG_SOCK ("Failed to set rx packet interface version");
Damjan Marion83243a02016-02-29 13:09:30 +0100115 ret = VNET_API_ERROR_SYSCALL_ERROR_1;
116 goto error;
117 }
118
119 int opt = 1;
Damjan Marion00a9dca2016-08-17 17:05:46 +0200120 if ((err =
121 setsockopt (*fd, SOL_PACKET, PACKET_LOSS, &opt, sizeof (opt))) < 0)
Damjan Marion83243a02016-02-29 13:09:30 +0100122 {
Damjan Marion00a9dca2016-08-17 17:05:46 +0200123 DBG_SOCK ("Failed to set packet tx ring error handling option");
Damjan Marion83243a02016-02-29 13:09:30 +0100124 ret = VNET_API_ERROR_SYSCALL_ERROR_1;
125 goto error;
126 }
127
Damjan Marion00a9dca2016-08-17 17:05:46 +0200128 if ((err =
129 setsockopt (*fd, SOL_PACKET, PACKET_RX_RING, rx_req, req_sz)) < 0)
Damjan Marion83243a02016-02-29 13:09:30 +0100130 {
Damjan Marion00a9dca2016-08-17 17:05:46 +0200131 DBG_SOCK ("Failed to set packet rx ring options");
Damjan Marion83243a02016-02-29 13:09:30 +0100132 ret = VNET_API_ERROR_SYSCALL_ERROR_1;
133 goto error;
134 }
135
Damjan Marion00a9dca2016-08-17 17:05:46 +0200136 if ((err =
137 setsockopt (*fd, SOL_PACKET, PACKET_TX_RING, tx_req, req_sz)) < 0)
Damjan Marion83243a02016-02-29 13:09:30 +0100138 {
Damjan Marion00a9dca2016-08-17 17:05:46 +0200139 DBG_SOCK ("Failed to set packet rx ring options");
Damjan Marion83243a02016-02-29 13:09:30 +0100140 ret = VNET_API_ERROR_SYSCALL_ERROR_1;
141 goto error;
142 }
143
Damjan Marion00a9dca2016-08-17 17:05:46 +0200144 *ring =
145 mmap (NULL, ring_sz, PROT_READ | PROT_WRITE, MAP_SHARED | MAP_LOCKED, *fd,
146 0);
Damjan Marion83243a02016-02-29 13:09:30 +0100147 if (*ring == MAP_FAILED)
148 {
Damjan Marion00a9dca2016-08-17 17:05:46 +0200149 DBG_SOCK ("mmap failure");
Damjan Marion83243a02016-02-29 13:09:30 +0100150 ret = VNET_API_ERROR_SYSCALL_ERROR_1;
151 goto error;
152 }
153
Damjan Marion00a9dca2016-08-17 17:05:46 +0200154 memset (&sll, 0, sizeof (sll));
Damjan Marion83243a02016-02-29 13:09:30 +0100155 sll.sll_family = PF_PACKET;
Damjan Marion00a9dca2016-08-17 17:05:46 +0200156 sll.sll_protocol = htons (ETH_P_ALL);
Damjan Marion83243a02016-02-29 13:09:30 +0100157 sll.sll_ifindex = host_if_index;
158
Damjan Marion00a9dca2016-08-17 17:05:46 +0200159 if ((err = bind (*fd, (struct sockaddr *) &sll, sizeof (sll))) < 0)
Damjan Marion83243a02016-02-29 13:09:30 +0100160 {
Damjan Marion00a9dca2016-08-17 17:05:46 +0200161 DBG_SOCK ("Failed to bind rx packet socket (error %d)", err);
Damjan Marion83243a02016-02-29 13:09:30 +0100162 ret = VNET_API_ERROR_SYSCALL_ERROR_1;
163 goto error;
164 }
165
166 return 0;
167error:
Dave Barach16ad6ae2016-07-28 17:55:30 -0400168 if (*fd >= 0)
Damjan Marion00a9dca2016-08-17 17:05:46 +0200169 close (*fd);
Peter Leidba76f22016-04-08 08:16:31 -0700170 *fd = -1;
Damjan Marion83243a02016-02-29 13:09:30 +0100171 return ret;
172}
173
174int
Damjan Marion00a9dca2016-08-17 17:05:46 +0200175af_packet_create_if (vlib_main_t * vm, u8 * host_if_name, u8 * hw_addr_set,
176 u32 * sw_if_index)
Damjan Marion83243a02016-02-29 13:09:30 +0100177{
Damjan Marion00a9dca2016-08-17 17:05:46 +0200178 af_packet_main_t *apm = &af_packet_main;
Damjan Marion83243a02016-02-29 13:09:30 +0100179 int ret, fd = -1;
Damjan Marion00a9dca2016-08-17 17:05:46 +0200180 struct tpacket_req *rx_req = 0;
181 struct tpacket_req *tx_req = 0;
182 u8 *ring = 0;
183 af_packet_if_t *apif = 0;
Damjan Marion83243a02016-02-29 13:09:30 +0100184 u8 hw_addr[6];
Damjan Marion00a9dca2016-08-17 17:05:46 +0200185 clib_error_t *error;
186 vnet_sw_interface_t *sw;
187 vnet_main_t *vnm = vnet_get_main ();
188 uword *p;
Damjan Marion83243a02016-02-29 13:09:30 +0100189 uword if_index;
Ivan Kellybfe737a2016-10-07 18:02:43 +0200190 u8 *host_if_name_dup = vec_dup (host_if_name);
Damjan Marion83243a02016-02-29 13:09:30 +0100191
192 p = mhash_get (&apm->if_index_by_host_if_name, host_if_name);
193 if (p)
194 {
195 return VNET_API_ERROR_SUBIF_ALREADY_EXISTS;
196 }
197
Damjan Marion00a9dca2016-08-17 17:05:46 +0200198 vec_validate (rx_req, 0);
Damjan Marion83243a02016-02-29 13:09:30 +0100199 rx_req->tp_block_size = AF_PACKET_RX_BLOCK_SIZE;
200 rx_req->tp_frame_size = AF_PACKET_RX_FRAME_SIZE;
201 rx_req->tp_block_nr = AF_PACKET_RX_BLOCK_NR;
202 rx_req->tp_frame_nr = AF_PACKET_RX_FRAME_NR;
203
Damjan Marion00a9dca2016-08-17 17:05:46 +0200204 vec_validate (tx_req, 0);
Damjan Marion83243a02016-02-29 13:09:30 +0100205 tx_req->tp_block_size = AF_PACKET_TX_BLOCK_SIZE;
206 tx_req->tp_frame_size = AF_PACKET_TX_FRAME_SIZE;
207 tx_req->tp_block_nr = AF_PACKET_TX_BLOCK_NR;
208 tx_req->tp_frame_nr = AF_PACKET_TX_FRAME_NR;
209
Damjan Marion00a9dca2016-08-17 17:05:46 +0200210 ret = create_packet_v2_sock (host_if_name, rx_req, tx_req, &fd, &ring);
Damjan Marion83243a02016-02-29 13:09:30 +0100211
212 if (ret != 0)
213 goto error;
214
215 /* So far everything looks good, let's create interface */
Damjan Marion048ee2e2016-03-16 22:59:21 +0100216 pool_get (apm->interfaces, apif);
Damjan Marion83243a02016-02-29 13:09:30 +0100217 if_index = apif - apm->interfaces;
218
219 apif->fd = fd;
220 apif->rx_ring = ring;
221 apif->tx_ring = ring + rx_req->tp_block_size * rx_req->tp_block_nr;
222 apif->rx_req = rx_req;
223 apif->tx_req = tx_req;
Ivan Kellybfe737a2016-10-07 18:02:43 +0200224 apif->host_if_name = host_if_name_dup;
Dave Barach13f3c452016-03-29 11:56:41 -0400225 apif->per_interface_next_index = ~0;
Peter Leidba76f22016-04-08 08:16:31 -0700226 apif->next_tx_frame = 0;
227 apif->next_rx_frame = 0;
Damjan Marion83243a02016-02-29 13:09:30 +0100228
229 {
Damjan Marion00a9dca2016-08-17 17:05:46 +0200230 unix_file_t template = { 0 };
Damjan Marion83243a02016-02-29 13:09:30 +0100231 template.read_function = af_packet_fd_read_ready;
232 template.file_descriptor = fd;
233 template.private_data = if_index;
234 template.flags = UNIX_FILE_EVENT_EDGE_TRIGGERED;
235 apif->unix_file_index = unix_file_add (&unix_main, &template);
236 }
237
238 /*use configured or generate random MAC address */
239 if (hw_addr_set)
Damjan Marion00a9dca2016-08-17 17:05:46 +0200240 clib_memcpy (hw_addr, hw_addr_set, 6);
Damjan Marion83243a02016-02-29 13:09:30 +0100241 else
242 {
Damjan Marion00a9dca2016-08-17 17:05:46 +0200243 f64 now = vlib_time_now (vm);
Damjan Marion83243a02016-02-29 13:09:30 +0100244 u32 rnd;
245 rnd = (u32) (now * 1e6);
246 rnd = random_u32 (&rnd);
247
Damjan Marion00a9dca2016-08-17 17:05:46 +0200248 clib_memcpy (hw_addr + 2, &rnd, sizeof (rnd));
Damjan Marion83243a02016-02-29 13:09:30 +0100249 hw_addr[0] = 2;
250 hw_addr[1] = 0xfe;
251 }
252
Damjan Marion00a9dca2016-08-17 17:05:46 +0200253 error = ethernet_register_interface (vnm, af_packet_device_class.index,
254 if_index, hw_addr, &apif->hw_if_index,
255 af_packet_eth_flag_change);
Damjan Marion83243a02016-02-29 13:09:30 +0100256
257 if (error)
258 {
Damjan Marion00a9dca2016-08-17 17:05:46 +0200259 memset (apif, 0, sizeof (*apif));
260 pool_put (apm->interfaces, apif);
Damjan Marion83243a02016-02-29 13:09:30 +0100261 clib_error_report (error);
262 ret = VNET_API_ERROR_SYSCALL_ERROR_1;
263 goto error;
264 }
265
266 sw = vnet_get_hw_sw_interface (vnm, apif->hw_if_index);
267 apif->sw_if_index = sw->sw_if_index;
268
269 vnet_hw_interface_set_flags (vnm, apif->hw_if_index,
270 VNET_HW_INTERFACE_FLAG_LINK_UP);
271
Ivan Kellybfe737a2016-10-07 18:02:43 +0200272 mhash_set_mem (&apm->if_index_by_host_if_name, host_if_name_dup, &if_index,
273 0);
Pierre Pfister78ea9c22016-05-23 12:51:54 +0100274 if (sw_if_index)
275 *sw_if_index = apif->sw_if_index;
Damjan Marion83243a02016-02-29 13:09:30 +0100276 return 0;
277
278error:
Ivan Kellybfe737a2016-10-07 18:02:43 +0200279 vec_free (host_if_name_dup);
Damjan Marion00a9dca2016-08-17 17:05:46 +0200280 vec_free (rx_req);
281 vec_free (tx_req);
Damjan Marion83243a02016-02-29 13:09:30 +0100282 return ret;
283}
284
Peter Leidba76f22016-04-08 08:16:31 -0700285int
Damjan Marion00a9dca2016-08-17 17:05:46 +0200286af_packet_delete_if (vlib_main_t * vm, u8 * host_if_name)
Peter Leidba76f22016-04-08 08:16:31 -0700287{
Damjan Marion00a9dca2016-08-17 17:05:46 +0200288 vnet_main_t *vnm = vnet_get_main ();
Peter Leidba76f22016-04-08 08:16:31 -0700289 af_packet_main_t *apm = &af_packet_main;
290 af_packet_if_t *apif;
291 uword *p;
292 uword if_index;
293 u32 ring_sz;
294
Damjan Marion00a9dca2016-08-17 17:05:46 +0200295 p = mhash_get (&apm->if_index_by_host_if_name, host_if_name);
296 if (p == NULL)
297 {
298 clib_warning ("Host interface %s does not exist", host_if_name);
299 return VNET_API_ERROR_SYSCALL_ERROR_1;
300 }
301 apif = pool_elt_at_index (apm->interfaces, p[0]);
Peter Leidba76f22016-04-08 08:16:31 -0700302 if_index = apif - apm->interfaces;
303
304 /* bring down the interface */
Damjan Marion00a9dca2016-08-17 17:05:46 +0200305 vnet_hw_interface_set_flags (vnm, apif->hw_if_index, 0);
Peter Leidba76f22016-04-08 08:16:31 -0700306
307 /* clean up */
Damjan Marion00a9dca2016-08-17 17:05:46 +0200308 if (apif->unix_file_index != ~0)
309 {
310 unix_file_del (&unix_main, unix_main.file_pool + apif->unix_file_index);
311 apif->unix_file_index = ~0;
312 }
Eyal Barif298ecf2016-09-19 18:47:39 +0300313 else
314 close (apif->fd);
315
Peter Leidba76f22016-04-08 08:16:31 -0700316 ring_sz = apif->rx_req->tp_block_size * apif->rx_req->tp_block_nr +
Damjan Marion00a9dca2016-08-17 17:05:46 +0200317 apif->tx_req->tp_block_size * apif->tx_req->tp_block_nr;
318 if (munmap (apif->rx_ring, ring_sz))
319 clib_warning ("Host interface %s could not free rx/tx ring",
320 host_if_name);
Peter Leidba76f22016-04-08 08:16:31 -0700321 apif->rx_ring = NULL;
322 apif->tx_ring = NULL;
Peter Leidba76f22016-04-08 08:16:31 -0700323 apif->fd = -1;
324
Damjan Marion00a9dca2016-08-17 17:05:46 +0200325 vec_free (apif->rx_req);
Peter Leidba76f22016-04-08 08:16:31 -0700326 apif->rx_req = NULL;
Damjan Marion00a9dca2016-08-17 17:05:46 +0200327 vec_free (apif->tx_req);
Peter Leidba76f22016-04-08 08:16:31 -0700328 apif->tx_req = NULL;
329
Damjan Marion00a9dca2016-08-17 17:05:46 +0200330 vec_free (apif->host_if_name);
Peter Leidba76f22016-04-08 08:16:31 -0700331 apif->host_if_name = NULL;
332
Damjan Marion00a9dca2016-08-17 17:05:46 +0200333 mhash_unset (&apm->if_index_by_host_if_name, host_if_name, &if_index);
Peter Leidba76f22016-04-08 08:16:31 -0700334
Damjan Marion00a9dca2016-08-17 17:05:46 +0200335 ethernet_delete_interface (vnm, apif->hw_if_index);
Peter Leidba76f22016-04-08 08:16:31 -0700336
Damjan Marion00a9dca2016-08-17 17:05:46 +0200337 pool_put (apm->interfaces, apif);
Peter Leidba76f22016-04-08 08:16:31 -0700338
339 return 0;
340}
341
Damjan Marion83243a02016-02-29 13:09:30 +0100342static clib_error_t *
343af_packet_init (vlib_main_t * vm)
344{
Damjan Marion00a9dca2016-08-17 17:05:46 +0200345 af_packet_main_t *apm = &af_packet_main;
Damjan Marion553f6bd2016-09-07 11:54:22 +0200346 vlib_thread_main_t *tm = vlib_get_thread_main ();
Damjan Marion83243a02016-02-29 13:09:30 +0100347
348 memset (apm, 0, sizeof (af_packet_main_t));
349
350 mhash_init_vec_string (&apm->if_index_by_host_if_name, sizeof (uword));
351
Damjan Marion553f6bd2016-09-07 11:54:22 +0200352 vec_validate_aligned (apm->rx_buffers, tm->n_vlib_mains - 1,
353 CLIB_CACHE_LINE_BYTES);
354
Damjan Marion83243a02016-02-29 13:09:30 +0100355 return 0;
356}
357
358VLIB_INIT_FUNCTION (af_packet_init);
Damjan Marion00a9dca2016-08-17 17:05:46 +0200359
360/*
361 * fd.io coding-style-patch-verification: ON
362 *
363 * Local Variables:
364 * eval: (c-set-style "gnu")
365 * End:
366 */