blob: db3ea332fbd6c25a17f0e175f2a3aef304d7a4d8 [file] [log] [blame]
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -07001/*
2 * Copyright (c) 2016 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
6 *
7 * http://www.apache.org/licenses/LICENSE-2.0
8 *
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
14 */
15
16/**
17 * @file
18 * @brief Local TCP/IP stack punt infrastructure.
19 *
Ole Troanf7a55ad2017-05-16 14:59:29 +020020 * Provides a set of VPP nodes together with the relevant APIs and CLI
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -070021 * commands in order to adjust and dispatch packets from the VPP data plane
22 * to the local TCP/IP stack
23 */
Ole Troanf7a55ad2017-05-16 14:59:29 +020024
25#include <vnet/ip/ip.h>
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -070026#include <vlib/vlib.h>
27#include <vnet/pg/pg.h>
Dave Barach68b0fb02017-02-28 15:15:56 -050028#include <vnet/udp/udp.h>
Pierre Pfister7fe51f32017-09-20 08:48:36 +020029#include <vnet/tcp/tcp.h>
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -070030#include <vnet/ip/punt.h>
Ole Troanf7a55ad2017-05-16 14:59:29 +020031#include <vppinfra/sparse_vec.h>
32#include <vlib/unix/unix.h>
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -070033
Ole Troanf7a55ad2017-05-16 14:59:29 +020034#include <stdio.h>
35#include <unistd.h>
36#include <sys/socket.h>
37#include <sys/un.h>
Marco Varlese22349832017-09-08 10:40:34 +020038#include <sys/uio.h>
Ole Troanf7a55ad2017-05-16 14:59:29 +020039#include <stdlib.h>
40#include <stdbool.h>
41
42#define foreach_punt_next \
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -070043 _ (PUNT, "error-punt")
44
45typedef enum
46{
47#define _(s,n) PUNT_NEXT_##s,
48 foreach_punt_next
49#undef _
50 PUNT_N_NEXT,
51} punt_next_t;
52
Ole Troanf7a55ad2017-05-16 14:59:29 +020053enum punt_socket_rx_next_e
54{
55 PUNT_SOCKET_RX_NEXT_INTERFACE_OUTPUT,
56 PUNT_SOCKET_RX_NEXT_IP4_LOOKUP,
57 PUNT_SOCKET_RX_NEXT_IP6_LOOKUP,
58 PUNT_SOCKET_RX_N_NEXT
59};
60
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -070061vlib_node_registration_t udp4_punt_node;
62vlib_node_registration_t udp6_punt_node;
Ole Troanf7a55ad2017-05-16 14:59:29 +020063vlib_node_registration_t udp4_punt_socket_node;
64vlib_node_registration_t udp6_punt_socket_node;
65static vlib_node_registration_t punt_socket_rx_node;
66
67punt_main_t punt_main;
68
69char *
70vnet_punt_get_server_pathname (void)
71{
72 punt_main_t *pm = &punt_main;
73 return pm->sun_path;
74}
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -070075
76/** @brief IPv4/IPv6 UDP punt node main loop.
77
78 This is the main loop inline function for IPv4/IPv6 UDP punt
79 transition node.
80
81 @param vm vlib_main_t corresponding to the current thread
82 @param node vlib_node_runtime_t
83 @param frame vlib_frame_t whose contents should be dispatched
84 @param is_ipv4 indicates if called for IPv4 or IPv6 node
85*/
86always_inline uword
87udp46_punt_inline (vlib_main_t * vm,
88 vlib_node_runtime_t * node,
89 vlib_frame_t * from_frame, int is_ip4)
90{
91 u32 n_left_from, *from, *to_next;
92 word advance;
93
94 from = vlib_frame_vector_args (from_frame);
95 n_left_from = from_frame->n_vectors;
96
97 /* udp[46]_lookup hands us the data payload, not the IP header */
98 if (is_ip4)
99 advance = -(sizeof (ip4_header_t) + sizeof (udp_header_t));
100 else
101 advance = -(sizeof (ip6_header_t) + sizeof (udp_header_t));
102
103 while (n_left_from > 0)
104 {
105 u32 n_left_to_next;
106
107 vlib_get_next_frame (vm, node, PUNT_NEXT_PUNT, to_next, n_left_to_next);
108
109 while (n_left_from > 0 && n_left_to_next > 0)
110 {
111 u32 bi0;
112 vlib_buffer_t *b0;
113
114 bi0 = from[0];
115 to_next[0] = bi0;
116 from += 1;
117 to_next += 1;
118 n_left_from -= 1;
119 n_left_to_next -= 1;
120
121 b0 = vlib_get_buffer (vm, bi0);
122 vlib_buffer_advance (b0, advance);
123 b0->error = node->errors[PUNT_ERROR_UDP_PORT];
124 }
125
126 vlib_put_next_frame (vm, node, PUNT_NEXT_PUNT, n_left_to_next);
127 }
128
129 return from_frame->n_vectors;
130}
131
132static char *punt_error_strings[] = {
133#define punt_error(n,s) s,
134#include "punt_error.def"
135#undef punt_error
136};
137
138/** @brief IPv4 UDP punt node.
139 @node ip4-udp-punt
140
141 This is the IPv4 UDP punt transition node. It is registered as a next
142 node for the "ip4-udp-lookup" handling UDP port(s) requested for punt.
143 The buffer's current data pointer is adjusted to the original packet
144 IPv4 header. All buffers are dispatched to "error-punt".
145
146 @param vm vlib_main_t corresponding to the current thread
147 @param node vlib_node_runtime_t
148 @param frame vlib_frame_t whose contents should be dispatched
149
150 @par Graph mechanics: next index usage
151
152 @em Sets:
153 - <code>vnet_buffer(b)->current_data</code>
154 - <code>vnet_buffer(b)->current_len</code>
155
156 <em>Next Index:</em>
157 - Dispatches the packet to the "error-punt" node
158*/
159static uword
160udp4_punt (vlib_main_t * vm,
161 vlib_node_runtime_t * node, vlib_frame_t * from_frame)
162{
163 return udp46_punt_inline (vm, node, from_frame, 1 /* is_ip4 */ );
164}
165
166/** @brief IPv6 UDP punt node.
167 @node ip6-udp-punt
168
169 This is the IPv6 UDP punt transition node. It is registered as a next
170 node for the "ip6-udp-lookup" handling UDP port(s) requested for punt.
171 The buffer's current data pointer is adjusted to the original packet
172 IPv6 header. All buffers are dispatched to "error-punt".
173
174 @param vm vlib_main_t corresponding to the current thread
175 @param node vlib_node_runtime_t
176 @param frame vlib_frame_t whose contents should be dispatched
177
178 @par Graph mechanics: next index usage
179
180 @em Sets:
181 - <code>vnet_buffer(b)->current_data</code>
182 - <code>vnet_buffer(b)->current_len</code>
183
184 <em>Next Index:</em>
185 - Dispatches the packet to the "error-punt" node
186*/
187static uword
188udp6_punt (vlib_main_t * vm,
189 vlib_node_runtime_t * node, vlib_frame_t * from_frame)
190{
191 return udp46_punt_inline (vm, node, from_frame, 0 /* is_ip4 */ );
192}
193
194/* *INDENT-OFF* */
195VLIB_REGISTER_NODE (udp4_punt_node) = {
196 .function = udp4_punt,
197 .name = "ip4-udp-punt",
198 /* Takes a vector of packets. */
199 .vector_size = sizeof (u32),
200
201 .n_errors = PUNT_N_ERROR,
202 .error_strings = punt_error_strings,
203
204 .n_next_nodes = PUNT_N_NEXT,
205 .next_nodes = {
206#define _(s,n) [PUNT_NEXT_##s] = n,
207 foreach_punt_next
208#undef _
209 },
210};
211
Dave Barachd7cb1b52016-12-09 09:52:16 -0500212VLIB_NODE_FUNCTION_MULTIARCH (udp4_punt_node, udp4_punt);
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -0700213
214VLIB_REGISTER_NODE (udp6_punt_node) = {
215 .function = udp6_punt,
216 .name = "ip6-udp-punt",
217 /* Takes a vector of packets. */
218 .vector_size = sizeof (u32),
219
220 .n_errors = PUNT_N_ERROR,
221 .error_strings = punt_error_strings,
222
223 .n_next_nodes = PUNT_N_NEXT,
224 .next_nodes = {
225#define _(s,n) [PUNT_NEXT_##s] = n,
226 foreach_punt_next
227#undef _
228 },
229};
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -0700230
Dave Barachd7cb1b52016-12-09 09:52:16 -0500231VLIB_NODE_FUNCTION_MULTIARCH (udp6_punt_node, udp6_punt);;
232
Ole Troanf7a55ad2017-05-16 14:59:29 +0200233/* *INDENT-ON* */
234
Klement Sekera3c37ad52017-11-03 10:25:23 +0100235static punt_client_t *
236punt_client_get (bool is_ip4, u16 port)
Ole Troanf7a55ad2017-05-16 14:59:29 +0200237{
238 punt_main_t *pm = &punt_main;
Klement Sekera3c37ad52017-11-03 10:25:23 +0100239 punt_client_t *v =
240 is_ip4 ? pm->clients_by_dst_port4 : pm->clients_by_dst_port6;
Ole Troanf7a55ad2017-05-16 14:59:29 +0200241
242 u16 i = sparse_vec_index (v, port);
243 if (i == SPARSE_VEC_INVALID_INDEX)
244 return 0;
245
Klement Sekera3c37ad52017-11-03 10:25:23 +0100246 return &vec_elt (v, i);
247}
248
249static struct sockaddr_un *
250punt_socket_get (bool is_ip4, u16 port)
251{
252 punt_client_t *v = punt_client_get (is_ip4, port);
253 if (v)
254 return &v->caddr;
255
256 return NULL;
Ole Troanf7a55ad2017-05-16 14:59:29 +0200257}
258
259static void
260punt_socket_register (bool is_ip4, u8 protocol, u16 port,
261 char *client_pathname)
262{
263 punt_main_t *pm = &punt_main;
264 punt_client_t c, *n;
265 punt_client_t *v = is_ip4 ? pm->clients_by_dst_port4 :
266 pm->clients_by_dst_port6;
267
268 memset (&c, 0, sizeof (c));
269 memcpy (c.caddr.sun_path, client_pathname, sizeof (c.caddr.sun_path));
270 c.caddr.sun_family = AF_UNIX;
271 c.port = port;
272 n = sparse_vec_validate (v, port);
273 n[0] = c;
274}
275
276/* $$$$ Just leaves the mapping in place for now */
277static void
278punt_socket_unregister (bool is_ip4, u8 protocol, u16 port)
279{
280 return;
281}
282
Klement Sekera3c37ad52017-11-03 10:25:23 +0100283typedef struct
284{
285 punt_client_t client;
286 u8 is_midchain;
287} udp_punt_trace_t;
288
289u8 *
290format_udp_punt_trace (u8 * s, va_list * args)
291{
292 CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *);
293 CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *);
294 udp_punt_trace_t *t = va_arg (*args, udp_punt_trace_t *);
295 u32 indent = format_get_indent (s);
296 s = format (s, "to: %s", t->client.caddr.sun_path);
297 if (t->is_midchain)
298 {
299 s = format (s, "\n%U(buffer is part of chain)", format_white_space,
300 indent);
301 }
302 return s;
303}
304
Ole Troanf7a55ad2017-05-16 14:59:29 +0200305always_inline uword
306udp46_punt_socket_inline (vlib_main_t * vm,
307 vlib_node_runtime_t * node,
308 vlib_frame_t * frame, bool is_ip4)
309{
310 u32 *buffers = vlib_frame_args (frame);
311 uword n_packets = frame->n_vectors;
312 struct iovec *iovecs = 0;
313 punt_main_t *pm = &punt_main;
314 int i;
315
316 u32 node_index = is_ip4 ? udp4_punt_socket_node.index :
317 udp6_punt_socket_node.index;
318
319 for (i = 0; i < n_packets; i++)
320 {
321 struct iovec *iov;
322 vlib_buffer_t *b;
323 uword l;
324 punt_packetdesc_t packetdesc;
325
326 b = vlib_get_buffer (vm, buffers[i]);
327
328 /* Reverse UDP Punt advance */
329 udp_header_t *udp;
330 if (is_ip4)
331 {
332 vlib_buffer_advance (b, -(sizeof (ip4_header_t) +
333 sizeof (udp_header_t)));
334 ip4_header_t *ip = vlib_buffer_get_current (b);
335 udp = (udp_header_t *) (ip + 1);
336 }
337 else
338 {
339 vlib_buffer_advance (b, -(sizeof (ip6_header_t) +
340 sizeof (udp_header_t)));
341 ip6_header_t *ip = vlib_buffer_get_current (b);
342 udp = (udp_header_t *) (ip + 1);
343 }
344
345 u16 port = clib_net_to_host_u16 (udp->dst_port);
346
347 /*
348 * Find registerered client
349 * If no registered client, drop packet and count
350 */
351 struct sockaddr_un *caddr;
352 caddr = punt_socket_get (is_ip4, port);
353 if (!caddr)
354 {
355 vlib_node_increment_counter (vm, node_index,
356 PUNT_ERROR_SOCKET_TX_ERROR, 1);
357 goto error;
358 }
359
Klement Sekera3c37ad52017-11-03 10:25:23 +0100360 punt_client_t *c = NULL;
361 if (PREDICT_FALSE (b->flags & VLIB_BUFFER_IS_TRACED))
362 {
Klement Sekerab7163082017-11-08 04:13:49 +0100363 c = punt_client_get (is_ip4, port);
Klement Sekera3c37ad52017-11-03 10:25:23 +0100364 udp_punt_trace_t *t;
365 t = vlib_add_trace (vm, node, b, sizeof (t[0]));
366 clib_memcpy (&t->client, c, sizeof (t->client));
367 }
368
Ole Troanf7a55ad2017-05-16 14:59:29 +0200369 /* Re-set iovecs if present. */
370 if (iovecs)
371 _vec_len (iovecs) = 0;
372
373 /* Add packet descriptor */
374 packetdesc.sw_if_index = vnet_buffer (b)->sw_if_index[VLIB_RX];
375 packetdesc.action = 0;
376 vec_add2 (iovecs, iov, 1);
377 iov->iov_base = &packetdesc;
378 iov->iov_len = sizeof (packetdesc);
379
380 /** VLIB buffer chain -> Unix iovec(s). */
381 vlib_buffer_advance (b, -(sizeof (ethernet_header_t)));
382 vec_add2 (iovecs, iov, 1);
383 iov->iov_base = b->data + b->current_data;
384 iov->iov_len = l = b->current_length;
385
386 if (PREDICT_FALSE (b->flags & VLIB_BUFFER_NEXT_PRESENT))
387 {
388 do
389 {
390 b = vlib_get_buffer (vm, b->next_buffer);
Klement Sekera3c37ad52017-11-03 10:25:23 +0100391 if (PREDICT_FALSE (b->flags & VLIB_BUFFER_IS_TRACED))
392 {
Klement Sekerab7163082017-11-08 04:13:49 +0100393 if (PREDICT_FALSE (!c))
394 {
395 c = punt_client_get (is_ip4, port);
396 }
Klement Sekera3c37ad52017-11-03 10:25:23 +0100397 udp_punt_trace_t *t;
398 t = vlib_add_trace (vm, node, b, sizeof (t[0]));
399 clib_memcpy (&t->client, c, sizeof (t->client));
400 t->is_midchain = 1;
401 }
Ole Troanf7a55ad2017-05-16 14:59:29 +0200402
403 vec_add2 (iovecs, iov, 1);
404
405 iov->iov_base = b->data + b->current_data;
406 iov->iov_len = b->current_length;
407 l += b->current_length;
408 }
409 while (b->flags & VLIB_BUFFER_NEXT_PRESENT);
410 }
411
412 struct msghdr msg = {
413 .msg_name = caddr,
414 .msg_namelen = sizeof (*caddr),
415 .msg_iov = iovecs,
416 .msg_iovlen = vec_len (iovecs),
417 };
418
Klement Sekera6bd0bc32017-11-08 12:18:21 +0100419 if (sendmsg (pm->socket_fd, &msg, 0) < (ssize_t) l)
Ole Troanf7a55ad2017-05-16 14:59:29 +0200420 vlib_node_increment_counter (vm, node_index,
421 PUNT_ERROR_SOCKET_TX_ERROR, 1);
422 }
423
424error:
Klement Sekera0dc11a12017-11-03 06:39:28 +0100425 vlib_buffer_free (vm, buffers, n_packets);
Ole Troanf7a55ad2017-05-16 14:59:29 +0200426
427 return n_packets;
428}
429
430static uword
431udp4_punt_socket (vlib_main_t * vm,
432 vlib_node_runtime_t * node, vlib_frame_t * from_frame)
433{
434 return udp46_punt_socket_inline (vm, node, from_frame, true /* is_ip4 */ );
435}
436
437static uword
438udp6_punt_socket (vlib_main_t * vm,
439 vlib_node_runtime_t * node, vlib_frame_t * from_frame)
440{
441 return udp46_punt_socket_inline (vm, node, from_frame, false /* is_ip4 */ );
442}
443
444
445/* *INDENT-OFF* */
446VLIB_REGISTER_NODE (udp4_punt_socket_node) = {
447 .function = udp4_punt_socket,
448 .name = "ip4-udp-punt-socket",
Klement Sekera3c37ad52017-11-03 10:25:23 +0100449 .format_trace = format_udp_punt_trace,
Ole Troanf7a55ad2017-05-16 14:59:29 +0200450 .flags = VLIB_NODE_FLAG_IS_DROP,
451 /* Takes a vector of packets. */
452 .vector_size = sizeof (u32),
453 .n_errors = PUNT_N_ERROR,
454 .error_strings = punt_error_strings,
455};
456VLIB_REGISTER_NODE (udp6_punt_socket_node) = {
457 .function = udp6_punt_socket,
458 .name = "ip6-udp-punt-socket",
Klement Sekera3c37ad52017-11-03 10:25:23 +0100459 .format_trace = format_udp_punt_trace,
Ole Troanf7a55ad2017-05-16 14:59:29 +0200460 .flags = VLIB_NODE_FLAG_IS_DROP,
461 .vector_size = sizeof (u32),
462 .n_errors = PUNT_N_ERROR,
463 .error_strings = punt_error_strings,
464};
465/* *INDENT-ON* */
466
467typedef struct
468{
469 enum punt_action_e action;
470 u32 sw_if_index;
471} punt_trace_t;
472
473static u8 *
474format_punt_trace (u8 * s, va_list * va)
475{
476 CLIB_UNUSED (vlib_main_t * vm) = va_arg (*va, vlib_main_t *);
477 CLIB_UNUSED (vlib_node_t * node) = va_arg (*va, vlib_node_t *);
478 vnet_main_t *vnm = vnet_get_main ();
479 punt_trace_t *t = va_arg (*va, punt_trace_t *);
480 s = format (s, "%U Action: %d", format_vnet_sw_if_index_name,
481 vnm, t->sw_if_index, t->action);
482 return s;
483}
484
485static uword
486punt_socket_rx_fd (vlib_main_t * vm, vlib_node_runtime_t * node, u32 fd)
487{
488 const uword buffer_size = VLIB_BUFFER_DATA_SIZE;
489 u32 n_trace = vlib_get_trace_count (vm, node);
490 u32 next = node->cached_next_index;
491 u32 n_left_to_next, next_index;
492 u32 *to_next;
493 u32 error = PUNT_ERROR_NONE;
494 vlib_get_next_frame (vm, node, next, to_next, n_left_to_next);
495
496 /* $$$$ Only dealing with one buffer at the time for now */
497
498 u32 bi;
499 vlib_buffer_t *b;
500 punt_packetdesc_t packetdesc;
501 ssize_t size;
502 struct iovec io[2];
503
504 if (vlib_buffer_alloc (vm, &bi, 1) != 1)
505 {
506 error = PUNT_ERROR_NOBUFFER;
507 goto error;
508 }
509
510 b = vlib_get_buffer (vm, bi);
511 io[0].iov_base = &packetdesc;
512 io[0].iov_len = sizeof (packetdesc);
513 io[1].iov_base = b->data;
514 io[1].iov_len = buffer_size;
515
516 size = readv (fd, io, 2);
517 /* We need at least the packet descriptor plus a header */
518 if (size <= (int) (sizeof (packetdesc) + sizeof (ip4_header_t)))
519 {
520 vlib_buffer_free (vm, &bi, 1);
521 error = PUNT_ERROR_READV;
522 goto error;
523 }
524
525 b->flags = VNET_BUFFER_F_LOCALLY_ORIGINATED;
526 b->current_length = size - sizeof (packetdesc);
527
528 VLIB_BUFFER_TRACE_TRAJECTORY_INIT (b);
529
530 switch (packetdesc.action)
531 {
532 case PUNT_L2:
533 vnet_buffer (b)->sw_if_index[VLIB_TX] = packetdesc.sw_if_index;
534 next_index = PUNT_SOCKET_RX_NEXT_INTERFACE_OUTPUT;
535 break;
536
537 case PUNT_IP4_ROUTED:
538 vnet_buffer (b)->sw_if_index[VLIB_RX] = packetdesc.sw_if_index;
539 vnet_buffer (b)->sw_if_index[VLIB_TX] = ~0;
540 next_index = PUNT_SOCKET_RX_NEXT_IP4_LOOKUP;
541 break;
542
543 case PUNT_IP6_ROUTED:
544 vnet_buffer (b)->sw_if_index[VLIB_RX] = packetdesc.sw_if_index;
545 vnet_buffer (b)->sw_if_index[VLIB_TX] = ~0;
546 next_index = PUNT_SOCKET_RX_NEXT_IP6_LOOKUP;
547 break;
548
549 default:
550 error = PUNT_ERROR_ACTION;
551 vlib_buffer_free (vm, &bi, 1);
552 goto error;
553 }
554
555 if (PREDICT_FALSE (n_trace > 0))
556 {
557 punt_trace_t *t;
558 vlib_trace_buffer (vm, node, next_index, b, 1 /* follow_chain */ );
559 vlib_set_trace_count (vm, node, --n_trace);
560 t = vlib_add_trace (vm, node, b, sizeof (*t));
561 t->sw_if_index = packetdesc.sw_if_index;
562 t->action = packetdesc.action;
563 }
564
565 to_next[0] = bi;
566 to_next++;
567 n_left_to_next--;
568
569 vlib_validate_buffer_enqueue_x1 (vm, node, next, to_next, n_left_to_next,
570 bi, next_index);
571 vlib_put_next_frame (vm, node, next, n_left_to_next);
572 return 1;
573
574error:
575 vlib_node_increment_counter (vm, punt_socket_rx_node.index, error, 1);
576 return 0;
577}
578
579static uword
580punt_socket_rx (vlib_main_t * vm,
581 vlib_node_runtime_t * node, vlib_frame_t * frame)
582{
583 punt_main_t *pm = &punt_main;
584 u32 total_count = 0;
585 int i;
586
587 for (i = 0; i < vec_len (pm->ready_fds); i++)
588 {
589 total_count += punt_socket_rx_fd (vm, node, pm->ready_fds[i]);
590 vec_del1 (pm->ready_fds, i);
591 }
592 return total_count;
593}
594
595VLIB_REGISTER_NODE (punt_socket_rx_node, static) =
596{
597 .function = punt_socket_rx,.name = "punt-socket-rx",.type =
598 VLIB_NODE_TYPE_INPUT,.state = VLIB_NODE_STATE_INTERRUPT,.vector_size =
599 1,.n_errors = PUNT_N_ERROR,.error_strings =
600 punt_error_strings,.n_next_nodes = PUNT_SOCKET_RX_N_NEXT,.next_nodes =
601 {
602[PUNT_SOCKET_RX_NEXT_INTERFACE_OUTPUT] = "interface-output",
603 [PUNT_SOCKET_RX_NEXT_IP4_LOOKUP] = "ip4-lookup",
604 [PUNT_SOCKET_RX_NEXT_IP6_LOOKUP] = "ip6-lookup",},.format_trace =
605 format_punt_trace,};
606
607static clib_error_t *
Damjan Marion56dd5432017-09-08 19:52:02 +0200608punt_socket_read_ready (clib_file_t * uf)
Ole Troanf7a55ad2017-05-16 14:59:29 +0200609{
610 vlib_main_t *vm = vlib_get_main ();
611 punt_main_t *pm = &punt_main;
612
613 /** Schedule the rx node */
614 vlib_node_set_interrupt_pending (vm, punt_socket_rx_node.index);
615 vec_add1 (pm->ready_fds, uf->file_descriptor);
616
617 return 0;
618}
619
620clib_error_t *
621vnet_punt_socket_add (vlib_main_t * vm, u32 header_version,
622 bool is_ip4, u8 protocol, u16 port,
623 char *client_pathname)
624{
625 punt_main_t *pm = &punt_main;
626
627 if (!pm->is_configured)
628 return clib_error_return (0, "socket is not configured");
629
630 if (header_version != PUNT_PACKETDESC_VERSION)
631 return clib_error_return (0, "Invalid packet descriptor version");
632
633 /* For now we only support UDP punt */
634 if (protocol != IP_PROTOCOL_UDP)
635 return clib_error_return (0,
636 "only UDP protocol (%d) is supported, got %d",
637 IP_PROTOCOL_UDP, protocol);
638
639 if (port == (u16) ~ 0)
640 return clib_error_return (0, "UDP port number required");
641
642 /* Register client */
643 punt_socket_register (is_ip4, protocol, port, client_pathname);
644
645 u32 node_index = is_ip4 ? udp4_punt_socket_node.index :
646 udp6_punt_socket_node.index;
647
648 udp_register_dst_port (vm, port, node_index, is_ip4);
649
650 return 0;
651}
652
653clib_error_t *
654vnet_punt_socket_del (vlib_main_t * vm, bool is_ip4, u8 l4_protocol, u16 port)
655{
656 punt_main_t *pm = &punt_main;
657
658 if (!pm->is_configured)
659 return clib_error_return (0, "socket is not configured");
660
661 punt_socket_unregister (is_ip4, l4_protocol, port);
662 udp_unregister_dst_port (vm, port, is_ip4);
663
664 return 0;
665}
666
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -0700667/**
668 * @brief Request IP traffic punt to the local TCP/IP stack.
669 *
670 * @em Note
Pierre Pfister7fe51f32017-09-20 08:48:36 +0200671 * - UDP and TCP are the only protocols supported in the current implementation
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -0700672 *
673 * @param vm vlib_main_t corresponding to the current thread
674 * @param ipv IP protcol version.
675 * 4 - IPv4, 6 - IPv6, ~0 for both IPv6 and IPv4
676 * @param protocol 8-bits L4 protocol value
Pierre Pfister7fe51f32017-09-20 08:48:36 +0200677 * UDP is 17
678 * TCP is 1
679 * @param port 16-bits L4 (TCP/IP) port number when applicable (UDP only)
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -0700680 *
681 * @returns 0 on success, non-zero value otherwise
682 */
683clib_error_t *
684vnet_punt_add_del (vlib_main_t * vm, u8 ipv, u8 protocol, u16 port,
Ole Troanf7a55ad2017-05-16 14:59:29 +0200685 bool is_add)
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -0700686{
Pierre Pfister7fe51f32017-09-20 08:48:36 +0200687
Alexander Popovsky (apopovsk)740bcdb2016-11-15 15:36:23 -0800688 /* For now we only support UDP punt */
Pierre Pfister7fe51f32017-09-20 08:48:36 +0200689 if (protocol != IP_PROTOCOL_UDP && protocol != IP_PROTOCOL_TCP)
Alexander Popovsky (apopovsk)740bcdb2016-11-15 15:36:23 -0800690 return clib_error_return (0,
Pierre Pfister7fe51f32017-09-20 08:48:36 +0200691 "only UDP (%d) and TCP (%d) protocols are supported, got %d",
692 IP_PROTOCOL_UDP, IP_PROTOCOL_TCP, protocol);
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -0700693
Alexander Popovsky (apopovsk)740bcdb2016-11-15 15:36:23 -0800694 if (ipv != (u8) ~ 0 && ipv != 4 && ipv != 6)
695 return clib_error_return (0, "IP version must be 4 or 6, got %d", ipv);
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -0700696
Alexander Popovsky (apopovsk)740bcdb2016-11-15 15:36:23 -0800697 if (port == (u16) ~ 0)
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -0700698 {
Pierre Pfister7fe51f32017-09-20 08:48:36 +0200699 if ((ipv == 4) || (ipv == (u8) ~ 0))
700 {
701 if (protocol == IP_PROTOCOL_UDP)
702 udp_punt_unknown (vm, 1, is_add);
703 else if (protocol == IP_PROTOCOL_TCP)
704 tcp_punt_unknown (vm, 1, is_add);
705 }
Alexander Popovsky (apopovsk)740bcdb2016-11-15 15:36:23 -0800706
Pierre Pfister7fe51f32017-09-20 08:48:36 +0200707 if ((ipv == 6) || (ipv == (u8) ~ 0))
708 {
709 if (protocol == IP_PROTOCOL_UDP)
710 udp_punt_unknown (vm, 0, is_add);
711 else if (protocol == IP_PROTOCOL_TCP)
712 tcp_punt_unknown (vm, 0, is_add);
713 }
Alexander Popovsky (apopovsk)740bcdb2016-11-15 15:36:23 -0800714
715 return 0;
716 }
717
718 else if (is_add)
719 {
Pierre Pfister7fe51f32017-09-20 08:48:36 +0200720 if (protocol == IP_PROTOCOL_TCP)
721 return clib_error_return (0, "punt TCP ports is not supported yet");
722
Alexander Popovsky (apopovsk)740bcdb2016-11-15 15:36:23 -0800723 if (ipv == 4 || ipv == (u8) ~ 0)
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -0700724 udp_register_dst_port (vm, port, udp4_punt_node.index, 1);
Alexander Popovsky (apopovsk)740bcdb2016-11-15 15:36:23 -0800725
726 if (ipv == 6 || ipv == (u8) ~ 0)
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -0700727 udp_register_dst_port (vm, port, udp6_punt_node.index, 0);
Alexander Popovsky (apopovsk)740bcdb2016-11-15 15:36:23 -0800728
729 return 0;
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -0700730 }
731 else
Alexander Popovsky (apopovsk)740bcdb2016-11-15 15:36:23 -0800732 return clib_error_return (0, "punt delete is not supported yet");
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -0700733}
734
735static clib_error_t *
Pierre Pfister7fe51f32017-09-20 08:48:36 +0200736punt_cli (vlib_main_t * vm,
737 unformat_input_t * input, vlib_cli_command_t * cmd)
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -0700738{
Pierre Pfister7fe51f32017-09-20 08:48:36 +0200739 u32 port;
Ole Troanf7a55ad2017-05-16 14:59:29 +0200740 bool is_add = true;
Pierre Pfister7fe51f32017-09-20 08:48:36 +0200741 u32 protocol = ~0;
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -0700742 clib_error_t *error;
743
744 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
745 {
746 if (unformat (input, "del"))
Ole Troanf7a55ad2017-05-16 14:59:29 +0200747 is_add = false;
Pierre Pfister7fe51f32017-09-20 08:48:36 +0200748 else if (unformat (input, "all"))
Alexander Popovsky (apopovsk)740bcdb2016-11-15 15:36:23 -0800749 {
750 /* punt both IPv6 and IPv4 when used in CLI */
Pierre Pfister7fe51f32017-09-20 08:48:36 +0200751 error = vnet_punt_add_del (vm, ~0, protocol, ~0, is_add);
Alexander Popovsky (apopovsk)740bcdb2016-11-15 15:36:23 -0800752 if (error)
753 clib_error_report (error);
754 }
Pierre Pfister7fe51f32017-09-20 08:48:36 +0200755 else if (unformat (input, "%d", &port))
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -0700756 {
757 /* punt both IPv6 and IPv4 when used in CLI */
Pierre Pfister7fe51f32017-09-20 08:48:36 +0200758 error = vnet_punt_add_del (vm, ~0, protocol, port, is_add);
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -0700759 if (error)
760 clib_error_report (error);
761 }
Pierre Pfister7fe51f32017-09-20 08:48:36 +0200762 else if (unformat (input, "udp"))
763 protocol = IP_PROTOCOL_UDP;
764 else if (unformat (input, "tcp"))
765 protocol = IP_PROTOCOL_TCP;
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -0700766 }
767
768 return 0;
769}
770
771/*?
772 * The set of '<em>set punt</em>' commands allows specific IP traffic to
773 * be punted to the host TCP/IP stack
774 *
775 * @em Note
776 * - UDP is the only protocol supported in the current implementation
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -0700777 * - All TCP traffic is currently punted to the host by default
778 *
779 * @cliexpar
780 * @parblock
781 * Example of how to request NTP traffic to be punted
782 * @cliexcmd{set punt udp 125}
783 *
Alexander Popovsky (apopovsk)740bcdb2016-11-15 15:36:23 -0800784 * Example of how to request all 'unknown' UDP traffic to be punted
785 * @cliexcmd{set punt udp all}
786 *
787 * Example of how to stop all 'unknown' UDP traffic to be punted
788 * @cliexcmd{set punt udp del all}
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -0700789 * @endparblock
790?*/
791/* *INDENT-OFF* */
Pierre Pfister7fe51f32017-09-20 08:48:36 +0200792VLIB_CLI_COMMAND (punt_command, static) = {
793 .path = "set punt",
794 .short_help = "set punt [udp|tcp] [del] <all | port-num1 [port-num2 ...]>",
795 .function = punt_cli,
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -0700796};
797/* *INDENT-ON* */
798
Ole Troanf7a55ad2017-05-16 14:59:29 +0200799clib_error_t *
800punt_init (vlib_main_t * vm)
801{
802 punt_main_t *pm = &punt_main;
803
804 pm->clients_by_dst_port6 = sparse_vec_new
805 (sizeof (pm->clients_by_dst_port6[0]),
806 BITS (((udp_header_t *) 0)->dst_port));
807 pm->clients_by_dst_port4 = sparse_vec_new
808 (sizeof (pm->clients_by_dst_port4[0]),
809 BITS (((udp_header_t *) 0)->dst_port));
810
811 pm->is_configured = false;
812 pm->interface_output_node = vlib_get_node_by_name (vm,
813 (u8 *)
814 "interface-output");
815 return 0;
816}
817
818VLIB_INIT_FUNCTION (punt_init);
819
820static clib_error_t *
821punt_config (vlib_main_t * vm, unformat_input_t * input)
822{
823 punt_main_t *pm = &punt_main;
824 char *socket_path = 0;
825
826 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
827 {
828 if (unformat (input, "socket %s", &socket_path))
829 strncpy (pm->sun_path, socket_path, 108 - 1);
830 else
831 return clib_error_return (0, "unknown input `%U'",
832 format_unformat_error, input);
833 }
834
835 if (socket_path == 0)
836 return 0;
837
838 /* UNIX domain socket */
839 struct sockaddr_un addr;
840 if ((pm->socket_fd = socket (AF_UNIX, SOCK_DGRAM | SOCK_NONBLOCK, 0)) == -1)
841 {
842 return clib_error_return (0, "socket error");
843 }
844
845 memset (&addr, 0, sizeof (addr));
846 addr.sun_family = AF_UNIX;
847 if (*socket_path == '\0')
848 {
849 *addr.sun_path = '\0';
850 strncpy (addr.sun_path + 1, socket_path + 1,
851 sizeof (addr.sun_path) - 2);
852 }
853 else
854 {
855 strncpy (addr.sun_path, socket_path, sizeof (addr.sun_path) - 1);
856 unlink (socket_path);
857 }
858
859 if (bind (pm->socket_fd, (struct sockaddr *) &addr, sizeof (addr)) == -1)
860 {
861 return clib_error_return (0, "bind error");
862 }
863
864 /* Register socket */
Damjan Marion56dd5432017-09-08 19:52:02 +0200865 clib_file_main_t *fm = &file_main;
866 clib_file_t template = { 0 };
Ole Troanf7a55ad2017-05-16 14:59:29 +0200867 template.read_function = punt_socket_read_ready;
868 template.file_descriptor = pm->socket_fd;
Damjan Marion56dd5432017-09-08 19:52:02 +0200869 pm->clib_file_index = clib_file_add (fm, &template);
Ole Troanf7a55ad2017-05-16 14:59:29 +0200870
871 pm->is_configured = true;
872
873 return 0;
874}
875
876VLIB_CONFIG_FUNCTION (punt_config, "punt");
877
Alexander Popovsky (apopovsk)4a7e58b2016-10-05 22:31:23 -0700878/*
879 * fd.io coding-style-patch-verification: ON
880 *
881 * Local Variables:
882 * eval: (c-set-style "gnu")
883 * End:
884 */