blob: bd4e75710f5c0ee9ff69d92f4d4e27c8612d0940 [file] [log] [blame]
Dave Barach68b0fb02017-02-28 15:15:56 -05001/*
Florin Corasc5df8c72019-04-08 07:42:30 -07002 * Copyright (c) 2016-2019 Cisco and/or its affiliates.
Dave Barach68b0fb02017-02-28 15:15:56 -05003 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
6 *
7 * http://www.apache.org/licenses/LICENSE-2.0
8 *
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
14 */
15
Florin Coras7fb0fe12018-04-09 09:24:52 -070016#include <vlibmemory/api.h>
Dave Barach68b0fb02017-02-28 15:15:56 -050017#include <vlib/vlib.h>
Dave Barach68b0fb02017-02-28 15:15:56 -050018
Dave Barach68b0fb02017-02-28 15:15:56 -050019#include <vppinfra/hash.h>
20#include <vppinfra/error.h>
21#include <vppinfra/elog.h>
22
Florin Coras7fb0fe12018-04-09 09:24:52 -070023#include <vnet/vnet.h>
24#include <vnet/pg/pg.h>
25#include <vnet/ip/ip.h>
26#include <vnet/udp/udp.h>
Dave Barach68b0fb02017-02-28 15:15:56 -050027#include <vnet/udp/udp_packet.h>
Florin Coras7fb0fe12018-04-09 09:24:52 -070028#include <vnet/session/session.h>
Dave Barach68b0fb02017-02-28 15:15:56 -050029
Florin Coras3cbc04b2017-10-02 00:18:51 -070030static char *udp_error_strings[] = {
31#define udp_error(n,s) s,
32#include "udp_error.def"
33#undef udp_error
34};
Dave Barach68b0fb02017-02-28 15:15:56 -050035
36typedef struct
37{
Florin Coras3cbc04b2017-10-02 00:18:51 -070038 u32 connection;
Dave Barach68b0fb02017-02-28 15:15:56 -050039 u32 disposition;
40 u32 thread_index;
Florin Coras3cbc04b2017-10-02 00:18:51 -070041} udp_input_trace_t;
Dave Barach68b0fb02017-02-28 15:15:56 -050042
43/* packet trace format function */
44static u8 *
Florin Coras3cbc04b2017-10-02 00:18:51 -070045format_udp_input_trace (u8 * s, va_list * args)
Dave Barach68b0fb02017-02-28 15:15:56 -050046{
47 CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *);
48 CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *);
Florin Coras3cbc04b2017-10-02 00:18:51 -070049 udp_input_trace_t *t = va_arg (*args, udp_input_trace_t *);
Dave Barach68b0fb02017-02-28 15:15:56 -050050
Florin Coras3cbc04b2017-10-02 00:18:51 -070051 s = format (s, "UDP_INPUT: connection %d, disposition %d, thread %d",
52 t->connection, t->disposition, t->thread_index);
Dave Barach68b0fb02017-02-28 15:15:56 -050053 return s;
54}
55
Florin Coras3cbc04b2017-10-02 00:18:51 -070056#define foreach_udp_input_next \
57 _ (DROP, "error-drop")
58
Dave Barach68b0fb02017-02-28 15:15:56 -050059typedef enum
60{
Florin Coras3cbc04b2017-10-02 00:18:51 -070061#define _(s, n) UDP_INPUT_NEXT_##s,
62 foreach_udp_input_next
Dave Barach68b0fb02017-02-28 15:15:56 -050063#undef _
Florin Coras3cbc04b2017-10-02 00:18:51 -070064 UDP_INPUT_N_NEXT,
65} udp_input_next_t;
Dave Barach68b0fb02017-02-28 15:15:56 -050066
Florin Coras3cbc04b2017-10-02 00:18:51 -070067always_inline void
68udp_input_inc_counter (vlib_main_t * vm, u8 is_ip4, u8 evt, u8 val)
69{
70 if (PREDICT_TRUE (!val))
71 return;
72
73 if (is_ip4)
74 vlib_node_increment_counter (vm, udp4_input_node.index, evt, val);
75 else
76 vlib_node_increment_counter (vm, udp6_input_node.index, evt, val);
77}
78
79always_inline uword
80udp46_input_inline (vlib_main_t * vm, vlib_node_runtime_t * node,
81 vlib_frame_t * frame, u8 is_ip4)
Dave Barach68b0fb02017-02-28 15:15:56 -050082{
Aloys Augustin8fadb652019-09-24 18:57:50 +020083 u32 n_left_from, *from;
84 u32 errors, *first_buffer;
Damjan Marion586afd72017-04-05 19:18:20 +020085 u32 my_thread_index = vm->thread_index;
Dave Barach68b0fb02017-02-28 15:15:56 -050086
Aloys Augustin8fadb652019-09-24 18:57:50 +020087 from = first_buffer = vlib_frame_vector_args (frame);
Dave Barach68b0fb02017-02-28 15:15:56 -050088 n_left_from = frame->n_vectors;
Dave Barach68b0fb02017-02-28 15:15:56 -050089
90 while (n_left_from > 0)
91 {
Aloys Augustin8fadb652019-09-24 18:57:50 +020092 u32 bi0, fib_index0;
93 vlib_buffer_t *b0;
94 u32 error0 = UDP_ERROR_ENQUEUED;
95 udp_header_t *udp0;
96 ip4_header_t *ip40;
97 ip6_header_t *ip60;
98 u8 *data0;
99 session_t *s0;
100 udp_connection_t *uc0, *child0, *new_uc0;
101 transport_connection_t *tc0;
102 int wrote0;
103 void *rmt_addr, *lcl_addr;
104 session_dgram_hdr_t hdr0;
105 u8 queue_event = 1;
Dave Barach68b0fb02017-02-28 15:15:56 -0500106
Aloys Augustin8fadb652019-09-24 18:57:50 +0200107 /* speculatively enqueue b0 to the current next frame */
108 bi0 = from[0];
109 from += 1;
110 n_left_from -= 1;
Dave Barach68b0fb02017-02-28 15:15:56 -0500111
Aloys Augustin8fadb652019-09-24 18:57:50 +0200112 b0 = vlib_get_buffer (vm, bi0);
113
114 /* udp_local hands us a pointer to the udp data */
115 data0 = vlib_buffer_get_current (b0);
116 udp0 = (udp_header_t *) (data0 - sizeof (*udp0));
117 fib_index0 = vnet_buffer (b0)->ip.fib_index;
118
119 if (is_ip4)
Dave Barach68b0fb02017-02-28 15:15:56 -0500120 {
Aloys Augustin8fadb652019-09-24 18:57:50 +0200121 /* TODO: must fix once udp_local does ip options correctly */
122 ip40 = (ip4_header_t *) (((u8 *) udp0) - sizeof (*ip40));
123 s0 = session_lookup_safe4 (fib_index0, &ip40->dst_address,
124 &ip40->src_address, udp0->dst_port,
125 udp0->src_port, TRANSPORT_PROTO_UDP);
126 lcl_addr = &ip40->dst_address;
127 rmt_addr = &ip40->src_address;
Dave Barach68b0fb02017-02-28 15:15:56 -0500128
Aloys Augustin8fadb652019-09-24 18:57:50 +0200129 }
130 else
131 {
132 ip60 = (ip6_header_t *) (((u8 *) udp0) - sizeof (*ip60));
133 s0 = session_lookup_safe6 (fib_index0, &ip60->dst_address,
134 &ip60->src_address, udp0->dst_port,
135 udp0->src_port, TRANSPORT_PROTO_UDP);
136 lcl_addr = &ip60->dst_address;
137 rmt_addr = &ip60->src_address;
Dave Barach68b0fb02017-02-28 15:15:56 -0500138 }
139
Aloys Augustin8fadb652019-09-24 18:57:50 +0200140 if (PREDICT_FALSE (!s0))
141 {
142 error0 = UDP_ERROR_NO_LISTENER;
143 goto trace0;
144 }
145
146 if (s0->session_state == SESSION_STATE_OPENED)
147 {
148 /* TODO optimization: move cl session to right thread
149 * However, since such a move would affect the session handle,
150 * which we pass 'raw' to the app, we'd also have notify the
151 * app of the change or change the way we pass handles to apps.
152 */
153 tc0 = session_get_transport (s0);
154 uc0 = udp_get_connection_from_transport (tc0);
155 if (uc0->flags & UDP_CONN_F_CONNECTED)
156 {
157 if (s0->thread_index != vlib_get_thread_index ())
158 {
159 /*
160 * Clone the transport. It will be cleaned up with the
161 * session once we notify the session layer.
162 */
163 new_uc0 =
164 udp_connection_clone_safe (s0->connection_index,
165 s0->thread_index);
166 ASSERT (s0->session_index == new_uc0->c_s_index);
167
168 /*
169 * Drop the 'lock' on pool resize
170 */
171 session_pool_remove_peeker (s0->thread_index);
172 session_dgram_connect_notify (&new_uc0->connection,
173 s0->thread_index, &s0);
174 tc0 = &new_uc0->connection;
175 uc0 = new_uc0;
176 queue_event = 0;
177 }
178 else
179 s0->session_state = SESSION_STATE_READY;
180 }
181 }
182 else if (s0->session_state == SESSION_STATE_READY)
183 {
184 tc0 = session_get_transport (s0);
185 uc0 = udp_get_connection_from_transport (tc0);
186 }
187 else if (s0->session_state == SESSION_STATE_LISTENING)
188 {
189 tc0 = listen_session_get_transport (s0);
190 uc0 = udp_get_connection_from_transport (tc0);
191 if (uc0->flags & UDP_CONN_F_CONNECTED)
192 {
193 child0 = udp_connection_alloc (my_thread_index);
194 if (is_ip4)
195 {
196 ip_set (&child0->c_lcl_ip, &ip40->dst_address, 1);
197 ip_set (&child0->c_rmt_ip, &ip40->src_address, 1);
198 }
199 else
200 {
201 ip_set (&child0->c_lcl_ip, &ip60->dst_address, 0);
202 ip_set (&child0->c_rmt_ip, &ip60->src_address, 0);
203 }
204 child0->c_lcl_port = udp0->dst_port;
205 child0->c_rmt_port = udp0->src_port;
206 child0->c_is_ip4 = is_ip4;
207 child0->c_fib_index = tc0->fib_index;
208 child0->flags |= UDP_CONN_F_CONNECTED;
209
210 if (session_stream_accept (&child0->connection,
211 tc0->s_index, tc0->thread_index, 1))
212 {
213 error0 = UDP_ERROR_CREATE_SESSION;
214 goto trace0;
215 }
216 s0 = session_get (child0->c_s_index, child0->c_thread_index);
217 s0->session_state = SESSION_STATE_READY;
218 tc0 = &child0->connection;
219 uc0 = udp_get_connection_from_transport (tc0);
220 error0 = UDP_ERROR_LISTENER;
221 }
222 }
223 else
224 {
225 error0 = UDP_ERROR_NOT_READY;
226 goto trace0;
227 }
228
229
230 if (svm_fifo_max_enqueue_prod (s0->rx_fifo)
231 < b0->current_length + sizeof (session_dgram_hdr_t))
232 {
233 error0 = UDP_ERROR_FIFO_FULL;
234 goto trace0;
235 }
236 hdr0.data_length = b0->current_length;
237 hdr0.data_offset = 0;
238 ip_set (&hdr0.lcl_ip, lcl_addr, is_ip4);
239 ip_set (&hdr0.rmt_ip, rmt_addr, is_ip4);
240 hdr0.lcl_port = udp0->dst_port;
241 hdr0.rmt_port = udp0->src_port;
242 hdr0.is_ip4 = is_ip4;
243
244 clib_spinlock_lock (&uc0->rx_lock);
245 /* If session is owned by another thread and rx event needed,
246 * enqueue event now while we still have the peeker lock */
247 if (s0->thread_index != my_thread_index)
248 {
249 wrote0 = session_enqueue_dgram_connection (s0, &hdr0, b0,
250 TRANSPORT_PROTO_UDP,
251 /* queue event */ 0);
252 if (queue_event && !svm_fifo_has_event (s0->rx_fifo))
253 session_enqueue_notify (s0);
254 }
255 else
256 {
257 wrote0 = session_enqueue_dgram_connection (s0, &hdr0, b0,
258 TRANSPORT_PROTO_UDP,
259 queue_event);
260 }
261 clib_spinlock_unlock (&uc0->rx_lock);
262 ASSERT (wrote0 > 0);
263
264 if (s0->session_state != SESSION_STATE_LISTENING)
265 session_pool_remove_peeker (s0->thread_index);
266
267 trace0:
268
269 b0->error = node->errors[error0];
270
271 if (PREDICT_FALSE ((node->flags & VLIB_NODE_FLAG_TRACE)
272 && (b0->flags & VLIB_BUFFER_IS_TRACED)))
273 {
274 udp_input_trace_t *t = vlib_add_trace (vm, node, b0,
275 sizeof (*t));
276
277 t->connection = s0 ? s0->connection_index : ~0;
278 t->disposition = error0;
279 t->thread_index = my_thread_index;
280 }
Dave Barach68b0fb02017-02-28 15:15:56 -0500281 }
282
Aloys Augustin8fadb652019-09-24 18:57:50 +0200283 vlib_buffer_free (vm, first_buffer, frame->n_vectors);
Florin Coras9cbf6812019-08-06 18:28:49 -0700284 errors = session_main_flush_enqueue_events (TRANSPORT_PROTO_UDP,
285 my_thread_index);
Florin Coras3cbc04b2017-10-02 00:18:51 -0700286 udp_input_inc_counter (vm, is_ip4, UDP_ERROR_EVENT_FIFO_FULL, errors);
Dave Barach68b0fb02017-02-28 15:15:56 -0500287 return frame->n_vectors;
288}
289
Florin Coras3cbc04b2017-10-02 00:18:51 -0700290
291static uword
292udp4_input (vlib_main_t * vm, vlib_node_runtime_t * node,
293 vlib_frame_t * frame)
Dave Barach68b0fb02017-02-28 15:15:56 -0500294{
Florin Coras3cbc04b2017-10-02 00:18:51 -0700295 return udp46_input_inline (vm, node, frame, 1);
296}
297
298/* *INDENT-OFF* */
299VLIB_REGISTER_NODE (udp4_input_node) =
300{
301 .function = udp4_input,
302 .name = "udp4-input",
303 .vector_size = sizeof (u32),
304 .format_trace = format_udp_input_trace,
305 .type = VLIB_NODE_TYPE_INTERNAL,
306 .n_errors = ARRAY_LEN (udp_error_strings),
307 .error_strings = udp_error_strings,
308 .n_next_nodes = UDP_INPUT_N_NEXT,
309 .next_nodes = {
310#define _(s, n) [UDP_INPUT_NEXT_##s] = n,
311 foreach_udp_input_next
312#undef _
313 },
314};
315/* *INDENT-ON* */
316
317static uword
318udp6_input (vlib_main_t * vm, vlib_node_runtime_t * node,
319 vlib_frame_t * frame)
320{
321 return udp46_input_inline (vm, node, frame, 0);
322}
323
324/* *INDENT-OFF* */
325VLIB_REGISTER_NODE (udp6_input_node) =
326{
327 .function = udp6_input,
328 .name = "udp6-input",
329 .vector_size = sizeof (u32),
330 .format_trace = format_udp_input_trace,
331 .type = VLIB_NODE_TYPE_INTERNAL,
332 .n_errors = ARRAY_LEN (udp_error_strings),
333 .error_strings = udp_error_strings,
334 .n_next_nodes = UDP_INPUT_N_NEXT,
335 .next_nodes = {
336#define _(s, n) [UDP_INPUT_NEXT_##s] = n,
337 foreach_udp_input_next
338#undef _
339 },
340};
341/* *INDENT-ON* */
Dave Barach68b0fb02017-02-28 15:15:56 -0500342
343/*
344 * fd.io coding-style-patch-verification: ON
345 *
346 * Local Variables:
347 * eval: (c-set-style "gnu")
348 * End:
349 */