blob: d11d558eb934d3a57938a33309533ccd446ddaae [file] [log] [blame]
Ed Warnickecb9cada2015-12-08 15:45:58 -07001/*
2 * Copyright (c) 2015 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
6 *
7 * http://www.apache.org/licenses/LICENSE-2.0
8 *
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
14 */
15/*
16 * ip/ip4_input.c: IP v4 input node
17 *
18 * Copyright (c) 2008 Eliot Dresselhaus
19 *
20 * Permission is hereby granted, free of charge, to any person obtaining
21 * a copy of this software and associated documentation files (the
22 * "Software"), to deal in the Software without restriction, including
23 * without limitation the rights to use, copy, modify, merge, publish,
24 * distribute, sublicense, and/or sell copies of the Software, and to
25 * permit persons to whom the Software is furnished to do so, subject to
26 * the following conditions:
27 *
28 * The above copyright notice and this permission notice shall be
29 * included in all copies or substantial portions of the Software.
30 *
31 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
32 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
33 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
34 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
35 * LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
36 * OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
37 * WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
38 */
39
Neale Ranns4c7c8e52017-10-21 09:37:55 -070040#include <vnet/ip/ip4_input.h>
Ed Warnickecb9cada2015-12-08 15:45:58 -070041#include <vnet/ethernet/ethernet.h>
42#include <vnet/ppp/ppp.h>
43#include <vnet/hdlc/hdlc.h>
44
Dave Barachd7cb1b52016-12-09 09:52:16 -050045typedef struct
46{
Ed Warnickecb9cada2015-12-08 15:45:58 -070047 u8 packet_data[64];
48} ip4_input_trace_t;
49
Damjan Marion812b32d2018-05-28 21:26:47 +020050#ifndef CLIB_MARCH_VARIANT
Dave Barachd7cb1b52016-12-09 09:52:16 -050051static u8 *
52format_ip4_input_trace (u8 * s, va_list * va)
Ed Warnickecb9cada2015-12-08 15:45:58 -070053{
54 CLIB_UNUSED (vlib_main_t * vm) = va_arg (*va, vlib_main_t *);
55 CLIB_UNUSED (vlib_node_t * node) = va_arg (*va, vlib_node_t *);
Dave Barachd7cb1b52016-12-09 09:52:16 -050056 ip4_input_trace_t *t = va_arg (*va, ip4_input_trace_t *);
Ed Warnickecb9cada2015-12-08 15:45:58 -070057
58 s = format (s, "%U",
Dave Barachd7cb1b52016-12-09 09:52:16 -050059 format_ip4_header, t->packet_data, sizeof (t->packet_data));
Ed Warnickecb9cada2015-12-08 15:45:58 -070060
61 return s;
62}
Damjan Marion3ade6b62018-05-26 18:53:34 +020063#endif
64
65static_always_inline u32
66ip4_input_set_next (u32 sw_if_index, vlib_buffer_t * b, int arc_enabled)
67{
68 ip4_main_t *im = &ip4_main;
69 ip_lookup_main_t *lm = &im->lookup_main;
70 u32 next;
71 u8 arc;
72
73 ip4_header_t *ip = vlib_buffer_get_current (b);
74
75 if (PREDICT_FALSE (ip4_address_is_multicast (&ip->dst_address)))
76 {
77 next = IP4_INPUT_NEXT_LOOKUP_MULTICAST;
78 arc = lm->mcast_feature_arc_index;
79 }
80 else
81 {
82 next = IP4_INPUT_NEXT_LOOKUP;
83 arc = lm->ucast_feature_arc_index;
84 }
85
86 if (arc_enabled)
87 vnet_feature_arc_start (arc, sw_if_index, &next, b);
88
89 return next;
90}
91
92static_always_inline void
Damjan Marion067cd622018-07-11 12:47:43 +020093ip4_input_check_sw_if_index (vlib_main_t * vm,
94 vlib_simple_counter_main_t * cm, u32 sw_if_index,
Damjan Marion3ade6b62018-05-26 18:53:34 +020095 u32 * last_sw_if_index, u32 * cnt,
96 int *arc_enabled)
97{
98 ip4_main_t *im = &ip4_main;
99 ip_lookup_main_t *lm = &im->lookup_main;
100 u32 thread_index;
101 if (*last_sw_if_index == sw_if_index)
102 {
103 (*cnt)++;
104 return;
105 }
106
Damjan Marion067cd622018-07-11 12:47:43 +0200107 thread_index = vm->thread_index;
Damjan Marion3ade6b62018-05-26 18:53:34 +0200108 if (*cnt)
109 vlib_increment_simple_counter (cm, thread_index, *last_sw_if_index, *cnt);
110 *cnt = 1;
111 *last_sw_if_index = sw_if_index;
112
113 if (vnet_have_features (lm->ucast_feature_arc_index, sw_if_index) ||
114 vnet_have_features (lm->mcast_feature_arc_index, sw_if_index))
115 *arc_enabled = 1;
116 else
117 *arc_enabled = 0;
118}
Ed Warnickecb9cada2015-12-08 15:45:58 -0700119
Ed Warnickecb9cada2015-12-08 15:45:58 -0700120/* Validate IP v4 packets and pass them either to forwarding code
121 or drop/punt exception packets. */
122always_inline uword
123ip4_input_inline (vlib_main_t * vm,
124 vlib_node_runtime_t * node,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500125 vlib_frame_t * frame, int verify_checksum)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700126{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500127 vnet_main_t *vnm = vnet_get_main ();
Damjan Marion3ade6b62018-05-26 18:53:34 +0200128 u32 n_left_from, *from;
Damjan Marion067cd622018-07-11 12:47:43 +0200129 u32 thread_index = vm->thread_index;
Dave Barachd7cb1b52016-12-09 09:52:16 -0500130 vlib_node_runtime_t *error_node =
131 vlib_node_get_runtime (vm, ip4_input_node.index);
132 vlib_simple_counter_main_t *cm;
Damjan Marion3ade6b62018-05-26 18:53:34 +0200133 vlib_buffer_t *bufs[VLIB_FRAME_SIZE], **b;
134 ip4_header_t *ip[4];
135 u16 nexts[VLIB_FRAME_SIZE], *next;
136 u32 sw_if_index[4];
137 u32 last_sw_if_index = ~0;
138 u32 cnt = 0;
139 int arc_enabled = 0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700140
141 from = vlib_frame_vector_args (frame);
142 n_left_from = frame->n_vectors;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700143
144 if (node->flags & VLIB_NODE_FLAG_TRACE)
145 vlib_trace_frame_buffers_only (vm, node, from, frame->n_vectors,
146 /* stride */ 1,
147 sizeof (ip4_input_trace_t));
148
149 cm = vec_elt_at_index (vnm->interface_main.sw_if_counters,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500150 VNET_INTERFACE_COUNTER_IP4);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700151
Damjan Marion3ade6b62018-05-26 18:53:34 +0200152 vlib_get_buffers (vm, from, bufs, n_left_from);
153 b = bufs;
154 next = nexts;
155 while (n_left_from >= 4)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700156 {
Damjan Marion3ade6b62018-05-26 18:53:34 +0200157 u32 x = 0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700158
Damjan Marion3ade6b62018-05-26 18:53:34 +0200159 /* Prefetch next iteration. */
160 if (n_left_from >= 12)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700161 {
Damjan Marion3ade6b62018-05-26 18:53:34 +0200162 vlib_prefetch_buffer_header (b[8], LOAD);
163 vlib_prefetch_buffer_header (b[9], LOAD);
164 vlib_prefetch_buffer_header (b[10], LOAD);
165 vlib_prefetch_buffer_header (b[11], LOAD);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700166
Damjan Marion3ade6b62018-05-26 18:53:34 +0200167 CLIB_PREFETCH (b[4]->data, sizeof (ip4_header_t), LOAD);
168 CLIB_PREFETCH (b[5]->data, sizeof (ip4_header_t), LOAD);
169 CLIB_PREFETCH (b[6]->data, sizeof (ip4_header_t), LOAD);
170 CLIB_PREFETCH (b[7]->data, sizeof (ip4_header_t), LOAD);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700171 }
172
Damjan Marion3ade6b62018-05-26 18:53:34 +0200173 vnet_buffer (b[0])->ip.adj_index[VLIB_RX] = ~0;
174 vnet_buffer (b[1])->ip.adj_index[VLIB_RX] = ~0;
175 vnet_buffer (b[2])->ip.adj_index[VLIB_RX] = ~0;
176 vnet_buffer (b[3])->ip.adj_index[VLIB_RX] = ~0;
177
178 sw_if_index[0] = vnet_buffer (b[0])->sw_if_index[VLIB_RX];
179 sw_if_index[1] = vnet_buffer (b[1])->sw_if_index[VLIB_RX];
180 sw_if_index[2] = vnet_buffer (b[2])->sw_if_index[VLIB_RX];
181 sw_if_index[3] = vnet_buffer (b[3])->sw_if_index[VLIB_RX];
182
183 x |= sw_if_index[0] ^ last_sw_if_index;
184 x |= sw_if_index[1] ^ last_sw_if_index;
185 x |= sw_if_index[2] ^ last_sw_if_index;
186 x |= sw_if_index[3] ^ last_sw_if_index;
187
188 if (PREDICT_TRUE (x == 0))
189 {
190 /* we deal with 4 more packets sharing the same sw_if_index
191 with the previous one, so we can optimize */
192 cnt += 4;
193 if (arc_enabled)
194 {
195 next[0] = ip4_input_set_next (sw_if_index[0], b[0], 1);
196 next[1] = ip4_input_set_next (sw_if_index[1], b[1], 1);
197 next[2] = ip4_input_set_next (sw_if_index[2], b[2], 1);
198 next[3] = ip4_input_set_next (sw_if_index[3], b[3], 1);
199 }
200 else
201 {
202 next[0] = ip4_input_set_next (sw_if_index[0], b[0], 0);
203 next[1] = ip4_input_set_next (sw_if_index[1], b[1], 0);
204 next[2] = ip4_input_set_next (sw_if_index[2], b[2], 0);
205 next[3] = ip4_input_set_next (sw_if_index[3], b[3], 0);
206 }
207 }
208 else
209 {
Damjan Marion067cd622018-07-11 12:47:43 +0200210 ip4_input_check_sw_if_index (vm, cm, sw_if_index[0],
211 &last_sw_if_index, &cnt, &arc_enabled);
212 ip4_input_check_sw_if_index (vm, cm, sw_if_index[1],
213 &last_sw_if_index, &cnt, &arc_enabled);
214 ip4_input_check_sw_if_index (vm, cm, sw_if_index[2],
215 &last_sw_if_index, &cnt, &arc_enabled);
216 ip4_input_check_sw_if_index (vm, cm, sw_if_index[3],
217 &last_sw_if_index, &cnt, &arc_enabled);
Damjan Marion3ade6b62018-05-26 18:53:34 +0200218
219 next[0] = ip4_input_set_next (sw_if_index[0], b[0], 1);
220 next[1] = ip4_input_set_next (sw_if_index[1], b[1], 1);
221 next[2] = ip4_input_set_next (sw_if_index[2], b[2], 1);
222 next[3] = ip4_input_set_next (sw_if_index[3], b[3], 1);
223 }
224
225 ip[0] = vlib_buffer_get_current (b[0]);
226 ip[1] = vlib_buffer_get_current (b[1]);
227 ip[2] = vlib_buffer_get_current (b[2]);
228 ip[3] = vlib_buffer_get_current (b[3]);
229
230 ip4_input_check_x4 (vm, error_node, b, ip, next, verify_checksum);
231
232 /* next */
233 b += 4;
234 next += 4;
235 n_left_from -= 4;
236 }
237 while (n_left_from)
238 {
239 u32 next0;
240 vnet_buffer (b[0])->ip.adj_index[VLIB_RX] = ~0;
241 sw_if_index[0] = vnet_buffer (b[0])->sw_if_index[VLIB_RX];
Damjan Marion067cd622018-07-11 12:47:43 +0200242 ip4_input_check_sw_if_index (vm, cm, sw_if_index[0], &last_sw_if_index,
Damjan Marion3ade6b62018-05-26 18:53:34 +0200243 &cnt, &arc_enabled);
244 next0 = ip4_input_set_next (sw_if_index[0], b[0], arc_enabled);
245 ip[0] = vlib_buffer_get_current (b[0]);
246 ip4_input_check_x1 (vm, error_node, b[0], ip[0], &next0,
247 verify_checksum);
248 next[0] = next0;
249
250 /* next */
251 b += 1;
252 next += 1;
253 n_left_from -= 1;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700254 }
255
Damjan Marion3ade6b62018-05-26 18:53:34 +0200256 vlib_increment_simple_counter (cm, thread_index, last_sw_if_index, cnt);
257 vlib_buffer_enqueue_to_next (vm, node, from, nexts, frame->n_vectors);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700258 return frame->n_vectors;
259}
260
Dave Barach132d51d2016-07-07 10:10:17 -0400261/** \brief IPv4 input node.
262 @node ip4-input
263
264 This is the IPv4 input node: validates ip4 header checksums,
265 verifies ip header lengths, discards pkts with expired TTLs,
266 and sends pkts to the set of ip feature nodes configured on
267 the rx interface.
268
269 @param vm vlib_main_t corresponding to the current thread
270 @param node vlib_node_runtime_t
271 @param frame vlib_frame_t whose contents should be dispatched
272
273 @par Graph mechanics: buffer metadata, next index usage
274
275 @em Uses:
Dave Barachd7cb1b52016-12-09 09:52:16 -0500276 - vnet_feature_config_main_t cm corresponding to each pkt's dst address unicast /
Dave Barach132d51d2016-07-07 10:10:17 -0400277 multicast status.
278 - <code>b->current_config_index</code> corresponding to each pkt's
Dave Barachd7cb1b52016-12-09 09:52:16 -0500279 rx sw_if_index.
Dave Barach132d51d2016-07-07 10:10:17 -0400280 - This sets the per-packet graph trajectory, ensuring that
281 each packet visits the per-interface features in order.
282
283 - <code>vnet_buffer(b)->sw_if_index[VLIB_RX]</code>
284 - Indicates the @c sw_if_index value of the interface that the
285 packet was received on.
286
287 @em Sets:
288 - <code>vnet_buffer(b)->ip.adj_index[VLIB_TX]</code>
289 - The lookup result adjacency index.
290
291 <em>Next Indices:</em>
292 - Dispatches pkts to the (first) feature node:
293 <code> vnet_get_config_data (... &next0 ...); </code>
Dave Barachd7cb1b52016-12-09 09:52:16 -0500294 or @c error-drop
Dave Barach132d51d2016-07-07 10:10:17 -0400295*/
Damjan Marion812b32d2018-05-28 21:26:47 +0200296VLIB_NODE_FN (ip4_input_node) (vlib_main_t * vm, vlib_node_runtime_t * node,
Damjan Marion3ade6b62018-05-26 18:53:34 +0200297 vlib_frame_t * frame)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700298{
299 return ip4_input_inline (vm, node, frame, /* verify_checksum */ 1);
300}
301
Damjan Marion812b32d2018-05-28 21:26:47 +0200302VLIB_NODE_FN (ip4_input_no_checksum_node) (vlib_main_t * vm,
Damjan Marion3ade6b62018-05-26 18:53:34 +0200303 vlib_node_runtime_t * node,
304 vlib_frame_t * frame)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700305{
306 return ip4_input_inline (vm, node, frame, /* verify_checksum */ 0);
307}
308
Damjan Marion812b32d2018-05-28 21:26:47 +0200309#ifndef CLIB_MARCH_VARIANT
Neale Ranns4c7c8e52017-10-21 09:37:55 -0700310char *ip4_error_strings[] = {
Ed Warnickecb9cada2015-12-08 15:45:58 -0700311#define _(sym,string) string,
312 foreach_ip4_error
313#undef _
314};
315
Dave Barachd7cb1b52016-12-09 09:52:16 -0500316/* *INDENT-OFF* */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700317VLIB_REGISTER_NODE (ip4_input_node) = {
Ed Warnickecb9cada2015-12-08 15:45:58 -0700318 .name = "ip4-input",
319 .vector_size = sizeof (u32),
320
321 .n_errors = IP4_N_ERROR,
322 .error_strings = ip4_error_strings,
323
324 .n_next_nodes = IP4_INPUT_N_NEXT,
325 .next_nodes = {
326 [IP4_INPUT_NEXT_DROP] = "error-drop",
327 [IP4_INPUT_NEXT_PUNT] = "error-punt",
Neale Rannsc667ffd2018-06-27 18:59:03 -0700328 [IP4_INPUT_NEXT_OPTIONS] = "ip4-options",
Ed Warnickecb9cada2015-12-08 15:45:58 -0700329 [IP4_INPUT_NEXT_LOOKUP] = "ip4-lookup",
Neale Ranns32e1c012016-11-22 17:07:28 +0000330 [IP4_INPUT_NEXT_LOOKUP_MULTICAST] = "ip4-mfib-forward-lookup",
Ole Troan92eade12016-01-13 20:17:08 +0100331 [IP4_INPUT_NEXT_ICMP_ERROR] = "ip4-icmp-error",
Klement Sekera75e7d132017-09-20 08:26:30 +0200332 [IP4_INPUT_NEXT_REASSEMBLY] = "ip4-reassembly",
Ed Warnickecb9cada2015-12-08 15:45:58 -0700333 },
334
335 .format_buffer = format_ip4_header,
336 .format_trace = format_ip4_input_trace,
337};
338
Damjan Marion812b32d2018-05-28 21:26:47 +0200339VLIB_REGISTER_NODE (ip4_input_no_checksum_node) = {
Ed Warnickecb9cada2015-12-08 15:45:58 -0700340 .name = "ip4-input-no-checksum",
341 .vector_size = sizeof (u32),
342
Neale Ranns8a03e4f2018-07-17 07:15:05 -0700343 .sibling_of = "ip4-input",
Ed Warnickecb9cada2015-12-08 15:45:58 -0700344 .format_buffer = format_ip4_header,
345 .format_trace = format_ip4_input_trace,
346};
Dave Barachd7cb1b52016-12-09 09:52:16 -0500347/* *INDENT-ON* */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700348
Dave Barachd7cb1b52016-12-09 09:52:16 -0500349static clib_error_t *
350ip4_init (vlib_main_t * vm)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700351{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500352 clib_error_t *error;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700353
Dave Barachd7cb1b52016-12-09 09:52:16 -0500354 ethernet_register_input_type (vm, ETHERNET_TYPE_IP4, ip4_input_node.index);
355 ppp_register_input_protocol (vm, PPP_PROTOCOL_ip4, ip4_input_node.index);
356 hdlc_register_input_protocol (vm, HDLC_PROTOCOL_ip4, ip4_input_node.index);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700357
358 {
Dave Barachd7cb1b52016-12-09 09:52:16 -0500359 pg_node_t *pn;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700360 pn = pg_get_node (ip4_input_node.index);
361 pn->unformat_edit = unformat_pg_ip4_header;
362 pn = pg_get_node (ip4_input_no_checksum_node.index);
363 pn->unformat_edit = unformat_pg_ip4_header;
364 }
365
366 if ((error = vlib_call_init_function (vm, ip4_cli_init)))
367 return error;
368
369 if ((error = vlib_call_init_function (vm, ip4_source_check_init)))
370 return error;
371
Dave Barachd7cb1b52016-12-09 09:52:16 -0500372 if ((error = vlib_call_init_function
Dave Barach6f9bca22016-04-30 10:25:32 -0400373 (vm, ip4_source_and_port_range_check_init)))
374 return error;
375
Ed Warnickecb9cada2015-12-08 15:45:58 -0700376 /* Set flow hash to something non-zero. */
377 ip4_main.flow_hash_seed = 0xdeadbeef;
378
379 /* Default TTL for packets we generate. */
380 ip4_main.host_config.ttl = 64;
381
382 return error;
383}
384
385VLIB_INIT_FUNCTION (ip4_init);
Dave Barach49433ad2018-08-08 17:59:03 -0400386
387static clib_error_t *
388ip4_main_loop_enter (vlib_main_t * vm)
389{
390 ip4_main_t *im = &ip4_main;
391 vlib_thread_main_t *tm = &vlib_thread_main;
392 u32 n_vlib_mains = tm->n_vlib_mains;
393 int i;
394
395
396 vec_validate (im->arp_throttle_bitmaps, n_vlib_mains);
397 vec_validate (im->arp_throttle_seeds, n_vlib_mains);
398 vec_validate (im->arp_throttle_last_seed_change_time, n_vlib_mains);
399
400 for (i = 0; i < n_vlib_mains; i++)
401 vec_validate (im->arp_throttle_bitmaps[i],
402 (ARP_THROTTLE_BITS / BITS (uword)) - 1);
403 return 0;
404}
405
406VLIB_MAIN_LOOP_ENTER_FUNCTION (ip4_main_loop_enter);
407
Damjan Marion3ade6b62018-05-26 18:53:34 +0200408#endif
Dave Barachd7cb1b52016-12-09 09:52:16 -0500409
410/*
411 * fd.io coding-style-patch-verification: ON
412 *
413 * Local Variables:
414 * eval: (c-set-style "gnu")
415 * End:
416 */