blob: b9875d72b8e9fa5c6ed7a7f16cc3bb1917560739 [file] [log] [blame]
Ed Warnickecb9cada2015-12-08 15:45:58 -07001/*
2 * Copyright (c) 2015 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
6 *
7 * http://www.apache.org/licenses/LICENSE-2.0
8 *
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
14 */
15/*
16 * ip/ip4_forward.c: IP v4 forwarding
17 *
18 * Copyright (c) 2008 Eliot Dresselhaus
19 *
20 * Permission is hereby granted, free of charge, to any person obtaining
21 * a copy of this software and associated documentation files (the
22 * "Software"), to deal in the Software without restriction, including
23 * without limitation the rights to use, copy, modify, merge, publish,
24 * distribute, sublicense, and/or sell copies of the Software, and to
25 * permit persons to whom the Software is furnished to do so, subject to
26 * the following conditions:
27 *
28 * The above copyright notice and this permission notice shall be
29 * included in all copies or substantial portions of the Software.
30 *
31 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
32 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
33 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
34 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
35 * LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
36 * OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
37 * WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
38 */
39
40#include <vnet/vnet.h>
41#include <vnet/ip/ip.h>
Neale Ranns0bfe5d82016-08-25 15:29:12 +010042#include <vnet/ethernet/ethernet.h> /* for ethernet_header_t */
43#include <vnet/ethernet/arp_packet.h> /* for ethernet_arp_header_t */
Ed Warnickecb9cada2015-12-08 15:45:58 -070044#include <vnet/ppp/ppp.h>
Neale Ranns0bfe5d82016-08-25 15:29:12 +010045#include <vnet/srp/srp.h> /* for srp_hw_interface_class */
Dave Barachd7cb1b52016-12-09 09:52:16 -050046#include <vnet/api_errno.h> /* for API error numbers */
47#include <vnet/fib/fib_table.h> /* for FIB table and entry creation */
48#include <vnet/fib/fib_entry.h> /* for FIB table and entry creation */
49#include <vnet/fib/fib_urpf_list.h> /* for FIB uRPF check */
Neale Ranns0bfe5d82016-08-25 15:29:12 +010050#include <vnet/fib/ip4_fib.h>
51#include <vnet/dpo/load_balance.h>
Neale Rannsf12a83f2017-04-18 09:09:40 -070052#include <vnet/dpo/load_balance_map.h>
Neale Ranns0bfe5d82016-08-25 15:29:12 +010053#include <vnet/dpo/classify_dpo.h>
Neale Ranns32e1c012016-11-22 17:07:28 +000054#include <vnet/mfib/mfib_table.h> /* for mFIB table and entry creation */
Ed Warnickecb9cada2015-12-08 15:45:58 -070055
Vijayabhaskar Katamreddyacbde662018-01-23 13:39:40 -080056#include <vnet/ip/ip4_forward.h>
Ed Warnickecb9cada2015-12-08 15:45:58 -070057
Chris Luke8e5b0412016-07-26 13:06:10 -040058/** @brief IPv4 lookup node.
Dave Barach9770e202016-07-06 10:29:27 -040059 @node ip4-lookup
60
61 This is the main IPv4 lookup dispatch node.
62
63 @param vm vlib_main_t corresponding to the current thread
64 @param node vlib_node_runtime_t
65 @param frame vlib_frame_t whose contents should be dispatched
66
67 @par Graph mechanics: buffer metadata, next index usage
68
69 @em Uses:
70 - <code>vnet_buffer(b)->sw_if_index[VLIB_RX]</code>
71 - Indicates the @c sw_if_index value of the interface that the
72 packet was received on.
73 - <code>vnet_buffer(b)->sw_if_index[VLIB_TX]</code>
74 - When the value is @c ~0 then the node performs a longest prefix
75 match (LPM) for the packet destination address in the FIB attached
76 to the receive interface.
77 - Otherwise perform LPM for the packet destination address in the
78 indicated FIB. In this case <code>[VLIB_TX]</code> is a FIB index
79 value (0, 1, ...) and not a VRF id.
80
81 @em Sets:
82 - <code>vnet_buffer(b)->ip.adj_index[VLIB_TX]</code>
83 - The lookup result adjacency index.
84
85 <em>Next Index:</em>
86 - Dispatches the packet to the node index found in
87 ip_adjacency_t @c adj->lookup_next_index
88 (where @c adj is the lookup result adjacency).
89*/
Ed Warnickecb9cada2015-12-08 15:45:58 -070090static uword
91ip4_lookup (vlib_main_t * vm,
Dave Barachd7cb1b52016-12-09 09:52:16 -050092 vlib_node_runtime_t * node, vlib_frame_t * frame)
Ed Warnickecb9cada2015-12-08 15:45:58 -070093{
Damjan Marionaca64c92016-04-13 09:48:56 +020094 return ip4_lookup_inline (vm, node, frame,
Dave Barachd7cb1b52016-12-09 09:52:16 -050095 /* lookup_for_responses_to_locally_received_packets */
96 0);
Ed Warnickecb9cada2015-12-08 15:45:58 -070097
98}
99
Dave Barachd7cb1b52016-12-09 09:52:16 -0500100static u8 *format_ip4_lookup_trace (u8 * s, va_list * args);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100101
Neale Rannsf8686322017-11-29 02:39:53 -0800102/* *INDENT-OFF* */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500103VLIB_REGISTER_NODE (ip4_lookup_node) =
104{
Neale Rannsf8686322017-11-29 02:39:53 -0800105 .function = ip4_lookup,
106 .name = "ip4-lookup",
107 .vector_size = sizeof (u32),
108 .format_trace = format_ip4_lookup_trace,
109 .n_next_nodes = IP_LOOKUP_N_NEXT,
110 .next_nodes = IP4_LOOKUP_NEXT_NODES,
111};
112/* *INDENT-ON* */
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100113
Dave Barachd7cb1b52016-12-09 09:52:16 -0500114VLIB_NODE_FUNCTION_MULTIARCH (ip4_lookup_node, ip4_lookup);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100115
116always_inline uword
117ip4_load_balance (vlib_main_t * vm,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500118 vlib_node_runtime_t * node, vlib_frame_t * frame)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700119{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500120 vlib_combined_counter_main_t *cm = &load_balance_main.lbm_via_counters;
121 u32 n_left_from, n_left_to_next, *from, *to_next;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100122 ip_lookup_next_t next;
Damjan Marion586afd72017-04-05 19:18:20 +0200123 u32 thread_index = vlib_get_thread_index ();
Ed Warnickecb9cada2015-12-08 15:45:58 -0700124
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100125 from = vlib_frame_vector_args (frame);
126 n_left_from = frame->n_vectors;
127 next = node->cached_next_index;
128
129 if (node->flags & VLIB_NODE_FLAG_TRACE)
Dave Barachd7cb1b52016-12-09 09:52:16 -0500130 ip4_forward_next_trace (vm, node, frame, VLIB_TX);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100131
132 while (n_left_from > 0)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700133 {
Dave Barachd7cb1b52016-12-09 09:52:16 -0500134 vlib_get_next_frame (vm, node, next, to_next, n_left_to_next);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100135
Dave Barach75fc8542016-10-11 16:16:02 -0400136
Neale Ranns2be95c12016-11-19 13:50:04 +0000137 while (n_left_from >= 4 && n_left_to_next >= 2)
Dave Barachd7cb1b52016-12-09 09:52:16 -0500138 {
139 ip_lookup_next_t next0, next1;
Neale Ranns2be95c12016-11-19 13:50:04 +0000140 const load_balance_t *lb0, *lb1;
Dave Barachd7cb1b52016-12-09 09:52:16 -0500141 vlib_buffer_t *p0, *p1;
Neale Ranns2be95c12016-11-19 13:50:04 +0000142 u32 pi0, lbi0, hc0, pi1, lbi1, hc1;
143 const ip4_header_t *ip0, *ip1;
144 const dpo_id_t *dpo0, *dpo1;
145
Dave Barachd7cb1b52016-12-09 09:52:16 -0500146 /* Prefetch next iteration. */
147 {
148 vlib_buffer_t *p2, *p3;
Neale Ranns2be95c12016-11-19 13:50:04 +0000149
150 p2 = vlib_get_buffer (vm, from[2]);
151 p3 = vlib_get_buffer (vm, from[3]);
152
153 vlib_prefetch_buffer_header (p2, STORE);
154 vlib_prefetch_buffer_header (p3, STORE);
155
156 CLIB_PREFETCH (p2->data, sizeof (ip0[0]), STORE);
157 CLIB_PREFETCH (p3->data, sizeof (ip0[0]), STORE);
Dave Barachd7cb1b52016-12-09 09:52:16 -0500158 }
Neale Ranns2be95c12016-11-19 13:50:04 +0000159
160 pi0 = to_next[0] = from[0];
161 pi1 = to_next[1] = from[1];
162
163 from += 2;
164 n_left_from -= 2;
165 to_next += 2;
166 n_left_to_next -= 2;
167
168 p0 = vlib_get_buffer (vm, pi0);
169 p1 = vlib_get_buffer (vm, pi1);
170
171 ip0 = vlib_buffer_get_current (p0);
172 ip1 = vlib_buffer_get_current (p1);
173 lbi0 = vnet_buffer (p0)->ip.adj_index[VLIB_TX];
174 lbi1 = vnet_buffer (p1)->ip.adj_index[VLIB_TX];
175
Dave Barachd7cb1b52016-12-09 09:52:16 -0500176 lb0 = load_balance_get (lbi0);
177 lb1 = load_balance_get (lbi1);
Neale Ranns2be95c12016-11-19 13:50:04 +0000178
Dave Barachd7cb1b52016-12-09 09:52:16 -0500179 /*
180 * this node is for via FIBs we can re-use the hash value from the
181 * to node if present.
182 * We don't want to use the same hash value at each level in the recursion
183 * graph as that would lead to polarisation
184 */
AkshayaNadahalli153b8712017-03-06 18:22:29 +0000185 hc0 = hc1 = 0;
Neale Ranns2be95c12016-11-19 13:50:04 +0000186
Dave Barachd7cb1b52016-12-09 09:52:16 -0500187 if (PREDICT_FALSE (lb0->lb_n_buckets > 1))
188 {
189 if (PREDICT_TRUE (vnet_buffer (p0)->ip.flow_hash))
190 {
191 hc0 = vnet_buffer (p0)->ip.flow_hash =
192 vnet_buffer (p0)->ip.flow_hash >> 1;
193 }
194 else
195 {
196 hc0 = vnet_buffer (p0)->ip.flow_hash =
AkshayaNadahalli153b8712017-03-06 18:22:29 +0000197 ip4_compute_flow_hash (ip0, lb0->lb_hash_config);
Dave Barachd7cb1b52016-12-09 09:52:16 -0500198 }
Neale Rannsf12a83f2017-04-18 09:09:40 -0700199 dpo0 = load_balance_get_fwd_bucket
200 (lb0, (hc0 & (lb0->lb_n_buckets_minus_1)));
201 }
202 else
203 {
204 dpo0 = load_balance_get_bucket_i (lb0, 0);
Dave Barachd7cb1b52016-12-09 09:52:16 -0500205 }
206 if (PREDICT_FALSE (lb1->lb_n_buckets > 1))
207 {
208 if (PREDICT_TRUE (vnet_buffer (p1)->ip.flow_hash))
209 {
210 hc1 = vnet_buffer (p1)->ip.flow_hash =
211 vnet_buffer (p1)->ip.flow_hash >> 1;
212 }
213 else
214 {
215 hc1 = vnet_buffer (p1)->ip.flow_hash =
AkshayaNadahalli153b8712017-03-06 18:22:29 +0000216 ip4_compute_flow_hash (ip1, lb1->lb_hash_config);
Dave Barachd7cb1b52016-12-09 09:52:16 -0500217 }
Neale Rannsf12a83f2017-04-18 09:09:40 -0700218 dpo1 = load_balance_get_fwd_bucket
219 (lb1, (hc1 & (lb1->lb_n_buckets_minus_1)));
Dave Barachd7cb1b52016-12-09 09:52:16 -0500220 }
Neale Rannsf12a83f2017-04-18 09:09:40 -0700221 else
222 {
223 dpo1 = load_balance_get_bucket_i (lb1, 0);
224 }
Neale Ranns2be95c12016-11-19 13:50:04 +0000225
226 next0 = dpo0->dpoi_next_node;
227 next1 = dpo1->dpoi_next_node;
228
229 vnet_buffer (p0)->ip.adj_index[VLIB_TX] = dpo0->dpoi_index;
230 vnet_buffer (p1)->ip.adj_index[VLIB_TX] = dpo1->dpoi_index;
231
232 vlib_increment_combined_counter
Damjan Marion586afd72017-04-05 19:18:20 +0200233 (cm, thread_index, lbi0, 1, vlib_buffer_length_in_chain (vm, p0));
Neale Ranns2be95c12016-11-19 13:50:04 +0000234 vlib_increment_combined_counter
Damjan Marion586afd72017-04-05 19:18:20 +0200235 (cm, thread_index, lbi1, 1, vlib_buffer_length_in_chain (vm, p1));
Neale Ranns2be95c12016-11-19 13:50:04 +0000236
237 vlib_validate_buffer_enqueue_x2 (vm, node, next,
238 to_next, n_left_to_next,
239 pi0, pi1, next0, next1);
Dave Barachd7cb1b52016-12-09 09:52:16 -0500240 }
Neale Ranns2be95c12016-11-19 13:50:04 +0000241
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100242 while (n_left_from > 0 && n_left_to_next > 0)
243 {
244 ip_lookup_next_t next0;
245 const load_balance_t *lb0;
Dave Barachd7cb1b52016-12-09 09:52:16 -0500246 vlib_buffer_t *p0;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100247 u32 pi0, lbi0, hc0;
248 const ip4_header_t *ip0;
249 const dpo_id_t *dpo0;
250
251 pi0 = from[0];
252 to_next[0] = pi0;
Neale Ranns2be95c12016-11-19 13:50:04 +0000253 from += 1;
254 to_next += 1;
255 n_left_to_next -= 1;
256 n_left_from -= 1;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100257
258 p0 = vlib_get_buffer (vm, pi0);
259
260 ip0 = vlib_buffer_get_current (p0);
261 lbi0 = vnet_buffer (p0)->ip.adj_index[VLIB_TX];
262
Dave Barachd7cb1b52016-12-09 09:52:16 -0500263 lb0 = load_balance_get (lbi0);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100264
AkshayaNadahalli153b8712017-03-06 18:22:29 +0000265 hc0 = 0;
Dave Barachd7cb1b52016-12-09 09:52:16 -0500266 if (PREDICT_FALSE (lb0->lb_n_buckets > 1))
267 {
268 if (PREDICT_TRUE (vnet_buffer (p0)->ip.flow_hash))
269 {
270 hc0 = vnet_buffer (p0)->ip.flow_hash =
271 vnet_buffer (p0)->ip.flow_hash >> 1;
272 }
273 else
274 {
275 hc0 = vnet_buffer (p0)->ip.flow_hash =
AkshayaNadahalli153b8712017-03-06 18:22:29 +0000276 ip4_compute_flow_hash (ip0, lb0->lb_hash_config);
Dave Barachd7cb1b52016-12-09 09:52:16 -0500277 }
Neale Rannsf12a83f2017-04-18 09:09:40 -0700278 dpo0 = load_balance_get_fwd_bucket
279 (lb0, (hc0 & (lb0->lb_n_buckets_minus_1)));
Dave Barachd7cb1b52016-12-09 09:52:16 -0500280 }
Neale Rannsf12a83f2017-04-18 09:09:40 -0700281 else
282 {
283 dpo0 = load_balance_get_bucket_i (lb0, 0);
284 }
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100285
286 next0 = dpo0->dpoi_next_node;
287 vnet_buffer (p0)->ip.adj_index[VLIB_TX] = dpo0->dpoi_index;
288
Dave Barach75fc8542016-10-11 16:16:02 -0400289 vlib_increment_combined_counter
Damjan Marion586afd72017-04-05 19:18:20 +0200290 (cm, thread_index, lbi0, 1, vlib_buffer_length_in_chain (vm, p0));
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100291
Neale Ranns2be95c12016-11-19 13:50:04 +0000292 vlib_validate_buffer_enqueue_x1 (vm, node, next,
293 to_next, n_left_to_next,
294 pi0, next0);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100295 }
296
297 vlib_put_next_frame (vm, node, next, n_left_to_next);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700298 }
299
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100300 return frame->n_vectors;
301}
302
Neale Rannsf8686322017-11-29 02:39:53 -0800303/* *INDENT-OFF* */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500304VLIB_REGISTER_NODE (ip4_load_balance_node) =
305{
Neale Rannsf8686322017-11-29 02:39:53 -0800306 .function = ip4_load_balance,
307 .name = "ip4-load-balance",
308 .vector_size = sizeof (u32),
309 .sibling_of = "ip4-lookup",
310 .format_trace =
311 format_ip4_lookup_trace,
312};
313/* *INDENT-ON* */
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100314
Dave Barachd7cb1b52016-12-09 09:52:16 -0500315VLIB_NODE_FUNCTION_MULTIARCH (ip4_load_balance_node, ip4_load_balance);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100316
317/* get first interface address */
318ip4_address_t *
319ip4_interface_first_address (ip4_main_t * im, u32 sw_if_index,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500320 ip_interface_address_t ** result_ia)
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100321{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500322 ip_lookup_main_t *lm = &im->lookup_main;
323 ip_interface_address_t *ia = 0;
324 ip4_address_t *result = 0;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100325
Neale Ranns32e1c012016-11-22 17:07:28 +0000326 /* *INDENT-OFF* */
327 foreach_ip_interface_address
328 (lm, ia, sw_if_index,
329 1 /* honor unnumbered */ ,
330 ({
331 ip4_address_t * a =
332 ip_interface_address_get_address (lm, ia);
333 result = a;
334 break;
335 }));
336 /* *INDENT-OFF* */
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100337 if (result_ia)
338 *result_ia = result ? ia : 0;
339 return result;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700340}
341
342static void
343ip4_add_interface_routes (u32 sw_if_index,
344 ip4_main_t * im, u32 fib_index,
345 ip_interface_address_t * a)
346{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500347 ip_lookup_main_t *lm = &im->lookup_main;
348 ip4_address_t *address = ip_interface_address_get_address (lm, a);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100349 fib_prefix_t pfx = {
Dave Barachd7cb1b52016-12-09 09:52:16 -0500350 .fp_len = a->address_length,
351 .fp_proto = FIB_PROTOCOL_IP4,
352 .fp_addr.ip4 = *address,
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100353 };
Ed Warnickecb9cada2015-12-08 15:45:58 -0700354
Neale Ranns9a69a602017-03-26 10:56:33 -0700355 if (pfx.fp_len <= 30)
Dave Barachd7cb1b52016-12-09 09:52:16 -0500356 {
Neale Ranns9a69a602017-03-26 10:56:33 -0700357 /* a /30 or shorter - add a glean for the network address */
Neale Ranns7a272742017-05-30 02:08:14 -0700358 fib_table_entry_update_one_path (fib_index, &pfx,
359 FIB_SOURCE_INTERFACE,
360 (FIB_ENTRY_FLAG_CONNECTED |
361 FIB_ENTRY_FLAG_ATTACHED),
Neale Rannsda78f952017-05-24 09:15:43 -0700362 DPO_PROTO_IP4,
Neale Ranns7a272742017-05-30 02:08:14 -0700363 /* No next-hop address */
364 NULL,
365 sw_if_index,
366 // invalid FIB index
367 ~0,
368 1,
369 // no out-label stack
370 NULL,
371 FIB_ROUTE_PATH_FLAG_NONE);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100372
Neale Ranns9a69a602017-03-26 10:56:33 -0700373 /* Add the two broadcast addresses as drop */
374 fib_prefix_t net_pfx = {
375 .fp_len = 32,
376 .fp_proto = FIB_PROTOCOL_IP4,
377 .fp_addr.ip4.as_u32 = address->as_u32 & im->fib_masks[pfx.fp_len],
378 };
379 if (net_pfx.fp_addr.ip4.as_u32 != pfx.fp_addr.ip4.as_u32)
380 fib_table_entry_special_add(fib_index,
381 &net_pfx,
382 FIB_SOURCE_INTERFACE,
383 (FIB_ENTRY_FLAG_DROP |
Neale Rannsa0558302017-04-13 00:44:52 -0700384 FIB_ENTRY_FLAG_LOOSE_URPF_EXEMPT));
Neale Ranns9a69a602017-03-26 10:56:33 -0700385 net_pfx.fp_addr.ip4.as_u32 |= ~im->fib_masks[pfx.fp_len];
386 if (net_pfx.fp_addr.ip4.as_u32 != pfx.fp_addr.ip4.as_u32)
387 fib_table_entry_special_add(fib_index,
388 &net_pfx,
389 FIB_SOURCE_INTERFACE,
390 (FIB_ENTRY_FLAG_DROP |
Neale Rannsa0558302017-04-13 00:44:52 -0700391 FIB_ENTRY_FLAG_LOOSE_URPF_EXEMPT));
Neale Ranns9a69a602017-03-26 10:56:33 -0700392 }
393 else if (pfx.fp_len == 31)
394 {
395 u32 mask = clib_host_to_net_u32(1);
396 fib_prefix_t net_pfx = pfx;
397
398 net_pfx.fp_len = 32;
399 net_pfx.fp_addr.ip4.as_u32 ^= mask;
400
401 /* a /31 - add the other end as an attached host */
402 fib_table_entry_update_one_path (fib_index, &net_pfx,
403 FIB_SOURCE_INTERFACE,
404 (FIB_ENTRY_FLAG_ATTACHED),
Neale Rannsda78f952017-05-24 09:15:43 -0700405 DPO_PROTO_IP4,
Neale Ranns9a69a602017-03-26 10:56:33 -0700406 &net_pfx.fp_addr,
407 sw_if_index,
408 // invalid FIB index
409 ~0,
410 1,
411 NULL,
412 FIB_ROUTE_PATH_FLAG_NONE);
413 }
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100414 pfx.fp_len = 32;
415
416 if (sw_if_index < vec_len (lm->classify_table_index_by_sw_if_index))
Dave Barachd7cb1b52016-12-09 09:52:16 -0500417 {
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100418 u32 classify_table_index =
Dave Barachd7cb1b52016-12-09 09:52:16 -0500419 lm->classify_table_index_by_sw_if_index[sw_if_index];
420 if (classify_table_index != (u32) ~ 0)
421 {
422 dpo_id_t dpo = DPO_INVALID;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100423
Dave Barachd7cb1b52016-12-09 09:52:16 -0500424 dpo_set (&dpo,
425 DPO_CLASSIFY,
426 DPO_PROTO_IP4,
427 classify_dpo_create (DPO_PROTO_IP4, classify_table_index));
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100428
Dave Barachd7cb1b52016-12-09 09:52:16 -0500429 fib_table_entry_special_dpo_add (fib_index,
430 &pfx,
431 FIB_SOURCE_CLASSIFY,
432 FIB_ENTRY_FLAG_NONE, &dpo);
433 dpo_reset (&dpo);
434 }
435 }
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100436
Neale Ranns32e1c012016-11-22 17:07:28 +0000437 fib_table_entry_update_one_path (fib_index, &pfx,
438 FIB_SOURCE_INTERFACE,
439 (FIB_ENTRY_FLAG_CONNECTED |
440 FIB_ENTRY_FLAG_LOCAL),
Neale Rannsda78f952017-05-24 09:15:43 -0700441 DPO_PROTO_IP4,
Neale Ranns32e1c012016-11-22 17:07:28 +0000442 &pfx.fp_addr,
443 sw_if_index,
444 // invalid FIB index
445 ~0,
446 1, NULL,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500447 FIB_ROUTE_PATH_FLAG_NONE);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700448}
449
450static void
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100451ip4_del_interface_routes (ip4_main_t * im,
452 u32 fib_index,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500453 ip4_address_t * address, u32 address_length)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700454{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500455 fib_prefix_t pfx = {
456 .fp_len = address_length,
457 .fp_proto = FIB_PROTOCOL_IP4,
458 .fp_addr.ip4 = *address,
459 };
Ed Warnickecb9cada2015-12-08 15:45:58 -0700460
Neale Ranns9a69a602017-03-26 10:56:33 -0700461 if (pfx.fp_len <= 30)
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100462 {
Neale Ranns9a69a602017-03-26 10:56:33 -0700463 fib_prefix_t net_pfx = {
464 .fp_len = 32,
465 .fp_proto = FIB_PROTOCOL_IP4,
466 .fp_addr.ip4.as_u32 = address->as_u32 & im->fib_masks[pfx.fp_len],
467 };
468 if (net_pfx.fp_addr.ip4.as_u32 != pfx.fp_addr.ip4.as_u32)
469 fib_table_entry_special_remove(fib_index,
470 &net_pfx,
471 FIB_SOURCE_INTERFACE);
472 net_pfx.fp_addr.ip4.as_u32 |= ~im->fib_masks[pfx.fp_len];
473 if (net_pfx.fp_addr.ip4.as_u32 != pfx.fp_addr.ip4.as_u32)
474 fib_table_entry_special_remove(fib_index,
475 &net_pfx,
476 FIB_SOURCE_INTERFACE);
Dave Barachd7cb1b52016-12-09 09:52:16 -0500477 fib_table_entry_delete (fib_index, &pfx, FIB_SOURCE_INTERFACE);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100478 }
Neale Ranns9a69a602017-03-26 10:56:33 -0700479 else if (pfx.fp_len == 31)
480 {
481 u32 mask = clib_host_to_net_u32(1);
482 fib_prefix_t net_pfx = pfx;
483
484 net_pfx.fp_len = 32;
485 net_pfx.fp_addr.ip4.as_u32 ^= mask;
486
487 fib_table_entry_delete (fib_index, &net_pfx, FIB_SOURCE_INTERFACE);
488 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700489
Dave Barachd7cb1b52016-12-09 09:52:16 -0500490 pfx.fp_len = 32;
491 fib_table_entry_delete (fib_index, &pfx, FIB_SOURCE_INTERFACE);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700492}
493
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100494void
Dave Barachd7cb1b52016-12-09 09:52:16 -0500495ip4_sw_interface_enable_disable (u32 sw_if_index, u32 is_enable)
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100496{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500497 ip4_main_t *im = &ip4_main;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700498
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100499 vec_validate_init_empty (im->ip_enabled_by_sw_if_index, sw_if_index, 0);
500
501 /*
502 * enable/disable only on the 1<->0 transition
503 */
504 if (is_enable)
505 {
506 if (1 != ++im->ip_enabled_by_sw_if_index[sw_if_index])
Dave Barachd7cb1b52016-12-09 09:52:16 -0500507 return;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100508 }
509 else
510 {
Dave Barachd7cb1b52016-12-09 09:52:16 -0500511 ASSERT (im->ip_enabled_by_sw_if_index[sw_if_index] > 0);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100512 if (0 != --im->ip_enabled_by_sw_if_index[sw_if_index])
Dave Barachd7cb1b52016-12-09 09:52:16 -0500513 return;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100514 }
Neale Ranns8269d3d2018-01-30 09:02:20 -0800515 vnet_feature_enable_disable ("ip4-unicast", "ip4-not-enabled", sw_if_index,
Damjan Marion4d489932016-12-09 03:21:27 -0800516 !is_enable, 0, 0);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100517
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100518
Neale Ranns8269d3d2018-01-30 09:02:20 -0800519 vnet_feature_enable_disable ("ip4-multicast", "ip4-not-enabled",
Neale Ranns180279b2017-03-16 15:49:09 -0400520 sw_if_index, !is_enable, 0, 0);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100521}
Ed Warnickecb9cada2015-12-08 15:45:58 -0700522
Ed Warnickecb9cada2015-12-08 15:45:58 -0700523static clib_error_t *
524ip4_add_del_interface_address_internal (vlib_main_t * vm,
525 u32 sw_if_index,
526 ip4_address_t * address,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500527 u32 address_length, u32 is_del)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700528{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500529 vnet_main_t *vnm = vnet_get_main ();
530 ip4_main_t *im = &ip4_main;
531 ip_lookup_main_t *lm = &im->lookup_main;
532 clib_error_t *error = 0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700533 u32 if_address_index, elts_before;
Dave Barachd7cb1b52016-12-09 09:52:16 -0500534 ip4_address_fib_t ip4_af, *addr_fib = 0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700535
Pavel Kotucek57808982017-08-02 08:20:19 +0200536 /* local0 interface doesn't support IP addressing */
537 if (sw_if_index == 0)
538 {
539 return
540 clib_error_create ("local0 interface doesn't support IP addressing");
541 }
542
Ed Warnickecb9cada2015-12-08 15:45:58 -0700543 vec_validate (im->fib_index_by_sw_if_index, sw_if_index);
544 ip4_addr_fib_init (&ip4_af, address,
545 vec_elt (im->fib_index_by_sw_if_index, sw_if_index));
546 vec_add1 (addr_fib, ip4_af);
547
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100548 /* FIXME-LATER
549 * there is no support for adj-fib handling in the presence of overlapping
550 * subnets on interfaces. Easy fix - disallow overlapping subnets, like
551 * most routers do.
552 */
Neale Ranns32e1c012016-11-22 17:07:28 +0000553 /* *INDENT-OFF* */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500554 if (!is_del)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700555 {
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100556 /* When adding an address check that it does not conflict
Dave Barachd7cb1b52016-12-09 09:52:16 -0500557 with an existing address. */
558 ip_interface_address_t *ia;
Neale Ranns32e1c012016-11-22 17:07:28 +0000559 foreach_ip_interface_address
560 (&im->lookup_main, ia, sw_if_index,
561 0 /* honor unnumbered */ ,
562 ({
563 ip4_address_t * x =
564 ip_interface_address_get_address
565 (&im->lookup_main, ia);
566 if (ip4_destination_matches_route
567 (im, address, x, ia->address_length) ||
568 ip4_destination_matches_route (im,
569 x,
570 address,
571 address_length))
572 return
573 clib_error_create
574 ("failed to add %U which conflicts with %U for interface %U",
575 format_ip4_address_and_length, address,
576 address_length,
577 format_ip4_address_and_length, x,
578 ia->address_length,
579 format_vnet_sw_if_index_name, vnm,
580 sw_if_index);
581 }));
Ed Warnickecb9cada2015-12-08 15:45:58 -0700582 }
Neale Ranns32e1c012016-11-22 17:07:28 +0000583 /* *INDENT-ON* */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700584
Ed Warnickecb9cada2015-12-08 15:45:58 -0700585 elts_before = pool_elts (lm->if_address_pool);
586
587 error = ip_interface_address_add_del
Dave Barachd7cb1b52016-12-09 09:52:16 -0500588 (lm, sw_if_index, addr_fib, address_length, is_del, &if_address_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700589 if (error)
590 goto done;
Dave Barach75fc8542016-10-11 16:16:02 -0400591
Dave Barachd7cb1b52016-12-09 09:52:16 -0500592 ip4_sw_interface_enable_disable (sw_if_index, !is_del);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100593
594 if (is_del)
Dave Barachd7cb1b52016-12-09 09:52:16 -0500595 ip4_del_interface_routes (im, ip4_af.fib_index, address, address_length);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100596 else
Dave Barachd7cb1b52016-12-09 09:52:16 -0500597 ip4_add_interface_routes (sw_if_index,
598 im, ip4_af.fib_index,
599 pool_elt_at_index
600 (lm->if_address_pool, if_address_index));
Ed Warnickecb9cada2015-12-08 15:45:58 -0700601
602 /* If pool did not grow/shrink: add duplicate address. */
603 if (elts_before != pool_elts (lm->if_address_pool))
604 {
Dave Barachd7cb1b52016-12-09 09:52:16 -0500605 ip4_add_del_interface_address_callback_t *cb;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700606 vec_foreach (cb, im->add_del_interface_address_callbacks)
607 cb->function (im, cb->function_opaque, sw_if_index,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500608 address, address_length, if_address_index, is_del);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700609 }
610
Dave Barachd7cb1b52016-12-09 09:52:16 -0500611done:
Ed Warnickecb9cada2015-12-08 15:45:58 -0700612 vec_free (addr_fib);
613 return error;
614}
615
616clib_error_t *
Neale Ranns32e1c012016-11-22 17:07:28 +0000617ip4_add_del_interface_address (vlib_main_t * vm,
618 u32 sw_if_index,
619 ip4_address_t * address,
620 u32 address_length, u32 is_del)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700621{
622 return ip4_add_del_interface_address_internal
Dave Barachd7cb1b52016-12-09 09:52:16 -0500623 (vm, sw_if_index, address, address_length, is_del);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700624}
625
Dave Barachd6534602016-06-14 18:38:02 -0400626/* Built-in ip4 unicast rx feature path definition */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500627/* *INDENT-OFF* */
Damjan Marion8b3191e2016-11-09 19:54:20 +0100628VNET_FEATURE_ARC_INIT (ip4_unicast, static) =
629{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500630 .arc_name = "ip4-unicast",
Damjan Marion892e0762016-12-09 18:52:05 +0100631 .start_nodes = VNET_FEATURES ("ip4-input", "ip4-input-no-checksum"),
632 .arc_index_ptr = &ip4_main.lookup_main.ucast_feature_arc_index,
633};
Damjan Marion8b3191e2016-11-09 19:54:20 +0100634
Dave Barachd7cb1b52016-12-09 09:52:16 -0500635VNET_FEATURE_INIT (ip4_flow_classify, static) =
636{
Damjan Marion8b3191e2016-11-09 19:54:20 +0100637 .arc_name = "ip4-unicast",
Juraj Sloboda506b2452016-08-07 23:45:24 -0700638 .node_name = "ip4-flow-classify",
Damjan Marion8b3191e2016-11-09 19:54:20 +0100639 .runs_before = VNET_FEATURES ("ip4-inacl"),
Juraj Sloboda506b2452016-08-07 23:45:24 -0700640};
641
Dave Barachd7cb1b52016-12-09 09:52:16 -0500642VNET_FEATURE_INIT (ip4_inacl, static) =
643{
Damjan Marion8b3191e2016-11-09 19:54:20 +0100644 .arc_name = "ip4-unicast",
Dave Barach75fc8542016-10-11 16:16:02 -0400645 .node_name = "ip4-inacl",
Damjan Marion8b3191e2016-11-09 19:54:20 +0100646 .runs_before = VNET_FEATURES ("ip4-source-check-via-rx"),
Dave Barachd6534602016-06-14 18:38:02 -0400647};
648
Dave Barachd7cb1b52016-12-09 09:52:16 -0500649VNET_FEATURE_INIT (ip4_source_check_1, static) =
650{
Damjan Marion8b3191e2016-11-09 19:54:20 +0100651 .arc_name = "ip4-unicast",
Dave Barachd6534602016-06-14 18:38:02 -0400652 .node_name = "ip4-source-check-via-rx",
Damjan Marion8b3191e2016-11-09 19:54:20 +0100653 .runs_before = VNET_FEATURES ("ip4-source-check-via-any"),
Dave Barachd6534602016-06-14 18:38:02 -0400654};
655
Dave Barachd7cb1b52016-12-09 09:52:16 -0500656VNET_FEATURE_INIT (ip4_source_check_2, static) =
657{
Damjan Marion8b3191e2016-11-09 19:54:20 +0100658 .arc_name = "ip4-unicast",
Dave Barachd6534602016-06-14 18:38:02 -0400659 .node_name = "ip4-source-check-via-any",
Damjan Marion8b3191e2016-11-09 19:54:20 +0100660 .runs_before = VNET_FEATURES ("ip4-policer-classify"),
Dave Barachd6534602016-06-14 18:38:02 -0400661};
662
Dave Barachd7cb1b52016-12-09 09:52:16 -0500663VNET_FEATURE_INIT (ip4_source_and_port_range_check_rx, static) =
664{
Damjan Marion8b3191e2016-11-09 19:54:20 +0100665 .arc_name = "ip4-unicast",
Dave Barach5331c722016-08-17 11:54:30 -0400666 .node_name = "ip4-source-and-port-range-check-rx",
Damjan Marion8b3191e2016-11-09 19:54:20 +0100667 .runs_before = VNET_FEATURES ("ip4-policer-classify"),
Dave Barach6f9bca22016-04-30 10:25:32 -0400668};
669
Dave Barachd7cb1b52016-12-09 09:52:16 -0500670VNET_FEATURE_INIT (ip4_policer_classify, static) =
671{
Damjan Marion8b3191e2016-11-09 19:54:20 +0100672 .arc_name = "ip4-unicast",
Matus Fabian70e6a8d2016-06-20 08:10:42 -0700673 .node_name = "ip4-policer-classify",
Damjan Marion8b3191e2016-11-09 19:54:20 +0100674 .runs_before = VNET_FEATURES ("ipsec-input-ip4"),
Matus Fabian70e6a8d2016-06-20 08:10:42 -0700675};
676
Dave Barachd7cb1b52016-12-09 09:52:16 -0500677VNET_FEATURE_INIT (ip4_ipsec, static) =
678{
Damjan Marion8b3191e2016-11-09 19:54:20 +0100679 .arc_name = "ip4-unicast",
Dave Barachd6534602016-06-14 18:38:02 -0400680 .node_name = "ipsec-input-ip4",
Damjan Marion8b3191e2016-11-09 19:54:20 +0100681 .runs_before = VNET_FEATURES ("vpath-input-ip4"),
Dave Barachd6534602016-06-14 18:38:02 -0400682};
683
Dave Barachd7cb1b52016-12-09 09:52:16 -0500684VNET_FEATURE_INIT (ip4_vpath, static) =
685{
Damjan Marion8b3191e2016-11-09 19:54:20 +0100686 .arc_name = "ip4-unicast",
Dave Barachd6534602016-06-14 18:38:02 -0400687 .node_name = "vpath-input-ip4",
John Lo37682e12016-11-30 12:51:39 -0500688 .runs_before = VNET_FEATURES ("ip4-vxlan-bypass"),
689};
690
Dave Barachd7cb1b52016-12-09 09:52:16 -0500691VNET_FEATURE_INIT (ip4_vxlan_bypass, static) =
692{
John Lo37682e12016-11-30 12:51:39 -0500693 .arc_name = "ip4-unicast",
694 .node_name = "ip4-vxlan-bypass",
Damjan Marion8b3191e2016-11-09 19:54:20 +0100695 .runs_before = VNET_FEATURES ("ip4-lookup"),
Dave Barachd6534602016-06-14 18:38:02 -0400696};
697
Neale Ranns8269d3d2018-01-30 09:02:20 -0800698VNET_FEATURE_INIT (ip4_not_enabled, static) =
Dave Barachd7cb1b52016-12-09 09:52:16 -0500699{
Damjan Marion8b3191e2016-11-09 19:54:20 +0100700 .arc_name = "ip4-unicast",
Neale Ranns8269d3d2018-01-30 09:02:20 -0800701 .node_name = "ip4-not-enabled",
Neale Ranns180279b2017-03-16 15:49:09 -0400702 .runs_before = VNET_FEATURES ("ip4-lookup"),
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100703};
704
Neale Ranns180279b2017-03-16 15:49:09 -0400705VNET_FEATURE_INIT (ip4_lookup, static) =
706{
707 .arc_name = "ip4-unicast",
708 .node_name = "ip4-lookup",
709 .runs_before = 0, /* not before any other features */
710};
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100711
Dave Barachd6534602016-06-14 18:38:02 -0400712/* Built-in ip4 multicast rx feature path definition */
Damjan Marion8b3191e2016-11-09 19:54:20 +0100713VNET_FEATURE_ARC_INIT (ip4_multicast, static) =
714{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500715 .arc_name = "ip4-multicast",
Damjan Marion8b3191e2016-11-09 19:54:20 +0100716 .start_nodes = VNET_FEATURES ("ip4-input", "ip4-input-no-checksum"),
717 .arc_index_ptr = &ip4_main.lookup_main.mcast_feature_arc_index,
718};
719
Dave Barachd7cb1b52016-12-09 09:52:16 -0500720VNET_FEATURE_INIT (ip4_vpath_mc, static) =
721{
Damjan Marion8b3191e2016-11-09 19:54:20 +0100722 .arc_name = "ip4-multicast",
Dave Barachd6534602016-06-14 18:38:02 -0400723 .node_name = "vpath-input-ip4",
Neale Ranns32e1c012016-11-22 17:07:28 +0000724 .runs_before = VNET_FEATURES ("ip4-mfib-forward-lookup"),
Dave Barachd6534602016-06-14 18:38:02 -0400725};
726
Neale Ranns8269d3d2018-01-30 09:02:20 -0800727VNET_FEATURE_INIT (ip4_mc_not_enabled, static) =
Dave Barachd7cb1b52016-12-09 09:52:16 -0500728{
Damjan Marion8b3191e2016-11-09 19:54:20 +0100729 .arc_name = "ip4-multicast",
Neale Ranns8269d3d2018-01-30 09:02:20 -0800730 .node_name = "ip4-not-enabled",
Neale Ranns180279b2017-03-16 15:49:09 -0400731 .runs_before = VNET_FEATURES ("ip4-mfib-forward-lookup"),
732};
733
734VNET_FEATURE_INIT (ip4_lookup_mc, static) =
735{
736 .arc_name = "ip4-multicast",
737 .node_name = "ip4-mfib-forward-lookup",
Dave Barachd7cb1b52016-12-09 09:52:16 -0500738 .runs_before = 0, /* last feature */
Neale Ranns5e575b12016-10-03 09:40:25 +0100739};
Dave Barach5331c722016-08-17 11:54:30 -0400740
741/* Source and port-range check ip4 tx feature path definition */
Damjan Marion8b3191e2016-11-09 19:54:20 +0100742VNET_FEATURE_ARC_INIT (ip4_output, static) =
743{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500744 .arc_name = "ip4-output",
Neale Rannsf068c3e2018-01-03 04:18:48 -0800745 .start_nodes = VNET_FEATURES ("ip4-rewrite", "ip4-midchain", "ip4-dvr-dpo"),
Damjan Marion8b3191e2016-11-09 19:54:20 +0100746 .arc_index_ptr = &ip4_main.lookup_main.output_feature_arc_index,
747};
Dave Barach5331c722016-08-17 11:54:30 -0400748
Dave Barachd7cb1b52016-12-09 09:52:16 -0500749VNET_FEATURE_INIT (ip4_source_and_port_range_check_tx, static) =
750{
Damjan Marion8b3191e2016-11-09 19:54:20 +0100751 .arc_name = "ip4-output",
752 .node_name = "ip4-source-and-port-range-check-tx",
Andrew Yourtchenko815d7d52018-02-07 11:37:02 +0100753 .runs_before = VNET_FEATURES ("ip4-outacl"),
754};
755
756VNET_FEATURE_INIT (ip4_outacl, static) =
757{
758 .arc_name = "ip4-output",
759 .node_name = "ip4-outacl",
Matus Fabian08a6f012016-11-15 06:08:51 -0800760 .runs_before = VNET_FEATURES ("ipsec-output-ip4"),
761};
762
Dave Barachd7cb1b52016-12-09 09:52:16 -0500763VNET_FEATURE_INIT (ip4_ipsec_output, static) =
764{
Matus Fabian08a6f012016-11-15 06:08:51 -0800765 .arc_name = "ip4-output",
766 .node_name = "ipsec-output-ip4",
Damjan Marion8b3191e2016-11-09 19:54:20 +0100767 .runs_before = VNET_FEATURES ("interface-output"),
Dave Barach5331c722016-08-17 11:54:30 -0400768};
769
770/* Built-in ip4 tx feature path definition */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500771VNET_FEATURE_INIT (ip4_interface_output, static) =
772{
Damjan Marion8b3191e2016-11-09 19:54:20 +0100773 .arc_name = "ip4-output",
Dave Barach5331c722016-08-17 11:54:30 -0400774 .node_name = "interface-output",
Dave Barachd7cb1b52016-12-09 09:52:16 -0500775 .runs_before = 0, /* not before any other features */
Dave Barach5331c722016-08-17 11:54:30 -0400776};
Dave Barachd7cb1b52016-12-09 09:52:16 -0500777/* *INDENT-ON* */
Dave Barachd6534602016-06-14 18:38:02 -0400778
Ed Warnickecb9cada2015-12-08 15:45:58 -0700779static clib_error_t *
Dave Barachd7cb1b52016-12-09 09:52:16 -0500780ip4_sw_interface_add_del (vnet_main_t * vnm, u32 sw_if_index, u32 is_add)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700781{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500782 ip4_main_t *im = &ip4_main;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700783
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100784 /* Fill in lookup tables with default table (0). */
785 vec_validate (im->fib_index_by_sw_if_index, sw_if_index);
Neale Ranns32e1c012016-11-22 17:07:28 +0000786 vec_validate (im->mfib_index_by_sw_if_index, sw_if_index);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100787
Pavel Kotucek9f5a2b62017-06-14 13:56:55 +0200788 if (!is_add)
789 {
790 ip4_main_t *im4 = &ip4_main;
791 ip_lookup_main_t *lm4 = &im4->lookup_main;
792 ip_interface_address_t *ia = 0;
793 ip4_address_t *address;
794 vlib_main_t *vm = vlib_get_main ();
795
796 /* *INDENT-OFF* */
797 foreach_ip_interface_address (lm4, ia, sw_if_index, 1 /* honor unnumbered */,
798 ({
799 address = ip_interface_address_get_address (lm4, ia);
800 ip4_add_del_interface_address(vm, sw_if_index, address, ia->address_length, 1);
801 }));
802 /* *INDENT-ON* */
803 }
804
Neale Ranns8269d3d2018-01-30 09:02:20 -0800805 vnet_feature_enable_disable ("ip4-unicast", "ip4-not-enabled", sw_if_index,
Damjan Marion8b3191e2016-11-09 19:54:20 +0100806 is_add, 0, 0);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700807
Neale Ranns8269d3d2018-01-30 09:02:20 -0800808 vnet_feature_enable_disable ("ip4-multicast", "ip4-not-enabled",
809 sw_if_index, is_add, 0, 0);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700810
Ed Warnickecb9cada2015-12-08 15:45:58 -0700811 return /* no error */ 0;
812}
813
814VNET_SW_INTERFACE_ADD_DEL_FUNCTION (ip4_sw_interface_add_del);
815
Ed Warnickecb9cada2015-12-08 15:45:58 -0700816/* Global IP4 main. */
817ip4_main_t ip4_main;
818
819clib_error_t *
820ip4_lookup_init (vlib_main_t * vm)
821{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500822 ip4_main_t *im = &ip4_main;
823 clib_error_t *error;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700824 uword i;
825
Damjan Marion8b3191e2016-11-09 19:54:20 +0100826 if ((error = vlib_call_init_function (vm, vnet_feature_init)))
827 return error;
Neale Ranns1ec36522017-11-29 05:20:37 -0800828 if ((error = vlib_call_init_function (vm, ip4_mtrie_module_init)))
829 return (error);
830 if ((error = vlib_call_init_function (vm, fib_module_init)))
831 return error;
832 if ((error = vlib_call_init_function (vm, mfib_module_init)))
833 return error;
Damjan Marion8b3191e2016-11-09 19:54:20 +0100834
Ed Warnickecb9cada2015-12-08 15:45:58 -0700835 for (i = 0; i < ARRAY_LEN (im->fib_masks); i++)
836 {
837 u32 m;
838
839 if (i < 32)
840 m = pow2_mask (i) << (32 - i);
Dave Barach75fc8542016-10-11 16:16:02 -0400841 else
Ed Warnickecb9cada2015-12-08 15:45:58 -0700842 m = ~0;
843 im->fib_masks[i] = clib_host_to_net_u32 (m);
844 }
845
Ed Warnickecb9cada2015-12-08 15:45:58 -0700846 ip_lookup_init (&im->lookup_main, /* is_ip6 */ 0);
847
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100848 /* Create FIB with index 0 and table id of 0. */
Neale Ranns15002542017-09-10 04:39:11 -0700849 fib_table_find_or_create_and_lock (FIB_PROTOCOL_IP4, 0,
850 FIB_SOURCE_DEFAULT_ROUTE);
851 mfib_table_find_or_create_and_lock (FIB_PROTOCOL_IP4, 0,
852 MFIB_SOURCE_DEFAULT_ROUTE);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100853
Ed Warnickecb9cada2015-12-08 15:45:58 -0700854 {
Dave Barachd7cb1b52016-12-09 09:52:16 -0500855 pg_node_t *pn;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700856 pn = pg_get_node (ip4_lookup_node.index);
857 pn->unformat_edit = unformat_pg_ip4_header;
858 }
859
860 {
861 ethernet_arp_header_t h;
862
863 memset (&h, 0, sizeof (h));
864
865 /* Set target ethernet address to all zeros. */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500866 memset (h.ip4_over_ethernet[1].ethernet, 0,
867 sizeof (h.ip4_over_ethernet[1].ethernet));
Ed Warnickecb9cada2015-12-08 15:45:58 -0700868
869#define _16(f,v) h.f = clib_host_to_net_u16 (v);
870#define _8(f,v) h.f = v;
871 _16 (l2_type, ETHERNET_ARP_HARDWARE_TYPE_ethernet);
872 _16 (l3_type, ETHERNET_TYPE_IP4);
873 _8 (n_l2_address_bytes, 6);
874 _8 (n_l3_address_bytes, 4);
875 _16 (opcode, ETHERNET_ARP_OPCODE_request);
876#undef _16
877#undef _8
878
Dave Barachd7cb1b52016-12-09 09:52:16 -0500879 vlib_packet_template_init (vm, &im->ip4_arp_request_packet_template,
Ed Warnickecb9cada2015-12-08 15:45:58 -0700880 /* data */ &h,
881 sizeof (h),
882 /* alloc chunk size */ 8,
883 "ip4 arp");
884 }
885
Dave Barach203c6322016-06-26 10:29:03 -0400886 return error;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700887}
888
889VLIB_INIT_FUNCTION (ip4_lookup_init);
890
Dave Barachd7cb1b52016-12-09 09:52:16 -0500891typedef struct
892{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700893 /* Adjacency taken. */
Vengada Govindanf1544482016-09-28 02:45:57 -0700894 u32 dpo_index;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700895 u32 flow_hash;
896 u32 fib_index;
897
898 /* Packet data, possibly *after* rewrite. */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500899 u8 packet_data[64 - 1 * sizeof (u32)];
900}
901ip4_forward_next_trace_t;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700902
Dave Barachd7cb1b52016-12-09 09:52:16 -0500903u8 *
904format_ip4_forward_next_trace (u8 * s, va_list * args)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700905{
906 CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *);
907 CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *);
Dave Barachd7cb1b52016-12-09 09:52:16 -0500908 ip4_forward_next_trace_t *t = va_arg (*args, ip4_forward_next_trace_t *);
Christophe Fontained3c008d2017-10-02 18:10:54 +0200909 u32 indent = format_get_indent (s);
Pierre Pfistera38c3df2016-06-13 10:28:09 +0100910 s = format (s, "%U%U",
John Loac8146c2016-09-27 17:44:02 -0400911 format_white_space, indent,
912 format_ip4_header, t->packet_data, sizeof (t->packet_data));
Pierre Pfistera38c3df2016-06-13 10:28:09 +0100913 return s;
914}
915
Dave Barachd7cb1b52016-12-09 09:52:16 -0500916static u8 *
917format_ip4_lookup_trace (u8 * s, va_list * args)
Pierre Pfistera38c3df2016-06-13 10:28:09 +0100918{
919 CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *);
920 CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *);
Dave Barachd7cb1b52016-12-09 09:52:16 -0500921 ip4_forward_next_trace_t *t = va_arg (*args, ip4_forward_next_trace_t *);
Christophe Fontained3c008d2017-10-02 18:10:54 +0200922 u32 indent = format_get_indent (s);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700923
John Loac8146c2016-09-27 17:44:02 -0400924 s = format (s, "fib %d dpo-idx %d flow hash: 0x%08x",
Dave Barachd7cb1b52016-12-09 09:52:16 -0500925 t->fib_index, t->dpo_index, t->flow_hash);
Pierre Pfistera38c3df2016-06-13 10:28:09 +0100926 s = format (s, "\n%U%U",
Dave Barachd7cb1b52016-12-09 09:52:16 -0500927 format_white_space, indent,
928 format_ip4_header, t->packet_data, sizeof (t->packet_data));
Pierre Pfistera38c3df2016-06-13 10:28:09 +0100929 return s;
930}
Ed Warnickecb9cada2015-12-08 15:45:58 -0700931
Dave Barachd7cb1b52016-12-09 09:52:16 -0500932static u8 *
933format_ip4_rewrite_trace (u8 * s, va_list * args)
Pierre Pfistera38c3df2016-06-13 10:28:09 +0100934{
935 CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *);
936 CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *);
Dave Barachd7cb1b52016-12-09 09:52:16 -0500937 ip4_forward_next_trace_t *t = va_arg (*args, ip4_forward_next_trace_t *);
Christophe Fontained3c008d2017-10-02 18:10:54 +0200938 u32 indent = format_get_indent (s);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700939
Vengada Govindanf1544482016-09-28 02:45:57 -0700940 s = format (s, "tx_sw_if_index %d dpo-idx %d : %U flow hash: 0x%08x",
Dave Barachd7cb1b52016-12-09 09:52:16 -0500941 t->fib_index, t->dpo_index, format_ip_adjacency,
942 t->dpo_index, FORMAT_IP_ADJACENCY_NONE, t->flow_hash);
Pierre Pfistera38c3df2016-06-13 10:28:09 +0100943 s = format (s, "\n%U%U",
Dave Barachd7cb1b52016-12-09 09:52:16 -0500944 format_white_space, indent,
945 format_ip_adjacency_packet_data,
Neale Rannsb069a692017-03-15 12:34:25 -0400946 t->dpo_index, t->packet_data, sizeof (t->packet_data));
Ed Warnickecb9cada2015-12-08 15:45:58 -0700947 return s;
948}
949
950/* Common trace function for all ip4-forward next nodes. */
951void
952ip4_forward_next_trace (vlib_main_t * vm,
953 vlib_node_runtime_t * node,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500954 vlib_frame_t * frame, vlib_rx_or_tx_t which_adj_index)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700955{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500956 u32 *from, n_left;
957 ip4_main_t *im = &ip4_main;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700958
959 n_left = frame->n_vectors;
960 from = vlib_frame_vector_args (frame);
Dave Barach75fc8542016-10-11 16:16:02 -0400961
Ed Warnickecb9cada2015-12-08 15:45:58 -0700962 while (n_left >= 4)
963 {
964 u32 bi0, bi1;
Dave Barachd7cb1b52016-12-09 09:52:16 -0500965 vlib_buffer_t *b0, *b1;
966 ip4_forward_next_trace_t *t0, *t1;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700967
968 /* Prefetch next iteration. */
969 vlib_prefetch_buffer_with_index (vm, from[2], LOAD);
970 vlib_prefetch_buffer_with_index (vm, from[3], LOAD);
971
972 bi0 = from[0];
973 bi1 = from[1];
974
975 b0 = vlib_get_buffer (vm, bi0);
976 b1 = vlib_get_buffer (vm, bi1);
977
978 if (b0->flags & VLIB_BUFFER_IS_TRACED)
979 {
980 t0 = vlib_add_trace (vm, node, b0, sizeof (t0[0]));
Vengada Govindanf1544482016-09-28 02:45:57 -0700981 t0->dpo_index = vnet_buffer (b0)->ip.adj_index[which_adj_index];
Ed Warnickecb9cada2015-12-08 15:45:58 -0700982 t0->flow_hash = vnet_buffer (b0)->ip.flow_hash;
Dave Barachd7cb1b52016-12-09 09:52:16 -0500983 t0->fib_index =
984 (vnet_buffer (b0)->sw_if_index[VLIB_TX] !=
985 (u32) ~ 0) ? vnet_buffer (b0)->sw_if_index[VLIB_TX] :
986 vec_elt (im->fib_index_by_sw_if_index,
987 vnet_buffer (b0)->sw_if_index[VLIB_RX]);
Pierre Pfister0febaf12016-06-08 12:23:21 +0100988
Damjan Marionf1213b82016-03-13 02:22:06 +0100989 clib_memcpy (t0->packet_data,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500990 vlib_buffer_get_current (b0),
991 sizeof (t0->packet_data));
Ed Warnickecb9cada2015-12-08 15:45:58 -0700992 }
993 if (b1->flags & VLIB_BUFFER_IS_TRACED)
994 {
995 t1 = vlib_add_trace (vm, node, b1, sizeof (t1[0]));
Vengada Govindanf1544482016-09-28 02:45:57 -0700996 t1->dpo_index = vnet_buffer (b1)->ip.adj_index[which_adj_index];
Ed Warnickecb9cada2015-12-08 15:45:58 -0700997 t1->flow_hash = vnet_buffer (b1)->ip.flow_hash;
Dave Barachd7cb1b52016-12-09 09:52:16 -0500998 t1->fib_index =
999 (vnet_buffer (b1)->sw_if_index[VLIB_TX] !=
1000 (u32) ~ 0) ? vnet_buffer (b1)->sw_if_index[VLIB_TX] :
1001 vec_elt (im->fib_index_by_sw_if_index,
1002 vnet_buffer (b1)->sw_if_index[VLIB_RX]);
1003 clib_memcpy (t1->packet_data, vlib_buffer_get_current (b1),
1004 sizeof (t1->packet_data));
Ed Warnickecb9cada2015-12-08 15:45:58 -07001005 }
1006 from += 2;
1007 n_left -= 2;
1008 }
1009
1010 while (n_left >= 1)
1011 {
1012 u32 bi0;
Dave Barachd7cb1b52016-12-09 09:52:16 -05001013 vlib_buffer_t *b0;
1014 ip4_forward_next_trace_t *t0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001015
1016 bi0 = from[0];
1017
1018 b0 = vlib_get_buffer (vm, bi0);
1019
1020 if (b0->flags & VLIB_BUFFER_IS_TRACED)
1021 {
1022 t0 = vlib_add_trace (vm, node, b0, sizeof (t0[0]));
Vengada Govindanf1544482016-09-28 02:45:57 -07001023 t0->dpo_index = vnet_buffer (b0)->ip.adj_index[which_adj_index];
Ed Warnickecb9cada2015-12-08 15:45:58 -07001024 t0->flow_hash = vnet_buffer (b0)->ip.flow_hash;
Dave Barachd7cb1b52016-12-09 09:52:16 -05001025 t0->fib_index =
1026 (vnet_buffer (b0)->sw_if_index[VLIB_TX] !=
1027 (u32) ~ 0) ? vnet_buffer (b0)->sw_if_index[VLIB_TX] :
1028 vec_elt (im->fib_index_by_sw_if_index,
1029 vnet_buffer (b0)->sw_if_index[VLIB_RX]);
1030 clib_memcpy (t0->packet_data, vlib_buffer_get_current (b0),
1031 sizeof (t0->packet_data));
Ed Warnickecb9cada2015-12-08 15:45:58 -07001032 }
1033 from += 1;
1034 n_left -= 1;
1035 }
1036}
1037
Ed Warnickecb9cada2015-12-08 15:45:58 -07001038/* Compute TCP/UDP/ICMP4 checksum in software. */
1039u16
1040ip4_tcp_udp_compute_checksum (vlib_main_t * vm, vlib_buffer_t * p0,
1041 ip4_header_t * ip0)
1042{
1043 ip_csum_t sum0;
1044 u32 ip_header_length, payload_length_host_byte_order;
Florin Corasb2215d62017-08-01 16:56:58 -07001045 u32 n_this_buffer, n_bytes_left, n_ip_bytes_this_buffer;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001046 u16 sum16;
Dave Barachd7cb1b52016-12-09 09:52:16 -05001047 void *data_this_buffer;
Dave Barach75fc8542016-10-11 16:16:02 -04001048
Ed Warnickecb9cada2015-12-08 15:45:58 -07001049 /* Initialize checksum with ip header. */
1050 ip_header_length = ip4_header_bytes (ip0);
Dave Barachd7cb1b52016-12-09 09:52:16 -05001051 payload_length_host_byte_order =
1052 clib_net_to_host_u16 (ip0->length) - ip_header_length;
1053 sum0 =
1054 clib_host_to_net_u32 (payload_length_host_byte_order +
1055 (ip0->protocol << 16));
Ed Warnickecb9cada2015-12-08 15:45:58 -07001056
1057 if (BITS (uword) == 32)
1058 {
Dave Barachd7cb1b52016-12-09 09:52:16 -05001059 sum0 =
1060 ip_csum_with_carry (sum0,
1061 clib_mem_unaligned (&ip0->src_address, u32));
1062 sum0 =
1063 ip_csum_with_carry (sum0,
1064 clib_mem_unaligned (&ip0->dst_address, u32));
Ed Warnickecb9cada2015-12-08 15:45:58 -07001065 }
1066 else
Dave Barachd7cb1b52016-12-09 09:52:16 -05001067 sum0 =
1068 ip_csum_with_carry (sum0, clib_mem_unaligned (&ip0->src_address, u64));
Ed Warnickecb9cada2015-12-08 15:45:58 -07001069
1070 n_bytes_left = n_this_buffer = payload_length_host_byte_order;
1071 data_this_buffer = (void *) ip0 + ip_header_length;
Neale Rannsd91c1db2017-07-31 02:30:50 -07001072 n_ip_bytes_this_buffer =
1073 p0->current_length - (((u8 *) ip0 - p0->data) - p0->current_data);
Florin Corasb2215d62017-08-01 16:56:58 -07001074 if (n_this_buffer + ip_header_length > n_ip_bytes_this_buffer)
1075 {
1076 n_this_buffer = n_ip_bytes_this_buffer > ip_header_length ?
Neale Rannsd91c1db2017-07-31 02:30:50 -07001077 n_ip_bytes_this_buffer - ip_header_length : 0;
Florin Corasb2215d62017-08-01 16:56:58 -07001078 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07001079 while (1)
1080 {
1081 sum0 = ip_incremental_checksum (sum0, data_this_buffer, n_this_buffer);
1082 n_bytes_left -= n_this_buffer;
1083 if (n_bytes_left == 0)
1084 break;
1085
1086 ASSERT (p0->flags & VLIB_BUFFER_NEXT_PRESENT);
1087 p0 = vlib_get_buffer (vm, p0->next_buffer);
1088 data_this_buffer = vlib_buffer_get_current (p0);
1089 n_this_buffer = p0->current_length;
1090 }
1091
Dave Barachd7cb1b52016-12-09 09:52:16 -05001092 sum16 = ~ip_csum_fold (sum0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001093
1094 return sum16;
1095}
1096
John Lo37682e12016-11-30 12:51:39 -05001097u32
Ed Warnickecb9cada2015-12-08 15:45:58 -07001098ip4_tcp_udp_validate_checksum (vlib_main_t * vm, vlib_buffer_t * p0)
1099{
Dave Barachd7cb1b52016-12-09 09:52:16 -05001100 ip4_header_t *ip0 = vlib_buffer_get_current (p0);
1101 udp_header_t *udp0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001102 u16 sum16;
1103
1104 ASSERT (ip0->protocol == IP_PROTOCOL_TCP
1105 || ip0->protocol == IP_PROTOCOL_UDP);
1106
1107 udp0 = (void *) (ip0 + 1);
1108 if (ip0->protocol == IP_PROTOCOL_UDP && udp0->checksum == 0)
1109 {
Damjan Marion213b5aa2017-07-13 21:19:27 +02001110 p0->flags |= (VNET_BUFFER_F_L4_CHECKSUM_COMPUTED
1111 | VNET_BUFFER_F_L4_CHECKSUM_CORRECT);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001112 return p0->flags;
1113 }
1114
1115 sum16 = ip4_tcp_udp_compute_checksum (vm, p0, ip0);
1116
Damjan Marion213b5aa2017-07-13 21:19:27 +02001117 p0->flags |= (VNET_BUFFER_F_L4_CHECKSUM_COMPUTED
1118 | ((sum16 == 0) << VNET_BUFFER_F_LOG2_L4_CHECKSUM_CORRECT));
Ed Warnickecb9cada2015-12-08 15:45:58 -07001119
1120 return p0->flags;
1121}
1122
Dave Barach68b0fb02017-02-28 15:15:56 -05001123/* *INDENT-OFF* */
1124VNET_FEATURE_ARC_INIT (ip4_local) =
1125{
1126 .arc_name = "ip4-local",
1127 .start_nodes = VNET_FEATURES ("ip4-local"),
1128};
1129/* *INDENT-ON* */
1130
Florin Coras20a14b92017-08-15 22:47:22 -07001131static inline void
1132ip4_local_validate_l4 (vlib_main_t * vm, vlib_buffer_t * p, ip4_header_t * ip,
1133 u8 is_udp, u8 * error, u8 * good_tcp_udp)
1134{
1135 u32 flags0;
1136 flags0 = ip4_tcp_udp_validate_checksum (vm, p);
1137 *good_tcp_udp = (flags0 & VNET_BUFFER_F_L4_CHECKSUM_CORRECT) != 0;
1138 if (is_udp)
1139 {
1140 udp_header_t *udp;
1141 u32 ip_len, udp_len;
1142 i32 len_diff;
1143 udp = ip4_next_header (ip);
1144 /* Verify UDP length. */
1145 ip_len = clib_net_to_host_u16 (ip->length);
1146 udp_len = clib_net_to_host_u16 (udp->length);
1147
1148 len_diff = ip_len - udp_len;
1149 *good_tcp_udp &= len_diff >= 0;
1150 *error = len_diff < 0 ? IP4_ERROR_UDP_LENGTH : *error;
1151 }
1152}
1153
1154#define ip4_local_do_l4_check(is_tcp_udp, flags) \
Jakub Grajciar96be8e82017-10-30 14:56:17 +01001155 (is_tcp_udp && !(flags & VNET_BUFFER_F_L4_CHECKSUM_COMPUTED \
1156 || flags & VNET_BUFFER_F_OFFLOAD_TCP_CKSUM \
1157 || flags & VNET_BUFFER_F_OFFLOAD_UDP_CKSUM))
Florin Coras20a14b92017-08-15 22:47:22 -07001158
Dave Barach68b0fb02017-02-28 15:15:56 -05001159static inline uword
1160ip4_local_inline (vlib_main_t * vm,
1161 vlib_node_runtime_t * node,
1162 vlib_frame_t * frame, int head_of_feature_arc)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001163{
Dave Barachd7cb1b52016-12-09 09:52:16 -05001164 ip4_main_t *im = &ip4_main;
1165 ip_lookup_main_t *lm = &im->lookup_main;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001166 ip_local_next_t next_index;
Dave Barachd7cb1b52016-12-09 09:52:16 -05001167 u32 *from, *to_next, n_left_from, n_left_to_next;
1168 vlib_node_runtime_t *error_node =
1169 vlib_node_get_runtime (vm, ip4_input_node.index);
Dave Barach68b0fb02017-02-28 15:15:56 -05001170 u8 arc_index = vnet_feat_arc_ip4_local.feature_arc_index;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001171
1172 from = vlib_frame_vector_args (frame);
1173 n_left_from = frame->n_vectors;
1174 next_index = node->cached_next_index;
Dave Barach75fc8542016-10-11 16:16:02 -04001175
Ed Warnickecb9cada2015-12-08 15:45:58 -07001176 if (node->flags & VLIB_NODE_FLAG_TRACE)
1177 ip4_forward_next_trace (vm, node, frame, VLIB_TX);
1178
1179 while (n_left_from > 0)
1180 {
1181 vlib_get_next_frame (vm, node, next_index, to_next, n_left_to_next);
1182
1183 while (n_left_from >= 4 && n_left_to_next >= 2)
Dave Barachd7cb1b52016-12-09 09:52:16 -05001184 {
1185 vlib_buffer_t *p0, *p1;
1186 ip4_header_t *ip0, *ip1;
Dave Barachd7cb1b52016-12-09 09:52:16 -05001187 ip4_fib_mtrie_t *mtrie0, *mtrie1;
1188 ip4_fib_mtrie_leaf_t leaf0, leaf1;
1189 const dpo_id_t *dpo0, *dpo1;
1190 const load_balance_t *lb0, *lb1;
Florin Coras20a14b92017-08-15 22:47:22 -07001191 u32 pi0, next0, fib_index0, lbi0;
1192 u32 pi1, next1, fib_index1, lbi1;
Dave Barachd7cb1b52016-12-09 09:52:16 -05001193 u8 error0, is_udp0, is_tcp_udp0, good_tcp_udp0, proto0;
1194 u8 error1, is_udp1, is_tcp_udp1, good_tcp_udp1, proto1;
Dave Barach68b0fb02017-02-28 15:15:56 -05001195 u32 sw_if_index0, sw_if_index1;
Dave Barach75fc8542016-10-11 16:16:02 -04001196
Dave Barachd7cb1b52016-12-09 09:52:16 -05001197 pi0 = to_next[0] = from[0];
1198 pi1 = to_next[1] = from[1];
1199 from += 2;
1200 n_left_from -= 2;
1201 to_next += 2;
1202 n_left_to_next -= 2;
Dave Barach75fc8542016-10-11 16:16:02 -04001203
Dave Barach68b0fb02017-02-28 15:15:56 -05001204 next0 = next1 = IP_LOCAL_NEXT_DROP;
Florin Coras20a14b92017-08-15 22:47:22 -07001205 error0 = error1 = IP4_ERROR_UNKNOWN_PROTOCOL;
Dave Barach68b0fb02017-02-28 15:15:56 -05001206
Ed Warnickecb9cada2015-12-08 15:45:58 -07001207 p0 = vlib_get_buffer (vm, pi0);
1208 p1 = vlib_get_buffer (vm, pi1);
1209
1210 ip0 = vlib_buffer_get_current (p0);
1211 ip1 = vlib_buffer_get_current (p1);
1212
Damjan Marion072401e2017-07-13 18:53:27 +02001213 vnet_buffer (p0)->l3_hdr_offset = p0->current_data;
1214 vnet_buffer (p1)->l3_hdr_offset = p1->current_data;
Klement Sekera0e3c0de2016-09-29 14:43:44 +02001215
Dave Barach68b0fb02017-02-28 15:15:56 -05001216 sw_if_index0 = vnet_buffer (p0)->sw_if_index[VLIB_RX];
1217 sw_if_index1 = vnet_buffer (p1)->sw_if_index[VLIB_RX];
1218
Florin Coras20a14b92017-08-15 22:47:22 -07001219 /* Treat IP frag packets as "experimental" protocol for now
1220 until support of IP frag reassembly is implemented */
Klement Sekera75e7d132017-09-20 08:26:30 +02001221 proto0 =
1222 ip4_is_fragment (ip0) ? IP_PROTOCOL_VPP_FRAGMENTATION :
1223 ip0->protocol;
1224 proto1 =
1225 ip4_is_fragment (ip1) ? IP_PROTOCOL_VPP_FRAGMENTATION :
1226 ip1->protocol;
Florin Coras20a14b92017-08-15 22:47:22 -07001227
1228 if (head_of_feature_arc == 0)
1229 goto skip_checks;
1230
1231 is_udp0 = proto0 == IP_PROTOCOL_UDP;
1232 is_udp1 = proto1 == IP_PROTOCOL_UDP;
1233 is_tcp_udp0 = is_udp0 || proto0 == IP_PROTOCOL_TCP;
1234 is_tcp_udp1 = is_udp1 || proto1 == IP_PROTOCOL_TCP;
1235
1236 good_tcp_udp0 =
Jakub Grajciar96be8e82017-10-30 14:56:17 +01001237 (p0->flags & VNET_BUFFER_F_L4_CHECKSUM_CORRECT
Jakub Grajciar2eeeb4b2017-11-07 14:39:10 +01001238 || (p0->flags & VNET_BUFFER_F_OFFLOAD_TCP_CKSUM
1239 || p0->flags & VNET_BUFFER_F_OFFLOAD_UDP_CKSUM)) != 0;
Jakub Grajciar96be8e82017-10-30 14:56:17 +01001240 good_tcp_udp1 = (p1->flags & VNET_BUFFER_F_L4_CHECKSUM_CORRECT
Jakub Grajciar2eeeb4b2017-11-07 14:39:10 +01001241 || (p1->flags & VNET_BUFFER_F_OFFLOAD_TCP_CKSUM
1242 || p1->flags &
1243 VNET_BUFFER_F_OFFLOAD_UDP_CKSUM)) != 0;
Florin Coras20a14b92017-08-15 22:47:22 -07001244
1245 if (PREDICT_FALSE (ip4_local_do_l4_check (is_tcp_udp0, p0->flags)
1246 || ip4_local_do_l4_check (is_tcp_udp1,
1247 p1->flags)))
1248 {
1249 if (is_tcp_udp0)
1250 ip4_local_validate_l4 (vm, p0, ip0, is_udp0, &error0,
1251 &good_tcp_udp0);
1252 if (is_tcp_udp1)
1253 ip4_local_validate_l4 (vm, p1, ip1, is_udp1, &error1,
1254 &good_tcp_udp1);
1255 }
1256
1257 ASSERT (IP4_ERROR_TCP_CHECKSUM + 1 == IP4_ERROR_UDP_CHECKSUM);
1258 error0 = (is_tcp_udp0 && !good_tcp_udp0
1259 ? IP4_ERROR_TCP_CHECKSUM + is_udp0 : error0);
1260 error1 = (is_tcp_udp1 && !good_tcp_udp1
1261 ? IP4_ERROR_TCP_CHECKSUM + is_udp1 : error1);
Dave Barach68b0fb02017-02-28 15:15:56 -05001262
1263 fib_index0 = vec_elt (im->fib_index_by_sw_if_index, sw_if_index0);
Neale Ranns32e1c012016-11-22 17:07:28 +00001264 fib_index0 =
1265 (vnet_buffer (p0)->sw_if_index[VLIB_TX] ==
1266 (u32) ~ 0) ? fib_index0 : vnet_buffer (p0)->sw_if_index[VLIB_TX];
Neale Rannscb630ff2016-12-14 13:31:29 +01001267
Dave Barach68b0fb02017-02-28 15:15:56 -05001268 fib_index1 = vec_elt (im->fib_index_by_sw_if_index, sw_if_index1);
Neale Ranns32e1c012016-11-22 17:07:28 +00001269 fib_index1 =
1270 (vnet_buffer (p1)->sw_if_index[VLIB_TX] ==
1271 (u32) ~ 0) ? fib_index1 : vnet_buffer (p1)->sw_if_index[VLIB_TX];
Ed Warnickecb9cada2015-12-08 15:45:58 -07001272
Florin Corascea194d2017-10-02 00:18:51 -07001273 /* TODO maybe move to lookup? */
1274 vnet_buffer (p0)->ip.fib_index = fib_index0;
1275 vnet_buffer (p1)->ip.fib_index = fib_index1;
1276
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001277 mtrie0 = &ip4_fib_get (fib_index0)->mtrie;
1278 mtrie1 = &ip4_fib_get (fib_index1)->mtrie;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001279
Neale Ranns04a75e32017-03-23 06:46:01 -07001280 leaf0 = ip4_fib_mtrie_lookup_step_one (mtrie0, &ip0->src_address);
1281 leaf1 = ip4_fib_mtrie_lookup_step_one (mtrie1, &ip1->src_address);
Florin Coras20a14b92017-08-15 22:47:22 -07001282 leaf0 = ip4_fib_mtrie_lookup_step (mtrie0, leaf0, &ip0->src_address,
1283 2);
1284 leaf1 = ip4_fib_mtrie_lookup_step (mtrie1, leaf1, &ip1->src_address,
1285 2);
1286 leaf0 = ip4_fib_mtrie_lookup_step (mtrie0, leaf0, &ip0->src_address,
1287 3);
1288 leaf1 = ip4_fib_mtrie_lookup_step (mtrie1, leaf1, &ip1->src_address,
1289 3);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001290
Dave Barachd7cb1b52016-12-09 09:52:16 -05001291 vnet_buffer (p0)->ip.adj_index[VLIB_RX] = lbi0 =
1292 ip4_fib_mtrie_leaf_get_adj_index (leaf0);
1293 vnet_buffer (p0)->ip.adj_index[VLIB_TX] = lbi0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001294
Dave Barachd7cb1b52016-12-09 09:52:16 -05001295 vnet_buffer (p1)->ip.adj_index[VLIB_RX] = lbi1 =
1296 ip4_fib_mtrie_leaf_get_adj_index (leaf1);
1297 vnet_buffer (p1)->ip.adj_index[VLIB_TX] = lbi1;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001298
Dave Barachd7cb1b52016-12-09 09:52:16 -05001299 lb0 = load_balance_get (lbi0);
1300 lb1 = load_balance_get (lbi1);
1301 dpo0 = load_balance_get_bucket_i (lb0, 0);
1302 dpo1 = load_balance_get_bucket_i (lb1, 0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001303
Dave Barach75fc8542016-10-11 16:16:02 -04001304 /*
Dave Barachd7cb1b52016-12-09 09:52:16 -05001305 * Must have a route to source otherwise we drop the packet.
1306 * ip4 broadcasts are accepted, e.g. to make dhcp client work
Neale Ranns3ee44042016-10-03 13:05:48 +01001307 *
1308 * The checks are:
1309 * - the source is a recieve => it's from us => bogus, do this
1310 * first since it sets a different error code.
1311 * - uRPF check for any route to source - accept if passes.
1312 * - allow packets destined to the broadcast address from unknown sources
Dave Barachd7cb1b52016-12-09 09:52:16 -05001313 */
Matus Fabian87da4762017-10-04 08:03:56 -07001314 if (p0->flags & VNET_BUFFER_F_IS_NATED)
1315 goto skip_check0;
1316
Neale Ranns3ee44042016-10-03 13:05:48 +01001317 error0 = ((error0 == IP4_ERROR_UNKNOWN_PROTOCOL &&
Dave Barachd7cb1b52016-12-09 09:52:16 -05001318 dpo0->dpoi_type == DPO_RECEIVE) ?
1319 IP4_ERROR_SPOOFED_LOCAL_PACKETS : error0);
1320 error0 = ((error0 == IP4_ERROR_UNKNOWN_PROTOCOL &&
1321 !fib_urpf_check_size (lb0->lb_urpf) &&
Neale Ranns3ee44042016-10-03 13:05:48 +01001322 ip0->dst_address.as_u32 != 0xFFFFFFFF)
Dave Barachd7cb1b52016-12-09 09:52:16 -05001323 ? IP4_ERROR_SRC_LOOKUP_MISS : error0);
Matus Fabian87da4762017-10-04 08:03:56 -07001324
1325 skip_check0:
1326 if (p1->flags & VNET_BUFFER_F_IS_NATED)
1327 goto skip_checks;
1328
Neale Ranns3ee44042016-10-03 13:05:48 +01001329 error1 = ((error1 == IP4_ERROR_UNKNOWN_PROTOCOL &&
Dave Barachd7cb1b52016-12-09 09:52:16 -05001330 dpo1->dpoi_type == DPO_RECEIVE) ?
1331 IP4_ERROR_SPOOFED_LOCAL_PACKETS : error1);
1332 error1 = ((error1 == IP4_ERROR_UNKNOWN_PROTOCOL &&
1333 !fib_urpf_check_size (lb1->lb_urpf) &&
Neale Ranns3ee44042016-10-03 13:05:48 +01001334 ip1->dst_address.as_u32 != 0xFFFFFFFF)
Dave Barachd7cb1b52016-12-09 09:52:16 -05001335 ? IP4_ERROR_SRC_LOOKUP_MISS : error1);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001336
Florin Corasa0b34a72017-03-07 01:20:52 -08001337 skip_checks:
1338
Ed Warnickecb9cada2015-12-08 15:45:58 -07001339 next0 = lm->local_next_by_ip_protocol[proto0];
1340 next1 = lm->local_next_by_ip_protocol[proto1];
1341
Dave Barachd7cb1b52016-12-09 09:52:16 -05001342 next0 =
1343 error0 != IP4_ERROR_UNKNOWN_PROTOCOL ? IP_LOCAL_NEXT_DROP : next0;
1344 next1 =
1345 error1 != IP4_ERROR_UNKNOWN_PROTOCOL ? IP_LOCAL_NEXT_DROP : next1;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001346
1347 p0->error = error0 ? error_node->errors[error0] : 0;
1348 p1->error = error1 ? error_node->errors[error1] : 0;
1349
Dave Barach68b0fb02017-02-28 15:15:56 -05001350 if (head_of_feature_arc)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001351 {
Dave Barach68b0fb02017-02-28 15:15:56 -05001352 if (PREDICT_TRUE (error0 == (u8) IP4_ERROR_UNKNOWN_PROTOCOL))
1353 vnet_feature_arc_start (arc_index, sw_if_index0, &next0, p0);
1354 if (PREDICT_TRUE (error1 == (u8) IP4_ERROR_UNKNOWN_PROTOCOL))
1355 vnet_feature_arc_start (arc_index, sw_if_index1, &next1, p1);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001356 }
Dave Barach68b0fb02017-02-28 15:15:56 -05001357
1358 vlib_validate_buffer_enqueue_x2 (vm, node, next_index, to_next,
1359 n_left_to_next, pi0, pi1,
1360 next0, next1);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001361 }
1362
1363 while (n_left_from > 0 && n_left_to_next > 0)
1364 {
Dave Barachd7cb1b52016-12-09 09:52:16 -05001365 vlib_buffer_t *p0;
1366 ip4_header_t *ip0;
Dave Barachd7cb1b52016-12-09 09:52:16 -05001367 ip4_fib_mtrie_t *mtrie0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001368 ip4_fib_mtrie_leaf_t leaf0;
Florin Coras20a14b92017-08-15 22:47:22 -07001369 u32 pi0, next0, fib_index0, lbi0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001370 u8 error0, is_udp0, is_tcp_udp0, good_tcp_udp0, proto0;
Dave Barachd7cb1b52016-12-09 09:52:16 -05001371 load_balance_t *lb0;
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001372 const dpo_id_t *dpo0;
Dave Barach68b0fb02017-02-28 15:15:56 -05001373 u32 sw_if_index0;
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001374
Ed Warnickecb9cada2015-12-08 15:45:58 -07001375 pi0 = to_next[0] = from[0];
1376 from += 1;
1377 n_left_from -= 1;
1378 to_next += 1;
1379 n_left_to_next -= 1;
Dave Barach75fc8542016-10-11 16:16:02 -04001380
Dave Barach68b0fb02017-02-28 15:15:56 -05001381 next0 = IP_LOCAL_NEXT_DROP;
Florin Coras20a14b92017-08-15 22:47:22 -07001382 error0 = IP4_ERROR_UNKNOWN_PROTOCOL;
Dave Barach68b0fb02017-02-28 15:15:56 -05001383
Ed Warnickecb9cada2015-12-08 15:45:58 -07001384 p0 = vlib_get_buffer (vm, pi0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001385 ip0 = vlib_buffer_get_current (p0);
Damjan Marion072401e2017-07-13 18:53:27 +02001386 vnet_buffer (p0)->l3_hdr_offset = p0->current_data;
Dave Barach68b0fb02017-02-28 15:15:56 -05001387 sw_if_index0 = vnet_buffer (p0)->sw_if_index[VLIB_RX];
1388
John Lo3419d0b2016-06-02 09:28:37 -04001389 /* Treat IP frag packets as "experimental" protocol for now
1390 until support of IP frag reassembly is implemented */
Klement Sekera75e7d132017-09-20 08:26:30 +02001391 proto0 =
1392 ip4_is_fragment (ip0) ? IP_PROTOCOL_VPP_FRAGMENTATION :
1393 ip0->protocol;
Dave Barach68b0fb02017-02-28 15:15:56 -05001394
Matus Fabian87da4762017-10-04 08:03:56 -07001395 if (head_of_feature_arc == 0 || p0->flags & VNET_BUFFER_F_IS_NATED)
Florin Coras20a14b92017-08-15 22:47:22 -07001396 goto skip_check;
Dave Barach68b0fb02017-02-28 15:15:56 -05001397
Ed Warnickecb9cada2015-12-08 15:45:58 -07001398 is_udp0 = proto0 == IP_PROTOCOL_UDP;
1399 is_tcp_udp0 = is_udp0 || proto0 == IP_PROTOCOL_TCP;
Jakub Grajciar96be8e82017-10-30 14:56:17 +01001400
Florin Coras20a14b92017-08-15 22:47:22 -07001401 good_tcp_udp0 =
Jakub Grajciar96be8e82017-10-30 14:56:17 +01001402 (p0->flags & VNET_BUFFER_F_L4_CHECKSUM_CORRECT
Jakub Grajciar2eeeb4b2017-11-07 14:39:10 +01001403 || (p0->flags & VNET_BUFFER_F_OFFLOAD_TCP_CKSUM
1404 || p0->flags & VNET_BUFFER_F_OFFLOAD_UDP_CKSUM)) != 0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001405
Florin Coras20a14b92017-08-15 22:47:22 -07001406 if (PREDICT_FALSE (ip4_local_do_l4_check (is_tcp_udp0, p0->flags)))
Ed Warnickecb9cada2015-12-08 15:45:58 -07001407 {
Florin Coras20a14b92017-08-15 22:47:22 -07001408 ip4_local_validate_l4 (vm, p0, ip0, is_udp0, &error0,
1409 &good_tcp_udp0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001410 }
1411
Ed Warnickecb9cada2015-12-08 15:45:58 -07001412 ASSERT (IP4_ERROR_TCP_CHECKSUM + 1 == IP4_ERROR_UDP_CHECKSUM);
Dave Barachd7cb1b52016-12-09 09:52:16 -05001413 error0 = (is_tcp_udp0 && !good_tcp_udp0
1414 ? IP4_ERROR_TCP_CHECKSUM + is_udp0 : error0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001415
Florin Coras20a14b92017-08-15 22:47:22 -07001416 fib_index0 = vec_elt (im->fib_index_by_sw_if_index, sw_if_index0);
1417 fib_index0 =
1418 (vnet_buffer (p0)->sw_if_index[VLIB_TX] ==
1419 (u32) ~ 0) ? fib_index0 : vnet_buffer (p0)->sw_if_index[VLIB_TX];
Florin Corascea194d2017-10-02 00:18:51 -07001420 vnet_buffer (p0)->ip.fib_index = fib_index0;
Florin Coras20a14b92017-08-15 22:47:22 -07001421 mtrie0 = &ip4_fib_get (fib_index0)->mtrie;
1422 leaf0 = ip4_fib_mtrie_lookup_step_one (mtrie0, &ip0->src_address);
1423 leaf0 = ip4_fib_mtrie_lookup_step (mtrie0, leaf0, &ip0->src_address,
1424 2);
1425 leaf0 = ip4_fib_mtrie_lookup_step (mtrie0, leaf0, &ip0->src_address,
1426 3);
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001427 lbi0 = ip4_fib_mtrie_leaf_get_adj_index (leaf0);
Dave Barachd7cb1b52016-12-09 09:52:16 -05001428 vnet_buffer (p0)->ip.adj_index[VLIB_TX] = lbi0;
Florin Coras20a14b92017-08-15 22:47:22 -07001429 vnet_buffer (p0)->ip.adj_index[VLIB_RX] = lbi0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001430
Dave Barachd7cb1b52016-12-09 09:52:16 -05001431 lb0 = load_balance_get (lbi0);
1432 dpo0 = load_balance_get_bucket_i (lb0, 0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001433
Neale Ranns3ee44042016-10-03 13:05:48 +01001434 error0 = ((error0 == IP4_ERROR_UNKNOWN_PROTOCOL &&
Dave Barachd7cb1b52016-12-09 09:52:16 -05001435 dpo0->dpoi_type == DPO_RECEIVE) ?
1436 IP4_ERROR_SPOOFED_LOCAL_PACKETS : error0);
1437 error0 = ((error0 == IP4_ERROR_UNKNOWN_PROTOCOL &&
1438 !fib_urpf_check_size (lb0->lb_urpf) &&
Neale Ranns3ee44042016-10-03 13:05:48 +01001439 ip0->dst_address.as_u32 != 0xFFFFFFFF)
Dave Barachd7cb1b52016-12-09 09:52:16 -05001440 ? IP4_ERROR_SRC_LOOKUP_MISS : error0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001441
Dave Barach68b0fb02017-02-28 15:15:56 -05001442 skip_check:
Ed Warnickecb9cada2015-12-08 15:45:58 -07001443 next0 = lm->local_next_by_ip_protocol[proto0];
Dave Barachd7cb1b52016-12-09 09:52:16 -05001444 next0 =
1445 error0 != IP4_ERROR_UNKNOWN_PROTOCOL ? IP_LOCAL_NEXT_DROP : next0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001446
Dave Barachd7cb1b52016-12-09 09:52:16 -05001447 p0->error = error0 ? error_node->errors[error0] : 0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001448
Dave Barach68b0fb02017-02-28 15:15:56 -05001449 if (head_of_feature_arc)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001450 {
Dave Barach68b0fb02017-02-28 15:15:56 -05001451 if (PREDICT_TRUE (error0 == (u8) IP4_ERROR_UNKNOWN_PROTOCOL))
1452 vnet_feature_arc_start (arc_index, sw_if_index0, &next0, p0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001453 }
Dave Barach68b0fb02017-02-28 15:15:56 -05001454
1455 vlib_validate_buffer_enqueue_x1 (vm, node, next_index, to_next,
1456 n_left_to_next, pi0, next0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001457 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07001458 vlib_put_next_frame (vm, node, next_index, n_left_to_next);
1459 }
1460
1461 return frame->n_vectors;
1462}
1463
Dave Barach68b0fb02017-02-28 15:15:56 -05001464static uword
1465ip4_local (vlib_main_t * vm, vlib_node_runtime_t * node, vlib_frame_t * frame)
1466{
1467 return ip4_local_inline (vm, node, frame, 1 /* head of feature arc */ );
1468}
1469
1470/* *INDENT-OFF* */
Neale Ranns32e1c012016-11-22 17:07:28 +00001471VLIB_REGISTER_NODE (ip4_local_node) =
Ed Warnickecb9cada2015-12-08 15:45:58 -07001472{
Dave Barach68b0fb02017-02-28 15:15:56 -05001473 .function = ip4_local,
1474 .name = "ip4-local",
1475 .vector_size = sizeof (u32),
1476 .format_trace = format_ip4_forward_next_trace,
1477 .n_next_nodes = IP_LOCAL_N_NEXT,
1478 .next_nodes =
Dave Barachd7cb1b52016-12-09 09:52:16 -05001479 {
Neale Rannsd91c1db2017-07-31 02:30:50 -07001480 [IP_LOCAL_NEXT_DROP] = "ip4-drop",
1481 [IP_LOCAL_NEXT_PUNT] = "ip4-punt",
Dave Barach68b0fb02017-02-28 15:15:56 -05001482 [IP_LOCAL_NEXT_UDP_LOOKUP] = "ip4-udp-lookup",
Florin Coras20a14b92017-08-15 22:47:22 -07001483 [IP_LOCAL_NEXT_ICMP] = "ip4-icmp-input",
Klement Sekera75e7d132017-09-20 08:26:30 +02001484 [IP_LOCAL_NEXT_REASSEMBLY] = "ip4-reassembly",
Florin Coras20a14b92017-08-15 22:47:22 -07001485 },
Dave Barach68b0fb02017-02-28 15:15:56 -05001486};
1487/* *INDENT-ON* */
Dave Barachd7cb1b52016-12-09 09:52:16 -05001488
1489VLIB_NODE_FUNCTION_MULTIARCH (ip4_local_node, ip4_local);
1490
Dave Barach68b0fb02017-02-28 15:15:56 -05001491static uword
1492ip4_local_end_of_arc (vlib_main_t * vm,
1493 vlib_node_runtime_t * node, vlib_frame_t * frame)
1494{
1495 return ip4_local_inline (vm, node, frame, 0 /* head of feature arc */ );
1496}
1497
1498/* *INDENT-OFF* */
1499VLIB_REGISTER_NODE (ip4_local_end_of_arc_node,static) = {
1500 .function = ip4_local_end_of_arc,
1501 .name = "ip4-local-end-of-arc",
1502 .vector_size = sizeof (u32),
1503
1504 .format_trace = format_ip4_forward_next_trace,
1505 .sibling_of = "ip4-local",
1506};
1507
1508VLIB_NODE_FUNCTION_MULTIARCH (ip4_local_end_of_arc_node, ip4_local_end_of_arc)
1509
1510VNET_FEATURE_INIT (ip4_local_end_of_arc, static) = {
1511 .arc_name = "ip4-local",
1512 .node_name = "ip4-local-end-of-arc",
1513 .runs_before = 0, /* not before any other features */
1514};
1515/* *INDENT-ON* */
1516
Dave Barachd7cb1b52016-12-09 09:52:16 -05001517void
1518ip4_register_protocol (u32 protocol, u32 node_index)
1519{
1520 vlib_main_t *vm = vlib_get_main ();
1521 ip4_main_t *im = &ip4_main;
1522 ip_lookup_main_t *lm = &im->lookup_main;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001523
1524 ASSERT (protocol < ARRAY_LEN (lm->local_next_by_ip_protocol));
Dave Barachd7cb1b52016-12-09 09:52:16 -05001525 lm->local_next_by_ip_protocol[protocol] =
1526 vlib_node_add_next (vm, ip4_local_node.index, node_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001527}
1528
1529static clib_error_t *
1530show_ip_local_command_fn (vlib_main_t * vm,
Dave Barachd7cb1b52016-12-09 09:52:16 -05001531 unformat_input_t * input, vlib_cli_command_t * cmd)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001532{
Dave Barachd7cb1b52016-12-09 09:52:16 -05001533 ip4_main_t *im = &ip4_main;
1534 ip_lookup_main_t *lm = &im->lookup_main;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001535 int i;
1536
1537 vlib_cli_output (vm, "Protocols handled by ip4_local");
Dave Barachd7cb1b52016-12-09 09:52:16 -05001538 for (i = 0; i < ARRAY_LEN (lm->local_next_by_ip_protocol); i++)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001539 {
1540 if (lm->local_next_by_ip_protocol[i] != IP_LOCAL_NEXT_PUNT)
Pierre Pfister1bfd3722017-09-18 11:40:32 +02001541 {
1542 u32 node_index = vlib_get_node (vm,
1543 ip4_local_node.index)->
1544 next_nodes[lm->local_next_by_ip_protocol[i]];
1545 vlib_cli_output (vm, "%d: %U", i, format_vlib_node_name, vm,
1546 node_index);
1547 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07001548 }
1549 return 0;
1550}
1551
1552
1553
Billy McFall0683c9c2016-10-13 08:27:31 -04001554/*?
1555 * Display the set of protocols handled by the local IPv4 stack.
1556 *
1557 * @cliexpar
1558 * Example of how to display local protocol table:
1559 * @cliexstart{show ip local}
1560 * Protocols handled by ip4_local
1561 * 1
1562 * 17
1563 * 47
1564 * @cliexend
1565?*/
1566/* *INDENT-OFF* */
Dave Barachd7cb1b52016-12-09 09:52:16 -05001567VLIB_CLI_COMMAND (show_ip_local, static) =
1568{
Ed Warnickecb9cada2015-12-08 15:45:58 -07001569 .path = "show ip local",
1570 .function = show_ip_local_command_fn,
Billy McFall0683c9c2016-10-13 08:27:31 -04001571 .short_help = "show ip local",
Ed Warnickecb9cada2015-12-08 15:45:58 -07001572};
Billy McFall0683c9c2016-10-13 08:27:31 -04001573/* *INDENT-ON* */
Ed Warnickecb9cada2015-12-08 15:45:58 -07001574
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001575always_inline uword
1576ip4_arp_inline (vlib_main_t * vm,
1577 vlib_node_runtime_t * node,
Dave Barachd7cb1b52016-12-09 09:52:16 -05001578 vlib_frame_t * frame, int is_glean)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001579{
Dave Barachd7cb1b52016-12-09 09:52:16 -05001580 vnet_main_t *vnm = vnet_get_main ();
1581 ip4_main_t *im = &ip4_main;
1582 ip_lookup_main_t *lm = &im->lookup_main;
1583 u32 *from, *to_next_drop;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001584 uword n_left_from, n_left_to_next_drop, next_index;
1585 static f64 time_last_seed_change = -1e100;
1586 static u32 hash_seeds[3];
Dave Barach75fc8542016-10-11 16:16:02 -04001587 static uword hash_bitmap[256 / BITS (uword)];
Ed Warnickecb9cada2015-12-08 15:45:58 -07001588 f64 time_now;
1589
1590 if (node->flags & VLIB_NODE_FLAG_TRACE)
1591 ip4_forward_next_trace (vm, node, frame, VLIB_TX);
1592
1593 time_now = vlib_time_now (vm);
1594 if (time_now - time_last_seed_change > 1e-3)
1595 {
1596 uword i;
Dave Barachd7cb1b52016-12-09 09:52:16 -05001597 u32 *r = clib_random_buffer_get_data (&vm->random_buffer,
1598 sizeof (hash_seeds));
Ed Warnickecb9cada2015-12-08 15:45:58 -07001599 for (i = 0; i < ARRAY_LEN (hash_seeds); i++)
1600 hash_seeds[i] = r[i];
1601
1602 /* Mark all hash keys as been no-seen before. */
1603 for (i = 0; i < ARRAY_LEN (hash_bitmap); i++)
1604 hash_bitmap[i] = 0;
1605
1606 time_last_seed_change = time_now;
1607 }
1608
1609 from = vlib_frame_vector_args (frame);
1610 n_left_from = frame->n_vectors;
1611 next_index = node->cached_next_index;
1612 if (next_index == IP4_ARP_NEXT_DROP)
Dave Barachd7cb1b52016-12-09 09:52:16 -05001613 next_index = IP4_ARP_N_NEXT; /* point to first interface */
Ed Warnickecb9cada2015-12-08 15:45:58 -07001614
1615 while (n_left_from > 0)
1616 {
1617 vlib_get_next_frame (vm, node, IP4_ARP_NEXT_DROP,
1618 to_next_drop, n_left_to_next_drop);
1619
1620 while (n_left_from > 0 && n_left_to_next_drop > 0)
1621 {
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001622 u32 pi0, adj_index0, a0, b0, c0, m0, sw_if_index0, drop0;
Dave Barachd7cb1b52016-12-09 09:52:16 -05001623 ip_adjacency_t *adj0;
1624 vlib_buffer_t *p0;
1625 ip4_header_t *ip0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001626 uword bm0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001627
1628 pi0 = from[0];
1629
1630 p0 = vlib_get_buffer (vm, pi0);
1631
1632 adj_index0 = vnet_buffer (p0)->ip.adj_index[VLIB_TX];
Neale Ranns107e7d42017-04-11 09:55:19 -07001633 adj0 = adj_get (adj_index0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001634 ip0 = vlib_buffer_get_current (p0);
1635
Ed Warnickecb9cada2015-12-08 15:45:58 -07001636 a0 = hash_seeds[0];
1637 b0 = hash_seeds[1];
1638 c0 = hash_seeds[2];
1639
1640 sw_if_index0 = adj0->rewrite_header.sw_if_index;
1641 vnet_buffer (p0)->sw_if_index[VLIB_TX] = sw_if_index0;
1642
Dave Barachd7cb1b52016-12-09 09:52:16 -05001643 if (is_glean)
1644 {
Neale Ranns948e00f2016-10-20 13:39:34 +01001645 /*
1646 * this is the Glean case, so we are ARPing for the
1647 * packet's destination
1648 */
Dave Barachd7cb1b52016-12-09 09:52:16 -05001649 a0 ^= ip0->dst_address.data_u32;
1650 }
1651 else
1652 {
1653 a0 ^= adj0->sub_type.nbr.next_hop.ip4.data_u32;
1654 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07001655 b0 ^= sw_if_index0;
1656
Florin Coras2d3dbc42017-09-08 16:22:38 -04001657 hash_v3_mix32 (a0, b0, c0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001658 hash_v3_finalize32 (a0, b0, c0);
1659
1660 c0 &= BITS (hash_bitmap) - 1;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001661 m0 = (uword) 1 << (c0 % BITS (uword));
Florin Coras2d3dbc42017-09-08 16:22:38 -04001662 c0 = c0 / BITS (uword);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001663
1664 bm0 = hash_bitmap[c0];
1665 drop0 = (bm0 & m0) != 0;
1666
1667 /* Mark it as seen. */
1668 hash_bitmap[c0] = bm0 | m0;
1669
1670 from += 1;
1671 n_left_from -= 1;
1672 to_next_drop[0] = pi0;
1673 to_next_drop += 1;
1674 n_left_to_next_drop -= 1;
1675
Dave Barachd7cb1b52016-12-09 09:52:16 -05001676 p0->error =
1677 node->errors[drop0 ? IP4_ARP_ERROR_DROP :
1678 IP4_ARP_ERROR_REQUEST_SENT];
Ed Warnickecb9cada2015-12-08 15:45:58 -07001679
Neale Rannsb80c5362016-10-08 13:03:40 +01001680 /*
1681 * the adj has been updated to a rewrite but the node the DPO that got
1682 * us here hasn't - yet. no big deal. we'll drop while we wait.
1683 */
1684 if (IP_LOOKUP_NEXT_REWRITE == adj0->lookup_next_index)
1685 continue;
1686
Ed Warnickecb9cada2015-12-08 15:45:58 -07001687 if (drop0)
1688 continue;
1689
Dave Barachd7cb1b52016-12-09 09:52:16 -05001690 /*
1691 * Can happen if the control-plane is programming tables
1692 * with traffic flowing; at least that's today's lame excuse.
1693 */
Neale Ranns32e1c012016-11-22 17:07:28 +00001694 if ((is_glean && adj0->lookup_next_index != IP_LOOKUP_NEXT_GLEAN)
1695 || (!is_glean && adj0->lookup_next_index != IP_LOOKUP_NEXT_ARP))
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001696 {
Dave Barachd7cb1b52016-12-09 09:52:16 -05001697 p0->error = node->errors[IP4_ARP_ERROR_NON_ARP_ADJ];
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001698 }
Dave Barachd7cb1b52016-12-09 09:52:16 -05001699 else
1700 /* Send ARP request. */
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001701 {
Dave Barachd7cb1b52016-12-09 09:52:16 -05001702 u32 bi0 = 0;
1703 vlib_buffer_t *b0;
1704 ethernet_arp_header_t *h0;
1705 vnet_hw_interface_t *hw_if0;
1706
1707 h0 =
1708 vlib_packet_template_get_packet (vm,
1709 &im->ip4_arp_request_packet_template,
1710 &bi0);
1711
Florin Corasd172a622017-10-14 11:02:37 -07001712 /* Seems we're out of buffers */
1713 if (PREDICT_FALSE (!h0))
1714 continue;
1715
Dave Barachd7cb1b52016-12-09 09:52:16 -05001716 /* Add rewrite/encap string for ARP packet. */
1717 vnet_rewrite_one_header (adj0[0], h0,
1718 sizeof (ethernet_header_t));
1719
1720 hw_if0 = vnet_get_sup_hw_interface (vnm, sw_if_index0);
1721
1722 /* Src ethernet address in ARP header. */
1723 clib_memcpy (h0->ip4_over_ethernet[0].ethernet,
1724 hw_if0->hw_address,
1725 sizeof (h0->ip4_over_ethernet[0].ethernet));
1726
1727 if (is_glean)
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001728 {
Dave Barachd7cb1b52016-12-09 09:52:16 -05001729 /* The interface's source address is stashed in the Glean Adj */
1730 h0->ip4_over_ethernet[0].ip4 =
1731 adj0->sub_type.glean.receive_addr.ip4;
1732
1733 /* Copy in destination address we are requesting. This is the
1734 * glean case, so it's the packet's destination.*/
1735 h0->ip4_over_ethernet[1].ip4.data_u32 =
1736 ip0->dst_address.data_u32;
1737 }
1738 else
1739 {
1740 /* Src IP address in ARP header. */
1741 if (ip4_src_address_for_packet (lm, sw_if_index0,
1742 &h0->
1743 ip4_over_ethernet[0].ip4))
1744 {
1745 /* No source address available */
1746 p0->error =
1747 node->errors[IP4_ARP_ERROR_NO_SOURCE_ADDRESS];
1748 vlib_buffer_free (vm, &bi0, 1);
1749 continue;
1750 }
1751
1752 /* Copy in destination address we are requesting from the
1753 incomplete adj */
1754 h0->ip4_over_ethernet[1].ip4.data_u32 =
1755 adj0->sub_type.nbr.next_hop.ip4.as_u32;
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001756 }
1757
Dave Barachd7cb1b52016-12-09 09:52:16 -05001758 vlib_buffer_copy_trace_flag (vm, p0, bi0);
1759 b0 = vlib_get_buffer (vm, bi0);
Florin Coras2f9b0c02017-09-11 20:54:15 -04001760 VLIB_BUFFER_TRACE_TRAJECTORY_INIT (b0);
Dave Barachd7cb1b52016-12-09 09:52:16 -05001761 vnet_buffer (b0)->sw_if_index[VLIB_TX] = sw_if_index0;
1762
1763 vlib_buffer_advance (b0, -adj0->rewrite_header.data_bytes);
1764
1765 vlib_set_next_frame_buffer (vm, node,
1766 adj0->rewrite_header.next_index,
1767 bi0);
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001768 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07001769 }
1770
1771 vlib_put_next_frame (vm, node, IP4_ARP_NEXT_DROP, n_left_to_next_drop);
1772 }
1773
1774 return frame->n_vectors;
1775}
1776
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001777static uword
Dave Barachd7cb1b52016-12-09 09:52:16 -05001778ip4_arp (vlib_main_t * vm, vlib_node_runtime_t * node, vlib_frame_t * frame)
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001779{
Dave Barachd7cb1b52016-12-09 09:52:16 -05001780 return (ip4_arp_inline (vm, node, frame, 0));
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001781}
1782
1783static uword
Dave Barachd7cb1b52016-12-09 09:52:16 -05001784ip4_glean (vlib_main_t * vm, vlib_node_runtime_t * node, vlib_frame_t * frame)
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001785{
Dave Barachd7cb1b52016-12-09 09:52:16 -05001786 return (ip4_arp_inline (vm, node, frame, 1));
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001787}
1788
Dave Barachd7cb1b52016-12-09 09:52:16 -05001789static char *ip4_arp_error_strings[] = {
Ed Warnickecb9cada2015-12-08 15:45:58 -07001790 [IP4_ARP_ERROR_DROP] = "address overflow drops",
1791 [IP4_ARP_ERROR_REQUEST_SENT] = "ARP requests sent",
1792 [IP4_ARP_ERROR_NON_ARP_ADJ] = "ARPs to non-ARP adjacencies",
1793 [IP4_ARP_ERROR_REPLICATE_DROP] = "ARP replication completed",
1794 [IP4_ARP_ERROR_REPLICATE_FAIL] = "ARP replication failed",
Pierre Pfisterd076f192016-06-22 12:58:30 +01001795 [IP4_ARP_ERROR_NO_SOURCE_ADDRESS] = "no source address for ARP request",
Ed Warnickecb9cada2015-12-08 15:45:58 -07001796};
1797
Neale Rannsf8686322017-11-29 02:39:53 -08001798/* *INDENT-OFF* */
Dave Barachd7cb1b52016-12-09 09:52:16 -05001799VLIB_REGISTER_NODE (ip4_arp_node) =
1800{
Neale Rannsf8686322017-11-29 02:39:53 -08001801 .function = ip4_arp,
1802 .name = "ip4-arp",
1803 .vector_size = sizeof (u32),
1804 .format_trace = format_ip4_forward_next_trace,
1805 .n_errors = ARRAY_LEN (ip4_arp_error_strings),
1806 .error_strings = ip4_arp_error_strings,
1807 .n_next_nodes = IP4_ARP_N_NEXT,
1808 .next_nodes =
Dave Barachd7cb1b52016-12-09 09:52:16 -05001809 {
Neale Rannsf8686322017-11-29 02:39:53 -08001810 [IP4_ARP_NEXT_DROP] = "error-drop",
1811 },
1812};
Ed Warnickecb9cada2015-12-08 15:45:58 -07001813
Dave Barachd7cb1b52016-12-09 09:52:16 -05001814VLIB_REGISTER_NODE (ip4_glean_node) =
1815{
Neale Rannsf8686322017-11-29 02:39:53 -08001816 .function = ip4_glean,
1817 .name = "ip4-glean",
1818 .vector_size = sizeof (u32),
1819 .format_trace = format_ip4_forward_next_trace,
1820 .n_errors = ARRAY_LEN (ip4_arp_error_strings),
1821 .error_strings = ip4_arp_error_strings,
1822 .n_next_nodes = IP4_ARP_N_NEXT,
1823 .next_nodes = {
1824 [IP4_ARP_NEXT_DROP] = "error-drop",
1825 },
1826};
1827/* *INDENT-ON* */
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001828
Ed Warnickecb9cada2015-12-08 15:45:58 -07001829#define foreach_notrace_ip4_arp_error \
1830_(DROP) \
1831_(REQUEST_SENT) \
1832_(REPLICATE_DROP) \
1833_(REPLICATE_FAIL)
1834
Dave Barachd7cb1b52016-12-09 09:52:16 -05001835clib_error_t *
1836arp_notrace_init (vlib_main_t * vm)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001837{
Dave Barachd7cb1b52016-12-09 09:52:16 -05001838 vlib_node_runtime_t *rt = vlib_node_get_runtime (vm, ip4_arp_node.index);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001839
1840 /* don't trace ARP request packets */
1841#define _(a) \
1842 vnet_pcap_drop_trace_filter_add_del \
1843 (rt->errors[IP4_ARP_ERROR_##a], \
1844 1 /* is_add */);
Dave Barachd7cb1b52016-12-09 09:52:16 -05001845 foreach_notrace_ip4_arp_error;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001846#undef _
1847 return 0;
1848}
1849
Dave Barachd7cb1b52016-12-09 09:52:16 -05001850VLIB_INIT_FUNCTION (arp_notrace_init);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001851
1852
1853/* Send an ARP request to see if given destination is reachable on given interface. */
1854clib_error_t *
1855ip4_probe_neighbor (vlib_main_t * vm, ip4_address_t * dst, u32 sw_if_index)
1856{
Dave Barachd7cb1b52016-12-09 09:52:16 -05001857 vnet_main_t *vnm = vnet_get_main ();
1858 ip4_main_t *im = &ip4_main;
1859 ethernet_arp_header_t *h;
1860 ip4_address_t *src;
1861 ip_interface_address_t *ia;
1862 ip_adjacency_t *adj;
1863 vnet_hw_interface_t *hi;
1864 vnet_sw_interface_t *si;
1865 vlib_buffer_t *b;
Neale Ranns7a272742017-05-30 02:08:14 -07001866 adj_index_t ai;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001867 u32 bi = 0;
1868
1869 si = vnet_get_sw_interface (vnm, sw_if_index);
1870
1871 if (!(si->flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP))
1872 {
1873 return clib_error_return (0, "%U: interface %U down",
Dave Barachd7cb1b52016-12-09 09:52:16 -05001874 format_ip4_address, dst,
1875 format_vnet_sw_if_index_name, vnm,
1876 sw_if_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001877 }
1878
Dave Barachd7cb1b52016-12-09 09:52:16 -05001879 src =
1880 ip4_interface_address_matching_destination (im, dst, sw_if_index, &ia);
1881 if (!src)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001882 {
1883 vnm->api_errno = VNET_API_ERROR_NO_MATCHING_INTERFACE;
Dave Barach75fc8542016-10-11 16:16:02 -04001884 return clib_error_return
Neale Ranns32e1c012016-11-22 17:07:28 +00001885 (0,
1886 "no matching interface address for destination %U (interface %U)",
1887 format_ip4_address, dst, format_vnet_sw_if_index_name, vnm,
1888 sw_if_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001889 }
1890
Neale Ranns7a272742017-05-30 02:08:14 -07001891 h = vlib_packet_template_get_packet (vm,
1892 &im->ip4_arp_request_packet_template,
1893 &bi);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001894
1895 hi = vnet_get_sup_hw_interface (vnm, sw_if_index);
Pavel Kotucek57808982017-08-02 08:20:19 +02001896 if (PREDICT_FALSE (!hi->hw_address))
1897 {
1898 return clib_error_return (0, "%U: interface %U do not support ip probe",
1899 format_ip4_address, dst,
1900 format_vnet_sw_if_index_name, vnm,
1901 sw_if_index);
1902 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07001903
Dave Barachd7cb1b52016-12-09 09:52:16 -05001904 clib_memcpy (h->ip4_over_ethernet[0].ethernet, hi->hw_address,
1905 sizeof (h->ip4_over_ethernet[0].ethernet));
Ed Warnickecb9cada2015-12-08 15:45:58 -07001906
1907 h->ip4_over_ethernet[0].ip4 = src[0];
1908 h->ip4_over_ethernet[1].ip4 = dst[0];
1909
1910 b = vlib_get_buffer (vm, bi);
Dave Barachd7cb1b52016-12-09 09:52:16 -05001911 vnet_buffer (b)->sw_if_index[VLIB_RX] =
1912 vnet_buffer (b)->sw_if_index[VLIB_TX] = sw_if_index;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001913
Dave Barach59b25652017-09-10 15:04:27 -04001914 ip46_address_t nh = {
1915 .ip4 = *dst,
1916 };
1917
1918 ai = adj_nbr_add_or_lock (FIB_PROTOCOL_IP4,
1919 VNET_LINK_IP4, &nh, sw_if_index);
1920 adj = adj_get (ai);
1921
1922 /* Peer has been previously resolved, retrieve glean adj instead */
1923 if (adj->lookup_next_index == IP_LOOKUP_NEXT_REWRITE)
1924 {
1925 adj_unlock (ai);
1926 ai = adj_glean_add_or_lock (FIB_PROTOCOL_IP4, sw_if_index, &nh);
1927 adj = adj_get (ai);
1928 }
1929
Ed Warnickecb9cada2015-12-08 15:45:58 -07001930 /* Add encapsulation string for software interface (e.g. ethernet header). */
1931 vnet_rewrite_one_header (adj[0], h, sizeof (ethernet_header_t));
1932 vlib_buffer_advance (b, -adj->rewrite_header.data_bytes);
1933
1934 {
Dave Barachd7cb1b52016-12-09 09:52:16 -05001935 vlib_frame_t *f = vlib_get_frame_to_node (vm, hi->output_node_index);
1936 u32 *to_next = vlib_frame_vector_args (f);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001937 to_next[0] = bi;
1938 f->n_vectors = 1;
1939 vlib_put_frame_to_node (vm, hi->output_node_index, f);
1940 }
1941
Neale Ranns7a272742017-05-30 02:08:14 -07001942 adj_unlock (ai);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001943 return /* no error */ 0;
1944}
1945
Dave Barachd7cb1b52016-12-09 09:52:16 -05001946typedef enum
1947{
Ed Warnickecb9cada2015-12-08 15:45:58 -07001948 IP4_REWRITE_NEXT_DROP,
Chris Luke816f3e12016-06-14 16:24:47 -04001949 IP4_REWRITE_NEXT_ICMP_ERROR,
Ed Warnickecb9cada2015-12-08 15:45:58 -07001950} ip4_rewrite_next_t;
1951
1952always_inline uword
1953ip4_rewrite_inline (vlib_main_t * vm,
1954 vlib_node_runtime_t * node,
Neale Ranns9c6a6132017-02-21 05:33:14 -08001955 vlib_frame_t * frame,
1956 int do_counters, int is_midchain, int is_mcast)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001957{
Dave Barachd7cb1b52016-12-09 09:52:16 -05001958 ip_lookup_main_t *lm = &ip4_main.lookup_main;
1959 u32 *from = vlib_frame_vector_args (frame);
1960 u32 n_left_from, n_left_to_next, *to_next, next_index;
1961 vlib_node_runtime_t *error_node =
1962 vlib_node_get_runtime (vm, ip4_input_node.index);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001963
1964 n_left_from = frame->n_vectors;
1965 next_index = node->cached_next_index;
Damjan Marion586afd72017-04-05 19:18:20 +02001966 u32 thread_index = vlib_get_thread_index ();
Dave Barach75fc8542016-10-11 16:16:02 -04001967
Ed Warnickecb9cada2015-12-08 15:45:58 -07001968 while (n_left_from > 0)
1969 {
1970 vlib_get_next_frame (vm, node, next_index, to_next, n_left_to_next);
1971
1972 while (n_left_from >= 4 && n_left_to_next >= 2)
1973 {
Dave Barachd7cb1b52016-12-09 09:52:16 -05001974 ip_adjacency_t *adj0, *adj1;
1975 vlib_buffer_t *p0, *p1;
1976 ip4_header_t *ip0, *ip1;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001977 u32 pi0, rw_len0, next0, error0, checksum0, adj_index0;
1978 u32 pi1, rw_len1, next1, error1, checksum1, adj_index1;
Dave Barachd7cb1b52016-12-09 09:52:16 -05001979 u32 tx_sw_if_index0, tx_sw_if_index1;
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001980
Ed Warnickecb9cada2015-12-08 15:45:58 -07001981 /* Prefetch next iteration. */
1982 {
Dave Barachd7cb1b52016-12-09 09:52:16 -05001983 vlib_buffer_t *p2, *p3;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001984
1985 p2 = vlib_get_buffer (vm, from[2]);
1986 p3 = vlib_get_buffer (vm, from[3]);
1987
1988 vlib_prefetch_buffer_header (p2, STORE);
1989 vlib_prefetch_buffer_header (p3, STORE);
1990
1991 CLIB_PREFETCH (p2->data, sizeof (ip0[0]), STORE);
1992 CLIB_PREFETCH (p3->data, sizeof (ip0[0]), STORE);
1993 }
1994
1995 pi0 = to_next[0] = from[0];
1996 pi1 = to_next[1] = from[1];
1997
1998 from += 2;
1999 n_left_from -= 2;
2000 to_next += 2;
2001 n_left_to_next -= 2;
Dave Barach75fc8542016-10-11 16:16:02 -04002002
Ed Warnickecb9cada2015-12-08 15:45:58 -07002003 p0 = vlib_get_buffer (vm, pi0);
2004 p1 = vlib_get_buffer (vm, pi1);
2005
Neale Rannsf06aea52016-11-29 06:51:37 -08002006 adj_index0 = vnet_buffer (p0)->ip.adj_index[VLIB_TX];
2007 adj_index1 = vnet_buffer (p1)->ip.adj_index[VLIB_TX];
Ed Warnickecb9cada2015-12-08 15:45:58 -07002008
Neale Ranns1bd01092017-03-15 15:41:17 -04002009 /*
2010 * pre-fetch the per-adjacency counters
2011 */
2012 if (do_counters)
2013 {
2014 vlib_prefetch_combined_counter (&adjacency_counters,
Damjan Marion586afd72017-04-05 19:18:20 +02002015 thread_index, adj_index0);
Neale Ranns1bd01092017-03-15 15:41:17 -04002016 vlib_prefetch_combined_counter (&adjacency_counters,
Damjan Marion586afd72017-04-05 19:18:20 +02002017 thread_index, adj_index1);
Neale Ranns1bd01092017-03-15 15:41:17 -04002018 }
2019
Ed Warnickecb9cada2015-12-08 15:45:58 -07002020 ip0 = vlib_buffer_get_current (p0);
2021 ip1 = vlib_buffer_get_current (p1);
2022
2023 error0 = error1 = IP4_ERROR_NONE;
Dave Barachd7cb1b52016-12-09 09:52:16 -05002024 next0 = next1 = IP4_REWRITE_NEXT_DROP;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002025
2026 /* Decrement TTL & update checksum.
2027 Works either endian, so no need for byte swap. */
Damjan Marion213b5aa2017-07-13 21:19:27 +02002028 if (PREDICT_TRUE (!(p0->flags & VNET_BUFFER_F_LOCALLY_ORIGINATED)))
Ed Warnickecb9cada2015-12-08 15:45:58 -07002029 {
Dave Barachd7cb1b52016-12-09 09:52:16 -05002030 i32 ttl0 = ip0->ttl;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002031
2032 /* Input node should have reject packets with ttl 0. */
2033 ASSERT (ip0->ttl > 0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07002034
2035 checksum0 = ip0->checksum + clib_host_to_net_u16 (0x0100);
Ed Warnickecb9cada2015-12-08 15:45:58 -07002036 checksum0 += checksum0 >= 0xffff;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002037
2038 ip0->checksum = checksum0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002039 ttl0 -= 1;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002040 ip0->ttl = ttl0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002041
Dave Barachd7cb1b52016-12-09 09:52:16 -05002042 /*
2043 * If the ttl drops below 1 when forwarding, generate
2044 * an ICMP response.
2045 */
2046 if (PREDICT_FALSE (ttl0 <= 0))
2047 {
2048 error0 = IP4_ERROR_TIME_EXPIRED;
2049 vnet_buffer (p0)->sw_if_index[VLIB_TX] = (u32) ~ 0;
2050 icmp4_error_set_vnet_buffer (p0, ICMP4_time_exceeded,
2051 ICMP4_time_exceeded_ttl_exceeded_in_transit,
2052 0);
2053 next0 = IP4_REWRITE_NEXT_ICMP_ERROR;
2054 }
Neale Rannsf06aea52016-11-29 06:51:37 -08002055
2056 /* Verify checksum. */
Dave Barach2c0a4f42017-06-29 09:30:15 -04002057 ASSERT ((ip0->checksum == ip4_header_checksum (ip0)) ||
Damjan Marionfb3288f2017-07-19 15:07:10 +02002058 (p0->flags & VNET_BUFFER_F_OFFLOAD_IP_CKSUM));
Neale Rannsf06aea52016-11-29 06:51:37 -08002059 }
Dave Barachd7cb1b52016-12-09 09:52:16 -05002060 else
2061 {
Damjan Marion213b5aa2017-07-13 21:19:27 +02002062 p0->flags &= ~VNET_BUFFER_F_LOCALLY_ORIGINATED;
Dave Barachd7cb1b52016-12-09 09:52:16 -05002063 }
Damjan Marion213b5aa2017-07-13 21:19:27 +02002064 if (PREDICT_TRUE (!(p1->flags & VNET_BUFFER_F_LOCALLY_ORIGINATED)))
Neale Rannsf06aea52016-11-29 06:51:37 -08002065 {
2066 i32 ttl1 = ip1->ttl;
2067
2068 /* Input node should have reject packets with ttl 0. */
2069 ASSERT (ip1->ttl > 0);
2070
2071 checksum1 = ip1->checksum + clib_host_to_net_u16 (0x0100);
2072 checksum1 += checksum1 >= 0xffff;
2073
2074 ip1->checksum = checksum1;
2075 ttl1 -= 1;
2076 ip1->ttl = ttl1;
2077
Dave Barachd7cb1b52016-12-09 09:52:16 -05002078 /*
2079 * If the ttl drops below 1 when forwarding, generate
2080 * an ICMP response.
2081 */
2082 if (PREDICT_FALSE (ttl1 <= 0))
2083 {
2084 error1 = IP4_ERROR_TIME_EXPIRED;
2085 vnet_buffer (p1)->sw_if_index[VLIB_TX] = (u32) ~ 0;
2086 icmp4_error_set_vnet_buffer (p1, ICMP4_time_exceeded,
2087 ICMP4_time_exceeded_ttl_exceeded_in_transit,
2088 0);
2089 next1 = IP4_REWRITE_NEXT_ICMP_ERROR;
2090 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07002091
2092 /* Verify checksum. */
Dave Barach2c0a4f42017-06-29 09:30:15 -04002093 ASSERT ((ip1->checksum == ip4_header_checksum (ip1)) ||
Damjan Marionfb3288f2017-07-19 15:07:10 +02002094 (p1->flags & VNET_BUFFER_F_OFFLOAD_IP_CKSUM));
Ed Warnickecb9cada2015-12-08 15:45:58 -07002095 }
Dave Barachd7cb1b52016-12-09 09:52:16 -05002096 else
2097 {
Damjan Marion213b5aa2017-07-13 21:19:27 +02002098 p1->flags &= ~VNET_BUFFER_F_LOCALLY_ORIGINATED;
Dave Barachd7cb1b52016-12-09 09:52:16 -05002099 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07002100
2101 /* Rewrite packet header and updates lengths. */
Neale Ranns107e7d42017-04-11 09:55:19 -07002102 adj0 = adj_get (adj_index0);
2103 adj1 = adj_get (adj_index1);
Dave Barach75fc8542016-10-11 16:16:02 -04002104
Dave Barachd7cb1b52016-12-09 09:52:16 -05002105 /* Worth pipelining. No guarantee that adj0,1 are hot... */
Ed Warnickecb9cada2015-12-08 15:45:58 -07002106 rw_len0 = adj0[0].rewrite_header.data_bytes;
2107 rw_len1 = adj1[0].rewrite_header.data_bytes;
Dave Barachd7cb1b52016-12-09 09:52:16 -05002108 vnet_buffer (p0)->ip.save_rewrite_length = rw_len0;
2109 vnet_buffer (p1)->ip.save_rewrite_length = rw_len1;
Chris Lukef2868fc2016-06-14 16:26:22 -04002110
Dave Barachd7cb1b52016-12-09 09:52:16 -05002111 /* Check MTU of outgoing interface. */
Neale Rannsffd78d12018-02-09 06:05:16 -08002112 if (vlib_buffer_length_in_chain (vm, p0) >
2113 adj0[0].rewrite_header.max_l3_packet_bytes)
2114 {
2115 error0 = IP4_ERROR_MTU_EXCEEDED;
2116 next0 = IP4_REWRITE_NEXT_ICMP_ERROR;
2117 icmp4_error_set_vnet_buffer
2118 (p0, ICMP4_destination_unreachable,
2119 ICMP4_destination_unreachable_fragmentation_needed_and_dont_fragment_set,
2120 0);
2121 }
2122 if (vlib_buffer_length_in_chain (vm, p1) >
2123 adj1[0].rewrite_header.max_l3_packet_bytes)
2124 {
2125 error1 = IP4_ERROR_MTU_EXCEEDED;
2126 next1 = IP4_REWRITE_NEXT_ICMP_ERROR;
2127 icmp4_error_set_vnet_buffer
2128 (p1, ICMP4_destination_unreachable,
2129 ICMP4_destination_unreachable_fragmentation_needed_and_dont_fragment_set,
2130 0);
2131 }
Chris Lukef2868fc2016-06-14 16:26:22 -04002132
Neale Rannscf3561b2017-12-13 01:44:25 -08002133 if (is_mcast)
2134 {
2135 error0 = ((adj0[0].rewrite_header.sw_if_index ==
2136 vnet_buffer (p0)->sw_if_index[VLIB_RX]) ?
2137 IP4_ERROR_SAME_INTERFACE : error0);
2138 error1 = ((adj1[0].rewrite_header.sw_if_index ==
2139 vnet_buffer (p1)->sw_if_index[VLIB_RX]) ?
2140 IP4_ERROR_SAME_INTERFACE : error1);
2141 }
2142
Chun Lief56fae2018-02-07 09:58:28 +08002143 p0->error = error_node->errors[error0];
2144 p1->error = error_node->errors[error1];
Dave Barachd7cb1b52016-12-09 09:52:16 -05002145 /* Don't adjust the buffer for ttl issue; icmp-error node wants
2146 * to see the IP headerr */
2147 if (PREDICT_TRUE (error0 == IP4_ERROR_NONE))
2148 {
Damjan Marion892e0762016-12-09 18:52:05 +01002149 next0 = adj0[0].rewrite_header.next_index;
Dave Barachd7cb1b52016-12-09 09:52:16 -05002150 p0->current_data -= rw_len0;
2151 p0->current_length += rw_len0;
2152 tx_sw_if_index0 = adj0[0].rewrite_header.sw_if_index;
2153 vnet_buffer (p0)->sw_if_index[VLIB_TX] = tx_sw_if_index0;
Dave Barach5331c722016-08-17 11:54:30 -04002154
Neale Rannsb069a692017-03-15 12:34:25 -04002155 if (PREDICT_FALSE
2156 (adj0[0].rewrite_header.flags & VNET_REWRITE_HAS_FEATURES))
2157 vnet_feature_arc_start (lm->output_feature_arc_index,
2158 tx_sw_if_index0, &next0, p0);
Dave Barachd7cb1b52016-12-09 09:52:16 -05002159 }
2160 if (PREDICT_TRUE (error1 == IP4_ERROR_NONE))
2161 {
Damjan Marion892e0762016-12-09 18:52:05 +01002162 next1 = adj1[0].rewrite_header.next_index;
Dave Barachd7cb1b52016-12-09 09:52:16 -05002163 p1->current_data -= rw_len1;
2164 p1->current_length += rw_len1;
Dave Barach5331c722016-08-17 11:54:30 -04002165
Dave Barachd7cb1b52016-12-09 09:52:16 -05002166 tx_sw_if_index1 = adj1[0].rewrite_header.sw_if_index;
2167 vnet_buffer (p1)->sw_if_index[VLIB_TX] = tx_sw_if_index1;
Dave Barach5331c722016-08-17 11:54:30 -04002168
Neale Rannsb069a692017-03-15 12:34:25 -04002169 if (PREDICT_FALSE
2170 (adj1[0].rewrite_header.flags & VNET_REWRITE_HAS_FEATURES))
2171 vnet_feature_arc_start (lm->output_feature_arc_index,
2172 tx_sw_if_index1, &next1, p1);
Dave Barachd7cb1b52016-12-09 09:52:16 -05002173 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07002174
2175 /* Guess we are only writing on simple Ethernet header. */
2176 vnet_rewrite_two_headers (adj0[0], adj1[0],
Dave Barachd7cb1b52016-12-09 09:52:16 -05002177 ip0, ip1, sizeof (ethernet_header_t));
Neale Ranns5e575b12016-10-03 09:40:25 +01002178
Neale Ranns044183f2017-01-24 01:34:25 -08002179 /*
2180 * Bump the per-adjacency counters
2181 */
Neale Ranns9c6a6132017-02-21 05:33:14 -08002182 if (do_counters)
2183 {
2184 vlib_increment_combined_counter
2185 (&adjacency_counters,
Damjan Marion586afd72017-04-05 19:18:20 +02002186 thread_index,
Neale Ranns9c6a6132017-02-21 05:33:14 -08002187 adj_index0, 1,
2188 vlib_buffer_length_in_chain (vm, p0) + rw_len0);
Neale Ranns044183f2017-01-24 01:34:25 -08002189
Neale Ranns9c6a6132017-02-21 05:33:14 -08002190 vlib_increment_combined_counter
2191 (&adjacency_counters,
Damjan Marion586afd72017-04-05 19:18:20 +02002192 thread_index,
Neale Ranns9c6a6132017-02-21 05:33:14 -08002193 adj_index1, 1,
2194 vlib_buffer_length_in_chain (vm, p1) + rw_len1);
2195 }
Neale Ranns044183f2017-01-24 01:34:25 -08002196
Neale Ranns5e575b12016-10-03 09:40:25 +01002197 if (is_midchain)
Dave Barachd7cb1b52016-12-09 09:52:16 -05002198 {
Neale Rannsdb14f5a2018-01-29 10:43:33 -08002199 adj0->sub_type.midchain.fixup_func
2200 (vm, adj0, p0, adj0->sub_type.midchain.fixup_data);
2201 adj1->sub_type.midchain.fixup_func
2202 (vm, adj1, p1, adj0->sub_type.midchain.fixup_data);
Dave Barachd7cb1b52016-12-09 09:52:16 -05002203 }
Neale Ranns32e1c012016-11-22 17:07:28 +00002204 if (is_mcast)
2205 {
2206 /*
2207 * copy bytes from the IP address into the MAC rewrite
2208 */
Neale Ranns2e7fbcc2017-03-15 04:22:25 -07002209 vnet_fixup_one_header (adj0[0], &ip0->dst_address, ip0);
2210 vnet_fixup_one_header (adj1[0], &ip1->dst_address, ip1);
Neale Ranns32e1c012016-11-22 17:07:28 +00002211 }
Dave Barach75fc8542016-10-11 16:16:02 -04002212
Ed Warnickecb9cada2015-12-08 15:45:58 -07002213 vlib_validate_buffer_enqueue_x2 (vm, node, next_index,
2214 to_next, n_left_to_next,
2215 pi0, pi1, next0, next1);
2216 }
2217
2218 while (n_left_from > 0 && n_left_to_next > 0)
2219 {
Dave Barachd7cb1b52016-12-09 09:52:16 -05002220 ip_adjacency_t *adj0;
2221 vlib_buffer_t *p0;
2222 ip4_header_t *ip0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002223 u32 pi0, rw_len0, adj_index0, next0, error0, checksum0;
Dave Barachd7cb1b52016-12-09 09:52:16 -05002224 u32 tx_sw_if_index0;
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002225
Ed Warnickecb9cada2015-12-08 15:45:58 -07002226 pi0 = to_next[0] = from[0];
2227
2228 p0 = vlib_get_buffer (vm, pi0);
2229
Neale Rannsf06aea52016-11-29 06:51:37 -08002230 adj_index0 = vnet_buffer (p0)->ip.adj_index[VLIB_TX];
Ed Warnickecb9cada2015-12-08 15:45:58 -07002231
Neale Ranns107e7d42017-04-11 09:55:19 -07002232 adj0 = adj_get (adj_index0);
Dave Barach75fc8542016-10-11 16:16:02 -04002233
Ed Warnickecb9cada2015-12-08 15:45:58 -07002234 ip0 = vlib_buffer_get_current (p0);
2235
2236 error0 = IP4_ERROR_NONE;
Dave Barachd7cb1b52016-12-09 09:52:16 -05002237 next0 = IP4_REWRITE_NEXT_DROP; /* drop on error */
Ed Warnickecb9cada2015-12-08 15:45:58 -07002238
2239 /* Decrement TTL & update checksum. */
Damjan Marion213b5aa2017-07-13 21:19:27 +02002240 if (PREDICT_TRUE (!(p0->flags & VNET_BUFFER_F_LOCALLY_ORIGINATED)))
Ed Warnickecb9cada2015-12-08 15:45:58 -07002241 {
2242 i32 ttl0 = ip0->ttl;
2243
2244 checksum0 = ip0->checksum + clib_host_to_net_u16 (0x0100);
2245
2246 checksum0 += checksum0 >= 0xffff;
2247
2248 ip0->checksum = checksum0;
2249
2250 ASSERT (ip0->ttl > 0);
2251
2252 ttl0 -= 1;
2253
2254 ip0->ttl = ttl0;
2255
Dave Barach2c0a4f42017-06-29 09:30:15 -04002256 ASSERT ((ip0->checksum == ip4_header_checksum (ip0)) ||
Damjan Marionfb3288f2017-07-19 15:07:10 +02002257 (p0->flags & VNET_BUFFER_F_OFFLOAD_IP_CKSUM));
Ed Warnickecb9cada2015-12-08 15:45:58 -07002258
Dave Barachd7cb1b52016-12-09 09:52:16 -05002259 if (PREDICT_FALSE (ttl0 <= 0))
2260 {
2261 /*
2262 * If the ttl drops below 1 when forwarding, generate
2263 * an ICMP response.
2264 */
2265 error0 = IP4_ERROR_TIME_EXPIRED;
2266 next0 = IP4_REWRITE_NEXT_ICMP_ERROR;
2267 vnet_buffer (p0)->sw_if_index[VLIB_TX] = (u32) ~ 0;
2268 icmp4_error_set_vnet_buffer (p0, ICMP4_time_exceeded,
2269 ICMP4_time_exceeded_ttl_exceeded_in_transit,
2270 0);
2271 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07002272 }
Dave Barachd7cb1b52016-12-09 09:52:16 -05002273 else
2274 {
Damjan Marion213b5aa2017-07-13 21:19:27 +02002275 p0->flags &= ~VNET_BUFFER_F_LOCALLY_ORIGINATED;
Dave Barachd7cb1b52016-12-09 09:52:16 -05002276 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07002277
Neale Ranns1bd01092017-03-15 15:41:17 -04002278 if (do_counters)
2279 vlib_prefetch_combined_counter (&adjacency_counters,
Damjan Marion586afd72017-04-05 19:18:20 +02002280 thread_index, adj_index0);
Neale Ranns044183f2017-01-24 01:34:25 -08002281
Ed Warnickecb9cada2015-12-08 15:45:58 -07002282 /* Guess we are only writing on simple Ethernet header. */
Dave Barachd7cb1b52016-12-09 09:52:16 -05002283 vnet_rewrite_one_header (adj0[0], ip0, sizeof (ethernet_header_t));
Neale Ranns32e1c012016-11-22 17:07:28 +00002284 if (is_mcast)
2285 {
2286 /*
2287 * copy bytes from the IP address into the MAC rewrite
2288 */
Neale Ranns2e7fbcc2017-03-15 04:22:25 -07002289 vnet_fixup_one_header (adj0[0], &ip0->dst_address, ip0);
Neale Ranns32e1c012016-11-22 17:07:28 +00002290 }
Dave Barach75fc8542016-10-11 16:16:02 -04002291
Dave Barachd7cb1b52016-12-09 09:52:16 -05002292 /* Update packet buffer attributes/set output interface. */
2293 rw_len0 = adj0[0].rewrite_header.data_bytes;
2294 vnet_buffer (p0)->ip.save_rewrite_length = rw_len0;
Dave Barach75fc8542016-10-11 16:16:02 -04002295
Neale Ranns1bd01092017-03-15 15:41:17 -04002296 if (do_counters)
2297 vlib_increment_combined_counter
2298 (&adjacency_counters,
Damjan Marion586afd72017-04-05 19:18:20 +02002299 thread_index, adj_index0, 1,
Neale Ranns1bd01092017-03-15 15:41:17 -04002300 vlib_buffer_length_in_chain (vm, p0) + rw_len0);
Dave Barach75fc8542016-10-11 16:16:02 -04002301
Dave Barachd7cb1b52016-12-09 09:52:16 -05002302 /* Check MTU of outgoing interface. */
Neale Rannsffd78d12018-02-09 06:05:16 -08002303 if (vlib_buffer_length_in_chain (vm, p0) >
2304 adj0[0].rewrite_header.max_l3_packet_bytes)
2305 {
2306 error0 = IP4_ERROR_MTU_EXCEEDED;
2307 next0 = IP4_REWRITE_NEXT_ICMP_ERROR;
2308 icmp4_error_set_vnet_buffer
2309 (p0, ICMP4_destination_unreachable,
2310 ICMP4_destination_unreachable_fragmentation_needed_and_dont_fragment_set,
2311 0);
2312 }
Neale Rannscf3561b2017-12-13 01:44:25 -08002313 if (is_mcast)
2314 {
2315 error0 = ((adj0[0].rewrite_header.sw_if_index ==
2316 vnet_buffer (p0)->sw_if_index[VLIB_RX]) ?
2317 IP4_ERROR_SAME_INTERFACE : error0);
2318 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07002319 p0->error = error_node->errors[error0];
Chris Luke816f3e12016-06-14 16:24:47 -04002320
Dave Barachd7cb1b52016-12-09 09:52:16 -05002321 /* Don't adjust the buffer for ttl issue; icmp-error node wants
2322 * to see the IP headerr */
2323 if (PREDICT_TRUE (error0 == IP4_ERROR_NONE))
2324 {
2325 p0->current_data -= rw_len0;
2326 p0->current_length += rw_len0;
2327 tx_sw_if_index0 = adj0[0].rewrite_header.sw_if_index;
Chris Luke816f3e12016-06-14 16:24:47 -04002328
Dave Barachd7cb1b52016-12-09 09:52:16 -05002329 vnet_buffer (p0)->sw_if_index[VLIB_TX] = tx_sw_if_index0;
2330 next0 = adj0[0].rewrite_header.next_index;
Dave Barach5331c722016-08-17 11:54:30 -04002331
Neale Ranns5e575b12016-10-03 09:40:25 +01002332 if (is_midchain)
Dave Barachd7cb1b52016-12-09 09:52:16 -05002333 {
Neale Rannsdb14f5a2018-01-29 10:43:33 -08002334 adj0->sub_type.midchain.fixup_func
2335 (vm, adj0, p0, adj0->sub_type.midchain.fixup_data);
Neale Ranns5e575b12016-10-03 09:40:25 +01002336 }
2337
Neale Rannsb069a692017-03-15 12:34:25 -04002338 if (PREDICT_FALSE
2339 (adj0[0].rewrite_header.flags & VNET_REWRITE_HAS_FEATURES))
2340 vnet_feature_arc_start (lm->output_feature_arc_index,
2341 tx_sw_if_index0, &next0, p0);
Damjan Marion8b3191e2016-11-09 19:54:20 +01002342
Dave Barachd7cb1b52016-12-09 09:52:16 -05002343 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07002344
Ed Warnickecb9cada2015-12-08 15:45:58 -07002345 from += 1;
2346 n_left_from -= 1;
2347 to_next += 1;
2348 n_left_to_next -= 1;
Dave Barach75fc8542016-10-11 16:16:02 -04002349
Ed Warnickecb9cada2015-12-08 15:45:58 -07002350 vlib_validate_buffer_enqueue_x1 (vm, node, next_index,
2351 to_next, n_left_to_next,
2352 pi0, next0);
2353 }
Dave Barach75fc8542016-10-11 16:16:02 -04002354
Ed Warnickecb9cada2015-12-08 15:45:58 -07002355 vlib_put_next_frame (vm, node, next_index, n_left_to_next);
2356 }
2357
2358 /* Need to do trace after rewrites to pick up new packet data. */
2359 if (node->flags & VLIB_NODE_FLAG_TRACE)
Neale Rannsf06aea52016-11-29 06:51:37 -08002360 ip4_forward_next_trace (vm, node, frame, VLIB_TX);
Ed Warnickecb9cada2015-12-08 15:45:58 -07002361
2362 return frame->n_vectors;
2363}
2364
Dave Barach132d51d2016-07-07 10:10:17 -04002365
Neale Rannsf06aea52016-11-29 06:51:37 -08002366/** @brief IPv4 rewrite node.
2367 @node ip4-rewrite
Dave Barach132d51d2016-07-07 10:10:17 -04002368
2369 This is the IPv4 transit-rewrite node: decrement TTL, fix the ipv4
2370 header checksum, fetch the ip adjacency, check the outbound mtu,
2371 apply the adjacency rewrite, and send pkts to the adjacency
2372 rewrite header's rewrite_next_index.
2373
2374 @param vm vlib_main_t corresponding to the current thread
2375 @param node vlib_node_runtime_t
2376 @param frame vlib_frame_t whose contents should be dispatched
2377
2378 @par Graph mechanics: buffer metadata, next index usage
2379
2380 @em Uses:
2381 - <code>vnet_buffer(b)->ip.adj_index[VLIB_TX]</code>
2382 - the rewrite adjacency index
2383 - <code>adj->lookup_next_index</code>
2384 - Must be IP_LOOKUP_NEXT_REWRITE or IP_LOOKUP_NEXT_ARP, otherwise
Dave Barach75fc8542016-10-11 16:16:02 -04002385 the packet will be dropped.
Dave Barach132d51d2016-07-07 10:10:17 -04002386 - <code>adj->rewrite_header</code>
2387 - Rewrite string length, rewrite string, next_index
2388
2389 @em Sets:
2390 - <code>b->current_data, b->current_length</code>
2391 - Updated net of applying the rewrite string
2392
2393 <em>Next Indices:</em>
2394 - <code> adj->rewrite_header.next_index </code>
Vijayabhaskar Katamreddyce074122017-11-15 13:50:26 -08002395 or @c ip4-drop
Dave Barach132d51d2016-07-07 10:10:17 -04002396*/
Ed Warnickecb9cada2015-12-08 15:45:58 -07002397static uword
Neale Rannsf06aea52016-11-29 06:51:37 -08002398ip4_rewrite (vlib_main_t * vm,
Dave Barachd7cb1b52016-12-09 09:52:16 -05002399 vlib_node_runtime_t * node, vlib_frame_t * frame)
Ed Warnickecb9cada2015-12-08 15:45:58 -07002400{
Neale Ranns9c6a6132017-02-21 05:33:14 -08002401 if (adj_are_counters_enabled ())
2402 return ip4_rewrite_inline (vm, node, frame, 1, 0, 0);
2403 else
2404 return ip4_rewrite_inline (vm, node, frame, 0, 0, 0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07002405}
2406
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002407static uword
2408ip4_midchain (vlib_main_t * vm,
Dave Barachd7cb1b52016-12-09 09:52:16 -05002409 vlib_node_runtime_t * node, vlib_frame_t * frame)
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002410{
Neale Ranns9c6a6132017-02-21 05:33:14 -08002411 if (adj_are_counters_enabled ())
2412 return ip4_rewrite_inline (vm, node, frame, 1, 1, 0);
2413 else
2414 return ip4_rewrite_inline (vm, node, frame, 0, 1, 0);
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002415}
2416
Neale Ranns32e1c012016-11-22 17:07:28 +00002417static uword
2418ip4_rewrite_mcast (vlib_main_t * vm,
2419 vlib_node_runtime_t * node, vlib_frame_t * frame)
Dave Barachd7cb1b52016-12-09 09:52:16 -05002420{
Neale Ranns9c6a6132017-02-21 05:33:14 -08002421 if (adj_are_counters_enabled ())
2422 return ip4_rewrite_inline (vm, node, frame, 1, 0, 1);
2423 else
2424 return ip4_rewrite_inline (vm, node, frame, 0, 0, 1);
Neale Ranns32e1c012016-11-22 17:07:28 +00002425}
Ed Warnickecb9cada2015-12-08 15:45:58 -07002426
Neale Ranns0f26c5a2017-03-01 15:12:11 -08002427static uword
2428ip4_mcast_midchain (vlib_main_t * vm,
2429 vlib_node_runtime_t * node, vlib_frame_t * frame)
2430{
2431 if (adj_are_counters_enabled ())
2432 return ip4_rewrite_inline (vm, node, frame, 1, 1, 1);
2433 else
2434 return ip4_rewrite_inline (vm, node, frame, 0, 1, 1);
2435}
2436
Neale Ranns32e1c012016-11-22 17:07:28 +00002437/* *INDENT-OFF* */
2438VLIB_REGISTER_NODE (ip4_rewrite_node) = {
2439 .function = ip4_rewrite,
2440 .name = "ip4-rewrite",
2441 .vector_size = sizeof (u32),
Ed Warnickecb9cada2015-12-08 15:45:58 -07002442
Neale Ranns32e1c012016-11-22 17:07:28 +00002443 .format_trace = format_ip4_rewrite_trace,
Ed Warnickecb9cada2015-12-08 15:45:58 -07002444
Neale Ranns32e1c012016-11-22 17:07:28 +00002445 .n_next_nodes = 2,
2446 .next_nodes = {
Vijayabhaskar Katamreddyce074122017-11-15 13:50:26 -08002447 [IP4_REWRITE_NEXT_DROP] = "ip4-drop",
Neale Ranns32e1c012016-11-22 17:07:28 +00002448 [IP4_REWRITE_NEXT_ICMP_ERROR] = "ip4-icmp-error",
2449 },
2450};
2451VLIB_NODE_FUNCTION_MULTIARCH (ip4_rewrite_node, ip4_rewrite)
2452
2453VLIB_REGISTER_NODE (ip4_rewrite_mcast_node) = {
2454 .function = ip4_rewrite_mcast,
2455 .name = "ip4-rewrite-mcast",
2456 .vector_size = sizeof (u32),
2457
2458 .format_trace = format_ip4_rewrite_trace,
2459 .sibling_of = "ip4-rewrite",
2460};
2461VLIB_NODE_FUNCTION_MULTIARCH (ip4_rewrite_mcast_node, ip4_rewrite_mcast)
2462
Neale Ranns0f26c5a2017-03-01 15:12:11 -08002463VLIB_REGISTER_NODE (ip4_mcast_midchain_node, static) = {
2464 .function = ip4_mcast_midchain,
2465 .name = "ip4-mcast-midchain",
2466 .vector_size = sizeof (u32),
2467
2468 .format_trace = format_ip4_rewrite_trace,
2469 .sibling_of = "ip4-rewrite",
2470};
2471VLIB_NODE_FUNCTION_MULTIARCH (ip4_mcast_midchain_node, ip4_mcast_midchain)
2472
Neale Ranns32e1c012016-11-22 17:07:28 +00002473VLIB_REGISTER_NODE (ip4_midchain_node) = {
2474 .function = ip4_midchain,
2475 .name = "ip4-midchain",
2476 .vector_size = sizeof (u32),
2477 .format_trace = format_ip4_forward_next_trace,
2478 .sibling_of = "ip4-rewrite",
2479};
Dave Barachd7cb1b52016-12-09 09:52:16 -05002480VLIB_NODE_FUNCTION_MULTIARCH (ip4_midchain_node, ip4_midchain);
Neale Ranns32e1c012016-11-22 17:07:28 +00002481/* *INDENT-ON */
Damjan Marion1c80e832016-05-11 23:07:18 +02002482
Dave Barachd7cb1b52016-12-09 09:52:16 -05002483int
2484ip4_lookup_validate (ip4_address_t * a, u32 fib_index0)
2485{
2486 ip4_fib_mtrie_t *mtrie0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002487 ip4_fib_mtrie_leaf_t leaf0;
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002488 u32 lbi0;
Dave Barach75fc8542016-10-11 16:16:02 -04002489
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002490 mtrie0 = &ip4_fib_get (fib_index0)->mtrie;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002491
Neale Ranns04a75e32017-03-23 06:46:01 -07002492 leaf0 = ip4_fib_mtrie_lookup_step_one (mtrie0, a);
Ed Warnickecb9cada2015-12-08 15:45:58 -07002493 leaf0 = ip4_fib_mtrie_lookup_step (mtrie0, leaf0, a, 2);
2494 leaf0 = ip4_fib_mtrie_lookup_step (mtrie0, leaf0, a, 3);
Dave Barach75fc8542016-10-11 16:16:02 -04002495
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002496 lbi0 = ip4_fib_mtrie_leaf_get_adj_index (leaf0);
Dave Barach75fc8542016-10-11 16:16:02 -04002497
Dave Barachd7cb1b52016-12-09 09:52:16 -05002498 return lbi0 == ip4_fib_table_lookup_lb (ip4_fib_get (fib_index0), a);
Ed Warnickecb9cada2015-12-08 15:45:58 -07002499}
Dave Barach75fc8542016-10-11 16:16:02 -04002500
Ed Warnickecb9cada2015-12-08 15:45:58 -07002501static clib_error_t *
2502test_lookup_command_fn (vlib_main_t * vm,
Dave Barachd7cb1b52016-12-09 09:52:16 -05002503 unformat_input_t * input, vlib_cli_command_t * cmd)
Ed Warnickecb9cada2015-12-08 15:45:58 -07002504{
Billy McFall309fe062016-10-14 07:37:33 -04002505 ip4_fib_t *fib;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002506 u32 table_id = 0;
2507 f64 count = 1;
2508 u32 n;
2509 int i;
2510 ip4_address_t ip4_base_address;
2511 u64 errors = 0;
2512
Dave Barachd7cb1b52016-12-09 09:52:16 -05002513 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
2514 {
Ed Warnickecb9cada2015-12-08 15:45:58 -07002515 if (unformat (input, "table %d", &table_id))
Dave Barachd7cb1b52016-12-09 09:52:16 -05002516 {
2517 /* Make sure the entry exists. */
2518 fib = ip4_fib_get (table_id);
2519 if ((fib) && (fib->index != table_id))
2520 return clib_error_return (0, "<fib-index> %d does not exist",
2521 table_id);
2522 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07002523 else if (unformat (input, "count %f", &count))
2524 ;
2525
2526 else if (unformat (input, "%U",
2527 unformat_ip4_address, &ip4_base_address))
Dave Barachd7cb1b52016-12-09 09:52:16 -05002528 ;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002529 else
Dave Barachd7cb1b52016-12-09 09:52:16 -05002530 return clib_error_return (0, "unknown input `%U'",
2531 format_unformat_error, input);
2532 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07002533
2534 n = count;
2535
2536 for (i = 0; i < n; i++)
2537 {
2538 if (!ip4_lookup_validate (&ip4_base_address, table_id))
Dave Barachd7cb1b52016-12-09 09:52:16 -05002539 errors++;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002540
Dave Barach75fc8542016-10-11 16:16:02 -04002541 ip4_base_address.as_u32 =
Dave Barachd7cb1b52016-12-09 09:52:16 -05002542 clib_host_to_net_u32 (1 +
2543 clib_net_to_host_u32 (ip4_base_address.as_u32));
Ed Warnickecb9cada2015-12-08 15:45:58 -07002544 }
2545
Dave Barach75fc8542016-10-11 16:16:02 -04002546 if (errors)
Ed Warnickecb9cada2015-12-08 15:45:58 -07002547 vlib_cli_output (vm, "%llu errors out of %d lookups\n", errors, n);
2548 else
2549 vlib_cli_output (vm, "No errors in %d lookups\n", n);
2550
2551 return 0;
2552}
2553
Billy McFall0683c9c2016-10-13 08:27:31 -04002554/*?
2555 * Perform a lookup of an IPv4 Address (or range of addresses) in the
2556 * given FIB table to determine if there is a conflict with the
2557 * adjacency table. The fib-id can be determined by using the
2558 * '<em>show ip fib</em>' command. If fib-id is not entered, default value
2559 * of 0 is used.
2560 *
2561 * @todo This command uses fib-id, other commands use table-id (not
2562 * just a name, they are different indexes). Would like to change this
2563 * to table-id for consistency.
2564 *
2565 * @cliexpar
2566 * Example of how to run the test lookup command:
2567 * @cliexstart{test lookup 172.16.1.1 table 1 count 2}
2568 * No errors in 2 lookups
2569 * @cliexend
2570?*/
2571/* *INDENT-OFF* */
Dave Barachd7cb1b52016-12-09 09:52:16 -05002572VLIB_CLI_COMMAND (lookup_test_command, static) =
2573{
2574 .path = "test lookup",
2575 .short_help = "test lookup <ipv4-addr> [table <fib-id>] [count <nn>]",
2576 .function = test_lookup_command_fn,
Ed Warnickecb9cada2015-12-08 15:45:58 -07002577};
Billy McFall0683c9c2016-10-13 08:27:31 -04002578/* *INDENT-ON* */
Ed Warnickecb9cada2015-12-08 15:45:58 -07002579
Dave Barachd7cb1b52016-12-09 09:52:16 -05002580int
2581vnet_set_ip4_flow_hash (u32 table_id, u32 flow_hash_config)
Ed Warnickecb9cada2015-12-08 15:45:58 -07002582{
Neale Ranns107e7d42017-04-11 09:55:19 -07002583 u32 fib_index;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002584
Neale Ranns107e7d42017-04-11 09:55:19 -07002585 fib_index = fib_table_find (FIB_PROTOCOL_IP4, table_id);
2586
2587 if (~0 == fib_index)
Ed Warnickecb9cada2015-12-08 15:45:58 -07002588 return VNET_API_ERROR_NO_SUCH_FIB;
2589
Neale Ranns227038a2017-04-21 01:07:59 -07002590 fib_table_set_flow_hash_config (fib_index, FIB_PROTOCOL_IP4,
2591 flow_hash_config);
Ed Warnickecb9cada2015-12-08 15:45:58 -07002592
Ed Warnickecb9cada2015-12-08 15:45:58 -07002593 return 0;
2594}
Dave Barach75fc8542016-10-11 16:16:02 -04002595
Ed Warnickecb9cada2015-12-08 15:45:58 -07002596static clib_error_t *
2597set_ip_flow_hash_command_fn (vlib_main_t * vm,
Dave Barachd7cb1b52016-12-09 09:52:16 -05002598 unformat_input_t * input,
2599 vlib_cli_command_t * cmd)
Ed Warnickecb9cada2015-12-08 15:45:58 -07002600{
2601 int matched = 0;
2602 u32 table_id = 0;
2603 u32 flow_hash_config = 0;
2604 int rv;
2605
Dave Barachd7cb1b52016-12-09 09:52:16 -05002606 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
2607 {
2608 if (unformat (input, "table %d", &table_id))
2609 matched = 1;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002610#define _(a,v) \
2611 else if (unformat (input, #a)) { flow_hash_config |= v; matched=1;}
Dave Barachd7cb1b52016-12-09 09:52:16 -05002612 foreach_flow_hash_bit
Ed Warnickecb9cada2015-12-08 15:45:58 -07002613#undef _
Dave Barachd7cb1b52016-12-09 09:52:16 -05002614 else
2615 break;
2616 }
Dave Barach75fc8542016-10-11 16:16:02 -04002617
Ed Warnickecb9cada2015-12-08 15:45:58 -07002618 if (matched == 0)
2619 return clib_error_return (0, "unknown input `%U'",
Dave Barachd7cb1b52016-12-09 09:52:16 -05002620 format_unformat_error, input);
Dave Barach75fc8542016-10-11 16:16:02 -04002621
Ed Warnickecb9cada2015-12-08 15:45:58 -07002622 rv = vnet_set_ip4_flow_hash (table_id, flow_hash_config);
2623 switch (rv)
2624 {
2625 case 0:
2626 break;
Dave Barach75fc8542016-10-11 16:16:02 -04002627
Ed Warnickecb9cada2015-12-08 15:45:58 -07002628 case VNET_API_ERROR_NO_SUCH_FIB:
2629 return clib_error_return (0, "no such FIB table %d", table_id);
Dave Barach75fc8542016-10-11 16:16:02 -04002630
Ed Warnickecb9cada2015-12-08 15:45:58 -07002631 default:
2632 clib_warning ("BUG: illegal flow hash config 0x%x", flow_hash_config);
2633 break;
2634 }
Dave Barach75fc8542016-10-11 16:16:02 -04002635
Ed Warnickecb9cada2015-12-08 15:45:58 -07002636 return 0;
2637}
Dave Barach75fc8542016-10-11 16:16:02 -04002638
Billy McFall0683c9c2016-10-13 08:27:31 -04002639/*?
2640 * Configure the set of IPv4 fields used by the flow hash.
2641 *
2642 * @cliexpar
2643 * Example of how to set the flow hash on a given table:
2644 * @cliexcmd{set ip flow-hash table 7 dst sport dport proto}
2645 * Example of display the configured flow hash:
2646 * @cliexstart{show ip fib}
Billy McFallebb9a6a2016-10-17 11:35:32 -04002647 * ipv4-VRF:0, fib_index 0, flow hash: src dst sport dport proto
2648 * 0.0.0.0/0
2649 * unicast-ip4-chain
2650 * [@0]: dpo-load-balance: [index:0 buckets:1 uRPF:0 to:[0:0]]
2651 * [0] [@0]: dpo-drop ip6
2652 * 0.0.0.0/32
2653 * unicast-ip4-chain
2654 * [@0]: dpo-load-balance: [index:1 buckets:1 uRPF:1 to:[0:0]]
2655 * [0] [@0]: dpo-drop ip6
2656 * 224.0.0.0/8
2657 * unicast-ip4-chain
2658 * [@0]: dpo-load-balance: [index:3 buckets:1 uRPF:3 to:[0:0]]
2659 * [0] [@0]: dpo-drop ip6
2660 * 6.0.1.2/32
2661 * unicast-ip4-chain
2662 * [@0]: dpo-load-balance: [index:30 buckets:1 uRPF:29 to:[0:0]]
2663 * [0] [@3]: arp-ipv4: via 6.0.0.1 af_packet0
2664 * 7.0.0.1/32
2665 * unicast-ip4-chain
2666 * [@0]: dpo-load-balance: [index:31 buckets:4 uRPF:30 to:[0:0]]
2667 * [0] [@3]: arp-ipv4: via 6.0.0.2 af_packet0
2668 * [1] [@3]: arp-ipv4: via 6.0.0.2 af_packet0
2669 * [2] [@3]: arp-ipv4: via 6.0.0.2 af_packet0
2670 * [3] [@3]: arp-ipv4: via 6.0.0.1 af_packet0
2671 * 240.0.0.0/8
2672 * unicast-ip4-chain
2673 * [@0]: dpo-load-balance: [index:2 buckets:1 uRPF:2 to:[0:0]]
2674 * [0] [@0]: dpo-drop ip6
2675 * 255.255.255.255/32
2676 * unicast-ip4-chain
2677 * [@0]: dpo-load-balance: [index:4 buckets:1 uRPF:4 to:[0:0]]
2678 * [0] [@0]: dpo-drop ip6
2679 * ipv4-VRF:7, fib_index 1, flow hash: dst sport dport proto
2680 * 0.0.0.0/0
2681 * unicast-ip4-chain
2682 * [@0]: dpo-load-balance: [index:12 buckets:1 uRPF:11 to:[0:0]]
2683 * [0] [@0]: dpo-drop ip6
2684 * 0.0.0.0/32
2685 * unicast-ip4-chain
2686 * [@0]: dpo-load-balance: [index:13 buckets:1 uRPF:12 to:[0:0]]
2687 * [0] [@0]: dpo-drop ip6
2688 * 172.16.1.0/24
2689 * unicast-ip4-chain
2690 * [@0]: dpo-load-balance: [index:17 buckets:1 uRPF:16 to:[0:0]]
2691 * [0] [@4]: ipv4-glean: af_packet0
2692 * 172.16.1.1/32
2693 * unicast-ip4-chain
2694 * [@0]: dpo-load-balance: [index:18 buckets:1 uRPF:17 to:[1:84]]
2695 * [0] [@2]: dpo-receive: 172.16.1.1 on af_packet0
2696 * 172.16.1.2/32
2697 * unicast-ip4-chain
2698 * [@0]: dpo-load-balance: [index:21 buckets:1 uRPF:20 to:[0:0]]
2699 * [0] [@5]: ipv4 via 172.16.1.2 af_packet0: IP4: 02:fe:9e:70:7a:2b -> 26:a5:f6:9c:3a:36
2700 * 172.16.2.0/24
2701 * unicast-ip4-chain
2702 * [@0]: dpo-load-balance: [index:19 buckets:1 uRPF:18 to:[0:0]]
2703 * [0] [@4]: ipv4-glean: af_packet1
2704 * 172.16.2.1/32
2705 * unicast-ip4-chain
2706 * [@0]: dpo-load-balance: [index:20 buckets:1 uRPF:19 to:[0:0]]
2707 * [0] [@2]: dpo-receive: 172.16.2.1 on af_packet1
2708 * 224.0.0.0/8
2709 * unicast-ip4-chain
2710 * [@0]: dpo-load-balance: [index:15 buckets:1 uRPF:14 to:[0:0]]
2711 * [0] [@0]: dpo-drop ip6
2712 * 240.0.0.0/8
2713 * unicast-ip4-chain
2714 * [@0]: dpo-load-balance: [index:14 buckets:1 uRPF:13 to:[0:0]]
2715 * [0] [@0]: dpo-drop ip6
2716 * 255.255.255.255/32
2717 * unicast-ip4-chain
2718 * [@0]: dpo-load-balance: [index:16 buckets:1 uRPF:15 to:[0:0]]
2719 * [0] [@0]: dpo-drop ip6
Billy McFall0683c9c2016-10-13 08:27:31 -04002720 * @cliexend
2721?*/
2722/* *INDENT-OFF* */
Dave Barachd7cb1b52016-12-09 09:52:16 -05002723VLIB_CLI_COMMAND (set_ip_flow_hash_command, static) =
2724{
Ed Warnickecb9cada2015-12-08 15:45:58 -07002725 .path = "set ip flow-hash",
Dave Barach75fc8542016-10-11 16:16:02 -04002726 .short_help =
Billy McFall0683c9c2016-10-13 08:27:31 -04002727 "set ip flow-hash table <table-id> [src] [dst] [sport] [dport] [proto] [reverse]",
Ed Warnickecb9cada2015-12-08 15:45:58 -07002728 .function = set_ip_flow_hash_command_fn,
2729};
Billy McFall0683c9c2016-10-13 08:27:31 -04002730/* *INDENT-ON* */
Dave Barach75fc8542016-10-11 16:16:02 -04002731
Dave Barachd7cb1b52016-12-09 09:52:16 -05002732int
2733vnet_set_ip4_classify_intfc (vlib_main_t * vm, u32 sw_if_index,
2734 u32 table_index)
Ed Warnickecb9cada2015-12-08 15:45:58 -07002735{
Dave Barachd7cb1b52016-12-09 09:52:16 -05002736 vnet_main_t *vnm = vnet_get_main ();
2737 vnet_interface_main_t *im = &vnm->interface_main;
2738 ip4_main_t *ipm = &ip4_main;
2739 ip_lookup_main_t *lm = &ipm->lookup_main;
2740 vnet_classify_main_t *cm = &vnet_classify_main;
Neale Rannsdf089a82016-10-02 16:39:06 +01002741 ip4_address_t *if_addr;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002742
2743 if (pool_is_free_index (im->sw_interfaces, sw_if_index))
2744 return VNET_API_ERROR_NO_MATCHING_INTERFACE;
2745
2746 if (table_index != ~0 && pool_is_free_index (cm->tables, table_index))
2747 return VNET_API_ERROR_NO_SUCH_ENTRY;
2748
2749 vec_validate (lm->classify_table_index_by_sw_if_index, sw_if_index);
Dave Barachd7cb1b52016-12-09 09:52:16 -05002750 lm->classify_table_index_by_sw_if_index[sw_if_index] = table_index;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002751
Neale Rannsdf089a82016-10-02 16:39:06 +01002752 if_addr = ip4_interface_first_address (ipm, sw_if_index, NULL);
2753
2754 if (NULL != if_addr)
Dave Barachd7cb1b52016-12-09 09:52:16 -05002755 {
Neale Rannsdf089a82016-10-02 16:39:06 +01002756 fib_prefix_t pfx = {
Dave Barachd7cb1b52016-12-09 09:52:16 -05002757 .fp_len = 32,
2758 .fp_proto = FIB_PROTOCOL_IP4,
2759 .fp_addr.ip4 = *if_addr,
Neale Rannsdf089a82016-10-02 16:39:06 +01002760 };
2761 u32 fib_index;
2762
Dave Barachd7cb1b52016-12-09 09:52:16 -05002763 fib_index = fib_table_get_index_for_sw_if_index (FIB_PROTOCOL_IP4,
2764 sw_if_index);
Neale Rannsdf089a82016-10-02 16:39:06 +01002765
2766
Dave Barachd7cb1b52016-12-09 09:52:16 -05002767 if (table_index != (u32) ~ 0)
2768 {
2769 dpo_id_t dpo = DPO_INVALID;
Neale Rannsdf089a82016-10-02 16:39:06 +01002770
Dave Barachd7cb1b52016-12-09 09:52:16 -05002771 dpo_set (&dpo,
2772 DPO_CLASSIFY,
2773 DPO_PROTO_IP4,
2774 classify_dpo_create (DPO_PROTO_IP4, table_index));
Neale Rannsdf089a82016-10-02 16:39:06 +01002775
Dave Barachd7cb1b52016-12-09 09:52:16 -05002776 fib_table_entry_special_dpo_add (fib_index,
2777 &pfx,
2778 FIB_SOURCE_CLASSIFY,
2779 FIB_ENTRY_FLAG_NONE, &dpo);
2780 dpo_reset (&dpo);
2781 }
Neale Rannsdf089a82016-10-02 16:39:06 +01002782 else
Dave Barachd7cb1b52016-12-09 09:52:16 -05002783 {
2784 fib_table_entry_special_remove (fib_index,
2785 &pfx, FIB_SOURCE_CLASSIFY);
2786 }
2787 }
Neale Rannsdf089a82016-10-02 16:39:06 +01002788
Ed Warnickecb9cada2015-12-08 15:45:58 -07002789 return 0;
2790}
2791
2792static clib_error_t *
2793set_ip_classify_command_fn (vlib_main_t * vm,
Dave Barachd7cb1b52016-12-09 09:52:16 -05002794 unformat_input_t * input,
2795 vlib_cli_command_t * cmd)
Ed Warnickecb9cada2015-12-08 15:45:58 -07002796{
2797 u32 table_index = ~0;
2798 int table_index_set = 0;
2799 u32 sw_if_index = ~0;
2800 int rv;
Dave Barach75fc8542016-10-11 16:16:02 -04002801
Dave Barachd7cb1b52016-12-09 09:52:16 -05002802 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
2803 {
2804 if (unformat (input, "table-index %d", &table_index))
2805 table_index_set = 1;
2806 else if (unformat (input, "intfc %U", unformat_vnet_sw_interface,
2807 vnet_get_main (), &sw_if_index))
2808 ;
2809 else
2810 break;
2811 }
Dave Barach75fc8542016-10-11 16:16:02 -04002812
Ed Warnickecb9cada2015-12-08 15:45:58 -07002813 if (table_index_set == 0)
2814 return clib_error_return (0, "classify table-index must be specified");
2815
2816 if (sw_if_index == ~0)
2817 return clib_error_return (0, "interface / subif must be specified");
2818
2819 rv = vnet_set_ip4_classify_intfc (vm, sw_if_index, table_index);
2820
2821 switch (rv)
2822 {
2823 case 0:
2824 break;
2825
2826 case VNET_API_ERROR_NO_MATCHING_INTERFACE:
2827 return clib_error_return (0, "No such interface");
2828
2829 case VNET_API_ERROR_NO_SUCH_ENTRY:
2830 return clib_error_return (0, "No such classifier table");
2831 }
2832 return 0;
2833}
2834
Billy McFall0683c9c2016-10-13 08:27:31 -04002835/*?
2836 * Assign a classification table to an interface. The classification
2837 * table is created using the '<em>classify table</em>' and '<em>classify session</em>'
2838 * commands. Once the table is create, use this command to filter packets
2839 * on an interface.
2840 *
2841 * @cliexpar
2842 * Example of how to assign a classification table to an interface:
2843 * @cliexcmd{set ip classify intfc GigabitEthernet2/0/0 table-index 1}
2844?*/
2845/* *INDENT-OFF* */
Dave Barachd7cb1b52016-12-09 09:52:16 -05002846VLIB_CLI_COMMAND (set_ip_classify_command, static) =
2847{
Ed Warnickecb9cada2015-12-08 15:45:58 -07002848 .path = "set ip classify",
Dave Barach75fc8542016-10-11 16:16:02 -04002849 .short_help =
Billy McFall0683c9c2016-10-13 08:27:31 -04002850 "set ip classify intfc <interface> table-index <classify-idx>",
Ed Warnickecb9cada2015-12-08 15:45:58 -07002851 .function = set_ip_classify_command_fn,
2852};
Billy McFall0683c9c2016-10-13 08:27:31 -04002853/* *INDENT-ON* */
Dave Barachd7cb1b52016-12-09 09:52:16 -05002854
Neale Ranns1ec36522017-11-29 05:20:37 -08002855static clib_error_t *
2856ip4_config (vlib_main_t * vm, unformat_input_t * input)
2857{
2858 ip4_main_t *im = &ip4_main;
2859 uword heapsize = 0;
2860
2861 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
2862 {
2863 if (unformat (input, "heap-size %U", unformat_memory_size, &heapsize))
2864 ;
2865 else
2866 return clib_error_return (0,
2867 "invalid heap-size parameter `%U'",
2868 format_unformat_error, input);
2869 }
2870
2871 im->mtrie_heap_size = heapsize;
2872
2873 return 0;
2874}
2875
2876VLIB_EARLY_CONFIG_FUNCTION (ip4_config, "ip");
2877
Dave Barachd7cb1b52016-12-09 09:52:16 -05002878/*
2879 * fd.io coding-style-patch-verification: ON
2880 *
2881 * Local Variables:
2882 * eval: (c-set-style "gnu")
2883 * End:
2884 */