blob: 3ddf6dfa7839ceec0144d7b0464ef943bdc16c71 [file] [log] [blame]
Ed Warnickecb9cada2015-12-08 15:45:58 -07001/*
2 * Copyright (c) 2015 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
6 *
7 * http://www.apache.org/licenses/LICENSE-2.0
8 *
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
14 */
15/*
16 * ip/ip4_forward.c: IP v4 forwarding
17 *
18 * Copyright (c) 2008 Eliot Dresselhaus
19 *
20 * Permission is hereby granted, free of charge, to any person obtaining
21 * a copy of this software and associated documentation files (the
22 * "Software"), to deal in the Software without restriction, including
23 * without limitation the rights to use, copy, modify, merge, publish,
24 * distribute, sublicense, and/or sell copies of the Software, and to
25 * permit persons to whom the Software is furnished to do so, subject to
26 * the following conditions:
27 *
28 * The above copyright notice and this permission notice shall be
29 * included in all copies or substantial portions of the Software.
30 *
31 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
32 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
33 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
34 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
35 * LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
36 * OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
37 * WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
38 */
39
40#include <vnet/vnet.h>
41#include <vnet/ip/ip.h>
Neale Ranns0bfe5d82016-08-25 15:29:12 +010042#include <vnet/ethernet/ethernet.h> /* for ethernet_header_t */
43#include <vnet/ethernet/arp_packet.h> /* for ethernet_arp_header_t */
Ed Warnickecb9cada2015-12-08 15:45:58 -070044#include <vnet/ppp/ppp.h>
Neale Ranns0bfe5d82016-08-25 15:29:12 +010045#include <vnet/srp/srp.h> /* for srp_hw_interface_class */
Dave Barachd7cb1b52016-12-09 09:52:16 -050046#include <vnet/api_errno.h> /* for API error numbers */
47#include <vnet/fib/fib_table.h> /* for FIB table and entry creation */
48#include <vnet/fib/fib_entry.h> /* for FIB table and entry creation */
49#include <vnet/fib/fib_urpf_list.h> /* for FIB uRPF check */
Neale Ranns0bfe5d82016-08-25 15:29:12 +010050#include <vnet/fib/ip4_fib.h>
51#include <vnet/dpo/load_balance.h>
Neale Rannsf12a83f2017-04-18 09:09:40 -070052#include <vnet/dpo/load_balance_map.h>
Neale Ranns0bfe5d82016-08-25 15:29:12 +010053#include <vnet/dpo/classify_dpo.h>
Neale Ranns32e1c012016-11-22 17:07:28 +000054#include <vnet/mfib/mfib_table.h> /* for mFIB table and entry creation */
Ed Warnickecb9cada2015-12-08 15:45:58 -070055
Billy McFall0683c9c2016-10-13 08:27:31 -040056/**
57 * @file
58 * @brief IPv4 Forwarding.
59 *
60 * This file contains the source code for IPv4 forwarding.
61 */
62
Ed Warnickecb9cada2015-12-08 15:45:58 -070063always_inline uword
64ip4_lookup_inline (vlib_main_t * vm,
65 vlib_node_runtime_t * node,
66 vlib_frame_t * frame,
Neale Ranns0bfe5d82016-08-25 15:29:12 +010067 int lookup_for_responses_to_locally_received_packets)
Ed Warnickecb9cada2015-12-08 15:45:58 -070068{
Dave Barachd7cb1b52016-12-09 09:52:16 -050069 ip4_main_t *im = &ip4_main;
70 vlib_combined_counter_main_t *cm = &load_balance_main.lbm_to_counters;
71 u32 n_left_from, n_left_to_next, *from, *to_next;
Ed Warnickecb9cada2015-12-08 15:45:58 -070072 ip_lookup_next_t next;
Damjan Marion586afd72017-04-05 19:18:20 +020073 u32 thread_index = vlib_get_thread_index ();
Ed Warnickecb9cada2015-12-08 15:45:58 -070074
75 from = vlib_frame_vector_args (frame);
76 n_left_from = frame->n_vectors;
77 next = node->cached_next_index;
78
79 while (n_left_from > 0)
80 {
Dave Barachd7cb1b52016-12-09 09:52:16 -050081 vlib_get_next_frame (vm, node, next, to_next, n_left_to_next);
Ed Warnickecb9cada2015-12-08 15:45:58 -070082
Dave Barach670909e2016-10-18 15:25:35 -040083 while (n_left_from >= 8 && n_left_to_next >= 4)
Dave Barachd7cb1b52016-12-09 09:52:16 -050084 {
85 vlib_buffer_t *p0, *p1, *p2, *p3;
86 ip4_header_t *ip0, *ip1, *ip2, *ip3;
Dave Barachd7cb1b52016-12-09 09:52:16 -050087 ip_lookup_next_t next0, next1, next2, next3;
88 const load_balance_t *lb0, *lb1, *lb2, *lb3;
89 ip4_fib_mtrie_t *mtrie0, *mtrie1, *mtrie2, *mtrie3;
90 ip4_fib_mtrie_leaf_t leaf0, leaf1, leaf2, leaf3;
91 ip4_address_t *dst_addr0, *dst_addr1, *dst_addr2, *dst_addr3;
Neale Ranns340690e2017-03-22 13:27:53 -070092 u32 pi0, fib_index0, lb_index0;
93 u32 pi1, fib_index1, lb_index1;
94 u32 pi2, fib_index2, lb_index2;
95 u32 pi3, fib_index3, lb_index3;
Dave Barachd7cb1b52016-12-09 09:52:16 -050096 flow_hash_config_t flow_hash_config0, flow_hash_config1;
97 flow_hash_config_t flow_hash_config2, flow_hash_config3;
98 u32 hash_c0, hash_c1, hash_c2, hash_c3;
Dave Barach670909e2016-10-18 15:25:35 -040099 const dpo_id_t *dpo0, *dpo1, *dpo2, *dpo3;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700100
Dave Barachd7cb1b52016-12-09 09:52:16 -0500101 /* Prefetch next iteration. */
102 {
103 vlib_buffer_t *p4, *p5, *p6, *p7;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700104
Dave Barachd7cb1b52016-12-09 09:52:16 -0500105 p4 = vlib_get_buffer (vm, from[4]);
106 p5 = vlib_get_buffer (vm, from[5]);
107 p6 = vlib_get_buffer (vm, from[6]);
108 p7 = vlib_get_buffer (vm, from[7]);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700109
Dave Barachd7cb1b52016-12-09 09:52:16 -0500110 vlib_prefetch_buffer_header (p4, LOAD);
111 vlib_prefetch_buffer_header (p5, LOAD);
112 vlib_prefetch_buffer_header (p6, LOAD);
113 vlib_prefetch_buffer_header (p7, LOAD);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700114
Dave Barachd7cb1b52016-12-09 09:52:16 -0500115 CLIB_PREFETCH (p4->data, sizeof (ip0[0]), LOAD);
116 CLIB_PREFETCH (p5->data, sizeof (ip0[0]), LOAD);
117 CLIB_PREFETCH (p6->data, sizeof (ip0[0]), LOAD);
118 CLIB_PREFETCH (p7->data, sizeof (ip0[0]), LOAD);
119 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700120
Dave Barachd7cb1b52016-12-09 09:52:16 -0500121 pi0 = to_next[0] = from[0];
122 pi1 = to_next[1] = from[1];
123 pi2 = to_next[2] = from[2];
124 pi3 = to_next[3] = from[3];
Dave Barach670909e2016-10-18 15:25:35 -0400125
Dave Barachd7cb1b52016-12-09 09:52:16 -0500126 from += 4;
127 to_next += 4;
128 n_left_to_next -= 4;
129 n_left_from -= 4;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700130
Dave Barachd7cb1b52016-12-09 09:52:16 -0500131 p0 = vlib_get_buffer (vm, pi0);
132 p1 = vlib_get_buffer (vm, pi1);
133 p2 = vlib_get_buffer (vm, pi2);
134 p3 = vlib_get_buffer (vm, pi3);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700135
Dave Barachd7cb1b52016-12-09 09:52:16 -0500136 ip0 = vlib_buffer_get_current (p0);
137 ip1 = vlib_buffer_get_current (p1);
138 ip2 = vlib_buffer_get_current (p2);
139 ip3 = vlib_buffer_get_current (p3);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700140
Dave Barachd7cb1b52016-12-09 09:52:16 -0500141 dst_addr0 = &ip0->dst_address;
142 dst_addr1 = &ip1->dst_address;
143 dst_addr2 = &ip2->dst_address;
144 dst_addr3 = &ip3->dst_address;
Damjan Marionaca64c92016-04-13 09:48:56 +0200145
Dave Barachd7cb1b52016-12-09 09:52:16 -0500146 fib_index0 =
147 vec_elt (im->fib_index_by_sw_if_index,
148 vnet_buffer (p0)->sw_if_index[VLIB_RX]);
149 fib_index1 =
150 vec_elt (im->fib_index_by_sw_if_index,
151 vnet_buffer (p1)->sw_if_index[VLIB_RX]);
152 fib_index2 =
153 vec_elt (im->fib_index_by_sw_if_index,
154 vnet_buffer (p2)->sw_if_index[VLIB_RX]);
155 fib_index3 =
156 vec_elt (im->fib_index_by_sw_if_index,
157 vnet_buffer (p3)->sw_if_index[VLIB_RX]);
158 fib_index0 =
159 (vnet_buffer (p0)->sw_if_index[VLIB_TX] ==
160 (u32) ~ 0) ? fib_index0 : vnet_buffer (p0)->sw_if_index[VLIB_TX];
161 fib_index1 =
162 (vnet_buffer (p1)->sw_if_index[VLIB_TX] ==
163 (u32) ~ 0) ? fib_index1 : vnet_buffer (p1)->sw_if_index[VLIB_TX];
164 fib_index2 =
165 (vnet_buffer (p2)->sw_if_index[VLIB_TX] ==
166 (u32) ~ 0) ? fib_index2 : vnet_buffer (p2)->sw_if_index[VLIB_TX];
167 fib_index3 =
168 (vnet_buffer (p3)->sw_if_index[VLIB_TX] ==
169 (u32) ~ 0) ? fib_index3 : vnet_buffer (p3)->sw_if_index[VLIB_TX];
Ed Warnickecb9cada2015-12-08 15:45:58 -0700170
171
Dave Barachd7cb1b52016-12-09 09:52:16 -0500172 if (!lookup_for_responses_to_locally_received_packets)
173 {
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100174 mtrie0 = &ip4_fib_get (fib_index0)->mtrie;
175 mtrie1 = &ip4_fib_get (fib_index1)->mtrie;
Dave Barach670909e2016-10-18 15:25:35 -0400176 mtrie2 = &ip4_fib_get (fib_index2)->mtrie;
177 mtrie3 = &ip4_fib_get (fib_index3)->mtrie;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700178
Neale Ranns04a75e32017-03-23 06:46:01 -0700179 leaf0 = ip4_fib_mtrie_lookup_step_one (mtrie0, dst_addr0);
180 leaf1 = ip4_fib_mtrie_lookup_step_one (mtrie1, dst_addr1);
181 leaf2 = ip4_fib_mtrie_lookup_step_one (mtrie2, dst_addr2);
182 leaf3 = ip4_fib_mtrie_lookup_step_one (mtrie3, dst_addr3);
Dave Barachd7cb1b52016-12-09 09:52:16 -0500183 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700184
Dave Barachd7cb1b52016-12-09 09:52:16 -0500185 if (!lookup_for_responses_to_locally_received_packets)
186 {
Dave Barachd7cb1b52016-12-09 09:52:16 -0500187 leaf0 = ip4_fib_mtrie_lookup_step (mtrie0, leaf0, dst_addr0, 2);
188 leaf1 = ip4_fib_mtrie_lookup_step (mtrie1, leaf1, dst_addr1, 2);
189 leaf2 = ip4_fib_mtrie_lookup_step (mtrie2, leaf2, dst_addr2, 2);
190 leaf3 = ip4_fib_mtrie_lookup_step (mtrie3, leaf3, dst_addr3, 2);
191 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700192
Dave Barachd7cb1b52016-12-09 09:52:16 -0500193 if (!lookup_for_responses_to_locally_received_packets)
194 {
195 leaf0 = ip4_fib_mtrie_lookup_step (mtrie0, leaf0, dst_addr0, 3);
196 leaf1 = ip4_fib_mtrie_lookup_step (mtrie1, leaf1, dst_addr1, 3);
197 leaf2 = ip4_fib_mtrie_lookup_step (mtrie2, leaf2, dst_addr2, 3);
198 leaf3 = ip4_fib_mtrie_lookup_step (mtrie3, leaf3, dst_addr3, 3);
199 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700200
Dave Barachd7cb1b52016-12-09 09:52:16 -0500201 if (lookup_for_responses_to_locally_received_packets)
202 {
203 lb_index0 = vnet_buffer (p0)->ip.adj_index[VLIB_RX];
204 lb_index1 = vnet_buffer (p1)->ip.adj_index[VLIB_RX];
205 lb_index2 = vnet_buffer (p2)->ip.adj_index[VLIB_RX];
206 lb_index3 = vnet_buffer (p3)->ip.adj_index[VLIB_RX];
207 }
208 else
209 {
Dave Barachd7cb1b52016-12-09 09:52:16 -0500210 lb_index0 = ip4_fib_mtrie_leaf_get_adj_index (leaf0);
211 lb_index1 = ip4_fib_mtrie_leaf_get_adj_index (leaf1);
212 lb_index2 = ip4_fib_mtrie_leaf_get_adj_index (leaf2);
213 lb_index3 = ip4_fib_mtrie_leaf_get_adj_index (leaf3);
214 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700215
Neale Ranns04a75e32017-03-23 06:46:01 -0700216 ASSERT (lb_index0 && lb_index1 && lb_index2 && lb_index3);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100217 lb0 = load_balance_get (lb_index0);
218 lb1 = load_balance_get (lb_index1);
Dave Barach670909e2016-10-18 15:25:35 -0400219 lb2 = load_balance_get (lb_index2);
220 lb3 = load_balance_get (lb_index3);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700221
Neale Rannsf12a83f2017-04-18 09:09:40 -0700222 ASSERT (lb0->lb_n_buckets > 0);
223 ASSERT (is_pow2 (lb0->lb_n_buckets));
224 ASSERT (lb1->lb_n_buckets > 0);
225 ASSERT (is_pow2 (lb1->lb_n_buckets));
226 ASSERT (lb2->lb_n_buckets > 0);
227 ASSERT (is_pow2 (lb2->lb_n_buckets));
228 ASSERT (lb3->lb_n_buckets > 0);
229 ASSERT (is_pow2 (lb3->lb_n_buckets));
230
Dave Barachd7cb1b52016-12-09 09:52:16 -0500231 /* Use flow hash to compute multipath adjacency. */
232 hash_c0 = vnet_buffer (p0)->ip.flow_hash = 0;
233 hash_c1 = vnet_buffer (p1)->ip.flow_hash = 0;
234 hash_c2 = vnet_buffer (p2)->ip.flow_hash = 0;
235 hash_c3 = vnet_buffer (p3)->ip.flow_hash = 0;
236 if (PREDICT_FALSE (lb0->lb_n_buckets > 1))
237 {
238 flow_hash_config0 = lb0->lb_hash_config;
239 hash_c0 = vnet_buffer (p0)->ip.flow_hash =
240 ip4_compute_flow_hash (ip0, flow_hash_config0);
Neale Rannsf12a83f2017-04-18 09:09:40 -0700241 dpo0 =
242 load_balance_get_fwd_bucket (lb0,
243 (hash_c0 &
244 (lb0->lb_n_buckets_minus_1)));
245 }
246 else
247 {
248 dpo0 = load_balance_get_bucket_i (lb0, 0);
Dave Barachd7cb1b52016-12-09 09:52:16 -0500249 }
250 if (PREDICT_FALSE (lb1->lb_n_buckets > 1))
251 {
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100252 flow_hash_config1 = lb1->lb_hash_config;
Dave Barachd7cb1b52016-12-09 09:52:16 -0500253 hash_c1 = vnet_buffer (p1)->ip.flow_hash =
254 ip4_compute_flow_hash (ip1, flow_hash_config1);
Neale Rannsf12a83f2017-04-18 09:09:40 -0700255 dpo1 =
256 load_balance_get_fwd_bucket (lb1,
257 (hash_c1 &
258 (lb1->lb_n_buckets_minus_1)));
259 }
260 else
261 {
262 dpo1 = load_balance_get_bucket_i (lb1, 0);
Dave Barachd7cb1b52016-12-09 09:52:16 -0500263 }
264 if (PREDICT_FALSE (lb2->lb_n_buckets > 1))
265 {
266 flow_hash_config2 = lb2->lb_hash_config;
267 hash_c2 = vnet_buffer (p2)->ip.flow_hash =
268 ip4_compute_flow_hash (ip2, flow_hash_config2);
Neale Rannsf12a83f2017-04-18 09:09:40 -0700269 dpo2 =
270 load_balance_get_fwd_bucket (lb2,
271 (hash_c2 &
272 (lb2->lb_n_buckets_minus_1)));
273 }
274 else
275 {
276 dpo2 = load_balance_get_bucket_i (lb2, 0);
Dave Barachd7cb1b52016-12-09 09:52:16 -0500277 }
278 if (PREDICT_FALSE (lb3->lb_n_buckets > 1))
279 {
Dave Barach670909e2016-10-18 15:25:35 -0400280 flow_hash_config3 = lb3->lb_hash_config;
Dave Barachd7cb1b52016-12-09 09:52:16 -0500281 hash_c3 = vnet_buffer (p3)->ip.flow_hash =
282 ip4_compute_flow_hash (ip3, flow_hash_config3);
Neale Rannsf12a83f2017-04-18 09:09:40 -0700283 dpo3 =
284 load_balance_get_fwd_bucket (lb3,
285 (hash_c3 &
286 (lb3->lb_n_buckets_minus_1)));
Dave Barachd7cb1b52016-12-09 09:52:16 -0500287 }
Neale Rannsf12a83f2017-04-18 09:09:40 -0700288 else
289 {
290 dpo3 = load_balance_get_bucket_i (lb3, 0);
291 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700292
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100293 next0 = dpo0->dpoi_next_node;
294 vnet_buffer (p0)->ip.adj_index[VLIB_TX] = dpo0->dpoi_index;
295 next1 = dpo1->dpoi_next_node;
296 vnet_buffer (p1)->ip.adj_index[VLIB_TX] = dpo1->dpoi_index;
Dave Barach670909e2016-10-18 15:25:35 -0400297 next2 = dpo2->dpoi_next_node;
298 vnet_buffer (p2)->ip.adj_index[VLIB_TX] = dpo2->dpoi_index;
299 next3 = dpo3->dpoi_next_node;
300 vnet_buffer (p3)->ip.adj_index[VLIB_TX] = dpo3->dpoi_index;
Florin Corasdf9d3bc2016-09-05 19:54:17 +0200301
Dave Barachd7cb1b52016-12-09 09:52:16 -0500302 vlib_increment_combined_counter
Damjan Marion586afd72017-04-05 19:18:20 +0200303 (cm, thread_index, lb_index0, 1,
Neale Rannsf12a83f2017-04-18 09:09:40 -0700304 vlib_buffer_length_in_chain (vm, p0));
Dave Barachd7cb1b52016-12-09 09:52:16 -0500305 vlib_increment_combined_counter
Damjan Marion586afd72017-04-05 19:18:20 +0200306 (cm, thread_index, lb_index1, 1,
Neale Rannsf12a83f2017-04-18 09:09:40 -0700307 vlib_buffer_length_in_chain (vm, p1));
Dave Barachd7cb1b52016-12-09 09:52:16 -0500308 vlib_increment_combined_counter
Damjan Marion586afd72017-04-05 19:18:20 +0200309 (cm, thread_index, lb_index2, 1,
Neale Rannsf12a83f2017-04-18 09:09:40 -0700310 vlib_buffer_length_in_chain (vm, p2));
Dave Barachd7cb1b52016-12-09 09:52:16 -0500311 vlib_increment_combined_counter
Damjan Marion586afd72017-04-05 19:18:20 +0200312 (cm, thread_index, lb_index3, 1,
Neale Rannsf12a83f2017-04-18 09:09:40 -0700313 vlib_buffer_length_in_chain (vm, p3));
Ed Warnickecb9cada2015-12-08 15:45:58 -0700314
Dave Barach670909e2016-10-18 15:25:35 -0400315 vlib_validate_buffer_enqueue_x4 (vm, node, next,
316 to_next, n_left_to_next,
317 pi0, pi1, pi2, pi3,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500318 next0, next1, next2, next3);
319 }
Dave Barach75fc8542016-10-11 16:16:02 -0400320
Ed Warnickecb9cada2015-12-08 15:45:58 -0700321 while (n_left_from > 0 && n_left_to_next > 0)
322 {
Dave Barachd7cb1b52016-12-09 09:52:16 -0500323 vlib_buffer_t *p0;
324 ip4_header_t *ip0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700325 ip_lookup_next_t next0;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100326 const load_balance_t *lb0;
Dave Barachd7cb1b52016-12-09 09:52:16 -0500327 ip4_fib_mtrie_t *mtrie0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700328 ip4_fib_mtrie_leaf_t leaf0;
Dave Barachd7cb1b52016-12-09 09:52:16 -0500329 ip4_address_t *dst_addr0;
Neale Ranns340690e2017-03-22 13:27:53 -0700330 u32 pi0, fib_index0, lbi0;
Dave Barachd7cb1b52016-12-09 09:52:16 -0500331 flow_hash_config_t flow_hash_config0;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100332 const dpo_id_t *dpo0;
333 u32 hash_c0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700334
335 pi0 = from[0];
336 to_next[0] = pi0;
337
338 p0 = vlib_get_buffer (vm, pi0);
339
340 ip0 = vlib_buffer_get_current (p0);
341
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100342 dst_addr0 = &ip0->dst_address;
Damjan Marionaca64c92016-04-13 09:48:56 +0200343
Dave Barachd7cb1b52016-12-09 09:52:16 -0500344 fib_index0 =
345 vec_elt (im->fib_index_by_sw_if_index,
346 vnet_buffer (p0)->sw_if_index[VLIB_RX]);
347 fib_index0 =
348 (vnet_buffer (p0)->sw_if_index[VLIB_TX] ==
349 (u32) ~ 0) ? fib_index0 : vnet_buffer (p0)->sw_if_index[VLIB_TX];
Ed Warnickecb9cada2015-12-08 15:45:58 -0700350
Dave Barachd7cb1b52016-12-09 09:52:16 -0500351 if (!lookup_for_responses_to_locally_received_packets)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700352 {
Dave Barachd7cb1b52016-12-09 09:52:16 -0500353 mtrie0 = &ip4_fib_get (fib_index0)->mtrie;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700354
Neale Ranns04a75e32017-03-23 06:46:01 -0700355 leaf0 = ip4_fib_mtrie_lookup_step_one (mtrie0, dst_addr0);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700356 }
357
Dave Barachd7cb1b52016-12-09 09:52:16 -0500358 if (!lookup_for_responses_to_locally_received_packets)
Damjan Marionaca64c92016-04-13 09:48:56 +0200359 leaf0 = ip4_fib_mtrie_lookup_step (mtrie0, leaf0, dst_addr0, 2);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700360
Dave Barachd7cb1b52016-12-09 09:52:16 -0500361 if (!lookup_for_responses_to_locally_received_packets)
Damjan Marionaca64c92016-04-13 09:48:56 +0200362 leaf0 = ip4_fib_mtrie_lookup_step (mtrie0, leaf0, dst_addr0, 3);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700363
364 if (lookup_for_responses_to_locally_received_packets)
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100365 lbi0 = vnet_buffer (p0)->ip.adj_index[VLIB_RX];
Ed Warnickecb9cada2015-12-08 15:45:58 -0700366 else
367 {
368 /* Handle default route. */
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100369 lbi0 = ip4_fib_mtrie_leaf_get_adj_index (leaf0);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700370 }
371
Neale Ranns04a75e32017-03-23 06:46:01 -0700372 ASSERT (lbi0);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100373 lb0 = load_balance_get (lbi0);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700374
Neale Rannsf12a83f2017-04-18 09:09:40 -0700375 ASSERT (lb0->lb_n_buckets > 0);
376 ASSERT (is_pow2 (lb0->lb_n_buckets));
377
Ed Warnickecb9cada2015-12-08 15:45:58 -0700378 /* Use flow hash to compute multipath adjacency. */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500379 hash_c0 = vnet_buffer (p0)->ip.flow_hash = 0;
380 if (PREDICT_FALSE (lb0->lb_n_buckets > 1))
381 {
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100382 flow_hash_config0 = lb0->lb_hash_config;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700383
Dave Barachd7cb1b52016-12-09 09:52:16 -0500384 hash_c0 = vnet_buffer (p0)->ip.flow_hash =
385 ip4_compute_flow_hash (ip0, flow_hash_config0);
Neale Rannsf12a83f2017-04-18 09:09:40 -0700386 dpo0 =
387 load_balance_get_fwd_bucket (lb0,
388 (hash_c0 &
389 (lb0->lb_n_buckets_minus_1)));
Dave Barachd7cb1b52016-12-09 09:52:16 -0500390 }
Neale Rannsf12a83f2017-04-18 09:09:40 -0700391 else
392 {
393 dpo0 = load_balance_get_bucket_i (lb0, 0);
394 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700395
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100396 next0 = dpo0->dpoi_next_node;
397 vnet_buffer (p0)->ip.adj_index[VLIB_TX] = dpo0->dpoi_index;
Florin Corasdf9d3bc2016-09-05 19:54:17 +0200398
Neale Rannsf12a83f2017-04-18 09:09:40 -0700399 vlib_increment_combined_counter (cm, thread_index, lbi0, 1,
400 vlib_buffer_length_in_chain (vm,
401 p0));
Ed Warnickecb9cada2015-12-08 15:45:58 -0700402
403 from += 1;
404 to_next += 1;
405 n_left_to_next -= 1;
406 n_left_from -= 1;
407
408 if (PREDICT_FALSE (next0 != next))
409 {
410 n_left_to_next += 1;
411 vlib_put_next_frame (vm, node, next, n_left_to_next);
412 next = next0;
Dave Barachd7cb1b52016-12-09 09:52:16 -0500413 vlib_get_next_frame (vm, node, next, to_next, n_left_to_next);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700414 to_next[0] = pi0;
415 to_next += 1;
416 n_left_to_next -= 1;
417 }
418 }
419
420 vlib_put_next_frame (vm, node, next, n_left_to_next);
421 }
422
Pierre Pfistera38c3df2016-06-13 10:28:09 +0100423 if (node->flags & VLIB_NODE_FLAG_TRACE)
Dave Barachd7cb1b52016-12-09 09:52:16 -0500424 ip4_forward_next_trace (vm, node, frame, VLIB_TX);
Pierre Pfistera38c3df2016-06-13 10:28:09 +0100425
Ed Warnickecb9cada2015-12-08 15:45:58 -0700426 return frame->n_vectors;
427}
428
Chris Luke8e5b0412016-07-26 13:06:10 -0400429/** @brief IPv4 lookup node.
Dave Barach9770e202016-07-06 10:29:27 -0400430 @node ip4-lookup
431
432 This is the main IPv4 lookup dispatch node.
433
434 @param vm vlib_main_t corresponding to the current thread
435 @param node vlib_node_runtime_t
436 @param frame vlib_frame_t whose contents should be dispatched
437
438 @par Graph mechanics: buffer metadata, next index usage
439
440 @em Uses:
441 - <code>vnet_buffer(b)->sw_if_index[VLIB_RX]</code>
442 - Indicates the @c sw_if_index value of the interface that the
443 packet was received on.
444 - <code>vnet_buffer(b)->sw_if_index[VLIB_TX]</code>
445 - When the value is @c ~0 then the node performs a longest prefix
446 match (LPM) for the packet destination address in the FIB attached
447 to the receive interface.
448 - Otherwise perform LPM for the packet destination address in the
449 indicated FIB. In this case <code>[VLIB_TX]</code> is a FIB index
450 value (0, 1, ...) and not a VRF id.
451
452 @em Sets:
453 - <code>vnet_buffer(b)->ip.adj_index[VLIB_TX]</code>
454 - The lookup result adjacency index.
455
456 <em>Next Index:</em>
457 - Dispatches the packet to the node index found in
458 ip_adjacency_t @c adj->lookup_next_index
459 (where @c adj is the lookup result adjacency).
460*/
Ed Warnickecb9cada2015-12-08 15:45:58 -0700461static uword
462ip4_lookup (vlib_main_t * vm,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500463 vlib_node_runtime_t * node, vlib_frame_t * frame)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700464{
Damjan Marionaca64c92016-04-13 09:48:56 +0200465 return ip4_lookup_inline (vm, node, frame,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500466 /* lookup_for_responses_to_locally_received_packets */
467 0);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700468
469}
470
Dave Barachd7cb1b52016-12-09 09:52:16 -0500471static u8 *format_ip4_lookup_trace (u8 * s, va_list * args);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100472
Neale Rannsf8686322017-11-29 02:39:53 -0800473/* *INDENT-OFF* */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500474VLIB_REGISTER_NODE (ip4_lookup_node) =
475{
Neale Rannsf8686322017-11-29 02:39:53 -0800476 .function = ip4_lookup,
477 .name = "ip4-lookup",
478 .vector_size = sizeof (u32),
479 .format_trace = format_ip4_lookup_trace,
480 .n_next_nodes = IP_LOOKUP_N_NEXT,
481 .next_nodes = IP4_LOOKUP_NEXT_NODES,
482};
483/* *INDENT-ON* */
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100484
Dave Barachd7cb1b52016-12-09 09:52:16 -0500485VLIB_NODE_FUNCTION_MULTIARCH (ip4_lookup_node, ip4_lookup);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100486
487always_inline uword
488ip4_load_balance (vlib_main_t * vm,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500489 vlib_node_runtime_t * node, vlib_frame_t * frame)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700490{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500491 vlib_combined_counter_main_t *cm = &load_balance_main.lbm_via_counters;
492 u32 n_left_from, n_left_to_next, *from, *to_next;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100493 ip_lookup_next_t next;
Damjan Marion586afd72017-04-05 19:18:20 +0200494 u32 thread_index = vlib_get_thread_index ();
Ed Warnickecb9cada2015-12-08 15:45:58 -0700495
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100496 from = vlib_frame_vector_args (frame);
497 n_left_from = frame->n_vectors;
498 next = node->cached_next_index;
499
500 if (node->flags & VLIB_NODE_FLAG_TRACE)
Dave Barachd7cb1b52016-12-09 09:52:16 -0500501 ip4_forward_next_trace (vm, node, frame, VLIB_TX);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100502
503 while (n_left_from > 0)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700504 {
Dave Barachd7cb1b52016-12-09 09:52:16 -0500505 vlib_get_next_frame (vm, node, next, to_next, n_left_to_next);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100506
Dave Barach75fc8542016-10-11 16:16:02 -0400507
Neale Ranns2be95c12016-11-19 13:50:04 +0000508 while (n_left_from >= 4 && n_left_to_next >= 2)
Dave Barachd7cb1b52016-12-09 09:52:16 -0500509 {
510 ip_lookup_next_t next0, next1;
Neale Ranns2be95c12016-11-19 13:50:04 +0000511 const load_balance_t *lb0, *lb1;
Dave Barachd7cb1b52016-12-09 09:52:16 -0500512 vlib_buffer_t *p0, *p1;
Neale Ranns2be95c12016-11-19 13:50:04 +0000513 u32 pi0, lbi0, hc0, pi1, lbi1, hc1;
514 const ip4_header_t *ip0, *ip1;
515 const dpo_id_t *dpo0, *dpo1;
516
Dave Barachd7cb1b52016-12-09 09:52:16 -0500517 /* Prefetch next iteration. */
518 {
519 vlib_buffer_t *p2, *p3;
Neale Ranns2be95c12016-11-19 13:50:04 +0000520
521 p2 = vlib_get_buffer (vm, from[2]);
522 p3 = vlib_get_buffer (vm, from[3]);
523
524 vlib_prefetch_buffer_header (p2, STORE);
525 vlib_prefetch_buffer_header (p3, STORE);
526
527 CLIB_PREFETCH (p2->data, sizeof (ip0[0]), STORE);
528 CLIB_PREFETCH (p3->data, sizeof (ip0[0]), STORE);
Dave Barachd7cb1b52016-12-09 09:52:16 -0500529 }
Neale Ranns2be95c12016-11-19 13:50:04 +0000530
531 pi0 = to_next[0] = from[0];
532 pi1 = to_next[1] = from[1];
533
534 from += 2;
535 n_left_from -= 2;
536 to_next += 2;
537 n_left_to_next -= 2;
538
539 p0 = vlib_get_buffer (vm, pi0);
540 p1 = vlib_get_buffer (vm, pi1);
541
542 ip0 = vlib_buffer_get_current (p0);
543 ip1 = vlib_buffer_get_current (p1);
544 lbi0 = vnet_buffer (p0)->ip.adj_index[VLIB_TX];
545 lbi1 = vnet_buffer (p1)->ip.adj_index[VLIB_TX];
546
Dave Barachd7cb1b52016-12-09 09:52:16 -0500547 lb0 = load_balance_get (lbi0);
548 lb1 = load_balance_get (lbi1);
Neale Ranns2be95c12016-11-19 13:50:04 +0000549
Dave Barachd7cb1b52016-12-09 09:52:16 -0500550 /*
551 * this node is for via FIBs we can re-use the hash value from the
552 * to node if present.
553 * We don't want to use the same hash value at each level in the recursion
554 * graph as that would lead to polarisation
555 */
AkshayaNadahalli153b8712017-03-06 18:22:29 +0000556 hc0 = hc1 = 0;
Neale Ranns2be95c12016-11-19 13:50:04 +0000557
Dave Barachd7cb1b52016-12-09 09:52:16 -0500558 if (PREDICT_FALSE (lb0->lb_n_buckets > 1))
559 {
560 if (PREDICT_TRUE (vnet_buffer (p0)->ip.flow_hash))
561 {
562 hc0 = vnet_buffer (p0)->ip.flow_hash =
563 vnet_buffer (p0)->ip.flow_hash >> 1;
564 }
565 else
566 {
567 hc0 = vnet_buffer (p0)->ip.flow_hash =
AkshayaNadahalli153b8712017-03-06 18:22:29 +0000568 ip4_compute_flow_hash (ip0, lb0->lb_hash_config);
Dave Barachd7cb1b52016-12-09 09:52:16 -0500569 }
Neale Rannsf12a83f2017-04-18 09:09:40 -0700570 dpo0 = load_balance_get_fwd_bucket
571 (lb0, (hc0 & (lb0->lb_n_buckets_minus_1)));
572 }
573 else
574 {
575 dpo0 = load_balance_get_bucket_i (lb0, 0);
Dave Barachd7cb1b52016-12-09 09:52:16 -0500576 }
577 if (PREDICT_FALSE (lb1->lb_n_buckets > 1))
578 {
579 if (PREDICT_TRUE (vnet_buffer (p1)->ip.flow_hash))
580 {
581 hc1 = vnet_buffer (p1)->ip.flow_hash =
582 vnet_buffer (p1)->ip.flow_hash >> 1;
583 }
584 else
585 {
586 hc1 = vnet_buffer (p1)->ip.flow_hash =
AkshayaNadahalli153b8712017-03-06 18:22:29 +0000587 ip4_compute_flow_hash (ip1, lb1->lb_hash_config);
Dave Barachd7cb1b52016-12-09 09:52:16 -0500588 }
Neale Rannsf12a83f2017-04-18 09:09:40 -0700589 dpo1 = load_balance_get_fwd_bucket
590 (lb1, (hc1 & (lb1->lb_n_buckets_minus_1)));
Dave Barachd7cb1b52016-12-09 09:52:16 -0500591 }
Neale Rannsf12a83f2017-04-18 09:09:40 -0700592 else
593 {
594 dpo1 = load_balance_get_bucket_i (lb1, 0);
595 }
Neale Ranns2be95c12016-11-19 13:50:04 +0000596
597 next0 = dpo0->dpoi_next_node;
598 next1 = dpo1->dpoi_next_node;
599
600 vnet_buffer (p0)->ip.adj_index[VLIB_TX] = dpo0->dpoi_index;
601 vnet_buffer (p1)->ip.adj_index[VLIB_TX] = dpo1->dpoi_index;
602
603 vlib_increment_combined_counter
Damjan Marion586afd72017-04-05 19:18:20 +0200604 (cm, thread_index, lbi0, 1, vlib_buffer_length_in_chain (vm, p0));
Neale Ranns2be95c12016-11-19 13:50:04 +0000605 vlib_increment_combined_counter
Damjan Marion586afd72017-04-05 19:18:20 +0200606 (cm, thread_index, lbi1, 1, vlib_buffer_length_in_chain (vm, p1));
Neale Ranns2be95c12016-11-19 13:50:04 +0000607
608 vlib_validate_buffer_enqueue_x2 (vm, node, next,
609 to_next, n_left_to_next,
610 pi0, pi1, next0, next1);
Dave Barachd7cb1b52016-12-09 09:52:16 -0500611 }
Neale Ranns2be95c12016-11-19 13:50:04 +0000612
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100613 while (n_left_from > 0 && n_left_to_next > 0)
614 {
615 ip_lookup_next_t next0;
616 const load_balance_t *lb0;
Dave Barachd7cb1b52016-12-09 09:52:16 -0500617 vlib_buffer_t *p0;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100618 u32 pi0, lbi0, hc0;
619 const ip4_header_t *ip0;
620 const dpo_id_t *dpo0;
621
622 pi0 = from[0];
623 to_next[0] = pi0;
Neale Ranns2be95c12016-11-19 13:50:04 +0000624 from += 1;
625 to_next += 1;
626 n_left_to_next -= 1;
627 n_left_from -= 1;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100628
629 p0 = vlib_get_buffer (vm, pi0);
630
631 ip0 = vlib_buffer_get_current (p0);
632 lbi0 = vnet_buffer (p0)->ip.adj_index[VLIB_TX];
633
Dave Barachd7cb1b52016-12-09 09:52:16 -0500634 lb0 = load_balance_get (lbi0);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100635
AkshayaNadahalli153b8712017-03-06 18:22:29 +0000636 hc0 = 0;
Dave Barachd7cb1b52016-12-09 09:52:16 -0500637 if (PREDICT_FALSE (lb0->lb_n_buckets > 1))
638 {
639 if (PREDICT_TRUE (vnet_buffer (p0)->ip.flow_hash))
640 {
641 hc0 = vnet_buffer (p0)->ip.flow_hash =
642 vnet_buffer (p0)->ip.flow_hash >> 1;
643 }
644 else
645 {
646 hc0 = vnet_buffer (p0)->ip.flow_hash =
AkshayaNadahalli153b8712017-03-06 18:22:29 +0000647 ip4_compute_flow_hash (ip0, lb0->lb_hash_config);
Dave Barachd7cb1b52016-12-09 09:52:16 -0500648 }
Neale Rannsf12a83f2017-04-18 09:09:40 -0700649 dpo0 = load_balance_get_fwd_bucket
650 (lb0, (hc0 & (lb0->lb_n_buckets_minus_1)));
Dave Barachd7cb1b52016-12-09 09:52:16 -0500651 }
Neale Rannsf12a83f2017-04-18 09:09:40 -0700652 else
653 {
654 dpo0 = load_balance_get_bucket_i (lb0, 0);
655 }
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100656
657 next0 = dpo0->dpoi_next_node;
658 vnet_buffer (p0)->ip.adj_index[VLIB_TX] = dpo0->dpoi_index;
659
Dave Barach75fc8542016-10-11 16:16:02 -0400660 vlib_increment_combined_counter
Damjan Marion586afd72017-04-05 19:18:20 +0200661 (cm, thread_index, lbi0, 1, vlib_buffer_length_in_chain (vm, p0));
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100662
Neale Ranns2be95c12016-11-19 13:50:04 +0000663 vlib_validate_buffer_enqueue_x1 (vm, node, next,
664 to_next, n_left_to_next,
665 pi0, next0);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100666 }
667
668 vlib_put_next_frame (vm, node, next, n_left_to_next);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700669 }
670
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100671 return frame->n_vectors;
672}
673
Neale Rannsf8686322017-11-29 02:39:53 -0800674/* *INDENT-OFF* */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500675VLIB_REGISTER_NODE (ip4_load_balance_node) =
676{
Neale Rannsf8686322017-11-29 02:39:53 -0800677 .function = ip4_load_balance,
678 .name = "ip4-load-balance",
679 .vector_size = sizeof (u32),
680 .sibling_of = "ip4-lookup",
681 .format_trace =
682 format_ip4_lookup_trace,
683};
684/* *INDENT-ON* */
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100685
Dave Barachd7cb1b52016-12-09 09:52:16 -0500686VLIB_NODE_FUNCTION_MULTIARCH (ip4_load_balance_node, ip4_load_balance);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100687
688/* get first interface address */
689ip4_address_t *
690ip4_interface_first_address (ip4_main_t * im, u32 sw_if_index,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500691 ip_interface_address_t ** result_ia)
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100692{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500693 ip_lookup_main_t *lm = &im->lookup_main;
694 ip_interface_address_t *ia = 0;
695 ip4_address_t *result = 0;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100696
Neale Ranns32e1c012016-11-22 17:07:28 +0000697 /* *INDENT-OFF* */
698 foreach_ip_interface_address
699 (lm, ia, sw_if_index,
700 1 /* honor unnumbered */ ,
701 ({
702 ip4_address_t * a =
703 ip_interface_address_get_address (lm, ia);
704 result = a;
705 break;
706 }));
707 /* *INDENT-OFF* */
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100708 if (result_ia)
709 *result_ia = result ? ia : 0;
710 return result;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700711}
712
713static void
714ip4_add_interface_routes (u32 sw_if_index,
715 ip4_main_t * im, u32 fib_index,
716 ip_interface_address_t * a)
717{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500718 ip_lookup_main_t *lm = &im->lookup_main;
719 ip4_address_t *address = ip_interface_address_get_address (lm, a);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100720 fib_prefix_t pfx = {
Dave Barachd7cb1b52016-12-09 09:52:16 -0500721 .fp_len = a->address_length,
722 .fp_proto = FIB_PROTOCOL_IP4,
723 .fp_addr.ip4 = *address,
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100724 };
Ed Warnickecb9cada2015-12-08 15:45:58 -0700725
Neale Ranns9a69a602017-03-26 10:56:33 -0700726 if (pfx.fp_len <= 30)
Dave Barachd7cb1b52016-12-09 09:52:16 -0500727 {
Neale Ranns9a69a602017-03-26 10:56:33 -0700728 /* a /30 or shorter - add a glean for the network address */
Neale Ranns7a272742017-05-30 02:08:14 -0700729 fib_table_entry_update_one_path (fib_index, &pfx,
730 FIB_SOURCE_INTERFACE,
731 (FIB_ENTRY_FLAG_CONNECTED |
732 FIB_ENTRY_FLAG_ATTACHED),
Neale Rannsda78f952017-05-24 09:15:43 -0700733 DPO_PROTO_IP4,
Neale Ranns7a272742017-05-30 02:08:14 -0700734 /* No next-hop address */
735 NULL,
736 sw_if_index,
737 // invalid FIB index
738 ~0,
739 1,
740 // no out-label stack
741 NULL,
742 FIB_ROUTE_PATH_FLAG_NONE);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100743
Neale Ranns9a69a602017-03-26 10:56:33 -0700744 /* Add the two broadcast addresses as drop */
745 fib_prefix_t net_pfx = {
746 .fp_len = 32,
747 .fp_proto = FIB_PROTOCOL_IP4,
748 .fp_addr.ip4.as_u32 = address->as_u32 & im->fib_masks[pfx.fp_len],
749 };
750 if (net_pfx.fp_addr.ip4.as_u32 != pfx.fp_addr.ip4.as_u32)
751 fib_table_entry_special_add(fib_index,
752 &net_pfx,
753 FIB_SOURCE_INTERFACE,
754 (FIB_ENTRY_FLAG_DROP |
Neale Rannsa0558302017-04-13 00:44:52 -0700755 FIB_ENTRY_FLAG_LOOSE_URPF_EXEMPT));
Neale Ranns9a69a602017-03-26 10:56:33 -0700756 net_pfx.fp_addr.ip4.as_u32 |= ~im->fib_masks[pfx.fp_len];
757 if (net_pfx.fp_addr.ip4.as_u32 != pfx.fp_addr.ip4.as_u32)
758 fib_table_entry_special_add(fib_index,
759 &net_pfx,
760 FIB_SOURCE_INTERFACE,
761 (FIB_ENTRY_FLAG_DROP |
Neale Rannsa0558302017-04-13 00:44:52 -0700762 FIB_ENTRY_FLAG_LOOSE_URPF_EXEMPT));
Neale Ranns9a69a602017-03-26 10:56:33 -0700763 }
764 else if (pfx.fp_len == 31)
765 {
766 u32 mask = clib_host_to_net_u32(1);
767 fib_prefix_t net_pfx = pfx;
768
769 net_pfx.fp_len = 32;
770 net_pfx.fp_addr.ip4.as_u32 ^= mask;
771
772 /* a /31 - add the other end as an attached host */
773 fib_table_entry_update_one_path (fib_index, &net_pfx,
774 FIB_SOURCE_INTERFACE,
775 (FIB_ENTRY_FLAG_ATTACHED),
Neale Rannsda78f952017-05-24 09:15:43 -0700776 DPO_PROTO_IP4,
Neale Ranns9a69a602017-03-26 10:56:33 -0700777 &net_pfx.fp_addr,
778 sw_if_index,
779 // invalid FIB index
780 ~0,
781 1,
782 NULL,
783 FIB_ROUTE_PATH_FLAG_NONE);
784 }
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100785 pfx.fp_len = 32;
786
787 if (sw_if_index < vec_len (lm->classify_table_index_by_sw_if_index))
Dave Barachd7cb1b52016-12-09 09:52:16 -0500788 {
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100789 u32 classify_table_index =
Dave Barachd7cb1b52016-12-09 09:52:16 -0500790 lm->classify_table_index_by_sw_if_index[sw_if_index];
791 if (classify_table_index != (u32) ~ 0)
792 {
793 dpo_id_t dpo = DPO_INVALID;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100794
Dave Barachd7cb1b52016-12-09 09:52:16 -0500795 dpo_set (&dpo,
796 DPO_CLASSIFY,
797 DPO_PROTO_IP4,
798 classify_dpo_create (DPO_PROTO_IP4, classify_table_index));
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100799
Dave Barachd7cb1b52016-12-09 09:52:16 -0500800 fib_table_entry_special_dpo_add (fib_index,
801 &pfx,
802 FIB_SOURCE_CLASSIFY,
803 FIB_ENTRY_FLAG_NONE, &dpo);
804 dpo_reset (&dpo);
805 }
806 }
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100807
Neale Ranns32e1c012016-11-22 17:07:28 +0000808 fib_table_entry_update_one_path (fib_index, &pfx,
809 FIB_SOURCE_INTERFACE,
810 (FIB_ENTRY_FLAG_CONNECTED |
811 FIB_ENTRY_FLAG_LOCAL),
Neale Rannsda78f952017-05-24 09:15:43 -0700812 DPO_PROTO_IP4,
Neale Ranns32e1c012016-11-22 17:07:28 +0000813 &pfx.fp_addr,
814 sw_if_index,
815 // invalid FIB index
816 ~0,
817 1, NULL,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500818 FIB_ROUTE_PATH_FLAG_NONE);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700819}
820
821static void
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100822ip4_del_interface_routes (ip4_main_t * im,
823 u32 fib_index,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500824 ip4_address_t * address, u32 address_length)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700825{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500826 fib_prefix_t pfx = {
827 .fp_len = address_length,
828 .fp_proto = FIB_PROTOCOL_IP4,
829 .fp_addr.ip4 = *address,
830 };
Ed Warnickecb9cada2015-12-08 15:45:58 -0700831
Neale Ranns9a69a602017-03-26 10:56:33 -0700832 if (pfx.fp_len <= 30)
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100833 {
Neale Ranns9a69a602017-03-26 10:56:33 -0700834 fib_prefix_t net_pfx = {
835 .fp_len = 32,
836 .fp_proto = FIB_PROTOCOL_IP4,
837 .fp_addr.ip4.as_u32 = address->as_u32 & im->fib_masks[pfx.fp_len],
838 };
839 if (net_pfx.fp_addr.ip4.as_u32 != pfx.fp_addr.ip4.as_u32)
840 fib_table_entry_special_remove(fib_index,
841 &net_pfx,
842 FIB_SOURCE_INTERFACE);
843 net_pfx.fp_addr.ip4.as_u32 |= ~im->fib_masks[pfx.fp_len];
844 if (net_pfx.fp_addr.ip4.as_u32 != pfx.fp_addr.ip4.as_u32)
845 fib_table_entry_special_remove(fib_index,
846 &net_pfx,
847 FIB_SOURCE_INTERFACE);
Dave Barachd7cb1b52016-12-09 09:52:16 -0500848 fib_table_entry_delete (fib_index, &pfx, FIB_SOURCE_INTERFACE);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100849 }
Neale Ranns9a69a602017-03-26 10:56:33 -0700850 else if (pfx.fp_len == 31)
851 {
852 u32 mask = clib_host_to_net_u32(1);
853 fib_prefix_t net_pfx = pfx;
854
855 net_pfx.fp_len = 32;
856 net_pfx.fp_addr.ip4.as_u32 ^= mask;
857
858 fib_table_entry_delete (fib_index, &net_pfx, FIB_SOURCE_INTERFACE);
859 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700860
Dave Barachd7cb1b52016-12-09 09:52:16 -0500861 pfx.fp_len = 32;
862 fib_table_entry_delete (fib_index, &pfx, FIB_SOURCE_INTERFACE);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700863}
864
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100865void
Dave Barachd7cb1b52016-12-09 09:52:16 -0500866ip4_sw_interface_enable_disable (u32 sw_if_index, u32 is_enable)
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100867{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500868 ip4_main_t *im = &ip4_main;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700869
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100870 vec_validate_init_empty (im->ip_enabled_by_sw_if_index, sw_if_index, 0);
871
872 /*
873 * enable/disable only on the 1<->0 transition
874 */
875 if (is_enable)
876 {
877 if (1 != ++im->ip_enabled_by_sw_if_index[sw_if_index])
Dave Barachd7cb1b52016-12-09 09:52:16 -0500878 return;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100879 }
880 else
881 {
Dave Barachd7cb1b52016-12-09 09:52:16 -0500882 ASSERT (im->ip_enabled_by_sw_if_index[sw_if_index] > 0);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100883 if (0 != --im->ip_enabled_by_sw_if_index[sw_if_index])
Dave Barachd7cb1b52016-12-09 09:52:16 -0500884 return;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100885 }
Neale Ranns8269d3d2018-01-30 09:02:20 -0800886 vnet_feature_enable_disable ("ip4-unicast", "ip4-not-enabled", sw_if_index,
Damjan Marion4d489932016-12-09 03:21:27 -0800887 !is_enable, 0, 0);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100888
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100889
Neale Ranns8269d3d2018-01-30 09:02:20 -0800890 vnet_feature_enable_disable ("ip4-multicast", "ip4-not-enabled",
Neale Ranns180279b2017-03-16 15:49:09 -0400891 sw_if_index, !is_enable, 0, 0);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100892}
Ed Warnickecb9cada2015-12-08 15:45:58 -0700893
Ed Warnickecb9cada2015-12-08 15:45:58 -0700894static clib_error_t *
895ip4_add_del_interface_address_internal (vlib_main_t * vm,
896 u32 sw_if_index,
897 ip4_address_t * address,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500898 u32 address_length, u32 is_del)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700899{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500900 vnet_main_t *vnm = vnet_get_main ();
901 ip4_main_t *im = &ip4_main;
902 ip_lookup_main_t *lm = &im->lookup_main;
903 clib_error_t *error = 0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700904 u32 if_address_index, elts_before;
Dave Barachd7cb1b52016-12-09 09:52:16 -0500905 ip4_address_fib_t ip4_af, *addr_fib = 0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700906
Pavel Kotucek57808982017-08-02 08:20:19 +0200907 /* local0 interface doesn't support IP addressing */
908 if (sw_if_index == 0)
909 {
910 return
911 clib_error_create ("local0 interface doesn't support IP addressing");
912 }
913
Ed Warnickecb9cada2015-12-08 15:45:58 -0700914 vec_validate (im->fib_index_by_sw_if_index, sw_if_index);
915 ip4_addr_fib_init (&ip4_af, address,
916 vec_elt (im->fib_index_by_sw_if_index, sw_if_index));
917 vec_add1 (addr_fib, ip4_af);
918
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100919 /* FIXME-LATER
920 * there is no support for adj-fib handling in the presence of overlapping
921 * subnets on interfaces. Easy fix - disallow overlapping subnets, like
922 * most routers do.
923 */
Neale Ranns32e1c012016-11-22 17:07:28 +0000924 /* *INDENT-OFF* */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500925 if (!is_del)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700926 {
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100927 /* When adding an address check that it does not conflict
Dave Barachd7cb1b52016-12-09 09:52:16 -0500928 with an existing address. */
929 ip_interface_address_t *ia;
Neale Ranns32e1c012016-11-22 17:07:28 +0000930 foreach_ip_interface_address
931 (&im->lookup_main, ia, sw_if_index,
932 0 /* honor unnumbered */ ,
933 ({
934 ip4_address_t * x =
935 ip_interface_address_get_address
936 (&im->lookup_main, ia);
937 if (ip4_destination_matches_route
938 (im, address, x, ia->address_length) ||
939 ip4_destination_matches_route (im,
940 x,
941 address,
942 address_length))
943 return
944 clib_error_create
945 ("failed to add %U which conflicts with %U for interface %U",
946 format_ip4_address_and_length, address,
947 address_length,
948 format_ip4_address_and_length, x,
949 ia->address_length,
950 format_vnet_sw_if_index_name, vnm,
951 sw_if_index);
952 }));
Ed Warnickecb9cada2015-12-08 15:45:58 -0700953 }
Neale Ranns32e1c012016-11-22 17:07:28 +0000954 /* *INDENT-ON* */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700955
Ed Warnickecb9cada2015-12-08 15:45:58 -0700956 elts_before = pool_elts (lm->if_address_pool);
957
958 error = ip_interface_address_add_del
Dave Barachd7cb1b52016-12-09 09:52:16 -0500959 (lm, sw_if_index, addr_fib, address_length, is_del, &if_address_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700960 if (error)
961 goto done;
Dave Barach75fc8542016-10-11 16:16:02 -0400962
Dave Barachd7cb1b52016-12-09 09:52:16 -0500963 ip4_sw_interface_enable_disable (sw_if_index, !is_del);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100964
965 if (is_del)
Dave Barachd7cb1b52016-12-09 09:52:16 -0500966 ip4_del_interface_routes (im, ip4_af.fib_index, address, address_length);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100967 else
Dave Barachd7cb1b52016-12-09 09:52:16 -0500968 ip4_add_interface_routes (sw_if_index,
969 im, ip4_af.fib_index,
970 pool_elt_at_index
971 (lm->if_address_pool, if_address_index));
Ed Warnickecb9cada2015-12-08 15:45:58 -0700972
973 /* If pool did not grow/shrink: add duplicate address. */
974 if (elts_before != pool_elts (lm->if_address_pool))
975 {
Dave Barachd7cb1b52016-12-09 09:52:16 -0500976 ip4_add_del_interface_address_callback_t *cb;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700977 vec_foreach (cb, im->add_del_interface_address_callbacks)
978 cb->function (im, cb->function_opaque, sw_if_index,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500979 address, address_length, if_address_index, is_del);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700980 }
981
Dave Barachd7cb1b52016-12-09 09:52:16 -0500982done:
Ed Warnickecb9cada2015-12-08 15:45:58 -0700983 vec_free (addr_fib);
984 return error;
985}
986
987clib_error_t *
Neale Ranns32e1c012016-11-22 17:07:28 +0000988ip4_add_del_interface_address (vlib_main_t * vm,
989 u32 sw_if_index,
990 ip4_address_t * address,
991 u32 address_length, u32 is_del)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700992{
993 return ip4_add_del_interface_address_internal
Dave Barachd7cb1b52016-12-09 09:52:16 -0500994 (vm, sw_if_index, address, address_length, is_del);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700995}
996
Dave Barachd6534602016-06-14 18:38:02 -0400997/* Built-in ip4 unicast rx feature path definition */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500998/* *INDENT-OFF* */
Damjan Marion8b3191e2016-11-09 19:54:20 +0100999VNET_FEATURE_ARC_INIT (ip4_unicast, static) =
1000{
Dave Barachd7cb1b52016-12-09 09:52:16 -05001001 .arc_name = "ip4-unicast",
Damjan Marion892e0762016-12-09 18:52:05 +01001002 .start_nodes = VNET_FEATURES ("ip4-input", "ip4-input-no-checksum"),
1003 .arc_index_ptr = &ip4_main.lookup_main.ucast_feature_arc_index,
1004};
Damjan Marion8b3191e2016-11-09 19:54:20 +01001005
Dave Barachd7cb1b52016-12-09 09:52:16 -05001006VNET_FEATURE_INIT (ip4_flow_classify, static) =
1007{
Damjan Marion8b3191e2016-11-09 19:54:20 +01001008 .arc_name = "ip4-unicast",
Juraj Sloboda506b2452016-08-07 23:45:24 -07001009 .node_name = "ip4-flow-classify",
Damjan Marion8b3191e2016-11-09 19:54:20 +01001010 .runs_before = VNET_FEATURES ("ip4-inacl"),
Juraj Sloboda506b2452016-08-07 23:45:24 -07001011};
1012
Dave Barachd7cb1b52016-12-09 09:52:16 -05001013VNET_FEATURE_INIT (ip4_inacl, static) =
1014{
Damjan Marion8b3191e2016-11-09 19:54:20 +01001015 .arc_name = "ip4-unicast",
Dave Barach75fc8542016-10-11 16:16:02 -04001016 .node_name = "ip4-inacl",
Damjan Marion8b3191e2016-11-09 19:54:20 +01001017 .runs_before = VNET_FEATURES ("ip4-source-check-via-rx"),
Dave Barachd6534602016-06-14 18:38:02 -04001018};
1019
Dave Barachd7cb1b52016-12-09 09:52:16 -05001020VNET_FEATURE_INIT (ip4_source_check_1, static) =
1021{
Damjan Marion8b3191e2016-11-09 19:54:20 +01001022 .arc_name = "ip4-unicast",
Dave Barachd6534602016-06-14 18:38:02 -04001023 .node_name = "ip4-source-check-via-rx",
Damjan Marion8b3191e2016-11-09 19:54:20 +01001024 .runs_before = VNET_FEATURES ("ip4-source-check-via-any"),
Dave Barachd6534602016-06-14 18:38:02 -04001025};
1026
Dave Barachd7cb1b52016-12-09 09:52:16 -05001027VNET_FEATURE_INIT (ip4_source_check_2, static) =
1028{
Damjan Marion8b3191e2016-11-09 19:54:20 +01001029 .arc_name = "ip4-unicast",
Dave Barachd6534602016-06-14 18:38:02 -04001030 .node_name = "ip4-source-check-via-any",
Damjan Marion8b3191e2016-11-09 19:54:20 +01001031 .runs_before = VNET_FEATURES ("ip4-policer-classify"),
Dave Barachd6534602016-06-14 18:38:02 -04001032};
1033
Dave Barachd7cb1b52016-12-09 09:52:16 -05001034VNET_FEATURE_INIT (ip4_source_and_port_range_check_rx, static) =
1035{
Damjan Marion8b3191e2016-11-09 19:54:20 +01001036 .arc_name = "ip4-unicast",
Dave Barach5331c722016-08-17 11:54:30 -04001037 .node_name = "ip4-source-and-port-range-check-rx",
Damjan Marion8b3191e2016-11-09 19:54:20 +01001038 .runs_before = VNET_FEATURES ("ip4-policer-classify"),
Dave Barach6f9bca22016-04-30 10:25:32 -04001039};
1040
Dave Barachd7cb1b52016-12-09 09:52:16 -05001041VNET_FEATURE_INIT (ip4_policer_classify, static) =
1042{
Damjan Marion8b3191e2016-11-09 19:54:20 +01001043 .arc_name = "ip4-unicast",
Matus Fabian70e6a8d2016-06-20 08:10:42 -07001044 .node_name = "ip4-policer-classify",
Damjan Marion8b3191e2016-11-09 19:54:20 +01001045 .runs_before = VNET_FEATURES ("ipsec-input-ip4"),
Matus Fabian70e6a8d2016-06-20 08:10:42 -07001046};
1047
Dave Barachd7cb1b52016-12-09 09:52:16 -05001048VNET_FEATURE_INIT (ip4_ipsec, static) =
1049{
Damjan Marion8b3191e2016-11-09 19:54:20 +01001050 .arc_name = "ip4-unicast",
Dave Barachd6534602016-06-14 18:38:02 -04001051 .node_name = "ipsec-input-ip4",
Damjan Marion8b3191e2016-11-09 19:54:20 +01001052 .runs_before = VNET_FEATURES ("vpath-input-ip4"),
Dave Barachd6534602016-06-14 18:38:02 -04001053};
1054
Dave Barachd7cb1b52016-12-09 09:52:16 -05001055VNET_FEATURE_INIT (ip4_vpath, static) =
1056{
Damjan Marion8b3191e2016-11-09 19:54:20 +01001057 .arc_name = "ip4-unicast",
Dave Barachd6534602016-06-14 18:38:02 -04001058 .node_name = "vpath-input-ip4",
John Lo37682e12016-11-30 12:51:39 -05001059 .runs_before = VNET_FEATURES ("ip4-vxlan-bypass"),
1060};
1061
Dave Barachd7cb1b52016-12-09 09:52:16 -05001062VNET_FEATURE_INIT (ip4_vxlan_bypass, static) =
1063{
John Lo37682e12016-11-30 12:51:39 -05001064 .arc_name = "ip4-unicast",
1065 .node_name = "ip4-vxlan-bypass",
Damjan Marion8b3191e2016-11-09 19:54:20 +01001066 .runs_before = VNET_FEATURES ("ip4-lookup"),
Dave Barachd6534602016-06-14 18:38:02 -04001067};
1068
Neale Ranns8269d3d2018-01-30 09:02:20 -08001069VNET_FEATURE_INIT (ip4_not_enabled, static) =
Dave Barachd7cb1b52016-12-09 09:52:16 -05001070{
Damjan Marion8b3191e2016-11-09 19:54:20 +01001071 .arc_name = "ip4-unicast",
Neale Ranns8269d3d2018-01-30 09:02:20 -08001072 .node_name = "ip4-not-enabled",
Neale Ranns180279b2017-03-16 15:49:09 -04001073 .runs_before = VNET_FEATURES ("ip4-lookup"),
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001074};
1075
Neale Ranns180279b2017-03-16 15:49:09 -04001076VNET_FEATURE_INIT (ip4_lookup, static) =
1077{
1078 .arc_name = "ip4-unicast",
1079 .node_name = "ip4-lookup",
1080 .runs_before = 0, /* not before any other features */
1081};
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001082
Dave Barachd6534602016-06-14 18:38:02 -04001083/* Built-in ip4 multicast rx feature path definition */
Damjan Marion8b3191e2016-11-09 19:54:20 +01001084VNET_FEATURE_ARC_INIT (ip4_multicast, static) =
1085{
Dave Barachd7cb1b52016-12-09 09:52:16 -05001086 .arc_name = "ip4-multicast",
Damjan Marion8b3191e2016-11-09 19:54:20 +01001087 .start_nodes = VNET_FEATURES ("ip4-input", "ip4-input-no-checksum"),
1088 .arc_index_ptr = &ip4_main.lookup_main.mcast_feature_arc_index,
1089};
1090
Dave Barachd7cb1b52016-12-09 09:52:16 -05001091VNET_FEATURE_INIT (ip4_vpath_mc, static) =
1092{
Damjan Marion8b3191e2016-11-09 19:54:20 +01001093 .arc_name = "ip4-multicast",
Dave Barachd6534602016-06-14 18:38:02 -04001094 .node_name = "vpath-input-ip4",
Neale Ranns32e1c012016-11-22 17:07:28 +00001095 .runs_before = VNET_FEATURES ("ip4-mfib-forward-lookup"),
Dave Barachd6534602016-06-14 18:38:02 -04001096};
1097
Neale Ranns8269d3d2018-01-30 09:02:20 -08001098VNET_FEATURE_INIT (ip4_mc_not_enabled, static) =
Dave Barachd7cb1b52016-12-09 09:52:16 -05001099{
Damjan Marion8b3191e2016-11-09 19:54:20 +01001100 .arc_name = "ip4-multicast",
Neale Ranns8269d3d2018-01-30 09:02:20 -08001101 .node_name = "ip4-not-enabled",
Neale Ranns180279b2017-03-16 15:49:09 -04001102 .runs_before = VNET_FEATURES ("ip4-mfib-forward-lookup"),
1103};
1104
1105VNET_FEATURE_INIT (ip4_lookup_mc, static) =
1106{
1107 .arc_name = "ip4-multicast",
1108 .node_name = "ip4-mfib-forward-lookup",
Dave Barachd7cb1b52016-12-09 09:52:16 -05001109 .runs_before = 0, /* last feature */
Neale Ranns5e575b12016-10-03 09:40:25 +01001110};
Dave Barach5331c722016-08-17 11:54:30 -04001111
1112/* Source and port-range check ip4 tx feature path definition */
Damjan Marion8b3191e2016-11-09 19:54:20 +01001113VNET_FEATURE_ARC_INIT (ip4_output, static) =
1114{
Dave Barachd7cb1b52016-12-09 09:52:16 -05001115 .arc_name = "ip4-output",
Neale Rannsf068c3e2018-01-03 04:18:48 -08001116 .start_nodes = VNET_FEATURES ("ip4-rewrite", "ip4-midchain", "ip4-dvr-dpo"),
Damjan Marion8b3191e2016-11-09 19:54:20 +01001117 .arc_index_ptr = &ip4_main.lookup_main.output_feature_arc_index,
1118};
Dave Barach5331c722016-08-17 11:54:30 -04001119
Dave Barachd7cb1b52016-12-09 09:52:16 -05001120VNET_FEATURE_INIT (ip4_source_and_port_range_check_tx, static) =
1121{
Damjan Marion8b3191e2016-11-09 19:54:20 +01001122 .arc_name = "ip4-output",
1123 .node_name = "ip4-source-and-port-range-check-tx",
Matus Fabian08a6f012016-11-15 06:08:51 -08001124 .runs_before = VNET_FEATURES ("ipsec-output-ip4"),
1125};
1126
Dave Barachd7cb1b52016-12-09 09:52:16 -05001127VNET_FEATURE_INIT (ip4_ipsec_output, static) =
1128{
Matus Fabian08a6f012016-11-15 06:08:51 -08001129 .arc_name = "ip4-output",
1130 .node_name = "ipsec-output-ip4",
Damjan Marion8b3191e2016-11-09 19:54:20 +01001131 .runs_before = VNET_FEATURES ("interface-output"),
Dave Barach5331c722016-08-17 11:54:30 -04001132};
1133
1134/* Built-in ip4 tx feature path definition */
Dave Barachd7cb1b52016-12-09 09:52:16 -05001135VNET_FEATURE_INIT (ip4_interface_output, static) =
1136{
Damjan Marion8b3191e2016-11-09 19:54:20 +01001137 .arc_name = "ip4-output",
Dave Barach5331c722016-08-17 11:54:30 -04001138 .node_name = "interface-output",
Dave Barachd7cb1b52016-12-09 09:52:16 -05001139 .runs_before = 0, /* not before any other features */
Dave Barach5331c722016-08-17 11:54:30 -04001140};
Dave Barachd7cb1b52016-12-09 09:52:16 -05001141/* *INDENT-ON* */
Dave Barachd6534602016-06-14 18:38:02 -04001142
Ed Warnickecb9cada2015-12-08 15:45:58 -07001143static clib_error_t *
Dave Barachd7cb1b52016-12-09 09:52:16 -05001144ip4_sw_interface_add_del (vnet_main_t * vnm, u32 sw_if_index, u32 is_add)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001145{
Dave Barachd7cb1b52016-12-09 09:52:16 -05001146 ip4_main_t *im = &ip4_main;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001147
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001148 /* Fill in lookup tables with default table (0). */
1149 vec_validate (im->fib_index_by_sw_if_index, sw_if_index);
Neale Ranns32e1c012016-11-22 17:07:28 +00001150 vec_validate (im->mfib_index_by_sw_if_index, sw_if_index);
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001151
Pavel Kotucek9f5a2b62017-06-14 13:56:55 +02001152 if (!is_add)
1153 {
1154 ip4_main_t *im4 = &ip4_main;
1155 ip_lookup_main_t *lm4 = &im4->lookup_main;
1156 ip_interface_address_t *ia = 0;
1157 ip4_address_t *address;
1158 vlib_main_t *vm = vlib_get_main ();
1159
1160 /* *INDENT-OFF* */
1161 foreach_ip_interface_address (lm4, ia, sw_if_index, 1 /* honor unnumbered */,
1162 ({
1163 address = ip_interface_address_get_address (lm4, ia);
1164 ip4_add_del_interface_address(vm, sw_if_index, address, ia->address_length, 1);
1165 }));
1166 /* *INDENT-ON* */
1167 }
1168
Neale Ranns8269d3d2018-01-30 09:02:20 -08001169 vnet_feature_enable_disable ("ip4-unicast", "ip4-not-enabled", sw_if_index,
Damjan Marion8b3191e2016-11-09 19:54:20 +01001170 is_add, 0, 0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001171
Neale Ranns8269d3d2018-01-30 09:02:20 -08001172 vnet_feature_enable_disable ("ip4-multicast", "ip4-not-enabled",
1173 sw_if_index, is_add, 0, 0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001174
Ed Warnickecb9cada2015-12-08 15:45:58 -07001175 return /* no error */ 0;
1176}
1177
1178VNET_SW_INTERFACE_ADD_DEL_FUNCTION (ip4_sw_interface_add_del);
1179
Ed Warnickecb9cada2015-12-08 15:45:58 -07001180/* Global IP4 main. */
1181ip4_main_t ip4_main;
1182
1183clib_error_t *
1184ip4_lookup_init (vlib_main_t * vm)
1185{
Dave Barachd7cb1b52016-12-09 09:52:16 -05001186 ip4_main_t *im = &ip4_main;
1187 clib_error_t *error;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001188 uword i;
1189
Damjan Marion8b3191e2016-11-09 19:54:20 +01001190 if ((error = vlib_call_init_function (vm, vnet_feature_init)))
1191 return error;
Neale Ranns1ec36522017-11-29 05:20:37 -08001192 if ((error = vlib_call_init_function (vm, ip4_mtrie_module_init)))
1193 return (error);
1194 if ((error = vlib_call_init_function (vm, fib_module_init)))
1195 return error;
1196 if ((error = vlib_call_init_function (vm, mfib_module_init)))
1197 return error;
Damjan Marion8b3191e2016-11-09 19:54:20 +01001198
Ed Warnickecb9cada2015-12-08 15:45:58 -07001199 for (i = 0; i < ARRAY_LEN (im->fib_masks); i++)
1200 {
1201 u32 m;
1202
1203 if (i < 32)
1204 m = pow2_mask (i) << (32 - i);
Dave Barach75fc8542016-10-11 16:16:02 -04001205 else
Ed Warnickecb9cada2015-12-08 15:45:58 -07001206 m = ~0;
1207 im->fib_masks[i] = clib_host_to_net_u32 (m);
1208 }
1209
Ed Warnickecb9cada2015-12-08 15:45:58 -07001210 ip_lookup_init (&im->lookup_main, /* is_ip6 */ 0);
1211
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001212 /* Create FIB with index 0 and table id of 0. */
Neale Ranns15002542017-09-10 04:39:11 -07001213 fib_table_find_or_create_and_lock (FIB_PROTOCOL_IP4, 0,
1214 FIB_SOURCE_DEFAULT_ROUTE);
1215 mfib_table_find_or_create_and_lock (FIB_PROTOCOL_IP4, 0,
1216 MFIB_SOURCE_DEFAULT_ROUTE);
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001217
Ed Warnickecb9cada2015-12-08 15:45:58 -07001218 {
Dave Barachd7cb1b52016-12-09 09:52:16 -05001219 pg_node_t *pn;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001220 pn = pg_get_node (ip4_lookup_node.index);
1221 pn->unformat_edit = unformat_pg_ip4_header;
1222 }
1223
1224 {
1225 ethernet_arp_header_t h;
1226
1227 memset (&h, 0, sizeof (h));
1228
1229 /* Set target ethernet address to all zeros. */
Dave Barachd7cb1b52016-12-09 09:52:16 -05001230 memset (h.ip4_over_ethernet[1].ethernet, 0,
1231 sizeof (h.ip4_over_ethernet[1].ethernet));
Ed Warnickecb9cada2015-12-08 15:45:58 -07001232
1233#define _16(f,v) h.f = clib_host_to_net_u16 (v);
1234#define _8(f,v) h.f = v;
1235 _16 (l2_type, ETHERNET_ARP_HARDWARE_TYPE_ethernet);
1236 _16 (l3_type, ETHERNET_TYPE_IP4);
1237 _8 (n_l2_address_bytes, 6);
1238 _8 (n_l3_address_bytes, 4);
1239 _16 (opcode, ETHERNET_ARP_OPCODE_request);
1240#undef _16
1241#undef _8
1242
Dave Barachd7cb1b52016-12-09 09:52:16 -05001243 vlib_packet_template_init (vm, &im->ip4_arp_request_packet_template,
Ed Warnickecb9cada2015-12-08 15:45:58 -07001244 /* data */ &h,
1245 sizeof (h),
1246 /* alloc chunk size */ 8,
1247 "ip4 arp");
1248 }
1249
Dave Barach203c6322016-06-26 10:29:03 -04001250 return error;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001251}
1252
1253VLIB_INIT_FUNCTION (ip4_lookup_init);
1254
Dave Barachd7cb1b52016-12-09 09:52:16 -05001255typedef struct
1256{
Ed Warnickecb9cada2015-12-08 15:45:58 -07001257 /* Adjacency taken. */
Vengada Govindanf1544482016-09-28 02:45:57 -07001258 u32 dpo_index;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001259 u32 flow_hash;
1260 u32 fib_index;
1261
1262 /* Packet data, possibly *after* rewrite. */
Dave Barachd7cb1b52016-12-09 09:52:16 -05001263 u8 packet_data[64 - 1 * sizeof (u32)];
1264}
1265ip4_forward_next_trace_t;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001266
Dave Barachd7cb1b52016-12-09 09:52:16 -05001267u8 *
1268format_ip4_forward_next_trace (u8 * s, va_list * args)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001269{
1270 CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *);
1271 CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *);
Dave Barachd7cb1b52016-12-09 09:52:16 -05001272 ip4_forward_next_trace_t *t = va_arg (*args, ip4_forward_next_trace_t *);
Christophe Fontained3c008d2017-10-02 18:10:54 +02001273 u32 indent = format_get_indent (s);
Pierre Pfistera38c3df2016-06-13 10:28:09 +01001274 s = format (s, "%U%U",
John Loac8146c2016-09-27 17:44:02 -04001275 format_white_space, indent,
1276 format_ip4_header, t->packet_data, sizeof (t->packet_data));
Pierre Pfistera38c3df2016-06-13 10:28:09 +01001277 return s;
1278}
1279
Dave Barachd7cb1b52016-12-09 09:52:16 -05001280static u8 *
1281format_ip4_lookup_trace (u8 * s, va_list * args)
Pierre Pfistera38c3df2016-06-13 10:28:09 +01001282{
1283 CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *);
1284 CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *);
Dave Barachd7cb1b52016-12-09 09:52:16 -05001285 ip4_forward_next_trace_t *t = va_arg (*args, ip4_forward_next_trace_t *);
Christophe Fontained3c008d2017-10-02 18:10:54 +02001286 u32 indent = format_get_indent (s);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001287
John Loac8146c2016-09-27 17:44:02 -04001288 s = format (s, "fib %d dpo-idx %d flow hash: 0x%08x",
Dave Barachd7cb1b52016-12-09 09:52:16 -05001289 t->fib_index, t->dpo_index, t->flow_hash);
Pierre Pfistera38c3df2016-06-13 10:28:09 +01001290 s = format (s, "\n%U%U",
Dave Barachd7cb1b52016-12-09 09:52:16 -05001291 format_white_space, indent,
1292 format_ip4_header, t->packet_data, sizeof (t->packet_data));
Pierre Pfistera38c3df2016-06-13 10:28:09 +01001293 return s;
1294}
Ed Warnickecb9cada2015-12-08 15:45:58 -07001295
Dave Barachd7cb1b52016-12-09 09:52:16 -05001296static u8 *
1297format_ip4_rewrite_trace (u8 * s, va_list * args)
Pierre Pfistera38c3df2016-06-13 10:28:09 +01001298{
1299 CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *);
1300 CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *);
Dave Barachd7cb1b52016-12-09 09:52:16 -05001301 ip4_forward_next_trace_t *t = va_arg (*args, ip4_forward_next_trace_t *);
Christophe Fontained3c008d2017-10-02 18:10:54 +02001302 u32 indent = format_get_indent (s);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001303
Vengada Govindanf1544482016-09-28 02:45:57 -07001304 s = format (s, "tx_sw_if_index %d dpo-idx %d : %U flow hash: 0x%08x",
Dave Barachd7cb1b52016-12-09 09:52:16 -05001305 t->fib_index, t->dpo_index, format_ip_adjacency,
1306 t->dpo_index, FORMAT_IP_ADJACENCY_NONE, t->flow_hash);
Pierre Pfistera38c3df2016-06-13 10:28:09 +01001307 s = format (s, "\n%U%U",
Dave Barachd7cb1b52016-12-09 09:52:16 -05001308 format_white_space, indent,
1309 format_ip_adjacency_packet_data,
Neale Rannsb069a692017-03-15 12:34:25 -04001310 t->dpo_index, t->packet_data, sizeof (t->packet_data));
Ed Warnickecb9cada2015-12-08 15:45:58 -07001311 return s;
1312}
1313
1314/* Common trace function for all ip4-forward next nodes. */
1315void
1316ip4_forward_next_trace (vlib_main_t * vm,
1317 vlib_node_runtime_t * node,
Dave Barachd7cb1b52016-12-09 09:52:16 -05001318 vlib_frame_t * frame, vlib_rx_or_tx_t which_adj_index)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001319{
Dave Barachd7cb1b52016-12-09 09:52:16 -05001320 u32 *from, n_left;
1321 ip4_main_t *im = &ip4_main;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001322
1323 n_left = frame->n_vectors;
1324 from = vlib_frame_vector_args (frame);
Dave Barach75fc8542016-10-11 16:16:02 -04001325
Ed Warnickecb9cada2015-12-08 15:45:58 -07001326 while (n_left >= 4)
1327 {
1328 u32 bi0, bi1;
Dave Barachd7cb1b52016-12-09 09:52:16 -05001329 vlib_buffer_t *b0, *b1;
1330 ip4_forward_next_trace_t *t0, *t1;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001331
1332 /* Prefetch next iteration. */
1333 vlib_prefetch_buffer_with_index (vm, from[2], LOAD);
1334 vlib_prefetch_buffer_with_index (vm, from[3], LOAD);
1335
1336 bi0 = from[0];
1337 bi1 = from[1];
1338
1339 b0 = vlib_get_buffer (vm, bi0);
1340 b1 = vlib_get_buffer (vm, bi1);
1341
1342 if (b0->flags & VLIB_BUFFER_IS_TRACED)
1343 {
1344 t0 = vlib_add_trace (vm, node, b0, sizeof (t0[0]));
Vengada Govindanf1544482016-09-28 02:45:57 -07001345 t0->dpo_index = vnet_buffer (b0)->ip.adj_index[which_adj_index];
Ed Warnickecb9cada2015-12-08 15:45:58 -07001346 t0->flow_hash = vnet_buffer (b0)->ip.flow_hash;
Dave Barachd7cb1b52016-12-09 09:52:16 -05001347 t0->fib_index =
1348 (vnet_buffer (b0)->sw_if_index[VLIB_TX] !=
1349 (u32) ~ 0) ? vnet_buffer (b0)->sw_if_index[VLIB_TX] :
1350 vec_elt (im->fib_index_by_sw_if_index,
1351 vnet_buffer (b0)->sw_if_index[VLIB_RX]);
Pierre Pfister0febaf12016-06-08 12:23:21 +01001352
Damjan Marionf1213b82016-03-13 02:22:06 +01001353 clib_memcpy (t0->packet_data,
Dave Barachd7cb1b52016-12-09 09:52:16 -05001354 vlib_buffer_get_current (b0),
1355 sizeof (t0->packet_data));
Ed Warnickecb9cada2015-12-08 15:45:58 -07001356 }
1357 if (b1->flags & VLIB_BUFFER_IS_TRACED)
1358 {
1359 t1 = vlib_add_trace (vm, node, b1, sizeof (t1[0]));
Vengada Govindanf1544482016-09-28 02:45:57 -07001360 t1->dpo_index = vnet_buffer (b1)->ip.adj_index[which_adj_index];
Ed Warnickecb9cada2015-12-08 15:45:58 -07001361 t1->flow_hash = vnet_buffer (b1)->ip.flow_hash;
Dave Barachd7cb1b52016-12-09 09:52:16 -05001362 t1->fib_index =
1363 (vnet_buffer (b1)->sw_if_index[VLIB_TX] !=
1364 (u32) ~ 0) ? vnet_buffer (b1)->sw_if_index[VLIB_TX] :
1365 vec_elt (im->fib_index_by_sw_if_index,
1366 vnet_buffer (b1)->sw_if_index[VLIB_RX]);
1367 clib_memcpy (t1->packet_data, vlib_buffer_get_current (b1),
1368 sizeof (t1->packet_data));
Ed Warnickecb9cada2015-12-08 15:45:58 -07001369 }
1370 from += 2;
1371 n_left -= 2;
1372 }
1373
1374 while (n_left >= 1)
1375 {
1376 u32 bi0;
Dave Barachd7cb1b52016-12-09 09:52:16 -05001377 vlib_buffer_t *b0;
1378 ip4_forward_next_trace_t *t0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001379
1380 bi0 = from[0];
1381
1382 b0 = vlib_get_buffer (vm, bi0);
1383
1384 if (b0->flags & VLIB_BUFFER_IS_TRACED)
1385 {
1386 t0 = vlib_add_trace (vm, node, b0, sizeof (t0[0]));
Vengada Govindanf1544482016-09-28 02:45:57 -07001387 t0->dpo_index = vnet_buffer (b0)->ip.adj_index[which_adj_index];
Ed Warnickecb9cada2015-12-08 15:45:58 -07001388 t0->flow_hash = vnet_buffer (b0)->ip.flow_hash;
Dave Barachd7cb1b52016-12-09 09:52:16 -05001389 t0->fib_index =
1390 (vnet_buffer (b0)->sw_if_index[VLIB_TX] !=
1391 (u32) ~ 0) ? vnet_buffer (b0)->sw_if_index[VLIB_TX] :
1392 vec_elt (im->fib_index_by_sw_if_index,
1393 vnet_buffer (b0)->sw_if_index[VLIB_RX]);
1394 clib_memcpy (t0->packet_data, vlib_buffer_get_current (b0),
1395 sizeof (t0->packet_data));
Ed Warnickecb9cada2015-12-08 15:45:58 -07001396 }
1397 from += 1;
1398 n_left -= 1;
1399 }
1400}
1401
Ed Warnickecb9cada2015-12-08 15:45:58 -07001402/* Compute TCP/UDP/ICMP4 checksum in software. */
1403u16
1404ip4_tcp_udp_compute_checksum (vlib_main_t * vm, vlib_buffer_t * p0,
1405 ip4_header_t * ip0)
1406{
1407 ip_csum_t sum0;
1408 u32 ip_header_length, payload_length_host_byte_order;
Florin Corasb2215d62017-08-01 16:56:58 -07001409 u32 n_this_buffer, n_bytes_left, n_ip_bytes_this_buffer;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001410 u16 sum16;
Dave Barachd7cb1b52016-12-09 09:52:16 -05001411 void *data_this_buffer;
Dave Barach75fc8542016-10-11 16:16:02 -04001412
Ed Warnickecb9cada2015-12-08 15:45:58 -07001413 /* Initialize checksum with ip header. */
1414 ip_header_length = ip4_header_bytes (ip0);
Dave Barachd7cb1b52016-12-09 09:52:16 -05001415 payload_length_host_byte_order =
1416 clib_net_to_host_u16 (ip0->length) - ip_header_length;
1417 sum0 =
1418 clib_host_to_net_u32 (payload_length_host_byte_order +
1419 (ip0->protocol << 16));
Ed Warnickecb9cada2015-12-08 15:45:58 -07001420
1421 if (BITS (uword) == 32)
1422 {
Dave Barachd7cb1b52016-12-09 09:52:16 -05001423 sum0 =
1424 ip_csum_with_carry (sum0,
1425 clib_mem_unaligned (&ip0->src_address, u32));
1426 sum0 =
1427 ip_csum_with_carry (sum0,
1428 clib_mem_unaligned (&ip0->dst_address, u32));
Ed Warnickecb9cada2015-12-08 15:45:58 -07001429 }
1430 else
Dave Barachd7cb1b52016-12-09 09:52:16 -05001431 sum0 =
1432 ip_csum_with_carry (sum0, clib_mem_unaligned (&ip0->src_address, u64));
Ed Warnickecb9cada2015-12-08 15:45:58 -07001433
1434 n_bytes_left = n_this_buffer = payload_length_host_byte_order;
1435 data_this_buffer = (void *) ip0 + ip_header_length;
Neale Rannsd91c1db2017-07-31 02:30:50 -07001436 n_ip_bytes_this_buffer =
1437 p0->current_length - (((u8 *) ip0 - p0->data) - p0->current_data);
Florin Corasb2215d62017-08-01 16:56:58 -07001438 if (n_this_buffer + ip_header_length > n_ip_bytes_this_buffer)
1439 {
1440 n_this_buffer = n_ip_bytes_this_buffer > ip_header_length ?
Neale Rannsd91c1db2017-07-31 02:30:50 -07001441 n_ip_bytes_this_buffer - ip_header_length : 0;
Florin Corasb2215d62017-08-01 16:56:58 -07001442 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07001443 while (1)
1444 {
1445 sum0 = ip_incremental_checksum (sum0, data_this_buffer, n_this_buffer);
1446 n_bytes_left -= n_this_buffer;
1447 if (n_bytes_left == 0)
1448 break;
1449
1450 ASSERT (p0->flags & VLIB_BUFFER_NEXT_PRESENT);
1451 p0 = vlib_get_buffer (vm, p0->next_buffer);
1452 data_this_buffer = vlib_buffer_get_current (p0);
1453 n_this_buffer = p0->current_length;
1454 }
1455
Dave Barachd7cb1b52016-12-09 09:52:16 -05001456 sum16 = ~ip_csum_fold (sum0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001457
1458 return sum16;
1459}
1460
John Lo37682e12016-11-30 12:51:39 -05001461u32
Ed Warnickecb9cada2015-12-08 15:45:58 -07001462ip4_tcp_udp_validate_checksum (vlib_main_t * vm, vlib_buffer_t * p0)
1463{
Dave Barachd7cb1b52016-12-09 09:52:16 -05001464 ip4_header_t *ip0 = vlib_buffer_get_current (p0);
1465 udp_header_t *udp0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001466 u16 sum16;
1467
1468 ASSERT (ip0->protocol == IP_PROTOCOL_TCP
1469 || ip0->protocol == IP_PROTOCOL_UDP);
1470
1471 udp0 = (void *) (ip0 + 1);
1472 if (ip0->protocol == IP_PROTOCOL_UDP && udp0->checksum == 0)
1473 {
Damjan Marion213b5aa2017-07-13 21:19:27 +02001474 p0->flags |= (VNET_BUFFER_F_L4_CHECKSUM_COMPUTED
1475 | VNET_BUFFER_F_L4_CHECKSUM_CORRECT);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001476 return p0->flags;
1477 }
1478
1479 sum16 = ip4_tcp_udp_compute_checksum (vm, p0, ip0);
1480
Damjan Marion213b5aa2017-07-13 21:19:27 +02001481 p0->flags |= (VNET_BUFFER_F_L4_CHECKSUM_COMPUTED
1482 | ((sum16 == 0) << VNET_BUFFER_F_LOG2_L4_CHECKSUM_CORRECT));
Ed Warnickecb9cada2015-12-08 15:45:58 -07001483
1484 return p0->flags;
1485}
1486
Dave Barach68b0fb02017-02-28 15:15:56 -05001487/* *INDENT-OFF* */
1488VNET_FEATURE_ARC_INIT (ip4_local) =
1489{
1490 .arc_name = "ip4-local",
1491 .start_nodes = VNET_FEATURES ("ip4-local"),
1492};
1493/* *INDENT-ON* */
1494
Florin Coras20a14b92017-08-15 22:47:22 -07001495static inline void
1496ip4_local_validate_l4 (vlib_main_t * vm, vlib_buffer_t * p, ip4_header_t * ip,
1497 u8 is_udp, u8 * error, u8 * good_tcp_udp)
1498{
1499 u32 flags0;
1500 flags0 = ip4_tcp_udp_validate_checksum (vm, p);
1501 *good_tcp_udp = (flags0 & VNET_BUFFER_F_L4_CHECKSUM_CORRECT) != 0;
1502 if (is_udp)
1503 {
1504 udp_header_t *udp;
1505 u32 ip_len, udp_len;
1506 i32 len_diff;
1507 udp = ip4_next_header (ip);
1508 /* Verify UDP length. */
1509 ip_len = clib_net_to_host_u16 (ip->length);
1510 udp_len = clib_net_to_host_u16 (udp->length);
1511
1512 len_diff = ip_len - udp_len;
1513 *good_tcp_udp &= len_diff >= 0;
1514 *error = len_diff < 0 ? IP4_ERROR_UDP_LENGTH : *error;
1515 }
1516}
1517
1518#define ip4_local_do_l4_check(is_tcp_udp, flags) \
Jakub Grajciar96be8e82017-10-30 14:56:17 +01001519 (is_tcp_udp && !(flags & VNET_BUFFER_F_L4_CHECKSUM_COMPUTED \
1520 || flags & VNET_BUFFER_F_OFFLOAD_TCP_CKSUM \
1521 || flags & VNET_BUFFER_F_OFFLOAD_UDP_CKSUM))
Florin Coras20a14b92017-08-15 22:47:22 -07001522
Dave Barach68b0fb02017-02-28 15:15:56 -05001523static inline uword
1524ip4_local_inline (vlib_main_t * vm,
1525 vlib_node_runtime_t * node,
1526 vlib_frame_t * frame, int head_of_feature_arc)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001527{
Dave Barachd7cb1b52016-12-09 09:52:16 -05001528 ip4_main_t *im = &ip4_main;
1529 ip_lookup_main_t *lm = &im->lookup_main;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001530 ip_local_next_t next_index;
Dave Barachd7cb1b52016-12-09 09:52:16 -05001531 u32 *from, *to_next, n_left_from, n_left_to_next;
1532 vlib_node_runtime_t *error_node =
1533 vlib_node_get_runtime (vm, ip4_input_node.index);
Dave Barach68b0fb02017-02-28 15:15:56 -05001534 u8 arc_index = vnet_feat_arc_ip4_local.feature_arc_index;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001535
1536 from = vlib_frame_vector_args (frame);
1537 n_left_from = frame->n_vectors;
1538 next_index = node->cached_next_index;
Dave Barach75fc8542016-10-11 16:16:02 -04001539
Ed Warnickecb9cada2015-12-08 15:45:58 -07001540 if (node->flags & VLIB_NODE_FLAG_TRACE)
1541 ip4_forward_next_trace (vm, node, frame, VLIB_TX);
1542
1543 while (n_left_from > 0)
1544 {
1545 vlib_get_next_frame (vm, node, next_index, to_next, n_left_to_next);
1546
1547 while (n_left_from >= 4 && n_left_to_next >= 2)
Dave Barachd7cb1b52016-12-09 09:52:16 -05001548 {
1549 vlib_buffer_t *p0, *p1;
1550 ip4_header_t *ip0, *ip1;
Dave Barachd7cb1b52016-12-09 09:52:16 -05001551 ip4_fib_mtrie_t *mtrie0, *mtrie1;
1552 ip4_fib_mtrie_leaf_t leaf0, leaf1;
1553 const dpo_id_t *dpo0, *dpo1;
1554 const load_balance_t *lb0, *lb1;
Florin Coras20a14b92017-08-15 22:47:22 -07001555 u32 pi0, next0, fib_index0, lbi0;
1556 u32 pi1, next1, fib_index1, lbi1;
Dave Barachd7cb1b52016-12-09 09:52:16 -05001557 u8 error0, is_udp0, is_tcp_udp0, good_tcp_udp0, proto0;
1558 u8 error1, is_udp1, is_tcp_udp1, good_tcp_udp1, proto1;
Dave Barach68b0fb02017-02-28 15:15:56 -05001559 u32 sw_if_index0, sw_if_index1;
Dave Barach75fc8542016-10-11 16:16:02 -04001560
Dave Barachd7cb1b52016-12-09 09:52:16 -05001561 pi0 = to_next[0] = from[0];
1562 pi1 = to_next[1] = from[1];
1563 from += 2;
1564 n_left_from -= 2;
1565 to_next += 2;
1566 n_left_to_next -= 2;
Dave Barach75fc8542016-10-11 16:16:02 -04001567
Dave Barach68b0fb02017-02-28 15:15:56 -05001568 next0 = next1 = IP_LOCAL_NEXT_DROP;
Florin Coras20a14b92017-08-15 22:47:22 -07001569 error0 = error1 = IP4_ERROR_UNKNOWN_PROTOCOL;
Dave Barach68b0fb02017-02-28 15:15:56 -05001570
Ed Warnickecb9cada2015-12-08 15:45:58 -07001571 p0 = vlib_get_buffer (vm, pi0);
1572 p1 = vlib_get_buffer (vm, pi1);
1573
1574 ip0 = vlib_buffer_get_current (p0);
1575 ip1 = vlib_buffer_get_current (p1);
1576
Damjan Marion072401e2017-07-13 18:53:27 +02001577 vnet_buffer (p0)->l3_hdr_offset = p0->current_data;
1578 vnet_buffer (p1)->l3_hdr_offset = p1->current_data;
Klement Sekera0e3c0de2016-09-29 14:43:44 +02001579
Dave Barach68b0fb02017-02-28 15:15:56 -05001580 sw_if_index0 = vnet_buffer (p0)->sw_if_index[VLIB_RX];
1581 sw_if_index1 = vnet_buffer (p1)->sw_if_index[VLIB_RX];
1582
Florin Coras20a14b92017-08-15 22:47:22 -07001583 /* Treat IP frag packets as "experimental" protocol for now
1584 until support of IP frag reassembly is implemented */
1585 proto0 = ip4_is_fragment (ip0) ? 0xfe : ip0->protocol;
1586 proto1 = ip4_is_fragment (ip1) ? 0xfe : ip1->protocol;
1587
1588 if (head_of_feature_arc == 0)
1589 goto skip_checks;
1590
1591 is_udp0 = proto0 == IP_PROTOCOL_UDP;
1592 is_udp1 = proto1 == IP_PROTOCOL_UDP;
1593 is_tcp_udp0 = is_udp0 || proto0 == IP_PROTOCOL_TCP;
1594 is_tcp_udp1 = is_udp1 || proto1 == IP_PROTOCOL_TCP;
1595
1596 good_tcp_udp0 =
Jakub Grajciar96be8e82017-10-30 14:56:17 +01001597 (p0->flags & VNET_BUFFER_F_L4_CHECKSUM_CORRECT
Jakub Grajciar2eeeb4b2017-11-07 14:39:10 +01001598 || (p0->flags & VNET_BUFFER_F_OFFLOAD_TCP_CKSUM
1599 || p0->flags & VNET_BUFFER_F_OFFLOAD_UDP_CKSUM)) != 0;
Jakub Grajciar96be8e82017-10-30 14:56:17 +01001600 good_tcp_udp1 = (p1->flags & VNET_BUFFER_F_L4_CHECKSUM_CORRECT
Jakub Grajciar2eeeb4b2017-11-07 14:39:10 +01001601 || (p1->flags & VNET_BUFFER_F_OFFLOAD_TCP_CKSUM
1602 || p1->flags &
1603 VNET_BUFFER_F_OFFLOAD_UDP_CKSUM)) != 0;
Florin Coras20a14b92017-08-15 22:47:22 -07001604
1605 if (PREDICT_FALSE (ip4_local_do_l4_check (is_tcp_udp0, p0->flags)
1606 || ip4_local_do_l4_check (is_tcp_udp1,
1607 p1->flags)))
1608 {
1609 if (is_tcp_udp0)
1610 ip4_local_validate_l4 (vm, p0, ip0, is_udp0, &error0,
1611 &good_tcp_udp0);
1612 if (is_tcp_udp1)
1613 ip4_local_validate_l4 (vm, p1, ip1, is_udp1, &error1,
1614 &good_tcp_udp1);
1615 }
1616
1617 ASSERT (IP4_ERROR_TCP_CHECKSUM + 1 == IP4_ERROR_UDP_CHECKSUM);
1618 error0 = (is_tcp_udp0 && !good_tcp_udp0
1619 ? IP4_ERROR_TCP_CHECKSUM + is_udp0 : error0);
1620 error1 = (is_tcp_udp1 && !good_tcp_udp1
1621 ? IP4_ERROR_TCP_CHECKSUM + is_udp1 : error1);
Dave Barach68b0fb02017-02-28 15:15:56 -05001622
1623 fib_index0 = vec_elt (im->fib_index_by_sw_if_index, sw_if_index0);
Neale Ranns32e1c012016-11-22 17:07:28 +00001624 fib_index0 =
1625 (vnet_buffer (p0)->sw_if_index[VLIB_TX] ==
1626 (u32) ~ 0) ? fib_index0 : vnet_buffer (p0)->sw_if_index[VLIB_TX];
Neale Rannscb630ff2016-12-14 13:31:29 +01001627
Dave Barach68b0fb02017-02-28 15:15:56 -05001628 fib_index1 = vec_elt (im->fib_index_by_sw_if_index, sw_if_index1);
Neale Ranns32e1c012016-11-22 17:07:28 +00001629 fib_index1 =
1630 (vnet_buffer (p1)->sw_if_index[VLIB_TX] ==
1631 (u32) ~ 0) ? fib_index1 : vnet_buffer (p1)->sw_if_index[VLIB_TX];
Ed Warnickecb9cada2015-12-08 15:45:58 -07001632
Florin Corascea194d2017-10-02 00:18:51 -07001633 /* TODO maybe move to lookup? */
1634 vnet_buffer (p0)->ip.fib_index = fib_index0;
1635 vnet_buffer (p1)->ip.fib_index = fib_index1;
1636
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001637 mtrie0 = &ip4_fib_get (fib_index0)->mtrie;
1638 mtrie1 = &ip4_fib_get (fib_index1)->mtrie;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001639
Neale Ranns04a75e32017-03-23 06:46:01 -07001640 leaf0 = ip4_fib_mtrie_lookup_step_one (mtrie0, &ip0->src_address);
1641 leaf1 = ip4_fib_mtrie_lookup_step_one (mtrie1, &ip1->src_address);
Florin Coras20a14b92017-08-15 22:47:22 -07001642 leaf0 = ip4_fib_mtrie_lookup_step (mtrie0, leaf0, &ip0->src_address,
1643 2);
1644 leaf1 = ip4_fib_mtrie_lookup_step (mtrie1, leaf1, &ip1->src_address,
1645 2);
1646 leaf0 = ip4_fib_mtrie_lookup_step (mtrie0, leaf0, &ip0->src_address,
1647 3);
1648 leaf1 = ip4_fib_mtrie_lookup_step (mtrie1, leaf1, &ip1->src_address,
1649 3);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001650
Dave Barachd7cb1b52016-12-09 09:52:16 -05001651 vnet_buffer (p0)->ip.adj_index[VLIB_RX] = lbi0 =
1652 ip4_fib_mtrie_leaf_get_adj_index (leaf0);
1653 vnet_buffer (p0)->ip.adj_index[VLIB_TX] = lbi0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001654
Dave Barachd7cb1b52016-12-09 09:52:16 -05001655 vnet_buffer (p1)->ip.adj_index[VLIB_RX] = lbi1 =
1656 ip4_fib_mtrie_leaf_get_adj_index (leaf1);
1657 vnet_buffer (p1)->ip.adj_index[VLIB_TX] = lbi1;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001658
Dave Barachd7cb1b52016-12-09 09:52:16 -05001659 lb0 = load_balance_get (lbi0);
1660 lb1 = load_balance_get (lbi1);
1661 dpo0 = load_balance_get_bucket_i (lb0, 0);
1662 dpo1 = load_balance_get_bucket_i (lb1, 0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001663
Dave Barach75fc8542016-10-11 16:16:02 -04001664 /*
Dave Barachd7cb1b52016-12-09 09:52:16 -05001665 * Must have a route to source otherwise we drop the packet.
1666 * ip4 broadcasts are accepted, e.g. to make dhcp client work
Neale Ranns3ee44042016-10-03 13:05:48 +01001667 *
1668 * The checks are:
1669 * - the source is a recieve => it's from us => bogus, do this
1670 * first since it sets a different error code.
1671 * - uRPF check for any route to source - accept if passes.
1672 * - allow packets destined to the broadcast address from unknown sources
Dave Barachd7cb1b52016-12-09 09:52:16 -05001673 */
Matus Fabian87da4762017-10-04 08:03:56 -07001674 if (p0->flags & VNET_BUFFER_F_IS_NATED)
1675 goto skip_check0;
1676
Neale Ranns3ee44042016-10-03 13:05:48 +01001677 error0 = ((error0 == IP4_ERROR_UNKNOWN_PROTOCOL &&
Dave Barachd7cb1b52016-12-09 09:52:16 -05001678 dpo0->dpoi_type == DPO_RECEIVE) ?
1679 IP4_ERROR_SPOOFED_LOCAL_PACKETS : error0);
1680 error0 = ((error0 == IP4_ERROR_UNKNOWN_PROTOCOL &&
1681 !fib_urpf_check_size (lb0->lb_urpf) &&
Neale Ranns3ee44042016-10-03 13:05:48 +01001682 ip0->dst_address.as_u32 != 0xFFFFFFFF)
Dave Barachd7cb1b52016-12-09 09:52:16 -05001683 ? IP4_ERROR_SRC_LOOKUP_MISS : error0);
Matus Fabian87da4762017-10-04 08:03:56 -07001684
1685 skip_check0:
1686 if (p1->flags & VNET_BUFFER_F_IS_NATED)
1687 goto skip_checks;
1688
Neale Ranns3ee44042016-10-03 13:05:48 +01001689 error1 = ((error1 == IP4_ERROR_UNKNOWN_PROTOCOL &&
Dave Barachd7cb1b52016-12-09 09:52:16 -05001690 dpo1->dpoi_type == DPO_RECEIVE) ?
1691 IP4_ERROR_SPOOFED_LOCAL_PACKETS : error1);
1692 error1 = ((error1 == IP4_ERROR_UNKNOWN_PROTOCOL &&
1693 !fib_urpf_check_size (lb1->lb_urpf) &&
Neale Ranns3ee44042016-10-03 13:05:48 +01001694 ip1->dst_address.as_u32 != 0xFFFFFFFF)
Dave Barachd7cb1b52016-12-09 09:52:16 -05001695 ? IP4_ERROR_SRC_LOOKUP_MISS : error1);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001696
Florin Corasa0b34a72017-03-07 01:20:52 -08001697 skip_checks:
1698
Ed Warnickecb9cada2015-12-08 15:45:58 -07001699 next0 = lm->local_next_by_ip_protocol[proto0];
1700 next1 = lm->local_next_by_ip_protocol[proto1];
1701
Dave Barachd7cb1b52016-12-09 09:52:16 -05001702 next0 =
1703 error0 != IP4_ERROR_UNKNOWN_PROTOCOL ? IP_LOCAL_NEXT_DROP : next0;
1704 next1 =
1705 error1 != IP4_ERROR_UNKNOWN_PROTOCOL ? IP_LOCAL_NEXT_DROP : next1;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001706
1707 p0->error = error0 ? error_node->errors[error0] : 0;
1708 p1->error = error1 ? error_node->errors[error1] : 0;
1709
Dave Barach68b0fb02017-02-28 15:15:56 -05001710 if (head_of_feature_arc)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001711 {
Dave Barach68b0fb02017-02-28 15:15:56 -05001712 if (PREDICT_TRUE (error0 == (u8) IP4_ERROR_UNKNOWN_PROTOCOL))
1713 vnet_feature_arc_start (arc_index, sw_if_index0, &next0, p0);
1714 if (PREDICT_TRUE (error1 == (u8) IP4_ERROR_UNKNOWN_PROTOCOL))
1715 vnet_feature_arc_start (arc_index, sw_if_index1, &next1, p1);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001716 }
Dave Barach68b0fb02017-02-28 15:15:56 -05001717
1718 vlib_validate_buffer_enqueue_x2 (vm, node, next_index, to_next,
1719 n_left_to_next, pi0, pi1,
1720 next0, next1);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001721 }
1722
1723 while (n_left_from > 0 && n_left_to_next > 0)
1724 {
Dave Barachd7cb1b52016-12-09 09:52:16 -05001725 vlib_buffer_t *p0;
1726 ip4_header_t *ip0;
Dave Barachd7cb1b52016-12-09 09:52:16 -05001727 ip4_fib_mtrie_t *mtrie0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001728 ip4_fib_mtrie_leaf_t leaf0;
Florin Coras20a14b92017-08-15 22:47:22 -07001729 u32 pi0, next0, fib_index0, lbi0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001730 u8 error0, is_udp0, is_tcp_udp0, good_tcp_udp0, proto0;
Dave Barachd7cb1b52016-12-09 09:52:16 -05001731 load_balance_t *lb0;
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001732 const dpo_id_t *dpo0;
Dave Barach68b0fb02017-02-28 15:15:56 -05001733 u32 sw_if_index0;
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001734
Ed Warnickecb9cada2015-12-08 15:45:58 -07001735 pi0 = to_next[0] = from[0];
1736 from += 1;
1737 n_left_from -= 1;
1738 to_next += 1;
1739 n_left_to_next -= 1;
Dave Barach75fc8542016-10-11 16:16:02 -04001740
Dave Barach68b0fb02017-02-28 15:15:56 -05001741 next0 = IP_LOCAL_NEXT_DROP;
Florin Coras20a14b92017-08-15 22:47:22 -07001742 error0 = IP4_ERROR_UNKNOWN_PROTOCOL;
Dave Barach68b0fb02017-02-28 15:15:56 -05001743
Ed Warnickecb9cada2015-12-08 15:45:58 -07001744 p0 = vlib_get_buffer (vm, pi0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001745 ip0 = vlib_buffer_get_current (p0);
Damjan Marion072401e2017-07-13 18:53:27 +02001746 vnet_buffer (p0)->l3_hdr_offset = p0->current_data;
Dave Barach68b0fb02017-02-28 15:15:56 -05001747 sw_if_index0 = vnet_buffer (p0)->sw_if_index[VLIB_RX];
1748
John Lo3419d0b2016-06-02 09:28:37 -04001749 /* Treat IP frag packets as "experimental" protocol for now
1750 until support of IP frag reassembly is implemented */
Dave Barachd7cb1b52016-12-09 09:52:16 -05001751 proto0 = ip4_is_fragment (ip0) ? 0xfe : ip0->protocol;
Dave Barach68b0fb02017-02-28 15:15:56 -05001752
Matus Fabian87da4762017-10-04 08:03:56 -07001753 if (head_of_feature_arc == 0 || p0->flags & VNET_BUFFER_F_IS_NATED)
Florin Coras20a14b92017-08-15 22:47:22 -07001754 goto skip_check;
Dave Barach68b0fb02017-02-28 15:15:56 -05001755
Ed Warnickecb9cada2015-12-08 15:45:58 -07001756 is_udp0 = proto0 == IP_PROTOCOL_UDP;
1757 is_tcp_udp0 = is_udp0 || proto0 == IP_PROTOCOL_TCP;
Jakub Grajciar96be8e82017-10-30 14:56:17 +01001758
Florin Coras20a14b92017-08-15 22:47:22 -07001759 good_tcp_udp0 =
Jakub Grajciar96be8e82017-10-30 14:56:17 +01001760 (p0->flags & VNET_BUFFER_F_L4_CHECKSUM_CORRECT
Jakub Grajciar2eeeb4b2017-11-07 14:39:10 +01001761 || (p0->flags & VNET_BUFFER_F_OFFLOAD_TCP_CKSUM
1762 || p0->flags & VNET_BUFFER_F_OFFLOAD_UDP_CKSUM)) != 0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001763
Florin Coras20a14b92017-08-15 22:47:22 -07001764 if (PREDICT_FALSE (ip4_local_do_l4_check (is_tcp_udp0, p0->flags)))
Ed Warnickecb9cada2015-12-08 15:45:58 -07001765 {
Florin Coras20a14b92017-08-15 22:47:22 -07001766 ip4_local_validate_l4 (vm, p0, ip0, is_udp0, &error0,
1767 &good_tcp_udp0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001768 }
1769
Ed Warnickecb9cada2015-12-08 15:45:58 -07001770 ASSERT (IP4_ERROR_TCP_CHECKSUM + 1 == IP4_ERROR_UDP_CHECKSUM);
Dave Barachd7cb1b52016-12-09 09:52:16 -05001771 error0 = (is_tcp_udp0 && !good_tcp_udp0
1772 ? IP4_ERROR_TCP_CHECKSUM + is_udp0 : error0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001773
Florin Coras20a14b92017-08-15 22:47:22 -07001774 fib_index0 = vec_elt (im->fib_index_by_sw_if_index, sw_if_index0);
1775 fib_index0 =
1776 (vnet_buffer (p0)->sw_if_index[VLIB_TX] ==
1777 (u32) ~ 0) ? fib_index0 : vnet_buffer (p0)->sw_if_index[VLIB_TX];
Florin Corascea194d2017-10-02 00:18:51 -07001778 vnet_buffer (p0)->ip.fib_index = fib_index0;
Florin Coras20a14b92017-08-15 22:47:22 -07001779 mtrie0 = &ip4_fib_get (fib_index0)->mtrie;
1780 leaf0 = ip4_fib_mtrie_lookup_step_one (mtrie0, &ip0->src_address);
1781 leaf0 = ip4_fib_mtrie_lookup_step (mtrie0, leaf0, &ip0->src_address,
1782 2);
1783 leaf0 = ip4_fib_mtrie_lookup_step (mtrie0, leaf0, &ip0->src_address,
1784 3);
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001785 lbi0 = ip4_fib_mtrie_leaf_get_adj_index (leaf0);
Dave Barachd7cb1b52016-12-09 09:52:16 -05001786 vnet_buffer (p0)->ip.adj_index[VLIB_TX] = lbi0;
Florin Coras20a14b92017-08-15 22:47:22 -07001787 vnet_buffer (p0)->ip.adj_index[VLIB_RX] = lbi0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001788
Dave Barachd7cb1b52016-12-09 09:52:16 -05001789 lb0 = load_balance_get (lbi0);
1790 dpo0 = load_balance_get_bucket_i (lb0, 0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001791
Neale Ranns3ee44042016-10-03 13:05:48 +01001792 error0 = ((error0 == IP4_ERROR_UNKNOWN_PROTOCOL &&
Dave Barachd7cb1b52016-12-09 09:52:16 -05001793 dpo0->dpoi_type == DPO_RECEIVE) ?
1794 IP4_ERROR_SPOOFED_LOCAL_PACKETS : error0);
1795 error0 = ((error0 == IP4_ERROR_UNKNOWN_PROTOCOL &&
1796 !fib_urpf_check_size (lb0->lb_urpf) &&
Neale Ranns3ee44042016-10-03 13:05:48 +01001797 ip0->dst_address.as_u32 != 0xFFFFFFFF)
Dave Barachd7cb1b52016-12-09 09:52:16 -05001798 ? IP4_ERROR_SRC_LOOKUP_MISS : error0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001799
Dave Barach68b0fb02017-02-28 15:15:56 -05001800 skip_check:
Ed Warnickecb9cada2015-12-08 15:45:58 -07001801 next0 = lm->local_next_by_ip_protocol[proto0];
Dave Barachd7cb1b52016-12-09 09:52:16 -05001802 next0 =
1803 error0 != IP4_ERROR_UNKNOWN_PROTOCOL ? IP_LOCAL_NEXT_DROP : next0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001804
Dave Barachd7cb1b52016-12-09 09:52:16 -05001805 p0->error = error0 ? error_node->errors[error0] : 0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001806
Dave Barach68b0fb02017-02-28 15:15:56 -05001807 if (head_of_feature_arc)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001808 {
Dave Barach68b0fb02017-02-28 15:15:56 -05001809 if (PREDICT_TRUE (error0 == (u8) IP4_ERROR_UNKNOWN_PROTOCOL))
1810 vnet_feature_arc_start (arc_index, sw_if_index0, &next0, p0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001811 }
Dave Barach68b0fb02017-02-28 15:15:56 -05001812
1813 vlib_validate_buffer_enqueue_x1 (vm, node, next_index, to_next,
1814 n_left_to_next, pi0, next0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001815 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07001816 vlib_put_next_frame (vm, node, next_index, n_left_to_next);
1817 }
1818
1819 return frame->n_vectors;
1820}
1821
Dave Barach68b0fb02017-02-28 15:15:56 -05001822static uword
1823ip4_local (vlib_main_t * vm, vlib_node_runtime_t * node, vlib_frame_t * frame)
1824{
1825 return ip4_local_inline (vm, node, frame, 1 /* head of feature arc */ );
1826}
1827
1828/* *INDENT-OFF* */
Neale Ranns32e1c012016-11-22 17:07:28 +00001829VLIB_REGISTER_NODE (ip4_local_node) =
Ed Warnickecb9cada2015-12-08 15:45:58 -07001830{
Dave Barach68b0fb02017-02-28 15:15:56 -05001831 .function = ip4_local,
1832 .name = "ip4-local",
1833 .vector_size = sizeof (u32),
1834 .format_trace = format_ip4_forward_next_trace,
1835 .n_next_nodes = IP_LOCAL_N_NEXT,
1836 .next_nodes =
Dave Barachd7cb1b52016-12-09 09:52:16 -05001837 {
Neale Rannsd91c1db2017-07-31 02:30:50 -07001838 [IP_LOCAL_NEXT_DROP] = "ip4-drop",
1839 [IP_LOCAL_NEXT_PUNT] = "ip4-punt",
Dave Barach68b0fb02017-02-28 15:15:56 -05001840 [IP_LOCAL_NEXT_UDP_LOOKUP] = "ip4-udp-lookup",
Florin Coras20a14b92017-08-15 22:47:22 -07001841 [IP_LOCAL_NEXT_ICMP] = "ip4-icmp-input",
1842 },
Dave Barach68b0fb02017-02-28 15:15:56 -05001843};
1844/* *INDENT-ON* */
Dave Barachd7cb1b52016-12-09 09:52:16 -05001845
1846VLIB_NODE_FUNCTION_MULTIARCH (ip4_local_node, ip4_local);
1847
Dave Barach68b0fb02017-02-28 15:15:56 -05001848static uword
1849ip4_local_end_of_arc (vlib_main_t * vm,
1850 vlib_node_runtime_t * node, vlib_frame_t * frame)
1851{
1852 return ip4_local_inline (vm, node, frame, 0 /* head of feature arc */ );
1853}
1854
1855/* *INDENT-OFF* */
1856VLIB_REGISTER_NODE (ip4_local_end_of_arc_node,static) = {
1857 .function = ip4_local_end_of_arc,
1858 .name = "ip4-local-end-of-arc",
1859 .vector_size = sizeof (u32),
1860
1861 .format_trace = format_ip4_forward_next_trace,
1862 .sibling_of = "ip4-local",
1863};
1864
1865VLIB_NODE_FUNCTION_MULTIARCH (ip4_local_end_of_arc_node, ip4_local_end_of_arc)
1866
1867VNET_FEATURE_INIT (ip4_local_end_of_arc, static) = {
1868 .arc_name = "ip4-local",
1869 .node_name = "ip4-local-end-of-arc",
1870 .runs_before = 0, /* not before any other features */
1871};
1872/* *INDENT-ON* */
1873
Dave Barachd7cb1b52016-12-09 09:52:16 -05001874void
1875ip4_register_protocol (u32 protocol, u32 node_index)
1876{
1877 vlib_main_t *vm = vlib_get_main ();
1878 ip4_main_t *im = &ip4_main;
1879 ip_lookup_main_t *lm = &im->lookup_main;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001880
1881 ASSERT (protocol < ARRAY_LEN (lm->local_next_by_ip_protocol));
Dave Barachd7cb1b52016-12-09 09:52:16 -05001882 lm->local_next_by_ip_protocol[protocol] =
1883 vlib_node_add_next (vm, ip4_local_node.index, node_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001884}
1885
1886static clib_error_t *
1887show_ip_local_command_fn (vlib_main_t * vm,
Dave Barachd7cb1b52016-12-09 09:52:16 -05001888 unformat_input_t * input, vlib_cli_command_t * cmd)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001889{
Dave Barachd7cb1b52016-12-09 09:52:16 -05001890 ip4_main_t *im = &ip4_main;
1891 ip_lookup_main_t *lm = &im->lookup_main;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001892 int i;
1893
1894 vlib_cli_output (vm, "Protocols handled by ip4_local");
Dave Barachd7cb1b52016-12-09 09:52:16 -05001895 for (i = 0; i < ARRAY_LEN (lm->local_next_by_ip_protocol); i++)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001896 {
1897 if (lm->local_next_by_ip_protocol[i] != IP_LOCAL_NEXT_PUNT)
Pierre Pfister1bfd3722017-09-18 11:40:32 +02001898 {
1899 u32 node_index = vlib_get_node (vm,
1900 ip4_local_node.index)->
1901 next_nodes[lm->local_next_by_ip_protocol[i]];
1902 vlib_cli_output (vm, "%d: %U", i, format_vlib_node_name, vm,
1903 node_index);
1904 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07001905 }
1906 return 0;
1907}
1908
1909
1910
Billy McFall0683c9c2016-10-13 08:27:31 -04001911/*?
1912 * Display the set of protocols handled by the local IPv4 stack.
1913 *
1914 * @cliexpar
1915 * Example of how to display local protocol table:
1916 * @cliexstart{show ip local}
1917 * Protocols handled by ip4_local
1918 * 1
1919 * 17
1920 * 47
1921 * @cliexend
1922?*/
1923/* *INDENT-OFF* */
Dave Barachd7cb1b52016-12-09 09:52:16 -05001924VLIB_CLI_COMMAND (show_ip_local, static) =
1925{
Ed Warnickecb9cada2015-12-08 15:45:58 -07001926 .path = "show ip local",
1927 .function = show_ip_local_command_fn,
Billy McFall0683c9c2016-10-13 08:27:31 -04001928 .short_help = "show ip local",
Ed Warnickecb9cada2015-12-08 15:45:58 -07001929};
Billy McFall0683c9c2016-10-13 08:27:31 -04001930/* *INDENT-ON* */
Ed Warnickecb9cada2015-12-08 15:45:58 -07001931
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001932always_inline uword
1933ip4_arp_inline (vlib_main_t * vm,
1934 vlib_node_runtime_t * node,
Dave Barachd7cb1b52016-12-09 09:52:16 -05001935 vlib_frame_t * frame, int is_glean)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001936{
Dave Barachd7cb1b52016-12-09 09:52:16 -05001937 vnet_main_t *vnm = vnet_get_main ();
1938 ip4_main_t *im = &ip4_main;
1939 ip_lookup_main_t *lm = &im->lookup_main;
1940 u32 *from, *to_next_drop;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001941 uword n_left_from, n_left_to_next_drop, next_index;
1942 static f64 time_last_seed_change = -1e100;
1943 static u32 hash_seeds[3];
Dave Barach75fc8542016-10-11 16:16:02 -04001944 static uword hash_bitmap[256 / BITS (uword)];
Ed Warnickecb9cada2015-12-08 15:45:58 -07001945 f64 time_now;
1946
1947 if (node->flags & VLIB_NODE_FLAG_TRACE)
1948 ip4_forward_next_trace (vm, node, frame, VLIB_TX);
1949
1950 time_now = vlib_time_now (vm);
1951 if (time_now - time_last_seed_change > 1e-3)
1952 {
1953 uword i;
Dave Barachd7cb1b52016-12-09 09:52:16 -05001954 u32 *r = clib_random_buffer_get_data (&vm->random_buffer,
1955 sizeof (hash_seeds));
Ed Warnickecb9cada2015-12-08 15:45:58 -07001956 for (i = 0; i < ARRAY_LEN (hash_seeds); i++)
1957 hash_seeds[i] = r[i];
1958
1959 /* Mark all hash keys as been no-seen before. */
1960 for (i = 0; i < ARRAY_LEN (hash_bitmap); i++)
1961 hash_bitmap[i] = 0;
1962
1963 time_last_seed_change = time_now;
1964 }
1965
1966 from = vlib_frame_vector_args (frame);
1967 n_left_from = frame->n_vectors;
1968 next_index = node->cached_next_index;
1969 if (next_index == IP4_ARP_NEXT_DROP)
Dave Barachd7cb1b52016-12-09 09:52:16 -05001970 next_index = IP4_ARP_N_NEXT; /* point to first interface */
Ed Warnickecb9cada2015-12-08 15:45:58 -07001971
1972 while (n_left_from > 0)
1973 {
1974 vlib_get_next_frame (vm, node, IP4_ARP_NEXT_DROP,
1975 to_next_drop, n_left_to_next_drop);
1976
1977 while (n_left_from > 0 && n_left_to_next_drop > 0)
1978 {
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001979 u32 pi0, adj_index0, a0, b0, c0, m0, sw_if_index0, drop0;
Dave Barachd7cb1b52016-12-09 09:52:16 -05001980 ip_adjacency_t *adj0;
1981 vlib_buffer_t *p0;
1982 ip4_header_t *ip0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001983 uword bm0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001984
1985 pi0 = from[0];
1986
1987 p0 = vlib_get_buffer (vm, pi0);
1988
1989 adj_index0 = vnet_buffer (p0)->ip.adj_index[VLIB_TX];
Neale Ranns107e7d42017-04-11 09:55:19 -07001990 adj0 = adj_get (adj_index0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001991 ip0 = vlib_buffer_get_current (p0);
1992
Ed Warnickecb9cada2015-12-08 15:45:58 -07001993 a0 = hash_seeds[0];
1994 b0 = hash_seeds[1];
1995 c0 = hash_seeds[2];
1996
1997 sw_if_index0 = adj0->rewrite_header.sw_if_index;
1998 vnet_buffer (p0)->sw_if_index[VLIB_TX] = sw_if_index0;
1999
Dave Barachd7cb1b52016-12-09 09:52:16 -05002000 if (is_glean)
2001 {
Neale Ranns948e00f2016-10-20 13:39:34 +01002002 /*
2003 * this is the Glean case, so we are ARPing for the
2004 * packet's destination
2005 */
Dave Barachd7cb1b52016-12-09 09:52:16 -05002006 a0 ^= ip0->dst_address.data_u32;
2007 }
2008 else
2009 {
2010 a0 ^= adj0->sub_type.nbr.next_hop.ip4.data_u32;
2011 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07002012 b0 ^= sw_if_index0;
2013
Florin Coras2d3dbc42017-09-08 16:22:38 -04002014 hash_v3_mix32 (a0, b0, c0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07002015 hash_v3_finalize32 (a0, b0, c0);
2016
2017 c0 &= BITS (hash_bitmap) - 1;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002018 m0 = (uword) 1 << (c0 % BITS (uword));
Florin Coras2d3dbc42017-09-08 16:22:38 -04002019 c0 = c0 / BITS (uword);
Ed Warnickecb9cada2015-12-08 15:45:58 -07002020
2021 bm0 = hash_bitmap[c0];
2022 drop0 = (bm0 & m0) != 0;
2023
2024 /* Mark it as seen. */
2025 hash_bitmap[c0] = bm0 | m0;
2026
2027 from += 1;
2028 n_left_from -= 1;
2029 to_next_drop[0] = pi0;
2030 to_next_drop += 1;
2031 n_left_to_next_drop -= 1;
2032
Dave Barachd7cb1b52016-12-09 09:52:16 -05002033 p0->error =
2034 node->errors[drop0 ? IP4_ARP_ERROR_DROP :
2035 IP4_ARP_ERROR_REQUEST_SENT];
Ed Warnickecb9cada2015-12-08 15:45:58 -07002036
Neale Rannsb80c5362016-10-08 13:03:40 +01002037 /*
2038 * the adj has been updated to a rewrite but the node the DPO that got
2039 * us here hasn't - yet. no big deal. we'll drop while we wait.
2040 */
2041 if (IP_LOOKUP_NEXT_REWRITE == adj0->lookup_next_index)
2042 continue;
2043
Ed Warnickecb9cada2015-12-08 15:45:58 -07002044 if (drop0)
2045 continue;
2046
Dave Barachd7cb1b52016-12-09 09:52:16 -05002047 /*
2048 * Can happen if the control-plane is programming tables
2049 * with traffic flowing; at least that's today's lame excuse.
2050 */
Neale Ranns32e1c012016-11-22 17:07:28 +00002051 if ((is_glean && adj0->lookup_next_index != IP_LOOKUP_NEXT_GLEAN)
2052 || (!is_glean && adj0->lookup_next_index != IP_LOOKUP_NEXT_ARP))
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002053 {
Dave Barachd7cb1b52016-12-09 09:52:16 -05002054 p0->error = node->errors[IP4_ARP_ERROR_NON_ARP_ADJ];
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002055 }
Dave Barachd7cb1b52016-12-09 09:52:16 -05002056 else
2057 /* Send ARP request. */
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002058 {
Dave Barachd7cb1b52016-12-09 09:52:16 -05002059 u32 bi0 = 0;
2060 vlib_buffer_t *b0;
2061 ethernet_arp_header_t *h0;
2062 vnet_hw_interface_t *hw_if0;
2063
2064 h0 =
2065 vlib_packet_template_get_packet (vm,
2066 &im->ip4_arp_request_packet_template,
2067 &bi0);
2068
Florin Corasd172a622017-10-14 11:02:37 -07002069 /* Seems we're out of buffers */
2070 if (PREDICT_FALSE (!h0))
2071 continue;
2072
Dave Barachd7cb1b52016-12-09 09:52:16 -05002073 /* Add rewrite/encap string for ARP packet. */
2074 vnet_rewrite_one_header (adj0[0], h0,
2075 sizeof (ethernet_header_t));
2076
2077 hw_if0 = vnet_get_sup_hw_interface (vnm, sw_if_index0);
2078
2079 /* Src ethernet address in ARP header. */
2080 clib_memcpy (h0->ip4_over_ethernet[0].ethernet,
2081 hw_if0->hw_address,
2082 sizeof (h0->ip4_over_ethernet[0].ethernet));
2083
2084 if (is_glean)
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002085 {
Dave Barachd7cb1b52016-12-09 09:52:16 -05002086 /* The interface's source address is stashed in the Glean Adj */
2087 h0->ip4_over_ethernet[0].ip4 =
2088 adj0->sub_type.glean.receive_addr.ip4;
2089
2090 /* Copy in destination address we are requesting. This is the
2091 * glean case, so it's the packet's destination.*/
2092 h0->ip4_over_ethernet[1].ip4.data_u32 =
2093 ip0->dst_address.data_u32;
2094 }
2095 else
2096 {
2097 /* Src IP address in ARP header. */
2098 if (ip4_src_address_for_packet (lm, sw_if_index0,
2099 &h0->
2100 ip4_over_ethernet[0].ip4))
2101 {
2102 /* No source address available */
2103 p0->error =
2104 node->errors[IP4_ARP_ERROR_NO_SOURCE_ADDRESS];
2105 vlib_buffer_free (vm, &bi0, 1);
2106 continue;
2107 }
2108
2109 /* Copy in destination address we are requesting from the
2110 incomplete adj */
2111 h0->ip4_over_ethernet[1].ip4.data_u32 =
2112 adj0->sub_type.nbr.next_hop.ip4.as_u32;
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002113 }
2114
Dave Barachd7cb1b52016-12-09 09:52:16 -05002115 vlib_buffer_copy_trace_flag (vm, p0, bi0);
2116 b0 = vlib_get_buffer (vm, bi0);
Florin Coras2f9b0c02017-09-11 20:54:15 -04002117 VLIB_BUFFER_TRACE_TRAJECTORY_INIT (b0);
Dave Barachd7cb1b52016-12-09 09:52:16 -05002118 vnet_buffer (b0)->sw_if_index[VLIB_TX] = sw_if_index0;
2119
2120 vlib_buffer_advance (b0, -adj0->rewrite_header.data_bytes);
2121
2122 vlib_set_next_frame_buffer (vm, node,
2123 adj0->rewrite_header.next_index,
2124 bi0);
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002125 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07002126 }
2127
2128 vlib_put_next_frame (vm, node, IP4_ARP_NEXT_DROP, n_left_to_next_drop);
2129 }
2130
2131 return frame->n_vectors;
2132}
2133
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002134static uword
Dave Barachd7cb1b52016-12-09 09:52:16 -05002135ip4_arp (vlib_main_t * vm, vlib_node_runtime_t * node, vlib_frame_t * frame)
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002136{
Dave Barachd7cb1b52016-12-09 09:52:16 -05002137 return (ip4_arp_inline (vm, node, frame, 0));
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002138}
2139
2140static uword
Dave Barachd7cb1b52016-12-09 09:52:16 -05002141ip4_glean (vlib_main_t * vm, vlib_node_runtime_t * node, vlib_frame_t * frame)
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002142{
Dave Barachd7cb1b52016-12-09 09:52:16 -05002143 return (ip4_arp_inline (vm, node, frame, 1));
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002144}
2145
Dave Barachd7cb1b52016-12-09 09:52:16 -05002146static char *ip4_arp_error_strings[] = {
Ed Warnickecb9cada2015-12-08 15:45:58 -07002147 [IP4_ARP_ERROR_DROP] = "address overflow drops",
2148 [IP4_ARP_ERROR_REQUEST_SENT] = "ARP requests sent",
2149 [IP4_ARP_ERROR_NON_ARP_ADJ] = "ARPs to non-ARP adjacencies",
2150 [IP4_ARP_ERROR_REPLICATE_DROP] = "ARP replication completed",
2151 [IP4_ARP_ERROR_REPLICATE_FAIL] = "ARP replication failed",
Pierre Pfisterd076f192016-06-22 12:58:30 +01002152 [IP4_ARP_ERROR_NO_SOURCE_ADDRESS] = "no source address for ARP request",
Ed Warnickecb9cada2015-12-08 15:45:58 -07002153};
2154
Neale Rannsf8686322017-11-29 02:39:53 -08002155/* *INDENT-OFF* */
Dave Barachd7cb1b52016-12-09 09:52:16 -05002156VLIB_REGISTER_NODE (ip4_arp_node) =
2157{
Neale Rannsf8686322017-11-29 02:39:53 -08002158 .function = ip4_arp,
2159 .name = "ip4-arp",
2160 .vector_size = sizeof (u32),
2161 .format_trace = format_ip4_forward_next_trace,
2162 .n_errors = ARRAY_LEN (ip4_arp_error_strings),
2163 .error_strings = ip4_arp_error_strings,
2164 .n_next_nodes = IP4_ARP_N_NEXT,
2165 .next_nodes =
Dave Barachd7cb1b52016-12-09 09:52:16 -05002166 {
Neale Rannsf8686322017-11-29 02:39:53 -08002167 [IP4_ARP_NEXT_DROP] = "error-drop",
2168 },
2169};
Ed Warnickecb9cada2015-12-08 15:45:58 -07002170
Dave Barachd7cb1b52016-12-09 09:52:16 -05002171VLIB_REGISTER_NODE (ip4_glean_node) =
2172{
Neale Rannsf8686322017-11-29 02:39:53 -08002173 .function = ip4_glean,
2174 .name = "ip4-glean",
2175 .vector_size = sizeof (u32),
2176 .format_trace = format_ip4_forward_next_trace,
2177 .n_errors = ARRAY_LEN (ip4_arp_error_strings),
2178 .error_strings = ip4_arp_error_strings,
2179 .n_next_nodes = IP4_ARP_N_NEXT,
2180 .next_nodes = {
2181 [IP4_ARP_NEXT_DROP] = "error-drop",
2182 },
2183};
2184/* *INDENT-ON* */
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002185
Ed Warnickecb9cada2015-12-08 15:45:58 -07002186#define foreach_notrace_ip4_arp_error \
2187_(DROP) \
2188_(REQUEST_SENT) \
2189_(REPLICATE_DROP) \
2190_(REPLICATE_FAIL)
2191
Dave Barachd7cb1b52016-12-09 09:52:16 -05002192clib_error_t *
2193arp_notrace_init (vlib_main_t * vm)
Ed Warnickecb9cada2015-12-08 15:45:58 -07002194{
Dave Barachd7cb1b52016-12-09 09:52:16 -05002195 vlib_node_runtime_t *rt = vlib_node_get_runtime (vm, ip4_arp_node.index);
Ed Warnickecb9cada2015-12-08 15:45:58 -07002196
2197 /* don't trace ARP request packets */
2198#define _(a) \
2199 vnet_pcap_drop_trace_filter_add_del \
2200 (rt->errors[IP4_ARP_ERROR_##a], \
2201 1 /* is_add */);
Dave Barachd7cb1b52016-12-09 09:52:16 -05002202 foreach_notrace_ip4_arp_error;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002203#undef _
2204 return 0;
2205}
2206
Dave Barachd7cb1b52016-12-09 09:52:16 -05002207VLIB_INIT_FUNCTION (arp_notrace_init);
Ed Warnickecb9cada2015-12-08 15:45:58 -07002208
2209
2210/* Send an ARP request to see if given destination is reachable on given interface. */
2211clib_error_t *
2212ip4_probe_neighbor (vlib_main_t * vm, ip4_address_t * dst, u32 sw_if_index)
2213{
Dave Barachd7cb1b52016-12-09 09:52:16 -05002214 vnet_main_t *vnm = vnet_get_main ();
2215 ip4_main_t *im = &ip4_main;
2216 ethernet_arp_header_t *h;
2217 ip4_address_t *src;
2218 ip_interface_address_t *ia;
2219 ip_adjacency_t *adj;
2220 vnet_hw_interface_t *hi;
2221 vnet_sw_interface_t *si;
2222 vlib_buffer_t *b;
Neale Ranns7a272742017-05-30 02:08:14 -07002223 adj_index_t ai;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002224 u32 bi = 0;
2225
2226 si = vnet_get_sw_interface (vnm, sw_if_index);
2227
2228 if (!(si->flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP))
2229 {
2230 return clib_error_return (0, "%U: interface %U down",
Dave Barachd7cb1b52016-12-09 09:52:16 -05002231 format_ip4_address, dst,
2232 format_vnet_sw_if_index_name, vnm,
2233 sw_if_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -07002234 }
2235
Dave Barachd7cb1b52016-12-09 09:52:16 -05002236 src =
2237 ip4_interface_address_matching_destination (im, dst, sw_if_index, &ia);
2238 if (!src)
Ed Warnickecb9cada2015-12-08 15:45:58 -07002239 {
2240 vnm->api_errno = VNET_API_ERROR_NO_MATCHING_INTERFACE;
Dave Barach75fc8542016-10-11 16:16:02 -04002241 return clib_error_return
Neale Ranns32e1c012016-11-22 17:07:28 +00002242 (0,
2243 "no matching interface address for destination %U (interface %U)",
2244 format_ip4_address, dst, format_vnet_sw_if_index_name, vnm,
2245 sw_if_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -07002246 }
2247
Neale Ranns7a272742017-05-30 02:08:14 -07002248 h = vlib_packet_template_get_packet (vm,
2249 &im->ip4_arp_request_packet_template,
2250 &bi);
Ed Warnickecb9cada2015-12-08 15:45:58 -07002251
2252 hi = vnet_get_sup_hw_interface (vnm, sw_if_index);
Pavel Kotucek57808982017-08-02 08:20:19 +02002253 if (PREDICT_FALSE (!hi->hw_address))
2254 {
2255 return clib_error_return (0, "%U: interface %U do not support ip probe",
2256 format_ip4_address, dst,
2257 format_vnet_sw_if_index_name, vnm,
2258 sw_if_index);
2259 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07002260
Dave Barachd7cb1b52016-12-09 09:52:16 -05002261 clib_memcpy (h->ip4_over_ethernet[0].ethernet, hi->hw_address,
2262 sizeof (h->ip4_over_ethernet[0].ethernet));
Ed Warnickecb9cada2015-12-08 15:45:58 -07002263
2264 h->ip4_over_ethernet[0].ip4 = src[0];
2265 h->ip4_over_ethernet[1].ip4 = dst[0];
2266
2267 b = vlib_get_buffer (vm, bi);
Dave Barachd7cb1b52016-12-09 09:52:16 -05002268 vnet_buffer (b)->sw_if_index[VLIB_RX] =
2269 vnet_buffer (b)->sw_if_index[VLIB_TX] = sw_if_index;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002270
Dave Barach59b25652017-09-10 15:04:27 -04002271 ip46_address_t nh = {
2272 .ip4 = *dst,
2273 };
2274
2275 ai = adj_nbr_add_or_lock (FIB_PROTOCOL_IP4,
2276 VNET_LINK_IP4, &nh, sw_if_index);
2277 adj = adj_get (ai);
2278
2279 /* Peer has been previously resolved, retrieve glean adj instead */
2280 if (adj->lookup_next_index == IP_LOOKUP_NEXT_REWRITE)
2281 {
2282 adj_unlock (ai);
2283 ai = adj_glean_add_or_lock (FIB_PROTOCOL_IP4, sw_if_index, &nh);
2284 adj = adj_get (ai);
2285 }
2286
Ed Warnickecb9cada2015-12-08 15:45:58 -07002287 /* Add encapsulation string for software interface (e.g. ethernet header). */
2288 vnet_rewrite_one_header (adj[0], h, sizeof (ethernet_header_t));
2289 vlib_buffer_advance (b, -adj->rewrite_header.data_bytes);
2290
2291 {
Dave Barachd7cb1b52016-12-09 09:52:16 -05002292 vlib_frame_t *f = vlib_get_frame_to_node (vm, hi->output_node_index);
2293 u32 *to_next = vlib_frame_vector_args (f);
Ed Warnickecb9cada2015-12-08 15:45:58 -07002294 to_next[0] = bi;
2295 f->n_vectors = 1;
2296 vlib_put_frame_to_node (vm, hi->output_node_index, f);
2297 }
2298
Neale Ranns7a272742017-05-30 02:08:14 -07002299 adj_unlock (ai);
Ed Warnickecb9cada2015-12-08 15:45:58 -07002300 return /* no error */ 0;
2301}
2302
Dave Barachd7cb1b52016-12-09 09:52:16 -05002303typedef enum
2304{
Ed Warnickecb9cada2015-12-08 15:45:58 -07002305 IP4_REWRITE_NEXT_DROP,
Chris Luke816f3e12016-06-14 16:24:47 -04002306 IP4_REWRITE_NEXT_ICMP_ERROR,
Ed Warnickecb9cada2015-12-08 15:45:58 -07002307} ip4_rewrite_next_t;
2308
2309always_inline uword
2310ip4_rewrite_inline (vlib_main_t * vm,
2311 vlib_node_runtime_t * node,
Neale Ranns9c6a6132017-02-21 05:33:14 -08002312 vlib_frame_t * frame,
2313 int do_counters, int is_midchain, int is_mcast)
Ed Warnickecb9cada2015-12-08 15:45:58 -07002314{
Dave Barachd7cb1b52016-12-09 09:52:16 -05002315 ip_lookup_main_t *lm = &ip4_main.lookup_main;
2316 u32 *from = vlib_frame_vector_args (frame);
2317 u32 n_left_from, n_left_to_next, *to_next, next_index;
2318 vlib_node_runtime_t *error_node =
2319 vlib_node_get_runtime (vm, ip4_input_node.index);
Ed Warnickecb9cada2015-12-08 15:45:58 -07002320
2321 n_left_from = frame->n_vectors;
2322 next_index = node->cached_next_index;
Damjan Marion586afd72017-04-05 19:18:20 +02002323 u32 thread_index = vlib_get_thread_index ();
Dave Barach75fc8542016-10-11 16:16:02 -04002324
Ed Warnickecb9cada2015-12-08 15:45:58 -07002325 while (n_left_from > 0)
2326 {
2327 vlib_get_next_frame (vm, node, next_index, to_next, n_left_to_next);
2328
2329 while (n_left_from >= 4 && n_left_to_next >= 2)
2330 {
Dave Barachd7cb1b52016-12-09 09:52:16 -05002331 ip_adjacency_t *adj0, *adj1;
2332 vlib_buffer_t *p0, *p1;
2333 ip4_header_t *ip0, *ip1;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002334 u32 pi0, rw_len0, next0, error0, checksum0, adj_index0;
2335 u32 pi1, rw_len1, next1, error1, checksum1, adj_index1;
Dave Barachd7cb1b52016-12-09 09:52:16 -05002336 u32 tx_sw_if_index0, tx_sw_if_index1;
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002337
Ed Warnickecb9cada2015-12-08 15:45:58 -07002338 /* Prefetch next iteration. */
2339 {
Dave Barachd7cb1b52016-12-09 09:52:16 -05002340 vlib_buffer_t *p2, *p3;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002341
2342 p2 = vlib_get_buffer (vm, from[2]);
2343 p3 = vlib_get_buffer (vm, from[3]);
2344
2345 vlib_prefetch_buffer_header (p2, STORE);
2346 vlib_prefetch_buffer_header (p3, STORE);
2347
2348 CLIB_PREFETCH (p2->data, sizeof (ip0[0]), STORE);
2349 CLIB_PREFETCH (p3->data, sizeof (ip0[0]), STORE);
2350 }
2351
2352 pi0 = to_next[0] = from[0];
2353 pi1 = to_next[1] = from[1];
2354
2355 from += 2;
2356 n_left_from -= 2;
2357 to_next += 2;
2358 n_left_to_next -= 2;
Dave Barach75fc8542016-10-11 16:16:02 -04002359
Ed Warnickecb9cada2015-12-08 15:45:58 -07002360 p0 = vlib_get_buffer (vm, pi0);
2361 p1 = vlib_get_buffer (vm, pi1);
2362
Neale Rannsf06aea52016-11-29 06:51:37 -08002363 adj_index0 = vnet_buffer (p0)->ip.adj_index[VLIB_TX];
2364 adj_index1 = vnet_buffer (p1)->ip.adj_index[VLIB_TX];
Ed Warnickecb9cada2015-12-08 15:45:58 -07002365
Neale Ranns1bd01092017-03-15 15:41:17 -04002366 /*
2367 * pre-fetch the per-adjacency counters
2368 */
2369 if (do_counters)
2370 {
2371 vlib_prefetch_combined_counter (&adjacency_counters,
Damjan Marion586afd72017-04-05 19:18:20 +02002372 thread_index, adj_index0);
Neale Ranns1bd01092017-03-15 15:41:17 -04002373 vlib_prefetch_combined_counter (&adjacency_counters,
Damjan Marion586afd72017-04-05 19:18:20 +02002374 thread_index, adj_index1);
Neale Ranns1bd01092017-03-15 15:41:17 -04002375 }
2376
Ed Warnickecb9cada2015-12-08 15:45:58 -07002377 ip0 = vlib_buffer_get_current (p0);
2378 ip1 = vlib_buffer_get_current (p1);
2379
2380 error0 = error1 = IP4_ERROR_NONE;
Dave Barachd7cb1b52016-12-09 09:52:16 -05002381 next0 = next1 = IP4_REWRITE_NEXT_DROP;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002382
2383 /* Decrement TTL & update checksum.
2384 Works either endian, so no need for byte swap. */
Damjan Marion213b5aa2017-07-13 21:19:27 +02002385 if (PREDICT_TRUE (!(p0->flags & VNET_BUFFER_F_LOCALLY_ORIGINATED)))
Ed Warnickecb9cada2015-12-08 15:45:58 -07002386 {
Dave Barachd7cb1b52016-12-09 09:52:16 -05002387 i32 ttl0 = ip0->ttl;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002388
2389 /* Input node should have reject packets with ttl 0. */
2390 ASSERT (ip0->ttl > 0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07002391
2392 checksum0 = ip0->checksum + clib_host_to_net_u16 (0x0100);
Ed Warnickecb9cada2015-12-08 15:45:58 -07002393 checksum0 += checksum0 >= 0xffff;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002394
2395 ip0->checksum = checksum0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002396 ttl0 -= 1;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002397 ip0->ttl = ttl0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002398
Dave Barachd7cb1b52016-12-09 09:52:16 -05002399 /*
2400 * If the ttl drops below 1 when forwarding, generate
2401 * an ICMP response.
2402 */
2403 if (PREDICT_FALSE (ttl0 <= 0))
2404 {
2405 error0 = IP4_ERROR_TIME_EXPIRED;
2406 vnet_buffer (p0)->sw_if_index[VLIB_TX] = (u32) ~ 0;
2407 icmp4_error_set_vnet_buffer (p0, ICMP4_time_exceeded,
2408 ICMP4_time_exceeded_ttl_exceeded_in_transit,
2409 0);
2410 next0 = IP4_REWRITE_NEXT_ICMP_ERROR;
2411 }
Neale Rannsf06aea52016-11-29 06:51:37 -08002412
2413 /* Verify checksum. */
Dave Barach2c0a4f42017-06-29 09:30:15 -04002414 ASSERT ((ip0->checksum == ip4_header_checksum (ip0)) ||
Damjan Marionfb3288f2017-07-19 15:07:10 +02002415 (p0->flags & VNET_BUFFER_F_OFFLOAD_IP_CKSUM));
Neale Rannsf06aea52016-11-29 06:51:37 -08002416 }
Dave Barachd7cb1b52016-12-09 09:52:16 -05002417 else
2418 {
Damjan Marion213b5aa2017-07-13 21:19:27 +02002419 p0->flags &= ~VNET_BUFFER_F_LOCALLY_ORIGINATED;
Dave Barachd7cb1b52016-12-09 09:52:16 -05002420 }
Damjan Marion213b5aa2017-07-13 21:19:27 +02002421 if (PREDICT_TRUE (!(p1->flags & VNET_BUFFER_F_LOCALLY_ORIGINATED)))
Neale Rannsf06aea52016-11-29 06:51:37 -08002422 {
2423 i32 ttl1 = ip1->ttl;
2424
2425 /* Input node should have reject packets with ttl 0. */
2426 ASSERT (ip1->ttl > 0);
2427
2428 checksum1 = ip1->checksum + clib_host_to_net_u16 (0x0100);
2429 checksum1 += checksum1 >= 0xffff;
2430
2431 ip1->checksum = checksum1;
2432 ttl1 -= 1;
2433 ip1->ttl = ttl1;
2434
Dave Barachd7cb1b52016-12-09 09:52:16 -05002435 /*
2436 * If the ttl drops below 1 when forwarding, generate
2437 * an ICMP response.
2438 */
2439 if (PREDICT_FALSE (ttl1 <= 0))
2440 {
2441 error1 = IP4_ERROR_TIME_EXPIRED;
2442 vnet_buffer (p1)->sw_if_index[VLIB_TX] = (u32) ~ 0;
2443 icmp4_error_set_vnet_buffer (p1, ICMP4_time_exceeded,
2444 ICMP4_time_exceeded_ttl_exceeded_in_transit,
2445 0);
2446 next1 = IP4_REWRITE_NEXT_ICMP_ERROR;
2447 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07002448
2449 /* Verify checksum. */
Dave Barach2c0a4f42017-06-29 09:30:15 -04002450 ASSERT ((ip1->checksum == ip4_header_checksum (ip1)) ||
Damjan Marionfb3288f2017-07-19 15:07:10 +02002451 (p1->flags & VNET_BUFFER_F_OFFLOAD_IP_CKSUM));
Ed Warnickecb9cada2015-12-08 15:45:58 -07002452 }
Dave Barachd7cb1b52016-12-09 09:52:16 -05002453 else
2454 {
Damjan Marion213b5aa2017-07-13 21:19:27 +02002455 p1->flags &= ~VNET_BUFFER_F_LOCALLY_ORIGINATED;
Dave Barachd7cb1b52016-12-09 09:52:16 -05002456 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07002457
2458 /* Rewrite packet header and updates lengths. */
Neale Ranns107e7d42017-04-11 09:55:19 -07002459 adj0 = adj_get (adj_index0);
2460 adj1 = adj_get (adj_index1);
Dave Barach75fc8542016-10-11 16:16:02 -04002461
Dave Barachd7cb1b52016-12-09 09:52:16 -05002462 /* Worth pipelining. No guarantee that adj0,1 are hot... */
Ed Warnickecb9cada2015-12-08 15:45:58 -07002463 rw_len0 = adj0[0].rewrite_header.data_bytes;
2464 rw_len1 = adj1[0].rewrite_header.data_bytes;
Dave Barachd7cb1b52016-12-09 09:52:16 -05002465 vnet_buffer (p0)->ip.save_rewrite_length = rw_len0;
2466 vnet_buffer (p1)->ip.save_rewrite_length = rw_len1;
Chris Lukef2868fc2016-06-14 16:26:22 -04002467
Dave Barachd7cb1b52016-12-09 09:52:16 -05002468 /* Check MTU of outgoing interface. */
2469 error0 =
2470 (vlib_buffer_length_in_chain (vm, p0) >
2471 adj0[0].
2472 rewrite_header.max_l3_packet_bytes ? IP4_ERROR_MTU_EXCEEDED :
2473 error0);
2474 error1 =
2475 (vlib_buffer_length_in_chain (vm, p1) >
2476 adj1[0].
2477 rewrite_header.max_l3_packet_bytes ? IP4_ERROR_MTU_EXCEEDED :
2478 error1);
Chris Lukef2868fc2016-06-14 16:26:22 -04002479
Neale Rannscf3561b2017-12-13 01:44:25 -08002480 if (is_mcast)
2481 {
2482 error0 = ((adj0[0].rewrite_header.sw_if_index ==
2483 vnet_buffer (p0)->sw_if_index[VLIB_RX]) ?
2484 IP4_ERROR_SAME_INTERFACE : error0);
2485 error1 = ((adj1[0].rewrite_header.sw_if_index ==
2486 vnet_buffer (p1)->sw_if_index[VLIB_RX]) ?
2487 IP4_ERROR_SAME_INTERFACE : error1);
2488 }
2489
Dave Barachd7cb1b52016-12-09 09:52:16 -05002490 /* Don't adjust the buffer for ttl issue; icmp-error node wants
2491 * to see the IP headerr */
2492 if (PREDICT_TRUE (error0 == IP4_ERROR_NONE))
2493 {
Damjan Marion892e0762016-12-09 18:52:05 +01002494 next0 = adj0[0].rewrite_header.next_index;
Dave Barachd7cb1b52016-12-09 09:52:16 -05002495 p0->current_data -= rw_len0;
2496 p0->current_length += rw_len0;
2497 tx_sw_if_index0 = adj0[0].rewrite_header.sw_if_index;
2498 vnet_buffer (p0)->sw_if_index[VLIB_TX] = tx_sw_if_index0;
Dave Barach5331c722016-08-17 11:54:30 -04002499
Neale Rannsb069a692017-03-15 12:34:25 -04002500 if (PREDICT_FALSE
2501 (adj0[0].rewrite_header.flags & VNET_REWRITE_HAS_FEATURES))
2502 vnet_feature_arc_start (lm->output_feature_arc_index,
2503 tx_sw_if_index0, &next0, p0);
Dave Barachd7cb1b52016-12-09 09:52:16 -05002504 }
2505 if (PREDICT_TRUE (error1 == IP4_ERROR_NONE))
2506 {
Damjan Marion892e0762016-12-09 18:52:05 +01002507 next1 = adj1[0].rewrite_header.next_index;
Dave Barachd7cb1b52016-12-09 09:52:16 -05002508 p1->current_data -= rw_len1;
2509 p1->current_length += rw_len1;
Dave Barach5331c722016-08-17 11:54:30 -04002510
Dave Barachd7cb1b52016-12-09 09:52:16 -05002511 tx_sw_if_index1 = adj1[0].rewrite_header.sw_if_index;
2512 vnet_buffer (p1)->sw_if_index[VLIB_TX] = tx_sw_if_index1;
Dave Barach5331c722016-08-17 11:54:30 -04002513
Neale Rannsb069a692017-03-15 12:34:25 -04002514 if (PREDICT_FALSE
2515 (adj1[0].rewrite_header.flags & VNET_REWRITE_HAS_FEATURES))
2516 vnet_feature_arc_start (lm->output_feature_arc_index,
2517 tx_sw_if_index1, &next1, p1);
Dave Barachd7cb1b52016-12-09 09:52:16 -05002518 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07002519
2520 /* Guess we are only writing on simple Ethernet header. */
2521 vnet_rewrite_two_headers (adj0[0], adj1[0],
Dave Barachd7cb1b52016-12-09 09:52:16 -05002522 ip0, ip1, sizeof (ethernet_header_t));
Neale Ranns5e575b12016-10-03 09:40:25 +01002523
Neale Ranns044183f2017-01-24 01:34:25 -08002524 /*
2525 * Bump the per-adjacency counters
2526 */
Neale Ranns9c6a6132017-02-21 05:33:14 -08002527 if (do_counters)
2528 {
2529 vlib_increment_combined_counter
2530 (&adjacency_counters,
Damjan Marion586afd72017-04-05 19:18:20 +02002531 thread_index,
Neale Ranns9c6a6132017-02-21 05:33:14 -08002532 adj_index0, 1,
2533 vlib_buffer_length_in_chain (vm, p0) + rw_len0);
Neale Ranns044183f2017-01-24 01:34:25 -08002534
Neale Ranns9c6a6132017-02-21 05:33:14 -08002535 vlib_increment_combined_counter
2536 (&adjacency_counters,
Damjan Marion586afd72017-04-05 19:18:20 +02002537 thread_index,
Neale Ranns9c6a6132017-02-21 05:33:14 -08002538 adj_index1, 1,
2539 vlib_buffer_length_in_chain (vm, p1) + rw_len1);
2540 }
Neale Ranns044183f2017-01-24 01:34:25 -08002541
Neale Ranns5e575b12016-10-03 09:40:25 +01002542 if (is_midchain)
Dave Barachd7cb1b52016-12-09 09:52:16 -05002543 {
Neale Rannsdb14f5a2018-01-29 10:43:33 -08002544 adj0->sub_type.midchain.fixup_func
2545 (vm, adj0, p0, adj0->sub_type.midchain.fixup_data);
2546 adj1->sub_type.midchain.fixup_func
2547 (vm, adj1, p1, adj0->sub_type.midchain.fixup_data);
Dave Barachd7cb1b52016-12-09 09:52:16 -05002548 }
Neale Ranns32e1c012016-11-22 17:07:28 +00002549 if (is_mcast)
2550 {
2551 /*
2552 * copy bytes from the IP address into the MAC rewrite
2553 */
Neale Ranns2e7fbcc2017-03-15 04:22:25 -07002554 vnet_fixup_one_header (adj0[0], &ip0->dst_address, ip0);
2555 vnet_fixup_one_header (adj1[0], &ip1->dst_address, ip1);
Neale Ranns32e1c012016-11-22 17:07:28 +00002556 }
Dave Barach75fc8542016-10-11 16:16:02 -04002557
Ed Warnickecb9cada2015-12-08 15:45:58 -07002558 vlib_validate_buffer_enqueue_x2 (vm, node, next_index,
2559 to_next, n_left_to_next,
2560 pi0, pi1, next0, next1);
2561 }
2562
2563 while (n_left_from > 0 && n_left_to_next > 0)
2564 {
Dave Barachd7cb1b52016-12-09 09:52:16 -05002565 ip_adjacency_t *adj0;
2566 vlib_buffer_t *p0;
2567 ip4_header_t *ip0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002568 u32 pi0, rw_len0, adj_index0, next0, error0, checksum0;
Dave Barachd7cb1b52016-12-09 09:52:16 -05002569 u32 tx_sw_if_index0;
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002570
Ed Warnickecb9cada2015-12-08 15:45:58 -07002571 pi0 = to_next[0] = from[0];
2572
2573 p0 = vlib_get_buffer (vm, pi0);
2574
Neale Rannsf06aea52016-11-29 06:51:37 -08002575 adj_index0 = vnet_buffer (p0)->ip.adj_index[VLIB_TX];
Ed Warnickecb9cada2015-12-08 15:45:58 -07002576
Neale Ranns107e7d42017-04-11 09:55:19 -07002577 adj0 = adj_get (adj_index0);
Dave Barach75fc8542016-10-11 16:16:02 -04002578
Ed Warnickecb9cada2015-12-08 15:45:58 -07002579 ip0 = vlib_buffer_get_current (p0);
2580
2581 error0 = IP4_ERROR_NONE;
Dave Barachd7cb1b52016-12-09 09:52:16 -05002582 next0 = IP4_REWRITE_NEXT_DROP; /* drop on error */
Ed Warnickecb9cada2015-12-08 15:45:58 -07002583
2584 /* Decrement TTL & update checksum. */
Damjan Marion213b5aa2017-07-13 21:19:27 +02002585 if (PREDICT_TRUE (!(p0->flags & VNET_BUFFER_F_LOCALLY_ORIGINATED)))
Ed Warnickecb9cada2015-12-08 15:45:58 -07002586 {
2587 i32 ttl0 = ip0->ttl;
2588
2589 checksum0 = ip0->checksum + clib_host_to_net_u16 (0x0100);
2590
2591 checksum0 += checksum0 >= 0xffff;
2592
2593 ip0->checksum = checksum0;
2594
2595 ASSERT (ip0->ttl > 0);
2596
2597 ttl0 -= 1;
2598
2599 ip0->ttl = ttl0;
2600
Dave Barach2c0a4f42017-06-29 09:30:15 -04002601 ASSERT ((ip0->checksum == ip4_header_checksum (ip0)) ||
Damjan Marionfb3288f2017-07-19 15:07:10 +02002602 (p0->flags & VNET_BUFFER_F_OFFLOAD_IP_CKSUM));
Ed Warnickecb9cada2015-12-08 15:45:58 -07002603
Dave Barachd7cb1b52016-12-09 09:52:16 -05002604 if (PREDICT_FALSE (ttl0 <= 0))
2605 {
2606 /*
2607 * If the ttl drops below 1 when forwarding, generate
2608 * an ICMP response.
2609 */
2610 error0 = IP4_ERROR_TIME_EXPIRED;
2611 next0 = IP4_REWRITE_NEXT_ICMP_ERROR;
2612 vnet_buffer (p0)->sw_if_index[VLIB_TX] = (u32) ~ 0;
2613 icmp4_error_set_vnet_buffer (p0, ICMP4_time_exceeded,
2614 ICMP4_time_exceeded_ttl_exceeded_in_transit,
2615 0);
2616 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07002617 }
Dave Barachd7cb1b52016-12-09 09:52:16 -05002618 else
2619 {
Damjan Marion213b5aa2017-07-13 21:19:27 +02002620 p0->flags &= ~VNET_BUFFER_F_LOCALLY_ORIGINATED;
Dave Barachd7cb1b52016-12-09 09:52:16 -05002621 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07002622
Neale Ranns1bd01092017-03-15 15:41:17 -04002623 if (do_counters)
2624 vlib_prefetch_combined_counter (&adjacency_counters,
Damjan Marion586afd72017-04-05 19:18:20 +02002625 thread_index, adj_index0);
Neale Ranns044183f2017-01-24 01:34:25 -08002626
Ed Warnickecb9cada2015-12-08 15:45:58 -07002627 /* Guess we are only writing on simple Ethernet header. */
Dave Barachd7cb1b52016-12-09 09:52:16 -05002628 vnet_rewrite_one_header (adj0[0], ip0, sizeof (ethernet_header_t));
Neale Ranns32e1c012016-11-22 17:07:28 +00002629 if (is_mcast)
2630 {
2631 /*
2632 * copy bytes from the IP address into the MAC rewrite
2633 */
Neale Ranns2e7fbcc2017-03-15 04:22:25 -07002634 vnet_fixup_one_header (adj0[0], &ip0->dst_address, ip0);
Neale Ranns32e1c012016-11-22 17:07:28 +00002635 }
Dave Barach75fc8542016-10-11 16:16:02 -04002636
Dave Barachd7cb1b52016-12-09 09:52:16 -05002637 /* Update packet buffer attributes/set output interface. */
2638 rw_len0 = adj0[0].rewrite_header.data_bytes;
2639 vnet_buffer (p0)->ip.save_rewrite_length = rw_len0;
Dave Barach75fc8542016-10-11 16:16:02 -04002640
Neale Ranns1bd01092017-03-15 15:41:17 -04002641 if (do_counters)
2642 vlib_increment_combined_counter
2643 (&adjacency_counters,
Damjan Marion586afd72017-04-05 19:18:20 +02002644 thread_index, adj_index0, 1,
Neale Ranns1bd01092017-03-15 15:41:17 -04002645 vlib_buffer_length_in_chain (vm, p0) + rw_len0);
Dave Barach75fc8542016-10-11 16:16:02 -04002646
Dave Barachd7cb1b52016-12-09 09:52:16 -05002647 /* Check MTU of outgoing interface. */
2648 error0 = (vlib_buffer_length_in_chain (vm, p0)
2649 > adj0[0].rewrite_header.max_l3_packet_bytes
2650 ? IP4_ERROR_MTU_EXCEEDED : error0);
Neale Rannscf3561b2017-12-13 01:44:25 -08002651 if (is_mcast)
2652 {
2653 error0 = ((adj0[0].rewrite_header.sw_if_index ==
2654 vnet_buffer (p0)->sw_if_index[VLIB_RX]) ?
2655 IP4_ERROR_SAME_INTERFACE : error0);
2656 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07002657 p0->error = error_node->errors[error0];
Chris Luke816f3e12016-06-14 16:24:47 -04002658
Dave Barachd7cb1b52016-12-09 09:52:16 -05002659 /* Don't adjust the buffer for ttl issue; icmp-error node wants
2660 * to see the IP headerr */
2661 if (PREDICT_TRUE (error0 == IP4_ERROR_NONE))
2662 {
2663 p0->current_data -= rw_len0;
2664 p0->current_length += rw_len0;
2665 tx_sw_if_index0 = adj0[0].rewrite_header.sw_if_index;
Chris Luke816f3e12016-06-14 16:24:47 -04002666
Dave Barachd7cb1b52016-12-09 09:52:16 -05002667 vnet_buffer (p0)->sw_if_index[VLIB_TX] = tx_sw_if_index0;
2668 next0 = adj0[0].rewrite_header.next_index;
Dave Barach5331c722016-08-17 11:54:30 -04002669
Neale Ranns5e575b12016-10-03 09:40:25 +01002670 if (is_midchain)
Dave Barachd7cb1b52016-12-09 09:52:16 -05002671 {
Neale Rannsdb14f5a2018-01-29 10:43:33 -08002672 adj0->sub_type.midchain.fixup_func
2673 (vm, adj0, p0, adj0->sub_type.midchain.fixup_data);
Neale Ranns5e575b12016-10-03 09:40:25 +01002674 }
2675
Neale Rannsb069a692017-03-15 12:34:25 -04002676 if (PREDICT_FALSE
2677 (adj0[0].rewrite_header.flags & VNET_REWRITE_HAS_FEATURES))
2678 vnet_feature_arc_start (lm->output_feature_arc_index,
2679 tx_sw_if_index0, &next0, p0);
Damjan Marion8b3191e2016-11-09 19:54:20 +01002680
Dave Barachd7cb1b52016-12-09 09:52:16 -05002681 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07002682
Ed Warnickecb9cada2015-12-08 15:45:58 -07002683 from += 1;
2684 n_left_from -= 1;
2685 to_next += 1;
2686 n_left_to_next -= 1;
Dave Barach75fc8542016-10-11 16:16:02 -04002687
Ed Warnickecb9cada2015-12-08 15:45:58 -07002688 vlib_validate_buffer_enqueue_x1 (vm, node, next_index,
2689 to_next, n_left_to_next,
2690 pi0, next0);
2691 }
Dave Barach75fc8542016-10-11 16:16:02 -04002692
Ed Warnickecb9cada2015-12-08 15:45:58 -07002693 vlib_put_next_frame (vm, node, next_index, n_left_to_next);
2694 }
2695
2696 /* Need to do trace after rewrites to pick up new packet data. */
2697 if (node->flags & VLIB_NODE_FLAG_TRACE)
Neale Rannsf06aea52016-11-29 06:51:37 -08002698 ip4_forward_next_trace (vm, node, frame, VLIB_TX);
Ed Warnickecb9cada2015-12-08 15:45:58 -07002699
2700 return frame->n_vectors;
2701}
2702
Dave Barach132d51d2016-07-07 10:10:17 -04002703
Neale Rannsf06aea52016-11-29 06:51:37 -08002704/** @brief IPv4 rewrite node.
2705 @node ip4-rewrite
Dave Barach132d51d2016-07-07 10:10:17 -04002706
2707 This is the IPv4 transit-rewrite node: decrement TTL, fix the ipv4
2708 header checksum, fetch the ip adjacency, check the outbound mtu,
2709 apply the adjacency rewrite, and send pkts to the adjacency
2710 rewrite header's rewrite_next_index.
2711
2712 @param vm vlib_main_t corresponding to the current thread
2713 @param node vlib_node_runtime_t
2714 @param frame vlib_frame_t whose contents should be dispatched
2715
2716 @par Graph mechanics: buffer metadata, next index usage
2717
2718 @em Uses:
2719 - <code>vnet_buffer(b)->ip.adj_index[VLIB_TX]</code>
2720 - the rewrite adjacency index
2721 - <code>adj->lookup_next_index</code>
2722 - Must be IP_LOOKUP_NEXT_REWRITE or IP_LOOKUP_NEXT_ARP, otherwise
Dave Barach75fc8542016-10-11 16:16:02 -04002723 the packet will be dropped.
Dave Barach132d51d2016-07-07 10:10:17 -04002724 - <code>adj->rewrite_header</code>
2725 - Rewrite string length, rewrite string, next_index
2726
2727 @em Sets:
2728 - <code>b->current_data, b->current_length</code>
2729 - Updated net of applying the rewrite string
2730
2731 <em>Next Indices:</em>
2732 - <code> adj->rewrite_header.next_index </code>
Vijayabhaskar Katamreddyce074122017-11-15 13:50:26 -08002733 or @c ip4-drop
Dave Barach132d51d2016-07-07 10:10:17 -04002734*/
Ed Warnickecb9cada2015-12-08 15:45:58 -07002735static uword
Neale Rannsf06aea52016-11-29 06:51:37 -08002736ip4_rewrite (vlib_main_t * vm,
Dave Barachd7cb1b52016-12-09 09:52:16 -05002737 vlib_node_runtime_t * node, vlib_frame_t * frame)
Ed Warnickecb9cada2015-12-08 15:45:58 -07002738{
Neale Ranns9c6a6132017-02-21 05:33:14 -08002739 if (adj_are_counters_enabled ())
2740 return ip4_rewrite_inline (vm, node, frame, 1, 0, 0);
2741 else
2742 return ip4_rewrite_inline (vm, node, frame, 0, 0, 0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07002743}
2744
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002745static uword
2746ip4_midchain (vlib_main_t * vm,
Dave Barachd7cb1b52016-12-09 09:52:16 -05002747 vlib_node_runtime_t * node, vlib_frame_t * frame)
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002748{
Neale Ranns9c6a6132017-02-21 05:33:14 -08002749 if (adj_are_counters_enabled ())
2750 return ip4_rewrite_inline (vm, node, frame, 1, 1, 0);
2751 else
2752 return ip4_rewrite_inline (vm, node, frame, 0, 1, 0);
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002753}
2754
Neale Ranns32e1c012016-11-22 17:07:28 +00002755static uword
2756ip4_rewrite_mcast (vlib_main_t * vm,
2757 vlib_node_runtime_t * node, vlib_frame_t * frame)
Dave Barachd7cb1b52016-12-09 09:52:16 -05002758{
Neale Ranns9c6a6132017-02-21 05:33:14 -08002759 if (adj_are_counters_enabled ())
2760 return ip4_rewrite_inline (vm, node, frame, 1, 0, 1);
2761 else
2762 return ip4_rewrite_inline (vm, node, frame, 0, 0, 1);
Neale Ranns32e1c012016-11-22 17:07:28 +00002763}
Ed Warnickecb9cada2015-12-08 15:45:58 -07002764
Neale Ranns0f26c5a2017-03-01 15:12:11 -08002765static uword
2766ip4_mcast_midchain (vlib_main_t * vm,
2767 vlib_node_runtime_t * node, vlib_frame_t * frame)
2768{
2769 if (adj_are_counters_enabled ())
2770 return ip4_rewrite_inline (vm, node, frame, 1, 1, 1);
2771 else
2772 return ip4_rewrite_inline (vm, node, frame, 0, 1, 1);
2773}
2774
Neale Ranns32e1c012016-11-22 17:07:28 +00002775/* *INDENT-OFF* */
2776VLIB_REGISTER_NODE (ip4_rewrite_node) = {
2777 .function = ip4_rewrite,
2778 .name = "ip4-rewrite",
2779 .vector_size = sizeof (u32),
Ed Warnickecb9cada2015-12-08 15:45:58 -07002780
Neale Ranns32e1c012016-11-22 17:07:28 +00002781 .format_trace = format_ip4_rewrite_trace,
Ed Warnickecb9cada2015-12-08 15:45:58 -07002782
Neale Ranns32e1c012016-11-22 17:07:28 +00002783 .n_next_nodes = 2,
2784 .next_nodes = {
Vijayabhaskar Katamreddyce074122017-11-15 13:50:26 -08002785 [IP4_REWRITE_NEXT_DROP] = "ip4-drop",
Neale Ranns32e1c012016-11-22 17:07:28 +00002786 [IP4_REWRITE_NEXT_ICMP_ERROR] = "ip4-icmp-error",
2787 },
2788};
2789VLIB_NODE_FUNCTION_MULTIARCH (ip4_rewrite_node, ip4_rewrite)
2790
2791VLIB_REGISTER_NODE (ip4_rewrite_mcast_node) = {
2792 .function = ip4_rewrite_mcast,
2793 .name = "ip4-rewrite-mcast",
2794 .vector_size = sizeof (u32),
2795
2796 .format_trace = format_ip4_rewrite_trace,
2797 .sibling_of = "ip4-rewrite",
2798};
2799VLIB_NODE_FUNCTION_MULTIARCH (ip4_rewrite_mcast_node, ip4_rewrite_mcast)
2800
Neale Ranns0f26c5a2017-03-01 15:12:11 -08002801VLIB_REGISTER_NODE (ip4_mcast_midchain_node, static) = {
2802 .function = ip4_mcast_midchain,
2803 .name = "ip4-mcast-midchain",
2804 .vector_size = sizeof (u32),
2805
2806 .format_trace = format_ip4_rewrite_trace,
2807 .sibling_of = "ip4-rewrite",
2808};
2809VLIB_NODE_FUNCTION_MULTIARCH (ip4_mcast_midchain_node, ip4_mcast_midchain)
2810
Neale Ranns32e1c012016-11-22 17:07:28 +00002811VLIB_REGISTER_NODE (ip4_midchain_node) = {
2812 .function = ip4_midchain,
2813 .name = "ip4-midchain",
2814 .vector_size = sizeof (u32),
2815 .format_trace = format_ip4_forward_next_trace,
2816 .sibling_of = "ip4-rewrite",
2817};
Dave Barachd7cb1b52016-12-09 09:52:16 -05002818VLIB_NODE_FUNCTION_MULTIARCH (ip4_midchain_node, ip4_midchain);
Neale Ranns32e1c012016-11-22 17:07:28 +00002819/* *INDENT-ON */
Damjan Marion1c80e832016-05-11 23:07:18 +02002820
Dave Barachd7cb1b52016-12-09 09:52:16 -05002821int
2822ip4_lookup_validate (ip4_address_t * a, u32 fib_index0)
2823{
2824 ip4_fib_mtrie_t *mtrie0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002825 ip4_fib_mtrie_leaf_t leaf0;
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002826 u32 lbi0;
Dave Barach75fc8542016-10-11 16:16:02 -04002827
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002828 mtrie0 = &ip4_fib_get (fib_index0)->mtrie;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002829
Neale Ranns04a75e32017-03-23 06:46:01 -07002830 leaf0 = ip4_fib_mtrie_lookup_step_one (mtrie0, a);
Ed Warnickecb9cada2015-12-08 15:45:58 -07002831 leaf0 = ip4_fib_mtrie_lookup_step (mtrie0, leaf0, a, 2);
2832 leaf0 = ip4_fib_mtrie_lookup_step (mtrie0, leaf0, a, 3);
Dave Barach75fc8542016-10-11 16:16:02 -04002833
Neale Ranns0bfe5d82016-08-25 15:29:12 +01002834 lbi0 = ip4_fib_mtrie_leaf_get_adj_index (leaf0);
Dave Barach75fc8542016-10-11 16:16:02 -04002835
Dave Barachd7cb1b52016-12-09 09:52:16 -05002836 return lbi0 == ip4_fib_table_lookup_lb (ip4_fib_get (fib_index0), a);
Ed Warnickecb9cada2015-12-08 15:45:58 -07002837}
Dave Barach75fc8542016-10-11 16:16:02 -04002838
Ed Warnickecb9cada2015-12-08 15:45:58 -07002839static clib_error_t *
2840test_lookup_command_fn (vlib_main_t * vm,
Dave Barachd7cb1b52016-12-09 09:52:16 -05002841 unformat_input_t * input, vlib_cli_command_t * cmd)
Ed Warnickecb9cada2015-12-08 15:45:58 -07002842{
Billy McFall309fe062016-10-14 07:37:33 -04002843 ip4_fib_t *fib;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002844 u32 table_id = 0;
2845 f64 count = 1;
2846 u32 n;
2847 int i;
2848 ip4_address_t ip4_base_address;
2849 u64 errors = 0;
2850
Dave Barachd7cb1b52016-12-09 09:52:16 -05002851 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
2852 {
Ed Warnickecb9cada2015-12-08 15:45:58 -07002853 if (unformat (input, "table %d", &table_id))
Dave Barachd7cb1b52016-12-09 09:52:16 -05002854 {
2855 /* Make sure the entry exists. */
2856 fib = ip4_fib_get (table_id);
2857 if ((fib) && (fib->index != table_id))
2858 return clib_error_return (0, "<fib-index> %d does not exist",
2859 table_id);
2860 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07002861 else if (unformat (input, "count %f", &count))
2862 ;
2863
2864 else if (unformat (input, "%U",
2865 unformat_ip4_address, &ip4_base_address))
Dave Barachd7cb1b52016-12-09 09:52:16 -05002866 ;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002867 else
Dave Barachd7cb1b52016-12-09 09:52:16 -05002868 return clib_error_return (0, "unknown input `%U'",
2869 format_unformat_error, input);
2870 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07002871
2872 n = count;
2873
2874 for (i = 0; i < n; i++)
2875 {
2876 if (!ip4_lookup_validate (&ip4_base_address, table_id))
Dave Barachd7cb1b52016-12-09 09:52:16 -05002877 errors++;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002878
Dave Barach75fc8542016-10-11 16:16:02 -04002879 ip4_base_address.as_u32 =
Dave Barachd7cb1b52016-12-09 09:52:16 -05002880 clib_host_to_net_u32 (1 +
2881 clib_net_to_host_u32 (ip4_base_address.as_u32));
Ed Warnickecb9cada2015-12-08 15:45:58 -07002882 }
2883
Dave Barach75fc8542016-10-11 16:16:02 -04002884 if (errors)
Ed Warnickecb9cada2015-12-08 15:45:58 -07002885 vlib_cli_output (vm, "%llu errors out of %d lookups\n", errors, n);
2886 else
2887 vlib_cli_output (vm, "No errors in %d lookups\n", n);
2888
2889 return 0;
2890}
2891
Billy McFall0683c9c2016-10-13 08:27:31 -04002892/*?
2893 * Perform a lookup of an IPv4 Address (or range of addresses) in the
2894 * given FIB table to determine if there is a conflict with the
2895 * adjacency table. The fib-id can be determined by using the
2896 * '<em>show ip fib</em>' command. If fib-id is not entered, default value
2897 * of 0 is used.
2898 *
2899 * @todo This command uses fib-id, other commands use table-id (not
2900 * just a name, they are different indexes). Would like to change this
2901 * to table-id for consistency.
2902 *
2903 * @cliexpar
2904 * Example of how to run the test lookup command:
2905 * @cliexstart{test lookup 172.16.1.1 table 1 count 2}
2906 * No errors in 2 lookups
2907 * @cliexend
2908?*/
2909/* *INDENT-OFF* */
Dave Barachd7cb1b52016-12-09 09:52:16 -05002910VLIB_CLI_COMMAND (lookup_test_command, static) =
2911{
2912 .path = "test lookup",
2913 .short_help = "test lookup <ipv4-addr> [table <fib-id>] [count <nn>]",
2914 .function = test_lookup_command_fn,
Ed Warnickecb9cada2015-12-08 15:45:58 -07002915};
Billy McFall0683c9c2016-10-13 08:27:31 -04002916/* *INDENT-ON* */
Ed Warnickecb9cada2015-12-08 15:45:58 -07002917
Dave Barachd7cb1b52016-12-09 09:52:16 -05002918int
2919vnet_set_ip4_flow_hash (u32 table_id, u32 flow_hash_config)
Ed Warnickecb9cada2015-12-08 15:45:58 -07002920{
Neale Ranns107e7d42017-04-11 09:55:19 -07002921 u32 fib_index;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002922
Neale Ranns107e7d42017-04-11 09:55:19 -07002923 fib_index = fib_table_find (FIB_PROTOCOL_IP4, table_id);
2924
2925 if (~0 == fib_index)
Ed Warnickecb9cada2015-12-08 15:45:58 -07002926 return VNET_API_ERROR_NO_SUCH_FIB;
2927
Neale Ranns227038a2017-04-21 01:07:59 -07002928 fib_table_set_flow_hash_config (fib_index, FIB_PROTOCOL_IP4,
2929 flow_hash_config);
Ed Warnickecb9cada2015-12-08 15:45:58 -07002930
Ed Warnickecb9cada2015-12-08 15:45:58 -07002931 return 0;
2932}
Dave Barach75fc8542016-10-11 16:16:02 -04002933
Ed Warnickecb9cada2015-12-08 15:45:58 -07002934static clib_error_t *
2935set_ip_flow_hash_command_fn (vlib_main_t * vm,
Dave Barachd7cb1b52016-12-09 09:52:16 -05002936 unformat_input_t * input,
2937 vlib_cli_command_t * cmd)
Ed Warnickecb9cada2015-12-08 15:45:58 -07002938{
2939 int matched = 0;
2940 u32 table_id = 0;
2941 u32 flow_hash_config = 0;
2942 int rv;
2943
Dave Barachd7cb1b52016-12-09 09:52:16 -05002944 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
2945 {
2946 if (unformat (input, "table %d", &table_id))
2947 matched = 1;
Ed Warnickecb9cada2015-12-08 15:45:58 -07002948#define _(a,v) \
2949 else if (unformat (input, #a)) { flow_hash_config |= v; matched=1;}
Dave Barachd7cb1b52016-12-09 09:52:16 -05002950 foreach_flow_hash_bit
Ed Warnickecb9cada2015-12-08 15:45:58 -07002951#undef _
Dave Barachd7cb1b52016-12-09 09:52:16 -05002952 else
2953 break;
2954 }
Dave Barach75fc8542016-10-11 16:16:02 -04002955
Ed Warnickecb9cada2015-12-08 15:45:58 -07002956 if (matched == 0)
2957 return clib_error_return (0, "unknown input `%U'",
Dave Barachd7cb1b52016-12-09 09:52:16 -05002958 format_unformat_error, input);
Dave Barach75fc8542016-10-11 16:16:02 -04002959
Ed Warnickecb9cada2015-12-08 15:45:58 -07002960 rv = vnet_set_ip4_flow_hash (table_id, flow_hash_config);
2961 switch (rv)
2962 {
2963 case 0:
2964 break;
Dave Barach75fc8542016-10-11 16:16:02 -04002965
Ed Warnickecb9cada2015-12-08 15:45:58 -07002966 case VNET_API_ERROR_NO_SUCH_FIB:
2967 return clib_error_return (0, "no such FIB table %d", table_id);
Dave Barach75fc8542016-10-11 16:16:02 -04002968
Ed Warnickecb9cada2015-12-08 15:45:58 -07002969 default:
2970 clib_warning ("BUG: illegal flow hash config 0x%x", flow_hash_config);
2971 break;
2972 }
Dave Barach75fc8542016-10-11 16:16:02 -04002973
Ed Warnickecb9cada2015-12-08 15:45:58 -07002974 return 0;
2975}
Dave Barach75fc8542016-10-11 16:16:02 -04002976
Billy McFall0683c9c2016-10-13 08:27:31 -04002977/*?
2978 * Configure the set of IPv4 fields used by the flow hash.
2979 *
2980 * @cliexpar
2981 * Example of how to set the flow hash on a given table:
2982 * @cliexcmd{set ip flow-hash table 7 dst sport dport proto}
2983 * Example of display the configured flow hash:
2984 * @cliexstart{show ip fib}
Billy McFallebb9a6a2016-10-17 11:35:32 -04002985 * ipv4-VRF:0, fib_index 0, flow hash: src dst sport dport proto
2986 * 0.0.0.0/0
2987 * unicast-ip4-chain
2988 * [@0]: dpo-load-balance: [index:0 buckets:1 uRPF:0 to:[0:0]]
2989 * [0] [@0]: dpo-drop ip6
2990 * 0.0.0.0/32
2991 * unicast-ip4-chain
2992 * [@0]: dpo-load-balance: [index:1 buckets:1 uRPF:1 to:[0:0]]
2993 * [0] [@0]: dpo-drop ip6
2994 * 224.0.0.0/8
2995 * unicast-ip4-chain
2996 * [@0]: dpo-load-balance: [index:3 buckets:1 uRPF:3 to:[0:0]]
2997 * [0] [@0]: dpo-drop ip6
2998 * 6.0.1.2/32
2999 * unicast-ip4-chain
3000 * [@0]: dpo-load-balance: [index:30 buckets:1 uRPF:29 to:[0:0]]
3001 * [0] [@3]: arp-ipv4: via 6.0.0.1 af_packet0
3002 * 7.0.0.1/32
3003 * unicast-ip4-chain
3004 * [@0]: dpo-load-balance: [index:31 buckets:4 uRPF:30 to:[0:0]]
3005 * [0] [@3]: arp-ipv4: via 6.0.0.2 af_packet0
3006 * [1] [@3]: arp-ipv4: via 6.0.0.2 af_packet0
3007 * [2] [@3]: arp-ipv4: via 6.0.0.2 af_packet0
3008 * [3] [@3]: arp-ipv4: via 6.0.0.1 af_packet0
3009 * 240.0.0.0/8
3010 * unicast-ip4-chain
3011 * [@0]: dpo-load-balance: [index:2 buckets:1 uRPF:2 to:[0:0]]
3012 * [0] [@0]: dpo-drop ip6
3013 * 255.255.255.255/32
3014 * unicast-ip4-chain
3015 * [@0]: dpo-load-balance: [index:4 buckets:1 uRPF:4 to:[0:0]]
3016 * [0] [@0]: dpo-drop ip6
3017 * ipv4-VRF:7, fib_index 1, flow hash: dst sport dport proto
3018 * 0.0.0.0/0
3019 * unicast-ip4-chain
3020 * [@0]: dpo-load-balance: [index:12 buckets:1 uRPF:11 to:[0:0]]
3021 * [0] [@0]: dpo-drop ip6
3022 * 0.0.0.0/32
3023 * unicast-ip4-chain
3024 * [@0]: dpo-load-balance: [index:13 buckets:1 uRPF:12 to:[0:0]]
3025 * [0] [@0]: dpo-drop ip6
3026 * 172.16.1.0/24
3027 * unicast-ip4-chain
3028 * [@0]: dpo-load-balance: [index:17 buckets:1 uRPF:16 to:[0:0]]
3029 * [0] [@4]: ipv4-glean: af_packet0
3030 * 172.16.1.1/32
3031 * unicast-ip4-chain
3032 * [@0]: dpo-load-balance: [index:18 buckets:1 uRPF:17 to:[1:84]]
3033 * [0] [@2]: dpo-receive: 172.16.1.1 on af_packet0
3034 * 172.16.1.2/32
3035 * unicast-ip4-chain
3036 * [@0]: dpo-load-balance: [index:21 buckets:1 uRPF:20 to:[0:0]]
3037 * [0] [@5]: ipv4 via 172.16.1.2 af_packet0: IP4: 02:fe:9e:70:7a:2b -> 26:a5:f6:9c:3a:36
3038 * 172.16.2.0/24
3039 * unicast-ip4-chain
3040 * [@0]: dpo-load-balance: [index:19 buckets:1 uRPF:18 to:[0:0]]
3041 * [0] [@4]: ipv4-glean: af_packet1
3042 * 172.16.2.1/32
3043 * unicast-ip4-chain
3044 * [@0]: dpo-load-balance: [index:20 buckets:1 uRPF:19 to:[0:0]]
3045 * [0] [@2]: dpo-receive: 172.16.2.1 on af_packet1
3046 * 224.0.0.0/8
3047 * unicast-ip4-chain
3048 * [@0]: dpo-load-balance: [index:15 buckets:1 uRPF:14 to:[0:0]]
3049 * [0] [@0]: dpo-drop ip6
3050 * 240.0.0.0/8
3051 * unicast-ip4-chain
3052 * [@0]: dpo-load-balance: [index:14 buckets:1 uRPF:13 to:[0:0]]
3053 * [0] [@0]: dpo-drop ip6
3054 * 255.255.255.255/32
3055 * unicast-ip4-chain
3056 * [@0]: dpo-load-balance: [index:16 buckets:1 uRPF:15 to:[0:0]]
3057 * [0] [@0]: dpo-drop ip6
Billy McFall0683c9c2016-10-13 08:27:31 -04003058 * @cliexend
3059?*/
3060/* *INDENT-OFF* */
Dave Barachd7cb1b52016-12-09 09:52:16 -05003061VLIB_CLI_COMMAND (set_ip_flow_hash_command, static) =
3062{
Ed Warnickecb9cada2015-12-08 15:45:58 -07003063 .path = "set ip flow-hash",
Dave Barach75fc8542016-10-11 16:16:02 -04003064 .short_help =
Billy McFall0683c9c2016-10-13 08:27:31 -04003065 "set ip flow-hash table <table-id> [src] [dst] [sport] [dport] [proto] [reverse]",
Ed Warnickecb9cada2015-12-08 15:45:58 -07003066 .function = set_ip_flow_hash_command_fn,
3067};
Billy McFall0683c9c2016-10-13 08:27:31 -04003068/* *INDENT-ON* */
Dave Barach75fc8542016-10-11 16:16:02 -04003069
Dave Barachd7cb1b52016-12-09 09:52:16 -05003070int
3071vnet_set_ip4_classify_intfc (vlib_main_t * vm, u32 sw_if_index,
3072 u32 table_index)
Ed Warnickecb9cada2015-12-08 15:45:58 -07003073{
Dave Barachd7cb1b52016-12-09 09:52:16 -05003074 vnet_main_t *vnm = vnet_get_main ();
3075 vnet_interface_main_t *im = &vnm->interface_main;
3076 ip4_main_t *ipm = &ip4_main;
3077 ip_lookup_main_t *lm = &ipm->lookup_main;
3078 vnet_classify_main_t *cm = &vnet_classify_main;
Neale Rannsdf089a82016-10-02 16:39:06 +01003079 ip4_address_t *if_addr;
Ed Warnickecb9cada2015-12-08 15:45:58 -07003080
3081 if (pool_is_free_index (im->sw_interfaces, sw_if_index))
3082 return VNET_API_ERROR_NO_MATCHING_INTERFACE;
3083
3084 if (table_index != ~0 && pool_is_free_index (cm->tables, table_index))
3085 return VNET_API_ERROR_NO_SUCH_ENTRY;
3086
3087 vec_validate (lm->classify_table_index_by_sw_if_index, sw_if_index);
Dave Barachd7cb1b52016-12-09 09:52:16 -05003088 lm->classify_table_index_by_sw_if_index[sw_if_index] = table_index;
Ed Warnickecb9cada2015-12-08 15:45:58 -07003089
Neale Rannsdf089a82016-10-02 16:39:06 +01003090 if_addr = ip4_interface_first_address (ipm, sw_if_index, NULL);
3091
3092 if (NULL != if_addr)
Dave Barachd7cb1b52016-12-09 09:52:16 -05003093 {
Neale Rannsdf089a82016-10-02 16:39:06 +01003094 fib_prefix_t pfx = {
Dave Barachd7cb1b52016-12-09 09:52:16 -05003095 .fp_len = 32,
3096 .fp_proto = FIB_PROTOCOL_IP4,
3097 .fp_addr.ip4 = *if_addr,
Neale Rannsdf089a82016-10-02 16:39:06 +01003098 };
3099 u32 fib_index;
3100
Dave Barachd7cb1b52016-12-09 09:52:16 -05003101 fib_index = fib_table_get_index_for_sw_if_index (FIB_PROTOCOL_IP4,
3102 sw_if_index);
Neale Rannsdf089a82016-10-02 16:39:06 +01003103
3104
Dave Barachd7cb1b52016-12-09 09:52:16 -05003105 if (table_index != (u32) ~ 0)
3106 {
3107 dpo_id_t dpo = DPO_INVALID;
Neale Rannsdf089a82016-10-02 16:39:06 +01003108
Dave Barachd7cb1b52016-12-09 09:52:16 -05003109 dpo_set (&dpo,
3110 DPO_CLASSIFY,
3111 DPO_PROTO_IP4,
3112 classify_dpo_create (DPO_PROTO_IP4, table_index));
Neale Rannsdf089a82016-10-02 16:39:06 +01003113
Dave Barachd7cb1b52016-12-09 09:52:16 -05003114 fib_table_entry_special_dpo_add (fib_index,
3115 &pfx,
3116 FIB_SOURCE_CLASSIFY,
3117 FIB_ENTRY_FLAG_NONE, &dpo);
3118 dpo_reset (&dpo);
3119 }
Neale Rannsdf089a82016-10-02 16:39:06 +01003120 else
Dave Barachd7cb1b52016-12-09 09:52:16 -05003121 {
3122 fib_table_entry_special_remove (fib_index,
3123 &pfx, FIB_SOURCE_CLASSIFY);
3124 }
3125 }
Neale Rannsdf089a82016-10-02 16:39:06 +01003126
Ed Warnickecb9cada2015-12-08 15:45:58 -07003127 return 0;
3128}
3129
3130static clib_error_t *
3131set_ip_classify_command_fn (vlib_main_t * vm,
Dave Barachd7cb1b52016-12-09 09:52:16 -05003132 unformat_input_t * input,
3133 vlib_cli_command_t * cmd)
Ed Warnickecb9cada2015-12-08 15:45:58 -07003134{
3135 u32 table_index = ~0;
3136 int table_index_set = 0;
3137 u32 sw_if_index = ~0;
3138 int rv;
Dave Barach75fc8542016-10-11 16:16:02 -04003139
Dave Barachd7cb1b52016-12-09 09:52:16 -05003140 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
3141 {
3142 if (unformat (input, "table-index %d", &table_index))
3143 table_index_set = 1;
3144 else if (unformat (input, "intfc %U", unformat_vnet_sw_interface,
3145 vnet_get_main (), &sw_if_index))
3146 ;
3147 else
3148 break;
3149 }
Dave Barach75fc8542016-10-11 16:16:02 -04003150
Ed Warnickecb9cada2015-12-08 15:45:58 -07003151 if (table_index_set == 0)
3152 return clib_error_return (0, "classify table-index must be specified");
3153
3154 if (sw_if_index == ~0)
3155 return clib_error_return (0, "interface / subif must be specified");
3156
3157 rv = vnet_set_ip4_classify_intfc (vm, sw_if_index, table_index);
3158
3159 switch (rv)
3160 {
3161 case 0:
3162 break;
3163
3164 case VNET_API_ERROR_NO_MATCHING_INTERFACE:
3165 return clib_error_return (0, "No such interface");
3166
3167 case VNET_API_ERROR_NO_SUCH_ENTRY:
3168 return clib_error_return (0, "No such classifier table");
3169 }
3170 return 0;
3171}
3172
Billy McFall0683c9c2016-10-13 08:27:31 -04003173/*?
3174 * Assign a classification table to an interface. The classification
3175 * table is created using the '<em>classify table</em>' and '<em>classify session</em>'
3176 * commands. Once the table is create, use this command to filter packets
3177 * on an interface.
3178 *
3179 * @cliexpar
3180 * Example of how to assign a classification table to an interface:
3181 * @cliexcmd{set ip classify intfc GigabitEthernet2/0/0 table-index 1}
3182?*/
3183/* *INDENT-OFF* */
Dave Barachd7cb1b52016-12-09 09:52:16 -05003184VLIB_CLI_COMMAND (set_ip_classify_command, static) =
3185{
Ed Warnickecb9cada2015-12-08 15:45:58 -07003186 .path = "set ip classify",
Dave Barach75fc8542016-10-11 16:16:02 -04003187 .short_help =
Billy McFall0683c9c2016-10-13 08:27:31 -04003188 "set ip classify intfc <interface> table-index <classify-idx>",
Ed Warnickecb9cada2015-12-08 15:45:58 -07003189 .function = set_ip_classify_command_fn,
3190};
Billy McFall0683c9c2016-10-13 08:27:31 -04003191/* *INDENT-ON* */
Dave Barachd7cb1b52016-12-09 09:52:16 -05003192
Neale Ranns1ec36522017-11-29 05:20:37 -08003193static clib_error_t *
3194ip4_config (vlib_main_t * vm, unformat_input_t * input)
3195{
3196 ip4_main_t *im = &ip4_main;
3197 uword heapsize = 0;
3198
3199 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
3200 {
3201 if (unformat (input, "heap-size %U", unformat_memory_size, &heapsize))
3202 ;
3203 else
3204 return clib_error_return (0,
3205 "invalid heap-size parameter `%U'",
3206 format_unformat_error, input);
3207 }
3208
3209 im->mtrie_heap_size = heapsize;
3210
3211 return 0;
3212}
3213
3214VLIB_EARLY_CONFIG_FUNCTION (ip4_config, "ip");
3215
Dave Barachd7cb1b52016-12-09 09:52:16 -05003216/*
3217 * fd.io coding-style-patch-verification: ON
3218 *
3219 * Local Variables:
3220 * eval: (c-set-style "gnu")
3221 * End:
3222 */