blob: 8524c6c83aeaa15fcff3bb09094d4280639b192e [file] [log] [blame]
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001/*
2 * Copyright (c) 2016 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
6 *
7 * http://www.apache.org/licenses/LICENSE-2.0
8 *
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
14 */
15
16#include <vnet/adj/adj_nbr.h>
17#include <vnet/adj/adj_internal.h>
18#include <vnet/ethernet/arp_packet.h>
19#include <vnet/fib/fib_walk.h>
20
21/*
22 * Vector Hash tables of neighbour (traditional) adjacencies
23 * Key: interface(for the vector index), address (and its proto),
24 * link-type/ether-type.
25 */
Neale Ranns20aec3d2020-05-25 09:09:36 +000026static uword **adj_nbr_tables[FIB_PROTOCOL_IP_MAX];
Neale Ranns0bfe5d82016-08-25 15:29:12 +010027
Neale Ranns20aec3d2020-05-25 09:09:36 +000028typedef struct adj_nbr_key_t_
29{
30 ip46_address_t ank_ip;
31 u64 ank_linkt;
32} adj_nbr_key_t;
Neale Ranns0bfe5d82016-08-25 15:29:12 +010033
34#define ADJ_NBR_SET_KEY(_key, _lt, _nh) \
35{ \
Neale Ranns20aec3d2020-05-25 09:09:36 +000036 ip46_address_copy(&(_key).ank_ip, (_nh)); \
37 _key.ank_linkt = (_lt); \
Neale Ranns0bfe5d82016-08-25 15:29:12 +010038}
39
40#define ADJ_NBR_ITF_OK(_proto, _itf) \
41 (((_itf) < vec_len(adj_nbr_tables[_proto])) && \
yedgf6698d22020-08-29 14:12:20 +080042 (NULL != adj_nbr_tables[_proto][(_itf)]))
Neale Ranns0bfe5d82016-08-25 15:29:12 +010043
Benoît Gannefaec38f2020-08-13 11:16:56 +020044#define ADJ_NBR_ASSERT_NH_PROTO(nh_proto, err) \
45 do { \
46 ASSERT (nh_proto < FIB_PROTOCOL_IP_MAX); \
47 const fib_protocol_t nh_proto__ = (nh_proto); \
48 if (nh_proto__ >= FIB_PROTOCOL_IP_MAX) \
49 { \
50 clib_warning ("BUG: protocol %d > %d\n", \
51 (int)nh_proto__, \
52 FIB_PROTOCOL_IP_MAX); \
53 return err; \
54 } \
55 } while (0)
56
Neale Ranns0bfe5d82016-08-25 15:29:12 +010057static void
58adj_nbr_insert (fib_protocol_t nh_proto,
Neale Ranns924d03a2016-10-19 08:25:46 +010059 vnet_link_t link_type,
Neale Ranns0bfe5d82016-08-25 15:29:12 +010060 const ip46_address_t *nh_addr,
61 u32 sw_if_index,
62 adj_index_t adj_index)
63{
Neale Ranns20aec3d2020-05-25 09:09:36 +000064 adj_nbr_key_t kv;
Neale Ranns0bfe5d82016-08-25 15:29:12 +010065
Benoît Gannefaec38f2020-08-13 11:16:56 +020066 ADJ_NBR_ASSERT_NH_PROTO (nh_proto,);
67
Neale Ranns0bfe5d82016-08-25 15:29:12 +010068 if (sw_if_index >= vec_len(adj_nbr_tables[nh_proto]))
69 {
70 vec_validate(adj_nbr_tables[nh_proto], sw_if_index);
71 }
72 if (NULL == adj_nbr_tables[nh_proto][sw_if_index])
73 {
74 adj_nbr_tables[nh_proto][sw_if_index] =
Neale Ranns20aec3d2020-05-25 09:09:36 +000075 hash_create_mem(0, sizeof(adj_nbr_key_t), sizeof(adj_index_t));
Neale Ranns0bfe5d82016-08-25 15:29:12 +010076 }
77
78 ADJ_NBR_SET_KEY(kv, link_type, nh_addr);
Neale Ranns0bfe5d82016-08-25 15:29:12 +010079
Neale Ranns20aec3d2020-05-25 09:09:36 +000080 hash_set_mem_alloc (&adj_nbr_tables[nh_proto][sw_if_index],
81 &kv, adj_index);
Neale Ranns0bfe5d82016-08-25 15:29:12 +010082}
83
84void
Neale Ranns177bbdc2016-11-15 09:46:51 +000085adj_nbr_remove (adj_index_t ai,
86 fib_protocol_t nh_proto,
Neale Ranns924d03a2016-10-19 08:25:46 +010087 vnet_link_t link_type,
Neale Ranns0bfe5d82016-08-25 15:29:12 +010088 const ip46_address_t *nh_addr,
89 u32 sw_if_index)
90{
Neale Ranns20aec3d2020-05-25 09:09:36 +000091 adj_nbr_key_t kv;
Neale Ranns0bfe5d82016-08-25 15:29:12 +010092
Benoît Gannefaec38f2020-08-13 11:16:56 +020093 ADJ_NBR_ASSERT_NH_PROTO (nh_proto,);
94
Neale Ranns0bfe5d82016-08-25 15:29:12 +010095 if (!ADJ_NBR_ITF_OK(nh_proto, sw_if_index))
96 return;
97
98 ADJ_NBR_SET_KEY(kv, link_type, nh_addr);
99
Neale Ranns20aec3d2020-05-25 09:09:36 +0000100 hash_unset_mem_free(&adj_nbr_tables[nh_proto][sw_if_index], &kv);
101
102 if (0 == hash_elts(adj_nbr_tables[nh_proto][sw_if_index]))
103 {
104 hash_free(adj_nbr_tables[nh_proto][sw_if_index]);
105 }
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100106}
107
Florin Corasf9d05682018-04-26 08:26:52 -0700108adj_index_t
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100109adj_nbr_find (fib_protocol_t nh_proto,
Neale Ranns924d03a2016-10-19 08:25:46 +0100110 vnet_link_t link_type,
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100111 const ip46_address_t *nh_addr,
112 u32 sw_if_index)
113{
Neale Ranns20aec3d2020-05-25 09:09:36 +0000114 adj_nbr_key_t kv;
115 uword *p;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100116
Benoît Gannefaec38f2020-08-13 11:16:56 +0200117 ADJ_NBR_ASSERT_NH_PROTO (nh_proto, ADJ_INDEX_INVALID);
118
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100119 ADJ_NBR_SET_KEY(kv, link_type, nh_addr);
120
121 if (!ADJ_NBR_ITF_OK(nh_proto, sw_if_index))
122 return (ADJ_INDEX_INVALID);
123
Neale Ranns20aec3d2020-05-25 09:09:36 +0000124 p = hash_get_mem(adj_nbr_tables[nh_proto][sw_if_index], &kv);
125
126 if (p)
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100127 {
Neale Ranns20aec3d2020-05-25 09:09:36 +0000128 return (p[0]);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100129 }
Neale Ranns20aec3d2020-05-25 09:09:36 +0000130 return (ADJ_INDEX_INVALID);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100131}
132
Neale Rannsb80c5362016-10-08 13:03:40 +0100133static inline u32
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100134adj_get_nd_node (fib_protocol_t proto)
135{
136 switch (proto) {
137 case FIB_PROTOCOL_IP4:
Neale Rannsb80c5362016-10-08 13:03:40 +0100138 return (ip4_arp_node.index);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100139 case FIB_PROTOCOL_IP6:
Neale Rannsb80c5362016-10-08 13:03:40 +0100140 return (ip6_discover_neighbor_node.index);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100141 case FIB_PROTOCOL_MPLS:
142 break;
143 }
144 ASSERT(0);
Neale Rannsb80c5362016-10-08 13:03:40 +0100145 return (ip4_arp_node.index);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100146}
147
AkshayaNadahalli17f5f602017-03-27 14:47:41 +0530148/**
149 * @brief Check and set feature flags if o/p interface has any o/p features.
150 */
151static void
152adj_nbr_evaluate_feature (adj_index_t ai)
153{
154 ip_adjacency_t *adj;
155 vnet_feature_main_t *fm = &feature_main;
156 i16 feature_count;
157 u8 arc_index;
158 u32 sw_if_index;
159
160 adj = adj_get(ai);
161
162 switch (adj->ia_link)
163 {
164 case VNET_LINK_IP4:
165 arc_index = ip4_main.lookup_main.output_feature_arc_index;
166 break;
167 case VNET_LINK_IP6:
168 arc_index = ip6_main.lookup_main.output_feature_arc_index;
169 break;
170 case VNET_LINK_MPLS:
171 arc_index = mpls_main.output_feature_arc_index;
172 break;
173 default:
174 return;
175 }
176
177 sw_if_index = adj->rewrite_header.sw_if_index;
AkshayaNadahalli98ab0912017-03-27 17:21:05 +0000178 if (vec_len(fm->feature_count_by_sw_if_index[arc_index]) > sw_if_index)
179 {
180 feature_count = fm->feature_count_by_sw_if_index[arc_index][sw_if_index];
181 if (feature_count > 0)
Neale Ranns4ec36c52020-03-31 09:21:29 -0400182 {
183 vnet_feature_config_main_t *cm;
AkshayaNadahalli17f5f602017-03-27 14:47:41 +0530184
Neale Ranns4ec36c52020-03-31 09:21:29 -0400185 adj->rewrite_header.flags |= VNET_REWRITE_HAS_FEATURES;
186 cm = &fm->feature_config_mains[arc_index];
187
188 adj->ia_cfg_index = vec_elt (cm->config_index_by_sw_if_index,
189 sw_if_index);
190 }
191 }
AkshayaNadahalli17f5f602017-03-27 14:47:41 +0530192 return;
193}
194
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100195static ip_adjacency_t*
196adj_nbr_alloc (fib_protocol_t nh_proto,
Neale Ranns924d03a2016-10-19 08:25:46 +0100197 vnet_link_t link_type,
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100198 const ip46_address_t *nh_addr,
199 u32 sw_if_index)
200{
201 ip_adjacency_t *adj;
202
203 adj = adj_alloc(nh_proto);
204
205 adj_nbr_insert(nh_proto, link_type, nh_addr,
206 sw_if_index,
Neale Ranns6c3ebcc2016-10-02 21:20:15 +0100207 adj_get_index(adj));
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100208
209 /*
210 * since we just added the ADJ we have no rewrite string for it,
211 * so its for ARP
212 */
213 adj->lookup_next_index = IP_LOOKUP_NEXT_ARP;
214 adj->sub_type.nbr.next_hop = *nh_addr;
215 adj->ia_link = link_type;
216 adj->ia_nh_proto = nh_proto;
Neale Rannsb80c5362016-10-08 13:03:40 +0100217 adj->rewrite_header.sw_if_index = sw_if_index;
Neale Ranns1bce5a92018-10-30 06:34:25 -0700218 vnet_rewrite_update_mtu(vnet_get_main(), adj->ia_link,
219 &adj->rewrite_header);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100220
AkshayaNadahalli17f5f602017-03-27 14:47:41 +0530221 adj_nbr_evaluate_feature (adj_get_index(adj));
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100222 return (adj);
223}
224
Neale Ranns8f5fef22020-12-21 08:29:34 +0000225void
226adj_nbr_set_mtu (adj_index_t adj_index, u16 mtu)
227{
228 ip_adjacency_t *adj;
229
230 ASSERT(ADJ_INDEX_INVALID != adj_index);
231
232 adj = adj_get(adj_index);
233
234 if (0 == mtu)
235 vnet_rewrite_update_mtu(vnet_get_main(), adj->ia_link,
236 &adj->rewrite_header);
237 else
238 {
239 vnet_rewrite_update_mtu(vnet_get_main(), adj->ia_link,
240 &adj->rewrite_header);
241 adj->rewrite_header.max_l3_packet_bytes =
242 clib_min (adj->rewrite_header.max_l3_packet_bytes, mtu);
243 }
244}
245
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100246/*
Neale Ranns32e1c012016-11-22 17:07:28 +0000247 * adj_nbr_add_or_lock
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100248 *
249 * Add an adjacency for the neighbour requested.
250 *
251 * The key for an adj is:
252 * - the Next-hops protocol (i.e. v4 or v6)
253 * - the address of the next-hop
254 * - the interface the next-hop is reachable through
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100255 */
256adj_index_t
257adj_nbr_add_or_lock (fib_protocol_t nh_proto,
Neale Ranns924d03a2016-10-19 08:25:46 +0100258 vnet_link_t link_type,
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100259 const ip46_address_t *nh_addr,
260 u32 sw_if_index)
261{
262 adj_index_t adj_index;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100263
264 adj_index = adj_nbr_find(nh_proto, link_type, nh_addr, sw_if_index);
265
266 if (ADJ_INDEX_INVALID == adj_index)
267 {
Neale Ranns77cfc012019-12-15 22:26:37 +0000268 ip_adjacency_t *adj;
Neale Rannsb80c5362016-10-08 13:03:40 +0100269 vnet_main_t *vnm;
270
271 vnm = vnet_get_main();
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100272 adj = adj_nbr_alloc(nh_proto, link_type, nh_addr, sw_if_index);
Neale Rannsb80c5362016-10-08 13:03:40 +0100273 adj_index = adj_get_index(adj);
274 adj_lock(adj_index);
275
Neale Ranns1855b8e2018-07-11 10:31:26 -0700276 if (ip46_address_is_equal(&ADJ_BCAST_ADDR, nh_addr))
277 {
278 adj->lookup_next_index = IP_LOOKUP_NEXT_BCAST;
279 }
280
Ole Troand7231612018-06-07 10:17:57 +0200281 vnet_rewrite_init(vnm, sw_if_index, link_type,
Neale Rannsb80c5362016-10-08 13:03:40 +0100282 adj_get_nd_node(nh_proto),
283 vnet_tx_node_index_for_sw_interface(vnm, sw_if_index),
284 &adj->rewrite_header);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100285
286 /*
Neale Rannsb80c5362016-10-08 13:03:40 +0100287 * we need a rewrite where the destination IP address is converted
288 * to the appropriate link-layer address. This is interface specific.
289 * So ask the interface to do it.
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100290 */
Neale Rannsb80c5362016-10-08 13:03:40 +0100291 vnet_update_adjacency_for_sw_interface(vnm, sw_if_index, adj_index);
Neale Ranns8f5fef22020-12-21 08:29:34 +0000292 adj_delegate_adj_created(adj_get(adj_index));
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100293 }
294 else
295 {
Neale Rannsb80c5362016-10-08 13:03:40 +0100296 adj_lock(adj_index);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100297 }
298
Neale Rannsb80c5362016-10-08 13:03:40 +0100299 return (adj_index);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100300}
301
302adj_index_t
303adj_nbr_add_or_lock_w_rewrite (fib_protocol_t nh_proto,
Neale Ranns924d03a2016-10-19 08:25:46 +0100304 vnet_link_t link_type,
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100305 const ip46_address_t *nh_addr,
306 u32 sw_if_index,
307 u8 *rewrite)
308{
309 adj_index_t adj_index;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100310
311 adj_index = adj_nbr_find(nh_proto, link_type, nh_addr, sw_if_index);
312
313 if (ADJ_INDEX_INVALID == adj_index)
314 {
Neale Ranns13a08cc2018-11-07 09:25:54 -0800315 ip_adjacency_t *adj;
316
317 adj = adj_nbr_alloc(nh_proto, link_type, nh_addr, sw_if_index);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100318 adj->rewrite_header.sw_if_index = sw_if_index;
Neale Ranns13a08cc2018-11-07 09:25:54 -0800319 adj_index = adj_get_index(adj);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100320 }
321
Neale Ranns13a08cc2018-11-07 09:25:54 -0800322 adj_lock(adj_index);
323 adj_nbr_update_rewrite(adj_index,
Neale Rannsb80c5362016-10-08 13:03:40 +0100324 ADJ_NBR_REWRITE_FLAG_COMPLETE,
325 rewrite);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100326
Neale Ranns77cfc012019-12-15 22:26:37 +0000327 adj_delegate_adj_created(adj_get(adj_index));
328
Neale Ranns13a08cc2018-11-07 09:25:54 -0800329 return (adj_index);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100330}
331
332/**
333 * adj_nbr_update_rewrite
334 *
335 * Update the adjacency's rewrite string. A NULL string implies the
Jim Thompsonf324dec2019-04-08 03:22:21 -0500336 * rewrite is reset (i.e. when ARP/ND entry is gone).
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100337 * NB: the adj being updated may be handling traffic in the DP.
338 */
339void
340adj_nbr_update_rewrite (adj_index_t adj_index,
Neale Rannsb80c5362016-10-08 13:03:40 +0100341 adj_nbr_rewrite_flag_t flags,
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100342 u8 *rewrite)
343{
344 ip_adjacency_t *adj;
345
346 ASSERT(ADJ_INDEX_INVALID != adj_index);
347
348 adj = adj_get(adj_index);
Neale Rannsb80c5362016-10-08 13:03:40 +0100349
350 if (flags & ADJ_NBR_REWRITE_FLAG_COMPLETE)
351 {
352 /*
353 * update the adj's rewrite string and build the arc
354 * from the rewrite node to the interface's TX node
355 */
356 adj_nbr_update_rewrite_internal(adj, IP_LOOKUP_NEXT_REWRITE,
357 adj_get_rewrite_node(adj->ia_link),
358 vnet_tx_node_index_for_sw_interface(
359 vnet_get_main(),
360 adj->rewrite_header.sw_if_index),
361 rewrite);
362 }
363 else
364 {
365 adj_nbr_update_rewrite_internal(adj, IP_LOOKUP_NEXT_ARP,
366 adj_get_nd_node(adj->ia_nh_proto),
367 vnet_tx_node_index_for_sw_interface(
368 vnet_get_main(),
369 adj->rewrite_header.sw_if_index),
370 rewrite);
371 }
Neale Rannsb80c5362016-10-08 13:03:40 +0100372}
373
374/**
375 * adj_nbr_update_rewrite_internal
376 *
377 * Update the adjacency's rewrite string. A NULL string implies the
Jim Thompsonf324dec2019-04-08 03:22:21 -0500378 * rewrite is reset (i.e. when ARP/ND entry is gone).
Neale Rannsb80c5362016-10-08 13:03:40 +0100379 * NB: the adj being updated may be handling traffic in the DP.
380 */
381void
382adj_nbr_update_rewrite_internal (ip_adjacency_t *adj,
Neale Rannsfa5d1982017-02-20 14:19:51 -0800383 ip_lookup_next_t adj_next_index,
Neale Rannsb80c5362016-10-08 13:03:40 +0100384 u32 this_node,
385 u32 next_node,
386 u8 *rewrite)
387{
Neale Ranns19c68d22016-12-07 15:38:14 +0000388 ip_adjacency_t *walk_adj;
Neale Ranns66300f62020-01-12 21:16:55 +0000389 adj_index_t walk_ai, ai;
Neale Rannsad95b5d2016-11-10 20:35:14 +0000390 vlib_main_t * vm;
391 u32 old_next;
Neale Ranns19c68d22016-12-07 15:38:14 +0000392 int do_walk;
Neale Rannsad95b5d2016-11-10 20:35:14 +0000393
394 vm = vlib_get_main();
395 old_next = adj->lookup_next_index;
396
Neale Ranns66300f62020-01-12 21:16:55 +0000397 ai = walk_ai = adj_get_index(adj);
Neale Rannsad95b5d2016-11-10 20:35:14 +0000398 if (VNET_LINK_MPLS == adj->ia_link)
399 {
400 /*
401 * The link type MPLS has no children in the control plane graph, it only
Paul Vinciguerra8feeaff2019-03-27 11:25:48 -0700402 * has children in the data-plane graph. The backwalk is up the former.
Neale Rannsad95b5d2016-11-10 20:35:14 +0000403 * So we need to walk from its IP cousin.
404 */
405 walk_ai = adj_nbr_find(adj->ia_nh_proto,
406 fib_proto_to_link(adj->ia_nh_proto),
407 &adj->sub_type.nbr.next_hop,
408 adj->rewrite_header.sw_if_index);
409 }
Neale Rannsb80c5362016-10-08 13:03:40 +0100410
411 /*
Neale Ranns19c68d22016-12-07 15:38:14 +0000412 * Don't call the walk re-entrantly
413 */
414 if (ADJ_INDEX_INVALID != walk_ai)
415 {
416 walk_adj = adj_get(walk_ai);
Neale Rannsfa5d1982017-02-20 14:19:51 -0800417 if (ADJ_FLAG_SYNC_WALK_ACTIVE & walk_adj->ia_flags)
Neale Ranns19c68d22016-12-07 15:38:14 +0000418 {
419 do_walk = 0;
420 }
421 else
422 {
423 /*
424 * Prevent re-entrant walk of the same adj
425 */
Neale Rannsfa5d1982017-02-20 14:19:51 -0800426 walk_adj->ia_flags |= ADJ_FLAG_SYNC_WALK_ACTIVE;
Neale Ranns19c68d22016-12-07 15:38:14 +0000427 do_walk = 1;
428 }
429 }
430 else
431 {
432 do_walk = 0;
433 }
434
435 /*
436 * lock the adjacencies that are affected by updates this walk will provoke.
437 * Since the aim of the walk is to update children to link to a different
438 * DPO, this adj will no longer be in use and its lock count will drop to 0.
Paul Vinciguerra8feeaff2019-03-27 11:25:48 -0700439 * We don't want it to be deleted as part of this endeavour.
Neale Ranns19c68d22016-12-07 15:38:14 +0000440 */
Neale Ranns66300f62020-01-12 21:16:55 +0000441 adj_lock(ai);
Neale Ranns19c68d22016-12-07 15:38:14 +0000442 adj_lock(walk_ai);
443
444 /*
Neale Rannsb80c5362016-10-08 13:03:40 +0100445 * Updating a rewrite string is not atomic;
446 * - the rewrite string is too long to write in one instruction
447 * - when swapping from incomplete to complete, we also need to update
Neale Rannsad95b5d2016-11-10 20:35:14 +0000448 * the VLIB graph next-index of the adj.
Neale Rannsb80c5362016-10-08 13:03:40 +0100449 * ideally we would only want to suspend forwarding via this adj whilst we
450 * do this, but we do not have that level of granularity - it's suspend all
451 * worker threads or nothing.
Paul Vinciguerra8feeaff2019-03-27 11:25:48 -0700452 * The other choices are:
Neale Rannsb80c5362016-10-08 13:03:40 +0100453 * - to mark the adj down and back walk so child load-balances drop this adj
454 * from the set.
455 * - update the next_node index of this adj to point to error-drop
456 * both of which will mean for MAC change we will drop for this adj
Neale Rannsad95b5d2016-11-10 20:35:14 +0000457 * which is not acceptable. However, when the adj changes type (from
458 * complete to incomplete and vice-versa) the child DPOs, which have the
459 * VLIB graph next node index, will be sending packets to the wrong graph
460 * node. So from the options above, updating the next_node of the adj to
461 * be drop will work, but it relies on each graph node v4/v6/mpls, rewrite/
462 * arp/midchain always be valid w.r.t. a mis-match of adj type and node type
Paul Vinciguerra8feeaff2019-03-27 11:25:48 -0700463 * (i.e. a rewrite adj in the arp node). This is not enforceable. Getting it
Neale Rannsad95b5d2016-11-10 20:35:14 +0000464 * wrong will lead to hard to find bugs since its a race condition. So we
465 * choose the more reliable method of updating the children to use the drop,
466 * then switching adj's type, then updating the children again. Did I mention
467 * that this doesn't happen often...
468 * So we need to distinguish between the two cases:
469 * 1 - mac change
470 * 2 - adj type change
471 */
Neale Ranns19c68d22016-12-07 15:38:14 +0000472 if (do_walk &&
473 old_next != adj_next_index &&
Neale Rannsad95b5d2016-11-10 20:35:14 +0000474 ADJ_INDEX_INVALID != walk_ai)
475 {
476 /*
477 * the adj is changing type. we need to fix all children so that they
478 * stack momentarily on a drop, while the adj changes. If we don't do
479 * this the children will send packets to a VLIB graph node that does
480 * not correspond to the adj's type - and it goes downhill from there.
481 */
482 fib_node_back_walk_ctx_t bw_ctx = {
483 .fnbw_reason = FIB_NODE_BW_REASON_FLAG_ADJ_DOWN,
484 /*
Paul Vinciguerra8feeaff2019-03-27 11:25:48 -0700485 * force this walk to be synchronous. if we don't and a node in the graph
Neale Rannsad95b5d2016-11-10 20:35:14 +0000486 * (a heavily shared path-list) chooses to back-ground the walk (make it
487 * async) then it will pause and we will do the adj update below, before
488 * all the children are updated. not good.
489 */
490 .fnbw_flags = FIB_NODE_BW_FLAG_FORCE_SYNC,
491 };
492
493 fib_walk_sync(FIB_NODE_TYPE_ADJ, walk_ai, &bw_ctx);
Steven Luong3d5f6222020-01-30 09:11:18 -0800494 /*
495 * fib_walk_sync may allocate a new adjacency and potentially cuase a
496 * realloc for adj_pool. When that happens, adj pointer is no longer
497 * valid here. We refresh the adj pointer accordingly.
498 */
499 adj = adj_get (ai);
Neale Rannsad95b5d2016-11-10 20:35:14 +0000500 }
501
502 /*
503 * If we are just updating the MAC string of the adj (which we also can't
504 * do atomically), then we need to stop packets switching through the adj.
505 * We can't do that on a per-adj basis, so it's all the packets.
506 * If we are updating the type, and we walked back to the children above,
507 * then this barrier serves to flush the queues/frames.
Neale Rannsb80c5362016-10-08 13:03:40 +0100508 */
509 vlib_worker_thread_barrier_sync(vm);
510
511 adj->lookup_next_index = adj_next_index;
Neale Rannscbe25aa2019-09-30 10:53:31 +0000512 adj->ia_node_index = this_node;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100513
514 if (NULL != rewrite)
515 {
516 /*
517 * new rewrite provided.
Neale Rannsb80c5362016-10-08 13:03:40 +0100518 * fill in the adj's rewrite string, and build the VLIB graph arc.
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100519 */
Neale Rannsb80c5362016-10-08 13:03:40 +0100520 vnet_rewrite_set_data_internal(&adj->rewrite_header,
521 sizeof(adj->rewrite_data),
522 rewrite,
523 vec_len(rewrite));
Neale Rannsb80c5362016-10-08 13:03:40 +0100524 vec_free(rewrite);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100525 }
526 else
527 {
Neale Rannsb80c5362016-10-08 13:03:40 +0100528 vnet_rewrite_clear_data_internal(&adj->rewrite_header,
529 sizeof(adj->rewrite_data));
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100530 }
Neale Rannsad95b5d2016-11-10 20:35:14 +0000531 adj->rewrite_header.next_index = vlib_node_add_next(vlib_get_main(),
532 this_node,
533 next_node);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100534
535 /*
Paul Vinciguerra8feeaff2019-03-27 11:25:48 -0700536 * done with the rewrite update - let the workers loose.
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100537 */
Neale Rannsb80c5362016-10-08 13:03:40 +0100538 vlib_worker_thread_barrier_release(vm);
Neale Rannsad95b5d2016-11-10 20:35:14 +0000539
Neale Ranns19c68d22016-12-07 15:38:14 +0000540 if (do_walk &&
541 (old_next != adj->lookup_next_index) &&
542 (ADJ_INDEX_INVALID != walk_ai))
Neale Rannsad95b5d2016-11-10 20:35:14 +0000543 {
544 /*
545 * backwalk to the children so they can stack on the now updated
546 * adjacency
547 */
548 fib_node_back_walk_ctx_t bw_ctx = {
549 .fnbw_reason = FIB_NODE_BW_REASON_FLAG_ADJ_UPDATE,
550 };
551
552 fib_walk_sync(FIB_NODE_TYPE_ADJ, walk_ai, &bw_ctx);
553 }
Neale Ranns19c68d22016-12-07 15:38:14 +0000554 /*
555 * Prevent re-entrant walk of the same adj
556 */
557 if (do_walk)
558 {
Neale Ranns37157d52020-01-23 22:46:06 +0000559 walk_adj = adj_get(walk_ai);
Neale Rannsfa5d1982017-02-20 14:19:51 -0800560 walk_adj->ia_flags &= ~ADJ_FLAG_SYNC_WALK_ACTIVE;
Neale Ranns19c68d22016-12-07 15:38:14 +0000561 }
562
Neale Ranns4ec36c52020-03-31 09:21:29 -0400563 adj_delegate_adj_modified(adj);
Neale Ranns66300f62020-01-12 21:16:55 +0000564 adj_unlock(ai);
Neale Ranns19c68d22016-12-07 15:38:14 +0000565 adj_unlock(walk_ai);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100566}
567
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100568u32
569adj_nbr_db_size (void)
570{
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100571 fib_protocol_t proto;
572 u32 sw_if_index = 0;
Neale Ranns20aec3d2020-05-25 09:09:36 +0000573 u64 count = 0;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100574
575 for (proto = FIB_PROTOCOL_IP4; proto <= FIB_PROTOCOL_IP6; proto++)
576 {
577 vec_foreach_index(sw_if_index, adj_nbr_tables[proto])
578 {
579 if (NULL != adj_nbr_tables[proto][sw_if_index])
580 {
Neale Ranns20aec3d2020-05-25 09:09:36 +0000581 count += hash_elts(adj_nbr_tables[proto][sw_if_index]);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100582 }
583 }
584 }
Neale Ranns20aec3d2020-05-25 09:09:36 +0000585 return (count);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100586}
587
588/**
Neale Ranns20aec3d2020-05-25 09:09:36 +0000589 * @brief Walk all adjacencies on a link for a given next-hop protocol
Neale Rannsb80c5362016-10-08 13:03:40 +0100590 */
Neale Rannsb80c5362016-10-08 13:03:40 +0100591void
592adj_nbr_walk (u32 sw_if_index,
593 fib_protocol_t adj_nh_proto,
594 adj_walk_cb_t cb,
595 void *ctx)
596{
Neale Ranns22391fa2020-05-29 10:19:41 -0400597 adj_index_t ai, *ais, *aip;
Neale Ranns20aec3d2020-05-25 09:09:36 +0000598 adj_nbr_key_t *key;
Neale Ranns20aec3d2020-05-25 09:09:36 +0000599
Benoît Gannefaec38f2020-08-13 11:16:56 +0200600 ADJ_NBR_ASSERT_NH_PROTO (adj_nh_proto,);
601
Neale Rannsb80c5362016-10-08 13:03:40 +0100602 if (!ADJ_NBR_ITF_OK(adj_nh_proto, sw_if_index))
603 return;
604
Neale Ranns22391fa2020-05-29 10:19:41 -0400605 ais = NULL;
606
607 /* elements may be removed from the table during the walk, so
608 * collect the set first then process them */
609 hash_foreach_mem (key, ai, adj_nbr_tables[adj_nh_proto][sw_if_index],
610 ({
611 vec_add1(ais, ai);
612 }));
613
614 vec_foreach(aip, ais)
Neale Ranns20aec3d2020-05-25 09:09:36 +0000615 {
Neale Ranns22391fa2020-05-29 10:19:41 -0400616 /* An adj may be deleted during the walk so check first */
617 if (!pool_is_free_index(adj_pool, *aip))
618 cb(*aip, ctx);
Neale Ranns20aec3d2020-05-25 09:09:36 +0000619 }
Neale Ranns22391fa2020-05-29 10:19:41 -0400620 vec_free(ais);
Neale Rannsb80c5362016-10-08 13:03:40 +0100621}
622
623/**
Neale Rannsb80c5362016-10-08 13:03:40 +0100624 * @brief Walk adjacencies on a link with a given v4 next-hop.
625 * that is visit the adjacencies with different link types.
626 */
627void
628adj_nbr_walk_nh4 (u32 sw_if_index,
629 const ip4_address_t *addr,
630 adj_walk_cb_t cb,
631 void *ctx)
632{
633 if (!ADJ_NBR_ITF_OK(FIB_PROTOCOL_IP4, sw_if_index))
634 return;
635
636 ip46_address_t nh = {
637 .ip4 = *addr,
638 };
Neale Ranns580bba72018-04-23 05:31:19 -0700639 vnet_link_t linkt;
640 adj_index_t ai;
Neale Rannsb80c5362016-10-08 13:03:40 +0100641
Neale Ranns580bba72018-04-23 05:31:19 -0700642 FOR_EACH_VNET_LINK(linkt)
643 {
644 ai = adj_nbr_find (FIB_PROTOCOL_IP4, linkt, &nh, sw_if_index);
Neale Rannsb80c5362016-10-08 13:03:40 +0100645
Neale Ranns580bba72018-04-23 05:31:19 -0700646 if (INDEX_INVALID != ai)
647 cb(ai, ctx);
648 }
Neale Rannsb80c5362016-10-08 13:03:40 +0100649}
650
651/**
652 * @brief Walk adjacencies on a link with a given v6 next-hop.
653 * that is visit the adjacencies with different link types.
654 */
655void
656adj_nbr_walk_nh6 (u32 sw_if_index,
657 const ip6_address_t *addr,
658 adj_walk_cb_t cb,
659 void *ctx)
660{
661 if (!ADJ_NBR_ITF_OK(FIB_PROTOCOL_IP6, sw_if_index))
662 return;
663
664 ip46_address_t nh = {
665 .ip6 = *addr,
666 };
Neale Ranns580bba72018-04-23 05:31:19 -0700667 vnet_link_t linkt;
668 adj_index_t ai;
Neale Rannsb80c5362016-10-08 13:03:40 +0100669
Neale Ranns580bba72018-04-23 05:31:19 -0700670 FOR_EACH_VNET_LINK(linkt)
671 {
672 ai = adj_nbr_find (FIB_PROTOCOL_IP6, linkt, &nh, sw_if_index);
Neale Rannsb80c5362016-10-08 13:03:40 +0100673
Neale Ranns580bba72018-04-23 05:31:19 -0700674 if (INDEX_INVALID != ai)
675 cb(ai, ctx);
676 }
Neale Rannsb80c5362016-10-08 13:03:40 +0100677}
678
679/**
680 * @brief Walk adjacencies on a link with a given next-hop.
681 * that is visit the adjacencies with different link types.
682 */
683void
684adj_nbr_walk_nh (u32 sw_if_index,
685 fib_protocol_t adj_nh_proto,
686 const ip46_address_t *nh,
687 adj_walk_cb_t cb,
688 void *ctx)
689{
Benoît Gannefaec38f2020-08-13 11:16:56 +0200690 ADJ_NBR_ASSERT_NH_PROTO (adj_nh_proto,);
691
Neale Rannsb80c5362016-10-08 13:03:40 +0100692 if (!ADJ_NBR_ITF_OK(adj_nh_proto, sw_if_index))
693 return;
694
Neale Rannscbe25aa2019-09-30 10:53:31 +0000695 switch (adj_nh_proto)
Neale Ranns580bba72018-04-23 05:31:19 -0700696 {
Neale Rannscbe25aa2019-09-30 10:53:31 +0000697 case FIB_PROTOCOL_IP4:
698 adj_nbr_walk_nh4(sw_if_index, &nh->ip4, cb, ctx);
699 break;
700 case FIB_PROTOCOL_IP6:
701 adj_nbr_walk_nh6(sw_if_index, &nh->ip6, cb, ctx);
702 break;
703 case FIB_PROTOCOL_MPLS:
704 ASSERT(0);
705 break;
Neale Ranns580bba72018-04-23 05:31:19 -0700706 }
Neale Rannsb80c5362016-10-08 13:03:40 +0100707}
708
709/**
Neale Ranns8b37b872016-11-21 12:25:22 +0000710 * Flags associated with the interface state walks
711 */
712typedef enum adj_nbr_interface_flags_t_
713{
714 ADJ_NBR_INTERFACE_UP = (1 << 0),
715} adj_nbr_interface_flags_t;
716
717/**
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100718 * Context for the state change walk of the DB
719 */
720typedef struct adj_nbr_interface_state_change_ctx_t_
721{
722 /**
Neale Ranns8b37b872016-11-21 12:25:22 +0000723 * Flags on the interface
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100724 */
Neale Ranns8b37b872016-11-21 12:25:22 +0000725 adj_nbr_interface_flags_t flags;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100726} adj_nbr_interface_state_change_ctx_t;
727
Neale Rannsb80c5362016-10-08 13:03:40 +0100728static adj_walk_rc_t
729adj_nbr_interface_state_change_one (adj_index_t ai,
Neale Ranns8b37b872016-11-21 12:25:22 +0000730 void *arg)
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100731{
732 /*
733 * Back walk the graph to inform the forwarding entries
Neale Ranns8b37b872016-11-21 12:25:22 +0000734 * that this interface state has changed. Do this synchronously
735 * since this is the walk that provides convergence
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100736 */
737 adj_nbr_interface_state_change_ctx_t *ctx = arg;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100738 fib_node_back_walk_ctx_t bw_ctx = {
Neale Ranns8b37b872016-11-21 12:25:22 +0000739 .fnbw_reason = ((ctx->flags & ADJ_NBR_INTERFACE_UP) ?
740 FIB_NODE_BW_REASON_FLAG_INTERFACE_UP :
741 FIB_NODE_BW_REASON_FLAG_INTERFACE_DOWN),
742 /*
743 * the force sync applies only as far as the first fib_entry.
744 * And it's the fib_entry's we need to converge away from
745 * the adjacencies on the now down link
746 */
747 .fnbw_flags = (!(ctx->flags & ADJ_NBR_INTERFACE_UP) ?
748 FIB_NODE_BW_FLAG_FORCE_SYNC :
Neale Ranns30d53642018-08-27 07:29:15 -0700749 FIB_NODE_BW_FLAG_NONE),
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100750 };
Neale Ranns30d53642018-08-27 07:29:15 -0700751 ip_adjacency_t *adj;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100752
Benoît Ganne9f10edb2021-06-08 16:25:14 +0200753 adj_lock (ai);
754
Neale Ranns30d53642018-08-27 07:29:15 -0700755 adj = adj_get(ai);
756
757 adj->ia_flags |= ADJ_FLAG_SYNC_WALK_ACTIVE;
Neale Rannsb80c5362016-10-08 13:03:40 +0100758 fib_walk_sync(FIB_NODE_TYPE_ADJ, ai, &bw_ctx);
Neale Ranns30d53642018-08-27 07:29:15 -0700759 adj->ia_flags &= ~ADJ_FLAG_SYNC_WALK_ACTIVE;
Neale Rannsb80c5362016-10-08 13:03:40 +0100760
Benoît Ganne9f10edb2021-06-08 16:25:14 +0200761 adj_unlock (ai);
Neale Rannsb80c5362016-10-08 13:03:40 +0100762 return (ADJ_WALK_RC_CONTINUE);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100763}
764
Neale Ranns8b37b872016-11-21 12:25:22 +0000765/**
766 * @brief Registered function for SW interface state changes
767 */
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100768static clib_error_t *
Neale Ranns8b37b872016-11-21 12:25:22 +0000769adj_nbr_sw_interface_state_change (vnet_main_t * vnm,
770 u32 sw_if_index,
771 u32 flags)
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100772{
773 fib_protocol_t proto;
774
775 /*
776 * walk each adj on the interface and trigger a walk from that adj
777 */
778 for (proto = FIB_PROTOCOL_IP4; proto <= FIB_PROTOCOL_IP6; proto++)
779 {
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100780 adj_nbr_interface_state_change_ctx_t ctx = {
Neale Ranns8b37b872016-11-21 12:25:22 +0000781 .flags = ((flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP) ?
782 ADJ_NBR_INTERFACE_UP :
783 0),
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100784 };
785
Neale Rannsb80c5362016-10-08 13:03:40 +0100786 adj_nbr_walk(sw_if_index, proto,
787 adj_nbr_interface_state_change_one,
788 &ctx);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100789 }
790
791 return (NULL);
792}
793
Neale Ranns8b37b872016-11-21 12:25:22 +0000794VNET_SW_INTERFACE_ADMIN_UP_DOWN_FUNCTION_PRIO(
795 adj_nbr_sw_interface_state_change,
796 VNET_ITF_FUNC_PRIORITY_HIGH);
797
798/**
799 * @brief Invoked on each SW interface of a HW interface when the
800 * HW interface state changes
801 */
Neale Ranns0053de62018-05-22 08:40:52 -0700802static walk_rc_t
Neale Ranns8b37b872016-11-21 12:25:22 +0000803adj_nbr_hw_sw_interface_state_change (vnet_main_t * vnm,
804 u32 sw_if_index,
805 void *arg)
806{
807 adj_nbr_interface_state_change_ctx_t *ctx = arg;
808 fib_protocol_t proto;
809
810 /*
811 * walk each adj on the interface and trigger a walk from that adj
812 */
813 for (proto = FIB_PROTOCOL_IP4; proto <= FIB_PROTOCOL_IP6; proto++)
814 {
815 adj_nbr_walk(sw_if_index, proto,
816 adj_nbr_interface_state_change_one,
817 ctx);
818 }
Neale Ranns0053de62018-05-22 08:40:52 -0700819 return (WALK_CONTINUE);
Neale Ranns8b37b872016-11-21 12:25:22 +0000820}
821
822/**
823 * @brief Registered callback for HW interface state changes
824 */
825static clib_error_t *
826adj_nbr_hw_interface_state_change (vnet_main_t * vnm,
827 u32 hw_if_index,
828 u32 flags)
829{
830 /*
831 * walk SW interface on the HW
832 */
833 adj_nbr_interface_state_change_ctx_t ctx = {
834 .flags = ((flags & VNET_HW_INTERFACE_FLAG_LINK_UP) ?
835 ADJ_NBR_INTERFACE_UP :
836 0),
837 };
838
839 vnet_hw_interface_walk_sw(vnm, hw_if_index,
840 adj_nbr_hw_sw_interface_state_change,
841 &ctx);
842
843 return (NULL);
844}
845
846VNET_HW_INTERFACE_LINK_UP_DOWN_FUNCTION_PRIO(
847 adj_nbr_hw_interface_state_change,
848 VNET_ITF_FUNC_PRIORITY_HIGH);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100849
Neale Rannsb80c5362016-10-08 13:03:40 +0100850static adj_walk_rc_t
851adj_nbr_interface_delete_one (adj_index_t ai,
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100852 void *arg)
853{
854 /*
855 * Back walk the graph to inform the forwarding entries
856 * that this interface has been deleted.
857 */
858 fib_node_back_walk_ctx_t bw_ctx = {
859 .fnbw_reason = FIB_NODE_BW_REASON_FLAG_INTERFACE_DELETE,
860 };
Neale Ranns30d53642018-08-27 07:29:15 -0700861 ip_adjacency_t *adj;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100862
Benoît Ganne73911562019-10-16 15:08:37 +0200863 adj_lock(ai);
864
Neale Ranns30d53642018-08-27 07:29:15 -0700865 adj = adj_get(ai);
866
867 adj->ia_flags |= ADJ_FLAG_SYNC_WALK_ACTIVE;
Neale Rannsb80c5362016-10-08 13:03:40 +0100868 fib_walk_sync(FIB_NODE_TYPE_ADJ, ai, &bw_ctx);
Neale Ranns30d53642018-08-27 07:29:15 -0700869 adj->ia_flags &= ~ADJ_FLAG_SYNC_WALK_ACTIVE;
Neale Rannsb80c5362016-10-08 13:03:40 +0100870
Benoît Ganne73911562019-10-16 15:08:37 +0200871 adj_unlock(ai);
Neale Rannsb80c5362016-10-08 13:03:40 +0100872 return (ADJ_WALK_RC_CONTINUE);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100873}
874
875/**
876 * adj_nbr_interface_add_del
877 *
878 * Registered to receive interface Add and delete notifications
879 */
880static clib_error_t *
881adj_nbr_interface_add_del (vnet_main_t * vnm,
882 u32 sw_if_index,
883 u32 is_add)
884{
885 fib_protocol_t proto;
886
887 if (is_add)
888 {
889 /*
890 * not interested in interface additions. we will not back walk
891 * to resolve paths through newly added interfaces. Why? The control
892 * plane should have the brains to add interfaces first, then routes.
893 * So the case where there are paths with a interface that matches
894 * one just created is the case where the path resolved through an
895 * interface that was deleted, and still has not been removed. The
896 * new interface added, is NO GUARANTEE that the interface being
897 * added now, even though it may have the same sw_if_index, is the
898 * same interface that the path needs. So tough!
899 * If the control plane wants these routes to resolve it needs to
900 * remove and add them again.
901 */
902 return (NULL);
903 }
904
905 for (proto = FIB_PROTOCOL_IP4; proto <= FIB_PROTOCOL_IP6; proto++)
906 {
Neale Rannsb80c5362016-10-08 13:03:40 +0100907 adj_nbr_walk(sw_if_index, proto,
908 adj_nbr_interface_delete_one,
909 NULL);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100910 }
911
912 return (NULL);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100913}
914
915VNET_SW_INTERFACE_ADD_DEL_FUNCTION(adj_nbr_interface_add_del);
916
917
Neale Rannsb80c5362016-10-08 13:03:40 +0100918static adj_walk_rc_t
Neale Rannsea8adf72021-08-13 08:10:59 +0000919adj_nbr_ethernet_mac_change_one (adj_index_t ai,
920 void *arg)
921{
922 vnet_update_adjacency_for_sw_interface(vnet_get_main(),
923 adj_get_sw_if_index(ai),
924 ai);
925
926 return (ADJ_WALK_RC_CONTINUE);
927}
928
929/**
930 * Callback function invoked when an interface's MAC Address changes
931 */
932static void
933adj_nbr_ethernet_change_mac (ethernet_main_t * em,
934 u32 sw_if_index, uword opaque)
935{
936 fib_protocol_t proto;
937
938 FOR_EACH_FIB_IP_PROTOCOL(proto)
939 {
940 adj_nbr_walk(sw_if_index, proto,
941 adj_nbr_ethernet_mac_change_one,
942 NULL);
943 }
944}
945
946static adj_walk_rc_t
Neale Rannsb80c5362016-10-08 13:03:40 +0100947adj_nbr_show_one (adj_index_t ai,
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100948 void *arg)
949{
950 vlib_cli_output (arg, "[@%d] %U",
Neale Rannsb80c5362016-10-08 13:03:40 +0100951 ai,
952 format_ip_adjacency, ai,
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100953 FORMAT_IP_ADJACENCY_NONE);
Neale Rannsb80c5362016-10-08 13:03:40 +0100954
955 return (ADJ_WALK_RC_CONTINUE);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100956}
957
958static clib_error_t *
959adj_nbr_show (vlib_main_t * vm,
960 unformat_input_t * input,
961 vlib_cli_command_t * cmd)
962{
963 adj_index_t ai = ADJ_INDEX_INVALID;
Neale Ranns14053c92019-12-29 23:55:18 +0000964 ip46_address_t nh = ip46_address_initializer;
Neale Rannsb80c5362016-10-08 13:03:40 +0100965 u32 sw_if_index = ~0;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100966
967 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
968 {
Neale Ranns14053c92019-12-29 23:55:18 +0000969 if (unformat (input, "%U",
970 unformat_vnet_sw_interface, vnet_get_main(),
971 &sw_if_index))
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100972 ;
Neale Rannsb80c5362016-10-08 13:03:40 +0100973 else if (unformat (input, "%U",
Neale Ranns14053c92019-12-29 23:55:18 +0000974 unformat_ip46_address, &nh, IP46_TYPE_ANY))
975 ;
976 else if (unformat (input, "%d", &ai))
Neale Rannsb80c5362016-10-08 13:03:40 +0100977 ;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100978 else
979 break;
980 }
981
982 if (ADJ_INDEX_INVALID != ai)
983 {
984 vlib_cli_output (vm, "[@%d] %U",
985 ai,
Neale Rannsb80c5362016-10-08 13:03:40 +0100986 format_ip_adjacency, ai,
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100987 FORMAT_IP_ADJACENCY_DETAIL);
988 }
Neale Rannsb80c5362016-10-08 13:03:40 +0100989 else if (~0 != sw_if_index)
990 {
991 fib_protocol_t proto;
992
Neale Ranns14053c92019-12-29 23:55:18 +0000993 if (ip46_address_is_zero(&nh))
994 {
995 for (proto = FIB_PROTOCOL_IP4; proto <= FIB_PROTOCOL_IP6; proto++)
996 {
997 adj_nbr_walk(sw_if_index, proto,
998 adj_nbr_show_one,
999 vm);
1000 }
1001 }
1002 else
1003 {
1004 proto = (ip46_address_is_ip4(&nh) ?
1005 FIB_PROTOCOL_IP4 :
1006 FIB_PROTOCOL_IP6);
1007 adj_nbr_walk_nh(sw_if_index, proto, &nh,
1008 adj_nbr_show_one,
1009 vm);
1010 }
Neale Rannsb80c5362016-10-08 13:03:40 +01001011 }
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001012 else
1013 {
1014 fib_protocol_t proto;
1015
1016 for (proto = FIB_PROTOCOL_IP4; proto <= FIB_PROTOCOL_IP6; proto++)
1017 {
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001018 vec_foreach_index(sw_if_index, adj_nbr_tables[proto])
1019 {
Neale Rannsb80c5362016-10-08 13:03:40 +01001020 adj_nbr_walk(sw_if_index, proto,
1021 adj_nbr_show_one,
1022 vm);
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001023 }
1024 }
1025 }
1026
1027 return 0;
1028}
1029
Neale Rannsb80c5362016-10-08 13:03:40 +01001030/*?
1031 * Show all neighbour adjacencies.
1032 * @cliexpar
1033 * @cliexstart{sh adj nbr}
1034 * [@2] ipv4 via 1.0.0.2 loop0: IP4: 00:00:22:aa:bb:cc -> 00:00:11:aa:bb:cc
1035 * [@3] mpls via 1.0.0.2 loop0: MPLS_UNICAST: 00:00:22:aa:bb:cc -> 00:00:11:aa:bb:cc
1036 * [@4] ipv4 via 1.0.0.3 loop0: IP4: 00:00:22:aa:bb:cc -> 00:00:11:aa:bb:cc
1037 * [@5] mpls via 1.0.0.3 loop0: MPLS_UNICAST: 00:00:22:aa:bb:cc -> 00:00:11:aa:bb:cc
1038 * @cliexend
1039 ?*/
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001040VLIB_CLI_COMMAND (ip4_show_fib_command, static) = {
1041 .path = "show adj nbr",
Neale Rannsb80c5362016-10-08 13:03:40 +01001042 .short_help = "show adj nbr [<adj_index>] [interface]",
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001043 .function = adj_nbr_show,
1044};
1045
1046u8*
1047format_adj_nbr_incomplete (u8* s, va_list *ap)
1048{
Billy McFallcfcf1e22016-10-14 09:51:49 -04001049 index_t index = va_arg(*ap, index_t);
1050 CLIB_UNUSED(u32 indent) = va_arg(*ap, u32);
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001051 vnet_main_t * vnm = vnet_get_main();
1052 ip_adjacency_t * adj = adj_get(index);
1053
Neale Ranns924d03a2016-10-19 08:25:46 +01001054 s = format (s, "arp-%U", format_vnet_link, adj->ia_link);
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001055 s = format (s, ": via %U",
Neale Rannsb80c5362016-10-08 13:03:40 +01001056 format_ip46_address, &adj->sub_type.nbr.next_hop,
1057 adj_proto_to_46(adj->ia_nh_proto));
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001058 s = format (s, " %U",
Steven70488ab2018-03-28 17:59:00 -07001059 format_vnet_sw_if_index_name,
1060 vnm, adj->rewrite_header.sw_if_index);
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001061
1062 return (s);
1063}
1064
1065u8*
1066format_adj_nbr (u8* s, va_list *ap)
1067{
Billy McFallcfcf1e22016-10-14 09:51:49 -04001068 index_t index = va_arg(*ap, index_t);
1069 CLIB_UNUSED(u32 indent) = va_arg(*ap, u32);
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001070 ip_adjacency_t * adj = adj_get(index);
1071
Neale Ranns924d03a2016-10-19 08:25:46 +01001072 s = format (s, "%U", format_vnet_link, adj->ia_link);
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001073 s = format (s, " via %U ",
Neale Rannsb80c5362016-10-08 13:03:40 +01001074 format_ip46_address, &adj->sub_type.nbr.next_hop,
1075 adj_proto_to_46(adj->ia_nh_proto));
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001076 s = format (s, "%U",
1077 format_vnet_rewrite,
Neale Rannsb069a692017-03-15 12:34:25 -04001078 &adj->rewrite_header, sizeof (adj->rewrite_data), 0);
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001079
1080 return (s);
1081}
1082
1083static void
1084adj_dpo_lock (dpo_id_t *dpo)
1085{
1086 adj_lock(dpo->dpoi_index);
1087}
1088static void
1089adj_dpo_unlock (dpo_id_t *dpo)
1090{
1091 adj_unlock(dpo->dpoi_index);
1092}
1093
Neale Ranns6c3ebcc2016-10-02 21:20:15 +01001094static void
1095adj_mem_show (void)
1096{
1097 fib_show_memory_usage("Adjacency",
1098 pool_elts(adj_pool),
1099 pool_len(adj_pool),
1100 sizeof(ip_adjacency_t));
1101}
1102
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001103const static dpo_vft_t adj_nbr_dpo_vft = {
1104 .dv_lock = adj_dpo_lock,
1105 .dv_unlock = adj_dpo_unlock,
1106 .dv_format = format_adj_nbr,
Neale Ranns6c3ebcc2016-10-02 21:20:15 +01001107 .dv_mem_show = adj_mem_show,
Andrew Yourtchenko5f3fcb92017-10-25 05:50:37 -07001108 .dv_get_urpf = adj_dpo_get_urpf,
Neale Ranns8f5fef22020-12-21 08:29:34 +00001109 .dv_get_mtu = adj_dpo_get_mtu,
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001110};
1111const static dpo_vft_t adj_nbr_incompl_dpo_vft = {
1112 .dv_lock = adj_dpo_lock,
1113 .dv_unlock = adj_dpo_unlock,
1114 .dv_format = format_adj_nbr_incomplete,
Andrew Yourtchenko5f3fcb92017-10-25 05:50:37 -07001115 .dv_get_urpf = adj_dpo_get_urpf,
Neale Ranns8f5fef22020-12-21 08:29:34 +00001116 .dv_get_mtu = adj_dpo_get_mtu,
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001117};
1118
1119/**
1120 * @brief The per-protocol VLIB graph nodes that are assigned to an adjacency
1121 * object.
1122 *
1123 * this means that these graph nodes are ones from which a nbr is the
1124 * parent object in the DPO-graph.
1125 */
1126const static char* const nbr_ip4_nodes[] =
1127{
Neale Rannsf06aea52016-11-29 06:51:37 -08001128 "ip4-rewrite",
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001129 NULL,
1130};
1131const static char* const nbr_ip6_nodes[] =
1132{
1133 "ip6-rewrite",
1134 NULL,
1135};
1136const static char* const nbr_mpls_nodes[] =
1137{
1138 "mpls-output",
1139 NULL,
1140};
Neale Ranns5e575b12016-10-03 09:40:25 +01001141const static char* const nbr_ethernet_nodes[] =
1142{
1143 "adj-l2-rewrite",
1144 NULL,
1145};
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001146const static char* const * const nbr_nodes[DPO_PROTO_NUM] =
1147{
1148 [DPO_PROTO_IP4] = nbr_ip4_nodes,
1149 [DPO_PROTO_IP6] = nbr_ip6_nodes,
1150 [DPO_PROTO_MPLS] = nbr_mpls_nodes,
Neale Ranns5e575b12016-10-03 09:40:25 +01001151 [DPO_PROTO_ETHERNET] = nbr_ethernet_nodes,
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001152};
1153
1154const static char* const nbr_incomplete_ip4_nodes[] =
1155{
1156 "ip4-arp",
1157 NULL,
1158};
1159const static char* const nbr_incomplete_ip6_nodes[] =
1160{
1161 "ip6-discover-neighbor",
1162 NULL,
1163};
1164const static char* const nbr_incomplete_mpls_nodes[] =
1165{
1166 "mpls-adj-incomplete",
1167 NULL,
1168};
1169
1170const static char* const * const nbr_incomplete_nodes[DPO_PROTO_NUM] =
1171{
1172 [DPO_PROTO_IP4] = nbr_incomplete_ip4_nodes,
1173 [DPO_PROTO_IP6] = nbr_incomplete_ip6_nodes,
1174 [DPO_PROTO_MPLS] = nbr_incomplete_mpls_nodes,
1175};
1176
1177void
1178adj_nbr_module_init (void)
1179{
1180 dpo_register(DPO_ADJACENCY,
1181 &adj_nbr_dpo_vft,
1182 nbr_nodes);
1183 dpo_register(DPO_ADJACENCY_INCOMPLETE,
1184 &adj_nbr_incompl_dpo_vft,
1185 nbr_incomplete_nodes);
Neale Rannsea8adf72021-08-13 08:10:59 +00001186
1187 ethernet_address_change_ctx_t ctx = {
1188 .function = adj_nbr_ethernet_change_mac,
1189 .function_opaque = 0,
1190 };
1191 vec_add1 (ethernet_main.address_change_callbacks, ctx);
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001192}