blob: 8c96a25cc5d5fbda4ccf5b4b142d3decfaf4b230 [file] [log] [blame]
Neale Ranns0bfe5d82016-08-25 15:29:12 +01001/*
2 * Copyright (c) 2016 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
6 *
7 * http://www.apache.org/licenses/LICENSE-2.0
8 *
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
14 */
15/**
16 * @file
17 * @brief Common utility functions for IPv4, IPv6 and L2 LISP-GPE adjacencys.
18 *
19 */
20
Neale Rannsb80c5362016-10-08 13:03:40 +010021#include <vnet/dpo/load_balance.h>
22#include <vnet/lisp-cp/lisp_types.h>
Neale Ranns0bfe5d82016-08-25 15:29:12 +010023#include <vnet/lisp-gpe/lisp_gpe_sub_interface.h>
24#include <vnet/lisp-gpe/lisp_gpe_adjacency.h>
25#include <vnet/lisp-gpe/lisp_gpe_tunnel.h>
26#include <vnet/fib/fib_entry.h>
27#include <vnet/adj/adj_midchain.h>
28
29/**
30 * Memory pool of all adjacencies
31 */
32static lisp_gpe_adjacency_t *lisp_adj_pool;
33
34/**
35 * Hash table of all adjacencies. key:{nh, itf}
36 * We never have an all zeros address since the interfaces are multi-access,
37 * therefore there is no ambiguity between a v4 and v6 next-hop, so we don't
38 * need to add the protocol to the key.
39 */
40static
41BVT (clib_bihash)
42 lisp_adj_db;
43
44#define LISP_ADJ_SET_KEY(_key, _itf, _nh) \
45{ \
46 _key.key[0] = (_nh)->ip.v6.as_u64[0]; \
47 _key.key[1] = (_nh)->ip.v6.as_u64[1]; \
48 _key.key[2] = (_itf); \
49}
50
51 static index_t lisp_adj_find (const ip_address_t * addr, u32 sw_if_index)
52{
53 BVT (clib_bihash_kv) kv;
54
55 LISP_ADJ_SET_KEY (kv, sw_if_index, addr);
56
57 if (BV (clib_bihash_search) (&lisp_adj_db, &kv, &kv) < 0)
58 {
59 return (INDEX_INVALID);
60 }
61 else
62 {
63 return (kv.value);
64 }
65}
66
67static void
68lisp_adj_insert (const ip_address_t * addr, u32 sw_if_index, index_t ai)
69{
70 BVT (clib_bihash_kv) kv;
71
72 LISP_ADJ_SET_KEY (kv, sw_if_index, addr);
73 kv.value = ai;
74
75 BV (clib_bihash_add_del) (&lisp_adj_db, &kv, 1);
76}
77
78static void
79lisp_adj_remove (const ip_address_t * addr, u32 sw_if_index)
80{
81 BVT (clib_bihash_kv) kv;
82
83 LISP_ADJ_SET_KEY (kv, sw_if_index, addr);
84
85 BV (clib_bihash_add_del) (&lisp_adj_db, &kv, 0);
86}
87
88static lisp_gpe_adjacency_t *
89lisp_gpe_adjacency_get_i (index_t lai)
90{
91 return (pool_elt_at_index (lisp_adj_pool, lai));
92}
93
94fib_forward_chain_type_t
95lisp_gpe_adj_get_fib_chain_type (const lisp_gpe_adjacency_t * ladj)
96{
97 switch (ip_addr_version (&ladj->remote_rloc))
98 {
99 case IP4:
100 return (FIB_FORW_CHAIN_TYPE_UNICAST_IP4);
101 case IP6:
102 return (FIB_FORW_CHAIN_TYPE_UNICAST_IP6);
103 default:
104 ASSERT (0);
105 break;
106 }
107 return (FIB_FORW_CHAIN_TYPE_UNICAST_IP4);
108}
109
Neale Rannsb80c5362016-10-08 13:03:40 +0100110static void
111ip46_address_to_ip_address (const ip46_address_t * a, ip_address_t * b)
112{
113 if (ip46_address_is_ip4 (a))
114 {
115 memset (b, 0, sizeof (*b));
116 ip_address_set (b, &a->ip4, IP4);
117 }
118 else
119 {
120 ip_address_set (b, &a->ip6, IP6);
121 }
122}
123
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100124/**
125 * @brief Stack the tunnel's midchain on the IP forwarding chain of the via
126 */
127static void
Neale Rannsb80c5362016-10-08 13:03:40 +0100128lisp_gpe_adj_stack_one (lisp_gpe_adjacency_t * ladj, adj_index_t ai)
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100129{
Neale Ranns5e575b12016-10-03 09:40:25 +0100130 const lisp_gpe_tunnel_t *lgt;
Neale Ranns948e00f2016-10-20 13:39:34 +0100131 dpo_id_t tmp = DPO_INVALID;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100132
133 lgt = lisp_gpe_tunnel_get (ladj->tunnel_index);
134 fib_entry_contribute_forwarding (lgt->fib_entry_index,
135 lisp_gpe_adj_get_fib_chain_type (ladj),
136 &tmp);
137
Neale Rannsb80c5362016-10-08 13:03:40 +0100138 if (DPO_LOAD_BALANCE == tmp.dpoi_type)
139 {
140 /*
141 * post LISP rewrite we will load-balance. However, the LISP encap
142 * is always the same for this adjacency/tunnel and hence the IP/UDP src,dst
143 * hash is always the same result too. So we do that hash now and
144 * stack on the choice.
145 * If the choice is an incomplete adj then we will need a poke when
146 * it becomes complete. This happens since the adj update walk propagates
147 * as far a recursive paths.
148 */
149 const dpo_id_t *choice;
150 load_balance_t *lb;
151 int hash;
152
153 lb = load_balance_get (tmp.dpoi_index);
154
155 if (IP4 == ip_addr_version (&ladj->remote_rloc))
156 {
157 hash = ip4_compute_flow_hash ((ip4_header_t *) adj_get_rewrite (ai),
158 lb->lb_hash_config);
159 }
160 else
161 {
162 hash = ip6_compute_flow_hash ((ip6_header_t *) adj_get_rewrite (ai),
163 lb->lb_hash_config);
164 }
165
166 choice =
167 load_balance_get_bucket_i (lb, hash & lb->lb_n_buckets_minus_1);
168 dpo_copy (&tmp, choice);
169 }
170
171 adj_nbr_midchain_stack (ai, &tmp);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100172 dpo_reset (&tmp);
173}
174
Neale Rannsb80c5362016-10-08 13:03:40 +0100175/**
176 * @brief Call back when restacking all adjacencies on a GRE interface
177 */
178static adj_walk_rc_t
179lisp_gpe_adj_walk_cb (adj_index_t ai, void *ctx)
180{
181 lisp_gpe_adjacency_t *ladj = ctx;
182
183 lisp_gpe_adj_stack_one (ladj, ai);
184
185 return (ADJ_WALK_RC_CONTINUE);
186}
187
188static void
189lisp_gpe_adj_stack (lisp_gpe_adjacency_t * ladj)
190{
191 fib_protocol_t nh_proto;
192 ip46_address_t nh;
193
194 ip_address_to_46 (&ladj->remote_rloc, &nh, &nh_proto);
195
196 /*
197 * walk all the adjacencies on th lisp interface and restack them
198 */
199 adj_nbr_walk_nh (ladj->sw_if_index,
200 nh_proto, &nh, lisp_gpe_adj_walk_cb, ladj);
201}
202
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100203static lisp_gpe_next_protocol_e
Neale Ranns924d03a2016-10-19 08:25:46 +0100204lisp_gpe_adj_proto_from_vnet_link_type (vnet_link_t linkt)
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100205{
206 switch (linkt)
207 {
Neale Ranns924d03a2016-10-19 08:25:46 +0100208 case VNET_LINK_IP4:
Neale Ranns5e575b12016-10-03 09:40:25 +0100209 return (LISP_GPE_NEXT_PROTO_IP4);
Neale Ranns924d03a2016-10-19 08:25:46 +0100210 case VNET_LINK_IP6:
Neale Ranns5e575b12016-10-03 09:40:25 +0100211 return (LISP_GPE_NEXT_PROTO_IP6);
Neale Ranns924d03a2016-10-19 08:25:46 +0100212 case VNET_LINK_ETHERNET:
Neale Ranns5e575b12016-10-03 09:40:25 +0100213 return (LISP_GPE_NEXT_PROTO_ETHERNET);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100214 default:
215 ASSERT (0);
216 }
Neale Ranns5e575b12016-10-03 09:40:25 +0100217 return (LISP_GPE_NEXT_PROTO_IP4);
218}
219
220#define is_v4_packet(_h) ((*(u8*) _h) & 0xF0) == 0x40
221
222static void
223lisp_gpe_fixup (vlib_main_t * vm, ip_adjacency_t * adj, vlib_buffer_t * b)
224{
225 /* Fixup the checksum and len fields in the LISP tunnel encap
226 * that was applied at the midchain node */
227 ip_udp_fixup_one (vm, b, is_v4_packet (vlib_buffer_get_current (b)));
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100228}
229
Neale Rannsb80c5362016-10-08 13:03:40 +0100230/**
231 * @brief The LISP-GPE interface registered function to update, i.e.
232 * provide an rewrite string for, an adjacency.
233 */
234void
235lisp_gpe_update_adjacency (vnet_main_t * vnm, u32 sw_if_index, adj_index_t ai)
236{
237 const lisp_gpe_tunnel_t *lgt;
238 lisp_gpe_adjacency_t *ladj;
239 ip_adjacency_t *adj;
240 ip_address_t rloc;
241 vnet_link_t linkt;
242 index_t lai;
243
244 adj = adj_get (ai);
245 ip46_address_to_ip_address (&adj->sub_type.nbr.next_hop, &rloc);
246
247 /*
248 * find an existing or create a new adj
249 */
250 lai = lisp_adj_find (&rloc, sw_if_index);
251
252 ASSERT (INDEX_INVALID != lai);
253
254 ladj = pool_elt_at_index (lisp_adj_pool, lai);
255 lgt = lisp_gpe_tunnel_get (ladj->tunnel_index);
256 linkt = adj_get_link_type (ai);
257
258 adj_nbr_midchain_update_rewrite
259 (ai, lisp_gpe_fixup,
260 (VNET_LINK_ETHERNET == linkt ?
261 ADJ_MIDCHAIN_FLAG_NO_COUNT :
262 ADJ_MIDCHAIN_FLAG_NONE),
263 lisp_gpe_tunnel_build_rewrite
Neale Ranns924d03a2016-10-19 08:25:46 +0100264 (lgt, ladj, lisp_gpe_adj_proto_from_vnet_link_type (linkt)));
Neale Rannsb80c5362016-10-08 13:03:40 +0100265
266 lisp_gpe_adj_stack_one (ladj, ai);
267}
268
269u8 *
270lisp_gpe_build_rewrite (vnet_main_t * vnm,
271 u32 sw_if_index,
272 vnet_link_t link_type, const void *dst_address)
273{
274 ASSERT (0);
275 return (NULL);
276}
277
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100278index_t
279lisp_gpe_adjacency_find_or_create_and_lock (const locator_pair_t * pair,
280 u32 overlay_table_id, u32 vni)
281{
Neale Rannsb80c5362016-10-08 13:03:40 +0100282 const lisp_gpe_sub_interface_t *l3s;
Neale Ranns5e575b12016-10-03 09:40:25 +0100283 const lisp_gpe_tunnel_t *lgt;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100284 lisp_gpe_adjacency_t *ladj;
285 index_t lai, l3si;
286
287 /*
288 * first find the L3 sub-interface that corresponds to the loacl-rloc and vni
289 */
290 l3si = lisp_gpe_sub_interface_find_or_create_and_lock (&pair->lcl_loc,
291 overlay_table_id,
292 vni);
Neale Rannsb80c5362016-10-08 13:03:40 +0100293 l3s = lisp_gpe_sub_interface_get (l3si);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100294
295 /*
296 * find an existing or create a new adj
297 */
Neale Rannsb80c5362016-10-08 13:03:40 +0100298 lai = lisp_adj_find (&pair->rmt_loc, l3s->sw_if_index);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100299
300 if (INDEX_INVALID == lai)
301 {
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100302
303 pool_get (lisp_adj_pool, ladj);
304 memset (ladj, 0, sizeof (*ladj));
305 lai = (ladj - lisp_adj_pool);
306
Neale Rannsb80c5362016-10-08 13:03:40 +0100307 ip_address_copy (&ladj->remote_rloc, &pair->rmt_loc);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100308 ladj->vni = vni;
309 /* transfer the lock to the adj */
310 ladj->lisp_l3_sub_index = l3si;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100311 ladj->sw_if_index = l3s->sw_if_index;
312
313 /* if vni is non-default */
314 if (ladj->vni)
315 ladj->flags = LISP_GPE_FLAGS_I;
316
317 /* work in lisp-gpe not legacy mode */
318 ladj->flags |= LISP_GPE_FLAGS_P;
319
320 /*
321 * find the tunnel that will provide the underlying transport
322 * and hence the rewrite.
323 * The RLOC FIB index is default table - always.
324 */
325 ladj->tunnel_index = lisp_gpe_tunnel_find_or_create_and_lock (pair, 0);
326
327 lgt = lisp_gpe_tunnel_get (ladj->tunnel_index);
328
329 /*
330 * become of child of the RLOC FIB entry so we are updated when
331 * its reachability changes, allowing us to re-stack the midcahins
332 */
333 ladj->fib_entry_child_index = fib_entry_child_add (lgt->fib_entry_index,
334 FIB_NODE_TYPE_LISP_ADJ,
335 lai);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100336
Neale Rannsb80c5362016-10-08 13:03:40 +0100337 lisp_adj_insert (&ladj->remote_rloc, ladj->sw_if_index, lai);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100338 }
339 else
340 {
341 /* unlock the interface from the find. */
342 lisp_gpe_sub_interface_unlock (l3si);
343 ladj = lisp_gpe_adjacency_get_i (lai);
344 }
345
346 ladj->locks++;
347
348 return (lai);
349}
350
351/**
352 * @brief Get a pointer to a tunnel from a pointer to a FIB node
353 */
354static lisp_gpe_adjacency_t *
355lisp_gpe_adjacency_from_fib_node (const fib_node_t * node)
356{
357 return ((lisp_gpe_adjacency_t *)
358 ((char *) node -
359 STRUCT_OFFSET_OF (lisp_gpe_adjacency_t, fib_node)));
360}
361
362static void
363lisp_gpe_adjacency_last_lock_gone (lisp_gpe_adjacency_t * ladj)
364{
Neale Rannsb80c5362016-10-08 13:03:40 +0100365 const lisp_gpe_tunnel_t *lgt;
366
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100367 /*
368 * no children so we are not counting locks. no-op.
369 * at least not counting
370 */
Neale Rannsb80c5362016-10-08 13:03:40 +0100371 lisp_adj_remove (&ladj->remote_rloc, ladj->sw_if_index);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100372
373 /*
374 * unlock the resources this adj holds
375 */
Neale Rannsb80c5362016-10-08 13:03:40 +0100376 lgt = lisp_gpe_tunnel_get (ladj->tunnel_index);
377
378 fib_entry_child_remove (lgt->fib_entry_index, ladj->fib_entry_child_index);
379
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100380 lisp_gpe_tunnel_unlock (ladj->tunnel_index);
381 lisp_gpe_sub_interface_unlock (ladj->lisp_l3_sub_index);
382
383 pool_put (lisp_adj_pool, ladj);
384}
385
386void
387lisp_gpe_adjacency_unlock (index_t lai)
388{
389 lisp_gpe_adjacency_t *ladj;
390
391 ladj = lisp_gpe_adjacency_get_i (lai);
392
393 ladj->locks--;
394
395 if (0 == ladj->locks)
396 {
397 lisp_gpe_adjacency_last_lock_gone (ladj);
398 }
399}
400
401const lisp_gpe_adjacency_t *
402lisp_gpe_adjacency_get (index_t lai)
403{
404 return (lisp_gpe_adjacency_get_i (lai));
405}
406
407
408/**
409 * @brief LISP GPE tunnel back walk
410 *
411 * The FIB entry through which this tunnel resolves has been updated.
412 * re-stack the midchain on the new forwarding.
413 */
414static fib_node_back_walk_rc_t
415lisp_gpe_adjacency_back_walk (fib_node_t * node,
416 fib_node_back_walk_ctx_t * ctx)
417{
418 lisp_gpe_adj_stack (lisp_gpe_adjacency_from_fib_node (node));
419
420 return (FIB_NODE_BACK_WALK_CONTINUE);
421}
422
423static fib_node_t *
424lisp_gpe_adjacency_get_fib_node (fib_node_index_t index)
425{
426 lisp_gpe_adjacency_t *ladj;
427
428 ladj = pool_elt_at_index (lisp_adj_pool, index);
429 return (&ladj->fib_node);
430}
431
432static void
433lisp_gpe_adjacency_last_fib_lock_gone (fib_node_t * node)
434{
435 lisp_gpe_adjacency_last_lock_gone (lisp_gpe_adjacency_from_fib_node (node));
436}
437
438const static fib_node_vft_t lisp_gpe_tuennel_vft = {
439 .fnv_get = lisp_gpe_adjacency_get_fib_node,
440 .fnv_back_walk = lisp_gpe_adjacency_back_walk,
441 .fnv_last_lock = lisp_gpe_adjacency_last_fib_lock_gone,
442};
443
444u8 *
445format_lisp_gpe_adjacency (u8 * s, va_list * args)
446{
447 lisp_gpe_adjacency_t *ladj = va_arg (*args, lisp_gpe_adjacency_t *);
448 lisp_gpe_adjacency_format_flags_t flags =
Billy McFallcfcf1e22016-10-14 09:51:49 -0400449 va_arg (*args, lisp_gpe_adjacency_format_flags_t);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100450
451 if (flags & LISP_GPE_ADJ_FORMAT_FLAG_DETAIL)
452 {
453 s =
454 format (s, "index %d locks:%d\n", ladj - lisp_adj_pool, ladj->locks);
455 }
456
457 s = format (s, " vni: %d,", ladj->vni);
458 s = format (s, " remote-RLOC: %U,", format_ip_address, &ladj->remote_rloc);
459
460 if (flags & LISP_GPE_ADJ_FORMAT_FLAG_DETAIL)
461 {
462 s = format (s, " %U\n",
463 format_lisp_gpe_sub_interface,
464 lisp_gpe_sub_interface_get (ladj->lisp_l3_sub_index));
465 s = format (s, " %U\n",
466 format_lisp_gpe_tunnel,
467 lisp_gpe_tunnel_get (ladj->tunnel_index));
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100468 }
469 else
470 {
471 s = format (s, " LISP L3 sub-interface index: %d,",
472 ladj->lisp_l3_sub_index);
473 s = format (s, " LISP tunnel index: %d", ladj->tunnel_index);
474 }
475
476
477 return (s);
478}
479
480static clib_error_t *
481lisp_gpe_adjacency_show (vlib_main_t * vm,
482 unformat_input_t * input, vlib_cli_command_t * cmd)
483{
484 lisp_gpe_adjacency_t *ladj;
485 index_t index;
486
487 if (pool_elts (lisp_adj_pool) == 0)
488 vlib_cli_output (vm, "No lisp-gpe Adjacencies");
489
490 if (unformat (input, "%d", &index))
491 {
492 ladj = lisp_gpe_adjacency_get_i (index);
493 vlib_cli_output (vm, "%U", format_lisp_gpe_adjacency, ladj,
494 LISP_GPE_ADJ_FORMAT_FLAG_DETAIL);
495 }
496 else
497 {
498 /* *INDENT-OFF* */
499 pool_foreach (ladj, lisp_adj_pool,
500 ({
501 vlib_cli_output (vm, "[%d] %U\n",
502 ladj - lisp_adj_pool,
503 format_lisp_gpe_adjacency, ladj,
504 LISP_GPE_ADJ_FORMAT_FLAG_NONE);
505 }));
506 /* *INDENT-ON* */
507 }
508
509 return 0;
510}
511
512/* *INDENT-OFF* */
513VLIB_CLI_COMMAND (show_lisp_gpe_tunnel_command, static) =
514{
515 .path = "show lisp gpe adjacency",
516 .function = lisp_gpe_adjacency_show,
517};
518/* *INDENT-ON* */
519
520#define LISP_ADJ_NBR_DEFAULT_HASH_NUM_BUCKETS (256)
521#define LISP_ADJ_NBR_DEFAULT_HASH_MEMORY_SIZE (1<<20)
522
523static clib_error_t *
524lisp_gpe_adj_module_init (vlib_main_t * vm)
525{
526 BV (clib_bihash_init) (&lisp_adj_db,
527 "Adjacency Neighbour table",
528 LISP_ADJ_NBR_DEFAULT_HASH_NUM_BUCKETS,
529 LISP_ADJ_NBR_DEFAULT_HASH_MEMORY_SIZE);
530
531 fib_node_register_type (FIB_NODE_TYPE_LISP_ADJ, &lisp_gpe_tuennel_vft);
532 return (NULL);
533}
534
535VLIB_INIT_FUNCTION (lisp_gpe_adj_module_init)
536/*
537 * fd.io coding-style-patch-verification: ON
538 *
539 * Local Variables:
540 * eval: (c-set-style "gnu")
541 * End:
542 */