blob: fa47605e42d61d21537a542ec0f467704363a72e [file] [log] [blame]
Ed Warnickecb9cada2015-12-08 15:45:58 -07001/*
2 * Copyright (c) 2015 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
6 *
7 * http://www.apache.org/licenses/LICENSE-2.0
8 *
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
14 */
15#ifndef included_vnet_vxlan_h
16#define included_vnet_vxlan_h
17
18#include <vppinfra/error.h>
19#include <vppinfra/hash.h>
Eyal Baridd47eca2018-07-08 08:15:56 +030020#include <vppinfra/bihash_16_8.h>
Eyal Bari0fa56782018-06-04 12:25:05 +030021#include <vppinfra/bihash_24_8.h>
Ed Warnickecb9cada2015-12-08 15:45:58 -070022#include <vnet/vnet.h>
23#include <vnet/ip/ip.h>
Nick Zavaritsky27518c22020-02-27 15:54:58 +000024#include <vnet/ip/vtep.h>
Ed Warnickecb9cada2015-12-08 15:45:58 -070025#include <vnet/l2/l2_input.h>
John Lo3ef822e2016-06-07 09:14:07 -040026#include <vnet/l2/l2_output.h>
Ed Warnickecb9cada2015-12-08 15:45:58 -070027#include <vnet/l2/l2_bd.h>
28#include <vnet/ethernet/ethernet.h>
29#include <vnet/vxlan/vxlan_packet.h>
30#include <vnet/ip/ip4_packet.h>
Chris Luke99cb3352016-04-26 10:49:53 -040031#include <vnet/ip/ip6_packet.h>
Florin Corasb040f982020-10-20 14:59:43 -070032#include <vnet/udp/udp_packet.h>
John Loc42912d2016-11-07 18:30:47 -050033#include <vnet/dpo/dpo.h>
Eyal Baric5b13602016-11-24 19:42:43 +020034#include <vnet/adj/adj_types.h>
Ed Warnickecb9cada2015-12-08 15:45:58 -070035
Eyal Bari0fa56782018-06-04 12:25:05 +030036/* *INDENT-OFF* */
Ed Warnickecb9cada2015-12-08 15:45:58 -070037typedef CLIB_PACKED (struct {
Eyal Bari0fa56782018-06-04 12:25:05 +030038 ip4_header_t ip4; /* 20 bytes */
39 udp_header_t udp; /* 8 bytes */
40 vxlan_header_t vxlan; /* 8 bytes */
Ed Warnickecb9cada2015-12-08 15:45:58 -070041}) ip4_vxlan_header_t;
42
Chris Luke99cb3352016-04-26 10:49:53 -040043typedef CLIB_PACKED (struct {
Eyal Bari0fa56782018-06-04 12:25:05 +030044 ip6_header_t ip6; /* 40 bytes */
45 udp_header_t udp; /* 8 bytes */
46 vxlan_header_t vxlan; /* 8 bytes */
Chris Luke99cb3352016-04-26 10:49:53 -040047}) ip6_vxlan_header_t;
Eyal Baridd47eca2018-07-08 08:15:56 +030048/* *INDENT-ON* */
Chris Luke99cb3352016-04-26 10:49:53 -040049
Eyal Baridd47eca2018-07-08 08:15:56 +030050/*
51* Key fields: remote ip, vni on incoming VXLAN packet
52* all fields in NET byte order
53*/
54typedef clib_bihash_kv_16_8_t vxlan4_tunnel_key_t;
Chris Luke99cb3352016-04-26 10:49:53 -040055
Eyal Bari0fa56782018-06-04 12:25:05 +030056/*
57* Key fields: remote ip, vni and fib index on incoming VXLAN packet
58* ip, vni fields in NET byte order
59* fib index field in host byte order
60*/
Eyal Baridd47eca2018-07-08 08:15:56 +030061typedef clib_bihash_kv_24_8_t vxlan6_tunnel_key_t;
Ed Warnickecb9cada2015-12-08 15:45:58 -070062
Eyal Bariefd9cf32018-10-02 12:23:06 +030063typedef union
64{
65 struct
66 {
67 u32 sw_if_index; /* unicast - input interface / mcast - stats interface */
68 union
69 {
70 struct /* unicast action */
71 {
72 u16 next_index;
73 u8 error;
74 };
75 ip4_address_t local_ip; /* used as dst ip for mcast pkts to assign them to unicast tunnel */
76 };
77 };
78 u64 as_u64;
79} vxlan_decap_info_t;
80
Eyal Bari0fa56782018-06-04 12:25:05 +030081typedef struct
82{
Dave Baracheb987d32018-05-03 08:26:39 -040083 /* Required for pool_get_aligned */
Eyal Bari0fa56782018-06-04 12:25:05 +030084 CLIB_CACHE_LINE_ALIGN_MARK (cacheline0);
Dave Baracheb987d32018-05-03 08:26:39 -040085
John Loc42912d2016-11-07 18:30:47 -050086 /* FIB DPO for IP forwarding of VXLAN encap packet */
Eyal Bari0fa56782018-06-04 12:25:05 +030087 dpo_id_t next_dpo;
John Loc42912d2016-11-07 18:30:47 -050088
Ed Warnickecb9cada2015-12-08 15:45:58 -070089 /* vxlan VNI in HOST byte order */
90 u32 vni;
91
John Loc42912d2016-11-07 18:30:47 -050092 /* tunnel src and dst addresses */
93 ip46_address_t src;
94 ip46_address_t dst;
Chris Luke99cb3352016-04-26 10:49:53 -040095
Artem Glazychev839dcc02020-12-01 02:39:21 +070096 /* udp-ports */
97 u16 src_port;
98 u16 dst_port;
99
John Lo56912c82016-12-08 16:10:02 -0500100 /* mcast packet output intfc index (used only if dst is mcast) */
Eyal Baric5b13602016-11-24 19:42:43 +0200101 u32 mcast_sw_if_index;
John Lo56912c82016-12-08 16:10:02 -0500102
Hongjun Nibeb4bf72016-11-25 00:03:46 +0800103 /* decap next index */
Eyal Baria5679e82018-08-26 15:20:07 +0300104 u16 decap_next_index;
Eyal Baric5b13602016-11-24 19:42:43 +0200105
John Loc42912d2016-11-07 18:30:47 -0500106 /* The FIB index for src/dst addresses */
107 u32 encap_fib_index;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700108
John Loc42912d2016-11-07 18:30:47 -0500109 /* vnet intfc index */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700110 u32 sw_if_index;
John Loc42912d2016-11-07 18:30:47 -0500111 u32 hw_if_index;
Chris Luke99cb3352016-04-26 10:49:53 -0400112
John Loc42912d2016-11-07 18:30:47 -0500113 /**
114 * Linkage into the FIB object graph
115 */
116 fib_node_t node;
Chris Luke99cb3352016-04-26 10:49:53 -0400117
Eyal Baric5b13602016-11-24 19:42:43 +0200118 /*
119 * The FIB entry for (depending on VXLAN tunnel is unicast or mcast)
120 * sending unicast VXLAN encap packets or receiving mcast VXLAN packets
121 */
John Loc42912d2016-11-07 18:30:47 -0500122 fib_node_index_t fib_entry_index;
Eyal Baric5b13602016-11-24 19:42:43 +0200123 adj_index_t mcast_adj_index;
John Loc42912d2016-11-07 18:30:47 -0500124
125 /**
Paul Vinciguerrabdc0e6b2018-09-22 05:32:50 -0700126 * The tunnel is a child of the FIB entry for its destination. This is
John Loc42912d2016-11-07 18:30:47 -0500127 * so it receives updates when the forwarding information for that entry
128 * changes.
129 * The tunnels sibling index on the FIB entry's dependency list.
130 */
131 u32 sibling_index;
Jon Loeliger3d460bd2018-02-01 16:36:12 -0600132
Eyal Bari0fa56782018-06-04 12:25:05 +0300133 u32 flow_index; /* infra flow index */
134 u32 dev_instance; /* Real device instance in tunnel vector */
135 u32 user_instance; /* Instance name being shown to user */
eyal bari82e21d72018-04-26 13:14:55 +0300136
Steven Luongb8de7d42021-12-13 11:26:30 -0800137 VNET_DECLARE_REWRITE;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700138} vxlan_tunnel_t;
139
140#define foreach_vxlan_input_next \
141_(DROP, "error-drop") \
John Loc42912d2016-11-07 18:30:47 -0500142_(L2_INPUT, "l2-input")
Ed Warnickecb9cada2015-12-08 15:45:58 -0700143
Eyal Bari0fa56782018-06-04 12:25:05 +0300144typedef enum
145{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700146#define _(s,n) VXLAN_INPUT_NEXT_##s,
147 foreach_vxlan_input_next
148#undef _
Eyal Bari0fa56782018-06-04 12:25:05 +0300149 VXLAN_INPUT_N_NEXT,
Ed Warnickecb9cada2015-12-08 15:45:58 -0700150} vxlan_input_next_t;
151
Eyal Bari0fa56782018-06-04 12:25:05 +0300152typedef enum
153{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700154#define vxlan_error(n,s) VXLAN_ERROR_##n,
155#include <vnet/vxlan/vxlan_error.def>
156#undef vxlan_error
157 VXLAN_N_ERROR,
158} vxlan_input_error_t;
159
Eyal Bari0fa56782018-06-04 12:25:05 +0300160typedef struct
161{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700162 /* vector of encap tunnel instances */
Eyal Bari0fa56782018-06-04 12:25:05 +0300163 vxlan_tunnel_t *tunnels;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700164
165 /* lookup tunnel by key */
Artem Glazychev839dcc02020-12-01 02:39:21 +0700166 clib_bihash_16_8_t
167 vxlan4_tunnel_by_key; /* keyed on ipv4.dst + src_port + fib + vni */
168 clib_bihash_24_8_t
169 vxlan6_tunnel_by_key; /* keyed on ipv6.dst + src_port + fib + vni */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700170
Eyal Barifff67c82016-12-21 12:45:47 +0200171 /* local VTEP IPs ref count used by vxlan-bypass node to check if
172 received VXLAN packet DIP matches any local VTEP address */
Nick Zavaritsky27518c22020-02-27 15:54:58 +0000173 vtep_table_t vtep_table;
John Lo37682e12016-11-30 12:51:39 -0500174
Eyal Bari0ded8512017-01-19 17:01:09 +0200175 /* mcast shared info */
Eyal Bari0fa56782018-06-04 12:25:05 +0300176 uword *mcast_shared; /* keyed on mcast ip46 addr */
Eyal Barifff67c82016-12-21 12:45:47 +0200177
Dave Wallace60231f32015-12-17 21:04:30 -0500178 /* Mapping from sw_if_index to tunnel index */
Eyal Bari0fa56782018-06-04 12:25:05 +0300179 u32 *tunnel_index_by_sw_if_index;
Dave Wallace60231f32015-12-17 21:04:30 -0500180
Jon Loeligere3034cd2019-01-03 12:56:02 -0600181 /* graph node state */
182 uword *bm_ip4_bypass_enabled_by_sw_if;
183 uword *bm_ip6_bypass_enabled_by_sw_if;
184
Ed Warnickecb9cada2015-12-08 15:45:58 -0700185 /* convenience */
Eyal Bari0fa56782018-06-04 12:25:05 +0300186 vlib_main_t *vlib_main;
187 vnet_main_t *vnet_main;
Jon Loeliger3d460bd2018-02-01 16:36:12 -0600188
189 /* Record used instances */
190 uword *instance_used;
eyal bariaf86a482018-04-17 11:20:27 +0300191 u32 flow_id_start;
Junfeng Wang290526e2021-03-09 16:44:57 +0800192
193 /* cache for last 8 vxlan tunnel */
Junfeng Wang290526e2021-03-09 16:44:57 +0800194 vtep4_cache_t vtep4_u512;
Junfeng Wang290526e2021-03-09 16:44:57 +0800195
Ed Warnickecb9cada2015-12-08 15:45:58 -0700196} vxlan_main_t;
197
Dave Wallace71612d62017-10-24 01:32:41 -0400198extern vxlan_main_t vxlan_main;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700199
Chris Luke99cb3352016-04-26 10:49:53 -0400200extern vlib_node_registration_t vxlan4_input_node;
201extern vlib_node_registration_t vxlan6_input_node;
John Loc42912d2016-11-07 18:30:47 -0500202extern vlib_node_registration_t vxlan4_encap_node;
203extern vlib_node_registration_t vxlan6_encap_node;
eyal bariaf86a482018-04-17 11:20:27 +0300204extern vlib_node_registration_t vxlan4_flow_input_node;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700205
Eyal Bari0fa56782018-06-04 12:25:05 +0300206u8 *format_vxlan_encap_trace (u8 * s, va_list * args);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700207
Eyal Bari0fa56782018-06-04 12:25:05 +0300208typedef struct
209{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700210 u8 is_add;
Chris Luke99cb3352016-04-26 10:49:53 -0400211
212 /* we normally use is_ip4, but since this adds to the
Paul Vinciguerrabdc0e6b2018-09-22 05:32:50 -0700213 * structure, this seems less of a breaking change */
Chris Luke99cb3352016-04-26 10:49:53 -0400214 u8 is_ip6;
Nathan Skrzypczak3e384222021-04-21 19:56:34 +0200215 u8 is_l3;
Jon Loeliger3d460bd2018-02-01 16:36:12 -0600216 u32 instance;
Chris Luke99cb3352016-04-26 10:49:53 -0400217 ip46_address_t src, dst;
Eyal Baric5b13602016-11-24 19:42:43 +0200218 u32 mcast_sw_if_index;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700219 u32 encap_fib_index;
220 u32 decap_next_index;
221 u32 vni;
Artem Glazychev839dcc02020-12-01 02:39:21 +0700222 u16 src_port;
223 u16 dst_port;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700224} vnet_vxlan_add_del_tunnel_args_t;
225
Eyal Bari0fa56782018-06-04 12:25:05 +0300226int vnet_vxlan_add_del_tunnel
227 (vnet_vxlan_add_del_tunnel_args_t * a, u32 * sw_if_indexp);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700228
Eyal Bari0fa56782018-06-04 12:25:05 +0300229void vnet_int_vxlan_bypass_mode (u32 sw_if_index, u8 is_ip6, u8 is_enable);
eyal bariaf86a482018-04-17 11:20:27 +0300230
Eyal Bari0fa56782018-06-04 12:25:05 +0300231int vnet_vxlan_add_del_rx_flow (u32 hw_if_index, u32 t_imdex, int is_add);
eyal bariaf86a482018-04-17 11:20:27 +0300232
233u32 vnet_vxlan_get_tunnel_index (u32 sw_if_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700234#endif /* included_vnet_vxlan_h */
Jon Loeliger3d460bd2018-02-01 16:36:12 -0600235
236/*
Eyal Bari0fa56782018-06-04 12:25:05 +0300237 * fd.io coding-style-patch-verification: ON
238 *
Jon Loeliger3d460bd2018-02-01 16:36:12 -0600239 * Local Variables:
240 * eval: (c-set-style "gnu")
241 * End:
242 */