Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (c) 2015 Cisco and/or its affiliates. |
| 3 | * Licensed under the Apache License, Version 2.0 (the "License"); |
| 4 | * you may not use this file except in compliance with the License. |
| 5 | * You may obtain a copy of the License at: |
| 6 | * |
| 7 | * http://www.apache.org/licenses/LICENSE-2.0 |
| 8 | * |
| 9 | * Unless required by applicable law or agreed to in writing, software |
| 10 | * distributed under the License is distributed on an "AS IS" BASIS, |
| 11 | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 12 | * See the License for the specific language governing permissions and |
| 13 | * limitations under the License. |
| 14 | */ |
| 15 | #ifndef included_vnet_vxlan_h |
| 16 | #define included_vnet_vxlan_h |
| 17 | |
| 18 | #include <vppinfra/error.h> |
| 19 | #include <vppinfra/hash.h> |
Eyal Bari | dd47eca | 2018-07-08 08:15:56 +0300 | [diff] [blame] | 20 | #include <vppinfra/bihash_16_8.h> |
Eyal Bari | 0fa5678 | 2018-06-04 12:25:05 +0300 | [diff] [blame] | 21 | #include <vppinfra/bihash_24_8.h> |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 22 | #include <vnet/vnet.h> |
| 23 | #include <vnet/ip/ip.h> |
Nick Zavaritsky | 27518c2 | 2020-02-27 15:54:58 +0000 | [diff] [blame] | 24 | #include <vnet/ip/vtep.h> |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 25 | #include <vnet/l2/l2_input.h> |
John Lo | 3ef822e | 2016-06-07 09:14:07 -0400 | [diff] [blame] | 26 | #include <vnet/l2/l2_output.h> |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 27 | #include <vnet/l2/l2_bd.h> |
| 28 | #include <vnet/ethernet/ethernet.h> |
| 29 | #include <vnet/vxlan/vxlan_packet.h> |
| 30 | #include <vnet/ip/ip4_packet.h> |
Chris Luke | 99cb335 | 2016-04-26 10:49:53 -0400 | [diff] [blame] | 31 | #include <vnet/ip/ip6_packet.h> |
Florin Coras | b040f98 | 2020-10-20 14:59:43 -0700 | [diff] [blame] | 32 | #include <vnet/udp/udp_packet.h> |
John Lo | c42912d | 2016-11-07 18:30:47 -0500 | [diff] [blame] | 33 | #include <vnet/dpo/dpo.h> |
Eyal Bari | c5b1360 | 2016-11-24 19:42:43 +0200 | [diff] [blame] | 34 | #include <vnet/adj/adj_types.h> |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 35 | |
Eyal Bari | 0fa5678 | 2018-06-04 12:25:05 +0300 | [diff] [blame] | 36 | /* *INDENT-OFF* */ |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 37 | typedef CLIB_PACKED (struct { |
Eyal Bari | 0fa5678 | 2018-06-04 12:25:05 +0300 | [diff] [blame] | 38 | ip4_header_t ip4; /* 20 bytes */ |
| 39 | udp_header_t udp; /* 8 bytes */ |
| 40 | vxlan_header_t vxlan; /* 8 bytes */ |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 41 | }) ip4_vxlan_header_t; |
| 42 | |
Chris Luke | 99cb335 | 2016-04-26 10:49:53 -0400 | [diff] [blame] | 43 | typedef CLIB_PACKED (struct { |
Eyal Bari | 0fa5678 | 2018-06-04 12:25:05 +0300 | [diff] [blame] | 44 | ip6_header_t ip6; /* 40 bytes */ |
| 45 | udp_header_t udp; /* 8 bytes */ |
| 46 | vxlan_header_t vxlan; /* 8 bytes */ |
Chris Luke | 99cb335 | 2016-04-26 10:49:53 -0400 | [diff] [blame] | 47 | }) ip6_vxlan_header_t; |
Eyal Bari | dd47eca | 2018-07-08 08:15:56 +0300 | [diff] [blame] | 48 | /* *INDENT-ON* */ |
Chris Luke | 99cb335 | 2016-04-26 10:49:53 -0400 | [diff] [blame] | 49 | |
Eyal Bari | dd47eca | 2018-07-08 08:15:56 +0300 | [diff] [blame] | 50 | /* |
| 51 | * Key fields: remote ip, vni on incoming VXLAN packet |
| 52 | * all fields in NET byte order |
| 53 | */ |
| 54 | typedef clib_bihash_kv_16_8_t vxlan4_tunnel_key_t; |
Chris Luke | 99cb335 | 2016-04-26 10:49:53 -0400 | [diff] [blame] | 55 | |
Eyal Bari | 0fa5678 | 2018-06-04 12:25:05 +0300 | [diff] [blame] | 56 | /* |
| 57 | * Key fields: remote ip, vni and fib index on incoming VXLAN packet |
| 58 | * ip, vni fields in NET byte order |
| 59 | * fib index field in host byte order |
| 60 | */ |
Eyal Bari | dd47eca | 2018-07-08 08:15:56 +0300 | [diff] [blame] | 61 | typedef clib_bihash_kv_24_8_t vxlan6_tunnel_key_t; |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 62 | |
Eyal Bari | efd9cf3 | 2018-10-02 12:23:06 +0300 | [diff] [blame] | 63 | typedef union |
| 64 | { |
| 65 | struct |
| 66 | { |
| 67 | u32 sw_if_index; /* unicast - input interface / mcast - stats interface */ |
| 68 | union |
| 69 | { |
| 70 | struct /* unicast action */ |
| 71 | { |
| 72 | u16 next_index; |
| 73 | u8 error; |
| 74 | }; |
| 75 | ip4_address_t local_ip; /* used as dst ip for mcast pkts to assign them to unicast tunnel */ |
| 76 | }; |
| 77 | }; |
| 78 | u64 as_u64; |
| 79 | } vxlan_decap_info_t; |
| 80 | |
Eyal Bari | 0fa5678 | 2018-06-04 12:25:05 +0300 | [diff] [blame] | 81 | typedef struct |
| 82 | { |
Dave Barach | eb987d3 | 2018-05-03 08:26:39 -0400 | [diff] [blame] | 83 | /* Required for pool_get_aligned */ |
Eyal Bari | 0fa5678 | 2018-06-04 12:25:05 +0300 | [diff] [blame] | 84 | CLIB_CACHE_LINE_ALIGN_MARK (cacheline0); |
Dave Barach | eb987d3 | 2018-05-03 08:26:39 -0400 | [diff] [blame] | 85 | |
John Lo | c42912d | 2016-11-07 18:30:47 -0500 | [diff] [blame] | 86 | /* FIB DPO for IP forwarding of VXLAN encap packet */ |
Eyal Bari | 0fa5678 | 2018-06-04 12:25:05 +0300 | [diff] [blame] | 87 | dpo_id_t next_dpo; |
John Lo | c42912d | 2016-11-07 18:30:47 -0500 | [diff] [blame] | 88 | |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 89 | /* vxlan VNI in HOST byte order */ |
| 90 | u32 vni; |
| 91 | |
John Lo | c42912d | 2016-11-07 18:30:47 -0500 | [diff] [blame] | 92 | /* tunnel src and dst addresses */ |
| 93 | ip46_address_t src; |
| 94 | ip46_address_t dst; |
Chris Luke | 99cb335 | 2016-04-26 10:49:53 -0400 | [diff] [blame] | 95 | |
Artem Glazychev | 839dcc0 | 2020-12-01 02:39:21 +0700 | [diff] [blame] | 96 | /* udp-ports */ |
| 97 | u16 src_port; |
| 98 | u16 dst_port; |
| 99 | |
John Lo | 56912c8 | 2016-12-08 16:10:02 -0500 | [diff] [blame] | 100 | /* mcast packet output intfc index (used only if dst is mcast) */ |
Eyal Bari | c5b1360 | 2016-11-24 19:42:43 +0200 | [diff] [blame] | 101 | u32 mcast_sw_if_index; |
John Lo | 56912c8 | 2016-12-08 16:10:02 -0500 | [diff] [blame] | 102 | |
Hongjun Ni | beb4bf7 | 2016-11-25 00:03:46 +0800 | [diff] [blame] | 103 | /* decap next index */ |
Eyal Bari | a5679e8 | 2018-08-26 15:20:07 +0300 | [diff] [blame] | 104 | u16 decap_next_index; |
Eyal Bari | c5b1360 | 2016-11-24 19:42:43 +0200 | [diff] [blame] | 105 | |
John Lo | c42912d | 2016-11-07 18:30:47 -0500 | [diff] [blame] | 106 | /* The FIB index for src/dst addresses */ |
| 107 | u32 encap_fib_index; |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 108 | |
John Lo | c42912d | 2016-11-07 18:30:47 -0500 | [diff] [blame] | 109 | /* vnet intfc index */ |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 110 | u32 sw_if_index; |
John Lo | c42912d | 2016-11-07 18:30:47 -0500 | [diff] [blame] | 111 | u32 hw_if_index; |
Chris Luke | 99cb335 | 2016-04-26 10:49:53 -0400 | [diff] [blame] | 112 | |
John Lo | c42912d | 2016-11-07 18:30:47 -0500 | [diff] [blame] | 113 | /** |
| 114 | * Linkage into the FIB object graph |
| 115 | */ |
| 116 | fib_node_t node; |
Chris Luke | 99cb335 | 2016-04-26 10:49:53 -0400 | [diff] [blame] | 117 | |
Eyal Bari | c5b1360 | 2016-11-24 19:42:43 +0200 | [diff] [blame] | 118 | /* |
| 119 | * The FIB entry for (depending on VXLAN tunnel is unicast or mcast) |
| 120 | * sending unicast VXLAN encap packets or receiving mcast VXLAN packets |
| 121 | */ |
John Lo | c42912d | 2016-11-07 18:30:47 -0500 | [diff] [blame] | 122 | fib_node_index_t fib_entry_index; |
Eyal Bari | c5b1360 | 2016-11-24 19:42:43 +0200 | [diff] [blame] | 123 | adj_index_t mcast_adj_index; |
John Lo | c42912d | 2016-11-07 18:30:47 -0500 | [diff] [blame] | 124 | |
| 125 | /** |
Paul Vinciguerra | bdc0e6b | 2018-09-22 05:32:50 -0700 | [diff] [blame] | 126 | * The tunnel is a child of the FIB entry for its destination. This is |
John Lo | c42912d | 2016-11-07 18:30:47 -0500 | [diff] [blame] | 127 | * so it receives updates when the forwarding information for that entry |
| 128 | * changes. |
| 129 | * The tunnels sibling index on the FIB entry's dependency list. |
| 130 | */ |
| 131 | u32 sibling_index; |
Jon Loeliger | 3d460bd | 2018-02-01 16:36:12 -0600 | [diff] [blame] | 132 | |
Eyal Bari | 0fa5678 | 2018-06-04 12:25:05 +0300 | [diff] [blame] | 133 | u32 flow_index; /* infra flow index */ |
| 134 | u32 dev_instance; /* Real device instance in tunnel vector */ |
| 135 | u32 user_instance; /* Instance name being shown to user */ |
eyal bari | 82e21d7 | 2018-04-26 13:14:55 +0300 | [diff] [blame] | 136 | |
Klement Sekera | 7dbf9a1 | 2019-11-21 10:31:03 +0000 | [diff] [blame] | 137 | VNET_DECLARE_REWRITE; |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 138 | } vxlan_tunnel_t; |
| 139 | |
| 140 | #define foreach_vxlan_input_next \ |
| 141 | _(DROP, "error-drop") \ |
John Lo | c42912d | 2016-11-07 18:30:47 -0500 | [diff] [blame] | 142 | _(L2_INPUT, "l2-input") |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 143 | |
Eyal Bari | 0fa5678 | 2018-06-04 12:25:05 +0300 | [diff] [blame] | 144 | typedef enum |
| 145 | { |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 146 | #define _(s,n) VXLAN_INPUT_NEXT_##s, |
| 147 | foreach_vxlan_input_next |
| 148 | #undef _ |
Eyal Bari | 0fa5678 | 2018-06-04 12:25:05 +0300 | [diff] [blame] | 149 | VXLAN_INPUT_N_NEXT, |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 150 | } vxlan_input_next_t; |
| 151 | |
Eyal Bari | 0fa5678 | 2018-06-04 12:25:05 +0300 | [diff] [blame] | 152 | typedef enum |
| 153 | { |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 154 | #define vxlan_error(n,s) VXLAN_ERROR_##n, |
| 155 | #include <vnet/vxlan/vxlan_error.def> |
| 156 | #undef vxlan_error |
| 157 | VXLAN_N_ERROR, |
| 158 | } vxlan_input_error_t; |
| 159 | |
Eyal Bari | 0fa5678 | 2018-06-04 12:25:05 +0300 | [diff] [blame] | 160 | typedef struct |
| 161 | { |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 162 | /* vector of encap tunnel instances */ |
Eyal Bari | 0fa5678 | 2018-06-04 12:25:05 +0300 | [diff] [blame] | 163 | vxlan_tunnel_t *tunnels; |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 164 | |
| 165 | /* lookup tunnel by key */ |
Artem Glazychev | 839dcc0 | 2020-12-01 02:39:21 +0700 | [diff] [blame] | 166 | clib_bihash_16_8_t |
| 167 | vxlan4_tunnel_by_key; /* keyed on ipv4.dst + src_port + fib + vni */ |
| 168 | clib_bihash_24_8_t |
| 169 | vxlan6_tunnel_by_key; /* keyed on ipv6.dst + src_port + fib + vni */ |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 170 | |
Eyal Bari | fff67c8 | 2016-12-21 12:45:47 +0200 | [diff] [blame] | 171 | /* local VTEP IPs ref count used by vxlan-bypass node to check if |
| 172 | received VXLAN packet DIP matches any local VTEP address */ |
Nick Zavaritsky | 27518c2 | 2020-02-27 15:54:58 +0000 | [diff] [blame] | 173 | vtep_table_t vtep_table; |
John Lo | 37682e1 | 2016-11-30 12:51:39 -0500 | [diff] [blame] | 174 | |
Eyal Bari | 0ded851 | 2017-01-19 17:01:09 +0200 | [diff] [blame] | 175 | /* mcast shared info */ |
Eyal Bari | 0fa5678 | 2018-06-04 12:25:05 +0300 | [diff] [blame] | 176 | uword *mcast_shared; /* keyed on mcast ip46 addr */ |
Eyal Bari | fff67c8 | 2016-12-21 12:45:47 +0200 | [diff] [blame] | 177 | |
Dave Wallace | 60231f3 | 2015-12-17 21:04:30 -0500 | [diff] [blame] | 178 | /* Mapping from sw_if_index to tunnel index */ |
Eyal Bari | 0fa5678 | 2018-06-04 12:25:05 +0300 | [diff] [blame] | 179 | u32 *tunnel_index_by_sw_if_index; |
Dave Wallace | 60231f3 | 2015-12-17 21:04:30 -0500 | [diff] [blame] | 180 | |
Jon Loeliger | e3034cd | 2019-01-03 12:56:02 -0600 | [diff] [blame] | 181 | /* graph node state */ |
| 182 | uword *bm_ip4_bypass_enabled_by_sw_if; |
| 183 | uword *bm_ip6_bypass_enabled_by_sw_if; |
| 184 | |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 185 | /* convenience */ |
Eyal Bari | 0fa5678 | 2018-06-04 12:25:05 +0300 | [diff] [blame] | 186 | vlib_main_t *vlib_main; |
| 187 | vnet_main_t *vnet_main; |
Jon Loeliger | 3d460bd | 2018-02-01 16:36:12 -0600 | [diff] [blame] | 188 | |
| 189 | /* Record used instances */ |
| 190 | uword *instance_used; |
eyal bari | af86a48 | 2018-04-17 11:20:27 +0300 | [diff] [blame] | 191 | u32 flow_id_start; |
Junfeng Wang | 290526e | 2021-03-09 16:44:57 +0800 | [diff] [blame] | 192 | |
| 193 | /* cache for last 8 vxlan tunnel */ |
Junfeng Wang | 290526e | 2021-03-09 16:44:57 +0800 | [diff] [blame] | 194 | vtep4_cache_t vtep4_u512; |
Junfeng Wang | 290526e | 2021-03-09 16:44:57 +0800 | [diff] [blame] | 195 | |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 196 | } vxlan_main_t; |
| 197 | |
Dave Wallace | 71612d6 | 2017-10-24 01:32:41 -0400 | [diff] [blame] | 198 | extern vxlan_main_t vxlan_main; |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 199 | |
Chris Luke | 99cb335 | 2016-04-26 10:49:53 -0400 | [diff] [blame] | 200 | extern vlib_node_registration_t vxlan4_input_node; |
| 201 | extern vlib_node_registration_t vxlan6_input_node; |
John Lo | c42912d | 2016-11-07 18:30:47 -0500 | [diff] [blame] | 202 | extern vlib_node_registration_t vxlan4_encap_node; |
| 203 | extern vlib_node_registration_t vxlan6_encap_node; |
eyal bari | af86a48 | 2018-04-17 11:20:27 +0300 | [diff] [blame] | 204 | extern vlib_node_registration_t vxlan4_flow_input_node; |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 205 | |
Eyal Bari | 0fa5678 | 2018-06-04 12:25:05 +0300 | [diff] [blame] | 206 | u8 *format_vxlan_encap_trace (u8 * s, va_list * args); |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 207 | |
Eyal Bari | 0fa5678 | 2018-06-04 12:25:05 +0300 | [diff] [blame] | 208 | typedef struct |
| 209 | { |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 210 | u8 is_add; |
Chris Luke | 99cb335 | 2016-04-26 10:49:53 -0400 | [diff] [blame] | 211 | |
| 212 | /* we normally use is_ip4, but since this adds to the |
Paul Vinciguerra | bdc0e6b | 2018-09-22 05:32:50 -0700 | [diff] [blame] | 213 | * structure, this seems less of a breaking change */ |
Chris Luke | 99cb335 | 2016-04-26 10:49:53 -0400 | [diff] [blame] | 214 | u8 is_ip6; |
Nathan Skrzypczak | 3e38422 | 2021-04-21 19:56:34 +0200 | [diff] [blame] | 215 | u8 is_l3; |
Jon Loeliger | 3d460bd | 2018-02-01 16:36:12 -0600 | [diff] [blame] | 216 | u32 instance; |
Chris Luke | 99cb335 | 2016-04-26 10:49:53 -0400 | [diff] [blame] | 217 | ip46_address_t src, dst; |
Eyal Bari | c5b1360 | 2016-11-24 19:42:43 +0200 | [diff] [blame] | 218 | u32 mcast_sw_if_index; |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 219 | u32 encap_fib_index; |
| 220 | u32 decap_next_index; |
| 221 | u32 vni; |
Artem Glazychev | 839dcc0 | 2020-12-01 02:39:21 +0700 | [diff] [blame] | 222 | u16 src_port; |
| 223 | u16 dst_port; |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 224 | } vnet_vxlan_add_del_tunnel_args_t; |
| 225 | |
Eyal Bari | 0fa5678 | 2018-06-04 12:25:05 +0300 | [diff] [blame] | 226 | int vnet_vxlan_add_del_tunnel |
| 227 | (vnet_vxlan_add_del_tunnel_args_t * a, u32 * sw_if_indexp); |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 228 | |
Eyal Bari | 0fa5678 | 2018-06-04 12:25:05 +0300 | [diff] [blame] | 229 | void vnet_int_vxlan_bypass_mode (u32 sw_if_index, u8 is_ip6, u8 is_enable); |
eyal bari | af86a48 | 2018-04-17 11:20:27 +0300 | [diff] [blame] | 230 | |
Eyal Bari | 0fa5678 | 2018-06-04 12:25:05 +0300 | [diff] [blame] | 231 | int vnet_vxlan_add_del_rx_flow (u32 hw_if_index, u32 t_imdex, int is_add); |
eyal bari | af86a48 | 2018-04-17 11:20:27 +0300 | [diff] [blame] | 232 | |
| 233 | u32 vnet_vxlan_get_tunnel_index (u32 sw_if_index); |
Ed Warnicke | cb9cada | 2015-12-08 15:45:58 -0700 | [diff] [blame] | 234 | #endif /* included_vnet_vxlan_h */ |
Jon Loeliger | 3d460bd | 2018-02-01 16:36:12 -0600 | [diff] [blame] | 235 | |
| 236 | /* |
Eyal Bari | 0fa5678 | 2018-06-04 12:25:05 +0300 | [diff] [blame] | 237 | * fd.io coding-style-patch-verification: ON |
| 238 | * |
Jon Loeliger | 3d460bd | 2018-02-01 16:36:12 -0600 | [diff] [blame] | 239 | * Local Variables: |
| 240 | * eval: (c-set-style "gnu") |
| 241 | * End: |
| 242 | */ |