blob: decb840b390c01258d4ec6de1f17825c88fb42c9 [file] [log] [blame]
Ed Warnickecb9cada2015-12-08 15:45:58 -07001/*
2 * Copyright (c) 2015 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
6 *
7 * http://www.apache.org/licenses/LICENSE-2.0
8 *
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
14 */
15/*
16 * ip/ip4.h: ip4 main include file
17 *
18 * Copyright (c) 2008 Eliot Dresselhaus
19 *
20 * Permission is hereby granted, free of charge, to any person obtaining
21 * a copy of this software and associated documentation files (the
22 * "Software"), to deal in the Software without restriction, including
23 * without limitation the rights to use, copy, modify, merge, publish,
24 * distribute, sublicense, and/or sell copies of the Software, and to
25 * permit persons to whom the Software is furnished to do so, subject to
26 * the following conditions:
27 *
28 * The above copyright notice and this permission notice shall be
29 * included in all copies or substantial portions of the Software.
30 *
31 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
32 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
33 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
34 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
35 * LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
36 * OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
37 * WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
38 */
39
40#ifndef included_ip_ip4_h
41#define included_ip_ip4_h
42
Ed Warnickecb9cada2015-12-08 15:45:58 -070043#include <vnet/ip/ip4_packet.h>
44#include <vnet/ip/lookup.h>
Dave Barach2c0a4f42017-06-29 09:30:15 -040045#include <vnet/buffer.h>
Damjan Marion22311502016-10-28 20:30:15 +020046#include <vnet/feature/feature.h>
Ed Warnickecb9cada2015-12-08 15:45:58 -070047
Neale Ranns32e1c012016-11-22 17:07:28 +000048typedef struct ip4_mfib_t
49{
50 /* Hash table for each prefix length mapping. */
51 uword *fib_entry_by_dst_address[65];
52
53 /* Table ID (hash key) for this FIB. */
54 u32 table_id;
55
56 /* Index into FIB vector. */
57 u32 index;
58} ip4_mfib_t;
59
Ed Warnickecb9cada2015-12-08 15:45:58 -070060struct ip4_main_t;
61
Ed Warnickecb9cada2015-12-08 15:45:58 -070062typedef void (ip4_add_del_interface_address_function_t)
63 (struct ip4_main_t * im,
64 uword opaque,
65 u32 sw_if_index,
66 ip4_address_t * address,
Dave Barachd7cb1b52016-12-09 09:52:16 -050067 u32 address_length, u32 if_address_index, u32 is_del);
Ed Warnickecb9cada2015-12-08 15:45:58 -070068
Dave Barachd7cb1b52016-12-09 09:52:16 -050069typedef struct
70{
71 ip4_add_del_interface_address_function_t *function;
Ed Warnickecb9cada2015-12-08 15:45:58 -070072 uword function_opaque;
73} ip4_add_del_interface_address_callback_t;
74
Neale Ranns15002542017-09-10 04:39:11 -070075typedef void (ip4_table_bind_function_t)
76 (struct ip4_main_t * im,
77 uword opaque, u32 sw_if_index, u32 new_fib_index, u32 old_fib_index);
78
79typedef struct
80{
81 ip4_table_bind_function_t *function;
82 uword function_opaque;
83} ip4_table_bind_callback_t;
84
Dave Barach6f9bca22016-04-30 10:25:32 -040085/**
86 * @brief IPv4 main type.
87 *
88 * State of IPv4 VPP processing including:
89 * - FIBs
90 * - Feature indices used in feature topological sort
91 * - Feature node run time references
92 */
93
Dave Barachd7cb1b52016-12-09 09:52:16 -050094typedef struct ip4_main_t
95{
Ed Warnickecb9cada2015-12-08 15:45:58 -070096 ip_lookup_main_t lookup_main;
97
Dave Barach6f9bca22016-04-30 10:25:32 -040098 /** Vector of FIBs. */
Dave Barachd7cb1b52016-12-09 09:52:16 -050099 struct fib_table_t_ *fibs;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700100
Neale Rannsa3af3372017-03-28 03:49:52 -0700101 /** Vector of MTries. */
102 struct ip4_fib_t_ *v4_fibs;
103
Neale Ranns32e1c012016-11-22 17:07:28 +0000104 /** Vector of MFIBs. */
105 struct mfib_table_t_ *mfibs;
106
Ed Warnickecb9cada2015-12-08 15:45:58 -0700107 u32 fib_masks[33];
108
Dave Barach6f9bca22016-04-30 10:25:32 -0400109 /** Table index indexed by software interface. */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500110 u32 *fib_index_by_sw_if_index;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700111
Neale Ranns32e1c012016-11-22 17:07:28 +0000112 /** Table index indexed by software interface. */
113 u32 *mfib_index_by_sw_if_index;
114
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100115 /* IP4 enabled count by software interface */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500116 u8 *ip_enabled_by_sw_if_index;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100117
Dave Barach6f9bca22016-04-30 10:25:32 -0400118 /** Hash table mapping table id to fib index.
Ed Warnickecb9cada2015-12-08 15:45:58 -0700119 ID space is not necessarily dense; index space is dense. */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500120 uword *fib_index_by_table_id;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700121
Neale Ranns32e1c012016-11-22 17:07:28 +0000122 /** Hash table mapping table id to multicast fib index.
123 ID space is not necessarily dense; index space is dense. */
124 uword *mfib_index_by_table_id;
125
Dave Barach6f9bca22016-04-30 10:25:32 -0400126 /** Functions to call when interface address changes. */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500127 ip4_add_del_interface_address_callback_t
128 * add_del_interface_address_callbacks;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700129
Neale Ranns15002542017-09-10 04:39:11 -0700130 /** Functions to call when interface to table biding changes. */
131 ip4_table_bind_callback_t *table_bind_callbacks;
132
Dave Barach6f9bca22016-04-30 10:25:32 -0400133 /** Template used to generate IP4 ARP packets. */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700134 vlib_packet_template_t ip4_arp_request_packet_template;
135
Dave Barach6f9bca22016-04-30 10:25:32 -0400136 /** Seed for Jenkins hash used to compute ip4 flow hash. */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700137 u32 flow_hash_seed;
138
Dave Barach6f9bca22016-04-30 10:25:32 -0400139 /** @brief Template information for VPP generated packets */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500140 struct
141 {
Dave Barach6f9bca22016-04-30 10:25:32 -0400142 /** TTL to use for host generated packets. */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700143 u8 ttl;
144
Dave Barach6f9bca22016-04-30 10:25:32 -0400145 /** TOS byte to use for host generated packets. */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700146 u8 tos;
147
148 u8 pad[2];
149 } host_config;
150} ip4_main_t;
151
Dave Barach6f9bca22016-04-30 10:25:32 -0400152/** Global ip4 main structure. */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700153extern ip4_main_t ip4_main;
154
Keith Burns (alagalah)79b5f632016-08-02 05:40:20 -0700155/** Global ip4 input node. Errors get attached to ip4 input node. */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700156extern vlib_node_registration_t ip4_input_node;
157extern vlib_node_registration_t ip4_lookup_node;
Neale Ranns32e1c012016-11-22 17:07:28 +0000158extern vlib_node_registration_t ip4_local_node;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700159extern vlib_node_registration_t ip4_rewrite_node;
Neale Ranns32e1c012016-11-22 17:07:28 +0000160extern vlib_node_registration_t ip4_rewrite_mcast_node;
Pierre Pfister0febaf12016-06-08 12:23:21 +0100161extern vlib_node_registration_t ip4_rewrite_local_node;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700162extern vlib_node_registration_t ip4_arp_node;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100163extern vlib_node_registration_t ip4_glean_node;
164extern vlib_node_registration_t ip4_midchain_node;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700165
166always_inline uword
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100167ip4_destination_matches_route (const ip4_main_t * im,
168 const ip4_address_t * key,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500169 const ip4_address_t * dest, uword dest_length)
170{
171 return 0 == ((key->data_u32 ^ dest->data_u32) & im->fib_masks[dest_length]);
172}
Ed Warnickecb9cada2015-12-08 15:45:58 -0700173
174always_inline uword
175ip4_destination_matches_interface (ip4_main_t * im,
176 ip4_address_t * key,
177 ip_interface_address_t * ia)
178{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500179 ip4_address_t *a = ip_interface_address_get_address (&im->lookup_main, ia);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700180 return ip4_destination_matches_route (im, key, a, ia->address_length);
181}
182
183/* As above but allows for unaligned destinations (e.g. works right from IP header of packet). */
184always_inline uword
185ip4_unaligned_destination_matches_route (ip4_main_t * im,
186 ip4_address_t * key,
187 ip4_address_t * dest,
188 uword dest_length)
Dave Barachd7cb1b52016-12-09 09:52:16 -0500189{
190 return 0 ==
191 ((clib_mem_unaligned (&key->data_u32, u32) ^ dest->
192 data_u32) & im->fib_masks[dest_length]);
193}
Ed Warnickecb9cada2015-12-08 15:45:58 -0700194
Pierre Pfisterd076f192016-06-22 12:58:30 +0100195always_inline int
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100196ip4_src_address_for_packet (ip_lookup_main_t * lm,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500197 u32 sw_if_index, ip4_address_t * src)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700198{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500199 u32 if_add_index = lm->if_address_pool_index_by_sw_if_index[sw_if_index];
200 if (PREDICT_TRUE (if_add_index != ~0))
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100201 {
Dave Barachd7cb1b52016-12-09 09:52:16 -0500202 ip_interface_address_t *if_add =
203 pool_elt_at_index (lm->if_address_pool, if_add_index);
204 ip4_address_t *if_ip = ip_interface_address_get_address (lm, if_add);
205 *src = *if_ip;
206 return 0;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100207 }
Dave Barachd7cb1b52016-12-09 09:52:16 -0500208 else
209 {
Dave Barachd7cb1b52016-12-09 09:52:16 -0500210 src->as_u32 = 0;
211 }
212 return (!0);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700213}
214
215/* Find interface address which matches destination. */
216always_inline ip4_address_t *
Dave Barachd7cb1b52016-12-09 09:52:16 -0500217ip4_interface_address_matching_destination (ip4_main_t * im,
218 ip4_address_t * dst,
219 u32 sw_if_index,
220 ip_interface_address_t **
221 result_ia)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700222{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500223 ip_lookup_main_t *lm = &im->lookup_main;
224 ip_interface_address_t *ia;
225 ip4_address_t *result = 0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700226
Dave Barachd7cb1b52016-12-09 09:52:16 -0500227 /* *INDENT-OFF* */
Dave Barach75fc8542016-10-11 16:16:02 -0400228 foreach_ip_interface_address (lm, ia, sw_if_index,
Ed Warnickecb9cada2015-12-08 15:45:58 -0700229 1 /* honor unnumbered */,
230 ({
231 ip4_address_t * a = ip_interface_address_get_address (lm, ia);
232 if (ip4_destination_matches_route (im, dst, a, ia->address_length))
233 {
234 result = a;
235 break;
236 }
237 }));
Dave Barachd7cb1b52016-12-09 09:52:16 -0500238 /* *INDENT-ON* */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700239 if (result_ia)
240 *result_ia = result ? ia : 0;
241 return result;
242}
243
Dave Barachd7cb1b52016-12-09 09:52:16 -0500244ip4_address_t *ip4_interface_first_address (ip4_main_t * im, u32 sw_if_index,
245 ip_interface_address_t **
246 result_ia);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100247
Dave Barachd7cb1b52016-12-09 09:52:16 -0500248clib_error_t *ip4_add_del_interface_address (vlib_main_t * vm,
249 u32 sw_if_index,
250 ip4_address_t * address,
251 u32 address_length, u32 is_del);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700252
Dave Barachd7cb1b52016-12-09 09:52:16 -0500253void ip4_sw_interface_enable_disable (u32 sw_if_index, u32 is_enable);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700254
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100255int ip4_address_compare (ip4_address_t * a1, ip4_address_t * a2);
Dave Barach203c6322016-06-26 10:29:03 -0400256
Ed Warnickecb9cada2015-12-08 15:45:58 -0700257/* Send an ARP request to see if given destination is reachable on given interface. */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500258clib_error_t *ip4_probe_neighbor (vlib_main_t * vm, ip4_address_t * dst,
259 u32 sw_if_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700260
Dave Barachd7cb1b52016-12-09 09:52:16 -0500261clib_error_t *ip4_set_arp_limit (u32 arp_limit);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700262
263uword
Ed Warnickecb9cada2015-12-08 15:45:58 -0700264ip4_udp_register_listener (vlib_main_t * vm,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500265 u16 dst_port, u32 next_node_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700266
Dave Barach75fc8542016-10-11 16:16:02 -0400267void
Dave Barachd7cb1b52016-12-09 09:52:16 -0500268ip4_icmp_register_type (vlib_main_t * vm, icmp4_type_t type, u32 node_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700269
Dave Barachd7cb1b52016-12-09 09:52:16 -0500270u16 ip4_tcp_udp_compute_checksum (vlib_main_t * vm, vlib_buffer_t * p0,
271 ip4_header_t * ip0);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700272
273void ip4_register_protocol (u32 protocol, u32 node_index);
274
275serialize_function_t serialize_vnet_ip4_main, unserialize_vnet_ip4_main;
276
Dave Barachd7cb1b52016-12-09 09:52:16 -0500277int vnet_set_ip4_flow_hash (u32 table_id,
278 flow_hash_config_t flow_hash_config);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700279
Dave Barach75fc8542016-10-11 16:16:02 -0400280int vnet_set_ip4_classify_intfc (vlib_main_t * vm, u32 sw_if_index,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500281 u32 table_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700282
283/* Compute flow hash. We'll use it to select which adjacency to use for this
284 flow. And other things. */
285always_inline u32
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100286ip4_compute_flow_hash (const ip4_header_t * ip,
287 flow_hash_config_t flow_hash_config)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700288{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500289 tcp_header_t *tcp = (void *) (ip + 1);
290 u32 a, b, c, t1, t2;
291 uword is_tcp_udp = (ip->protocol == IP_PROTOCOL_TCP
292 || ip->protocol == IP_PROTOCOL_UDP);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700293
Dave Barachd7cb1b52016-12-09 09:52:16 -0500294 t1 = (flow_hash_config & IP_FLOW_HASH_SRC_ADDR)
295 ? ip->src_address.data_u32 : 0;
296 t2 = (flow_hash_config & IP_FLOW_HASH_DST_ADDR)
297 ? ip->dst_address.data_u32 : 0;
Dave Barach75fc8542016-10-11 16:16:02 -0400298
Dave Barachd7cb1b52016-12-09 09:52:16 -0500299 a = (flow_hash_config & IP_FLOW_HASH_REVERSE_SRC_DST) ? t2 : t1;
300 b = (flow_hash_config & IP_FLOW_HASH_REVERSE_SRC_DST) ? t1 : t2;
301 b ^= (flow_hash_config & IP_FLOW_HASH_PROTO) ? ip->protocol : 0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700302
Dave Barach68b0fb02017-02-28 15:15:56 -0500303 t1 = is_tcp_udp ? tcp->src : 0;
304 t2 = is_tcp_udp ? tcp->dst : 0;
Dave Barach75fc8542016-10-11 16:16:02 -0400305
Dave Barachd7cb1b52016-12-09 09:52:16 -0500306 t1 = (flow_hash_config & IP_FLOW_HASH_SRC_PORT) ? t1 : 0;
307 t2 = (flow_hash_config & IP_FLOW_HASH_DST_PORT) ? t2 : 0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700308
Dave Barachd7cb1b52016-12-09 09:52:16 -0500309 c = (flow_hash_config & IP_FLOW_HASH_REVERSE_SRC_DST) ?
310 (t1 << 16) | t2 : (t2 << 16) | t1;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700311
Dave Barachd7cb1b52016-12-09 09:52:16 -0500312 hash_v3_mix32 (a, b, c);
313 hash_v3_finalize32 (a, b, c);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700314
Dave Barachd7cb1b52016-12-09 09:52:16 -0500315 return c;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700316}
317
John Lo37682e12016-11-30 12:51:39 -0500318void
319ip4_forward_next_trace (vlib_main_t * vm,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500320 vlib_node_runtime_t * node,
321 vlib_frame_t * frame,
322 vlib_rx_or_tx_t which_adj_index);
John Lo37682e12016-11-30 12:51:39 -0500323
Dave Barachd7cb1b52016-12-09 09:52:16 -0500324u8 *format_ip4_forward_next_trace (u8 * s, va_list * args);
John Lo37682e12016-11-30 12:51:39 -0500325
326u32 ip4_tcp_udp_validate_checksum (vlib_main_t * vm, vlib_buffer_t * p0);
327
Dave Barach68b0fb02017-02-28 15:15:56 -0500328#define IP_DF 0x4000 /* don't fragment */
329
330/**
331 * Push IPv4 header to buffer
332 *
333 * This does not support fragmentation.
334 *
335 * @param vm - vlib_main
336 * @param b - buffer to write the header to
337 * @param src - source IP
338 * @param dst - destination IP
339 * @param prot - payload proto
340 *
341 * @return - pointer to start of IP header
342 */
343always_inline void *
344vlib_buffer_push_ip4 (vlib_main_t * vm, vlib_buffer_t * b,
Florin Corasfdbc3822017-07-27 00:34:12 -0700345 ip4_address_t * src, ip4_address_t * dst, int proto,
346 u8 csum_offload)
Dave Barach68b0fb02017-02-28 15:15:56 -0500347{
348 ip4_header_t *ih;
349
350 /* make some room */
351 ih = vlib_buffer_push_uninit (b, sizeof (ip4_header_t));
352
353 ih->ip_version_and_header_length = 0x45;
354 ih->tos = 0;
355 ih->length = clib_host_to_net_u16 (vlib_buffer_length_in_chain (vm, b));
356
357 /* No fragments */
358 ih->flags_and_fragment_offset = clib_host_to_net_u16 (IP_DF);
359 ih->ttl = 255;
360 ih->protocol = proto;
361 ih->src_address.as_u32 = src->as_u32;
362 ih->dst_address.as_u32 = dst->as_u32;
363
Dave Barachc4423222017-07-19 08:48:09 -0400364 /* Offload ip4 header checksum generation */
Florin Corasfdbc3822017-07-27 00:34:12 -0700365 if (csum_offload)
Dave Barachc4423222017-07-19 08:48:09 -0400366 {
367 ih->checksum = 0;
368 b->flags |= VNET_BUFFER_F_OFFLOAD_IP_CKSUM | VNET_BUFFER_F_IS_IP4;
369 vnet_buffer (b)->l3_hdr_offset = (u8 *) ih - b->data;
Dave Barachac0c96b2017-08-02 09:19:32 -0400370 vnet_buffer (b)->l4_hdr_offset = vnet_buffer (b)->l3_hdr_offset +
371 sizeof (*ih);
Dave Barachc4423222017-07-19 08:48:09 -0400372 }
373 else
374 ih->checksum = ip4_header_checksum (ih);
375
Dave Barach68b0fb02017-02-28 15:15:56 -0500376 return ih;
377}
Ed Warnickecb9cada2015-12-08 15:45:58 -0700378#endif /* included_ip_ip4_h */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500379
380/*
381 * fd.io coding-style-patch-verification: ON
382 *
383 * Local Variables:
384 * eval: (c-set-style "gnu")
385 * End:
386 */