blob: 8187a9dd0e2c46d27b94082bf74e849a91019547 [file] [log] [blame]
Ed Warnickecb9cada2015-12-08 15:45:58 -07001/*
2 * Copyright (c) 2015 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
6 *
7 * http://www.apache.org/licenses/LICENSE-2.0
8 *
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
14 */
15/*
16 * ip/ip4.h: ip4 main include file
17 *
18 * Copyright (c) 2008 Eliot Dresselhaus
19 *
20 * Permission is hereby granted, free of charge, to any person obtaining
21 * a copy of this software and associated documentation files (the
22 * "Software"), to deal in the Software without restriction, including
23 * without limitation the rights to use, copy, modify, merge, publish,
24 * distribute, sublicense, and/or sell copies of the Software, and to
25 * permit persons to whom the Software is furnished to do so, subject to
26 * the following conditions:
27 *
28 * The above copyright notice and this permission notice shall be
29 * included in all copies or substantial portions of the Software.
30 *
31 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
32 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
33 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
34 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
35 * LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
36 * OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
37 * WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
38 */
39
40#ifndef included_ip_ip4_h
41#define included_ip_ip4_h
42
Ed Warnickecb9cada2015-12-08 15:45:58 -070043#include <vnet/ip/ip4_packet.h>
44#include <vnet/ip/lookup.h>
Dave Barach2c0a4f42017-06-29 09:30:15 -040045#include <vnet/buffer.h>
Damjan Marion22311502016-10-28 20:30:15 +020046#include <vnet/feature/feature.h>
Pierre Pfister1bfd3722017-09-18 11:40:32 +020047#include <vnet/ip/icmp46_packet.h>
Ed Warnickecb9cada2015-12-08 15:45:58 -070048
Neale Ranns32e1c012016-11-22 17:07:28 +000049typedef struct ip4_mfib_t
50{
51 /* Hash table for each prefix length mapping. */
52 uword *fib_entry_by_dst_address[65];
53
54 /* Table ID (hash key) for this FIB. */
55 u32 table_id;
56
57 /* Index into FIB vector. */
58 u32 index;
59} ip4_mfib_t;
60
Ed Warnickecb9cada2015-12-08 15:45:58 -070061struct ip4_main_t;
62
Ed Warnickecb9cada2015-12-08 15:45:58 -070063typedef void (ip4_add_del_interface_address_function_t)
64 (struct ip4_main_t * im,
65 uword opaque,
66 u32 sw_if_index,
67 ip4_address_t * address,
Dave Barachd7cb1b52016-12-09 09:52:16 -050068 u32 address_length, u32 if_address_index, u32 is_del);
Ed Warnickecb9cada2015-12-08 15:45:58 -070069
Dave Barachd7cb1b52016-12-09 09:52:16 -050070typedef struct
71{
72 ip4_add_del_interface_address_function_t *function;
Ed Warnickecb9cada2015-12-08 15:45:58 -070073 uword function_opaque;
74} ip4_add_del_interface_address_callback_t;
75
Neale Ranns15002542017-09-10 04:39:11 -070076typedef void (ip4_table_bind_function_t)
77 (struct ip4_main_t * im,
78 uword opaque, u32 sw_if_index, u32 new_fib_index, u32 old_fib_index);
79
80typedef struct
81{
82 ip4_table_bind_function_t *function;
83 uword function_opaque;
84} ip4_table_bind_callback_t;
85
Dave Barach6f9bca22016-04-30 10:25:32 -040086/**
87 * @brief IPv4 main type.
88 *
89 * State of IPv4 VPP processing including:
90 * - FIBs
91 * - Feature indices used in feature topological sort
92 * - Feature node run time references
93 */
94
Dave Barachd7cb1b52016-12-09 09:52:16 -050095typedef struct ip4_main_t
96{
Ed Warnickecb9cada2015-12-08 15:45:58 -070097 ip_lookup_main_t lookup_main;
98
Dave Barach6f9bca22016-04-30 10:25:32 -040099 /** Vector of FIBs. */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500100 struct fib_table_t_ *fibs;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700101
Neale Rannsa3af3372017-03-28 03:49:52 -0700102 /** Vector of MTries. */
103 struct ip4_fib_t_ *v4_fibs;
104
Neale Ranns32e1c012016-11-22 17:07:28 +0000105 /** Vector of MFIBs. */
106 struct mfib_table_t_ *mfibs;
107
Ed Warnickecb9cada2015-12-08 15:45:58 -0700108 u32 fib_masks[33];
109
Dave Barach6f9bca22016-04-30 10:25:32 -0400110 /** Table index indexed by software interface. */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500111 u32 *fib_index_by_sw_if_index;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700112
Neale Ranns32e1c012016-11-22 17:07:28 +0000113 /** Table index indexed by software interface. */
114 u32 *mfib_index_by_sw_if_index;
115
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100116 /* IP4 enabled count by software interface */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500117 u8 *ip_enabled_by_sw_if_index;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100118
Dave Barach6f9bca22016-04-30 10:25:32 -0400119 /** Hash table mapping table id to fib index.
Ed Warnickecb9cada2015-12-08 15:45:58 -0700120 ID space is not necessarily dense; index space is dense. */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500121 uword *fib_index_by_table_id;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700122
Neale Ranns32e1c012016-11-22 17:07:28 +0000123 /** Hash table mapping table id to multicast fib index.
124 ID space is not necessarily dense; index space is dense. */
125 uword *mfib_index_by_table_id;
126
Dave Barach6f9bca22016-04-30 10:25:32 -0400127 /** Functions to call when interface address changes. */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500128 ip4_add_del_interface_address_callback_t
129 * add_del_interface_address_callbacks;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700130
Neale Ranns15002542017-09-10 04:39:11 -0700131 /** Functions to call when interface to table biding changes. */
132 ip4_table_bind_callback_t *table_bind_callbacks;
133
Dave Barach6f9bca22016-04-30 10:25:32 -0400134 /** Template used to generate IP4 ARP packets. */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700135 vlib_packet_template_t ip4_arp_request_packet_template;
136
Dave Barach6f9bca22016-04-30 10:25:32 -0400137 /** Seed for Jenkins hash used to compute ip4 flow hash. */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700138 u32 flow_hash_seed;
139
Dave Barach6f9bca22016-04-30 10:25:32 -0400140 /** @brief Template information for VPP generated packets */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500141 struct
142 {
Dave Barach6f9bca22016-04-30 10:25:32 -0400143 /** TTL to use for host generated packets. */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700144 u8 ttl;
145
Dave Barach6f9bca22016-04-30 10:25:32 -0400146 /** TOS byte to use for host generated packets. */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700147 u8 tos;
148
149 u8 pad[2];
150 } host_config;
Neale Ranns1ec36522017-11-29 05:20:37 -0800151
152 /** Heapsize for the Mtries */
153 uword mtrie_heap_size;
154
155 /** The memory heap for the mtries */
156 void *mtrie_mheap;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700157} ip4_main_t;
158
Dave Barach6f9bca22016-04-30 10:25:32 -0400159/** Global ip4 main structure. */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700160extern ip4_main_t ip4_main;
161
Keith Burns (alagalah)79b5f632016-08-02 05:40:20 -0700162/** Global ip4 input node. Errors get attached to ip4 input node. */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700163extern vlib_node_registration_t ip4_input_node;
164extern vlib_node_registration_t ip4_lookup_node;
Neale Ranns32e1c012016-11-22 17:07:28 +0000165extern vlib_node_registration_t ip4_local_node;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700166extern vlib_node_registration_t ip4_rewrite_node;
Neale Ranns32e1c012016-11-22 17:07:28 +0000167extern vlib_node_registration_t ip4_rewrite_mcast_node;
Pierre Pfister0febaf12016-06-08 12:23:21 +0100168extern vlib_node_registration_t ip4_rewrite_local_node;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700169extern vlib_node_registration_t ip4_arp_node;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100170extern vlib_node_registration_t ip4_glean_node;
171extern vlib_node_registration_t ip4_midchain_node;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700172
173always_inline uword
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100174ip4_destination_matches_route (const ip4_main_t * im,
175 const ip4_address_t * key,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500176 const ip4_address_t * dest, uword dest_length)
177{
178 return 0 == ((key->data_u32 ^ dest->data_u32) & im->fib_masks[dest_length]);
179}
Ed Warnickecb9cada2015-12-08 15:45:58 -0700180
181always_inline uword
182ip4_destination_matches_interface (ip4_main_t * im,
183 ip4_address_t * key,
184 ip_interface_address_t * ia)
185{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500186 ip4_address_t *a = ip_interface_address_get_address (&im->lookup_main, ia);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700187 return ip4_destination_matches_route (im, key, a, ia->address_length);
188}
189
Pierre Pfisterd076f192016-06-22 12:58:30 +0100190always_inline int
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100191ip4_src_address_for_packet (ip_lookup_main_t * lm,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500192 u32 sw_if_index, ip4_address_t * src)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700193{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500194 u32 if_add_index = lm->if_address_pool_index_by_sw_if_index[sw_if_index];
195 if (PREDICT_TRUE (if_add_index != ~0))
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100196 {
Dave Barachd7cb1b52016-12-09 09:52:16 -0500197 ip_interface_address_t *if_add =
198 pool_elt_at_index (lm->if_address_pool, if_add_index);
199 ip4_address_t *if_ip = ip_interface_address_get_address (lm, if_add);
200 *src = *if_ip;
201 return 0;
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100202 }
Dave Barachd7cb1b52016-12-09 09:52:16 -0500203 else
204 {
Dave Barachd7cb1b52016-12-09 09:52:16 -0500205 src->as_u32 = 0;
206 }
207 return (!0);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700208}
209
210/* Find interface address which matches destination. */
211always_inline ip4_address_t *
Dave Barachd7cb1b52016-12-09 09:52:16 -0500212ip4_interface_address_matching_destination (ip4_main_t * im,
213 ip4_address_t * dst,
214 u32 sw_if_index,
215 ip_interface_address_t **
216 result_ia)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700217{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500218 ip_lookup_main_t *lm = &im->lookup_main;
219 ip_interface_address_t *ia;
220 ip4_address_t *result = 0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700221
Dave Barachd7cb1b52016-12-09 09:52:16 -0500222 /* *INDENT-OFF* */
Dave Barach75fc8542016-10-11 16:16:02 -0400223 foreach_ip_interface_address (lm, ia, sw_if_index,
Ed Warnickecb9cada2015-12-08 15:45:58 -0700224 1 /* honor unnumbered */,
225 ({
226 ip4_address_t * a = ip_interface_address_get_address (lm, ia);
227 if (ip4_destination_matches_route (im, dst, a, ia->address_length))
228 {
229 result = a;
230 break;
231 }
232 }));
Dave Barachd7cb1b52016-12-09 09:52:16 -0500233 /* *INDENT-ON* */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700234 if (result_ia)
235 *result_ia = result ? ia : 0;
236 return result;
237}
238
Dave Barachd7cb1b52016-12-09 09:52:16 -0500239ip4_address_t *ip4_interface_first_address (ip4_main_t * im, u32 sw_if_index,
240 ip_interface_address_t **
241 result_ia);
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100242
Dave Barachd7cb1b52016-12-09 09:52:16 -0500243clib_error_t *ip4_add_del_interface_address (vlib_main_t * vm,
244 u32 sw_if_index,
245 ip4_address_t * address,
246 u32 address_length, u32 is_del);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700247
Dave Barachd7cb1b52016-12-09 09:52:16 -0500248void ip4_sw_interface_enable_disable (u32 sw_if_index, u32 is_enable);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700249
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100250int ip4_address_compare (ip4_address_t * a1, ip4_address_t * a2);
Dave Barach203c6322016-06-26 10:29:03 -0400251
Ed Warnickecb9cada2015-12-08 15:45:58 -0700252/* Send an ARP request to see if given destination is reachable on given interface. */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500253clib_error_t *ip4_probe_neighbor (vlib_main_t * vm, ip4_address_t * dst,
John Lo86376342018-06-11 20:14:49 -0400254 u32 sw_if_index, u8 refresh);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700255
Dave Barachd7cb1b52016-12-09 09:52:16 -0500256clib_error_t *ip4_set_arp_limit (u32 arp_limit);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700257
258uword
Ed Warnickecb9cada2015-12-08 15:45:58 -0700259ip4_udp_register_listener (vlib_main_t * vm,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500260 u16 dst_port, u32 next_node_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700261
Dave Barach75fc8542016-10-11 16:16:02 -0400262void
Dave Barachd7cb1b52016-12-09 09:52:16 -0500263ip4_icmp_register_type (vlib_main_t * vm, icmp4_type_t type, u32 node_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700264
Dave Barachd7cb1b52016-12-09 09:52:16 -0500265u16 ip4_tcp_udp_compute_checksum (vlib_main_t * vm, vlib_buffer_t * p0,
266 ip4_header_t * ip0);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700267
268void ip4_register_protocol (u32 protocol, u32 node_index);
269
270serialize_function_t serialize_vnet_ip4_main, unserialize_vnet_ip4_main;
271
Dave Barachd7cb1b52016-12-09 09:52:16 -0500272int vnet_set_ip4_flow_hash (u32 table_id,
273 flow_hash_config_t flow_hash_config);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700274
Dave Barach75fc8542016-10-11 16:16:02 -0400275int vnet_set_ip4_classify_intfc (vlib_main_t * vm, u32 sw_if_index,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500276 u32 table_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700277
Neale Rannsd91c1db2017-07-31 02:30:50 -0700278void ip4_punt_policer_add_del (u8 is_add, u32 policer_index);
279
280void ip4_punt_redirect_add (u32 rx_sw_if_index,
281 u32 tx_sw_if_index, ip46_address_t * nh);
282void ip4_punt_redirect_del (u32 rx_sw_if_index);
283
Ed Warnickecb9cada2015-12-08 15:45:58 -0700284/* Compute flow hash. We'll use it to select which adjacency to use for this
285 flow. And other things. */
286always_inline u32
Neale Ranns0bfe5d82016-08-25 15:29:12 +0100287ip4_compute_flow_hash (const ip4_header_t * ip,
288 flow_hash_config_t flow_hash_config)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700289{
Dave Barachd7cb1b52016-12-09 09:52:16 -0500290 tcp_header_t *tcp = (void *) (ip + 1);
291 u32 a, b, c, t1, t2;
292 uword is_tcp_udp = (ip->protocol == IP_PROTOCOL_TCP
293 || ip->protocol == IP_PROTOCOL_UDP);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700294
Dave Barachd7cb1b52016-12-09 09:52:16 -0500295 t1 = (flow_hash_config & IP_FLOW_HASH_SRC_ADDR)
296 ? ip->src_address.data_u32 : 0;
297 t2 = (flow_hash_config & IP_FLOW_HASH_DST_ADDR)
298 ? ip->dst_address.data_u32 : 0;
Dave Barach75fc8542016-10-11 16:16:02 -0400299
Dave Barachd7cb1b52016-12-09 09:52:16 -0500300 a = (flow_hash_config & IP_FLOW_HASH_REVERSE_SRC_DST) ? t2 : t1;
301 b = (flow_hash_config & IP_FLOW_HASH_REVERSE_SRC_DST) ? t1 : t2;
302 b ^= (flow_hash_config & IP_FLOW_HASH_PROTO) ? ip->protocol : 0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700303
Dave Barach68b0fb02017-02-28 15:15:56 -0500304 t1 = is_tcp_udp ? tcp->src : 0;
305 t2 = is_tcp_udp ? tcp->dst : 0;
Dave Barach75fc8542016-10-11 16:16:02 -0400306
Dave Barachd7cb1b52016-12-09 09:52:16 -0500307 t1 = (flow_hash_config & IP_FLOW_HASH_SRC_PORT) ? t1 : 0;
308 t2 = (flow_hash_config & IP_FLOW_HASH_DST_PORT) ? t2 : 0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700309
Dave Barachd7cb1b52016-12-09 09:52:16 -0500310 c = (flow_hash_config & IP_FLOW_HASH_REVERSE_SRC_DST) ?
311 (t1 << 16) | t2 : (t2 << 16) | t1;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700312
Dave Barachd7cb1b52016-12-09 09:52:16 -0500313 hash_v3_mix32 (a, b, c);
314 hash_v3_finalize32 (a, b, c);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700315
Dave Barachd7cb1b52016-12-09 09:52:16 -0500316 return c;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700317}
318
John Lo37682e12016-11-30 12:51:39 -0500319void
320ip4_forward_next_trace (vlib_main_t * vm,
Dave Barachd7cb1b52016-12-09 09:52:16 -0500321 vlib_node_runtime_t * node,
322 vlib_frame_t * frame,
323 vlib_rx_or_tx_t which_adj_index);
John Lo37682e12016-11-30 12:51:39 -0500324
Dave Barachd7cb1b52016-12-09 09:52:16 -0500325u8 *format_ip4_forward_next_trace (u8 * s, va_list * args);
John Lo37682e12016-11-30 12:51:39 -0500326
327u32 ip4_tcp_udp_validate_checksum (vlib_main_t * vm, vlib_buffer_t * p0);
328
Dave Barach68b0fb02017-02-28 15:15:56 -0500329#define IP_DF 0x4000 /* don't fragment */
330
331/**
332 * Push IPv4 header to buffer
333 *
334 * This does not support fragmentation.
335 *
336 * @param vm - vlib_main
337 * @param b - buffer to write the header to
338 * @param src - source IP
339 * @param dst - destination IP
340 * @param prot - payload proto
341 *
342 * @return - pointer to start of IP header
343 */
344always_inline void *
345vlib_buffer_push_ip4 (vlib_main_t * vm, vlib_buffer_t * b,
Florin Corasfdbc3822017-07-27 00:34:12 -0700346 ip4_address_t * src, ip4_address_t * dst, int proto,
347 u8 csum_offload)
Dave Barach68b0fb02017-02-28 15:15:56 -0500348{
349 ip4_header_t *ih;
350
351 /* make some room */
352 ih = vlib_buffer_push_uninit (b, sizeof (ip4_header_t));
353
354 ih->ip_version_and_header_length = 0x45;
355 ih->tos = 0;
356 ih->length = clib_host_to_net_u16 (vlib_buffer_length_in_chain (vm, b));
357
358 /* No fragments */
359 ih->flags_and_fragment_offset = clib_host_to_net_u16 (IP_DF);
360 ih->ttl = 255;
361 ih->protocol = proto;
362 ih->src_address.as_u32 = src->as_u32;
363 ih->dst_address.as_u32 = dst->as_u32;
364
Dave Barachc4423222017-07-19 08:48:09 -0400365 /* Offload ip4 header checksum generation */
Florin Corasfdbc3822017-07-27 00:34:12 -0700366 if (csum_offload)
Dave Barachc4423222017-07-19 08:48:09 -0400367 {
368 ih->checksum = 0;
369 b->flags |= VNET_BUFFER_F_OFFLOAD_IP_CKSUM | VNET_BUFFER_F_IS_IP4;
370 vnet_buffer (b)->l3_hdr_offset = (u8 *) ih - b->data;
Dave Barachac0c96b2017-08-02 09:19:32 -0400371 vnet_buffer (b)->l4_hdr_offset = vnet_buffer (b)->l3_hdr_offset +
372 sizeof (*ih);
Dave Barachc4423222017-07-19 08:48:09 -0400373 }
374 else
375 ih->checksum = ip4_header_checksum (ih);
376
Dave Barach68b0fb02017-02-28 15:15:56 -0500377 return ih;
378}
Ed Warnickecb9cada2015-12-08 15:45:58 -0700379#endif /* included_ip_ip4_h */
Dave Barachd7cb1b52016-12-09 09:52:16 -0500380
381/*
382 * fd.io coding-style-patch-verification: ON
383 *
384 * Local Variables:
385 * eval: (c-set-style "gnu")
386 * End:
387 */