blob: d3812f1ec9ac1e006a323600e4c304f664ef3b54 [file] [log] [blame]
Ratheesh Kannoth24fb1db2021-10-20 07:28:06 +05301/*
2 * sfe_ipv6.h
3 * Shortcut forwarding engine header file for IPv6.
4 *
5 * Copyright (c) 2015-2016, 2019-2020, The Linux Foundation. All rights reserved.
6 * Copyright (c) 2021 Qualcomm Innovation Center, Inc. All rights reserved.
7 *
8 * Permission to use, copy, modify, and/or distribute this software for any
9 * purpose with or without fee is hereby granted, provided that the above
10 * copyright notice and this permission notice appear in all copies.
11 *
12 * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
13 * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
14 * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
15 * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
16 * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
17 * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
18 * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
19 */
20
Ratheesh Kannoth24fb1db2021-10-20 07:28:06 +053021#define CHAR_DEV_MSG_SIZE 768
22
Ratheesh Kannoth24fb1db2021-10-20 07:28:06 +053023#define SFE_IPV6_DSCP_MASK 0xf03f
24#define SFE_IPV6_DSCP_SHIFT 2
25
Ratheesh Kannoth24fb1db2021-10-20 07:28:06 +053026#define SFE_IPV6_FRAG_OFFSET 0xfff8
27
28/*
29 * generic IPv6 extension header
30 */
31struct sfe_ipv6_ext_hdr {
32 __u8 next_hdr;
33 __u8 hdr_len;
34 __u8 padding[6];
Ratheesh Kannoth741f7992021-10-20 07:39:52 +053035};
Ratheesh Kannoth24fb1db2021-10-20 07:28:06 +053036
37/*
38 * Specifies the lower bound on ACK numbers carried in the TCP header
39 */
40#define SFE_IPV6_TCP_MAX_ACK_WINDOW 65520
41
42/*
43 * IPv6 TCP connection match additional data.
44 */
45struct sfe_ipv6_tcp_connection_match {
46 u8 win_scale; /* Window scale */
47 u32 max_win; /* Maximum window size seen */
48 u32 end; /* Sequence number of the next byte to send (seq + segment length) */
49 u32 max_end; /* Sequence number of the last byte to ack */
50};
51
52/*
53 * Bit flags for IPv6 connection matching entry.
54 */
55#define SFE_IPV6_CONNECTION_MATCH_FLAG_XLATE_SRC (1<<0)
56 /* Perform source translation */
57#define SFE_IPV6_CONNECTION_MATCH_FLAG_XLATE_DEST (1<<1)
58 /* Perform destination translation */
59#define SFE_IPV6_CONNECTION_MATCH_FLAG_NO_SEQ_CHECK (1<<2)
60 /* Ignore TCP sequence numbers */
61#define SFE_IPV6_CONNECTION_MATCH_FLAG_WRITE_FAST_ETH_HDR (1<<3)
62 /* Fast Ethernet header write */
63#define SFE_IPV6_CONNECTION_MATCH_FLAG_WRITE_L2_HDR (1<<4)
64 /* Fast Ethernet header write */
65#define SFE_IPV6_CONNECTION_MATCH_FLAG_PRIORITY_REMARK (1<<5)
66 /* remark priority of SKB */
67#define SFE_IPV6_CONNECTION_MATCH_FLAG_DSCP_REMARK (1<<6)
68 /* remark DSCP of packet */
69
70/*
71 * IPv6 connection matching structure.
72 */
73struct sfe_ipv6_connection_match {
74 /*
75 * References to other objects.
76 */
Ratheesh Kannotha212fc52021-10-20 07:50:32 +053077 struct hlist_node hnode;
Ratheesh Kannoth24fb1db2021-10-20 07:28:06 +053078 struct sfe_ipv6_connection *connection;
79 struct sfe_ipv6_connection_match *counter_match;
80 /* Matches the flow in the opposite direction as the one in connection */
Ratheesh Kannoth24fb1db2021-10-20 07:28:06 +053081 /*
82 * Characteristics that identify flows that match this rule.
83 */
84 struct net_device *match_dev; /* Network device */
85 u8 match_protocol; /* Protocol */
86 struct sfe_ipv6_addr match_src_ip[1]; /* Source IP address */
87 struct sfe_ipv6_addr match_dest_ip[1]; /* Destination IP address */
88 __be16 match_src_port; /* Source port/connection ident */
89 __be16 match_dest_port; /* Destination port/connection ident */
90
91 /*
92 * Control the operations of the match.
93 */
94 u32 flags; /* Bit flags */
95#ifdef CONFIG_NF_FLOW_COOKIE
96 u32 flow_cookie; /* used flow cookie, for debug */
97#endif
98#ifdef CONFIG_XFRM
99 u32 flow_accel; /* The flow accelerated or not */
100#endif
101
102 /*
103 * Connection state that we track once we match.
104 */
105 union { /* Protocol-specific state */
106 struct sfe_ipv6_tcp_connection_match tcp;
107 } protocol_state;
108 /*
109 * Stats recorded in a sync period. These stats will be added to
110 * rx_packet_count64/rx_byte_count64 after a sync period.
111 */
Ratheesh Kannotha212fc52021-10-20 07:50:32 +0530112 atomic_t rx_packet_count;
113 atomic_t rx_byte_count;
Ratheesh Kannoth24fb1db2021-10-20 07:28:06 +0530114
115 /*
116 * Packet translation information.
117 */
118 struct sfe_ipv6_addr xlate_src_ip[1]; /* Address after source translation */
119 __be16 xlate_src_port; /* Port/connection ident after source translation */
120 u16 xlate_src_csum_adjustment;
121 /* Transport layer checksum adjustment after source translation */
122 struct sfe_ipv6_addr xlate_dest_ip[1]; /* Address after destination translation */
123 __be16 xlate_dest_port; /* Port/connection ident after destination translation */
124 u16 xlate_dest_csum_adjustment;
125 /* Transport layer checksum adjustment after destination translation */
126
127 /*
128 * QoS information
129 */
130 u32 priority;
131 u32 dscp;
132
133 /*
134 * Packet transmit information.
135 */
136 struct net_device *xmit_dev; /* Network device on which to transmit */
137 unsigned short int xmit_dev_mtu;
138 /* Interface MTU */
139 u16 xmit_dest_mac[ETH_ALEN / 2];
140 /* Destination MAC address to use when forwarding */
141 u16 xmit_src_mac[ETH_ALEN / 2];
142 /* Source MAC address to use when forwarding */
143
144 /*
145 * Summary stats.
146 */
147 u64 rx_packet_count64;
148 u64 rx_byte_count64;
149};
150
151/*
152 * Per-connection data structure.
153 */
154struct sfe_ipv6_connection {
155 struct sfe_ipv6_connection *next;
156 /* Pointer to the next entry in a hash chain */
157 struct sfe_ipv6_connection *prev;
158 /* Pointer to the previous entry in a hash chain */
159 int protocol; /* IP protocol number */
160 struct sfe_ipv6_addr src_ip[1]; /* Src IP addr pre-translation */
161 struct sfe_ipv6_addr src_ip_xlate[1]; /* Src IP addr post-translation */
162 struct sfe_ipv6_addr dest_ip[1]; /* Dest IP addr pre-translation */
163 struct sfe_ipv6_addr dest_ip_xlate[1]; /* Dest IP addr post-translation */
164 __be16 src_port; /* Src port pre-translation */
165 __be16 src_port_xlate; /* Src port post-translation */
166 __be16 dest_port; /* Dest port pre-translation */
167 __be16 dest_port_xlate; /* Dest port post-translation */
168 struct sfe_ipv6_connection_match *original_match;
169 /* Original direction matching structure */
170 struct net_device *original_dev;
171 /* Original direction source device */
172 struct sfe_ipv6_connection_match *reply_match;
173 /* Reply direction matching structure */
174 struct net_device *reply_dev; /* Reply direction source device */
175 u64 last_sync_jiffies; /* Jiffies count for the last sync */
176 struct sfe_ipv6_connection *all_connections_next;
177 /* Pointer to the next entry in the list of all connections */
178 struct sfe_ipv6_connection *all_connections_prev;
179 /* Pointer to the previous entry in the list of all connections */
Ratheesh Kannotha212fc52021-10-20 07:50:32 +0530180 bool removed; /* Indicates the connection is removed */
181 struct rcu_head rcu; /* delay rcu free */
Ratheesh Kannoth24fb1db2021-10-20 07:28:06 +0530182 u32 mark; /* mark for outgoing packet */
183 u32 debug_read_seq; /* sequence number for debug dump */
184};
185
186/*
187 * IPv6 connections and hash table size information.
188 */
189#define SFE_IPV6_CONNECTION_HASH_SHIFT 12
190#define SFE_IPV6_CONNECTION_HASH_SIZE (1 << SFE_IPV6_CONNECTION_HASH_SHIFT)
191#define SFE_IPV6_CONNECTION_HASH_MASK (SFE_IPV6_CONNECTION_HASH_SIZE - 1)
192
193enum sfe_ipv6_exception_events {
194 SFE_IPV6_EXCEPTION_EVENT_UDP_HEADER_INCOMPLETE,
195 SFE_IPV6_EXCEPTION_EVENT_UDP_NO_CONNECTION,
196 SFE_IPV6_EXCEPTION_EVENT_UDP_IP_OPTIONS_OR_INITIAL_FRAGMENT,
197 SFE_IPV6_EXCEPTION_EVENT_UDP_SMALL_TTL,
198 SFE_IPV6_EXCEPTION_EVENT_UDP_NEEDS_FRAGMENTATION,
199 SFE_IPV6_EXCEPTION_EVENT_TCP_HEADER_INCOMPLETE,
200 SFE_IPV6_EXCEPTION_EVENT_TCP_NO_CONNECTION_SLOW_FLAGS,
201 SFE_IPV6_EXCEPTION_EVENT_TCP_NO_CONNECTION_FAST_FLAGS,
202 SFE_IPV6_EXCEPTION_EVENT_TCP_IP_OPTIONS_OR_INITIAL_FRAGMENT,
203 SFE_IPV6_EXCEPTION_EVENT_TCP_SMALL_TTL,
204 SFE_IPV6_EXCEPTION_EVENT_TCP_NEEDS_FRAGMENTATION,
205 SFE_IPV6_EXCEPTION_EVENT_TCP_FLAGS,
206 SFE_IPV6_EXCEPTION_EVENT_TCP_SEQ_EXCEEDS_RIGHT_EDGE,
207 SFE_IPV6_EXCEPTION_EVENT_TCP_SMALL_DATA_OFFS,
208 SFE_IPV6_EXCEPTION_EVENT_TCP_BAD_SACK,
209 SFE_IPV6_EXCEPTION_EVENT_TCP_BIG_DATA_OFFS,
210 SFE_IPV6_EXCEPTION_EVENT_TCP_SEQ_BEFORE_LEFT_EDGE,
211 SFE_IPV6_EXCEPTION_EVENT_TCP_ACK_EXCEEDS_RIGHT_EDGE,
212 SFE_IPV6_EXCEPTION_EVENT_TCP_ACK_BEFORE_LEFT_EDGE,
213 SFE_IPV6_EXCEPTION_EVENT_ICMP_HEADER_INCOMPLETE,
214 SFE_IPV6_EXCEPTION_EVENT_ICMP_UNHANDLED_TYPE,
215 SFE_IPV6_EXCEPTION_EVENT_ICMP_IPV6_HEADER_INCOMPLETE,
216 SFE_IPV6_EXCEPTION_EVENT_ICMP_IPV6_NON_V6,
217 SFE_IPV6_EXCEPTION_EVENT_ICMP_IPV6_IP_OPTIONS_INCOMPLETE,
218 SFE_IPV6_EXCEPTION_EVENT_ICMP_IPV6_UDP_HEADER_INCOMPLETE,
219 SFE_IPV6_EXCEPTION_EVENT_ICMP_IPV6_TCP_HEADER_INCOMPLETE,
220 SFE_IPV6_EXCEPTION_EVENT_ICMP_IPV6_UNHANDLED_PROTOCOL,
221 SFE_IPV6_EXCEPTION_EVENT_ICMP_NO_CONNECTION,
222 SFE_IPV6_EXCEPTION_EVENT_ICMP_FLUSHED_CONNECTION,
223 SFE_IPV6_EXCEPTION_EVENT_HEADER_INCOMPLETE,
224 SFE_IPV6_EXCEPTION_EVENT_BAD_TOTAL_LENGTH,
225 SFE_IPV6_EXCEPTION_EVENT_NON_V6,
226 SFE_IPV6_EXCEPTION_EVENT_NON_INITIAL_FRAGMENT,
227 SFE_IPV6_EXCEPTION_EVENT_DATAGRAM_INCOMPLETE,
228 SFE_IPV6_EXCEPTION_EVENT_IP_OPTIONS_INCOMPLETE,
229 SFE_IPV6_EXCEPTION_EVENT_UNHANDLED_PROTOCOL,
230 SFE_IPV6_EXCEPTION_EVENT_FLOW_COOKIE_ADD_FAIL,
231 SFE_IPV6_EXCEPTION_EVENT_LAST
232};
233
234/*
Ratheesh Kannoth1ed95462021-10-20 07:57:45 +0530235 * Per CPU stats
236 */
237struct sfe_ipv6_stats {
238 /*
239 * Stats recorded in a sync period. These stats will be added to
240 * connection_xxx64 after a sync period.
241 */
242 u64 connection_create_requests64;
243 /* Number of IPv6 connection create requests */
244 u64 connection_create_collisions64;
245 /* Number of IPv6 connection create requests that collided with existing hash table entries */
Ratheesh Kannoth89302a72021-10-20 08:10:37 +0530246 u64 connection_create_failures64;
247 /* Number of IPv6 connection create requests failures. */
248
Ratheesh Kannoth1ed95462021-10-20 07:57:45 +0530249 u64 connection_destroy_requests64;
250 /* Number of IPv6 connection destroy requests */
251 u64 connection_destroy_misses64;
252 /* Number of IPv6 connection destroy requests that missed our hash table */
253 u64 connection_match_hash_hits64;
254 /* Number of IPv6 connection match hash hits */
255 u64 connection_match_hash_reorders64;
256 /* Number of IPv6 connection match hash reorders */
257 u64 connection_flushes64; /* Number of IPv6 connection flushes */
258 u64 packets_forwarded64; /* Number of IPv6 packets forwarded */
259 u64 packets_not_forwarded64; /* Number of IPv6 packets not forwarded */
260 u64 exception_events64[SFE_IPV6_EXCEPTION_EVENT_LAST];
261};
262
263/*
Ratheesh Kannoth24fb1db2021-10-20 07:28:06 +0530264 * Per-module structure.
265 */
266struct sfe_ipv6 {
267 spinlock_t lock; /* Lock for SMP correctness */
Ratheesh Kannoth24fb1db2021-10-20 07:28:06 +0530268 struct sfe_ipv6_connection *all_connections_head;
269 /* Head of the list of all connections */
270 struct sfe_ipv6_connection *all_connections_tail;
271 /* Tail of the list of all connections */
272 unsigned int num_connections; /* Number of connections */
Ken Zhu137722d2021-09-23 17:57:36 -0700273 struct delayed_work sync_dwork; /* Work to sync the statistics */
274 unsigned int work_cpu; /* The core to run stats sync on */
275
Ratheesh Kannoth24fb1db2021-10-20 07:28:06 +0530276 sfe_sync_rule_callback_t __rcu sync_rule_callback;
277 /* Callback function registered by a connection manager for stats syncing */
278 struct sfe_ipv6_connection *conn_hash[SFE_IPV6_CONNECTION_HASH_SIZE];
279 /* Connection hash table */
Ratheesh Kannotha212fc52021-10-20 07:50:32 +0530280 struct hlist_head hlist_conn_match_hash_head[SFE_IPV6_CONNECTION_HASH_SIZE];
Ratheesh Kannoth24fb1db2021-10-20 07:28:06 +0530281#ifdef CONFIG_NF_FLOW_COOKIE
282 struct sfe_ipv6_flow_cookie_entry sfe_flow_cookie_table[SFE_FLOW_COOKIE_SIZE];
283 /* flow cookie table*/
284 sfe_ipv6_flow_cookie_set_func_t flow_cookie_set_func;
285 /* function used to configure flow cookie in hardware*/
286 int flow_cookie_enable;
287 /* Enable/disable flow cookie at runtime */
288#endif
289
Ratheesh Kannoth1ed95462021-10-20 07:57:45 +0530290 struct sfe_ipv6_stats __percpu *stats_pcpu;
291 /* Common SFE counters. */
Ratheesh Kannoth24fb1db2021-10-20 07:28:06 +0530292
Ken Zhu32b95392021-09-03 13:52:04 -0700293 struct sfe_ipv6_connection *wc_next;
294 /* The next walk point in the all connection list*/
295
Ratheesh Kannoth24fb1db2021-10-20 07:28:06 +0530296 /*
297 * Control state.
298 */
Ratheesh Kannoth6307bec2021-11-25 08:26:39 +0530299 struct kobject *sys_ipv6; /* sysfs linkage */
Ratheesh Kannoth24fb1db2021-10-20 07:28:06 +0530300 int debug_dev; /* Major number of the debug char device */
301 u32 debug_read_seq; /* sequence number for debug dump */
302};
303
304/*
305 * Enumeration of the XML output.
306 */
307enum sfe_ipv6_debug_xml_states {
308 SFE_IPV6_DEBUG_XML_STATE_START,
309 SFE_IPV6_DEBUG_XML_STATE_CONNECTIONS_START,
310 SFE_IPV6_DEBUG_XML_STATE_CONNECTIONS_CONNECTION,
311 SFE_IPV6_DEBUG_XML_STATE_CONNECTIONS_END,
312 SFE_IPV6_DEBUG_XML_STATE_EXCEPTIONS_START,
313 SFE_IPV6_DEBUG_XML_STATE_EXCEPTIONS_EXCEPTION,
314 SFE_IPV6_DEBUG_XML_STATE_EXCEPTIONS_END,
315 SFE_IPV6_DEBUG_XML_STATE_STATS,
316 SFE_IPV6_DEBUG_XML_STATE_END,
317 SFE_IPV6_DEBUG_XML_STATE_DONE
318};
319
320/*
321 * XML write state.
322 */
323struct sfe_ipv6_debug_xml_write_state {
324 enum sfe_ipv6_debug_xml_states state;
325 /* XML output file state machine state */
326 int iter_exception; /* Next exception iterator */
327};
328
329typedef bool (*sfe_ipv6_debug_xml_write_method_t)(struct sfe_ipv6 *si, char *buffer, char *msg, size_t *length,
330 int *total_read, struct sfe_ipv6_debug_xml_write_state *ws);
331
Ratheesh Kannoth6307bec2021-11-25 08:26:39 +0530332/*
333 * sfe_ipv6_is_ext_hdr()
334 * check if we recognize ipv6 extension header
335 */
336static inline bool sfe_ipv6_is_ext_hdr(u8 hdr)
337{
338 return (hdr == NEXTHDR_HOP) ||
339 (hdr == NEXTHDR_ROUTING) ||
340 (hdr == NEXTHDR_FRAGMENT) ||
341 (hdr == NEXTHDR_AUTH) ||
342 (hdr == NEXTHDR_DEST) ||
343 (hdr == NEXTHDR_MOBILITY);
344}
345
346/*
347 * sfe_ipv6_change_dsfield()
348 * change dscp field in IPv6 packet
349 */
350static inline void sfe_ipv6_change_dsfield(struct ipv6hdr *iph, u8 dscp)
351{
352 __be16 *p = (__be16 *)iph;
353
354 *p = ((*p & htons(SFE_IPV6_DSCP_MASK)) | htons((u16)dscp << 4));
355}
356
357void sfe_ipv6_exception_stats_inc(struct sfe_ipv6 *si, enum sfe_ipv6_exception_events reason);
358
359struct sfe_ipv6_connection_match *
360sfe_ipv6_find_connection_match_rcu(struct sfe_ipv6 *si, struct net_device *dev, u8 protocol,
361 struct sfe_ipv6_addr *src_ip, __be16 src_port,
362 struct sfe_ipv6_addr *dest_ip, __be16 dest_port);
363
364bool sfe_ipv6_remove_connection(struct sfe_ipv6 *si, struct sfe_ipv6_connection *c);
365
366void sfe_ipv6_flush_connection(struct sfe_ipv6 *si,
367 struct sfe_ipv6_connection *c,
368 sfe_sync_reason_t reason);
369
Ratheesh Kannoth24fb1db2021-10-20 07:28:06 +0530370void sfe_ipv6_exit(void);
371int sfe_ipv6_init(void);