blob: 955010a34b3a0f3b976214125be0c816251e4c26 [file] [log] [blame]
/*
* Copyright (c) 2017 SUSE LLC.
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at:
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#include <sctp/sctp.h>
#include <sctp/sctp_debug.h>
#include <vppinfra/random.h>
#include <openssl/hmac.h>
/**
* Flush tx frame populated by retransmits and timer pops
*/
void
sctp_flush_frame_to_output (vlib_main_t * vm, u8 thread_index, u8 is_ip4)
{
if (sctp_main.tx_frames[!is_ip4][thread_index])
{
u32 next_index;
next_index = is_ip4 ? sctp4_output_node.index : sctp6_output_node.index;
vlib_put_frame_to_node (vm, next_index,
sctp_main.tx_frames[!is_ip4][thread_index]);
sctp_main.tx_frames[!is_ip4][thread_index] = 0;
}
}
/**
* Flush ip lookup tx frames populated by timer pops
*/
always_inline void
sctp_flush_frame_to_ip_lookup (vlib_main_t * vm, u8 thread_index, u8 is_ip4)
{
if (sctp_main.ip_lookup_tx_frames[!is_ip4][thread_index])
{
u32 next_index;
next_index = is_ip4 ? ip4_lookup_node.index : ip6_lookup_node.index;
vlib_put_frame_to_node (vm, next_index,
sctp_main.ip_lookup_tx_frames[!is_ip4]
[thread_index]);
sctp_main.ip_lookup_tx_frames[!is_ip4][thread_index] = 0;
}
}
/**
* Flush v4 and v6 sctp and ip-lookup tx frames for thread index
*/
void
sctp_flush_frames_to_output (u8 thread_index)
{
vlib_main_t *vm = vlib_get_main ();
sctp_flush_frame_to_output (vm, thread_index, 1);
sctp_flush_frame_to_output (vm, thread_index, 0);
sctp_flush_frame_to_ip_lookup (vm, thread_index, 1);
sctp_flush_frame_to_ip_lookup (vm, thread_index, 0);
}
u32
ip4_sctp_compute_checksum (vlib_main_t * vm, vlib_buffer_t * p0,
ip4_header_t * ip0)
{
ip_csum_t checksum;
u32 ip_header_length, payload_length_host_byte_order;
u32 n_this_buffer, n_bytes_left, n_ip_bytes_this_buffer;
void *data_this_buffer;
/* Initialize checksum with ip header. */
ip_header_length = ip4_header_bytes (ip0);
payload_length_host_byte_order =
clib_net_to_host_u16 (ip0->length) - ip_header_length;
checksum =
clib_host_to_net_u32 (payload_length_host_byte_order +
(ip0->protocol << 16));
if (BITS (uword) == 32)
{
checksum =
ip_csum_with_carry (checksum,
clib_mem_unaligned (&ip0->src_address, u32));
checksum =
ip_csum_with_carry (checksum,
clib_mem_unaligned (&ip0->dst_address, u32));
}
else
checksum =
ip_csum_with_carry (checksum,
clib_mem_unaligned (&ip0->src_address, u64));
n_bytes_left = n_this_buffer = payload_length_host_byte_order;
data_this_buffer = (void *) ip0 + ip_header_length;
n_ip_bytes_this_buffer =
p0->current_length - (((u8 *) ip0 - p0->data) - p0->current_data);
if (n_this_buffer + ip_header_length > n_ip_bytes_this_buffer)
{
n_this_buffer = n_ip_bytes_this_buffer > ip_header_length ?
n_ip_bytes_this_buffer - ip_header_length : 0;
}
while (1)
{
checksum =
ip_incremental_checksum (checksum, data_this_buffer, n_this_buffer);
n_bytes_left -= n_this_buffer;
if (n_bytes_left == 0)
break;
ASSERT (p0->flags & VLIB_BUFFER_NEXT_PRESENT);
p0 = vlib_get_buffer (vm, p0->next_buffer);
data_this_buffer = vlib_buffer_get_current (p0);
n_this_buffer = p0->current_length;
}
return checksum;
}
u32
ip6_sctp_compute_checksum (vlib_main_t * vm, vlib_buffer_t * p0,
ip6_header_t * ip0, int *bogus_lengthp)
{
ip_csum_t checksum;
u16 payload_length_host_byte_order;
u32 i, n_this_buffer, n_bytes_left;
u32 headers_size = sizeof (ip0[0]);
void *data_this_buffer;
ASSERT (bogus_lengthp);
*bogus_lengthp = 0;
/* Initialize checksum with ip header. */
checksum = ip0->payload_length + clib_host_to_net_u16 (ip0->protocol);
payload_length_host_byte_order = clib_net_to_host_u16 (ip0->payload_length);
data_this_buffer = (void *) (ip0 + 1);
for (i = 0; i < ARRAY_LEN (ip0->src_address.as_uword); i++)
{
checksum = ip_csum_with_carry (checksum,
clib_mem_unaligned (&ip0->
src_address.as_uword
[i], uword));
checksum =
ip_csum_with_carry (checksum,
clib_mem_unaligned (&ip0->dst_address.as_uword[i],
uword));
}
/* some icmp packets may come with a "router alert" hop-by-hop extension header (e.g., mldv2 packets)
* or UDP-Ping packets */
if (PREDICT_FALSE (ip0->protocol == IP_PROTOCOL_IP6_HOP_BY_HOP_OPTIONS))
{
u32 skip_bytes;
ip6_hop_by_hop_ext_t *ext_hdr =
(ip6_hop_by_hop_ext_t *) data_this_buffer;
/* validate really icmp6 next */
ASSERT ((ext_hdr->next_hdr == IP_PROTOCOL_SCTP));
skip_bytes = 8 * (1 + ext_hdr->n_data_u64s);
data_this_buffer = (void *) ((u8 *) data_this_buffer + skip_bytes);
payload_length_host_byte_order -= skip_bytes;
headers_size += skip_bytes;
}
n_bytes_left = n_this_buffer = payload_length_host_byte_order;
if (p0 && n_this_buffer + headers_size > p0->current_length)
n_this_buffer =
p0->current_length >
headers_size ? p0->current_length - headers_size : 0;
while (1)
{
checksum =
ip_incremental_checksum (checksum, data_this_buffer, n_this_buffer);
n_bytes_left -= n_this_buffer;
if (n_bytes_left == 0)
break;
if (!(p0->flags & VLIB_BUFFER_NEXT_PRESENT))
{
*bogus_lengthp = 1;
return 0xfefe;
}
p0 = vlib_get_buffer (vm, p0->next_buffer);
data_this_buffer = vlib_buffer_get_current (p0);
n_this_buffer = p0->current_length;
}
return checksum;
}
void
sctp_push_ip_hdr (sctp_main_t * tm, sctp_sub_connection_t * sctp_sub_conn,
vlib_buffer_t * b)
{
sctp_header_t *th = vlib_buffer_get_current (b);
vlib_main_t *vm = vlib_get_main ();
if (sctp_sub_conn->c_is_ip4)
{
ip4_header_t *ih;
ih = vlib_buffer_push_ip4 (vm, b, &sctp_sub_conn->c_lcl_ip4,
&sctp_sub_conn->c_rmt_ip4, IP_PROTOCOL_SCTP,
1);
th->checksum = ip4_sctp_compute_checksum (vm, b, ih);
}
else
{
ip6_header_t *ih;
int bogus = ~0;
ih = vlib_buffer_push_ip6 (vm, b, &sctp_sub_conn->c_lcl_ip6,
&sctp_sub_conn->c_rmt_ip6, IP_PROTOCOL_SCTP);
th->checksum = ip6_sctp_compute_checksum (vm, b, ih, &bogus);
ASSERT (!bogus);
}
}
always_inline void *
sctp_reuse_buffer (vlib_main_t * vm, vlib_buffer_t * b)
{
if (b->flags & VLIB_BUFFER_NEXT_PRESENT)
vlib_buffer_free_one (vm, b->next_buffer);
/* Zero all flags but free list index and trace flag */
b->flags &= VLIB_BUFFER_NEXT_PRESENT - 1;
b->current_data = 0;
b->current_length = 0;
b->total_length_not_including_first_buffer = 0;
sctp_buffer_opaque (b)->sctp.flags = 0;
sctp_buffer_opaque (b)->sctp.subconn_idx = MAX_SCTP_CONNECTIONS;
/* Leave enough space for headers */
return vlib_buffer_make_headroom (b, TRANSPORT_MAX_HDRS_LEN);
}
always_inline void *
sctp_init_buffer (vlib_main_t * vm, vlib_buffer_t * b)
{
ASSERT ((b->flags & VLIB_BUFFER_NEXT_PRESENT) == 0);
b->flags |= VNET_BUFFER_F_LOCALLY_ORIGINATED;
b->total_length_not_including_first_buffer = 0;
sctp_buffer_opaque (b)->sctp.flags = 0;
sctp_buffer_opaque (b)->sctp.subconn_idx = MAX_SCTP_CONNECTIONS;
VLIB_BUFFER_TRACE_TRAJECTORY_INIT (b);
/* Leave enough space for headers */
return vlib_buffer_make_headroom (b, TRANSPORT_MAX_HDRS_LEN);
}
always_inline int
sctp_alloc_tx_buffers (sctp_main_t * tm, u8 thread_index, u32 n_free_buffers)
{
vlib_main_t *vm = vlib_get_main ();
u32 current_length = vec_len (tm->tx_buffers[thread_index]);
u32 n_allocated;
vec_validate (tm->tx_buffers[thread_index],
current_length + n_free_buffers - 1);
n_allocated =
vlib_buffer_alloc (vm, &tm->tx_buffers[thread_index][current_length],
n_free_buffers);
_vec_len (tm->tx_buffers[thread_index]) = current_length + n_allocated;
/* buffer shortage, report failure */
if (vec_len (tm->tx_buffers[thread_index]) == 0)
{
clib_warning ("out of buffers");
return -1;
}
return 0;
}
always_inline int
sctp_get_free_buffer_index (sctp_main_t * tm, u32 * bidx)
{
u32 *my_tx_buffers;
u32 thread_index = vlib_get_thread_index ();
if (PREDICT_FALSE (vec_len (tm->tx_buffers[thread_index]) == 0))
{
if (sctp_alloc_tx_buffers (tm, thread_index, VLIB_FRAME_SIZE))
return -1;
}
my_tx_buffers = tm->tx_buffers[thread_index];
*bidx = my_tx_buffers[vec_len (my_tx_buffers) - 1];
_vec_len (my_tx_buffers) -= 1;
return 0;
}
always_inline void
sctp_enqueue_to_output_i (vlib_main_t * vm, vlib_buffer_t * b, u32 bi,
u8 is_ip4, u8 flush)
{
sctp_main_t *tm = vnet_get_sctp_main ();
u32 thread_index = vlib_get_thread_index ();
u32 *to_next, next_index;
vlib_frame_t *f;
b->flags |= VNET_BUFFER_F_LOCALLY_ORIGINATED;
b->error = 0;
/* Decide where to send the packet */
next_index = is_ip4 ? sctp4_output_node.index : sctp6_output_node.index;
sctp_trajectory_add_start (b, 2);
/* Get frame to v4/6 output node */
f = tm->tx_frames[!is_ip4][thread_index];
if (!f)
{
f = vlib_get_frame_to_node (vm, next_index);
ASSERT (f);
tm->tx_frames[!is_ip4][thread_index] = f;
}
to_next = vlib_frame_vector_args (f);
to_next[f->n_vectors] = bi;
f->n_vectors += 1;
if (flush || f->n_vectors == VLIB_FRAME_SIZE)
{
vlib_put_frame_to_node (vm, next_index, f);
tm->tx_frames[!is_ip4][thread_index] = 0;
}
}
always_inline void
sctp_enqueue_to_output_now (vlib_main_t * vm, vlib_buffer_t * b, u32 bi,
u8 is_ip4)
{
sctp_enqueue_to_output_i (vm, b, bi, is_ip4, 1);
}
always_inline void
sctp_enqueue_to_ip_lookup_i (vlib_main_t * vm, vlib_buffer_t * b, u32 bi,
u8 is_ip4, u32 fib_index, u8 flush)
{
sctp_main_t *tm = vnet_get_sctp_main ();
u32 thread_index = vlib_get_thread_index ();
u32 *to_next, next_index;
vlib_frame_t *f;
b->flags |= VNET_BUFFER_F_LOCALLY_ORIGINATED;
b->error = 0;
vnet_buffer (b)->sw_if_index[VLIB_TX] = fib_index;
vnet_buffer (b)->sw_if_index[VLIB_RX] = 0;
/* Send to IP lookup */
next_index = is_ip4 ? ip4_lookup_node.index : ip6_lookup_node.index;
if (VLIB_BUFFER_TRACE_TRAJECTORY > 0)
{
b->pre_data[0] = 2;
b->pre_data[1] = next_index;
}
f = tm->ip_lookup_tx_frames[!is_ip4][thread_index];
if (!f)
{
f = vlib_get_frame_to_node (vm, next_index);
ASSERT (f);
tm->ip_lookup_tx_frames[!is_ip4][thread_index] = f;
}
to_next = vlib_frame_vector_args (f);
to_next[f->n_vectors] = bi;
f->n_vectors += 1;
if (flush || f->n_vectors == VLIB_FRAME_SIZE)
{
vlib_put_frame_to_node (vm, next_index, f);
tm->ip_lookup_tx_frames[!is_ip4][thread_index] = 0;
}
}
always_inline void
sctp_enqueue_to_ip_lookup (vlib_main_t * vm, vlib_buffer_t * b, u32 bi,
u8 is_ip4, u32 fib_index)
{
sctp_enqueue_to_ip_lookup_i (vm, b, bi, is_ip4, fib_index, 0);
if (vm->thread_index == 0 && vlib_num_workers ())
session_flush_frames_main_thread (vm);
}
/**
* Convert buffer to INIT
*/
void
sctp_prepare_init_chunk (sctp_connection_t * sctp_conn, u8 idx,
vlib_buffer_t * b)
{
u32 random_seed = random_default_seed ();
u16 alloc_bytes = sizeof (sctp_init_chunk_t);
sctp_sub_connection_t *sub_conn = &sctp_conn->sub_conn[idx];
sctp_ipv4_addr_param_t *ip4_param = 0;
sctp_ipv6_addr_param_t *ip6_param = 0;
if (sub_conn->c_is_ip4)
alloc_bytes += sizeof (sctp_ipv4_addr_param_t);
else
alloc_bytes += sizeof (sctp_ipv6_addr_param_t);
/* As per RFC 4960 the chunk_length value does NOT contemplate
* the size of the first header (see sctp_header_t) and any padding
*/
u16 chunk_len = alloc_bytes - sizeof (sctp_header_t);
alloc_bytes += vnet_sctp_calculate_padding (alloc_bytes);
sctp_init_chunk_t *init_chunk = vlib_buffer_push_uninit (b, alloc_bytes);
u16 pointer_offset = sizeof (init_chunk);
if (sub_conn->c_is_ip4)
{
ip4_param = (sctp_ipv4_addr_param_t *) init_chunk + pointer_offset;
ip4_param->address.as_u32 = sub_conn->c_lcl_ip.ip4.as_u32;
pointer_offset += sizeof (sctp_ipv4_addr_param_t);
}
else
{
ip6_param = (sctp_ipv6_addr_param_t *) init_chunk + pointer_offset;
ip6_param->address.as_u64[0] = sub_conn->c_lcl_ip.ip6.as_u64[0];
ip6_param->address.as_u64[1] = sub_conn->c_lcl_ip.ip6.as_u64[1];
pointer_offset += sizeof (sctp_ipv6_addr_param_t);
}
init_chunk->sctp_hdr.src_port = sub_conn->c_lcl_port; /* No need of host_to_net conversion, already in net-byte order */
init_chunk->sctp_hdr.dst_port = sub_conn->c_rmt_port; /* No need of host_to_net conversion, already in net-byte order */
init_chunk->sctp_hdr.checksum = 0;
/* The sender of an INIT must set the VERIFICATION_TAG to 0 as per RFC 4960 Section 8.5.1 */
init_chunk->sctp_hdr.verification_tag = 0x0;
vnet_sctp_set_chunk_type (&init_chunk->chunk_hdr, INIT);
vnet_sctp_set_chunk_length (&init_chunk->chunk_hdr, chunk_len);
vnet_sctp_common_hdr_params_host_to_net (&init_chunk->chunk_hdr);
sctp_init_cwnd (sctp_conn);
init_chunk->a_rwnd = clib_host_to_net_u32 (sctp_conn->sub_conn[idx].cwnd);
init_chunk->initiate_tag = clib_host_to_net_u32 (random_u32 (&random_seed));
init_chunk->inboud_streams_count =
clib_host_to_net_u16 (INBOUND_STREAMS_COUNT);
init_chunk->outbound_streams_count =
clib_host_to_net_u16 (OUTBOUND_STREAMS_COUNT);
init_chunk->initial_tsn =
clib_host_to_net_u32 (sctp_conn->local_initial_tsn);
SCTP_CONN_TRACKING_DBG ("sctp_conn->local_initial_tsn = %u",
sctp_conn->local_initial_tsn);
sctp_conn->local_tag = init_chunk->initiate_tag;
sctp_buffer_opaque (b)->sctp.connection_index = sub_conn->c_c_index;
sctp_buffer_opaque (b)->sctp.subconn_idx = idx;
SCTP_DBG_STATE_MACHINE ("CONN_INDEX = %u, CURR_CONN_STATE = %u (%s), "
"CHUNK_TYPE = %s, "
"SRC_PORT = %u, DST_PORT = %u",
sub_conn->connection.c_index,
sctp_conn->state,
sctp_state_to_string (sctp_conn->state),
sctp_chunk_to_string (INIT),
init_chunk->sctp_hdr.src_port,
init_chunk->sctp_hdr.dst_port);
}
void
sctp_compute_mac (sctp_connection_t * sctp_conn,
sctp_state_cookie_param_t * state_cookie)
{
#if OPENSSL_VERSION_NUMBER >= 0x10100000L
HMAC_CTX *ctx;
#else
HMAC_CTX ctx;
#endif
unsigned int len = 0;
const EVP_MD *md = EVP_sha1 ();
#if OPENSSL_VERSION_NUMBER >= 0x10100000L
ctx = HMAC_CTX_new ();
HMAC_Init_ex (ctx, &state_cookie->creation_time,
sizeof (state_cookie->creation_time), md, NULL);
HMAC_Update (ctx, (const unsigned char *) &sctp_conn, sizeof (sctp_conn));
HMAC_Final (ctx, state_cookie->mac, &len);
#else
HMAC_CTX_init (&ctx);
HMAC_Init_ex (&ctx, &state_cookie->creation_time,
sizeof (state_cookie->creation_time), md, NULL);
HMAC_Update (&ctx, (const unsigned char *) &sctp_conn, sizeof (sctp_conn));
HMAC_Final (&ctx, state_cookie->mac, &len);
HMAC_CTX_cleanup (&ctx);
#endif
ENDIANESS_SWAP (state_cookie->mac);
}
void
sctp_prepare_cookie_ack_chunk (sctp_connection_t * sctp_conn, u8 idx,
vlib_buffer_t * b)
{
vlib_main_t *vm = vlib_get_main ();
sctp_reuse_buffer (vm, b);
u16 alloc_bytes = sizeof (sctp_cookie_ack_chunk_t);
/* As per RFC 4960 the chunk_length value does NOT contemplate
* the size of the first header (see sctp_header_t) and any padding
*/
u16 chunk_len = alloc_bytes - sizeof (sctp_header_t);
alloc_bytes += vnet_sctp_calculate_padding (alloc_bytes);
sctp_cookie_ack_chunk_t *cookie_ack_chunk =
vlib_buffer_push_uninit (b, alloc_bytes);
cookie_ack_chunk->sctp_hdr.checksum = 0;
cookie_ack_chunk->sctp_hdr.src_port =
sctp_conn->sub_conn[idx].connection.lcl_port;
cookie_ack_chunk->sctp_hdr.dst_port =
sctp_conn->sub_conn[idx].connection.rmt_port;
cookie_ack_chunk->sctp_hdr.verification_tag = sctp_conn->remote_tag;
vnet_sctp_set_chunk_type (&cookie_ack_chunk->chunk_hdr, COOKIE_ACK);
vnet_sctp_set_chunk_length (&cookie_ack_chunk->chunk_hdr, chunk_len);
sctp_buffer_opaque (b)->sctp.connection_index =
sctp_conn->sub_conn[idx].connection.c_index;
sctp_buffer_opaque (b)->sctp.subconn_idx = idx;
}
void
sctp_prepare_cookie_echo_chunk (sctp_connection_t * sctp_conn, u8 idx,
vlib_buffer_t * b, u8 reuse_buffer)
{
vlib_main_t *vm = vlib_get_main ();
if (reuse_buffer)
sctp_reuse_buffer (vm, b);
/* The minimum size of the message is given by the sctp_init_ack_chunk_t */
u16 alloc_bytes = sizeof (sctp_cookie_echo_chunk_t);
/* As per RFC 4960 the chunk_length value does NOT contemplate
* the size of the first header (see sctp_header_t) and any padding
*/
u16 chunk_len = alloc_bytes - sizeof (sctp_header_t);
alloc_bytes += vnet_sctp_calculate_padding (alloc_bytes);
sctp_cookie_echo_chunk_t *cookie_echo_chunk =
vlib_buffer_push_uninit (b, alloc_bytes);
cookie_echo_chunk->sctp_hdr.checksum = 0;
cookie_echo_chunk->sctp_hdr.src_port =
sctp_conn->sub_conn[idx].connection.lcl_port;
cookie_echo_chunk->sctp_hdr.dst_port =
sctp_conn->sub_conn[idx].connection.rmt_port;
cookie_echo_chunk->sctp_hdr.verification_tag = sctp_conn->remote_tag;
vnet_sctp_set_chunk_type (&cookie_echo_chunk->chunk_hdr, COOKIE_ECHO);
vnet_sctp_set_chunk_length (&cookie_echo_chunk->chunk_hdr, chunk_len);
clib_memcpy_fast (&(cookie_echo_chunk->cookie), &sctp_conn->cookie_param,
sizeof (sctp_state_cookie_param_t));
sctp_buffer_opaque (b)->sctp.connection_index =
sctp_conn->sub_conn[idx].connection.c_index;
sctp_buffer_opaque (b)->sctp.subconn_idx = idx;
}
/*
* Send COOKIE_ECHO
*/
void
sctp_send_cookie_echo (sctp_connection_t * sctp_conn)
{
vlib_buffer_t *b;
u32 bi;
sctp_main_t *tm = vnet_get_sctp_main ();
vlib_main_t *vm = vlib_get_main ();
if (PREDICT_FALSE (sctp_conn->init_retransmit_err > SCTP_MAX_INIT_RETRANS))
{
clib_warning ("Reached MAX_INIT_RETRANS times. Aborting connection.");
session_stream_connect_notify (&sctp_conn->sub_conn
[SCTP_PRIMARY_PATH_IDX].connection, 1);
sctp_connection_timers_reset (sctp_conn);
sctp_connection_cleanup (sctp_conn);
}
if (PREDICT_FALSE (sctp_get_free_buffer_index (tm, &bi)))
return;
b = vlib_get_buffer (vm, bi);
u8 idx = SCTP_PRIMARY_PATH_IDX;
sctp_init_buffer (vm, b);
sctp_prepare_cookie_echo_chunk (sctp_conn, idx, b, 0);
sctp_enqueue_to_output_now (vm, b, bi, sctp_conn->sub_conn[idx].c_is_ip4);
/* Start the T1_INIT timer */
sctp_timer_set (sctp_conn, idx, SCTP_TIMER_T1_INIT,
sctp_conn->sub_conn[idx].RTO);
/* Change state to COOKIE_WAIT */
sctp_conn->state = SCTP_STATE_COOKIE_WAIT;
/* Measure RTT with this */
sctp_conn->sub_conn[idx].rtt_ts = sctp_time_now ();
}
/**
* Convert buffer to ERROR
*/
void
sctp_prepare_operation_error (sctp_connection_t * sctp_conn, u8 idx,
vlib_buffer_t * b, u8 err_cause)
{
vlib_main_t *vm = vlib_get_main ();
sctp_reuse_buffer (vm, b);
/* The minimum size of the message is given by the sctp_operation_error_t */
u16 alloc_bytes =
sizeof (sctp_operation_error_t) + sizeof (sctp_err_cause_param_t);
/* As per RFC 4960 the chunk_length value does NOT contemplate
* the size of the first header (see sctp_header_t) and any padding
*/
u16 chunk_len = alloc_bytes - sizeof (sctp_header_t);
alloc_bytes += vnet_sctp_calculate_padding (alloc_bytes);
sctp_operation_error_t *err_chunk =
vlib_buffer_push_uninit (b, alloc_bytes);
/* src_port & dst_port are already in network byte-order */
err_chunk->sctp_hdr.checksum = 0;
err_chunk->sctp_hdr.src_port = sctp_conn->sub_conn[idx].connection.lcl_port;
err_chunk->sctp_hdr.dst_port = sctp_conn->sub_conn[idx].connection.rmt_port;
/* As per RFC4960 Section 5.2.2: copy the INITIATE_TAG into the VERIFICATION_TAG of the ABORT chunk */
err_chunk->sctp_hdr.verification_tag = sctp_conn->local_tag;
err_chunk->err_causes[0].param_hdr.length =
clib_host_to_net_u16 (sizeof (err_chunk->err_causes[0].param_hdr.type) +
sizeof (err_chunk->err_causes[0].param_hdr.length));
err_chunk->err_causes[0].param_hdr.type = clib_host_to_net_u16 (err_cause);
vnet_sctp_set_chunk_type (&err_chunk->chunk_hdr, OPERATION_ERROR);
vnet_sctp_set_chunk_length (&err_chunk->chunk_hdr, chunk_len);
sctp_buffer_opaque (b)->sctp.connection_index =
sctp_conn->sub_conn[idx].connection.c_index;
sctp_buffer_opaque (b)->sctp.subconn_idx = idx;
}
/**
* Convert buffer to ABORT
*/
void
sctp_prepare_abort_for_collision (sctp_connection_t * sctp_conn, u8 idx,
vlib_buffer_t * b, ip4_address_t * ip4_addr,
ip6_address_t * ip6_addr)
{
vlib_main_t *vm = vlib_get_main ();
sctp_reuse_buffer (vm, b);
/* The minimum size of the message is given by the sctp_abort_chunk_t */
u16 alloc_bytes = sizeof (sctp_abort_chunk_t);
/* As per RFC 4960 the chunk_length value does NOT contemplate
* the size of the first header (see sctp_header_t) and any padding
*/
u16 chunk_len = alloc_bytes - sizeof (sctp_header_t);
alloc_bytes += vnet_sctp_calculate_padding (alloc_bytes);
sctp_abort_chunk_t *abort_chunk = vlib_buffer_push_uninit (b, alloc_bytes);
/* src_port & dst_port are already in network byte-order */
abort_chunk->sctp_hdr.checksum = 0;
abort_chunk->sctp_hdr.src_port =
sctp_conn->sub_conn[idx].connection.lcl_port;
abort_chunk->sctp_hdr.dst_port =
sctp_conn->sub_conn[idx].connection.rmt_port;
/* As per RFC4960 Section 5.2.2: copy the INITIATE_TAG into the VERIFICATION_TAG of the ABORT chunk */
abort_chunk->sctp_hdr.verification_tag = sctp_conn->local_tag;
vnet_sctp_set_chunk_type (&abort_chunk->chunk_hdr, ABORT);
vnet_sctp_set_chunk_length (&abort_chunk->chunk_hdr, chunk_len);
sctp_buffer_opaque (b)->sctp.connection_index =
sctp_conn->sub_conn[idx].connection.c_index;
sctp_buffer_opaque (b)->sctp.subconn_idx = idx;
}
/**
* Convert buffer to INIT-ACK
*/
void
sctp_prepare_initack_chunk_for_collision (sctp_connection_t * sctp_conn,
u8 idx, vlib_buffer_t * b,
ip4_address_t * ip4_addr,
ip6_address_t * ip6_addr)
{
vlib_main_t *vm = vlib_get_main ();
sctp_ipv4_addr_param_t *ip4_param = 0;
sctp_ipv6_addr_param_t *ip6_param = 0;
sctp_reuse_buffer (vm, b);
/* The minimum size of the message is given by the sctp_init_ack_chunk_t */
u16 alloc_bytes =
sizeof (sctp_init_ack_chunk_t) + sizeof (sctp_state_cookie_param_t);
if (PREDICT_TRUE (ip4_addr != NULL))
{
/* Create room for variable-length fields in the INIT_ACK chunk */
alloc_bytes += SCTP_IPV4_ADDRESS_TYPE_LENGTH;
}
if (PREDICT_TRUE (ip6_addr != NULL))
{
/* Create room for variable-length fields in the INIT_ACK chunk */
alloc_bytes += SCTP_IPV6_ADDRESS_TYPE_LENGTH;
}
if (sctp_conn->sub_conn[idx].connection.is_ip4)
alloc_bytes += sizeof (sctp_ipv4_addr_param_t);
else
alloc_bytes += sizeof (sctp_ipv6_addr_param_t);
/* As per RFC 4960 the chunk_length value does NOT contemplate
* the size of the first header (see sctp_header_t) and any padding
*/
u16 chunk_len = alloc_bytes - sizeof (sctp_header_t);
alloc_bytes += vnet_sctp_calculate_padding (alloc_bytes);
sctp_init_ack_chunk_t *init_ack_chunk =
vlib_buffer_push_uninit (b, alloc_bytes);
u16 pointer_offset = sizeof (sctp_init_ack_chunk_t);
/* Create State Cookie parameter */
sctp_state_cookie_param_t *state_cookie_param =
(sctp_state_cookie_param_t *) ((char *) init_ack_chunk + pointer_offset);
state_cookie_param->param_hdr.type =
clib_host_to_net_u16 (SCTP_STATE_COOKIE_TYPE);
state_cookie_param->param_hdr.length =
clib_host_to_net_u16 (sizeof (sctp_state_cookie_param_t));
state_cookie_param->creation_time = clib_host_to_net_u64 (sctp_time_now ());
state_cookie_param->cookie_lifespan =
clib_host_to_net_u32 (SCTP_VALID_COOKIE_LIFE);
sctp_compute_mac (sctp_conn, state_cookie_param);
pointer_offset += sizeof (sctp_state_cookie_param_t);
if (PREDICT_TRUE (ip4_addr != NULL))
{
sctp_ipv4_addr_param_t *ipv4_addr =
(sctp_ipv4_addr_param_t *) init_ack_chunk + pointer_offset;
ipv4_addr->param_hdr.type =
clib_host_to_net_u16 (SCTP_IPV4_ADDRESS_TYPE);
ipv4_addr->param_hdr.length =
clib_host_to_net_u16 (SCTP_IPV4_ADDRESS_TYPE_LENGTH);
ipv4_addr->address.as_u32 = ip4_addr->as_u32;
pointer_offset += SCTP_IPV4_ADDRESS_TYPE_LENGTH;
}
if (PREDICT_TRUE (ip6_addr != NULL))
{
sctp_ipv6_addr_param_t *ipv6_addr =
(sctp_ipv6_addr_param_t *) init_ack_chunk + pointer_offset;
ipv6_addr->param_hdr.type =
clib_host_to_net_u16 (SCTP_IPV6_ADDRESS_TYPE);
ipv6_addr->param_hdr.length =
clib_host_to_net_u16 (SCTP_IPV6_ADDRESS_TYPE_LENGTH);
ipv6_addr->address.as_u64[0] = ip6_addr->as_u64[0];
ipv6_addr->address.as_u64[1] = ip6_addr->as_u64[1];
pointer_offset += SCTP_IPV6_ADDRESS_TYPE_LENGTH;
}
if (sctp_conn->sub_conn[idx].connection.is_ip4)
{
ip4_param = (sctp_ipv4_addr_param_t *) init_ack_chunk + pointer_offset;
ip4_param->address.as_u32 =
sctp_conn->sub_conn[idx].connection.lcl_ip.ip4.as_u32;
pointer_offset += sizeof (sctp_ipv4_addr_param_t);
}
else
{
ip6_param = (sctp_ipv6_addr_param_t *) init_ack_chunk + pointer_offset;
ip6_param->address.as_u64[0] =
sctp_conn->sub_conn[idx].connection.lcl_ip.ip6.as_u64[0];
ip6_param->address.as_u64[1] =
sctp_conn->sub_conn[idx].connection.lcl_ip.ip6.as_u64[1];
pointer_offset += sizeof (sctp_ipv6_addr_param_t);
}
/* src_port & dst_port are already in network byte-order */
init_ack_chunk->sctp_hdr.checksum = 0;
init_ack_chunk->sctp_hdr.src_port =
sctp_conn->sub_conn[idx].connection.lcl_port;
init_ack_chunk->sctp_hdr.dst_port =
sctp_conn->sub_conn[idx].connection.rmt_port;
/* the sctp_conn->verification_tag is already in network byte-order (being a copy of the init_tag coming with the INIT chunk) */
init_ack_chunk->sctp_hdr.verification_tag = sctp_conn->remote_tag;
init_ack_chunk->initial_tsn =
clib_host_to_net_u32 (sctp_conn->local_initial_tsn);
SCTP_CONN_TRACKING_DBG ("init_ack_chunk->initial_tsn = %u",
init_ack_chunk->initial_tsn);
vnet_sctp_set_chunk_type (&init_ack_chunk->chunk_hdr, INIT_ACK);
vnet_sctp_set_chunk_length (&init_ack_chunk->chunk_hdr, chunk_len);
init_ack_chunk->initiate_tag = sctp_conn->local_tag;
init_ack_chunk->a_rwnd =
clib_host_to_net_u32 (sctp_conn->sub_conn[idx].cwnd);
init_ack_chunk->inboud_streams_count =
clib_host_to_net_u16 (INBOUND_STREAMS_COUNT);
init_ack_chunk->outbound_streams_count =
clib_host_to_net_u16 (OUTBOUND_STREAMS_COUNT);
sctp_buffer_opaque (b)->sctp.connection_index =
sctp_conn->sub_conn[idx].connection.c_index;
sctp_buffer_opaque (b)->sctp.subconn_idx = idx;
}
/**
* Convert buffer to INIT-ACK
*/
void
sctp_prepare_initack_chunk (sctp_connection_t * sctp_conn, u8 idx,
vlib_buffer_t * b, ip4_address_t * ip4_addr,
u8 add_ip4, ip6_address_t * ip6_addr, u8 add_ip6)
{
vlib_main_t *vm = vlib_get_main ();
sctp_ipv4_addr_param_t *ip4_param = 0;
sctp_ipv6_addr_param_t *ip6_param = 0;
u32 random_seed = random_default_seed ();
sctp_reuse_buffer (vm, b);
/* The minimum size of the message is given by the sctp_init_ack_chunk_t */
u16 alloc_bytes =
sizeof (sctp_init_ack_chunk_t) + sizeof (sctp_state_cookie_param_t);
if (PREDICT_FALSE (add_ip4 == 1))
{
/* Create room for variable-length fields in the INIT_ACK chunk */
alloc_bytes += SCTP_IPV4_ADDRESS_TYPE_LENGTH;
}
if (PREDICT_FALSE (add_ip6 == 1))
{
/* Create room for variable-length fields in the INIT_ACK chunk */
alloc_bytes += SCTP_IPV6_ADDRESS_TYPE_LENGTH;
}
if (sctp_conn->sub_conn[idx].connection.is_ip4)
alloc_bytes += sizeof (sctp_ipv4_addr_param_t);
else
alloc_bytes += sizeof (sctp_ipv6_addr_param_t);
/* As per RFC 4960 the chunk_length value does NOT contemplate
* the size of the first header (see sctp_header_t) and any padding
*/
u16 chunk_len = alloc_bytes - sizeof (sctp_header_t);
alloc_bytes += vnet_sctp_calculate_padding (alloc_bytes);
sctp_init_ack_chunk_t *init_ack_chunk =
vlib_buffer_push_uninit (b, alloc_bytes);
u16 pointer_offset = sizeof (sctp_init_ack_chunk_t);
/* Create State Cookie parameter */
sctp_state_cookie_param_t *state_cookie_param =
(sctp_state_cookie_param_t *) ((char *) init_ack_chunk + pointer_offset);
state_cookie_param->param_hdr.type =
clib_host_to_net_u16 (SCTP_STATE_COOKIE_TYPE);
state_cookie_param->param_hdr.length =
clib_host_to_net_u16 (sizeof (sctp_state_cookie_param_t));
state_cookie_param->creation_time = clib_host_to_net_u64 (sctp_time_now ());
state_cookie_param->cookie_lifespan =
clib_host_to_net_u32 (SCTP_VALID_COOKIE_LIFE);
sctp_compute_mac (sctp_conn, state_cookie_param);
pointer_offset += sizeof (sctp_state_cookie_param_t);
if (PREDICT_TRUE (ip4_addr != NULL))
{
sctp_ipv4_addr_param_t *ipv4_addr =
(sctp_ipv4_addr_param_t *) init_ack_chunk + pointer_offset;
ipv4_addr->param_hdr.type =
clib_host_to_net_u16 (SCTP_IPV4_ADDRESS_TYPE);
ipv4_addr->param_hdr.length =
clib_host_to_net_u16 (SCTP_IPV4_ADDRESS_TYPE_LENGTH);
ipv4_addr->address.as_u32 = ip4_addr->as_u32;
pointer_offset += SCTP_IPV4_ADDRESS_TYPE_LENGTH;
}
if (PREDICT_TRUE (ip6_addr != NULL))
{
sctp_ipv6_addr_param_t *ipv6_addr =
(sctp_ipv6_addr_param_t *) init_ack_chunk + pointer_offset;
ipv6_addr->param_hdr.type =
clib_host_to_net_u16 (SCTP_IPV6_ADDRESS_TYPE);
ipv6_addr->param_hdr.length =
clib_host_to_net_u16 (SCTP_IPV6_ADDRESS_TYPE_LENGTH);
ipv6_addr->address.as_u64[0] = ip6_addr->as_u64[0];
ipv6_addr->address.as_u64[1] = ip6_addr->as_u64[1];
pointer_offset += SCTP_IPV6_ADDRESS_TYPE_LENGTH;
}
if (sctp_conn->sub_conn[idx].connection.is_ip4)
{
ip4_param = (sctp_ipv4_addr_param_t *) init_ack_chunk + pointer_offset;
ip4_param->address.as_u32 =
sctp_conn->sub_conn[idx].connection.lcl_ip.ip4.as_u32;
pointer_offset += sizeof (sctp_ipv4_addr_param_t);
}
else
{
ip6_param = (sctp_ipv6_addr_param_t *) init_ack_chunk + pointer_offset;
ip6_param->address.as_u64[0] =
sctp_conn->sub_conn[idx].connection.lcl_ip.ip6.as_u64[0];
ip6_param->address.as_u64[1] =
sctp_conn->sub_conn[idx].connection.lcl_ip.ip6.as_u64[1];
pointer_offset += sizeof (sctp_ipv6_addr_param_t);
}
/* src_port & dst_port are already in network byte-order */
init_ack_chunk->sctp_hdr.checksum = 0;
init_ack_chunk->sctp_hdr.src_port =
sctp_conn->sub_conn[idx].connection.lcl_port;
init_ack_chunk->sctp_hdr.dst_port =
sctp_conn->sub_conn[idx].connection.rmt_port;
/* the sctp_conn->verification_tag is already in network byte-order (being a copy of the init_tag coming with the INIT chunk) */
init_ack_chunk->sctp_hdr.verification_tag = sctp_conn->remote_tag;
init_ack_chunk->initial_tsn =
clib_host_to_net_u32 (sctp_conn->local_initial_tsn);
SCTP_CONN_TRACKING_DBG ("init_ack_chunk->initial_tsn = %u",
init_ack_chunk->initial_tsn);
vnet_sctp_set_chunk_type (&init_ack_chunk->chunk_hdr, INIT_ACK);
vnet_sctp_set_chunk_length (&init_ack_chunk->chunk_hdr, chunk_len);
init_ack_chunk->initiate_tag =
clib_host_to_net_u32 (random_u32 (&random_seed));
init_ack_chunk->a_rwnd =
clib_host_to_net_u32 (sctp_conn->sub_conn[idx].cwnd);
init_ack_chunk->inboud_streams_count =
clib_host_to_net_u16 (INBOUND_STREAMS_COUNT);
init_ack_chunk->outbound_streams_count =
clib_host_to_net_u16 (OUTBOUND_STREAMS_COUNT);
sctp_conn->local_tag = init_ack_chunk->initiate_tag;
sctp_buffer_opaque (b)->sctp.connection_index =
sctp_conn->sub_conn[idx].connection.c_index;
sctp_buffer_opaque (b)->sctp.subconn_idx = idx;
}
/**
* Convert buffer to SHUTDOWN
*/
void
sctp_prepare_shutdown_chunk (sctp_connection_t * sctp_conn, u8 idx,
vlib_buffer_t * b)
{
u16 alloc_bytes = sizeof (sctp_shutdown_association_chunk_t);
/* As per RFC 4960 the chunk_length value does NOT contemplate
* the size of the first header (see sctp_header_t) and any padding
*/
u16 chunk_len = alloc_bytes - sizeof (sctp_header_t);
alloc_bytes += vnet_sctp_calculate_padding (alloc_bytes);
sctp_shutdown_association_chunk_t *shutdown_chunk =
vlib_buffer_push_uninit (b, alloc_bytes);
shutdown_chunk->sctp_hdr.checksum = 0;
/* No need of host_to_net conversion, already in net-byte order */
shutdown_chunk->sctp_hdr.src_port =
sctp_conn->sub_conn[idx].connection.lcl_port;
shutdown_chunk->sctp_hdr.dst_port =
sctp_conn->sub_conn[idx].connection.rmt_port;
shutdown_chunk->sctp_hdr.verification_tag = sctp_conn->remote_tag;
vnet_sctp_set_chunk_type (&shutdown_chunk->chunk_hdr, SHUTDOWN);
vnet_sctp_set_chunk_length (&shutdown_chunk->chunk_hdr, chunk_len);
shutdown_chunk->cumulative_tsn_ack = sctp_conn->last_rcvd_tsn;
sctp_buffer_opaque (b)->sctp.connection_index =
sctp_conn->sub_conn[idx].connection.c_index;
sctp_buffer_opaque (b)->sctp.subconn_idx = idx;
}
/*
* Send SHUTDOWN
*/
void
sctp_send_shutdown (sctp_connection_t * sctp_conn)
{
vlib_buffer_t *b;
u32 bi;
sctp_main_t *tm = vnet_get_sctp_main ();
vlib_main_t *vm = vlib_get_main ();
if (sctp_check_outstanding_data_chunks (sctp_conn) > 0)
return;
if (PREDICT_FALSE (sctp_get_free_buffer_index (tm, &bi)))
return;
u8 idx = SCTP_PRIMARY_PATH_IDX;
b = vlib_get_buffer (vm, bi);
sctp_init_buffer (vm, b);
sctp_prepare_shutdown_chunk (sctp_conn, idx, b);
sctp_enqueue_to_output_now (vm, b, bi,
sctp_conn->sub_conn[idx].connection.is_ip4);
}
/**
* Convert buffer to SHUTDOWN_ACK
*/
void
sctp_prepare_shutdown_ack_chunk (sctp_connection_t * sctp_conn, u8 idx,
vlib_buffer_t * b)
{
u16 alloc_bytes = sizeof (sctp_shutdown_association_chunk_t);
alloc_bytes += vnet_sctp_calculate_padding (alloc_bytes);
u16 chunk_len = alloc_bytes - sizeof (sctp_header_t);
sctp_shutdown_ack_chunk_t *shutdown_ack_chunk =
vlib_buffer_push_uninit (b, alloc_bytes);
shutdown_ack_chunk->sctp_hdr.checksum = 0;
/* No need of host_to_net conversion, already in net-byte order */
shutdown_ack_chunk->sctp_hdr.src_port =
sctp_conn->sub_conn[idx].connection.lcl_port;
shutdown_ack_chunk->sctp_hdr.dst_port =
sctp_conn->sub_conn[idx].connection.rmt_port;
shutdown_ack_chunk->sctp_hdr.verification_tag = sctp_conn->remote_tag;
vnet_sctp_set_chunk_type (&shutdown_ack_chunk->chunk_hdr, SHUTDOWN_ACK);
vnet_sctp_set_chunk_length (&shutdown_ack_chunk->chunk_hdr, chunk_len);
sctp_buffer_opaque (b)->sctp.connection_index =
sctp_conn->sub_conn[idx].connection.c_index;
sctp_buffer_opaque (b)->sctp.subconn_idx = idx;
}
/*
* Send SHUTDOWN_ACK
*/
void
sctp_send_shutdown_ack (sctp_connection_t * sctp_conn, u8 idx,
vlib_buffer_t * b)
{
vlib_main_t *vm = vlib_get_main ();
if (sctp_check_outstanding_data_chunks (sctp_conn) > 0)
return;
sctp_reuse_buffer (vm, b);
sctp_prepare_shutdown_ack_chunk (sctp_conn, idx, b);
}
/**
* Convert buffer to SACK
*/
void
sctp_prepare_sack_chunk (sctp_connection_t * sctp_conn, u8 idx,
vlib_buffer_t * b)
{
vlib_main_t *vm = vlib_get_main ();
sctp_reuse_buffer (vm, b);
u16 alloc_bytes = sizeof (sctp_selective_ack_chunk_t);
/* As per RFC 4960 the chunk_length value does NOT contemplate
* the size of the first header (see sctp_header_t) and any padding
*/
u16 chunk_len = alloc_bytes - sizeof (sctp_header_t);
alloc_bytes += vnet_sctp_calculate_padding (alloc_bytes);
sctp_selective_ack_chunk_t *sack = vlib_buffer_push_uninit (b, alloc_bytes);
sack->sctp_hdr.checksum = 0;
sack->sctp_hdr.src_port = sctp_conn->sub_conn[idx].connection.lcl_port;
sack->sctp_hdr.dst_port = sctp_conn->sub_conn[idx].connection.rmt_port;
sack->sctp_hdr.verification_tag = sctp_conn->remote_tag;
vnet_sctp_set_chunk_type (&sack->chunk_hdr, SACK);
vnet_sctp_set_chunk_length (&sack->chunk_hdr, chunk_len);
sack->cumulative_tsn_ack = sctp_conn->next_tsn_expected;
sctp_conn->ack_state = 0;
sctp_buffer_opaque (b)->sctp.connection_index =
sctp_conn->sub_conn[idx].connection.c_index;
sctp_buffer_opaque (b)->sctp.subconn_idx = idx;
}
/**
* Convert buffer to HEARTBEAT_ACK
*/
void
sctp_prepare_heartbeat_ack_chunk (sctp_connection_t * sctp_conn, u8 idx,
vlib_buffer_t * b)
{
vlib_main_t *vm = vlib_get_main ();
u16 alloc_bytes = sizeof (sctp_hb_ack_chunk_t);
sctp_reuse_buffer (vm, b);
/* As per RFC 4960 the chunk_length value does NOT contemplate
* the size of the first header (see sctp_header_t) and any padding
*/
u16 chunk_len = alloc_bytes - sizeof (sctp_header_t);
alloc_bytes += vnet_sctp_calculate_padding (alloc_bytes);
sctp_hb_ack_chunk_t *hb_ack = vlib_buffer_push_uninit (b, alloc_bytes);
hb_ack->sctp_hdr.checksum = 0;
/* No need of host_to_net conversion, already in net-byte order */
hb_ack->sctp_hdr.src_port = sctp_conn->sub_conn[idx].connection.lcl_port;
hb_ack->sctp_hdr.dst_port = sctp_conn->sub_conn[idx].connection.rmt_port;
hb_ack->sctp_hdr.verification_tag = sctp_conn->remote_tag;
hb_ack->hb_info.param_hdr.type = clib_host_to_net_u16 (1);
hb_ack->hb_info.param_hdr.length =
clib_host_to_net_u16 (sizeof (hb_ack->hb_info.hb_info));
vnet_sctp_set_chunk_type (&hb_ack->chunk_hdr, HEARTBEAT_ACK);
vnet_sctp_set_chunk_length (&hb_ack->chunk_hdr, chunk_len);
sctp_buffer_opaque (b)->sctp.connection_index =
sctp_conn->sub_conn[idx].connection.c_index;
sctp_buffer_opaque (b)->sctp.subconn_idx = idx;
}
/**
* Convert buffer to HEARTBEAT
*/
void
sctp_prepare_heartbeat_chunk (sctp_connection_t * sctp_conn, u8 idx,
vlib_buffer_t * b)
{
u16 alloc_bytes = sizeof (sctp_hb_req_chunk_t);
/* As per RFC 4960 the chunk_length value does NOT contemplate
* the size of the first header (see sctp_header_t) and any padding
*/
u16 chunk_len = alloc_bytes - sizeof (sctp_header_t);
alloc_bytes += vnet_sctp_calculate_padding (alloc_bytes);
sctp_hb_req_chunk_t *hb_req = vlib_buffer_push_uninit (b, alloc_bytes);
hb_req->sctp_hdr.checksum = 0;
/* No need of host_to_net conversion, already in net-byte order */
hb_req->sctp_hdr.src_port = sctp_conn->sub_conn[idx].connection.lcl_port;
hb_req->sctp_hdr.dst_port = sctp_conn->sub_conn[idx].connection.rmt_port;
hb_req->sctp_hdr.verification_tag = sctp_conn->remote_tag;
hb_req->hb_info.param_hdr.type = clib_host_to_net_u16 (1);
hb_req->hb_info.param_hdr.length =
clib_host_to_net_u16 (sizeof (hb_req->hb_info.hb_info));
vnet_sctp_set_chunk_type (&hb_req->chunk_hdr, HEARTBEAT);
vnet_sctp_set_chunk_length (&hb_req->chunk_hdr, chunk_len);
sctp_buffer_opaque (b)->sctp.connection_index =
sctp_conn->sub_conn[idx].connection.c_index;
sctp_buffer_opaque (b)->sctp.subconn_idx = idx;
}
void
sctp_send_heartbeat (sctp_connection_t * sctp_conn)
{
vlib_buffer_t *b;
u32 bi;
sctp_main_t *tm = vnet_get_sctp_main ();
vlib_main_t *vm = vlib_get_main ();
u8 i;
u64 now = sctp_time_now ();
for (i = 0; i < MAX_SCTP_CONNECTIONS; i++)
{
if (sctp_conn->sub_conn[i].state == SCTP_SUBCONN_STATE_DOWN)
continue;
if (now > (sctp_conn->sub_conn[i].last_seen + SCTP_HB_INTERVAL))
{
if (PREDICT_FALSE (sctp_get_free_buffer_index (tm, &bi)))
return;
b = vlib_get_buffer (vm, bi);
sctp_init_buffer (vm, b);
sctp_prepare_heartbeat_chunk (sctp_conn, i, b);
sctp_enqueue_to_output_now (vm, b, bi,
sctp_conn->sub_conn[i].
connection.is_ip4);
sctp_conn->sub_conn[i].unacknowledged_hb += 1;
}
}
}
/**
* Convert buffer to SHUTDOWN_COMPLETE
*/
void
sctp_prepare_shutdown_complete_chunk (sctp_connection_t * sctp_conn, u8 idx,
vlib_buffer_t * b)
{
u16 alloc_bytes = sizeof (sctp_shutdown_association_chunk_t);
alloc_bytes += vnet_sctp_calculate_padding (alloc_bytes);
u16 chunk_len = alloc_bytes - sizeof (sctp_header_t);
sctp_shutdown_complete_chunk_t *shutdown_complete =
vlib_buffer_push_uninit (b, alloc_bytes);
shutdown_complete->sctp_hdr.checksum = 0;
/* No need of host_to_net conversion, already in net-byte order */
shutdown_complete->sctp_hdr.src_port =
sctp_conn->sub_conn[idx].connection.lcl_port;
shutdown_complete->sctp_hdr.dst_port =
sctp_conn->sub_conn[idx].connection.rmt_port;
shutdown_complete->sctp_hdr.verification_tag = sctp_conn->remote_tag;
vnet_sctp_set_chunk_type (&shutdown_complete->chunk_hdr, SHUTDOWN_COMPLETE);
vnet_sctp_set_chunk_length (&shutdown_complete->chunk_hdr, chunk_len);
sctp_buffer_opaque (b)->sctp.connection_index =
sctp_conn->sub_conn[idx].connection.c_index;
sctp_buffer_opaque (b)->sctp.subconn_idx = idx;
}
void
sctp_send_shutdown_complete (sctp_connection_t * sctp_conn, u8 idx,
vlib_buffer_t * b0)
{
vlib_main_t *vm = vlib_get_main ();
if (sctp_check_outstanding_data_chunks (sctp_conn) > 0)
return;
sctp_reuse_buffer (vm, b0);
sctp_prepare_shutdown_complete_chunk (sctp_conn, idx, b0);
}
/*
* Send INIT
*/
void
sctp_send_init (sctp_connection_t * sctp_conn)
{
vlib_buffer_t *b;
u32 bi;
sctp_main_t *tm = vnet_get_sctp_main ();
vlib_main_t *vm = vlib_get_main ();
if (PREDICT_FALSE (sctp_conn->init_retransmit_err > SCTP_MAX_INIT_RETRANS))
{
clib_warning ("Reached MAX_INIT_RETRANS times. Aborting connection.");
session_stream_connect_notify (&sctp_conn->sub_conn
[SCTP_PRIMARY_PATH_IDX].connection, 1);
sctp_connection_timers_reset (sctp_conn);
sctp_connection_cleanup (sctp_conn);
return;
}
if (PREDICT_FALSE (sctp_get_free_buffer_index (tm, &bi)))
return;
b = vlib_get_buffer (vm, bi);
u8 idx = SCTP_PRIMARY_PATH_IDX;
sctp_init_buffer (vm, b);
sctp_prepare_init_chunk (sctp_conn, idx, b);
sctp_push_ip_hdr (tm, &sctp_conn->sub_conn[idx], b);
sctp_enqueue_to_ip_lookup (vm, b, bi, sctp_conn->sub_conn[idx].c_is_ip4,
sctp_conn->sub_conn[idx].c_fib_index);
/* Start the T1_INIT timer */
sctp_timer_set (sctp_conn, idx, SCTP_TIMER_T1_INIT,
sctp_conn->sub_conn[idx].RTO);
/* Change state to COOKIE_WAIT */
sctp_conn->state = SCTP_STATE_COOKIE_WAIT;
/* Measure RTT with this */
sctp_conn->sub_conn[idx].rtt_ts = sctp_time_now ();
}
/**
* Push SCTP header and update connection variables
*/
static void
sctp_push_hdr_i (sctp_connection_t * sctp_conn, vlib_buffer_t * b,
sctp_state_t next_state)
{
u16 data_len = b->current_length;
if (b->flags & VLIB_BUFFER_TOTAL_LENGTH_VALID)
data_len += b->total_length_not_including_first_buffer;
ASSERT (!b->total_length_not_including_first_buffer
|| (b->flags & VLIB_BUFFER_NEXT_PRESENT)
|| !(b->flags & VLIB_BUFFER_TOTAL_LENGTH_VALID));
SCTP_ADV_DBG_OUTPUT ("b->current_length = %u, "
"b->current_data = %p "
"data_len = %u",
b->current_length, b->current_data, data_len);
u16 data_padding = vnet_sctp_calculate_padding (b->current_length);
if (data_padding > 0)
{
u8 *p_tail = vlib_buffer_put_uninit (b, data_padding);
clib_memset_u8 (p_tail, 0, data_padding);
}
u16 bytes_to_add = sizeof (sctp_payload_data_chunk_t);
u16 chunk_length = data_len + bytes_to_add - sizeof (sctp_header_t);
sctp_payload_data_chunk_t *data_chunk =
vlib_buffer_push_uninit (b, bytes_to_add);
u8 idx = sctp_data_subconn_select (sctp_conn);
SCTP_DBG_OUTPUT
("SCTP_CONN = %p, IDX = %u, S_INDEX = %u, C_INDEX = %u, sctp_conn->[...].LCL_PORT = %u, sctp_conn->[...].RMT_PORT = %u",
sctp_conn, idx, sctp_conn->sub_conn[idx].connection.s_index,
sctp_conn->sub_conn[idx].connection.c_index,
sctp_conn->sub_conn[idx].connection.lcl_port,
sctp_conn->sub_conn[idx].connection.rmt_port);
data_chunk->sctp_hdr.checksum = 0;
data_chunk->sctp_hdr.src_port =
sctp_conn->sub_conn[idx].connection.lcl_port;
data_chunk->sctp_hdr.dst_port =
sctp_conn->sub_conn[idx].connection.rmt_port;
data_chunk->sctp_hdr.verification_tag = sctp_conn->remote_tag;
data_chunk->tsn = clib_host_to_net_u32 (sctp_conn->next_tsn);
data_chunk->stream_id = clib_host_to_net_u16 (0);
data_chunk->stream_seq = clib_host_to_net_u16 (0);
vnet_sctp_set_chunk_type (&data_chunk->chunk_hdr, DATA);
vnet_sctp_set_chunk_length (&data_chunk->chunk_hdr, chunk_length);
vnet_sctp_set_bbit (&data_chunk->chunk_hdr);
vnet_sctp_set_ebit (&data_chunk->chunk_hdr);
SCTP_ADV_DBG_OUTPUT ("POINTER_WITH_DATA = %p, DATA_OFFSET = %u",
b->data, b->current_data);
if (sctp_conn->sub_conn[idx].state != SCTP_SUBCONN_AWAITING_SACK)
{
sctp_conn->sub_conn[idx].state = SCTP_SUBCONN_AWAITING_SACK;
sctp_conn->last_unacked_tsn = sctp_conn->next_tsn;
}
sctp_conn->next_tsn += data_len;
u32 inflight = sctp_conn->next_tsn - sctp_conn->last_unacked_tsn;
/* Section 7.2.2; point (3) */
if (sctp_conn->sub_conn[idx].partially_acked_bytes >=
sctp_conn->sub_conn[idx].cwnd
&& inflight >= sctp_conn->sub_conn[idx].cwnd)
{
sctp_conn->sub_conn[idx].cwnd += sctp_conn->sub_conn[idx].PMTU;
sctp_conn->sub_conn[idx].partially_acked_bytes -=
sctp_conn->sub_conn[idx].cwnd;
}
sctp_conn->sub_conn[idx].last_data_ts = sctp_time_now ();
sctp_buffer_opaque (b)->sctp.connection_index =
sctp_conn->sub_conn[idx].connection.c_index;
sctp_buffer_opaque (b)->sctp.subconn_idx = idx;
}
u32
sctp_push_header (transport_connection_t * trans_conn, vlib_buffer_t * b)
{
sctp_connection_t *sctp_conn =
sctp_get_connection_from_transport (trans_conn);
SCTP_DBG_OUTPUT ("TRANS_CONN = %p, SCTP_CONN = %p, "
"S_INDEX = %u, C_INDEX = %u,"
"trans_conn->LCL_PORT = %u, trans_conn->RMT_PORT = %u",
trans_conn,
sctp_conn,
trans_conn->s_index,
trans_conn->c_index,
trans_conn->lcl_port, trans_conn->rmt_port);
sctp_push_hdr_i (sctp_conn, b, SCTP_STATE_ESTABLISHED);
sctp_trajectory_add_start (b, 3);
return 0;
}
u32
sctp_prepare_data_retransmit (sctp_connection_t * sctp_conn,
u8 idx,
u32 offset,
u32 max_deq_bytes, vlib_buffer_t ** b)
{
sctp_main_t *tm = vnet_get_sctp_main ();
vlib_main_t *vm = vlib_get_main ();
int n_bytes = 0;
u32 bi, available_bytes, seg_size;
u8 *data;
ASSERT (sctp_conn->state >= SCTP_STATE_ESTABLISHED);
ASSERT (max_deq_bytes != 0);
/*
* Make sure we can retransmit something
*/
available_bytes =
transport_max_tx_dequeue (&sctp_conn->sub_conn[idx].connection);
ASSERT (available_bytes >= offset);
available_bytes -= offset;
if (!available_bytes)
return 0;
max_deq_bytes = clib_min (sctp_conn->sub_conn[idx].cwnd, max_deq_bytes);
max_deq_bytes = clib_min (available_bytes, max_deq_bytes);
seg_size = max_deq_bytes;
/*
* Allocate and fill in buffer(s)
*/
if (PREDICT_FALSE (sctp_get_free_buffer_index (tm, &bi)))
return 0;
*b = vlib_get_buffer (vm, bi);
data = sctp_init_buffer (vm, *b);
/* Easy case, buffer size greater than mss */
if (PREDICT_TRUE (seg_size <= tm->bytes_per_buffer))
{
n_bytes =
session_tx_fifo_peek_bytes (&sctp_conn->sub_conn[idx].connection,
data, offset, max_deq_bytes);
ASSERT (n_bytes == max_deq_bytes);
b[0]->current_length = n_bytes;
sctp_push_hdr_i (sctp_conn, *b, sctp_conn->state);
}
return n_bytes;
}
void
sctp_data_retransmit (sctp_connection_t * sctp_conn)
{
vlib_main_t *vm = vlib_get_main ();
vlib_buffer_t *b = 0;
u32 bi, n_bytes = 0;
u8 idx = sctp_data_subconn_select (sctp_conn);
SCTP_DBG_OUTPUT
("SCTP_CONN = %p, IDX = %u, S_INDEX = %u, C_INDEX = %u, sctp_conn->[...].LCL_PORT = %u, sctp_conn->[...].RMT_PORT = %u",
sctp_conn, idx, sctp_conn->sub_conn[idx].connection.s_index,
sctp_conn->sub_conn[idx].connection.c_index,
sctp_conn->sub_conn[idx].connection.lcl_port,
sctp_conn->sub_conn[idx].connection.rmt_port);
if (sctp_conn->state >= SCTP_STATE_ESTABLISHED)
{
return;
}
n_bytes =
sctp_prepare_data_retransmit (sctp_conn, idx, 0,
sctp_conn->sub_conn[idx].cwnd, &b);
if (n_bytes > 0)
SCTP_DBG_OUTPUT ("We have data (%u bytes) to retransmit", n_bytes);
bi = vlib_get_buffer_index (vm, b);
sctp_enqueue_to_output_now (vm, b, bi,
sctp_conn->sub_conn[idx].connection.is_ip4);
return;
}
#if SCTP_DEBUG_STATE_MACHINE
always_inline u8
sctp_validate_output_state_machine (sctp_connection_t * sctp_conn,
u8 chunk_type)
{
u8 result = 0;
switch (sctp_conn->state)
{
case SCTP_STATE_CLOSED:
if (chunk_type != INIT && chunk_type != INIT_ACK)
result = 1;
break;
case SCTP_STATE_ESTABLISHED:
if (chunk_type != DATA && chunk_type != HEARTBEAT &&
chunk_type != HEARTBEAT_ACK && chunk_type != SACK &&
chunk_type != COOKIE_ACK && chunk_type != SHUTDOWN)
result = 1;
break;
case SCTP_STATE_COOKIE_WAIT:
if (chunk_type != COOKIE_ECHO)
result = 1;
break;
case SCTP_STATE_SHUTDOWN_SENT:
if (chunk_type != SHUTDOWN_COMPLETE)
result = 1;
break;
case SCTP_STATE_SHUTDOWN_RECEIVED:
if (chunk_type != SHUTDOWN_ACK)
result = 1;
break;
}
return result;
}
#endif
/*
* fd.io coding-style-patch-verification: ON
*
* Local Variables:
* eval: (c-set-style "gnu")
* End:
*/