blob: db4fafa9a140e03fd886465a21664552c363f284 [file] [log] [blame]
/*
* Copyright (c) 2015 Cisco and/or its affiliates.
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at:
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#include "ssvm_eth.h"
ssvm_eth_main_t ssvm_eth_main;
#define foreach_ssvm_eth_tx_func_error \
_(RING_FULL, "Tx packet drops (ring full)") \
_(NO_BUFFERS, "Tx packet drops (no buffers)") \
_(ADMIN_DOWN, "Tx packet drops (admin down)")
typedef enum
{
#define _(f,s) SSVM_ETH_TX_ERROR_##f,
foreach_ssvm_eth_tx_func_error
#undef _
SSVM_ETH_TX_N_ERROR,
} ssvm_eth_tx_func_error_t;
static u32 ssvm_eth_flag_change (vnet_main_t * vnm,
vnet_hw_interface_t * hi, u32 flags);
int
ssvm_eth_create (ssvm_eth_main_t * em, u8 * name, int is_master)
{
ssvm_private_t *intfc;
void *oldheap;
clib_error_t *e;
unix_shared_memory_queue_t *q;
ssvm_shared_header_t *sh;
ssvm_eth_queue_elt_t *elts;
u32 *elt_indices;
u8 enet_addr[6];
int i, rv;
vec_add2 (em->intfcs, intfc, 1);
intfc->ssvm_size = em->segment_size;
intfc->i_am_master = 1;
intfc->name = name;
intfc->my_pid = getpid ();
if (is_master == 0)
{
rv = ssvm_slave_init (intfc, 20 /* timeout in seconds */ );
if (rv < 0)
return rv;
goto create_vnet_interface;
}
intfc->requested_va = em->next_base_va;
em->next_base_va += em->segment_size;
rv = ssvm_master_init (intfc, intfc - em->intfcs /* master index */ );
if (rv < 0)
return rv;
/* OK, segment created, set up queues and so forth. */
sh = intfc->sh;
oldheap = ssvm_push_heap (sh);
q = unix_shared_memory_queue_init (em->queue_elts, sizeof (u32),
0 /* consumer pid not interesting */ ,
0 /* signal not sent */ );
sh->opaque[TO_MASTER_Q_INDEX] = (void *) q;
q = unix_shared_memory_queue_init (em->queue_elts, sizeof (u32),
0 /* consumer pid not interesting */ ,
0 /* signal not sent */ );
sh->opaque[TO_SLAVE_Q_INDEX] = (void *) q;
/*
* Preallocate the requested number of buffer chunks
* There must be a better way to do this, etc.
* Add some slop to avoid pool reallocation, which will not go well
*/
elts = 0;
elt_indices = 0;
vec_validate_aligned (elts, em->nbuffers - 1, CLIB_CACHE_LINE_BYTES);
vec_validate_aligned (elt_indices, em->nbuffers - 1, CLIB_CACHE_LINE_BYTES);
for (i = 0; i < em->nbuffers; i++)
elt_indices[i] = i;
sh->opaque[CHUNK_POOL_INDEX] = (void *) elts;
sh->opaque[CHUNK_POOL_FREELIST_INDEX] = (void *) elt_indices;
sh->opaque[CHUNK_POOL_NFREE] = (void *) (uword) em->nbuffers;
ssvm_pop_heap (oldheap);
create_vnet_interface:
sh = intfc->sh;
memset (enet_addr, 0, sizeof (enet_addr));
enet_addr[0] = 2;
enet_addr[1] = 0xFE;
enet_addr[2] = is_master;
enet_addr[5] = sh->master_index;
e = ethernet_register_interface
(em->vnet_main, ssvm_eth_device_class.index, intfc - em->intfcs,
/* ethernet address */ enet_addr,
&intfc->vlib_hw_if_index, ssvm_eth_flag_change);
if (e)
{
clib_error_report (e);
/* $$$$ unmap offending region? */
return VNET_API_ERROR_INVALID_INTERFACE;
}
/* Declare link up */
vnet_hw_interface_set_flags (em->vnet_main, intfc->vlib_hw_if_index,
VNET_HW_INTERFACE_FLAG_LINK_UP);
/* Let the games begin... */
if (is_master)
sh->ready = 1;
return 0;
}
static clib_error_t *
ssvm_config (vlib_main_t * vm, unformat_input_t * input)
{
u8 *name;
int is_master = 1;
int i, rv;
ssvm_eth_main_t *em = &ssvm_eth_main;
while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
{
if (unformat (input, "base-va %llx", &em->next_base_va))
;
else if (unformat (input, "segment-size %lld", &em->segment_size))
em->segment_size = 1ULL << (max_log2 (em->segment_size));
else if (unformat (input, "nbuffers %lld", &em->nbuffers))
;
else if (unformat (input, "queue-elts %lld", &em->queue_elts))
;
else if (unformat (input, "slave"))
is_master = 0;
else if (unformat (input, "%s", &name))
vec_add1 (em->names, name);
else
break;
}
/* No configured instances, we're done... */
if (vec_len (em->names) == 0)
return 0;
for (i = 0; i < vec_len (em->names); i++)
{
rv = ssvm_eth_create (em, em->names[i], is_master);
if (rv < 0)
return clib_error_return (0, "ssvm_eth_create '%s' failed, error %d",
em->names[i], rv);
}
vlib_node_set_state (vm, ssvm_eth_input_node.index,
VLIB_NODE_STATE_POLLING);
return 0;
}
VLIB_CONFIG_FUNCTION (ssvm_config, "ssvm_eth");
static clib_error_t *
ssvm_eth_init (vlib_main_t * vm)
{
ssvm_eth_main_t *em = &ssvm_eth_main;
if (((sizeof (ssvm_eth_queue_elt_t) / CLIB_CACHE_LINE_BYTES)
* CLIB_CACHE_LINE_BYTES) != sizeof (ssvm_eth_queue_elt_t))
clib_warning ("ssvm_eth_queue_elt_t size %d not a multiple of %d",
sizeof (ssvm_eth_queue_elt_t), CLIB_CACHE_LINE_BYTES);
em->vlib_main = vm;
em->vnet_main = vnet_get_main ();
em->elog_main = &vm->elog_main;
/* default config param values... */
em->next_base_va = 0x600000000ULL;
/*
* Allocate 2 full superframes in each dir (256 x 2 x 2 x 2048 bytes),
* 2mb; double that so we have plenty of space... 4mb
*/
em->segment_size = 8 << 20;
em->nbuffers = 1024;
em->queue_elts = 512;
return 0;
}
VLIB_INIT_FUNCTION (ssvm_eth_init);
static char *ssvm_eth_tx_func_error_strings[] = {
#define _(n,s) s,
foreach_ssvm_eth_tx_func_error
#undef _
};
static u8 *
format_ssvm_eth_device_name (u8 * s, va_list * args)
{
u32 i = va_arg (*args, u32);
s = format (s, "ssvmEthernet%d", i);
return s;
}
static u8 *
format_ssvm_eth_device (u8 * s, va_list * args)
{
s = format (s, "SSVM Ethernet");
return s;
}
static u8 *
format_ssvm_eth_tx_trace (u8 * s, va_list * args)
{
s = format (s, "Unimplemented...");
return s;
}
static uword
ssvm_eth_interface_tx (vlib_main_t * vm,
vlib_node_runtime_t * node, vlib_frame_t * f)
{
ssvm_eth_main_t *em = &ssvm_eth_main;
vnet_interface_output_runtime_t *rd = (void *) node->runtime_data;
ssvm_private_t *intfc = vec_elt_at_index (em->intfcs, rd->dev_instance);
ssvm_shared_header_t *sh = intfc->sh;
unix_shared_memory_queue_t *q;
u32 *from;
u32 n_left;
ssvm_eth_queue_elt_t *elts, *elt, *prev_elt;
u32 my_pid = intfc->my_pid;
vlib_buffer_t *b0;
u32 bi0;
u32 size_this_buffer;
u32 chunks_this_buffer;
u8 i_am_master = intfc->i_am_master;
u32 elt_index;
int is_ring_full, interface_down;
int i;
volatile u32 *queue_lock;
u32 n_to_alloc = VLIB_FRAME_SIZE;
u32 n_allocated, n_present_in_cache, n_available;
u32 *elt_indices;
if (i_am_master)
q = (unix_shared_memory_queue_t *) sh->opaque[TO_SLAVE_Q_INDEX];
else
q = (unix_shared_memory_queue_t *) sh->opaque[TO_MASTER_Q_INDEX];
queue_lock = (u32 *) q;
from = vlib_frame_vector_args (f);
n_left = f->n_vectors;
is_ring_full = 0;
interface_down = 0;
n_present_in_cache = vec_len (em->chunk_cache);
/* admin / link up/down check */
if (sh->opaque[MASTER_ADMIN_STATE_INDEX] == 0 ||
sh->opaque[SLAVE_ADMIN_STATE_INDEX] == 0)
{
interface_down = 1;
goto out;
}
ssvm_lock (sh, my_pid, 1);
elts = (ssvm_eth_queue_elt_t *) (sh->opaque[CHUNK_POOL_INDEX]);
elt_indices = (u32 *) (sh->opaque[CHUNK_POOL_FREELIST_INDEX]);
n_available = (u32) pointer_to_uword (sh->opaque[CHUNK_POOL_NFREE]);
if (n_present_in_cache < n_left * 2)
{
vec_validate (em->chunk_cache, n_to_alloc + n_present_in_cache - 1);
n_allocated = n_to_alloc < n_available ? n_to_alloc : n_available;
if (PREDICT_TRUE (n_allocated > 0))
{
clib_memcpy (&em->chunk_cache[n_present_in_cache],
&elt_indices[n_available - n_allocated],
sizeof (u32) * n_allocated);
}
n_present_in_cache += n_allocated;
n_available -= n_allocated;
sh->opaque[CHUNK_POOL_NFREE] = uword_to_pointer (n_available, void *);
_vec_len (em->chunk_cache) = n_present_in_cache;
}
ssvm_unlock (sh);
while (n_left)
{
bi0 = from[0];
b0 = vlib_get_buffer (vm, bi0);
size_this_buffer = vlib_buffer_length_in_chain (vm, b0);
chunks_this_buffer = (size_this_buffer + (SSVM_BUFFER_SIZE - 1))
/ SSVM_BUFFER_SIZE;
/* If we're not going to be able to enqueue the buffer, tail drop. */
if (q->cursize >= q->maxsize)
{
is_ring_full = 1;
break;
}
prev_elt = 0;
elt_index = ~0;
for (i = 0; i < chunks_this_buffer; i++)
{
if (PREDICT_FALSE (n_present_in_cache == 0))
goto out;
elt_index = em->chunk_cache[--n_present_in_cache];
elt = elts + elt_index;
elt->type = SSVM_PACKET_TYPE;
elt->flags = 0;
elt->total_length_not_including_first_buffer =
b0->total_length_not_including_first_buffer;
elt->length_this_buffer = b0->current_length;
elt->current_data_hint = b0->current_data;
elt->owner = !i_am_master;
elt->tag = 1;
clib_memcpy (elt->data, b0->data + b0->current_data,
b0->current_length);
if (PREDICT_FALSE (prev_elt != 0))
prev_elt->next_index = elt - elts;
if (PREDICT_FALSE (i < (chunks_this_buffer - 1)))
{
elt->flags = SSVM_BUFFER_NEXT_PRESENT;
ASSERT (b0->flags & VLIB_BUFFER_NEXT_PRESENT);
b0 = vlib_get_buffer (vm, b0->next_buffer);
}
prev_elt = elt;
}
while (__sync_lock_test_and_set (queue_lock, 1))
;
unix_shared_memory_queue_add_raw (q, (u8 *) & elt_index);
CLIB_MEMORY_BARRIER ();
*queue_lock = 0;
from++;
n_left--;
}
out:
if (PREDICT_FALSE (n_left))
{
if (is_ring_full)
vlib_error_count (vm, node->node_index, SSVM_ETH_TX_ERROR_RING_FULL,
n_left);
else if (interface_down)
vlib_error_count (vm, node->node_index, SSVM_ETH_TX_ERROR_ADMIN_DOWN,
n_left);
else
vlib_error_count (vm, node->node_index, SSVM_ETH_TX_ERROR_NO_BUFFERS,
n_left);
vlib_buffer_free (vm, from, n_left);
}
else
vlib_buffer_free (vm, vlib_frame_vector_args (f), f->n_vectors);
if (PREDICT_TRUE (vec_len (em->chunk_cache)))
_vec_len (em->chunk_cache) = n_present_in_cache;
return f->n_vectors;
}
static void
ssvm_eth_clear_hw_interface_counters (u32 instance)
{
/* Nothing for now */
}
static clib_error_t *
ssvm_eth_interface_admin_up_down (vnet_main_t * vnm, u32 hw_if_index,
u32 flags)
{
vnet_hw_interface_t *hif = vnet_get_hw_interface (vnm, hw_if_index);
uword is_up = (flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP) != 0;
ssvm_eth_main_t *em = &ssvm_eth_main;
ssvm_private_t *intfc = vec_elt_at_index (em->intfcs, hif->dev_instance);
ssvm_shared_header_t *sh;
/* publish link-state in shared-memory, to discourage buffer-wasting */
sh = intfc->sh;
if (intfc->i_am_master)
sh->opaque[MASTER_ADMIN_STATE_INDEX] = (void *) is_up;
else
sh->opaque[SLAVE_ADMIN_STATE_INDEX] = (void *) is_up;
return 0;
}
static clib_error_t *
ssvm_eth_subif_add_del_function (vnet_main_t * vnm,
u32 hw_if_index,
struct vnet_sw_interface_t *st, int is_add)
{
/* Nothing for now */
return 0;
}
/*
* Dynamically redirect all pkts from a specific interface
* to the specified node
*/
static void
ssvm_eth_set_interface_next_node (vnet_main_t * vnm, u32 hw_if_index,
u32 node_index)
{
ssvm_eth_main_t *em = &ssvm_eth_main;
vnet_hw_interface_t *hw = vnet_get_hw_interface (vnm, hw_if_index);
ssvm_private_t *intfc = pool_elt_at_index (em->intfcs, hw->dev_instance);
/* Shut off redirection */
if (node_index == ~0)
{
intfc->per_interface_next_index = node_index;
return;
}
intfc->per_interface_next_index =
vlib_node_add_next (em->vlib_main, ssvm_eth_input_node.index, node_index);
}
static u32
ssvm_eth_flag_change (vnet_main_t * vnm, vnet_hw_interface_t * hi, u32 flags)
{
/* nothing for now */
return 0;
}
/* *INDENT-OFF* */
VNET_DEVICE_CLASS (ssvm_eth_device_class) = {
.name = "ssvm-eth",
.tx_function = ssvm_eth_interface_tx,
.tx_function_n_errors = SSVM_ETH_TX_N_ERROR,
.tx_function_error_strings = ssvm_eth_tx_func_error_strings,
.format_device_name = format_ssvm_eth_device_name,
.format_device = format_ssvm_eth_device,
.format_tx_trace = format_ssvm_eth_tx_trace,
.clear_counters = ssvm_eth_clear_hw_interface_counters,
.admin_up_down_function = ssvm_eth_interface_admin_up_down,
.subif_add_del_function = ssvm_eth_subif_add_del_function,
.rx_redirect_to_node = ssvm_eth_set_interface_next_node,
};
VLIB_DEVICE_TX_FUNCTION_MULTIARCH (ssvm_eth_device_class,
ssvm_eth_interface_tx)
/* *INDENT-ON* */
/*
* fd.io coding-style-patch-verification: ON
*
* Local Variables:
* eval: (c-set-style "gnu")
* End:
*/