blob: aad9701080e0941d17505c7d56b2859ff576a26f [file] [log] [blame]
/*
* Copyright (c) 2015 Cisco and/or its affiliates.
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at:
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
/*
* buffer.h: VLIB buffers
*
* Copyright (c) 2008 Eliot Dresselhaus
*
* Permission is hereby granted, free of charge, to any person obtaining
* a copy of this software and associated documentation files (the
* "Software"), to deal in the Software without restriction, including
* without limitation the rights to use, copy, modify, merge, publish,
* distribute, sublicense, and/or sell copies of the Software, and to
* permit persons to whom the Software is furnished to do so, subject to
* the following conditions:
*
* The above copyright notice and this permission notice shall be
* included in all copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
* NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
* LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
* OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
* WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
*/
#ifndef included_vlib_buffer_h
#define included_vlib_buffer_h
#include <vppinfra/types.h>
#include <vppinfra/cache.h>
#include <vppinfra/serialize.h>
#include <vppinfra/vector.h>
#include <vppinfra/lock.h>
#include <vlib/error.h> /* for vlib_error_t */
#include <vlib/config.h> /* for VLIB_BUFFER_PRE_DATA_SIZE */
#define VLIB_BUFFER_DEFAULT_DATA_SIZE (2048)
/* Minimum buffer chain segment size. Does not apply to last buffer in chain.
Dataplane code can safely asume that specified amount of data is not split
into 2 chained buffers */
#define VLIB_BUFFER_MIN_CHAIN_SEG_SIZE (128)
/* Amount of head buffer data copied to each replica head buffer */
#define VLIB_BUFFER_CLONE_HEAD_SIZE (256)
/** \file
vlib buffer structure definition and a few select
access methods. This structure and the buffer allocation
mechanism should perhaps live in vnet, but it would take a lot
of typing to make it so.
*/
/**
* Buffer Flags
*/
#define foreach_vlib_buffer_flag \
_( 0, IS_TRACED, 0) \
_( 1, NEXT_PRESENT, "next-present") \
_( 2, TOTAL_LENGTH_VALID, 0) \
_( 3, EXT_HDR_VALID, "ext-hdr-valid")
/* NOTE: only buffer generic flags should be defined here, please consider
using user flags. i.e. src/vnet/buffer.h */
enum
{
#define _(bit, name, v) VLIB_BUFFER_##name = (1 << (bit)),
foreach_vlib_buffer_flag
#undef _
};
enum
{
#define _(bit, name, v) VLIB_BUFFER_LOG2_##name = (bit),
foreach_vlib_buffer_flag
#undef _
};
/* User defined buffer flags. */
#define LOG2_VLIB_BUFFER_FLAG_USER(n) (32 - (n))
#define VLIB_BUFFER_FLAG_USER(n) (1 << LOG2_VLIB_BUFFER_FLAG_USER(n))
#define VLIB_BUFFER_FLAGS_ALL (0x0f)
/** \brief Compile time buffer trajectory tracing option
Turn this on if you run into "bad monkey" contexts,
and you want to know exactly which nodes they've visited...
See vlib/main.c...
*/
#ifndef VLIB_BUFFER_TRACE_TRAJECTORY
#define VLIB_BUFFER_TRACE_TRAJECTORY 0
#endif /* VLIB_BUFFER_TRACE_TRAJECTORY */
#define vlib_buffer_template_fields \
/** signed offset in data[], pre_data[] that we are currently \
* processing. If negative current header points into predata area. */ \
i16 current_data; \
\
/** Nbytes between current data and the end of this buffer. */ \
u16 current_length; \
/** buffer flags: \
<br> VLIB_BUFFER_FREE_LIST_INDEX_MASK: bits used to store free list \
index, <br> VLIB_BUFFER_IS_TRACED: trace this buffer. <br> \
VLIB_BUFFER_NEXT_PRESENT: this is a multi-chunk buffer. <br> \
VLIB_BUFFER_TOTAL_LENGTH_VALID: as it says <br> \
VLIB_BUFFER_EXT_HDR_VALID: buffer contains valid external buffer manager \
header, set to avoid adding it to a flow report <br> \
VLIB_BUFFER_FLAG_USER(n): user-defined bit N \
*/ \
u32 flags; \
\
/** Generic flow identifier */ \
u32 flow_id; \
\
/** Reference count for this buffer. */ \
volatile u8 ref_count; \
\
/** index of buffer pool this buffer belongs. */ \
u8 buffer_pool_index; \
\
/** Error code for buffers to be enqueued to error handler. */ \
vlib_error_t error; \
\
/** Next buffer for this linked-list of buffers. Only valid if \
* VLIB_BUFFER_NEXT_PRESENT flag is set. */ \
u32 next_buffer; \
\
/** The following fields can be in a union because once a packet enters \
* the punt path, it is no longer on a feature arc */ \
union \
{ \
/** Used by feature subgraph arcs to visit enabled feature nodes */ \
u32 current_config_index; \
/* the reason the packet once punted */ \
u32 punt_reason; \
}; \
\
/** Opaque data used by sub-graphs for their own purposes. */ \
u32 opaque[10];
typedef struct
{
CLIB_ALIGN_MARK (align_mark, 64);
vlib_buffer_template_fields
} vlib_buffer_template_t;
STATIC_ASSERT_SIZEOF (vlib_buffer_template_t, 64);
/** VLIB buffer representation. */
typedef union
{
CLIB_CACHE_LINE_ALIGN_MARK (cacheline0);
struct
{
union
{
struct
{
vlib_buffer_template_fields
};
vlib_buffer_template_t template;
};
/* Data above is initialized or zeroed on alloc, data bellow is not
* and it is app responsibility to ensure data is valid */
/** start of 2nd half (2nd cacheline on systems where cacheline size is 64) */
CLIB_ALIGN_MARK (second_half, 64);
/** Specifies trace buffer handle if VLIB_PACKET_IS_TRACED flag is
* set. */
u32 trace_handle;
/** Only valid for first buffer in chain. Current length plus total length
* given here give total number of bytes in buffer chain. */
u32 total_length_not_including_first_buffer;
/**< More opaque data, see ../vnet/vnet/buffer.h */
u32 opaque2[14];
#if VLIB_BUFFER_TRACE_TRAJECTORY > 0
/** trace trajectory data - we use a specific cacheline for that in the
* buffer when it is compiled-in */
#define VLIB_BUFFER_TRACE_TRAJECTORY_MAX 31
#define VLIB_BUFFER_TRACE_TRAJECTORY_SZ 64
#define VLIB_BUFFER_TRACE_TRAJECTORY_INIT(b) (b)->trajectory_nb = 0
CLIB_ALIGN_MARK (trajectory, 64);
u16 trajectory_nb;
u16 trajectory_trace[VLIB_BUFFER_TRACE_TRAJECTORY_MAX];
#else /* VLIB_BUFFER_TRACE_TRAJECTORY */
#define VLIB_BUFFER_TRACE_TRAJECTORY_SZ 0
#define VLIB_BUFFER_TRACE_TRAJECTORY_INIT(b)
#endif /* VLIB_BUFFER_TRACE_TRAJECTORY */
/** start of buffer headroom */
CLIB_ALIGN_MARK (headroom, 64);
/** Space for inserting data before buffer start. Packet rewrite string
* will be rewritten backwards and may extend back before
* buffer->data[0]. Must come directly before packet data. */
u8 pre_data[VLIB_BUFFER_PRE_DATA_SIZE];
/** Packet data */
u8 data[];
};
#ifdef CLIB_HAVE_VEC128
u8x16 as_u8x16[4];
#endif
#ifdef CLIB_HAVE_VEC256
u8x32 as_u8x32[2];
#endif
#ifdef CLIB_HAVE_VEC512
u8x64 as_u8x64[1];
#endif
} vlib_buffer_t;
STATIC_ASSERT_SIZEOF (vlib_buffer_t, 128 + VLIB_BUFFER_TRACE_TRAJECTORY_SZ +
VLIB_BUFFER_PRE_DATA_SIZE);
STATIC_ASSERT (VLIB_BUFFER_PRE_DATA_SIZE % CLIB_CACHE_LINE_BYTES == 0,
"VLIB_BUFFER_PRE_DATA_SIZE must be divisible by cache line size");
#define VLIB_BUFFER_HDR_SIZE (sizeof(vlib_buffer_t) - VLIB_BUFFER_PRE_DATA_SIZE)
#define VLIB_BUFFER_INVALID_INDEX 0xffffffff
/** \brief Prefetch buffer metadata.
The first 64 bytes of buffer contains most header information
@param b - (vlib_buffer_t *) pointer to the buffer
@param type - LOAD, STORE. In most cases, STORE is the right answer
*/
#define vlib_prefetch_buffer_header(b,type) CLIB_PREFETCH (b, 64, type)
#define vlib_prefetch_buffer_data(b,type) \
CLIB_PREFETCH (vlib_buffer_get_current(b), CLIB_CACHE_LINE_BYTES, type)
always_inline void
vlib_buffer_struct_is_sane (vlib_buffer_t * b)
{
ASSERT (sizeof (b[0]) % 64 == 0);
/* Rewrite data must be before and contiguous with packet data. */
ASSERT (b->pre_data + VLIB_BUFFER_PRE_DATA_SIZE == b->data);
}
always_inline uword
vlib_buffer_get_va (vlib_buffer_t * b)
{
return pointer_to_uword (b->data);
}
/** \brief Get pointer to current data to process
@param b - (vlib_buffer_t *) pointer to the buffer
@return - (void *) (b->data + b->current_data)
*/
always_inline void *
vlib_buffer_get_current (vlib_buffer_t * b)
{
/* Check bounds. */
ASSERT ((signed) b->current_data >= (signed) -VLIB_BUFFER_PRE_DATA_SIZE);
return b->data + b->current_data;
}
always_inline uword
vlib_buffer_get_current_va (vlib_buffer_t * b)
{
return vlib_buffer_get_va (b) + b->current_data;
}
/** \brief Advance current data pointer by the supplied (signed!) amount
@param b - (vlib_buffer_t *) pointer to the buffer
@param l - (word) signed increment
*/
always_inline void
vlib_buffer_advance (vlib_buffer_t * b, word l)
{
ASSERT (b->current_length >= l);
b->current_data += l;
b->current_length -= l;
ASSERT ((b->flags & VLIB_BUFFER_NEXT_PRESENT) == 0 ||
b->current_length >= VLIB_BUFFER_MIN_CHAIN_SEG_SIZE);
}
/** \brief Check if there is enough space in buffer to advance
@param b - (vlib_buffer_t *) pointer to the buffer
@param l - (word) size to check
@return - 0 if there is less space than 'l' in buffer
*/
always_inline u8
vlib_buffer_has_space (vlib_buffer_t * b, word l)
{
return b->current_length >= l;
}
/** \brief Reset current header & length to state they were in when
packet was received.
@param b - (vlib_buffer_t *) pointer to the buffer
*/
always_inline void
vlib_buffer_reset (vlib_buffer_t * b)
{
b->current_length += clib_max (b->current_data, 0);
b->current_data = 0;
}
/** \brief Get pointer to buffer's opaque data array
@param b - (vlib_buffer_t *) pointer to the buffer
@return - (void *) b->opaque
*/
always_inline void *
vlib_get_buffer_opaque (vlib_buffer_t * b)
{
return (void *) b->opaque;
}
/** \brief Get pointer to buffer's opaque2 data array
@param b - (vlib_buffer_t *) pointer to the buffer
@return - (void *) b->opaque2
*/
always_inline void *
vlib_get_buffer_opaque2 (vlib_buffer_t * b)
{
return (void *) b->opaque2;
}
/** \brief Get pointer to the end of buffer's data
* @param b pointer to the buffer
* @return pointer to tail of packet's data
*/
always_inline u8 *
vlib_buffer_get_tail (vlib_buffer_t * b)
{
return b->data + b->current_data + b->current_length;
}
/** \brief Append uninitialized data to buffer
* @param b pointer to the buffer
* @param size number of uninitialized bytes
* @return pointer to beginning of uninitialized data
*/
always_inline void *
vlib_buffer_put_uninit (vlib_buffer_t * b, u16 size)
{
void *p = vlib_buffer_get_tail (b);
/* XXX make sure there's enough space */
b->current_length += size;
return p;
}
/** \brief Prepend uninitialized data to buffer
* @param b pointer to the buffer
* @param size number of uninitialized bytes
* @return pointer to beginning of uninitialized data
*/
always_inline void *
vlib_buffer_push_uninit (vlib_buffer_t * b, u8 size)
{
ASSERT (b->current_data + VLIB_BUFFER_PRE_DATA_SIZE >= size);
b->current_data -= size;
b->current_length += size;
return vlib_buffer_get_current (b);
}
/** \brief Make head room, typically for packet headers
* @param b pointer to the buffer
* @param size number of head room bytes
* @return pointer to start of buffer (current data)
*/
always_inline void *
vlib_buffer_make_headroom (vlib_buffer_t * b, u8 size)
{
b->current_data += size;
return vlib_buffer_get_current (b);
}
/** \brief Construct a trace handle from thread and pool index
* @param thread Thread id
* @param pool_index Pool index
* @return trace handle
*/
always_inline u32
vlib_buffer_make_trace_handle (u32 thread, u32 pool_index)
{
u32 rv;
ASSERT (thread < 0xff);
ASSERT (pool_index < 0x00FFFFFF);
rv = (thread << 24) | (pool_index & 0x00FFFFFF);
return rv;
}
/** \brief Extract the thread id from a trace handle
* @param trace_handle the trace handle
* @return the thread id
*/
always_inline u32
vlib_buffer_get_trace_thread (vlib_buffer_t * b)
{
u32 trace_handle = b->trace_handle;
return trace_handle >> 24;
}
/** \brief Extract the trace (pool) index from a trace handle
* @param trace_handle the trace handle
* @return the trace index
*/
always_inline u32
vlib_buffer_get_trace_index (vlib_buffer_t * b)
{
u32 trace_handle = b->trace_handle;
return trace_handle & 0x00FFFFFF;
}
/** \brief Retrieve bytes from buffer head
* @param b pointer to the buffer
* @param size number of bytes to pull
* @return pointer to start of buffer (current data)
*/
always_inline void *
vlib_buffer_pull (vlib_buffer_t * b, u8 size)
{
if (b->current_length + VLIB_BUFFER_PRE_DATA_SIZE < size)
return 0;
void *data = vlib_buffer_get_current (b);
vlib_buffer_advance (b, size);
return data;
}
/* Forward declaration. */
struct vlib_main_t;
#define VLIB_BUFFER_POOL_PER_THREAD_CACHE_SZ 512
typedef struct
{
CLIB_CACHE_LINE_ALIGN_MARK (cacheline0);
u32 cached_buffers[VLIB_BUFFER_POOL_PER_THREAD_CACHE_SZ];
u32 n_cached;
} vlib_buffer_pool_thread_t;
typedef struct
{
CLIB_CACHE_LINE_ALIGN_MARK (cacheline0);
uword start;
uword size;
u8 log2_page_size;
u8 index;
u8 numa_node;
u32 physmem_map_index;
u32 data_size;
u32 alloc_size;
u32 n_buffers;
u32 n_avail;
u32 *buffers;
u8 *name;
clib_spinlock_t lock;
/* per-thread data */
vlib_buffer_pool_thread_t *threads;
/* buffer metadata template */
vlib_buffer_template_t buffer_template;
} vlib_buffer_pool_t;
#define VLIB_BUFFER_MAX_NUMA_NODES 32
typedef u32 (vlib_buffer_alloc_free_callback_t) (struct vlib_main_t *vm,
u8 buffer_pool_index,
u32 *buffers, u32 n_buffers);
typedef struct
{
CLIB_CACHE_LINE_ALIGN_MARK (cacheline0);
/* Virtual memory address and size of buffer memory, used for calculating
buffer index */
uword buffer_mem_start;
uword buffer_mem_size;
vlib_buffer_pool_t *buffer_pools;
vlib_buffer_alloc_free_callback_t *alloc_callback_fn;
vlib_buffer_alloc_free_callback_t *free_callback_fn;
u8 default_buffer_pool_index_for_numa[VLIB_BUFFER_MAX_NUMA_NODES];
/* config */
u32 default_buffers_per_numa;
u32 buffers_per_numa[VLIB_BUFFER_MAX_NUMA_NODES];
u16 ext_hdr_size;
u32 default_data_size;
clib_mem_page_sz_t log2_page_size;
/* Hash table mapping buffer index into number
0 => allocated but free, 1 => allocated and not-free.
If buffer index is not in hash table then this buffer
has never been allocated. */
uword *buffer_known_hash;
clib_spinlock_t buffer_known_hash_lockp;
/* logging */
vlib_log_class_t log_default;
} vlib_buffer_main_t;
clib_error_t *vlib_buffer_main_init (struct vlib_main_t *vm);
format_function_t format_vlib_buffer_pool_all;
int vlib_buffer_set_alloc_free_callback (
struct vlib_main_t *vm, vlib_buffer_alloc_free_callback_t *alloc_callback_fn,
vlib_buffer_alloc_free_callback_t *free_callback_fn);
extern u16 __vlib_buffer_external_hdr_size;
#define VLIB_BUFFER_SET_EXT_HDR_SIZE(x) \
static void __clib_constructor \
vnet_buffer_set_ext_hdr_size() \
{ \
if (__vlib_buffer_external_hdr_size) \
clib_error ("buffer external header space already set"); \
__vlib_buffer_external_hdr_size = CLIB_CACHE_LINE_ROUND (x); \
}
#endif /* included_vlib_buffer_h */
/*
* fd.io coding-style-patch-verification: ON
*
* Local Variables:
* eval: (c-set-style "gnu")
* End:
*/