blob: 06c4afdc79b18138236c7d7fa76cf19fc95433c4 [file] [log] [blame]
/*
Copyright (c) 2017 Cisco and/or its affiliates.
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at:
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
/*
* cuckoo hash implementation based on paper
* 'Algorithmic Improvements for Fast Concurrent Cuckoo Hashing'
* by Xiaozhou Li, David G. Andersen, Michael Kaminsky, Michael J. Freedman
* and their libcuckoo implementation (https://github.com/efficient/libcuckoo)
*/
/*
* Note: to instantiate the template multiple times in a single file,
* #undef __included_cuckoo_template_h__...
*/
#ifndef __included_cuckoo_template_h__
#define __included_cuckoo_template_h__
#include <vppinfra/heap.h>
#include <vppinfra/format.h>
#include <vppinfra/pool.h>
#include <vppinfra/lock.h>
#include <vppinfra/error.h>
#include <vppinfra/hash.h>
#include <vppinfra/cache.h>
#ifndef CLIB_CUCKOO_TYPE
#error CLIB_CUCKOO_TYPE not defined
#endif
#ifndef CLIB_CUCKOO_BFS_MAX_STEPS
#error CLIB_CUCKOO_BFS_MAX_STEPS not defined
#endif
#ifndef CLIB_CUCKOO_KVP_PER_BUCKET
#error CLIB_CUCKOO_KVP_PER_BUCKET not defined
#endif
#ifndef CLIB_CUCKOO_LOG2_KVP_PER_BUCKET
#error CLIB_CUCKOO_LOG2_KVP_PER_BUCKET not defined
#endif
#ifndef CLIB_CUCKOO_BFS_MAX_PATH_LENGTH
#error CLIB_CUCKOO_BFS_MAX_PATH_LENGTH not defined
#endif
STATIC_ASSERT (CLIB_CUCKOO_KVP_PER_BUCKET ==
(1 << CLIB_CUCKOO_LOG2_KVP_PER_BUCKET),
"CLIB_CUCKOO_KVP_PER_BUCKET != (1 << CLIB_CUCKOO_LOG2_KVP_PER_BUCKET");
#define _cv(a, b) a##b
#define __cv(a, b) _cv (a, b)
#define CV(a) __cv (a, CLIB_CUCKOO_TYPE)
#define _cvt(a, b) a##b##_t
#define __cvt(a, b) _cvt (a, b)
#define CVT(a) __cvt (a, CLIB_CUCKOO_TYPE)
typedef u64 clib_cuckoo_bucket_aux_t;
#define CLIB_CUCKOO_USE_COUNT_BIT_WIDTH (1 + CLIB_CUCKOO_LOG2_KVP_PER_BUCKET)
always_inline u64
clib_cuckoo_bucket_aux_get_version (clib_cuckoo_bucket_aux_t aux)
{
return aux >> (1 + CLIB_CUCKOO_USE_COUNT_BIT_WIDTH);
}
always_inline int
clib_cuckoo_bucket_aux_get_use_count (clib_cuckoo_bucket_aux_t aux)
{
u64 use_count_mask = (1 << CLIB_CUCKOO_USE_COUNT_BIT_WIDTH) - 1;
return (aux >> 1) & use_count_mask;
}
always_inline int
clib_cuckoo_bucket_aux_get_writer_flag (clib_cuckoo_bucket_aux_t aux)
{
return aux & 1;
}
always_inline clib_cuckoo_bucket_aux_t
clib_cuckoo_bucket_aux_pack (u64 version, int use_count, int writer_flag)
{
return (version << (1 + CLIB_CUCKOO_USE_COUNT_BIT_WIDTH)) +
(use_count << 1) + writer_flag;
}
always_inline clib_cuckoo_bucket_aux_t
clib_cuckoo_bucket_aux_set_version (clib_cuckoo_bucket_aux_t aux, u64 version)
{
int use_count = clib_cuckoo_bucket_aux_get_use_count (aux);
int writer_flag = clib_cuckoo_bucket_aux_get_writer_flag (aux);
return clib_cuckoo_bucket_aux_pack (version, use_count, writer_flag);
}
always_inline clib_cuckoo_bucket_aux_t
clib_cuckoo_bucket_aux_set_use_count (clib_cuckoo_bucket_aux_t aux,
int use_count)
{
u64 version = clib_cuckoo_bucket_aux_get_version (aux);
int writer_flag = clib_cuckoo_bucket_aux_get_writer_flag (aux);
return clib_cuckoo_bucket_aux_pack (version, use_count, writer_flag);
}
always_inline clib_cuckoo_bucket_aux_t
clib_cuckoo_bucket_aux_set_writer_flag (clib_cuckoo_bucket_aux_t aux,
int writer_flag)
{
u64 version = clib_cuckoo_bucket_aux_get_version (aux);
int use_count = clib_cuckoo_bucket_aux_get_use_count (aux);
return clib_cuckoo_bucket_aux_pack (version, use_count, writer_flag);
}
#define PATH_BITS_REQ \
(CLIB_CUCKOO_BFS_MAX_PATH_LENGTH * CLIB_CUCKOO_LOG2_KVP_PER_BUCKET)
#if PATH_BITS_REQ <= 8
typedef u8 path_data_t;
#elif PATH_BITS_REQ <= 16
typedef u16 path_data_t;
#elif PATH_BITS_REQ <= 32
typedef u32 path_data_t;
#elif PATH_BITS_REQ <= 64
typedef u64 path_data_t;
#else
#error no suitable datatype for path storage...
#endif
typedef struct
{
/** bucket where this path begins */
u64 start;
/** bucket at end of path */
u64 bucket;
/** length of the path */
u8 length;
/** holds compressed offsets in buckets along path */
path_data_t data;
} clib_cuckoo_path_t;
typedef struct
{
CLIB_CACHE_LINE_ALIGN_MARK (cacheline0);
/** reduced hashes corresponding to elements */
u8 reduced_hashes[CLIB_CUCKOO_KVP_PER_BUCKET];
/** auxiliary data - version, writer flag and used count */
volatile clib_cuckoo_bucket_aux_t aux;
/** cuckoo elements in this bucket */
CVT (clib_cuckoo_kv) elts[CLIB_CUCKOO_KVP_PER_BUCKET];
} CVT (clib_cuckoo_bucket);
#define clib_cuckoo_bucket_foreach_idx(var) \
for (var = 0; var < CLIB_CUCKOO_KVP_PER_BUCKET; var++)
#if CLIB_CUCKOO_OPTIMIZE_UNROLL
#if CLIB_CUCKOO_KVP_PER_BUCKET == 2
#define clib_cuckoo_bucket_foreach_idx_unrolled(var, body) \
do \
{ \
var = 0; \
body; \
var = 1; \
body; \
} \
while (0);
#elif CLIB_CUCKOO_KVP_PER_BUCKET == 4
#define clib_cuckoo_bucket_foreach_idx_unrolled(var, body) \
do \
{ \
var = 0; \
body; \
var = 1; \
body; \
var = 2; \
body; \
var = 3; \
body; \
} \
while (0);
#elif CLIB_CUCKOO_KVP_PER_BUCKET == 8
#define clib_cuckoo_bucket_foreach_idx_unrolled(var, body) \
do \
{ \
var = 0; \
body; \
var = 1; \
body; \
var = 2; \
body; \
var = 3; \
body; \
var = 4; \
body; \
var = 5; \
body; \
var = 6; \
body; \
var = 7; \
body; \
} \
while (0);
#else
#define clib_cuckoo_bucket_foreach_idx_unrolled(var, body) \
clib_cuckoo_bucket_foreach_idx (var) \
{ \
body; \
}
#endif
#else /* CLIB_CUCKOO_OPTIMIZE_UNROLL */
#define clib_cuckoo_bucket_foreach_idx_unrolled(var, body) \
clib_cuckoo_bucket_foreach_idx (var) \
{ \
body; \
}
#endif /* CLIB_CUCKOO_OPTIMIZE_UNROLL */
#define clib_cuckoo_bucket_foreach_elt_index(var, bucket) \
for (var = 0; var < CLIB_CUCKOO_KVP_PER_BUCKET; ++i)
#define clib_cuckoo_foreach_bucket(var, h, body) \
do \
{ \
CVT (clib_cuckoo_bucket) *__buckets = h->buckets; \
vec_foreach (var, __buckets) \
{ \
body; \
} \
} \
while (0)
typedef struct CV (clib_cuckoo)
{
/** vector of elements containing key-value pairs and auxiliary data */
CVT (clib_cuckoo_bucket) * volatile buckets;
/** garbage to be freed once its safe to do so .. */
CVT (clib_cuckoo_bucket) * *to_be_freed;
/** hash table name */
const char *name;
/** pool of cuckoo paths (reused when doing bfd search) */
clib_cuckoo_path_t *paths;
/**
* vector used as queue when doing cuckoo path searches - holds offsets
* in paths pool
*/
uword *bfs_search_queue;
/**
* writer lock - whether this lock is taken or not has zero effect on
* readers
*/
clib_spinlock_t writer_lock;
/** caller context passed to callback with garbage notification */
void *garbage_ctx;
/**
* garbage notify function - called when some garbage needs to be collected
* in main thread while other threads are stopped
*/
void (*garbage_callback) (struct CV (clib_cuckoo) * h, void *garbage_ctx);
#if CLIB_CUCKOO_DEBUG_COUNTERS
u64 steps_exceeded;
u64 bfs_queue_emptied;
u64 fast_adds;
u64 slow_adds;
u64 rehashes;
#endif
} CVT (clib_cuckoo);
void CV (clib_cuckoo_init) (CVT (clib_cuckoo) * h, const char *name,
uword nbuckets,
void (*garbage_callback) (CVT (clib_cuckoo) *,
void *),
void *garbage_ctx);
void CV (clib_cuckoo_garbage_collect) (CVT (clib_cuckoo) * h);
void CV (clib_cuckoo_free) (CVT (clib_cuckoo) * h);
int CV (clib_cuckoo_add_del) (CVT (clib_cuckoo) * h,
CVT (clib_cuckoo_kv) * add_v, int is_add,
int dont_overwrite);
int CV (clib_cuckoo_search) (CVT (clib_cuckoo) * h,
CVT (clib_cuckoo_kv) * search_v,
CVT (clib_cuckoo_kv) * return_v);
void CV (clib_cuckoo_foreach_key_value_pair) (CVT (clib_cuckoo) * h,
void *callback, void *arg);
float CV (clib_cuckoo_calc_load) (CVT (clib_cuckoo) * h);
format_function_t CV (format_cuckoo);
format_function_t CV (format_cuckoo_kvp);
always_inline u8
clib_cuckoo_reduce_hash (u64 hash)
{
u32 v32 = ((u32) hash) ^ ((u32) (hash >> 32));
u16 v16 = ((u16) v32) ^ ((u16) (v32 >> 16));
u8 v8 = ((u8) v16) ^ ((u8) (v16 >> 8));
return v8;
}
always_inline u64
clib_cuckoo_get_other_bucket (u64 nbuckets, u64 bucket, u8 reduced_hash)
{
u64 mask = (nbuckets - 1);
return (bucket ^ ((reduced_hash + 1) * 0xc6a4a7935bd1e995)) & mask;
}
always_inline clib_cuckoo_lookup_info_t
CV (clib_cuckoo_calc_lookup) (CVT (clib_cuckoo_bucket) * buckets, u64 hash)
{
clib_cuckoo_lookup_info_t lookup;
u64 nbuckets = vec_len (buckets);
u64 mask = (nbuckets - 1);
lookup.bucket1 = hash & mask;
#if CLIB_CUCKOO_OPTIMIZE_PREFETCH
CLIB_PREFETCH (vec_elt_at_index (buckets, lookup.bucket1),
sizeof (*buckets), LOAD);
#endif
u8 reduced_hash = clib_cuckoo_reduce_hash (hash);
lookup.bucket2 =
clib_cuckoo_get_other_bucket (nbuckets, lookup.bucket1, reduced_hash);
#if CLIB_CUCKOO_OPTIMIZE_PREFETCH
CLIB_PREFETCH (vec_elt_at_index (buckets, lookup.bucket2),
sizeof (*buckets), LOAD);
#endif
lookup.reduced_hash = reduced_hash;
ASSERT (lookup.bucket1 < nbuckets);
ASSERT (lookup.bucket2 < nbuckets);
return lookup;
}
/**
* search for key within bucket
*/
always_inline int CV (clib_cuckoo_bucket_search) (CVT (clib_cuckoo_bucket) *
b,
CVT (clib_cuckoo_kv) * kvp,
u8 reduced_hash)
{
clib_cuckoo_bucket_aux_t bucket_aux;
u8 writer_flag;
do
{
bucket_aux = b->aux;
writer_flag = clib_cuckoo_bucket_aux_get_writer_flag (bucket_aux);
}
while (PREDICT_FALSE (writer_flag)); /* loop while writer flag is set */
int i;
#if CLIB_CUCKOO_OPTIMIZE_USE_COUNT_LIMITS_SEARCH
const int use_count = clib_cuckoo_bucket_aux_get_use_count (bucket_aux);
#endif
/* *INDENT-OFF* */
clib_cuckoo_bucket_foreach_idx_unrolled (i, {
#if CLIB_CUCKOO_OPTIMIZE_USE_COUNT_LIMITS_SEARCH
if (i > use_count)
{
break;
}
#endif
if (
#if CLIB_CUCKOO_OPTIMIZE_CMP_REDUCED_HASH
reduced_hash == b->reduced_hashes[i] &&
#endif
0 == memcmp (&kvp->key, &b->elts[i].key, sizeof (kvp->key)))
{
kvp->value = b->elts[i].value;
clib_cuckoo_bucket_aux_t bucket_aux2 = b->aux;
if (PREDICT_TRUE (clib_cuckoo_bucket_aux_get_version (bucket_aux) ==
clib_cuckoo_bucket_aux_get_version (bucket_aux2)))
{
/* yay, fresh data */
return CLIB_CUCKOO_ERROR_SUCCESS;
}
else
{
/* oops, modification detected */
return CLIB_CUCKOO_ERROR_AGAIN;
}
}
});
/* *INDENT-ON* */
return CLIB_CUCKOO_ERROR_NOT_FOUND;
}
always_inline int CV (clib_cuckoo_search_inline) (CVT (clib_cuckoo) * h,
CVT (clib_cuckoo_kv) * kvp)
{
clib_cuckoo_lookup_info_t lookup;
int rv;
u64 hash = CV (clib_cuckoo_hash) (kvp);
CVT (clib_cuckoo_bucket) * buckets;
again:
buckets = h->buckets;
lookup = CV (clib_cuckoo_calc_lookup) (buckets, hash);
do
{
rv =
CV (clib_cuckoo_bucket_search) (vec_elt_at_index
(buckets, lookup.bucket1), kvp,
lookup.reduced_hash);
}
while (PREDICT_FALSE (CLIB_CUCKOO_ERROR_AGAIN == rv));
if (CLIB_CUCKOO_ERROR_SUCCESS == rv)
{
return CLIB_CUCKOO_ERROR_SUCCESS;
}
rv =
CV (clib_cuckoo_bucket_search) (vec_elt_at_index
(buckets, lookup.bucket2), kvp,
lookup.reduced_hash);
if (PREDICT_FALSE (CLIB_CUCKOO_ERROR_AGAIN == rv))
{
/*
* change to 2nd bucket could bump the item to 1st bucket and the bucket
* indexes might not even be valid anymore - restart the search
*/
goto again;
}
return rv;
}
#endif /* __included_cuckoo_template_h__ */
/** @endcond */
/*
* fd.io coding-style-patch-verification: ON
*
* Local Variables:
* eval: (c-set-style "gnu")
* End:
*/