blob: 11e3ac448f83d4ecb13674afd9656f990347a773 [file] [log] [blame]
Ed Warnickecb9cada2015-12-08 15:45:58 -07001/*
2 * Copyright (c) 2015 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
6 *
7 * http://www.apache.org/licenses/LICENSE-2.0
8 *
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
14 */
15
Chris Luke16bcf7d2016-09-01 14:31:46 -040016/** @cond DOCUMENTATION_IS_IN_BIHASH_DOC_H */
Dave Barachdd3a57f2016-07-27 16:58:51 -040017
Dave Barach97f5af02018-02-22 09:48:45 -050018static inline void *BV (alloc_aligned) (BVT (clib_bihash) * h, uword nbytes)
19{
20 uword rv;
21
22 /* Round to an even number of cache lines */
23 nbytes += CLIB_CACHE_LINE_BYTES - 1;
24 nbytes &= ~(CLIB_CACHE_LINE_BYTES - 1);
25
Dave Barach9466c452018-08-24 17:21:14 -040026 rv = alloc_arena_next (h);
27 alloc_arena_next (h) += nbytes;
Dave Barach97f5af02018-02-22 09:48:45 -050028
Andreas Schultzb4b525e2019-07-19 11:14:50 +020029 if (alloc_arena_next (h) > alloc_arena_size (h))
Dave Barach97f5af02018-02-22 09:48:45 -050030 os_out_of_memory ();
31
Dave Barachffb14b92018-09-11 17:20:23 -040032 return (void *) (uword) (rv + alloc_arena (h));
Dave Barach97f5af02018-02-22 09:48:45 -050033}
34
Dave Barach32dcd3b2019-07-08 12:25:38 -040035void BV (clib_bihash_instantiate) (BVT (clib_bihash) * h)
36{
37 uword bucket_size;
38
39 alloc_arena (h) = (uword) clib_mem_vm_alloc (h->memory_size);
40 alloc_arena_next (h) = 0;
41 alloc_arena_size (h) = h->memory_size;
42
43 bucket_size = h->nbuckets * sizeof (h->buckets[0]);
44 h->buckets = BV (alloc_aligned) (h, bucket_size);
45
46 h->alloc_lock = BV (alloc_aligned) (h, CLIB_CACHE_LINE_BYTES);
47 h->alloc_lock[0] = 0;
48}
Dave Barach97f5af02018-02-22 09:48:45 -050049
Dave Barachc3799992016-08-15 11:12:27 -040050void BV (clib_bihash_init)
51 (BVT (clib_bihash) * h, char *name, u32 nbuckets, uword memory_size)
Ed Warnickecb9cada2015-12-08 15:45:58 -070052{
Dave Barach32dcd3b2019-07-08 12:25:38 -040053 int i;
54 void *oldheap;
Ed Warnickecb9cada2015-12-08 15:45:58 -070055 nbuckets = 1 << (max_log2 (nbuckets));
56
Dave Barachc3799992016-08-15 11:12:27 -040057 h->name = (u8 *) name;
Ed Warnickecb9cada2015-12-08 15:45:58 -070058 h->nbuckets = nbuckets;
59 h->log2_nbuckets = max_log2 (nbuckets);
Dave Barach32dcd3b2019-07-08 12:25:38 -040060 h->memory_size = memory_size;
61 alloc_arena (h) = 0;
Ed Warnickecb9cada2015-12-08 15:45:58 -070062
Dave Barach508498f2018-07-19 12:11:16 -040063 /*
64 * Make sure the requested size is rational. The max table
65 * size without playing the alignment card is 64 Gbytes.
66 * If someone starts complaining that's not enough, we can shift
67 * the offset by CLIB_LOG2_CACHE_LINE_BYTES...
68 */
69 ASSERT (memory_size < (1ULL << BIHASH_BUCKET_OFFSET_BITS));
Vijayabhaskar Katamreddyfb8e61c2017-12-14 13:20:50 -080070 h->fmt_fn = NULL;
Dave Barach32dcd3b2019-07-08 12:25:38 -040071
72 /* Add this hash table to the list */
73 for (i = 0; i < vec_len (clib_all_bihashes); i++)
74 if (clib_all_bihashes[i] == h)
75 return;
76
77 /* Unfortunately, the heap push/pop is required.... */
78 oldheap = clib_all_bihash_set_heap ();
79 vec_add1 (clib_all_bihashes, (void *) h);
80 clib_mem_set_heap (oldheap);
81
82#if BIHASH_INSTANTIATE_IMMEDIATELY
83 BV (clib_bihash_instantiate) (h);
84#endif
Vijayabhaskar Katamreddyfb8e61c2017-12-14 13:20:50 -080085}
86
Dave Barach9466c452018-08-24 17:21:14 -040087#if BIHASH_32_64_SVM
88#if !defined (MFD_ALLOW_SEALING)
89#define MFD_ALLOW_SEALING 0x0002U
90#endif
91
92void BV (clib_bihash_master_init_svm)
Dave Barachffb14b92018-09-11 17:20:23 -040093 (BVT (clib_bihash) * h, char *name, u32 nbuckets, u64 memory_size)
Dave Barach9466c452018-08-24 17:21:14 -040094{
95 uword bucket_size;
96 u8 *mmap_addr;
97 vec_header_t *freelist_vh;
98 int fd;
99
Dave Barachffb14b92018-09-11 17:20:23 -0400100 ASSERT (memory_size < (1ULL << 32));
Dave Barach9466c452018-08-24 17:21:14 -0400101 /* Set up for memfd sharing */
102 if ((fd = memfd_create (name, MFD_ALLOW_SEALING)) == -1)
103 {
104 clib_unix_warning ("memfd_create");
105 return;
106 }
107
108 if (ftruncate (fd, memory_size) < 0)
109 {
110 clib_unix_warning ("ftruncate");
111 return;
112 }
113
114 /* Not mission-critical, complain and continue */
115 if ((fcntl (fd, F_ADD_SEALS, F_SEAL_SHRINK)) == -1)
116 clib_unix_warning ("fcntl (F_ADD_SEALS)");
117
Dave Barachffb14b92018-09-11 17:20:23 -0400118 mmap_addr = mmap (0, memory_size,
119 PROT_READ | PROT_WRITE, MAP_SHARED, fd, 0 /* offset */ );
Dave Barach9466c452018-08-24 17:21:14 -0400120
121 if (mmap_addr == MAP_FAILED)
122 {
123 clib_unix_warning ("mmap failed");
124 ASSERT (0);
125 }
126
127 h->sh = (void *) mmap_addr;
128 h->memfd = fd;
129 nbuckets = 1 << (max_log2 (nbuckets));
130
131 h->name = (u8 *) name;
132 h->sh->nbuckets = h->nbuckets = nbuckets;
133 h->log2_nbuckets = max_log2 (nbuckets);
134
135 alloc_arena (h) = (u64) (uword) mmap_addr;
Dave Barachffb14b92018-09-11 17:20:23 -0400136 alloc_arena_next (h) = CLIB_CACHE_LINE_BYTES;
Dave Barach9466c452018-08-24 17:21:14 -0400137 alloc_arena_size (h) = memory_size;
138
139 bucket_size = nbuckets * sizeof (h->buckets[0]);
140 h->buckets = BV (alloc_aligned) (h, bucket_size);
Dave Barachffb14b92018-09-11 17:20:23 -0400141 h->sh->buckets_as_u64 = (u64) BV (clib_bihash_get_offset) (h, h->buckets);
Dave Barach9466c452018-08-24 17:21:14 -0400142
143 h->alloc_lock = BV (alloc_aligned) (h, CLIB_CACHE_LINE_BYTES);
144 h->alloc_lock[0] = 0;
145
Dave Barachffb14b92018-09-11 17:20:23 -0400146 h->sh->alloc_lock_as_u64 =
147 (u64) BV (clib_bihash_get_offset) (h, (void *) h->alloc_lock);
148 freelist_vh =
149 BV (alloc_aligned) (h,
150 sizeof (vec_header_t) +
151 BIHASH_FREELIST_LENGTH * sizeof (u64));
Dave Barach9466c452018-08-24 17:21:14 -0400152 freelist_vh->len = BIHASH_FREELIST_LENGTH;
153 freelist_vh->dlmalloc_header_offset = 0xDEADBEEF;
Dave Barachffb14b92018-09-11 17:20:23 -0400154 h->sh->freelists_as_u64 =
155 (u64) BV (clib_bihash_get_offset) (h, freelist_vh->vector_data);
156 h->freelists = (void *) (freelist_vh->vector_data);
Dave Barach9466c452018-08-24 17:21:14 -0400157
158 h->fmt_fn = NULL;
159}
160
161void BV (clib_bihash_slave_init_svm)
162 (BVT (clib_bihash) * h, char *name, int fd)
163{
164 u8 *mmap_addr;
Dave Barachffb14b92018-09-11 17:20:23 -0400165 u64 memory_size;
Dave Barach9466c452018-08-24 17:21:14 -0400166 BVT (clib_bihash_shared_header) * sh;
167
Dave Barachffb14b92018-09-11 17:20:23 -0400168 /* Trial mapping, to learn the segment size */
Dave Barach9466c452018-08-24 17:21:14 -0400169 mmap_addr = mmap (0, 4096, PROT_READ, MAP_SHARED, fd, 0 /* offset */ );
170 if (mmap_addr == MAP_FAILED)
171 {
172 clib_unix_warning ("trial mmap failed");
173 ASSERT (0);
174 }
175
176 sh = (BVT (clib_bihash_shared_header) *) mmap_addr;
177
Dave Barach9466c452018-08-24 17:21:14 -0400178 memory_size = sh->alloc_arena_size;
179
180 munmap (mmap_addr, 4096);
181
Dave Barachffb14b92018-09-11 17:20:23 -0400182 /* Actual mapping, at the required size */
183 mmap_addr = mmap (0, memory_size,
184 PROT_READ | PROT_WRITE, MAP_SHARED, fd, 0 /* offset */ );
Dave Barach9466c452018-08-24 17:21:14 -0400185
186 if (mmap_addr == MAP_FAILED)
187 {
188 clib_unix_warning ("mmap failed");
189 ASSERT (0);
190 }
191
192 (void) close (fd);
193
194 h->sh = (void *) mmap_addr;
Dave Barachffb14b92018-09-11 17:20:23 -0400195 alloc_arena (h) = (u64) (uword) mmap_addr;
Dave Barach9466c452018-08-24 17:21:14 -0400196 h->memfd = -1;
197
198 h->name = (u8 *) name;
Dave Barachffb14b92018-09-11 17:20:23 -0400199 h->buckets = BV (clib_bihash_get_value) (h, h->sh->buckets_as_u64);
Dave Barach9466c452018-08-24 17:21:14 -0400200 h->nbuckets = h->sh->nbuckets;
201 h->log2_nbuckets = max_log2 (h->nbuckets);
202
Dave Barachffb14b92018-09-11 17:20:23 -0400203 h->alloc_lock = BV (clib_bihash_get_value) (h, h->sh->alloc_lock_as_u64);
204 h->freelists = BV (clib_bihash_get_value) (h, h->sh->freelists_as_u64);
Dave Barach9466c452018-08-24 17:21:14 -0400205 h->fmt_fn = NULL;
206}
207#endif /* BIHASH_32_64_SVM */
208
Vijayabhaskar Katamreddyfb8e61c2017-12-14 13:20:50 -0800209void BV (clib_bihash_set_kvp_format_fn) (BVT (clib_bihash) * h,
210 format_function_t * fmt_fn)
211{
212 h->fmt_fn = fmt_fn;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700213}
214
Dave Barachc3799992016-08-15 11:12:27 -0400215void BV (clib_bihash_free) (BVT (clib_bihash) * h)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700216{
Dave Barach32dcd3b2019-07-08 12:25:38 -0400217 int i;
218
219 if (PREDICT_FALSE (alloc_arena (h) == 0))
220 goto never_initialized;
221
Dave Barach97f5af02018-02-22 09:48:45 -0500222 vec_free (h->working_copies);
Vijayabhaskar Katamreddy72739a62019-05-07 13:27:32 -0700223 vec_free (h->working_copy_lengths);
Dave Barach9466c452018-08-24 17:21:14 -0400224#if BIHASH_32_64_SVM == 0
Dave Barach97f5af02018-02-22 09:48:45 -0500225 vec_free (h->freelists);
Dave Barach9466c452018-08-24 17:21:14 -0400226#else
227 if (h->memfd > 0)
228 (void) close (h->memfd);
229#endif
230 clib_mem_vm_free ((void *) (uword) (alloc_arena (h)), alloc_arena_size (h));
Dave Barach32dcd3b2019-07-08 12:25:38 -0400231never_initialized:
Dave Barachb7b92992018-10-17 10:38:51 -0400232 clib_memset (h, 0, sizeof (*h));
Dave Barach32dcd3b2019-07-08 12:25:38 -0400233 for (i = 0; i < vec_len (clib_all_bihashes); i++)
234 {
235 if ((void *) h == clib_all_bihashes[i])
236 {
237 vec_delete (clib_all_bihashes, 1, i);
238 return;
239 }
240 }
241 clib_warning ("Couldn't find hash table %llx on clib_all_bihashes...",
242 (u64) h);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700243}
244
Dave Barachc3799992016-08-15 11:12:27 -0400245static
246BVT (clib_bihash_value) *
247BV (value_alloc) (BVT (clib_bihash) * h, u32 log2_pages)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700248{
Dave Barachc3799992016-08-15 11:12:27 -0400249 BVT (clib_bihash_value) * rv = 0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700250
Dave Barach508498f2018-07-19 12:11:16 -0400251 ASSERT (h->alloc_lock[0]);
Dave Barach9466c452018-08-24 17:21:14 -0400252
253#if BIHASH_32_64_SVM
254 ASSERT (log2_pages < vec_len (h->freelists));
255#endif
256
Dave Barachc3799992016-08-15 11:12:27 -0400257 if (log2_pages >= vec_len (h->freelists) || h->freelists[log2_pages] == 0)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700258 {
Dave Barach97f5af02018-02-22 09:48:45 -0500259 vec_validate_init_empty (h->freelists, log2_pages, 0);
260 rv = BV (alloc_aligned) (h, (sizeof (*rv) * (1 << log2_pages)));
Dave Barachc3799992016-08-15 11:12:27 -0400261 goto initialize;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700262 }
Dave Barachffb14b92018-09-11 17:20:23 -0400263 rv = BV (clib_bihash_get_value) (h, (uword) h->freelists[log2_pages]);
Dave Barach9466c452018-08-24 17:21:14 -0400264 h->freelists[log2_pages] = rv->next_free_as_u64;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700265
Dave Barachc3799992016-08-15 11:12:27 -0400266initialize:
267 ASSERT (rv);
Dave Barachc3799992016-08-15 11:12:27 -0400268 /*
269 * Latest gcc complains that the length arg is zero
270 * if we replace (1<<log2_pages) with vec_len(rv).
271 * No clue.
272 */
Dave Barachb7b92992018-10-17 10:38:51 -0400273 clib_memset (rv, 0xff, sizeof (*rv) * (1 << log2_pages));
Dave Barachc3799992016-08-15 11:12:27 -0400274 return rv;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700275}
276
277static void
Dave Barachba7ddfe2017-05-17 20:20:50 -0400278BV (value_free) (BVT (clib_bihash) * h, BVT (clib_bihash_value) * v,
279 u32 log2_pages)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700280{
Dave Barach508498f2018-07-19 12:11:16 -0400281 ASSERT (h->alloc_lock[0]);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700282
Dave Barachc3799992016-08-15 11:12:27 -0400283 ASSERT (vec_len (h->freelists) > log2_pages);
284
Dave Barach508498f2018-07-19 12:11:16 -0400285 if (CLIB_DEBUG > 0)
Dave Barachb7b92992018-10-17 10:38:51 -0400286 clib_memset (v, 0xFE, sizeof (*v) * (1 << log2_pages));
Dave Barach508498f2018-07-19 12:11:16 -0400287
Dave Barach9466c452018-08-24 17:21:14 -0400288 v->next_free_as_u64 = (u64) h->freelists[log2_pages];
Dave Barachffb14b92018-09-11 17:20:23 -0400289 h->freelists[log2_pages] = (u64) BV (clib_bihash_get_offset) (h, v);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700290}
291
292static inline void
Dave Barach908a5ea2017-07-14 12:42:21 -0400293BV (make_working_copy) (BVT (clib_bihash) * h, BVT (clib_bihash_bucket) * b)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700294{
Dave Barachc3799992016-08-15 11:12:27 -0400295 BVT (clib_bihash_value) * v;
Dave Barach908a5ea2017-07-14 12:42:21 -0400296 BVT (clib_bihash_bucket) working_bucket __attribute__ ((aligned (8)));
Dave Barachc3799992016-08-15 11:12:27 -0400297 BVT (clib_bihash_value) * working_copy;
Damjan Marionf55f9b82017-05-10 21:06:28 +0200298 u32 thread_index = os_get_thread_index ();
Dave Barachba7ddfe2017-05-17 20:20:50 -0400299 int log2_working_copy_length;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700300
Dave Barach508498f2018-07-19 12:11:16 -0400301 ASSERT (h->alloc_lock[0]);
302
Damjan Marionf55f9b82017-05-10 21:06:28 +0200303 if (thread_index >= vec_len (h->working_copies))
Ed Warnickecb9cada2015-12-08 15:45:58 -0700304 {
Damjan Marionf55f9b82017-05-10 21:06:28 +0200305 vec_validate (h->working_copies, thread_index);
Steve Shin871cdec2017-06-02 10:09:02 -0700306 vec_validate_init_empty (h->working_copy_lengths, thread_index, ~0);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700307 }
308
Dave Barachc3799992016-08-15 11:12:27 -0400309 /*
Ed Warnickecb9cada2015-12-08 15:45:58 -0700310 * working_copies are per-cpu so that near-simultaneous
311 * updates from multiple threads will not result in sporadic, spurious
Dave Barachc3799992016-08-15 11:12:27 -0400312 * lookup failures.
Ed Warnickecb9cada2015-12-08 15:45:58 -0700313 */
Damjan Marionf55f9b82017-05-10 21:06:28 +0200314 working_copy = h->working_copies[thread_index];
Dave Barachba7ddfe2017-05-17 20:20:50 -0400315 log2_working_copy_length = h->working_copy_lengths[thread_index];
Ed Warnickecb9cada2015-12-08 15:45:58 -0700316
317 h->saved_bucket.as_u64 = b->as_u64;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700318
Dave Barachba7ddfe2017-05-17 20:20:50 -0400319 if (b->log2_pages > log2_working_copy_length)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700320 {
Dave Barach97f5af02018-02-22 09:48:45 -0500321 /*
322 * It's not worth the bookkeeping to free working copies
323 * if (working_copy)
324 * clib_mem_free (working_copy);
325 */
326 working_copy = BV (alloc_aligned)
327 (h, sizeof (working_copy[0]) * (1 << b->log2_pages));
Dave Barachba7ddfe2017-05-17 20:20:50 -0400328 h->working_copy_lengths[thread_index] = b->log2_pages;
Damjan Marionf55f9b82017-05-10 21:06:28 +0200329 h->working_copies[thread_index] = working_copy;
Dave Barach2ce28d62019-05-03 12:58:01 -0400330
331 BV (clib_bihash_increment_stat) (h, BIHASH_STAT_working_copy_lost,
332 1ULL << b->log2_pages);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700333 }
334
Dave Barachc3799992016-08-15 11:12:27 -0400335 v = BV (clib_bihash_get_value) (h, b->offset);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700336
Dave Barach178cf492018-11-13 16:34:13 -0500337 clib_memcpy_fast (working_copy, v, sizeof (*v) * (1 << b->log2_pages));
Ed Warnickecb9cada2015-12-08 15:45:58 -0700338 working_bucket.as_u64 = b->as_u64;
Dave Barachc3799992016-08-15 11:12:27 -0400339 working_bucket.offset = BV (clib_bihash_get_offset) (h, working_copy);
340 CLIB_MEMORY_BARRIER ();
Ed Warnickecb9cada2015-12-08 15:45:58 -0700341 b->as_u64 = working_bucket.as_u64;
Damjan Marionf55f9b82017-05-10 21:06:28 +0200342 h->working_copies[thread_index] = working_copy;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700343}
344
Dave Barachc3799992016-08-15 11:12:27 -0400345static
346BVT (clib_bihash_value) *
347BV (split_and_rehash)
348 (BVT (clib_bihash) * h,
Dave Barachba7ddfe2017-05-17 20:20:50 -0400349 BVT (clib_bihash_value) * old_values, u32 old_log2_pages,
350 u32 new_log2_pages)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700351{
Dave Barach5e6b9582016-12-12 15:37:29 -0500352 BVT (clib_bihash_value) * new_values, *new_v;
Dave Barachba7ddfe2017-05-17 20:20:50 -0400353 int i, j, length_in_kvs;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700354
Dave Barach508498f2018-07-19 12:11:16 -0400355 ASSERT (h->alloc_lock[0]);
356
Dave Barachc3799992016-08-15 11:12:27 -0400357 new_values = BV (value_alloc) (h, new_log2_pages);
Dave Barachba7ddfe2017-05-17 20:20:50 -0400358 length_in_kvs = (1 << old_log2_pages) * BIHASH_KVP_PER_PAGE;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700359
Dave Barachba7ddfe2017-05-17 20:20:50 -0400360 for (i = 0; i < length_in_kvs; i++)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700361 {
362 u64 new_hash;
Dave Barachc3799992016-08-15 11:12:27 -0400363
Dave Barach5e6b9582016-12-12 15:37:29 -0500364 /* Entry not in use? Forget it */
365 if (BV (clib_bihash_is_free) (&(old_values->kvp[i])))
366 continue;
367
368 /* rehash the item onto its new home-page */
369 new_hash = BV (clib_bihash_hash) (&(old_values->kvp[i]));
370 new_hash >>= h->log2_nbuckets;
371 new_hash &= (1 << new_log2_pages) - 1;
372 new_v = &new_values[new_hash];
373
374 /* Across the new home-page */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700375 for (j = 0; j < BIHASH_KVP_PER_PAGE; j++)
Dave Barachc3799992016-08-15 11:12:27 -0400376 {
Dave Barach5e6b9582016-12-12 15:37:29 -0500377 /* Empty slot */
378 if (BV (clib_bihash_is_free) (&(new_v->kvp[j])))
Dave Barachc3799992016-08-15 11:12:27 -0400379 {
Dave Barach178cf492018-11-13 16:34:13 -0500380 clib_memcpy_fast (&(new_v->kvp[j]), &(old_values->kvp[i]),
381 sizeof (new_v->kvp[j]));
Dave Barach5e6b9582016-12-12 15:37:29 -0500382 goto doublebreak;
Dave Barachc3799992016-08-15 11:12:27 -0400383 }
Dave Barachc3799992016-08-15 11:12:27 -0400384 }
Dave Barach5e6b9582016-12-12 15:37:29 -0500385 /* Crap. Tell caller to try again */
Dave Barachba7ddfe2017-05-17 20:20:50 -0400386 BV (value_free) (h, new_values, new_log2_pages);
Dave Barach5e6b9582016-12-12 15:37:29 -0500387 return 0;
388 doublebreak:;
389 }
Dave Barachba7ddfe2017-05-17 20:20:50 -0400390
Dave Barach5e6b9582016-12-12 15:37:29 -0500391 return new_values;
392}
393
394static
395BVT (clib_bihash_value) *
396BV (split_and_rehash_linear)
397 (BVT (clib_bihash) * h,
Dave Barachba7ddfe2017-05-17 20:20:50 -0400398 BVT (clib_bihash_value) * old_values, u32 old_log2_pages,
399 u32 new_log2_pages)
Dave Barach5e6b9582016-12-12 15:37:29 -0500400{
401 BVT (clib_bihash_value) * new_values;
Dave Barachba7ddfe2017-05-17 20:20:50 -0400402 int i, j, new_length, old_length;
Dave Barach5e6b9582016-12-12 15:37:29 -0500403
Dave Barach508498f2018-07-19 12:11:16 -0400404 ASSERT (h->alloc_lock[0]);
405
Dave Barach5e6b9582016-12-12 15:37:29 -0500406 new_values = BV (value_alloc) (h, new_log2_pages);
407 new_length = (1 << new_log2_pages) * BIHASH_KVP_PER_PAGE;
Dave Barachba7ddfe2017-05-17 20:20:50 -0400408 old_length = (1 << old_log2_pages) * BIHASH_KVP_PER_PAGE;
Dave Barach5e6b9582016-12-12 15:37:29 -0500409
410 j = 0;
411 /* Across the old value array */
Dave Barachba7ddfe2017-05-17 20:20:50 -0400412 for (i = 0; i < old_length; i++)
Dave Barach5e6b9582016-12-12 15:37:29 -0500413 {
414 /* Find a free slot in the new linear scan bucket */
415 for (; j < new_length; j++)
416 {
Dave Barach8f544962017-01-18 10:23:22 -0500417 /* Old value not in use? Forget it. */
Dave Barach5e6b9582016-12-12 15:37:29 -0500418 if (BV (clib_bihash_is_free) (&(old_values->kvp[i])))
419 goto doublebreak;
420
421 /* New value should never be in use */
422 if (BV (clib_bihash_is_free) (&(new_values->kvp[j])))
423 {
424 /* Copy the old value and move along */
Dave Barach178cf492018-11-13 16:34:13 -0500425 clib_memcpy_fast (&(new_values->kvp[j]), &(old_values->kvp[i]),
426 sizeof (new_values->kvp[j]));
Dave Barach5e6b9582016-12-12 15:37:29 -0500427 j++;
428 goto doublebreak;
429 }
Dave Barach5e6b9582016-12-12 15:37:29 -0500430 }
Dave Barach8f544962017-01-18 10:23:22 -0500431 /* This should never happen... */
432 clib_warning ("BUG: linear rehash failed!");
Dave Barachba7ddfe2017-05-17 20:20:50 -0400433 BV (value_free) (h, new_values, new_log2_pages);
Dave Barach8f544962017-01-18 10:23:22 -0500434 return 0;
435
Dave Barach5e6b9582016-12-12 15:37:29 -0500436 doublebreak:;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700437 }
438 return new_values;
439}
440
Matus Fabian828d27e2018-08-21 03:15:50 -0700441static inline int BV (clib_bihash_add_del_inline)
442 (BVT (clib_bihash) * h, BVT (clib_bihash_kv) * add_v, int is_add,
443 int (*is_stale_cb) (BVT (clib_bihash_kv) *, void *), void *arg)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700444{
445 u32 bucket_index;
Dave Barach908a5ea2017-07-14 12:42:21 -0400446 BVT (clib_bihash_bucket) * b, tmp_b;
Dave Barachc3799992016-08-15 11:12:27 -0400447 BVT (clib_bihash_value) * v, *new_v, *save_new_v, *working_copy;
Dave Barach5e6b9582016-12-12 15:37:29 -0500448 int i, limit;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700449 u64 hash, new_hash;
Dave Barachba7ddfe2017-05-17 20:20:50 -0400450 u32 new_log2_pages, old_log2_pages;
Damjan Marionf55f9b82017-05-10 21:06:28 +0200451 u32 thread_index = os_get_thread_index ();
Dave Barach5e6b9582016-12-12 15:37:29 -0500452 int mark_bucket_linear;
453 int resplit_once;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700454
Dave Barach32dcd3b2019-07-08 12:25:38 -0400455 /* Create the table (is_add=1), or flunk the request now (is_add=0) */
456 if (PREDICT_FALSE (alloc_arena (h) == 0))
457 {
458 if (is_add == 0)
459 return (-1);
460 BV (clib_bihash_instantiate) (h);
461 }
462
Dave Barachc3799992016-08-15 11:12:27 -0400463 hash = BV (clib_bihash_hash) (add_v);
464
465 bucket_index = hash & (h->nbuckets - 1);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700466 b = &h->buckets[bucket_index];
467
468 hash >>= h->log2_nbuckets;
469
Dave Barach508498f2018-07-19 12:11:16 -0400470 BV (clib_bihash_lock_bucket) (b);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700471
472 /* First elt in the bucket? */
Damjan Marion882fcfe2018-07-17 23:01:49 +0200473 if (BV (clib_bihash_bucket_is_empty) (b))
Ed Warnickecb9cada2015-12-08 15:45:58 -0700474 {
475 if (is_add == 0)
Dave Barachc3799992016-08-15 11:12:27 -0400476 {
Dave Barach508498f2018-07-19 12:11:16 -0400477 BV (clib_bihash_unlock_bucket) (b);
478 return (-1);
Dave Barachc3799992016-08-15 11:12:27 -0400479 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700480
Dave Barach508498f2018-07-19 12:11:16 -0400481 BV (clib_bihash_alloc_lock) (h);
Dave Barachc3799992016-08-15 11:12:27 -0400482 v = BV (value_alloc) (h, 0);
Dave Barach508498f2018-07-19 12:11:16 -0400483 BV (clib_bihash_alloc_unlock) (h);
Dave Barachba7ddfe2017-05-17 20:20:50 -0400484
Dave Barachc3799992016-08-15 11:12:27 -0400485 *v->kvp = *add_v;
Dave Barach508498f2018-07-19 12:11:16 -0400486 tmp_b.as_u64 = 0; /* clears bucket lock */
Dave Barachc3799992016-08-15 11:12:27 -0400487 tmp_b.offset = BV (clib_bihash_get_offset) (h, v);
Dave Barache7d212f2018-02-07 13:14:06 -0500488 tmp_b.refcnt = 1;
Dave Barach508498f2018-07-19 12:11:16 -0400489 CLIB_MEMORY_BARRIER ();
Ed Warnickecb9cada2015-12-08 15:45:58 -0700490
Tom Seidenberg97f8ae92019-03-15 10:15:26 -0400491 b->as_u64 = tmp_b.as_u64; /* unlocks the bucket */
Dave Barach2ce28d62019-05-03 12:58:01 -0400492 BV (clib_bihash_increment_stat) (h, BIHASH_STAT_alloc_add, 1);
493
Dave Barach508498f2018-07-19 12:11:16 -0400494 return (0);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700495 }
496
Dave Barach508498f2018-07-19 12:11:16 -0400497 /* WARNING: we're still looking at the live copy... */
Dave Barach5e6b9582016-12-12 15:37:29 -0500498 limit = BIHASH_KVP_PER_PAGE;
Dave Barach508498f2018-07-19 12:11:16 -0400499 v = BV (clib_bihash_get_value) (h, b->offset);
500
Dave Barach5e6b9582016-12-12 15:37:29 -0500501 v += (b->linear_search == 0) ? hash & ((1 << b->log2_pages) - 1) : 0;
502 if (b->linear_search)
503 limit <<= b->log2_pages;
Dave Barachc3799992016-08-15 11:12:27 -0400504
Ed Warnickecb9cada2015-12-08 15:45:58 -0700505 if (is_add)
506 {
Dave Barachc3799992016-08-15 11:12:27 -0400507 /*
Dave Barach508498f2018-07-19 12:11:16 -0400508 * Because reader threads are looking at live data,
509 * we have to be extra careful. Readers do NOT hold the
510 * bucket lock. We need to be SLOWER than a search, past the
511 * point where readers CHECK the bucket lock.
512 */
513
514 /*
Ed Warnickecb9cada2015-12-08 15:45:58 -0700515 * For obvious (in hindsight) reasons, see if we're supposed to
516 * replace an existing key, then look for an empty slot.
517 */
Dave Barach5e6b9582016-12-12 15:37:29 -0500518 for (i = 0; i < limit; i++)
Dave Barachc3799992016-08-15 11:12:27 -0400519 {
Dave Baracha11bf452019-04-17 17:27:31 -0400520 if (BV (clib_bihash_key_compare) (v->kvp[i].key, add_v->key))
Dave Barachc3799992016-08-15 11:12:27 -0400521 {
Dave Barach9e4946b2019-07-08 14:47:44 -0400522 /* Add but do not overwrite? */
523 if (is_add == 2)
524 {
525 BV (clib_bihash_unlock_bucket) (b);
526 return (-2);
527 }
528
Dave Barach508498f2018-07-19 12:11:16 -0400529 CLIB_MEMORY_BARRIER (); /* Add a delay */
Dave Barach178cf492018-11-13 16:34:13 -0500530 clib_memcpy_fast (&(v->kvp[i]), add_v, sizeof (*add_v));
Dave Barach508498f2018-07-19 12:11:16 -0400531 BV (clib_bihash_unlock_bucket) (b);
Dave Barach2ce28d62019-05-03 12:58:01 -0400532 BV (clib_bihash_increment_stat) (h, BIHASH_STAT_replace, 1);
Dave Barach508498f2018-07-19 12:11:16 -0400533 return (0);
Dave Barachc3799992016-08-15 11:12:27 -0400534 }
535 }
Dave Barach508498f2018-07-19 12:11:16 -0400536 /*
537 * Look for an empty slot. If found, use it
538 */
Dave Barach5e6b9582016-12-12 15:37:29 -0500539 for (i = 0; i < limit; i++)
Dave Barachc3799992016-08-15 11:12:27 -0400540 {
541 if (BV (clib_bihash_is_free) (&(v->kvp[i])))
542 {
Dave Barach508498f2018-07-19 12:11:16 -0400543 /*
544 * Copy the value first, so that if a reader manages
545 * to match the new key, the value will be right...
546 */
Dave Barach178cf492018-11-13 16:34:13 -0500547 clib_memcpy_fast (&(v->kvp[i].value),
548 &add_v->value, sizeof (add_v->value));
Dave Barach508498f2018-07-19 12:11:16 -0400549 CLIB_MEMORY_BARRIER (); /* Make sure the value has settled */
Dave Barach178cf492018-11-13 16:34:13 -0500550 clib_memcpy_fast (&(v->kvp[i]), &add_v->key,
551 sizeof (add_v->key));
Dave Barache7d212f2018-02-07 13:14:06 -0500552 b->refcnt++;
Dave Barach9466c452018-08-24 17:21:14 -0400553 ASSERT (b->refcnt > 0);
Dave Barach508498f2018-07-19 12:11:16 -0400554 BV (clib_bihash_unlock_bucket) (b);
Dave Barach2ce28d62019-05-03 12:58:01 -0400555 BV (clib_bihash_increment_stat) (h, BIHASH_STAT_add, 1);
Dave Barach508498f2018-07-19 12:11:16 -0400556 return (0);
Dave Barachc3799992016-08-15 11:12:27 -0400557 }
558 }
Matus Fabian828d27e2018-08-21 03:15:50 -0700559 /* look for stale data to overwrite */
560 if (is_stale_cb)
561 {
562 for (i = 0; i < limit; i++)
563 {
564 if (is_stale_cb (&(v->kvp[i]), arg))
565 {
566 CLIB_MEMORY_BARRIER ();
Dave Barach178cf492018-11-13 16:34:13 -0500567 clib_memcpy_fast (&(v->kvp[i]), add_v, sizeof (*add_v));
Matus Fabian828d27e2018-08-21 03:15:50 -0700568 BV (clib_bihash_unlock_bucket) (b);
Dave Barach2ce28d62019-05-03 12:58:01 -0400569 BV (clib_bihash_increment_stat) (h, BIHASH_STAT_replace, 1);
Matus Fabian828d27e2018-08-21 03:15:50 -0700570 return (0);
571 }
572 }
573 }
Dave Barach508498f2018-07-19 12:11:16 -0400574 /* Out of space in this bucket, split the bucket... */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700575 }
Dave Barach508498f2018-07-19 12:11:16 -0400576 else /* delete case */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700577 {
Dave Barach5e6b9582016-12-12 15:37:29 -0500578 for (i = 0; i < limit; i++)
Dave Barachc3799992016-08-15 11:12:27 -0400579 {
Dave Barach508498f2018-07-19 12:11:16 -0400580 /* Found the key? Kill it... */
Dave Baracha11bf452019-04-17 17:27:31 -0400581 if (BV (clib_bihash_key_compare) (v->kvp[i].key, add_v->key))
Dave Barachc3799992016-08-15 11:12:27 -0400582 {
Dave Barachb7b92992018-10-17 10:38:51 -0400583 clib_memset (&(v->kvp[i]), 0xff, sizeof (*(add_v)));
Dave Barach508498f2018-07-19 12:11:16 -0400584 /* Is the bucket empty? */
585 if (PREDICT_TRUE (b->refcnt > 1))
Dave Barache7d212f2018-02-07 13:14:06 -0500586 {
Dave Barach508498f2018-07-19 12:11:16 -0400587 b->refcnt--;
588 BV (clib_bihash_unlock_bucket) (b);
Dave Barach2ce28d62019-05-03 12:58:01 -0400589 BV (clib_bihash_increment_stat) (h, BIHASH_STAT_del, 1);
Dave Barach508498f2018-07-19 12:11:16 -0400590 return (0);
Dave Barache7d212f2018-02-07 13:14:06 -0500591 }
Dave Barach508498f2018-07-19 12:11:16 -0400592 else /* yes, free it */
Dave Barache7d212f2018-02-07 13:14:06 -0500593 {
Dave Barach508498f2018-07-19 12:11:16 -0400594 /* Save old bucket value, need log2_pages to free it */
595 tmp_b.as_u64 = b->as_u64;
596 CLIB_MEMORY_BARRIER ();
597
598 /* Kill and unlock the bucket */
599 b->as_u64 = 0;
600
601 /* And free the backing storage */
602 BV (clib_bihash_alloc_lock) (h);
603 /* Note: v currently points into the middle of the bucket */
604 v = BV (clib_bihash_get_value) (h, tmp_b.offset);
605 BV (value_free) (h, v, tmp_b.log2_pages);
606 BV (clib_bihash_alloc_unlock) (h);
Dave Barach2ce28d62019-05-03 12:58:01 -0400607 BV (clib_bihash_increment_stat) (h, BIHASH_STAT_del_free,
608 1);
Dave Barach508498f2018-07-19 12:11:16 -0400609 return (0);
Dave Barache7d212f2018-02-07 13:14:06 -0500610 }
Dave Barachc3799992016-08-15 11:12:27 -0400611 }
612 }
Dave Barach508498f2018-07-19 12:11:16 -0400613 /* Not found... */
614 BV (clib_bihash_unlock_bucket) (b);
615 return (-3);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700616 }
617
Dave Barach508498f2018-07-19 12:11:16 -0400618 /* Move readers to a (locked) temp copy of the bucket */
619 BV (clib_bihash_alloc_lock) (h);
620 BV (make_working_copy) (h, b);
621
622 v = BV (clib_bihash_get_value) (h, h->saved_bucket.offset);
623
Dave Barachba7ddfe2017-05-17 20:20:50 -0400624 old_log2_pages = h->saved_bucket.log2_pages;
625 new_log2_pages = old_log2_pages + 1;
Dave Barach5e6b9582016-12-12 15:37:29 -0500626 mark_bucket_linear = 0;
Dave Barach2ce28d62019-05-03 12:58:01 -0400627 BV (clib_bihash_increment_stat) (h, BIHASH_STAT_split_add, 1);
628 BV (clib_bihash_increment_stat) (h, BIHASH_STAT_splits, old_log2_pages);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700629
Damjan Marionf55f9b82017-05-10 21:06:28 +0200630 working_copy = h->working_copies[thread_index];
Dave Barach5e6b9582016-12-12 15:37:29 -0500631 resplit_once = 0;
Dave Barach2ce28d62019-05-03 12:58:01 -0400632 BV (clib_bihash_increment_stat) (h, BIHASH_STAT_splits, 1);
Dave Barach5e6b9582016-12-12 15:37:29 -0500633
Dave Barachba7ddfe2017-05-17 20:20:50 -0400634 new_v = BV (split_and_rehash) (h, working_copy, old_log2_pages,
635 new_log2_pages);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700636 if (new_v == 0)
637 {
Dave Barach5e6b9582016-12-12 15:37:29 -0500638 try_resplit:
639 resplit_once = 1;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700640 new_log2_pages++;
Dave Barach5e6b9582016-12-12 15:37:29 -0500641 /* Try re-splitting. If that fails, fall back to linear search */
Dave Barachba7ddfe2017-05-17 20:20:50 -0400642 new_v = BV (split_and_rehash) (h, working_copy, old_log2_pages,
643 new_log2_pages);
Dave Barach5e6b9582016-12-12 15:37:29 -0500644 if (new_v == 0)
645 {
646 mark_linear:
647 new_log2_pages--;
648 /* pinned collisions, use linear search */
649 new_v =
Dave Barachba7ddfe2017-05-17 20:20:50 -0400650 BV (split_and_rehash_linear) (h, working_copy, old_log2_pages,
651 new_log2_pages);
Dave Barach5e6b9582016-12-12 15:37:29 -0500652 mark_bucket_linear = 1;
Dave Barach2ce28d62019-05-03 12:58:01 -0400653 BV (clib_bihash_increment_stat) (h, BIHASH_STAT_linear, 1);
Dave Barach5e6b9582016-12-12 15:37:29 -0500654 }
Dave Barach2ce28d62019-05-03 12:58:01 -0400655 BV (clib_bihash_increment_stat) (h, BIHASH_STAT_resplit, 1);
656 BV (clib_bihash_increment_stat) (h, BIHASH_STAT_splits,
657 old_log2_pages + 1);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700658 }
659
660 /* Try to add the new entry */
661 save_new_v = new_v;
Dave Barachc3799992016-08-15 11:12:27 -0400662 new_hash = BV (clib_bihash_hash) (add_v);
Dave Barach5e6b9582016-12-12 15:37:29 -0500663 limit = BIHASH_KVP_PER_PAGE;
664 if (mark_bucket_linear)
665 limit <<= new_log2_pages;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700666 new_hash >>= h->log2_nbuckets;
Dave Barach5e6b9582016-12-12 15:37:29 -0500667 new_hash &= (1 << new_log2_pages) - 1;
668 new_v += mark_bucket_linear ? 0 : new_hash;
Dave Barachc3799992016-08-15 11:12:27 -0400669
Dave Barach5e6b9582016-12-12 15:37:29 -0500670 for (i = 0; i < limit; i++)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700671 {
Dave Barachc3799992016-08-15 11:12:27 -0400672 if (BV (clib_bihash_is_free) (&(new_v->kvp[i])))
673 {
Dave Barach178cf492018-11-13 16:34:13 -0500674 clib_memcpy_fast (&(new_v->kvp[i]), add_v, sizeof (*add_v));
Dave Barachc3799992016-08-15 11:12:27 -0400675 goto expand_ok;
676 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700677 }
Dave Barachba7ddfe2017-05-17 20:20:50 -0400678
Ed Warnickecb9cada2015-12-08 15:45:58 -0700679 /* Crap. Try again */
Dave Barachba7ddfe2017-05-17 20:20:50 -0400680 BV (value_free) (h, save_new_v, new_log2_pages);
Dave Barach5e6b9582016-12-12 15:37:29 -0500681 /*
682 * If we've already doubled the size of the bucket once,
683 * fall back to linear search now.
684 */
685 if (resplit_once)
686 goto mark_linear;
687 else
688 goto try_resplit;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700689
Dave Barachc3799992016-08-15 11:12:27 -0400690expand_ok:
Dave Barach5e6b9582016-12-12 15:37:29 -0500691 tmp_b.log2_pages = new_log2_pages;
Dave Barachc3799992016-08-15 11:12:27 -0400692 tmp_b.offset = BV (clib_bihash_get_offset) (h, save_new_v);
Dave Barach5e6b9582016-12-12 15:37:29 -0500693 tmp_b.linear_search = mark_bucket_linear;
Dave Barache7d212f2018-02-07 13:14:06 -0500694 tmp_b.refcnt = h->saved_bucket.refcnt + 1;
Dave Barach9466c452018-08-24 17:21:14 -0400695 ASSERT (tmp_b.refcnt > 0);
Dave Barach508498f2018-07-19 12:11:16 -0400696 tmp_b.lock = 0;
Dave Barachc3799992016-08-15 11:12:27 -0400697 CLIB_MEMORY_BARRIER ();
Ed Warnickecb9cada2015-12-08 15:45:58 -0700698 b->as_u64 = tmp_b.as_u64;
Andrew Yourtchenkodf32bc42018-09-20 15:36:51 +0200699 /* free the old bucket */
700 v = BV (clib_bihash_get_value) (h, h->saved_bucket.offset);
701 BV (value_free) (h, v, h->saved_bucket.log2_pages);
Dave Barach508498f2018-07-19 12:11:16 -0400702 BV (clib_bihash_alloc_unlock) (h);
703 return (0);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700704}
705
Matus Fabian828d27e2018-08-21 03:15:50 -0700706int BV (clib_bihash_add_del)
707 (BVT (clib_bihash) * h, BVT (clib_bihash_kv) * add_v, int is_add)
708{
709 return BV (clib_bihash_add_del_inline) (h, add_v, is_add, 0, 0);
710}
711
712int BV (clib_bihash_add_or_overwrite_stale)
713 (BVT (clib_bihash) * h, BVT (clib_bihash_kv) * add_v,
714 int (*stale_callback) (BVT (clib_bihash_kv) *, void *), void *arg)
715{
716 return BV (clib_bihash_add_del_inline) (h, add_v, 1, stale_callback, arg);
717}
718
Dave Barachc3799992016-08-15 11:12:27 -0400719int BV (clib_bihash_search)
Dave Barach908a5ea2017-07-14 12:42:21 -0400720 (BVT (clib_bihash) * h,
Dave Barachc3799992016-08-15 11:12:27 -0400721 BVT (clib_bihash_kv) * search_key, BVT (clib_bihash_kv) * valuep)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700722{
723 u64 hash;
724 u32 bucket_index;
Dave Barachc3799992016-08-15 11:12:27 -0400725 BVT (clib_bihash_value) * v;
Dave Barach908a5ea2017-07-14 12:42:21 -0400726 BVT (clib_bihash_bucket) * b;
Dave Barach5e6b9582016-12-12 15:37:29 -0500727 int i, limit;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700728
Dave Barachc3799992016-08-15 11:12:27 -0400729 ASSERT (valuep);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700730
Dave Barach32dcd3b2019-07-08 12:25:38 -0400731 if (PREDICT_FALSE (alloc_arena (h) == 0))
732 return -1;
733
Dave Barachc3799992016-08-15 11:12:27 -0400734 hash = BV (clib_bihash_hash) (search_key);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700735
Dave Barachc3799992016-08-15 11:12:27 -0400736 bucket_index = hash & (h->nbuckets - 1);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700737 b = &h->buckets[bucket_index];
738
Damjan Marion882fcfe2018-07-17 23:01:49 +0200739 if (BV (clib_bihash_bucket_is_empty) (b))
Ed Warnickecb9cada2015-12-08 15:45:58 -0700740 return -1;
741
Dave Barach508498f2018-07-19 12:11:16 -0400742 if (PREDICT_FALSE (b->lock))
Dave Barach908a5ea2017-07-14 12:42:21 -0400743 {
Dave Barach508498f2018-07-19 12:11:16 -0400744 volatile BVT (clib_bihash_bucket) * bv = b;
745 while (bv->lock)
Damjan Marion2a03efe2018-07-20 21:48:59 +0200746 CLIB_PAUSE ();
Dave Barach908a5ea2017-07-14 12:42:21 -0400747 }
748
Ed Warnickecb9cada2015-12-08 15:45:58 -0700749 hash >>= h->log2_nbuckets;
750
Dave Barachc3799992016-08-15 11:12:27 -0400751 v = BV (clib_bihash_get_value) (h, b->offset);
Dave Barach5e6b9582016-12-12 15:37:29 -0500752 limit = BIHASH_KVP_PER_PAGE;
753 v += (b->linear_search == 0) ? hash & ((1 << b->log2_pages) - 1) : 0;
754 if (PREDICT_FALSE (b->linear_search))
755 limit <<= b->log2_pages;
Dave Barachc3799992016-08-15 11:12:27 -0400756
Dave Barach5e6b9582016-12-12 15:37:29 -0500757 for (i = 0; i < limit; i++)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700758 {
Dave Barachc3799992016-08-15 11:12:27 -0400759 if (BV (clib_bihash_key_compare) (v->kvp[i].key, search_key->key))
760 {
761 *valuep = v->kvp[i];
762 return 0;
763 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700764 }
765 return -1;
766}
767
Dave Barachc3799992016-08-15 11:12:27 -0400768u8 *BV (format_bihash) (u8 * s, va_list * args)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700769{
Dave Barachc3799992016-08-15 11:12:27 -0400770 BVT (clib_bihash) * h = va_arg (*args, BVT (clib_bihash) *);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700771 int verbose = va_arg (*args, int);
Dave Barach908a5ea2017-07-14 12:42:21 -0400772 BVT (clib_bihash_bucket) * b;
Dave Barachc3799992016-08-15 11:12:27 -0400773 BVT (clib_bihash_value) * v;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700774 int i, j, k;
775 u64 active_elements = 0;
Dave Barache7d212f2018-02-07 13:14:06 -0500776 u64 active_buckets = 0;
777 u64 linear_buckets = 0;
Dave Barach97f5af02018-02-22 09:48:45 -0500778 u64 used_bytes;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700779
780 s = format (s, "Hash table %s\n", h->name ? h->name : (u8 *) "(unnamed)");
Dave Barachc3799992016-08-15 11:12:27 -0400781
Dave Barach32dcd3b2019-07-08 12:25:38 -0400782 if (PREDICT_FALSE (alloc_arena (h) == 0))
783 return format (s, "[empty, uninitialized]");
784
Ed Warnickecb9cada2015-12-08 15:45:58 -0700785 for (i = 0; i < h->nbuckets; i++)
786 {
Dave Barachc3799992016-08-15 11:12:27 -0400787 b = &h->buckets[i];
Damjan Marion882fcfe2018-07-17 23:01:49 +0200788 if (BV (clib_bihash_bucket_is_empty) (b))
Dave Barachc3799992016-08-15 11:12:27 -0400789 {
790 if (verbose > 1)
791 s = format (s, "[%d]: empty\n", i);
792 continue;
793 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700794
Dave Barache7d212f2018-02-07 13:14:06 -0500795 active_buckets++;
796
797 if (b->linear_search)
798 linear_buckets++;
799
Ed Warnickecb9cada2015-12-08 15:45:58 -0700800 if (verbose)
Dave Barachc3799992016-08-15 11:12:27 -0400801 {
Dave Barach9466c452018-08-24 17:21:14 -0400802 s = format (s, "[%d]: heap offset %lld, len %d, linear %d\n", i,
Dave Barach5e6b9582016-12-12 15:37:29 -0500803 b->offset, (1 << b->log2_pages), b->linear_search);
Dave Barachc3799992016-08-15 11:12:27 -0400804 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700805
Dave Barachc3799992016-08-15 11:12:27 -0400806 v = BV (clib_bihash_get_value) (h, b->offset);
807 for (j = 0; j < (1 << b->log2_pages); j++)
808 {
809 for (k = 0; k < BIHASH_KVP_PER_PAGE; k++)
810 {
811 if (BV (clib_bihash_is_free) (&v->kvp[k]))
812 {
813 if (verbose > 1)
814 s = format (s, " %d: empty\n",
815 j * BIHASH_KVP_PER_PAGE + k);
816 continue;
817 }
818 if (verbose)
819 {
Vijayabhaskar Katamreddyfb8e61c2017-12-14 13:20:50 -0800820 if (h->fmt_fn)
821 {
822 s = format (s, " %d: %U\n",
823 j * BIHASH_KVP_PER_PAGE + k,
Vijayabhaskar Katamreddy72739a62019-05-07 13:27:32 -0700824 h->fmt_fn, &(v->kvp[k]), verbose);
Vijayabhaskar Katamreddyfb8e61c2017-12-14 13:20:50 -0800825 }
826 else
827 {
828 s = format (s, " %d: %U\n",
829 j * BIHASH_KVP_PER_PAGE + k,
830 BV (format_bihash_kvp), &(v->kvp[k]));
831 }
Dave Barachc3799992016-08-15 11:12:27 -0400832 }
833 active_elements++;
834 }
835 v++;
836 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700837 }
838
Dave Barache7d212f2018-02-07 13:14:06 -0500839 s = format (s, " %lld active elements %lld active buckets\n",
840 active_elements, active_buckets);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700841 s = format (s, " %d free lists\n", vec_len (h->freelists));
Dave Barache7d212f2018-02-07 13:14:06 -0500842
843 for (i = 0; i < vec_len (h->freelists); i++)
844 {
845 u32 nfree = 0;
846 BVT (clib_bihash_value) * free_elt;
Dave Barachffb14b92018-09-11 17:20:23 -0400847 u64 free_elt_as_u64 = h->freelists[i];
Dave Barache7d212f2018-02-07 13:14:06 -0500848
Dave Barachffb14b92018-09-11 17:20:23 -0400849 while (free_elt_as_u64)
Dave Barache7d212f2018-02-07 13:14:06 -0500850 {
Dave Barachffb14b92018-09-11 17:20:23 -0400851 free_elt = BV (clib_bihash_get_value) (h, free_elt_as_u64);
Dave Barache7d212f2018-02-07 13:14:06 -0500852 nfree++;
Dave Barachffb14b92018-09-11 17:20:23 -0400853 free_elt_as_u64 = free_elt->next_free_as_u64;
Dave Barache7d212f2018-02-07 13:14:06 -0500854 }
855
Dave Barach9466c452018-08-24 17:21:14 -0400856 if (nfree || verbose)
857 s = format (s, " [len %d] %u free elts\n", 1 << i, nfree);
Dave Barache7d212f2018-02-07 13:14:06 -0500858 }
859
860 s = format (s, " %lld linear search buckets\n", linear_buckets);
Dave Barachffb14b92018-09-11 17:20:23 -0400861 used_bytes = alloc_arena_next (h);
Dave Barach97f5af02018-02-22 09:48:45 -0500862 s = format (s,
863 " arena: base %llx, next %llx\n"
864 " used %lld b (%lld Mbytes) of %lld b (%lld Mbytes)\n",
Dave Barach9466c452018-08-24 17:21:14 -0400865 alloc_arena (h), alloc_arena_next (h),
Dave Barach97f5af02018-02-22 09:48:45 -0500866 used_bytes, used_bytes >> 20,
Dave Barach9466c452018-08-24 17:21:14 -0400867 alloc_arena_size (h), alloc_arena_size (h) >> 20);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700868 return s;
869}
870
Dave Barachc3799992016-08-15 11:12:27 -0400871void BV (clib_bihash_foreach_key_value_pair)
872 (BVT (clib_bihash) * h, void *callback, void *arg)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700873{
874 int i, j, k;
Dave Barach908a5ea2017-07-14 12:42:21 -0400875 BVT (clib_bihash_bucket) * b;
Dave Barachc3799992016-08-15 11:12:27 -0400876 BVT (clib_bihash_value) * v;
877 void (*fp) (BVT (clib_bihash_kv) *, void *) = callback;
878
Dave Barach32dcd3b2019-07-08 12:25:38 -0400879 if (PREDICT_FALSE (alloc_arena (h) == 0))
880 return;
881
Ed Warnickecb9cada2015-12-08 15:45:58 -0700882 for (i = 0; i < h->nbuckets; i++)
883 {
Dave Barachc3799992016-08-15 11:12:27 -0400884 b = &h->buckets[i];
Damjan Marion882fcfe2018-07-17 23:01:49 +0200885 if (BV (clib_bihash_bucket_is_empty) (b))
Dave Barachc3799992016-08-15 11:12:27 -0400886 continue;
887
888 v = BV (clib_bihash_get_value) (h, b->offset);
889 for (j = 0; j < (1 << b->log2_pages); j++)
890 {
891 for (k = 0; k < BIHASH_KVP_PER_PAGE; k++)
892 {
893 if (BV (clib_bihash_is_free) (&v->kvp[k]))
894 continue;
895
896 (*fp) (&v->kvp[k], arg);
Dave Barachca45ee72018-08-06 08:43:47 -0400897 /*
898 * In case the callback deletes the last entry in the bucket...
899 */
900 if (BV (clib_bihash_bucket_is_empty) (b))
901 goto doublebreak;
Dave Barachc3799992016-08-15 11:12:27 -0400902 }
903 v++;
904 }
Dave Barachca45ee72018-08-06 08:43:47 -0400905 doublebreak:
906 ;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700907 }
908}
Dave Barachdd3a57f2016-07-27 16:58:51 -0400909
Chris Luke16bcf7d2016-09-01 14:31:46 -0400910/** @endcond */
Dave Barachc3799992016-08-15 11:12:27 -0400911
912/*
913 * fd.io coding-style-patch-verification: ON
914 *
915 * Local Variables:
916 * eval: (c-set-style "gnu")
917 * End:
918 */