blob: bf6be83b2e06ea5db717394074ad2328cee25dbb [file] [log] [blame]
Ed Warnickecb9cada2015-12-08 15:45:58 -07001/*
2 * Copyright (c) 2015 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
6 *
7 * http://www.apache.org/licenses/LICENSE-2.0
8 *
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
14 */
15
Chris Luke16bcf7d2016-09-01 14:31:46 -040016/** @cond DOCUMENTATION_IS_IN_BIHASH_DOC_H */
Dave Barachdd3a57f2016-07-27 16:58:51 -040017
Dave Barach97f5af02018-02-22 09:48:45 -050018static inline void *BV (alloc_aligned) (BVT (clib_bihash) * h, uword nbytes)
19{
20 uword rv;
21
22 /* Round to an even number of cache lines */
23 nbytes += CLIB_CACHE_LINE_BYTES - 1;
24 nbytes &= ~(CLIB_CACHE_LINE_BYTES - 1);
25
Dave Barach9466c452018-08-24 17:21:14 -040026 rv = alloc_arena_next (h);
27 alloc_arena_next (h) += nbytes;
Dave Barach97f5af02018-02-22 09:48:45 -050028
Andrew Yourtchenkoa7132542018-09-19 15:50:55 +020029 if (rv >= alloc_arena_size (h))
Dave Barach97f5af02018-02-22 09:48:45 -050030 os_out_of_memory ();
31
Dave Barachffb14b92018-09-11 17:20:23 -040032 return (void *) (uword) (rv + alloc_arena (h));
Dave Barach97f5af02018-02-22 09:48:45 -050033}
34
Dave Barach32dcd3b2019-07-08 12:25:38 -040035void BV (clib_bihash_instantiate) (BVT (clib_bihash) * h)
36{
37 uword bucket_size;
38
39 alloc_arena (h) = (uword) clib_mem_vm_alloc (h->memory_size);
40 alloc_arena_next (h) = 0;
41 alloc_arena_size (h) = h->memory_size;
42
43 bucket_size = h->nbuckets * sizeof (h->buckets[0]);
44 h->buckets = BV (alloc_aligned) (h, bucket_size);
45
46 h->alloc_lock = BV (alloc_aligned) (h, CLIB_CACHE_LINE_BYTES);
47 h->alloc_lock[0] = 0;
48}
Dave Barach97f5af02018-02-22 09:48:45 -050049
Dave Barachc3799992016-08-15 11:12:27 -040050void BV (clib_bihash_init)
51 (BVT (clib_bihash) * h, char *name, u32 nbuckets, uword memory_size)
Ed Warnickecb9cada2015-12-08 15:45:58 -070052{
Dave Barach32dcd3b2019-07-08 12:25:38 -040053 int i;
54 void *oldheap;
Ed Warnickecb9cada2015-12-08 15:45:58 -070055 nbuckets = 1 << (max_log2 (nbuckets));
56
Dave Barachc3799992016-08-15 11:12:27 -040057 h->name = (u8 *) name;
Ed Warnickecb9cada2015-12-08 15:45:58 -070058 h->nbuckets = nbuckets;
59 h->log2_nbuckets = max_log2 (nbuckets);
Dave Barach32dcd3b2019-07-08 12:25:38 -040060 h->memory_size = memory_size;
61 alloc_arena (h) = 0;
Ed Warnickecb9cada2015-12-08 15:45:58 -070062
Dave Barach508498f2018-07-19 12:11:16 -040063 /*
64 * Make sure the requested size is rational. The max table
65 * size without playing the alignment card is 64 Gbytes.
66 * If someone starts complaining that's not enough, we can shift
67 * the offset by CLIB_LOG2_CACHE_LINE_BYTES...
68 */
69 ASSERT (memory_size < (1ULL << BIHASH_BUCKET_OFFSET_BITS));
Vijayabhaskar Katamreddyfb8e61c2017-12-14 13:20:50 -080070 h->fmt_fn = NULL;
Dave Barach32dcd3b2019-07-08 12:25:38 -040071
72 /* Add this hash table to the list */
73 for (i = 0; i < vec_len (clib_all_bihashes); i++)
74 if (clib_all_bihashes[i] == h)
75 return;
76
77 /* Unfortunately, the heap push/pop is required.... */
78 oldheap = clib_all_bihash_set_heap ();
79 vec_add1 (clib_all_bihashes, (void *) h);
80 clib_mem_set_heap (oldheap);
81
82#if BIHASH_INSTANTIATE_IMMEDIATELY
83 BV (clib_bihash_instantiate) (h);
84#endif
Vijayabhaskar Katamreddyfb8e61c2017-12-14 13:20:50 -080085}
86
Dave Barach9466c452018-08-24 17:21:14 -040087#if BIHASH_32_64_SVM
88#if !defined (MFD_ALLOW_SEALING)
89#define MFD_ALLOW_SEALING 0x0002U
90#endif
91
92void BV (clib_bihash_master_init_svm)
Dave Barachffb14b92018-09-11 17:20:23 -040093 (BVT (clib_bihash) * h, char *name, u32 nbuckets, u64 memory_size)
Dave Barach9466c452018-08-24 17:21:14 -040094{
95 uword bucket_size;
96 u8 *mmap_addr;
97 vec_header_t *freelist_vh;
98 int fd;
99
Dave Barachffb14b92018-09-11 17:20:23 -0400100 ASSERT (memory_size < (1ULL << 32));
Dave Barach9466c452018-08-24 17:21:14 -0400101 /* Set up for memfd sharing */
102 if ((fd = memfd_create (name, MFD_ALLOW_SEALING)) == -1)
103 {
104 clib_unix_warning ("memfd_create");
105 return;
106 }
107
108 if (ftruncate (fd, memory_size) < 0)
109 {
110 clib_unix_warning ("ftruncate");
111 return;
112 }
113
114 /* Not mission-critical, complain and continue */
115 if ((fcntl (fd, F_ADD_SEALS, F_SEAL_SHRINK)) == -1)
116 clib_unix_warning ("fcntl (F_ADD_SEALS)");
117
Dave Barachffb14b92018-09-11 17:20:23 -0400118 mmap_addr = mmap (0, memory_size,
119 PROT_READ | PROT_WRITE, MAP_SHARED, fd, 0 /* offset */ );
Dave Barach9466c452018-08-24 17:21:14 -0400120
121 if (mmap_addr == MAP_FAILED)
122 {
123 clib_unix_warning ("mmap failed");
124 ASSERT (0);
125 }
126
127 h->sh = (void *) mmap_addr;
128 h->memfd = fd;
129 nbuckets = 1 << (max_log2 (nbuckets));
130
131 h->name = (u8 *) name;
132 h->sh->nbuckets = h->nbuckets = nbuckets;
133 h->log2_nbuckets = max_log2 (nbuckets);
134
135 alloc_arena (h) = (u64) (uword) mmap_addr;
Dave Barachffb14b92018-09-11 17:20:23 -0400136 alloc_arena_next (h) = CLIB_CACHE_LINE_BYTES;
Dave Barach9466c452018-08-24 17:21:14 -0400137 alloc_arena_size (h) = memory_size;
138
139 bucket_size = nbuckets * sizeof (h->buckets[0]);
140 h->buckets = BV (alloc_aligned) (h, bucket_size);
Dave Barachffb14b92018-09-11 17:20:23 -0400141 h->sh->buckets_as_u64 = (u64) BV (clib_bihash_get_offset) (h, h->buckets);
Dave Barach9466c452018-08-24 17:21:14 -0400142
143 h->alloc_lock = BV (alloc_aligned) (h, CLIB_CACHE_LINE_BYTES);
144 h->alloc_lock[0] = 0;
145
Dave Barachffb14b92018-09-11 17:20:23 -0400146 h->sh->alloc_lock_as_u64 =
147 (u64) BV (clib_bihash_get_offset) (h, (void *) h->alloc_lock);
148 freelist_vh =
149 BV (alloc_aligned) (h,
150 sizeof (vec_header_t) +
151 BIHASH_FREELIST_LENGTH * sizeof (u64));
Dave Barach9466c452018-08-24 17:21:14 -0400152 freelist_vh->len = BIHASH_FREELIST_LENGTH;
153 freelist_vh->dlmalloc_header_offset = 0xDEADBEEF;
Dave Barachffb14b92018-09-11 17:20:23 -0400154 h->sh->freelists_as_u64 =
155 (u64) BV (clib_bihash_get_offset) (h, freelist_vh->vector_data);
156 h->freelists = (void *) (freelist_vh->vector_data);
Dave Barach9466c452018-08-24 17:21:14 -0400157
158 h->fmt_fn = NULL;
159}
160
161void BV (clib_bihash_slave_init_svm)
162 (BVT (clib_bihash) * h, char *name, int fd)
163{
164 u8 *mmap_addr;
Dave Barachffb14b92018-09-11 17:20:23 -0400165 u64 memory_size;
Dave Barach9466c452018-08-24 17:21:14 -0400166 BVT (clib_bihash_shared_header) * sh;
167
Dave Barachffb14b92018-09-11 17:20:23 -0400168 /* Trial mapping, to learn the segment size */
Dave Barach9466c452018-08-24 17:21:14 -0400169 mmap_addr = mmap (0, 4096, PROT_READ, MAP_SHARED, fd, 0 /* offset */ );
170 if (mmap_addr == MAP_FAILED)
171 {
172 clib_unix_warning ("trial mmap failed");
173 ASSERT (0);
174 }
175
176 sh = (BVT (clib_bihash_shared_header) *) mmap_addr;
177
Dave Barach9466c452018-08-24 17:21:14 -0400178 memory_size = sh->alloc_arena_size;
179
180 munmap (mmap_addr, 4096);
181
Dave Barachffb14b92018-09-11 17:20:23 -0400182 /* Actual mapping, at the required size */
183 mmap_addr = mmap (0, memory_size,
184 PROT_READ | PROT_WRITE, MAP_SHARED, fd, 0 /* offset */ );
Dave Barach9466c452018-08-24 17:21:14 -0400185
186 if (mmap_addr == MAP_FAILED)
187 {
188 clib_unix_warning ("mmap failed");
189 ASSERT (0);
190 }
191
192 (void) close (fd);
193
194 h->sh = (void *) mmap_addr;
Dave Barachffb14b92018-09-11 17:20:23 -0400195 alloc_arena (h) = (u64) (uword) mmap_addr;
Dave Barach9466c452018-08-24 17:21:14 -0400196 h->memfd = -1;
197
198 h->name = (u8 *) name;
Dave Barachffb14b92018-09-11 17:20:23 -0400199 h->buckets = BV (clib_bihash_get_value) (h, h->sh->buckets_as_u64);
Dave Barach9466c452018-08-24 17:21:14 -0400200 h->nbuckets = h->sh->nbuckets;
201 h->log2_nbuckets = max_log2 (h->nbuckets);
202
Dave Barachffb14b92018-09-11 17:20:23 -0400203 h->alloc_lock = BV (clib_bihash_get_value) (h, h->sh->alloc_lock_as_u64);
204 h->freelists = BV (clib_bihash_get_value) (h, h->sh->freelists_as_u64);
Dave Barach9466c452018-08-24 17:21:14 -0400205 h->fmt_fn = NULL;
206}
207#endif /* BIHASH_32_64_SVM */
208
Vijayabhaskar Katamreddyfb8e61c2017-12-14 13:20:50 -0800209void BV (clib_bihash_set_kvp_format_fn) (BVT (clib_bihash) * h,
210 format_function_t * fmt_fn)
211{
212 h->fmt_fn = fmt_fn;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700213}
214
Dave Barachc3799992016-08-15 11:12:27 -0400215void BV (clib_bihash_free) (BVT (clib_bihash) * h)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700216{
Dave Barach32dcd3b2019-07-08 12:25:38 -0400217 int i;
218
219 if (PREDICT_FALSE (alloc_arena (h) == 0))
220 goto never_initialized;
221
Dave Barach97f5af02018-02-22 09:48:45 -0500222 vec_free (h->working_copies);
Vijayabhaskar Katamreddy72739a62019-05-07 13:27:32 -0700223 vec_free (h->working_copy_lengths);
Dave Barach9466c452018-08-24 17:21:14 -0400224#if BIHASH_32_64_SVM == 0
Dave Barach97f5af02018-02-22 09:48:45 -0500225 vec_free (h->freelists);
Dave Barach9466c452018-08-24 17:21:14 -0400226#else
227 if (h->memfd > 0)
228 (void) close (h->memfd);
229#endif
230 clib_mem_vm_free ((void *) (uword) (alloc_arena (h)), alloc_arena_size (h));
Dave Barach32dcd3b2019-07-08 12:25:38 -0400231never_initialized:
Dave Barachb7b92992018-10-17 10:38:51 -0400232 clib_memset (h, 0, sizeof (*h));
Dave Barach32dcd3b2019-07-08 12:25:38 -0400233 for (i = 0; i < vec_len (clib_all_bihashes); i++)
234 {
235 if ((void *) h == clib_all_bihashes[i])
236 {
237 vec_delete (clib_all_bihashes, 1, i);
238 return;
239 }
240 }
241 clib_warning ("Couldn't find hash table %llx on clib_all_bihashes...",
242 (u64) h);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700243}
244
Dave Barachc3799992016-08-15 11:12:27 -0400245static
246BVT (clib_bihash_value) *
247BV (value_alloc) (BVT (clib_bihash) * h, u32 log2_pages)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700248{
Dave Barachc3799992016-08-15 11:12:27 -0400249 BVT (clib_bihash_value) * rv = 0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700250
Dave Barach508498f2018-07-19 12:11:16 -0400251 ASSERT (h->alloc_lock[0]);
Dave Barach9466c452018-08-24 17:21:14 -0400252
253#if BIHASH_32_64_SVM
254 ASSERT (log2_pages < vec_len (h->freelists));
255#endif
256
Dave Barachc3799992016-08-15 11:12:27 -0400257 if (log2_pages >= vec_len (h->freelists) || h->freelists[log2_pages] == 0)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700258 {
Dave Barach97f5af02018-02-22 09:48:45 -0500259 vec_validate_init_empty (h->freelists, log2_pages, 0);
260 rv = BV (alloc_aligned) (h, (sizeof (*rv) * (1 << log2_pages)));
Dave Barachc3799992016-08-15 11:12:27 -0400261 goto initialize;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700262 }
Dave Barachffb14b92018-09-11 17:20:23 -0400263 rv = BV (clib_bihash_get_value) (h, (uword) h->freelists[log2_pages]);
Dave Barach9466c452018-08-24 17:21:14 -0400264 h->freelists[log2_pages] = rv->next_free_as_u64;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700265
Dave Barachc3799992016-08-15 11:12:27 -0400266initialize:
267 ASSERT (rv);
Dave Barachc3799992016-08-15 11:12:27 -0400268 /*
269 * Latest gcc complains that the length arg is zero
270 * if we replace (1<<log2_pages) with vec_len(rv).
271 * No clue.
272 */
Dave Barachb7b92992018-10-17 10:38:51 -0400273 clib_memset (rv, 0xff, sizeof (*rv) * (1 << log2_pages));
Dave Barachc3799992016-08-15 11:12:27 -0400274 return rv;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700275}
276
277static void
Dave Barachba7ddfe2017-05-17 20:20:50 -0400278BV (value_free) (BVT (clib_bihash) * h, BVT (clib_bihash_value) * v,
279 u32 log2_pages)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700280{
Dave Barach508498f2018-07-19 12:11:16 -0400281 ASSERT (h->alloc_lock[0]);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700282
Dave Barachc3799992016-08-15 11:12:27 -0400283 ASSERT (vec_len (h->freelists) > log2_pages);
284
Dave Barach508498f2018-07-19 12:11:16 -0400285 if (CLIB_DEBUG > 0)
Dave Barachb7b92992018-10-17 10:38:51 -0400286 clib_memset (v, 0xFE, sizeof (*v) * (1 << log2_pages));
Dave Barach508498f2018-07-19 12:11:16 -0400287
Dave Barach9466c452018-08-24 17:21:14 -0400288 v->next_free_as_u64 = (u64) h->freelists[log2_pages];
Dave Barachffb14b92018-09-11 17:20:23 -0400289 h->freelists[log2_pages] = (u64) BV (clib_bihash_get_offset) (h, v);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700290}
291
292static inline void
Dave Barach908a5ea2017-07-14 12:42:21 -0400293BV (make_working_copy) (BVT (clib_bihash) * h, BVT (clib_bihash_bucket) * b)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700294{
Dave Barachc3799992016-08-15 11:12:27 -0400295 BVT (clib_bihash_value) * v;
Dave Barach908a5ea2017-07-14 12:42:21 -0400296 BVT (clib_bihash_bucket) working_bucket __attribute__ ((aligned (8)));
Dave Barachc3799992016-08-15 11:12:27 -0400297 BVT (clib_bihash_value) * working_copy;
Damjan Marionf55f9b82017-05-10 21:06:28 +0200298 u32 thread_index = os_get_thread_index ();
Dave Barachba7ddfe2017-05-17 20:20:50 -0400299 int log2_working_copy_length;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700300
Dave Barach508498f2018-07-19 12:11:16 -0400301 ASSERT (h->alloc_lock[0]);
302
Damjan Marionf55f9b82017-05-10 21:06:28 +0200303 if (thread_index >= vec_len (h->working_copies))
Ed Warnickecb9cada2015-12-08 15:45:58 -0700304 {
Damjan Marionf55f9b82017-05-10 21:06:28 +0200305 vec_validate (h->working_copies, thread_index);
Steve Shin871cdec2017-06-02 10:09:02 -0700306 vec_validate_init_empty (h->working_copy_lengths, thread_index, ~0);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700307 }
308
Dave Barachc3799992016-08-15 11:12:27 -0400309 /*
Ed Warnickecb9cada2015-12-08 15:45:58 -0700310 * working_copies are per-cpu so that near-simultaneous
311 * updates from multiple threads will not result in sporadic, spurious
Dave Barachc3799992016-08-15 11:12:27 -0400312 * lookup failures.
Ed Warnickecb9cada2015-12-08 15:45:58 -0700313 */
Damjan Marionf55f9b82017-05-10 21:06:28 +0200314 working_copy = h->working_copies[thread_index];
Dave Barachba7ddfe2017-05-17 20:20:50 -0400315 log2_working_copy_length = h->working_copy_lengths[thread_index];
Ed Warnickecb9cada2015-12-08 15:45:58 -0700316
317 h->saved_bucket.as_u64 = b->as_u64;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700318
Dave Barachba7ddfe2017-05-17 20:20:50 -0400319 if (b->log2_pages > log2_working_copy_length)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700320 {
Dave Barach97f5af02018-02-22 09:48:45 -0500321 /*
322 * It's not worth the bookkeeping to free working copies
323 * if (working_copy)
324 * clib_mem_free (working_copy);
325 */
326 working_copy = BV (alloc_aligned)
327 (h, sizeof (working_copy[0]) * (1 << b->log2_pages));
Dave Barachba7ddfe2017-05-17 20:20:50 -0400328 h->working_copy_lengths[thread_index] = b->log2_pages;
Damjan Marionf55f9b82017-05-10 21:06:28 +0200329 h->working_copies[thread_index] = working_copy;
Dave Barach2ce28d62019-05-03 12:58:01 -0400330
331 BV (clib_bihash_increment_stat) (h, BIHASH_STAT_working_copy_lost,
332 1ULL << b->log2_pages);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700333 }
334
Dave Barachc3799992016-08-15 11:12:27 -0400335 v = BV (clib_bihash_get_value) (h, b->offset);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700336
Dave Barach178cf492018-11-13 16:34:13 -0500337 clib_memcpy_fast (working_copy, v, sizeof (*v) * (1 << b->log2_pages));
Ed Warnickecb9cada2015-12-08 15:45:58 -0700338 working_bucket.as_u64 = b->as_u64;
Dave Barachc3799992016-08-15 11:12:27 -0400339 working_bucket.offset = BV (clib_bihash_get_offset) (h, working_copy);
340 CLIB_MEMORY_BARRIER ();
Ed Warnickecb9cada2015-12-08 15:45:58 -0700341 b->as_u64 = working_bucket.as_u64;
Damjan Marionf55f9b82017-05-10 21:06:28 +0200342 h->working_copies[thread_index] = working_copy;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700343}
344
Dave Barachc3799992016-08-15 11:12:27 -0400345static
346BVT (clib_bihash_value) *
347BV (split_and_rehash)
348 (BVT (clib_bihash) * h,
Dave Barachba7ddfe2017-05-17 20:20:50 -0400349 BVT (clib_bihash_value) * old_values, u32 old_log2_pages,
350 u32 new_log2_pages)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700351{
Dave Barach5e6b9582016-12-12 15:37:29 -0500352 BVT (clib_bihash_value) * new_values, *new_v;
Dave Barachba7ddfe2017-05-17 20:20:50 -0400353 int i, j, length_in_kvs;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700354
Dave Barach508498f2018-07-19 12:11:16 -0400355 ASSERT (h->alloc_lock[0]);
356
Dave Barachc3799992016-08-15 11:12:27 -0400357 new_values = BV (value_alloc) (h, new_log2_pages);
Dave Barachba7ddfe2017-05-17 20:20:50 -0400358 length_in_kvs = (1 << old_log2_pages) * BIHASH_KVP_PER_PAGE;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700359
Dave Barachba7ddfe2017-05-17 20:20:50 -0400360 for (i = 0; i < length_in_kvs; i++)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700361 {
362 u64 new_hash;
Dave Barachc3799992016-08-15 11:12:27 -0400363
Dave Barach5e6b9582016-12-12 15:37:29 -0500364 /* Entry not in use? Forget it */
365 if (BV (clib_bihash_is_free) (&(old_values->kvp[i])))
366 continue;
367
368 /* rehash the item onto its new home-page */
369 new_hash = BV (clib_bihash_hash) (&(old_values->kvp[i]));
370 new_hash >>= h->log2_nbuckets;
371 new_hash &= (1 << new_log2_pages) - 1;
372 new_v = &new_values[new_hash];
373
374 /* Across the new home-page */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700375 for (j = 0; j < BIHASH_KVP_PER_PAGE; j++)
Dave Barachc3799992016-08-15 11:12:27 -0400376 {
Dave Barach5e6b9582016-12-12 15:37:29 -0500377 /* Empty slot */
378 if (BV (clib_bihash_is_free) (&(new_v->kvp[j])))
Dave Barachc3799992016-08-15 11:12:27 -0400379 {
Dave Barach178cf492018-11-13 16:34:13 -0500380 clib_memcpy_fast (&(new_v->kvp[j]), &(old_values->kvp[i]),
381 sizeof (new_v->kvp[j]));
Dave Barach5e6b9582016-12-12 15:37:29 -0500382 goto doublebreak;
Dave Barachc3799992016-08-15 11:12:27 -0400383 }
Dave Barachc3799992016-08-15 11:12:27 -0400384 }
Dave Barach5e6b9582016-12-12 15:37:29 -0500385 /* Crap. Tell caller to try again */
Dave Barachba7ddfe2017-05-17 20:20:50 -0400386 BV (value_free) (h, new_values, new_log2_pages);
Dave Barach5e6b9582016-12-12 15:37:29 -0500387 return 0;
388 doublebreak:;
389 }
Dave Barachba7ddfe2017-05-17 20:20:50 -0400390
Dave Barach5e6b9582016-12-12 15:37:29 -0500391 return new_values;
392}
393
394static
395BVT (clib_bihash_value) *
396BV (split_and_rehash_linear)
397 (BVT (clib_bihash) * h,
Dave Barachba7ddfe2017-05-17 20:20:50 -0400398 BVT (clib_bihash_value) * old_values, u32 old_log2_pages,
399 u32 new_log2_pages)
Dave Barach5e6b9582016-12-12 15:37:29 -0500400{
401 BVT (clib_bihash_value) * new_values;
Dave Barachba7ddfe2017-05-17 20:20:50 -0400402 int i, j, new_length, old_length;
Dave Barach5e6b9582016-12-12 15:37:29 -0500403
Dave Barach508498f2018-07-19 12:11:16 -0400404 ASSERT (h->alloc_lock[0]);
405
Dave Barach5e6b9582016-12-12 15:37:29 -0500406 new_values = BV (value_alloc) (h, new_log2_pages);
407 new_length = (1 << new_log2_pages) * BIHASH_KVP_PER_PAGE;
Dave Barachba7ddfe2017-05-17 20:20:50 -0400408 old_length = (1 << old_log2_pages) * BIHASH_KVP_PER_PAGE;
Dave Barach5e6b9582016-12-12 15:37:29 -0500409
410 j = 0;
411 /* Across the old value array */
Dave Barachba7ddfe2017-05-17 20:20:50 -0400412 for (i = 0; i < old_length; i++)
Dave Barach5e6b9582016-12-12 15:37:29 -0500413 {
414 /* Find a free slot in the new linear scan bucket */
415 for (; j < new_length; j++)
416 {
Dave Barach8f544962017-01-18 10:23:22 -0500417 /* Old value not in use? Forget it. */
Dave Barach5e6b9582016-12-12 15:37:29 -0500418 if (BV (clib_bihash_is_free) (&(old_values->kvp[i])))
419 goto doublebreak;
420
421 /* New value should never be in use */
422 if (BV (clib_bihash_is_free) (&(new_values->kvp[j])))
423 {
424 /* Copy the old value and move along */
Dave Barach178cf492018-11-13 16:34:13 -0500425 clib_memcpy_fast (&(new_values->kvp[j]), &(old_values->kvp[i]),
426 sizeof (new_values->kvp[j]));
Dave Barach5e6b9582016-12-12 15:37:29 -0500427 j++;
428 goto doublebreak;
429 }
Dave Barach5e6b9582016-12-12 15:37:29 -0500430 }
Dave Barach8f544962017-01-18 10:23:22 -0500431 /* This should never happen... */
432 clib_warning ("BUG: linear rehash failed!");
Dave Barachba7ddfe2017-05-17 20:20:50 -0400433 BV (value_free) (h, new_values, new_log2_pages);
Dave Barach8f544962017-01-18 10:23:22 -0500434 return 0;
435
Dave Barach5e6b9582016-12-12 15:37:29 -0500436 doublebreak:;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700437 }
438 return new_values;
439}
440
Matus Fabian828d27e2018-08-21 03:15:50 -0700441static inline int BV (clib_bihash_add_del_inline)
442 (BVT (clib_bihash) * h, BVT (clib_bihash_kv) * add_v, int is_add,
443 int (*is_stale_cb) (BVT (clib_bihash_kv) *, void *), void *arg)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700444{
445 u32 bucket_index;
Dave Barach908a5ea2017-07-14 12:42:21 -0400446 BVT (clib_bihash_bucket) * b, tmp_b;
Dave Barachc3799992016-08-15 11:12:27 -0400447 BVT (clib_bihash_value) * v, *new_v, *save_new_v, *working_copy;
Dave Barach5e6b9582016-12-12 15:37:29 -0500448 int i, limit;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700449 u64 hash, new_hash;
Dave Barachba7ddfe2017-05-17 20:20:50 -0400450 u32 new_log2_pages, old_log2_pages;
Damjan Marionf55f9b82017-05-10 21:06:28 +0200451 u32 thread_index = os_get_thread_index ();
Dave Barach5e6b9582016-12-12 15:37:29 -0500452 int mark_bucket_linear;
453 int resplit_once;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700454
Dave Barach32dcd3b2019-07-08 12:25:38 -0400455 /* Create the table (is_add=1), or flunk the request now (is_add=0) */
456 if (PREDICT_FALSE (alloc_arena (h) == 0))
457 {
458 if (is_add == 0)
459 return (-1);
460 BV (clib_bihash_instantiate) (h);
461 }
462
Dave Barachc3799992016-08-15 11:12:27 -0400463 hash = BV (clib_bihash_hash) (add_v);
464
465 bucket_index = hash & (h->nbuckets - 1);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700466 b = &h->buckets[bucket_index];
467
468 hash >>= h->log2_nbuckets;
469
Dave Barach508498f2018-07-19 12:11:16 -0400470 BV (clib_bihash_lock_bucket) (b);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700471
472 /* First elt in the bucket? */
Damjan Marion882fcfe2018-07-17 23:01:49 +0200473 if (BV (clib_bihash_bucket_is_empty) (b))
Ed Warnickecb9cada2015-12-08 15:45:58 -0700474 {
475 if (is_add == 0)
Dave Barachc3799992016-08-15 11:12:27 -0400476 {
Dave Barach508498f2018-07-19 12:11:16 -0400477 BV (clib_bihash_unlock_bucket) (b);
478 return (-1);
Dave Barachc3799992016-08-15 11:12:27 -0400479 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700480
Dave Barach508498f2018-07-19 12:11:16 -0400481 BV (clib_bihash_alloc_lock) (h);
Dave Barachc3799992016-08-15 11:12:27 -0400482 v = BV (value_alloc) (h, 0);
Dave Barach508498f2018-07-19 12:11:16 -0400483 BV (clib_bihash_alloc_unlock) (h);
Dave Barachba7ddfe2017-05-17 20:20:50 -0400484
Dave Barachc3799992016-08-15 11:12:27 -0400485 *v->kvp = *add_v;
Dave Barach508498f2018-07-19 12:11:16 -0400486 tmp_b.as_u64 = 0; /* clears bucket lock */
Dave Barachc3799992016-08-15 11:12:27 -0400487 tmp_b.offset = BV (clib_bihash_get_offset) (h, v);
Dave Barache7d212f2018-02-07 13:14:06 -0500488 tmp_b.refcnt = 1;
Dave Barach508498f2018-07-19 12:11:16 -0400489 CLIB_MEMORY_BARRIER ();
Ed Warnickecb9cada2015-12-08 15:45:58 -0700490
Tom Seidenberg97f8ae92019-03-15 10:15:26 -0400491 b->as_u64 = tmp_b.as_u64; /* unlocks the bucket */
Dave Barach2ce28d62019-05-03 12:58:01 -0400492 BV (clib_bihash_increment_stat) (h, BIHASH_STAT_alloc_add, 1);
493
Dave Barach508498f2018-07-19 12:11:16 -0400494 return (0);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700495 }
496
Dave Barach508498f2018-07-19 12:11:16 -0400497 /* WARNING: we're still looking at the live copy... */
Dave Barach5e6b9582016-12-12 15:37:29 -0500498 limit = BIHASH_KVP_PER_PAGE;
Dave Barach508498f2018-07-19 12:11:16 -0400499 v = BV (clib_bihash_get_value) (h, b->offset);
500
Dave Barach5e6b9582016-12-12 15:37:29 -0500501 v += (b->linear_search == 0) ? hash & ((1 << b->log2_pages) - 1) : 0;
502 if (b->linear_search)
503 limit <<= b->log2_pages;
Dave Barachc3799992016-08-15 11:12:27 -0400504
Ed Warnickecb9cada2015-12-08 15:45:58 -0700505 if (is_add)
506 {
Dave Barachc3799992016-08-15 11:12:27 -0400507 /*
Dave Barach508498f2018-07-19 12:11:16 -0400508 * Because reader threads are looking at live data,
509 * we have to be extra careful. Readers do NOT hold the
510 * bucket lock. We need to be SLOWER than a search, past the
511 * point where readers CHECK the bucket lock.
512 */
513
514 /*
Ed Warnickecb9cada2015-12-08 15:45:58 -0700515 * For obvious (in hindsight) reasons, see if we're supposed to
516 * replace an existing key, then look for an empty slot.
517 */
Dave Barach5e6b9582016-12-12 15:37:29 -0500518 for (i = 0; i < limit; i++)
Dave Barachc3799992016-08-15 11:12:27 -0400519 {
Dave Baracha11bf452019-04-17 17:27:31 -0400520 if (BV (clib_bihash_key_compare) (v->kvp[i].key, add_v->key))
Dave Barachc3799992016-08-15 11:12:27 -0400521 {
Dave Barach508498f2018-07-19 12:11:16 -0400522 CLIB_MEMORY_BARRIER (); /* Add a delay */
Dave Barach178cf492018-11-13 16:34:13 -0500523 clib_memcpy_fast (&(v->kvp[i]), add_v, sizeof (*add_v));
Dave Barach508498f2018-07-19 12:11:16 -0400524 BV (clib_bihash_unlock_bucket) (b);
Dave Barach2ce28d62019-05-03 12:58:01 -0400525 BV (clib_bihash_increment_stat) (h, BIHASH_STAT_replace, 1);
Dave Barach508498f2018-07-19 12:11:16 -0400526 return (0);
Dave Barachc3799992016-08-15 11:12:27 -0400527 }
528 }
Dave Barach508498f2018-07-19 12:11:16 -0400529 /*
530 * Look for an empty slot. If found, use it
531 */
Dave Barach5e6b9582016-12-12 15:37:29 -0500532 for (i = 0; i < limit; i++)
Dave Barachc3799992016-08-15 11:12:27 -0400533 {
534 if (BV (clib_bihash_is_free) (&(v->kvp[i])))
535 {
Dave Barach508498f2018-07-19 12:11:16 -0400536 /*
537 * Copy the value first, so that if a reader manages
538 * to match the new key, the value will be right...
539 */
Dave Barach178cf492018-11-13 16:34:13 -0500540 clib_memcpy_fast (&(v->kvp[i].value),
541 &add_v->value, sizeof (add_v->value));
Dave Barach508498f2018-07-19 12:11:16 -0400542 CLIB_MEMORY_BARRIER (); /* Make sure the value has settled */
Dave Barach178cf492018-11-13 16:34:13 -0500543 clib_memcpy_fast (&(v->kvp[i]), &add_v->key,
544 sizeof (add_v->key));
Dave Barache7d212f2018-02-07 13:14:06 -0500545 b->refcnt++;
Dave Barach9466c452018-08-24 17:21:14 -0400546 ASSERT (b->refcnt > 0);
Dave Barach508498f2018-07-19 12:11:16 -0400547 BV (clib_bihash_unlock_bucket) (b);
Dave Barach2ce28d62019-05-03 12:58:01 -0400548 BV (clib_bihash_increment_stat) (h, BIHASH_STAT_add, 1);
Dave Barach508498f2018-07-19 12:11:16 -0400549 return (0);
Dave Barachc3799992016-08-15 11:12:27 -0400550 }
551 }
Matus Fabian828d27e2018-08-21 03:15:50 -0700552 /* look for stale data to overwrite */
553 if (is_stale_cb)
554 {
555 for (i = 0; i < limit; i++)
556 {
557 if (is_stale_cb (&(v->kvp[i]), arg))
558 {
559 CLIB_MEMORY_BARRIER ();
Dave Barach178cf492018-11-13 16:34:13 -0500560 clib_memcpy_fast (&(v->kvp[i]), add_v, sizeof (*add_v));
Matus Fabian828d27e2018-08-21 03:15:50 -0700561 BV (clib_bihash_unlock_bucket) (b);
Dave Barach2ce28d62019-05-03 12:58:01 -0400562 BV (clib_bihash_increment_stat) (h, BIHASH_STAT_replace, 1);
Matus Fabian828d27e2018-08-21 03:15:50 -0700563 return (0);
564 }
565 }
566 }
Dave Barach508498f2018-07-19 12:11:16 -0400567 /* Out of space in this bucket, split the bucket... */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700568 }
Dave Barach508498f2018-07-19 12:11:16 -0400569 else /* delete case */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700570 {
Dave Barach5e6b9582016-12-12 15:37:29 -0500571 for (i = 0; i < limit; i++)
Dave Barachc3799992016-08-15 11:12:27 -0400572 {
Dave Barach508498f2018-07-19 12:11:16 -0400573 /* Found the key? Kill it... */
Dave Baracha11bf452019-04-17 17:27:31 -0400574 if (BV (clib_bihash_key_compare) (v->kvp[i].key, add_v->key))
Dave Barachc3799992016-08-15 11:12:27 -0400575 {
Dave Barachb7b92992018-10-17 10:38:51 -0400576 clib_memset (&(v->kvp[i]), 0xff, sizeof (*(add_v)));
Dave Barach508498f2018-07-19 12:11:16 -0400577 /* Is the bucket empty? */
578 if (PREDICT_TRUE (b->refcnt > 1))
Dave Barache7d212f2018-02-07 13:14:06 -0500579 {
Dave Barach508498f2018-07-19 12:11:16 -0400580 b->refcnt--;
581 BV (clib_bihash_unlock_bucket) (b);
Dave Barach2ce28d62019-05-03 12:58:01 -0400582 BV (clib_bihash_increment_stat) (h, BIHASH_STAT_del, 1);
Dave Barach508498f2018-07-19 12:11:16 -0400583 return (0);
Dave Barache7d212f2018-02-07 13:14:06 -0500584 }
Dave Barach508498f2018-07-19 12:11:16 -0400585 else /* yes, free it */
Dave Barache7d212f2018-02-07 13:14:06 -0500586 {
Dave Barach508498f2018-07-19 12:11:16 -0400587 /* Save old bucket value, need log2_pages to free it */
588 tmp_b.as_u64 = b->as_u64;
589 CLIB_MEMORY_BARRIER ();
590
591 /* Kill and unlock the bucket */
592 b->as_u64 = 0;
593
594 /* And free the backing storage */
595 BV (clib_bihash_alloc_lock) (h);
596 /* Note: v currently points into the middle of the bucket */
597 v = BV (clib_bihash_get_value) (h, tmp_b.offset);
598 BV (value_free) (h, v, tmp_b.log2_pages);
599 BV (clib_bihash_alloc_unlock) (h);
Dave Barach2ce28d62019-05-03 12:58:01 -0400600 BV (clib_bihash_increment_stat) (h, BIHASH_STAT_del_free,
601 1);
Dave Barach508498f2018-07-19 12:11:16 -0400602 return (0);
Dave Barache7d212f2018-02-07 13:14:06 -0500603 }
Dave Barachc3799992016-08-15 11:12:27 -0400604 }
605 }
Dave Barach508498f2018-07-19 12:11:16 -0400606 /* Not found... */
607 BV (clib_bihash_unlock_bucket) (b);
608 return (-3);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700609 }
610
Dave Barach508498f2018-07-19 12:11:16 -0400611 /* Move readers to a (locked) temp copy of the bucket */
612 BV (clib_bihash_alloc_lock) (h);
613 BV (make_working_copy) (h, b);
614
615 v = BV (clib_bihash_get_value) (h, h->saved_bucket.offset);
616
Dave Barachba7ddfe2017-05-17 20:20:50 -0400617 old_log2_pages = h->saved_bucket.log2_pages;
618 new_log2_pages = old_log2_pages + 1;
Dave Barach5e6b9582016-12-12 15:37:29 -0500619 mark_bucket_linear = 0;
Dave Barach2ce28d62019-05-03 12:58:01 -0400620 BV (clib_bihash_increment_stat) (h, BIHASH_STAT_split_add, 1);
621 BV (clib_bihash_increment_stat) (h, BIHASH_STAT_splits, old_log2_pages);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700622
Damjan Marionf55f9b82017-05-10 21:06:28 +0200623 working_copy = h->working_copies[thread_index];
Dave Barach5e6b9582016-12-12 15:37:29 -0500624 resplit_once = 0;
Dave Barach2ce28d62019-05-03 12:58:01 -0400625 BV (clib_bihash_increment_stat) (h, BIHASH_STAT_splits, 1);
Dave Barach5e6b9582016-12-12 15:37:29 -0500626
Dave Barachba7ddfe2017-05-17 20:20:50 -0400627 new_v = BV (split_and_rehash) (h, working_copy, old_log2_pages,
628 new_log2_pages);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700629 if (new_v == 0)
630 {
Dave Barach5e6b9582016-12-12 15:37:29 -0500631 try_resplit:
632 resplit_once = 1;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700633 new_log2_pages++;
Dave Barach5e6b9582016-12-12 15:37:29 -0500634 /* Try re-splitting. If that fails, fall back to linear search */
Dave Barachba7ddfe2017-05-17 20:20:50 -0400635 new_v = BV (split_and_rehash) (h, working_copy, old_log2_pages,
636 new_log2_pages);
Dave Barach5e6b9582016-12-12 15:37:29 -0500637 if (new_v == 0)
638 {
639 mark_linear:
640 new_log2_pages--;
641 /* pinned collisions, use linear search */
642 new_v =
Dave Barachba7ddfe2017-05-17 20:20:50 -0400643 BV (split_and_rehash_linear) (h, working_copy, old_log2_pages,
644 new_log2_pages);
Dave Barach5e6b9582016-12-12 15:37:29 -0500645 mark_bucket_linear = 1;
Dave Barach2ce28d62019-05-03 12:58:01 -0400646 BV (clib_bihash_increment_stat) (h, BIHASH_STAT_linear, 1);
Dave Barach5e6b9582016-12-12 15:37:29 -0500647 }
Dave Barach2ce28d62019-05-03 12:58:01 -0400648 BV (clib_bihash_increment_stat) (h, BIHASH_STAT_resplit, 1);
649 BV (clib_bihash_increment_stat) (h, BIHASH_STAT_splits,
650 old_log2_pages + 1);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700651 }
652
653 /* Try to add the new entry */
654 save_new_v = new_v;
Dave Barachc3799992016-08-15 11:12:27 -0400655 new_hash = BV (clib_bihash_hash) (add_v);
Dave Barach5e6b9582016-12-12 15:37:29 -0500656 limit = BIHASH_KVP_PER_PAGE;
657 if (mark_bucket_linear)
658 limit <<= new_log2_pages;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700659 new_hash >>= h->log2_nbuckets;
Dave Barach5e6b9582016-12-12 15:37:29 -0500660 new_hash &= (1 << new_log2_pages) - 1;
661 new_v += mark_bucket_linear ? 0 : new_hash;
Dave Barachc3799992016-08-15 11:12:27 -0400662
Dave Barach5e6b9582016-12-12 15:37:29 -0500663 for (i = 0; i < limit; i++)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700664 {
Dave Barachc3799992016-08-15 11:12:27 -0400665 if (BV (clib_bihash_is_free) (&(new_v->kvp[i])))
666 {
Dave Barach178cf492018-11-13 16:34:13 -0500667 clib_memcpy_fast (&(new_v->kvp[i]), add_v, sizeof (*add_v));
Dave Barachc3799992016-08-15 11:12:27 -0400668 goto expand_ok;
669 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700670 }
Dave Barachba7ddfe2017-05-17 20:20:50 -0400671
Ed Warnickecb9cada2015-12-08 15:45:58 -0700672 /* Crap. Try again */
Dave Barachba7ddfe2017-05-17 20:20:50 -0400673 BV (value_free) (h, save_new_v, new_log2_pages);
Dave Barach5e6b9582016-12-12 15:37:29 -0500674 /*
675 * If we've already doubled the size of the bucket once,
676 * fall back to linear search now.
677 */
678 if (resplit_once)
679 goto mark_linear;
680 else
681 goto try_resplit;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700682
Dave Barachc3799992016-08-15 11:12:27 -0400683expand_ok:
Dave Barach5e6b9582016-12-12 15:37:29 -0500684 tmp_b.log2_pages = new_log2_pages;
Dave Barachc3799992016-08-15 11:12:27 -0400685 tmp_b.offset = BV (clib_bihash_get_offset) (h, save_new_v);
Dave Barach5e6b9582016-12-12 15:37:29 -0500686 tmp_b.linear_search = mark_bucket_linear;
Dave Barache7d212f2018-02-07 13:14:06 -0500687 tmp_b.refcnt = h->saved_bucket.refcnt + 1;
Dave Barach9466c452018-08-24 17:21:14 -0400688 ASSERT (tmp_b.refcnt > 0);
Dave Barach508498f2018-07-19 12:11:16 -0400689 tmp_b.lock = 0;
Dave Barachc3799992016-08-15 11:12:27 -0400690 CLIB_MEMORY_BARRIER ();
Ed Warnickecb9cada2015-12-08 15:45:58 -0700691 b->as_u64 = tmp_b.as_u64;
Andrew Yourtchenkodf32bc42018-09-20 15:36:51 +0200692 /* free the old bucket */
693 v = BV (clib_bihash_get_value) (h, h->saved_bucket.offset);
694 BV (value_free) (h, v, h->saved_bucket.log2_pages);
Dave Barach508498f2018-07-19 12:11:16 -0400695 BV (clib_bihash_alloc_unlock) (h);
696 return (0);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700697}
698
Matus Fabian828d27e2018-08-21 03:15:50 -0700699int BV (clib_bihash_add_del)
700 (BVT (clib_bihash) * h, BVT (clib_bihash_kv) * add_v, int is_add)
701{
702 return BV (clib_bihash_add_del_inline) (h, add_v, is_add, 0, 0);
703}
704
705int BV (clib_bihash_add_or_overwrite_stale)
706 (BVT (clib_bihash) * h, BVT (clib_bihash_kv) * add_v,
707 int (*stale_callback) (BVT (clib_bihash_kv) *, void *), void *arg)
708{
709 return BV (clib_bihash_add_del_inline) (h, add_v, 1, stale_callback, arg);
710}
711
Dave Barachc3799992016-08-15 11:12:27 -0400712int BV (clib_bihash_search)
Dave Barach908a5ea2017-07-14 12:42:21 -0400713 (BVT (clib_bihash) * h,
Dave Barachc3799992016-08-15 11:12:27 -0400714 BVT (clib_bihash_kv) * search_key, BVT (clib_bihash_kv) * valuep)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700715{
716 u64 hash;
717 u32 bucket_index;
Dave Barachc3799992016-08-15 11:12:27 -0400718 BVT (clib_bihash_value) * v;
Dave Barach908a5ea2017-07-14 12:42:21 -0400719 BVT (clib_bihash_bucket) * b;
Dave Barach5e6b9582016-12-12 15:37:29 -0500720 int i, limit;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700721
Dave Barachc3799992016-08-15 11:12:27 -0400722 ASSERT (valuep);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700723
Dave Barach32dcd3b2019-07-08 12:25:38 -0400724 if (PREDICT_FALSE (alloc_arena (h) == 0))
725 return -1;
726
Dave Barachc3799992016-08-15 11:12:27 -0400727 hash = BV (clib_bihash_hash) (search_key);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700728
Dave Barachc3799992016-08-15 11:12:27 -0400729 bucket_index = hash & (h->nbuckets - 1);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700730 b = &h->buckets[bucket_index];
731
Damjan Marion882fcfe2018-07-17 23:01:49 +0200732 if (BV (clib_bihash_bucket_is_empty) (b))
Ed Warnickecb9cada2015-12-08 15:45:58 -0700733 return -1;
734
Dave Barach508498f2018-07-19 12:11:16 -0400735 if (PREDICT_FALSE (b->lock))
Dave Barach908a5ea2017-07-14 12:42:21 -0400736 {
Dave Barach508498f2018-07-19 12:11:16 -0400737 volatile BVT (clib_bihash_bucket) * bv = b;
738 while (bv->lock)
Damjan Marion2a03efe2018-07-20 21:48:59 +0200739 CLIB_PAUSE ();
Dave Barach908a5ea2017-07-14 12:42:21 -0400740 }
741
Ed Warnickecb9cada2015-12-08 15:45:58 -0700742 hash >>= h->log2_nbuckets;
743
Dave Barachc3799992016-08-15 11:12:27 -0400744 v = BV (clib_bihash_get_value) (h, b->offset);
Dave Barach5e6b9582016-12-12 15:37:29 -0500745 limit = BIHASH_KVP_PER_PAGE;
746 v += (b->linear_search == 0) ? hash & ((1 << b->log2_pages) - 1) : 0;
747 if (PREDICT_FALSE (b->linear_search))
748 limit <<= b->log2_pages;
Dave Barachc3799992016-08-15 11:12:27 -0400749
Dave Barach5e6b9582016-12-12 15:37:29 -0500750 for (i = 0; i < limit; i++)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700751 {
Dave Barachc3799992016-08-15 11:12:27 -0400752 if (BV (clib_bihash_key_compare) (v->kvp[i].key, search_key->key))
753 {
754 *valuep = v->kvp[i];
755 return 0;
756 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700757 }
758 return -1;
759}
760
Dave Barachc3799992016-08-15 11:12:27 -0400761u8 *BV (format_bihash) (u8 * s, va_list * args)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700762{
Dave Barachc3799992016-08-15 11:12:27 -0400763 BVT (clib_bihash) * h = va_arg (*args, BVT (clib_bihash) *);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700764 int verbose = va_arg (*args, int);
Dave Barach908a5ea2017-07-14 12:42:21 -0400765 BVT (clib_bihash_bucket) * b;
Dave Barachc3799992016-08-15 11:12:27 -0400766 BVT (clib_bihash_value) * v;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700767 int i, j, k;
768 u64 active_elements = 0;
Dave Barache7d212f2018-02-07 13:14:06 -0500769 u64 active_buckets = 0;
770 u64 linear_buckets = 0;
Dave Barach97f5af02018-02-22 09:48:45 -0500771 u64 used_bytes;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700772
773 s = format (s, "Hash table %s\n", h->name ? h->name : (u8 *) "(unnamed)");
Dave Barachc3799992016-08-15 11:12:27 -0400774
Dave Barach32dcd3b2019-07-08 12:25:38 -0400775 if (PREDICT_FALSE (alloc_arena (h) == 0))
776 return format (s, "[empty, uninitialized]");
777
Ed Warnickecb9cada2015-12-08 15:45:58 -0700778 for (i = 0; i < h->nbuckets; i++)
779 {
Dave Barachc3799992016-08-15 11:12:27 -0400780 b = &h->buckets[i];
Damjan Marion882fcfe2018-07-17 23:01:49 +0200781 if (BV (clib_bihash_bucket_is_empty) (b))
Dave Barachc3799992016-08-15 11:12:27 -0400782 {
783 if (verbose > 1)
784 s = format (s, "[%d]: empty\n", i);
785 continue;
786 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700787
Dave Barache7d212f2018-02-07 13:14:06 -0500788 active_buckets++;
789
790 if (b->linear_search)
791 linear_buckets++;
792
Ed Warnickecb9cada2015-12-08 15:45:58 -0700793 if (verbose)
Dave Barachc3799992016-08-15 11:12:27 -0400794 {
Dave Barach9466c452018-08-24 17:21:14 -0400795 s = format (s, "[%d]: heap offset %lld, len %d, linear %d\n", i,
Dave Barach5e6b9582016-12-12 15:37:29 -0500796 b->offset, (1 << b->log2_pages), b->linear_search);
Dave Barachc3799992016-08-15 11:12:27 -0400797 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700798
Dave Barachc3799992016-08-15 11:12:27 -0400799 v = BV (clib_bihash_get_value) (h, b->offset);
800 for (j = 0; j < (1 << b->log2_pages); j++)
801 {
802 for (k = 0; k < BIHASH_KVP_PER_PAGE; k++)
803 {
804 if (BV (clib_bihash_is_free) (&v->kvp[k]))
805 {
806 if (verbose > 1)
807 s = format (s, " %d: empty\n",
808 j * BIHASH_KVP_PER_PAGE + k);
809 continue;
810 }
811 if (verbose)
812 {
Vijayabhaskar Katamreddyfb8e61c2017-12-14 13:20:50 -0800813 if (h->fmt_fn)
814 {
815 s = format (s, " %d: %U\n",
816 j * BIHASH_KVP_PER_PAGE + k,
Vijayabhaskar Katamreddy72739a62019-05-07 13:27:32 -0700817 h->fmt_fn, &(v->kvp[k]), verbose);
Vijayabhaskar Katamreddyfb8e61c2017-12-14 13:20:50 -0800818 }
819 else
820 {
821 s = format (s, " %d: %U\n",
822 j * BIHASH_KVP_PER_PAGE + k,
823 BV (format_bihash_kvp), &(v->kvp[k]));
824 }
Dave Barachc3799992016-08-15 11:12:27 -0400825 }
826 active_elements++;
827 }
828 v++;
829 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700830 }
831
Dave Barache7d212f2018-02-07 13:14:06 -0500832 s = format (s, " %lld active elements %lld active buckets\n",
833 active_elements, active_buckets);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700834 s = format (s, " %d free lists\n", vec_len (h->freelists));
Dave Barache7d212f2018-02-07 13:14:06 -0500835
836 for (i = 0; i < vec_len (h->freelists); i++)
837 {
838 u32 nfree = 0;
839 BVT (clib_bihash_value) * free_elt;
Dave Barachffb14b92018-09-11 17:20:23 -0400840 u64 free_elt_as_u64 = h->freelists[i];
Dave Barache7d212f2018-02-07 13:14:06 -0500841
Dave Barachffb14b92018-09-11 17:20:23 -0400842 while (free_elt_as_u64)
Dave Barache7d212f2018-02-07 13:14:06 -0500843 {
Dave Barachffb14b92018-09-11 17:20:23 -0400844 free_elt = BV (clib_bihash_get_value) (h, free_elt_as_u64);
Dave Barache7d212f2018-02-07 13:14:06 -0500845 nfree++;
Dave Barachffb14b92018-09-11 17:20:23 -0400846 free_elt_as_u64 = free_elt->next_free_as_u64;
Dave Barache7d212f2018-02-07 13:14:06 -0500847 }
848
Dave Barach9466c452018-08-24 17:21:14 -0400849 if (nfree || verbose)
850 s = format (s, " [len %d] %u free elts\n", 1 << i, nfree);
Dave Barache7d212f2018-02-07 13:14:06 -0500851 }
852
853 s = format (s, " %lld linear search buckets\n", linear_buckets);
Dave Barachffb14b92018-09-11 17:20:23 -0400854 used_bytes = alloc_arena_next (h);
Dave Barach97f5af02018-02-22 09:48:45 -0500855 s = format (s,
856 " arena: base %llx, next %llx\n"
857 " used %lld b (%lld Mbytes) of %lld b (%lld Mbytes)\n",
Dave Barach9466c452018-08-24 17:21:14 -0400858 alloc_arena (h), alloc_arena_next (h),
Dave Barach97f5af02018-02-22 09:48:45 -0500859 used_bytes, used_bytes >> 20,
Dave Barach9466c452018-08-24 17:21:14 -0400860 alloc_arena_size (h), alloc_arena_size (h) >> 20);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700861 return s;
862}
863
Dave Barachc3799992016-08-15 11:12:27 -0400864void BV (clib_bihash_foreach_key_value_pair)
865 (BVT (clib_bihash) * h, void *callback, void *arg)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700866{
867 int i, j, k;
Dave Barach908a5ea2017-07-14 12:42:21 -0400868 BVT (clib_bihash_bucket) * b;
Dave Barachc3799992016-08-15 11:12:27 -0400869 BVT (clib_bihash_value) * v;
870 void (*fp) (BVT (clib_bihash_kv) *, void *) = callback;
871
Dave Barach32dcd3b2019-07-08 12:25:38 -0400872 if (PREDICT_FALSE (alloc_arena (h) == 0))
873 return;
874
Ed Warnickecb9cada2015-12-08 15:45:58 -0700875 for (i = 0; i < h->nbuckets; i++)
876 {
Dave Barachc3799992016-08-15 11:12:27 -0400877 b = &h->buckets[i];
Damjan Marion882fcfe2018-07-17 23:01:49 +0200878 if (BV (clib_bihash_bucket_is_empty) (b))
Dave Barachc3799992016-08-15 11:12:27 -0400879 continue;
880
881 v = BV (clib_bihash_get_value) (h, b->offset);
882 for (j = 0; j < (1 << b->log2_pages); j++)
883 {
884 for (k = 0; k < BIHASH_KVP_PER_PAGE; k++)
885 {
886 if (BV (clib_bihash_is_free) (&v->kvp[k]))
887 continue;
888
889 (*fp) (&v->kvp[k], arg);
Dave Barachca45ee72018-08-06 08:43:47 -0400890 /*
891 * In case the callback deletes the last entry in the bucket...
892 */
893 if (BV (clib_bihash_bucket_is_empty) (b))
894 goto doublebreak;
Dave Barachc3799992016-08-15 11:12:27 -0400895 }
896 v++;
897 }
Dave Barachca45ee72018-08-06 08:43:47 -0400898 doublebreak:
899 ;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700900 }
901}
Dave Barachdd3a57f2016-07-27 16:58:51 -0400902
Chris Luke16bcf7d2016-09-01 14:31:46 -0400903/** @endcond */
Dave Barachc3799992016-08-15 11:12:27 -0400904
905/*
906 * fd.io coding-style-patch-verification: ON
907 *
908 * Local Variables:
909 * eval: (c-set-style "gnu")
910 * End:
911 */