blob: 18a87b300446ec5a79c9346536f7e9d7902dd233 [file] [log] [blame]
Florin Corase86a8ed2018-01-05 03:20:25 -08001/*
2 *------------------------------------------------------------------
3 * Copyright (c) 2018 Cisco and/or its affiliates.
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at:
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 *------------------------------------------------------------------
16 */
17#include <signal.h>
18
19#include <vlib/vlib.h>
20#include <vlibapi/api.h>
21#include <vlibmemory/api.h>
22#include <vlibmemory/memory_api.h>
23
24#include <vlibmemory/vl_memory_msg_enum.h> /* enumerate all vlib messages */
25
26#define vl_typedefs /* define message structures */
27#include <vlibmemory/vl_memory_api_h.h>
28#undef vl_typedefs
29
30/* instantiate all the print functions we know about */
31#define vl_print(handle, ...) vlib_cli_output (handle, __VA_ARGS__)
32#define vl_printfun
33#include <vlibmemory/vl_memory_api_h.h>
34#undef vl_printfun
35
36/* instantiate all the endian swap functions we know about */
37#define vl_endianfun
38#include <vlibmemory/vl_memory_api_h.h>
39#undef vl_endianfun
40
41static inline void *
42vl_api_memclnt_create_t_print (vl_api_memclnt_create_t * a, void *handle)
43{
44 vl_print (handle, "vl_api_memclnt_create_t:\n");
45 vl_print (handle, "name: %s\n", a->name);
46 vl_print (handle, "input_queue: 0x%wx\n", a->input_queue);
47 vl_print (handle, "context: %u\n", (unsigned) a->context);
48 vl_print (handle, "ctx_quota: %ld\n", (long) a->ctx_quota);
49 return handle;
50}
51
52static inline void *
53vl_api_memclnt_delete_t_print (vl_api_memclnt_delete_t * a, void *handle)
54{
55 vl_print (handle, "vl_api_memclnt_delete_t:\n");
56 vl_print (handle, "index: %u\n", (unsigned) a->index);
57 vl_print (handle, "handle: 0x%wx\n", a->handle);
58 return handle;
59}
60
61volatile int **vl_api_queue_cursizes;
62
63static void
64memclnt_queue_callback (vlib_main_t * vm)
65{
66 int i;
Dave Barach39d69112019-11-27 11:42:13 -050067 api_main_t *am = vlibapi_get_main ();
Florin Corase86a8ed2018-01-05 03:20:25 -080068
69 if (PREDICT_FALSE (vec_len (vl_api_queue_cursizes) !=
70 1 + vec_len (am->vlib_private_rps)))
71 {
72 vl_shmem_hdr_t *shmem_hdr = am->shmem_hdr;
73 svm_queue_t *q;
74
75 if (shmem_hdr == 0)
76 return;
77
78 q = shmem_hdr->vl_input_queue;
79 if (q == 0)
80 return;
81
82 vec_add1 (vl_api_queue_cursizes, &q->cursize);
83
84 for (i = 0; i < vec_len (am->vlib_private_rps); i++)
85 {
86 svm_region_t *vlib_rp = am->vlib_private_rps[i];
87
88 shmem_hdr = (void *) vlib_rp->user_ctx;
89 q = shmem_hdr->vl_input_queue;
90 vec_add1 (vl_api_queue_cursizes, &q->cursize);
91 }
92 }
93
94 for (i = 0; i < vec_len (vl_api_queue_cursizes); i++)
95 {
96 if (*vl_api_queue_cursizes[i])
97 {
98 vm->queue_signal_pending = 1;
99 vm->api_queue_nonempty = 1;
100 vlib_process_signal_event (vm, vl_api_clnt_node.index,
101 /* event_type */ QUEUE_SIGNAL_EVENT,
102 /* event_data */ 0);
103 break;
104 }
105 }
Dave Barachf6c68d72018-11-01 08:12:52 -0400106 if (vec_len (vm->pending_rpc_requests))
107 {
108 vm->queue_signal_pending = 1;
109 vm->api_queue_nonempty = 1;
110 vlib_process_signal_event (vm, vl_api_clnt_node.index,
111 /* event_type */ QUEUE_SIGNAL_EVENT,
112 /* event_data */ 0);
113 }
Florin Corase86a8ed2018-01-05 03:20:25 -0800114}
115
116/*
117 * vl_api_memclnt_create_internal
118 */
119u32
120vl_api_memclnt_create_internal (char *name, svm_queue_t * q)
121{
122 vl_api_registration_t **regpp;
123 vl_api_registration_t *regp;
Florin Corase86a8ed2018-01-05 03:20:25 -0800124 void *oldheap;
Dave Barach39d69112019-11-27 11:42:13 -0500125 api_main_t *am = vlibapi_get_main ();
Florin Corase86a8ed2018-01-05 03:20:25 -0800126
127 ASSERT (vlib_get_thread_index () == 0);
128 pool_get (am->vl_clients, regpp);
129
Florin Corase86a8ed2018-01-05 03:20:25 -0800130
Nathan Skrzypczak0aa40132019-11-25 16:29:38 +0100131 oldheap = vl_msg_push_heap ();
Florin Corase86a8ed2018-01-05 03:20:25 -0800132 *regpp = clib_mem_alloc (sizeof (vl_api_registration_t));
133
134 regp = *regpp;
Dave Barachb7b92992018-10-17 10:38:51 -0400135 clib_memset (regp, 0, sizeof (*regp));
Florin Corase86a8ed2018-01-05 03:20:25 -0800136 regp->registration_type = REGISTRATION_TYPE_SHMEM;
137 regp->vl_api_registration_pool_index = regpp - am->vl_clients;
Nathan Skrzypczak0aa40132019-11-25 16:29:38 +0100138 regp->vlib_rp = am->vlib_rp;
Florin Corase86a8ed2018-01-05 03:20:25 -0800139 regp->shmem_hdr = am->shmem_hdr;
140
141 regp->vl_input_queue = q;
142 regp->name = format (0, "%s%c", name, 0);
143
Nathan Skrzypczak0aa40132019-11-25 16:29:38 +0100144 vl_msg_pop_heap (oldheap);
Florin Corase86a8ed2018-01-05 03:20:25 -0800145 return vl_msg_api_handle_from_index_and_epoch
146 (regp->vl_api_registration_pool_index,
147 am->shmem_hdr->application_restarts);
148}
149
150/*
151 * vl_api_memclnt_create_t_handler
152 */
153void
154vl_api_memclnt_create_t_handler (vl_api_memclnt_create_t * mp)
155{
156 vl_api_registration_t **regpp;
157 vl_api_registration_t *regp;
158 vl_api_memclnt_create_reply_t *rp;
Florin Corase86a8ed2018-01-05 03:20:25 -0800159 svm_queue_t *q;
160 int rv = 0;
161 void *oldheap;
Dave Barach39d69112019-11-27 11:42:13 -0500162 api_main_t *am = vlibapi_get_main ();
Florin Corase25c9bf2018-08-06 12:19:29 -0700163 u8 *msg_table;
Florin Corase86a8ed2018-01-05 03:20:25 -0800164
165 /*
166 * This is tortured. Maintain a vlib-address-space private
167 * pool of client registrations. We use the shared-memory virtual
168 * address of client structure as a handle, to allow direct
169 * manipulation of context quota vbls from the client library.
170 *
171 * This scheme causes trouble w/ API message trace replay, since
172 * some random VA from clib_mem_alloc() certainly won't
173 * occur in the Linux sim. The (very) few places
174 * that care need to use the pool index.
175 *
176 * Putting the registration object(s) into a pool in shared memory and
177 * using the pool index as a handle seems like a great idea.
178 * Unfortunately, each and every reference to that pool would need
179 * to be protected by a mutex:
180 *
181 * Client VLIB
182 * ------ ----
183 * convert pool index to
184 * pointer.
185 * <deschedule>
186 * expand pool
187 * <deschedule>
188 * kaboom!
189 */
190
191 pool_get (am->vl_clients, regpp);
192
Nathan Skrzypczak0aa40132019-11-25 16:29:38 +0100193 oldheap = vl_msg_push_heap ();
Florin Corase86a8ed2018-01-05 03:20:25 -0800194 *regpp = clib_mem_alloc (sizeof (vl_api_registration_t));
195
196 regp = *regpp;
Dave Barachb7b92992018-10-17 10:38:51 -0400197 clib_memset (regp, 0, sizeof (*regp));
Florin Corase86a8ed2018-01-05 03:20:25 -0800198 regp->registration_type = REGISTRATION_TYPE_SHMEM;
199 regp->vl_api_registration_pool_index = regpp - am->vl_clients;
Nathan Skrzypczak0aa40132019-11-25 16:29:38 +0100200 regp->vlib_rp = am->vlib_rp;
Florin Corase86a8ed2018-01-05 03:20:25 -0800201 regp->shmem_hdr = am->shmem_hdr;
Florin Corasb384b542018-01-15 01:08:33 -0800202 regp->clib_file_index = am->shmem_hdr->clib_file_index;
Florin Corase86a8ed2018-01-05 03:20:25 -0800203
204 q = regp->vl_input_queue = (svm_queue_t *) (uword) mp->input_queue;
Benoît Ganne9fb6d402019-04-15 15:28:21 +0200205 VL_MSG_API_SVM_QUEUE_UNPOISON (q);
Florin Corase86a8ed2018-01-05 03:20:25 -0800206
Ole Troan7adaa222019-08-27 15:05:27 +0200207 regp->name = format (0, "%s", mp->name);
Florin Corase86a8ed2018-01-05 03:20:25 -0800208 vec_add1 (regp->name, 0);
209
210 if (am->serialized_message_table_in_shmem == 0)
211 am->serialized_message_table_in_shmem =
212 vl_api_serialize_message_table (am, 0);
213
Florin Corase25c9bf2018-08-06 12:19:29 -0700214 if (am->vlib_rp != am->vlib_primary_rp)
215 msg_table = vl_api_serialize_message_table (am, 0);
216 else
217 msg_table = am->serialized_message_table_in_shmem;
218
Nathan Skrzypczak0aa40132019-11-25 16:29:38 +0100219 vl_msg_pop_heap (oldheap);
Florin Corase86a8ed2018-01-05 03:20:25 -0800220
221 rp = vl_msg_api_alloc (sizeof (*rp));
222 rp->_vl_msg_id = ntohs (VL_API_MEMCLNT_CREATE_REPLY);
223 rp->handle = (uword) regp;
224 rp->index = vl_msg_api_handle_from_index_and_epoch
225 (regp->vl_api_registration_pool_index,
226 am->shmem_hdr->application_restarts);
227 rp->context = mp->context;
228 rp->response = ntohl (rv);
Florin Corase25c9bf2018-08-06 12:19:29 -0700229 rp->message_table = pointer_to_uword (msg_table);
Florin Corase86a8ed2018-01-05 03:20:25 -0800230
231 vl_msg_api_send_shmem (q, (u8 *) & rp);
232}
233
Dave Barach38ca6e62020-07-17 17:16:34 -0400234void
Florin Corase86a8ed2018-01-05 03:20:25 -0800235vl_api_call_reaper_functions (u32 client_index)
236{
237 clib_error_t *error = 0;
238 _vl_msg_api_function_list_elt_t *i;
239
Dave Barach39d69112019-11-27 11:42:13 -0500240 i = vlibapi_get_main ()->reaper_function_registrations;
Florin Corase86a8ed2018-01-05 03:20:25 -0800241 while (i)
242 {
243 error = i->f (client_index);
244 if (error)
245 clib_error_report (error);
246 i = i->next_init_function;
247 }
Florin Corase86a8ed2018-01-05 03:20:25 -0800248}
249
250/*
251 * vl_api_memclnt_delete_t_handler
252 */
253void
254vl_api_memclnt_delete_t_handler (vl_api_memclnt_delete_t * mp)
255{
256 vl_api_registration_t **regpp;
257 vl_api_registration_t *regp;
258 vl_api_memclnt_delete_reply_t *rp;
Florin Corase86a8ed2018-01-05 03:20:25 -0800259 void *oldheap;
Dave Barach39d69112019-11-27 11:42:13 -0500260 api_main_t *am = vlibapi_get_main ();
Florin Corase86a8ed2018-01-05 03:20:25 -0800261 u32 handle, client_index, epoch;
262
263 handle = mp->index;
264
Dave Barach38ca6e62020-07-17 17:16:34 -0400265 vl_api_call_reaper_functions (handle);
Florin Corase86a8ed2018-01-05 03:20:25 -0800266
267 epoch = vl_msg_api_handle_get_epoch (handle);
268 client_index = vl_msg_api_handle_get_index (handle);
269
270 if (epoch != (am->shmem_hdr->application_restarts & VL_API_EPOCH_MASK))
271 {
272 clib_warning
273 ("Stale clnt delete index %d old epoch %d cur epoch %d",
274 client_index, epoch,
275 (am->shmem_hdr->application_restarts & VL_API_EPOCH_MASK));
276 return;
277 }
278
Florin Corasb384b542018-01-15 01:08:33 -0800279 regpp = pool_elt_at_index (am->vl_clients, client_index);
Florin Corase86a8ed2018-01-05 03:20:25 -0800280
281 if (!pool_is_free (am->vl_clients, regpp))
282 {
283 int i;
284 regp = *regpp;
Florin Corase86a8ed2018-01-05 03:20:25 -0800285 int private_registration = 0;
286
Florin Coraseaec2a62018-12-04 16:34:05 -0800287 /* Send reply unless client asked us to do the cleanup */
288 if (!mp->do_cleanup)
Florin Corase86a8ed2018-01-05 03:20:25 -0800289 {
Florin Coraseaec2a62018-12-04 16:34:05 -0800290 /*
291 * Note: the API message handling path will set am->vlib_rp
292 * as appropriate for pairwise / private memory segments
293 */
294 rp = vl_msg_api_alloc (sizeof (*rp));
295 rp->_vl_msg_id = ntohs (VL_API_MEMCLNT_DELETE_REPLY);
296 rp->handle = mp->handle;
297 rp->response = 1;
298
299 vl_msg_api_send_shmem (regp->vl_input_queue, (u8 *) & rp);
300 if (client_index != regp->vl_api_registration_pool_index)
301 {
302 clib_warning ("mismatch client_index %d pool_index %d",
303 client_index,
304 regp->vl_api_registration_pool_index);
305 vl_msg_api_free (rp);
306 return;
307 }
Florin Corase86a8ed2018-01-05 03:20:25 -0800308 }
309
Benoît Gannef26b2512019-09-11 16:43:44 +0200310 /* No dangling references, please */
311 *regpp = 0;
312
Florin Corase86a8ed2018-01-05 03:20:25 -0800313 /* For horizontal scaling, add a hash table... */
314 for (i = 0; i < vec_len (am->vlib_private_rps); i++)
315 {
316 /* Is this a pairwise / private API segment? */
Nathan Skrzypczak0aa40132019-11-25 16:29:38 +0100317 if (am->vlib_private_rps[i] == am->vlib_rp)
Florin Corase86a8ed2018-01-05 03:20:25 -0800318 {
319 /* Note: account for the memfd header page */
Nathan Skrzypczak0aa40132019-11-25 16:29:38 +0100320 uword virtual_base = am->vlib_rp->virtual_base - MMAP_PAGESIZE;
321 uword virtual_size = am->vlib_rp->virtual_size + MMAP_PAGESIZE;
Florin Corase86a8ed2018-01-05 03:20:25 -0800322
323 /*
324 * Kill the registration pool element before we make
325 * the index vanish forever
326 */
327 pool_put_index (am->vl_clients,
328 regp->vl_api_registration_pool_index);
329
330 vec_delete (am->vlib_private_rps, 1, i);
331 /* Kill it, accounting for the memfd header page */
332 if (munmap ((void *) virtual_base, virtual_size) < 0)
333 clib_unix_warning ("munmap");
334 /* Reset the queue-length-address cache */
335 vec_reset_length (vl_api_queue_cursizes);
336 private_registration = 1;
337 break;
338 }
339 }
340
Florin Corase86a8ed2018-01-05 03:20:25 -0800341 if (private_registration == 0)
342 {
343 pool_put_index (am->vl_clients,
344 regp->vl_api_registration_pool_index);
Nathan Skrzypczak0aa40132019-11-25 16:29:38 +0100345 oldheap = vl_msg_push_heap ();
Florin Coraseaec2a62018-12-04 16:34:05 -0800346 if (mp->do_cleanup)
347 svm_queue_free (regp->vl_input_queue);
Ole Troan73710c72018-06-04 22:27:49 +0200348 vec_free (regp->name);
Florin Corase86a8ed2018-01-05 03:20:25 -0800349 /* Poison the old registration */
Dave Barachb7b92992018-10-17 10:38:51 -0400350 clib_memset (regp, 0xF1, sizeof (*regp));
Florin Corase86a8ed2018-01-05 03:20:25 -0800351 clib_mem_free (regp);
Nathan Skrzypczak0aa40132019-11-25 16:29:38 +0100352 vl_msg_pop_heap (oldheap);
Florin Corase86a8ed2018-01-05 03:20:25 -0800353 /*
354 * These messages must be freed manually, since they're set up
355 * as "bounce" messages. In the private_registration == 1 case,
356 * we kill the shared-memory segment which contains the message
357 * with munmap.
358 */
359 vl_msg_api_free (mp);
360 }
361 }
362 else
363 {
364 clib_warning ("unknown client ID %d", mp->index);
365 }
366}
367
368/**
369 * client answered a ping, stave off the grim reaper...
370 */
371void
372 vl_api_memclnt_keepalive_reply_t_handler
373 (vl_api_memclnt_keepalive_reply_t * mp)
374{
375 vl_api_registration_t *regp;
376 vlib_main_t *vm = vlib_get_main ();
377
378 regp = vl_api_client_index_to_registration (mp->context);
379 if (regp)
380 {
381 regp->last_heard = vlib_time_now (vm);
382 regp->unanswered_pings = 0;
383 }
384 else
385 clib_warning ("BUG: anonymous memclnt_keepalive_reply");
386}
387
388/**
389 * We can send ourselves these messages if someone uses the
390 * builtin binary api test tool...
391 */
392static void
393vl_api_memclnt_keepalive_t_handler (vl_api_memclnt_keepalive_t * mp)
394{
395 vl_api_memclnt_keepalive_reply_t *rmp;
396 api_main_t *am;
397 vl_shmem_hdr_t *shmem_hdr;
398
Dave Barach39d69112019-11-27 11:42:13 -0500399 am = vlibapi_get_main ();
Florin Corase86a8ed2018-01-05 03:20:25 -0800400 shmem_hdr = am->shmem_hdr;
401
402 rmp = vl_msg_api_alloc_as_if_client (sizeof (*rmp));
Dave Barachb7b92992018-10-17 10:38:51 -0400403 clib_memset (rmp, 0, sizeof (*rmp));
Florin Corase86a8ed2018-01-05 03:20:25 -0800404 rmp->_vl_msg_id = ntohs (VL_API_MEMCLNT_KEEPALIVE_REPLY);
405 rmp->context = mp->context;
406 vl_msg_api_send_shmem (shmem_hdr->vl_input_queue, (u8 *) & rmp);
407}
408
Dave Barachc89c7672019-07-19 17:40:18 -0400409/*
410 * To avoid filling the API trace buffer with boring messages,
411 * don't trace memclnt_keepalive[_reply] msgs
412 */
413
Florin Corase86a8ed2018-01-05 03:20:25 -0800414#define foreach_vlib_api_msg \
Dave Barachc89c7672019-07-19 17:40:18 -0400415_(MEMCLNT_CREATE, memclnt_create, 1) \
416_(MEMCLNT_DELETE, memclnt_delete, 1) \
417_(MEMCLNT_KEEPALIVE, memclnt_keepalive, 0) \
418_(MEMCLNT_KEEPALIVE_REPLY, memclnt_keepalive_reply, 0)
Florin Corase86a8ed2018-01-05 03:20:25 -0800419
420/*
421 * memory_api_init
422 */
423int
424vl_mem_api_init (const char *region_name)
425{
426 int rv;
Dave Barach39d69112019-11-27 11:42:13 -0500427 api_main_t *am = vlibapi_get_main ();
Florin Corase86a8ed2018-01-05 03:20:25 -0800428 vl_msg_api_msg_config_t cfg;
429 vl_msg_api_msg_config_t *c = &cfg;
430 vl_shmem_hdr_t *shm;
431 vlib_main_t *vm = vlib_get_main ();
432
Dave Barachb7b92992018-10-17 10:38:51 -0400433 clib_memset (c, 0, sizeof (*c));
Florin Corase86a8ed2018-01-05 03:20:25 -0800434
435 if ((rv = vl_map_shmem (region_name, 1 /* is_vlib */ )) < 0)
436 return rv;
437
Dave Barachc89c7672019-07-19 17:40:18 -0400438#define _(N,n,t) do { \
Florin Corase86a8ed2018-01-05 03:20:25 -0800439 c->id = VL_API_##N; \
440 c->name = #n; \
441 c->handler = vl_api_##n##_t_handler; \
442 c->cleanup = vl_noop_handler; \
443 c->endian = vl_api_##n##_t_endian; \
444 c->print = vl_api_##n##_t_print; \
445 c->size = sizeof(vl_api_##n##_t); \
Dave Barachc89c7672019-07-19 17:40:18 -0400446 c->traced = t; /* trace, so these msgs print */ \
Florin Corase86a8ed2018-01-05 03:20:25 -0800447 c->replay = 0; /* don't replay client create/delete msgs */ \
448 c->message_bounce = 0; /* don't bounce this message */ \
449 vl_msg_api_config(c);} while (0);
450
451 foreach_vlib_api_msg;
452#undef _
453
454 /*
455 * special-case freeing of memclnt_delete messages, so we can
456 * simply munmap pairwise / private API segments...
457 */
458 am->message_bounce[VL_API_MEMCLNT_DELETE] = 1;
459 am->is_mp_safe[VL_API_MEMCLNT_KEEPALIVE_REPLY] = 1;
Dave Barachc898a4f2019-06-14 17:29:55 -0400460 am->is_mp_safe[VL_API_MEMCLNT_KEEPALIVE] = 1;
Florin Corase86a8ed2018-01-05 03:20:25 -0800461
462 vlib_set_queue_signal_callback (vm, memclnt_queue_callback);
463
464 shm = am->shmem_hdr;
465 ASSERT (shm && shm->vl_input_queue);
466
467 /* Make a note so we can always find the primary region easily */
468 am->vlib_primary_rp = am->vlib_rp;
469
470 return 0;
471}
472
Dave Barach1f806582018-06-14 09:18:21 -0400473clib_error_t *
Dave Barach048a4e52018-06-01 18:52:25 -0400474map_api_segment_init (vlib_main_t * vm)
475{
Dave Barach39d69112019-11-27 11:42:13 -0500476 api_main_t *am = vlibapi_get_main ();
Dave Barach048a4e52018-06-01 18:52:25 -0400477 int rv;
478
479 if ((rv = vl_mem_api_init (am->region_name)) < 0)
480 {
481 return clib_error_return (0, "vl_mem_api_init (%s) failed",
482 am->region_name);
483 }
484 return 0;
485}
486
Florin Corase86a8ed2018-01-05 03:20:25 -0800487static void
488send_memclnt_keepalive (vl_api_registration_t * regp, f64 now)
489{
490 vl_api_memclnt_keepalive_t *mp;
Florin Coras8d820852019-11-27 09:15:25 -0800491 svm_queue_t *q;
Dave Barach39d69112019-11-27 11:42:13 -0500492 api_main_t *am = vlibapi_get_main ();
Florin Corase86a8ed2018-01-05 03:20:25 -0800493
494 q = regp->vl_input_queue;
495
496 /*
497 * If the queue head is moving, assume that the client is processing
498 * messages and skip the ping. This heuristic may fail if the queue
499 * is in the same position as last time, net of wrapping; in which
500 * case, the client will receive a keepalive.
501 */
502 if (regp->last_queue_head != q->head)
503 {
504 regp->last_heard = now;
505 regp->unanswered_pings = 0;
506 regp->last_queue_head = q->head;
507 return;
508 }
509
510 /*
511 * push/pop shared memory segment, so this routine
512 * will work with "normal" as well as "private segment"
513 * memory clients..
514 */
515
Florin Coras8d820852019-11-27 09:15:25 -0800516 mp = vl_mem_api_alloc_as_if_client_w_reg (regp, sizeof (*mp));
Dave Barachb7b92992018-10-17 10:38:51 -0400517 clib_memset (mp, 0, sizeof (*mp));
Florin Corase86a8ed2018-01-05 03:20:25 -0800518 mp->_vl_msg_id = clib_host_to_net_u16 (VL_API_MEMCLNT_KEEPALIVE);
519 mp->context = mp->client_index =
520 vl_msg_api_handle_from_index_and_epoch
521 (regp->vl_api_registration_pool_index,
522 am->shmem_hdr->application_restarts);
523
524 regp->unanswered_pings++;
525
526 /* Failure-to-send due to a stuffed queue is absolutely expected */
527 if (svm_queue_add (q, (u8 *) & mp, 1 /* nowait */ ))
Florin Coras8d820852019-11-27 09:15:25 -0800528 vl_msg_api_free_w_region (regp->vlib_rp, mp);
Florin Corase86a8ed2018-01-05 03:20:25 -0800529}
530
Florin Corasb384b542018-01-15 01:08:33 -0800531static void
532vl_mem_send_client_keepalive_w_reg (api_main_t * am, f64 now,
533 vl_api_registration_t ** regpp,
534 u32 ** dead_indices,
535 u32 ** confused_indices)
536{
537 vl_api_registration_t *regp = *regpp;
538 if (regp)
539 {
540 /* If we haven't heard from this client recently... */
541 if (regp->last_heard < (now - 10.0))
542 {
543 if (regp->unanswered_pings == 2)
544 {
545 svm_queue_t *q;
546 q = regp->vl_input_queue;
547 if (kill (q->consumer_pid, 0) >= 0)
548 {
549 clib_warning ("REAPER: lazy binary API client '%s'",
550 regp->name);
551 regp->unanswered_pings = 0;
552 regp->last_heard = now;
553 }
554 else
555 {
556 clib_warning ("REAPER: binary API client '%s' died",
557 regp->name);
558 vec_add1 (*dead_indices, regpp - am->vl_clients);
559 }
560 }
561 else
562 send_memclnt_keepalive (regp, now);
563 }
564 else
565 regp->unanswered_pings = 0;
566 }
567 else
568 {
569 clib_warning ("NULL client registration index %d",
570 regpp - am->vl_clients);
571 vec_add1 (*confused_indices, regpp - am->vl_clients);
572 }
573}
574
Florin Corase86a8ed2018-01-05 03:20:25 -0800575void
576vl_mem_api_dead_client_scan (api_main_t * am, vl_shmem_hdr_t * shm, f64 now)
577{
578 vl_api_registration_t **regpp;
Florin Corase86a8ed2018-01-05 03:20:25 -0800579 static u32 *dead_indices;
580 static u32 *confused_indices;
581
582 vec_reset_length (dead_indices);
583 vec_reset_length (confused_indices);
584
585 /* *INDENT-OFF* */
Florin Corasb384b542018-01-15 01:08:33 -0800586 pool_foreach (regpp, am->vl_clients, ({
587 vl_mem_send_client_keepalive_w_reg (am, now, regpp, &dead_indices,
588 &confused_indices);
Florin Corase86a8ed2018-01-05 03:20:25 -0800589 }));
590 /* *INDENT-ON* */
Florin Corasb384b542018-01-15 01:08:33 -0800591
Florin Corase86a8ed2018-01-05 03:20:25 -0800592 /* This should "never happen," but if it does, fix it... */
593 if (PREDICT_FALSE (vec_len (confused_indices) > 0))
594 {
595 int i;
596 for (i = 0; i < vec_len (confused_indices); i++)
597 {
598 pool_put_index (am->vl_clients, confused_indices[i]);
599 }
600 }
601
602 if (PREDICT_FALSE (vec_len (dead_indices) > 0))
603 {
604 int i;
Florin Corase86a8ed2018-01-05 03:20:25 -0800605 void *oldheap;
606
607 /* Allow the application to clean up its registrations */
608 for (i = 0; i < vec_len (dead_indices); i++)
609 {
610 regpp = pool_elt_at_index (am->vl_clients, dead_indices[i]);
611 if (regpp)
612 {
613 u32 handle;
614
615 handle = vl_msg_api_handle_from_index_and_epoch
616 (dead_indices[i], shm->application_restarts);
Dave Barach38ca6e62020-07-17 17:16:34 -0400617 vl_api_call_reaper_functions (handle);
Florin Corase86a8ed2018-01-05 03:20:25 -0800618 }
619 }
620
Nathan Skrzypczak0aa40132019-11-25 16:29:38 +0100621 oldheap = vl_msg_push_heap ();
Florin Corase86a8ed2018-01-05 03:20:25 -0800622
623 for (i = 0; i < vec_len (dead_indices); i++)
624 {
625 regpp = pool_elt_at_index (am->vl_clients, dead_indices[i]);
626 if (regpp)
627 {
628 /* Is this a pairwise SVM segment? */
Nathan Skrzypczak0aa40132019-11-25 16:29:38 +0100629 if ((*regpp)->vlib_rp != am->vlib_rp)
Florin Corase86a8ed2018-01-05 03:20:25 -0800630 {
631 int i;
632 svm_region_t *dead_rp = (*regpp)->vlib_rp;
633 /* Note: account for the memfd header page */
David Johnsond9818dd2018-12-14 14:53:41 -0500634 uword virtual_base = dead_rp->virtual_base - MMAP_PAGESIZE;
635 uword virtual_size = dead_rp->virtual_size + MMAP_PAGESIZE;
Florin Corase86a8ed2018-01-05 03:20:25 -0800636
637 /* For horizontal scaling, add a hash table... */
638 for (i = 0; i < vec_len (am->vlib_private_rps); i++)
639 if (am->vlib_private_rps[i] == dead_rp)
640 {
641 vec_delete (am->vlib_private_rps, 1, i);
642 goto found;
643 }
Nathan Skrzypczak5ed3fe32019-11-07 16:00:57 +0100644 svm_pop_heap (oldheap);
Florin Corase86a8ed2018-01-05 03:20:25 -0800645 clib_warning ("private rp %llx AWOL", dead_rp);
Nathan Skrzypczak0aa40132019-11-25 16:29:38 +0100646 oldheap = svm_push_data_heap (am->vlib_rp);
Florin Corase86a8ed2018-01-05 03:20:25 -0800647
648 found:
649 /* Kill it, accounting for the memfd header page */
Nathan Skrzypczak5ed3fe32019-11-07 16:00:57 +0100650 svm_pop_heap (oldheap);
Florin Corase86a8ed2018-01-05 03:20:25 -0800651 if (munmap ((void *) virtual_base, virtual_size) < 0)
652 clib_unix_warning ("munmap");
653 /* Reset the queue-length-address cache */
654 vec_reset_length (vl_api_queue_cursizes);
Nathan Skrzypczak0aa40132019-11-25 16:29:38 +0100655 oldheap = svm_push_data_heap (am->vlib_rp);
Florin Corase86a8ed2018-01-05 03:20:25 -0800656 }
657 else
658 {
659 /* Poison the old registration */
Dave Barachb7b92992018-10-17 10:38:51 -0400660 clib_memset (*regpp, 0xF3, sizeof (**regpp));
Florin Corase86a8ed2018-01-05 03:20:25 -0800661 clib_mem_free (*regpp);
662 }
663 /* no dangling references, please */
664 *regpp = 0;
665 }
666 else
667 {
668 svm_pop_heap (oldheap);
669 clib_warning ("Duplicate free, client index %d",
670 regpp - am->vl_clients);
Nathan Skrzypczak0aa40132019-11-25 16:29:38 +0100671 oldheap = svm_push_data_heap (am->vlib_rp);
Florin Corase86a8ed2018-01-05 03:20:25 -0800672 }
673 }
674
675 svm_client_scan_this_region_nolock (am->vlib_rp);
676
Nathan Skrzypczak0aa40132019-11-25 16:29:38 +0100677 vl_msg_pop_heap (oldheap);
Florin Corase86a8ed2018-01-05 03:20:25 -0800678 for (i = 0; i < vec_len (dead_indices); i++)
679 pool_put_index (am->vl_clients, dead_indices[i]);
680 }
681}
682
683static inline int
Florin Coras8d820852019-11-27 09:15:25 -0800684void_mem_api_handle_msg_i (api_main_t * am, svm_region_t * vlib_rp,
685 vlib_main_t * vm, vlib_node_runtime_t * node,
686 u8 is_private)
Florin Corase86a8ed2018-01-05 03:20:25 -0800687{
Florin Coras8d820852019-11-27 09:15:25 -0800688 svm_queue_t *q;
Florin Corase86a8ed2018-01-05 03:20:25 -0800689 uword mp;
Florin Coras8d820852019-11-27 09:15:25 -0800690
691 q = ((vl_shmem_hdr_t *) (void *) vlib_rp->user_ctx)->vl_input_queue;
692
Florin Corase86a8ed2018-01-05 03:20:25 -0800693 if (!svm_queue_sub2 (q, (u8 *) & mp))
694 {
Benoît Ganne9fb6d402019-04-15 15:28:21 +0200695 VL_MSG_API_UNPOISON ((void *) mp);
Florin Coras8d820852019-11-27 09:15:25 -0800696 vl_msg_api_handler_with_vm_node (am, vlib_rp, (void *) mp, vm, node,
697 is_private);
Florin Corase86a8ed2018-01-05 03:20:25 -0800698 return 0;
699 }
700 return -1;
701}
702
703int
704vl_mem_api_handle_msg_main (vlib_main_t * vm, vlib_node_runtime_t * node)
705{
Dave Barach39d69112019-11-27 11:42:13 -0500706 api_main_t *am = vlibapi_get_main ();
Florin Coras8d820852019-11-27 09:15:25 -0800707 return void_mem_api_handle_msg_i (am, am->vlib_rp, vm, node,
708 0 /* is_private */ );
Florin Corase86a8ed2018-01-05 03:20:25 -0800709}
710
711int
Dave Barachf6c68d72018-11-01 08:12:52 -0400712vl_mem_api_handle_rpc (vlib_main_t * vm, vlib_node_runtime_t * node)
713{
Dave Barach39d69112019-11-27 11:42:13 -0500714 api_main_t *am = vlibapi_get_main ();
Dave Barachf6c68d72018-11-01 08:12:52 -0400715 int i;
716 uword *tmp, mp;
717
718 /*
719 * Swap pending and processing vectors, then process the RPCs
720 * Avoid deadlock conditions by construction.
721 */
722 clib_spinlock_lock_if_init (&vm->pending_rpc_lock);
723 tmp = vm->processing_rpc_requests;
724 vec_reset_length (tmp);
725 vm->processing_rpc_requests = vm->pending_rpc_requests;
726 vm->pending_rpc_requests = tmp;
727 clib_spinlock_unlock_if_init (&vm->pending_rpc_lock);
728
Dave Barach1bb981d2019-02-26 17:04:40 -0500729 /*
730 * RPCs are used to reflect function calls to thread 0
731 * when the underlying code is not thread-safe.
732 *
733 * Grabbing the thread barrier across a set of RPCs
734 * greatly increases efficiency, and avoids
735 * running afoul of the barrier sync holddown timer.
736 * The barrier sync code supports recursive locking.
737 *
738 * We really need to rewrite RPC-based code...
739 */
740 if (PREDICT_TRUE (vec_len (vm->processing_rpc_requests)))
Dave Barachf6c68d72018-11-01 08:12:52 -0400741 {
Dave Barach1bb981d2019-02-26 17:04:40 -0500742 vl_msg_api_barrier_sync ();
743 for (i = 0; i < vec_len (vm->processing_rpc_requests); i++)
744 {
745 mp = vm->processing_rpc_requests[i];
Florin Coras8d820852019-11-27 09:15:25 -0800746 vl_msg_api_handler_with_vm_node (am, am->vlib_rp, (void *) mp, vm,
747 node, 0 /* is_private */ );
Dave Barach1bb981d2019-02-26 17:04:40 -0500748 }
749 vl_msg_api_barrier_release ();
Dave Barachf6c68d72018-11-01 08:12:52 -0400750 }
Dave Barach1bb981d2019-02-26 17:04:40 -0500751
Dave Barachf6c68d72018-11-01 08:12:52 -0400752 return 0;
753}
754
755int
Florin Corase86a8ed2018-01-05 03:20:25 -0800756vl_mem_api_handle_msg_private (vlib_main_t * vm, vlib_node_runtime_t * node,
757 u32 reg_index)
758{
Dave Barach39d69112019-11-27 11:42:13 -0500759 api_main_t *am = vlibapi_get_main ();
Florin Coras8d820852019-11-27 09:15:25 -0800760 return void_mem_api_handle_msg_i (am, am->vlib_private_rps[reg_index], vm,
761 node, 1 /* is_private */ );
Florin Corase86a8ed2018-01-05 03:20:25 -0800762}
763
764vl_api_registration_t *
765vl_mem_api_client_index_to_registration (u32 handle)
766{
767 vl_api_registration_t **regpp;
768 vl_api_registration_t *regp;
Dave Barach39d69112019-11-27 11:42:13 -0500769 api_main_t *am = vlibapi_get_main ();
Florin Corasb384b542018-01-15 01:08:33 -0800770 vl_shmem_hdr_t *shmem_hdr;
Florin Corase86a8ed2018-01-05 03:20:25 -0800771 u32 index;
772
773 index = vl_msg_api_handle_get_index (handle);
Florin Corase86a8ed2018-01-05 03:20:25 -0800774 regpp = am->vl_clients + index;
775
776 if (pool_is_free (am->vl_clients, regpp))
777 {
778 vl_msg_api_increment_missing_client_counter ();
779 return 0;
780 }
781 regp = *regpp;
Florin Corasb384b542018-01-15 01:08:33 -0800782
783 shmem_hdr = (vl_shmem_hdr_t *) regp->shmem_hdr;
784 if (!vl_msg_api_handle_is_valid (handle, shmem_hdr->application_restarts))
785 {
786 vl_msg_api_increment_missing_client_counter ();
787 return 0;
788 }
789
Florin Corase86a8ed2018-01-05 03:20:25 -0800790 return (regp);
791}
792
793svm_queue_t *
794vl_api_client_index_to_input_queue (u32 index)
795{
796 vl_api_registration_t *regp;
Dave Barach39d69112019-11-27 11:42:13 -0500797 api_main_t *am = vlibapi_get_main ();
Florin Corase86a8ed2018-01-05 03:20:25 -0800798
799 /* Special case: vlib trying to send itself a message */
800 if (index == (u32) ~ 0)
801 return (am->shmem_hdr->vl_input_queue);
802
803 regp = vl_mem_api_client_index_to_registration (index);
804 if (!regp)
805 return 0;
806 return (regp->vl_input_queue);
807}
808
809static clib_error_t *
810setup_memclnt_exit (vlib_main_t * vm)
811{
812 atexit (vl_unmap_shmem);
813 return 0;
814}
815
816VLIB_INIT_FUNCTION (setup_memclnt_exit);
817
818u8 *
819format_api_message_rings (u8 * s, va_list * args)
820{
821 api_main_t *am = va_arg (*args, api_main_t *);
822 vl_shmem_hdr_t *shmem_hdr = va_arg (*args, vl_shmem_hdr_t *);
823 int main_segment = va_arg (*args, int);
824 ring_alloc_t *ap;
825 int i;
826
827 if (shmem_hdr == 0)
828 return format (s, "%8s %8s %8s %8s %8s\n",
829 "Owner", "Size", "Nitems", "Hits", "Misses");
830
831 ap = shmem_hdr->vl_rings;
832
833 for (i = 0; i < vec_len (shmem_hdr->vl_rings); i++)
834 {
835 s = format (s, "%8s %8d %8d %8d %8d\n",
836 "vlib", ap->size, ap->nitems, ap->hits, ap->misses);
837 ap++;
838 }
839
840 ap = shmem_hdr->client_rings;
841
842 for (i = 0; i < vec_len (shmem_hdr->client_rings); i++)
843 {
844 s = format (s, "%8s %8d %8d %8d %8d\n",
845 "clnt", ap->size, ap->nitems, ap->hits, ap->misses);
846 ap++;
847 }
848
849 if (main_segment)
850 {
851 s = format (s, "%d ring miss fallback allocations\n", am->ring_misses);
852 s = format
853 (s,
854 "%d application restarts, %d reclaimed msgs, %d garbage collects\n",
855 shmem_hdr->application_restarts, shmem_hdr->restart_reclaims,
856 shmem_hdr->garbage_collects);
857 }
858 return s;
859}
860
861static clib_error_t *
862vl_api_ring_command (vlib_main_t * vm,
863 unformat_input_t * input, vlib_cli_command_t * cli_cmd)
864{
865 int i;
866 vl_shmem_hdr_t *shmem_hdr;
Dave Barach39d69112019-11-27 11:42:13 -0500867 api_main_t *am = vlibapi_get_main ();
Florin Corase86a8ed2018-01-05 03:20:25 -0800868
869 /* First, dump the primary region rings.. */
870
871 if (am->vlib_primary_rp == 0 || am->vlib_primary_rp->user_ctx == 0)
872 {
873 vlib_cli_output (vm, "Shared memory segment not initialized...\n");
874 return 0;
875 }
876
877 shmem_hdr = (void *) am->vlib_primary_rp->user_ctx;
878
879 vlib_cli_output (vm, "Main API segment rings:");
880
881 vlib_cli_output (vm, "%U", format_api_message_rings, am,
882 0 /* print header */ , 0 /* notused */ );
883
884 vlib_cli_output (vm, "%U", format_api_message_rings, am,
885 shmem_hdr, 1 /* main segment */ );
886
887 for (i = 0; i < vec_len (am->vlib_private_rps); i++)
888 {
889 svm_region_t *vlib_rp = am->vlib_private_rps[i];
890 shmem_hdr = (void *) vlib_rp->user_ctx;
891 vl_api_registration_t **regpp;
892 vl_api_registration_t *regp = 0;
893
894 /* For horizontal scaling, add a hash table... */
895 /* *INDENT-OFF* */
896 pool_foreach (regpp, am->vl_clients,
897 ({
898 regp = *regpp;
899 if (regp && regp->vlib_rp == vlib_rp)
900 {
901 vlib_cli_output (vm, "%s segment rings:", regp->name);
902 goto found;
903 }
904 }));
905 vlib_cli_output (vm, "regp %llx not found?", regp);
906 continue;
907 /* *INDENT-ON* */
908 found:
909 vlib_cli_output (vm, "%U", format_api_message_rings, am,
910 0 /* print header */ , 0 /* notused */ );
911 vlib_cli_output (vm, "%U", format_api_message_rings, am,
912 shmem_hdr, 0 /* main segment */ );
913 }
914
915 return 0;
916}
917
918/*?
919 * Display binary api message allocation ring statistics
920?*/
921/* *INDENT-OFF* */
922VLIB_CLI_COMMAND (cli_show_api_ring_command, static) =
923{
924 .path = "show api ring-stats",
925 .short_help = "Message ring statistics",
926 .function = vl_api_ring_command,
927};
928/* *INDENT-ON* */
929
930clib_error_t *
931vlibmemory_init (vlib_main_t * vm)
932{
Dave Barach39d69112019-11-27 11:42:13 -0500933 api_main_t *am = vlibapi_get_main ();
Florin Corase86a8ed2018-01-05 03:20:25 -0800934 svm_map_region_args_t _a, *a = &_a;
Dave Barachb2204672018-11-30 16:46:29 -0500935 u8 *remove_path1, *remove_path2;
Dave Barachf8d50682019-05-14 18:01:44 -0400936 void vlibsocket_reference (void);
937
938 vlibsocket_reference ();
Dave Barachb2204672018-11-30 16:46:29 -0500939
940 /*
941 * By popular request / to avoid support fires, remove any old api segment
942 * files Right Here.
943 */
944 if (am->root_path == 0)
945 {
946 remove_path1 = format (0, "/dev/shm/global_vm%c", 0);
947 remove_path2 = format (0, "/dev/shm/vpe-api%c", 0);
948 }
949 else
950 {
951 remove_path1 = format (0, "/dev/shm/%s-global_vm%c", am->root_path, 0);
952 remove_path2 = format (0, "/dev/shm/%s-vpe-api%c", am->root_path, 0);
953 }
954
955 (void) unlink ((char *) remove_path1);
956 (void) unlink ((char *) remove_path2);
957
958 vec_free (remove_path1);
959 vec_free (remove_path2);
Florin Corase86a8ed2018-01-05 03:20:25 -0800960
Dave Barachb7b92992018-10-17 10:38:51 -0400961 clib_memset (a, 0, sizeof (*a));
Florin Corase86a8ed2018-01-05 03:20:25 -0800962 a->root_path = am->root_path;
963 a->name = SVM_GLOBAL_REGION_NAME;
964 a->baseva = (am->global_baseva != 0) ?
Damjan Marionaec8f892018-01-08 16:35:35 +0100965 am->global_baseva : +svm_get_global_region_base_va ();
Florin Corase86a8ed2018-01-05 03:20:25 -0800966 a->size = (am->global_size != 0) ? am->global_size : SVM_GLOBAL_REGION_SIZE;
967 a->flags = SVM_FLAGS_NODATA;
968 a->uid = am->api_uid;
969 a->gid = am->api_gid;
970 a->pvt_heap_size =
971 (am->global_pvt_heap_size !=
972 0) ? am->global_pvt_heap_size : SVM_PVT_MHEAP_SIZE;
973
974 svm_region_init_args (a);
975
Dave Barachf8d50682019-05-14 18:01:44 -0400976 return 0;
Florin Corase86a8ed2018-01-05 03:20:25 -0800977}
978
Florin Corase86a8ed2018-01-05 03:20:25 -0800979void
980vl_set_memory_region_name (const char *name)
981{
Dave Barach39d69112019-11-27 11:42:13 -0500982 api_main_t *am = vlibapi_get_main ();
Florin Corase86a8ed2018-01-05 03:20:25 -0800983 am->region_name = name;
984}
985
986/*
987 * fd.io coding-style-patch-verification: ON
988 *
989 * Local Variables:
990 * eval: (c-set-style "gnu")
991 * End:
992 */