blob: ce834a70aac260e7bc34f61c77b53bc89b57cce4 [file] [log] [blame]
Dave Barach59b25652017-09-10 15:04:27 -04001/*
2 *------------------------------------------------------------------
Ole Troan94495f22018-08-02 11:58:12 +02003 * socket_api.c
Dave Barach59b25652017-09-10 15:04:27 -04004 *
5 * Copyright (c) 2009 Cisco and/or its affiliates.
6 * Licensed under the Apache License, Version 2.0 (the "License");
7 * you may not use this file except in compliance with the License.
8 * You may obtain a copy of the License at:
9 *
10 * http://www.apache.org/licenses/LICENSE-2.0
11 *
12 * Unless required by applicable law or agreed to in writing, software
13 * distributed under the License is distributed on an "AS IS" BASIS,
14 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15 * See the License for the specific language governing permissions and
16 * limitations under the License.
17 *------------------------------------------------------------------
18 */
19
20#include <sys/types.h>
21#include <sys/socket.h>
22#include <netinet/in.h>
23#include <sys/ioctl.h>
Dave Barach59b25652017-09-10 15:04:27 -040024#include <fcntl.h>
25#include <sys/stat.h>
26
Florin Corase86a8ed2018-01-05 03:20:25 -080027#include <vppinfra/byte_order.h>
Florin Coras4d9b9d82018-01-14 12:25:50 -080028#include <svm/ssvm.h>
Dave Barach59b25652017-09-10 15:04:27 -040029#include <vlibmemory/api.h>
30
31#include <vlibmemory/vl_memory_msg_enum.h>
32
33#define vl_typedefs /* define message structures */
34#include <vlibmemory/vl_memory_api_h.h>
35#undef vl_typedefs
36
37/* instantiate all the print functions we know about */
38#define vl_print(handle, ...) vlib_cli_output (handle, __VA_ARGS__)
39#define vl_printfun
40#include <vlibmemory/vl_memory_api_h.h>
41#undef vl_printfun
42
43/* instantiate all the endian swap functions we know about */
44#define vl_endianfun
45#include <vlibmemory/vl_memory_api_h.h>
46#undef vl_endianfun
47
Florin Corase86a8ed2018-01-05 03:20:25 -080048socket_main_t socket_main;
49
Florin Coras2881dec2018-10-02 18:29:25 -070050#define SOCK_API_REG_HANDLE_BIT (1<<31)
51
52static u32
53sock_api_registration_handle (vl_api_registration_t * regp)
54{
55 ASSERT (regp->vl_api_registration_pool_index < SOCK_API_REG_HANDLE_BIT);
56 return regp->vl_api_registration_pool_index | SOCK_API_REG_HANDLE_BIT;
57}
58
59static u32
60socket_api_registration_handle_to_index (u32 reg_index)
61{
62 return (reg_index & ~SOCK_API_REG_HANDLE_BIT);
63}
64
65u8
66vl_socket_api_registration_handle_is_valid (u32 reg_handle)
67{
68 return ((reg_handle & SOCK_API_REG_HANDLE_BIT) != 0);
69}
70
Dave Barach59b25652017-09-10 15:04:27 -040071void
Florin Corase86a8ed2018-01-05 03:20:25 -080072vl_sock_api_dump_clients (vlib_main_t * vm, api_main_t * am)
Dave Barach59b25652017-09-10 15:04:27 -040073{
74 vl_api_registration_t *reg;
75 socket_main_t *sm = &socket_main;
Dave Barach59b25652017-09-10 15:04:27 -040076 clib_file_t *f;
77
78 /*
79 * Must have at least one active client, not counting the
80 * REGISTRATION_TYPE_SOCKET_LISTEN bind/accept socket
81 */
82 if (pool_elts (sm->registration_pool) < 2)
83 return;
84
85 vlib_cli_output (vm, "Socket clients");
Florin Coras90a63982017-12-19 04:50:01 -080086 vlib_cli_output (vm, "%20s %8s", "Name", "Fildesc");
Dave Barach59b25652017-09-10 15:04:27 -040087 /* *INDENT-OFF* */
Damjan Marionb2c31b62020-12-13 21:47:40 +010088 pool_foreach (reg, sm->registration_pool)
89 {
Dave Barach59b25652017-09-10 15:04:27 -040090 if (reg->registration_type == REGISTRATION_TYPE_SOCKET_SERVER) {
Florin Corasb384b542018-01-15 01:08:33 -080091 f = vl_api_registration_file (reg);
92 vlib_cli_output (vm, "%20s %8d", reg->name, f->file_descriptor);
Dave Barach59b25652017-09-10 15:04:27 -040093 }
Damjan Marionb2c31b62020-12-13 21:47:40 +010094 }
Dave Barach59b25652017-09-10 15:04:27 -040095/* *INDENT-ON* */
96}
97
Ole Troan94495f22018-08-02 11:58:12 +020098vl_api_registration_t *
Florin Coras2881dec2018-10-02 18:29:25 -070099vl_socket_api_client_handle_to_registration (u32 handle)
Ole Troan94495f22018-08-02 11:58:12 +0200100{
101 socket_main_t *sm = &socket_main;
Florin Coras2881dec2018-10-02 18:29:25 -0700102 u32 index = socket_api_registration_handle_to_index (handle);
103 if (pool_is_free_index (sm->registration_pool, index))
Ole Troan94495f22018-08-02 11:58:12 +0200104 {
105#if DEBUG > 2
Florin Coras2881dec2018-10-02 18:29:25 -0700106 clib_warning ("Invalid index %d\n", index);
Ole Troan94495f22018-08-02 11:58:12 +0200107#endif
108 return 0;
109 }
Florin Coras2881dec2018-10-02 18:29:25 -0700110 return pool_elt_at_index (sm->registration_pool, index);
Ole Troan94495f22018-08-02 11:58:12 +0200111}
112
Dave Barach59b25652017-09-10 15:04:27 -0400113void
114vl_socket_api_send (vl_api_registration_t * rp, u8 * elem)
115{
Dave Barach59b25652017-09-10 15:04:27 -0400116#if CLIB_DEBUG > 1
117 u32 output_length;
118#endif
Florin Coras90a63982017-12-19 04:50:01 -0800119 socket_main_t *sm = &socket_main;
120 u16 msg_id = ntohs (*(u16 *) elem);
Dave Barach39d69112019-11-27 11:42:13 -0500121 api_main_t *am = vlibapi_get_main ();
Florin Coras90a63982017-12-19 04:50:01 -0800122 msgbuf_t *mb = (msgbuf_t *) (elem - offsetof (msgbuf_t, data));
Florin Coras90a63982017-12-19 04:50:01 -0800123 vl_api_registration_t *sock_rp;
Florin Coras8023ad42018-08-02 12:16:03 -0700124 clib_file_main_t *fm = &file_main;
125 clib_error_t *error;
Florin Corasb384b542018-01-15 01:08:33 -0800126 clib_file_t *cf;
Dave Barach59b25652017-09-10 15:04:27 -0400127
Florin Corasb384b542018-01-15 01:08:33 -0800128 cf = vl_api_registration_file (rp);
Dave Barach59b25652017-09-10 15:04:27 -0400129 ASSERT (rp->registration_type > REGISTRATION_TYPE_SHMEM);
130
131 if (msg_id >= vec_len (am->api_trace_cfg))
132 {
133 clib_warning ("id out of range: %d", msg_id);
134 vl_msg_api_free ((void *) elem);
135 return;
136 }
137
Florin Coras90a63982017-12-19 04:50:01 -0800138 sock_rp = pool_elt_at_index (sm->registration_pool,
139 rp->vl_api_registration_pool_index);
140 ASSERT (sock_rp);
141
Dave Barach59b25652017-09-10 15:04:27 -0400142 /* Add the msgbuf_t to the output vector */
Florin Coras8023ad42018-08-02 12:16:03 -0700143 vec_add (sock_rp->output_vector, (u8 *) mb, sizeof (*mb));
144
145 /* Try to send the message and save any error like
146 * we do in the input epoll loop */
147 vec_add (sock_rp->output_vector, elem, ntohl (mb->data_len));
148 error = clib_file_write (cf);
149 unix_save_error (&unix_main, error);
150
151 /* If we didn't finish sending everything, wait for tx space */
152 if (vec_len (sock_rp->output_vector) > 0
153 && !(cf->flags & UNIX_FILE_DATA_AVAILABLE_TO_WRITE))
154 {
155 cf->flags |= UNIX_FILE_DATA_AVAILABLE_TO_WRITE;
156 fm->file_update (cf, UNIX_FILE_UPDATE_MODIFY);
157 }
Dave Barach59b25652017-09-10 15:04:27 -0400158
159#if CLIB_DEBUG > 1
160 output_length = sizeof (*mb) + ntohl (mb->data_len);
161 clib_warning ("wrote %u bytes to fd %d", output_length,
162 cf->file_descriptor);
163#endif
164
165 vl_msg_api_free ((void *) elem);
166}
167
168void
Florin Corase86a8ed2018-01-05 03:20:25 -0800169vl_socket_free_registration_index (u32 pool_index)
Dave Barach59b25652017-09-10 15:04:27 -0400170{
171 int i;
172 vl_api_registration_t *rp;
Dave Barach38ca6e62020-07-17 17:16:34 -0400173 void vl_api_call_reaper_functions (u32 client_index);
174
Dave Barach59b25652017-09-10 15:04:27 -0400175 if (pool_is_free_index (socket_main.registration_pool, pool_index))
176 {
177 clib_warning ("main pool index %d already free", pool_index);
178 return;
179 }
180 rp = pool_elt_at_index (socket_main.registration_pool, pool_index);
181
Dave Barach38ca6e62020-07-17 17:16:34 -0400182 vl_api_call_reaper_functions (pool_index);
183
Dave Barach59b25652017-09-10 15:04:27 -0400184 ASSERT (rp->registration_type != REGISTRATION_TYPE_FREE);
185 for (i = 0; i < vec_len (rp->additional_fds_to_close); i++)
186 if (close (rp->additional_fds_to_close[i]) < 0)
187 clib_unix_warning ("close");
188 vec_free (rp->additional_fds_to_close);
189 vec_free (rp->name);
190 vec_free (rp->unprocessed_input);
191 vec_free (rp->output_vector);
192 rp->registration_type = REGISTRATION_TYPE_FREE;
193 pool_put (socket_main.registration_pool, rp);
194}
195
196void
Florin Coras5224b5c2019-12-06 17:05:08 -0800197vl_socket_process_api_msg (vl_api_registration_t * rp, i8 * input_v)
Dave Barach59b25652017-09-10 15:04:27 -0400198{
199 msgbuf_t *mbp = (msgbuf_t *) input_v;
200
201 u8 *the_msg = (u8 *) (mbp->data);
Dave Barach59b25652017-09-10 15:04:27 -0400202 socket_main.current_rp = rp;
203 vl_msg_api_socket_handler (the_msg);
Dave Barach59b25652017-09-10 15:04:27 -0400204 socket_main.current_rp = 0;
205}
206
Andrew Yourtchenko162b70d2021-03-11 12:54:11 +0000207int
208is_being_removed_reg_index (u32 reg_index)
209{
210 vl_api_registration_t *rp = vl_socket_get_registration (reg_index);
211 ALWAYS_ASSERT (rp != 0);
212 return (rp->is_being_removed);
213}
214
215static void
216socket_cleanup_pending_remove_registration_cb (u32 *preg_index)
217{
218 vl_api_registration_t *rp = vl_socket_get_registration (*preg_index);
219 clib_file_main_t *fm = &file_main;
220 u32 pending_remove_file_index = vl_api_registration_file_index (rp);
221
222 clib_file_t *zf = fm->file_pool + pending_remove_file_index;
223
224 clib_file_del (fm, zf);
225 vl_socket_free_registration_index (rp - socket_main.registration_pool);
226}
227
228static void
229vl_socket_request_remove_reg_index (u32 reg_index)
230{
231 vl_api_registration_t *rp = vl_socket_get_registration (reg_index);
232 ALWAYS_ASSERT (rp != 0);
233 if (rp->is_being_removed)
234 {
235 return;
236 }
237 rp->is_being_removed = 1;
238 vl_api_force_rpc_call_main_thread (
239 socket_cleanup_pending_remove_registration_cb, (void *) &reg_index,
240 sizeof (u32));
241}
242
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200243/*
244 * Read function for API socket.
245 *
246 * Read data from socket, invoke SOCKET_READ_EVENT
247 * for each fully read API message, return 0.
248 * Store incomplete data for next invocation to continue.
249 *
250 * On severe read error, the file is closed.
251 *
252 * As reading is single threaded,
253 * socket_main.input_buffer is used temporarily.
254 * Even its length is modified, but always restored before return.
255 *
256 * Incomplete data is copied into a vector,
257 * pointer saved in registration's unprocessed_input.
258 */
Dave Barach59b25652017-09-10 15:04:27 -0400259clib_error_t *
260vl_socket_read_ready (clib_file_t * uf)
261{
Dave Barach59b25652017-09-10 15:04:27 -0400262 vlib_main_t *vm = vlib_get_main ();
263 vl_api_registration_t *rp;
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200264 /* n is the size of data read to input_buffer */
Dave Barach59b25652017-09-10 15:04:27 -0400265 int n;
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200266 /* msg_buffer vector can point to input_buffer or unprocessed_input */
Dave Barach59b25652017-09-10 15:04:27 -0400267 i8 *msg_buffer = 0;
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200268 /* data_for_process is a vector containing one full message, incl msgbuf_t */
Dave Barach59b25652017-09-10 15:04:27 -0400269 u8 *data_for_process;
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200270 /* msgbuf_len is the size of one message, including sizeof (msgbuf_t) */
271 u32 msgbuf_len;
Dave Barach59b25652017-09-10 15:04:27 -0400272 u32 save_input_buffer_length = vec_len (socket_main.input_buffer);
273 vl_socket_args_for_process_t *a;
Florin Coras5224b5c2019-12-06 17:05:08 -0800274 u32 reg_index = uf->private_data;
Andrew Yourtchenko162b70d2021-03-11 12:54:11 +0000275 if (is_being_removed_reg_index (reg_index))
276 {
277 return 0;
278 }
Dave Barach59b25652017-09-10 15:04:27 -0400279
Florin Coras5224b5c2019-12-06 17:05:08 -0800280 rp = vl_socket_get_registration (reg_index);
Dave Barach59b25652017-09-10 15:04:27 -0400281
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200282 /* Ignore unprocessed_input for now, n describes input_buffer for now. */
Dave Barach59b25652017-09-10 15:04:27 -0400283 n = read (uf->file_descriptor, socket_main.input_buffer,
284 vec_len (socket_main.input_buffer));
285
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200286 if (n <= 0)
Dave Barach59b25652017-09-10 15:04:27 -0400287 {
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200288 if (errno != EAGAIN)
289 {
290 /* Severe error, close the file. */
Andrew Yourtchenko162b70d2021-03-11 12:54:11 +0000291 vl_socket_request_remove_reg_index (reg_index);
Dave Barach59b25652017-09-10 15:04:27 -0400292 }
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200293 /* EAGAIN means we do not close the file, but no data to process anyway. */
Dave Barach59b25652017-09-10 15:04:27 -0400294 return 0;
295 }
296
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200297 /* Fake smaller length teporarily, so input_buffer can be used as msg_buffer. */
Benoît Gannef017b812021-06-22 11:58:27 +0200298 vec_set_len (socket_main.input_buffer, n);
Dave Barach59b25652017-09-10 15:04:27 -0400299
300 /*
301 * Look for bugs here. This code is tricky because
302 * data read from a stream socket does not honor message
303 * boundaries. In the case of a long message (>4K bytes)
304 * we have to do (at least) 2 reads, etc.
305 */
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200306 /* Determine msg_buffer. */
307 if (vec_len (rp->unprocessed_input))
308 {
309 vec_append (rp->unprocessed_input, socket_main.input_buffer);
310 msg_buffer = rp->unprocessed_input;
311 }
312 else
313 {
314 msg_buffer = socket_main.input_buffer;
315 }
316 /* Loop to process any full messages. */
317 ASSERT (vec_len (msg_buffer) > 0);
Dave Barach59b25652017-09-10 15:04:27 -0400318 do
319 {
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200320 /* Here, we are not sure how big a chunk of message we have left. */
321 /* Do we at least know how big the full message will be? */
322 if (vec_len (msg_buffer) <= sizeof (msgbuf_t))
323 /* No, so fragment is not a full message. */
324 goto save_and_split;
Dave Barach59b25652017-09-10 15:04:27 -0400325
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200326 /* Now we know how big the full message will be. */
327 msgbuf_len =
328 ntohl (((msgbuf_t *) msg_buffer)->data_len) + sizeof (msgbuf_t);
Dave Barach59b25652017-09-10 15:04:27 -0400329
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200330 /* But do we have a full message? */
331 if (msgbuf_len > vec_len (msg_buffer))
Dave Barach59b25652017-09-10 15:04:27 -0400332 {
333 save_and_split:
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200334 /* We don't have the entire message yet. */
335 /* If msg_buffer is unprocessed_input, nothing needs to be done. */
Dave Barach59b25652017-09-10 15:04:27 -0400336 if (msg_buffer == socket_main.input_buffer)
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200337 /* But if we were using the input buffer, save the fragment. */
Dave Barach59b25652017-09-10 15:04:27 -0400338 {
339 ASSERT (vec_len (rp->unprocessed_input) == 0);
340 vec_validate (rp->unprocessed_input, vec_len (msg_buffer) - 1);
Dave Barach178cf492018-11-13 16:34:13 -0500341 clib_memcpy_fast (rp->unprocessed_input, msg_buffer,
342 vec_len (msg_buffer));
Benoît Gannef017b812021-06-22 11:58:27 +0200343 vec_set_len (rp->unprocessed_input, vec_len (msg_buffer));
Dave Barach59b25652017-09-10 15:04:27 -0400344 }
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200345 /* No more full messages, restore original input_buffer length. */
Benoît Gannef017b812021-06-22 11:58:27 +0200346 vec_set_len (socket_main.input_buffer, save_input_buffer_length);
Dave Barach59b25652017-09-10 15:04:27 -0400347 return 0;
348 }
349
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200350 /*
351 * We have at least one full message.
352 * But msg_buffer can contain more data, so copy one message data
353 * so we can overwrite its length to what single message has.
354 */
Dave Barach59b25652017-09-10 15:04:27 -0400355 data_for_process = (u8 *) vec_dup (msg_buffer);
Benoît Gannef017b812021-06-22 11:58:27 +0200356 vec_set_len (data_for_process, msgbuf_len);
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200357 /* Everything is ready to signal the SOCKET_READ_EVENT. */
Dave Barach59b25652017-09-10 15:04:27 -0400358 pool_get (socket_main.process_args, a);
Florin Coras5224b5c2019-12-06 17:05:08 -0800359 a->reg_index = reg_index;
Dave Barach59b25652017-09-10 15:04:27 -0400360 a->data = data_for_process;
361
Florin Corase86a8ed2018-01-05 03:20:25 -0800362 vlib_process_signal_event (vm, vl_api_clnt_node.index,
Dave Barach59b25652017-09-10 15:04:27 -0400363 SOCKET_READ_EVENT,
364 a - socket_main.process_args);
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200365 if (vec_len (msg_buffer) > msgbuf_len)
366 /* There are some fragments left. Shrink the msg_buffer to simplify logic. */
367 vec_delete (msg_buffer, msgbuf_len, 0);
Dave Barach59b25652017-09-10 15:04:27 -0400368 else
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200369 /* We are done with msg_buffer. */
Benoît Gannef017b812021-06-22 11:58:27 +0200370 vec_set_len (msg_buffer, 0);
Dave Barach59b25652017-09-10 15:04:27 -0400371 }
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200372 while (vec_len (msg_buffer) > 0);
Dave Barach59b25652017-09-10 15:04:27 -0400373
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200374 /* Restore input_buffer, it could have been msg_buffer. */
Benoît Gannef017b812021-06-22 11:58:27 +0200375 vec_set_len (socket_main.input_buffer, save_input_buffer_length);
Dave Barach59b25652017-09-10 15:04:27 -0400376 return 0;
377}
378
Dave Barach59b25652017-09-10 15:04:27 -0400379clib_error_t *
380vl_socket_write_ready (clib_file_t * uf)
381{
382 clib_file_main_t *fm = &file_main;
383 vl_api_registration_t *rp;
384 int n;
385
Andrew Yourtchenko162b70d2021-03-11 12:54:11 +0000386 u32 reg_index = uf->private_data;
387 if (is_being_removed_reg_index (reg_index))
388 {
389 return 0;
390 }
391
392 rp = pool_elt_at_index (socket_main.registration_pool, reg_index);
Dave Barach59b25652017-09-10 15:04:27 -0400393
394 /* Flush output vector. */
Ole Troan94495f22018-08-02 11:58:12 +0200395 size_t total_bytes = vec_len (rp->output_vector);
396 size_t bytes_to_send, remaining_bytes = total_bytes;
397 void *p = rp->output_vector;
398 while (remaining_bytes > 0)
Dave Barach59b25652017-09-10 15:04:27 -0400399 {
Ole Troan94495f22018-08-02 11:58:12 +0200400 bytes_to_send = remaining_bytes > 4096 ? 4096 : remaining_bytes;
401 n = write (uf->file_descriptor, p, bytes_to_send);
402 if (n < 0)
Florin Coras8023ad42018-08-02 12:16:03 -0700403 {
Ole Troan94495f22018-08-02 11:58:12 +0200404 if (errno == EAGAIN)
405 {
406 break;
407 }
408#if DEBUG > 2
409 clib_warning ("write error, close the file...\n");
410#endif
Andrew Yourtchenko162b70d2021-03-11 12:54:11 +0000411 vl_socket_request_remove_reg_index (reg_index);
Ole Troan94495f22018-08-02 11:58:12 +0200412 return 0;
Florin Coras8023ad42018-08-02 12:16:03 -0700413 }
Ole Troan94495f22018-08-02 11:58:12 +0200414 remaining_bytes -= bytes_to_send;
415 p += bytes_to_send;
416 }
417
418 vec_delete (rp->output_vector, total_bytes - remaining_bytes, 0);
419 if (vec_len (rp->output_vector) <= 0
420 && (uf->flags & UNIX_FILE_DATA_AVAILABLE_TO_WRITE))
421 {
422 uf->flags &= ~UNIX_FILE_DATA_AVAILABLE_TO_WRITE;
423 fm->file_update (uf, UNIX_FILE_UPDATE_MODIFY);
Florin Coras8023ad42018-08-02 12:16:03 -0700424 }
Dave Barach59b25652017-09-10 15:04:27 -0400425
426 return 0;
427}
428
429clib_error_t *
430vl_socket_error_ready (clib_file_t * uf)
431{
Andrew Yourtchenko162b70d2021-03-11 12:54:11 +0000432 u32 reg_index = uf->private_data;
433 vl_socket_request_remove_reg_index (reg_index);
Dave Barach59b25652017-09-10 15:04:27 -0400434 return 0;
435}
436
437void
438socksvr_file_add (clib_file_main_t * fm, int fd)
439{
440 vl_api_registration_t *rp;
441 clib_file_t template = { 0 };
442
443 pool_get (socket_main.registration_pool, rp);
Dave Barachb7b92992018-10-17 10:38:51 -0400444 clib_memset (rp, 0, sizeof (*rp));
Dave Barach59b25652017-09-10 15:04:27 -0400445
446 template.read_function = vl_socket_read_ready;
447 template.write_function = vl_socket_write_ready;
448 template.error_function = vl_socket_error_ready;
449 template.file_descriptor = fd;
Paul Vinciguerra5481ad42020-01-28 14:47:17 -0500450 template.description = format (0, "socksrv");
Dave Barach59b25652017-09-10 15:04:27 -0400451 template.private_data = rp - socket_main.registration_pool;
452
453 rp->registration_type = REGISTRATION_TYPE_SOCKET_SERVER;
454 rp->vl_api_registration_pool_index = rp - socket_main.registration_pool;
455 rp->clib_file_index = clib_file_add (fm, &template);
456}
457
458static clib_error_t *
459socksvr_accept_ready (clib_file_t * uf)
460{
461 clib_file_main_t *fm = &file_main;
462 socket_main_t *sm = &socket_main;
463 clib_socket_t *sock = &sm->socksvr_listen_socket;
464 clib_socket_t client;
465 clib_error_t *error;
466
467 error = clib_socket_accept (sock, &client);
Dave Barach59b25652017-09-10 15:04:27 -0400468 if (error)
469 return error;
470
471 socksvr_file_add (fm, client.fd);
472 return 0;
473}
474
475static clib_error_t *
476socksvr_bogus_write (clib_file_t * uf)
477{
478 clib_warning ("why am I here?");
479 return 0;
480}
481
482/*
483 * vl_api_sockclnt_create_t_handler
484 */
485void
486vl_api_sockclnt_create_t_handler (vl_api_sockclnt_create_t * mp)
487{
488 vl_api_registration_t *regp;
489 vl_api_sockclnt_create_reply_t *rp;
Dave Barach39d69112019-11-27 11:42:13 -0500490 api_main_t *am = vlibapi_get_main ();
Ole Troan94495f22018-08-02 11:58:12 +0200491 hash_pair_t *hp;
Florin Coras90a63982017-12-19 04:50:01 -0800492 int rv = 0;
Ole Troan94495f22018-08-02 11:58:12 +0200493 u32 nmsg = hash_elts (am->msg_index_by_name_and_crc);
494 u32 i = 0;
Dave Barach59b25652017-09-10 15:04:27 -0400495
496 regp = socket_main.current_rp;
497
Filip Tehlar36217e32021-07-23 08:51:10 +0000498 /* client already connected through shared memory? */
499 if (!regp || regp->registration_type != REGISTRATION_TYPE_SOCKET_SERVER)
500 {
501 clib_warning (
502 "unsupported API call: already connected though shared memory?");
503 return;
504 }
Dave Barach59b25652017-09-10 15:04:27 -0400505
Ole Troan7adaa222019-08-27 15:05:27 +0200506 regp->name = format (0, "%s%c", mp->name, 0);
Dave Barach59b25652017-09-10 15:04:27 -0400507
Ole Troan94495f22018-08-02 11:58:12 +0200508 u32 size = sizeof (*rp) + (nmsg * sizeof (vl_api_message_table_entry_t));
Vratko Polakfc4828c2019-07-02 11:07:24 +0200509 rp = vl_msg_api_alloc_zero (size);
Dave Barach59b25652017-09-10 15:04:27 -0400510 rp->_vl_msg_id = htons (VL_API_SOCKCLNT_CREATE_REPLY);
Florin Coras2881dec2018-10-02 18:29:25 -0700511 rp->index = htonl (sock_api_registration_handle (regp));
Dave Barach59b25652017-09-10 15:04:27 -0400512 rp->context = mp->context;
513 rp->response = htonl (rv);
Ole Troan94495f22018-08-02 11:58:12 +0200514 rp->count = htons (nmsg);
Dave Barach59b25652017-09-10 15:04:27 -0400515
Ole Troan94495f22018-08-02 11:58:12 +0200516 /* *INDENT-OFF* */
517 hash_foreach_pair (hp, am->msg_index_by_name_and_crc,
518 ({
519 rp->message_table[i].index = htons(hp->value[0]);
Dave Baracha6ef36b2020-02-11 10:29:13 -0500520 (void) strncpy_s((char *)rp->message_table[i].name,
521 64 /* bytes of space at dst */,
522 (char *)hp->key,
523 64-1 /* chars to copy, without zero byte. */);
Ole Troan94495f22018-08-02 11:58:12 +0200524 i++;
525 }));
526 /* *INDENT-ON* */
Florin Corase86a8ed2018-01-05 03:20:25 -0800527 vl_api_send_msg (regp, (u8 *) rp);
Dave Barach59b25652017-09-10 15:04:27 -0400528}
529
530/*
531 * vl_api_sockclnt_delete_t_handler
532 */
533void
534vl_api_sockclnt_delete_t_handler (vl_api_sockclnt_delete_t * mp)
535{
536 vl_api_registration_t *regp;
537 vl_api_sockclnt_delete_reply_t *rp;
538
Ole Troan94495f22018-08-02 11:58:12 +0200539 regp = vl_api_client_index_to_registration (mp->client_index);
540 if (!regp)
541 return;
542
Ole Troan3c1cf2c2019-01-05 11:27:54 +0100543 u32 reg_index = socket_api_registration_handle_to_index (ntohl (mp->index));
Ole Troan94495f22018-08-02 11:58:12 +0200544 rp = vl_msg_api_alloc (sizeof (*rp));
545 rp->_vl_msg_id = htons (VL_API_SOCKCLNT_DELETE_REPLY);
546 rp->context = mp->context;
547
548 if (!pool_is_free_index (socket_main.registration_pool, reg_index))
Dave Barach59b25652017-09-10 15:04:27 -0400549 {
Dave Barach59b25652017-09-10 15:04:27 -0400550 rp->response = htonl (1);
Florin Corase86a8ed2018-01-05 03:20:25 -0800551 vl_api_send_msg (regp, (u8 *) rp);
Dave Barach59b25652017-09-10 15:04:27 -0400552
Florin Corasb384b542018-01-15 01:08:33 -0800553 vl_api_registration_del_file (regp);
Ole Troan94495f22018-08-02 11:58:12 +0200554 vl_socket_free_registration_index (reg_index);
Dave Barach59b25652017-09-10 15:04:27 -0400555 }
556 else
557 {
Ole Troan94495f22018-08-02 11:58:12 +0200558 clib_warning ("unknown client ID %d", reg_index);
559 rp->response = htonl (-1);
560 vl_api_send_msg (regp, (u8 *) rp);
Dave Barach59b25652017-09-10 15:04:27 -0400561 }
562}
563
Florin Corasb384b542018-01-15 01:08:33 -0800564clib_error_t *
Florin Coras466f2892018-08-03 02:50:43 -0700565vl_sock_api_send_fd_msg (int socket_fd, int fds[], int n_fds)
Dave Barach59b25652017-09-10 15:04:27 -0400566{
567 struct msghdr mh = { 0 };
568 struct iovec iov[1];
Florin Coras99368312018-08-02 10:45:44 -0700569 char ctl[CMSG_SPACE (sizeof (int) * n_fds)];
Florin Coras466f2892018-08-03 02:50:43 -0700570 struct cmsghdr *cmsg;
571 char *msg = "fdmsg";
Dave Barach59b25652017-09-10 15:04:27 -0400572 int rv;
573
574 iov[0].iov_base = msg;
575 iov[0].iov_len = strlen (msg);
576 mh.msg_iov = iov;
577 mh.msg_iovlen = 1;
578
Dave Barachb7b92992018-10-17 10:38:51 -0400579 clib_memset (&ctl, 0, sizeof (ctl));
Dave Barach59b25652017-09-10 15:04:27 -0400580 mh.msg_control = ctl;
581 mh.msg_controllen = sizeof (ctl);
582 cmsg = CMSG_FIRSTHDR (&mh);
Florin Coras466f2892018-08-03 02:50:43 -0700583 cmsg->cmsg_len = CMSG_LEN (sizeof (int) * n_fds);
Dave Barach59b25652017-09-10 15:04:27 -0400584 cmsg->cmsg_level = SOL_SOCKET;
585 cmsg->cmsg_type = SCM_RIGHTS;
Dave Barach178cf492018-11-13 16:34:13 -0500586 clib_memcpy_fast (CMSG_DATA (cmsg), fds, sizeof (int) * n_fds);
Dave Barach59b25652017-09-10 15:04:27 -0400587
Florin Coras587ea452020-08-17 20:46:34 -0700588 while ((rv = sendmsg (socket_fd, &mh, 0)) < 0 && errno == EAGAIN)
589 ;
Dave Barach59b25652017-09-10 15:04:27 -0400590 if (rv < 0)
591 return clib_error_return_unix (0, "sendmsg");
592 return 0;
593}
594
Florin Coras90a63982017-12-19 04:50:01 -0800595vl_api_shm_elem_config_t *
596vl_api_make_shm_config (vl_api_sock_init_shm_t * mp)
597{
598 vl_api_shm_elem_config_t *config = 0, *c;
599 u64 cfg;
600 int i;
601
602 if (!mp->nitems)
603 {
Dave Barach78958722018-05-10 16:44:27 -0400604 vec_validate (config, 6);
Florin Coras90a63982017-12-19 04:50:01 -0800605 config[0].type = VL_API_VLIB_RING;
Florin Coras90a63982017-12-19 04:50:01 -0800606 config[0].size = 256;
Dave Barach78958722018-05-10 16:44:27 -0400607 config[0].count = 32;
608
609 config[1].type = VL_API_VLIB_RING;
Florin Coras90a63982017-12-19 04:50:01 -0800610 config[1].size = 1024;
Dave Barach78958722018-05-10 16:44:27 -0400611 config[1].count = 16;
612
613 config[2].type = VL_API_VLIB_RING;
Florin Coras90a63982017-12-19 04:50:01 -0800614 config[2].size = 4096;
Dave Barach78958722018-05-10 16:44:27 -0400615 config[2].count = 2;
616
617 config[3].type = VL_API_CLIENT_RING;
618 config[3].size = 256;
619 config[3].count = 32;
620
621 config[4].type = VL_API_CLIENT_RING;
622 config[4].size = 1024;
623 config[4].count = 16;
624
625 config[5].type = VL_API_CLIENT_RING;
626 config[5].size = 4096;
627 config[5].count = 2;
628
629 config[6].type = VL_API_QUEUE;
630 config[6].count = 128;
631 config[6].size = sizeof (uword);
Florin Coras90a63982017-12-19 04:50:01 -0800632 }
633 else
634 {
635 vec_validate (config, mp->nitems - 1);
636 for (i = 0; i < mp->nitems; i++)
637 {
638 cfg = mp->configs[i];
639 /* Pretty much a hack but it avoids defining our own api type
640 * in memclnt.api */
641 c = (vl_api_shm_elem_config_t *) & cfg;
642 config[i].type = c->type;
643 config[i].count = c->count;
644 config[i].size = c->size;
645 }
646 }
647 return config;
648}
649
Dave Barach59b25652017-09-10 15:04:27 -0400650/*
Florin Coras90a63982017-12-19 04:50:01 -0800651 * Bootstrap shm api using the socket api
Dave Barach59b25652017-09-10 15:04:27 -0400652 */
653void
Florin Coras90a63982017-12-19 04:50:01 -0800654vl_api_sock_init_shm_t_handler (vl_api_sock_init_shm_t * mp)
Dave Barach59b25652017-09-10 15:04:27 -0400655{
Florin Coras90a63982017-12-19 04:50:01 -0800656 vl_api_sock_init_shm_reply_t *rmp;
Florin Coras4d9b9d82018-01-14 12:25:50 -0800657 ssvm_private_t _memfd_private, *memfd = &_memfd_private;
Dave Barach59b25652017-09-10 15:04:27 -0400658 svm_map_region_args_t _args, *a = &_args;
Florin Coras90a63982017-12-19 04:50:01 -0800659 vl_api_registration_t *regp;
Dave Barach39d69112019-11-27 11:42:13 -0500660 api_main_t *am = vlibapi_get_main ();
Dave Barach59b25652017-09-10 15:04:27 -0400661 svm_region_t *vlib_rp;
Florin Coras90a63982017-12-19 04:50:01 -0800662 clib_file_t *cf;
663 vl_api_shm_elem_config_t *config = 0;
Florin Corasb384b542018-01-15 01:08:33 -0800664 vl_shmem_hdr_t *shmem_hdr;
Florin Coras1f30a592019-05-08 19:57:24 -0700665 int rv, tries = 1000;
Dave Barach59b25652017-09-10 15:04:27 -0400666
667 regp = vl_api_client_index_to_registration (mp->client_index);
Dave Barach59b25652017-09-10 15:04:27 -0400668 if (regp == 0)
669 {
670 clib_warning ("API client disconnected");
671 return;
672 }
Dave Barach59b25652017-09-10 15:04:27 -0400673 if (regp->registration_type != REGISTRATION_TYPE_SOCKET_SERVER)
674 {
wanghanlinec2c4c42021-03-02 17:18:06 +0800675 clib_warning ("Invalid registration");
676 return;
Dave Barach59b25652017-09-10 15:04:27 -0400677 }
678
Florin Coras90a63982017-12-19 04:50:01 -0800679 /*
680 * Set up a memfd segment of the requested size wherein the
681 * shmem data structures will be initialized
682 */
Dave Barachb7b92992018-10-17 10:38:51 -0400683 clib_memset (memfd, 0, sizeof (*memfd));
Florin Coras4d9b9d82018-01-14 12:25:50 -0800684 memfd->ssvm_size = mp->requested_size;
Dave Barach59b25652017-09-10 15:04:27 -0400685 memfd->requested_va = 0ULL;
Florin Coras5220a262020-09-29 18:11:24 -0700686 memfd->is_server = 1;
Dave Barach59b25652017-09-10 15:04:27 -0400687 memfd->name = format (0, "%s%c", regp->name, 0);
688
Florin Coras5220a262020-09-29 18:11:24 -0700689 if ((rv = ssvm_server_init_memfd (memfd)))
Dave Barach59b25652017-09-10 15:04:27 -0400690 goto reply;
691
Benoît Gannedf601ae2020-10-20 14:31:55 +0200692 /* delete the unused heap created in ssvm_server_init_memfd and mark it
693 * accessible again for ASAN */
694 clib_mem_destroy_heap (memfd->sh->heap);
695 CLIB_MEM_UNPOISON ((void *) memfd->sh->ssvm_va, memfd->ssvm_size);
696
Dave Barach59b25652017-09-10 15:04:27 -0400697 /* Remember to close this fd when the socket connection goes away */
698 vec_add1 (regp->additional_fds_to_close, memfd->fd);
699
Florin Coras90a63982017-12-19 04:50:01 -0800700 /*
701 * Create a plausible svm_region in the memfd backed segment
702 */
Dave Barachb7b92992018-10-17 10:38:51 -0400703 clib_memset (a, 0, sizeof (*a));
Florin Coras4d9b9d82018-01-14 12:25:50 -0800704 a->baseva = memfd->sh->ssvm_va + MMAP_PAGESIZE;
705 a->size = memfd->ssvm_size - MMAP_PAGESIZE;
Dave Barach59b25652017-09-10 15:04:27 -0400706 /* $$$$ might want a different config parameter */
707 a->pvt_heap_size = am->api_pvt_heap_size;
708 a->flags = SVM_FLAGS_MHEAP;
709 svm_region_init_mapped_region (a, (svm_region_t *) a->baseva);
710
Dave Barach59b25652017-09-10 15:04:27 -0400711 /*
712 * Part deux, initialize the svm_region_t shared-memory header
713 * api allocation rings, and so on.
714 */
Florin Coras90a63982017-12-19 04:50:01 -0800715 config = vl_api_make_shm_config (mp);
716 vlib_rp = (svm_region_t *) a->baseva;
717 vl_init_shmem (vlib_rp, config, 1 /* is_vlib (dont-care) */ ,
718 1 /* is_private */ );
Florin Corasb384b542018-01-15 01:08:33 -0800719
720 /* Remember who created this. Needs to be post vl_init_shmem */
721 shmem_hdr = (vl_shmem_hdr_t *) vlib_rp->user_ctx;
722 shmem_hdr->clib_file_index = vl_api_registration_file_index (regp);
723
Dave Barach59b25652017-09-10 15:04:27 -0400724 vec_add1 (am->vlib_private_rps, vlib_rp);
Dave Barach59b25652017-09-10 15:04:27 -0400725 memfd->sh->ready = 1;
Florin Coras90a63982017-12-19 04:50:01 -0800726 vec_free (config);
Dave Barach59b25652017-09-10 15:04:27 -0400727
728 /* Recompute the set of input queues to poll in memclnt_process */
729 vec_reset_length (vl_api_queue_cursizes);
730
731reply:
732
Florin Coras90a63982017-12-19 04:50:01 -0800733 rmp = vl_msg_api_alloc (sizeof (*rmp));
734 rmp->_vl_msg_id = htons (VL_API_SOCK_INIT_SHM_REPLY);
735 rmp->context = mp->context;
736 rmp->retval = htonl (rv);
737
Florin Coras8023ad42018-08-02 12:16:03 -0700738 /*
739 * Note: The reply message needs to make it out the back door
740 * before we send the magic fd message. That's taken care of by
741 * the send function.
742 */
743 vl_socket_api_send (regp, (u8 *) rmp);
Florin Coras90a63982017-12-19 04:50:01 -0800744
745 if (rv != 0)
746 return;
747
Florin Coras90a63982017-12-19 04:50:01 -0800748 /* Send the magic "here's your sign (aka fd)" socket message */
Florin Coras8023ad42018-08-02 12:16:03 -0700749 cf = vl_api_registration_file (regp);
wanghanlinec2c4c42021-03-02 17:18:06 +0800750 if (!cf)
751 {
752 clib_warning ("cf removed");
753 return;
754 }
Florin Coras1f30a592019-05-08 19:57:24 -0700755
756 /* Wait for reply to be consumed before sending the fd */
757 while (tries-- > 0)
758 {
759 int bytes;
760 rv = ioctl (cf->file_descriptor, TIOCOUTQ, &bytes);
761 if (rv < 0)
762 {
763 clib_unix_warning ("ioctl returned");
764 break;
765 }
766 if (bytes == 0)
767 break;
768 usleep (1e3);
769 }
770
Florin Coras466f2892018-08-03 02:50:43 -0700771 vl_sock_api_send_fd_msg (cf->file_descriptor, &memfd->fd, 1);
Florin Coras90a63982017-12-19 04:50:01 -0800772}
773
Filip Tehlar36217e32021-07-23 08:51:10 +0000774#define foreach_vlib_api_msg \
775 _ (SOCKCLNT_CREATE, sockclnt_create, 0) \
776 _ (SOCKCLNT_DELETE, sockclnt_delete, 0) \
777 _ (SOCK_INIT_SHM, sock_init_shm, 0)
Dave Barach59b25652017-09-10 15:04:27 -0400778
779clib_error_t *
Florin Corase86a8ed2018-01-05 03:20:25 -0800780vl_sock_api_init (vlib_main_t * vm)
Dave Barach59b25652017-09-10 15:04:27 -0400781{
Filip Tehlar36217e32021-07-23 08:51:10 +0000782 api_main_t *am = vlibapi_get_main ();
Dave Barach59b25652017-09-10 15:04:27 -0400783 clib_file_main_t *fm = &file_main;
784 clib_file_t template = { 0 };
785 vl_api_registration_t *rp;
Dave Barach59b25652017-09-10 15:04:27 -0400786 socket_main_t *sm = &socket_main;
787 clib_socket_t *sock = &sm->socksvr_listen_socket;
788 clib_error_t *error;
789
790 /* If not explicitly configured, do not bind/enable, etc. */
791 if (sm->socket_name == 0)
792 return 0;
793
Filip Tehlar36217e32021-07-23 08:51:10 +0000794#define _(N, n, t) \
795 vl_msg_api_set_handlers (VL_API_##N, #n, vl_api_##n##_t_handler, \
796 vl_noop_handler, vl_api_##n##_t_endian, \
797 vl_api_##n##_t_print, sizeof (vl_api_##n##_t), t, \
798 vl_api_##n##_t_print_json, vl_api_##n##_t_tojson, \
799 vl_api_##n##_t_fromjson); \
800 am->api_trace_cfg[VL_API_##N].replay_enable = 0;
Dave Barach59b25652017-09-10 15:04:27 -0400801 foreach_vlib_api_msg;
802#undef _
803
804 vec_resize (sm->input_buffer, 4096);
805
806 sock->config = (char *) sm->socket_name;
Ole Troan4ff09ae2019-04-15 11:27:22 +0200807 sock->flags = CLIB_SOCKET_F_IS_SERVER | CLIB_SOCKET_F_ALLOW_GROUP_WRITE;
Dave Barach59b25652017-09-10 15:04:27 -0400808 error = clib_socket_init (sock);
809 if (error)
810 return error;
811
812 pool_get (sm->registration_pool, rp);
Dave Barachb7b92992018-10-17 10:38:51 -0400813 clib_memset (rp, 0, sizeof (*rp));
Dave Barach59b25652017-09-10 15:04:27 -0400814
815 rp->registration_type = REGISTRATION_TYPE_SOCKET_LISTEN;
816
817 template.read_function = socksvr_accept_ready;
818 template.write_function = socksvr_bogus_write;
819 template.file_descriptor = sock->fd;
Paul Vinciguerra5481ad42020-01-28 14:47:17 -0500820 template.description = format (0, "socksvr %s", sock->config);
Dave Barach59b25652017-09-10 15:04:27 -0400821 template.private_data = rp - sm->registration_pool;
822
823 rp->clib_file_index = clib_file_add (fm, &template);
824 return 0;
825}
826
827static clib_error_t *
828socket_exit (vlib_main_t * vm)
829{
Dave Barach59b25652017-09-10 15:04:27 -0400830 socket_main_t *sm = &socket_main;
831 vl_api_registration_t *rp;
832
833 /* Defensive driving in case something wipes out early */
834 if (sm->registration_pool)
835 {
836 u32 index;
837 /* *INDENT-OFF* */
Damjan Marionb2c31b62020-12-13 21:47:40 +0100838 pool_foreach (rp, sm->registration_pool) {
Florin Corasb384b542018-01-15 01:08:33 -0800839 vl_api_registration_del_file (rp);
840 index = rp->vl_api_registration_pool_index;
841 vl_socket_free_registration_index (index);
Damjan Marionb2c31b62020-12-13 21:47:40 +0100842 }
Dave Barach59b25652017-09-10 15:04:27 -0400843/* *INDENT-ON* */
844 }
845
846 return 0;
847}
848
849VLIB_MAIN_LOOP_EXIT_FUNCTION (socket_exit);
850
851static clib_error_t *
852socksvr_config (vlib_main_t * vm, unformat_input_t * input)
853{
854 socket_main_t *sm = &socket_main;
855
856 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
857 {
858 if (unformat (input, "socket-name %s", &sm->socket_name))
859 ;
Ole Troan6595ff72019-08-07 13:41:39 +0200860 /* DEPRECATE: default keyword is ignored */
Dave Barach59b25652017-09-10 15:04:27 -0400861 else if (unformat (input, "default"))
Ole Troan6595ff72019-08-07 13:41:39 +0200862 ;
Dave Barach59b25652017-09-10 15:04:27 -0400863 else
864 {
865 return clib_error_return (0, "unknown input '%U'",
866 format_unformat_error, input);
867 }
868 }
Ole Troan6595ff72019-08-07 13:41:39 +0200869
870 if (!vec_len (sm->socket_name))
871 sm->socket_name = format (0, "%s/%s", vlib_unix_get_runtime_dir (),
872 API_SOCKET_FILENAME);
873 vec_terminate_c_string (sm->socket_name);
874
Dave Barach59b25652017-09-10 15:04:27 -0400875 return 0;
876}
877
878VLIB_CONFIG_FUNCTION (socksvr_config, "socksvr");
879
Dave Barachf8d50682019-05-14 18:01:44 -0400880void
881vlibsocket_reference ()
Dave Barach59b25652017-09-10 15:04:27 -0400882{
Dave Barach59b25652017-09-10 15:04:27 -0400883}
884
Dave Barach59b25652017-09-10 15:04:27 -0400885/*
886 * fd.io coding-style-patch-verification: ON
887 *
888 * Local Variables:
889 * eval: (c-set-style "gnu")
890 * End:
891 */