blob: d85339b4dff6841a2a80d53f145c30971b1d11ae [file] [log] [blame]
Dave Barach59b25652017-09-10 15:04:27 -04001/*
2 *------------------------------------------------------------------
Ole Troan94495f22018-08-02 11:58:12 +02003 * socket_api.c
Dave Barach59b25652017-09-10 15:04:27 -04004 *
5 * Copyright (c) 2009 Cisco and/or its affiliates.
6 * Licensed under the Apache License, Version 2.0 (the "License");
7 * you may not use this file except in compliance with the License.
8 * You may obtain a copy of the License at:
9 *
10 * http://www.apache.org/licenses/LICENSE-2.0
11 *
12 * Unless required by applicable law or agreed to in writing, software
13 * distributed under the License is distributed on an "AS IS" BASIS,
14 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15 * See the License for the specific language governing permissions and
16 * limitations under the License.
17 *------------------------------------------------------------------
18 */
19
20#include <sys/types.h>
21#include <sys/socket.h>
22#include <netinet/in.h>
23#include <sys/ioctl.h>
Dave Barach59b25652017-09-10 15:04:27 -040024#include <fcntl.h>
25#include <sys/stat.h>
26
Florin Corase86a8ed2018-01-05 03:20:25 -080027#include <vppinfra/byte_order.h>
Florin Coras4d9b9d82018-01-14 12:25:50 -080028#include <svm/ssvm.h>
Dave Barach59b25652017-09-10 15:04:27 -040029#include <vlibmemory/api.h>
30
31#include <vlibmemory/vl_memory_msg_enum.h>
32
33#define vl_typedefs /* define message structures */
34#include <vlibmemory/vl_memory_api_h.h>
35#undef vl_typedefs
36
37/* instantiate all the print functions we know about */
38#define vl_print(handle, ...) vlib_cli_output (handle, __VA_ARGS__)
39#define vl_printfun
40#include <vlibmemory/vl_memory_api_h.h>
41#undef vl_printfun
42
43/* instantiate all the endian swap functions we know about */
44#define vl_endianfun
45#include <vlibmemory/vl_memory_api_h.h>
46#undef vl_endianfun
47
Florin Corase86a8ed2018-01-05 03:20:25 -080048socket_main_t socket_main;
49
Florin Coras2881dec2018-10-02 18:29:25 -070050#define SOCK_API_REG_HANDLE_BIT (1<<31)
51
52static u32
53sock_api_registration_handle (vl_api_registration_t * regp)
54{
55 ASSERT (regp->vl_api_registration_pool_index < SOCK_API_REG_HANDLE_BIT);
56 return regp->vl_api_registration_pool_index | SOCK_API_REG_HANDLE_BIT;
57}
58
59static u32
60socket_api_registration_handle_to_index (u32 reg_index)
61{
62 return (reg_index & ~SOCK_API_REG_HANDLE_BIT);
63}
64
65u8
66vl_socket_api_registration_handle_is_valid (u32 reg_handle)
67{
68 return ((reg_handle & SOCK_API_REG_HANDLE_BIT) != 0);
69}
70
Dave Barach59b25652017-09-10 15:04:27 -040071void
Florin Corase86a8ed2018-01-05 03:20:25 -080072vl_sock_api_dump_clients (vlib_main_t * vm, api_main_t * am)
Dave Barach59b25652017-09-10 15:04:27 -040073{
74 vl_api_registration_t *reg;
75 socket_main_t *sm = &socket_main;
Dave Barach59b25652017-09-10 15:04:27 -040076 clib_file_t *f;
77
78 /*
79 * Must have at least one active client, not counting the
80 * REGISTRATION_TYPE_SOCKET_LISTEN bind/accept socket
81 */
82 if (pool_elts (sm->registration_pool) < 2)
83 return;
84
85 vlib_cli_output (vm, "Socket clients");
Florin Coras90a63982017-12-19 04:50:01 -080086 vlib_cli_output (vm, "%20s %8s", "Name", "Fildesc");
Dave Barach59b25652017-09-10 15:04:27 -040087 /* *INDENT-OFF* */
Damjan Marionb2c31b62020-12-13 21:47:40 +010088 pool_foreach (reg, sm->registration_pool)
89 {
Dave Barach59b25652017-09-10 15:04:27 -040090 if (reg->registration_type == REGISTRATION_TYPE_SOCKET_SERVER) {
Florin Corasb384b542018-01-15 01:08:33 -080091 f = vl_api_registration_file (reg);
92 vlib_cli_output (vm, "%20s %8d", reg->name, f->file_descriptor);
Dave Barach59b25652017-09-10 15:04:27 -040093 }
Damjan Marionb2c31b62020-12-13 21:47:40 +010094 }
Dave Barach59b25652017-09-10 15:04:27 -040095/* *INDENT-ON* */
96}
97
Ole Troan94495f22018-08-02 11:58:12 +020098vl_api_registration_t *
Florin Coras2881dec2018-10-02 18:29:25 -070099vl_socket_api_client_handle_to_registration (u32 handle)
Ole Troan94495f22018-08-02 11:58:12 +0200100{
101 socket_main_t *sm = &socket_main;
Florin Coras2881dec2018-10-02 18:29:25 -0700102 u32 index = socket_api_registration_handle_to_index (handle);
103 if (pool_is_free_index (sm->registration_pool, index))
Ole Troan94495f22018-08-02 11:58:12 +0200104 {
105#if DEBUG > 2
Florin Coras2881dec2018-10-02 18:29:25 -0700106 clib_warning ("Invalid index %d\n", index);
Ole Troan94495f22018-08-02 11:58:12 +0200107#endif
108 return 0;
109 }
Florin Coras2881dec2018-10-02 18:29:25 -0700110 return pool_elt_at_index (sm->registration_pool, index);
Ole Troan94495f22018-08-02 11:58:12 +0200111}
112
Dave Barach59b25652017-09-10 15:04:27 -0400113void
114vl_socket_api_send (vl_api_registration_t * rp, u8 * elem)
115{
Dave Barach59b25652017-09-10 15:04:27 -0400116#if CLIB_DEBUG > 1
117 u32 output_length;
118#endif
Florin Coras90a63982017-12-19 04:50:01 -0800119 socket_main_t *sm = &socket_main;
120 u16 msg_id = ntohs (*(u16 *) elem);
Dave Barach39d69112019-11-27 11:42:13 -0500121 api_main_t *am = vlibapi_get_main ();
Florin Coras90a63982017-12-19 04:50:01 -0800122 msgbuf_t *mb = (msgbuf_t *) (elem - offsetof (msgbuf_t, data));
Florin Coras90a63982017-12-19 04:50:01 -0800123 vl_api_registration_t *sock_rp;
Florin Coras8023ad42018-08-02 12:16:03 -0700124 clib_file_main_t *fm = &file_main;
125 clib_error_t *error;
Florin Corasb384b542018-01-15 01:08:33 -0800126 clib_file_t *cf;
Dave Barach59b25652017-09-10 15:04:27 -0400127
Florin Corasb384b542018-01-15 01:08:33 -0800128 cf = vl_api_registration_file (rp);
Dave Barach59b25652017-09-10 15:04:27 -0400129 ASSERT (rp->registration_type > REGISTRATION_TYPE_SHMEM);
130
131 if (msg_id >= vec_len (am->api_trace_cfg))
132 {
133 clib_warning ("id out of range: %d", msg_id);
134 vl_msg_api_free ((void *) elem);
135 return;
136 }
137
Florin Coras90a63982017-12-19 04:50:01 -0800138 sock_rp = pool_elt_at_index (sm->registration_pool,
139 rp->vl_api_registration_pool_index);
140 ASSERT (sock_rp);
141
Dave Barach59b25652017-09-10 15:04:27 -0400142 /* Add the msgbuf_t to the output vector */
Florin Coras8023ad42018-08-02 12:16:03 -0700143 vec_add (sock_rp->output_vector, (u8 *) mb, sizeof (*mb));
144
145 /* Try to send the message and save any error like
146 * we do in the input epoll loop */
147 vec_add (sock_rp->output_vector, elem, ntohl (mb->data_len));
148 error = clib_file_write (cf);
149 unix_save_error (&unix_main, error);
150
wanghanlinec2c4c42021-03-02 17:18:06 +0800151 /* Make sure cf not removed in clib_file_write */
152 cf = vl_api_registration_file (rp);
153 if (!cf)
154 {
155 clib_warning ("cf removed");
156 vl_msg_api_free ((void *) elem);
157 return;
158 }
159
Florin Coras8023ad42018-08-02 12:16:03 -0700160 /* If we didn't finish sending everything, wait for tx space */
161 if (vec_len (sock_rp->output_vector) > 0
162 && !(cf->flags & UNIX_FILE_DATA_AVAILABLE_TO_WRITE))
163 {
164 cf->flags |= UNIX_FILE_DATA_AVAILABLE_TO_WRITE;
165 fm->file_update (cf, UNIX_FILE_UPDATE_MODIFY);
166 }
Dave Barach59b25652017-09-10 15:04:27 -0400167
168#if CLIB_DEBUG > 1
169 output_length = sizeof (*mb) + ntohl (mb->data_len);
170 clib_warning ("wrote %u bytes to fd %d", output_length,
171 cf->file_descriptor);
172#endif
173
174 vl_msg_api_free ((void *) elem);
175}
176
177void
Florin Corase86a8ed2018-01-05 03:20:25 -0800178vl_socket_free_registration_index (u32 pool_index)
Dave Barach59b25652017-09-10 15:04:27 -0400179{
180 int i;
181 vl_api_registration_t *rp;
Dave Barach38ca6e62020-07-17 17:16:34 -0400182 void vl_api_call_reaper_functions (u32 client_index);
183
Dave Barach59b25652017-09-10 15:04:27 -0400184 if (pool_is_free_index (socket_main.registration_pool, pool_index))
185 {
186 clib_warning ("main pool index %d already free", pool_index);
187 return;
188 }
189 rp = pool_elt_at_index (socket_main.registration_pool, pool_index);
190
Dave Barach38ca6e62020-07-17 17:16:34 -0400191 vl_api_call_reaper_functions (pool_index);
192
Dave Barach59b25652017-09-10 15:04:27 -0400193 ASSERT (rp->registration_type != REGISTRATION_TYPE_FREE);
194 for (i = 0; i < vec_len (rp->additional_fds_to_close); i++)
195 if (close (rp->additional_fds_to_close[i]) < 0)
196 clib_unix_warning ("close");
197 vec_free (rp->additional_fds_to_close);
198 vec_free (rp->name);
199 vec_free (rp->unprocessed_input);
200 vec_free (rp->output_vector);
201 rp->registration_type = REGISTRATION_TYPE_FREE;
202 pool_put (socket_main.registration_pool, rp);
203}
204
205void
Florin Coras5224b5c2019-12-06 17:05:08 -0800206vl_socket_process_api_msg (vl_api_registration_t * rp, i8 * input_v)
Dave Barach59b25652017-09-10 15:04:27 -0400207{
208 msgbuf_t *mbp = (msgbuf_t *) input_v;
209
210 u8 *the_msg = (u8 *) (mbp->data);
Dave Barach59b25652017-09-10 15:04:27 -0400211 socket_main.current_rp = rp;
212 vl_msg_api_socket_handler (the_msg);
Dave Barach59b25652017-09-10 15:04:27 -0400213 socket_main.current_rp = 0;
214}
215
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200216/*
217 * Read function for API socket.
218 *
219 * Read data from socket, invoke SOCKET_READ_EVENT
220 * for each fully read API message, return 0.
221 * Store incomplete data for next invocation to continue.
222 *
223 * On severe read error, the file is closed.
224 *
225 * As reading is single threaded,
226 * socket_main.input_buffer is used temporarily.
227 * Even its length is modified, but always restored before return.
228 *
229 * Incomplete data is copied into a vector,
230 * pointer saved in registration's unprocessed_input.
231 */
Dave Barach59b25652017-09-10 15:04:27 -0400232clib_error_t *
233vl_socket_read_ready (clib_file_t * uf)
234{
235 clib_file_main_t *fm = &file_main;
236 vlib_main_t *vm = vlib_get_main ();
237 vl_api_registration_t *rp;
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200238 /* n is the size of data read to input_buffer */
Dave Barach59b25652017-09-10 15:04:27 -0400239 int n;
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200240 /* msg_buffer vector can point to input_buffer or unprocessed_input */
Dave Barach59b25652017-09-10 15:04:27 -0400241 i8 *msg_buffer = 0;
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200242 /* data_for_process is a vector containing one full message, incl msgbuf_t */
Dave Barach59b25652017-09-10 15:04:27 -0400243 u8 *data_for_process;
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200244 /* msgbuf_len is the size of one message, including sizeof (msgbuf_t) */
245 u32 msgbuf_len;
Dave Barach59b25652017-09-10 15:04:27 -0400246 u32 save_input_buffer_length = vec_len (socket_main.input_buffer);
247 vl_socket_args_for_process_t *a;
Florin Coras5224b5c2019-12-06 17:05:08 -0800248 u32 reg_index = uf->private_data;
Dave Barach59b25652017-09-10 15:04:27 -0400249
Florin Coras5224b5c2019-12-06 17:05:08 -0800250 rp = vl_socket_get_registration (reg_index);
Dave Barach59b25652017-09-10 15:04:27 -0400251
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200252 /* Ignore unprocessed_input for now, n describes input_buffer for now. */
Dave Barach59b25652017-09-10 15:04:27 -0400253 n = read (uf->file_descriptor, socket_main.input_buffer,
254 vec_len (socket_main.input_buffer));
255
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200256 if (n <= 0)
Dave Barach59b25652017-09-10 15:04:27 -0400257 {
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200258 if (errno != EAGAIN)
259 {
260 /* Severe error, close the file. */
261 clib_file_del (fm, uf);
Florin Coras5224b5c2019-12-06 17:05:08 -0800262 vl_socket_free_registration_index (reg_index);
Dave Barach59b25652017-09-10 15:04:27 -0400263 }
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200264 /* EAGAIN means we do not close the file, but no data to process anyway. */
Dave Barach59b25652017-09-10 15:04:27 -0400265 return 0;
266 }
267
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200268 /* Fake smaller length teporarily, so input_buffer can be used as msg_buffer. */
Dave Barach59b25652017-09-10 15:04:27 -0400269 _vec_len (socket_main.input_buffer) = n;
270
271 /*
272 * Look for bugs here. This code is tricky because
273 * data read from a stream socket does not honor message
274 * boundaries. In the case of a long message (>4K bytes)
275 * we have to do (at least) 2 reads, etc.
276 */
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200277 /* Determine msg_buffer. */
278 if (vec_len (rp->unprocessed_input))
279 {
280 vec_append (rp->unprocessed_input, socket_main.input_buffer);
281 msg_buffer = rp->unprocessed_input;
282 }
283 else
284 {
285 msg_buffer = socket_main.input_buffer;
286 }
287 /* Loop to process any full messages. */
288 ASSERT (vec_len (msg_buffer) > 0);
Dave Barach59b25652017-09-10 15:04:27 -0400289 do
290 {
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200291 /* Here, we are not sure how big a chunk of message we have left. */
292 /* Do we at least know how big the full message will be? */
293 if (vec_len (msg_buffer) <= sizeof (msgbuf_t))
294 /* No, so fragment is not a full message. */
295 goto save_and_split;
Dave Barach59b25652017-09-10 15:04:27 -0400296
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200297 /* Now we know how big the full message will be. */
298 msgbuf_len =
299 ntohl (((msgbuf_t *) msg_buffer)->data_len) + sizeof (msgbuf_t);
Dave Barach59b25652017-09-10 15:04:27 -0400300
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200301 /* But do we have a full message? */
302 if (msgbuf_len > vec_len (msg_buffer))
Dave Barach59b25652017-09-10 15:04:27 -0400303 {
304 save_and_split:
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200305 /* We don't have the entire message yet. */
306 /* If msg_buffer is unprocessed_input, nothing needs to be done. */
Dave Barach59b25652017-09-10 15:04:27 -0400307 if (msg_buffer == socket_main.input_buffer)
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200308 /* But if we were using the input buffer, save the fragment. */
Dave Barach59b25652017-09-10 15:04:27 -0400309 {
310 ASSERT (vec_len (rp->unprocessed_input) == 0);
311 vec_validate (rp->unprocessed_input, vec_len (msg_buffer) - 1);
Dave Barach178cf492018-11-13 16:34:13 -0500312 clib_memcpy_fast (rp->unprocessed_input, msg_buffer,
313 vec_len (msg_buffer));
Dave Barach59b25652017-09-10 15:04:27 -0400314 _vec_len (rp->unprocessed_input) = vec_len (msg_buffer);
315 }
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200316 /* No more full messages, restore original input_buffer length. */
Dave Barach59b25652017-09-10 15:04:27 -0400317 _vec_len (socket_main.input_buffer) = save_input_buffer_length;
318 return 0;
319 }
320
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200321 /*
322 * We have at least one full message.
323 * But msg_buffer can contain more data, so copy one message data
324 * so we can overwrite its length to what single message has.
325 */
Dave Barach59b25652017-09-10 15:04:27 -0400326 data_for_process = (u8 *) vec_dup (msg_buffer);
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200327 _vec_len (data_for_process) = msgbuf_len;
328 /* Everything is ready to signal the SOCKET_READ_EVENT. */
Dave Barach59b25652017-09-10 15:04:27 -0400329 pool_get (socket_main.process_args, a);
Florin Coras5224b5c2019-12-06 17:05:08 -0800330 a->reg_index = reg_index;
Dave Barach59b25652017-09-10 15:04:27 -0400331 a->data = data_for_process;
332
Florin Corase86a8ed2018-01-05 03:20:25 -0800333 vlib_process_signal_event (vm, vl_api_clnt_node.index,
Dave Barach59b25652017-09-10 15:04:27 -0400334 SOCKET_READ_EVENT,
335 a - socket_main.process_args);
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200336 if (vec_len (msg_buffer) > msgbuf_len)
337 /* There are some fragments left. Shrink the msg_buffer to simplify logic. */
338 vec_delete (msg_buffer, msgbuf_len, 0);
Dave Barach59b25652017-09-10 15:04:27 -0400339 else
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200340 /* We are done with msg_buffer. */
Dave Barach59b25652017-09-10 15:04:27 -0400341 _vec_len (msg_buffer) = 0;
Dave Barach59b25652017-09-10 15:04:27 -0400342 }
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200343 while (vec_len (msg_buffer) > 0);
Dave Barach59b25652017-09-10 15:04:27 -0400344
Vratko Polak6a6af6e2019-10-07 14:52:53 +0200345 /* Restore input_buffer, it could have been msg_buffer. */
Dave Barach59b25652017-09-10 15:04:27 -0400346 _vec_len (socket_main.input_buffer) = save_input_buffer_length;
Dave Barach59b25652017-09-10 15:04:27 -0400347 return 0;
348}
349
Dave Barach59b25652017-09-10 15:04:27 -0400350clib_error_t *
351vl_socket_write_ready (clib_file_t * uf)
352{
353 clib_file_main_t *fm = &file_main;
354 vl_api_registration_t *rp;
355 int n;
356
357 rp = pool_elt_at_index (socket_main.registration_pool, uf->private_data);
358
359 /* Flush output vector. */
Ole Troan94495f22018-08-02 11:58:12 +0200360 size_t total_bytes = vec_len (rp->output_vector);
361 size_t bytes_to_send, remaining_bytes = total_bytes;
362 void *p = rp->output_vector;
363 while (remaining_bytes > 0)
Dave Barach59b25652017-09-10 15:04:27 -0400364 {
Ole Troan94495f22018-08-02 11:58:12 +0200365 bytes_to_send = remaining_bytes > 4096 ? 4096 : remaining_bytes;
366 n = write (uf->file_descriptor, p, bytes_to_send);
367 if (n < 0)
Florin Coras8023ad42018-08-02 12:16:03 -0700368 {
Ole Troan94495f22018-08-02 11:58:12 +0200369 if (errno == EAGAIN)
370 {
371 break;
372 }
373#if DEBUG > 2
374 clib_warning ("write error, close the file...\n");
375#endif
376 clib_file_del (fm, uf);
377 vl_socket_free_registration_index (rp -
378 socket_main.registration_pool);
379 return 0;
Florin Coras8023ad42018-08-02 12:16:03 -0700380 }
Ole Troan94495f22018-08-02 11:58:12 +0200381 remaining_bytes -= bytes_to_send;
382 p += bytes_to_send;
383 }
384
385 vec_delete (rp->output_vector, total_bytes - remaining_bytes, 0);
386 if (vec_len (rp->output_vector) <= 0
387 && (uf->flags & UNIX_FILE_DATA_AVAILABLE_TO_WRITE))
388 {
389 uf->flags &= ~UNIX_FILE_DATA_AVAILABLE_TO_WRITE;
390 fm->file_update (uf, UNIX_FILE_UPDATE_MODIFY);
Florin Coras8023ad42018-08-02 12:16:03 -0700391 }
Dave Barach59b25652017-09-10 15:04:27 -0400392
393 return 0;
394}
395
396clib_error_t *
397vl_socket_error_ready (clib_file_t * uf)
398{
399 vl_api_registration_t *rp;
400 clib_file_main_t *fm = &file_main;
401
402 rp = pool_elt_at_index (socket_main.registration_pool, uf->private_data);
403 clib_file_del (fm, uf);
Florin Corase86a8ed2018-01-05 03:20:25 -0800404 vl_socket_free_registration_index (rp - socket_main.registration_pool);
Dave Barach59b25652017-09-10 15:04:27 -0400405
406 return 0;
407}
408
409void
410socksvr_file_add (clib_file_main_t * fm, int fd)
411{
412 vl_api_registration_t *rp;
413 clib_file_t template = { 0 };
414
415 pool_get (socket_main.registration_pool, rp);
Dave Barachb7b92992018-10-17 10:38:51 -0400416 clib_memset (rp, 0, sizeof (*rp));
Dave Barach59b25652017-09-10 15:04:27 -0400417
418 template.read_function = vl_socket_read_ready;
419 template.write_function = vl_socket_write_ready;
420 template.error_function = vl_socket_error_ready;
421 template.file_descriptor = fd;
Paul Vinciguerra5481ad42020-01-28 14:47:17 -0500422 template.description = format (0, "socksrv");
Dave Barach59b25652017-09-10 15:04:27 -0400423 template.private_data = rp - socket_main.registration_pool;
424
425 rp->registration_type = REGISTRATION_TYPE_SOCKET_SERVER;
426 rp->vl_api_registration_pool_index = rp - socket_main.registration_pool;
427 rp->clib_file_index = clib_file_add (fm, &template);
428}
429
430static clib_error_t *
431socksvr_accept_ready (clib_file_t * uf)
432{
433 clib_file_main_t *fm = &file_main;
434 socket_main_t *sm = &socket_main;
435 clib_socket_t *sock = &sm->socksvr_listen_socket;
436 clib_socket_t client;
437 clib_error_t *error;
438
439 error = clib_socket_accept (sock, &client);
Dave Barach59b25652017-09-10 15:04:27 -0400440 if (error)
441 return error;
442
443 socksvr_file_add (fm, client.fd);
444 return 0;
445}
446
447static clib_error_t *
448socksvr_bogus_write (clib_file_t * uf)
449{
450 clib_warning ("why am I here?");
451 return 0;
452}
453
454/*
455 * vl_api_sockclnt_create_t_handler
456 */
457void
458vl_api_sockclnt_create_t_handler (vl_api_sockclnt_create_t * mp)
459{
460 vl_api_registration_t *regp;
461 vl_api_sockclnt_create_reply_t *rp;
Dave Barach39d69112019-11-27 11:42:13 -0500462 api_main_t *am = vlibapi_get_main ();
Ole Troan94495f22018-08-02 11:58:12 +0200463 hash_pair_t *hp;
Florin Coras90a63982017-12-19 04:50:01 -0800464 int rv = 0;
Ole Troan94495f22018-08-02 11:58:12 +0200465 u32 nmsg = hash_elts (am->msg_index_by_name_and_crc);
466 u32 i = 0;
Dave Barach59b25652017-09-10 15:04:27 -0400467
468 regp = socket_main.current_rp;
469
470 ASSERT (regp->registration_type == REGISTRATION_TYPE_SOCKET_SERVER);
471
Ole Troan7adaa222019-08-27 15:05:27 +0200472 regp->name = format (0, "%s%c", mp->name, 0);
Dave Barach59b25652017-09-10 15:04:27 -0400473
Ole Troan94495f22018-08-02 11:58:12 +0200474 u32 size = sizeof (*rp) + (nmsg * sizeof (vl_api_message_table_entry_t));
Vratko Polakfc4828c2019-07-02 11:07:24 +0200475 rp = vl_msg_api_alloc_zero (size);
Dave Barach59b25652017-09-10 15:04:27 -0400476 rp->_vl_msg_id = htons (VL_API_SOCKCLNT_CREATE_REPLY);
Florin Coras2881dec2018-10-02 18:29:25 -0700477 rp->index = htonl (sock_api_registration_handle (regp));
Dave Barach59b25652017-09-10 15:04:27 -0400478 rp->context = mp->context;
479 rp->response = htonl (rv);
Ole Troan94495f22018-08-02 11:58:12 +0200480 rp->count = htons (nmsg);
Dave Barach59b25652017-09-10 15:04:27 -0400481
Ole Troan94495f22018-08-02 11:58:12 +0200482 /* *INDENT-OFF* */
483 hash_foreach_pair (hp, am->msg_index_by_name_and_crc,
484 ({
485 rp->message_table[i].index = htons(hp->value[0]);
Dave Baracha6ef36b2020-02-11 10:29:13 -0500486 (void) strncpy_s((char *)rp->message_table[i].name,
487 64 /* bytes of space at dst */,
488 (char *)hp->key,
489 64-1 /* chars to copy, without zero byte. */);
Ole Troan94495f22018-08-02 11:58:12 +0200490 i++;
491 }));
492 /* *INDENT-ON* */
Florin Corase86a8ed2018-01-05 03:20:25 -0800493 vl_api_send_msg (regp, (u8 *) rp);
Dave Barach59b25652017-09-10 15:04:27 -0400494}
495
496/*
497 * vl_api_sockclnt_delete_t_handler
498 */
499void
500vl_api_sockclnt_delete_t_handler (vl_api_sockclnt_delete_t * mp)
501{
502 vl_api_registration_t *regp;
503 vl_api_sockclnt_delete_reply_t *rp;
504
Ole Troan94495f22018-08-02 11:58:12 +0200505 regp = vl_api_client_index_to_registration (mp->client_index);
506 if (!regp)
507 return;
508
Ole Troan3c1cf2c2019-01-05 11:27:54 +0100509 u32 reg_index = socket_api_registration_handle_to_index (ntohl (mp->index));
Ole Troan94495f22018-08-02 11:58:12 +0200510 rp = vl_msg_api_alloc (sizeof (*rp));
511 rp->_vl_msg_id = htons (VL_API_SOCKCLNT_DELETE_REPLY);
512 rp->context = mp->context;
513
514 if (!pool_is_free_index (socket_main.registration_pool, reg_index))
Dave Barach59b25652017-09-10 15:04:27 -0400515 {
Dave Barach59b25652017-09-10 15:04:27 -0400516 rp->response = htonl (1);
Florin Corase86a8ed2018-01-05 03:20:25 -0800517 vl_api_send_msg (regp, (u8 *) rp);
Dave Barach59b25652017-09-10 15:04:27 -0400518
Florin Corasb384b542018-01-15 01:08:33 -0800519 vl_api_registration_del_file (regp);
Ole Troan94495f22018-08-02 11:58:12 +0200520 vl_socket_free_registration_index (reg_index);
Dave Barach59b25652017-09-10 15:04:27 -0400521 }
522 else
523 {
Ole Troan94495f22018-08-02 11:58:12 +0200524 clib_warning ("unknown client ID %d", reg_index);
525 rp->response = htonl (-1);
526 vl_api_send_msg (regp, (u8 *) rp);
Dave Barach59b25652017-09-10 15:04:27 -0400527 }
528}
529
Florin Corasb384b542018-01-15 01:08:33 -0800530clib_error_t *
Florin Coras466f2892018-08-03 02:50:43 -0700531vl_sock_api_send_fd_msg (int socket_fd, int fds[], int n_fds)
Dave Barach59b25652017-09-10 15:04:27 -0400532{
533 struct msghdr mh = { 0 };
534 struct iovec iov[1];
Florin Coras99368312018-08-02 10:45:44 -0700535 char ctl[CMSG_SPACE (sizeof (int) * n_fds)];
Florin Coras466f2892018-08-03 02:50:43 -0700536 struct cmsghdr *cmsg;
537 char *msg = "fdmsg";
Dave Barach59b25652017-09-10 15:04:27 -0400538 int rv;
539
540 iov[0].iov_base = msg;
541 iov[0].iov_len = strlen (msg);
542 mh.msg_iov = iov;
543 mh.msg_iovlen = 1;
544
Dave Barachb7b92992018-10-17 10:38:51 -0400545 clib_memset (&ctl, 0, sizeof (ctl));
Dave Barach59b25652017-09-10 15:04:27 -0400546 mh.msg_control = ctl;
547 mh.msg_controllen = sizeof (ctl);
548 cmsg = CMSG_FIRSTHDR (&mh);
Florin Coras466f2892018-08-03 02:50:43 -0700549 cmsg->cmsg_len = CMSG_LEN (sizeof (int) * n_fds);
Dave Barach59b25652017-09-10 15:04:27 -0400550 cmsg->cmsg_level = SOL_SOCKET;
551 cmsg->cmsg_type = SCM_RIGHTS;
Dave Barach178cf492018-11-13 16:34:13 -0500552 clib_memcpy_fast (CMSG_DATA (cmsg), fds, sizeof (int) * n_fds);
Dave Barach59b25652017-09-10 15:04:27 -0400553
Florin Coras587ea452020-08-17 20:46:34 -0700554 while ((rv = sendmsg (socket_fd, &mh, 0)) < 0 && errno == EAGAIN)
555 ;
Dave Barach59b25652017-09-10 15:04:27 -0400556 if (rv < 0)
557 return clib_error_return_unix (0, "sendmsg");
558 return 0;
559}
560
Florin Coras90a63982017-12-19 04:50:01 -0800561vl_api_shm_elem_config_t *
562vl_api_make_shm_config (vl_api_sock_init_shm_t * mp)
563{
564 vl_api_shm_elem_config_t *config = 0, *c;
565 u64 cfg;
566 int i;
567
568 if (!mp->nitems)
569 {
Dave Barach78958722018-05-10 16:44:27 -0400570 vec_validate (config, 6);
Florin Coras90a63982017-12-19 04:50:01 -0800571 config[0].type = VL_API_VLIB_RING;
Florin Coras90a63982017-12-19 04:50:01 -0800572 config[0].size = 256;
Dave Barach78958722018-05-10 16:44:27 -0400573 config[0].count = 32;
574
575 config[1].type = VL_API_VLIB_RING;
Florin Coras90a63982017-12-19 04:50:01 -0800576 config[1].size = 1024;
Dave Barach78958722018-05-10 16:44:27 -0400577 config[1].count = 16;
578
579 config[2].type = VL_API_VLIB_RING;
Florin Coras90a63982017-12-19 04:50:01 -0800580 config[2].size = 4096;
Dave Barach78958722018-05-10 16:44:27 -0400581 config[2].count = 2;
582
583 config[3].type = VL_API_CLIENT_RING;
584 config[3].size = 256;
585 config[3].count = 32;
586
587 config[4].type = VL_API_CLIENT_RING;
588 config[4].size = 1024;
589 config[4].count = 16;
590
591 config[5].type = VL_API_CLIENT_RING;
592 config[5].size = 4096;
593 config[5].count = 2;
594
595 config[6].type = VL_API_QUEUE;
596 config[6].count = 128;
597 config[6].size = sizeof (uword);
Florin Coras90a63982017-12-19 04:50:01 -0800598 }
599 else
600 {
601 vec_validate (config, mp->nitems - 1);
602 for (i = 0; i < mp->nitems; i++)
603 {
604 cfg = mp->configs[i];
605 /* Pretty much a hack but it avoids defining our own api type
606 * in memclnt.api */
607 c = (vl_api_shm_elem_config_t *) & cfg;
608 config[i].type = c->type;
609 config[i].count = c->count;
610 config[i].size = c->size;
611 }
612 }
613 return config;
614}
615
Dave Barach59b25652017-09-10 15:04:27 -0400616/*
Florin Coras90a63982017-12-19 04:50:01 -0800617 * Bootstrap shm api using the socket api
Dave Barach59b25652017-09-10 15:04:27 -0400618 */
619void
Florin Coras90a63982017-12-19 04:50:01 -0800620vl_api_sock_init_shm_t_handler (vl_api_sock_init_shm_t * mp)
Dave Barach59b25652017-09-10 15:04:27 -0400621{
Florin Coras90a63982017-12-19 04:50:01 -0800622 vl_api_sock_init_shm_reply_t *rmp;
Florin Coras4d9b9d82018-01-14 12:25:50 -0800623 ssvm_private_t _memfd_private, *memfd = &_memfd_private;
Dave Barach59b25652017-09-10 15:04:27 -0400624 svm_map_region_args_t _args, *a = &_args;
Florin Coras90a63982017-12-19 04:50:01 -0800625 vl_api_registration_t *regp;
Dave Barach39d69112019-11-27 11:42:13 -0500626 api_main_t *am = vlibapi_get_main ();
Dave Barach59b25652017-09-10 15:04:27 -0400627 svm_region_t *vlib_rp;
Florin Coras90a63982017-12-19 04:50:01 -0800628 clib_file_t *cf;
629 vl_api_shm_elem_config_t *config = 0;
Florin Corasb384b542018-01-15 01:08:33 -0800630 vl_shmem_hdr_t *shmem_hdr;
Florin Coras1f30a592019-05-08 19:57:24 -0700631 int rv, tries = 1000;
Dave Barach59b25652017-09-10 15:04:27 -0400632
633 regp = vl_api_client_index_to_registration (mp->client_index);
Dave Barach59b25652017-09-10 15:04:27 -0400634 if (regp == 0)
635 {
636 clib_warning ("API client disconnected");
637 return;
638 }
Dave Barach59b25652017-09-10 15:04:27 -0400639 if (regp->registration_type != REGISTRATION_TYPE_SOCKET_SERVER)
640 {
wanghanlinec2c4c42021-03-02 17:18:06 +0800641 clib_warning ("Invalid registration");
642 return;
Dave Barach59b25652017-09-10 15:04:27 -0400643 }
644
Florin Coras90a63982017-12-19 04:50:01 -0800645 /*
646 * Set up a memfd segment of the requested size wherein the
647 * shmem data structures will be initialized
648 */
Dave Barachb7b92992018-10-17 10:38:51 -0400649 clib_memset (memfd, 0, sizeof (*memfd));
Florin Coras4d9b9d82018-01-14 12:25:50 -0800650 memfd->ssvm_size = mp->requested_size;
Dave Barach59b25652017-09-10 15:04:27 -0400651 memfd->requested_va = 0ULL;
Florin Coras5220a262020-09-29 18:11:24 -0700652 memfd->is_server = 1;
Dave Barach59b25652017-09-10 15:04:27 -0400653 memfd->name = format (0, "%s%c", regp->name, 0);
654
Florin Coras5220a262020-09-29 18:11:24 -0700655 if ((rv = ssvm_server_init_memfd (memfd)))
Dave Barach59b25652017-09-10 15:04:27 -0400656 goto reply;
657
Benoît Gannedf601ae2020-10-20 14:31:55 +0200658 /* delete the unused heap created in ssvm_server_init_memfd and mark it
659 * accessible again for ASAN */
660 clib_mem_destroy_heap (memfd->sh->heap);
661 CLIB_MEM_UNPOISON ((void *) memfd->sh->ssvm_va, memfd->ssvm_size);
662
Dave Barach59b25652017-09-10 15:04:27 -0400663 /* Remember to close this fd when the socket connection goes away */
664 vec_add1 (regp->additional_fds_to_close, memfd->fd);
665
Florin Coras90a63982017-12-19 04:50:01 -0800666 /*
667 * Create a plausible svm_region in the memfd backed segment
668 */
Dave Barachb7b92992018-10-17 10:38:51 -0400669 clib_memset (a, 0, sizeof (*a));
Florin Coras4d9b9d82018-01-14 12:25:50 -0800670 a->baseva = memfd->sh->ssvm_va + MMAP_PAGESIZE;
671 a->size = memfd->ssvm_size - MMAP_PAGESIZE;
Dave Barach59b25652017-09-10 15:04:27 -0400672 /* $$$$ might want a different config parameter */
673 a->pvt_heap_size = am->api_pvt_heap_size;
674 a->flags = SVM_FLAGS_MHEAP;
675 svm_region_init_mapped_region (a, (svm_region_t *) a->baseva);
676
Dave Barach59b25652017-09-10 15:04:27 -0400677 /*
678 * Part deux, initialize the svm_region_t shared-memory header
679 * api allocation rings, and so on.
680 */
Florin Coras90a63982017-12-19 04:50:01 -0800681 config = vl_api_make_shm_config (mp);
682 vlib_rp = (svm_region_t *) a->baseva;
683 vl_init_shmem (vlib_rp, config, 1 /* is_vlib (dont-care) */ ,
684 1 /* is_private */ );
Florin Corasb384b542018-01-15 01:08:33 -0800685
686 /* Remember who created this. Needs to be post vl_init_shmem */
687 shmem_hdr = (vl_shmem_hdr_t *) vlib_rp->user_ctx;
688 shmem_hdr->clib_file_index = vl_api_registration_file_index (regp);
689
Dave Barach59b25652017-09-10 15:04:27 -0400690 vec_add1 (am->vlib_private_rps, vlib_rp);
Dave Barach59b25652017-09-10 15:04:27 -0400691 memfd->sh->ready = 1;
Florin Coras90a63982017-12-19 04:50:01 -0800692 vec_free (config);
Dave Barach59b25652017-09-10 15:04:27 -0400693
694 /* Recompute the set of input queues to poll in memclnt_process */
695 vec_reset_length (vl_api_queue_cursizes);
696
697reply:
698
Florin Coras90a63982017-12-19 04:50:01 -0800699 rmp = vl_msg_api_alloc (sizeof (*rmp));
700 rmp->_vl_msg_id = htons (VL_API_SOCK_INIT_SHM_REPLY);
701 rmp->context = mp->context;
702 rmp->retval = htonl (rv);
703
Florin Coras8023ad42018-08-02 12:16:03 -0700704 /*
705 * Note: The reply message needs to make it out the back door
706 * before we send the magic fd message. That's taken care of by
707 * the send function.
708 */
709 vl_socket_api_send (regp, (u8 *) rmp);
Florin Coras90a63982017-12-19 04:50:01 -0800710
711 if (rv != 0)
712 return;
713
Florin Coras90a63982017-12-19 04:50:01 -0800714 /* Send the magic "here's your sign (aka fd)" socket message */
Florin Coras8023ad42018-08-02 12:16:03 -0700715 cf = vl_api_registration_file (regp);
wanghanlinec2c4c42021-03-02 17:18:06 +0800716 if (!cf)
717 {
718 clib_warning ("cf removed");
719 return;
720 }
Florin Coras1f30a592019-05-08 19:57:24 -0700721
722 /* Wait for reply to be consumed before sending the fd */
723 while (tries-- > 0)
724 {
725 int bytes;
726 rv = ioctl (cf->file_descriptor, TIOCOUTQ, &bytes);
727 if (rv < 0)
728 {
729 clib_unix_warning ("ioctl returned");
730 break;
731 }
732 if (bytes == 0)
733 break;
734 usleep (1e3);
735 }
736
Florin Coras466f2892018-08-03 02:50:43 -0700737 vl_sock_api_send_fd_msg (cf->file_descriptor, &memfd->fd, 1);
Florin Coras90a63982017-12-19 04:50:01 -0800738}
739
Florin Coras90a63982017-12-19 04:50:01 -0800740#define foreach_vlib_api_msg \
Ole Troanedfe2c02019-07-30 15:38:13 +0200741 _(SOCKCLNT_CREATE, sockclnt_create, 1) \
742 _(SOCKCLNT_DELETE, sockclnt_delete, 1) \
743 _(SOCK_INIT_SHM, sock_init_shm, 1)
Dave Barach59b25652017-09-10 15:04:27 -0400744
745clib_error_t *
Florin Corase86a8ed2018-01-05 03:20:25 -0800746vl_sock_api_init (vlib_main_t * vm)
Dave Barach59b25652017-09-10 15:04:27 -0400747{
748 clib_file_main_t *fm = &file_main;
749 clib_file_t template = { 0 };
750 vl_api_registration_t *rp;
Dave Barach59b25652017-09-10 15:04:27 -0400751 socket_main_t *sm = &socket_main;
752 clib_socket_t *sock = &sm->socksvr_listen_socket;
753 clib_error_t *error;
754
755 /* If not explicitly configured, do not bind/enable, etc. */
756 if (sm->socket_name == 0)
757 return 0;
758
Ole Troanedfe2c02019-07-30 15:38:13 +0200759#define _(N,n,t) \
Florin Coras90a63982017-12-19 04:50:01 -0800760 vl_msg_api_set_handlers(VL_API_##N, #n, \
761 vl_api_##n##_t_handler, \
762 vl_noop_handler, \
763 vl_api_##n##_t_endian, \
764 vl_api_##n##_t_print, \
Ole Troanedfe2c02019-07-30 15:38:13 +0200765 sizeof(vl_api_##n##_t), t);
Dave Barach59b25652017-09-10 15:04:27 -0400766 foreach_vlib_api_msg;
767#undef _
768
769 vec_resize (sm->input_buffer, 4096);
770
771 sock->config = (char *) sm->socket_name;
Ole Troan4ff09ae2019-04-15 11:27:22 +0200772 sock->flags = CLIB_SOCKET_F_IS_SERVER | CLIB_SOCKET_F_ALLOW_GROUP_WRITE;
Dave Barach59b25652017-09-10 15:04:27 -0400773 error = clib_socket_init (sock);
774 if (error)
775 return error;
776
777 pool_get (sm->registration_pool, rp);
Dave Barachb7b92992018-10-17 10:38:51 -0400778 clib_memset (rp, 0, sizeof (*rp));
Dave Barach59b25652017-09-10 15:04:27 -0400779
780 rp->registration_type = REGISTRATION_TYPE_SOCKET_LISTEN;
781
782 template.read_function = socksvr_accept_ready;
783 template.write_function = socksvr_bogus_write;
784 template.file_descriptor = sock->fd;
Paul Vinciguerra5481ad42020-01-28 14:47:17 -0500785 template.description = format (0, "socksvr %s", sock->config);
Dave Barach59b25652017-09-10 15:04:27 -0400786 template.private_data = rp - sm->registration_pool;
787
788 rp->clib_file_index = clib_file_add (fm, &template);
789 return 0;
790}
791
792static clib_error_t *
793socket_exit (vlib_main_t * vm)
794{
Dave Barach59b25652017-09-10 15:04:27 -0400795 socket_main_t *sm = &socket_main;
796 vl_api_registration_t *rp;
797
798 /* Defensive driving in case something wipes out early */
799 if (sm->registration_pool)
800 {
801 u32 index;
802 /* *INDENT-OFF* */
Damjan Marionb2c31b62020-12-13 21:47:40 +0100803 pool_foreach (rp, sm->registration_pool) {
Florin Corasb384b542018-01-15 01:08:33 -0800804 vl_api_registration_del_file (rp);
805 index = rp->vl_api_registration_pool_index;
806 vl_socket_free_registration_index (index);
Damjan Marionb2c31b62020-12-13 21:47:40 +0100807 }
Dave Barach59b25652017-09-10 15:04:27 -0400808/* *INDENT-ON* */
809 }
810
811 return 0;
812}
813
814VLIB_MAIN_LOOP_EXIT_FUNCTION (socket_exit);
815
816static clib_error_t *
817socksvr_config (vlib_main_t * vm, unformat_input_t * input)
818{
819 socket_main_t *sm = &socket_main;
820
821 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
822 {
823 if (unformat (input, "socket-name %s", &sm->socket_name))
824 ;
Ole Troan6595ff72019-08-07 13:41:39 +0200825 /* DEPRECATE: default keyword is ignored */
Dave Barach59b25652017-09-10 15:04:27 -0400826 else if (unformat (input, "default"))
Ole Troan6595ff72019-08-07 13:41:39 +0200827 ;
Dave Barach59b25652017-09-10 15:04:27 -0400828 else
829 {
830 return clib_error_return (0, "unknown input '%U'",
831 format_unformat_error, input);
832 }
833 }
Ole Troan6595ff72019-08-07 13:41:39 +0200834
835 if (!vec_len (sm->socket_name))
836 sm->socket_name = format (0, "%s/%s", vlib_unix_get_runtime_dir (),
837 API_SOCKET_FILENAME);
838 vec_terminate_c_string (sm->socket_name);
839
Dave Barach59b25652017-09-10 15:04:27 -0400840 return 0;
841}
842
843VLIB_CONFIG_FUNCTION (socksvr_config, "socksvr");
844
Dave Barachf8d50682019-05-14 18:01:44 -0400845void
846vlibsocket_reference ()
Dave Barach59b25652017-09-10 15:04:27 -0400847{
Dave Barach59b25652017-09-10 15:04:27 -0400848}
849
Dave Barach59b25652017-09-10 15:04:27 -0400850/*
851 * fd.io coding-style-patch-verification: ON
852 *
853 * Local Variables:
854 * eval: (c-set-style "gnu")
855 * End:
856 */