blob: 566b5a858a33cd6fe6a2e92987365cf3be7f77a4 [file] [log] [blame]
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001/*
Florin Coras5e062572019-03-14 19:07:51 -07002 * Copyright (c) 2016-2019 Cisco and/or its affiliates.
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07003 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
6 *
7 * http://www.apache.org/licenses/LICENSE-2.0
8 *
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
14 */
Florin Coras36847942023-02-02 12:56:16 -080015
16#ifdef HAVE_GNU_SOURCE
17#define _GNU_SOURCE
18#endif
19
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -070020#include <unistd.h>
21#include <stdio.h>
22#include <signal.h>
23#include <dlfcn.h>
24#include <pthread.h>
25#include <time.h>
26#include <stdarg.h>
shrinivasan ganapathy1d359632017-10-15 15:46:09 -070027#include <sys/resource.h>
Dave Wallace048b1d62018-01-03 22:24:41 -050028#include <netinet/tcp.h>
Florin Coraseff5f7a2023-02-07 17:36:17 -080029#include <netinet/udp.h>
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -070030
Dave Wallace2a865272018-02-07 21:00:42 -050031#include <vcl/ldp_socket_wrapper.h>
32#include <vcl/ldp.h>
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -070033#include <sys/time.h>
34
Florin Coras7baeb712019-01-04 17:05:43 -080035#include <vcl/vcl_locked.h>
Dave Wallace048b1d62018-01-03 22:24:41 -050036#include <vppinfra/time.h>
37#include <vppinfra/bitmap.h>
Florin Coras30e273b2018-11-27 00:04:59 -080038#include <vppinfra/lock.h>
39#include <vppinfra/pool.h>
40#include <vppinfra/hash.h>
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -070041
42#define HAVE_CONSTRUCTOR_ATTRIBUTE
43#ifdef HAVE_CONSTRUCTOR_ATTRIBUTE
44#define CONSTRUCTOR_ATTRIBUTE \
45 __attribute__ ((constructor))
46#else
47#define CONSTRUCTOR_ATTRIBUTE
48#endif /* HAVE_CONSTRUCTOR_ATTRIBUTE */
49
50#define HAVE_DESTRUCTOR_ATTRIBUTE
51#ifdef HAVE_DESTRUCTOR_ATTRIBUTE
52#define DESTRUCTOR_ATTRIBUTE \
53 __attribute__ ((destructor))
54#else
55#define DESTRUCTOR_ATTRIBUTE
56#endif
57
Florin Corasdfe4cf42018-11-28 22:13:45 -080058#define LDP_MAX_NWORKERS 32
59
Florin Coras36847942023-02-02 12:56:16 -080060#ifdef HAVE_GNU_SOURCE
61#define SOCKADDR_GET_SA(__addr) __addr.__sockaddr__;
62#else
63#define SOCKADDR_GET_SA(__addr) _addr;
64#endif
65
Tianyu Li2073fe42023-02-27 09:14:34 +000066#ifndef UDP_SEGMENT
67#define UDP_SEGMENT 103
68#endif
69
qinyangaf9b7152023-06-27 01:11:53 -070070#ifndef SO_ORIGINAL_DST
71/* from <linux/netfilter_ipv4.h> */
72#define SO_ORIGINAL_DST 80
73#endif
Florin Corasdfe4cf42018-11-28 22:13:45 -080074typedef struct ldp_worker_ctx_
Dave Wallace048b1d62018-01-03 22:24:41 -050075{
Dave Wallace048b1d62018-01-03 22:24:41 -050076 u8 *io_buffer;
77 clib_time_t clib_time;
Florin Corasdfe4cf42018-11-28 22:13:45 -080078
79 /*
80 * Select state
81 */
Dave Wallace048b1d62018-01-03 22:24:41 -050082 clib_bitmap_t *rd_bitmap;
83 clib_bitmap_t *wr_bitmap;
84 clib_bitmap_t *ex_bitmap;
Florin Coras294afe22019-01-07 17:49:17 -080085 clib_bitmap_t *si_rd_bitmap;
86 clib_bitmap_t *si_wr_bitmap;
87 clib_bitmap_t *si_ex_bitmap;
Dave Wallace048b1d62018-01-03 22:24:41 -050088 clib_bitmap_t *libc_rd_bitmap;
89 clib_bitmap_t *libc_wr_bitmap;
90 clib_bitmap_t *libc_ex_bitmap;
Florin Corasdfe4cf42018-11-28 22:13:45 -080091
92 /*
93 * Poll state
94 */
Dave Wallace048b1d62018-01-03 22:24:41 -050095 vcl_poll_t *vcl_poll;
Florin Coras6917b942018-11-13 22:44:54 -080096 struct pollfd *libc_poll;
97 u16 *libc_poll_idxs;
Florin Corasdfe4cf42018-11-28 22:13:45 -080098
99 /*
100 * Epoll state
101 */
Dave Wallace048b1d62018-01-03 22:24:41 -0500102 u8 epoll_wait_vcl;
hanlin4266d4d2020-05-19 17:34:17 +0800103 u8 mq_epfd_added;
Florin Coras99368312018-08-02 10:45:44 -0700104 int vcl_mq_epfd;
Florin Corasdfe4cf42018-11-28 22:13:45 -0800105
106} ldp_worker_ctx_t;
107
Florin Coras294afe22019-01-07 17:49:17 -0800108/* clib_bitmap_t, fd_mask and vcl_si_set are used interchangeably. Make sure
109 * they are the same size */
110STATIC_ASSERT (sizeof (clib_bitmap_t) == sizeof (fd_mask),
111 "ldp bitmap size mismatch");
112STATIC_ASSERT (sizeof (vcl_si_set) == sizeof (fd_mask),
113 "ldp bitmap size mismatch");
114
Florin Corasdfe4cf42018-11-28 22:13:45 -0800115typedef struct
116{
117 ldp_worker_ctx_t *workers;
118 int init;
119 char app_name[LDP_APP_NAME_MAX];
Florin Coras7baeb712019-01-04 17:05:43 -0800120 u32 vlsh_bit_val;
121 u32 vlsh_bit_mask;
Florin Corasdfe4cf42018-11-28 22:13:45 -0800122 u32 debug;
Florin Corasdfe4cf42018-11-28 22:13:45 -0800123
124 /** vcl needs next epoll_create to go to libc_epoll */
125 u8 vcl_needs_real_epoll;
Florin Corasa5a9efd2021-01-05 17:03:29 -0800126
127 /**
128 * crypto state used only for testing
129 */
130 u8 transparent_tls;
131 u32 ckpair_index;
Dave Wallace2a865272018-02-07 21:00:42 -0500132} ldp_main_t;
Florin Corasdfe4cf42018-11-28 22:13:45 -0800133
Dave Wallace2a865272018-02-07 21:00:42 -0500134#define LDP_DEBUG ldp->debug
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700135
Florin Coras99368312018-08-02 10:45:44 -0700136#define LDBG(_lvl, _fmt, _args...) \
137 if (ldp->debug > _lvl) \
hanlin9f3f18f2019-12-30 16:25:20 +0800138 { \
139 int errno_saved = errno; \
Florin Coras585c86a2020-10-16 17:57:36 -0700140 fprintf (stderr, "ldp<%d>: " _fmt "\n", getpid(), ##_args); \
hanlin9f3f18f2019-12-30 16:25:20 +0800141 errno = errno_saved; \
142 }
Florin Coras99368312018-08-02 10:45:44 -0700143
Dave Wallace2a865272018-02-07 21:00:42 -0500144static ldp_main_t ldp_main = {
Florin Coras7baeb712019-01-04 17:05:43 -0800145 .vlsh_bit_val = (1 << LDP_SID_BIT_MIN),
146 .vlsh_bit_mask = (1 << LDP_SID_BIT_MIN) - 1,
Dave Wallace2a865272018-02-07 21:00:42 -0500147 .debug = LDP_DEBUG_INIT,
Yu Ping7b74b072019-05-08 00:40:24 +0800148 .transparent_tls = 0,
Florin Corasa5a9efd2021-01-05 17:03:29 -0800149 .ckpair_index = ~0,
Dave Wallace048b1d62018-01-03 22:24:41 -0500150};
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700151
Dave Wallace2a865272018-02-07 21:00:42 -0500152static ldp_main_t *ldp = &ldp_main;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700153
Florin Corasdfe4cf42018-11-28 22:13:45 -0800154static inline ldp_worker_ctx_t *
155ldp_worker_get_current (void)
156{
157 return (ldp->workers + vppcom_worker_index ());
158}
159
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700160/*
161 * RETURN: 0 on success or -1 on error.
162 * */
Dave Wallace048b1d62018-01-03 22:24:41 -0500163static inline void
Dave Wallace2a865272018-02-07 21:00:42 -0500164ldp_set_app_name (char *app_name)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700165{
Florin Coras729b9c92023-02-28 10:58:08 -0800166 snprintf (ldp->app_name, LDP_APP_NAME_MAX, "%s-ldp-%d", app_name, getpid ());
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700167}
168
Dave Wallace048b1d62018-01-03 22:24:41 -0500169static inline char *
Dave Wallace2a865272018-02-07 21:00:42 -0500170ldp_get_app_name ()
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700171{
Dave Wallace2a865272018-02-07 21:00:42 -0500172 if (ldp->app_name[0] == '\0')
Florin Coras729b9c92023-02-28 10:58:08 -0800173 ldp_set_app_name (program_invocation_short_name);
Dave Wallace048b1d62018-01-03 22:24:41 -0500174
Dave Wallace2a865272018-02-07 21:00:42 -0500175 return ldp->app_name;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700176}
177
Dave Wallace048b1d62018-01-03 22:24:41 -0500178static inline int
Florin Coras7baeb712019-01-04 17:05:43 -0800179ldp_vlsh_to_fd (vls_handle_t vlsh)
Dave Wallace048b1d62018-01-03 22:24:41 -0500180{
Florin Coras7baeb712019-01-04 17:05:43 -0800181 return (vlsh + ldp->vlsh_bit_val);
Dave Wallace048b1d62018-01-03 22:24:41 -0500182}
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700183
Florin Coras7baeb712019-01-04 17:05:43 -0800184static inline vls_handle_t
185ldp_fd_to_vlsh (int fd)
Dave Wallace048b1d62018-01-03 22:24:41 -0500186{
Florin Coras7baeb712019-01-04 17:05:43 -0800187 if (fd < ldp->vlsh_bit_val)
188 return VLS_INVALID_HANDLE;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700189
Florin Coras7baeb712019-01-04 17:05:43 -0800190 return (fd - ldp->vlsh_bit_val);
Dave Wallace048b1d62018-01-03 22:24:41 -0500191}
192
Florin Coras2d9b4272019-03-11 10:14:37 -0700193static void
194ldp_alloc_workers (void)
195{
196 if (ldp->workers)
197 return;
Florin Coras1b75fdb2023-11-28 16:05:29 -0800198 ldp->workers = vec_new (ldp_worker_ctx_t, LDP_MAX_NWORKERS);
Florin Coras2d9b4272019-03-11 10:14:37 -0700199}
200
Florin Corasc6c4e862023-03-09 18:23:05 -0800201static void
202ldp_init_cfg (void)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700203{
Florin Coras99368312018-08-02 10:45:44 -0700204 char *env_var_str = getenv (LDP_ENV_DEBUG);
205 if (env_var_str)
206 {
207 u32 tmp;
208 if (sscanf (env_var_str, "%u", &tmp) != 1)
209 clib_warning ("LDP<%d>: WARNING: Invalid LDP debug level specified in"
210 " the env var " LDP_ENV_DEBUG " (%s)!", getpid (),
211 env_var_str);
212 else
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700213 {
Florin Coras99368312018-08-02 10:45:44 -0700214 ldp->debug = tmp;
Florin Coras05ecfcc2018-12-12 18:19:39 -0800215 LDBG (0, "configured LDP debug level (%u) from env var "
216 LDP_ENV_DEBUG "!", ldp->debug);
Florin Coras99368312018-08-02 10:45:44 -0700217 }
218 }
Dave Wallace048b1d62018-01-03 22:24:41 -0500219
Florin Coras99368312018-08-02 10:45:44 -0700220 env_var_str = getenv (LDP_ENV_APP_NAME);
221 if (env_var_str)
222 {
223 ldp_set_app_name (env_var_str);
Florin Coras05ecfcc2018-12-12 18:19:39 -0800224 LDBG (0, "configured LDP app name (%s) from the env var "
225 LDP_ENV_APP_NAME "!", ldp->app_name);
Florin Coras99368312018-08-02 10:45:44 -0700226 }
Dave Wallace048b1d62018-01-03 22:24:41 -0500227
Florin Coras99368312018-08-02 10:45:44 -0700228 env_var_str = getenv (LDP_ENV_SID_BIT);
229 if (env_var_str)
230 {
231 u32 sb;
232 if (sscanf (env_var_str, "%u", &sb) != 1)
233 {
Florin Coras294afe22019-01-07 17:49:17 -0800234 LDBG (0, "WARNING: Invalid LDP sid bit specified in the env var "
235 LDP_ENV_SID_BIT " (%s)! sid bit value %d (0x%x)", env_var_str,
236 ldp->vlsh_bit_val, ldp->vlsh_bit_val);
Florin Coras99368312018-08-02 10:45:44 -0700237 }
238 else if (sb < LDP_SID_BIT_MIN)
239 {
Florin Coras7baeb712019-01-04 17:05:43 -0800240 ldp->vlsh_bit_val = (1 << LDP_SID_BIT_MIN);
241 ldp->vlsh_bit_mask = ldp->vlsh_bit_val - 1;
Dave Wallace048b1d62018-01-03 22:24:41 -0500242
Florin Coras294afe22019-01-07 17:49:17 -0800243 LDBG (0, "WARNING: LDP sid bit (%u) specified in the env var "
244 LDP_ENV_SID_BIT " (%s) is too small. Using LDP_SID_BIT_MIN"
245 " (%d)! sid bit value %d (0x%x)", sb, env_var_str,
246 LDP_SID_BIT_MIN, ldp->vlsh_bit_val, ldp->vlsh_bit_val);
Florin Coras99368312018-08-02 10:45:44 -0700247 }
248 else if (sb > LDP_SID_BIT_MAX)
249 {
Florin Coras7baeb712019-01-04 17:05:43 -0800250 ldp->vlsh_bit_val = (1 << LDP_SID_BIT_MAX);
251 ldp->vlsh_bit_mask = ldp->vlsh_bit_val - 1;
Dave Wallace048b1d62018-01-03 22:24:41 -0500252
Florin Coras294afe22019-01-07 17:49:17 -0800253 LDBG (0, "WARNING: LDP sid bit (%u) specified in the env var "
254 LDP_ENV_SID_BIT " (%s) is too big. Using LDP_SID_BIT_MAX"
255 " (%d)! sid bit value %d (0x%x)", sb, env_var_str,
256 LDP_SID_BIT_MAX, ldp->vlsh_bit_val, ldp->vlsh_bit_val);
Dave Wallace048b1d62018-01-03 22:24:41 -0500257 }
258 else
259 {
Florin Coras7baeb712019-01-04 17:05:43 -0800260 ldp->vlsh_bit_val = (1 << sb);
261 ldp->vlsh_bit_mask = ldp->vlsh_bit_val - 1;
Florin Coras99368312018-08-02 10:45:44 -0700262
Florin Coras05ecfcc2018-12-12 18:19:39 -0800263 LDBG (0, "configured LDP sid bit (%u) from "
264 LDP_ENV_SID_BIT "! sid bit value %d (0x%x)", sb,
Florin Coras7baeb712019-01-04 17:05:43 -0800265 ldp->vlsh_bit_val, ldp->vlsh_bit_val);
Dave Wallace048b1d62018-01-03 22:24:41 -0500266 }
Florin Coras294afe22019-01-07 17:49:17 -0800267
268 /* Make sure there are enough bits in the fd set for vcl sessions */
269 if (ldp->vlsh_bit_val > FD_SETSIZE / 2)
270 {
wanghanlin1eb8fea2021-10-14 11:10:26 +0800271 /* Only valid for select/pselect, so just WARNING and not exit */
272 LDBG (0,
273 "WARNING: LDP vlsh bit value %d > FD_SETSIZE/2 %d, "
274 "select/pselect not supported now!",
Florin Coras294afe22019-01-07 17:49:17 -0800275 ldp->vlsh_bit_val, FD_SETSIZE / 2);
Florin Coras294afe22019-01-07 17:49:17 -0800276 }
Dave Wallace048b1d62018-01-03 22:24:41 -0500277 }
Yu Ping7b74b072019-05-08 00:40:24 +0800278 env_var_str = getenv (LDP_ENV_TLS_TRANS);
279 if (env_var_str)
280 {
281 ldp->transparent_tls = 1;
282 }
Florin Corasc6c4e862023-03-09 18:23:05 -0800283}
Florin Coras99368312018-08-02 10:45:44 -0700284
Florin Corasc6c4e862023-03-09 18:23:05 -0800285static int
286ldp_init (void)
287{
288 ldp_worker_ctx_t *ldpw;
289 int rv;
290
Gao Feng96600f92023-07-17 22:19:32 +0800291 if (ldp->init)
292 {
293 LDBG (0, "LDP is initialized already");
294 return 0;
295 }
Florin Corasc6c4e862023-03-09 18:23:05 -0800296
297 ldp_init_cfg ();
298 ldp->init = 1;
299 ldp->vcl_needs_real_epoll = 1;
300 rv = vls_app_create (ldp_get_app_name ());
301 if (rv != VPPCOM_OK)
302 {
303 ldp->vcl_needs_real_epoll = 0;
304 if (rv == VPPCOM_EEXIST)
305 return 0;
306 LDBG (2,
307 "\nERROR: ldp_init: vppcom_app_create()"
308 " failed! rv = %d (%s)\n",
309 rv, vppcom_retval_str (rv));
310 ldp->init = 0;
311 return rv;
312 }
313 ldp->vcl_needs_real_epoll = 0;
314 ldp_alloc_workers ();
Florin Corasc6c4e862023-03-09 18:23:05 -0800315
Florin Coras1b75fdb2023-11-28 16:05:29 -0800316 vec_foreach (ldpw, ldp->workers)
Florin Coras4dee8cd2019-01-29 21:28:16 -0800317 clib_memset (&ldpw->clib_time, 0, sizeof (ldpw->clib_time));
Florin Coras4dee8cd2019-01-29 21:28:16 -0800318
Florin Coras05ecfcc2018-12-12 18:19:39 -0800319 LDBG (0, "LDP initialization: done!");
Florin Coras99368312018-08-02 10:45:44 -0700320
321 return 0;
Dave Wallace048b1d62018-01-03 22:24:41 -0500322}
323
Florin Coras5f33d0d2021-06-02 21:22:21 -0700324#define ldp_init_check() \
325 if (PREDICT_FALSE (!ldp->init)) \
326 { \
327 if ((errno = -ldp_init ())) \
328 return -1; \
329 }
330
Dave Wallace048b1d62018-01-03 22:24:41 -0500331int
332close (int fd)
333{
Florin Coras7baeb712019-01-04 17:05:43 -0800334 vls_handle_t vlsh;
335 int rv, epfd;
Dave Wallace048b1d62018-01-03 22:24:41 -0500336
Florin Coras5f33d0d2021-06-02 21:22:21 -0700337 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -0500338
Florin Coras7baeb712019-01-04 17:05:43 -0800339 vlsh = ldp_fd_to_vlsh (fd);
340 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -0500341 {
Florin Coras7baeb712019-01-04 17:05:43 -0800342 epfd = vls_attr (vlsh, VPPCOM_ATTR_GET_LIBC_EPFD, 0, 0);
Dave Wallace048b1d62018-01-03 22:24:41 -0500343 if (epfd > 0)
344 {
Florin Coras06defbc2023-02-28 22:32:31 -0800345 ldp_worker_ctx_t *ldpw = ldp_worker_get_current ();
346 u32 size = sizeof (epfd);
347
Florin Coras7baeb712019-01-04 17:05:43 -0800348 LDBG (0, "fd %d: calling libc_close: epfd %u", fd, epfd);
Dave Wallace048b1d62018-01-03 22:24:41 -0500349
Florin Coras06defbc2023-02-28 22:32:31 -0800350 libc_close (epfd);
351 ldpw->mq_epfd_added = 0;
Dave Wallace048b1d62018-01-03 22:24:41 -0500352
Florin Coras06defbc2023-02-28 22:32:31 -0800353 epfd = 0;
354 (void) vls_attr (vlsh, VPPCOM_ATTR_SET_LIBC_EPFD, &epfd, &size);
Dave Wallace048b1d62018-01-03 22:24:41 -0500355 }
356 else if (PREDICT_FALSE (epfd < 0))
357 {
358 errno = -epfd;
359 rv = -1;
360 goto done;
361 }
362
Florin Coras7baeb712019-01-04 17:05:43 -0800363 LDBG (0, "fd %d: calling vls_close: vlsh %u", fd, vlsh);
Dave Wallace048b1d62018-01-03 22:24:41 -0500364
Florin Coras7baeb712019-01-04 17:05:43 -0800365 rv = vls_close (vlsh);
Dave Wallace048b1d62018-01-03 22:24:41 -0500366 if (rv != VPPCOM_OK)
367 {
368 errno = -rv;
369 rv = -1;
370 }
371 }
372 else
373 {
Florin Coras7baeb712019-01-04 17:05:43 -0800374 LDBG (0, "fd %d: calling libc_close", fd);
Dave Wallace048b1d62018-01-03 22:24:41 -0500375 rv = libc_close (fd);
376 }
377
378done:
Dave Wallace048b1d62018-01-03 22:24:41 -0500379 return rv;
380}
381
382ssize_t
383read (int fd, void *buf, size_t nbytes)
384{
Florin Coras7baeb712019-01-04 17:05:43 -0800385 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -0500386 ssize_t size;
Dave Wallace048b1d62018-01-03 22:24:41 -0500387
Florin Coras5f33d0d2021-06-02 21:22:21 -0700388 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -0500389
Florin Coras7baeb712019-01-04 17:05:43 -0800390 vlsh = ldp_fd_to_vlsh (fd);
391 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -0500392 {
Florin Coras7baeb712019-01-04 17:05:43 -0800393 size = vls_read (vlsh, buf, nbytes);
Dave Wallace048b1d62018-01-03 22:24:41 -0500394 if (size < 0)
395 {
396 errno = -size;
397 size = -1;
398 }
399 }
400 else
401 {
Dave Wallace048b1d62018-01-03 22:24:41 -0500402 size = libc_read (fd, buf, nbytes);
403 }
404
Dave Wallace048b1d62018-01-03 22:24:41 -0500405 return size;
406}
407
408ssize_t
409readv (int fd, const struct iovec * iov, int iovcnt)
410{
Dave Wallace8aaba562018-01-18 17:21:19 -0500411 int rv = 0, i, total = 0;
Florin Coras7baeb712019-01-04 17:05:43 -0800412 vls_handle_t vlsh;
413 ssize_t size = 0;
Dave Wallace048b1d62018-01-03 22:24:41 -0500414
Florin Coras5f33d0d2021-06-02 21:22:21 -0700415 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -0500416
Florin Coras7baeb712019-01-04 17:05:43 -0800417 vlsh = ldp_fd_to_vlsh (fd);
418 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -0500419 {
Florin Coras067f9542020-02-14 05:33:46 +0000420 for (i = 0; i < iovcnt; ++i)
Dave Wallace048b1d62018-01-03 22:24:41 -0500421 {
Florin Coras067f9542020-02-14 05:33:46 +0000422 rv = vls_read (vlsh, iov[i].iov_base, iov[i].iov_len);
423 if (rv <= 0)
424 break;
425 else
Dave Wallace048b1d62018-01-03 22:24:41 -0500426 {
Florin Coras067f9542020-02-14 05:33:46 +0000427 total += rv;
428 if (rv < iov[i].iov_len)
Dave Wallace048b1d62018-01-03 22:24:41 -0500429 break;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700430 }
431 }
Florin Coras067f9542020-02-14 05:33:46 +0000432 if (rv < 0 && total == 0)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700433 {
Dave Wallace048b1d62018-01-03 22:24:41 -0500434 errno = -rv;
435 size = -1;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700436 }
Dave Wallace048b1d62018-01-03 22:24:41 -0500437 else
438 size = total;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700439 }
440 else
441 {
Dave Wallace048b1d62018-01-03 22:24:41 -0500442 size = libc_readv (fd, iov, iovcnt);
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700443 }
444
Dave Wallace048b1d62018-01-03 22:24:41 -0500445 return size;
446}
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700447
Dave Wallace048b1d62018-01-03 22:24:41 -0500448ssize_t
449write (int fd, const void *buf, size_t nbytes)
450{
Florin Coras7baeb712019-01-04 17:05:43 -0800451 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -0500452 ssize_t size = 0;
Dave Wallace048b1d62018-01-03 22:24:41 -0500453
Florin Coras5f33d0d2021-06-02 21:22:21 -0700454 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -0500455
Florin Coras7baeb712019-01-04 17:05:43 -0800456 vlsh = ldp_fd_to_vlsh (fd);
457 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -0500458 {
Florin Coras7baeb712019-01-04 17:05:43 -0800459 size = vls_write_msg (vlsh, (void *) buf, nbytes);
Dave Wallace048b1d62018-01-03 22:24:41 -0500460 if (size < 0)
461 {
462 errno = -size;
463 size = -1;
464 }
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700465 }
466 else
467 {
Dave Wallace048b1d62018-01-03 22:24:41 -0500468 size = libc_write (fd, buf, nbytes);
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700469 }
470
Dave Wallace048b1d62018-01-03 22:24:41 -0500471 return size;
472}
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700473
Dave Wallace048b1d62018-01-03 22:24:41 -0500474ssize_t
475writev (int fd, const struct iovec * iov, int iovcnt)
476{
Dave Wallace048b1d62018-01-03 22:24:41 -0500477 ssize_t size = 0, total = 0;
Florin Coras7baeb712019-01-04 17:05:43 -0800478 vls_handle_t vlsh;
Dave Wallace8aaba562018-01-18 17:21:19 -0500479 int i, rv = 0;
Dave Wallace048b1d62018-01-03 22:24:41 -0500480
Florin Coras5f33d0d2021-06-02 21:22:21 -0700481 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -0500482
Florin Coras7baeb712019-01-04 17:05:43 -0800483 vlsh = ldp_fd_to_vlsh (fd);
484 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -0500485 {
Florin Coraseda1b8c2020-03-23 16:00:35 +0000486 for (i = 0; i < iovcnt; ++i)
Dave Wallace048b1d62018-01-03 22:24:41 -0500487 {
Florin Coraseda1b8c2020-03-23 16:00:35 +0000488 rv = vls_write_msg (vlsh, iov[i].iov_base, iov[i].iov_len);
489 if (rv < 0)
490 break;
491 else
Dave Wallace048b1d62018-01-03 22:24:41 -0500492 {
Florin Coraseda1b8c2020-03-23 16:00:35 +0000493 total += rv;
494 if (rv < iov[i].iov_len)
Dave Wallace048b1d62018-01-03 22:24:41 -0500495 break;
Dave Wallace048b1d62018-01-03 22:24:41 -0500496 }
497 }
Dave Wallace048b1d62018-01-03 22:24:41 -0500498
Florin Coraseda1b8c2020-03-23 16:00:35 +0000499 if (rv < 0 && total == 0)
Dave Wallace048b1d62018-01-03 22:24:41 -0500500 {
501 errno = -rv;
502 size = -1;
503 }
504 else
505 size = total;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700506 }
507 else
508 {
Dave Wallace048b1d62018-01-03 22:24:41 -0500509 size = libc_writev (fd, iov, iovcnt);
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700510 }
511
Dave Wallace048b1d62018-01-03 22:24:41 -0500512 return size;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700513}
514
Florin Coras0ab36f52020-05-26 19:45:45 +0000515static int
516fcntl_internal (int fd, int cmd, va_list ap)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700517{
Florin Coras7baeb712019-01-04 17:05:43 -0800518 vls_handle_t vlsh;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700519 int rv = 0;
Florin Coras7baeb712019-01-04 17:05:43 -0800520
521 vlsh = ldp_fd_to_vlsh (fd);
522 LDBG (0, "fd %u vlsh %d, cmd %u", fd, vlsh, cmd);
523 if (vlsh != VLS_INVALID_HANDLE)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700524 {
Dave Wallace048b1d62018-01-03 22:24:41 -0500525 int flags = va_arg (ap, int);
526 u32 size;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700527
Dave Wallace048b1d62018-01-03 22:24:41 -0500528 size = sizeof (flags);
529 rv = -EOPNOTSUPP;
530 switch (cmd)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700531 {
Dave Wallace048b1d62018-01-03 22:24:41 -0500532 case F_SETFL:
Florin Coras7baeb712019-01-04 17:05:43 -0800533 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_FLAGS, &flags, &size);
Dave Wallace048b1d62018-01-03 22:24:41 -0500534 break;
535
536 case F_GETFL:
Florin Coras7baeb712019-01-04 17:05:43 -0800537 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_FLAGS, &flags, &size);
Dave Wallace048b1d62018-01-03 22:24:41 -0500538 if (rv == VPPCOM_OK)
Florin Coras7baeb712019-01-04 17:05:43 -0800539 rv = flags;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700540 break;
Florin Coras173bae32018-11-16 18:56:28 -0800541 case F_SETFD:
542 /* TODO handle this */
543 LDBG (0, "F_SETFD ignored flags %u", flags);
544 rv = 0;
545 break;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700546 default:
Dave Wallace048b1d62018-01-03 22:24:41 -0500547 rv = -EOPNOTSUPP;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700548 break;
549 }
Dave Wallace048b1d62018-01-03 22:24:41 -0500550 if (rv < 0)
551 {
552 errno = -rv;
553 rv = -1;
554 }
555 }
556 else
557 {
Carl Smithe16707b2019-11-13 14:37:39 +1300558#ifdef HAVE_FCNTL64
559 rv = libc_vfcntl64 (fd, cmd, ap);
560#else
Dave Wallace048b1d62018-01-03 22:24:41 -0500561 rv = libc_vfcntl (fd, cmd, ap);
Carl Smithe16707b2019-11-13 14:37:39 +1300562#endif
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700563 }
564
Florin Coras0ab36f52020-05-26 19:45:45 +0000565 return rv;
566}
567
568int
569fcntl (int fd, int cmd, ...)
570{
571 va_list ap;
572 int rv;
573
Florin Coras5f33d0d2021-06-02 21:22:21 -0700574 ldp_init_check ();
Florin Coras0ab36f52020-05-26 19:45:45 +0000575
576 va_start (ap, cmd);
577 rv = fcntl_internal (fd, cmd, ap);
Dave Wallace048b1d62018-01-03 22:24:41 -0500578 va_end (ap);
579
Dave Wallace048b1d62018-01-03 22:24:41 -0500580 return rv;
581}
582
583int
Florin Corasd7586d52020-04-29 02:19:51 +0000584fcntl64 (int fd, int cmd, ...)
585{
586 va_list ap;
587 int rv;
588
Florin Coras5f33d0d2021-06-02 21:22:21 -0700589 ldp_init_check ();
Florin Coras0ab36f52020-05-26 19:45:45 +0000590
Florin Corasd7586d52020-04-29 02:19:51 +0000591 va_start (ap, cmd);
Florin Coras0ab36f52020-05-26 19:45:45 +0000592 rv = fcntl_internal (fd, cmd, ap);
Florin Corasd7586d52020-04-29 02:19:51 +0000593 va_end (ap);
594 return rv;
595}
596
597int
Dave Wallace048b1d62018-01-03 22:24:41 -0500598ioctl (int fd, unsigned long int cmd, ...)
599{
Florin Coras7baeb712019-01-04 17:05:43 -0800600 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -0500601 va_list ap;
Florin Coras7baeb712019-01-04 17:05:43 -0800602 int rv;
Dave Wallace048b1d62018-01-03 22:24:41 -0500603
Florin Coras5f33d0d2021-06-02 21:22:21 -0700604 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -0500605
606 va_start (ap, cmd);
Dave Wallace048b1d62018-01-03 22:24:41 -0500607
Florin Coras7baeb712019-01-04 17:05:43 -0800608 vlsh = ldp_fd_to_vlsh (fd);
609 if (vlsh != VLS_INVALID_HANDLE)
610 {
Dave Wallace048b1d62018-01-03 22:24:41 -0500611 switch (cmd)
612 {
613 case FIONREAD:
Florin Coras7baeb712019-01-04 17:05:43 -0800614 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_NREAD, 0, 0);
Dave Wallace048b1d62018-01-03 22:24:41 -0500615 break;
616
617 case FIONBIO:
618 {
Florin Coras4a0e08e2023-05-11 11:45:34 -0700619 u32 flags = *(va_arg (ap, int *)) ? O_NONBLOCK : 0;
Dave Wallace048b1d62018-01-03 22:24:41 -0500620 u32 size = sizeof (flags);
621
622 /* TBD: When VPPCOM_ATTR_[GS]ET_FLAGS supports flags other than
623 * non-blocking, the flags should be read here and merged
624 * with O_NONBLOCK.
625 */
Florin Coras7baeb712019-01-04 17:05:43 -0800626 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_FLAGS, &flags, &size);
Dave Wallace048b1d62018-01-03 22:24:41 -0500627 }
628 break;
629
630 default:
631 rv = -EOPNOTSUPP;
632 break;
633 }
634 if (rv < 0)
635 {
636 errno = -rv;
637 rv = -1;
638 }
639 }
640 else
641 {
Dave Wallace048b1d62018-01-03 22:24:41 -0500642 rv = libc_vioctl (fd, cmd, ap);
643 }
644
Dave Wallace048b1d62018-01-03 22:24:41 -0500645 va_end (ap);
646 return rv;
647}
648
Florin Coras294afe22019-01-07 17:49:17 -0800649always_inline void
650ldp_select_init_maps (fd_set * __restrict original,
651 clib_bitmap_t ** resultb, clib_bitmap_t ** libcb,
652 clib_bitmap_t ** vclb, int nfds, u32 minbits,
653 u32 n_bytes, uword * si_bits, uword * libc_bits)
654{
655 uword si_bits_set, libc_bits_set;
656 vls_handle_t vlsh;
657 int fd;
658
659 clib_bitmap_validate (*vclb, minbits);
660 clib_bitmap_validate (*libcb, minbits);
661 clib_bitmap_validate (*resultb, minbits);
662 clib_memcpy_fast (*resultb, original, n_bytes);
663 memset (original, 0, n_bytes);
664
Damjan Marionf0ca1e82020-12-13 23:26:56 +0100665 clib_bitmap_foreach (fd, *resultb) {
Florin Coras294afe22019-01-07 17:49:17 -0800666 if (fd > nfds)
667 break;
668 vlsh = ldp_fd_to_vlsh (fd);
669 if (vlsh == VLS_INVALID_HANDLE)
670 clib_bitmap_set_no_check (*libcb, fd, 1);
671 else
Florin Corascbce80a2020-04-20 01:32:38 +0000672 *vclb = clib_bitmap_set (*vclb, vlsh_to_session_index (vlsh), 1);
Damjan Marionf0ca1e82020-12-13 23:26:56 +0100673 }
Florin Coras294afe22019-01-07 17:49:17 -0800674
675 si_bits_set = clib_bitmap_last_set (*vclb) + 1;
676 *si_bits = (si_bits_set > *si_bits) ? si_bits_set : *si_bits;
Florin Corascbce80a2020-04-20 01:32:38 +0000677 clib_bitmap_validate (*resultb, *si_bits);
Florin Coras294afe22019-01-07 17:49:17 -0800678
679 libc_bits_set = clib_bitmap_last_set (*libcb) + 1;
680 *libc_bits = (libc_bits_set > *libc_bits) ? libc_bits_set : *libc_bits;
681}
682
683always_inline int
684ldp_select_vcl_map_to_libc (clib_bitmap_t * vclb, fd_set * __restrict libcb)
685{
686 vls_handle_t vlsh;
687 uword si;
688 int fd;
689
690 if (!libcb)
691 return 0;
692
Damjan Marionf0ca1e82020-12-13 23:26:56 +0100693 clib_bitmap_foreach (si, vclb) {
Florin Coras294afe22019-01-07 17:49:17 -0800694 vlsh = vls_session_index_to_vlsh (si);
Florin Coras54140622020-02-04 19:04:34 +0000695 ASSERT (vlsh != VLS_INVALID_HANDLE);
Florin Coras294afe22019-01-07 17:49:17 -0800696 fd = ldp_vlsh_to_fd (vlsh);
697 if (PREDICT_FALSE (fd < 0))
698 {
699 errno = EBADFD;
700 return -1;
701 }
702 FD_SET (fd, libcb);
Damjan Marionf0ca1e82020-12-13 23:26:56 +0100703 }
Florin Coras294afe22019-01-07 17:49:17 -0800704
705 return 0;
706}
707
708always_inline void
709ldp_select_libc_map_merge (clib_bitmap_t * result, fd_set * __restrict libcb)
710{
711 uword fd;
712
Florin Coras78b5fa62019-02-21 20:04:15 -0800713 if (!libcb)
714 return;
715
Damjan Marionf0ca1e82020-12-13 23:26:56 +0100716 clib_bitmap_foreach (fd, result)
Florin Coras294afe22019-01-07 17:49:17 -0800717 FD_SET ((int)fd, libcb);
Florin Coras294afe22019-01-07 17:49:17 -0800718}
719
Dave Wallace048b1d62018-01-03 22:24:41 -0500720int
Dave Wallace2a865272018-02-07 21:00:42 -0500721ldp_pselect (int nfds, fd_set * __restrict readfds,
722 fd_set * __restrict writefds,
723 fd_set * __restrict exceptfds,
724 const struct timespec *__restrict timeout,
725 const __sigset_t * __restrict sigmask)
Dave Wallace048b1d62018-01-03 22:24:41 -0500726{
Florin Coras294afe22019-01-07 17:49:17 -0800727 u32 minbits = clib_max (nfds, BITS (uword)), n_bytes;
Florin Corasdfe4cf42018-11-28 22:13:45 -0800728 ldp_worker_ctx_t *ldpw = ldp_worker_get_current ();
Florin Coras294afe22019-01-07 17:49:17 -0800729 struct timespec libc_tspec = { 0 };
730 f64 time_out, vcl_timeout = 0;
731 uword si_bits, libc_bits;
732 int rv, bits_set = 0;
Dave Wallace048b1d62018-01-03 22:24:41 -0500733
734 if (nfds < 0)
735 {
736 errno = EINVAL;
737 return -1;
738 }
739
Florin Coras4dee8cd2019-01-29 21:28:16 -0800740 if (PREDICT_FALSE (ldpw->clib_time.init_cpu_time == 0))
741 clib_time_init (&ldpw->clib_time);
742
Dave Wallace3ee1fe12018-02-23 01:09:11 -0500743 if (timeout)
744 {
745 time_out = (timeout->tv_sec == 0 && timeout->tv_nsec == 0) ?
Florin Coras7baeb712019-01-04 17:05:43 -0800746 (f64) 0 : (f64) timeout->tv_sec + (f64) timeout->tv_nsec / (f64) 1e9;
Dave Wallace3ee1fe12018-02-23 01:09:11 -0500747
liuyacanf71796e2021-08-02 10:01:39 +0800748 time_out += clib_time_now (&ldpw->clib_time);
749
Dave Wallace3ee1fe12018-02-23 01:09:11 -0500750 /* select as fine grained sleep */
751 if (!nfds)
752 {
Florin Corasdfe4cf42018-11-28 22:13:45 -0800753 while (clib_time_now (&ldpw->clib_time) < time_out)
Dave Wallace3ee1fe12018-02-23 01:09:11 -0500754 ;
755 return 0;
756 }
757 }
758 else if (!nfds)
759 {
760 errno = EINVAL;
761 return -1;
762 }
763 else
764 time_out = -1;
765
Florin Coras7baeb712019-01-04 17:05:43 -0800766 if (nfds <= ldp->vlsh_bit_val)
Dave Wallace048b1d62018-01-03 22:24:41 -0500767 {
Dave Wallace048b1d62018-01-03 22:24:41 -0500768 rv = libc_pselect (nfds, readfds, writefds, exceptfds,
769 timeout, sigmask);
770 goto done;
771 }
772
Florin Coras294afe22019-01-07 17:49:17 -0800773 si_bits = libc_bits = 0;
774 n_bytes = nfds / 8 + ((nfds % 8) ? 1 : 0);
Florin Coras7baeb712019-01-04 17:05:43 -0800775
Dave Wallace048b1d62018-01-03 22:24:41 -0500776 if (readfds)
Florin Coras294afe22019-01-07 17:49:17 -0800777 ldp_select_init_maps (readfds, &ldpw->rd_bitmap, &ldpw->libc_rd_bitmap,
778 &ldpw->si_rd_bitmap, nfds, minbits, n_bytes,
779 &si_bits, &libc_bits);
Dave Wallace048b1d62018-01-03 22:24:41 -0500780 if (writefds)
Florin Coras294afe22019-01-07 17:49:17 -0800781 ldp_select_init_maps (writefds, &ldpw->wr_bitmap,
782 &ldpw->libc_wr_bitmap, &ldpw->si_wr_bitmap, nfds,
783 minbits, n_bytes, &si_bits, &libc_bits);
Dave Wallace048b1d62018-01-03 22:24:41 -0500784 if (exceptfds)
Florin Coras294afe22019-01-07 17:49:17 -0800785 ldp_select_init_maps (exceptfds, &ldpw->ex_bitmap,
786 &ldpw->libc_ex_bitmap, &ldpw->si_ex_bitmap, nfds,
787 minbits, n_bytes, &si_bits, &libc_bits);
Dave Wallace048b1d62018-01-03 22:24:41 -0500788
Florin Coras294afe22019-01-07 17:49:17 -0800789 if (PREDICT_FALSE (!si_bits && !libc_bits))
Dave Wallace048b1d62018-01-03 22:24:41 -0500790 {
791 errno = EINVAL;
792 rv = -1;
793 goto done;
794 }
795
Florin Coras78b5fa62019-02-21 20:04:15 -0800796 if (!si_bits)
797 libc_tspec = timeout ? *timeout : libc_tspec;
Florin Coras294afe22019-01-07 17:49:17 -0800798
Dave Wallace048b1d62018-01-03 22:24:41 -0500799 do
800 {
Florin Coras294afe22019-01-07 17:49:17 -0800801 if (si_bits)
Dave Wallace048b1d62018-01-03 22:24:41 -0500802 {
Dave Wallace048b1d62018-01-03 22:24:41 -0500803 if (readfds)
Florin Coras294afe22019-01-07 17:49:17 -0800804 clib_memcpy_fast (ldpw->rd_bitmap, ldpw->si_rd_bitmap,
Florin Corascbce80a2020-04-20 01:32:38 +0000805 vec_len (ldpw->si_rd_bitmap) *
Dave Barach178cf492018-11-13 16:34:13 -0500806 sizeof (clib_bitmap_t));
Dave Wallace048b1d62018-01-03 22:24:41 -0500807 if (writefds)
Florin Coras294afe22019-01-07 17:49:17 -0800808 clib_memcpy_fast (ldpw->wr_bitmap, ldpw->si_wr_bitmap,
Florin Corascbce80a2020-04-20 01:32:38 +0000809 vec_len (ldpw->si_wr_bitmap) *
Dave Barach178cf492018-11-13 16:34:13 -0500810 sizeof (clib_bitmap_t));
Dave Wallace048b1d62018-01-03 22:24:41 -0500811 if (exceptfds)
Florin Coras294afe22019-01-07 17:49:17 -0800812 clib_memcpy_fast (ldpw->ex_bitmap, ldpw->si_ex_bitmap,
Florin Corascbce80a2020-04-20 01:32:38 +0000813 vec_len (ldpw->si_ex_bitmap) *
Dave Barach178cf492018-11-13 16:34:13 -0500814 sizeof (clib_bitmap_t));
Florin Coras294afe22019-01-07 17:49:17 -0800815
Florin Coras0ef8ef22019-01-18 08:37:13 -0800816 rv = vls_select (si_bits, readfds ? ldpw->rd_bitmap : NULL,
817 writefds ? ldpw->wr_bitmap : NULL,
818 exceptfds ? ldpw->ex_bitmap : NULL, vcl_timeout);
Florin Coras294afe22019-01-07 17:49:17 -0800819 if (rv < 0)
820 {
821 errno = -rv;
822 rv = -1;
Florin Coras5e6222a2020-04-24 17:09:25 +0000823 goto done;
Florin Coras294afe22019-01-07 17:49:17 -0800824 }
825 else if (rv > 0)
826 {
827 if (ldp_select_vcl_map_to_libc (ldpw->rd_bitmap, readfds))
828 {
829 rv = -1;
830 goto done;
831 }
832
833 if (ldp_select_vcl_map_to_libc (ldpw->wr_bitmap, writefds))
834 {
835 rv = -1;
836 goto done;
837 }
838
839 if (ldp_select_vcl_map_to_libc (ldpw->ex_bitmap, exceptfds))
840 {
841 rv = -1;
842 goto done;
843 }
844 bits_set = rv;
845 }
846 }
847 if (libc_bits)
848 {
849 if (readfds)
850 clib_memcpy_fast (ldpw->rd_bitmap, ldpw->libc_rd_bitmap,
851 vec_len (ldpw->libc_rd_bitmap) *
852 sizeof (clib_bitmap_t));
853 if (writefds)
854 clib_memcpy_fast (ldpw->wr_bitmap, ldpw->libc_wr_bitmap,
855 vec_len (ldpw->libc_wr_bitmap) *
856 sizeof (clib_bitmap_t));
857 if (exceptfds)
858 clib_memcpy_fast (ldpw->ex_bitmap, ldpw->libc_ex_bitmap,
859 vec_len (ldpw->libc_ex_bitmap) *
860 sizeof (clib_bitmap_t));
861
Dave Wallace048b1d62018-01-03 22:24:41 -0500862 rv = libc_pselect (libc_bits,
Florin Coras294afe22019-01-07 17:49:17 -0800863 readfds ? (fd_set *) ldpw->rd_bitmap : NULL,
864 writefds ? (fd_set *) ldpw->wr_bitmap : NULL,
865 exceptfds ? (fd_set *) ldpw->ex_bitmap : NULL,
866 &libc_tspec, sigmask);
867 if (rv > 0)
868 {
869 ldp_select_libc_map_merge (ldpw->rd_bitmap, readfds);
870 ldp_select_libc_map_merge (ldpw->wr_bitmap, writefds);
871 ldp_select_libc_map_merge (ldpw->ex_bitmap, exceptfds);
872 bits_set += rv;
873 }
874 }
875
876 if (bits_set)
877 {
878 rv = bits_set;
879 goto done;
Dave Wallace048b1d62018-01-03 22:24:41 -0500880 }
881 }
Florin Corasdfe4cf42018-11-28 22:13:45 -0800882 while ((time_out == -1) || (clib_time_now (&ldpw->clib_time) < time_out));
Dave Wallace048b1d62018-01-03 22:24:41 -0500883 rv = 0;
884
885done:
886 /* TBD: set timeout to amount of time left */
Florin Corasdfe4cf42018-11-28 22:13:45 -0800887 clib_bitmap_zero (ldpw->rd_bitmap);
Florin Coras294afe22019-01-07 17:49:17 -0800888 clib_bitmap_zero (ldpw->si_rd_bitmap);
Florin Corasdfe4cf42018-11-28 22:13:45 -0800889 clib_bitmap_zero (ldpw->libc_rd_bitmap);
890 clib_bitmap_zero (ldpw->wr_bitmap);
Florin Coras294afe22019-01-07 17:49:17 -0800891 clib_bitmap_zero (ldpw->si_wr_bitmap);
Florin Corasdfe4cf42018-11-28 22:13:45 -0800892 clib_bitmap_zero (ldpw->libc_wr_bitmap);
893 clib_bitmap_zero (ldpw->ex_bitmap);
Florin Coras294afe22019-01-07 17:49:17 -0800894 clib_bitmap_zero (ldpw->si_ex_bitmap);
Florin Corasdfe4cf42018-11-28 22:13:45 -0800895 clib_bitmap_zero (ldpw->libc_ex_bitmap);
Dave Wallace048b1d62018-01-03 22:24:41 -0500896
Dave Wallace048b1d62018-01-03 22:24:41 -0500897 return rv;
898}
899
900int
901select (int nfds, fd_set * __restrict readfds,
902 fd_set * __restrict writefds,
903 fd_set * __restrict exceptfds, struct timeval *__restrict timeout)
904{
905 struct timespec tspec;
906
907 if (timeout)
908 {
909 tspec.tv_sec = timeout->tv_sec;
910 tspec.tv_nsec = timeout->tv_usec * 1000;
911 }
Dave Wallace2a865272018-02-07 21:00:42 -0500912 return ldp_pselect (nfds, readfds, writefds, exceptfds,
913 timeout ? &tspec : NULL, NULL);
Dave Wallace048b1d62018-01-03 22:24:41 -0500914}
915
916#ifdef __USE_XOPEN2K
917int
918pselect (int nfds, fd_set * __restrict readfds,
919 fd_set * __restrict writefds,
920 fd_set * __restrict exceptfds,
921 const struct timespec *__restrict timeout,
922 const __sigset_t * __restrict sigmask)
923{
Dave Wallace2a865272018-02-07 21:00:42 -0500924 return ldp_pselect (nfds, readfds, writefds, exceptfds, timeout, 0);
Dave Wallace048b1d62018-01-03 22:24:41 -0500925}
926#endif
927
Yu Ping7b74b072019-05-08 00:40:24 +0800928/* If transparent TLS mode is turned on, then ldp will load key and cert.
929 */
930static int
Florin Corasa5a9efd2021-01-05 17:03:29 -0800931load_cert_key_pair (void)
Yu Ping7b74b072019-05-08 00:40:24 +0800932{
Florin Corasa5a9efd2021-01-05 17:03:29 -0800933 char *cert_str = getenv (LDP_ENV_TLS_CERT);
934 char *key_str = getenv (LDP_ENV_TLS_KEY);
935 char cert_buf[4096], key_buf[4096];
936 int cert_size, key_size;
937 vppcom_cert_key_pair_t crypto;
938 int ckp_index;
Yu Ping7b74b072019-05-08 00:40:24 +0800939 FILE *fp;
940
Florin Corasa5a9efd2021-01-05 17:03:29 -0800941 if (!cert_str || !key_str)
Yu Ping7b74b072019-05-08 00:40:24 +0800942 {
943 LDBG (0, "ERROR: failed to read LDP environment %s\n",
944 LDP_ENV_TLS_CERT);
945 return -1;
946 }
Florin Corasa5a9efd2021-01-05 17:03:29 -0800947
948 fp = fopen (cert_str, "r");
949 if (fp == NULL)
950 {
951 LDBG (0, "ERROR: failed to open cert file %s \n", cert_str);
952 return -1;
953 }
954 cert_size = fread (cert_buf, sizeof (char), sizeof (cert_buf), fp);
955 fclose (fp);
956
957 fp = fopen (key_str, "r");
958 if (fp == NULL)
959 {
960 LDBG (0, "ERROR: failed to open key file %s \n", key_str);
961 return -1;
962 }
963 key_size = fread (key_buf, sizeof (char), sizeof (key_buf), fp);
964 fclose (fp);
965
966 crypto.cert = cert_buf;
967 crypto.key = key_buf;
968 crypto.cert_len = cert_size;
969 crypto.key_len = key_size;
970 ckp_index = vppcom_add_cert_key_pair (&crypto);
971 if (ckp_index < 0)
972 {
973 LDBG (0, "ERROR: failed to add cert key pair\n");
974 return -1;
975 }
976
977 ldp->ckpair_index = ckp_index;
978
Yu Ping7b74b072019-05-08 00:40:24 +0800979 return 0;
980}
981
982static int
Florin Corasa5a9efd2021-01-05 17:03:29 -0800983assign_cert_key_pair (vls_handle_t vlsh)
Yu Ping7b74b072019-05-08 00:40:24 +0800984{
Florin Corasa5a9efd2021-01-05 17:03:29 -0800985 uint32_t ckp_len;
Yu Ping7b74b072019-05-08 00:40:24 +0800986
Florin Corasa5a9efd2021-01-05 17:03:29 -0800987 if (ldp->ckpair_index == ~0 && load_cert_key_pair () < 0)
988 return -1;
989
990 ckp_len = sizeof (ldp->ckpair_index);
liuyacan276675e2021-08-30 13:24:53 +0800991 return vls_attr (vlsh, VPPCOM_ATTR_SET_CKPAIR, &ldp->ckpair_index, &ckp_len);
Yu Ping7b74b072019-05-08 00:40:24 +0800992}
993
Dave Wallace048b1d62018-01-03 22:24:41 -0500994int
995socket (int domain, int type, int protocol)
996{
Florin Coras7baeb712019-01-04 17:05:43 -0800997 int rv, sock_type = type & ~(SOCK_CLOEXEC | SOCK_NONBLOCK);
Dave Wallace048b1d62018-01-03 22:24:41 -0500998 u8 is_nonblocking = type & SOCK_NONBLOCK ? 1 : 0;
Florin Coras7baeb712019-01-04 17:05:43 -0800999 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05001000
Florin Coras5f33d0d2021-06-02 21:22:21 -07001001 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001002
1003 if (((domain == AF_INET) || (domain == AF_INET6)) &&
1004 ((sock_type == SOCK_STREAM) || (sock_type == SOCK_DGRAM)))
1005 {
Yu Ping7b74b072019-05-08 00:40:24 +08001006 u8 proto;
1007 if (ldp->transparent_tls)
1008 {
1009 proto = VPPCOM_PROTO_TLS;
1010 }
1011 else
1012 proto = ((sock_type == SOCK_DGRAM) ?
1013 VPPCOM_PROTO_UDP : VPPCOM_PROTO_TCP);
Dave Wallace048b1d62018-01-03 22:24:41 -05001014
Florin Coras7baeb712019-01-04 17:05:43 -08001015 LDBG (0, "calling vls_create: proto %u (%s), is_nonblocking %u",
1016 proto, vppcom_proto_str (proto), is_nonblocking);
Dave Wallace048b1d62018-01-03 22:24:41 -05001017
Florin Coras7baeb712019-01-04 17:05:43 -08001018 vlsh = vls_create (proto, is_nonblocking);
1019 if (vlsh < 0)
Dave Wallace048b1d62018-01-03 22:24:41 -05001020 {
Florin Coras7baeb712019-01-04 17:05:43 -08001021 errno = -vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05001022 rv = -1;
1023 }
1024 else
1025 {
Yu Ping7b74b072019-05-08 00:40:24 +08001026 if (ldp->transparent_tls)
1027 {
Florin Corasa5a9efd2021-01-05 17:03:29 -08001028 if (assign_cert_key_pair (vlsh) < 0)
1029 return -1;
Yu Ping7b74b072019-05-08 00:40:24 +08001030 }
Florin Coras7baeb712019-01-04 17:05:43 -08001031 rv = ldp_vlsh_to_fd (vlsh);
Dave Wallace048b1d62018-01-03 22:24:41 -05001032 }
1033 }
1034 else
1035 {
Florin Coras7baeb712019-01-04 17:05:43 -08001036 LDBG (0, "calling libc_socket");
Dave Wallace048b1d62018-01-03 22:24:41 -05001037 rv = libc_socket (domain, type, protocol);
1038 }
1039
Dave Wallace048b1d62018-01-03 22:24:41 -05001040 return rv;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001041}
1042
1043/*
1044 * Create two new sockets, of type TYPE in domain DOMAIN and using
1045 * protocol PROTOCOL, which are connected to each other, and put file
1046 * descriptors for them in FDS[0] and FDS[1]. If PROTOCOL is zero,
1047 * one will be chosen automatically.
1048 * Returns 0 on success, -1 for errors.
1049 * */
1050int
Dave Wallace048b1d62018-01-03 22:24:41 -05001051socketpair (int domain, int type, int protocol, int fds[2])
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001052{
Florin Coras7baeb712019-01-04 17:05:43 -08001053 int rv, sock_type = type & ~(SOCK_CLOEXEC | SOCK_NONBLOCK);
Dave Wallace048b1d62018-01-03 22:24:41 -05001054
Florin Coras5f33d0d2021-06-02 21:22:21 -07001055 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001056
1057 if (((domain == AF_INET) || (domain == AF_INET6)) &&
1058 ((sock_type == SOCK_STREAM) || (sock_type == SOCK_DGRAM)))
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001059 {
Florin Coras7baeb712019-01-04 17:05:43 -08001060 LDBG (0, "LDP-TBD");
Dave Wallace048b1d62018-01-03 22:24:41 -05001061 errno = ENOSYS;
1062 rv = -1;
1063 }
1064 else
1065 {
Florin Coras7baeb712019-01-04 17:05:43 -08001066 LDBG (1, "calling libc_socketpair");
Florin Coras173bae32018-11-16 18:56:28 -08001067 rv = libc_socketpair (domain, type, protocol, fds);
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001068 }
1069
Dave Wallace048b1d62018-01-03 22:24:41 -05001070 return rv;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001071}
1072
1073int
Florin Coras36847942023-02-02 12:56:16 -08001074bind (int fd, __CONST_SOCKADDR_ARG _addr, socklen_t len)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001075{
Florin Coras36847942023-02-02 12:56:16 -08001076 const struct sockaddr *addr = SOCKADDR_GET_SA (_addr);
Florin Coras7baeb712019-01-04 17:05:43 -08001077 vls_handle_t vlsh;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001078 int rv;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001079
Florin Coras5f33d0d2021-06-02 21:22:21 -07001080 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001081
Florin Coras7baeb712019-01-04 17:05:43 -08001082 vlsh = ldp_fd_to_vlsh (fd);
1083 if (vlsh != VLS_INVALID_HANDLE)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001084 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001085 vppcom_endpt_t ep;
1086
Dave Wallace048b1d62018-01-03 22:24:41 -05001087 switch (addr->sa_family)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001088 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001089 case AF_INET:
1090 if (len != sizeof (struct sockaddr_in))
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001091 {
Florin Coras7baeb712019-01-04 17:05:43 -08001092 LDBG (0, "ERROR: fd %d: vlsh %u: Invalid AF_INET addr len %u!",
1093 fd, vlsh, len);
Dave Wallace048b1d62018-01-03 22:24:41 -05001094 errno = EINVAL;
1095 rv = -1;
1096 goto done;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001097 }
Dave Wallace048b1d62018-01-03 22:24:41 -05001098 ep.is_ip4 = VPPCOM_IS_IP4;
1099 ep.ip = (u8 *) & ((const struct sockaddr_in *) addr)->sin_addr;
1100 ep.port = (u16) ((const struct sockaddr_in *) addr)->sin_port;
1101 break;
1102
1103 case AF_INET6:
1104 if (len != sizeof (struct sockaddr_in6))
1105 {
Florin Coras7baeb712019-01-04 17:05:43 -08001106 LDBG (0, "ERROR: fd %d: vlsh %u: Invalid AF_INET6 addr len %u!",
1107 fd, vlsh, len);
Dave Wallace048b1d62018-01-03 22:24:41 -05001108 errno = EINVAL;
1109 rv = -1;
1110 goto done;
1111 }
1112 ep.is_ip4 = VPPCOM_IS_IP6;
1113 ep.ip = (u8 *) & ((const struct sockaddr_in6 *) addr)->sin6_addr;
1114 ep.port = (u16) ((const struct sockaddr_in6 *) addr)->sin6_port;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001115 break;
1116
1117 default:
Florin Coras7baeb712019-01-04 17:05:43 -08001118 LDBG (0, "ERROR: fd %d: vlsh %u: Unsupported address family %u!",
1119 fd, vlsh, addr->sa_family);
Dave Wallace048b1d62018-01-03 22:24:41 -05001120 errno = EAFNOSUPPORT;
1121 rv = -1;
1122 goto done;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001123 }
Florin Coras7baeb712019-01-04 17:05:43 -08001124 LDBG (0, "fd %d: calling vls_bind: vlsh %u, addr %p, len %u", fd, vlsh,
1125 addr, len);
Dave Wallace048b1d62018-01-03 22:24:41 -05001126
Florin Coras7baeb712019-01-04 17:05:43 -08001127 rv = vls_bind (vlsh, &ep);
Dave Wallace048b1d62018-01-03 22:24:41 -05001128 if (rv != VPPCOM_OK)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001129 {
1130 errno = -rv;
Dave Wallace048b1d62018-01-03 22:24:41 -05001131 rv = -1;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001132 }
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001133 }
Dave Wallace048b1d62018-01-03 22:24:41 -05001134 else
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001135 {
Florin Coras7baeb712019-01-04 17:05:43 -08001136 LDBG (0, "fd %d: calling libc_bind: addr %p, len %u", fd, addr, len);
Dave Wallace048b1d62018-01-03 22:24:41 -05001137 rv = libc_bind (fd, addr, len);
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001138 }
1139
Dave Wallace048b1d62018-01-03 22:24:41 -05001140done:
Florin Coras7baeb712019-01-04 17:05:43 -08001141 LDBG (1, "fd %d: returning %d", fd, rv);
Florin Coras05ecfcc2018-12-12 18:19:39 -08001142
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001143 return rv;
1144}
1145
1146static inline int
Florin Coras36847942023-02-02 12:56:16 -08001147ldp_copy_ep_to_sockaddr (struct sockaddr *addr, socklen_t *__restrict len,
1148 vppcom_endpt_t *ep)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001149{
Florin Coras36847942023-02-02 12:56:16 -08001150 int rv = 0, sa_len, copy_len;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001151
Florin Coras5f33d0d2021-06-02 21:22:21 -07001152 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001153
1154 if (addr && len && ep)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001155 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001156 addr->sa_family = (ep->is_ip4 == VPPCOM_IS_IP4) ? AF_INET : AF_INET6;
1157 switch (addr->sa_family)
1158 {
1159 case AF_INET:
1160 ((struct sockaddr_in *) addr)->sin_port = ep->port;
1161 if (*len > sizeof (struct sockaddr_in))
1162 *len = sizeof (struct sockaddr_in);
1163 sa_len = sizeof (struct sockaddr_in) - sizeof (struct in_addr);
1164 copy_len = *len - sa_len;
1165 if (copy_len > 0)
1166 memcpy (&((struct sockaddr_in *) addr)->sin_addr, ep->ip,
1167 copy_len);
1168 break;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001169
Dave Wallace048b1d62018-01-03 22:24:41 -05001170 case AF_INET6:
1171 ((struct sockaddr_in6 *) addr)->sin6_port = ep->port;
1172 if (*len > sizeof (struct sockaddr_in6))
1173 *len = sizeof (struct sockaddr_in6);
1174 sa_len = sizeof (struct sockaddr_in6) - sizeof (struct in6_addr);
1175 copy_len = *len - sa_len;
1176 if (copy_len > 0)
1177 memcpy (((struct sockaddr_in6 *) addr)->sin6_addr.
1178 __in6_u.__u6_addr8, ep->ip, copy_len);
1179 break;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001180
Dave Wallace048b1d62018-01-03 22:24:41 -05001181 default:
1182 /* Not possible */
1183 rv = -EAFNOSUPPORT;
1184 break;
1185 }
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001186 }
Dave Wallacee695cb42017-11-02 22:04:42 -04001187 return rv;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001188}
1189
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001190int
Florin Coras36847942023-02-02 12:56:16 -08001191getsockname (int fd, __SOCKADDR_ARG _addr, socklen_t *__restrict len)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001192{
Florin Coras36847942023-02-02 12:56:16 -08001193 struct sockaddr *addr = SOCKADDR_GET_SA (_addr);
Florin Coras7baeb712019-01-04 17:05:43 -08001194 vls_handle_t vlsh;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001195 int rv;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001196
Florin Coras5f33d0d2021-06-02 21:22:21 -07001197 ldp_init_check ();
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001198
Florin Coras7baeb712019-01-04 17:05:43 -08001199 vlsh = ldp_fd_to_vlsh (fd);
1200 if (vlsh != VLS_INVALID_HANDLE)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001201 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001202 vppcom_endpt_t ep;
1203 u8 addr_buf[sizeof (struct in6_addr)];
1204 u32 size = sizeof (ep);
1205
1206 ep.ip = addr_buf;
Dave Wallace048b1d62018-01-03 22:24:41 -05001207
Florin Coras7baeb712019-01-04 17:05:43 -08001208 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_LCL_ADDR, &ep, &size);
Dave Wallace048b1d62018-01-03 22:24:41 -05001209 if (rv != VPPCOM_OK)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001210 {
1211 errno = -rv;
Dave Wallace048b1d62018-01-03 22:24:41 -05001212 rv = -1;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001213 }
Dave Wallace048b1d62018-01-03 22:24:41 -05001214 else
1215 {
Dave Wallace2a865272018-02-07 21:00:42 -05001216 rv = ldp_copy_ep_to_sockaddr (addr, len, &ep);
Dave Wallace048b1d62018-01-03 22:24:41 -05001217 if (rv != VPPCOM_OK)
1218 {
1219 errno = -rv;
1220 rv = -1;
1221 }
1222 }
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001223 }
1224 else
1225 {
Florin Coras36847942023-02-02 12:56:16 -08001226 rv = libc_getsockname (fd, _addr, len);
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001227 }
1228
Dave Wallace048b1d62018-01-03 22:24:41 -05001229 return rv;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001230}
1231
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001232int
Florin Coras36847942023-02-02 12:56:16 -08001233connect (int fd, __CONST_SOCKADDR_ARG _addr, socklen_t len)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001234{
Florin Coras36847942023-02-02 12:56:16 -08001235 const struct sockaddr *addr = SOCKADDR_GET_SA (_addr);
Florin Coras7baeb712019-01-04 17:05:43 -08001236 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05001237 int rv;
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07001238
Florin Coras5f33d0d2021-06-02 21:22:21 -07001239 ldp_init_check ();
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07001240
Dave Wallace048b1d62018-01-03 22:24:41 -05001241 if (!addr)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001242 {
Florin Coras7baeb712019-01-04 17:05:43 -08001243 LDBG (0, "ERROR: fd %d: NULL addr, len %u", fd, len);
Dave Wallace048b1d62018-01-03 22:24:41 -05001244 errno = EINVAL;
1245 rv = -1;
1246 goto done;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001247 }
1248
Florin Coras7baeb712019-01-04 17:05:43 -08001249 vlsh = ldp_fd_to_vlsh (fd);
1250 if (vlsh != VLS_INVALID_HANDLE)
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07001251 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001252 vppcom_endpt_t ep;
1253
Dave Wallace048b1d62018-01-03 22:24:41 -05001254 switch (addr->sa_family)
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07001255 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001256 case AF_INET:
1257 if (len != sizeof (struct sockaddr_in))
1258 {
Florin Coras7baeb712019-01-04 17:05:43 -08001259 LDBG (0, "fd %d: ERROR vlsh %u: Invalid AF_INET addr len %u!",
1260 fd, vlsh, len);
Dave Wallace048b1d62018-01-03 22:24:41 -05001261 errno = EINVAL;
1262 rv = -1;
1263 goto done;
1264 }
1265 ep.is_ip4 = VPPCOM_IS_IP4;
1266 ep.ip = (u8 *) & ((const struct sockaddr_in *) addr)->sin_addr;
1267 ep.port = (u16) ((const struct sockaddr_in *) addr)->sin_port;
1268 break;
1269
1270 case AF_INET6:
1271 if (len != sizeof (struct sockaddr_in6))
1272 {
Florin Coras7baeb712019-01-04 17:05:43 -08001273 LDBG (0, "fd %d: ERROR vlsh %u: Invalid AF_INET6 addr len %u!",
1274 fd, vlsh, len);
Dave Wallace048b1d62018-01-03 22:24:41 -05001275 errno = EINVAL;
1276 rv = -1;
1277 goto done;
1278 }
1279 ep.is_ip4 = VPPCOM_IS_IP6;
1280 ep.ip = (u8 *) & ((const struct sockaddr_in6 *) addr)->sin6_addr;
1281 ep.port = (u16) ((const struct sockaddr_in6 *) addr)->sin6_port;
1282 break;
1283
1284 default:
Florin Coras7baeb712019-01-04 17:05:43 -08001285 LDBG (0, "fd %d: ERROR vlsh %u: Unsupported address family %u!",
1286 fd, vlsh, addr->sa_family);
Dave Wallace048b1d62018-01-03 22:24:41 -05001287 errno = EAFNOSUPPORT;
1288 rv = -1;
1289 goto done;
1290 }
Florin Coras7baeb712019-01-04 17:05:43 -08001291 LDBG (0, "fd %d: calling vls_connect(): vlsh %u addr %p len %u", fd,
1292 vlsh, addr, len);
Dave Wallace048b1d62018-01-03 22:24:41 -05001293
Florin Coras7baeb712019-01-04 17:05:43 -08001294 rv = vls_connect (vlsh, &ep);
Dave Wallace048b1d62018-01-03 22:24:41 -05001295 if (rv != VPPCOM_OK)
1296 {
1297 errno = -rv;
1298 rv = -1;
1299 }
1300 }
1301 else
1302 {
Florin Coras7baeb712019-01-04 17:05:43 -08001303 LDBG (0, "fd %d: calling libc_connect(): addr %p, len %u",
1304 fd, addr, len);
Dave Wallace048b1d62018-01-03 22:24:41 -05001305
1306 rv = libc_connect (fd, addr, len);
1307 }
1308
1309done:
Florin Coras7baeb712019-01-04 17:05:43 -08001310 LDBG (1, "fd %d: returning %d (0x%x)", fd, rv, rv);
Dave Wallace048b1d62018-01-03 22:24:41 -05001311 return rv;
1312}
1313
1314int
Florin Coras36847942023-02-02 12:56:16 -08001315getpeername (int fd, __SOCKADDR_ARG _addr, socklen_t *__restrict len)
Dave Wallace048b1d62018-01-03 22:24:41 -05001316{
Florin Coras36847942023-02-02 12:56:16 -08001317 struct sockaddr *addr = SOCKADDR_GET_SA (_addr);
Florin Coras7baeb712019-01-04 17:05:43 -08001318 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05001319 int rv;
Dave Wallace048b1d62018-01-03 22:24:41 -05001320
Florin Coras5f33d0d2021-06-02 21:22:21 -07001321 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001322
Florin Coras7baeb712019-01-04 17:05:43 -08001323 vlsh = ldp_fd_to_vlsh (fd);
1324 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05001325 {
1326 vppcom_endpt_t ep;
1327 u8 addr_buf[sizeof (struct in6_addr)];
1328 u32 size = sizeof (ep);
1329
1330 ep.ip = addr_buf;
Florin Coras7baeb712019-01-04 17:05:43 -08001331 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_PEER_ADDR, &ep, &size);
Dave Wallace048b1d62018-01-03 22:24:41 -05001332 if (rv != VPPCOM_OK)
1333 {
1334 errno = -rv;
1335 rv = -1;
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07001336 }
1337 else
1338 {
Dave Wallace2a865272018-02-07 21:00:42 -05001339 rv = ldp_copy_ep_to_sockaddr (addr, len, &ep);
Dave Wallace048b1d62018-01-03 22:24:41 -05001340 if (rv != VPPCOM_OK)
1341 {
1342 errno = -rv;
1343 rv = -1;
1344 }
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07001345 }
1346 }
Dave Wallace048b1d62018-01-03 22:24:41 -05001347 else
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07001348 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001349 rv = libc_getpeername (fd, addr, len);
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07001350 }
1351
Dave Wallace048b1d62018-01-03 22:24:41 -05001352 return rv;
1353}
1354
1355ssize_t
1356send (int fd, const void *buf, size_t n, int flags)
1357{
Florin Coras7baeb712019-01-04 17:05:43 -08001358 vls_handle_t vlsh = ldp_fd_to_vlsh (fd);
Dave Wallace048b1d62018-01-03 22:24:41 -05001359 ssize_t size;
Dave Wallace048b1d62018-01-03 22:24:41 -05001360
Florin Coras5f33d0d2021-06-02 21:22:21 -07001361 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001362
Florin Coras7baeb712019-01-04 17:05:43 -08001363 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05001364 {
Florin Coras7baeb712019-01-04 17:05:43 -08001365 size = vls_sendto (vlsh, (void *) buf, n, flags, NULL);
qchangaa8f63c2018-05-30 11:44:18 -07001366 if (size < VPPCOM_OK)
Dave Wallace048b1d62018-01-03 22:24:41 -05001367 {
1368 errno = -size;
1369 size = -1;
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07001370 }
1371 }
Dave Wallace048b1d62018-01-03 22:24:41 -05001372 else
1373 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001374 size = libc_send (fd, buf, n, flags);
1375 }
1376
Dave Wallace048b1d62018-01-03 22:24:41 -05001377 return size;
1378}
1379
1380ssize_t
1381sendfile (int out_fd, int in_fd, off_t * offset, size_t len)
1382{
Florin Corasdfe4cf42018-11-28 22:13:45 -08001383 ldp_worker_ctx_t *ldpw = ldp_worker_get_current ();
Florin Coras7baeb712019-01-04 17:05:43 -08001384 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05001385 ssize_t size = 0;
Dave Wallace048b1d62018-01-03 22:24:41 -05001386
Florin Coras5f33d0d2021-06-02 21:22:21 -07001387 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001388
Florin Coras7baeb712019-01-04 17:05:43 -08001389 vlsh = ldp_fd_to_vlsh (out_fd);
1390 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05001391 {
1392 int rv;
1393 ssize_t results = 0;
1394 size_t n_bytes_left = len;
1395 size_t bytes_to_read;
1396 int nbytes;
Dave Wallace048b1d62018-01-03 22:24:41 -05001397 u8 eagain = 0;
1398 u32 flags, flags_len = sizeof (flags);
1399
Florin Coras7baeb712019-01-04 17:05:43 -08001400 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_FLAGS, &flags, &flags_len);
Dave Wallace048b1d62018-01-03 22:24:41 -05001401 if (PREDICT_FALSE (rv != VPPCOM_OK))
1402 {
Florin Coras7baeb712019-01-04 17:05:43 -08001403 LDBG (0, "ERROR: out fd %d: vls_attr: vlsh %u, returned %d (%s)!",
1404 out_fd, vlsh, rv, vppcom_retval_str (rv));
Dave Wallace048b1d62018-01-03 22:24:41 -05001405
Florin Corasdfe4cf42018-11-28 22:13:45 -08001406 vec_reset_length (ldpw->io_buffer);
Dave Wallace048b1d62018-01-03 22:24:41 -05001407 errno = -rv;
1408 size = -1;
1409 goto done;
1410 }
1411
1412 if (offset)
1413 {
1414 off_t off = lseek (in_fd, *offset, SEEK_SET);
1415 if (PREDICT_FALSE (off == -1))
1416 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001417 size = -1;
1418 goto done;
1419 }
1420
1421 ASSERT (off == *offset);
1422 }
1423
1424 do
1425 {
Florin Coras7baeb712019-01-04 17:05:43 -08001426 size = vls_attr (vlsh, VPPCOM_ATTR_GET_NWRITE, 0, 0);
Dave Wallace048b1d62018-01-03 22:24:41 -05001427 if (size < 0)
1428 {
Florin Coraseb801d02020-09-16 17:44:58 -07001429 LDBG (0, "ERROR: fd %d: vls_attr: vlsh %u returned %ld (%s)!",
Florin Coras7baeb712019-01-04 17:05:43 -08001430 out_fd, vlsh, size, vppcom_retval_str (size));
Florin Corasdfe4cf42018-11-28 22:13:45 -08001431 vec_reset_length (ldpw->io_buffer);
Dave Wallace048b1d62018-01-03 22:24:41 -05001432 errno = -size;
1433 size = -1;
1434 goto done;
1435 }
1436
1437 bytes_to_read = size;
Dave Wallace048b1d62018-01-03 22:24:41 -05001438 if (bytes_to_read == 0)
1439 {
1440 if (flags & O_NONBLOCK)
1441 {
1442 if (!results)
Florin Coras7baeb712019-01-04 17:05:43 -08001443 eagain = 1;
Dave Wallace048b1d62018-01-03 22:24:41 -05001444 goto update_offset;
1445 }
1446 else
1447 continue;
1448 }
1449 bytes_to_read = clib_min (n_bytes_left, bytes_to_read);
Florin Corasdfe4cf42018-11-28 22:13:45 -08001450 vec_validate (ldpw->io_buffer, bytes_to_read);
1451 nbytes = libc_read (in_fd, ldpw->io_buffer, bytes_to_read);
Dave Wallace048b1d62018-01-03 22:24:41 -05001452 if (nbytes < 0)
1453 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001454 if (results == 0)
1455 {
Florin Corasdfe4cf42018-11-28 22:13:45 -08001456 vec_reset_length (ldpw->io_buffer);
Dave Wallace048b1d62018-01-03 22:24:41 -05001457 size = -1;
1458 goto done;
1459 }
1460 goto update_offset;
1461 }
Dave Wallace048b1d62018-01-03 22:24:41 -05001462
Florin Coras7baeb712019-01-04 17:05:43 -08001463 size = vls_write (vlsh, ldpw->io_buffer, nbytes);
Dave Wallace048b1d62018-01-03 22:24:41 -05001464 if (size < 0)
1465 {
1466 if (size == VPPCOM_EAGAIN)
1467 {
1468 if (flags & O_NONBLOCK)
1469 {
1470 if (!results)
Florin Coras7baeb712019-01-04 17:05:43 -08001471 eagain = 1;
Dave Wallace048b1d62018-01-03 22:24:41 -05001472 goto update_offset;
1473 }
1474 else
1475 continue;
1476 }
Dave Wallace048b1d62018-01-03 22:24:41 -05001477 if (results == 0)
1478 {
Florin Corasdfe4cf42018-11-28 22:13:45 -08001479 vec_reset_length (ldpw->io_buffer);
Dave Wallace048b1d62018-01-03 22:24:41 -05001480 errno = -size;
1481 size = -1;
1482 goto done;
1483 }
1484 goto update_offset;
1485 }
1486
1487 results += nbytes;
1488 ASSERT (n_bytes_left >= nbytes);
1489 n_bytes_left = n_bytes_left - nbytes;
1490 }
1491 while (n_bytes_left > 0);
1492
1493 update_offset:
Florin Corasdfe4cf42018-11-28 22:13:45 -08001494 vec_reset_length (ldpw->io_buffer);
Dave Wallace048b1d62018-01-03 22:24:41 -05001495 if (offset)
1496 {
1497 off_t off = lseek (in_fd, *offset, SEEK_SET);
1498 if (PREDICT_FALSE (off == -1))
1499 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001500 size = -1;
1501 goto done;
1502 }
1503
1504 ASSERT (off == *offset);
1505 *offset += results + 1;
1506 }
1507 if (eagain)
1508 {
1509 errno = EAGAIN;
1510 size = -1;
1511 }
1512 else
1513 size = results;
1514 }
1515 else
1516 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001517 size = libc_sendfile (out_fd, in_fd, offset, len);
1518 }
1519
1520done:
Dave Wallace048b1d62018-01-03 22:24:41 -05001521 return size;
1522}
1523
1524ssize_t
1525sendfile64 (int out_fd, int in_fd, off_t * offset, size_t len)
1526{
1527 return sendfile (out_fd, in_fd, offset, len);
1528}
1529
1530ssize_t
1531recv (int fd, void *buf, size_t n, int flags)
1532{
Florin Coras7baeb712019-01-04 17:05:43 -08001533 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05001534 ssize_t size;
Dave Wallace048b1d62018-01-03 22:24:41 -05001535
Florin Coras5f33d0d2021-06-02 21:22:21 -07001536 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001537
Florin Coras7baeb712019-01-04 17:05:43 -08001538 vlsh = ldp_fd_to_vlsh (fd);
1539 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05001540 {
Florin Coras7baeb712019-01-04 17:05:43 -08001541 size = vls_recvfrom (vlsh, buf, n, flags, NULL);
Dave Wallace048b1d62018-01-03 22:24:41 -05001542 if (size < 0)
Florin Coras2a6642e2020-03-24 15:24:29 +00001543 {
1544 errno = -size;
1545 size = -1;
1546 }
Dave Wallace048b1d62018-01-03 22:24:41 -05001547 }
1548 else
1549 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001550 size = libc_recv (fd, buf, n, flags);
1551 }
1552
Dave Wallace048b1d62018-01-03 22:24:41 -05001553 return size;
1554}
1555
Sivaprasad Tummalafdcbd382021-07-31 21:38:19 +05301556ssize_t
1557__recv_chk (int fd, void *buf, size_t n, size_t buflen, int flags)
1558{
1559 if (n > buflen)
1560 return -1;
1561
1562 return recv (fd, buf, n, flags);
1563}
1564
Dou Chao243a0432022-11-29 19:41:34 +08001565static inline int
1566ldp_vls_sendo (vls_handle_t vlsh, const void *buf, size_t n,
Florin Coraseff5f7a2023-02-07 17:36:17 -08001567 vppcom_endpt_tlv_t *app_tlvs, int flags,
Florin Coras36847942023-02-02 12:56:16 -08001568 __CONST_SOCKADDR_ARG _addr, socklen_t addr_len)
Florin Corasce17f462020-05-22 20:36:29 +00001569{
Florin Coras36847942023-02-02 12:56:16 -08001570 const struct sockaddr *addr = SOCKADDR_GET_SA (_addr);
Florin Corasce17f462020-05-22 20:36:29 +00001571 vppcom_endpt_t *ep = 0;
1572 vppcom_endpt_t _ep;
1573
Florin Coraseff5f7a2023-02-07 17:36:17 -08001574 _ep.app_tlvs = app_tlvs;
Dou Chao243a0432022-11-29 19:41:34 +08001575
Florin Corasce17f462020-05-22 20:36:29 +00001576 if (addr)
1577 {
1578 ep = &_ep;
1579 switch (addr->sa_family)
1580 {
1581 case AF_INET:
1582 ep->is_ip4 = VPPCOM_IS_IP4;
1583 ep->ip =
1584 (uint8_t *) & ((const struct sockaddr_in *) addr)->sin_addr;
1585 ep->port = (uint16_t) ((const struct sockaddr_in *) addr)->sin_port;
1586 break;
1587
1588 case AF_INET6:
1589 ep->is_ip4 = VPPCOM_IS_IP6;
1590 ep->ip =
1591 (uint8_t *) & ((const struct sockaddr_in6 *) addr)->sin6_addr;
1592 ep->port =
1593 (uint16_t) ((const struct sockaddr_in6 *) addr)->sin6_port;
1594 break;
1595
1596 default:
1597 return EAFNOSUPPORT;
1598 }
1599 }
1600
1601 return vls_sendto (vlsh, (void *) buf, n, flags, ep);
1602}
1603
1604static int
Florin Coras36847942023-02-02 12:56:16 -08001605ldp_vls_recvfrom (vls_handle_t vlsh, void *__restrict buf, size_t n, int flags,
1606 __SOCKADDR_ARG _addr, socklen_t *__restrict addr_len)
Florin Corasce17f462020-05-22 20:36:29 +00001607{
1608 u8 src_addr[sizeof (struct sockaddr_in6)];
Florin Coras36847942023-02-02 12:56:16 -08001609 struct sockaddr *addr = SOCKADDR_GET_SA (_addr);
Florin Corasce17f462020-05-22 20:36:29 +00001610 vppcom_endpt_t ep;
1611 ssize_t size;
1612 int rv;
1613
1614 if (addr)
1615 {
1616 ep.ip = src_addr;
1617 size = vls_recvfrom (vlsh, buf, n, flags, &ep);
1618
1619 if (size > 0)
1620 {
1621 rv = ldp_copy_ep_to_sockaddr (addr, addr_len, &ep);
1622 if (rv < 0)
1623 size = rv;
1624 }
1625 }
1626 else
1627 size = vls_recvfrom (vlsh, buf, n, flags, NULL);
1628
1629 return size;
1630}
1631
Dave Wallace048b1d62018-01-03 22:24:41 -05001632ssize_t
1633sendto (int fd, const void *buf, size_t n, int flags,
Florin Coras36847942023-02-02 12:56:16 -08001634 __CONST_SOCKADDR_ARG _addr, socklen_t addr_len)
Dave Wallace048b1d62018-01-03 22:24:41 -05001635{
Florin Coras36847942023-02-02 12:56:16 -08001636 const struct sockaddr *addr = SOCKADDR_GET_SA (_addr);
Florin Coras7baeb712019-01-04 17:05:43 -08001637 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05001638 ssize_t size;
Dave Wallace048b1d62018-01-03 22:24:41 -05001639
Florin Coras5f33d0d2021-06-02 21:22:21 -07001640 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001641
Florin Coras7baeb712019-01-04 17:05:43 -08001642 vlsh = ldp_fd_to_vlsh (fd);
wanghanlin97c6e0d2021-07-06 15:01:48 +08001643 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05001644 {
Dou Chao243a0432022-11-29 19:41:34 +08001645 size = ldp_vls_sendo (vlsh, buf, n, NULL, flags, addr, addr_len);
Dave Wallace048b1d62018-01-03 22:24:41 -05001646 if (size < 0)
1647 {
1648 errno = -size;
1649 size = -1;
1650 }
1651 }
1652 else
1653 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001654 size = libc_sendto (fd, buf, n, flags, addr, addr_len);
1655 }
1656
Dave Wallace048b1d62018-01-03 22:24:41 -05001657 return size;
1658}
1659
1660ssize_t
1661recvfrom (int fd, void *__restrict buf, size_t n, int flags,
1662 __SOCKADDR_ARG addr, socklen_t * __restrict addr_len)
1663{
Florin Corasce17f462020-05-22 20:36:29 +00001664 vls_handle_t vlsh;
1665 ssize_t size;
Dave Wallace048b1d62018-01-03 22:24:41 -05001666
Florin Coras5f33d0d2021-06-02 21:22:21 -07001667 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001668
Florin Corasce17f462020-05-22 20:36:29 +00001669 vlsh = ldp_fd_to_vlsh (fd);
1670 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05001671 {
Florin Corasce17f462020-05-22 20:36:29 +00001672 size = ldp_vls_recvfrom (vlsh, buf, n, flags, addr, addr_len);
Dave Wallace048b1d62018-01-03 22:24:41 -05001673 if (size < 0)
1674 {
1675 errno = -size;
1676 size = -1;
1677 }
1678 }
1679 else
1680 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001681 size = libc_recvfrom (fd, buf, n, flags, addr, addr_len);
1682 }
1683
Dave Wallace048b1d62018-01-03 22:24:41 -05001684 return size;
1685}
1686
Florin Coraseff5f7a2023-02-07 17:36:17 -08001687static int
1688ldp_parse_cmsg (vls_handle_t vlsh, const struct msghdr *msg,
1689 vppcom_endpt_tlv_t **app_tlvs)
1690{
1691 uint8_t *ad, *at = (uint8_t *) *app_tlvs;
1692 vppcom_endpt_tlv_t *adh;
1693 struct in_pktinfo *pi;
1694 struct cmsghdr *cmsg;
1695
1696 cmsg = CMSG_FIRSTHDR (msg);
1697
1698 while (cmsg != NULL)
1699 {
1700 switch (cmsg->cmsg_level)
1701 {
1702 case SOL_UDP:
1703 switch (cmsg->cmsg_type)
1704 {
1705 case UDP_SEGMENT:
1706 vec_add2 (at, adh, sizeof (*adh));
1707 adh->data_type = VCL_UDP_SEGMENT;
1708 adh->data_len = sizeof (uint16_t);
1709 vec_add2 (at, ad, sizeof (uint16_t));
1710 *(uint16_t *) ad = *(uint16_t *) CMSG_DATA (cmsg);
1711 break;
1712 default:
1713 LDBG (1, "SOL_UDP cmsg_type %u not supported", cmsg->cmsg_type);
1714 break;
1715 }
1716 break;
1717 case SOL_IP:
1718 switch (cmsg->cmsg_type)
1719 {
1720 case IP_PKTINFO:
1721 vec_add2 (at, adh, sizeof (*adh));
1722 adh->data_type = VCL_IP_PKTINFO;
1723 adh->data_len = sizeof (struct in_addr);
1724 vec_add2 (at, ad, sizeof (struct in_addr));
1725 pi = (void *) CMSG_DATA (cmsg);
1726 clib_memcpy_fast (ad, &pi->ipi_spec_dst,
1727 sizeof (struct in_addr));
1728 break;
1729 default:
1730 LDBG (1, "SOL_IP cmsg_type %u not supported", cmsg->cmsg_type);
1731 break;
1732 }
1733 break;
1734 default:
1735 LDBG (1, "cmsg_level %u not supported", cmsg->cmsg_level);
1736 break;
1737 }
1738 cmsg = CMSG_NXTHDR ((struct msghdr *) msg, cmsg);
1739 }
1740 *app_tlvs = (vppcom_endpt_tlv_t *) at;
1741 return 0;
1742}
1743
1744static int
1745ldp_make_cmsg (vls_handle_t vlsh, struct msghdr *msg)
1746{
1747 u32 optval, optlen = sizeof (optval);
1748 struct cmsghdr *cmsg;
1749
1750 cmsg = CMSG_FIRSTHDR (msg);
Steven Luong2da272e2023-07-18 23:25:15 -07001751 memset (cmsg, 0, sizeof (*cmsg));
Florin Coraseff5f7a2023-02-07 17:36:17 -08001752
1753 if (!vls_attr (vlsh, VPPCOM_ATTR_GET_IP_PKTINFO, (void *) &optval, &optlen))
1754 return 0;
1755
1756 if (optval)
1757 {
1758 vppcom_endpt_t ep;
1759 u8 addr_buf[sizeof (struct in_addr)];
1760 u32 size = sizeof (ep);
1761
1762 ep.ip = addr_buf;
1763
1764 if (!vls_attr (vlsh, VPPCOM_ATTR_GET_LCL_ADDR, &ep, &size))
1765 {
1766 struct in_pktinfo pi = {};
1767
1768 clib_memcpy (&pi.ipi_addr, ep.ip, sizeof (struct in_addr));
1769 cmsg->cmsg_level = SOL_IP;
1770 cmsg->cmsg_type = IP_PKTINFO;
1771 cmsg->cmsg_len = CMSG_LEN (sizeof (pi));
1772 clib_memcpy (CMSG_DATA (cmsg), &pi, sizeof (pi));
1773 }
1774 }
1775
1776 return 0;
1777}
1778
Dave Wallace048b1d62018-01-03 22:24:41 -05001779ssize_t
Florin Corasce17f462020-05-22 20:36:29 +00001780sendmsg (int fd, const struct msghdr * msg, int flags)
Dave Wallace048b1d62018-01-03 22:24:41 -05001781{
Florin Coras7baeb712019-01-04 17:05:43 -08001782 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05001783 ssize_t size;
Dave Wallace048b1d62018-01-03 22:24:41 -05001784
Florin Coras5f33d0d2021-06-02 21:22:21 -07001785 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001786
Florin Coras7baeb712019-01-04 17:05:43 -08001787 vlsh = ldp_fd_to_vlsh (fd);
1788 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05001789 {
Florin Coraseff5f7a2023-02-07 17:36:17 -08001790 vppcom_endpt_tlv_t *app_tlvs = 0;
Florin Corasce17f462020-05-22 20:36:29 +00001791 struct iovec *iov = msg->msg_iov;
1792 ssize_t total = 0;
Florin Corascba1c222021-11-29 08:12:27 -08001793 int i, rv = 0;
Dou Chao243a0432022-11-29 19:41:34 +08001794
Florin Coraseff5f7a2023-02-07 17:36:17 -08001795 ldp_parse_cmsg (vlsh, msg, &app_tlvs);
Florin Corasce17f462020-05-22 20:36:29 +00001796
1797 for (i = 0; i < msg->msg_iovlen; ++i)
1798 {
Florin Coraseff5f7a2023-02-07 17:36:17 -08001799 rv = ldp_vls_sendo (vlsh, iov[i].iov_base, iov[i].iov_len, app_tlvs,
1800 flags, msg->msg_name, msg->msg_namelen);
Florin Corasce17f462020-05-22 20:36:29 +00001801 if (rv < 0)
1802 break;
1803 else
1804 {
1805 total += rv;
1806 if (rv < iov[i].iov_len)
1807 break;
1808 }
1809 }
1810
Florin Coraseff5f7a2023-02-07 17:36:17 -08001811 vec_free (app_tlvs);
1812
Florin Corasce17f462020-05-22 20:36:29 +00001813 if (rv < 0 && total == 0)
1814 {
1815 errno = -rv;
1816 size = -1;
1817 }
1818 else
1819 size = total;
Dave Wallace048b1d62018-01-03 22:24:41 -05001820 }
1821 else
1822 {
Florin Corasce17f462020-05-22 20:36:29 +00001823 size = libc_sendmsg (fd, msg, flags);
Dave Wallace048b1d62018-01-03 22:24:41 -05001824 }
1825
Dave Wallace048b1d62018-01-03 22:24:41 -05001826 return size;
1827}
1828
Florin Coras36847942023-02-02 12:56:16 -08001829#ifdef _GNU_SOURCE
Dave Wallace048b1d62018-01-03 22:24:41 -05001830int
1831sendmmsg (int fd, struct mmsghdr *vmessages, unsigned int vlen, int flags)
1832{
1833 ssize_t size;
1834 const char *func_str;
Florin Coras7baeb712019-01-04 17:05:43 -08001835 u32 sh = ldp_fd_to_vlsh (fd);
Dave Wallace048b1d62018-01-03 22:24:41 -05001836
Florin Coras5f33d0d2021-06-02 21:22:21 -07001837 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001838
wanghanlin97c6e0d2021-07-06 15:01:48 +08001839 if (sh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05001840 {
1841 clib_warning ("LDP<%d>: LDP-TBD", getpid ());
1842 errno = ENOSYS;
1843 size = -1;
1844 }
1845 else
1846 {
1847 func_str = "libc_sendmmsg";
1848
Dave Wallace2a865272018-02-07 21:00:42 -05001849 if (LDP_DEBUG > 2)
Dave Wallace048b1d62018-01-03 22:24:41 -05001850 clib_warning ("LDP<%d>: fd %d (0x%x): calling %s(): "
1851 "vmessages %p, vlen %u, flags 0x%x",
1852 getpid (), fd, fd, func_str, vmessages, vlen, flags);
1853
1854 size = libc_sendmmsg (fd, vmessages, vlen, flags);
1855 }
1856
Dave Wallace2a865272018-02-07 21:00:42 -05001857 if (LDP_DEBUG > 2)
Dave Wallace048b1d62018-01-03 22:24:41 -05001858 {
1859 if (size < 0)
1860 {
1861 int errno_val = errno;
Dave Wallace048b1d62018-01-03 22:24:41 -05001862 clib_warning ("LDP<%d>: ERROR: fd %d (0x%x): %s() failed! "
1863 "rv %d, errno = %d", getpid (), fd, fd,
1864 func_str, size, errno_val);
1865 errno = errno_val;
1866 }
1867 else
1868 clib_warning ("LDP<%d>: fd %d (0x%x): returning %d (0x%x)",
1869 getpid (), fd, fd, size, size);
1870 }
1871 return size;
1872}
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07001873#endif
1874
Dave Wallace048b1d62018-01-03 22:24:41 -05001875ssize_t
Florin Corasce17f462020-05-22 20:36:29 +00001876recvmsg (int fd, struct msghdr * msg, int flags)
Dave Wallace048b1d62018-01-03 22:24:41 -05001877{
Florin Coras7baeb712019-01-04 17:05:43 -08001878 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05001879 ssize_t size;
Dave Wallace048b1d62018-01-03 22:24:41 -05001880
Florin Coras5f33d0d2021-06-02 21:22:21 -07001881 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001882
Florin Coras7baeb712019-01-04 17:05:43 -08001883 vlsh = ldp_fd_to_vlsh (fd);
1884 if (vlsh != VLS_INVALID_HANDLE)
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07001885 {
Florin Corasce17f462020-05-22 20:36:29 +00001886 struct iovec *iov = msg->msg_iov;
1887 ssize_t max_deq, total = 0;
Jieqiang Wang76d14b72023-07-24 16:52:06 +08001888 int i, rv = 0;
Florin Corasce17f462020-05-22 20:36:29 +00001889
1890 max_deq = vls_attr (vlsh, VPPCOM_ATTR_GET_NREAD, 0, 0);
1891 if (!max_deq)
1892 return 0;
1893
1894 for (i = 0; i < msg->msg_iovlen; i++)
1895 {
1896 rv = ldp_vls_recvfrom (vlsh, iov[i].iov_base, iov[i].iov_len, flags,
1897 (i == 0 ? msg->msg_name : NULL),
1898 (i == 0 ? &msg->msg_namelen : NULL));
1899 if (rv <= 0)
1900 break;
1901 else
1902 {
1903 total += rv;
1904 if (rv < iov[i].iov_len)
1905 break;
1906 }
1907 if (total >= max_deq)
1908 break;
1909 }
1910
1911 if (rv < 0 && total == 0)
1912 {
1913 errno = -rv;
1914 size = -1;
1915 }
1916 else
Florin Coraseff5f7a2023-02-07 17:36:17 -08001917 {
1918 if (msg->msg_controllen)
1919 ldp_make_cmsg (vlsh, msg);
1920 size = total;
1921 }
Dave Wallace048b1d62018-01-03 22:24:41 -05001922 }
1923 else
1924 {
Florin Corasce17f462020-05-22 20:36:29 +00001925 size = libc_recvmsg (fd, msg, flags);
Dave Wallace048b1d62018-01-03 22:24:41 -05001926 }
1927
Dave Wallace048b1d62018-01-03 22:24:41 -05001928 return size;
1929}
1930
Florin Coras36847942023-02-02 12:56:16 -08001931#ifdef _GNU_SOURCE
Dave Wallace048b1d62018-01-03 22:24:41 -05001932int
1933recvmmsg (int fd, struct mmsghdr *vmessages,
1934 unsigned int vlen, int flags, struct timespec *tmo)
1935{
Florin Corasf1a232f2023-02-02 22:56:03 -08001936 ldp_worker_ctx_t *ldpw = ldp_worker_get_current ();
1937 u32 sh;
Dave Wallace048b1d62018-01-03 22:24:41 -05001938
Florin Coras5f33d0d2021-06-02 21:22:21 -07001939 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001940
Florin Corasf1a232f2023-02-02 22:56:03 -08001941 sh = ldp_fd_to_vlsh (fd);
1942
wanghanlin97c6e0d2021-07-06 15:01:48 +08001943 if (sh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05001944 {
Florin Corasf1a232f2023-02-02 22:56:03 -08001945 struct mmsghdr *mh;
1946 ssize_t rv = 0;
1947 u32 nvecs = 0;
1948 f64 time_out;
1949
1950 if (PREDICT_FALSE (ldpw->clib_time.init_cpu_time == 0))
1951 clib_time_init (&ldpw->clib_time);
1952 if (tmo)
1953 {
1954 time_out = (f64) tmo->tv_sec + (f64) tmo->tv_nsec / (f64) 1e9;
1955 time_out += clib_time_now (&ldpw->clib_time);
1956 }
1957 else
1958 {
1959 time_out = (f64) ~0;
1960 }
1961
1962 while (nvecs < vlen)
1963 {
1964 mh = &vmessages[nvecs];
1965 rv = recvmsg (fd, &mh->msg_hdr, flags);
1966 if (rv > 0)
1967 {
1968 mh->msg_len = rv;
1969 nvecs += 1;
1970 continue;
1971 }
1972
1973 if (!time_out || clib_time_now (&ldpw->clib_time) >= time_out)
1974 break;
1975
1976 usleep (1);
1977 }
1978
1979 return nvecs > 0 ? nvecs : rv;
Dave Wallace048b1d62018-01-03 22:24:41 -05001980 }
1981 else
1982 {
Florin Corasf1a232f2023-02-02 22:56:03 -08001983 return libc_recvmmsg (fd, vmessages, vlen, flags, tmo);
Dave Wallace048b1d62018-01-03 22:24:41 -05001984 }
Dave Wallace048b1d62018-01-03 22:24:41 -05001985}
1986#endif
1987
1988int
1989getsockopt (int fd, int level, int optname,
1990 void *__restrict optval, socklen_t * __restrict optlen)
1991{
Florin Coras7baeb712019-01-04 17:05:43 -08001992 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05001993 int rv;
Dave Wallace048b1d62018-01-03 22:24:41 -05001994
Florin Coras5f33d0d2021-06-02 21:22:21 -07001995 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001996
Florin Coras7baeb712019-01-04 17:05:43 -08001997 vlsh = ldp_fd_to_vlsh (fd);
1998 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05001999 {
2000 rv = -EOPNOTSUPP;
2001
2002 switch (level)
2003 {
2004 case SOL_TCP:
2005 switch (optname)
2006 {
2007 case TCP_NODELAY:
Florin Coras7baeb712019-01-04 17:05:43 -08002008 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_TCP_NODELAY,
2009 optval, optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002010 break;
2011 case TCP_MAXSEG:
Florin Coras7baeb712019-01-04 17:05:43 -08002012 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_TCP_USER_MSS,
2013 optval, optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002014 break;
2015 case TCP_KEEPIDLE:
Florin Coras7baeb712019-01-04 17:05:43 -08002016 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_TCP_KEEPIDLE,
2017 optval, optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002018 break;
2019 case TCP_KEEPINTVL:
Florin Coras7baeb712019-01-04 17:05:43 -08002020 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_TCP_KEEPINTVL,
2021 optval, optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002022 break;
2023 case TCP_INFO:
2024 if (optval && optlen && (*optlen == sizeof (struct tcp_info)))
2025 {
Florin Coras7baeb712019-01-04 17:05:43 -08002026 LDBG (1, "fd %d: vlsh %u SOL_TCP, TCP_INFO, optval %p, "
2027 "optlen %d: #LDP-NOP#", fd, vlsh, optval, *optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002028 memset (optval, 0, *optlen);
2029 rv = VPPCOM_OK;
2030 }
2031 else
2032 rv = -EFAULT;
2033 break;
Florin Coras0ed24e92019-01-21 09:03:10 -08002034 case TCP_CONGESTION:
Florin Coras0ed24e92019-01-21 09:03:10 -08002035 *optlen = strlen ("cubic");
Dave Barach02500902020-04-04 18:34:41 -04002036 strncpy (optval, "cubic", *optlen + 1);
Florin Coras0ed24e92019-01-21 09:03:10 -08002037 rv = 0;
2038 break;
Dave Wallace048b1d62018-01-03 22:24:41 -05002039 default:
Florin Coras7baeb712019-01-04 17:05:43 -08002040 LDBG (0, "ERROR: fd %d: getsockopt SOL_TCP: sid %u, "
2041 "optname %d unsupported!", fd, vlsh, optname);
Dave Wallace048b1d62018-01-03 22:24:41 -05002042 break;
2043 }
2044 break;
qinyangaf9b7152023-06-27 01:11:53 -07002045 case SOL_IP:
2046 switch (optname)
2047 {
2048 case SO_ORIGINAL_DST:
2049 rv =
2050 vls_attr (vlsh, VPPCOM_ATTR_GET_ORIGINAL_DST, optval, optlen);
2051 break;
2052 default:
2053 LDBG (0,
2054 "ERROR: fd %d: getsockopt SOL_IP: vlsh %u "
2055 "optname %d unsupported!",
2056 fd, vlsh, optname);
2057 break;
2058 }
2059 break;
Dave Wallace048b1d62018-01-03 22:24:41 -05002060 case SOL_IPV6:
2061 switch (optname)
2062 {
2063 case IPV6_V6ONLY:
Florin Coras7baeb712019-01-04 17:05:43 -08002064 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_V6ONLY, optval, optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002065 break;
2066 default:
Florin Coras7baeb712019-01-04 17:05:43 -08002067 LDBG (0, "ERROR: fd %d: getsockopt SOL_IPV6: vlsh %u "
2068 "optname %d unsupported!", fd, vlsh, optname);
Dave Wallace048b1d62018-01-03 22:24:41 -05002069 break;
2070 }
2071 break;
2072 case SOL_SOCKET:
2073 switch (optname)
2074 {
2075 case SO_ACCEPTCONN:
Florin Coras7baeb712019-01-04 17:05:43 -08002076 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_LISTEN, optval, optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002077 break;
2078 case SO_KEEPALIVE:
Florin Coras7baeb712019-01-04 17:05:43 -08002079 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_KEEPALIVE, optval, optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002080 break;
2081 case SO_PROTOCOL:
Florin Coras7baeb712019-01-04 17:05:43 -08002082 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_PROTOCOL, optval, optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002083 *(int *) optval = *(int *) optval ? SOCK_DGRAM : SOCK_STREAM;
2084 break;
2085 case SO_SNDBUF:
Florin Coras7baeb712019-01-04 17:05:43 -08002086 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_TX_FIFO_LEN,
2087 optval, optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002088 break;
2089 case SO_RCVBUF:
Florin Coras7baeb712019-01-04 17:05:43 -08002090 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_RX_FIFO_LEN,
2091 optval, optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002092 break;
2093 case SO_REUSEADDR:
Florin Coras7baeb712019-01-04 17:05:43 -08002094 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_REUSEADDR, optval, optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002095 break;
wanghanlin0674f852021-02-22 10:38:36 +08002096 case SO_REUSEPORT:
2097 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_REUSEPORT, optval, optlen);
2098 break;
Dave Wallace048b1d62018-01-03 22:24:41 -05002099 case SO_BROADCAST:
Florin Coras7baeb712019-01-04 17:05:43 -08002100 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_BROADCAST, optval, optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002101 break;
wanghanlin0674f852021-02-22 10:38:36 +08002102 case SO_DOMAIN:
2103 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_DOMAIN, optval, optlen);
2104 break;
Dave Wallace048b1d62018-01-03 22:24:41 -05002105 case SO_ERROR:
Florin Coras7baeb712019-01-04 17:05:43 -08002106 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_ERROR, optval, optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002107 break;
Florin Coras8eb8d502021-06-16 14:46:57 -07002108 case SO_BINDTODEVICE:
2109 rv = 0;
2110 break;
Dave Wallace048b1d62018-01-03 22:24:41 -05002111 default:
Florin Coras7baeb712019-01-04 17:05:43 -08002112 LDBG (0, "ERROR: fd %d: getsockopt SOL_SOCKET: vlsh %u "
2113 "optname %d unsupported!", fd, vlsh, optname);
Dave Wallace048b1d62018-01-03 22:24:41 -05002114 break;
2115 }
2116 break;
2117 default:
2118 break;
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002119 }
2120
Dave Wallace048b1d62018-01-03 22:24:41 -05002121 if (rv != VPPCOM_OK)
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002122 {
Dave Wallace048b1d62018-01-03 22:24:41 -05002123 errno = -rv;
2124 rv = -1;
2125 }
2126 }
2127 else
2128 {
Dave Wallace048b1d62018-01-03 22:24:41 -05002129 rv = libc_getsockopt (fd, level, optname, optval, optlen);
2130 }
2131
Dave Wallace048b1d62018-01-03 22:24:41 -05002132 return rv;
2133}
2134
2135int
2136setsockopt (int fd, int level, int optname,
2137 const void *optval, socklen_t optlen)
2138{
Florin Coras7baeb712019-01-04 17:05:43 -08002139 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05002140 int rv;
Dave Wallace048b1d62018-01-03 22:24:41 -05002141
Florin Coras5f33d0d2021-06-02 21:22:21 -07002142 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05002143
Florin Coras7baeb712019-01-04 17:05:43 -08002144 vlsh = ldp_fd_to_vlsh (fd);
2145 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05002146 {
2147 rv = -EOPNOTSUPP;
2148
2149 switch (level)
2150 {
2151 case SOL_TCP:
2152 switch (optname)
2153 {
2154 case TCP_NODELAY:
Florin Coras7baeb712019-01-04 17:05:43 -08002155 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_TCP_NODELAY,
2156 (void *) optval, &optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002157 break;
2158 case TCP_MAXSEG:
Florin Coras7baeb712019-01-04 17:05:43 -08002159 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_TCP_USER_MSS,
2160 (void *) optval, &optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002161 break;
2162 case TCP_KEEPIDLE:
Florin Coras7baeb712019-01-04 17:05:43 -08002163 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_TCP_KEEPIDLE,
2164 (void *) optval, &optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002165 break;
2166 case TCP_KEEPINTVL:
Florin Coras7baeb712019-01-04 17:05:43 -08002167 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_TCP_KEEPINTVL,
2168 (void *) optval, &optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002169 break;
Florin Coras0ed24e92019-01-21 09:03:10 -08002170 case TCP_CONGESTION:
Florin Coras8509aa22019-04-04 12:55:30 -07002171 case TCP_CORK:
Florin Coras0ed24e92019-01-21 09:03:10 -08002172 /* Ignore */
2173 rv = 0;
2174 break;
Dave Wallace048b1d62018-01-03 22:24:41 -05002175 default:
Florin Coras7baeb712019-01-04 17:05:43 -08002176 LDBG (0, "ERROR: fd %d: setsockopt() SOL_TCP: vlsh %u"
2177 "optname %d unsupported!", fd, vlsh, optname);
Dave Wallace048b1d62018-01-03 22:24:41 -05002178 break;
2179 }
2180 break;
2181 case SOL_IPV6:
2182 switch (optname)
2183 {
2184 case IPV6_V6ONLY:
Florin Coras7baeb712019-01-04 17:05:43 -08002185 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_V6ONLY,
2186 (void *) optval, &optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002187 break;
2188 default:
Florin Coras7baeb712019-01-04 17:05:43 -08002189 LDBG (0, "ERROR: fd %d: setsockopt SOL_IPV6: vlsh %u"
2190 "optname %d unsupported!", fd, vlsh, optname);
Dave Wallace048b1d62018-01-03 22:24:41 -05002191 break;
2192 }
2193 break;
2194 case SOL_SOCKET:
2195 switch (optname)
2196 {
2197 case SO_KEEPALIVE:
Florin Coras7baeb712019-01-04 17:05:43 -08002198 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_KEEPALIVE,
2199 (void *) optval, &optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002200 break;
2201 case SO_REUSEADDR:
Florin Coras7baeb712019-01-04 17:05:43 -08002202 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_REUSEADDR,
2203 (void *) optval, &optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002204 break;
wanghanlin0674f852021-02-22 10:38:36 +08002205 case SO_REUSEPORT:
2206 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_REUSEPORT, (void *) optval,
2207 &optlen);
2208 break;
Dave Wallace048b1d62018-01-03 22:24:41 -05002209 case SO_BROADCAST:
Florin Coras7baeb712019-01-04 17:05:43 -08002210 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_BROADCAST,
2211 (void *) optval, &optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002212 break;
Florin Coras2f647902021-06-02 08:23:50 -07002213 case SO_LINGER:
2214 rv = 0;
2215 break;
Dave Wallace048b1d62018-01-03 22:24:41 -05002216 default:
Florin Coras7baeb712019-01-04 17:05:43 -08002217 LDBG (0, "ERROR: fd %d: setsockopt SOL_SOCKET: vlsh %u "
2218 "optname %d unsupported!", fd, vlsh, optname);
Dave Wallace048b1d62018-01-03 22:24:41 -05002219 break;
2220 }
2221 break;
Florin Coraseff5f7a2023-02-07 17:36:17 -08002222 case SOL_IP:
2223 switch (optname)
2224 {
2225 case IP_PKTINFO:
2226 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_IP_PKTINFO, (void *) optval,
2227 &optlen);
2228 break;
2229 default:
2230 LDBG (0,
2231 "ERROR: fd %d: setsockopt SOL_IP: vlsh %u optname %d"
2232 "unsupported!",
2233 fd, vlsh, optname);
2234 break;
2235 }
2236 break;
Dave Wallace048b1d62018-01-03 22:24:41 -05002237 default:
2238 break;
2239 }
2240
2241 if (rv != VPPCOM_OK)
2242 {
2243 errno = -rv;
2244 rv = -1;
2245 }
2246 }
2247 else
2248 {
Dave Wallace048b1d62018-01-03 22:24:41 -05002249 rv = libc_setsockopt (fd, level, optname, optval, optlen);
2250 }
2251
Dave Wallace048b1d62018-01-03 22:24:41 -05002252 return rv;
2253}
2254
2255int
2256listen (int fd, int n)
2257{
Florin Coras7baeb712019-01-04 17:05:43 -08002258 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05002259 int rv;
Dave Wallace048b1d62018-01-03 22:24:41 -05002260
Florin Coras5f33d0d2021-06-02 21:22:21 -07002261 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05002262
Florin Coras7baeb712019-01-04 17:05:43 -08002263 vlsh = ldp_fd_to_vlsh (fd);
2264 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05002265 {
Florin Coras7baeb712019-01-04 17:05:43 -08002266 LDBG (0, "fd %d: calling vls_listen: vlsh %u, n %d", fd, vlsh, n);
Dave Wallace048b1d62018-01-03 22:24:41 -05002267
Florin Coras7baeb712019-01-04 17:05:43 -08002268 rv = vls_listen (vlsh, n);
Dave Wallace048b1d62018-01-03 22:24:41 -05002269 if (rv != VPPCOM_OK)
2270 {
2271 errno = -rv;
2272 rv = -1;
2273 }
2274 }
2275 else
2276 {
Florin Coras7baeb712019-01-04 17:05:43 -08002277 LDBG (0, "fd %d: calling libc_listen(): n %d", fd, n);
Dave Wallace048b1d62018-01-03 22:24:41 -05002278 rv = libc_listen (fd, n);
2279 }
2280
Florin Coras7baeb712019-01-04 17:05:43 -08002281 LDBG (1, "fd %d: returning %d", fd, rv);
Dave Wallace048b1d62018-01-03 22:24:41 -05002282 return rv;
2283}
2284
2285static inline int
Florin Coras36847942023-02-02 12:56:16 -08002286ldp_accept4 (int listen_fd, __SOCKADDR_ARG _addr,
2287 socklen_t *__restrict addr_len, int flags)
Dave Wallace048b1d62018-01-03 22:24:41 -05002288{
Florin Coras36847942023-02-02 12:56:16 -08002289 struct sockaddr *addr = SOCKADDR_GET_SA (_addr);
Florin Coras7baeb712019-01-04 17:05:43 -08002290 vls_handle_t listen_vlsh, accept_vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05002291 int rv;
Dave Wallace048b1d62018-01-03 22:24:41 -05002292
Florin Coras5f33d0d2021-06-02 21:22:21 -07002293 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05002294
Florin Coras7baeb712019-01-04 17:05:43 -08002295 listen_vlsh = ldp_fd_to_vlsh (listen_fd);
2296 if (listen_vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05002297 {
2298 vppcom_endpt_t ep;
2299 u8 src_addr[sizeof (struct sockaddr_in6)];
Dave Wallace8aaba562018-01-18 17:21:19 -05002300 memset (&ep, 0, sizeof (ep));
Dave Wallace048b1d62018-01-03 22:24:41 -05002301 ep.ip = src_addr;
2302
Florin Coras7baeb712019-01-04 17:05:43 -08002303 LDBG (0, "listen fd %d: calling vppcom_session_accept: listen sid %u,"
Florin Coraseb801d02020-09-16 17:44:58 -07002304 " ep %p, flags 0x%x", listen_fd, listen_vlsh, &ep, flags);
Dave Wallace048b1d62018-01-03 22:24:41 -05002305
Florin Coras7baeb712019-01-04 17:05:43 -08002306 accept_vlsh = vls_accept (listen_vlsh, &ep, flags);
2307 if (accept_vlsh < 0)
Dave Wallace048b1d62018-01-03 22:24:41 -05002308 {
Florin Coras7baeb712019-01-04 17:05:43 -08002309 errno = -accept_vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05002310 rv = -1;
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002311 }
2312 else
2313 {
Dave Wallace2a865272018-02-07 21:00:42 -05002314 rv = ldp_copy_ep_to_sockaddr (addr, addr_len, &ep);
Dave Wallace048b1d62018-01-03 22:24:41 -05002315 if (rv != VPPCOM_OK)
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002316 {
Florin Coras7baeb712019-01-04 17:05:43 -08002317 (void) vls_close (accept_vlsh);
Dave Wallace048b1d62018-01-03 22:24:41 -05002318 errno = -rv;
2319 rv = -1;
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002320 }
Dave Wallace048b1d62018-01-03 22:24:41 -05002321 else
2322 {
Florin Coras7baeb712019-01-04 17:05:43 -08002323 rv = ldp_vlsh_to_fd (accept_vlsh);
Dave Wallace048b1d62018-01-03 22:24:41 -05002324 }
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002325 }
2326 }
Dave Wallace048b1d62018-01-03 22:24:41 -05002327 else
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002328 {
Florin Coras7baeb712019-01-04 17:05:43 -08002329 LDBG (0, "listen fd %d: calling libc_accept4(): addr %p, addr_len %p,"
2330 " flags 0x%x", listen_fd, addr, addr_len, flags);
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002331
Dave Wallace048b1d62018-01-03 22:24:41 -05002332 rv = libc_accept4 (listen_fd, addr, addr_len, flags);
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002333 }
2334
Florin Coras7baeb712019-01-04 17:05:43 -08002335 LDBG (1, "listen fd %d: accept returning %d", listen_fd, rv);
Florin Coras05ecfcc2018-12-12 18:19:39 -08002336
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002337 return rv;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002338}
2339
Dave Wallace048b1d62018-01-03 22:24:41 -05002340int
2341accept4 (int fd, __SOCKADDR_ARG addr, socklen_t * __restrict addr_len,
2342 int flags)
2343{
Dave Wallace2a865272018-02-07 21:00:42 -05002344 return ldp_accept4 (fd, addr, addr_len, flags);
Dave Wallace048b1d62018-01-03 22:24:41 -05002345}
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002346
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002347int
Dave Wallace048b1d62018-01-03 22:24:41 -05002348accept (int fd, __SOCKADDR_ARG addr, socklen_t * __restrict addr_len)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002349{
Dave Wallace2a865272018-02-07 21:00:42 -05002350 return ldp_accept4 (fd, addr, addr_len, 0);
Dave Wallace048b1d62018-01-03 22:24:41 -05002351}
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002352
Dave Wallace048b1d62018-01-03 22:24:41 -05002353int
2354shutdown (int fd, int how)
2355{
Florin Coras7baeb712019-01-04 17:05:43 -08002356 vls_handle_t vlsh;
liuyacan55c952e2021-06-13 14:54:55 +08002357 int rv = 0;
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002358
Florin Coras5f33d0d2021-06-02 21:22:21 -07002359 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05002360
Florin Coras7baeb712019-01-04 17:05:43 -08002361 vlsh = ldp_fd_to_vlsh (fd);
2362 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05002363 {
Florin Coras7baeb712019-01-04 17:05:43 -08002364 LDBG (0, "called shutdown: fd %u vlsh %u how %d", fd, vlsh, how);
liuyacan55c952e2021-06-13 14:54:55 +08002365 rv = vls_shutdown (vlsh, how);
Dave Wallace048b1d62018-01-03 22:24:41 -05002366 }
2367 else
2368 {
Florin Coras7baeb712019-01-04 17:05:43 -08002369 LDBG (0, "fd %d: calling libc_shutdown: how %d", fd, how);
Dave Wallace048b1d62018-01-03 22:24:41 -05002370 rv = libc_shutdown (fd, how);
2371 }
2372
Dave Wallace048b1d62018-01-03 22:24:41 -05002373 return rv;
2374}
2375
2376int
2377epoll_create1 (int flags)
2378{
Florin Corasdfe4cf42018-11-28 22:13:45 -08002379 ldp_worker_ctx_t *ldpw = ldp_worker_get_current ();
Florin Coras7baeb712019-01-04 17:05:43 -08002380 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05002381 int rv;
2382
Florin Coras5f33d0d2021-06-02 21:22:21 -07002383 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05002384
hanlina3a48962020-07-13 11:09:15 +08002385 if (ldp->vcl_needs_real_epoll || vls_use_real_epoll ())
Florin Coras99368312018-08-02 10:45:44 -07002386 {
Florin Coras2d9b4272019-03-11 10:14:37 -07002387 /* Make sure workers have been allocated */
2388 if (!ldp->workers)
2389 {
2390 ldp_alloc_workers ();
2391 ldpw = ldp_worker_get_current ();
2392 }
Florin Coras99368312018-08-02 10:45:44 -07002393 rv = libc_epoll_create1 (flags);
2394 ldp->vcl_needs_real_epoll = 0;
Florin Corasdfe4cf42018-11-28 22:13:45 -08002395 ldpw->vcl_mq_epfd = rv;
Florin Coras05ecfcc2018-12-12 18:19:39 -08002396 LDBG (0, "created vcl epfd %u", rv);
Florin Coras99368312018-08-02 10:45:44 -07002397 return rv;
2398 }
Dave Wallace048b1d62018-01-03 22:24:41 -05002399
Florin Coras7baeb712019-01-04 17:05:43 -08002400 vlsh = vls_epoll_create ();
2401 if (PREDICT_FALSE (vlsh == VLS_INVALID_HANDLE))
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002402 {
Florin Coras7baeb712019-01-04 17:05:43 -08002403 errno = -vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05002404 rv = -1;
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002405 }
Dave Wallace048b1d62018-01-03 22:24:41 -05002406 else
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002407 {
Florin Coras7baeb712019-01-04 17:05:43 -08002408 rv = ldp_vlsh_to_fd (vlsh);
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002409 }
Florin Coras7baeb712019-01-04 17:05:43 -08002410 LDBG (0, "epoll_create epfd %u vlsh %u", rv, vlsh);
Dave Wallace048b1d62018-01-03 22:24:41 -05002411 return rv;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002412}
2413
2414int
Dave Wallace048b1d62018-01-03 22:24:41 -05002415epoll_create (int size)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002416{
Dave Wallace048b1d62018-01-03 22:24:41 -05002417 return epoll_create1 (0);
2418}
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002419
Dave Wallace048b1d62018-01-03 22:24:41 -05002420int
2421epoll_ctl (int epfd, int op, int fd, struct epoll_event *event)
2422{
Florin Coras7baeb712019-01-04 17:05:43 -08002423 vls_handle_t vep_vlsh, vlsh;
Florin Coras99368312018-08-02 10:45:44 -07002424 int rv;
Dave Wallace048b1d62018-01-03 22:24:41 -05002425
Florin Coras5f33d0d2021-06-02 21:22:21 -07002426 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05002427
Florin Coras7baeb712019-01-04 17:05:43 -08002428 vep_vlsh = ldp_fd_to_vlsh (epfd);
2429 if (PREDICT_FALSE (vep_vlsh == VLS_INVALID_HANDLE))
Dave Wallace048b1d62018-01-03 22:24:41 -05002430 {
Dave Wallace3ee1fe12018-02-23 01:09:11 -05002431 /* The LDP epoll_create1 always creates VCL epfd's.
2432 * The app should never have a kernel base epoll fd unless it
2433 * was acquired outside of the LD_PRELOAD process context.
2434 * In any case, if we get one, punt it to libc_epoll_ctl.
2435 */
Florin Corasc86662a2023-03-05 11:45:38 -08002436 LDBG (1,
2437 "epfd %d: calling libc_epoll_ctl: op %d, fd %d"
2438 " events 0x%x",
2439 epfd, op, fd, event ? event->events : 0);
Dave Wallace048b1d62018-01-03 22:24:41 -05002440
2441 rv = libc_epoll_ctl (epfd, op, fd, event);
Florin Coras99368312018-08-02 10:45:44 -07002442 goto done;
2443 }
2444
Florin Coras7baeb712019-01-04 17:05:43 -08002445 vlsh = ldp_fd_to_vlsh (fd);
Florin Coras99368312018-08-02 10:45:44 -07002446
Florin Coras7baeb712019-01-04 17:05:43 -08002447 LDBG (0, "epfd %d ep_vlsh %d, fd %u vlsh %d, op %u", epfd, vep_vlsh, fd,
2448 vlsh, op);
Florin Coras99368312018-08-02 10:45:44 -07002449
Florin Coras7baeb712019-01-04 17:05:43 -08002450 if (vlsh != VLS_INVALID_HANDLE)
Florin Coras99368312018-08-02 10:45:44 -07002451 {
Florin Corasc86662a2023-03-05 11:45:38 -08002452 LDBG (1,
2453 "epfd %d: calling vls_epoll_ctl: ep_vlsh %d op %d, vlsh %u,"
2454 " events 0x%x",
2455 epfd, vep_vlsh, op, vlsh, event ? event->events : 0);
Florin Coras99368312018-08-02 10:45:44 -07002456
Florin Coras7baeb712019-01-04 17:05:43 -08002457 rv = vls_epoll_ctl (vep_vlsh, op, vlsh, event);
Florin Coras99368312018-08-02 10:45:44 -07002458 if (rv != VPPCOM_OK)
2459 {
2460 errno = -rv;
2461 rv = -1;
2462 }
2463 }
2464 else
2465 {
2466 int libc_epfd;
2467 u32 size = sizeof (epfd);
2468
Florin Coras7baeb712019-01-04 17:05:43 -08002469 libc_epfd = vls_attr (vep_vlsh, VPPCOM_ATTR_GET_LIBC_EPFD, 0, 0);
Florin Coras99368312018-08-02 10:45:44 -07002470 if (!libc_epfd)
2471 {
Florin Coras7baeb712019-01-04 17:05:43 -08002472 LDBG (1, "epfd %d, vep_vlsh %d calling libc_epoll_create1: "
2473 "EPOLL_CLOEXEC", epfd, vep_vlsh);
Florin Coras99368312018-08-02 10:45:44 -07002474
2475 libc_epfd = libc_epoll_create1 (EPOLL_CLOEXEC);
2476 if (libc_epfd < 0)
2477 {
2478 rv = libc_epfd;
2479 goto done;
2480 }
2481
Florin Coras7baeb712019-01-04 17:05:43 -08002482 rv = vls_attr (vep_vlsh, VPPCOM_ATTR_SET_LIBC_EPFD, &libc_epfd,
2483 &size);
Florin Coras99368312018-08-02 10:45:44 -07002484 if (rv < 0)
2485 {
2486 errno = -rv;
2487 rv = -1;
2488 goto done;
2489 }
2490 }
2491 else if (PREDICT_FALSE (libc_epfd < 0))
2492 {
2493 errno = -epfd;
2494 rv = -1;
2495 goto done;
2496 }
2497
Florin Coras7baeb712019-01-04 17:05:43 -08002498 LDBG (1, "epfd %d: calling libc_epoll_ctl: libc_epfd %d, op %d, fd %d,"
2499 " event %p", epfd, libc_epfd, op, fd, event);
Florin Coras99368312018-08-02 10:45:44 -07002500
2501 rv = libc_epoll_ctl (libc_epfd, op, fd, event);
Dave Wallace048b1d62018-01-03 22:24:41 -05002502 }
2503
2504done:
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002505 return rv;
2506}
Dave Wallace048b1d62018-01-03 22:24:41 -05002507
2508static inline int
Florin Coras99368312018-08-02 10:45:44 -07002509ldp_epoll_pwait (int epfd, struct epoll_event *events, int maxevents,
2510 int timeout, const sigset_t * sigmask)
Dave Wallace048b1d62018-01-03 22:24:41 -05002511{
Liangxing Wang7c7231f2023-02-16 09:31:01 +00002512 ldp_worker_ctx_t *ldpw;
Florin Coras72f77822019-01-22 19:05:52 -08002513 double time_to_wait = (double) 0, max_time;
Florin Coras99368312018-08-02 10:45:44 -07002514 int libc_epfd, rv = 0;
Florin Coras7baeb712019-01-04 17:05:43 -08002515 vls_handle_t ep_vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05002516
Florin Coras5f33d0d2021-06-02 21:22:21 -07002517 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05002518
2519 if (PREDICT_FALSE (!events || (timeout < -1)))
2520 {
2521 errno = EFAULT;
2522 return -1;
2523 }
2524
Liangxing Wang7c7231f2023-02-16 09:31:01 +00002525 if (PREDICT_FALSE (vppcom_worker_index () == ~0))
2526 vls_register_vcl_worker ();
2527
2528 ldpw = ldp_worker_get_current ();
Florin Corasdfe4cf42018-11-28 22:13:45 -08002529 if (epfd == ldpw->vcl_mq_epfd)
Florin Coras99368312018-08-02 10:45:44 -07002530 return libc_epoll_pwait (epfd, events, maxevents, timeout, sigmask);
2531
Florin Coras7baeb712019-01-04 17:05:43 -08002532 ep_vlsh = ldp_fd_to_vlsh (epfd);
2533 if (PREDICT_FALSE (ep_vlsh == VLS_INVALID_HANDLE))
Dave Wallace048b1d62018-01-03 22:24:41 -05002534 {
Florin Coras7baeb712019-01-04 17:05:43 -08002535 LDBG (0, "epfd %d: bad ep_vlsh %d!", epfd, ep_vlsh);
Dave Wallace048b1d62018-01-03 22:24:41 -05002536 errno = EBADFD;
2537 return -1;
2538 }
2539
Florin Coras4dee8cd2019-01-29 21:28:16 -08002540 if (PREDICT_FALSE (ldpw->clib_time.init_cpu_time == 0))
2541 clib_time_init (&ldpw->clib_time);
Florin Corasb0f662f2018-12-27 14:51:46 -08002542 time_to_wait = ((timeout >= 0) ? (double) timeout / 1000 : 0);
Florin Coras72f77822019-01-22 19:05:52 -08002543 max_time = clib_time_now (&ldpw->clib_time) + time_to_wait;
Dave Wallace048b1d62018-01-03 22:24:41 -05002544
Florin Coras7baeb712019-01-04 17:05:43 -08002545 libc_epfd = vls_attr (ep_vlsh, VPPCOM_ATTR_GET_LIBC_EPFD, 0, 0);
Dave Wallace048b1d62018-01-03 22:24:41 -05002546 if (PREDICT_FALSE (libc_epfd < 0))
2547 {
2548 errno = -libc_epfd;
2549 rv = -1;
2550 goto done;
2551 }
2552
Florin Coras7baeb712019-01-04 17:05:43 -08002553 LDBG (2, "epfd %d: vep_idx %d, libc_epfd %d, events %p, maxevents %d, "
2554 "timeout %d, sigmask %p: time_to_wait %.02f", epfd, ep_vlsh,
Florin Coras72f77822019-01-22 19:05:52 -08002555 libc_epfd, events, maxevents, timeout, sigmask, time_to_wait);
Dave Wallace048b1d62018-01-03 22:24:41 -05002556 do
2557 {
Florin Corasdfe4cf42018-11-28 22:13:45 -08002558 if (!ldpw->epoll_wait_vcl)
Dave Wallace048b1d62018-01-03 22:24:41 -05002559 {
Florin Coras7baeb712019-01-04 17:05:43 -08002560 rv = vls_epoll_wait (ep_vlsh, events, maxevents, 0);
Dave Wallace048b1d62018-01-03 22:24:41 -05002561 if (rv > 0)
2562 {
Florin Corasdfe4cf42018-11-28 22:13:45 -08002563 ldpw->epoll_wait_vcl = 1;
Dave Wallace048b1d62018-01-03 22:24:41 -05002564 goto done;
2565 }
2566 else if (rv < 0)
2567 {
2568 errno = -rv;
2569 rv = -1;
2570 goto done;
2571 }
2572 }
2573 else
Florin Corasdfe4cf42018-11-28 22:13:45 -08002574 ldpw->epoll_wait_vcl = 0;
Dave Wallace048b1d62018-01-03 22:24:41 -05002575
2576 if (libc_epfd > 0)
2577 {
Florin Corasb0f662f2018-12-27 14:51:46 -08002578 rv = libc_epoll_pwait (libc_epfd, events, maxevents, 0, sigmask);
Dave Wallace048b1d62018-01-03 22:24:41 -05002579 if (rv != 0)
2580 goto done;
2581 }
Dave Wallace048b1d62018-01-03 22:24:41 -05002582 }
Florin Coras72f77822019-01-22 19:05:52 -08002583 while ((timeout == -1) || (clib_time_now (&ldpw->clib_time) < max_time));
Dave Wallace048b1d62018-01-03 22:24:41 -05002584
2585done:
Dave Wallace048b1d62018-01-03 22:24:41 -05002586 return rv;
2587}
2588
hanlin4266d4d2020-05-19 17:34:17 +08002589static inline int
2590ldp_epoll_pwait_eventfd (int epfd, struct epoll_event *events,
2591 int maxevents, int timeout, const sigset_t * sigmask)
2592{
Florin Corasc86662a2023-03-05 11:45:38 -08002593 int libc_epfd, rv = 0, num_ev, libc_num_ev, vcl_wups = 0;
2594 struct epoll_event *libc_evts;
hanlina3a48962020-07-13 11:09:15 +08002595 ldp_worker_ctx_t *ldpw;
hanlin4266d4d2020-05-19 17:34:17 +08002596 vls_handle_t ep_vlsh;
2597
Florin Coras5f33d0d2021-06-02 21:22:21 -07002598 ldp_init_check ();
hanlin4266d4d2020-05-19 17:34:17 +08002599
2600 if (PREDICT_FALSE (!events || (timeout < -1)))
2601 {
2602 errno = EFAULT;
2603 return -1;
2604 }
2605
Florin Corasff40d8f2020-08-11 22:05:28 -07002606 /* Make sure the vcl worker is valid. Could be that epoll fd was created on
2607 * one thread but it is now used on another */
2608 if (PREDICT_FALSE (vppcom_worker_index () == ~0))
2609 vls_register_vcl_worker ();
hanlina3a48962020-07-13 11:09:15 +08002610
2611 ldpw = ldp_worker_get_current ();
hanlin4266d4d2020-05-19 17:34:17 +08002612 if (epfd == ldpw->vcl_mq_epfd)
2613 return libc_epoll_pwait (epfd, events, maxevents, timeout, sigmask);
2614
2615 ep_vlsh = ldp_fd_to_vlsh (epfd);
2616 if (PREDICT_FALSE (ep_vlsh == VLS_INVALID_HANDLE))
2617 {
2618 LDBG (0, "epfd %d: bad ep_vlsh %d!", epfd, ep_vlsh);
2619 errno = EBADFD;
2620 return -1;
2621 }
2622
2623 libc_epfd = vls_attr (ep_vlsh, VPPCOM_ATTR_GET_LIBC_EPFD, 0, 0);
2624 if (PREDICT_FALSE (!libc_epfd))
2625 {
2626 u32 size = sizeof (epfd);
2627
2628 LDBG (1, "epfd %d, vep_vlsh %d calling libc_epoll_create1: "
2629 "EPOLL_CLOEXEC", epfd, ep_vlsh);
2630 libc_epfd = libc_epoll_create1 (EPOLL_CLOEXEC);
2631 if (libc_epfd < 0)
2632 {
2633 rv = libc_epfd;
2634 goto done;
2635 }
2636
2637 rv = vls_attr (ep_vlsh, VPPCOM_ATTR_SET_LIBC_EPFD, &libc_epfd, &size);
2638 if (rv < 0)
2639 {
2640 errno = -rv;
2641 rv = -1;
2642 goto done;
2643 }
2644 }
2645 if (PREDICT_FALSE (libc_epfd <= 0))
2646 {
2647 errno = -libc_epfd;
2648 rv = -1;
2649 goto done;
2650 }
2651
2652 if (PREDICT_FALSE (!ldpw->mq_epfd_added))
2653 {
2654 struct epoll_event e = { 0 };
2655 e.events = EPOLLIN;
2656 e.data.fd = ldpw->vcl_mq_epfd;
2657 if (libc_epoll_ctl (libc_epfd, EPOLL_CTL_ADD, ldpw->vcl_mq_epfd, &e) <
2658 0)
2659 {
2660 LDBG (0, "epfd %d, add libc mq epoll fd %d to libc epoll fd %d",
2661 epfd, ldpw->vcl_mq_epfd, libc_epfd);
2662 rv = -1;
2663 goto done;
2664 }
2665 ldpw->mq_epfd_added = 1;
2666 }
2667
wanghanlin8919fec2021-03-18 20:00:41 +08002668 /* Request to only drain unhandled to prevent libc_epoll_wait starved */
2669 rv = vls_epoll_wait (ep_vlsh, events, maxevents, -2);
hanlin4266d4d2020-05-19 17:34:17 +08002670 if (rv > 0)
Florin Corasc86662a2023-03-05 11:45:38 -08002671 {
2672 timeout = 0;
2673 if (rv >= maxevents)
2674 goto done;
Florin Coras55c699e2023-08-15 12:11:50 -07002675 maxevents -= rv;
Florin Corasc86662a2023-03-05 11:45:38 -08002676 }
hanlina3a48962020-07-13 11:09:15 +08002677 else if (PREDICT_FALSE (rv < 0))
hanlin4266d4d2020-05-19 17:34:17 +08002678 {
2679 errno = -rv;
2680 rv = -1;
2681 goto done;
2682 }
2683
Florin Coras7a1e95a2023-03-01 00:45:31 -08002684epoll_again:
Florin Corasc86662a2023-03-05 11:45:38 -08002685
2686 libc_evts = &events[rv];
2687 libc_num_ev =
Florin Coras55c699e2023-08-15 12:11:50 -07002688 libc_epoll_pwait (libc_epfd, libc_evts, maxevents, timeout, sigmask);
Florin Corasc86662a2023-03-05 11:45:38 -08002689 if (libc_num_ev <= 0)
hanlin4266d4d2020-05-19 17:34:17 +08002690 {
Florin Corasc86662a2023-03-05 11:45:38 -08002691 rv = rv >= 0 ? rv : -1;
2692 goto done;
2693 }
2694
2695 for (int i = 0; i < libc_num_ev; i++)
2696 {
2697 if (libc_evts[i].data.fd == ldpw->vcl_mq_epfd)
hanlin4266d4d2020-05-19 17:34:17 +08002698 {
2699 /* We should remove mq epoll fd from events. */
Florin Corasc86662a2023-03-05 11:45:38 -08002700 libc_num_ev--;
2701 if (i != libc_num_ev)
hanlin4266d4d2020-05-19 17:34:17 +08002702 {
Florin Corasc86662a2023-03-05 11:45:38 -08002703 libc_evts[i].events = libc_evts[libc_num_ev].events;
2704 libc_evts[i].data.u64 = libc_evts[libc_num_ev].data.u64;
hanlin4266d4d2020-05-19 17:34:17 +08002705 }
Florin Corasc86662a2023-03-05 11:45:38 -08002706 num_ev = vls_epoll_wait (ep_vlsh, &libc_evts[libc_num_ev],
2707 maxevents - libc_num_ev, 0);
hanlin4266d4d2020-05-19 17:34:17 +08002708 if (PREDICT_TRUE (num_ev > 0))
2709 rv += num_ev;
Florin Coras7a1e95a2023-03-01 00:45:31 -08002710 /* Woken up by vcl but no events generated. Accept it once */
Florin Corasc86662a2023-03-05 11:45:38 -08002711 if (rv == 0 && libc_num_ev == 0 && timeout && vcl_wups++ < 1)
Florin Coras7a1e95a2023-03-01 00:45:31 -08002712 goto epoll_again;
hanlin4266d4d2020-05-19 17:34:17 +08002713 break;
2714 }
2715 }
2716
Florin Corasc86662a2023-03-05 11:45:38 -08002717 rv += libc_num_ev;
2718
hanlin4266d4d2020-05-19 17:34:17 +08002719done:
2720 return rv;
2721}
2722
Dave Wallace048b1d62018-01-03 22:24:41 -05002723int
2724epoll_pwait (int epfd, struct epoll_event *events,
2725 int maxevents, int timeout, const sigset_t * sigmask)
2726{
hanlin4266d4d2020-05-19 17:34:17 +08002727 if (vls_use_eventfd ())
2728 return ldp_epoll_pwait_eventfd (epfd, events, maxevents, timeout,
2729 sigmask);
2730 else
2731 return ldp_epoll_pwait (epfd, events, maxevents, timeout, sigmask);
Dave Wallace048b1d62018-01-03 22:24:41 -05002732}
2733
2734int
2735epoll_wait (int epfd, struct epoll_event *events, int maxevents, int timeout)
2736{
hanlin4266d4d2020-05-19 17:34:17 +08002737 if (vls_use_eventfd ())
2738 return ldp_epoll_pwait_eventfd (epfd, events, maxevents, timeout, NULL);
2739 else
2740 return ldp_epoll_pwait (epfd, events, maxevents, timeout, NULL);
Dave Wallace048b1d62018-01-03 22:24:41 -05002741}
2742
2743int
2744poll (struct pollfd *fds, nfds_t nfds, int timeout)
2745{
Florin Corasdfe4cf42018-11-28 22:13:45 -08002746 ldp_worker_ctx_t *ldpw = ldp_worker_get_current ();
Florin Coras6917b942018-11-13 22:44:54 -08002747 int rv, i, n_revents = 0;
Florin Coras7baeb712019-01-04 17:05:43 -08002748 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05002749 vcl_poll_t *vp;
Florin Coras4dee8cd2019-01-29 21:28:16 -08002750 double max_time;
Dave Wallace048b1d62018-01-03 22:24:41 -05002751
Florin Coraseb801d02020-09-16 17:44:58 -07002752 LDBG (3, "fds %p, nfds %ld, timeout %d", fds, nfds, timeout);
Dave Wallace048b1d62018-01-03 22:24:41 -05002753
Florin Coras4dee8cd2019-01-29 21:28:16 -08002754 if (PREDICT_FALSE (ldpw->clib_time.init_cpu_time == 0))
2755 clib_time_init (&ldpw->clib_time);
2756
2757 max_time = (timeout >= 0) ? (f64) timeout / 1000 : 0;
2758 max_time += clib_time_now (&ldpw->clib_time);
Dave Wallace048b1d62018-01-03 22:24:41 -05002759
Dave Wallace048b1d62018-01-03 22:24:41 -05002760 for (i = 0; i < nfds; i++)
2761 {
Florin Coras6917b942018-11-13 22:44:54 -08002762 if (fds[i].fd < 0)
2763 continue;
Dave Wallace048b1d62018-01-03 22:24:41 -05002764
Florin Coras7baeb712019-01-04 17:05:43 -08002765 vlsh = ldp_fd_to_vlsh (fds[i].fd);
2766 if (vlsh != VLS_INVALID_HANDLE)
Florin Coras6917b942018-11-13 22:44:54 -08002767 {
2768 fds[i].fd = -fds[i].fd;
Florin Corasdfe4cf42018-11-28 22:13:45 -08002769 vec_add2 (ldpw->vcl_poll, vp, 1);
Florin Coras6917b942018-11-13 22:44:54 -08002770 vp->fds_ndx = i;
Florin Coras7baeb712019-01-04 17:05:43 -08002771 vp->sh = vlsh_to_sh (vlsh);
Florin Coras6917b942018-11-13 22:44:54 -08002772 vp->events = fds[i].events;
Dave Wallace048b1d62018-01-03 22:24:41 -05002773#ifdef __USE_XOPEN2K
Florin Coras6917b942018-11-13 22:44:54 -08002774 if (fds[i].events & POLLRDNORM)
2775 vp->events |= POLLIN;
2776 if (fds[i].events & POLLWRNORM)
2777 vp->events |= POLLOUT;
Dave Wallace048b1d62018-01-03 22:24:41 -05002778#endif
Florin Coras6917b942018-11-13 22:44:54 -08002779 vp->revents = fds[i].revents;
2780 }
2781 else
2782 {
Florin Corasdfe4cf42018-11-28 22:13:45 -08002783 vec_add1 (ldpw->libc_poll, fds[i]);
2784 vec_add1 (ldpw->libc_poll_idxs, i);
Dave Wallace048b1d62018-01-03 22:24:41 -05002785 }
2786 }
2787
Dave Wallace048b1d62018-01-03 22:24:41 -05002788 do
2789 {
Florin Corasdfe4cf42018-11-28 22:13:45 -08002790 if (vec_len (ldpw->vcl_poll))
Dave Wallace048b1d62018-01-03 22:24:41 -05002791 {
Florin Corasdfe4cf42018-11-28 22:13:45 -08002792 rv = vppcom_poll (ldpw->vcl_poll, vec_len (ldpw->vcl_poll), 0);
Dave Wallace048b1d62018-01-03 22:24:41 -05002793 if (rv < 0)
2794 {
2795 errno = -rv;
2796 rv = -1;
2797 goto done;
2798 }
2799 else
2800 n_revents += rv;
2801 }
2802
Florin Corasdfe4cf42018-11-28 22:13:45 -08002803 if (vec_len (ldpw->libc_poll))
Dave Wallace048b1d62018-01-03 22:24:41 -05002804 {
Florin Corasdfe4cf42018-11-28 22:13:45 -08002805 rv = libc_poll (ldpw->libc_poll, vec_len (ldpw->libc_poll), 0);
Dave Wallace048b1d62018-01-03 22:24:41 -05002806 if (rv < 0)
2807 goto done;
2808 else
2809 n_revents += rv;
2810 }
2811
2812 if (n_revents)
2813 {
2814 rv = n_revents;
2815 goto done;
2816 }
2817 }
Florin Coras4dee8cd2019-01-29 21:28:16 -08002818 while ((timeout < 0) || (clib_time_now (&ldpw->clib_time) < max_time));
Dave Wallace048b1d62018-01-03 22:24:41 -05002819 rv = 0;
2820
2821done:
Florin Corasdfe4cf42018-11-28 22:13:45 -08002822 vec_foreach (vp, ldpw->vcl_poll)
Dave Wallace048b1d62018-01-03 22:24:41 -05002823 {
2824 fds[vp->fds_ndx].fd = -fds[vp->fds_ndx].fd;
Florin Coras6917b942018-11-13 22:44:54 -08002825 fds[vp->fds_ndx].revents = vp->revents;
Dave Wallace048b1d62018-01-03 22:24:41 -05002826#ifdef __USE_XOPEN2K
2827 if ((fds[vp->fds_ndx].revents & POLLIN) &&
2828 (fds[vp->fds_ndx].events & POLLRDNORM))
2829 fds[vp->fds_ndx].revents |= POLLRDNORM;
2830 if ((fds[vp->fds_ndx].revents & POLLOUT) &&
2831 (fds[vp->fds_ndx].events & POLLWRNORM))
2832 fds[vp->fds_ndx].revents |= POLLWRNORM;
2833#endif
2834 }
Florin Corasdfe4cf42018-11-28 22:13:45 -08002835 vec_reset_length (ldpw->vcl_poll);
Dave Wallace048b1d62018-01-03 22:24:41 -05002836
Florin Corasdfe4cf42018-11-28 22:13:45 -08002837 for (i = 0; i < vec_len (ldpw->libc_poll); i++)
Florin Coras6917b942018-11-13 22:44:54 -08002838 {
Florin Corasdfe4cf42018-11-28 22:13:45 -08002839 fds[ldpw->libc_poll_idxs[i]].revents = ldpw->libc_poll[i].revents;
Florin Coras6917b942018-11-13 22:44:54 -08002840 }
Florin Corasdfe4cf42018-11-28 22:13:45 -08002841 vec_reset_length (ldpw->libc_poll_idxs);
2842 vec_reset_length (ldpw->libc_poll);
Florin Coras6917b942018-11-13 22:44:54 -08002843
Dave Wallace048b1d62018-01-03 22:24:41 -05002844 return rv;
2845}
2846
Florin Coras36847942023-02-02 12:56:16 -08002847#ifdef _GNU_SOURCE
Dave Wallace048b1d62018-01-03 22:24:41 -05002848int
2849ppoll (struct pollfd *fds, nfds_t nfds,
2850 const struct timespec *timeout, const sigset_t * sigmask)
2851{
Florin Coras5f33d0d2021-06-02 21:22:21 -07002852 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05002853
2854 clib_warning ("LDP<%d>: LDP-TBD", getpid ());
2855 errno = ENOSYS;
2856
2857
2858 return -1;
2859}
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002860#endif
2861
Dave Wallace2a865272018-02-07 21:00:42 -05002862void CONSTRUCTOR_ATTRIBUTE ldp_constructor (void);
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002863
Dave Wallace2a865272018-02-07 21:00:42 -05002864void DESTRUCTOR_ATTRIBUTE ldp_destructor (void);
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002865
Dave Wallace048b1d62018-01-03 22:24:41 -05002866/*
2867 * This function is called when the library is loaded
2868 */
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002869void
Dave Wallace2a865272018-02-07 21:00:42 -05002870ldp_constructor (void)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002871{
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002872 swrap_constructor ();
Dave Wallace2a865272018-02-07 21:00:42 -05002873 if (ldp_init () != 0)
Florin Corasd89411e2019-03-19 19:44:51 -07002874 {
2875 fprintf (stderr, "\nLDP<%d>: ERROR: ldp_constructor: failed!\n",
2876 getpid ());
2877 _exit (1);
2878 }
Dave Wallace69d01192018-02-22 16:22:09 -05002879 else if (LDP_DEBUG > 0)
Dave Wallace2a865272018-02-07 21:00:42 -05002880 clib_warning ("LDP<%d>: LDP constructor: done!\n", getpid ());
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002881}
2882
2883/*
2884 * This function is called when the library is unloaded
2885 */
2886void
Dave Wallace2a865272018-02-07 21:00:42 -05002887ldp_destructor (void)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002888{
Florin Coras0ef8ef22019-01-18 08:37:13 -08002889 /*
2890 swrap_destructor ();
2891 if (ldp->init)
2892 ldp->init = 0;
2893 */
Dave Wallace048b1d62018-01-03 22:24:41 -05002894
2895 /* Don't use clib_warning() here because that calls writev()
Dave Wallace2a865272018-02-07 21:00:42 -05002896 * which will call ldp_init().
Dave Wallace048b1d62018-01-03 22:24:41 -05002897 */
Dave Wallace69d01192018-02-22 16:22:09 -05002898 if (LDP_DEBUG > 0)
Florin Coras0ef8ef22019-01-18 08:37:13 -08002899 fprintf (stderr, "%s:%d: LDP<%d>: LDP destructor: done!\n",
2900 __func__, __LINE__, getpid ());
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002901}
2902
2903
2904/*
2905 * fd.io coding-style-patch-verification: ON
2906 *
2907 * Local Variables:
2908 * eval: (c-set-style "gnu")
2909 * End:
2910 */