blob: 9e8858fb230d9e7daa005c7a40c466dc13258d4c [file] [log] [blame]
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001/*
Florin Coras5e062572019-03-14 19:07:51 -07002 * Copyright (c) 2016-2019 Cisco and/or its affiliates.
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07003 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
6 *
7 * http://www.apache.org/licenses/LICENSE-2.0
8 *
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
14 */
Florin Coras36847942023-02-02 12:56:16 -080015
16#ifdef HAVE_GNU_SOURCE
17#define _GNU_SOURCE
18#endif
19
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -070020#include <unistd.h>
21#include <stdio.h>
22#include <signal.h>
23#include <dlfcn.h>
24#include <pthread.h>
25#include <time.h>
26#include <stdarg.h>
shrinivasan ganapathy1d359632017-10-15 15:46:09 -070027#include <sys/resource.h>
Dave Wallace048b1d62018-01-03 22:24:41 -050028#include <netinet/tcp.h>
Florin Coraseff5f7a2023-02-07 17:36:17 -080029#include <netinet/udp.h>
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -070030
Dave Wallace2a865272018-02-07 21:00:42 -050031#include <vcl/ldp_socket_wrapper.h>
32#include <vcl/ldp.h>
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -070033#include <sys/time.h>
34
Florin Coras7baeb712019-01-04 17:05:43 -080035#include <vcl/vcl_locked.h>
Dave Wallace048b1d62018-01-03 22:24:41 -050036#include <vppinfra/time.h>
37#include <vppinfra/bitmap.h>
Florin Coras30e273b2018-11-27 00:04:59 -080038#include <vppinfra/lock.h>
39#include <vppinfra/pool.h>
40#include <vppinfra/hash.h>
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -070041
42#define HAVE_CONSTRUCTOR_ATTRIBUTE
43#ifdef HAVE_CONSTRUCTOR_ATTRIBUTE
44#define CONSTRUCTOR_ATTRIBUTE \
45 __attribute__ ((constructor))
46#else
47#define CONSTRUCTOR_ATTRIBUTE
48#endif /* HAVE_CONSTRUCTOR_ATTRIBUTE */
49
50#define HAVE_DESTRUCTOR_ATTRIBUTE
51#ifdef HAVE_DESTRUCTOR_ATTRIBUTE
52#define DESTRUCTOR_ATTRIBUTE \
53 __attribute__ ((destructor))
54#else
55#define DESTRUCTOR_ATTRIBUTE
56#endif
57
Florin Corasdfe4cf42018-11-28 22:13:45 -080058#define LDP_MAX_NWORKERS 32
59
Florin Coras36847942023-02-02 12:56:16 -080060#ifdef HAVE_GNU_SOURCE
61#define SOCKADDR_GET_SA(__addr) __addr.__sockaddr__;
62#else
63#define SOCKADDR_GET_SA(__addr) _addr;
64#endif
65
Florin Corasdfe4cf42018-11-28 22:13:45 -080066typedef struct ldp_worker_ctx_
Dave Wallace048b1d62018-01-03 22:24:41 -050067{
Dave Wallace048b1d62018-01-03 22:24:41 -050068 u8 *io_buffer;
69 clib_time_t clib_time;
Florin Corasdfe4cf42018-11-28 22:13:45 -080070
71 /*
72 * Select state
73 */
Dave Wallace048b1d62018-01-03 22:24:41 -050074 clib_bitmap_t *rd_bitmap;
75 clib_bitmap_t *wr_bitmap;
76 clib_bitmap_t *ex_bitmap;
Florin Coras294afe22019-01-07 17:49:17 -080077 clib_bitmap_t *si_rd_bitmap;
78 clib_bitmap_t *si_wr_bitmap;
79 clib_bitmap_t *si_ex_bitmap;
Dave Wallace048b1d62018-01-03 22:24:41 -050080 clib_bitmap_t *libc_rd_bitmap;
81 clib_bitmap_t *libc_wr_bitmap;
82 clib_bitmap_t *libc_ex_bitmap;
Florin Corasdfe4cf42018-11-28 22:13:45 -080083
84 /*
85 * Poll state
86 */
Dave Wallace048b1d62018-01-03 22:24:41 -050087 vcl_poll_t *vcl_poll;
Florin Coras6917b942018-11-13 22:44:54 -080088 struct pollfd *libc_poll;
89 u16 *libc_poll_idxs;
Florin Corasdfe4cf42018-11-28 22:13:45 -080090
91 /*
92 * Epoll state
93 */
Dave Wallace048b1d62018-01-03 22:24:41 -050094 u8 epoll_wait_vcl;
hanlin4266d4d2020-05-19 17:34:17 +080095 u8 mq_epfd_added;
Florin Coras99368312018-08-02 10:45:44 -070096 int vcl_mq_epfd;
Florin Corasdfe4cf42018-11-28 22:13:45 -080097
98} ldp_worker_ctx_t;
99
Florin Coras294afe22019-01-07 17:49:17 -0800100/* clib_bitmap_t, fd_mask and vcl_si_set are used interchangeably. Make sure
101 * they are the same size */
102STATIC_ASSERT (sizeof (clib_bitmap_t) == sizeof (fd_mask),
103 "ldp bitmap size mismatch");
104STATIC_ASSERT (sizeof (vcl_si_set) == sizeof (fd_mask),
105 "ldp bitmap size mismatch");
106
Florin Corasdfe4cf42018-11-28 22:13:45 -0800107typedef struct
108{
109 ldp_worker_ctx_t *workers;
110 int init;
111 char app_name[LDP_APP_NAME_MAX];
Florin Coras7baeb712019-01-04 17:05:43 -0800112 u32 vlsh_bit_val;
113 u32 vlsh_bit_mask;
Florin Corasdfe4cf42018-11-28 22:13:45 -0800114 u32 debug;
Florin Corasdfe4cf42018-11-28 22:13:45 -0800115
116 /** vcl needs next epoll_create to go to libc_epoll */
117 u8 vcl_needs_real_epoll;
Florin Corasa5a9efd2021-01-05 17:03:29 -0800118
119 /**
120 * crypto state used only for testing
121 */
122 u8 transparent_tls;
123 u32 ckpair_index;
Dave Wallace2a865272018-02-07 21:00:42 -0500124} ldp_main_t;
Florin Corasdfe4cf42018-11-28 22:13:45 -0800125
Dave Wallace2a865272018-02-07 21:00:42 -0500126#define LDP_DEBUG ldp->debug
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700127
Florin Coras99368312018-08-02 10:45:44 -0700128#define LDBG(_lvl, _fmt, _args...) \
129 if (ldp->debug > _lvl) \
hanlin9f3f18f2019-12-30 16:25:20 +0800130 { \
131 int errno_saved = errno; \
Florin Coras585c86a2020-10-16 17:57:36 -0700132 fprintf (stderr, "ldp<%d>: " _fmt "\n", getpid(), ##_args); \
hanlin9f3f18f2019-12-30 16:25:20 +0800133 errno = errno_saved; \
134 }
Florin Coras99368312018-08-02 10:45:44 -0700135
Dave Wallace2a865272018-02-07 21:00:42 -0500136static ldp_main_t ldp_main = {
Florin Coras7baeb712019-01-04 17:05:43 -0800137 .vlsh_bit_val = (1 << LDP_SID_BIT_MIN),
138 .vlsh_bit_mask = (1 << LDP_SID_BIT_MIN) - 1,
Dave Wallace2a865272018-02-07 21:00:42 -0500139 .debug = LDP_DEBUG_INIT,
Yu Ping7b74b072019-05-08 00:40:24 +0800140 .transparent_tls = 0,
Florin Corasa5a9efd2021-01-05 17:03:29 -0800141 .ckpair_index = ~0,
Dave Wallace048b1d62018-01-03 22:24:41 -0500142};
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700143
Dave Wallace2a865272018-02-07 21:00:42 -0500144static ldp_main_t *ldp = &ldp_main;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700145
Florin Corasdfe4cf42018-11-28 22:13:45 -0800146static inline ldp_worker_ctx_t *
147ldp_worker_get_current (void)
148{
149 return (ldp->workers + vppcom_worker_index ());
150}
151
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700152/*
153 * RETURN: 0 on success or -1 on error.
154 * */
Dave Wallace048b1d62018-01-03 22:24:41 -0500155static inline void
Dave Wallace2a865272018-02-07 21:00:42 -0500156ldp_set_app_name (char *app_name)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700157{
Benoît Ganne747b3d82019-08-21 18:27:23 +0200158 snprintf (ldp->app_name, LDP_APP_NAME_MAX,
159 "ldp-%d-%s", getpid (), app_name);
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700160}
161
Dave Wallace048b1d62018-01-03 22:24:41 -0500162static inline char *
Dave Wallace2a865272018-02-07 21:00:42 -0500163ldp_get_app_name ()
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700164{
Dave Wallace2a865272018-02-07 21:00:42 -0500165 if (ldp->app_name[0] == '\0')
166 ldp_set_app_name ("app");
Dave Wallace048b1d62018-01-03 22:24:41 -0500167
Dave Wallace2a865272018-02-07 21:00:42 -0500168 return ldp->app_name;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700169}
170
Dave Wallace048b1d62018-01-03 22:24:41 -0500171static inline int
Florin Coras7baeb712019-01-04 17:05:43 -0800172ldp_vlsh_to_fd (vls_handle_t vlsh)
Dave Wallace048b1d62018-01-03 22:24:41 -0500173{
Florin Coras7baeb712019-01-04 17:05:43 -0800174 return (vlsh + ldp->vlsh_bit_val);
Dave Wallace048b1d62018-01-03 22:24:41 -0500175}
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700176
Florin Coras7baeb712019-01-04 17:05:43 -0800177static inline vls_handle_t
178ldp_fd_to_vlsh (int fd)
Dave Wallace048b1d62018-01-03 22:24:41 -0500179{
Florin Coras7baeb712019-01-04 17:05:43 -0800180 if (fd < ldp->vlsh_bit_val)
181 return VLS_INVALID_HANDLE;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700182
Florin Coras7baeb712019-01-04 17:05:43 -0800183 return (fd - ldp->vlsh_bit_val);
Dave Wallace048b1d62018-01-03 22:24:41 -0500184}
185
Florin Coras2d9b4272019-03-11 10:14:37 -0700186static void
187ldp_alloc_workers (void)
188{
189 if (ldp->workers)
190 return;
191 pool_alloc (ldp->workers, LDP_MAX_NWORKERS);
192}
193
Florin Coras5f33d0d2021-06-02 21:22:21 -0700194static int
Dave Wallace2a865272018-02-07 21:00:42 -0500195ldp_init (void)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700196{
Florin Corasdfe4cf42018-11-28 22:13:45 -0800197 ldp_worker_ctx_t *ldpw;
Florin Coras99368312018-08-02 10:45:44 -0700198 int rv;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700199
Florin Coras5f33d0d2021-06-02 21:22:21 -0700200 ASSERT (!ldp->init);
Florin Coras99368312018-08-02 10:45:44 -0700201
202 ldp->init = 1;
203 ldp->vcl_needs_real_epoll = 1;
Florin Coras7baeb712019-01-04 17:05:43 -0800204 rv = vls_app_create (ldp_get_app_name ());
Florin Coras99368312018-08-02 10:45:44 -0700205 if (rv != VPPCOM_OK)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700206 {
Florin Coras955bfbb2018-12-04 13:43:45 -0800207 ldp->vcl_needs_real_epoll = 0;
208 if (rv == VPPCOM_EEXIST)
209 return 0;
Florin Coras05ecfcc2018-12-12 18:19:39 -0800210 LDBG (2, "\nERROR: ldp_init: vppcom_app_create()"
211 " failed! rv = %d (%s)\n", rv, vppcom_retval_str (rv));
Florin Coras99368312018-08-02 10:45:44 -0700212 ldp->init = 0;
213 return rv;
214 }
215 ldp->vcl_needs_real_epoll = 0;
Florin Coras2d9b4272019-03-11 10:14:37 -0700216 ldp_alloc_workers ();
Florin Corasdfe4cf42018-11-28 22:13:45 -0800217 ldpw = ldp_worker_get_current ();
Florin Coras99368312018-08-02 10:45:44 -0700218
219 char *env_var_str = getenv (LDP_ENV_DEBUG);
220 if (env_var_str)
221 {
222 u32 tmp;
223 if (sscanf (env_var_str, "%u", &tmp) != 1)
224 clib_warning ("LDP<%d>: WARNING: Invalid LDP debug level specified in"
225 " the env var " LDP_ENV_DEBUG " (%s)!", getpid (),
226 env_var_str);
227 else
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700228 {
Florin Coras99368312018-08-02 10:45:44 -0700229 ldp->debug = tmp;
Florin Coras05ecfcc2018-12-12 18:19:39 -0800230 LDBG (0, "configured LDP debug level (%u) from env var "
231 LDP_ENV_DEBUG "!", ldp->debug);
Florin Coras99368312018-08-02 10:45:44 -0700232 }
233 }
Dave Wallace048b1d62018-01-03 22:24:41 -0500234
Florin Coras99368312018-08-02 10:45:44 -0700235 env_var_str = getenv (LDP_ENV_APP_NAME);
236 if (env_var_str)
237 {
238 ldp_set_app_name (env_var_str);
Florin Coras05ecfcc2018-12-12 18:19:39 -0800239 LDBG (0, "configured LDP app name (%s) from the env var "
240 LDP_ENV_APP_NAME "!", ldp->app_name);
Florin Coras99368312018-08-02 10:45:44 -0700241 }
Dave Wallace048b1d62018-01-03 22:24:41 -0500242
Florin Coras99368312018-08-02 10:45:44 -0700243 env_var_str = getenv (LDP_ENV_SID_BIT);
244 if (env_var_str)
245 {
246 u32 sb;
247 if (sscanf (env_var_str, "%u", &sb) != 1)
248 {
Florin Coras294afe22019-01-07 17:49:17 -0800249 LDBG (0, "WARNING: Invalid LDP sid bit specified in the env var "
250 LDP_ENV_SID_BIT " (%s)! sid bit value %d (0x%x)", env_var_str,
251 ldp->vlsh_bit_val, ldp->vlsh_bit_val);
Florin Coras99368312018-08-02 10:45:44 -0700252 }
253 else if (sb < LDP_SID_BIT_MIN)
254 {
Florin Coras7baeb712019-01-04 17:05:43 -0800255 ldp->vlsh_bit_val = (1 << LDP_SID_BIT_MIN);
256 ldp->vlsh_bit_mask = ldp->vlsh_bit_val - 1;
Dave Wallace048b1d62018-01-03 22:24:41 -0500257
Florin Coras294afe22019-01-07 17:49:17 -0800258 LDBG (0, "WARNING: LDP sid bit (%u) specified in the env var "
259 LDP_ENV_SID_BIT " (%s) is too small. Using LDP_SID_BIT_MIN"
260 " (%d)! sid bit value %d (0x%x)", sb, env_var_str,
261 LDP_SID_BIT_MIN, ldp->vlsh_bit_val, ldp->vlsh_bit_val);
Florin Coras99368312018-08-02 10:45:44 -0700262 }
263 else if (sb > LDP_SID_BIT_MAX)
264 {
Florin Coras7baeb712019-01-04 17:05:43 -0800265 ldp->vlsh_bit_val = (1 << LDP_SID_BIT_MAX);
266 ldp->vlsh_bit_mask = ldp->vlsh_bit_val - 1;
Dave Wallace048b1d62018-01-03 22:24:41 -0500267
Florin Coras294afe22019-01-07 17:49:17 -0800268 LDBG (0, "WARNING: LDP sid bit (%u) specified in the env var "
269 LDP_ENV_SID_BIT " (%s) is too big. Using LDP_SID_BIT_MAX"
270 " (%d)! sid bit value %d (0x%x)", sb, env_var_str,
271 LDP_SID_BIT_MAX, ldp->vlsh_bit_val, ldp->vlsh_bit_val);
Dave Wallace048b1d62018-01-03 22:24:41 -0500272 }
273 else
274 {
Florin Coras7baeb712019-01-04 17:05:43 -0800275 ldp->vlsh_bit_val = (1 << sb);
276 ldp->vlsh_bit_mask = ldp->vlsh_bit_val - 1;
Florin Coras99368312018-08-02 10:45:44 -0700277
Florin Coras05ecfcc2018-12-12 18:19:39 -0800278 LDBG (0, "configured LDP sid bit (%u) from "
279 LDP_ENV_SID_BIT "! sid bit value %d (0x%x)", sb,
Florin Coras7baeb712019-01-04 17:05:43 -0800280 ldp->vlsh_bit_val, ldp->vlsh_bit_val);
Dave Wallace048b1d62018-01-03 22:24:41 -0500281 }
Florin Coras294afe22019-01-07 17:49:17 -0800282
283 /* Make sure there are enough bits in the fd set for vcl sessions */
284 if (ldp->vlsh_bit_val > FD_SETSIZE / 2)
285 {
wanghanlin1eb8fea2021-10-14 11:10:26 +0800286 /* Only valid for select/pselect, so just WARNING and not exit */
287 LDBG (0,
288 "WARNING: LDP vlsh bit value %d > FD_SETSIZE/2 %d, "
289 "select/pselect not supported now!",
Florin Coras294afe22019-01-07 17:49:17 -0800290 ldp->vlsh_bit_val, FD_SETSIZE / 2);
Florin Coras294afe22019-01-07 17:49:17 -0800291 }
Dave Wallace048b1d62018-01-03 22:24:41 -0500292 }
Yu Ping7b74b072019-05-08 00:40:24 +0800293 env_var_str = getenv (LDP_ENV_TLS_TRANS);
294 if (env_var_str)
295 {
296 ldp->transparent_tls = 1;
297 }
Florin Coras99368312018-08-02 10:45:44 -0700298
Florin Coras4dee8cd2019-01-29 21:28:16 -0800299 /* *INDENT-OFF* */
Damjan Marionb2c31b62020-12-13 21:47:40 +0100300 pool_foreach (ldpw, ldp->workers) {
Florin Coras4dee8cd2019-01-29 21:28:16 -0800301 clib_memset (&ldpw->clib_time, 0, sizeof (ldpw->clib_time));
Damjan Marionb2c31b62020-12-13 21:47:40 +0100302 }
Florin Coras4dee8cd2019-01-29 21:28:16 -0800303 /* *INDENT-ON* */
304
Florin Coras05ecfcc2018-12-12 18:19:39 -0800305 LDBG (0, "LDP initialization: done!");
Florin Coras99368312018-08-02 10:45:44 -0700306
307 return 0;
Dave Wallace048b1d62018-01-03 22:24:41 -0500308}
309
Florin Coras5f33d0d2021-06-02 21:22:21 -0700310#define ldp_init_check() \
311 if (PREDICT_FALSE (!ldp->init)) \
312 { \
313 if ((errno = -ldp_init ())) \
314 return -1; \
315 }
316
Dave Wallace048b1d62018-01-03 22:24:41 -0500317int
318close (int fd)
319{
Florin Coras7baeb712019-01-04 17:05:43 -0800320 vls_handle_t vlsh;
321 int rv, epfd;
Dave Wallace048b1d62018-01-03 22:24:41 -0500322
Florin Coras5f33d0d2021-06-02 21:22:21 -0700323 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -0500324
Florin Coras7baeb712019-01-04 17:05:43 -0800325 vlsh = ldp_fd_to_vlsh (fd);
326 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -0500327 {
Florin Coras7baeb712019-01-04 17:05:43 -0800328 epfd = vls_attr (vlsh, VPPCOM_ATTR_GET_LIBC_EPFD, 0, 0);
Dave Wallace048b1d62018-01-03 22:24:41 -0500329 if (epfd > 0)
330 {
Florin Coras7baeb712019-01-04 17:05:43 -0800331 LDBG (0, "fd %d: calling libc_close: epfd %u", fd, epfd);
Dave Wallace048b1d62018-01-03 22:24:41 -0500332
333 rv = libc_close (epfd);
334 if (rv < 0)
335 {
336 u32 size = sizeof (epfd);
337 epfd = 0;
338
Florin Coras7baeb712019-01-04 17:05:43 -0800339 (void) vls_attr (vlsh, VPPCOM_ATTR_SET_LIBC_EPFD, &epfd, &size);
Dave Wallace048b1d62018-01-03 22:24:41 -0500340 }
341 }
342 else if (PREDICT_FALSE (epfd < 0))
343 {
344 errno = -epfd;
345 rv = -1;
346 goto done;
347 }
348
Florin Coras7baeb712019-01-04 17:05:43 -0800349 LDBG (0, "fd %d: calling vls_close: vlsh %u", fd, vlsh);
Dave Wallace048b1d62018-01-03 22:24:41 -0500350
Florin Coras7baeb712019-01-04 17:05:43 -0800351 rv = vls_close (vlsh);
Dave Wallace048b1d62018-01-03 22:24:41 -0500352 if (rv != VPPCOM_OK)
353 {
354 errno = -rv;
355 rv = -1;
356 }
357 }
358 else
359 {
Florin Coras7baeb712019-01-04 17:05:43 -0800360 LDBG (0, "fd %d: calling libc_close", fd);
Dave Wallace048b1d62018-01-03 22:24:41 -0500361 rv = libc_close (fd);
362 }
363
364done:
Dave Wallace048b1d62018-01-03 22:24:41 -0500365 return rv;
366}
367
368ssize_t
369read (int fd, void *buf, size_t nbytes)
370{
Florin Coras7baeb712019-01-04 17:05:43 -0800371 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -0500372 ssize_t size;
Dave Wallace048b1d62018-01-03 22:24:41 -0500373
Florin Coras5f33d0d2021-06-02 21:22:21 -0700374 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -0500375
Florin Coras7baeb712019-01-04 17:05:43 -0800376 vlsh = ldp_fd_to_vlsh (fd);
377 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -0500378 {
Florin Coras7baeb712019-01-04 17:05:43 -0800379 size = vls_read (vlsh, buf, nbytes);
Dave Wallace048b1d62018-01-03 22:24:41 -0500380 if (size < 0)
381 {
382 errno = -size;
383 size = -1;
384 }
385 }
386 else
387 {
Dave Wallace048b1d62018-01-03 22:24:41 -0500388 size = libc_read (fd, buf, nbytes);
389 }
390
Dave Wallace048b1d62018-01-03 22:24:41 -0500391 return size;
392}
393
394ssize_t
395readv (int fd, const struct iovec * iov, int iovcnt)
396{
Dave Wallace8aaba562018-01-18 17:21:19 -0500397 int rv = 0, i, total = 0;
Florin Coras7baeb712019-01-04 17:05:43 -0800398 vls_handle_t vlsh;
399 ssize_t size = 0;
Dave Wallace048b1d62018-01-03 22:24:41 -0500400
Florin Coras5f33d0d2021-06-02 21:22:21 -0700401 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -0500402
Florin Coras7baeb712019-01-04 17:05:43 -0800403 vlsh = ldp_fd_to_vlsh (fd);
404 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -0500405 {
Florin Coras067f9542020-02-14 05:33:46 +0000406 for (i = 0; i < iovcnt; ++i)
Dave Wallace048b1d62018-01-03 22:24:41 -0500407 {
Florin Coras067f9542020-02-14 05:33:46 +0000408 rv = vls_read (vlsh, iov[i].iov_base, iov[i].iov_len);
409 if (rv <= 0)
410 break;
411 else
Dave Wallace048b1d62018-01-03 22:24:41 -0500412 {
Florin Coras067f9542020-02-14 05:33:46 +0000413 total += rv;
414 if (rv < iov[i].iov_len)
Dave Wallace048b1d62018-01-03 22:24:41 -0500415 break;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700416 }
417 }
Florin Coras067f9542020-02-14 05:33:46 +0000418 if (rv < 0 && total == 0)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700419 {
Dave Wallace048b1d62018-01-03 22:24:41 -0500420 errno = -rv;
421 size = -1;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700422 }
Dave Wallace048b1d62018-01-03 22:24:41 -0500423 else
424 size = total;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700425 }
426 else
427 {
Dave Wallace048b1d62018-01-03 22:24:41 -0500428 size = libc_readv (fd, iov, iovcnt);
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700429 }
430
Dave Wallace048b1d62018-01-03 22:24:41 -0500431 return size;
432}
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700433
Dave Wallace048b1d62018-01-03 22:24:41 -0500434ssize_t
435write (int fd, const void *buf, size_t nbytes)
436{
Florin Coras7baeb712019-01-04 17:05:43 -0800437 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -0500438 ssize_t size = 0;
Dave Wallace048b1d62018-01-03 22:24:41 -0500439
Florin Coras5f33d0d2021-06-02 21:22:21 -0700440 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -0500441
Florin Coras7baeb712019-01-04 17:05:43 -0800442 vlsh = ldp_fd_to_vlsh (fd);
443 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -0500444 {
Florin Coras7baeb712019-01-04 17:05:43 -0800445 size = vls_write_msg (vlsh, (void *) buf, nbytes);
Dave Wallace048b1d62018-01-03 22:24:41 -0500446 if (size < 0)
447 {
448 errno = -size;
449 size = -1;
450 }
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700451 }
452 else
453 {
Dave Wallace048b1d62018-01-03 22:24:41 -0500454 size = libc_write (fd, buf, nbytes);
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700455 }
456
Dave Wallace048b1d62018-01-03 22:24:41 -0500457 return size;
458}
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700459
Dave Wallace048b1d62018-01-03 22:24:41 -0500460ssize_t
461writev (int fd, const struct iovec * iov, int iovcnt)
462{
Dave Wallace048b1d62018-01-03 22:24:41 -0500463 ssize_t size = 0, total = 0;
Florin Coras7baeb712019-01-04 17:05:43 -0800464 vls_handle_t vlsh;
Dave Wallace8aaba562018-01-18 17:21:19 -0500465 int i, rv = 0;
Dave Wallace048b1d62018-01-03 22:24:41 -0500466
Florin Coras5f33d0d2021-06-02 21:22:21 -0700467 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -0500468
Florin Coras7baeb712019-01-04 17:05:43 -0800469 vlsh = ldp_fd_to_vlsh (fd);
470 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -0500471 {
Florin Coraseda1b8c2020-03-23 16:00:35 +0000472 for (i = 0; i < iovcnt; ++i)
Dave Wallace048b1d62018-01-03 22:24:41 -0500473 {
Florin Coraseda1b8c2020-03-23 16:00:35 +0000474 rv = vls_write_msg (vlsh, iov[i].iov_base, iov[i].iov_len);
475 if (rv < 0)
476 break;
477 else
Dave Wallace048b1d62018-01-03 22:24:41 -0500478 {
Florin Coraseda1b8c2020-03-23 16:00:35 +0000479 total += rv;
480 if (rv < iov[i].iov_len)
Dave Wallace048b1d62018-01-03 22:24:41 -0500481 break;
Dave Wallace048b1d62018-01-03 22:24:41 -0500482 }
483 }
Dave Wallace048b1d62018-01-03 22:24:41 -0500484
Florin Coraseda1b8c2020-03-23 16:00:35 +0000485 if (rv < 0 && total == 0)
Dave Wallace048b1d62018-01-03 22:24:41 -0500486 {
487 errno = -rv;
488 size = -1;
489 }
490 else
491 size = total;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700492 }
493 else
494 {
Dave Wallace048b1d62018-01-03 22:24:41 -0500495 size = libc_writev (fd, iov, iovcnt);
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700496 }
497
Dave Wallace048b1d62018-01-03 22:24:41 -0500498 return size;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700499}
500
Florin Coras0ab36f52020-05-26 19:45:45 +0000501static int
502fcntl_internal (int fd, int cmd, va_list ap)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700503{
Florin Coras7baeb712019-01-04 17:05:43 -0800504 vls_handle_t vlsh;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700505 int rv = 0;
Florin Coras7baeb712019-01-04 17:05:43 -0800506
507 vlsh = ldp_fd_to_vlsh (fd);
508 LDBG (0, "fd %u vlsh %d, cmd %u", fd, vlsh, cmd);
509 if (vlsh != VLS_INVALID_HANDLE)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700510 {
Dave Wallace048b1d62018-01-03 22:24:41 -0500511 int flags = va_arg (ap, int);
512 u32 size;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700513
Dave Wallace048b1d62018-01-03 22:24:41 -0500514 size = sizeof (flags);
515 rv = -EOPNOTSUPP;
516 switch (cmd)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700517 {
Dave Wallace048b1d62018-01-03 22:24:41 -0500518 case F_SETFL:
Florin Coras7baeb712019-01-04 17:05:43 -0800519 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_FLAGS, &flags, &size);
Dave Wallace048b1d62018-01-03 22:24:41 -0500520 break;
521
522 case F_GETFL:
Florin Coras7baeb712019-01-04 17:05:43 -0800523 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_FLAGS, &flags, &size);
Dave Wallace048b1d62018-01-03 22:24:41 -0500524 if (rv == VPPCOM_OK)
Florin Coras7baeb712019-01-04 17:05:43 -0800525 rv = flags;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700526 break;
Florin Coras173bae32018-11-16 18:56:28 -0800527 case F_SETFD:
528 /* TODO handle this */
529 LDBG (0, "F_SETFD ignored flags %u", flags);
530 rv = 0;
531 break;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700532 default:
Dave Wallace048b1d62018-01-03 22:24:41 -0500533 rv = -EOPNOTSUPP;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700534 break;
535 }
Dave Wallace048b1d62018-01-03 22:24:41 -0500536 if (rv < 0)
537 {
538 errno = -rv;
539 rv = -1;
540 }
541 }
542 else
543 {
Carl Smithe16707b2019-11-13 14:37:39 +1300544#ifdef HAVE_FCNTL64
545 rv = libc_vfcntl64 (fd, cmd, ap);
546#else
Dave Wallace048b1d62018-01-03 22:24:41 -0500547 rv = libc_vfcntl (fd, cmd, ap);
Carl Smithe16707b2019-11-13 14:37:39 +1300548#endif
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -0700549 }
550
Florin Coras0ab36f52020-05-26 19:45:45 +0000551 return rv;
552}
553
554int
555fcntl (int fd, int cmd, ...)
556{
557 va_list ap;
558 int rv;
559
Florin Coras5f33d0d2021-06-02 21:22:21 -0700560 ldp_init_check ();
Florin Coras0ab36f52020-05-26 19:45:45 +0000561
562 va_start (ap, cmd);
563 rv = fcntl_internal (fd, cmd, ap);
Dave Wallace048b1d62018-01-03 22:24:41 -0500564 va_end (ap);
565
Dave Wallace048b1d62018-01-03 22:24:41 -0500566 return rv;
567}
568
569int
Florin Corasd7586d52020-04-29 02:19:51 +0000570fcntl64 (int fd, int cmd, ...)
571{
572 va_list ap;
573 int rv;
574
Florin Coras5f33d0d2021-06-02 21:22:21 -0700575 ldp_init_check ();
Florin Coras0ab36f52020-05-26 19:45:45 +0000576
Florin Corasd7586d52020-04-29 02:19:51 +0000577 va_start (ap, cmd);
Florin Coras0ab36f52020-05-26 19:45:45 +0000578 rv = fcntl_internal (fd, cmd, ap);
Florin Corasd7586d52020-04-29 02:19:51 +0000579 va_end (ap);
580 return rv;
581}
582
583int
Dave Wallace048b1d62018-01-03 22:24:41 -0500584ioctl (int fd, unsigned long int cmd, ...)
585{
Florin Coras7baeb712019-01-04 17:05:43 -0800586 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -0500587 va_list ap;
Florin Coras7baeb712019-01-04 17:05:43 -0800588 int rv;
Dave Wallace048b1d62018-01-03 22:24:41 -0500589
Florin Coras5f33d0d2021-06-02 21:22:21 -0700590 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -0500591
592 va_start (ap, cmd);
Dave Wallace048b1d62018-01-03 22:24:41 -0500593
Florin Coras7baeb712019-01-04 17:05:43 -0800594 vlsh = ldp_fd_to_vlsh (fd);
595 if (vlsh != VLS_INVALID_HANDLE)
596 {
Dave Wallace048b1d62018-01-03 22:24:41 -0500597 switch (cmd)
598 {
599 case FIONREAD:
Florin Coras7baeb712019-01-04 17:05:43 -0800600 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_NREAD, 0, 0);
Dave Wallace048b1d62018-01-03 22:24:41 -0500601 break;
602
603 case FIONBIO:
604 {
605 u32 flags = va_arg (ap, int) ? O_NONBLOCK : 0;
606 u32 size = sizeof (flags);
607
608 /* TBD: When VPPCOM_ATTR_[GS]ET_FLAGS supports flags other than
609 * non-blocking, the flags should be read here and merged
610 * with O_NONBLOCK.
611 */
Florin Coras7baeb712019-01-04 17:05:43 -0800612 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_FLAGS, &flags, &size);
Dave Wallace048b1d62018-01-03 22:24:41 -0500613 }
614 break;
615
616 default:
617 rv = -EOPNOTSUPP;
618 break;
619 }
620 if (rv < 0)
621 {
622 errno = -rv;
623 rv = -1;
624 }
625 }
626 else
627 {
Dave Wallace048b1d62018-01-03 22:24:41 -0500628 rv = libc_vioctl (fd, cmd, ap);
629 }
630
Dave Wallace048b1d62018-01-03 22:24:41 -0500631 va_end (ap);
632 return rv;
633}
634
Florin Coras294afe22019-01-07 17:49:17 -0800635always_inline void
636ldp_select_init_maps (fd_set * __restrict original,
637 clib_bitmap_t ** resultb, clib_bitmap_t ** libcb,
638 clib_bitmap_t ** vclb, int nfds, u32 minbits,
639 u32 n_bytes, uword * si_bits, uword * libc_bits)
640{
641 uword si_bits_set, libc_bits_set;
642 vls_handle_t vlsh;
643 int fd;
644
645 clib_bitmap_validate (*vclb, minbits);
646 clib_bitmap_validate (*libcb, minbits);
647 clib_bitmap_validate (*resultb, minbits);
648 clib_memcpy_fast (*resultb, original, n_bytes);
649 memset (original, 0, n_bytes);
650
651 /* *INDENT-OFF* */
Damjan Marionf0ca1e82020-12-13 23:26:56 +0100652 clib_bitmap_foreach (fd, *resultb) {
Florin Coras294afe22019-01-07 17:49:17 -0800653 if (fd > nfds)
654 break;
655 vlsh = ldp_fd_to_vlsh (fd);
656 if (vlsh == VLS_INVALID_HANDLE)
657 clib_bitmap_set_no_check (*libcb, fd, 1);
658 else
Florin Corascbce80a2020-04-20 01:32:38 +0000659 *vclb = clib_bitmap_set (*vclb, vlsh_to_session_index (vlsh), 1);
Damjan Marionf0ca1e82020-12-13 23:26:56 +0100660 }
Florin Coras294afe22019-01-07 17:49:17 -0800661 /* *INDENT-ON* */
662
663 si_bits_set = clib_bitmap_last_set (*vclb) + 1;
664 *si_bits = (si_bits_set > *si_bits) ? si_bits_set : *si_bits;
Florin Corascbce80a2020-04-20 01:32:38 +0000665 clib_bitmap_validate (*resultb, *si_bits);
Florin Coras294afe22019-01-07 17:49:17 -0800666
667 libc_bits_set = clib_bitmap_last_set (*libcb) + 1;
668 *libc_bits = (libc_bits_set > *libc_bits) ? libc_bits_set : *libc_bits;
669}
670
671always_inline int
672ldp_select_vcl_map_to_libc (clib_bitmap_t * vclb, fd_set * __restrict libcb)
673{
674 vls_handle_t vlsh;
675 uword si;
676 int fd;
677
678 if (!libcb)
679 return 0;
680
681 /* *INDENT-OFF* */
Damjan Marionf0ca1e82020-12-13 23:26:56 +0100682 clib_bitmap_foreach (si, vclb) {
Florin Coras294afe22019-01-07 17:49:17 -0800683 vlsh = vls_session_index_to_vlsh (si);
Florin Coras54140622020-02-04 19:04:34 +0000684 ASSERT (vlsh != VLS_INVALID_HANDLE);
Florin Coras294afe22019-01-07 17:49:17 -0800685 fd = ldp_vlsh_to_fd (vlsh);
686 if (PREDICT_FALSE (fd < 0))
687 {
688 errno = EBADFD;
689 return -1;
690 }
691 FD_SET (fd, libcb);
Damjan Marionf0ca1e82020-12-13 23:26:56 +0100692 }
Florin Coras294afe22019-01-07 17:49:17 -0800693 /* *INDENT-ON* */
694
695 return 0;
696}
697
698always_inline void
699ldp_select_libc_map_merge (clib_bitmap_t * result, fd_set * __restrict libcb)
700{
701 uword fd;
702
Florin Coras78b5fa62019-02-21 20:04:15 -0800703 if (!libcb)
704 return;
705
Florin Coras294afe22019-01-07 17:49:17 -0800706 /* *INDENT-OFF* */
Damjan Marionf0ca1e82020-12-13 23:26:56 +0100707 clib_bitmap_foreach (fd, result)
Florin Coras294afe22019-01-07 17:49:17 -0800708 FD_SET ((int)fd, libcb);
Florin Coras294afe22019-01-07 17:49:17 -0800709 /* *INDENT-ON* */
710}
711
Dave Wallace048b1d62018-01-03 22:24:41 -0500712int
Dave Wallace2a865272018-02-07 21:00:42 -0500713ldp_pselect (int nfds, fd_set * __restrict readfds,
714 fd_set * __restrict writefds,
715 fd_set * __restrict exceptfds,
716 const struct timespec *__restrict timeout,
717 const __sigset_t * __restrict sigmask)
Dave Wallace048b1d62018-01-03 22:24:41 -0500718{
Florin Coras294afe22019-01-07 17:49:17 -0800719 u32 minbits = clib_max (nfds, BITS (uword)), n_bytes;
Florin Corasdfe4cf42018-11-28 22:13:45 -0800720 ldp_worker_ctx_t *ldpw = ldp_worker_get_current ();
Florin Coras294afe22019-01-07 17:49:17 -0800721 struct timespec libc_tspec = { 0 };
722 f64 time_out, vcl_timeout = 0;
723 uword si_bits, libc_bits;
724 int rv, bits_set = 0;
Dave Wallace048b1d62018-01-03 22:24:41 -0500725
726 if (nfds < 0)
727 {
728 errno = EINVAL;
729 return -1;
730 }
731
Florin Coras4dee8cd2019-01-29 21:28:16 -0800732 if (PREDICT_FALSE (ldpw->clib_time.init_cpu_time == 0))
733 clib_time_init (&ldpw->clib_time);
734
Dave Wallace3ee1fe12018-02-23 01:09:11 -0500735 if (timeout)
736 {
737 time_out = (timeout->tv_sec == 0 && timeout->tv_nsec == 0) ?
Florin Coras7baeb712019-01-04 17:05:43 -0800738 (f64) 0 : (f64) timeout->tv_sec + (f64) timeout->tv_nsec / (f64) 1e9;
Dave Wallace3ee1fe12018-02-23 01:09:11 -0500739
liuyacanf71796e2021-08-02 10:01:39 +0800740 time_out += clib_time_now (&ldpw->clib_time);
741
Dave Wallace3ee1fe12018-02-23 01:09:11 -0500742 /* select as fine grained sleep */
743 if (!nfds)
744 {
Florin Corasdfe4cf42018-11-28 22:13:45 -0800745 while (clib_time_now (&ldpw->clib_time) < time_out)
Dave Wallace3ee1fe12018-02-23 01:09:11 -0500746 ;
747 return 0;
748 }
749 }
750 else if (!nfds)
751 {
752 errno = EINVAL;
753 return -1;
754 }
755 else
756 time_out = -1;
757
Florin Coras7baeb712019-01-04 17:05:43 -0800758 if (nfds <= ldp->vlsh_bit_val)
Dave Wallace048b1d62018-01-03 22:24:41 -0500759 {
Dave Wallace048b1d62018-01-03 22:24:41 -0500760 rv = libc_pselect (nfds, readfds, writefds, exceptfds,
761 timeout, sigmask);
762 goto done;
763 }
764
Florin Coras294afe22019-01-07 17:49:17 -0800765 si_bits = libc_bits = 0;
766 n_bytes = nfds / 8 + ((nfds % 8) ? 1 : 0);
Florin Coras7baeb712019-01-04 17:05:43 -0800767
Dave Wallace048b1d62018-01-03 22:24:41 -0500768 if (readfds)
Florin Coras294afe22019-01-07 17:49:17 -0800769 ldp_select_init_maps (readfds, &ldpw->rd_bitmap, &ldpw->libc_rd_bitmap,
770 &ldpw->si_rd_bitmap, nfds, minbits, n_bytes,
771 &si_bits, &libc_bits);
Dave Wallace048b1d62018-01-03 22:24:41 -0500772 if (writefds)
Florin Coras294afe22019-01-07 17:49:17 -0800773 ldp_select_init_maps (writefds, &ldpw->wr_bitmap,
774 &ldpw->libc_wr_bitmap, &ldpw->si_wr_bitmap, nfds,
775 minbits, n_bytes, &si_bits, &libc_bits);
Dave Wallace048b1d62018-01-03 22:24:41 -0500776 if (exceptfds)
Florin Coras294afe22019-01-07 17:49:17 -0800777 ldp_select_init_maps (exceptfds, &ldpw->ex_bitmap,
778 &ldpw->libc_ex_bitmap, &ldpw->si_ex_bitmap, nfds,
779 minbits, n_bytes, &si_bits, &libc_bits);
Dave Wallace048b1d62018-01-03 22:24:41 -0500780
Florin Coras294afe22019-01-07 17:49:17 -0800781 if (PREDICT_FALSE (!si_bits && !libc_bits))
Dave Wallace048b1d62018-01-03 22:24:41 -0500782 {
783 errno = EINVAL;
784 rv = -1;
785 goto done;
786 }
787
Florin Coras78b5fa62019-02-21 20:04:15 -0800788 if (!si_bits)
789 libc_tspec = timeout ? *timeout : libc_tspec;
Florin Coras294afe22019-01-07 17:49:17 -0800790
Dave Wallace048b1d62018-01-03 22:24:41 -0500791 do
792 {
Florin Coras294afe22019-01-07 17:49:17 -0800793 if (si_bits)
Dave Wallace048b1d62018-01-03 22:24:41 -0500794 {
Dave Wallace048b1d62018-01-03 22:24:41 -0500795 if (readfds)
Florin Coras294afe22019-01-07 17:49:17 -0800796 clib_memcpy_fast (ldpw->rd_bitmap, ldpw->si_rd_bitmap,
Florin Corascbce80a2020-04-20 01:32:38 +0000797 vec_len (ldpw->si_rd_bitmap) *
Dave Barach178cf492018-11-13 16:34:13 -0500798 sizeof (clib_bitmap_t));
Dave Wallace048b1d62018-01-03 22:24:41 -0500799 if (writefds)
Florin Coras294afe22019-01-07 17:49:17 -0800800 clib_memcpy_fast (ldpw->wr_bitmap, ldpw->si_wr_bitmap,
Florin Corascbce80a2020-04-20 01:32:38 +0000801 vec_len (ldpw->si_wr_bitmap) *
Dave Barach178cf492018-11-13 16:34:13 -0500802 sizeof (clib_bitmap_t));
Dave Wallace048b1d62018-01-03 22:24:41 -0500803 if (exceptfds)
Florin Coras294afe22019-01-07 17:49:17 -0800804 clib_memcpy_fast (ldpw->ex_bitmap, ldpw->si_ex_bitmap,
Florin Corascbce80a2020-04-20 01:32:38 +0000805 vec_len (ldpw->si_ex_bitmap) *
Dave Barach178cf492018-11-13 16:34:13 -0500806 sizeof (clib_bitmap_t));
Florin Coras294afe22019-01-07 17:49:17 -0800807
Florin Coras0ef8ef22019-01-18 08:37:13 -0800808 rv = vls_select (si_bits, readfds ? ldpw->rd_bitmap : NULL,
809 writefds ? ldpw->wr_bitmap : NULL,
810 exceptfds ? ldpw->ex_bitmap : NULL, vcl_timeout);
Florin Coras294afe22019-01-07 17:49:17 -0800811 if (rv < 0)
812 {
813 errno = -rv;
814 rv = -1;
Florin Coras5e6222a2020-04-24 17:09:25 +0000815 goto done;
Florin Coras294afe22019-01-07 17:49:17 -0800816 }
817 else if (rv > 0)
818 {
819 if (ldp_select_vcl_map_to_libc (ldpw->rd_bitmap, readfds))
820 {
821 rv = -1;
822 goto done;
823 }
824
825 if (ldp_select_vcl_map_to_libc (ldpw->wr_bitmap, writefds))
826 {
827 rv = -1;
828 goto done;
829 }
830
831 if (ldp_select_vcl_map_to_libc (ldpw->ex_bitmap, exceptfds))
832 {
833 rv = -1;
834 goto done;
835 }
836 bits_set = rv;
837 }
838 }
839 if (libc_bits)
840 {
841 if (readfds)
842 clib_memcpy_fast (ldpw->rd_bitmap, ldpw->libc_rd_bitmap,
843 vec_len (ldpw->libc_rd_bitmap) *
844 sizeof (clib_bitmap_t));
845 if (writefds)
846 clib_memcpy_fast (ldpw->wr_bitmap, ldpw->libc_wr_bitmap,
847 vec_len (ldpw->libc_wr_bitmap) *
848 sizeof (clib_bitmap_t));
849 if (exceptfds)
850 clib_memcpy_fast (ldpw->ex_bitmap, ldpw->libc_ex_bitmap,
851 vec_len (ldpw->libc_ex_bitmap) *
852 sizeof (clib_bitmap_t));
853
Dave Wallace048b1d62018-01-03 22:24:41 -0500854 rv = libc_pselect (libc_bits,
Florin Coras294afe22019-01-07 17:49:17 -0800855 readfds ? (fd_set *) ldpw->rd_bitmap : NULL,
856 writefds ? (fd_set *) ldpw->wr_bitmap : NULL,
857 exceptfds ? (fd_set *) ldpw->ex_bitmap : NULL,
858 &libc_tspec, sigmask);
859 if (rv > 0)
860 {
861 ldp_select_libc_map_merge (ldpw->rd_bitmap, readfds);
862 ldp_select_libc_map_merge (ldpw->wr_bitmap, writefds);
863 ldp_select_libc_map_merge (ldpw->ex_bitmap, exceptfds);
864 bits_set += rv;
865 }
866 }
867
868 if (bits_set)
869 {
870 rv = bits_set;
871 goto done;
Dave Wallace048b1d62018-01-03 22:24:41 -0500872 }
873 }
Florin Corasdfe4cf42018-11-28 22:13:45 -0800874 while ((time_out == -1) || (clib_time_now (&ldpw->clib_time) < time_out));
Dave Wallace048b1d62018-01-03 22:24:41 -0500875 rv = 0;
876
877done:
878 /* TBD: set timeout to amount of time left */
Florin Corasdfe4cf42018-11-28 22:13:45 -0800879 clib_bitmap_zero (ldpw->rd_bitmap);
Florin Coras294afe22019-01-07 17:49:17 -0800880 clib_bitmap_zero (ldpw->si_rd_bitmap);
Florin Corasdfe4cf42018-11-28 22:13:45 -0800881 clib_bitmap_zero (ldpw->libc_rd_bitmap);
882 clib_bitmap_zero (ldpw->wr_bitmap);
Florin Coras294afe22019-01-07 17:49:17 -0800883 clib_bitmap_zero (ldpw->si_wr_bitmap);
Florin Corasdfe4cf42018-11-28 22:13:45 -0800884 clib_bitmap_zero (ldpw->libc_wr_bitmap);
885 clib_bitmap_zero (ldpw->ex_bitmap);
Florin Coras294afe22019-01-07 17:49:17 -0800886 clib_bitmap_zero (ldpw->si_ex_bitmap);
Florin Corasdfe4cf42018-11-28 22:13:45 -0800887 clib_bitmap_zero (ldpw->libc_ex_bitmap);
Dave Wallace048b1d62018-01-03 22:24:41 -0500888
Dave Wallace048b1d62018-01-03 22:24:41 -0500889 return rv;
890}
891
892int
893select (int nfds, fd_set * __restrict readfds,
894 fd_set * __restrict writefds,
895 fd_set * __restrict exceptfds, struct timeval *__restrict timeout)
896{
897 struct timespec tspec;
898
899 if (timeout)
900 {
901 tspec.tv_sec = timeout->tv_sec;
902 tspec.tv_nsec = timeout->tv_usec * 1000;
903 }
Dave Wallace2a865272018-02-07 21:00:42 -0500904 return ldp_pselect (nfds, readfds, writefds, exceptfds,
905 timeout ? &tspec : NULL, NULL);
Dave Wallace048b1d62018-01-03 22:24:41 -0500906}
907
908#ifdef __USE_XOPEN2K
909int
910pselect (int nfds, fd_set * __restrict readfds,
911 fd_set * __restrict writefds,
912 fd_set * __restrict exceptfds,
913 const struct timespec *__restrict timeout,
914 const __sigset_t * __restrict sigmask)
915{
Dave Wallace2a865272018-02-07 21:00:42 -0500916 return ldp_pselect (nfds, readfds, writefds, exceptfds, timeout, 0);
Dave Wallace048b1d62018-01-03 22:24:41 -0500917}
918#endif
919
Yu Ping7b74b072019-05-08 00:40:24 +0800920/* If transparent TLS mode is turned on, then ldp will load key and cert.
921 */
922static int
Florin Corasa5a9efd2021-01-05 17:03:29 -0800923load_cert_key_pair (void)
Yu Ping7b74b072019-05-08 00:40:24 +0800924{
Florin Corasa5a9efd2021-01-05 17:03:29 -0800925 char *cert_str = getenv (LDP_ENV_TLS_CERT);
926 char *key_str = getenv (LDP_ENV_TLS_KEY);
927 char cert_buf[4096], key_buf[4096];
928 int cert_size, key_size;
929 vppcom_cert_key_pair_t crypto;
930 int ckp_index;
Yu Ping7b74b072019-05-08 00:40:24 +0800931 FILE *fp;
932
Florin Corasa5a9efd2021-01-05 17:03:29 -0800933 if (!cert_str || !key_str)
Yu Ping7b74b072019-05-08 00:40:24 +0800934 {
935 LDBG (0, "ERROR: failed to read LDP environment %s\n",
936 LDP_ENV_TLS_CERT);
937 return -1;
938 }
Florin Corasa5a9efd2021-01-05 17:03:29 -0800939
940 fp = fopen (cert_str, "r");
941 if (fp == NULL)
942 {
943 LDBG (0, "ERROR: failed to open cert file %s \n", cert_str);
944 return -1;
945 }
946 cert_size = fread (cert_buf, sizeof (char), sizeof (cert_buf), fp);
947 fclose (fp);
948
949 fp = fopen (key_str, "r");
950 if (fp == NULL)
951 {
952 LDBG (0, "ERROR: failed to open key file %s \n", key_str);
953 return -1;
954 }
955 key_size = fread (key_buf, sizeof (char), sizeof (key_buf), fp);
956 fclose (fp);
957
958 crypto.cert = cert_buf;
959 crypto.key = key_buf;
960 crypto.cert_len = cert_size;
961 crypto.key_len = key_size;
962 ckp_index = vppcom_add_cert_key_pair (&crypto);
963 if (ckp_index < 0)
964 {
965 LDBG (0, "ERROR: failed to add cert key pair\n");
966 return -1;
967 }
968
969 ldp->ckpair_index = ckp_index;
970
Yu Ping7b74b072019-05-08 00:40:24 +0800971 return 0;
972}
973
974static int
Florin Corasa5a9efd2021-01-05 17:03:29 -0800975assign_cert_key_pair (vls_handle_t vlsh)
Yu Ping7b74b072019-05-08 00:40:24 +0800976{
Florin Corasa5a9efd2021-01-05 17:03:29 -0800977 uint32_t ckp_len;
Yu Ping7b74b072019-05-08 00:40:24 +0800978
Florin Corasa5a9efd2021-01-05 17:03:29 -0800979 if (ldp->ckpair_index == ~0 && load_cert_key_pair () < 0)
980 return -1;
981
982 ckp_len = sizeof (ldp->ckpair_index);
liuyacan276675e2021-08-30 13:24:53 +0800983 return vls_attr (vlsh, VPPCOM_ATTR_SET_CKPAIR, &ldp->ckpair_index, &ckp_len);
Yu Ping7b74b072019-05-08 00:40:24 +0800984}
985
Dave Wallace048b1d62018-01-03 22:24:41 -0500986int
987socket (int domain, int type, int protocol)
988{
Florin Coras7baeb712019-01-04 17:05:43 -0800989 int rv, sock_type = type & ~(SOCK_CLOEXEC | SOCK_NONBLOCK);
Dave Wallace048b1d62018-01-03 22:24:41 -0500990 u8 is_nonblocking = type & SOCK_NONBLOCK ? 1 : 0;
Florin Coras7baeb712019-01-04 17:05:43 -0800991 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -0500992
Florin Coras5f33d0d2021-06-02 21:22:21 -0700993 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -0500994
995 if (((domain == AF_INET) || (domain == AF_INET6)) &&
996 ((sock_type == SOCK_STREAM) || (sock_type == SOCK_DGRAM)))
997 {
Yu Ping7b74b072019-05-08 00:40:24 +0800998 u8 proto;
999 if (ldp->transparent_tls)
1000 {
1001 proto = VPPCOM_PROTO_TLS;
1002 }
1003 else
1004 proto = ((sock_type == SOCK_DGRAM) ?
1005 VPPCOM_PROTO_UDP : VPPCOM_PROTO_TCP);
Dave Wallace048b1d62018-01-03 22:24:41 -05001006
Florin Coras7baeb712019-01-04 17:05:43 -08001007 LDBG (0, "calling vls_create: proto %u (%s), is_nonblocking %u",
1008 proto, vppcom_proto_str (proto), is_nonblocking);
Dave Wallace048b1d62018-01-03 22:24:41 -05001009
Florin Coras7baeb712019-01-04 17:05:43 -08001010 vlsh = vls_create (proto, is_nonblocking);
1011 if (vlsh < 0)
Dave Wallace048b1d62018-01-03 22:24:41 -05001012 {
Florin Coras7baeb712019-01-04 17:05:43 -08001013 errno = -vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05001014 rv = -1;
1015 }
1016 else
1017 {
Yu Ping7b74b072019-05-08 00:40:24 +08001018 if (ldp->transparent_tls)
1019 {
Florin Corasa5a9efd2021-01-05 17:03:29 -08001020 if (assign_cert_key_pair (vlsh) < 0)
1021 return -1;
Yu Ping7b74b072019-05-08 00:40:24 +08001022 }
Florin Coras7baeb712019-01-04 17:05:43 -08001023 rv = ldp_vlsh_to_fd (vlsh);
Dave Wallace048b1d62018-01-03 22:24:41 -05001024 }
1025 }
1026 else
1027 {
Florin Coras7baeb712019-01-04 17:05:43 -08001028 LDBG (0, "calling libc_socket");
Dave Wallace048b1d62018-01-03 22:24:41 -05001029 rv = libc_socket (domain, type, protocol);
1030 }
1031
Dave Wallace048b1d62018-01-03 22:24:41 -05001032 return rv;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001033}
1034
1035/*
1036 * Create two new sockets, of type TYPE in domain DOMAIN and using
1037 * protocol PROTOCOL, which are connected to each other, and put file
1038 * descriptors for them in FDS[0] and FDS[1]. If PROTOCOL is zero,
1039 * one will be chosen automatically.
1040 * Returns 0 on success, -1 for errors.
1041 * */
1042int
Dave Wallace048b1d62018-01-03 22:24:41 -05001043socketpair (int domain, int type, int protocol, int fds[2])
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001044{
Florin Coras7baeb712019-01-04 17:05:43 -08001045 int rv, sock_type = type & ~(SOCK_CLOEXEC | SOCK_NONBLOCK);
Dave Wallace048b1d62018-01-03 22:24:41 -05001046
Florin Coras5f33d0d2021-06-02 21:22:21 -07001047 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001048
1049 if (((domain == AF_INET) || (domain == AF_INET6)) &&
1050 ((sock_type == SOCK_STREAM) || (sock_type == SOCK_DGRAM)))
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001051 {
Florin Coras7baeb712019-01-04 17:05:43 -08001052 LDBG (0, "LDP-TBD");
Dave Wallace048b1d62018-01-03 22:24:41 -05001053 errno = ENOSYS;
1054 rv = -1;
1055 }
1056 else
1057 {
Florin Coras7baeb712019-01-04 17:05:43 -08001058 LDBG (1, "calling libc_socketpair");
Florin Coras173bae32018-11-16 18:56:28 -08001059 rv = libc_socketpair (domain, type, protocol, fds);
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001060 }
1061
Dave Wallace048b1d62018-01-03 22:24:41 -05001062 return rv;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001063}
1064
1065int
Florin Coras36847942023-02-02 12:56:16 -08001066bind (int fd, __CONST_SOCKADDR_ARG _addr, socklen_t len)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001067{
Florin Coras36847942023-02-02 12:56:16 -08001068 const struct sockaddr *addr = SOCKADDR_GET_SA (_addr);
Florin Coras7baeb712019-01-04 17:05:43 -08001069 vls_handle_t vlsh;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001070 int rv;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001071
Florin Coras5f33d0d2021-06-02 21:22:21 -07001072 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001073
Florin Coras7baeb712019-01-04 17:05:43 -08001074 vlsh = ldp_fd_to_vlsh (fd);
1075 if (vlsh != VLS_INVALID_HANDLE)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001076 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001077 vppcom_endpt_t ep;
1078
Dave Wallace048b1d62018-01-03 22:24:41 -05001079 switch (addr->sa_family)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001080 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001081 case AF_INET:
1082 if (len != sizeof (struct sockaddr_in))
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001083 {
Florin Coras7baeb712019-01-04 17:05:43 -08001084 LDBG (0, "ERROR: fd %d: vlsh %u: Invalid AF_INET addr len %u!",
1085 fd, vlsh, len);
Dave Wallace048b1d62018-01-03 22:24:41 -05001086 errno = EINVAL;
1087 rv = -1;
1088 goto done;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001089 }
Dave Wallace048b1d62018-01-03 22:24:41 -05001090 ep.is_ip4 = VPPCOM_IS_IP4;
1091 ep.ip = (u8 *) & ((const struct sockaddr_in *) addr)->sin_addr;
1092 ep.port = (u16) ((const struct sockaddr_in *) addr)->sin_port;
1093 break;
1094
1095 case AF_INET6:
1096 if (len != sizeof (struct sockaddr_in6))
1097 {
Florin Coras7baeb712019-01-04 17:05:43 -08001098 LDBG (0, "ERROR: fd %d: vlsh %u: Invalid AF_INET6 addr len %u!",
1099 fd, vlsh, len);
Dave Wallace048b1d62018-01-03 22:24:41 -05001100 errno = EINVAL;
1101 rv = -1;
1102 goto done;
1103 }
1104 ep.is_ip4 = VPPCOM_IS_IP6;
1105 ep.ip = (u8 *) & ((const struct sockaddr_in6 *) addr)->sin6_addr;
1106 ep.port = (u16) ((const struct sockaddr_in6 *) addr)->sin6_port;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001107 break;
1108
1109 default:
Florin Coras7baeb712019-01-04 17:05:43 -08001110 LDBG (0, "ERROR: fd %d: vlsh %u: Unsupported address family %u!",
1111 fd, vlsh, addr->sa_family);
Dave Wallace048b1d62018-01-03 22:24:41 -05001112 errno = EAFNOSUPPORT;
1113 rv = -1;
1114 goto done;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001115 }
Florin Coras7baeb712019-01-04 17:05:43 -08001116 LDBG (0, "fd %d: calling vls_bind: vlsh %u, addr %p, len %u", fd, vlsh,
1117 addr, len);
Dave Wallace048b1d62018-01-03 22:24:41 -05001118
Florin Coras7baeb712019-01-04 17:05:43 -08001119 rv = vls_bind (vlsh, &ep);
Dave Wallace048b1d62018-01-03 22:24:41 -05001120 if (rv != VPPCOM_OK)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001121 {
1122 errno = -rv;
Dave Wallace048b1d62018-01-03 22:24:41 -05001123 rv = -1;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001124 }
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001125 }
Dave Wallace048b1d62018-01-03 22:24:41 -05001126 else
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001127 {
Florin Coras7baeb712019-01-04 17:05:43 -08001128 LDBG (0, "fd %d: calling libc_bind: addr %p, len %u", fd, addr, len);
Dave Wallace048b1d62018-01-03 22:24:41 -05001129 rv = libc_bind (fd, addr, len);
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001130 }
1131
Dave Wallace048b1d62018-01-03 22:24:41 -05001132done:
Florin Coras7baeb712019-01-04 17:05:43 -08001133 LDBG (1, "fd %d: returning %d", fd, rv);
Florin Coras05ecfcc2018-12-12 18:19:39 -08001134
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001135 return rv;
1136}
1137
1138static inline int
Florin Coras36847942023-02-02 12:56:16 -08001139ldp_copy_ep_to_sockaddr (struct sockaddr *addr, socklen_t *__restrict len,
1140 vppcom_endpt_t *ep)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001141{
Florin Coras36847942023-02-02 12:56:16 -08001142 int rv = 0, sa_len, copy_len;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001143
Florin Coras5f33d0d2021-06-02 21:22:21 -07001144 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001145
1146 if (addr && len && ep)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001147 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001148 addr->sa_family = (ep->is_ip4 == VPPCOM_IS_IP4) ? AF_INET : AF_INET6;
1149 switch (addr->sa_family)
1150 {
1151 case AF_INET:
1152 ((struct sockaddr_in *) addr)->sin_port = ep->port;
1153 if (*len > sizeof (struct sockaddr_in))
1154 *len = sizeof (struct sockaddr_in);
1155 sa_len = sizeof (struct sockaddr_in) - sizeof (struct in_addr);
1156 copy_len = *len - sa_len;
1157 if (copy_len > 0)
1158 memcpy (&((struct sockaddr_in *) addr)->sin_addr, ep->ip,
1159 copy_len);
1160 break;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001161
Dave Wallace048b1d62018-01-03 22:24:41 -05001162 case AF_INET6:
1163 ((struct sockaddr_in6 *) addr)->sin6_port = ep->port;
1164 if (*len > sizeof (struct sockaddr_in6))
1165 *len = sizeof (struct sockaddr_in6);
1166 sa_len = sizeof (struct sockaddr_in6) - sizeof (struct in6_addr);
1167 copy_len = *len - sa_len;
1168 if (copy_len > 0)
1169 memcpy (((struct sockaddr_in6 *) addr)->sin6_addr.
1170 __in6_u.__u6_addr8, ep->ip, copy_len);
1171 break;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001172
Dave Wallace048b1d62018-01-03 22:24:41 -05001173 default:
1174 /* Not possible */
1175 rv = -EAFNOSUPPORT;
1176 break;
1177 }
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001178 }
Dave Wallacee695cb42017-11-02 22:04:42 -04001179 return rv;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001180}
1181
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001182int
Florin Coras36847942023-02-02 12:56:16 -08001183getsockname (int fd, __SOCKADDR_ARG _addr, socklen_t *__restrict len)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001184{
Florin Coras36847942023-02-02 12:56:16 -08001185 struct sockaddr *addr = SOCKADDR_GET_SA (_addr);
Florin Coras7baeb712019-01-04 17:05:43 -08001186 vls_handle_t vlsh;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001187 int rv;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001188
Florin Coras5f33d0d2021-06-02 21:22:21 -07001189 ldp_init_check ();
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001190
Florin Coras7baeb712019-01-04 17:05:43 -08001191 vlsh = ldp_fd_to_vlsh (fd);
1192 if (vlsh != VLS_INVALID_HANDLE)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001193 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001194 vppcom_endpt_t ep;
1195 u8 addr_buf[sizeof (struct in6_addr)];
1196 u32 size = sizeof (ep);
1197
1198 ep.ip = addr_buf;
Dave Wallace048b1d62018-01-03 22:24:41 -05001199
Florin Coras7baeb712019-01-04 17:05:43 -08001200 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_LCL_ADDR, &ep, &size);
Dave Wallace048b1d62018-01-03 22:24:41 -05001201 if (rv != VPPCOM_OK)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001202 {
1203 errno = -rv;
Dave Wallace048b1d62018-01-03 22:24:41 -05001204 rv = -1;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001205 }
Dave Wallace048b1d62018-01-03 22:24:41 -05001206 else
1207 {
Dave Wallace2a865272018-02-07 21:00:42 -05001208 rv = ldp_copy_ep_to_sockaddr (addr, len, &ep);
Dave Wallace048b1d62018-01-03 22:24:41 -05001209 if (rv != VPPCOM_OK)
1210 {
1211 errno = -rv;
1212 rv = -1;
1213 }
1214 }
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001215 }
1216 else
1217 {
Florin Coras36847942023-02-02 12:56:16 -08001218 rv = libc_getsockname (fd, _addr, len);
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001219 }
1220
Dave Wallace048b1d62018-01-03 22:24:41 -05001221 return rv;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001222}
1223
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001224int
Florin Coras36847942023-02-02 12:56:16 -08001225connect (int fd, __CONST_SOCKADDR_ARG _addr, socklen_t len)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001226{
Florin Coras36847942023-02-02 12:56:16 -08001227 const struct sockaddr *addr = SOCKADDR_GET_SA (_addr);
Florin Coras7baeb712019-01-04 17:05:43 -08001228 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05001229 int rv;
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07001230
Florin Coras5f33d0d2021-06-02 21:22:21 -07001231 ldp_init_check ();
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07001232
Dave Wallace048b1d62018-01-03 22:24:41 -05001233 if (!addr)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001234 {
Florin Coras7baeb712019-01-04 17:05:43 -08001235 LDBG (0, "ERROR: fd %d: NULL addr, len %u", fd, len);
Dave Wallace048b1d62018-01-03 22:24:41 -05001236 errno = EINVAL;
1237 rv = -1;
1238 goto done;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07001239 }
1240
Florin Coras7baeb712019-01-04 17:05:43 -08001241 vlsh = ldp_fd_to_vlsh (fd);
1242 if (vlsh != VLS_INVALID_HANDLE)
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07001243 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001244 vppcom_endpt_t ep;
1245
Dave Wallace048b1d62018-01-03 22:24:41 -05001246 switch (addr->sa_family)
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07001247 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001248 case AF_INET:
1249 if (len != sizeof (struct sockaddr_in))
1250 {
Florin Coras7baeb712019-01-04 17:05:43 -08001251 LDBG (0, "fd %d: ERROR vlsh %u: Invalid AF_INET addr len %u!",
1252 fd, vlsh, len);
Dave Wallace048b1d62018-01-03 22:24:41 -05001253 errno = EINVAL;
1254 rv = -1;
1255 goto done;
1256 }
1257 ep.is_ip4 = VPPCOM_IS_IP4;
1258 ep.ip = (u8 *) & ((const struct sockaddr_in *) addr)->sin_addr;
1259 ep.port = (u16) ((const struct sockaddr_in *) addr)->sin_port;
1260 break;
1261
1262 case AF_INET6:
1263 if (len != sizeof (struct sockaddr_in6))
1264 {
Florin Coras7baeb712019-01-04 17:05:43 -08001265 LDBG (0, "fd %d: ERROR vlsh %u: Invalid AF_INET6 addr len %u!",
1266 fd, vlsh, len);
Dave Wallace048b1d62018-01-03 22:24:41 -05001267 errno = EINVAL;
1268 rv = -1;
1269 goto done;
1270 }
1271 ep.is_ip4 = VPPCOM_IS_IP6;
1272 ep.ip = (u8 *) & ((const struct sockaddr_in6 *) addr)->sin6_addr;
1273 ep.port = (u16) ((const struct sockaddr_in6 *) addr)->sin6_port;
1274 break;
1275
1276 default:
Florin Coras7baeb712019-01-04 17:05:43 -08001277 LDBG (0, "fd %d: ERROR vlsh %u: Unsupported address family %u!",
1278 fd, vlsh, addr->sa_family);
Dave Wallace048b1d62018-01-03 22:24:41 -05001279 errno = EAFNOSUPPORT;
1280 rv = -1;
1281 goto done;
1282 }
Florin Coras7baeb712019-01-04 17:05:43 -08001283 LDBG (0, "fd %d: calling vls_connect(): vlsh %u addr %p len %u", fd,
1284 vlsh, addr, len);
Dave Wallace048b1d62018-01-03 22:24:41 -05001285
Florin Coras7baeb712019-01-04 17:05:43 -08001286 rv = vls_connect (vlsh, &ep);
Dave Wallace048b1d62018-01-03 22:24:41 -05001287 if (rv != VPPCOM_OK)
1288 {
1289 errno = -rv;
1290 rv = -1;
1291 }
1292 }
1293 else
1294 {
Florin Coras7baeb712019-01-04 17:05:43 -08001295 LDBG (0, "fd %d: calling libc_connect(): addr %p, len %u",
1296 fd, addr, len);
Dave Wallace048b1d62018-01-03 22:24:41 -05001297
1298 rv = libc_connect (fd, addr, len);
1299 }
1300
1301done:
Florin Coras7baeb712019-01-04 17:05:43 -08001302 LDBG (1, "fd %d: returning %d (0x%x)", fd, rv, rv);
Dave Wallace048b1d62018-01-03 22:24:41 -05001303 return rv;
1304}
1305
1306int
Florin Coras36847942023-02-02 12:56:16 -08001307getpeername (int fd, __SOCKADDR_ARG _addr, socklen_t *__restrict len)
Dave Wallace048b1d62018-01-03 22:24:41 -05001308{
Florin Coras36847942023-02-02 12:56:16 -08001309 struct sockaddr *addr = SOCKADDR_GET_SA (_addr);
Florin Coras7baeb712019-01-04 17:05:43 -08001310 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05001311 int rv;
Dave Wallace048b1d62018-01-03 22:24:41 -05001312
Florin Coras5f33d0d2021-06-02 21:22:21 -07001313 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001314
Florin Coras7baeb712019-01-04 17:05:43 -08001315 vlsh = ldp_fd_to_vlsh (fd);
1316 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05001317 {
1318 vppcom_endpt_t ep;
1319 u8 addr_buf[sizeof (struct in6_addr)];
1320 u32 size = sizeof (ep);
1321
1322 ep.ip = addr_buf;
Florin Coras7baeb712019-01-04 17:05:43 -08001323 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_PEER_ADDR, &ep, &size);
Dave Wallace048b1d62018-01-03 22:24:41 -05001324 if (rv != VPPCOM_OK)
1325 {
1326 errno = -rv;
1327 rv = -1;
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07001328 }
1329 else
1330 {
Dave Wallace2a865272018-02-07 21:00:42 -05001331 rv = ldp_copy_ep_to_sockaddr (addr, len, &ep);
Dave Wallace048b1d62018-01-03 22:24:41 -05001332 if (rv != VPPCOM_OK)
1333 {
1334 errno = -rv;
1335 rv = -1;
1336 }
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07001337 }
1338 }
Dave Wallace048b1d62018-01-03 22:24:41 -05001339 else
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07001340 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001341 rv = libc_getpeername (fd, addr, len);
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07001342 }
1343
Dave Wallace048b1d62018-01-03 22:24:41 -05001344 return rv;
1345}
1346
1347ssize_t
1348send (int fd, const void *buf, size_t n, int flags)
1349{
Florin Coras7baeb712019-01-04 17:05:43 -08001350 vls_handle_t vlsh = ldp_fd_to_vlsh (fd);
Dave Wallace048b1d62018-01-03 22:24:41 -05001351 ssize_t size;
Dave Wallace048b1d62018-01-03 22:24:41 -05001352
Florin Coras5f33d0d2021-06-02 21:22:21 -07001353 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001354
Florin Coras7baeb712019-01-04 17:05:43 -08001355 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05001356 {
Florin Coras7baeb712019-01-04 17:05:43 -08001357 size = vls_sendto (vlsh, (void *) buf, n, flags, NULL);
qchangaa8f63c2018-05-30 11:44:18 -07001358 if (size < VPPCOM_OK)
Dave Wallace048b1d62018-01-03 22:24:41 -05001359 {
1360 errno = -size;
1361 size = -1;
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07001362 }
1363 }
Dave Wallace048b1d62018-01-03 22:24:41 -05001364 else
1365 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001366 size = libc_send (fd, buf, n, flags);
1367 }
1368
Dave Wallace048b1d62018-01-03 22:24:41 -05001369 return size;
1370}
1371
1372ssize_t
1373sendfile (int out_fd, int in_fd, off_t * offset, size_t len)
1374{
Florin Corasdfe4cf42018-11-28 22:13:45 -08001375 ldp_worker_ctx_t *ldpw = ldp_worker_get_current ();
Florin Coras7baeb712019-01-04 17:05:43 -08001376 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05001377 ssize_t size = 0;
Dave Wallace048b1d62018-01-03 22:24:41 -05001378
Florin Coras5f33d0d2021-06-02 21:22:21 -07001379 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001380
Florin Coras7baeb712019-01-04 17:05:43 -08001381 vlsh = ldp_fd_to_vlsh (out_fd);
1382 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05001383 {
1384 int rv;
1385 ssize_t results = 0;
1386 size_t n_bytes_left = len;
1387 size_t bytes_to_read;
1388 int nbytes;
Dave Wallace048b1d62018-01-03 22:24:41 -05001389 u8 eagain = 0;
1390 u32 flags, flags_len = sizeof (flags);
1391
Florin Coras7baeb712019-01-04 17:05:43 -08001392 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_FLAGS, &flags, &flags_len);
Dave Wallace048b1d62018-01-03 22:24:41 -05001393 if (PREDICT_FALSE (rv != VPPCOM_OK))
1394 {
Florin Coras7baeb712019-01-04 17:05:43 -08001395 LDBG (0, "ERROR: out fd %d: vls_attr: vlsh %u, returned %d (%s)!",
1396 out_fd, vlsh, rv, vppcom_retval_str (rv));
Dave Wallace048b1d62018-01-03 22:24:41 -05001397
Florin Corasdfe4cf42018-11-28 22:13:45 -08001398 vec_reset_length (ldpw->io_buffer);
Dave Wallace048b1d62018-01-03 22:24:41 -05001399 errno = -rv;
1400 size = -1;
1401 goto done;
1402 }
1403
1404 if (offset)
1405 {
1406 off_t off = lseek (in_fd, *offset, SEEK_SET);
1407 if (PREDICT_FALSE (off == -1))
1408 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001409 size = -1;
1410 goto done;
1411 }
1412
1413 ASSERT (off == *offset);
1414 }
1415
1416 do
1417 {
Florin Coras7baeb712019-01-04 17:05:43 -08001418 size = vls_attr (vlsh, VPPCOM_ATTR_GET_NWRITE, 0, 0);
Dave Wallace048b1d62018-01-03 22:24:41 -05001419 if (size < 0)
1420 {
Florin Coraseb801d02020-09-16 17:44:58 -07001421 LDBG (0, "ERROR: fd %d: vls_attr: vlsh %u returned %ld (%s)!",
Florin Coras7baeb712019-01-04 17:05:43 -08001422 out_fd, vlsh, size, vppcom_retval_str (size));
Florin Corasdfe4cf42018-11-28 22:13:45 -08001423 vec_reset_length (ldpw->io_buffer);
Dave Wallace048b1d62018-01-03 22:24:41 -05001424 errno = -size;
1425 size = -1;
1426 goto done;
1427 }
1428
1429 bytes_to_read = size;
Dave Wallace048b1d62018-01-03 22:24:41 -05001430 if (bytes_to_read == 0)
1431 {
1432 if (flags & O_NONBLOCK)
1433 {
1434 if (!results)
Florin Coras7baeb712019-01-04 17:05:43 -08001435 eagain = 1;
Dave Wallace048b1d62018-01-03 22:24:41 -05001436 goto update_offset;
1437 }
1438 else
1439 continue;
1440 }
1441 bytes_to_read = clib_min (n_bytes_left, bytes_to_read);
Florin Corasdfe4cf42018-11-28 22:13:45 -08001442 vec_validate (ldpw->io_buffer, bytes_to_read);
1443 nbytes = libc_read (in_fd, ldpw->io_buffer, bytes_to_read);
Dave Wallace048b1d62018-01-03 22:24:41 -05001444 if (nbytes < 0)
1445 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001446 if (results == 0)
1447 {
Florin Corasdfe4cf42018-11-28 22:13:45 -08001448 vec_reset_length (ldpw->io_buffer);
Dave Wallace048b1d62018-01-03 22:24:41 -05001449 size = -1;
1450 goto done;
1451 }
1452 goto update_offset;
1453 }
Dave Wallace048b1d62018-01-03 22:24:41 -05001454
Florin Coras7baeb712019-01-04 17:05:43 -08001455 size = vls_write (vlsh, ldpw->io_buffer, nbytes);
Dave Wallace048b1d62018-01-03 22:24:41 -05001456 if (size < 0)
1457 {
1458 if (size == VPPCOM_EAGAIN)
1459 {
1460 if (flags & O_NONBLOCK)
1461 {
1462 if (!results)
Florin Coras7baeb712019-01-04 17:05:43 -08001463 eagain = 1;
Dave Wallace048b1d62018-01-03 22:24:41 -05001464 goto update_offset;
1465 }
1466 else
1467 continue;
1468 }
Dave Wallace048b1d62018-01-03 22:24:41 -05001469 if (results == 0)
1470 {
Florin Corasdfe4cf42018-11-28 22:13:45 -08001471 vec_reset_length (ldpw->io_buffer);
Dave Wallace048b1d62018-01-03 22:24:41 -05001472 errno = -size;
1473 size = -1;
1474 goto done;
1475 }
1476 goto update_offset;
1477 }
1478
1479 results += nbytes;
1480 ASSERT (n_bytes_left >= nbytes);
1481 n_bytes_left = n_bytes_left - nbytes;
1482 }
1483 while (n_bytes_left > 0);
1484
1485 update_offset:
Florin Corasdfe4cf42018-11-28 22:13:45 -08001486 vec_reset_length (ldpw->io_buffer);
Dave Wallace048b1d62018-01-03 22:24:41 -05001487 if (offset)
1488 {
1489 off_t off = lseek (in_fd, *offset, SEEK_SET);
1490 if (PREDICT_FALSE (off == -1))
1491 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001492 size = -1;
1493 goto done;
1494 }
1495
1496 ASSERT (off == *offset);
1497 *offset += results + 1;
1498 }
1499 if (eagain)
1500 {
1501 errno = EAGAIN;
1502 size = -1;
1503 }
1504 else
1505 size = results;
1506 }
1507 else
1508 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001509 size = libc_sendfile (out_fd, in_fd, offset, len);
1510 }
1511
1512done:
Dave Wallace048b1d62018-01-03 22:24:41 -05001513 return size;
1514}
1515
1516ssize_t
1517sendfile64 (int out_fd, int in_fd, off_t * offset, size_t len)
1518{
1519 return sendfile (out_fd, in_fd, offset, len);
1520}
1521
1522ssize_t
1523recv (int fd, void *buf, size_t n, int flags)
1524{
Florin Coras7baeb712019-01-04 17:05:43 -08001525 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05001526 ssize_t size;
Dave Wallace048b1d62018-01-03 22:24:41 -05001527
Florin Coras5f33d0d2021-06-02 21:22:21 -07001528 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001529
Florin Coras7baeb712019-01-04 17:05:43 -08001530 vlsh = ldp_fd_to_vlsh (fd);
1531 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05001532 {
Florin Coras7baeb712019-01-04 17:05:43 -08001533 size = vls_recvfrom (vlsh, buf, n, flags, NULL);
Dave Wallace048b1d62018-01-03 22:24:41 -05001534 if (size < 0)
Florin Coras2a6642e2020-03-24 15:24:29 +00001535 {
1536 errno = -size;
1537 size = -1;
1538 }
Dave Wallace048b1d62018-01-03 22:24:41 -05001539 }
1540 else
1541 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001542 size = libc_recv (fd, buf, n, flags);
1543 }
1544
Dave Wallace048b1d62018-01-03 22:24:41 -05001545 return size;
1546}
1547
Sivaprasad Tummalafdcbd382021-07-31 21:38:19 +05301548ssize_t
1549__recv_chk (int fd, void *buf, size_t n, size_t buflen, int flags)
1550{
1551 if (n > buflen)
1552 return -1;
1553
1554 return recv (fd, buf, n, flags);
1555}
1556
Dou Chao243a0432022-11-29 19:41:34 +08001557static inline int
1558ldp_vls_sendo (vls_handle_t vlsh, const void *buf, size_t n,
Florin Coraseff5f7a2023-02-07 17:36:17 -08001559 vppcom_endpt_tlv_t *app_tlvs, int flags,
Florin Coras36847942023-02-02 12:56:16 -08001560 __CONST_SOCKADDR_ARG _addr, socklen_t addr_len)
Florin Corasce17f462020-05-22 20:36:29 +00001561{
Florin Coras36847942023-02-02 12:56:16 -08001562 const struct sockaddr *addr = SOCKADDR_GET_SA (_addr);
Florin Corasce17f462020-05-22 20:36:29 +00001563 vppcom_endpt_t *ep = 0;
1564 vppcom_endpt_t _ep;
1565
Florin Coraseff5f7a2023-02-07 17:36:17 -08001566 _ep.app_tlvs = app_tlvs;
Dou Chao243a0432022-11-29 19:41:34 +08001567
Florin Corasce17f462020-05-22 20:36:29 +00001568 if (addr)
1569 {
1570 ep = &_ep;
1571 switch (addr->sa_family)
1572 {
1573 case AF_INET:
1574 ep->is_ip4 = VPPCOM_IS_IP4;
1575 ep->ip =
1576 (uint8_t *) & ((const struct sockaddr_in *) addr)->sin_addr;
1577 ep->port = (uint16_t) ((const struct sockaddr_in *) addr)->sin_port;
1578 break;
1579
1580 case AF_INET6:
1581 ep->is_ip4 = VPPCOM_IS_IP6;
1582 ep->ip =
1583 (uint8_t *) & ((const struct sockaddr_in6 *) addr)->sin6_addr;
1584 ep->port =
1585 (uint16_t) ((const struct sockaddr_in6 *) addr)->sin6_port;
1586 break;
1587
1588 default:
1589 return EAFNOSUPPORT;
1590 }
1591 }
1592
1593 return vls_sendto (vlsh, (void *) buf, n, flags, ep);
1594}
1595
1596static int
Florin Coras36847942023-02-02 12:56:16 -08001597ldp_vls_recvfrom (vls_handle_t vlsh, void *__restrict buf, size_t n, int flags,
1598 __SOCKADDR_ARG _addr, socklen_t *__restrict addr_len)
Florin Corasce17f462020-05-22 20:36:29 +00001599{
1600 u8 src_addr[sizeof (struct sockaddr_in6)];
Florin Coras36847942023-02-02 12:56:16 -08001601 struct sockaddr *addr = SOCKADDR_GET_SA (_addr);
Florin Corasce17f462020-05-22 20:36:29 +00001602 vppcom_endpt_t ep;
1603 ssize_t size;
1604 int rv;
1605
1606 if (addr)
1607 {
1608 ep.ip = src_addr;
1609 size = vls_recvfrom (vlsh, buf, n, flags, &ep);
1610
1611 if (size > 0)
1612 {
1613 rv = ldp_copy_ep_to_sockaddr (addr, addr_len, &ep);
1614 if (rv < 0)
1615 size = rv;
1616 }
1617 }
1618 else
1619 size = vls_recvfrom (vlsh, buf, n, flags, NULL);
1620
1621 return size;
1622}
1623
Dave Wallace048b1d62018-01-03 22:24:41 -05001624ssize_t
1625sendto (int fd, const void *buf, size_t n, int flags,
Florin Coras36847942023-02-02 12:56:16 -08001626 __CONST_SOCKADDR_ARG _addr, socklen_t addr_len)
Dave Wallace048b1d62018-01-03 22:24:41 -05001627{
Florin Coras36847942023-02-02 12:56:16 -08001628 const struct sockaddr *addr = SOCKADDR_GET_SA (_addr);
Florin Coras7baeb712019-01-04 17:05:43 -08001629 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05001630 ssize_t size;
Dave Wallace048b1d62018-01-03 22:24:41 -05001631
Florin Coras5f33d0d2021-06-02 21:22:21 -07001632 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001633
Florin Coras7baeb712019-01-04 17:05:43 -08001634 vlsh = ldp_fd_to_vlsh (fd);
wanghanlin97c6e0d2021-07-06 15:01:48 +08001635 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05001636 {
Dou Chao243a0432022-11-29 19:41:34 +08001637 size = ldp_vls_sendo (vlsh, buf, n, NULL, flags, addr, addr_len);
Dave Wallace048b1d62018-01-03 22:24:41 -05001638 if (size < 0)
1639 {
1640 errno = -size;
1641 size = -1;
1642 }
1643 }
1644 else
1645 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001646 size = libc_sendto (fd, buf, n, flags, addr, addr_len);
1647 }
1648
Dave Wallace048b1d62018-01-03 22:24:41 -05001649 return size;
1650}
1651
1652ssize_t
1653recvfrom (int fd, void *__restrict buf, size_t n, int flags,
1654 __SOCKADDR_ARG addr, socklen_t * __restrict addr_len)
1655{
Florin Corasce17f462020-05-22 20:36:29 +00001656 vls_handle_t vlsh;
1657 ssize_t size;
Dave Wallace048b1d62018-01-03 22:24:41 -05001658
Florin Coras5f33d0d2021-06-02 21:22:21 -07001659 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001660
Florin Corasce17f462020-05-22 20:36:29 +00001661 vlsh = ldp_fd_to_vlsh (fd);
1662 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05001663 {
Florin Corasce17f462020-05-22 20:36:29 +00001664 size = ldp_vls_recvfrom (vlsh, buf, n, flags, addr, addr_len);
Dave Wallace048b1d62018-01-03 22:24:41 -05001665 if (size < 0)
1666 {
1667 errno = -size;
1668 size = -1;
1669 }
1670 }
1671 else
1672 {
Dave Wallace048b1d62018-01-03 22:24:41 -05001673 size = libc_recvfrom (fd, buf, n, flags, addr, addr_len);
1674 }
1675
Dave Wallace048b1d62018-01-03 22:24:41 -05001676 return size;
1677}
1678
Florin Coraseff5f7a2023-02-07 17:36:17 -08001679static int
1680ldp_parse_cmsg (vls_handle_t vlsh, const struct msghdr *msg,
1681 vppcom_endpt_tlv_t **app_tlvs)
1682{
1683 uint8_t *ad, *at = (uint8_t *) *app_tlvs;
1684 vppcom_endpt_tlv_t *adh;
1685 struct in_pktinfo *pi;
1686 struct cmsghdr *cmsg;
1687
1688 cmsg = CMSG_FIRSTHDR (msg);
1689
1690 while (cmsg != NULL)
1691 {
1692 switch (cmsg->cmsg_level)
1693 {
1694 case SOL_UDP:
1695 switch (cmsg->cmsg_type)
1696 {
1697 case UDP_SEGMENT:
1698 vec_add2 (at, adh, sizeof (*adh));
1699 adh->data_type = VCL_UDP_SEGMENT;
1700 adh->data_len = sizeof (uint16_t);
1701 vec_add2 (at, ad, sizeof (uint16_t));
1702 *(uint16_t *) ad = *(uint16_t *) CMSG_DATA (cmsg);
1703 break;
1704 default:
1705 LDBG (1, "SOL_UDP cmsg_type %u not supported", cmsg->cmsg_type);
1706 break;
1707 }
1708 break;
1709 case SOL_IP:
1710 switch (cmsg->cmsg_type)
1711 {
1712 case IP_PKTINFO:
1713 vec_add2 (at, adh, sizeof (*adh));
1714 adh->data_type = VCL_IP_PKTINFO;
1715 adh->data_len = sizeof (struct in_addr);
1716 vec_add2 (at, ad, sizeof (struct in_addr));
1717 pi = (void *) CMSG_DATA (cmsg);
1718 clib_memcpy_fast (ad, &pi->ipi_spec_dst,
1719 sizeof (struct in_addr));
1720 break;
1721 default:
1722 LDBG (1, "SOL_IP cmsg_type %u not supported", cmsg->cmsg_type);
1723 break;
1724 }
1725 break;
1726 default:
1727 LDBG (1, "cmsg_level %u not supported", cmsg->cmsg_level);
1728 break;
1729 }
1730 cmsg = CMSG_NXTHDR ((struct msghdr *) msg, cmsg);
1731 }
1732 *app_tlvs = (vppcom_endpt_tlv_t *) at;
1733 return 0;
1734}
1735
1736static int
1737ldp_make_cmsg (vls_handle_t vlsh, struct msghdr *msg)
1738{
1739 u32 optval, optlen = sizeof (optval);
1740 struct cmsghdr *cmsg;
1741
1742 cmsg = CMSG_FIRSTHDR (msg);
1743
1744 if (!vls_attr (vlsh, VPPCOM_ATTR_GET_IP_PKTINFO, (void *) &optval, &optlen))
1745 return 0;
1746
1747 if (optval)
1748 {
1749 vppcom_endpt_t ep;
1750 u8 addr_buf[sizeof (struct in_addr)];
1751 u32 size = sizeof (ep);
1752
1753 ep.ip = addr_buf;
1754
1755 if (!vls_attr (vlsh, VPPCOM_ATTR_GET_LCL_ADDR, &ep, &size))
1756 {
1757 struct in_pktinfo pi = {};
1758
1759 clib_memcpy (&pi.ipi_addr, ep.ip, sizeof (struct in_addr));
1760 cmsg->cmsg_level = SOL_IP;
1761 cmsg->cmsg_type = IP_PKTINFO;
1762 cmsg->cmsg_len = CMSG_LEN (sizeof (pi));
1763 clib_memcpy (CMSG_DATA (cmsg), &pi, sizeof (pi));
1764 }
1765 }
1766
1767 return 0;
1768}
1769
Dave Wallace048b1d62018-01-03 22:24:41 -05001770ssize_t
Florin Corasce17f462020-05-22 20:36:29 +00001771sendmsg (int fd, const struct msghdr * msg, int flags)
Dave Wallace048b1d62018-01-03 22:24:41 -05001772{
Florin Coras7baeb712019-01-04 17:05:43 -08001773 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05001774 ssize_t size;
Dave Wallace048b1d62018-01-03 22:24:41 -05001775
Florin Coras5f33d0d2021-06-02 21:22:21 -07001776 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001777
Florin Coras7baeb712019-01-04 17:05:43 -08001778 vlsh = ldp_fd_to_vlsh (fd);
1779 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05001780 {
Florin Coraseff5f7a2023-02-07 17:36:17 -08001781 vppcom_endpt_tlv_t *app_tlvs = 0;
Florin Corasce17f462020-05-22 20:36:29 +00001782 struct iovec *iov = msg->msg_iov;
1783 ssize_t total = 0;
Florin Corascba1c222021-11-29 08:12:27 -08001784 int i, rv = 0;
Dou Chao243a0432022-11-29 19:41:34 +08001785
Florin Coraseff5f7a2023-02-07 17:36:17 -08001786 ldp_parse_cmsg (vlsh, msg, &app_tlvs);
Florin Corasce17f462020-05-22 20:36:29 +00001787
1788 for (i = 0; i < msg->msg_iovlen; ++i)
1789 {
Florin Coraseff5f7a2023-02-07 17:36:17 -08001790 rv = ldp_vls_sendo (vlsh, iov[i].iov_base, iov[i].iov_len, app_tlvs,
1791 flags, msg->msg_name, msg->msg_namelen);
Florin Corasce17f462020-05-22 20:36:29 +00001792 if (rv < 0)
1793 break;
1794 else
1795 {
1796 total += rv;
1797 if (rv < iov[i].iov_len)
1798 break;
1799 }
1800 }
1801
Florin Coraseff5f7a2023-02-07 17:36:17 -08001802 vec_free (app_tlvs);
1803
Florin Corasce17f462020-05-22 20:36:29 +00001804 if (rv < 0 && total == 0)
1805 {
1806 errno = -rv;
1807 size = -1;
1808 }
1809 else
1810 size = total;
Dave Wallace048b1d62018-01-03 22:24:41 -05001811 }
1812 else
1813 {
Florin Corasce17f462020-05-22 20:36:29 +00001814 size = libc_sendmsg (fd, msg, flags);
Dave Wallace048b1d62018-01-03 22:24:41 -05001815 }
1816
Dave Wallace048b1d62018-01-03 22:24:41 -05001817 return size;
1818}
1819
Florin Coras36847942023-02-02 12:56:16 -08001820#ifdef _GNU_SOURCE
Dave Wallace048b1d62018-01-03 22:24:41 -05001821int
1822sendmmsg (int fd, struct mmsghdr *vmessages, unsigned int vlen, int flags)
1823{
1824 ssize_t size;
1825 const char *func_str;
Florin Coras7baeb712019-01-04 17:05:43 -08001826 u32 sh = ldp_fd_to_vlsh (fd);
Dave Wallace048b1d62018-01-03 22:24:41 -05001827
Florin Coras5f33d0d2021-06-02 21:22:21 -07001828 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001829
wanghanlin97c6e0d2021-07-06 15:01:48 +08001830 if (sh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05001831 {
1832 clib_warning ("LDP<%d>: LDP-TBD", getpid ());
1833 errno = ENOSYS;
1834 size = -1;
1835 }
1836 else
1837 {
1838 func_str = "libc_sendmmsg";
1839
Dave Wallace2a865272018-02-07 21:00:42 -05001840 if (LDP_DEBUG > 2)
Dave Wallace048b1d62018-01-03 22:24:41 -05001841 clib_warning ("LDP<%d>: fd %d (0x%x): calling %s(): "
1842 "vmessages %p, vlen %u, flags 0x%x",
1843 getpid (), fd, fd, func_str, vmessages, vlen, flags);
1844
1845 size = libc_sendmmsg (fd, vmessages, vlen, flags);
1846 }
1847
Dave Wallace2a865272018-02-07 21:00:42 -05001848 if (LDP_DEBUG > 2)
Dave Wallace048b1d62018-01-03 22:24:41 -05001849 {
1850 if (size < 0)
1851 {
1852 int errno_val = errno;
1853 perror (func_str);
1854 clib_warning ("LDP<%d>: ERROR: fd %d (0x%x): %s() failed! "
1855 "rv %d, errno = %d", getpid (), fd, fd,
1856 func_str, size, errno_val);
1857 errno = errno_val;
1858 }
1859 else
1860 clib_warning ("LDP<%d>: fd %d (0x%x): returning %d (0x%x)",
1861 getpid (), fd, fd, size, size);
1862 }
1863 return size;
1864}
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07001865#endif
1866
Dave Wallace048b1d62018-01-03 22:24:41 -05001867ssize_t
Florin Corasce17f462020-05-22 20:36:29 +00001868recvmsg (int fd, struct msghdr * msg, int flags)
Dave Wallace048b1d62018-01-03 22:24:41 -05001869{
Florin Coras7baeb712019-01-04 17:05:43 -08001870 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05001871 ssize_t size;
Dave Wallace048b1d62018-01-03 22:24:41 -05001872
Florin Coras5f33d0d2021-06-02 21:22:21 -07001873 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001874
Florin Coras7baeb712019-01-04 17:05:43 -08001875 vlsh = ldp_fd_to_vlsh (fd);
1876 if (vlsh != VLS_INVALID_HANDLE)
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07001877 {
Florin Corasce17f462020-05-22 20:36:29 +00001878 struct iovec *iov = msg->msg_iov;
1879 ssize_t max_deq, total = 0;
1880 int i, rv;
1881
1882 max_deq = vls_attr (vlsh, VPPCOM_ATTR_GET_NREAD, 0, 0);
1883 if (!max_deq)
1884 return 0;
1885
1886 for (i = 0; i < msg->msg_iovlen; i++)
1887 {
1888 rv = ldp_vls_recvfrom (vlsh, iov[i].iov_base, iov[i].iov_len, flags,
1889 (i == 0 ? msg->msg_name : NULL),
1890 (i == 0 ? &msg->msg_namelen : NULL));
1891 if (rv <= 0)
1892 break;
1893 else
1894 {
1895 total += rv;
1896 if (rv < iov[i].iov_len)
1897 break;
1898 }
1899 if (total >= max_deq)
1900 break;
1901 }
1902
1903 if (rv < 0 && total == 0)
1904 {
1905 errno = -rv;
1906 size = -1;
1907 }
1908 else
Florin Coraseff5f7a2023-02-07 17:36:17 -08001909 {
1910 if (msg->msg_controllen)
1911 ldp_make_cmsg (vlsh, msg);
1912 size = total;
1913 }
Dave Wallace048b1d62018-01-03 22:24:41 -05001914 }
1915 else
1916 {
Florin Corasce17f462020-05-22 20:36:29 +00001917 size = libc_recvmsg (fd, msg, flags);
Dave Wallace048b1d62018-01-03 22:24:41 -05001918 }
1919
Dave Wallace048b1d62018-01-03 22:24:41 -05001920 return size;
1921}
1922
Florin Coras36847942023-02-02 12:56:16 -08001923#ifdef _GNU_SOURCE
Dave Wallace048b1d62018-01-03 22:24:41 -05001924int
1925recvmmsg (int fd, struct mmsghdr *vmessages,
1926 unsigned int vlen, int flags, struct timespec *tmo)
1927{
Florin Corasf1a232f2023-02-02 22:56:03 -08001928 ldp_worker_ctx_t *ldpw = ldp_worker_get_current ();
1929 u32 sh;
Dave Wallace048b1d62018-01-03 22:24:41 -05001930
Florin Coras5f33d0d2021-06-02 21:22:21 -07001931 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001932
Florin Corasf1a232f2023-02-02 22:56:03 -08001933 sh = ldp_fd_to_vlsh (fd);
1934
wanghanlin97c6e0d2021-07-06 15:01:48 +08001935 if (sh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05001936 {
Florin Corasf1a232f2023-02-02 22:56:03 -08001937 struct mmsghdr *mh;
1938 ssize_t rv = 0;
1939 u32 nvecs = 0;
1940 f64 time_out;
1941
1942 if (PREDICT_FALSE (ldpw->clib_time.init_cpu_time == 0))
1943 clib_time_init (&ldpw->clib_time);
1944 if (tmo)
1945 {
1946 time_out = (f64) tmo->tv_sec + (f64) tmo->tv_nsec / (f64) 1e9;
1947 time_out += clib_time_now (&ldpw->clib_time);
1948 }
1949 else
1950 {
1951 time_out = (f64) ~0;
1952 }
1953
1954 while (nvecs < vlen)
1955 {
1956 mh = &vmessages[nvecs];
1957 rv = recvmsg (fd, &mh->msg_hdr, flags);
1958 if (rv > 0)
1959 {
1960 mh->msg_len = rv;
1961 nvecs += 1;
1962 continue;
1963 }
1964
1965 if (!time_out || clib_time_now (&ldpw->clib_time) >= time_out)
1966 break;
1967
1968 usleep (1);
1969 }
1970
1971 return nvecs > 0 ? nvecs : rv;
Dave Wallace048b1d62018-01-03 22:24:41 -05001972 }
1973 else
1974 {
Florin Corasf1a232f2023-02-02 22:56:03 -08001975 return libc_recvmmsg (fd, vmessages, vlen, flags, tmo);
Dave Wallace048b1d62018-01-03 22:24:41 -05001976 }
Dave Wallace048b1d62018-01-03 22:24:41 -05001977}
1978#endif
1979
1980int
1981getsockopt (int fd, int level, int optname,
1982 void *__restrict optval, socklen_t * __restrict optlen)
1983{
Florin Coras7baeb712019-01-04 17:05:43 -08001984 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05001985 int rv;
Dave Wallace048b1d62018-01-03 22:24:41 -05001986
Florin Coras5f33d0d2021-06-02 21:22:21 -07001987 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05001988
Florin Coras7baeb712019-01-04 17:05:43 -08001989 vlsh = ldp_fd_to_vlsh (fd);
1990 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05001991 {
1992 rv = -EOPNOTSUPP;
1993
1994 switch (level)
1995 {
1996 case SOL_TCP:
1997 switch (optname)
1998 {
1999 case TCP_NODELAY:
Florin Coras7baeb712019-01-04 17:05:43 -08002000 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_TCP_NODELAY,
2001 optval, optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002002 break;
2003 case TCP_MAXSEG:
Florin Coras7baeb712019-01-04 17:05:43 -08002004 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_TCP_USER_MSS,
2005 optval, optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002006 break;
2007 case TCP_KEEPIDLE:
Florin Coras7baeb712019-01-04 17:05:43 -08002008 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_TCP_KEEPIDLE,
2009 optval, optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002010 break;
2011 case TCP_KEEPINTVL:
Florin Coras7baeb712019-01-04 17:05:43 -08002012 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_TCP_KEEPINTVL,
2013 optval, optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002014 break;
2015 case TCP_INFO:
2016 if (optval && optlen && (*optlen == sizeof (struct tcp_info)))
2017 {
Florin Coras7baeb712019-01-04 17:05:43 -08002018 LDBG (1, "fd %d: vlsh %u SOL_TCP, TCP_INFO, optval %p, "
2019 "optlen %d: #LDP-NOP#", fd, vlsh, optval, *optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002020 memset (optval, 0, *optlen);
2021 rv = VPPCOM_OK;
2022 }
2023 else
2024 rv = -EFAULT;
2025 break;
Florin Coras0ed24e92019-01-21 09:03:10 -08002026 case TCP_CONGESTION:
Florin Coras0ed24e92019-01-21 09:03:10 -08002027 *optlen = strlen ("cubic");
Dave Barach02500902020-04-04 18:34:41 -04002028 strncpy (optval, "cubic", *optlen + 1);
Florin Coras0ed24e92019-01-21 09:03:10 -08002029 rv = 0;
2030 break;
Dave Wallace048b1d62018-01-03 22:24:41 -05002031 default:
Florin Coras7baeb712019-01-04 17:05:43 -08002032 LDBG (0, "ERROR: fd %d: getsockopt SOL_TCP: sid %u, "
2033 "optname %d unsupported!", fd, vlsh, optname);
Dave Wallace048b1d62018-01-03 22:24:41 -05002034 break;
2035 }
2036 break;
2037 case SOL_IPV6:
2038 switch (optname)
2039 {
2040 case IPV6_V6ONLY:
Florin Coras7baeb712019-01-04 17:05:43 -08002041 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_V6ONLY, optval, optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002042 break;
2043 default:
Florin Coras7baeb712019-01-04 17:05:43 -08002044 LDBG (0, "ERROR: fd %d: getsockopt SOL_IPV6: vlsh %u "
2045 "optname %d unsupported!", fd, vlsh, optname);
Dave Wallace048b1d62018-01-03 22:24:41 -05002046 break;
2047 }
2048 break;
2049 case SOL_SOCKET:
2050 switch (optname)
2051 {
2052 case SO_ACCEPTCONN:
Florin Coras7baeb712019-01-04 17:05:43 -08002053 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_LISTEN, optval, optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002054 break;
2055 case SO_KEEPALIVE:
Florin Coras7baeb712019-01-04 17:05:43 -08002056 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_KEEPALIVE, optval, optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002057 break;
2058 case SO_PROTOCOL:
Florin Coras7baeb712019-01-04 17:05:43 -08002059 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_PROTOCOL, optval, optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002060 *(int *) optval = *(int *) optval ? SOCK_DGRAM : SOCK_STREAM;
2061 break;
2062 case SO_SNDBUF:
Florin Coras7baeb712019-01-04 17:05:43 -08002063 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_TX_FIFO_LEN,
2064 optval, optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002065 break;
2066 case SO_RCVBUF:
Florin Coras7baeb712019-01-04 17:05:43 -08002067 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_RX_FIFO_LEN,
2068 optval, optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002069 break;
2070 case SO_REUSEADDR:
Florin Coras7baeb712019-01-04 17:05:43 -08002071 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_REUSEADDR, optval, optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002072 break;
wanghanlin0674f852021-02-22 10:38:36 +08002073 case SO_REUSEPORT:
2074 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_REUSEPORT, optval, optlen);
2075 break;
Dave Wallace048b1d62018-01-03 22:24:41 -05002076 case SO_BROADCAST:
Florin Coras7baeb712019-01-04 17:05:43 -08002077 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_BROADCAST, optval, optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002078 break;
wanghanlin0674f852021-02-22 10:38:36 +08002079 case SO_DOMAIN:
2080 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_DOMAIN, optval, optlen);
2081 break;
Dave Wallace048b1d62018-01-03 22:24:41 -05002082 case SO_ERROR:
Florin Coras7baeb712019-01-04 17:05:43 -08002083 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_ERROR, optval, optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002084 break;
Florin Coras8eb8d502021-06-16 14:46:57 -07002085 case SO_BINDTODEVICE:
2086 rv = 0;
2087 break;
Dave Wallace048b1d62018-01-03 22:24:41 -05002088 default:
Florin Coras7baeb712019-01-04 17:05:43 -08002089 LDBG (0, "ERROR: fd %d: getsockopt SOL_SOCKET: vlsh %u "
2090 "optname %d unsupported!", fd, vlsh, optname);
Dave Wallace048b1d62018-01-03 22:24:41 -05002091 break;
2092 }
2093 break;
2094 default:
2095 break;
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002096 }
2097
Dave Wallace048b1d62018-01-03 22:24:41 -05002098 if (rv != VPPCOM_OK)
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002099 {
Dave Wallace048b1d62018-01-03 22:24:41 -05002100 errno = -rv;
2101 rv = -1;
2102 }
2103 }
2104 else
2105 {
Dave Wallace048b1d62018-01-03 22:24:41 -05002106 rv = libc_getsockopt (fd, level, optname, optval, optlen);
2107 }
2108
Dave Wallace048b1d62018-01-03 22:24:41 -05002109 return rv;
2110}
2111
2112int
2113setsockopt (int fd, int level, int optname,
2114 const void *optval, socklen_t optlen)
2115{
Florin Coras7baeb712019-01-04 17:05:43 -08002116 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05002117 int rv;
Dave Wallace048b1d62018-01-03 22:24:41 -05002118
Florin Coras5f33d0d2021-06-02 21:22:21 -07002119 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05002120
Florin Coras7baeb712019-01-04 17:05:43 -08002121 vlsh = ldp_fd_to_vlsh (fd);
2122 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05002123 {
2124 rv = -EOPNOTSUPP;
2125
2126 switch (level)
2127 {
2128 case SOL_TCP:
2129 switch (optname)
2130 {
2131 case TCP_NODELAY:
Florin Coras7baeb712019-01-04 17:05:43 -08002132 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_TCP_NODELAY,
2133 (void *) optval, &optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002134 break;
2135 case TCP_MAXSEG:
Florin Coras7baeb712019-01-04 17:05:43 -08002136 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_TCP_USER_MSS,
2137 (void *) optval, &optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002138 break;
2139 case TCP_KEEPIDLE:
Florin Coras7baeb712019-01-04 17:05:43 -08002140 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_TCP_KEEPIDLE,
2141 (void *) optval, &optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002142 break;
2143 case TCP_KEEPINTVL:
Florin Coras7baeb712019-01-04 17:05:43 -08002144 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_TCP_KEEPINTVL,
2145 (void *) optval, &optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002146 break;
Florin Coras0ed24e92019-01-21 09:03:10 -08002147 case TCP_CONGESTION:
Florin Coras8509aa22019-04-04 12:55:30 -07002148 case TCP_CORK:
Florin Coras0ed24e92019-01-21 09:03:10 -08002149 /* Ignore */
2150 rv = 0;
2151 break;
Dave Wallace048b1d62018-01-03 22:24:41 -05002152 default:
Florin Coras7baeb712019-01-04 17:05:43 -08002153 LDBG (0, "ERROR: fd %d: setsockopt() SOL_TCP: vlsh %u"
2154 "optname %d unsupported!", fd, vlsh, optname);
Dave Wallace048b1d62018-01-03 22:24:41 -05002155 break;
2156 }
2157 break;
2158 case SOL_IPV6:
2159 switch (optname)
2160 {
2161 case IPV6_V6ONLY:
Florin Coras7baeb712019-01-04 17:05:43 -08002162 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_V6ONLY,
2163 (void *) optval, &optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002164 break;
2165 default:
Florin Coras7baeb712019-01-04 17:05:43 -08002166 LDBG (0, "ERROR: fd %d: setsockopt SOL_IPV6: vlsh %u"
2167 "optname %d unsupported!", fd, vlsh, optname);
Dave Wallace048b1d62018-01-03 22:24:41 -05002168 break;
2169 }
2170 break;
2171 case SOL_SOCKET:
2172 switch (optname)
2173 {
2174 case SO_KEEPALIVE:
Florin Coras7baeb712019-01-04 17:05:43 -08002175 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_KEEPALIVE,
2176 (void *) optval, &optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002177 break;
2178 case SO_REUSEADDR:
Florin Coras7baeb712019-01-04 17:05:43 -08002179 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_REUSEADDR,
2180 (void *) optval, &optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002181 break;
wanghanlin0674f852021-02-22 10:38:36 +08002182 case SO_REUSEPORT:
2183 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_REUSEPORT, (void *) optval,
2184 &optlen);
2185 break;
Dave Wallace048b1d62018-01-03 22:24:41 -05002186 case SO_BROADCAST:
Florin Coras7baeb712019-01-04 17:05:43 -08002187 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_BROADCAST,
2188 (void *) optval, &optlen);
Dave Wallace048b1d62018-01-03 22:24:41 -05002189 break;
Florin Coras2f647902021-06-02 08:23:50 -07002190 case SO_LINGER:
2191 rv = 0;
2192 break;
Dave Wallace048b1d62018-01-03 22:24:41 -05002193 default:
Florin Coras7baeb712019-01-04 17:05:43 -08002194 LDBG (0, "ERROR: fd %d: setsockopt SOL_SOCKET: vlsh %u "
2195 "optname %d unsupported!", fd, vlsh, optname);
Dave Wallace048b1d62018-01-03 22:24:41 -05002196 break;
2197 }
2198 break;
Florin Coraseff5f7a2023-02-07 17:36:17 -08002199 case SOL_IP:
2200 switch (optname)
2201 {
2202 case IP_PKTINFO:
2203 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_IP_PKTINFO, (void *) optval,
2204 &optlen);
2205 break;
2206 default:
2207 LDBG (0,
2208 "ERROR: fd %d: setsockopt SOL_IP: vlsh %u optname %d"
2209 "unsupported!",
2210 fd, vlsh, optname);
2211 break;
2212 }
2213 break;
Dave Wallace048b1d62018-01-03 22:24:41 -05002214 default:
2215 break;
2216 }
2217
2218 if (rv != VPPCOM_OK)
2219 {
2220 errno = -rv;
2221 rv = -1;
2222 }
2223 }
2224 else
2225 {
Dave Wallace048b1d62018-01-03 22:24:41 -05002226 rv = libc_setsockopt (fd, level, optname, optval, optlen);
2227 }
2228
Dave Wallace048b1d62018-01-03 22:24:41 -05002229 return rv;
2230}
2231
2232int
2233listen (int fd, int n)
2234{
Florin Coras7baeb712019-01-04 17:05:43 -08002235 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05002236 int rv;
Dave Wallace048b1d62018-01-03 22:24:41 -05002237
Florin Coras5f33d0d2021-06-02 21:22:21 -07002238 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05002239
Florin Coras7baeb712019-01-04 17:05:43 -08002240 vlsh = ldp_fd_to_vlsh (fd);
2241 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05002242 {
Florin Coras7baeb712019-01-04 17:05:43 -08002243 LDBG (0, "fd %d: calling vls_listen: vlsh %u, n %d", fd, vlsh, n);
Dave Wallace048b1d62018-01-03 22:24:41 -05002244
Florin Coras7baeb712019-01-04 17:05:43 -08002245 rv = vls_listen (vlsh, n);
Dave Wallace048b1d62018-01-03 22:24:41 -05002246 if (rv != VPPCOM_OK)
2247 {
2248 errno = -rv;
2249 rv = -1;
2250 }
2251 }
2252 else
2253 {
Florin Coras7baeb712019-01-04 17:05:43 -08002254 LDBG (0, "fd %d: calling libc_listen(): n %d", fd, n);
Dave Wallace048b1d62018-01-03 22:24:41 -05002255 rv = libc_listen (fd, n);
2256 }
2257
Florin Coras7baeb712019-01-04 17:05:43 -08002258 LDBG (1, "fd %d: returning %d", fd, rv);
Dave Wallace048b1d62018-01-03 22:24:41 -05002259 return rv;
2260}
2261
2262static inline int
Florin Coras36847942023-02-02 12:56:16 -08002263ldp_accept4 (int listen_fd, __SOCKADDR_ARG _addr,
2264 socklen_t *__restrict addr_len, int flags)
Dave Wallace048b1d62018-01-03 22:24:41 -05002265{
Florin Coras36847942023-02-02 12:56:16 -08002266 struct sockaddr *addr = SOCKADDR_GET_SA (_addr);
Florin Coras7baeb712019-01-04 17:05:43 -08002267 vls_handle_t listen_vlsh, accept_vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05002268 int rv;
Dave Wallace048b1d62018-01-03 22:24:41 -05002269
Florin Coras5f33d0d2021-06-02 21:22:21 -07002270 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05002271
Florin Coras7baeb712019-01-04 17:05:43 -08002272 listen_vlsh = ldp_fd_to_vlsh (listen_fd);
2273 if (listen_vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05002274 {
2275 vppcom_endpt_t ep;
2276 u8 src_addr[sizeof (struct sockaddr_in6)];
Dave Wallace8aaba562018-01-18 17:21:19 -05002277 memset (&ep, 0, sizeof (ep));
Dave Wallace048b1d62018-01-03 22:24:41 -05002278 ep.ip = src_addr;
2279
Florin Coras7baeb712019-01-04 17:05:43 -08002280 LDBG (0, "listen fd %d: calling vppcom_session_accept: listen sid %u,"
Florin Coraseb801d02020-09-16 17:44:58 -07002281 " ep %p, flags 0x%x", listen_fd, listen_vlsh, &ep, flags);
Dave Wallace048b1d62018-01-03 22:24:41 -05002282
Florin Coras7baeb712019-01-04 17:05:43 -08002283 accept_vlsh = vls_accept (listen_vlsh, &ep, flags);
2284 if (accept_vlsh < 0)
Dave Wallace048b1d62018-01-03 22:24:41 -05002285 {
Florin Coras7baeb712019-01-04 17:05:43 -08002286 errno = -accept_vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05002287 rv = -1;
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002288 }
2289 else
2290 {
Dave Wallace2a865272018-02-07 21:00:42 -05002291 rv = ldp_copy_ep_to_sockaddr (addr, addr_len, &ep);
Dave Wallace048b1d62018-01-03 22:24:41 -05002292 if (rv != VPPCOM_OK)
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002293 {
Florin Coras7baeb712019-01-04 17:05:43 -08002294 (void) vls_close (accept_vlsh);
Dave Wallace048b1d62018-01-03 22:24:41 -05002295 errno = -rv;
2296 rv = -1;
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002297 }
Dave Wallace048b1d62018-01-03 22:24:41 -05002298 else
2299 {
Florin Coras7baeb712019-01-04 17:05:43 -08002300 rv = ldp_vlsh_to_fd (accept_vlsh);
Dave Wallace048b1d62018-01-03 22:24:41 -05002301 }
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002302 }
2303 }
Dave Wallace048b1d62018-01-03 22:24:41 -05002304 else
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002305 {
Florin Coras7baeb712019-01-04 17:05:43 -08002306 LDBG (0, "listen fd %d: calling libc_accept4(): addr %p, addr_len %p,"
2307 " flags 0x%x", listen_fd, addr, addr_len, flags);
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002308
Dave Wallace048b1d62018-01-03 22:24:41 -05002309 rv = libc_accept4 (listen_fd, addr, addr_len, flags);
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002310 }
2311
Florin Coras7baeb712019-01-04 17:05:43 -08002312 LDBG (1, "listen fd %d: accept returning %d", listen_fd, rv);
Florin Coras05ecfcc2018-12-12 18:19:39 -08002313
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002314 return rv;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002315}
2316
Dave Wallace048b1d62018-01-03 22:24:41 -05002317int
2318accept4 (int fd, __SOCKADDR_ARG addr, socklen_t * __restrict addr_len,
2319 int flags)
2320{
Dave Wallace2a865272018-02-07 21:00:42 -05002321 return ldp_accept4 (fd, addr, addr_len, flags);
Dave Wallace048b1d62018-01-03 22:24:41 -05002322}
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002323
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002324int
Dave Wallace048b1d62018-01-03 22:24:41 -05002325accept (int fd, __SOCKADDR_ARG addr, socklen_t * __restrict addr_len)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002326{
Dave Wallace2a865272018-02-07 21:00:42 -05002327 return ldp_accept4 (fd, addr, addr_len, 0);
Dave Wallace048b1d62018-01-03 22:24:41 -05002328}
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002329
Dave Wallace048b1d62018-01-03 22:24:41 -05002330int
2331shutdown (int fd, int how)
2332{
Florin Coras7baeb712019-01-04 17:05:43 -08002333 vls_handle_t vlsh;
liuyacan55c952e2021-06-13 14:54:55 +08002334 int rv = 0;
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002335
Florin Coras5f33d0d2021-06-02 21:22:21 -07002336 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05002337
Florin Coras7baeb712019-01-04 17:05:43 -08002338 vlsh = ldp_fd_to_vlsh (fd);
2339 if (vlsh != VLS_INVALID_HANDLE)
Dave Wallace048b1d62018-01-03 22:24:41 -05002340 {
Florin Coras7baeb712019-01-04 17:05:43 -08002341 LDBG (0, "called shutdown: fd %u vlsh %u how %d", fd, vlsh, how);
liuyacan55c952e2021-06-13 14:54:55 +08002342 rv = vls_shutdown (vlsh, how);
Dave Wallace048b1d62018-01-03 22:24:41 -05002343 }
2344 else
2345 {
Florin Coras7baeb712019-01-04 17:05:43 -08002346 LDBG (0, "fd %d: calling libc_shutdown: how %d", fd, how);
Dave Wallace048b1d62018-01-03 22:24:41 -05002347 rv = libc_shutdown (fd, how);
2348 }
2349
Dave Wallace048b1d62018-01-03 22:24:41 -05002350 return rv;
2351}
2352
2353int
2354epoll_create1 (int flags)
2355{
Florin Corasdfe4cf42018-11-28 22:13:45 -08002356 ldp_worker_ctx_t *ldpw = ldp_worker_get_current ();
Florin Coras7baeb712019-01-04 17:05:43 -08002357 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05002358 int rv;
2359
Florin Coras5f33d0d2021-06-02 21:22:21 -07002360 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05002361
hanlina3a48962020-07-13 11:09:15 +08002362 if (ldp->vcl_needs_real_epoll || vls_use_real_epoll ())
Florin Coras99368312018-08-02 10:45:44 -07002363 {
Florin Coras2d9b4272019-03-11 10:14:37 -07002364 /* Make sure workers have been allocated */
2365 if (!ldp->workers)
2366 {
2367 ldp_alloc_workers ();
2368 ldpw = ldp_worker_get_current ();
2369 }
Florin Coras99368312018-08-02 10:45:44 -07002370 rv = libc_epoll_create1 (flags);
2371 ldp->vcl_needs_real_epoll = 0;
Florin Corasdfe4cf42018-11-28 22:13:45 -08002372 ldpw->vcl_mq_epfd = rv;
Florin Coras05ecfcc2018-12-12 18:19:39 -08002373 LDBG (0, "created vcl epfd %u", rv);
Florin Coras99368312018-08-02 10:45:44 -07002374 return rv;
2375 }
Dave Wallace048b1d62018-01-03 22:24:41 -05002376
Florin Coras7baeb712019-01-04 17:05:43 -08002377 vlsh = vls_epoll_create ();
2378 if (PREDICT_FALSE (vlsh == VLS_INVALID_HANDLE))
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002379 {
Florin Coras7baeb712019-01-04 17:05:43 -08002380 errno = -vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05002381 rv = -1;
shrinivasan ganapathy1d359632017-10-15 15:46:09 -07002382 }
Dave Wallace048b1d62018-01-03 22:24:41 -05002383 else
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002384 {
Florin Coras7baeb712019-01-04 17:05:43 -08002385 rv = ldp_vlsh_to_fd (vlsh);
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002386 }
Florin Coras7baeb712019-01-04 17:05:43 -08002387 LDBG (0, "epoll_create epfd %u vlsh %u", rv, vlsh);
Dave Wallace048b1d62018-01-03 22:24:41 -05002388 return rv;
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002389}
2390
2391int
Dave Wallace048b1d62018-01-03 22:24:41 -05002392epoll_create (int size)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002393{
Dave Wallace048b1d62018-01-03 22:24:41 -05002394 return epoll_create1 (0);
2395}
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002396
Dave Wallace048b1d62018-01-03 22:24:41 -05002397int
2398epoll_ctl (int epfd, int op, int fd, struct epoll_event *event)
2399{
Florin Coras7baeb712019-01-04 17:05:43 -08002400 vls_handle_t vep_vlsh, vlsh;
Florin Coras99368312018-08-02 10:45:44 -07002401 int rv;
Dave Wallace048b1d62018-01-03 22:24:41 -05002402
Florin Coras5f33d0d2021-06-02 21:22:21 -07002403 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05002404
Florin Coras7baeb712019-01-04 17:05:43 -08002405 vep_vlsh = ldp_fd_to_vlsh (epfd);
2406 if (PREDICT_FALSE (vep_vlsh == VLS_INVALID_HANDLE))
Dave Wallace048b1d62018-01-03 22:24:41 -05002407 {
Dave Wallace3ee1fe12018-02-23 01:09:11 -05002408 /* The LDP epoll_create1 always creates VCL epfd's.
2409 * The app should never have a kernel base epoll fd unless it
2410 * was acquired outside of the LD_PRELOAD process context.
2411 * In any case, if we get one, punt it to libc_epoll_ctl.
2412 */
Florin Coras7baeb712019-01-04 17:05:43 -08002413 LDBG (1, "epfd %d: calling libc_epoll_ctl: op %d, fd %d"
2414 " event %p", epfd, op, fd, event);
Dave Wallace048b1d62018-01-03 22:24:41 -05002415
2416 rv = libc_epoll_ctl (epfd, op, fd, event);
Florin Coras99368312018-08-02 10:45:44 -07002417 goto done;
2418 }
2419
Florin Coras7baeb712019-01-04 17:05:43 -08002420 vlsh = ldp_fd_to_vlsh (fd);
Florin Coras99368312018-08-02 10:45:44 -07002421
Florin Coras7baeb712019-01-04 17:05:43 -08002422 LDBG (0, "epfd %d ep_vlsh %d, fd %u vlsh %d, op %u", epfd, vep_vlsh, fd,
2423 vlsh, op);
Florin Coras99368312018-08-02 10:45:44 -07002424
Florin Coras7baeb712019-01-04 17:05:43 -08002425 if (vlsh != VLS_INVALID_HANDLE)
Florin Coras99368312018-08-02 10:45:44 -07002426 {
Florin Coras7baeb712019-01-04 17:05:43 -08002427 LDBG (1, "epfd %d: calling vls_epoll_ctl: ep_vlsh %d op %d, vlsh %u,"
Florin Coraseb801d02020-09-16 17:44:58 -07002428 " event %p", epfd, vep_vlsh, op, vlsh, event);
Florin Coras99368312018-08-02 10:45:44 -07002429
Florin Coras7baeb712019-01-04 17:05:43 -08002430 rv = vls_epoll_ctl (vep_vlsh, op, vlsh, event);
Florin Coras99368312018-08-02 10:45:44 -07002431 if (rv != VPPCOM_OK)
2432 {
2433 errno = -rv;
2434 rv = -1;
2435 }
2436 }
2437 else
2438 {
2439 int libc_epfd;
2440 u32 size = sizeof (epfd);
2441
Florin Coras7baeb712019-01-04 17:05:43 -08002442 libc_epfd = vls_attr (vep_vlsh, VPPCOM_ATTR_GET_LIBC_EPFD, 0, 0);
Florin Coras99368312018-08-02 10:45:44 -07002443 if (!libc_epfd)
2444 {
Florin Coras7baeb712019-01-04 17:05:43 -08002445 LDBG (1, "epfd %d, vep_vlsh %d calling libc_epoll_create1: "
2446 "EPOLL_CLOEXEC", epfd, vep_vlsh);
Florin Coras99368312018-08-02 10:45:44 -07002447
2448 libc_epfd = libc_epoll_create1 (EPOLL_CLOEXEC);
2449 if (libc_epfd < 0)
2450 {
2451 rv = libc_epfd;
2452 goto done;
2453 }
2454
Florin Coras7baeb712019-01-04 17:05:43 -08002455 rv = vls_attr (vep_vlsh, VPPCOM_ATTR_SET_LIBC_EPFD, &libc_epfd,
2456 &size);
Florin Coras99368312018-08-02 10:45:44 -07002457 if (rv < 0)
2458 {
2459 errno = -rv;
2460 rv = -1;
2461 goto done;
2462 }
2463 }
2464 else if (PREDICT_FALSE (libc_epfd < 0))
2465 {
2466 errno = -epfd;
2467 rv = -1;
2468 goto done;
2469 }
2470
Florin Coras7baeb712019-01-04 17:05:43 -08002471 LDBG (1, "epfd %d: calling libc_epoll_ctl: libc_epfd %d, op %d, fd %d,"
2472 " event %p", epfd, libc_epfd, op, fd, event);
Florin Coras99368312018-08-02 10:45:44 -07002473
2474 rv = libc_epoll_ctl (libc_epfd, op, fd, event);
Dave Wallace048b1d62018-01-03 22:24:41 -05002475 }
2476
2477done:
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002478 return rv;
2479}
Dave Wallace048b1d62018-01-03 22:24:41 -05002480
2481static inline int
Florin Coras99368312018-08-02 10:45:44 -07002482ldp_epoll_pwait (int epfd, struct epoll_event *events, int maxevents,
2483 int timeout, const sigset_t * sigmask)
Dave Wallace048b1d62018-01-03 22:24:41 -05002484{
Liangxing Wang7c7231f2023-02-16 09:31:01 +00002485 ldp_worker_ctx_t *ldpw;
Florin Coras72f77822019-01-22 19:05:52 -08002486 double time_to_wait = (double) 0, max_time;
Florin Coras99368312018-08-02 10:45:44 -07002487 int libc_epfd, rv = 0;
Florin Coras7baeb712019-01-04 17:05:43 -08002488 vls_handle_t ep_vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05002489
Florin Coras5f33d0d2021-06-02 21:22:21 -07002490 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05002491
2492 if (PREDICT_FALSE (!events || (timeout < -1)))
2493 {
2494 errno = EFAULT;
2495 return -1;
2496 }
2497
Liangxing Wang7c7231f2023-02-16 09:31:01 +00002498 if (PREDICT_FALSE (vppcom_worker_index () == ~0))
2499 vls_register_vcl_worker ();
2500
2501 ldpw = ldp_worker_get_current ();
Florin Corasdfe4cf42018-11-28 22:13:45 -08002502 if (epfd == ldpw->vcl_mq_epfd)
Florin Coras99368312018-08-02 10:45:44 -07002503 return libc_epoll_pwait (epfd, events, maxevents, timeout, sigmask);
2504
Florin Coras7baeb712019-01-04 17:05:43 -08002505 ep_vlsh = ldp_fd_to_vlsh (epfd);
2506 if (PREDICT_FALSE (ep_vlsh == VLS_INVALID_HANDLE))
Dave Wallace048b1d62018-01-03 22:24:41 -05002507 {
Florin Coras7baeb712019-01-04 17:05:43 -08002508 LDBG (0, "epfd %d: bad ep_vlsh %d!", epfd, ep_vlsh);
Dave Wallace048b1d62018-01-03 22:24:41 -05002509 errno = EBADFD;
2510 return -1;
2511 }
2512
Florin Coras4dee8cd2019-01-29 21:28:16 -08002513 if (PREDICT_FALSE (ldpw->clib_time.init_cpu_time == 0))
2514 clib_time_init (&ldpw->clib_time);
Florin Corasb0f662f2018-12-27 14:51:46 -08002515 time_to_wait = ((timeout >= 0) ? (double) timeout / 1000 : 0);
Florin Coras72f77822019-01-22 19:05:52 -08002516 max_time = clib_time_now (&ldpw->clib_time) + time_to_wait;
Dave Wallace048b1d62018-01-03 22:24:41 -05002517
Florin Coras7baeb712019-01-04 17:05:43 -08002518 libc_epfd = vls_attr (ep_vlsh, VPPCOM_ATTR_GET_LIBC_EPFD, 0, 0);
Dave Wallace048b1d62018-01-03 22:24:41 -05002519 if (PREDICT_FALSE (libc_epfd < 0))
2520 {
2521 errno = -libc_epfd;
2522 rv = -1;
2523 goto done;
2524 }
2525
Florin Coras7baeb712019-01-04 17:05:43 -08002526 LDBG (2, "epfd %d: vep_idx %d, libc_epfd %d, events %p, maxevents %d, "
2527 "timeout %d, sigmask %p: time_to_wait %.02f", epfd, ep_vlsh,
Florin Coras72f77822019-01-22 19:05:52 -08002528 libc_epfd, events, maxevents, timeout, sigmask, time_to_wait);
Dave Wallace048b1d62018-01-03 22:24:41 -05002529 do
2530 {
Florin Corasdfe4cf42018-11-28 22:13:45 -08002531 if (!ldpw->epoll_wait_vcl)
Dave Wallace048b1d62018-01-03 22:24:41 -05002532 {
Florin Coras7baeb712019-01-04 17:05:43 -08002533 rv = vls_epoll_wait (ep_vlsh, events, maxevents, 0);
Dave Wallace048b1d62018-01-03 22:24:41 -05002534 if (rv > 0)
2535 {
Florin Corasdfe4cf42018-11-28 22:13:45 -08002536 ldpw->epoll_wait_vcl = 1;
Dave Wallace048b1d62018-01-03 22:24:41 -05002537 goto done;
2538 }
2539 else if (rv < 0)
2540 {
2541 errno = -rv;
2542 rv = -1;
2543 goto done;
2544 }
2545 }
2546 else
Florin Corasdfe4cf42018-11-28 22:13:45 -08002547 ldpw->epoll_wait_vcl = 0;
Dave Wallace048b1d62018-01-03 22:24:41 -05002548
2549 if (libc_epfd > 0)
2550 {
Florin Corasb0f662f2018-12-27 14:51:46 -08002551 rv = libc_epoll_pwait (libc_epfd, events, maxevents, 0, sigmask);
Dave Wallace048b1d62018-01-03 22:24:41 -05002552 if (rv != 0)
2553 goto done;
2554 }
Dave Wallace048b1d62018-01-03 22:24:41 -05002555 }
Florin Coras72f77822019-01-22 19:05:52 -08002556 while ((timeout == -1) || (clib_time_now (&ldpw->clib_time) < max_time));
Dave Wallace048b1d62018-01-03 22:24:41 -05002557
2558done:
Dave Wallace048b1d62018-01-03 22:24:41 -05002559 return rv;
2560}
2561
hanlin4266d4d2020-05-19 17:34:17 +08002562static inline int
2563ldp_epoll_pwait_eventfd (int epfd, struct epoll_event *events,
2564 int maxevents, int timeout, const sigset_t * sigmask)
2565{
hanlina3a48962020-07-13 11:09:15 +08002566 ldp_worker_ctx_t *ldpw;
hanlin4266d4d2020-05-19 17:34:17 +08002567 int libc_epfd, rv = 0, num_ev;
2568 vls_handle_t ep_vlsh;
2569
Florin Coras5f33d0d2021-06-02 21:22:21 -07002570 ldp_init_check ();
hanlin4266d4d2020-05-19 17:34:17 +08002571
2572 if (PREDICT_FALSE (!events || (timeout < -1)))
2573 {
2574 errno = EFAULT;
2575 return -1;
2576 }
2577
Florin Corasff40d8f2020-08-11 22:05:28 -07002578 /* Make sure the vcl worker is valid. Could be that epoll fd was created on
2579 * one thread but it is now used on another */
2580 if (PREDICT_FALSE (vppcom_worker_index () == ~0))
2581 vls_register_vcl_worker ();
hanlina3a48962020-07-13 11:09:15 +08002582
2583 ldpw = ldp_worker_get_current ();
hanlin4266d4d2020-05-19 17:34:17 +08002584 if (epfd == ldpw->vcl_mq_epfd)
2585 return libc_epoll_pwait (epfd, events, maxevents, timeout, sigmask);
2586
2587 ep_vlsh = ldp_fd_to_vlsh (epfd);
2588 if (PREDICT_FALSE (ep_vlsh == VLS_INVALID_HANDLE))
2589 {
2590 LDBG (0, "epfd %d: bad ep_vlsh %d!", epfd, ep_vlsh);
2591 errno = EBADFD;
2592 return -1;
2593 }
2594
2595 libc_epfd = vls_attr (ep_vlsh, VPPCOM_ATTR_GET_LIBC_EPFD, 0, 0);
2596 if (PREDICT_FALSE (!libc_epfd))
2597 {
2598 u32 size = sizeof (epfd);
2599
2600 LDBG (1, "epfd %d, vep_vlsh %d calling libc_epoll_create1: "
2601 "EPOLL_CLOEXEC", epfd, ep_vlsh);
2602 libc_epfd = libc_epoll_create1 (EPOLL_CLOEXEC);
2603 if (libc_epfd < 0)
2604 {
2605 rv = libc_epfd;
2606 goto done;
2607 }
2608
2609 rv = vls_attr (ep_vlsh, VPPCOM_ATTR_SET_LIBC_EPFD, &libc_epfd, &size);
2610 if (rv < 0)
2611 {
2612 errno = -rv;
2613 rv = -1;
2614 goto done;
2615 }
2616 }
2617 if (PREDICT_FALSE (libc_epfd <= 0))
2618 {
2619 errno = -libc_epfd;
2620 rv = -1;
2621 goto done;
2622 }
2623
2624 if (PREDICT_FALSE (!ldpw->mq_epfd_added))
2625 {
2626 struct epoll_event e = { 0 };
2627 e.events = EPOLLIN;
2628 e.data.fd = ldpw->vcl_mq_epfd;
2629 if (libc_epoll_ctl (libc_epfd, EPOLL_CTL_ADD, ldpw->vcl_mq_epfd, &e) <
2630 0)
2631 {
2632 LDBG (0, "epfd %d, add libc mq epoll fd %d to libc epoll fd %d",
2633 epfd, ldpw->vcl_mq_epfd, libc_epfd);
2634 rv = -1;
2635 goto done;
2636 }
2637 ldpw->mq_epfd_added = 1;
2638 }
2639
wanghanlin8919fec2021-03-18 20:00:41 +08002640 /* Request to only drain unhandled to prevent libc_epoll_wait starved */
2641 rv = vls_epoll_wait (ep_vlsh, events, maxevents, -2);
hanlin4266d4d2020-05-19 17:34:17 +08002642 if (rv > 0)
2643 goto done;
hanlina3a48962020-07-13 11:09:15 +08002644 else if (PREDICT_FALSE (rv < 0))
hanlin4266d4d2020-05-19 17:34:17 +08002645 {
2646 errno = -rv;
2647 rv = -1;
2648 goto done;
2649 }
2650
2651 rv = libc_epoll_pwait (libc_epfd, events, maxevents, timeout, sigmask);
2652 if (rv <= 0)
2653 goto done;
2654 for (int i = 0; i < rv; i++)
2655 {
2656 if (events[i].data.fd == ldpw->vcl_mq_epfd)
2657 {
2658 /* We should remove mq epoll fd from events. */
2659 rv--;
2660 if (i != rv)
2661 {
2662 events[i].events = events[rv].events;
2663 events[i].data.u64 = events[rv].data.u64;
2664 }
2665 num_ev = vls_epoll_wait (ep_vlsh, &events[rv], maxevents - rv, 0);
2666 if (PREDICT_TRUE (num_ev > 0))
2667 rv += num_ev;
2668 break;
2669 }
2670 }
2671
2672done:
2673 return rv;
2674}
2675
Dave Wallace048b1d62018-01-03 22:24:41 -05002676int
2677epoll_pwait (int epfd, struct epoll_event *events,
2678 int maxevents, int timeout, const sigset_t * sigmask)
2679{
hanlin4266d4d2020-05-19 17:34:17 +08002680 if (vls_use_eventfd ())
2681 return ldp_epoll_pwait_eventfd (epfd, events, maxevents, timeout,
2682 sigmask);
2683 else
2684 return ldp_epoll_pwait (epfd, events, maxevents, timeout, sigmask);
Dave Wallace048b1d62018-01-03 22:24:41 -05002685}
2686
2687int
2688epoll_wait (int epfd, struct epoll_event *events, int maxevents, int timeout)
2689{
hanlin4266d4d2020-05-19 17:34:17 +08002690 if (vls_use_eventfd ())
2691 return ldp_epoll_pwait_eventfd (epfd, events, maxevents, timeout, NULL);
2692 else
2693 return ldp_epoll_pwait (epfd, events, maxevents, timeout, NULL);
Dave Wallace048b1d62018-01-03 22:24:41 -05002694}
2695
2696int
2697poll (struct pollfd *fds, nfds_t nfds, int timeout)
2698{
Florin Corasdfe4cf42018-11-28 22:13:45 -08002699 ldp_worker_ctx_t *ldpw = ldp_worker_get_current ();
Florin Coras6917b942018-11-13 22:44:54 -08002700 int rv, i, n_revents = 0;
Florin Coras7baeb712019-01-04 17:05:43 -08002701 vls_handle_t vlsh;
Dave Wallace048b1d62018-01-03 22:24:41 -05002702 vcl_poll_t *vp;
Florin Coras4dee8cd2019-01-29 21:28:16 -08002703 double max_time;
Dave Wallace048b1d62018-01-03 22:24:41 -05002704
Florin Coraseb801d02020-09-16 17:44:58 -07002705 LDBG (3, "fds %p, nfds %ld, timeout %d", fds, nfds, timeout);
Dave Wallace048b1d62018-01-03 22:24:41 -05002706
Florin Coras4dee8cd2019-01-29 21:28:16 -08002707 if (PREDICT_FALSE (ldpw->clib_time.init_cpu_time == 0))
2708 clib_time_init (&ldpw->clib_time);
2709
2710 max_time = (timeout >= 0) ? (f64) timeout / 1000 : 0;
2711 max_time += clib_time_now (&ldpw->clib_time);
Dave Wallace048b1d62018-01-03 22:24:41 -05002712
Dave Wallace048b1d62018-01-03 22:24:41 -05002713 for (i = 0; i < nfds; i++)
2714 {
Florin Coras6917b942018-11-13 22:44:54 -08002715 if (fds[i].fd < 0)
2716 continue;
Dave Wallace048b1d62018-01-03 22:24:41 -05002717
Florin Coras7baeb712019-01-04 17:05:43 -08002718 vlsh = ldp_fd_to_vlsh (fds[i].fd);
2719 if (vlsh != VLS_INVALID_HANDLE)
Florin Coras6917b942018-11-13 22:44:54 -08002720 {
2721 fds[i].fd = -fds[i].fd;
Florin Corasdfe4cf42018-11-28 22:13:45 -08002722 vec_add2 (ldpw->vcl_poll, vp, 1);
Florin Coras6917b942018-11-13 22:44:54 -08002723 vp->fds_ndx = i;
Florin Coras7baeb712019-01-04 17:05:43 -08002724 vp->sh = vlsh_to_sh (vlsh);
Florin Coras6917b942018-11-13 22:44:54 -08002725 vp->events = fds[i].events;
Dave Wallace048b1d62018-01-03 22:24:41 -05002726#ifdef __USE_XOPEN2K
Florin Coras6917b942018-11-13 22:44:54 -08002727 if (fds[i].events & POLLRDNORM)
2728 vp->events |= POLLIN;
2729 if (fds[i].events & POLLWRNORM)
2730 vp->events |= POLLOUT;
Dave Wallace048b1d62018-01-03 22:24:41 -05002731#endif
Florin Coras6917b942018-11-13 22:44:54 -08002732 vp->revents = fds[i].revents;
2733 }
2734 else
2735 {
Florin Corasdfe4cf42018-11-28 22:13:45 -08002736 vec_add1 (ldpw->libc_poll, fds[i]);
2737 vec_add1 (ldpw->libc_poll_idxs, i);
Dave Wallace048b1d62018-01-03 22:24:41 -05002738 }
2739 }
2740
Dave Wallace048b1d62018-01-03 22:24:41 -05002741 do
2742 {
Florin Corasdfe4cf42018-11-28 22:13:45 -08002743 if (vec_len (ldpw->vcl_poll))
Dave Wallace048b1d62018-01-03 22:24:41 -05002744 {
Florin Corasdfe4cf42018-11-28 22:13:45 -08002745 rv = vppcom_poll (ldpw->vcl_poll, vec_len (ldpw->vcl_poll), 0);
Dave Wallace048b1d62018-01-03 22:24:41 -05002746 if (rv < 0)
2747 {
2748 errno = -rv;
2749 rv = -1;
2750 goto done;
2751 }
2752 else
2753 n_revents += rv;
2754 }
2755
Florin Corasdfe4cf42018-11-28 22:13:45 -08002756 if (vec_len (ldpw->libc_poll))
Dave Wallace048b1d62018-01-03 22:24:41 -05002757 {
Florin Corasdfe4cf42018-11-28 22:13:45 -08002758 rv = libc_poll (ldpw->libc_poll, vec_len (ldpw->libc_poll), 0);
Dave Wallace048b1d62018-01-03 22:24:41 -05002759 if (rv < 0)
2760 goto done;
2761 else
2762 n_revents += rv;
2763 }
2764
2765 if (n_revents)
2766 {
2767 rv = n_revents;
2768 goto done;
2769 }
2770 }
Florin Coras4dee8cd2019-01-29 21:28:16 -08002771 while ((timeout < 0) || (clib_time_now (&ldpw->clib_time) < max_time));
Dave Wallace048b1d62018-01-03 22:24:41 -05002772 rv = 0;
2773
2774done:
Florin Corasdfe4cf42018-11-28 22:13:45 -08002775 vec_foreach (vp, ldpw->vcl_poll)
Dave Wallace048b1d62018-01-03 22:24:41 -05002776 {
2777 fds[vp->fds_ndx].fd = -fds[vp->fds_ndx].fd;
Florin Coras6917b942018-11-13 22:44:54 -08002778 fds[vp->fds_ndx].revents = vp->revents;
Dave Wallace048b1d62018-01-03 22:24:41 -05002779#ifdef __USE_XOPEN2K
2780 if ((fds[vp->fds_ndx].revents & POLLIN) &&
2781 (fds[vp->fds_ndx].events & POLLRDNORM))
2782 fds[vp->fds_ndx].revents |= POLLRDNORM;
2783 if ((fds[vp->fds_ndx].revents & POLLOUT) &&
2784 (fds[vp->fds_ndx].events & POLLWRNORM))
2785 fds[vp->fds_ndx].revents |= POLLWRNORM;
2786#endif
2787 }
Florin Corasdfe4cf42018-11-28 22:13:45 -08002788 vec_reset_length (ldpw->vcl_poll);
Dave Wallace048b1d62018-01-03 22:24:41 -05002789
Florin Corasdfe4cf42018-11-28 22:13:45 -08002790 for (i = 0; i < vec_len (ldpw->libc_poll); i++)
Florin Coras6917b942018-11-13 22:44:54 -08002791 {
Florin Corasdfe4cf42018-11-28 22:13:45 -08002792 fds[ldpw->libc_poll_idxs[i]].revents = ldpw->libc_poll[i].revents;
Florin Coras6917b942018-11-13 22:44:54 -08002793 }
Florin Corasdfe4cf42018-11-28 22:13:45 -08002794 vec_reset_length (ldpw->libc_poll_idxs);
2795 vec_reset_length (ldpw->libc_poll);
Florin Coras6917b942018-11-13 22:44:54 -08002796
Dave Wallace048b1d62018-01-03 22:24:41 -05002797 return rv;
2798}
2799
Florin Coras36847942023-02-02 12:56:16 -08002800#ifdef _GNU_SOURCE
Dave Wallace048b1d62018-01-03 22:24:41 -05002801int
2802ppoll (struct pollfd *fds, nfds_t nfds,
2803 const struct timespec *timeout, const sigset_t * sigmask)
2804{
Florin Coras5f33d0d2021-06-02 21:22:21 -07002805 ldp_init_check ();
Dave Wallace048b1d62018-01-03 22:24:41 -05002806
2807 clib_warning ("LDP<%d>: LDP-TBD", getpid ());
2808 errno = ENOSYS;
2809
2810
2811 return -1;
2812}
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002813#endif
2814
Dave Wallace2a865272018-02-07 21:00:42 -05002815void CONSTRUCTOR_ATTRIBUTE ldp_constructor (void);
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002816
Dave Wallace2a865272018-02-07 21:00:42 -05002817void DESTRUCTOR_ATTRIBUTE ldp_destructor (void);
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002818
Dave Wallace048b1d62018-01-03 22:24:41 -05002819/*
2820 * This function is called when the library is loaded
2821 */
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002822void
Dave Wallace2a865272018-02-07 21:00:42 -05002823ldp_constructor (void)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002824{
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002825 swrap_constructor ();
Dave Wallace2a865272018-02-07 21:00:42 -05002826 if (ldp_init () != 0)
Florin Corasd89411e2019-03-19 19:44:51 -07002827 {
2828 fprintf (stderr, "\nLDP<%d>: ERROR: ldp_constructor: failed!\n",
2829 getpid ());
2830 _exit (1);
2831 }
Dave Wallace69d01192018-02-22 16:22:09 -05002832 else if (LDP_DEBUG > 0)
Dave Wallace2a865272018-02-07 21:00:42 -05002833 clib_warning ("LDP<%d>: LDP constructor: done!\n", getpid ());
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002834}
2835
2836/*
2837 * This function is called when the library is unloaded
2838 */
2839void
Dave Wallace2a865272018-02-07 21:00:42 -05002840ldp_destructor (void)
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002841{
Florin Coras0ef8ef22019-01-18 08:37:13 -08002842 /*
2843 swrap_destructor ();
2844 if (ldp->init)
2845 ldp->init = 0;
2846 */
Dave Wallace048b1d62018-01-03 22:24:41 -05002847
2848 /* Don't use clib_warning() here because that calls writev()
Dave Wallace2a865272018-02-07 21:00:42 -05002849 * which will call ldp_init().
Dave Wallace048b1d62018-01-03 22:24:41 -05002850 */
Dave Wallace69d01192018-02-22 16:22:09 -05002851 if (LDP_DEBUG > 0)
Florin Coras0ef8ef22019-01-18 08:37:13 -08002852 fprintf (stderr, "%s:%d: LDP<%d>: LDP destructor: done!\n",
2853 __func__, __LINE__, getpid ());
Keith Burns (alagalah)b327c2b2017-10-09 08:52:59 -07002854}
2855
2856
2857/*
2858 * fd.io coding-style-patch-verification: ON
2859 *
2860 * Local Variables:
2861 * eval: (c-set-style "gnu")
2862 * End:
2863 */