2 * Copyright (c) 2016-2019 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
7 * http://www.apache.org/licenses/LICENSE-2.0
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
22 #include <sys/resource.h>
23 #include <netinet/tcp.h>
25 #include <vcl/ldp_socket_wrapper.h>
29 #include <vcl/vcl_locked.h>
30 #include <vppinfra/time.h>
31 #include <vppinfra/bitmap.h>
32 #include <vppinfra/lock.h>
33 #include <vppinfra/pool.h>
34 #include <vppinfra/hash.h>
36 #define HAVE_CONSTRUCTOR_ATTRIBUTE
37 #ifdef HAVE_CONSTRUCTOR_ATTRIBUTE
38 #define CONSTRUCTOR_ATTRIBUTE \
39 __attribute__ ((constructor))
41 #define CONSTRUCTOR_ATTRIBUTE
42 #endif /* HAVE_CONSTRUCTOR_ATTRIBUTE */
44 #define HAVE_DESTRUCTOR_ATTRIBUTE
45 #ifdef HAVE_DESTRUCTOR_ATTRIBUTE
46 #define DESTRUCTOR_ATTRIBUTE \
47 __attribute__ ((destructor))
49 #define DESTRUCTOR_ATTRIBUTE
52 #define LDP_MAX_NWORKERS 32
54 typedef struct ldp_worker_ctx_
57 clib_time_t clib_time;
62 clib_bitmap_t *rd_bitmap;
63 clib_bitmap_t *wr_bitmap;
64 clib_bitmap_t *ex_bitmap;
65 clib_bitmap_t *si_rd_bitmap;
66 clib_bitmap_t *si_wr_bitmap;
67 clib_bitmap_t *si_ex_bitmap;
68 clib_bitmap_t *libc_rd_bitmap;
69 clib_bitmap_t *libc_wr_bitmap;
70 clib_bitmap_t *libc_ex_bitmap;
76 struct pollfd *libc_poll;
87 /* clib_bitmap_t, fd_mask and vcl_si_set are used interchangeably. Make sure
88 * they are the same size */
89 STATIC_ASSERT (sizeof (clib_bitmap_t) == sizeof (fd_mask),
90 "ldp bitmap size mismatch");
91 STATIC_ASSERT (sizeof (vcl_si_set) == sizeof (fd_mask),
92 "ldp bitmap size mismatch");
96 ldp_worker_ctx_t *workers;
98 char app_name[LDP_APP_NAME_MAX];
104 /** vcl needs next epoll_create to go to libc_epoll */
105 u8 vcl_needs_real_epoll;
108 #define LDP_DEBUG ldp->debug
110 #define LDBG(_lvl, _fmt, _args...) \
111 if (ldp->debug > _lvl) \
113 int errno_saved = errno; \
114 clib_warning ("ldp<%d>: " _fmt, getpid(), ##_args); \
115 errno = errno_saved; \
118 static ldp_main_t ldp_main = {
119 .vlsh_bit_val = (1 << LDP_SID_BIT_MIN),
120 .vlsh_bit_mask = (1 << LDP_SID_BIT_MIN) - 1,
121 .debug = LDP_DEBUG_INIT,
122 .transparent_tls = 0,
125 static ldp_main_t *ldp = &ldp_main;
127 static inline ldp_worker_ctx_t *
128 ldp_worker_get_current (void)
130 return (ldp->workers + vppcom_worker_index ());
134 * RETURN: 0 on success or -1 on error.
137 ldp_set_app_name (char *app_name)
139 snprintf (ldp->app_name, LDP_APP_NAME_MAX,
140 "ldp-%d-%s", getpid (), app_name);
146 if (ldp->app_name[0] == '\0')
147 ldp_set_app_name ("app");
149 return ldp->app_name;
153 ldp_vlsh_to_fd (vls_handle_t vlsh)
155 return (vlsh + ldp->vlsh_bit_val);
158 static inline vls_handle_t
159 ldp_fd_to_vlsh (int fd)
161 if (fd < ldp->vlsh_bit_val)
162 return VLS_INVALID_HANDLE;
164 return (fd - ldp->vlsh_bit_val);
168 ldp_alloc_workers (void)
172 pool_alloc (ldp->workers, LDP_MAX_NWORKERS);
178 ldp_worker_ctx_t *ldpw;
181 if (PREDICT_TRUE (ldp->init))
185 ldp->vcl_needs_real_epoll = 1;
186 rv = vls_app_create (ldp_get_app_name ());
189 ldp->vcl_needs_real_epoll = 0;
190 if (rv == VPPCOM_EEXIST)
192 LDBG (2, "\nERROR: ldp_init: vppcom_app_create()"
193 " failed! rv = %d (%s)\n", rv, vppcom_retval_str (rv));
197 ldp->vcl_needs_real_epoll = 0;
198 ldp_alloc_workers ();
199 ldpw = ldp_worker_get_current ();
201 char *env_var_str = getenv (LDP_ENV_DEBUG);
205 if (sscanf (env_var_str, "%u", &tmp) != 1)
206 clib_warning ("LDP<%d>: WARNING: Invalid LDP debug level specified in"
207 " the env var " LDP_ENV_DEBUG " (%s)!", getpid (),
212 LDBG (0, "configured LDP debug level (%u) from env var "
213 LDP_ENV_DEBUG "!", ldp->debug);
217 env_var_str = getenv (LDP_ENV_APP_NAME);
220 ldp_set_app_name (env_var_str);
221 LDBG (0, "configured LDP app name (%s) from the env var "
222 LDP_ENV_APP_NAME "!", ldp->app_name);
225 env_var_str = getenv (LDP_ENV_SID_BIT);
229 if (sscanf (env_var_str, "%u", &sb) != 1)
231 LDBG (0, "WARNING: Invalid LDP sid bit specified in the env var "
232 LDP_ENV_SID_BIT " (%s)! sid bit value %d (0x%x)", env_var_str,
233 ldp->vlsh_bit_val, ldp->vlsh_bit_val);
235 else if (sb < LDP_SID_BIT_MIN)
237 ldp->vlsh_bit_val = (1 << LDP_SID_BIT_MIN);
238 ldp->vlsh_bit_mask = ldp->vlsh_bit_val - 1;
240 LDBG (0, "WARNING: LDP sid bit (%u) specified in the env var "
241 LDP_ENV_SID_BIT " (%s) is too small. Using LDP_SID_BIT_MIN"
242 " (%d)! sid bit value %d (0x%x)", sb, env_var_str,
243 LDP_SID_BIT_MIN, ldp->vlsh_bit_val, ldp->vlsh_bit_val);
245 else if (sb > LDP_SID_BIT_MAX)
247 ldp->vlsh_bit_val = (1 << LDP_SID_BIT_MAX);
248 ldp->vlsh_bit_mask = ldp->vlsh_bit_val - 1;
250 LDBG (0, "WARNING: LDP sid bit (%u) specified in the env var "
251 LDP_ENV_SID_BIT " (%s) is too big. Using LDP_SID_BIT_MAX"
252 " (%d)! sid bit value %d (0x%x)", sb, env_var_str,
253 LDP_SID_BIT_MAX, ldp->vlsh_bit_val, ldp->vlsh_bit_val);
257 ldp->vlsh_bit_val = (1 << sb);
258 ldp->vlsh_bit_mask = ldp->vlsh_bit_val - 1;
260 LDBG (0, "configured LDP sid bit (%u) from "
261 LDP_ENV_SID_BIT "! sid bit value %d (0x%x)", sb,
262 ldp->vlsh_bit_val, ldp->vlsh_bit_val);
265 /* Make sure there are enough bits in the fd set for vcl sessions */
266 if (ldp->vlsh_bit_val > FD_SETSIZE / 2)
268 LDBG (0, "ERROR: LDP vlsh bit value %d > FD_SETSIZE/2 %d!",
269 ldp->vlsh_bit_val, FD_SETSIZE / 2);
274 env_var_str = getenv (LDP_ENV_TLS_TRANS);
277 ldp->transparent_tls = 1;
281 pool_foreach (ldpw, ldp->workers, ({
282 clib_memset (&ldpw->clib_time, 0, sizeof (ldpw->clib_time));
286 LDBG (0, "LDP initialization: done!");
297 if ((errno = -ldp_init ()))
300 vlsh = ldp_fd_to_vlsh (fd);
301 if (vlsh != VLS_INVALID_HANDLE)
303 epfd = vls_attr (vlsh, VPPCOM_ATTR_GET_LIBC_EPFD, 0, 0);
306 LDBG (0, "fd %d: calling libc_close: epfd %u", fd, epfd);
308 rv = libc_close (epfd);
311 u32 size = sizeof (epfd);
314 (void) vls_attr (vlsh, VPPCOM_ATTR_SET_LIBC_EPFD, &epfd, &size);
317 else if (PREDICT_FALSE (epfd < 0))
324 LDBG (0, "fd %d: calling vls_close: vlsh %u", fd, vlsh);
326 rv = vls_close (vlsh);
335 LDBG (0, "fd %d: calling libc_close", fd);
336 rv = libc_close (fd);
344 read (int fd, void *buf, size_t nbytes)
349 if ((errno = -ldp_init ()))
352 vlsh = ldp_fd_to_vlsh (fd);
353 if (vlsh != VLS_INVALID_HANDLE)
355 size = vls_read (vlsh, buf, nbytes);
364 size = libc_read (fd, buf, nbytes);
371 readv (int fd, const struct iovec * iov, int iovcnt)
373 int rv = 0, i, total = 0;
377 if ((errno = -ldp_init ()))
380 vlsh = ldp_fd_to_vlsh (fd);
381 if (vlsh != VLS_INVALID_HANDLE)
383 for (i = 0; i < iovcnt; ++i)
385 rv = vls_read (vlsh, iov[i].iov_base, iov[i].iov_len);
391 if (rv < iov[i].iov_len)
395 if (rv < 0 && total == 0)
405 size = libc_readv (fd, iov, iovcnt);
412 write (int fd, const void *buf, size_t nbytes)
417 if ((errno = -ldp_init ()))
420 vlsh = ldp_fd_to_vlsh (fd);
421 if (vlsh != VLS_INVALID_HANDLE)
423 size = vls_write_msg (vlsh, (void *) buf, nbytes);
432 size = libc_write (fd, buf, nbytes);
439 writev (int fd, const struct iovec * iov, int iovcnt)
441 ssize_t size = 0, total = 0;
445 if ((errno = -ldp_init ()))
448 vlsh = ldp_fd_to_vlsh (fd);
449 if (vlsh != VLS_INVALID_HANDLE)
453 for (i = 0; i < iovcnt; ++i)
455 rv = vls_write_msg (vlsh, iov[i].iov_base, iov[i].iov_len);
461 if (rv < iov[i].iov_len)
466 while ((rv >= 0) && (total == 0));
478 size = libc_writev (fd, iov, iovcnt);
486 fcntl64 (int fd, int cmd, ...)
489 fcntl (int fd, int cmd, ...)
496 if ((errno = -ldp_init ()))
501 vlsh = ldp_fd_to_vlsh (fd);
502 LDBG (0, "fd %u vlsh %d, cmd %u", fd, vlsh, cmd);
503 if (vlsh != VLS_INVALID_HANDLE)
505 int flags = va_arg (ap, int);
508 size = sizeof (flags);
513 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_FLAGS, &flags, &size);
517 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_FLAGS, &flags, &size);
522 /* TODO handle this */
523 LDBG (0, "F_SETFD ignored flags %u", flags);
539 rv = libc_vfcntl64 (fd, cmd, ap);
541 rv = libc_vfcntl (fd, cmd, ap);
551 ioctl (int fd, unsigned long int cmd, ...)
557 if ((errno = -ldp_init ()))
562 vlsh = ldp_fd_to_vlsh (fd);
563 if (vlsh != VLS_INVALID_HANDLE)
568 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_NREAD, 0, 0);
573 u32 flags = va_arg (ap, int) ? O_NONBLOCK : 0;
574 u32 size = sizeof (flags);
576 /* TBD: When VPPCOM_ATTR_[GS]ET_FLAGS supports flags other than
577 * non-blocking, the flags should be read here and merged
580 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_FLAGS, &flags, &size);
596 rv = libc_vioctl (fd, cmd, ap);
604 ldp_select_init_maps (fd_set * __restrict original,
605 clib_bitmap_t ** resultb, clib_bitmap_t ** libcb,
606 clib_bitmap_t ** vclb, int nfds, u32 minbits,
607 u32 n_bytes, uword * si_bits, uword * libc_bits)
609 uword si_bits_set, libc_bits_set;
613 clib_bitmap_validate (*vclb, minbits);
614 clib_bitmap_validate (*libcb, minbits);
615 clib_bitmap_validate (*resultb, minbits);
616 clib_memcpy_fast (*resultb, original, n_bytes);
617 memset (original, 0, n_bytes);
620 clib_bitmap_foreach (fd, *resultb, ({
623 vlsh = ldp_fd_to_vlsh (fd);
624 if (vlsh == VLS_INVALID_HANDLE)
625 clib_bitmap_set_no_check (*libcb, fd, 1);
627 clib_bitmap_set_no_check (*vclb, vlsh_to_session_index (vlsh), 1);
631 si_bits_set = clib_bitmap_last_set (*vclb) + 1;
632 *si_bits = (si_bits_set > *si_bits) ? si_bits_set : *si_bits;
634 libc_bits_set = clib_bitmap_last_set (*libcb) + 1;
635 *libc_bits = (libc_bits_set > *libc_bits) ? libc_bits_set : *libc_bits;
639 ldp_select_vcl_map_to_libc (clib_bitmap_t * vclb, fd_set * __restrict libcb)
649 clib_bitmap_foreach (si, vclb, ({
650 vlsh = vls_session_index_to_vlsh (si);
651 ASSERT (vlsh != VLS_INVALID_HANDLE);
652 fd = ldp_vlsh_to_fd (vlsh);
653 if (PREDICT_FALSE (fd < 0))
666 ldp_select_libc_map_merge (clib_bitmap_t * result, fd_set * __restrict libcb)
674 clib_bitmap_foreach (fd, result, ({
675 FD_SET ((int)fd, libcb);
681 ldp_pselect (int nfds, fd_set * __restrict readfds,
682 fd_set * __restrict writefds,
683 fd_set * __restrict exceptfds,
684 const struct timespec *__restrict timeout,
685 const __sigset_t * __restrict sigmask)
687 u32 minbits = clib_max (nfds, BITS (uword)), n_bytes;
688 ldp_worker_ctx_t *ldpw = ldp_worker_get_current ();
689 struct timespec libc_tspec = { 0 };
690 f64 time_out, vcl_timeout = 0;
691 uword si_bits, libc_bits;
692 int rv, bits_set = 0;
700 if (PREDICT_FALSE (ldpw->clib_time.init_cpu_time == 0))
701 clib_time_init (&ldpw->clib_time);
705 time_out = (timeout->tv_sec == 0 && timeout->tv_nsec == 0) ?
706 (f64) 0 : (f64) timeout->tv_sec + (f64) timeout->tv_nsec / (f64) 1e9;
708 /* select as fine grained sleep */
711 time_out += clib_time_now (&ldpw->clib_time);
712 while (clib_time_now (&ldpw->clib_time) < time_out)
725 if (nfds <= ldp->vlsh_bit_val)
727 rv = libc_pselect (nfds, readfds, writefds, exceptfds,
732 si_bits = libc_bits = 0;
733 n_bytes = nfds / 8 + ((nfds % 8) ? 1 : 0);
736 ldp_select_init_maps (readfds, &ldpw->rd_bitmap, &ldpw->libc_rd_bitmap,
737 &ldpw->si_rd_bitmap, nfds, minbits, n_bytes,
738 &si_bits, &libc_bits);
740 ldp_select_init_maps (writefds, &ldpw->wr_bitmap,
741 &ldpw->libc_wr_bitmap, &ldpw->si_wr_bitmap, nfds,
742 minbits, n_bytes, &si_bits, &libc_bits);
744 ldp_select_init_maps (exceptfds, &ldpw->ex_bitmap,
745 &ldpw->libc_ex_bitmap, &ldpw->si_ex_bitmap, nfds,
746 minbits, n_bytes, &si_bits, &libc_bits);
748 if (PREDICT_FALSE (!si_bits && !libc_bits))
756 libc_tspec = timeout ? *timeout : libc_tspec;
763 clib_memcpy_fast (ldpw->rd_bitmap, ldpw->si_rd_bitmap,
764 vec_len (ldpw->rd_bitmap) *
765 sizeof (clib_bitmap_t));
767 clib_memcpy_fast (ldpw->wr_bitmap, ldpw->si_wr_bitmap,
768 vec_len (ldpw->wr_bitmap) *
769 sizeof (clib_bitmap_t));
771 clib_memcpy_fast (ldpw->ex_bitmap, ldpw->si_ex_bitmap,
772 vec_len (ldpw->ex_bitmap) *
773 sizeof (clib_bitmap_t));
775 rv = vls_select (si_bits, readfds ? ldpw->rd_bitmap : NULL,
776 writefds ? ldpw->wr_bitmap : NULL,
777 exceptfds ? ldpw->ex_bitmap : NULL, vcl_timeout);
785 if (ldp_select_vcl_map_to_libc (ldpw->rd_bitmap, readfds))
791 if (ldp_select_vcl_map_to_libc (ldpw->wr_bitmap, writefds))
797 if (ldp_select_vcl_map_to_libc (ldpw->ex_bitmap, exceptfds))
808 clib_memcpy_fast (ldpw->rd_bitmap, ldpw->libc_rd_bitmap,
809 vec_len (ldpw->libc_rd_bitmap) *
810 sizeof (clib_bitmap_t));
812 clib_memcpy_fast (ldpw->wr_bitmap, ldpw->libc_wr_bitmap,
813 vec_len (ldpw->libc_wr_bitmap) *
814 sizeof (clib_bitmap_t));
816 clib_memcpy_fast (ldpw->ex_bitmap, ldpw->libc_ex_bitmap,
817 vec_len (ldpw->libc_ex_bitmap) *
818 sizeof (clib_bitmap_t));
820 rv = libc_pselect (libc_bits,
821 readfds ? (fd_set *) ldpw->rd_bitmap : NULL,
822 writefds ? (fd_set *) ldpw->wr_bitmap : NULL,
823 exceptfds ? (fd_set *) ldpw->ex_bitmap : NULL,
824 &libc_tspec, sigmask);
827 ldp_select_libc_map_merge (ldpw->rd_bitmap, readfds);
828 ldp_select_libc_map_merge (ldpw->wr_bitmap, writefds);
829 ldp_select_libc_map_merge (ldpw->ex_bitmap, exceptfds);
840 while ((time_out == -1) || (clib_time_now (&ldpw->clib_time) < time_out));
844 /* TBD: set timeout to amount of time left */
845 clib_bitmap_zero (ldpw->rd_bitmap);
846 clib_bitmap_zero (ldpw->si_rd_bitmap);
847 clib_bitmap_zero (ldpw->libc_rd_bitmap);
848 clib_bitmap_zero (ldpw->wr_bitmap);
849 clib_bitmap_zero (ldpw->si_wr_bitmap);
850 clib_bitmap_zero (ldpw->libc_wr_bitmap);
851 clib_bitmap_zero (ldpw->ex_bitmap);
852 clib_bitmap_zero (ldpw->si_ex_bitmap);
853 clib_bitmap_zero (ldpw->libc_ex_bitmap);
859 select (int nfds, fd_set * __restrict readfds,
860 fd_set * __restrict writefds,
861 fd_set * __restrict exceptfds, struct timeval *__restrict timeout)
863 struct timespec tspec;
867 tspec.tv_sec = timeout->tv_sec;
868 tspec.tv_nsec = timeout->tv_usec * 1000;
870 return ldp_pselect (nfds, readfds, writefds, exceptfds,
871 timeout ? &tspec : NULL, NULL);
876 pselect (int nfds, fd_set * __restrict readfds,
877 fd_set * __restrict writefds,
878 fd_set * __restrict exceptfds,
879 const struct timespec *__restrict timeout,
880 const __sigset_t * __restrict sigmask)
882 return ldp_pselect (nfds, readfds, writefds, exceptfds, timeout, 0);
886 /* If transparent TLS mode is turned on, then ldp will load key and cert.
889 load_tls_cert (vls_handle_t vlsh)
891 char *env_var_str = getenv (LDP_ENV_TLS_CERT);
899 fp = fopen (env_var_str, "r");
902 LDBG (0, "ERROR: failed to open cert file %s \n", env_var_str);
905 cert_size = fread (inbuf, sizeof (char), sizeof (inbuf), fp);
907 vppcom_session_tls_add_cert (vlsh_to_session_index (vlsh), tls_cert,
913 LDBG (0, "ERROR: failed to read LDP environment %s\n",
921 load_tls_key (vls_handle_t vlsh)
923 char *env_var_str = getenv (LDP_ENV_TLS_KEY);
931 fp = fopen (env_var_str, "r");
934 LDBG (0, "ERROR: failed to open key file %s \n", env_var_str);
937 key_size = fread (inbuf, sizeof (char), sizeof (inbuf), fp);
939 vppcom_session_tls_add_key (vlsh_to_session_index (vlsh), tls_key,
945 LDBG (0, "ERROR: failed to read LDP environment %s\n", LDP_ENV_TLS_KEY);
952 socket (int domain, int type, int protocol)
954 int rv, sock_type = type & ~(SOCK_CLOEXEC | SOCK_NONBLOCK);
955 u8 is_nonblocking = type & SOCK_NONBLOCK ? 1 : 0;
958 if ((errno = -ldp_init ()))
961 if (((domain == AF_INET) || (domain == AF_INET6)) &&
962 ((sock_type == SOCK_STREAM) || (sock_type == SOCK_DGRAM)))
965 if (ldp->transparent_tls)
967 proto = VPPCOM_PROTO_TLS;
970 proto = ((sock_type == SOCK_DGRAM) ?
971 VPPCOM_PROTO_UDP : VPPCOM_PROTO_TCP);
973 LDBG (0, "calling vls_create: proto %u (%s), is_nonblocking %u",
974 proto, vppcom_proto_str (proto), is_nonblocking);
976 vlsh = vls_create (proto, is_nonblocking);
984 if (ldp->transparent_tls)
986 if (load_tls_cert (vlsh) < 0 || load_tls_key (vlsh) < 0)
991 rv = ldp_vlsh_to_fd (vlsh);
996 LDBG (0, "calling libc_socket");
997 rv = libc_socket (domain, type, protocol);
1004 * Create two new sockets, of type TYPE in domain DOMAIN and using
1005 * protocol PROTOCOL, which are connected to each other, and put file
1006 * descriptors for them in FDS[0] and FDS[1]. If PROTOCOL is zero,
1007 * one will be chosen automatically.
1008 * Returns 0 on success, -1 for errors.
1011 socketpair (int domain, int type, int protocol, int fds[2])
1013 int rv, sock_type = type & ~(SOCK_CLOEXEC | SOCK_NONBLOCK);
1015 if ((errno = -ldp_init ()))
1018 if (((domain == AF_INET) || (domain == AF_INET6)) &&
1019 ((sock_type == SOCK_STREAM) || (sock_type == SOCK_DGRAM)))
1021 LDBG (0, "LDP-TBD");
1027 LDBG (1, "calling libc_socketpair");
1028 rv = libc_socketpair (domain, type, protocol, fds);
1035 bind (int fd, __CONST_SOCKADDR_ARG addr, socklen_t len)
1040 if ((errno = -ldp_init ()))
1043 vlsh = ldp_fd_to_vlsh (fd);
1044 if (vlsh != VLS_INVALID_HANDLE)
1048 switch (addr->sa_family)
1051 if (len != sizeof (struct sockaddr_in))
1053 LDBG (0, "ERROR: fd %d: vlsh %u: Invalid AF_INET addr len %u!",
1059 ep.is_ip4 = VPPCOM_IS_IP4;
1060 ep.ip = (u8 *) & ((const struct sockaddr_in *) addr)->sin_addr;
1061 ep.port = (u16) ((const struct sockaddr_in *) addr)->sin_port;
1065 if (len != sizeof (struct sockaddr_in6))
1067 LDBG (0, "ERROR: fd %d: vlsh %u: Invalid AF_INET6 addr len %u!",
1073 ep.is_ip4 = VPPCOM_IS_IP6;
1074 ep.ip = (u8 *) & ((const struct sockaddr_in6 *) addr)->sin6_addr;
1075 ep.port = (u16) ((const struct sockaddr_in6 *) addr)->sin6_port;
1079 LDBG (0, "ERROR: fd %d: vlsh %u: Unsupported address family %u!",
1080 fd, vlsh, addr->sa_family);
1081 errno = EAFNOSUPPORT;
1085 LDBG (0, "fd %d: calling vls_bind: vlsh %u, addr %p, len %u", fd, vlsh,
1088 rv = vls_bind (vlsh, &ep);
1089 if (rv != VPPCOM_OK)
1097 LDBG (0, "fd %d: calling libc_bind: addr %p, len %u", fd, addr, len);
1098 rv = libc_bind (fd, addr, len);
1102 LDBG (1, "fd %d: returning %d", fd, rv);
1108 ldp_copy_ep_to_sockaddr (__SOCKADDR_ARG addr, socklen_t * __restrict len,
1109 vppcom_endpt_t * ep)
1112 int sa_len, copy_len;
1114 if ((errno = -ldp_init ()))
1117 if (addr && len && ep)
1119 addr->sa_family = (ep->is_ip4 == VPPCOM_IS_IP4) ? AF_INET : AF_INET6;
1120 switch (addr->sa_family)
1123 ((struct sockaddr_in *) addr)->sin_port = ep->port;
1124 if (*len > sizeof (struct sockaddr_in))
1125 *len = sizeof (struct sockaddr_in);
1126 sa_len = sizeof (struct sockaddr_in) - sizeof (struct in_addr);
1127 copy_len = *len - sa_len;
1129 memcpy (&((struct sockaddr_in *) addr)->sin_addr, ep->ip,
1134 ((struct sockaddr_in6 *) addr)->sin6_port = ep->port;
1135 if (*len > sizeof (struct sockaddr_in6))
1136 *len = sizeof (struct sockaddr_in6);
1137 sa_len = sizeof (struct sockaddr_in6) - sizeof (struct in6_addr);
1138 copy_len = *len - sa_len;
1140 memcpy (((struct sockaddr_in6 *) addr)->sin6_addr.
1141 __in6_u.__u6_addr8, ep->ip, copy_len);
1154 getsockname (int fd, __SOCKADDR_ARG addr, socklen_t * __restrict len)
1159 if ((errno = -ldp_init ()))
1162 vlsh = ldp_fd_to_vlsh (fd);
1163 if (vlsh != VLS_INVALID_HANDLE)
1166 u8 addr_buf[sizeof (struct in6_addr)];
1167 u32 size = sizeof (ep);
1171 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_LCL_ADDR, &ep, &size);
1172 if (rv != VPPCOM_OK)
1179 rv = ldp_copy_ep_to_sockaddr (addr, len, &ep);
1180 if (rv != VPPCOM_OK)
1189 rv = libc_getsockname (fd, addr, len);
1196 connect (int fd, __CONST_SOCKADDR_ARG addr, socklen_t len)
1201 if ((errno = -ldp_init ()))
1206 LDBG (0, "ERROR: fd %d: NULL addr, len %u", fd, len);
1212 vlsh = ldp_fd_to_vlsh (fd);
1213 if (vlsh != VLS_INVALID_HANDLE)
1217 switch (addr->sa_family)
1220 if (len != sizeof (struct sockaddr_in))
1222 LDBG (0, "fd %d: ERROR vlsh %u: Invalid AF_INET addr len %u!",
1228 ep.is_ip4 = VPPCOM_IS_IP4;
1229 ep.ip = (u8 *) & ((const struct sockaddr_in *) addr)->sin_addr;
1230 ep.port = (u16) ((const struct sockaddr_in *) addr)->sin_port;
1234 if (len != sizeof (struct sockaddr_in6))
1236 LDBG (0, "fd %d: ERROR vlsh %u: Invalid AF_INET6 addr len %u!",
1242 ep.is_ip4 = VPPCOM_IS_IP6;
1243 ep.ip = (u8 *) & ((const struct sockaddr_in6 *) addr)->sin6_addr;
1244 ep.port = (u16) ((const struct sockaddr_in6 *) addr)->sin6_port;
1248 LDBG (0, "fd %d: ERROR vlsh %u: Unsupported address family %u!",
1249 fd, vlsh, addr->sa_family);
1250 errno = EAFNOSUPPORT;
1254 LDBG (0, "fd %d: calling vls_connect(): vlsh %u addr %p len %u", fd,
1257 rv = vls_connect (vlsh, &ep);
1258 if (rv != VPPCOM_OK)
1266 LDBG (0, "fd %d: calling libc_connect(): addr %p, len %u",
1269 rv = libc_connect (fd, addr, len);
1273 LDBG (1, "fd %d: returning %d (0x%x)", fd, rv, rv);
1278 getpeername (int fd, __SOCKADDR_ARG addr, socklen_t * __restrict len)
1283 if ((errno = -ldp_init ()))
1286 vlsh = ldp_fd_to_vlsh (fd);
1287 if (vlsh != VLS_INVALID_HANDLE)
1290 u8 addr_buf[sizeof (struct in6_addr)];
1291 u32 size = sizeof (ep);
1294 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_PEER_ADDR, &ep, &size);
1295 if (rv != VPPCOM_OK)
1302 rv = ldp_copy_ep_to_sockaddr (addr, len, &ep);
1303 if (rv != VPPCOM_OK)
1312 rv = libc_getpeername (fd, addr, len);
1319 send (int fd, const void *buf, size_t n, int flags)
1321 vls_handle_t vlsh = ldp_fd_to_vlsh (fd);
1324 if ((errno = -ldp_init ()))
1327 if (vlsh != VLS_INVALID_HANDLE)
1329 size = vls_sendto (vlsh, (void *) buf, n, flags, NULL);
1330 if (size < VPPCOM_OK)
1338 size = libc_send (fd, buf, n, flags);
1345 sendfile (int out_fd, int in_fd, off_t * offset, size_t len)
1347 ldp_worker_ctx_t *ldpw = ldp_worker_get_current ();
1351 if ((errno = -ldp_init ()))
1354 vlsh = ldp_fd_to_vlsh (out_fd);
1355 if (vlsh != VLS_INVALID_HANDLE)
1358 ssize_t results = 0;
1359 size_t n_bytes_left = len;
1360 size_t bytes_to_read;
1363 u32 flags, flags_len = sizeof (flags);
1365 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_FLAGS, &flags, &flags_len);
1366 if (PREDICT_FALSE (rv != VPPCOM_OK))
1368 LDBG (0, "ERROR: out fd %d: vls_attr: vlsh %u, returned %d (%s)!",
1369 out_fd, vlsh, rv, vppcom_retval_str (rv));
1371 vec_reset_length (ldpw->io_buffer);
1379 off_t off = lseek (in_fd, *offset, SEEK_SET);
1380 if (PREDICT_FALSE (off == -1))
1386 ASSERT (off == *offset);
1391 size = vls_attr (vlsh, VPPCOM_ATTR_GET_NWRITE, 0, 0);
1394 LDBG (0, "ERROR: fd %d: vls_attr: vlsh %u returned %d (%s)!",
1395 out_fd, vlsh, size, vppcom_retval_str (size));
1396 vec_reset_length (ldpw->io_buffer);
1402 bytes_to_read = size;
1403 if (bytes_to_read == 0)
1405 if (flags & O_NONBLOCK)
1414 bytes_to_read = clib_min (n_bytes_left, bytes_to_read);
1415 vec_validate (ldpw->io_buffer, bytes_to_read);
1416 nbytes = libc_read (in_fd, ldpw->io_buffer, bytes_to_read);
1421 vec_reset_length (ldpw->io_buffer);
1428 size = vls_write (vlsh, ldpw->io_buffer, nbytes);
1431 if (size == VPPCOM_EAGAIN)
1433 if (flags & O_NONBLOCK)
1444 vec_reset_length (ldpw->io_buffer);
1453 ASSERT (n_bytes_left >= nbytes);
1454 n_bytes_left = n_bytes_left - nbytes;
1456 while (n_bytes_left > 0);
1459 vec_reset_length (ldpw->io_buffer);
1462 off_t off = lseek (in_fd, *offset, SEEK_SET);
1463 if (PREDICT_FALSE (off == -1))
1469 ASSERT (off == *offset);
1470 *offset += results + 1;
1482 size = libc_sendfile (out_fd, in_fd, offset, len);
1490 sendfile64 (int out_fd, int in_fd, off_t * offset, size_t len)
1492 return sendfile (out_fd, in_fd, offset, len);
1496 recv (int fd, void *buf, size_t n, int flags)
1501 if ((errno = -ldp_init ()))
1504 vlsh = ldp_fd_to_vlsh (fd);
1505 if (vlsh != VLS_INVALID_HANDLE)
1507 size = vls_recvfrom (vlsh, buf, n, flags, NULL);
1513 size = libc_recv (fd, buf, n, flags);
1520 sendto (int fd, const void *buf, size_t n, int flags,
1521 __CONST_SOCKADDR_ARG addr, socklen_t addr_len)
1526 if ((errno = -ldp_init ()))
1529 vlsh = ldp_fd_to_vlsh (fd);
1530 if (vlsh != INVALID_SESSION_ID)
1532 vppcom_endpt_t *ep = 0;
1538 switch (addr->sa_family)
1541 ep->is_ip4 = VPPCOM_IS_IP4;
1543 (uint8_t *) & ((const struct sockaddr_in *) addr)->sin_addr;
1545 (uint16_t) ((const struct sockaddr_in *) addr)->sin_port;
1549 ep->is_ip4 = VPPCOM_IS_IP6;
1551 (uint8_t *) & ((const struct sockaddr_in6 *) addr)->sin6_addr;
1553 (uint16_t) ((const struct sockaddr_in6 *) addr)->sin6_port;
1557 errno = EAFNOSUPPORT;
1563 size = vls_sendto (vlsh, (void *) buf, n, flags, ep);
1572 size = libc_sendto (fd, buf, n, flags, addr, addr_len);
1580 recvfrom (int fd, void *__restrict buf, size_t n, int flags,
1581 __SOCKADDR_ARG addr, socklen_t * __restrict addr_len)
1586 if ((errno = -ldp_init ()))
1589 sid = ldp_fd_to_vlsh (fd);
1590 if (sid != VLS_INVALID_HANDLE)
1593 u8 src_addr[sizeof (struct sockaddr_in6)];
1598 size = vls_recvfrom (sid, buf, n, flags, &ep);
1602 rv = ldp_copy_ep_to_sockaddr (addr, addr_len, &ep);
1608 size = vls_recvfrom (sid, buf, n, flags, NULL);
1618 size = libc_recvfrom (fd, buf, n, flags, addr, addr_len);
1625 sendmsg (int fd, const struct msghdr * message, int flags)
1630 if ((errno = -ldp_init ()))
1633 vlsh = ldp_fd_to_vlsh (fd);
1634 if (vlsh != VLS_INVALID_HANDLE)
1636 LDBG (0, "LDP-TBD");
1642 size = libc_sendmsg (fd, message, flags);
1650 sendmmsg (int fd, struct mmsghdr *vmessages, unsigned int vlen, int flags)
1653 const char *func_str;
1654 u32 sh = ldp_fd_to_vlsh (fd);
1656 if ((errno = -ldp_init ()))
1659 if (sh != INVALID_SESSION_ID)
1661 clib_warning ("LDP<%d>: LDP-TBD", getpid ());
1667 func_str = "libc_sendmmsg";
1670 clib_warning ("LDP<%d>: fd %d (0x%x): calling %s(): "
1671 "vmessages %p, vlen %u, flags 0x%x",
1672 getpid (), fd, fd, func_str, vmessages, vlen, flags);
1674 size = libc_sendmmsg (fd, vmessages, vlen, flags);
1681 int errno_val = errno;
1683 clib_warning ("LDP<%d>: ERROR: fd %d (0x%x): %s() failed! "
1684 "rv %d, errno = %d", getpid (), fd, fd,
1685 func_str, size, errno_val);
1689 clib_warning ("LDP<%d>: fd %d (0x%x): returning %d (0x%x)",
1690 getpid (), fd, fd, size, size);
1697 recvmsg (int fd, struct msghdr * message, int flags)
1702 if ((errno = -ldp_init ()))
1705 vlsh = ldp_fd_to_vlsh (fd);
1706 if (vlsh != VLS_INVALID_HANDLE)
1708 LDBG (0, "LDP-TBD");
1714 size = libc_recvmsg (fd, message, flags);
1722 recvmmsg (int fd, struct mmsghdr *vmessages,
1723 unsigned int vlen, int flags, struct timespec *tmo)
1726 const char *func_str;
1727 u32 sh = ldp_fd_to_vlsh (fd);
1729 if ((errno = -ldp_init ()))
1732 if (sh != INVALID_SESSION_ID)
1734 clib_warning ("LDP<%d>: LDP-TBD", getpid ());
1740 func_str = "libc_recvmmsg";
1743 clib_warning ("LDP<%d>: fd %d (0x%x): calling %s(): "
1744 "vmessages %p, vlen %u, flags 0x%x, tmo %p",
1745 getpid (), fd, fd, func_str, vmessages, vlen,
1748 size = libc_recvmmsg (fd, vmessages, vlen, flags, tmo);
1755 int errno_val = errno;
1757 clib_warning ("LDP<%d>: ERROR: fd %d (0x%x): %s() failed! "
1758 "rv %d, errno = %d", getpid (), fd, fd,
1759 func_str, size, errno_val);
1763 clib_warning ("LDP<%d>: fd %d (0x%x): returning %d (0x%x)",
1764 getpid (), fd, fd, size, size);
1771 getsockopt (int fd, int level, int optname,
1772 void *__restrict optval, socklen_t * __restrict optlen)
1777 if ((errno = -ldp_init ()))
1780 vlsh = ldp_fd_to_vlsh (fd);
1781 if (vlsh != VLS_INVALID_HANDLE)
1791 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_TCP_NODELAY,
1795 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_TCP_USER_MSS,
1799 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_TCP_KEEPIDLE,
1803 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_TCP_KEEPINTVL,
1807 if (optval && optlen && (*optlen == sizeof (struct tcp_info)))
1809 LDBG (1, "fd %d: vlsh %u SOL_TCP, TCP_INFO, optval %p, "
1810 "optlen %d: #LDP-NOP#", fd, vlsh, optval, *optlen);
1811 memset (optval, 0, *optlen);
1817 case TCP_CONGESTION:
1818 strcpy (optval, "cubic");
1819 *optlen = strlen ("cubic");
1823 LDBG (0, "ERROR: fd %d: getsockopt SOL_TCP: sid %u, "
1824 "optname %d unsupported!", fd, vlsh, optname);
1832 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_V6ONLY, optval, optlen);
1835 LDBG (0, "ERROR: fd %d: getsockopt SOL_IPV6: vlsh %u "
1836 "optname %d unsupported!", fd, vlsh, optname);
1844 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_LISTEN, optval, optlen);
1847 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_KEEPALIVE, optval, optlen);
1850 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_PROTOCOL, optval, optlen);
1851 *(int *) optval = *(int *) optval ? SOCK_DGRAM : SOCK_STREAM;
1854 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_TX_FIFO_LEN,
1858 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_RX_FIFO_LEN,
1862 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_REUSEADDR, optval, optlen);
1865 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_BROADCAST, optval, optlen);
1868 rv = vls_attr (vlsh, VPPCOM_ATTR_GET_ERROR, optval, optlen);
1871 LDBG (0, "ERROR: fd %d: getsockopt SOL_SOCKET: vlsh %u "
1872 "optname %d unsupported!", fd, vlsh, optname);
1880 if (rv != VPPCOM_OK)
1888 rv = libc_getsockopt (fd, level, optname, optval, optlen);
1895 setsockopt (int fd, int level, int optname,
1896 const void *optval, socklen_t optlen)
1901 if ((errno = -ldp_init ()))
1904 vlsh = ldp_fd_to_vlsh (fd);
1905 if (vlsh != VLS_INVALID_HANDLE)
1915 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_TCP_NODELAY,
1916 (void *) optval, &optlen);
1919 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_TCP_USER_MSS,
1920 (void *) optval, &optlen);
1923 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_TCP_KEEPIDLE,
1924 (void *) optval, &optlen);
1927 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_TCP_KEEPINTVL,
1928 (void *) optval, &optlen);
1930 case TCP_CONGESTION:
1936 LDBG (0, "ERROR: fd %d: setsockopt() SOL_TCP: vlsh %u"
1937 "optname %d unsupported!", fd, vlsh, optname);
1945 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_V6ONLY,
1946 (void *) optval, &optlen);
1949 LDBG (0, "ERROR: fd %d: setsockopt SOL_IPV6: vlsh %u"
1950 "optname %d unsupported!", fd, vlsh, optname);
1958 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_KEEPALIVE,
1959 (void *) optval, &optlen);
1962 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_REUSEADDR,
1963 (void *) optval, &optlen);
1966 rv = vls_attr (vlsh, VPPCOM_ATTR_SET_BROADCAST,
1967 (void *) optval, &optlen);
1970 LDBG (0, "ERROR: fd %d: setsockopt SOL_SOCKET: vlsh %u "
1971 "optname %d unsupported!", fd, vlsh, optname);
1979 if (rv != VPPCOM_OK)
1987 rv = libc_setsockopt (fd, level, optname, optval, optlen);
1994 listen (int fd, int n)
1999 if ((errno = -ldp_init ()))
2002 vlsh = ldp_fd_to_vlsh (fd);
2003 if (vlsh != VLS_INVALID_HANDLE)
2005 LDBG (0, "fd %d: calling vls_listen: vlsh %u, n %d", fd, vlsh, n);
2007 rv = vls_listen (vlsh, n);
2008 if (rv != VPPCOM_OK)
2016 LDBG (0, "fd %d: calling libc_listen(): n %d", fd, n);
2017 rv = libc_listen (fd, n);
2020 LDBG (1, "fd %d: returning %d", fd, rv);
2025 ldp_accept4 (int listen_fd, __SOCKADDR_ARG addr,
2026 socklen_t * __restrict addr_len, int flags)
2028 vls_handle_t listen_vlsh, accept_vlsh;
2031 if ((errno = -ldp_init ()))
2034 listen_vlsh = ldp_fd_to_vlsh (listen_fd);
2035 if (listen_vlsh != VLS_INVALID_HANDLE)
2038 u8 src_addr[sizeof (struct sockaddr_in6)];
2039 memset (&ep, 0, sizeof (ep));
2042 LDBG (0, "listen fd %d: calling vppcom_session_accept: listen sid %u,"
2043 " ep %p, flags 0x%x", listen_fd, listen_vlsh, ep, flags);
2045 accept_vlsh = vls_accept (listen_vlsh, &ep, flags);
2046 if (accept_vlsh < 0)
2048 errno = -accept_vlsh;
2053 rv = ldp_copy_ep_to_sockaddr (addr, addr_len, &ep);
2054 if (rv != VPPCOM_OK)
2056 (void) vls_close (accept_vlsh);
2062 rv = ldp_vlsh_to_fd (accept_vlsh);
2068 LDBG (0, "listen fd %d: calling libc_accept4(): addr %p, addr_len %p,"
2069 " flags 0x%x", listen_fd, addr, addr_len, flags);
2071 rv = libc_accept4 (listen_fd, addr, addr_len, flags);
2074 LDBG (1, "listen fd %d: accept returning %d", listen_fd, rv);
2080 accept4 (int fd, __SOCKADDR_ARG addr, socklen_t * __restrict addr_len,
2083 return ldp_accept4 (fd, addr, addr_len, flags);
2087 accept (int fd, __SOCKADDR_ARG addr, socklen_t * __restrict addr_len)
2089 return ldp_accept4 (fd, addr, addr_len, 0);
2093 shutdown (int fd, int how)
2097 u32 flags_len = sizeof (flags);
2099 if ((errno = -ldp_init ()))
2102 vlsh = ldp_fd_to_vlsh (fd);
2103 if (vlsh != VLS_INVALID_HANDLE)
2105 LDBG (0, "called shutdown: fd %u vlsh %u how %d", fd, vlsh, how);
2107 if (vls_attr (vlsh, VPPCOM_ATTR_SET_SHUT, &how, &flags_len))
2113 if (vls_attr (vlsh, VPPCOM_ATTR_GET_SHUT, &flags, &flags_len))
2119 if (flags == SHUT_RDWR)
2124 LDBG (0, "fd %d: calling libc_shutdown: how %d", fd, how);
2125 rv = libc_shutdown (fd, how);
2132 epoll_create1 (int flags)
2134 ldp_worker_ctx_t *ldpw = ldp_worker_get_current ();
2138 if ((errno = -ldp_init ()))
2141 if (ldp->vcl_needs_real_epoll)
2143 /* Make sure workers have been allocated */
2146 ldp_alloc_workers ();
2147 ldpw = ldp_worker_get_current ();
2149 rv = libc_epoll_create1 (flags);
2150 ldp->vcl_needs_real_epoll = 0;
2151 ldpw->vcl_mq_epfd = rv;
2152 LDBG (0, "created vcl epfd %u", rv);
2156 vlsh = vls_epoll_create ();
2157 if (PREDICT_FALSE (vlsh == VLS_INVALID_HANDLE))
2164 rv = ldp_vlsh_to_fd (vlsh);
2166 LDBG (0, "epoll_create epfd %u vlsh %u", rv, vlsh);
2171 epoll_create (int size)
2173 return epoll_create1 (0);
2177 epoll_ctl (int epfd, int op, int fd, struct epoll_event *event)
2179 vls_handle_t vep_vlsh, vlsh;
2182 if ((errno = -ldp_init ()))
2185 vep_vlsh = ldp_fd_to_vlsh (epfd);
2186 if (PREDICT_FALSE (vep_vlsh == VLS_INVALID_HANDLE))
2188 /* The LDP epoll_create1 always creates VCL epfd's.
2189 * The app should never have a kernel base epoll fd unless it
2190 * was acquired outside of the LD_PRELOAD process context.
2191 * In any case, if we get one, punt it to libc_epoll_ctl.
2193 LDBG (1, "epfd %d: calling libc_epoll_ctl: op %d, fd %d"
2194 " event %p", epfd, op, fd, event);
2196 rv = libc_epoll_ctl (epfd, op, fd, event);
2200 vlsh = ldp_fd_to_vlsh (fd);
2202 LDBG (0, "epfd %d ep_vlsh %d, fd %u vlsh %d, op %u", epfd, vep_vlsh, fd,
2205 if (vlsh != VLS_INVALID_HANDLE)
2207 LDBG (1, "epfd %d: calling vls_epoll_ctl: ep_vlsh %d op %d, vlsh %u,"
2208 " event %p", epfd, vep_vlsh, vlsh, event);
2210 rv = vls_epoll_ctl (vep_vlsh, op, vlsh, event);
2211 if (rv != VPPCOM_OK)
2220 u32 size = sizeof (epfd);
2222 libc_epfd = vls_attr (vep_vlsh, VPPCOM_ATTR_GET_LIBC_EPFD, 0, 0);
2225 LDBG (1, "epfd %d, vep_vlsh %d calling libc_epoll_create1: "
2226 "EPOLL_CLOEXEC", epfd, vep_vlsh);
2228 libc_epfd = libc_epoll_create1 (EPOLL_CLOEXEC);
2235 rv = vls_attr (vep_vlsh, VPPCOM_ATTR_SET_LIBC_EPFD, &libc_epfd,
2244 else if (PREDICT_FALSE (libc_epfd < 0))
2251 LDBG (1, "epfd %d: calling libc_epoll_ctl: libc_epfd %d, op %d, fd %d,"
2252 " event %p", epfd, libc_epfd, op, fd, event);
2254 rv = libc_epoll_ctl (libc_epfd, op, fd, event);
2262 ldp_epoll_pwait (int epfd, struct epoll_event *events, int maxevents,
2263 int timeout, const sigset_t * sigmask)
2265 ldp_worker_ctx_t *ldpw = ldp_worker_get_current ();
2266 double time_to_wait = (double) 0, max_time;
2267 int libc_epfd, rv = 0;
2268 vls_handle_t ep_vlsh;
2270 if ((errno = -ldp_init ()))
2273 if (PREDICT_FALSE (!events || (timeout < -1)))
2279 if (epfd == ldpw->vcl_mq_epfd)
2280 return libc_epoll_pwait (epfd, events, maxevents, timeout, sigmask);
2282 ep_vlsh = ldp_fd_to_vlsh (epfd);
2283 if (PREDICT_FALSE (ep_vlsh == VLS_INVALID_HANDLE))
2285 LDBG (0, "epfd %d: bad ep_vlsh %d!", epfd, ep_vlsh);
2290 if (PREDICT_FALSE (ldpw->clib_time.init_cpu_time == 0))
2291 clib_time_init (&ldpw->clib_time);
2292 time_to_wait = ((timeout >= 0) ? (double) timeout / 1000 : 0);
2293 max_time = clib_time_now (&ldpw->clib_time) + time_to_wait;
2295 libc_epfd = vls_attr (ep_vlsh, VPPCOM_ATTR_GET_LIBC_EPFD, 0, 0);
2296 if (PREDICT_FALSE (libc_epfd < 0))
2303 LDBG (2, "epfd %d: vep_idx %d, libc_epfd %d, events %p, maxevents %d, "
2304 "timeout %d, sigmask %p: time_to_wait %.02f", epfd, ep_vlsh,
2305 libc_epfd, events, maxevents, timeout, sigmask, time_to_wait);
2308 if (!ldpw->epoll_wait_vcl)
2310 rv = vls_epoll_wait (ep_vlsh, events, maxevents, 0);
2313 ldpw->epoll_wait_vcl = 1;
2324 ldpw->epoll_wait_vcl = 0;
2328 rv = libc_epoll_pwait (libc_epfd, events, maxevents, 0, sigmask);
2333 while ((timeout == -1) || (clib_time_now (&ldpw->clib_time) < max_time));
2340 epoll_pwait (int epfd, struct epoll_event *events,
2341 int maxevents, int timeout, const sigset_t * sigmask)
2343 return ldp_epoll_pwait (epfd, events, maxevents, timeout, sigmask);
2347 epoll_wait (int epfd, struct epoll_event *events, int maxevents, int timeout)
2349 return ldp_epoll_pwait (epfd, events, maxevents, timeout, NULL);
2353 poll (struct pollfd *fds, nfds_t nfds, int timeout)
2355 ldp_worker_ctx_t *ldpw = ldp_worker_get_current ();
2356 int rv, i, n_revents = 0;
2361 LDBG (3, "fds %p, nfds %d, timeout %d", fds, nfds, timeout);
2363 if (PREDICT_FALSE (ldpw->clib_time.init_cpu_time == 0))
2364 clib_time_init (&ldpw->clib_time);
2366 max_time = (timeout >= 0) ? (f64) timeout / 1000 : 0;
2367 max_time += clib_time_now (&ldpw->clib_time);
2369 for (i = 0; i < nfds; i++)
2374 vlsh = ldp_fd_to_vlsh (fds[i].fd);
2375 if (vlsh != VLS_INVALID_HANDLE)
2377 fds[i].fd = -fds[i].fd;
2378 vec_add2 (ldpw->vcl_poll, vp, 1);
2380 vp->sh = vlsh_to_sh (vlsh);
2381 vp->events = fds[i].events;
2382 #ifdef __USE_XOPEN2K
2383 if (fds[i].events & POLLRDNORM)
2384 vp->events |= POLLIN;
2385 if (fds[i].events & POLLWRNORM)
2386 vp->events |= POLLOUT;
2388 vp->revents = fds[i].revents;
2392 vec_add1 (ldpw->libc_poll, fds[i]);
2393 vec_add1 (ldpw->libc_poll_idxs, i);
2399 if (vec_len (ldpw->vcl_poll))
2401 rv = vppcom_poll (ldpw->vcl_poll, vec_len (ldpw->vcl_poll), 0);
2412 if (vec_len (ldpw->libc_poll))
2414 rv = libc_poll (ldpw->libc_poll, vec_len (ldpw->libc_poll), 0);
2427 while ((timeout < 0) || (clib_time_now (&ldpw->clib_time) < max_time));
2431 vec_foreach (vp, ldpw->vcl_poll)
2433 fds[vp->fds_ndx].fd = -fds[vp->fds_ndx].fd;
2434 fds[vp->fds_ndx].revents = vp->revents;
2435 #ifdef __USE_XOPEN2K
2436 if ((fds[vp->fds_ndx].revents & POLLIN) &&
2437 (fds[vp->fds_ndx].events & POLLRDNORM))
2438 fds[vp->fds_ndx].revents |= POLLRDNORM;
2439 if ((fds[vp->fds_ndx].revents & POLLOUT) &&
2440 (fds[vp->fds_ndx].events & POLLWRNORM))
2441 fds[vp->fds_ndx].revents |= POLLWRNORM;
2444 vec_reset_length (ldpw->vcl_poll);
2446 for (i = 0; i < vec_len (ldpw->libc_poll); i++)
2448 fds[ldpw->libc_poll_idxs[i]].revents = ldpw->libc_poll[i].revents;
2450 vec_reset_length (ldpw->libc_poll_idxs);
2451 vec_reset_length (ldpw->libc_poll);
2458 ppoll (struct pollfd *fds, nfds_t nfds,
2459 const struct timespec *timeout, const sigset_t * sigmask)
2461 if ((errno = -ldp_init ()))
2464 clib_warning ("LDP<%d>: LDP-TBD", getpid ());
2472 void CONSTRUCTOR_ATTRIBUTE ldp_constructor (void);
2474 void DESTRUCTOR_ATTRIBUTE ldp_destructor (void);
2477 * This function is called when the library is loaded
2480 ldp_constructor (void)
2482 swrap_constructor ();
2483 if (ldp_init () != 0)
2485 fprintf (stderr, "\nLDP<%d>: ERROR: ldp_constructor: failed!\n",
2489 else if (LDP_DEBUG > 0)
2490 clib_warning ("LDP<%d>: LDP constructor: done!\n", getpid ());
2494 * This function is called when the library is unloaded
2497 ldp_destructor (void)
2500 swrap_destructor ();
2505 /* Don't use clib_warning() here because that calls writev()
2506 * which will call ldp_init().
2509 fprintf (stderr, "%s:%d: LDP<%d>: LDP destructor: done!\n",
2510 __func__, __LINE__, getpid ());
2515 * fd.io coding-style-patch-verification: ON
2518 * eval: (c-set-style "gnu")