2 * Copyright (c) 2015 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
7 * http://www.apache.org/licenses/LICENSE-2.0
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
16 * input.c: Unix file input
18 * Copyright (c) 2008 Eliot Dresselhaus
20 * Permission is hereby granted, free of charge, to any person obtaining
21 * a copy of this software and associated documentation files (the
22 * "Software"), to deal in the Software without restriction, including
23 * without limitation the rights to use, copy, modify, merge, publish,
24 * distribute, sublicense, and/or sell copies of the Software, and to
25 * permit persons to whom the Software is furnished to do so, subject to
26 * the following conditions:
28 * The above copyright notice and this permission notice shall be
29 * included in all copies or substantial portions of the Software.
31 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
32 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
33 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
34 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
35 * LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
36 * OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
37 * WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
40 #include <vlib/vlib.h>
41 #include <vlib/unix/unix.h>
45 #define HAVE_LINUX_EPOLL
47 #ifdef HAVE_LINUX_EPOLL
49 #include <sys/epoll.h>
53 struct epoll_event * epoll_events;
56 u64 epoll_files_ready;
60 static linux_epoll_main_t linux_epoll_main;
63 linux_epoll_file_update (unix_file_t * f,
64 unix_file_update_type_t update_type)
66 unix_main_t * um = &unix_main;
67 linux_epoll_main_t * em = &linux_epoll_main;
70 memset (&e, 0, sizeof (e));
73 if (f->flags & UNIX_FILE_DATA_AVAILABLE_TO_WRITE)
75 if (f->flags & UNIX_FILE_EVENT_EDGE_TRIGGERED)
77 e.data.u32 = f - um->file_pool;
79 if (epoll_ctl (em->epoll_fd,
80 (update_type == UNIX_FILE_UPDATE_ADD
82 : (update_type == UNIX_FILE_UPDATE_MODIFY
87 clib_warning ("epoll_ctl");
91 linux_epoll_input (vlib_main_t * vm,
92 vlib_node_runtime_t * node,
95 unix_main_t * um = &unix_main;
96 linux_epoll_main_t * em = &linux_epoll_main;
97 struct epoll_event * e;
101 vlib_node_main_t * nm = &vm->node_main;
102 u64 t = nm->cpu_time_next_process_ready;
104 int timeout_ms, max_timeout_ms = 10;
105 f64 vector_rate = vlib_last_vectors_per_main_loop (vm);
110 timeout_ms = max_timeout_ms;
115 (((i64) t - (i64) clib_cpu_time_now ())
116 * vm->clib_time.seconds_per_clock)
117 /* subtract off some slop time */ - 50e-6;
118 timeout_ms = timeout * 1e3;
120 /* Must be between 1 and 10 ms. */
121 timeout_ms = clib_max (1, timeout_ms);
122 timeout_ms = clib_min (max_timeout_ms, timeout_ms);
125 /* If we still have input nodes polling (e.g. vnet packet generator)
127 if (nm->input_node_counts_by_state[VLIB_NODE_STATE_POLLING] > 0)
131 * When busy: don't wait & only epoll for input
132 * every 1024 times through main loop.
134 if (vector_rate > 1 || vm->api_queue_nonempty)
137 node->input_main_loops_per_call = 1024;
140 /* We're not busy; go to sleep for a while. */
141 node->input_main_loops_per_call = 0;
143 /* Allow any signal to wakeup our sleep. */
145 static sigset_t unblock_all_signals;
146 n_fds_ready = epoll_pwait (em->epoll_fd,
148 vec_len (em->epoll_events),
150 &unblock_all_signals);
152 /* This kludge is necessary to run over absurdly old kernels */
153 if (n_fds_ready < 0 && errno == ENOSYS)
155 n_fds_ready = epoll_wait (em->epoll_fd,
157 vec_len (em->epoll_events),
165 if (unix_error_is_fatal (errno))
166 vlib_panic_with_error (vm, clib_error_return_unix (0, "epoll_wait"));
168 /* non fatal error (e.g. EINTR). */
172 em->epoll_waits += 1;
173 em->epoll_files_ready += n_fds_ready;
175 for (e = em->epoll_events; e < em->epoll_events + n_fds_ready; e++)
178 unix_file_t * f = pool_elt_at_index (um->file_pool, i);
179 clib_error_t * errors[4];
182 if (PREDICT_TRUE (! (e->events & EPOLLERR)))
184 if (e->events & EPOLLIN)
186 errors[n_errors] = f->read_function (f);
187 n_errors += errors[n_errors] != 0;
189 if (e->events & EPOLLOUT)
191 errors[n_errors] = f->write_function (f);
192 n_errors += errors[n_errors] != 0;
197 if (f->error_function)
199 errors[n_errors] = f->error_function (f);
200 n_errors += errors[n_errors] != 0;
203 close(f->file_descriptor);
206 ASSERT (n_errors < ARRAY_LEN (errors));
207 for (i = 0; i < n_errors; i++)
209 unix_save_error (um, errors[i]);
216 VLIB_REGISTER_NODE (linux_epoll_input_node,static) = {
217 .function = linux_epoll_input,
218 .type = VLIB_NODE_TYPE_PRE_INPUT,
219 .name = "unix-epoll-input",
223 linux_epoll_input_init (vlib_main_t * vm)
225 linux_epoll_main_t * em = &linux_epoll_main;
226 unix_main_t * um = &unix_main;
228 /* Allocate some events. */
229 vec_resize (em->epoll_events, VLIB_FRAME_SIZE);
231 em->epoll_fd = epoll_create (vec_len (em->epoll_events));
232 if (em->epoll_fd < 0)
233 return clib_error_return_unix (0, "epoll_create");
235 um->file_update = linux_epoll_file_update;
240 VLIB_INIT_FUNCTION (linux_epoll_input_init);
242 #endif /* HAVE_LINUX_EPOLL */
244 static clib_error_t *
245 unix_input_init (vlib_main_t * vm)
247 return vlib_call_init_function (vm, linux_epoll_input_init);
250 VLIB_INIT_FUNCTION (unix_input_init);