FD.io VPP  v16.12-rc0-308-g931be3a
Vector Packet Processing
input.c
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2015 Cisco and/or its affiliates.
3  * Licensed under the Apache License, Version 2.0 (the "License");
4  * you may not use this file except in compliance with the License.
5  * You may obtain a copy of the License at:
6  *
7  * http://www.apache.org/licenses/LICENSE-2.0
8  *
9  * Unless required by applicable law or agreed to in writing, software
10  * distributed under the License is distributed on an "AS IS" BASIS,
11  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12  * See the License for the specific language governing permissions and
13  * limitations under the License.
14  */
15 /*
16  * input.c: Unix file input
17  *
18  * Copyright (c) 2008 Eliot Dresselhaus
19  *
20  * Permission is hereby granted, free of charge, to any person obtaining
21  * a copy of this software and associated documentation files (the
22  * "Software"), to deal in the Software without restriction, including
23  * without limitation the rights to use, copy, modify, merge, publish,
24  * distribute, sublicense, and/or sell copies of the Software, and to
25  * permit persons to whom the Software is furnished to do so, subject to
26  * the following conditions:
27  *
28  * The above copyright notice and this permission notice shall be
29  * included in all copies or substantial portions of the Software.
30  *
31  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
32  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
33  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
34  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
35  * LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
36  * OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
37  * WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
38  */
39 
40 #include <vlib/vlib.h>
41 #include <vlib/unix/unix.h>
42 #include <signal.h>
43 
44 /* FIXME autoconf */
45 #define HAVE_LINUX_EPOLL
46 
47 #ifdef HAVE_LINUX_EPOLL
48 
49 #include <sys/epoll.h>
50 
51 typedef struct
52 {
53  int epoll_fd;
54  struct epoll_event *epoll_events;
55 
56  /* Statistics. */
60 
62 
63 static void
65 {
66  unix_main_t *um = &unix_main;
68  struct epoll_event e;
69 
70  memset (&e, 0, sizeof (e));
71 
72  e.events = EPOLLIN;
74  e.events |= EPOLLOUT;
76  e.events |= EPOLLET;
77  e.data.u32 = f - um->file_pool;
78 
79  if (epoll_ctl (em->epoll_fd,
80  (update_type == UNIX_FILE_UPDATE_ADD
81  ? EPOLL_CTL_ADD
82  : (update_type == UNIX_FILE_UPDATE_MODIFY
83  ? EPOLL_CTL_MOD
84  : EPOLL_CTL_DEL)), f->file_descriptor, &e) < 0)
85  clib_warning ("epoll_ctl");
86 }
87 
88 static uword
90  vlib_node_runtime_t * node, vlib_frame_t * frame)
91 {
92  unix_main_t *um = &unix_main;
94  struct epoll_event *e;
95  int n_fds_ready;
96 
97  {
98  vlib_node_main_t *nm = &vm->node_main;
100  f64 timeout;
101  int timeout_ms, max_timeout_ms = 10;
102  f64 vector_rate = vlib_last_vectors_per_main_loop (vm);
103 
104  if (t == ~0ULL)
105  {
106  timeout = 10e-3;
107  timeout_ms = max_timeout_ms;
108  }
109  else
110  {
111  timeout =
112  (((i64) t - (i64) clib_cpu_time_now ())
114  /* subtract off some slop time */ - 50e-6;
115  timeout_ms = timeout * 1e3;
116 
117  /* Must be between 1 and 10 ms. */
118  timeout_ms = clib_max (1, timeout_ms);
119  timeout_ms = clib_min (max_timeout_ms, timeout_ms);
120  }
121 
122  /* If we still have input nodes polling (e.g. vnet packet generator)
123  don't sleep. */
124  if (nm->input_node_counts_by_state[VLIB_NODE_STATE_POLLING] > 0)
125  timeout_ms = 0;
126 
127  /*
128  * When busy: don't wait & only epoll for input
129  * every 1024 times through main loop.
130  */
131  if (vector_rate > 1 || vm->api_queue_nonempty)
132  {
133  timeout_ms = 0;
134  node->input_main_loops_per_call = 1024;
135  }
136  else
137  /* We're not busy; go to sleep for a while. */
138  node->input_main_loops_per_call = 0;
139 
140  /* Allow any signal to wakeup our sleep. */
141  {
142  static sigset_t unblock_all_signals;
143  n_fds_ready = epoll_pwait (em->epoll_fd,
144  em->epoll_events,
145  vec_len (em->epoll_events),
146  timeout_ms, &unblock_all_signals);
147 
148  /* This kludge is necessary to run over absurdly old kernels */
149  if (n_fds_ready < 0 && errno == ENOSYS)
150  {
151  n_fds_ready = epoll_wait (em->epoll_fd,
152  em->epoll_events,
153  vec_len (em->epoll_events), timeout_ms);
154  }
155  }
156  }
157 
158  if (n_fds_ready < 0)
159  {
160  if (unix_error_is_fatal (errno))
161  vlib_panic_with_error (vm, clib_error_return_unix (0, "epoll_wait"));
162 
163  /* non fatal error (e.g. EINTR). */
164  return 0;
165  }
166 
167  em->epoll_waits += 1;
168  em->epoll_files_ready += n_fds_ready;
169 
170  for (e = em->epoll_events; e < em->epoll_events + n_fds_ready; e++)
171  {
172  u32 i = e->data.u32;
174  clib_error_t *errors[4];
175  int n_errors = 0;
176 
177  if (PREDICT_TRUE (!(e->events & EPOLLERR)))
178  {
179  if (e->events & EPOLLIN)
180  {
181  errors[n_errors] = f->read_function (f);
182  n_errors += errors[n_errors] != 0;
183  }
184  if (e->events & EPOLLOUT)
185  {
186  errors[n_errors] = f->write_function (f);
187  n_errors += errors[n_errors] != 0;
188  }
189  }
190  else
191  {
192  if (f->error_function)
193  {
194  errors[n_errors] = f->error_function (f);
195  n_errors += errors[n_errors] != 0;
196  }
197  else
198  close (f->file_descriptor);
199  }
200 
201  ASSERT (n_errors < ARRAY_LEN (errors));
202  for (i = 0; i < n_errors; i++)
203  {
204  unix_save_error (um, errors[i]);
205  }
206  }
207 
208  return 0;
209 }
210 
211 /* *INDENT-OFF* */
213  .function = linux_epoll_input,
214  .type = VLIB_NODE_TYPE_PRE_INPUT,
215  .name = "unix-epoll-input",
216 };
217 /* *INDENT-ON* */
218 
219 clib_error_t *
221 {
223  unix_main_t *um = &unix_main;
224 
225  /* Allocate some events. */
227 
228  em->epoll_fd = epoll_create (vec_len (em->epoll_events));
229  if (em->epoll_fd < 0)
230  return clib_error_return_unix (0, "epoll_create");
231 
233 
234  return 0;
235 }
236 
238 
239 #endif /* HAVE_LINUX_EPOLL */
240 
241 static clib_error_t *
243 {
245 }
246 
248 
249 /*
250  * fd.io coding-style-patch-verification: ON
251  *
252  * Local Variables:
253  * eval: (c-set-style "gnu")
254  * End:
255  */
unix_file_t * file_pool
Definition: unix.h:89
sll srl srl sll sra u16x4 i
Definition: vector_sse2.h:343
#define clib_min(x, y)
Definition: clib.h:326
static void vlib_panic_with_error(vlib_main_t *vm, clib_error_t *error)
Definition: main.h:227
u32 flags
Definition: unix.h:54
unix_file_function_t * read_function
Definition: unix.h:62
#define PREDICT_TRUE(x)
Definition: clib.h:98
static uword linux_epoll_input(vlib_main_t *vm, vlib_node_runtime_t *node, vlib_frame_t *frame)
Definition: input.c:89
u64 cpu_time_next_process_ready
Definition: node.h:669
static u64 clib_cpu_time_now(void)
Definition: time.h:73
clib_time_t clib_time
Definition: main.h:62
static u32 vlib_last_vectors_per_main_loop(vlib_main_t *vm)
Definition: main.h:255
u32 input_main_loops_per_call
Definition: node.h:445
#define VLIB_INIT_FUNCTION(x)
Definition: init.h:111
static vlib_node_registration_t linux_epoll_input_node
(constructor) VLIB_REGISTER_NODE (linux_epoll_input_node)
Definition: input.c:212
#define clib_warning(format, args...)
Definition: error.h:59
unsigned long u64
Definition: types.h:89
#define vec_resize(V, N)
Resize a vector (no header, unspecified alignment) Add N elements to end of given vector V...
Definition: vec.h:201
#define vlib_call_init_function(vm, x)
Definition: init.h:161
#define pool_elt_at_index(p, i)
Returns pointer to element at given index.
Definition: pool.h:369
u32 file_descriptor
Definition: unix.h:52
static void unix_save_error(unix_main_t *um, clib_error_t *error)
Definition: unix.h:169
unix_file_function_t * error_function
Definition: unix.h:62
#define UNIX_FILE_EVENT_EDGE_TRIGGERED
Definition: unix.h:56
#define clib_error_return_unix(e, args...)
Definition: error.h:114
#define VLIB_FRAME_SIZE
Definition: node.h:328
f64 seconds_per_clock
Definition: time.h:57
long i64
Definition: types.h:82
clib_error_t * linux_epoll_input_init(vlib_main_t *vm)
Definition: input.c:220
static clib_error_t * unix_input_init(vlib_main_t *vm)
Definition: input.c:242
#define ARRAY_LEN(x)
Definition: clib.h:59
#define ASSERT(truth)
static word unix_error_is_fatal(word error)
Definition: error.h:130
unsigned int u32
Definition: types.h:88
unix_main_t unix_main
Definition: main.c:57
#define clib_max(x, y)
Definition: clib.h:319
u64 uword
Definition: types.h:112
struct epoll_event * epoll_events
Definition: input.c:54
static linux_epoll_main_t linux_epoll_main
Definition: input.c:61
void(* file_update)(unix_file_t *file, unix_file_update_type_t update_type)
Definition: unix.h:94
unix_file_function_t * write_function
Definition: unix.h:62
#define UNIX_FILE_DATA_AVAILABLE_TO_WRITE
Definition: unix.h:55
#define vec_len(v)
Number of elements in vector (rvalue-only, NULL tolerant)
double f64
Definition: types.h:142
u32 input_node_counts_by_state[VLIB_N_NODE_STATE]
Definition: node.h:685
vlib_node_main_t node_main
Definition: main.h:115
Definition: unix.h:49
u64 epoll_files_ready
Definition: input.c:57
volatile u32 api_queue_nonempty
Definition: main.h:173
#define VLIB_REGISTER_NODE(x,...)
Definition: node.h:143
static void linux_epoll_file_update(unix_file_t *f, unix_file_update_type_t update_type)
Definition: input.c:64
unix_file_update_type_t
Definition: unix.h:71