|
1 /* |
|
2 * Copyright 2000-2009 Niels Provos <provos@citi.umich.edu> |
|
3 * Copyright 2009-2012 Niels Provos and Nick Mathewson |
|
4 * |
|
5 * Redistribution and use in source and binary forms, with or without |
|
6 * modification, are permitted provided that the following conditions |
|
7 * are met: |
|
8 * 1. Redistributions of source code must retain the above copyright |
|
9 * notice, this list of conditions and the following disclaimer. |
|
10 * 2. Redistributions in binary form must reproduce the above copyright |
|
11 * notice, this list of conditions and the following disclaimer in the |
|
12 * documentation and/or other materials provided with the distribution. |
|
13 * 3. The name of the author may not be used to endorse or promote products |
|
14 * derived from this software without specific prior written permission. |
|
15 * |
|
16 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR |
|
17 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES |
|
18 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. |
|
19 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, |
|
20 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT |
|
21 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, |
|
22 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY |
|
23 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
|
24 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF |
|
25 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
|
26 */ |
|
27 #include "event2/event-config.h" |
|
28 |
|
29 #include <sys/types.h> |
|
30 #include <sys/resource.h> |
|
31 #ifdef _EVENT_HAVE_SYS_TIME_H |
|
32 #include <sys/time.h> |
|
33 #endif |
|
34 #include <sys/queue.h> |
|
35 #include <sys/devpoll.h> |
|
36 #include <signal.h> |
|
37 #include <stdio.h> |
|
38 #include <stdlib.h> |
|
39 #include <string.h> |
|
40 #include <unistd.h> |
|
41 #include <fcntl.h> |
|
42 #include <errno.h> |
|
43 |
|
44 #include "event2/event.h" |
|
45 #include "event2/event_struct.h" |
|
46 #include "event2/thread.h" |
|
47 #include "event-internal.h" |
|
48 #include "evsignal-internal.h" |
|
49 #include "log-internal.h" |
|
50 #include "evmap-internal.h" |
|
51 #include "evthread-internal.h" |
|
52 |
|
53 struct devpollop { |
|
54 struct pollfd *events; |
|
55 int nevents; |
|
56 int dpfd; |
|
57 struct pollfd *changes; |
|
58 int nchanges; |
|
59 }; |
|
60 |
|
61 static void *devpoll_init(struct event_base *); |
|
62 static int devpoll_add(struct event_base *, int fd, short old, short events, void *); |
|
63 static int devpoll_del(struct event_base *, int fd, short old, short events, void *); |
|
64 static int devpoll_dispatch(struct event_base *, struct timeval *); |
|
65 static void devpoll_dealloc(struct event_base *); |
|
66 |
|
67 const struct eventop devpollops = { |
|
68 "devpoll", |
|
69 devpoll_init, |
|
70 devpoll_add, |
|
71 devpoll_del, |
|
72 devpoll_dispatch, |
|
73 devpoll_dealloc, |
|
74 1, /* need reinit */ |
|
75 EV_FEATURE_FDS|EV_FEATURE_O1, |
|
76 0 |
|
77 }; |
|
78 |
|
79 #define NEVENT 32000 |
|
80 |
|
81 static int |
|
82 devpoll_commit(struct devpollop *devpollop) |
|
83 { |
|
84 /* |
|
85 * Due to a bug in Solaris, we have to use pwrite with an offset of 0. |
|
86 * Write is limited to 2GB of data, until it will fail. |
|
87 */ |
|
88 if (pwrite(devpollop->dpfd, devpollop->changes, |
|
89 sizeof(struct pollfd) * devpollop->nchanges, 0) == -1) |
|
90 return (-1); |
|
91 |
|
92 devpollop->nchanges = 0; |
|
93 return (0); |
|
94 } |
|
95 |
|
96 static int |
|
97 devpoll_queue(struct devpollop *devpollop, int fd, int events) { |
|
98 struct pollfd *pfd; |
|
99 |
|
100 if (devpollop->nchanges >= devpollop->nevents) { |
|
101 /* |
|
102 * Change buffer is full, must commit it to /dev/poll before |
|
103 * adding more |
|
104 */ |
|
105 if (devpoll_commit(devpollop) != 0) |
|
106 return (-1); |
|
107 } |
|
108 |
|
109 pfd = &devpollop->changes[devpollop->nchanges++]; |
|
110 pfd->fd = fd; |
|
111 pfd->events = events; |
|
112 pfd->revents = 0; |
|
113 |
|
114 return (0); |
|
115 } |
|
116 |
|
117 static void * |
|
118 devpoll_init(struct event_base *base) |
|
119 { |
|
120 int dpfd, nfiles = NEVENT; |
|
121 struct rlimit rl; |
|
122 struct devpollop *devpollop; |
|
123 |
|
124 if (!(devpollop = mm_calloc(1, sizeof(struct devpollop)))) |
|
125 return (NULL); |
|
126 |
|
127 if (getrlimit(RLIMIT_NOFILE, &rl) == 0 && |
|
128 rl.rlim_cur != RLIM_INFINITY) |
|
129 nfiles = rl.rlim_cur; |
|
130 |
|
131 /* Initialize the kernel queue */ |
|
132 if ((dpfd = evutil_open_closeonexec("/dev/poll", O_RDWR, 0)) == -1) { |
|
133 event_warn("open: /dev/poll"); |
|
134 mm_free(devpollop); |
|
135 return (NULL); |
|
136 } |
|
137 |
|
138 devpollop->dpfd = dpfd; |
|
139 |
|
140 /* Initialize fields */ |
|
141 /* FIXME: allocating 'nfiles' worth of space here can be |
|
142 * expensive and unnecessary. See how epoll.c does it instead. */ |
|
143 devpollop->events = mm_calloc(nfiles, sizeof(struct pollfd)); |
|
144 if (devpollop->events == NULL) { |
|
145 mm_free(devpollop); |
|
146 close(dpfd); |
|
147 return (NULL); |
|
148 } |
|
149 devpollop->nevents = nfiles; |
|
150 |
|
151 devpollop->changes = mm_calloc(nfiles, sizeof(struct pollfd)); |
|
152 if (devpollop->changes == NULL) { |
|
153 mm_free(devpollop->events); |
|
154 mm_free(devpollop); |
|
155 close(dpfd); |
|
156 return (NULL); |
|
157 } |
|
158 |
|
159 evsig_init(base); |
|
160 |
|
161 return (devpollop); |
|
162 } |
|
163 |
|
164 static int |
|
165 devpoll_dispatch(struct event_base *base, struct timeval *tv) |
|
166 { |
|
167 struct devpollop *devpollop = base->evbase; |
|
168 struct pollfd *events = devpollop->events; |
|
169 struct dvpoll dvp; |
|
170 int i, res, timeout = -1; |
|
171 |
|
172 if (devpollop->nchanges) |
|
173 devpoll_commit(devpollop); |
|
174 |
|
175 if (tv != NULL) |
|
176 timeout = tv->tv_sec * 1000 + (tv->tv_usec + 999) / 1000; |
|
177 |
|
178 dvp.dp_fds = devpollop->events; |
|
179 dvp.dp_nfds = devpollop->nevents; |
|
180 dvp.dp_timeout = timeout; |
|
181 |
|
182 EVBASE_RELEASE_LOCK(base, th_base_lock); |
|
183 |
|
184 res = ioctl(devpollop->dpfd, DP_POLL, &dvp); |
|
185 |
|
186 EVBASE_ACQUIRE_LOCK(base, th_base_lock); |
|
187 |
|
188 if (res == -1) { |
|
189 if (errno != EINTR) { |
|
190 event_warn("ioctl: DP_POLL"); |
|
191 return (-1); |
|
192 } |
|
193 |
|
194 return (0); |
|
195 } |
|
196 |
|
197 event_debug(("%s: devpoll_wait reports %d", __func__, res)); |
|
198 |
|
199 for (i = 0; i < res; i++) { |
|
200 int which = 0; |
|
201 int what = events[i].revents; |
|
202 |
|
203 if (what & POLLHUP) |
|
204 what |= POLLIN | POLLOUT; |
|
205 else if (what & POLLERR) |
|
206 what |= POLLIN | POLLOUT; |
|
207 |
|
208 if (what & POLLIN) |
|
209 which |= EV_READ; |
|
210 if (what & POLLOUT) |
|
211 which |= EV_WRITE; |
|
212 |
|
213 if (!which) |
|
214 continue; |
|
215 |
|
216 /* XXX(niels): not sure if this works for devpoll */ |
|
217 evmap_io_active(base, events[i].fd, which); |
|
218 } |
|
219 |
|
220 return (0); |
|
221 } |
|
222 |
|
223 |
|
224 static int |
|
225 devpoll_add(struct event_base *base, int fd, short old, short events, void *p) |
|
226 { |
|
227 struct devpollop *devpollop = base->evbase; |
|
228 int res; |
|
229 (void)p; |
|
230 |
|
231 /* |
|
232 * It's not necessary to OR the existing read/write events that we |
|
233 * are currently interested in with the new event we are adding. |
|
234 * The /dev/poll driver ORs any new events with the existing events |
|
235 * that it has cached for the fd. |
|
236 */ |
|
237 |
|
238 res = 0; |
|
239 if (events & EV_READ) |
|
240 res |= POLLIN; |
|
241 if (events & EV_WRITE) |
|
242 res |= POLLOUT; |
|
243 |
|
244 if (devpoll_queue(devpollop, fd, res) != 0) |
|
245 return (-1); |
|
246 |
|
247 return (0); |
|
248 } |
|
249 |
|
250 static int |
|
251 devpoll_del(struct event_base *base, int fd, short old, short events, void *p) |
|
252 { |
|
253 struct devpollop *devpollop = base->evbase; |
|
254 int res; |
|
255 (void)p; |
|
256 |
|
257 res = 0; |
|
258 if (events & EV_READ) |
|
259 res |= POLLIN; |
|
260 if (events & EV_WRITE) |
|
261 res |= POLLOUT; |
|
262 |
|
263 /* |
|
264 * The only way to remove an fd from the /dev/poll monitored set is |
|
265 * to use POLLREMOVE by itself. This removes ALL events for the fd |
|
266 * provided so if we care about two events and are only removing one |
|
267 * we must re-add the other event after POLLREMOVE. |
|
268 */ |
|
269 |
|
270 if (devpoll_queue(devpollop, fd, POLLREMOVE) != 0) |
|
271 return (-1); |
|
272 |
|
273 if ((res & (POLLIN|POLLOUT)) != (POLLIN|POLLOUT)) { |
|
274 /* |
|
275 * We're not deleting all events, so we must resubmit the |
|
276 * event that we are still interested in if one exists. |
|
277 */ |
|
278 |
|
279 if ((res & POLLIN) && (old & EV_WRITE)) { |
|
280 /* Deleting read, still care about write */ |
|
281 devpoll_queue(devpollop, fd, POLLOUT); |
|
282 } else if ((res & POLLOUT) && (old & EV_READ)) { |
|
283 /* Deleting write, still care about read */ |
|
284 devpoll_queue(devpollop, fd, POLLIN); |
|
285 } |
|
286 } |
|
287 |
|
288 return (0); |
|
289 } |
|
290 |
|
291 static void |
|
292 devpoll_dealloc(struct event_base *base) |
|
293 { |
|
294 struct devpollop *devpollop = base->evbase; |
|
295 |
|
296 evsig_dealloc(base); |
|
297 if (devpollop->events) |
|
298 mm_free(devpollop->events); |
|
299 if (devpollop->changes) |
|
300 mm_free(devpollop->changes); |
|
301 if (devpollop->dpfd >= 0) |
|
302 close(devpollop->dpfd); |
|
303 |
|
304 memset(devpollop, 0, sizeof(struct devpollop)); |
|
305 mm_free(devpollop); |
|
306 } |