1 /* 2 * Submitted by David Pacheco (dp.spambait (at) gmail.com) 3 * 4 * Redistribution and use in source and binary forms, with or without 5 * modification, are permitted provided that the following conditions 6 * are met: 7 * 1. Redistributions of source code must retain the above copyright 8 * notice, this list of conditions and the following disclaimer. 9 * 2. Redistributions in binary form must reproduce the above copyright 10 * notice, this list of conditions and the following disclaimer in the 11 * documentation and/or other materials provided with the distribution. 12 * 3. The name of the author may not be used to endorse or promote products 13 * derived from this software without specific prior written permission. 14 * 15 * THIS SOFTWARE IS PROVIDED BY SUN MICROSYSTEMS, INC. ``AS IS'' AND ANY 16 * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED 17 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE 18 * DISCLAIMED. IN NO EVENT SHALL SUN MICROSYSTEMS, INC. BE LIABLE FOR ANY 19 * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES 20 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; 21 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND 22 * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 23 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS 24 * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 25 */ 26 27 /* 28 * Copyright (c) 2007 Sun Microsystems. All rights reserved. 29 * Use is subject to license terms. 30 */ 31 32 /* 33 * evport.c: event backend using Solaris 10 event ports. See port_create(3C). 34 * This implementation is loosely modeled after the one used for select(2) (in 35 * select.c). 36 * 37 * The outstanding events are tracked in a data structure called evport_data. 38 * Each entry in the ed_fds array corresponds to a file descriptor, and contains 39 * pointers to the read and write events that correspond to that fd. (That is, 40 * when the file is readable, the "read" event should handle it, etc.) 41 * 42 * evport_add and evport_del update this data structure. evport_dispatch uses it 43 * to determine where to callback when an event occurs (which it gets from 44 * port_getn). 45 * 46 * Helper functions are used: grow() grows the file descriptor array as 47 * necessary when large fd's come in. reassociate() takes care of maintaining 48 * the proper file-descriptor/event-port associations. 49 * 50 * As in the select(2) implementation, signals are handled by evsignal. 51 */ 52 53 #ifdef HAVE_CONFIG_H 54 #include "config.h" 55 #endif 56 57 #include <sys/time.h> 58 #include <assert.h> 59 #include <sys/queue.h> 60 #include <errno.h> 61 #include <poll.h> 62 #include <port.h> 63 #include <signal.h> 64 #include <stdio.h> 65 #include <stdlib.h> 66 #include <string.h> 67 #include <time.h> 68 #include <unistd.h> 69 #ifdef CHECK_INVARIANTS 70 #include <assert.h> 71 #endif 72 73 #include "event.h" 74 #include "event-internal.h" 75 #include "log.h" 76 #include "evsignal.h" 77 78 79 /* 80 * Default value for ed_nevents, which is the maximum file descriptor number we 81 * can handle. If an event comes in for a file descriptor F > nevents, we will 82 * grow the array of file descriptors, doubling its size. 83 */ 84 #define DEFAULT_NFDS 16 85 86 87 /* 88 * EVENTS_PER_GETN is the maximum number of events to retrieve from port_getn on 89 * any particular call. You can speed things up by increasing this, but it will 90 * (obviously) require more memory. 91 */ 92 #define EVENTS_PER_GETN 8 93 94 /* 95 * Per-file-descriptor information about what events we're subscribed to. These 96 * fields are NULL if no event is subscribed to either of them. 97 */ 98 99 struct fd_info { 100 struct event* fdi_revt; /* the event responsible for the "read" */ 101 struct event* fdi_wevt; /* the event responsible for the "write" */ 102 }; 103 104 #define FDI_HAS_READ(fdi) ((fdi)->fdi_revt != NULL) 105 #define FDI_HAS_WRITE(fdi) ((fdi)->fdi_wevt != NULL) 106 #define FDI_HAS_EVENTS(fdi) (FDI_HAS_READ(fdi) || FDI_HAS_WRITE(fdi)) 107 #define FDI_TO_SYSEVENTS(fdi) (FDI_HAS_READ(fdi) ? POLLIN : 0) | \ 108 (FDI_HAS_WRITE(fdi) ? POLLOUT : 0) 109 110 struct evport_data { 111 int ed_port; /* event port for system events */ 112 int ed_nevents; /* number of allocated fdi's */ 113 struct fd_info *ed_fds; /* allocated fdi table */ 114 /* fdi's that we need to reassoc */ 115 int ed_pending[EVENTS_PER_GETN]; /* fd's with pending events */ 116 }; 117 118 static void* evport_init (struct event_base *); 119 static int evport_add (void *, struct event *); 120 static int evport_del (void *, struct event *); 121 static int evport_dispatch (struct event_base *, void *, struct timeval *); 122 static void evport_dealloc (struct event_base *, void *); 123 124 const struct eventop evportops = { 125 "evport", 126 evport_init, 127 evport_add, 128 evport_del, 129 evport_dispatch, 130 evport_dealloc, 131 1 /* need reinit */ 132 }; 133 134 /* 135 * Initialize the event port implementation. 136 */ 137 138 static void* 139 evport_init(struct event_base *base) 140 { 141 struct evport_data *evpd; 142 int i; 143 /* 144 * Disable event ports when this environment variable is set 145 */ 146 if (evutil_getenv("EVENT_NOEVPORT")) 147 return (NULL); 148 149 if (!(evpd = calloc(1, sizeof(struct evport_data)))) 150 return (NULL); 151 152 if ((evpd->ed_port = port_create()) == -1) { 153 free(evpd); 154 return (NULL); 155 } 156 157 /* 158 * Initialize file descriptor structure 159 */ 160 evpd->ed_fds = calloc(DEFAULT_NFDS, sizeof(struct fd_info)); 161 if (evpd->ed_fds == NULL) { 162 close(evpd->ed_port); 163 free(evpd); 164 return (NULL); 165 } 166 evpd->ed_nevents = DEFAULT_NFDS; 167 for (i = 0; i < EVENTS_PER_GETN; i++) 168 evpd->ed_pending[i] = -1; 169 170 evsignal_init(base); 171 172 return (evpd); 173 } 174 175 #ifdef CHECK_INVARIANTS 176 /* 177 * Checks some basic properties about the evport_data structure. Because it 178 * checks all file descriptors, this function can be expensive when the maximum 179 * file descriptor ever used is rather large. 180 */ 181 182 static void 183 check_evportop(struct evport_data *evpd) 184 { 185 assert(evpd); 186 assert(evpd->ed_nevents > 0); 187 assert(evpd->ed_port > 0); 188 assert(evpd->ed_fds > 0); 189 190 /* 191 * Verify the integrity of the fd_info struct as well as the events to 192 * which it points (at least, that they're valid references and correct 193 * for their position in the structure). 194 */ 195 int i; 196 for (i = 0; i < evpd->ed_nevents; ++i) { 197 struct event *ev; 198 struct fd_info *fdi; 199 200 fdi = &evpd->ed_fds[i]; 201 if ((ev = fdi->fdi_revt) != NULL) { 202 assert(ev->ev_fd == i); 203 } 204 if ((ev = fdi->fdi_wevt) != NULL) { 205 assert(ev->ev_fd == i); 206 } 207 } 208 } 209 210 /* 211 * Verifies very basic integrity of a given port_event. 212 */ 213 static void 214 check_event(port_event_t* pevt) 215 { 216 /* 217 * We've only registered for PORT_SOURCE_FD events. The only 218 * other thing we can legitimately receive is PORT_SOURCE_ALERT, 219 * but since we're not using port_alert either, we can assume 220 * PORT_SOURCE_FD. 221 */ 222 assert(pevt->portev_source == PORT_SOURCE_FD); 223 assert(pevt->portev_user == NULL); 224 } 225 226 #else 227 #define check_evportop(epop) 228 #define check_event(pevt) 229 #endif /* CHECK_INVARIANTS */ 230 231 /* 232 * Doubles the size of the allocated file descriptor array. 233 */ 234 static int 235 grow(struct evport_data *epdp, int factor) 236 { 237 struct fd_info *tmp; 238 int oldsize = epdp->ed_nevents; 239 int newsize = factor * oldsize; 240 assert(factor > 1); 241 242 check_evportop(epdp); 243 244 tmp = realloc(epdp->ed_fds, sizeof(struct fd_info) * newsize); 245 if (NULL == tmp) 246 return -1; 247 epdp->ed_fds = tmp; 248 memset((char*) (epdp->ed_fds + oldsize), 0, 249 (newsize - oldsize)*sizeof(struct fd_info)); 250 epdp->ed_nevents = newsize; 251 252 check_evportop(epdp); 253 254 return 0; 255 } 256 257 258 /* 259 * (Re)associates the given file descriptor with the event port. The OS events 260 * are specified (implicitly) from the fd_info struct. 261 */ 262 static int 263 reassociate(struct evport_data *epdp, struct fd_info *fdip, int fd) 264 { 265 int sysevents = FDI_TO_SYSEVENTS(fdip); 266 267 if (sysevents != 0) { 268 if (port_associate(epdp->ed_port, PORT_SOURCE_FD, 269 fd, sysevents, NULL) == -1) { 270 event_warn("port_associate"); 271 return (-1); 272 } 273 } 274 275 check_evportop(epdp); 276 277 return (0); 278 } 279 280 /* 281 * Main event loop - polls port_getn for some number of events, and processes 282 * them. 283 */ 284 285 static int 286 evport_dispatch(struct event_base *base, void *arg, struct timeval *tv) 287 { 288 int i, res; 289 struct evport_data *epdp = arg; 290 port_event_t pevtlist[EVENTS_PER_GETN]; 291 292 /* 293 * port_getn will block until it has at least nevents events. It will 294 * also return how many it's given us (which may be more than we asked 295 * for, as long as it's less than our maximum (EVENTS_PER_GETN)) in 296 * nevents. 297 */ 298 int nevents = 1; 299 300 /* 301 * We have to convert a struct timeval to a struct timespec 302 * (only difference is nanoseconds vs. microseconds). If no time-based 303 * events are active, we should wait for I/O (and tv == NULL). 304 */ 305 struct timespec ts; 306 struct timespec *ts_p = NULL; 307 if (tv != NULL) { 308 ts.tv_sec = tv->tv_sec; 309 ts.tv_nsec = tv->tv_usec * 1000; 310 ts_p = &ts; 311 } 312 313 /* 314 * Before doing anything else, we need to reassociate the events we hit 315 * last time which need reassociation. See comment at the end of the 316 * loop below. 317 */ 318 for (i = 0; i < EVENTS_PER_GETN; ++i) { 319 struct fd_info *fdi = NULL; 320 if (epdp->ed_pending[i] != -1) { 321 fdi = &(epdp->ed_fds[epdp->ed_pending[i]]); 322 } 323 324 if (fdi != NULL && FDI_HAS_EVENTS(fdi)) { 325 int fd = FDI_HAS_READ(fdi) ? fdi->fdi_revt->ev_fd : 326 fdi->fdi_wevt->ev_fd; 327 reassociate(epdp, fdi, fd); 328 epdp->ed_pending[i] = -1; 329 } 330 } 331 332 if ((res = port_getn(epdp->ed_port, pevtlist, EVENTS_PER_GETN, 333 (unsigned int *) &nevents, ts_p)) == -1) { 334 if (errno == EINTR || errno == EAGAIN) { 335 evsignal_process(base); 336 return (0); 337 } else if (errno == ETIME) { 338 if (nevents == 0) 339 return (0); 340 } else { 341 event_warn("port_getn"); 342 return (-1); 343 } 344 } else if (base->sig.evsignal_caught) { 345 evsignal_process(base); 346 } 347 348 event_debug(("%s: port_getn reports %d events", __func__, nevents)); 349 350 for (i = 0; i < nevents; ++i) { 351 struct event *ev; 352 struct fd_info *fdi; 353 port_event_t *pevt = &pevtlist[i]; 354 int fd = (int) pevt->portev_object; 355 356 check_evportop(epdp); 357 check_event(pevt); 358 epdp->ed_pending[i] = fd; 359 360 /* 361 * Figure out what kind of event it was 362 * (because we have to pass this to the callback) 363 */ 364 res = 0; 365 if (pevt->portev_events & POLLIN) 366 res |= EV_READ; 367 if (pevt->portev_events & POLLOUT) 368 res |= EV_WRITE; 369 370 assert(epdp->ed_nevents > fd); 371 fdi = &(epdp->ed_fds[fd]); 372 373 /* 374 * We now check for each of the possible events (READ 375 * or WRITE). Then, we activate the event (which will 376 * cause its callback to be executed). 377 */ 378 379 if ((res & EV_READ) && ((ev = fdi->fdi_revt) != NULL)) { 380 event_active(ev, res, 1); 381 } 382 383 if ((res & EV_WRITE) && ((ev = fdi->fdi_wevt) != NULL)) { 384 event_active(ev, res, 1); 385 } 386 } /* end of all events gotten */ 387 388 check_evportop(epdp); 389 390 return (0); 391 } 392 393 394 /* 395 * Adds the given event (so that you will be notified when it happens via 396 * the callback function). 397 */ 398 399 static int 400 evport_add(void *arg, struct event *ev) 401 { 402 struct evport_data *evpd = arg; 403 struct fd_info *fdi; 404 int factor; 405 406 check_evportop(evpd); 407 408 /* 409 * Delegate, if it's not ours to handle. 410 */ 411 if (ev->ev_events & EV_SIGNAL) 412 return (evsignal_add(ev)); 413 414 /* 415 * If necessary, grow the file descriptor info table 416 */ 417 418 factor = 1; 419 while (ev->ev_fd >= factor * evpd->ed_nevents) 420 factor *= 2; 421 422 if (factor > 1) { 423 if (-1 == grow(evpd, factor)) { 424 return (-1); 425 } 426 } 427 428 fdi = &evpd->ed_fds[ev->ev_fd]; 429 if (ev->ev_events & EV_READ) 430 fdi->fdi_revt = ev; 431 if (ev->ev_events & EV_WRITE) 432 fdi->fdi_wevt = ev; 433 434 return reassociate(evpd, fdi, ev->ev_fd); 435 } 436 437 /* 438 * Removes the given event from the list of events to wait for. 439 */ 440 441 static int 442 evport_del(void *arg, struct event *ev) 443 { 444 struct evport_data *evpd = arg; 445 struct fd_info *fdi; 446 int i; 447 int associated = 1; 448 449 check_evportop(evpd); 450 451 /* 452 * Delegate, if it's not ours to handle 453 */ 454 if (ev->ev_events & EV_SIGNAL) { 455 return (evsignal_del(ev)); 456 } 457 458 if (evpd->ed_nevents < ev->ev_fd) { 459 return (-1); 460 } 461 462 for (i = 0; i < EVENTS_PER_GETN; ++i) { 463 if (evpd->ed_pending[i] == ev->ev_fd) { 464 associated = 0; 465 break; 466 } 467 } 468 469 fdi = &evpd->ed_fds[ev->ev_fd]; 470 if (ev->ev_events & EV_READ) 471 fdi->fdi_revt = NULL; 472 if (ev->ev_events & EV_WRITE) 473 fdi->fdi_wevt = NULL; 474 475 if (associated) { 476 if (!FDI_HAS_EVENTS(fdi) && 477 port_dissociate(evpd->ed_port, PORT_SOURCE_FD, 478 ev->ev_fd) == -1) { 479 /* 480 * Ignre EBADFD error the fd could have been closed 481 * before event_del() was called. 482 */ 483 if (errno != EBADFD) { 484 event_warn("port_dissociate"); 485 return (-1); 486 } 487 } else { 488 if (FDI_HAS_EVENTS(fdi)) { 489 return (reassociate(evpd, fdi, ev->ev_fd)); 490 } 491 } 492 } else { 493 if (fdi->fdi_revt == NULL && fdi->fdi_wevt == NULL) { 494 evpd->ed_pending[i] = -1; 495 } 496 } 497 return 0; 498 } 499 500 501 static void 502 evport_dealloc(struct event_base *base, void *arg) 503 { 504 struct evport_data *evpd = arg; 505 506 evsignal_dealloc(base); 507 508 close(evpd->ed_port); 509 510 if (evpd->ed_fds) 511 free(evpd->ed_fds); 512 free(evpd); 513 } 514